Spaces:

FINAL-Bench
/

LiteRT-LM

Running

App Files Files Community

LiteRT-LM / runtime /executor /executor_settings_base_test.cc

SeaWolf-AI

Upload full LiteRT-LM codebase

5f923cd verified 3 days ago

raw

history blame contribute delete

6.97 kB

	// Copyright 2025 The ODML Authors.
	//
	// Licensed under the Apache License, Version 2.0 (the "License");
	// you may not use this file except in compliance with the License.
	// You may obtain a copy of the License at
	//
	// http://www.apache.org/licenses/LICENSE-2.0
	//
	// Unless required by applicable law or agreed to in writing, software
	// distributed under the License is distributed on an "AS IS" BASIS,
	// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	// See the License for the specific language governing permissions and
	// limitations under the License.

	#include "runtime/executor/executor_settings_base.h"

	#include <memory>
	#include <sstream>
	#include <string>
	#include <utility>
	#include <variant>

	#include <gmock/gmock.h>
	#include <gtest/gtest.h>
	#include "absl/status/status.h" // from @com_google_absl
	#include "absl/strings/string_view.h" // from @com_google_absl
	#include "runtime/util/memory_mapped_file.h"
	#include "runtime/util/test_utils.h" // NOLINT

	namespace litert::lm {
	namespace {

	TEST(LlmExecutorConfigTest, Backend) {
	Backend backend;
	std::stringstream oss;
	backend = Backend::CPU_ARTISAN;
	oss << backend;
	EXPECT_EQ(oss.str(), "CPU_ARTISAN");

	backend = Backend::GPU_ARTISAN;
	oss.str("");
	oss << backend;
	EXPECT_EQ(oss.str(), "GPU_ARTISAN");

	backend = Backend::GPU;
	oss.str("");
	oss << backend;
	EXPECT_EQ(oss.str(), "GPU");

	backend = Backend::CPU;
	oss.str("");
	oss << backend;
	EXPECT_EQ(oss.str(), "CPU");

	backend = Backend::GOOGLE_TENSOR_ARTISAN;
	oss.str("");
	oss << backend;
	EXPECT_EQ(oss.str(), "GOOGLE_TENSOR_ARTISAN");

	backend = Backend::NPU;
	oss.str("");
	oss << backend;
	EXPECT_EQ(oss.str(), "NPU");
	}

	TEST(LlmExecutorConfigTest, StringToBackend) {
	auto backend = GetBackendFromString("cpu_artisan");
	EXPECT_EQ(*backend, Backend::CPU_ARTISAN);
	backend = GetBackendFromString("gpu_artisan");
	EXPECT_EQ(*backend, Backend::GPU_ARTISAN);
	backend = GetBackendFromString("gpu");
	EXPECT_EQ(*backend, Backend::GPU);
	backend = GetBackendFromString("cpu");
	EXPECT_EQ(*backend, Backend::CPU);
	backend = GetBackendFromString("google_tensor_artisan");
	EXPECT_EQ(*backend, Backend::GOOGLE_TENSOR_ARTISAN);
	backend = GetBackendFromString("npu");
	EXPECT_EQ(*backend, Backend::NPU);
	}

	TEST(LlmExecutorConfigTest, StringToActivationDataType) {
	auto activation_data_type = GetActivationDataTypeFromString("float32");
	EXPECT_EQ(*activation_data_type, ActivationDataType::FLOAT32);
	activation_data_type = GetActivationDataTypeFromString("float16");
	EXPECT_EQ(*activation_data_type, ActivationDataType::FLOAT16);
	activation_data_type = GetActivationDataTypeFromString("int16");
	EXPECT_EQ(*activation_data_type, ActivationDataType::INT16);
	activation_data_type = GetActivationDataTypeFromString("int8");
	EXPECT_EQ(*activation_data_type, ActivationDataType::INT8);
	activation_data_type = GetActivationDataTypeFromString("invalid");
	EXPECT_EQ(activation_data_type.status(),
	absl::InvalidArgumentError(
	"Unsupported activation data type: invalid. Supported "
	"activation data types are: [FLOAT32, "
	"FLOAT16, INT16, INT8]"));
	}

	TEST(LlmExecutorConfigTest, ActivatonDataType) {
	ActivationDataType act;
	std::stringstream oss;
	act = ActivationDataType::FLOAT32;
	oss << act;
	EXPECT_EQ(oss.str(), "FLOAT32");

	act = ActivationDataType::FLOAT16;
	oss.str("");
	oss << act;
	EXPECT_EQ(oss.str(), "FLOAT16");
	}

	TEST(LlmExecutorConfigTest, FakeWeightsMode) {
	FakeWeightsMode fake_weights_mode;
	std::stringstream oss;
	fake_weights_mode = FakeWeightsMode::FAKE_WEIGHTS_NONE;
	oss << fake_weights_mode;
	EXPECT_EQ(oss.str(), "FAKE_WEIGHTS_NONE");

	fake_weights_mode = FakeWeightsMode::FAKE_WEIGHTS_8BITS_ALL_LAYERS;
	oss.str("");
	oss << fake_weights_mode;
	EXPECT_EQ(oss.str(), "FAKE_WEIGHTS_8BITS_ALL_LAYERS");

	fake_weights_mode = FakeWeightsMode::FAKE_WEIGHTS_ATTN_8_FFN_4_EMB_4;
	oss.str("");
	oss << fake_weights_mode;
	EXPECT_EQ(oss.str(), "FAKE_WEIGHTS_ATTN_8_FFN_4_EMB_4");
	}

	TEST(LlmExecutorConfigTest, FileFormat) {
	std::stringstream oss;

	oss.str("");
	oss << FileFormat::TFLITE;
	EXPECT_EQ(oss.str(), "TFLITE");

	oss.str("");
	oss << FileFormat::TASK;
	EXPECT_EQ(oss.str(), "TASK");

	oss.str("");
	oss << FileFormat::LITERT_LM;
	EXPECT_EQ(oss.str(), "LITERT_LM");
	}

	TEST(LlmExecutorConfigTest, ModelAssets) {
	auto model_assets = ModelAssets::Create("/path/to/model1");
	ASSERT_OK(model_assets);
	std::stringstream oss;
	oss << *model_assets;
	const std::string expected_output = R"(model_path: /path/to/model1
	fake_weights_mode: FAKE_WEIGHTS_NONE
	)";
	EXPECT_EQ(oss.str(), expected_output);
	}

	TEST(LlmExecutorConfigTest, ModelAssetsMemoryMapped) {
	const std::string model_content = "some fake model content";
	ASSERT_OK_AND_ASSIGN(std::unique_ptr<MemoryMappedFile> memory_mapped_file,
	InMemoryFile::Create(model_content));
	MemoryMappedFile* raw_ptr = memory_mapped_file.get();
	auto model_assets = ModelAssets::Create(std::move(memory_mapped_file));
	ASSERT_OK(model_assets);
	EXPECT_TRUE(model_assets->HasMemoryMappedFile());
	ASSERT_OK_AND_ASSIGN(auto retrieved_mmf, model_assets->GetMemoryMappedFile());
	EXPECT_EQ(retrieved_mmf.get(), raw_ptr);
	EXPECT_EQ(retrieved_mmf->length(), model_content.length());
	EXPECT_EQ(
	absl::string_view(reinterpret_cast<const char*>(retrieved_mmf->data()),
	retrieved_mmf->length()),
	model_content);

	std::stringstream oss;
	oss << *model_assets;
	EXPECT_THAT(oss.str(), testing::HasSubstr("model_file memory mapped file"));
	EXPECT_THAT(oss.str(), testing::HasSubstr("FAKE_WEIGHTS_NONE"));
	}

	class TestExecutorSettings : public ExecutorSettingsBase {
	public:
	explicit TestExecutorSettings(ModelAssets model_assets)
	: ExecutorSettingsBase(std::move(model_assets)) {}
	};

	TEST(LlmExecutorConfigTest, GetProgramCacheFile) {
	auto model_assets = ModelAssets::Create("/path/to/model.tflite");
	ASSERT_OK(model_assets);
	TestExecutorSettings settings(*model_assets);
	settings.SetCacheDir("/cache/dir");

	auto result = settings.GetProgramCacheFile();
	ASSERT_OK(result);
	EXPECT_TRUE(std::holds_alternative<std::string>(*result));
	EXPECT_THAT(std::get<std::string>(*result),
	testing::HasSubstr("model.tflite.program_cache"));
	}

	TEST(LlmExecutorConfigTest, GetProgramCacheFileWithSuffix) {
	auto model_assets = ModelAssets::Create("/path/to/model.tflite");
	ASSERT_OK(model_assets);
	TestExecutorSettings settings(*model_assets);
	settings.SetCacheDir("/cache/dir");

	auto result = settings.GetProgramCacheFile(".mysuffix");
	ASSERT_OK(result);
	EXPECT_TRUE(std::holds_alternative<std::string>(*result));
	EXPECT_THAT(std::get<std::string>(*result),
	testing::HasSubstr("model.tflite.mysuffix"));
	}

	} // namespace
	} // namespace litert::lm