Spaces:
Running
Running
File size: 3,020 Bytes
5f923cd | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 | #include "runtime/components/constrained_decoding/constraint_provider_factory.h"
#include <string>
#include <vector>
#include <gmock/gmock.h>
#include <gtest/gtest.h>
#include "absl/status/status.h" // from @com_google_absl
#include "absl/status/statusor.h" // from @com_google_absl
#include "absl/strings/string_view.h" // from @com_google_absl
#include "runtime/components/constrained_decoding/constraint_provider_config.h"
#include "runtime/components/constrained_decoding/external_constraint_config.h"
#include "runtime/components/constrained_decoding/llg_constraint_config.h"
#include "runtime/components/tokenizer.h"
#include "runtime/util/test_utils.h" // NOLINT
namespace litert::lm {
namespace {
using ::testing::Return;
class MockTokenizer : public Tokenizer {
public:
MOCK_METHOD(TokenizerType, GetTokenizerType, (), (const, override));
MOCK_METHOD(absl::StatusOr<TokenIds>, TextToTokenIds, (absl::string_view),
(override));
MOCK_METHOD(absl::StatusOr<int>, TokenToId, (absl::string_view), (override));
MOCK_METHOD(absl::StatusOr<std::string>, TokenIdsToText, (const TokenIds&),
(override));
MOCK_METHOD(std::vector<std::string>, GetTokens, (), (const, override));
};
class ConstraintProviderFactoryTest : public ::testing::Test {
protected:
MockTokenizer tokenizer_;
};
TEST_F(ConstraintProviderFactoryTest, CreateExternalConstraintProvider) {
ExternalConstraintConfig config;
std::vector<std::vector<int>> stop_token_ids;
auto provider = CreateConstraintProvider(config, tokenizer_, stop_token_ids);
ASSERT_TRUE(provider.ok());
EXPECT_NE(provider.value(), nullptr);
}
TEST_F(ConstraintProviderFactoryTest, CreateLlgConstraintProvider) {
LlGuidanceConfig config;
config.eos_id = 1;
std::vector<std::vector<int>> stop_token_ids;
EXPECT_CALL(tokenizer_, GetTokens())
.WillOnce(Return(std::vector<std::string>{"<pad>", "<eos>", "a", "b"}));
auto provider = CreateConstraintProvider(config, tokenizer_, stop_token_ids);
ASSERT_TRUE(provider.ok());
EXPECT_NE(provider.value(), nullptr);
}
TEST_F(ConstraintProviderFactoryTest, CreateLlgConstraintProviderInferEosId) {
LlGuidanceConfig config;
// eos_id is missing, but stop_token_ids has a valid token
std::vector<std::vector<int>> stop_token_ids = {{2}};
EXPECT_CALL(tokenizer_, GetTokens())
.WillOnce(Return(std::vector<std::string>{"<pad>", "<eos>", "a", "b"}));
auto provider = CreateConstraintProvider(config, tokenizer_, stop_token_ids);
ASSERT_TRUE(provider.ok());
EXPECT_NE(provider.value(), nullptr);
}
TEST_F(ConstraintProviderFactoryTest, CreateLlgConstraintProviderMissingEosId) {
LlGuidanceConfig config;
// eos_id is missing, and stop_token_ids is empty
std::vector<std::vector<int>> stop_token_ids;
auto provider = CreateConstraintProvider(config, tokenizer_, stop_token_ids);
EXPECT_FALSE(provider.ok());
EXPECT_EQ(provider.status().code(), absl::StatusCode::kInvalidArgument);
}
} // namespace
} // namespace litert::lm
|