File size: 3,020 Bytes
5f923cd
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
#include "runtime/components/constrained_decoding/constraint_provider_factory.h"

#include <string>
#include <vector>

#include <gmock/gmock.h>
#include <gtest/gtest.h>
#include "absl/status/status.h"  // from @com_google_absl
#include "absl/status/statusor.h"  // from @com_google_absl
#include "absl/strings/string_view.h"  // from @com_google_absl
#include "runtime/components/constrained_decoding/constraint_provider_config.h"
#include "runtime/components/constrained_decoding/external_constraint_config.h"
#include "runtime/components/constrained_decoding/llg_constraint_config.h"
#include "runtime/components/tokenizer.h"
#include "runtime/util/test_utils.h"  // NOLINT

namespace litert::lm {
namespace {

using ::testing::Return;

class MockTokenizer : public Tokenizer {
 public:
  MOCK_METHOD(TokenizerType, GetTokenizerType, (), (const, override));
  MOCK_METHOD(absl::StatusOr<TokenIds>, TextToTokenIds, (absl::string_view),
              (override));
  MOCK_METHOD(absl::StatusOr<int>, TokenToId, (absl::string_view), (override));
  MOCK_METHOD(absl::StatusOr<std::string>, TokenIdsToText, (const TokenIds&),
              (override));
  MOCK_METHOD(std::vector<std::string>, GetTokens, (), (const, override));
};

class ConstraintProviderFactoryTest : public ::testing::Test {
 protected:
  MockTokenizer tokenizer_;
};

TEST_F(ConstraintProviderFactoryTest, CreateExternalConstraintProvider) {
  ExternalConstraintConfig config;
  std::vector<std::vector<int>> stop_token_ids;
  auto provider = CreateConstraintProvider(config, tokenizer_, stop_token_ids);
  ASSERT_TRUE(provider.ok());
  EXPECT_NE(provider.value(), nullptr);
}

TEST_F(ConstraintProviderFactoryTest, CreateLlgConstraintProvider) {
  LlGuidanceConfig config;
  config.eos_id = 1;
  std::vector<std::vector<int>> stop_token_ids;

  EXPECT_CALL(tokenizer_, GetTokens())
      .WillOnce(Return(std::vector<std::string>{"<pad>", "<eos>", "a", "b"}));

  auto provider = CreateConstraintProvider(config, tokenizer_, stop_token_ids);
  ASSERT_TRUE(provider.ok());
  EXPECT_NE(provider.value(), nullptr);
}

TEST_F(ConstraintProviderFactoryTest, CreateLlgConstraintProviderInferEosId) {
  LlGuidanceConfig config;
  // eos_id is missing, but stop_token_ids has a valid token
  std::vector<std::vector<int>> stop_token_ids = {{2}};

  EXPECT_CALL(tokenizer_, GetTokens())
      .WillOnce(Return(std::vector<std::string>{"<pad>", "<eos>", "a", "b"}));

  auto provider = CreateConstraintProvider(config, tokenizer_, stop_token_ids);
  ASSERT_TRUE(provider.ok());
  EXPECT_NE(provider.value(), nullptr);
}

TEST_F(ConstraintProviderFactoryTest, CreateLlgConstraintProviderMissingEosId) {
  LlGuidanceConfig config;
  // eos_id is missing, and stop_token_ids is empty
  std::vector<std::vector<int>> stop_token_ids;

  auto provider = CreateConstraintProvider(config, tokenizer_, stop_token_ids);
  EXPECT_FALSE(provider.ok());
  EXPECT_EQ(provider.status().code(), absl::StatusCode::kInvalidArgument);
}

}  // namespace
}  // namespace litert::lm