Spaces:

FINAL-Bench
/

LiteRT-LM

Running

App Files Files Community

LiteRT-LM / runtime /components /stop_token_detector_test.cc

SeaWolf-AI

Upload full LiteRT-LM codebase

5f923cd verified 6 days ago

raw

history blame contribute delete

4.83 kB

	// Copyright 2025 The ODML Authors.
	//
	// Licensed under the Apache License, Version 2.0 (the "License");
	// you may not use this file except in compliance with the License.
	// You may obtain a copy of the License at
	//
	// http://www.apache.org/licenses/LICENSE-2.0
	//
	// Unless required by applicable law or agreed to in writing, software
	// distributed under the License is distributed on an "AS IS" BASIS,
	// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	// See the License for the specific language governing permissions and
	// limitations under the License.

	#include "runtime/components/stop_token_detector.h"

	#include <cstddef>
	#include <vector>

	#include <gmock/gmock.h>
	#include <gtest/gtest.h>
	#include "absl/status/status.h" // from @com_google_absl
	#include "absl/types/span.h" // from @com_google_absl
	#include "runtime/util/test_utils.h" // NOLINT

	namespace litert::lm {
	namespace {

	TEST(StopTokenDetectorTest, AddStopSequence) {
	StopTokenDetector detector(1);
	EXPECT_TRUE(detector.AddStopTokenSequence({1, 2, 3}).ok());

	// Adding an empty sequence should fail
	EXPECT_EQ(absl::StatusCode::kInvalidArgument,
	detector.AddStopTokenSequence({}).code());

	// Adding a repeated sequence should be a no-op.
	EXPECT_EQ(absl::StatusCode::kOk,
	detector.AddStopTokenSequence({1, 2, 3}).code());

	EXPECT_TRUE(detector.AddStopTokenSequence({9}).ok());
	}

	TEST(StopTokenDetectorTest, ProcessTokensSingleStopToken) {
	StopTokenDetector detector(2); // Batch size 2
	EXPECT_OK(detector.AddStopTokenSequence({5}));

	std::vector<int> tokens_item0 = {3, 4, 5, 6, 7};
	std::vector<int> tokens_item1 = {1, 0, 6, 5, 99};

	// Simulate processing token by token
	size_t i;
	for (i = 0; i < tokens_item0.size(); ++i) {
	std::vector<int> current_batch_tokens = {tokens_item0[i], tokens_item1[i]};
	EXPECT_TRUE(
	detector.ProcessTokens(absl::MakeSpan(current_batch_tokens)).ok());
	if (detector.AllDone().value()) {
	break;
	}
	}
	// Stop token, 5, is found for all batch items at step 3.
	EXPECT_EQ(i, 3);

	const auto& steps_before_stop_tokens = detector.GetStepsBeforeStopTokens();
	EXPECT_EQ(2, steps_before_stop_tokens.size());
	// Batch item 0: stop token found at step 2, the current step is 3. So the
	// steps before stop token is 2 = (3 - 2 + 1(# stop tokens)).
	EXPECT_EQ(2, steps_before_stop_tokens[0]);

	// Batch item 1: stop token found at step 3, the current step is 3. So the
	// steps before stop token is = (3 - 3 + 1(# stop tokens)).
	EXPECT_EQ(1, steps_before_stop_tokens[1]);
	}


	TEST(StopTokenDetectorTest, ProcessTokensMultipleStopTokens) {
	StopTokenDetector detector(2); // Batch size 2
	EXPECT_OK(detector.AddStopTokenSequence({5}));
	EXPECT_OK(detector.AddStopTokenSequence({7, 8, 9}));

	std::vector<int> tokens_item0 = {3, 6, 7, 8, 9, 10, 11, 12};
	std::vector<int> tokens_item1 = {1, 0, 0, 0, 0, 6, 5, 99};

	// Simulate processing token by token
	size_t i;
	for (i = 0; i < tokens_item0.size(); ++i) {
	std::vector<int> current_batch_tokens = {tokens_item0[i], tokens_item1[i]};
	EXPECT_TRUE(
	detector.ProcessTokens(absl::MakeSpan(current_batch_tokens)).ok());
	if (detector.AllDone().value()) {
	break;
	}
	if (i < 2) {
	EXPECT_EQ(0, detector.MaxPartialStopTokenLength(0));
	} else if (i < 4) {
	EXPECT_EQ(i - 1, detector.MaxPartialStopTokenLength(0));
	} else {
	EXPECT_EQ(3, detector.MaxPartialStopTokenLength(0));
	}
	EXPECT_EQ(0, detector.MaxPartialStopTokenLength(1));
	}
	// Stop tokens are found for all batch items at step 6.
	EXPECT_EQ(i, 6);

	const auto& steps_before_stop_tokens = detector.GetStepsBeforeStopTokens();
	EXPECT_EQ(2, steps_before_stop_tokens.size());

	// Batch item 0: stop token found at step 5, the current step is 6. So the
	// steps before stop token is 4 = (6 - 5 + 3(# stop tokens)).
	EXPECT_EQ(5, steps_before_stop_tokens[0]);

	// Batch item 1: stop token found at step 6, the current step is 6. So the
	// steps before stop token is 1 = (6 - 6 + 1(# stop tokens)).
	EXPECT_EQ(1, steps_before_stop_tokens[1]);
	}

	TEST(StopTokenDetectorTest, ResetBatch) {
	StopTokenDetector detector(1);
	EXPECT_OK(detector.AddStopTokenSequence({1}));
	std::vector<int> tokens1 = {0, 2, 3, 1, 5};
	size_t i;
	for (i = 0; i < tokens1.size(); ++i) {
	std::vector<int> current_batch_tokens = {tokens1[i]};
	EXPECT_TRUE(
	detector.ProcessTokens(absl::MakeSpan(current_batch_tokens)).ok());
	if (detector.AllDone().value()) {
	break;
	}
	}
	EXPECT_EQ(i, 3);
	detector.ResetBatch();
	// Batch is not done after reset.
	EXPECT_FALSE(detector.AllDone().value());
	EXPECT_EQ(0, detector.GetStepsBeforeStopTokens()[0]);
	}

	} // namespace
	} // namespace litert::lm