GraphGen / graphgen /models /evaluator /qa /length_evaluator.py
github-actions[bot]
Auto-sync from demo at Fri Dec 26 08:29:01 UTC 2025
7566ac3
import os
from graphgen.bases import BaseEvaluator, QAPair
from graphgen.models.tokenizer import Tokenizer
class LengthEvaluator(BaseEvaluator):
def __init__(self, tokenizer_name: str = None):
tokenizer_model = tokenizer_name or os.environ.get("TOKENIZER_MODEL", "cl100k_base")
self.tokenizer: Tokenizer = Tokenizer(tokenizer_model)
def evaluate(self, pair: QAPair) -> float:
"""
Evaluate the length of the qa pair.
"""
content = pair.question + pair.answer
tokens = self.tokenizer.encode(content)
return len(tokens)