coding-llm-space / src /relevancy.py
girish00's picture
Upload folder using huggingface_hub
07a91a1 verified
raw
history blame contribute delete
649 Bytes
"""Lightweight relevancy scoring without heavy embedding backends."""
from __future__ import annotations
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.metrics.pairwise import cosine_similarity
class RelevancyScorer:
"""Computes semantic relevancy between request and generated code."""
def __init__(self):
self.vectorizer = TfidfVectorizer(ngram_range=(1, 2), min_df=1)
def score(self, query_text: str, generated_text: str) -> float:
matrix = self.vectorizer.fit_transform([query_text, generated_text])
return float(cosine_similarity(matrix[0], matrix[1])[0][0])