Spaces:

amiraghhh
/

rag

Build error

amiraghhh commited on Jan 1

Commit

ab46c35

verified ·

1 Parent(s): b30f331

Update utils.py

Files changed (1) hide show

utils.py CHANGED Viewed

@@ -133,41 +133,3 @@ A: Information unavailable."""
     full_prompt = f"{instruction_text}{the_context_block}{query_footer}"
     return full_prompt
-def normalize_text(text):
-    """Normalize text for duplicate detection by removing spaces and punctuation.
-    Returns: str"""
-    if not isinstance(text, str):
-        return ""
-    text = text.lower()  # Lowercase
-    text = re.sub(r'\s+', ' ', text)  # Remove extra whitespace
-    text = text.strip()  # Remove leading/trailing spaces
-    text = re.sub(r'[^\w\s]', '', text)  # Remove punctuation
-    return text
-def chunk_text(text, chunk_size=384, chunk_overlap=20):
-    """Split text into chunks for embeddings.
-    Returns: list(chunks)"""
-    splitter = RecursiveCharacterTextSplitter(
-        separators=["\n\n", "\n", " ", ""],
-        chunk_size=chunk_size,
-        chunk_overlap=chunk_overlap
-    )
-    return splitter.split_text(text)
-def create_embeddings(texts):
-    """Create embeddings for a list of texts.
-    Returns: list(embeddings)"""
-    embed_model = get_embed_model()
-    return embed_model.encode(
-        texts,
-        batch_size=64,
-        show_progress_bar=False,
-        convert_to_numpy=True,
-        normalize_embeddings=True
-    )


133	full_prompt = f"{instruction_text}{the_context_block}{query_footer}"
134
135	return full_prompt