Spaces:

amaherovskyi
/

Financial_RAG

Sleeping

App Files Files Community

amaherovskyi commited on Dec 15, 2025

Commit

a4bfffb

verified ·

1 Parent(s): 5b933aa

Update pipeline.py

Browse files

Files changed (1) hide show

pipeline.py +1 -12

pipeline.py CHANGED Viewed

@@ -1,4 +1,3 @@
-# pipeline.py
 import os
 import logging
 from typing import List, Dict
@@ -21,9 +20,7 @@ console_handler.setFormatter(formatter)
 logger.addHandler(console_handler)
-# ---------------------------
 # Initialization
-# ---------------------------
 def init_reranker(model_name: str = "cross-encoder/ms-marco-MiniLM-L-6-v2") -> CrossEncoder:
     """Initialize CrossEncoder for document reordering."""
     logger.info(f"CrossEncoder initialization: {model_name}")
@@ -39,9 +36,7 @@ def init_groq(api_key: str = None) -> Groq:
     return client
-# ---------------------------
 # Reranking
-# ---------------------------
 def rerank(query: str, docs: List[Dict], reranker: CrossEncoder, top_k: int = 5) -> List[Dict]:
     """Reranking documents using CrossEncoder based on a query."""
     if not docs:
@@ -57,9 +52,7 @@ def rerank(query: str, docs: List[Dict], reranker: CrossEncoder, top_k: int = 5)
     return ranked[:top_k]
-# ---------------------------
 # LLM answering
-# ---------------------------
 def llm_answer(query: str, context: List[Dict], client: Groq) -> str:
     """Forming an LLM response based on the provided document context."""
     context_text = "\n\n---\n\n".join(f"[{d['id']}] {d['text']}" for d in context)
@@ -84,9 +77,7 @@ Answer only using information from the context. If answer not found, say "I don'
     return completion.choices[0].message.content
-# ---------------------------
-# Retrieve documents (fixed!)
-# ---------------------------
 def retrieve_documents(
     query: str,
     documents: list,
@@ -123,9 +114,7 @@ def retrieve_documents(
     return docs
-# ---------------------------
 # Full RAG Pipeline
-# ---------------------------
 def rag_pipeline(
     query: str,
     reranker_model: CrossEncoder,

 import os
 import logging
 from typing import List, Dict
 logger.addHandler(console_handler)
 # Initialization
 def init_reranker(model_name: str = "cross-encoder/ms-marco-MiniLM-L-6-v2") -> CrossEncoder:
     """Initialize CrossEncoder for document reordering."""
     logger.info(f"CrossEncoder initialization: {model_name}")
     return client
 # Reranking
 def rerank(query: str, docs: List[Dict], reranker: CrossEncoder, top_k: int = 5) -> List[Dict]:
     """Reranking documents using CrossEncoder based on a query."""
     if not docs:
     return ranked[:top_k]
 # LLM answering
 def llm_answer(query: str, context: List[Dict], client: Groq) -> str:
     """Forming an LLM response based on the provided document context."""
     context_text = "\n\n---\n\n".join(f"[{d['id']}] {d['text']}" for d in context)
     return completion.choices[0].message.content
+# Retrieve documents
 def retrieve_documents(
     query: str,
     documents: list,
     return docs
 # Full RAG Pipeline
 def rag_pipeline(
     query: str,
     reranker_model: CrossEncoder,