Spaces:

Arif-Badhon
/

Generative_AI_Project

Sleeping

App Files Files Community

Arif commited on Oct 24, 2025

Commit

704b133

1 Parent(s): 92ab414

Demo data added for query test

Browse files

Files changed (11) hide show

app/core/llm.py +35 -41
app/core/vector_store.py +24 -17
app/models/schemas.py +0 -4
app/services/document_processor.py +0 -1
data/documents/ai_basics.txt +1 -0
data/documents/ml_concepts.txt +11 -0
data/documents/rag_explanation.txt +16 -0
main.py +141 -3
pyproject.toml +1 -0
scripts/demo_queries.py +56 -0
uv.lock +43 -31

app/core/llm.py CHANGED Viewed

@@ -1,22 +1,15 @@
-from langchain_ollama import ChatOllama
-try:
-    from langchain.prompts import PromptTemplate
-except ImportError:
-    from langchain_core.prompts import PromptTemplate
-from langchain_core.output_parsers import StrOutputParser
 class OllamaLLM:
     def __init__(self, base_url: str, model: str):
-        self.llm = ChatOllama(
-            base_url=base_url,
-            model=model,
-            temperature=0.2,  # Lower for more factual responses
-        )
-        # RAG-specific prompt template
-        self.prompt_template = PromptTemplate(
-            template="""You are a helpful AI assistant. Use the following context to answer the question accurately and concisely.
 Context:
 {context}
@@ -29,30 +22,31 @@ Instructions:
 - Keep your answer clear and concise (max 3-5 sentences)
 - Cite specific parts of the context when relevant
-Answer:""",
-            input_variables=["context", "question"]
-        )
-        self.chain = self.prompt_template | self.llm | StrOutputParser()
-    def generate(self, question: str, context: str) -> str:
-        """Generate answer using RAG context"""
-        return self.chain.invoke({
-            "question": question,
-            "context": context
-        })
-async def generate_stream(self, question: str, context: str):
-    """Stream LLM responses"""
-    async for chunk in self.chain.astream({
-        "question": question,
-        "context": context
-    }):
-        yield chunk
-from langchain.memory import ConversationBufferMemory
-class ConversationalRAG:
-    def __init__(self, rag_chain):
-        self.rag_chain = rag_chain
-        self.memory = ConversationBufferMemory()

+import requests
+import json
+from typing import Dict
 class OllamaLLM:
     def __init__(self, base_url: str, model: str):
+        self.base_url = base_url.rstrip('/')
+        self.model = model
+    def generate(self, question: str, context: str) -> str:
+        """Generate answer using RAG context"""
+        prompt = f"""You are a helpful AI assistant. Use the following context to answer the question accurately and concisely.
 Context:
 {context}
 - Keep your answer clear and concise (max 3-5 sentences)
 - Cite specific parts of the context when relevant
+Answer:"""
+        try:
+            response = requests.post(
+                f"{self.base_url}/api/generate",
+                json={
+                    "model": self.model,
+                    "prompt": prompt,
+                    "stream": False,
+                    "options": {
+                        "temperature": 0.2,
+                        "top_p": 0.9,
+                        "top_k": 40
+                    }
+                },
+                timeout=60
+            )
+            if response.status_code == 200:
+                result = response.json()
+                return result.get("response", "Error generating response")
+            else:
+                return f"Error: Ollama returned status {response.status_code}"
+        except requests.exceptions.RequestException as e:
+            return f"Error connecting to Ollama: {str(e)}"
+        except Exception as e:
+            return f"Unexpected error: {str(e)}"

app/core/vector_store.py CHANGED Viewed

@@ -12,17 +12,20 @@ class VectorStore:
     def _ensure_collection(self):
         """Create collection if it doesn't exist"""
-        collections = self.client.get_collections().collections
-        collection_names = [col.name for col in collections]
-        if self.collection_name not in collection_names:
-            self.client.create_collection(
-                collection_name=self.collection_name,
-                vectors_config=VectorParams(
-                    size=self.vector_size,
-                    distance=Distance.COSINE
                 )
-            )
     def add_documents(self, texts: List[str], embeddings: List[List[float]],
                      metadata: List[Dict] = None):
@@ -50,10 +53,14 @@ class VectorStore:
     def search(self, query_embedding: List[float], limit: int = 5,
               score_threshold: float = 0.7):
         """Search for similar documents"""
-        results = self.client.search(
-            collection_name=self.collection_name,
-            query_vector=query_embedding,
-            limit=limit,
-            score_threshold=score_threshold
-        )
-        return results

     def _ensure_collection(self):
         """Create collection if it doesn't exist"""
+        try:
+            collections = self.client.get_collections().collections
+            collection_names = [col.name for col in collections]
+            if self.collection_name not in collection_names:
+                self.client.create_collection(
+                    collection_name=self.collection_name,
+                    vectors_config=VectorParams(
+                        size=self.vector_size,
+                        distance=Distance.COSINE
+                    )
                 )
+        except Exception as e:
+            print(f"Warning: Could not connect to Qdrant: {e}")
     def add_documents(self, texts: List[str], embeddings: List[List[float]],
                      metadata: List[Dict] = None):
     def search(self, query_embedding: List[float], limit: int = 5,
               score_threshold: float = 0.7):
         """Search for similar documents"""
+        try:
+            results = self.client.search(
+                collection_name=self.collection_name,
+                query_vector=query_embedding,
+                limit=limit,
+                score_threshold=score_threshold
+            )
+            return results
+        except Exception as e:
+            print(f"Search error: {e}")
+            return []

app/models/schemas.py CHANGED Viewed

@@ -1,10 +1,6 @@
 from pydantic import BaseModel
 from typing import List, Optional
-class DocumentUpload(BaseModel):
-    filename: str
-    content: str
 class QueryRequest(BaseModel):
     question: str
     top_k: Optional[int] = 5

 from pydantic import BaseModel
 from typing import List, Optional
 class QueryRequest(BaseModel):
     question: str
     top_k: Optional[int] = 5

app/services/document_processor.py CHANGED Viewed

@@ -4,7 +4,6 @@ import pypdf
 from docx import Document
 from langchain_text_splitters import RecursiveCharacterTextSplitter
 class DocumentProcessor:
     def __init__(self, chunk_size: int = 500, chunk_overlap: int = 50):
         self.text_splitter = RecursiveCharacterTextSplitter(

 from docx import Document
 from langchain_text_splitters import RecursiveCharacterTextSplitter
 class DocumentProcessor:
     def __init__(self, chunk_size: int = 500, chunk_overlap: int = 50):
         self.text_splitter = RecursiveCharacterTextSplitter(

data/documents/ai_basics.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ Artificial Intelligence is transforming the world. Machine learning enables computers to learn from data. Deep learning uses neural networks with multiple layers. Natural language processing helps computers understand human language. Computer vision allows machines to interpret visual information.

data/documents/ml_concepts.txt ADDED Viewed

	@@ -0,0 +1,11 @@

+Machine Learning Fundamentals
+Supervised Learning: Training models with labeled data. Examples include classification and regression tasks.
+Unsupervised Learning: Finding patterns in unlabeled data. Clustering and dimensionality reduction are common techniques.
+Reinforcement Learning: Learning through trial and error with rewards and penalties. Used in robotics and game playing.
+Feature Engineering: The process of selecting and transforming variables to improve model performance.
+Model Evaluation: Using metrics like accuracy, precision, recall, and F1-score to assess model quality.

data/documents/rag_explanation.txt ADDED Viewed

	@@ -0,0 +1,16 @@

+Retrieval-Augmented Generation (RAG) System
+RAG combines retrieval and generation to create more accurate AI responses.
+The process works in three steps:
+1. Document Ingestion: Documents are split into chunks and converted to vector embeddings
+2. Retrieval: When a query comes in, relevant chunks are found using similarity search
+3. Generation: The LLM uses retrieved context to generate accurate, grounded answers
+Benefits of RAG:
+- Reduces hallucinations by grounding responses in actual documents
+- Enables knowledge updates without retraining models
+- Provides source citations for transparency
+- Works with private, domain-specific data
+RAG is ideal for enterprise knowledge bases, customer support, and research applications.

main.py CHANGED Viewed

@@ -1,6 +1,144 @@
-def main():
-    print("Hello from generative-ai-portfolio-project!")
 if __name__ == "__main__":
-    main()

+from fastapi import FastAPI, UploadFile, File, HTTPException
+from fastapi.middleware.cors import CORSMiddleware
+from app.config import get_settings
+from app.core.embeddings import EmbeddingGenerator
+from app.core.vector_store import VectorStore
+from app.core.llm import OllamaLLM
+from app.services.document_processor import DocumentProcessor
+from app.services.rag_chain import RAGChain
+from app.models.schemas import QueryRequest, QueryResponse, IngestResponse
+import tempfile
+import os
+# Initialize FastAPI app
+app = FastAPI(
+    title="RAG Portfolio Project",
+    description="Production-grade Retrieval-Augmented Generation system",
+    version="1.0.0"
+)
+# Add CORS middleware
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+# Initialize components
+settings = get_settings()
+try:
+    embedding_generator = EmbeddingGenerator(settings.embedding_model)
+    vector_store = VectorStore(
+        host=settings.qdrant_host,
+        port=settings.qdrant_port,
+        collection_name=settings.qdrant_collection_name,
+        vector_size=embedding_generator.dimension
+    )
+    llm = OllamaLLM(settings.ollama_base_url, settings.ollama_model)
+    document_processor = DocumentProcessor()
+    rag_chain = RAGChain(embedding_generator, vector_store, llm)
+    print("✅ All components initialized successfully!")
+except Exception as e:
+    print(f"❌ Error initializing components: {e}")
+    # Create dummy components for now
+    embedding_generator = None
+    vector_store = None
+    llm = None
+    document_processor = None
+    rag_chain = None
+@app.get("/")
+async def root():
+    return {
+        "message": "RAG Portfolio Project API",
+        "status": "running",
+        "docs": "/docs"
+    }
+@app.get("/health")
+async def health_check():
+    # Check if services are running
+    ollama_status = True
+    qdrant_status = True
+    try:
+        if llm:
+            # Test Ollama connection
+            test_response = llm.generate("test", "test context")
+            ollama_status = "Error" not in test_response
+    except:
+        ollama_status = False
+    try:
+        if vector_store:
+            # Test Qdrant connection
+            vector_store.client.get_collections()
+    except:
+        qdrant_status = False
+    return {
+        "status": "healthy" if (ollama_status and qdrant_status) else "degraded",
+        "ollama_connected": ollama_status,
+        "qdrant_connected": qdrant_status
+    }
+@app.post("/ingest/file", response_model=IngestResponse)
+async def ingest_file(file: UploadFile = File(...)):
+    """Upload and ingest a document into the RAG system"""
+    if not rag_chain:
+        raise HTTPException(status_code=503, detail="RAG system not initialized")
+    try:
+        # Save uploaded file temporarily
+        with tempfile.NamedTemporaryFile(delete=False, suffix=file.filename) as tmp:
+            content = await file.read()
+            tmp.write(content)
+            tmp_path = tmp.name
+        # Process document
+        chunks = document_processor.process_document(tmp_path)
+        # Ingest into RAG system
+        result = rag_chain.ingest_documents(chunks)
+        # Clean up
+        os.unlink(tmp_path)
+        return IngestResponse(**result, message=f"Successfully ingested {file.filename}")
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+@app.post("/query", response_model=QueryResponse)
+async def query(request: QueryRequest):
+    """Query the RAG system"""
+    if not rag_chain:
+        raise HTTPException(status_code=503, detail="RAG system not initialized")
+    try:
+        result = rag_chain.query(request.question, request.top_k)
+        return QueryResponse(**result)
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+@app.delete("/reset")
+async def reset_collection():
+    """Reset the vector collection (delete all documents)"""
+    if not vector_store:
+        raise HTTPException(status_code=503, detail="Vector store not initialized")
+    try:
+        vector_store.client.delete_collection(settings.qdrant_collection_name)
+        vector_store._ensure_collection()
+        return {"status": "success", "message": "Collection reset successfully"}
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
 if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run(app, host=settings.app_host, port=settings.app_port)

pyproject.toml CHANGED Viewed

@@ -16,6 +16,7 @@ dependencies = [
     "qdrant-client>=1.15.1",
     "ragas>=0.3.7",
     "rank-bm25>=0.2.2",
     "sentence-transformers>=5.1.2",
     "unstructured>=0.18.15",
     "uvicorn>=0.38.0",

     "qdrant-client>=1.15.1",
     "ragas>=0.3.7",
     "rank-bm25>=0.2.2",
+    "requests>=2.32.5",
     "sentence-transformers>=5.1.2",
     "unstructured>=0.18.15",
     "uvicorn>=0.38.0",

scripts/demo_queries.py ADDED Viewed

	@@ -0,0 +1,56 @@

+import requests
+import json
+from typing import Dict
+BASE_URL = "http://localhost:8000"
+def query_rag(question: str, top_k: int = 5) -> Dict:
+    """Query the RAG system"""
+    response = requests.post(
+        f"{BASE_URL}/query",
+        json={"question": question, "top_k": top_k}
+    )
+    return response.json()
+def print_result(question: str, result: Dict):
+    """Pretty print query results"""
+    print("\n" + "="*80)
+    print(f"❓ QUESTION: {question}")
+    print("="*80)
+    print(f"\n💡 ANSWER:\n{result['answer']}\n")
+    print(f"📚 SOURCES ({result['context_used']} chunks used):")
+    for idx, source in enumerate(result['sources'], 1):
+        print(f"  {idx}. {source['source']} (chunk {source['chunk_index']}, score: {source['score']:.3f})")
+    print("="*80)
+def main():
+    """Run demo queries"""
+    demo_queries = [
+        "What is deep learning and how does it work?",
+        "Explain the RAG process in simple terms",
+        "What are the benefits of using RAG systems?",
+        "What is supervised learning?",
+        "How does reinforcement learning work?",
+    ]
+    print("\n🚀 RAG SYSTEM DEMO")
+    print("="*80)
+    # Check health first
+    health = requests.get(f"{BASE_URL}/health").json()
+    print(f"\n✅ System Status: {health['status']}")
+    print(f"   Ollama: {'✓' if health['ollama_connected'] else '✗'}")
+    print(f"   Qdrant: {'✓' if health['qdrant_connected'] else '✗'}")
+    # Run queries
+    for question in demo_queries:
+        try:
+            result = query_rag(question)
+            print_result(question, result)
+        except Exception as e:
+            print(f"\n❌ Error: {e}")
+    print("\n✨ Demo complete!")
+if __name__ == "__main__":
+    main()

uv.lock CHANGED Viewed

@@ -159,6 +159,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/fb/76/641ae371508676492379f16e2fa48f4e2c11741bd63c48be4b12a6b09cba/aiosignal-1.4.0-py3-none-any.whl", hash = "sha256:053243f8b92b990551949e63930a839ff0cf0b0ebbe0597b0f3fb19e1a0fe82e", size = 7490, upload-time = "2025-07-03T22:54:42.156Z" },
 ]
 [[package]]
 name = "annotated-types"
 version = "0.7.0"
@@ -548,7 +557,7 @@ wheels = [
 [[package]]
 name = "datasets"
-version = "4.2.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "dill" },
@@ -567,9 +576,9 @@ dependencies = [
     { name = "tqdm" },
     { name = "xxhash" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/70/48/0186fbc4b86a4f9ecaf04eb01e877e78b53bfa0b03be9c84b2298431ba33/datasets-4.2.0.tar.gz", hash = "sha256:8333a7db9f3bb8044c1b819a35d4e3e2809596c837793b0921382efffdc36e78", size = 582256, upload-time = "2025-10-09T16:10:15.534Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/91/9e/0bbbd09b116fd8ee2d3617e28e6598551d2f0f24d3a2ce99cc87ec85aeb0/datasets-4.2.0-py3-none-any.whl", hash = "sha256:fdc43aaf4a73b31f64f80f72f195ab413a1141ed15555d675b2fd17926f8b026", size = 506316, upload-time = "2025-10-09T16:10:13.375Z" },
 ]
 [[package]]
@@ -631,16 +640,17 @@ wheels = [
 [[package]]
 name = "fastapi"
-version = "0.119.1"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "pydantic" },
     { name = "starlette" },
     { name = "typing-extensions" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/a6/f4/152127681182e6413e7a89684c434e19e7414ed7ac0c632999c3c6980640/fastapi-0.119.1.tar.gz", hash = "sha256:a5e3426edce3fe221af4e1992c6d79011b247e3b03cc57999d697fe76cbf8ae0", size = 338616, upload-time = "2025-10-20T11:30:27.734Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/b1/26/e6d959b4ac959fdb3e9c4154656fc160794db6af8e64673d52759456bf07/fastapi-0.119.1-py3-none-any.whl", hash = "sha256:0b8c2a2cce853216e150e9bd4faaed88227f8eb37de21cb200771f491586a27f", size = 108123, upload-time = "2025-10-20T11:30:26.185Z" },
 ]
 [[package]]
@@ -812,6 +822,7 @@ dependencies = [
     { name = "qdrant-client" },
     { name = "ragas" },
     { name = "rank-bm25" },
     { name = "sentence-transformers" },
     { name = "unstructured" },
     { name = "uvicorn" },
@@ -837,6 +848,7 @@ requires-dist = [
     { name = "qdrant-client", specifier = ">=1.15.1" },
     { name = "ragas", specifier = ">=0.3.7" },
     { name = "rank-bm25", specifier = ">=0.2.2" },
     { name = "sentence-transformers", specifier = ">=5.1.2" },
     { name = "unstructured", specifier = ">=0.18.15" },
     { name = "uvicorn", specifier = ">=0.38.0" },
@@ -1450,7 +1462,7 @@ wheels = [
 [[package]]
 name = "langsmith"
-version = "0.4.37"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "httpx" },
@@ -1461,9 +1473,9 @@ dependencies = [
     { name = "requests-toolbelt" },
     { name = "zstandard" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/09/51/58d561dd40ec564509724f0a6a7148aa8090143208ef5d06b73b7fc90d31/langsmith-0.4.37.tar.gz", hash = "sha256:d9a0eb6dd93f89843ac982c9f92be93cf2bcabbe19957f362c547766c7366c71", size = 959089, upload-time = "2025-10-15T22:33:59.465Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/14/e8/edff4de49cf364eb9ee88d13da0a555844df32438413bf53d90d507b97cd/langsmith-0.4.37-py3-none-any.whl", hash = "sha256:e34a94ce7277646299e4703a0f6e2d2c43647a28e8b800bb7ef82fd87a0ec766", size = 396111, upload-time = "2025-10-15T22:33:57.392Z" },
 ]
 [[package]]
@@ -3469,28 +3481,28 @@ wheels = [
 [[package]]
 name = "ruff"
-version = "0.14.1"
-source = { registry = "https://pypi.org/simple" }
-sdist = { url = "https://files.pythonhosted.org/packages/9e/58/6ca66896635352812de66f71cdf9ff86b3a4f79071ca5730088c0cd0fc8d/ruff-0.14.1.tar.gz", hash = "sha256:1dd86253060c4772867c61791588627320abcb6ed1577a90ef432ee319729b69", size = 5513429, upload-time = "2025-10-16T18:05:41.766Z" }
-wheels = [
-    { url = "https://files.pythonhosted.org/packages/8d/39/9cc5ab181478d7a18adc1c1e051a84ee02bec94eb9bdfd35643d7c74ca31/ruff-0.14.1-py3-none-linux_armv6l.whl", hash = "sha256:083bfc1f30f4a391ae09c6f4f99d83074416b471775b59288956f5bc18e82f8b", size = 12445415, upload-time = "2025-10-16T18:04:48.227Z" },
-    { url = "https://files.pythonhosted.org/packages/ef/2e/1226961855ccd697255988f5a2474890ac7c5863b080b15bd038df820818/ruff-0.14.1-py3-none-macosx_10_12_x86_64.whl", hash = "sha256:f6fa757cd717f791009f7669fefb09121cc5f7d9bd0ef211371fad68c2b8b224", size = 12784267, upload-time = "2025-10-16T18:04:52.515Z" },
-    { url = "https://files.pythonhosted.org/packages/c1/ea/fd9e95863124ed159cd0667ec98449ae461de94acda7101f1acb6066da00/ruff-0.14.1-py3-none-macosx_11_0_arm64.whl", hash = "sha256:d6191903d39ac156921398e9c86b7354d15e3c93772e7dbf26c9fcae59ceccd5", size = 11781872, upload-time = "2025-10-16T18:04:55.396Z" },
-    { url = "https://files.pythonhosted.org/packages/1e/5a/e890f7338ff537dba4589a5e02c51baa63020acfb7c8cbbaea4831562c96/ruff-0.14.1-py3-none-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ed04f0e04f7a4587244e5c9d7df50e6b5bf2705d75059f409a6421c593a35896", size = 12226558, upload-time = "2025-10-16T18:04:58.166Z" },
-    { url = "https://files.pythonhosted.org/packages/a6/7a/8ab5c3377f5bf31e167b73651841217542bcc7aa1c19e83030835cc25204/ruff-0.14.1-py3-none-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:5c9e6cf6cd4acae0febbce29497accd3632fe2025c0c583c8b87e8dbdeae5f61", size = 12187898, upload-time = "2025-10-16T18:05:01.455Z" },
-    { url = "https://files.pythonhosted.org/packages/48/8d/ba7c33aa55406955fc124e62c8259791c3d42e3075a71710fdff9375134f/ruff-0.14.1-py3-none-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:a6fa2458527794ecdfbe45f654e42c61f2503a230545a91af839653a0a93dbc6", size = 12939168, upload-time = "2025-10-16T18:05:04.397Z" },
-    { url = "https://files.pythonhosted.org/packages/b4/c2/70783f612b50f66d083380e68cbd1696739d88e9b4f6164230375532c637/ruff-0.14.1-py3-none-manylinux_2_17_ppc64.manylinux2014_ppc64.whl", hash = "sha256:39f1c392244e338b21d42ab29b8a6392a722c5090032eb49bb4d6defcdb34345", size = 14386942, upload-time = "2025-10-16T18:05:07.102Z" },
-    { url = "https://files.pythonhosted.org/packages/48/44/cd7abb9c776b66d332119d67f96acf15830d120f5b884598a36d9d3f4d83/ruff-0.14.1-py3-none-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:7382fa12a26cce1f95070ce450946bec357727aaa428983036362579eadcc5cf", size = 13990622, upload-time = "2025-10-16T18:05:09.882Z" },
-    { url = "https://files.pythonhosted.org/packages/eb/56/4259b696db12ac152fe472764b4f78bbdd9b477afd9bc3a6d53c01300b37/ruff-0.14.1-py3-none-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:dd0bf2be3ae8521e1093a487c4aa3b455882f139787770698530d28ed3fbb37c", size = 13431143, upload-time = "2025-10-16T18:05:13.46Z" },
-    { url = "https://files.pythonhosted.org/packages/e0/35/266a80d0eb97bd224b3265b9437bd89dde0dcf4faf299db1212e81824e7e/ruff-0.14.1-py3-none-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:cabcaa9ccf8089fb4fdb78d17cc0e28241520f50f4c2e88cb6261ed083d85151", size = 13132844, upload-time = "2025-10-16T18:05:16.1Z" },
-    { url = "https://files.pythonhosted.org/packages/65/6e/d31ce218acc11a8d91ef208e002a31acf315061a85132f94f3df7a252b18/ruff-0.14.1-py3-none-manylinux_2_31_riscv64.whl", hash = "sha256:747d583400f6125ec11a4c14d1c8474bf75d8b419ad22a111a537ec1a952d192", size = 13401241, upload-time = "2025-10-16T18:05:19.395Z" },
-    { url = "https://files.pythonhosted.org/packages/9f/b5/dbc4221bf0b03774b3b2f0d47f39e848d30664157c15b965a14d890637d2/ruff-0.14.1-py3-none-musllinux_1_2_aarch64.whl", hash = "sha256:5a6e74c0efd78515a1d13acbfe6c90f0f5bd822aa56b4a6d43a9ffb2ae6e56cd", size = 12132476, upload-time = "2025-10-16T18:05:22.163Z" },
-    { url = "https://files.pythonhosted.org/packages/98/4b/ac99194e790ccd092d6a8b5f341f34b6e597d698e3077c032c502d75ea84/ruff-0.14.1-py3-none-musllinux_1_2_armv7l.whl", hash = "sha256:0ea6a864d2fb41a4b6d5b456ed164302a0d96f4daac630aeba829abfb059d020", size = 12139749, upload-time = "2025-10-16T18:05:25.162Z" },
-    { url = "https://files.pythonhosted.org/packages/47/26/7df917462c3bb5004e6fdfcc505a49e90bcd8a34c54a051953118c00b53a/ruff-0.14.1-py3-none-musllinux_1_2_i686.whl", hash = "sha256:0826b8764f94229604fa255918d1cc45e583e38c21c203248b0bfc9a0e930be5", size = 12544758, upload-time = "2025-10-16T18:05:28.018Z" },
-    { url = "https://files.pythonhosted.org/packages/64/d0/81e7f0648e9764ad9b51dd4be5e5dac3fcfff9602428ccbae288a39c2c22/ruff-0.14.1-py3-none-musllinux_1_2_x86_64.whl", hash = "sha256:cbc52160465913a1a3f424c81c62ac8096b6a491468e7d872cb9444a860bc33d", size = 13221811, upload-time = "2025-10-16T18:05:30.707Z" },
-    { url = "https://files.pythonhosted.org/packages/c3/07/3c45562c67933cc35f6d5df4ca77dabbcd88fddaca0d6b8371693d29fd56/ruff-0.14.1-py3-none-win32.whl", hash = "sha256:e037ea374aaaff4103240ae79168c0945ae3d5ae8db190603de3b4012bd1def6", size = 12319467, upload-time = "2025-10-16T18:05:33.261Z" },
-    { url = "https://files.pythonhosted.org/packages/02/88/0ee4ca507d4aa05f67e292d2e5eb0b3e358fbcfe527554a2eda9ac422d6b/ruff-0.14.1-py3-none-win_amd64.whl", hash = "sha256:59d599cdff9c7f925a017f6f2c256c908b094e55967f93f2821b1439928746a1", size = 13401123, upload-time = "2025-10-16T18:05:35.984Z" },
-    { url = "https://files.pythonhosted.org/packages/b8/81/4b6387be7014858d924b843530e1b2a8e531846807516e9bea2ee0936bf7/ruff-0.14.1-py3-none-win_arm64.whl", hash = "sha256:e3b443c4c9f16ae850906b8d0a707b2a4c16f8d2f0a7fe65c475c5886665ce44", size = 12436636, upload-time = "2025-10-16T18:05:38.995Z" },
 ]
 [[package]]

     { url = "https://files.pythonhosted.org/packages/fb/76/641ae371508676492379f16e2fa48f4e2c11741bd63c48be4b12a6b09cba/aiosignal-1.4.0-py3-none-any.whl", hash = "sha256:053243f8b92b990551949e63930a839ff0cf0b0ebbe0597b0f3fb19e1a0fe82e", size = 7490, upload-time = "2025-07-03T22:54:42.156Z" },
 ]
+[[package]]
+name = "annotated-doc"
+version = "0.0.2"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/c4/92/2974dba489541ed4af531d00a4df075bc3a455557d3b54fd6932c51c95cc/annotated_doc-0.0.2.tar.gz", hash = "sha256:f25664061aee278227abfaec5aeb398298be579b934758c16205d48e896e149c", size = 4452, upload-time = "2025-10-22T18:38:52.597Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/bd/ee/cc5109cdd46a6ccd3d923db3c5425383abe51b5c033647aad1b5e2452e82/annotated_doc-0.0.2-py3-none-any.whl", hash = "sha256:2188cb99e353fcb5c20f23b8bc6f5fa7c924b213fac733d4b44883f9edffa090", size = 4056, upload-time = "2025-10-22T18:38:51.24Z" },
+]
 [[package]]
 name = "annotated-types"
 version = "0.7.0"
 [[package]]
 name = "datasets"
+version = "4.3.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "dill" },
     { name = "tqdm" },
     { name = "xxhash" },
 ]
+sdist = { url = "https://files.pythonhosted.org/packages/2a/47/325206ac160f7699ed9f1798afa8f8f8d5189b03bf3815654859ac1d5cba/datasets-4.3.0.tar.gz", hash = "sha256:bc9118ed9afd92346c5be7ed3aaa00177eb907c25467f9d072a0d22777efbd2b", size = 582801, upload-time = "2025-10-23T16:31:51.547Z" }
 wheels = [
+    { url = "https://files.pythonhosted.org/packages/ca/51/409a8184ed35453d9cbb3d6b20d524b1115c2c2d117b85d5e9b06cd70b45/datasets-4.3.0-py3-none-any.whl", hash = "sha256:0ea157e72138b3ca6c7d2415f19a164ecf7d4c4fa72da2a570da286882e96903", size = 506846, upload-time = "2025-10-23T16:31:49.965Z" },
 ]
 [[package]]
 [[package]]
 name = "fastapi"
+version = "0.120.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
+    { name = "annotated-doc" },
     { name = "pydantic" },
     { name = "starlette" },
     { name = "typing-extensions" },
 ]
+sdist = { url = "https://files.pythonhosted.org/packages/f7/0e/7f29e8f7219e4526747db182e1afb5a4b6abc3201768fb38d81fa2536241/fastapi-0.120.0.tar.gz", hash = "sha256:6ce2c1cfb7000ac14ffd8ddb2bc12e62d023a36c20ec3710d09d8e36fab177a0", size = 337603, upload-time = "2025-10-23T20:56:34.743Z" }
 wheels = [
+    { url = "https://files.pythonhosted.org/packages/1d/60/7a639ceaba54aec4e1d5676498c568abc654b95762d456095b6cb529b1ca/fastapi-0.120.0-py3-none-any.whl", hash = "sha256:84009182e530c47648da2f07eb380b44b69889a4acfd9e9035ee4605c5cfc469", size = 108243, upload-time = "2025-10-23T20:56:33.281Z" },
 ]
 [[package]]
     { name = "qdrant-client" },
     { name = "ragas" },
     { name = "rank-bm25" },
+    { name = "requests" },
     { name = "sentence-transformers" },
     { name = "unstructured" },
     { name = "uvicorn" },
     { name = "qdrant-client", specifier = ">=1.15.1" },
     { name = "ragas", specifier = ">=0.3.7" },
     { name = "rank-bm25", specifier = ">=0.2.2" },
+    { name = "requests", specifier = ">=2.32.5" },
     { name = "sentence-transformers", specifier = ">=5.1.2" },
     { name = "unstructured", specifier = ">=0.18.15" },
     { name = "uvicorn", specifier = ">=0.38.0" },
 [[package]]
 name = "langsmith"
+version = "0.4.38"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "httpx" },
     { name = "requests-toolbelt" },
     { name = "zstandard" },
 ]
+sdist = { url = "https://files.pythonhosted.org/packages/37/21/f1ba48412c64bf3bb8feb532fc9d247b396935b5d8242332d44a4195ec2d/langsmith-0.4.38.tar.gz", hash = "sha256:3aa57f9c16a5880256cd1eab0452533c1fb5ee14ec5250e23ed919cc2b07f6d3", size = 942789, upload-time = "2025-10-23T22:28:20.458Z" }
 wheels = [
+    { url = "https://files.pythonhosted.org/packages/b4/2b/7e0248f65e35800ea8e4e3dbb3bcc36c61b81f5b8abeddaceec8320ab491/langsmith-0.4.38-py3-none-any.whl", hash = "sha256:326232a24b1c6dd308a3188557cc023adf8fb14144263b2982c115a6be5141e7", size = 397341, upload-time = "2025-10-23T22:28:18.333Z" },
 ]
 [[package]]
 [[package]]
 name = "ruff"
+version = "0.14.2"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/ee/34/8218a19b2055b80601e8fd201ec723c74c7fe1ca06d525a43ed07b6d8e85/ruff-0.14.2.tar.gz", hash = "sha256:98da787668f239313d9c902ca7c523fe11b8ec3f39345553a51b25abc4629c96", size = 5539663, upload-time = "2025-10-23T19:37:00.956Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/16/dd/23eb2db5ad9acae7c845700493b72d3ae214dce0b226f27df89216110f2b/ruff-0.14.2-py3-none-linux_armv6l.whl", hash = "sha256:7cbe4e593505bdec5884c2d0a4d791a90301bc23e49a6b1eb642dd85ef9c64f1", size = 12533390, upload-time = "2025-10-23T19:36:18.044Z" },
+    { url = "https://files.pythonhosted.org/packages/5a/8c/5f9acff43ddcf3f85130d0146d0477e28ccecc495f9f684f8f7119b74c0d/ruff-0.14.2-py3-none-macosx_10_12_x86_64.whl", hash = "sha256:8d54b561729cee92f8d89c316ad7a3f9705533f5903b042399b6ae0ddfc62e11", size = 12887187, upload-time = "2025-10-23T19:36:22.664Z" },
+    { url = "https://files.pythonhosted.org/packages/99/fa/047646491479074029665022e9f3dc6f0515797f40a4b6014ea8474c539d/ruff-0.14.2-py3-none-macosx_11_0_arm64.whl", hash = "sha256:5c8753dfa44ebb2cde10ce5b4d2ef55a41fb9d9b16732a2c5df64620dbda44a3", size = 11925177, upload-time = "2025-10-23T19:36:24.778Z" },
+    { url = "https://files.pythonhosted.org/packages/15/8b/c44cf7fe6e59ab24a9d939493a11030b503bdc2a16622cede8b7b1df0114/ruff-0.14.2-py3-none-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:3d0bbeffb8d9f4fccf7b5198d566d0bad99a9cb622f1fc3467af96cb8773c9e3", size = 12358285, upload-time = "2025-10-23T19:36:26.979Z" },
+    { url = "https://files.pythonhosted.org/packages/45/01/47701b26254267ef40369aea3acb62a7b23e921c27372d127e0f3af48092/ruff-0.14.2-py3-none-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:7047f0c5a713a401e43a88d36843d9c83a19c584e63d664474675620aaa634a8", size = 12303832, upload-time = "2025-10-23T19:36:29.192Z" },
+    { url = "https://files.pythonhosted.org/packages/2d/5c/ae7244ca4fbdf2bee9d6405dcd5bc6ae51ee1df66eb7a9884b77b8af856d/ruff-0.14.2-py3-none-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:3bf8d2f9aa1602599217d82e8e0af7fd33e5878c4d98f37906b7c93f46f9a839", size = 13036995, upload-time = "2025-10-23T19:36:31.861Z" },
+    { url = "https://files.pythonhosted.org/packages/27/4c/0860a79ce6fd4c709ac01173f76f929d53f59748d0dcdd662519835dae43/ruff-0.14.2-py3-none-manylinux_2_17_ppc64.manylinux2014_ppc64.whl", hash = "sha256:1c505b389e19c57a317cf4b42db824e2fca96ffb3d86766c1c9f8b96d32048a7", size = 14512649, upload-time = "2025-10-23T19:36:33.915Z" },
+    { url = "https://files.pythonhosted.org/packages/7f/7f/d365de998069720a3abfc250ddd876fc4b81a403a766c74ff9bde15b5378/ruff-0.14.2-py3-none-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:a307fc45ebd887b3f26b36d9326bb70bf69b01561950cdcc6c0bdf7bb8e0f7cc", size = 14088182, upload-time = "2025-10-23T19:36:36.983Z" },
+    { url = "https://files.pythonhosted.org/packages/6c/ea/d8e3e6b209162000a7be1faa41b0a0c16a133010311edc3329753cc6596a/ruff-0.14.2-py3-none-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:61ae91a32c853172f832c2f40bd05fd69f491db7289fb85a9b941ebdd549781a", size = 13599516, upload-time = "2025-10-23T19:36:39.208Z" },
+    { url = "https://files.pythonhosted.org/packages/fa/ea/c7810322086db68989fb20a8d5221dd3b79e49e396b01badca07b433ab45/ruff-0.14.2-py3-none-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:bc1967e40286f63ee23c615e8e7e98098dedc7301568bd88991f6e544d8ae096", size = 13272690, upload-time = "2025-10-23T19:36:41.453Z" },
+    { url = "https://files.pythonhosted.org/packages/a9/39/10b05acf8c45786ef501d454e00937e1b97964f846bf28883d1f9619928a/ruff-0.14.2-py3-none-manylinux_2_31_riscv64.whl", hash = "sha256:2877f02119cdebf52a632d743a2e302dea422bfae152ebe2f193d3285a3a65df", size = 13496497, upload-time = "2025-10-23T19:36:43.61Z" },
+    { url = "https://files.pythonhosted.org/packages/59/a1/1f25f8301e13751c30895092485fada29076e5e14264bdacc37202e85d24/ruff-0.14.2-py3-none-musllinux_1_2_aarch64.whl", hash = "sha256:e681c5bc777de5af898decdcb6ba3321d0d466f4cb43c3e7cc2c3b4e7b843a05", size = 12266116, upload-time = "2025-10-23T19:36:45.625Z" },
+    { url = "https://files.pythonhosted.org/packages/5c/fa/0029bfc9ce16ae78164e6923ef392e5f173b793b26cc39aa1d8b366cf9dc/ruff-0.14.2-py3-none-musllinux_1_2_armv7l.whl", hash = "sha256:e21be42d72e224736f0c992cdb9959a2fa53c7e943b97ef5d081e13170e3ffc5", size = 12281345, upload-time = "2025-10-23T19:36:47.618Z" },
+    { url = "https://files.pythonhosted.org/packages/a5/ab/ece7baa3c0f29b7683be868c024f0838770c16607bea6852e46b202f1ff6/ruff-0.14.2-py3-none-musllinux_1_2_i686.whl", hash = "sha256:b8264016f6f209fac16262882dbebf3f8be1629777cf0f37e7aff071b3e9b92e", size = 12629296, upload-time = "2025-10-23T19:36:49.789Z" },
+    { url = "https://files.pythonhosted.org/packages/a4/7f/638f54b43f3d4e48c6a68062794e5b367ddac778051806b9e235dfb7aa81/ruff-0.14.2-py3-none-musllinux_1_2_x86_64.whl", hash = "sha256:5ca36b4cb4db3067a3b24444463ceea5565ea78b95fe9a07ca7cb7fd16948770", size = 13371610, upload-time = "2025-10-23T19:36:51.882Z" },
+    { url = "https://files.pythonhosted.org/packages/8d/35/3654a973ebe5b32e1fd4a08ed2d46755af7267da7ac710d97420d7b8657d/ruff-0.14.2-py3-none-win32.whl", hash = "sha256:41775927d287685e08f48d8eb3f765625ab0b7042cc9377e20e64f4eb0056ee9", size = 12415318, upload-time = "2025-10-23T19:36:53.961Z" },
+    { url = "https://files.pythonhosted.org/packages/71/30/3758bcf9e0b6a4193a6f51abf84254aba00887dfa8c20aba18aa366c5f57/ruff-0.14.2-py3-none-win_amd64.whl", hash = "sha256:0df3424aa5c3c08b34ed8ce099df1021e3adaca6e90229273496b839e5a7e1af", size = 13565279, upload-time = "2025-10-23T19:36:56.578Z" },
+    { url = "https://files.pythonhosted.org/packages/2e/5d/aa883766f8ef9ffbe6aa24f7192fb71632f31a30e77eb39aa2b0dc4290ac/ruff-0.14.2-py3-none-win_arm64.whl", hash = "sha256:ea9d635e83ba21569fbacda7e78afbfeb94911c9434aff06192d9bc23fd5495a", size = 12554956, upload-time = "2025-10-23T19:36:58.714Z" },
 ]
 [[package]]