Spaces:

TeamSAS
/

UB_VSA

Sleeping

SakshamLak commited on May 15, 2025

Commit

867fb31

verified ·

1 Parent(s): 2b03f76

Upload 2 files

Files changed (2) hide show

buffalo_rag/api/README.md ADDED Viewed


1	+ # API Directory
2	+
3	+ This directory contains the FastAPI backend for the UB-VSA project. It includes routes, schemas, and static assets for serving the API endpoints.

buffalo_rag/api/background_tasks.py ADDED Viewed

+from buffalo_rag.scraper.scraper import BuffaloScraper
+from buffalo_rag.embeddings.chunker import DocumentChunker
+from buffalo_rag.vector_store.db import VectorStore
+from buffalo_rag.model.rag import BuffaloRAG
+def run_scraper(seed_url: str, max_pages: int):
+    """Run the web scraper in the background."""
+    scraper = BuffaloScraper(seed_url=seed_url)
+    scraper.scrape(max_pages=max_pages)
+    # After scraping, update the embeddings and index
+    chunker = DocumentChunker()
+    chunks = chunker.create_chunks()
+    chunker.create_embeddings(chunks)
+    # Reload the vector store
+    global vector_store
+    vector_store = VectorStore()
+    # Update the RAG model
+    global rag
+    rag = BuffaloRAG(vector_store=vector_store)
+def refresh_index():
+    """Refresh the vector index in the background."""
+    chunker = DocumentChunker()
+    chunks = chunker.create_chunks()
+    chunker.create_embeddings(chunks)
+    # Reload the vector store
+    global vector_store
+    vector_store = VectorStore()
+    # Update the RAG model
+    global rag
+    rag = BuffaloRAG(vector_store=vector_store)