Spaces:

m97j
/

knowledge-engine

Sleeping

App Files Files Community

m97j commited on 16 days ago

Commit

9496080

1 Parent(s): ee15d5b

fix(search): add missing return statement in search service

Browse files

Files changed (3) hide show

api/schemas/search.py +2 -1
api/v1/search.py +4 -2
services/search_service.py +13 -6

api/schemas/search.py CHANGED Viewed

@@ -13,7 +13,8 @@ class SearchRequest(BaseModel):
     top_k: int = Field(default=5, ge=1, le=50)
     # optional
-    use_reranker: Optional[bool] = True
 # ---------------------------
 # Document metadata

     top_k: int = Field(default=5, ge=1, le=50)
     # optional
+    use_reranking: Optional[bool] = True
+    include_llm_context: Optional[bool] = True
 # ---------------------------
 # Document metadata

api/v1/search.py CHANGED Viewed

@@ -28,7 +28,9 @@ async def execute_search(
     try:
         search_output = search_service.search(
             query=request_data.query,
-            top_k=request_data.top_k
         )
         return SearchResponse(
             query=search_output["query"],
@@ -66,7 +68,7 @@ async def demo_page_post(
     Handle form submission from the demo page, execute the search, and render results in the same template.
     """
     try:
-        search_output = search_service.search(query=query, top_k=5)
         return templates.TemplateResponse(
             "index.html",

     try:
         search_output = search_service.search(
             query=request_data.query,
+            top_k=request_data.top_k,
+            use_reranking=request_data.use_reranking,
+            include_llm_context=request_data.include_llm_context
         )
         return SearchResponse(
             query=search_output["query"],
     Handle form submission from the demo page, execute the search, and render results in the same template.
     """
     try:
+        search_output = search_service.search(query=query, top_k=5, use_reranking=False, include_llm_context=False)
         return templates.TemplateResponse(
             "index.html",

services/search_service.py CHANGED Viewed

@@ -24,13 +24,14 @@ class HybridSearchService:
         self.embedder = embedder
         self.reranker = reranker
-    def search(self, query: str, top_k: int = 5, limit: int = 50, include_llm_context: bool = True) -> Dict[str, Any]:
         """
         Receives user queries and performs hybrid search and reranking.
         :param query: User search query
         :param top_k: Number of documents to return (after reranking)
         :param limit: Number of candidate documents to fetch from Qdrant (after RRF fusion, before reranking)
         :param include_llm_context: Whether to include LLM context in the response (formatted text for LLM consumption)
         :return: A dictionary containing the original query, a list of search results, and latency information. Each search result includes chunk_id, text, relevance score, and metadata.
         """
@@ -80,11 +81,15 @@ class HybridSearchService:
             # 5. Perform Cross-Encoder Reranking
             # Return a list sorted in descending order after recalculating context-based precise scores
-            reranked_docs = self.reranker.rerank(
-                query=query,
-                documents=chunks_for_reranking,
-                text_key="text"
-            )
             # 6. Top-K Truncation and Mapping to Pydantic Schema (SearchResultItem) Specification
             final_results = []
@@ -108,6 +113,8 @@ class HybridSearchService:
             if include_llm_context:
                 # 7. Optional: Format results into LLM-friendly context (Markdown/XML mixed format)
                 response["llm_context"] = self.format_for_llm(final_results)
         except Exception as e:
             # Wrap unexpected errors in custom errors and throw them to the router

         self.embedder = embedder
         self.reranker = reranker
+    def search(self, query: str, top_k: int = 5, limit: int = 50, use_reranking: bool = True, include_llm_context: bool = True) -> Dict[str, Any]:
         """
         Receives user queries and performs hybrid search and reranking.
         :param query: User search query
         :param top_k: Number of documents to return (after reranking)
         :param limit: Number of candidate documents to fetch from Qdrant (after RRF fusion, before reranking)
+        :param use_reranking: Whether to use reranking (if False, it will skip the reranking step and return Qdrant results directly, still mapped with SQLite data)
         :param include_llm_context: Whether to include LLM context in the response (formatted text for LLM consumption)
         :return: A dictionary containing the original query, a list of search results, and latency information. Each search result includes chunk_id, text, relevance score, and metadata.
         """
             # 5. Perform Cross-Encoder Reranking
             # Return a list sorted in descending order after recalculating context-based precise scores
+            if use_reranking:
+                reranked_docs = self.reranker.rerank(
+                    query=query,
+                    documents=chunks_for_reranking,
+                    text_key="text"
+                )
+            else:
+                # If reranking is disabled, use the Qdrant results directly
+                reranked_docs = chunks_for_reranking
             # 6. Top-K Truncation and Mapping to Pydantic Schema (SearchResultItem) Specification
             final_results = []
             if include_llm_context:
                 # 7. Optional: Format results into LLM-friendly context (Markdown/XML mixed format)
                 response["llm_context"] = self.format_for_llm(final_results)
+            return response
         except Exception as e:
             # Wrap unexpected errors in custom errors and throw them to the router