Spaces:

alesamodio
/

Socrates_docker

Sleeping

App Files Files Community

alesamodio commited on Dec 5, 2025

Commit

ee157dc

1 Parent(s): 3ced307

remove streamlit from retrieve

Browse files

Files changed (2) hide show

Retrieve.py +10 -5
socrates_core.py +34 -4

Retrieve.py CHANGED Viewed

@@ -36,6 +36,7 @@ def retrieve_chunks_from_vdb(
     use_metadata_boost: bool = False,
     filter_keywords: List[str] = None,
     topic: str = None,
 ) -> List[Dict]:
     """
     Download FAISS index from Supabase, search it, return top-k results.
@@ -94,7 +95,8 @@ def retrieve_all_chunks(
     k: int = 10,
     filter_keywords: List[str] = None,
     topic: str = None,
-    topic_to_dbs: Dict[str, List[str]] = None
 ) -> List[Dict]:
     """
     Retrieve chunks across all Supabase sources (dbs + personal_info + chat_history).
@@ -136,11 +138,12 @@ def retrieve_all_chunks(
                 query_vector=query_vector,
                 model=model,
                 query=query,
-                username=username,   # ✅ FIX
                 k=k,
                 use_metadata_boost=use_metadata_boost,
                 filter_keywords=filter_keywords,
-                topic = topic,
             )
     return all_chunks
@@ -151,7 +154,8 @@ def retrieve_from_db(
     query: str,
     model,
     username: str,
-    k: int = 5
 ) -> List[Dict]:
     """
     Retrieve top-k chunks from a single Supabase FAISS db (e.g. db6).
@@ -163,7 +167,8 @@ def retrieve_from_db(
         model=model,
         query=query,
         username=username,
-        k=k
     )
 # used in retrieve_chunks_from_vdb
 def compute_metadata_boost(metadata: Dict, query: str, filter_keywords: List[str] = None) -> float:

     use_metadata_boost: bool = False,
     filter_keywords: List[str] = None,
     topic: str = None,
+    db6_override_store: Optional[FAISS] = None,  # NEW
 ) -> List[Dict]:
     """
     Download FAISS index from Supabase, search it, return top-k results.
     k: int = 10,
     filter_keywords: List[str] = None,
     topic: str = None,
+    topic_to_dbs: Dict[str, List[str]] = None,
+    db6_override_store: Optional[FAISS] = None  # NEW
 ) -> List[Dict]:
     """
     Retrieve chunks across all Supabase sources (dbs + personal_info + chat_history).
                 query_vector=query_vector,
                 model=model,
                 query=query,
+                username=username,
                 k=k,
                 use_metadata_boost=use_metadata_boost,
                 filter_keywords=filter_keywords,
+                topic=topic,
+                db6_override_store=db6_override_store,  # NEW: passed through
             )
     return all_chunks
     query: str,
     model,
     username: str,
+    k: int = 5,
+    db6_override_store: Optional[FAISS] = None,  # NEW (optional)
 ) -> List[Dict]:
     """
     Retrieve top-k chunks from a single Supabase FAISS db (e.g. db6).
         model=model,
         query=query,
         username=username,
+        k=k,
+        db6_override_store=db6_override_store,   # pass through
     )
 # used in retrieve_chunks_from_vdb
 def compute_metadata_boost(metadata: Dict, query: str, filter_keywords: List[str] = None) -> float:

socrates_core.py CHANGED Viewed

@@ -1,6 +1,6 @@
 # socrates_core.py
 from typing import Dict, Any, Optional, List
 from supabase import create_client
 from langchain_huggingface import HuggingFaceEmbeddings
@@ -80,21 +80,51 @@ def socrates_reply(
     except Exception:
         emotion_result = None
     # ---- Classify message ----
     analysis = analyze_message(user_id, user_msg_en)
     story_topic = analysis.get("topic_for_story")
-    # ---- Retrieval ----
     chunks = retrieve_all_chunks(
         query=user_msg_en,
         model=embeddings,
         user_id=user_id,
         username=username,
         k=10,
-        topic=analysis.get("topic"),
         topic_to_dbs=TOPIC_TO_DBS,
     )
     # ---- Story / anecdote selection ----
     socratic_story_dic = pick_story_with_fallback(user_id, story_topic)
     socratic_story_formatted = build_story_txt(

 # socrates_core.py
 from typing import Dict, Any, Optional, List
+from db7_pipeline import run_db7_pipeline
 from supabase import create_client
 from langchain_huggingface import HuggingFaceEmbeddings
     except Exception:
         emotion_result = None
+    # ---- Classify message ----
     # ---- Classify message ----
     analysis = analyze_message(user_id, user_msg_en)
     story_topic = analysis.get("topic_for_story")
+    topic = analysis.get("topic")
+    needs_news_fetch = analysis.get("needs_news_fetch", False)
+   # ---- Optional db7 news pipeline (build fresh db6) ----
+    db7_result = None  # we just store it for now, not used in retrieval yet
+    try:
+        # Very simple condition to start with:
+        # later you can refine with needs_news_fetch or news_type
+        if topic == "news" and needs_news_fetch:
+            db7_result = run_db7_pipeline(
+                news_topic=[user_msg_en],  # or a keyword list, we can refine later
+                user_query=user_msg_en,
+                username=username,
+                user_id=user_id,
+                user_countries=profile.get("countries_of_interest", []),
+                user_lang=user_lang_code,
+            )
+            # db7_result is a dict like:
+            # {
+            #   "status": "ok",
+            #   "keywords": ...,
+            #   "articles": ...,
+            #   "top_full": ...,
+            #   "faiss_object": <FAISS store for updated db6>
+            # }
+    except Exception as e:
+        print(f"⚠️ db7 pipeline failed or not configured: {e}")
+        db7_result = None
+    # ---- Retrieval (still old behaviour for now) ----
     chunks = retrieve_all_chunks(
         query=user_msg_en,
         model=embeddings,
         user_id=user_id,
         username=username,
         k=10,
+        topic=topic,
         topic_to_dbs=TOPIC_TO_DBS,
     )
     # ---- Story / anecdote selection ----
     socratic_story_dic = pick_story_with_fallback(user_id, story_topic)
     socratic_story_formatted = build_story_txt(