Spaces:

teofizzy
/

mshauri-fedha

Sleeping

App Files Files Community

teofizzy commited on Feb 2

Commit

f8266e7

1 Parent(s): c60e74e

changed to use huggingface serverless endpoint with local CPU as a fallback

Browse files

Files changed (5) hide show

Dockerfile +5 -4
requirements.txt +2 -1
src/app.py +3 -5
src/load/mshauri_demo.py +56 -46
src/load/start_ollama.py +3 -3

Dockerfile CHANGED Viewed

@@ -34,15 +34,16 @@ COPY --chown=user . $HOME/app
 # 7. Startup
 #    We clone the dataset. git-lfs ensures we get the big files.
 CMD git clone https://huggingface.co/datasets/teofizzy/mshauri-data data_download && \
     mv data_download/mshauri_fedha_v6.db . && \
     mv data_download/mshauri_fedha_chroma_db . && \
     rm -rf data_download && \
-    echo "⬇️ Starting Ollama..." && \
     ollama serve & \
     sleep 10 && \
-    echo "⬇️ Pulling Models..." && \
-    ollama pull qwen2.5:7b && \
     ollama pull nomic-embed-text && \
-    echo "✅ Models Ready. Launching App..." && \
     streamlit run src/app.py --server.port 7860 --server.address 0.0.0.0

 # 7. Startup
 #    We clone the dataset. git-lfs ensures we get the big files.
+#    CHANGE: Pulling 'qwen2.5:3b' instead of '7b' for a faster fallback.
 CMD git clone https://huggingface.co/datasets/teofizzy/mshauri-data data_download && \
     mv data_download/mshauri_fedha_v6.db . && \
     mv data_download/mshauri_fedha_chroma_db . && \
     rm -rf data_download && \
+    echo "Starting Ollama..." && \
     ollama serve & \
     sleep 10 && \
+    echo "Pulling Fallback Model (3B)..." && \
+    ollama pull qwen2.5:3b && \
     ollama pull nomic-embed-text && \
+    echo "Models Ready. Launching App..." && \
     streamlit run src/app.py --server.port 7860 --server.address 0.0.0.0

requirements.txt CHANGED Viewed

@@ -3,7 +3,8 @@ pandas
 numpy
 langchain-ollama
 langchain-community
 langchain-chroma
 chromadb
 huggingface_hub
-pysqlite3-binary

 numpy
 langchain-ollama
 langchain-community
+langchain-huggingface
 langchain-chroma
 chromadb
 huggingface_hub
+pysqlite3-binary

src/app.py CHANGED Viewed

@@ -28,7 +28,6 @@ if "messages" not in st.session_state:
 if "agent" not in st.session_state:
     with st.spinner("Initializing Mshauri Brain (Loading Models & Data)..."):
-        # --- THE FIX IS HERE ---
         # SQLAlchemy requires a URI starting with sqlite:///
         # We use 4 slashes (sqlite:////) because it is an absolute path on Linux
         sql_path = f"sqlite:///{os.path.join(current_dir, 'mshauri_fedha_v6.db')}"
@@ -37,15 +36,14 @@ if "agent" not in st.session_state:
         # Check if data exists (Debugging for Space deployment)
         real_db_path = os.path.join(current_dir, "mshauri_fedha_v6.db")
         if not os.path.exists(real_db_path):
-            st.error(f"❌ Database not found at {real_db_path}. Did the clone fail?")
             st.stop()
         try:
-            # Force the 7b model here to ensure CPU compatibility
             st.session_state.agent = create_mshauri_agent(
                 sql_db_path=sql_path,
-                vector_db_path=vector_path,
-                llm_model="qwen2.5:7b"
             )
             st.success("System Ready!")
         except Exception as e:

 if "agent" not in st.session_state:
     with st.spinner("Initializing Mshauri Brain (Loading Models & Data)..."):
         # SQLAlchemy requires a URI starting with sqlite:///
         # We use 4 slashes (sqlite:////) because it is an absolute path on Linux
         sql_path = f"sqlite:///{os.path.join(current_dir, 'mshauri_fedha_v6.db')}"
         # Check if data exists (Debugging for Space deployment)
         real_db_path = os.path.join(current_dir, "mshauri_fedha_v6.db")
         if not os.path.exists(real_db_path):
+            st.error(f"Database not found at {real_db_path}. Did the clone fail?")
             st.stop()
         try:
+            # mshauri_demo.py to intelligently pick the API or Local model.
             st.session_state.agent = create_mshauri_agent(
                 sql_db_path=sql_path,
+                vector_db_path=vector_path
             )
             st.success("System Ready!")
         except Exception as e:

src/load/mshauri_demo.py CHANGED Viewed

@@ -2,7 +2,8 @@ import os
 import re
 import sys
 import io
-from contextlib import redirect_stdout # <--- FIXED: Missing Import
 from langchain_ollama import ChatOllama
 from langchain_community.utilities import SQLDatabase
 from langchain_community.agent_toolkits.sql.toolkit import SQLDatabaseToolkit
@@ -56,39 +57,39 @@ class SimpleReActAgent:
         # IMPROVED PROMPT: Explicitly tells agent to switch strategies if SQL fails
         self.prompt_template = """You are Mshauri Fedha, a senior financial advisor for Kenya.
-Your goal is to provide accurate, data-backed advice.
-RULES:
-1. CITATIONS: You MUST cite your sources (,).
-    - SQL Data ->
-    - Text Data ->
-    - Code -> PythonREPLTool
-2. STRATEGY:
-    - First, check SQL tables ('sql_db_list_tables').
-    - IF the tables listed do NOT match the user's question, IMMEDIATELY switch to 'search_financial_reports_and_news'.
-    - Do NOT keep asking for tables if they are clearly not there.
-3. ADVICE: After presenting facts, add an "Advisory Opinion" section.
-4. CONFIDENCE: If data is old, state "Low Confidence".
-Tools Available:
-{tool_desc}
-Use the following format:
-Question: the input question you must answer
-Thought: you should always think about what to do
-Thought: look at the tools and the question. Which tool is best?
-Action: the action to take, should be one of [{tool_names}]
-Action Input: the input to the action
-Observation: the result of the action
-... (repeat Thought/Action/Observation as needed)
-Thought: I have enough info.
-Final Answer: the final answer with citations.
-Begin!
-Question: {input}
-Thought:{agent_scratchpad}"""
     def invoke(self, inputs):
         query = inputs["input"]
@@ -128,7 +129,7 @@ Thought:{agent_scratchpad}"""
                 if action_name in self.tools:
                     if self.verbose:
-                        print(f"🛠️  Calling '{action_name}' with: '{action_input}'")
                     try:
                         tool = self.tools[action_name]
@@ -142,7 +143,7 @@ Thought:{agent_scratchpad}"""
                     # --- ADDED LOGGING HERE ---
                     if self.verbose:
                         # Print first 200 chars so we can see if it worked
-                        print(f"👀 Observation: {str(tool_result)[:200]}...")
                     observation = f"\nObservation: {tool_result}\n"
                 else:
@@ -163,22 +164,31 @@ def create_mshauri_agent(
     sql_db_path=DEFAULT_SQL_DB,
     vector_db_path=DEFAULT_VECTOR_DB,
     llm_model=DEFAULT_LLM_MODEL,
-    ollama_url=DEFAULT_OLLAMA_URL
-):
     print(f"⚙️  Initializing Mshauri Fedha (Model: {llm_model})...")
     # 1. Initialize LLM
-    try:
-        llm = ChatOllama(model=llm_model, base_url=ollama_url, temperature=0.1)
-    except Exception as e:
-        print(f"❌ Error connecting to Ollama: {e}")
-        return None
     # 2. LEFT BRAIN (SQL)
     if "sqlite" in sql_db_path:
         real_path = sql_db_path.replace("sqlite:///", "")
         if not os.path.exists(real_path):
-             print(f"⚠️  Warning: SQL Database not found at {real_path}")
     db = SQLDatabase.from_uri(sql_db_path)
     sql_toolkit = SQLDatabaseToolkit(db=db, llm=llm)
@@ -205,7 +215,7 @@ def create_mshauri_agent(
     tools = sql_tools + [retriever_tool, repl_tool]
     agent = SimpleReActAgent(llm, tools)
-    print("✅ Mshauri Agent Ready (Zero-Dependency Mode).")
     return agent
 def ask_mshauri(agent, query):

 import re
 import sys
 import io
+from contextlib import redirect_stdout
+from langchain_huggingface import HuggingFaceEndpoint
 from langchain_ollama import ChatOllama
 from langchain_community.utilities import SQLDatabase
 from langchain_community.agent_toolkits.sql.toolkit import SQLDatabaseToolkit
         # IMPROVED PROMPT: Explicitly tells agent to switch strategies if SQL fails
         self.prompt_template = """You are Mshauri Fedha, a senior financial advisor for Kenya.
+        Your goal is to provide accurate, data-backed advice.
+        RULES:
+        1. CITATIONS: You MUST cite your sources (,).
+            - SQL Data ->
+            - Text Data ->
+            - Code -> PythonREPLTool
+        2. STRATEGY:
+            - First, check SQL tables ('sql_db_list_tables').
+            - IF the tables listed do NOT match the user's question, IMMEDIATELY switch to 'search_financial_reports_and_news'.
+            - Do NOT keep asking for tables if they are clearly not there.
+        3. ADVICE: After presenting facts, add an "Advisory Opinion" section.
+        4. CONFIDENCE: If data is old, state "Low Confidence".
+        Tools Available:
+        {tool_desc}
+        Use the following format:
+        Question: the input question you must answer
+        Thought: you should always think about what to do
+        Thought: look at the tools and the question. Which tool is best?
+        Action: the action to take, should be one of [{tool_names}]
+        Action Input: the input to the action
+        Observation: the result of the action
+        ... (repeat Thought/Action/Observation as needed)
+        Thought: I have enough info.
+        Final Answer: the final answer with citations.
+        Begin!
+        Question: {input}
+        Thought:{agent_scratchpad}"""
     def invoke(self, inputs):
         query = inputs["input"]
                 if action_name in self.tools:
                     if self.verbose:
+                        print(f"Calling '{action_name}' with: '{action_input}'")
                     try:
                         tool = self.tools[action_name]
                     # --- ADDED LOGGING HERE ---
                     if self.verbose:
                         # Print first 200 chars so we can see if it worked
+                        print(f"Observation: {str(tool_result)[:200]}...")
                     observation = f"\nObservation: {tool_result}\n"
                 else:
     sql_db_path=DEFAULT_SQL_DB,
     vector_db_path=DEFAULT_VECTOR_DB,
     llm_model=DEFAULT_LLM_MODEL,
+    ollama_url=DEFAULT_OLLAMA_URL):
     print(f"⚙️  Initializing Mshauri Fedha (Model: {llm_model})...")
     # 1. Initialize LLM
+    hf_token = os.getenv("HF_TOKEN")
+    if hf_token:
+        print("Using Hugging Face Serverless API")
+        # We can use the massive 72B model because we aren't hosting it!
+        llm = HuggingFaceEndpoint(
+            repo_id="Qwen/Qwen2.5-72B-Instruct",
+            task="text-generation",
+            max_new_tokens=512,
+            repetition_penalty=1.1,
+            temperature=0.2,
+            huggingfacehub_api_token=hf_token
+        )
+    else:
+        print("Using Local CPU Ollama (Slow)")
+        llm = ChatOllama(model="qwen2.5:7b", base_url=ollama_url, temperature=0.1)
     # 2. LEFT BRAIN (SQL)
     if "sqlite" in sql_db_path:
         real_path = sql_db_path.replace("sqlite:///", "")
         if not os.path.exists(real_path):
+             print(f"Warning: SQL Database not found at {real_path}")
     db = SQLDatabase.from_uri(sql_db_path)
     sql_toolkit = SQLDatabaseToolkit(db=db, llm=llm)
     tools = sql_tools + [retriever_tool, repl_tool]
     agent = SimpleReActAgent(llm, tools)
+    print(" Mshauri Agent Ready (Zero-Dependency Mode).")
     return agent
 def ask_mshauri(agent, query):

src/load/start_ollama.py CHANGED Viewed

@@ -2,6 +2,8 @@ import os
 import subprocess
 import time
 import requests
 from pathlib import Path
 def start_ollama_server():
@@ -49,9 +51,7 @@ def start_ollama_server():
         print(f" Failed to start server: {e}")
         return False
-import requests
-import json
-import sys
 def pull_embedding_model(model_name="nomic-embed-text"):
     url = "http://127.0.0.1:25000/api/pull"

 import subprocess
 import time
 import requests
+import json
+import sys
 from pathlib import Path
 def start_ollama_server():
         print(f" Failed to start server: {e}")
         return False
 def pull_embedding_model(model_name="nomic-embed-text"):
     url = "http://127.0.0.1:25000/api/pull"