Spaces:

NimrodDev
/

RAG_SPACE

Build error

App Files Files Community

NimrodDev commited on Nov 2, 2025

Commit

74b9a8d

1 Parent(s): c66dd86

cmc

Browse files

Files changed (2) hide show

app.py +15 -8
rag.py +87 -76

app.py CHANGED Viewed

@@ -1,16 +1,23 @@
-# app.py
-from flask import Flask, request, jsonify
 from rag import ask_question
 app = Flask(__name__)
 @app.route("/webhook", methods=["POST"])
 def webhook():
-    payload = request.get_json(force=True)
-    phone = payload["phone"]
-    question = payload["question"]
-    answer, docs = ask_question(phone, question)
-    return jsonify({"answer": answer, "docs": len(docs)})
 if __name__ == "__main__":
-    app.run(host="0.0.0.0", port=7860)

+#from flask import Flask, request, jsonify
 from rag import ask_question
 app = Flask(__name__)
 @app.route("/webhook", methods=["POST"])
 def webhook():
+    try:
+        data = request.get_json(force=True)
+        phone = data.get("phone", "")
+        question = data.get("question", "")
+        answer, docs = ask_question(phone, question)
+        return jsonify({"answer": answer, "docs": len(docs)})
+    except Exception as e:
+        print(f"❌ Webhook error: {e}")
+        return jsonify({"answer": "Let me get back to you on that.", "docs": 0})
+@app.route("/healthcheck")
+def healthcheck():
+    return jsonify({"status": "ok", "message": "Amina bot running!"})
 if __name__ == "__main__":
+    app.run(host="0.0.0.0", port=7860)

rag.py CHANGED Viewed

@@ -1,73 +1,80 @@
-# rag.py — production-grade, Parquet-ready, FAISS-cached RAG pipeline
 from __future__ import annotations
-import os, re, json, pickle
 from typing import List, Tuple
 from functools import lru_cache
-import requests
 from supabase import create_client
-# LangChain + HF
 from datasets import load_dataset
 from langchain.text_splitter import RecursiveCharacterTextSplitter
 from langchain_community.vectorstores import FAISS
-from langchain_community.embeddings import HuggingFaceEmbeddings
 from langchain_huggingface import HuggingFaceEndpoint
-from langchain_core.prompts import PromptTemplate
 from langchain.chains import RetrievalQA
-# ------------------------------------------------------------------ CONFIG
 DATASET_ID  = "NimrodDev/LD_Events2"
-HF_TOKEN    = os.getenv("HF_TOKEN")
 SUPABASE_URL = os.getenv("SUPABASE_URL")
 SUPABASE_KEY = os.getenv("SUPABASE_KEY")
-LLM_MODEL   = "mistralai/Mistral-7B-Instruct-v0.3"  # stronger model
-CACHE_DIR   = os.getenv("HF_HOME", "/tmp/hf_cache")
-FAISS_PATH  = "/tmp/faiss_index.pkl"
-os.makedirs(CACHE_DIR, exist_ok=True)
-os.environ["TRANSFORMERS_CACHE"] = CACHE_DIR
-os.environ["HF_HOME"] = CACHE_DIR
-os.environ["HF_HUB_CACHE"] = CACHE_DIR
-supabase = create_client(SUPABASE_URL, SUPABASE_KEY)
-# ------------------------------------------------------------------ INTENT DETECTION
-GREETING_RE  = re.compile(r"\b(hi|hello|hey|good morning|good afternoon|good evening)\b", re.I)
-THANKS_RE    = re.compile(r"\b(thank|thanks|appreciate)\b", re.I)
-BYE_RE       = re.compile(r"\b(bye|goodbye|see you|later)\b", re.I)
-MONEY_RE     = re.compile(r"\b(price|cost|budget|cheap|expensive|money|usd|ksh|payment|deposit)\b", re.I)
-COMPLAIN_RE  = re.compile(r"\b(complain|bad|terrible|awful|disappointed|angry|slow|rude)\b", re.I)
 FALLBACKS = {
     "LD Events": {
-        "greeting": "Hello! 👋 I’m Amina, your assistant for *LD Events* (weddings, graduations, corporate events) "
-                    "and *Lamaki Designs* (construction & architectural plans).\n\n"
-                    "Which service would you like to know about?\n\n",
-        "money": "Our pricing depends on venue / project size. Please share a few details so we can give you a tailored quote.",
-        "complain": "We’re sorry to hear this. A senior agent will contact you within 30 minutes to resolve the issue.",
-        "thanks": "You’re welcome! If you need anything else, just text back.",
-        "bye": "Thanks for chatting. Have a lovely day!",
-        "default": "I’m not sure about that, but a human agent will follow up shortly."
     },
     "Lamaki Designs": {
-        "greeting": "Karibu! 🏗️ I’m Amina, your assistant for *Lamaki Designs* (construction, architectural plans, project management) "
-                    "and *LD Events* (weddings, graduations, corporate events).\n\n"
-                    "Which service would you like to know about?\n\n",
-        "money": "Cost varies by project size and materials. Kindly share your plot size / plan so we can estimate for you.",
-        "complain": "We apologise for the inconvenience. Our site manager will call you within 30 minutes to sort it out.",
-        "thanks": "Asante! Feel free to text any time.",
-        "bye": "Good-bye and stay safe!",
-        "default": "Let me get back to you on that."
     }
 }
-# ------------------------------------------------------------------ HELPERS
 def _company_from_text(text: str) -> str:
     t = text.lower()
-    if any(k in t for k in ("ld events", "event", "wedding", "venue", "graduation")):
-        return "LD Events"
-    if any(k in t for k in ("lamaki", "construction", "build", "site", "bungalow", "architect")):
         return "Lamaki Designs"
     return "LD Events"
 def _detect_intent(text: str) -> str:
@@ -76,65 +83,67 @@ def _detect_intent(text: str) -> str:
     if BYE_RE.search(text):      return "bye"
     if MONEY_RE.search(text):    return "money"
     if COMPLAIN_RE.search(text): return "complain"
     return "normal"
 def _fallback_answer(company: str, intent: str) -> str:
     return FALLBACKS[company].get(intent, FALLBACKS[company]["default"])
-# ------------------------------------------------------------------ DATA FETCH (Parquet)
 @lru_cache(maxsize=1)
 def get_texts() -> List[str]:
     try:
-        print("🔍 Loading dataset from Parquet branch...")
         ds = load_dataset(DATASET_ID, split="train", revision="refs/convert/parquet")
         texts = [str(row["text"]) for row in ds if row.get("text")]
-        print(f"✅ Loaded {len(texts)} rows from {DATASET_ID}")
         return texts
     except Exception as e:
-        print(f"⚠️ Failed to load Parquet dataset: {e}")
         return []
-# ------------------------------------------------------------------ VECTORSTORE
 @lru_cache(maxsize=1)
 def get_vectorstore() -> FAISS:
     if os.path.exists(FAISS_PATH):
         try:
             with open(FAISS_PATH, "rb") as f:
-                vs = pickle.load(f)
-                print("📦 Loaded cached FAISS index.")
-                return vs
-        except Exception:
-            print("⚠️ Cached FAISS corrupted, rebuilding...")
     texts = get_texts()
     if not texts:
-        print("⚠️ No dataset found; creating dummy FAISS index.")
-        return FAISS.from_texts(["No context available."], HuggingFaceEmbeddings(model_name="all-MiniLM-L6-v2"))
-    embeddings = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
-    splitter = RecursiveCharacterTextSplitter(chunk_size=600, chunk_overlap=100)
     docs = splitter.create_documents(texts)
     vs = FAISS.from_documents(docs, embeddings)
     with open(FAISS_PATH, "wb") as f:
         pickle.dump(vs, f)
     print("✅ FAISS index created and cached.")
     return vs
-# ------------------------------------------------------------------ LLM
 @lru_cache(maxsize=1)
 def get_llm():
     return HuggingFaceEndpoint(
         repo_id=LLM_MODEL,
         huggingfacehub_api_token=HF_TOKEN,
-        temperature=0.1,
-        max_new_tokens=200
     )
 PROMPT = PromptTemplate.from_template("""
-You are Amina, assistant for {company}.
-Answer clearly and politely using the context below.
-If context lacks information, say: "Let me get back to you on that."
 Context:
 {context}
@@ -145,24 +154,25 @@ Question:
 Answer:
 """)
-# ------------------------------------------------------------------ MAIN LOGIC
 def ask_question(phone: str, question: str) -> Tuple[str, List]:
-    intent  = _detect_intent(question)
     company = _company_from_text(question)
-    # Quick intents skip RAG
-    if intent in ("greeting", "thanks", "bye"):
         answer = _fallback_answer(company, intent)
         _save_chat(phone, question, answer)
         return answer, []
     vs = get_vectorstore()
     retriever = vs.as_retriever(search_kwargs={"k": 4})
     qa = RetrievalQA.from_chain_type(
         llm=get_llm(),
         retriever=retriever,
         chain_type_kwargs={"prompt": PROMPT},
-        return_source_documents=True
     )
     try:
@@ -170,20 +180,21 @@ def ask_question(phone: str, question: str) -> Tuple[str, List]:
         answer = result.get("result", "").strip()
         docs = result.get("source_documents", [])
     except Exception as e:
-        print(f"❌ QA error: {e}")
         answer, docs = "", []
-    # Fallback logic
-    if not answer or len(answer.split()) < 3:
         answer = _fallback_answer(company, intent if intent in ("money", "complain") else "default")
     _save_chat(phone, question, answer)
     return answer, docs
-# ------------------------------------------------------------------ SUPABASE LOGGING
 def _save_chat(phone: str, q: str, a: str) -> None:
     try:
         supabase.table("chat_memory").insert({"user_phone": phone, "role": "user", "message": q}).execute()
         supabase.table("chat_memory").insert({"user_phone": phone, "role": "assistant", "message": a}).execute()
     except Exception as e:
-        print(f"⚠️ Supabase logging failed: {e}")

+# rag.py — Dual-company RAG pipeline (LD Events + Lamaki Designs)
 from __future__ import annotations
+import os, re, json, pickle, tempfile
 from typing import List, Tuple
 from functools import lru_cache
 from supabase import create_client
 from datasets import load_dataset
 from langchain.text_splitter import RecursiveCharacterTextSplitter
 from langchain_community.vectorstores import FAISS
 from langchain_huggingface import HuggingFaceEndpoint
+from langchain_community.embeddings import HuggingFaceEmbeddings
 from langchain.chains import RetrievalQA
+from langchain_core.prompts import PromptTemplate
+# ---------------------------------------------------------------- CONFIG
 DATASET_ID  = "NimrodDev/LD_Events2"
+LLM_MODEL   = "mistralai/Mistral-7B-Instruct-v0.3"
+CACHE_DIR   = os.getenv("HF_HOME", tempfile.gettempdir())
+FAISS_PATH  = os.path.join(CACHE_DIR, "faiss_index.pkl")
+HF_TOKEN    = os.getenv("HF_TOKEN", os.getenv("HUGGINGFACEHUB_API_TOKEN", ""))
 SUPABASE_URL = os.getenv("SUPABASE_URL")
 SUPABASE_KEY = os.getenv("SUPABASE_KEY")
+supabase = None
+if SUPABASE_URL and SUPABASE_KEY:
+    try:
+        supabase = create_client(SUPABASE_URL, SUPABASE_KEY)
+    except Exception as e:
+        print(f"⚠️ Supabase init failed: {e}")
+os.makedirs(CACHE_DIR, exist_ok=True)
+os.environ.update({
+    "HF_HOME": CACHE_DIR,
+    "HF_HUB_CACHE": CACHE_DIR,
+    "TRANSFORMERS_CACHE": CACHE_DIR
+})
+# ---------------------------------------------------------------- INTENT DETECTION
+GREETING_RE = re.compile(r"\b(hi|hello|hey|good morning|good afternoon|good evening)\b", re.I)
+THANKS_RE   = re.compile(r"\b(thank|thanks|appreciate)\b", re.I)
+BYE_RE      = re.compile(r"\b(bye|goodbye|see you|later)\b", re.I)
+MONEY_RE    = re.compile(r"\b(price|cost|budget|cheap|expensive|money|usd|ksh|payment|deposit|fee|quote)\b", re.I)
+COMPLAIN_RE = re.compile(r"\b(complain|bad|terrible|awful|disappointed|angry|slow|rude|issue|problem)\b", re.I)
+HUMAN_RE    = re.compile(r"\b(agent|human|representative|manager|someone|person)\b", re.I)
+# ---------------------------------------------------------------- COMPANY FALLBACKS
 FALLBACKS = {
     "LD Events": {
+        "greeting": "Hello! 👋 I’m *Amina*, your assistant for **LD Events** (weddings, graduations, corporate events) "
+                    "and **Lamaki Designs** (construction & architecture). How may I help you today?",
+        "money": "Our event packages vary depending on venue and number of guests. Could you share a few details so we can estimate a quote?",
+        "complain": "I’m sorry to hear that 😔. I’ll alert our support team — expect a call from a senior agent shortly.",
+        "thanks": "You’re most welcome! 💐",
+        "bye": "Thanks for chatting with LD Events. Have a beautiful day!",
+        "handoff": "Sure! I’ll connect you to a human representative now. Please hold on a moment.",
+        "default": "Let me get back to you on that. I’ve forwarded your question to a senior planner."
     },
     "Lamaki Designs": {
+        "greeting": "Karibu! 🏗️ I’m *Amina*, assistant for **Lamaki Designs** (construction, architectural plans, project management) "
+                    "and **LD Events** (weddings, graduations, corporate events). How may I assist?",
+        "money": "Construction costs depend on project scope and materials. Kindly share your plot size or design type for an accurate estimate.",
+        "complain": "We’re truly sorry for the inconvenience. Our site supervisor will reach out within 30 minutes to help.",
+        "thanks": "Asante! We appreciate your time.",
+        "bye": "Goodbye 👋 and thank you for trusting Lamaki Designs.",
+        "handoff": "No problem. A Lamaki Designs representative will join the chat soon.",
+        "default": "Let me get back to you on that — I’ll forward this to our design team."
     }
 }
+# ---------------------------------------------------------------- HELPERS
 def _company_from_text(text: str) -> str:
     t = text.lower()
+    if any(k in t for k in ("lamaki", "construction", "architect", "plan", "bungalow", "site", "building")):
         return "Lamaki Designs"
+    if any(k in t for k in ("ld events", "event", "wedding", "graduation", "venue", "party")):
+        return "LD Events"
     return "LD Events"
 def _detect_intent(text: str) -> str:
     if BYE_RE.search(text):      return "bye"
     if MONEY_RE.search(text):    return "money"
     if COMPLAIN_RE.search(text): return "complain"
+    if HUMAN_RE.search(text):    return "handoff"
     return "normal"
 def _fallback_answer(company: str, intent: str) -> str:
     return FALLBACKS[company].get(intent, FALLBACKS[company]["default"])
+# ---------------------------------------------------------------- DATA FETCH
 @lru_cache(maxsize=1)
 def get_texts() -> List[str]:
     try:
+        print("🔍 Loading dataset from Parquet...")
         ds = load_dataset(DATASET_ID, split="train", revision="refs/convert/parquet")
         texts = [str(row["text"]) for row in ds if row.get("text")]
+        print(f"✅ Loaded {len(texts)} text chunks from {DATASET_ID}")
         return texts
     except Exception as e:
+        print(f"⚠️ Dataset load failed: {e}")
         return []
+# ---------------------------------------------------------------- VECTORSTORE
 @lru_cache(maxsize=1)
 def get_vectorstore() -> FAISS:
     if os.path.exists(FAISS_PATH):
         try:
             with open(FAISS_PATH, "rb") as f:
+                print("📦 Using cached FAISS index.")
+                return pickle.load(f)
+        except Exception as e:
+            print(f"⚠️ Failed to load FAISS cache: {e}, rebuilding...")
     texts = get_texts()
     if not texts:
+        print("⚠️ No dataset found; building dummy FAISS index.")
+        return FAISS.from_texts(["No context available."],
+                                HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2"))
+    splitter = RecursiveCharacterTextSplitter(chunk_size=700, chunk_overlap=100)
     docs = splitter.create_documents(texts)
+    embeddings = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
     vs = FAISS.from_documents(docs, embeddings)
     with open(FAISS_PATH, "wb") as f:
         pickle.dump(vs, f)
     print("✅ FAISS index created and cached.")
     return vs
+# ---------------------------------------------------------------- LLM
 @lru_cache(maxsize=1)
 def get_llm():
+    if not HF_TOKEN:
+        raise ValueError("Hugging Face token missing! Please set HF_TOKEN or HUGGINGFACEHUB_API_TOKEN.")
     return HuggingFaceEndpoint(
         repo_id=LLM_MODEL,
         huggingfacehub_api_token=HF_TOKEN,
+        temperature=0.3,
+        max_new_tokens=300
     )
 PROMPT = PromptTemplate.from_template("""
+You are Amina, a friendly virtual assistant for {company}.
+Use the context below to answer questions concisely and politely.
+If unsure, say: "Let me get back to you on that."
 Context:
 {context}
 Answer:
 """)
+# ---------------------------------------------------------------- MAIN CHAT LOGIC
 def ask_question(phone: str, question: str) -> Tuple[str, List]:
+    intent = _detect_intent(question)
     company = _company_from_text(question)
+    # Fast fallback for simple intents
+    if intent in ("greeting", "thanks", "bye", "handoff"):
         answer = _fallback_answer(company, intent)
         _save_chat(phone, question, answer)
         return answer, []
     vs = get_vectorstore()
     retriever = vs.as_retriever(search_kwargs={"k": 4})
     qa = RetrievalQA.from_chain_type(
         llm=get_llm(),
         retriever=retriever,
         chain_type_kwargs={"prompt": PROMPT},
+        return_source_documents=True,
     )
     try:
         answer = result.get("result", "").strip()
         docs = result.get("source_documents", [])
     except Exception as e:
+        print(f"❌ QA pipeline error: {e}")
         answer, docs = "", []
+    # Smart fallback (pricing, complaints, or missing)
+    if not answer or len(answer.split()) < 4:
         answer = _fallback_answer(company, intent if intent in ("money", "complain") else "default")
     _save_chat(phone, question, answer)
     return answer, docs
+# ---------------------------------------------------------------- SUPABASE LOGGING
 def _save_chat(phone: str, q: str, a: str) -> None:
+    if not supabase: return
     try:
         supabase.table("chat_memory").insert({"user_phone": phone, "role": "user", "message": q}).execute()
         supabase.table("chat_memory").insert({"user_phone": phone, "role": "assistant", "message": a}).execute()
     except Exception as e:
+        print(f"⚠️ Chat log failed: {e}")