Spaces:

NOVA-chatbot
/

chatbot-backend

Sleeping

App Files Files Community

Jaita commited on Dec 8, 2025

Commit

7bea0f0

verified ·

1 Parent(s): 0ef51b1

Create main.py

Browse files

Files changed (1) hide show

main.py +123 -0

main.py ADDED Viewed

	@@ -0,0 +1,123 @@

+import os
+import requests
+from fastapi import FastAPI, HTTPException
+from fastapi.middleware.cors import CORSMiddleware
+from pydantic import BaseModel
+from services.kb_creation import collection, ingest_documents, search_knowledge_base
+from contextlib import asynccontextmanager
+import google.generativeai as genai
+os.environ["POSTHOG_DISABLED"] = "true"  # Disable PostHog telemetry
+# --- 0. Config ---
+GEMINI_API_KEY = os.getenv("GEMINI_API_KEY")
+if not GEMINI_API_KEY:
+    raise RuntimeError("GEMINI_API_KEY is not set in environment.")
+# Configure the SDK
+genai.configure(api_key=GEMINI_API_KEY)
+# Choose the model
+MODEL_NAME = "gemini-2.5-flash-lite"
+model = genai.GenerativeModel(MODEL_NAME)
+# --- Initialize FastAPI ---
+#app = FastAPI()
+@asynccontextmanager
+async def lifespan(app: FastAPI):
+    try:
+        folder_path = os.path.join(os.getcwd(), "documents")
+        if collection.count() == 0:
+                print("🔍 KB empty. Running ingestion...")
+                ingest_documents(folder_path)
+        else:
+                print(f"✅ KB already populated with {collection.count()} entries. Skipping ingestion.")
+    except Exception as e:
+        print(f"⚠️ KB ingestion failed: {e}")
+    yield
+app = FastAPI(lifespan=lifespan)
+# --- Configure CORS ---
+origins = [
+    "https://jaita-chatbot-react-frontend-v1.hf.space"
+    #"https://jaita-chatbot-fastapi-backend.hf.space/chat",
+]
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=origins,
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+# --- Define the Request Data Structure ---
+class ChatInput(BaseModel):
+    user_message: str
+# --- Gemini API Setup ---
+GEMINI_API_KEY = os.getenv("GEMINI_API_KEY")
+GEMINI_URL = f"https://generativelanguage.googleapis.com/v1beta/models/gemini-2.5-flash-lite:generateContent?key={GEMINI_API_KEY}"
+# --- Endpoints ---
+@app.get("/")
+async def health_check():
+    return {"status": "ok"}
+@app.post("/chat")
+async def chat_with_ai(input_data: ChatInput):
+    """Handle chat interactions using Google Generative AI via requests."""
+    try:
+        # Retrieve relevant documents from knowledge base
+        kb_results = search_knowledge_base(input_data.user_message, top_k=10)
+        #print(f"kb_results are: {kb_results}")
+        # Extract relevant context from search results
+        context = ""
+        relevant_docs=[]
+        if kb_results and kb_results.get('documents'):
+            # Limit context to avoid token limits - take top 2 most relevant
+            relevant_docs = kb_results['documents'][0][:2]
+            context = "\n\n".join(relevant_docs)
+        # Construct enhanced prompt with context
+        if context:
+            enhanced_prompt = f"""Use the following knowledge base context to answer the user's question accurately.
+If the context contains relevant information, base your answer on it.
+If the context doesn't help, say you're raising a ticket and provide a ticket number.
+Knowledge Base Context:
+{context}
+User Question: {input_data.user_message}
+Answer:"""
+        else:
+            enhanced_prompt = f"User Question: {input_data.user_message}\n\nAnswer:"
+        headers = {"Content-Type": "application/json"}
+        payload = {
+            "contents": [
+                {
+                    "parts": [{"text": enhanced_prompt}]
+                }
+            ]
+        }
+        response = requests.post(GEMINI_URL, headers=headers, json=payload, verify=False)
+        result = response.json()
+        #print("result",result)
+        # Extract Gemini's response
+        bot_response = result["candidates"][0]["content"]["parts"][0]["text"]
+        # Include debug info in response
+        debug_info = f"Context found: {'Yes' if context else 'No'}"
+        if context:
+            debug_info += f" (Top {len(relevant_docs)} documents used)"
+        return {"bot_response": bot_response, "debug": debug_info}
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))