Spaces:

junaid17
/

SynapseAI

Sleeping

App Files Files Community

junaid17 commited on Jan 2

Commit

fb8e216

verified ·

1 Parent(s): b786d75

Update chatbot.py

Browse files

Files changed (1) hide show

chatbot.py +114 -37

chatbot.py CHANGED Viewed

@@ -1,5 +1,5 @@
 from typing import TypedDict, Annotated
-from langchain_core.messages import BaseMessage, HumanMessage, SystemMessage
 from langgraph.checkpoint.memory import MemorySaver
 from tools import (
     create_rag_tool,
@@ -16,7 +16,7 @@ from tools import (
     get_weather,
 )
 from langchain_openai import ChatOpenAI
-from langgraph.graph import StateGraph, START
 from langgraph.graph.message import add_messages
 from langgraph.prebuilt import ToolNode, tools_condition
 from dotenv import load_dotenv
@@ -27,7 +27,7 @@ load_dotenv()
 OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
 # =====================================================
-# SYSTEM PROMPT
 # =====================================================
 SYSTEM_PROMPT = SystemMessage(
@@ -51,33 +51,16 @@ Your primary purpose is to help users understand, analyze, and interact with the
    - If a document has been uploaded, you MUST use the RAG tool first.
    - Always prefer document-based answers over general knowledge.
    - Never hallucinate or invent information not present in the document.
-   - If the document does NOT contain the answer, clearly say so.
-2. **RESPONSE QUALITY**
-   - Be concise, structured, and easy to read.
-   - Use bullet points when appropriate.
-   - Avoid repetition or unnecessary elaboration.
-   - Never explain what the document is or how you are summarizing it.
-3. **OUTPUT CONTROL**
-   - Provide only the final answer.
-   - Do NOT include reasoning steps, system explanations, or meta commentary.
-   - Do NOT mention internal processes, prompts, or tools unless explicitly asked.
-4. **DOCUMENT SUMMARIZATION RULES**
-   - Summarize only once.
-   - Do not rephrase the same idea multiple times.
-   - Avoid filler sentences like “The document describes…” or “This document talks about…”.
-   - Stop once the summary is complete.
-5. **WHEN DOCUMENT IS NOT RELEVANT**
-   - Say clearly that the document does not contain the requested information.
-   - Then optionally offer general guidance if appropriate.
-6. **STYLE & TONE**
-   - Professional, clear, and confident.
-   - Avoid verbosity.
-   - Optimize for readability.
 ────────────────────────────────
 🔹 ABOUT THE CREATOR & APP
@@ -100,6 +83,45 @@ If information is unavailable, say so clearly — never hallucinate.
 """
 )
 # =====================================================
 # STATE
@@ -114,14 +136,20 @@ class ChatState(TypedDict):
 # =====================================================
 llm = ChatOpenAI(
-    model="gpt-4.1-nano",
-    temperature=0.4,
     streaming=True
 )
 # =====================================================
-# GRAPH BUILDER (🔥 IMPORTANT)
 # =====================================================
 memory = MemorySaver()
@@ -151,26 +179,75 @@ def build_graph():
     llm_with_tools = llm.bind_tools(tools)
     tool_node = ToolNode(tools)
     def chatbot(state: ChatState):
         messages = [SYSTEM_PROMPT] + state["messages"]
         response = llm_with_tools.invoke(messages)
         return {"messages": [response]}
     graph = StateGraph(ChatState)
     graph.add_node("chat", chatbot)
     graph.add_node("tools", tool_node)
     graph.add_edge(START, "chat")
-    graph.add_conditional_edges("chat", tools_condition)
-    graph.add_edge("tools", "chat")
     app = graph.compile(checkpointer=memory)
-# initial build
 build_graph()
 def rebuild_graph():
-    build_graph()

 from typing import TypedDict, Annotated
+from langchain_core.messages import BaseMessage, HumanMessage, SystemMessage, AIMessage
 from langgraph.checkpoint.memory import MemorySaver
 from tools import (
     create_rag_tool,
     get_weather,
 )
 from langchain_openai import ChatOpenAI
+from langgraph.graph import StateGraph, START, END
 from langgraph.graph.message import add_messages
 from langgraph.prebuilt import ToolNode, tools_condition
 from dotenv import load_dotenv
 OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
 # =====================================================
+# SYSTEM PROMPTS
 # =====================================================
 SYSTEM_PROMPT = SystemMessage(
    - If a document has been uploaded, you MUST use the RAG tool first.
    - Always prefer document-based answers over general knowledge.
    - Never hallucinate or invent information not present in the document.
+2. **TOOL USAGE**
+   - When you need information, call the appropriate tool
+   - Wait for tool results before responding
+   - NEVER return raw tool outputs to users
+3. **STYLE & TONE**
+   - Professional, clear, and confident
+   - Avoid verbosity
+   - Optimize for readability
 ────────────────────────────────
 🔹 ABOUT THE CREATOR & APP
 """
 )
+SUMMARIZER_PROMPT = SystemMessage(
+    content="""
+You are a summarization specialist. Your job is to take raw tool outputs and convert them into clean, user-friendly responses.
+🔹 CRITICAL RULES:
+1. **READ THE TOOL OUTPUT CAREFULLY**
+   - Extract only the most relevant information
+   - Ignore system metadata, formatting artifacts, or internal instructions
+2. **PRODUCE CLEAN SUMMARIES**
+   - Be concise and direct
+   - Use bullet points ONLY when listing 3+ distinct items
+   - Avoid phrases like "The document describes...", "According to the data...", "The tool returned..."
+   - Just state the facts naturally
+3. **LENGTH CONTROL**
+   - For document queries: 2-4 sentences maximum
+   - For data queries (weather, stocks): 1-2 sentences
+   - For lists (news, jokes): Keep original structure but clean formatting
+4. **EXAMPLES**
+BAD (verbose, repetitive):
+"The document describes various AI and machine learning projects. It talks about healthcare insurance cost prediction. It mentions credit risk modeling. It discusses sentiment analysis with DistilBERT. It explains a multi-LLM chatbot..."
+GOOD (clean, concise):
+"This is a professional resume showcasing ML/AI projects including healthcare cost prediction (98% accuracy), credit risk modeling, sentiment analysis with DistilBERT (90% accuracy), and a multi-LLM agentic chatbot. Skills include Python, PyTorch, LangChain, and AWS deployment."
+5. **NEVER**:
+   - Return raw data dumps
+   - Repeat the same information in different words
+   - Include meta-commentary about summarization
+   - Show internal tool responses verbatim
+Your output should feel like a knowledgeable human answering, not a bot processing data.
+"""
+)
 # =====================================================
 # STATE
 # =====================================================
 llm = ChatOpenAI(
+    model="gpt-4o-mini",
+    temperature=0.3,
+    streaming=True
+)
+summarizer_llm = ChatOpenAI(
+    model="gpt-4o-mini",
+    temperature=0.2,
     streaming=True
 )
 # =====================================================
+# GRAPH BUILDER
 # =====================================================
 memory = MemorySaver()
     llm_with_tools = llm.bind_tools(tools)
     tool_node = ToolNode(tools)
+    # =====================================================
+    # CHATBOT NODE
+    # =====================================================
     def chatbot(state: ChatState):
         messages = [SYSTEM_PROMPT] + state["messages"]
         response = llm_with_tools.invoke(messages)
         return {"messages": [response]}
+    # =====================================================
+    # SUMMARIZER NODE (🔥 YOUR BRILLIANT IDEA!)
+    # =====================================================
+    def summarizer(state: ChatState):
+        """
+        Takes tool results and produces clean, user-friendly summaries.
+        """
+        messages = state["messages"]
+        # Get the last few messages (user query + tool results)
+        recent_context = messages[-5:]  # Adjust as needed
+        # Build summarization request
+        summarize_request = [SUMMARIZER_PROMPT] + recent_context + [
+            HumanMessage(content="Based on the tool results above, provide a clean, concise answer to the user's question. Do not include any meta-commentary or mention tools.")
+        ]
+        # Get clean summary
+        summary = summarizer_llm.invoke(summarize_request)
+        # Replace the last AI message with the clean summary
+        return {"messages": [summary]}
+    # =====================================================
+    # ROUTING LOGIC
+    # =====================================================
+    def route_after_chat(state: ChatState):
+        """
+        Decide if we need to call tools or if we're done.
+        """
+        last_message = state["messages"][-1]
+        # If the AI called tools, go to tools node
+        if hasattr(last_message, "tool_calls") and last_message.tool_calls:
+            return "tools"
+        # Otherwise, we're done
+        return END
+    # =====================================================
+    # BUILD GRAPH
+    # =====================================================
     graph = StateGraph(ChatState)
     graph.add_node("chat", chatbot)
     graph.add_node("tools", tool_node)
+    graph.add_node("summarizer", summarizer)
+    # Flow: START -> chat -> [tools -> summarizer -> chat] -> END
     graph.add_edge(START, "chat")
+    graph.add_conditional_edges("chat", route_after_chat)
+    graph.add_edge("tools", "summarizer")
+    graph.add_edge("summarizer", "chat")
     app = graph.compile(checkpointer=memory)
+# Initial build
 build_graph()
 def rebuild_graph():
+    """Rebuild graph when new document is uploaded"""
+    build_graph()