New_Final_Assignment

Sleeping

App Files Files Community

naman1102 commited on Jun 11, 2025

Commit

14fa0cc

1 Parent(s): 9af3089

React_graph

Browse files

Files changed (4) hide show

agent.py +16 -117
app.py +7 -3
tools.py +26 -48
toolsold.py +349 -0

agent.py CHANGED Viewed

@@ -6,19 +6,19 @@ from langchain.schema import HumanMessage, SystemMessage, AIMessage
 from state import AgentState
 from typing import Any, Dict, List, Optional
 import json
 # ─────────────────────────── External tools ──────────────────────────────
 from tools import (
     wikipedia_search_tool,
-    ocr_image_tool,
     audio_transcriber_tool,
-    parse_excel_tool,
     analyze_code_tool
 )
 # ─────────────────────────── Configuration ───────────────────────────────
-LLM = ChatOpenAI(model_name="gpt-4.1-mini", temperature=0.3)
 MAX_TOOL_CALLS = 5
 # ─────────────────────────── Helper utilities ────────────────────────────
@@ -29,122 +29,21 @@ MAX_TOOL_CALLS = 5
 # ------------- tool adapters -------------
-def wiki_tool(state: AgentState) -> AgentState:
-    out = wikipedia_search_tool({"wiki_query": state.query or ""})
-    state.tool_calls += 1
-    state.add(SystemMessage(content=f"WIKI_TOOL_OUT: {out}"))
-    state.next_action = None
-    return state
-def ocr_tool(state: AgentState) -> AgentState:
-    out = ocr_image_tool({"task_id": state.task_id, "ocr_path": ""})
-    state.tool_calls += 1
-    state.add(SystemMessage(content=f"OCR_TOOL_OUT: {out}"))
-    state.next_action = None
-    return state
-def audio_tool(state: AgentState) -> AgentState:
-    out = audio_transcriber_tool({"task_id": state.task_id, "audio_path": ""})
-    state.tool_calls += 1
-    state.add(SystemMessage(content=f"AUDIO_TOOL_OUT: {out}"))
-    state.next_action = None
-    return state
-def excel_tool(state: AgentState) -> AgentState:
-    result = parse_excel_tool({
-        "task_id": state.task_id,
-        "excel_sheet_name": ""
-    })
-    out = {"excel_result": result}
-    state.tool_calls += 1
-    state.add(SystemMessage(content=f"EXCEL_TOOL_OUT: {out}"))
-    state.next_action = None
-    return state
-def code_tool(state: AgentState) -> AgentState:
-    if state.snippet:
-        out = {"analysis": analyze_code_tool({
-            "task_id": state.task_id,
-            "snippet": state.snippet,
-        })}
-    else:
-        out = {"analysis": analyze_code_tool({
-            "task_id": state.task_id,
-            "snippet": ""
-        })}
-    state.tool_calls += 1
-    state.add(SystemMessage(content=f"CODE_TOOL_OUT: {out}"))
-    state.next_action = None
-    return state
-# ------------- final answer -------------
-def final_node(state: AgentState) -> AgentState:
-    print("reached final node")
-    wrap = SystemMessage(
-        content="Using everything so far, reply ONLY with {'final_answer':'…'}. YOUR FINAL ANSWER should be a number OR as few words as possible OR a comma separated list of numbers and/or strings. If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise. If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise. If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string. \n"
-        "reply **only** with "
-        "{\"final_answer\":\"…\"} (no markdown, no commentary)."
-    )
-    raw = LLM.invoke(state.messages + [wrap]).content.strip()
-    # print("raw : ", raw)
-    state.add(AIMessage(content=raw))
-    parsed = safe_json(raw)
-    # print("parsed : ", parsed, "type : ", type(parsed))
-    state.final_answer = parsed.get("final_answer") if parsed else "Unable to parse final answer."
-    # print("state.final_answer : ", state.final_answer)
-    return state
 # ─────────────────────────── Graph wiring ───────────────────────────────
 def build_graph():
     graph = StateGraph(AgentState)
-    # Register nodes
-    for name, fn in [
-        ("tool_selector", tool_selector),
-        ("wiki_tool", wiki_tool),
-        ("ocr_tool", ocr_tool),
-        ("audio_tool", audio_tool),
-        ("excel_tool", excel_tool),
-        ("code_tool", code_tool),
-        ("final_node", final_node),
-    ]:
-        graph.add_node(name, fn)
-    # Edges
-    graph.add_edge(START, "tool_selector")
-    def dispatch(state: AgentState) -> str:
-        return {
-            "wiki": "wiki_tool",
-            "ocr": "ocr_tool",
-            "audio": "audio_tool",
-            "excel": "excel_tool",
-            "code": "code_tool",
-            "final": "final_node",
-        }.get(state.next_action, "final_node")
-    graph.add_conditional_edges(
-        "tool_selector",
-        dispatch,
-        {
-            "wiki_tool": "wiki_tool",
-            "ocr_tool": "ocr_tool",
-            "audio_tool": "audio_tool",
-            "excel_tool": "excel_tool",
-            "code_tool": "code_tool",
-            "final_node": "final_node",
-        },
-    )
-    # tools loop back to selector
-    for tool_name in ("wiki_tool", "ocr_tool", "audio_tool", "excel_tool", "code_tool"):
-        graph.add_edge(tool_name, "tool_selector")
-    # final_answer → END
-    graph.add_edge("final_node", END)
-    return graph

 from state import AgentState
 from typing import Any, Dict, List, Optional
 import json
+from langgraph.prebuilt import create_react_agent
 # ─────────────────────────── External tools ──────────────────────────────
 from tools import (
     wikipedia_search_tool,
+    arxiv_search_tool,
     audio_transcriber_tool,
+    excel_tool,
     analyze_code_tool
 )
 # ─────────────────────────── Configuration ───────────────────────────────
+llm = ChatOpenAI(model_name="gpt-4.1-mini", temperature=0.3)
 MAX_TOOL_CALLS = 5
 # ─────────────────────────── Helper utilities ────────────────────────────
 # ------------- tool adapters -------------
 # ─────────────────────────── Graph wiring ───────────────────────────────
 def build_graph():
     graph = StateGraph(AgentState)
+    llm_tools = [
+        wikipedia_search_tool,
+        arxiv_search_tool,
+        audio_transcriber_tool,
+        excel_tool,
+        analyze_code_tool,
+    ]
+    llm = llm.bind_tools(llm_tools)
+    agent = create_react_agent(llm, llm_tools)
+    return agent

app.py CHANGED Viewed

@@ -12,12 +12,16 @@ from state import AgentState
 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
 class BasicAgent:
     def __init__(self):
         print("BasicAgent initialized.")
         graph = build_graph()
-        self.compiled_graph = graph.compile()
     def __call__(self, question: str, task_id: Optional[str] = None) -> str:
         """Run the agent and return whatever FINAL_ANSWER the graph produces."""
@@ -25,12 +29,12 @@ class BasicAgent:
         # The user_question argument for AgentState is the question.
         init_state = AgentState(user_question=question, task_id=task_id)
-        init_state.add(SystemMessage(content="You are a helpful assistant."))
         init_state.add(HumanMessage(content=question))
         # IMPORTANT: invoke() returns a **new** state instance (or an AddableValuesDict),
         # not the object we pass in.  Use the returned value to fetch final_answer.
-        out_state = self.compiled_graph.invoke(init_state)
         if isinstance(out_state, dict):        # AddableValuesDict behaves like a dict
             return out_state.get("final_answer", "No answer.")

 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
+SYSTEM_PROMPT = """
+You are a general AI assistant. I will ask you a question. Report your thoughts, and finish your answer with the following template: FINAL ANSWER: [YOUR FINAL ANSWER]. YOUR FINAL ANSWER should be a number OR as few words as possible OR a comma separated list of numbers and/or strings. If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise. If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise. If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string.
+"""
 class BasicAgent:
     def __init__(self):
         print("BasicAgent initialized.")
         graph = build_graph()
     def __call__(self, question: str, task_id: Optional[str] = None) -> str:
         """Run the agent and return whatever FINAL_ANSWER the graph produces."""
         # The user_question argument for AgentState is the question.
         init_state = AgentState(user_question=question, task_id=task_id)
+        init_state.add(SystemMessage(content=SYSTEM_PROMPT))
         init_state.add(HumanMessage(content=question))
         # IMPORTANT: invoke() returns a **new** state instance (or an AddableValuesDict),
         # not the object we pass in.  Use the returned value to fetch final_answer.
+        out_state = self.graph.invoke(init_state)
         if isinstance(out_state, dict):        # AddableValuesDict behaves like a dict
             return out_state.get("final_answer", "No answer.")

tools.py CHANGED Viewed

@@ -9,6 +9,8 @@ import time
 import os
 from duckduckgo_search import DDGS
 from langchain_core.tools import tool
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
@@ -199,7 +201,7 @@ import requests
 @tool
 def wikipedia_search_tool(wiki_query: str) -> str:
     """
-    LangGraph wrapper for searching Wikipedia.
     Expects: wiki_query is a non‐empty string.
     Returns: text summary of first matching page or an error message>"
@@ -207,53 +209,29 @@ def wikipedia_search_tool(wiki_query: str) -> str:
     """
     print("reached wikipedia search tool")
     query = wiki_query
-    if not query:
-        return {}
-    try:
-        # 1) Use the MediaWiki API to search for page titles matching the query
-        search_params = {
-            "action": "query",
-            "list": "search",
-            "srsearch": query,
-            "format": "json",
-            "utf8": 1
-        }
-        search_resp = requests.get("https://en.wikipedia.org/w/api.php", params=search_params, timeout=10)
-        search_resp.raise_for_status()
-        search_data = search_resp.json()
-        search_results = search_data.get("query", {}).get("search", [])
-        # print("wikipedia: search_results",search_results)
-        if not search_results:
-            print(f"No Wikipedia page found for '{query}'.")
-            return f"No Wikipedia page found for '{query}'."
-        # 2) Take the first search result's title
-        first_title = search_results[0].get("title", "")
-        if not first_title:
-            print("Unexpected format from Wikipedia search.")
-            return "Unexpected format from Wikipedia search."
-        # 3) Fetch the page summary for that title via the REST summary endpoint
-        title_for_url = requests.utils.requote_uri(first_title)
-        summary_url = f"https://en.wikipedia.org/api/rest_v1/page/summary/{title_for_url}"
-        summary_resp = requests.get(summary_url, timeout=10)
-        summary_resp.raise_for_status()
-        summary_data = summary_resp.json()
-        # 4) Extract either the "extract" field or a fallback message
-        summary_text = summary_data.get("extract")
-        if not summary_text:
-            summary_text = summary_data.get("description", "No summary available.")
-        print(f"Title: {first_title}\n\n{summary_text}")
-        return f"Title: {first_title}\n\n{summary_text}"
-    except requests.exceptions.RequestException as e:
-        return f"Wikipedia search error: {e}"
-    except Exception as e:
-        return f"Unexpected error in wikipedia_search_tool: {e}"
 from langchain_openai import ChatOpenAI

 import os
 from duckduckgo_search import DDGS
 from langchain_core.tools import tool
+from langchain_community.document_loaders import WikipediaLoader, ArxivLoader
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
 @tool
 def wikipedia_search_tool(wiki_query: str) -> str:
     """
+    Searches Wikipedia for the given query and returns the first 5 pages.
     Expects: wiki_query is a non‐empty string.
     Returns: text summary of first matching page or an error message>"
     """
     print("reached wikipedia search tool")
     query = wiki_query
+    docs = WikipediaLoader(query=query, load_max_docs=5).load()
+    result = ""
+    counter = 1
+    for doc in docs:
+        result += f"\n\nDocument{counter}: {doc.metadata['title']}\n. {doc.page_content}"
+        counter += 1
+    return result
+@tool
+def arxiv_search_tool(arxiv_query: str) -> str:
+    """
+    Searches Arxiv for the given query and returns the first 5 pages.
+    Expects: arxiv_query is a non‐empty string.
+    Returns: text summary of first matching page or an error message>"
+    """
+    print("reached arxiv_search_tool")
+    docs = ArxivLoader(query=arxiv_query, load_max_docs=5).load()
+    result = ""
+    counter = 1
+    for doc in docs:
+        result += f"\n\nDocument{counter}: {doc.metadata['title']}\n. {doc.page_content}"
+        counter += 1
+    return result
 from langchain_openai import ChatOpenAI

toolsold.py ADDED Viewed

	@@ -0,0 +1,349 @@

+# tools.py
+import pandas as pd
+from pathlib import Path
+import requests
+import regex as re
+import time
+import os
+from duckduckgo_search import DDGS
+from langchain_core.tools import tool
+DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
+def _download_file_for_task(task_id: str, ext: str) -> str:
+    """
+    Helper: attempt to GET the remote file for a given task_id.
+    Saves under ./hf_files/{task_id}.{ext}. Returns the local path if successful,
+    or an empty string if no file / download failed.
+    """
+    print("reached _download_file_for_task")
+    os.makedirs("hf_files", exist_ok=True)
+    local_path = os.path.join("hf_files", f"{task_id}.{ext}")
+    url = f"{DEFAULT_API_URL}/files/{task_id}"
+    try:
+        resp = requests.get(url, timeout=10)
+        if resp.status_code == 200 and resp.content:
+            print(f"Downloaded file from {url} to {local_path}")
+            with open(local_path, "wb") as f:
+                f.write(resp.content)
+            return local_path
+    except Exception:
+        print(f"Error downloading file from {url} to {local_path}")
+        pass
+    # If we get here, either 404 or download error
+    return ""
+@tool
+def image_tool(task_id: str) -> str:
+    """
+    Expects: task_id is a string
+    Returns: "OCR text + brief caption or an error message"
+    """
+    print("reached image_tool")
+    # path_or_id = state.get("ocr_path", "")
+    for ext in ("png", "jpg", "jpeg"):
+            candidate = _download_file_for_task(task_id, ext)
+            if candidate:
+                local_img = candidate
+                break
+    if not local_img or not os.path.exists(local_img):
+        return {
+            "ocr_path": None,
+            "ocr_result": "Error: No image file found (local nonexistent or download failed)."
+        }
+    # 2) Read raw bytes
+    try:
+        with open(local_img, "rb") as f:
+            image_bytes = f.read()
+    except Exception as e:
+        return  f"Error reading image file: {e}"
+    # 3) Prepare HF Inference headers
+    hf_token = os.getenv("HF_TOKEN")
+    if not hf_token:
+        return "Error: HUGGINGFACE_API_KEY not set in environment."
+    headers = {"Authorization": f"Bearer {hf_token}"}
+    # 4) Call HF’s vision-ocr to extract text
+    ocr_text = ""
+    try:
+        ocr_resp = requests.post(
+            "https://api-inference.huggingface.co/models/google/vit-ocr",
+            headers=headers,
+            files={"file": image_bytes},
+            timeout=30
+        )
+        ocr_resp.raise_for_status()
+        ocr_json = ocr_resp.json()
+        # The JSON has “pages” → list of blocks → “lines” → each line has “text”
+        lines = []
+        for page in ocr_json.get("pages", []):
+            for line in page.get("lines", []):
+                lines.append(line.get("text", "").strip())
+        ocr_text = "\n".join(lines).strip() or "(no visible text)"
+    except Exception as e:
+        ocr_text = f"Error during HF OCR: {e}"
+    # 5) Call HF’s image-captioning to get a brief description
+    caption = ""
+    try:
+        cap_resp = requests.post(
+            "https://api-inference.huggingface.co/models/Salesforce/blip-image-captioning-base",
+            headers=headers,
+            files={"file": image_bytes},
+            timeout=30
+        )
+        cap_resp.raise_for_status()
+        cap_json = cap_resp.json()
+        # The response looks like: {"generated_text": "...caption..."}
+        caption = cap_json.get("generated_text", "").strip()
+        if not caption:
+            caption = "(no caption returned)"
+    except Exception as e:
+        caption = f"Error during HF captioning: {e}"
+    # 6) Combine OCR + caption
+    combined = f"OCR text:\n{ocr_text}\n\nImage caption:\n{caption}"
+    print("combined: ")
+    return combined
+@tool
+def excel_tool(task_id: str) -> str:
+    """
+    Downloads <task_id>.xlsx (if any) and returns a stringified list of
+    records from the specified sheet.  No fallback to user-supplied tables.
+    Expected keys in `task_id`:
+        • task_id            – required (used to download the file)
+    returns: stringified list of records from the specified sheet
+    """
+    print("reached excel_tool")
+    sheet   = "Sheet1"
+    local_xlsx = _download_file_for_task(task_id, "xlsx")
+    if not local_xlsx or not os.path.exists(local_xlsx):
+        return "Error: Excel file not found for this task."
+    try:
+        xls = pd.ExcelFile(local_xlsx)
+        df  = pd.read_excel(
+            xls,
+            sheet_name=sheet if sheet and sheet in xls.sheet_names else xls.sheet_names[0]
+        )
+        print(f"Excel file read successfully: {str(df.to_dict(orient='records'))}")
+        return str(df.to_dict(orient="records"))
+    except Exception as e:
+        return f"Error reading Excel file: {e}"
+import openai
+@tool
+def audio_transcriber_tool(task_id: str) -> str:
+    """
+    LangGraph tool for transcribing audio via OpenAI's Whisper API.
+    Expects: task_id is a string
+    Returns:
+    "<text or error message>"
+    Always attempts to download the file for the given path or task ID.
+    """
+    print("reached audio_transcriber_tool")
+    # Always attempt to download the file, regardless of local existence
+    local_audio = ""
+    for ext in ("mp3", "wav", "m4a"):
+        candidate = _download_file_for_task(task_id, ext)
+        if candidate:
+            local_audio = candidate
+            break
+    if not local_audio or not os.path.exists(local_audio):
+        return "Error: No audio file found (download failed)."
+    # Send to OpenAI Whisper
+    try:
+        openai.api_key = os.getenv("OPENAI_API_KEY")
+        if not openai.api_key:
+            raise RuntimeError("OPENAI_API_KEY is not set in environment.")
+        with open(local_audio, "rb") as audio_file:
+            print("reached openai.audio.transcriptions.create")
+            response = openai.audio.transcriptions.create(
+                model="whisper-1",
+                file=audio_file,
+            )
+            print("reached response")
+        text = response.text.strip()
+    except Exception as e:
+        text = f"Error during transcription: {e}"
+    print(f"Transcripted as transcript: {text}")
+    return text
+# tools.py
+import re
+import requests
+@tool
+def wikipedia_search_tool(wiki_query: str) -> str:
+    """
+    LangGraph wrapper for searching Wikipedia.
+    Expects: wiki_query is a non‐empty string.
+    Returns: text summary of first matching page or an error message>"
+    If no valid wiki_query is provided, returns {}.
+    """
+    print("reached wikipedia search tool")
+    query = wiki_query
+    if not query:
+        return {}
+    try:
+        # 1) Use the MediaWiki API to search for page titles matching the query
+        search_params = {
+            "action": "query",
+            "list": "search",
+            "srsearch": query,
+            "format": "json",
+            "utf8": 1
+        }
+        search_resp = requests.get("https://en.wikipedia.org/w/api.php", params=search_params, timeout=10)
+        search_resp.raise_for_status()
+        search_data = search_resp.json()
+        search_results = search_data.get("query", {}).get("search", [])
+        # print("wikipedia: search_results",search_results)
+        if not search_results:
+            print(f"No Wikipedia page found for '{query}'.")
+            return f"No Wikipedia page found for '{query}'."
+        # 2) Take the first search result's title
+        first_title = search_results[0].get("title", "")
+        if not first_title:
+            print("Unexpected format from Wikipedia search.")
+            return "Unexpected format from Wikipedia search."
+        # 3) Fetch the page summary for that title via the REST summary endpoint
+        title_for_url = requests.utils.requote_uri(first_title)
+        summary_url = f"https://en.wikipedia.org/api/rest_v1/page/summary/{title_for_url}"
+        summary_resp = requests.get(summary_url, timeout=10)
+        summary_resp.raise_for_status()
+        summary_data = summary_resp.json()
+        # 4) Extract either the "extract" field or a fallback message
+        summary_text = summary_data.get("extract")
+        if not summary_text:
+            summary_text = summary_data.get("description", "No summary available.")
+        print(f"Title: {first_title}\n\n{summary_text}")
+        return f"Title: {first_title}\n\n{summary_text}"
+    except requests.exceptions.RequestException as e:
+        return f"Wikipedia search error: {e}"
+    except Exception as e:
+        return f"Unexpected error in wikipedia_search_tool: {e}"
+from langchain_openai import ChatOpenAI
+from langchain.schema import SystemMessage, HumanMessage
+LLM = ChatOpenAI(model_name="gpt-4.1-mini", temperature=0.2)
+@tool
+def analyze_code_tool(task_id: str) -> str:
+    """
+    Either task_id  OR  (file + task_id)
+    Reads the code (max 400 lines / 10 kB) and asks the LLM for:
+        • plain-language summary
+        • list of key functions/classes
+        • obvious bugs or style smells
+    Returns that analysis as a string.
+    """
+    print("reached analyze_code_tool")
+    code_txt = ""
+    if not task_id:
+        code_txt = "No code provided."
+    else:
+        path = _download_file_for_task(task_id, "py")
+        if not path:
+            return "Error: .py file not found for this task."
+        code_txt = Path(path).read_text(encoding="utf-8", errors="ignore")
+    # else:
+    #     return "Error: neither snippet nor file provided."
+    # Truncate for safety
+    lines = code_txt.splitlines()[:400]
+    code_sample = "\n".join(lines)[:10_000]
+    prompt = [
+        SystemMessage(content="You are a senior Python code reviewer."),
+        HumanMessage(content=(
+            "Please analyse the following code. "
+            "Summarise what it does, list key functions/classes, "
+            "and point out any obvious bugs, performance issues or style problems.\n\n"
+            f"```python\n{code_sample}\n```"
+            "If you can then find the output of the code and return it in the output."
+        ))
+    ]
+    return LLM.invoke(prompt).content.strip()
+# def web_search_tool(state: AgentState) -> AgentState:
+#     """
+#     Expects: state["web_search_query"] is a non‐empty string.
+#     Returns: {"web_search_query": None, "web_search_result": <string>}.
+#     Retries up to 5 times on either a DuckDuckGo “202 Ratelimit” response or any exception (e.g. timeout).
+#     """
+#     print("reached web_search_tool")
+#     query = state.get("web_search_query", "")
+#     if not query:
+#         return {}  # nothing to do
+#     ddg = DDGS()
+#     max_retries = 5
+#     result_text = ""
+#     for attempt in range(1, max_retries + 1):
+#         try:
+#             result_text = str(ddg.text(query, max_results=5))
+#         except Exception as e:
+#             # Network error or timeout—retry up to max_retries
+#             if attempt < max_retries:
+#                 print(f"web_search_tool: exception '{e}', retrying in 4 seconds ({attempt}/{max_retries})")
+#                 time.sleep(4)
+#                 continue
+#             else:
+#                 # Final attempt failed
+#                 return {
+#                     "web_search_query": None,
+#                     "web_search_result": f"Error during DuckDuckGo search: {e}"
+#                 }
+#         # Check for DuckDuckGo rate‐limit indicator
+#         if "202 Ratelimit" in result_text:
+#             if attempt < max_retries:
+#                 print(f"web_search_tool: received '202 Ratelimit', retrying in 4 seconds ({attempt}/{max_retries})")
+#                 time.sleep(4)
+#                 continue
+#             else:
+#                 # Final attempt still rate‐limited
+#                 break
+#         # Successful response (no exception and no rate‐limit text)
+#         break
+#     return {
+#         "web_search_query": None,
+#         "web_search_result": result_text
+#     }