Final_Assignment_Template

Sleeping

App Files Files Community

mrhenu commited on Jul 8, 2025

Commit

2c1cc68

verified ·

1 Parent(s): 662cd6f

Update app.py

Browse files

Files changed (1) hide show

app.py +54 -123

app.py CHANGED Viewed

@@ -9,161 +9,92 @@ from langchain.agents import AgentExecutor
 from langchain_experimental.tools import PythonREPLTool
 from langchain_community.tools.youtube.search import YouTubeSearchTool
 from langchain_community.tools.tavily_search import TavilySearchResults
 from langchain_openai import ChatOpenAI
-from langgraph.graph import StateGraph, END
 from langgraph.prebuilt import ToolNode, tools_condition
-# --- Main Application Logic ---
-# Agentin muisti
 class AgentState(TypedDict):
     messages: Annotated[Sequence[BaseMessage], operator.add]
-# Agentin rakentajafunktio
 def create_langgraph_agent():
-    print("Initializing Advanced LangGraph Agent…")
-    # 1. System prompt GAIA-tyyliin
     SYSTEM_PROMPT = """
-You are a general AI assistant. I will ask you a question. Report your thoughts, and finish your answer with the following template:
-FINAL ANSWER: [YOUR FINAL ANSWER].
-YOUR FINAL ANSWER should be a number OR as few words as possible OR a comma separated list of numbers and/or strings.
-If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise.
-If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise.
-If you are asked for a comma separated list, apply the above rules depending on whether the element to be put in the list is a number or a string.
 """
-    # 2. LLM (ei system_message-parametria -> annetaan prompt SystemMessage-na)
     llm = ChatOpenAI(model="gpt-4o", temperature=0)
-    # 3. Perustyökalut
     tools = [
         TavilySearchResults(max_results=3),
         PythonREPLTool(),
         YouTubeSearchTool(),
     ]
-    # 4. Valinnainen FileManagement toolkit (kevyt, yleensä saatavilla)
     try:
         from langchain_community.agent_toolkits.file_management.toolkit import FileManagementToolkit
-        file_toolkit = FileManagementToolkit(root_dir=".")
-        tools.extend(file_toolkit.get_tools())
-        print("FileManagement tools loaded.")
-    except Exception as e:
-        print("FileManagement toolkit unavailable:", e)
-    # 5. Bind tools
     llm_with_tools = llm.bind_tools(tools)
-    print("LLM and tools initialized.")
-    # 6. Agent-solmu (lisää system prompt joka kierroksella)
     def agent_node(state):
-        print("Calling agent node…")
-        full_msgs = [SystemMessage(content=SYSTEM_PROMPT)] + list(state["messages"])
-        reply = llm_with_tools.invoke(full_msgs)
         return {"messages": [reply]}
-    # 7. Työkalusolmu
-    tool_node = ToolNode(tools)
-    # 8. Rakenna graafi
     graph = StateGraph(AgentState)
     graph.add_node("agent", agent_node)
-    graph.add_node("tools", tool_node)
     graph.set_entry_point("agent")
     graph.add_conditional_edges("agent", tools_condition)
     graph.add_edge("tools", "agent")
-    app = graph.compile()
-    print("LangGraph agent compiled and ready.")
-    return app
-# Agentin suoritusfunktio
-def run_agent(agent_executor, question: str) -> str:
-    print(f"Agent received question: {question}")
-    final_answer = ""
-    try:
-        response = agent_executor.invoke(
-            {"messages": [HumanMessage(content=question)]},
-            config={"recursion_limit": 15}
-        )
-        raw_answer = response['messages'][-1].content
-        if "FINAL ANSWER:" in raw_answer:
-            final_answer = raw_answer.split("FINAL ANSWER:")[-1].strip()
-        else:
-            final_answer = raw_answer
-    except Exception as e:
-        print(f"Error during agent execution: {e}")
-        final_answer = f"Error: Agent failed to execute. {e}"
-    print(f"Agent returning answer: {final_answer}")
-    return str(final_answer)
-# Evaluaation ajaminen ja tulosten lähetys
-def run_and_submit_all(profile: gr.OAuthProfile | None):
-    space_id = os.getenv("SPACE_ID")
-    if not profile:
-        return "Please login to Hugging Face.", None
-    username = f"{profile.username}"
-    if not os.getenv("TAVILY_API_KEY") or not os.getenv("OPENAI_API_KEY"):
-        return "API keys missing (TAVILY_API_KEY, OPENAI_API_KEY)", None
-    try:
-        agent_executor = create_langgraph_agent()
-    except Exception as e:
-        return f"Error initializing agent: {e}", None
-    agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main"
-    questions_url = "https://agents-course-unit4-scoring.hf.space/questions"
-    try:
-        response = requests.get(questions_url, timeout=20)
-        response.raise_for_status()
-        questions_data = response.json()
-    except Exception as e:
-        return f"Error fetching questions: {e}", None
-    answers_payload = []
-    for item in questions_data:
-        task_id, question_text = item.get("task_id"), item.get("question")
-        if task_id and question_text:
-            submitted_answer = run_agent(agent_executor, question_text)
-            answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
-    submission_data = {
-        "username": username.strip(),
-        "agent_code": agent_code,
-        "answers": answers_payload,
-    }
-    submit_url = "https://agents-course-unit4-scoring.hf.space/submit"
-    try:
-        response = requests.post(submit_url, json=submission_data, timeout=240)
-        response.raise_for_status()
-        result_data = response.json()
-        final_status = (
-            f"Submission Successful!\n"
-            f"User: {result_data.get('username')}\n"
-            f"Overall Score: {result_data.get('score', 'N/A')}% "
-            f"({result_data.get('correct_count', '?')}/{result_data.get('total_attempted', '?')} correct)\n"
-            f"Message: {result_data.get('message', 'No message received.')}"
-        )
-        return final_status, pd.DataFrame(answers_payload)
-    except Exception as e:
-        return f"Error during submission: {e}", pd.DataFrame(answers_payload)
-# Gradio-käyttöliittymä
-with gr.Blocks() as demo:
-    gr.Markdown("# Agent Evaluation Runner (GAIA Prompt)")
-    gr.LoginButton()
-    run_button = gr.Button("Run Evaluation & Submit All Answers")
-    status_output = gr.Textbox(label="Run Status / Submission Result", lines=5, interactive=False)
-    results_table = gr.DataFrame(label="Questions and Agent Answers", wrap=True)
-    run_button.click(fn=run_and_submit_all, outputs=[status_output, results_table])
-if __name__ == "__main__":
-    demo.launch()

 from langchain_experimental.tools import PythonREPLTool
 from langchain_community.tools.youtube.search import YouTubeSearchTool
 from langchain_community.tools.tavily_search import TavilySearchResults
+from langchain_core.tools import tool
 from langchain_openai import ChatOpenAI
+from langgraph.graph import StateGraph
 from langgraph.prebuilt import ToolNode, tools_condition
+# --- Custom Image Analysis Tool ---------------------------------------------
+@tool("image_analysis", return_direct=True)
+def image_analysis(image_path: str, prompt: str) -> str:
+    """Analyze an image located at image_path and answer according to prompt.
+    image_path: path or URL to the image file
+    prompt: the specific question or instruction about the image
+    Returns a textual answer.
+    """
+    from PIL import Image
+    import openai
+    if not os.path.exists(image_path):
+        return "Image path not found."
+    # Load image bytes
+    with open(image_path, "rb") as f:
+        img_bytes = f.read()
+    # Send to OpenAI vision-capable model (e.g., gpt-4o with vision)
+    client = openai.OpenAI()
+    response = client.chat.completions.create(
+        model="gpt-4o-mini",  # vision-capable
+        messages=[
+            {
+                "role": "user",
+                "content": [
+                    {"type": "image", "image": img_bytes},
+                    {"type": "text", "text": prompt},
+                ],
+            }
+        ],
+    )
+    return response.choices[0].message.content.strip()
+# --- Main Application Logic --------------------------------------------------
 class AgentState(TypedDict):
+    """State schema for the LangGraph agent."""
     messages: Annotated[Sequence[BaseMessage], operator.add]
 def create_langgraph_agent():
+    print("Initializing Advanced LangGraph Agent with vision…")
     SYSTEM_PROMPT = """
+You are a general AI assistant for the GAIA test. I will ask you a question. Report your reasoning briefly, and finish with:
+FINAL ANSWER: [YOUR FINAL ANSWER]
+Follow the formatting rules strictly.
 """
     llm = ChatOpenAI(model="gpt-4o", temperature=0)
     tools = [
         TavilySearchResults(max_results=3),
         PythonREPLTool(),
         YouTubeSearchTool(),
+        image_analysis,  # new vision tool
     ]
+    # Optional FileManagement tools
     try:
         from langchain_community.agent_toolkits.file_management.toolkit import FileManagementToolkit
+        tools.extend(FileManagementToolkit(root_dir=".").get_tools())
+    except Exception:
+        pass
     llm_with_tools = llm.bind_tools(tools)
     def agent_node(state):
+        msgs = [SystemMessage(content=SYSTEM_PROMPT)] + list(state["messages"])
+        reply = llm_with_tools.invoke(msgs)
         return {"messages": [reply]}
     graph = StateGraph(AgentState)
     graph.add_node("agent", agent_node)
+    graph.add_node("tools", ToolNode(tools))
     graph.set_entry_point("agent")
     graph.add_conditional_edges("agent", tools_condition)
     graph.add_edge("tools", "agent")
+    return graph.compile()
+# rest of app (run_agent, Gradio UI, evaluation) remains identical to V2