Final_Assignment_Template

Sleeping

App Files Files Community

mianf4884 commited on 24 days ago

Commit

60a3312

verified ·

1 Parent(s): 44d9d68

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -17

app.py CHANGED Viewed

@@ -2,7 +2,7 @@ import os
 import gradio as gr
 import requests
 import pandas as pd
-# 2026 standard: InferenceClientModel replaces HfApiModel for the free tier
 from smolagents import CodeAgent, DuckDuckGoSearchTool, InferenceClientModel, VisitWebpageTool
 # --- Constants ---
@@ -11,19 +11,22 @@ DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
 # --- Agent Definition ---
 class AgentArchitect:
     def __init__(self):
-        # Fetch token from Space Secrets (Settings tab)
         hf_token = os.getenv("HF_TOKEN")
-        # InferenceClientModel is the gateway to the FREE Serverless API
-        # Qwen 2.5 Coder 32B is excellent for the Python tasks in GAIA
         self.model = InferenceClientModel(
             model_id="Qwen/Qwen2.5-Coder-32B-Instruct",
             token=hf_token
         )
         self.tools = [DuckDuckGoSearchTool(), VisitWebpageTool()]
-        # CodeAgent allows the LLM to write Python to solve the benchmark
         self.agent = CodeAgent(
             tools=self.tools,
             model=self.model,
@@ -32,11 +35,11 @@ class AgentArchitect:
     def __call__(self, question: str) -> str:
         try:
-            # We enforce conciseness. GAIA needs exact answers!
             prompt = (
                 f"{question}\n\n"
-                f"Instructions: Solve the task step-by-step using your tools. "
-                f"Provide ONLY the final result as a concise string."
             )
             result = self.agent.run(prompt)
             return str(result)
@@ -55,10 +58,8 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
     submit_url = f"{api_url}/submit"
     try:
-        # Initialize the new free-tier agent
         agent_instance = AgentArchitect()
-        # 1. Fetch Questions
         response = requests.get(questions_url, timeout=15)
         response.raise_for_status()
         questions_data = response.json()
@@ -66,18 +67,16 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
         results_log = []
         answers_payload = []
-        # 2. Process all 20 questions
         for item in questions_data:
             task_id = item.get("task_id")
             question_text = item.get("question")
-            # The agent will now actually THINK and SEARCH
             submitted_answer = agent_instance(question_text)
             answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
             results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
-        # 3. Submit to the course leaderboard
         agent_code_link = f"https://huggingface.co/spaces/{space_id}/tree/main"
         submission_data = {
             "username": username.strip(),
@@ -98,13 +97,13 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
         return final_status, pd.DataFrame(results_log)
     except Exception as e:
-        return f"Error: {e}", None
 # --- Gradio UI ---
-with gr.Blocks(theme=gr.themes.Monochrome()) as demo:
-    gr.Markdown("# 🚀 Final Mission: The 30% Score")
     gr.LoginButton()
-    run_button = gr.Button("Run Evaluation & Submit", variant="primary")
     status_output = gr.Textbox(label="Leaderboard Status", lines=4)
     results_table = gr.DataFrame(label="Agent Reasoning Trace", wrap=True)

 import gradio as gr
 import requests
 import pandas as pd
+# 2026 standard: InferenceClientModel is the robust way to access free models
 from smolagents import CodeAgent, DuckDuckGoSearchTool, InferenceClientModel, VisitWebpageTool
 # --- Constants ---
 # --- Agent Definition ---
 class AgentArchitect:
     def __init__(self):
+        # SECURE: Fetches the token from your Space Secrets
         hf_token = os.getenv("HF_TOKEN")
+        if not hf_token:
+            print("CRITICAL: HF_TOKEN is missing. Please add it to your Space Secrets!")
+        # InferenceClientModel is the 2026 gateway for free Serverless Inference.
+        # We use Qwen 2.5 Coder 32B because it has the highest reasoning-to-speed ratio.
         self.model = InferenceClientModel(
             model_id="Qwen/Qwen2.5-Coder-32B-Instruct",
             token=hf_token
         )
+        # This will now work perfectly because 'ddgs' is in your requirements.txt
         self.tools = [DuckDuckGoSearchTool(), VisitWebpageTool()]
         self.agent = CodeAgent(
             tools=self.tools,
             model=self.model,
     def __call__(self, question: str) -> str:
         try:
+            # We enforce a concise output format to satisfy the grader's 'Exact Match' logic.
             prompt = (
                 f"{question}\n\n"
+                f"Instructions: Think step-by-step. Solve the problem using your tools. "
+                f"Provide ONLY the final, concise answer."
             )
             result = self.agent.run(prompt)
             return str(result)
     submit_url = f"{api_url}/submit"
     try:
         agent_instance = AgentArchitect()
         response = requests.get(questions_url, timeout=15)
         response.raise_for_status()
         questions_data = response.json()
         results_log = []
         answers_payload = []
         for item in questions_data:
             task_id = item.get("task_id")
             question_text = item.get("question")
+            # The agent now has the 'ddgs' muscles to perform the search
             submitted_answer = agent_instance(question_text)
             answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
             results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
         agent_code_link = f"https://huggingface.co/spaces/{space_id}/tree/main"
         submission_data = {
             "username": username.strip(),
         return final_status, pd.DataFrame(results_log)
     except Exception as e:
+        return f"Submission Failed: {e}", None
 # --- Gradio UI ---
+with gr.Blocks(theme=gr.themes.Soft()) as demo:
+    gr.Markdown("# 🚀 Professional Agent Evaluator")
     gr.LoginButton()
+    run_button = gr.Button("Run Evaluation & Submit All Answers", variant="primary")
     status_output = gr.Textbox(label="Leaderboard Status", lines=4)
     results_table = gr.DataFrame(label="Agent Reasoning Trace", wrap=True)