Final_Assignment_Template

Paused

App Files Files Community

wahibtim commited on 24 days ago

Commit

f05a776

verified ·

1 Parent(s): 341e0dc

Update app.py

Browse files

Files changed (1) hide show

app.py +46 -54

app.py CHANGED Viewed

@@ -2,7 +2,8 @@ import os
 import gradio as gr
 import requests
 import pandas as pd
-from smolagents import CodeAgent, HfApiModel, tool
 from PIL import Image
 import io
@@ -11,7 +12,7 @@ DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
 # ====================== TOOLS ======================
 @tool
 def web_search(query: str) -> str:
-    """Search the web for information."""
     try:
         from duckduckgo_search import DDGS
         with DDGS() as ddgs:
@@ -20,73 +21,55 @@ def web_search(query: str) -> str:
     except:
         return "Search failed."
-@tool
-def calculate(expression: str) -> str:
-    """Calculate simple math."""
-    try:
-        import math
-        return str(eval(expression, {"__builtins__": {}}, {"math": math}))
-    except:
-        return "Calc failed."
 @tool
 def download_file(task_id: str) -> str:
-    """Download the file (image, csv, audio, etc.) attached to a question."""
     url = f"{DEFAULT_API_URL}/files/{task_id}"
     try:
         r = requests.get(url, timeout=20)
         r.raise_for_status()
-        content_type = r.headers.get("content-type", "")
-        if "image" in content_type:
             img = Image.open(io.BytesIO(r.content))
-            return f"Downloaded image: {img.size} {img.format}"
         else:
-            text = r.text[:1500]
-            return f"Downloaded file content:\n{text}"
-    except Exception as e:
-        return f"File download failed: {str(e)}"
 # ====================== AGENT ======================
 class BasicAgent:
     def __init__(self):
         self.model = HfApiModel(model_id="Qwen/Qwen2.5-Coder-32B-Instruct")
-        self.agent = CodeAgent(
-            model=self.model,
-            tools=[web_search, calculate, download_file],
-            add_base_tools=True,
-            verbosity_level=0,
-            max_steps=10,
-            planning_interval=3
-        )
     def __call__(self, question: str) -> str:
         try:
-            output = self.agent.run(question)
             answer = str(output).strip()
-            # Force clean final answer (this fixes 0%)
             if "Final Answer:" in answer:
                 answer = answer.split("Final Answer:")[-1].strip()
-            elif "Answer:" in answer:
                 answer = answer.split("Answer:")[-1].strip()
-            # Take last line if too long
-            if len(answer) > 400:
-                answer = answer.split("\n")[-1].strip()
-            return answer[:700].strip()
         except Exception as e:
-            return f"Error: {str(e)[:150]}"
-# ====================== SUBMISSION ======================
 def run_and_submit_all(profile: gr.OAuthProfile | None):
     if not profile:
-        return "Please login first.", None
     username = profile.username.strip()
     api_url = DEFAULT_API_URL
@@ -94,16 +77,18 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
     submit_url = f"{api_url}/submit"
     agent = BasicAgent()
     space_id = os.getenv("SPACE_ID")
     agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main" if space_id else ""
-    response = requests.get(questions_url, timeout=20)
-    questions_data = response.json()
     answers_payload = []
     results_log = []
     for item in questions_data:
         task_id = item.get("task_id")
         question = item.get("question")
@@ -112,16 +97,23 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
         answer = agent(question)
         answers_payload.append({"task_id": task_id, "submitted_answer": answer})
-        results_log.append({"Task ID": task_id, "Question": question[:100]+"...", "Answer": answer[:150]+"..."})
     submission_data = {"username": username, "agent_code": agent_code, "answers": answers_payload}
     try:
-        response = requests.post(submit_url, json=submission_data, timeout=90)
-        response.raise_for_status()
-        result = response.json()
         score = result.get("score", 0)
-        status = f"✅ Done!\nScore: {score}% ({result.get('correct_count',0)}/20)\n{result.get('message','')}"
         return status, pd.DataFrame(results_log)
     except Exception as e:
         return f"Submission failed: {str(e)}", pd.DataFrame(results_log)
@@ -129,8 +121,8 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
 # ====================== UI ======================
 with gr.Blocks() as demo:
-    gr.Markdown("# Unit 4 - Final GAIA Agent (with file support)")
-    gr.Markdown("Login → Click button (takes 8-15 min)")
     gr.LoginButton()
     btn = gr.Button("🚀 Run Evaluation & Submit All Answers", variant="primary", size="large")

 import gradio as gr
 import requests
 import pandas as pd
+import time
+from smolagents import HfApiModel, tool
 from PIL import Image
 import io
 # ====================== TOOLS ======================
 @tool
 def web_search(query: str) -> str:
+    """Search the web."""
     try:
         from duckduckgo_search import DDGS
         with DDGS() as ddgs:
     except:
         return "Search failed."
 @tool
 def download_file(task_id: str) -> str:
+    """Download attached file (image, csv, audio...) for the task."""
     url = f"{DEFAULT_API_URL}/files/{task_id}"
     try:
         r = requests.get(url, timeout=20)
         r.raise_for_status()
+        if "image" in r.headers.get("content-type", ""):
             img = Image.open(io.BytesIO(r.content))
+            return f"Image downloaded: size {img.size}"
         else:
+            return f"File downloaded: {len(r.content)} bytes"
+    except:
+        return "File download failed."
 # ====================== AGENT ======================
 class BasicAgent:
     def __init__(self):
         self.model = HfApiModel(model_id="Qwen/Qwen2.5-Coder-32B-Instruct")
     def __call__(self, question: str) -> str:
+        # VERY STRICT PROMPT – this is what fixes the 0%
+        prompt = f"""You are answering a GAIA benchmark question.
+Answer with ONLY the final answer. No explanation, no reasoning, no "Final Answer", no quotes, no extra text.
+Question: {question}
+Final Answer:"""
         try:
+            output = self.model.generate(prompt, max_new_tokens=150)
             answer = str(output).strip()
+            # Extra cleaning
             if "Final Answer:" in answer:
                 answer = answer.split("Final Answer:")[-1].strip()
+            if "Answer:" in answer:
                 answer = answer.split("Answer:")[-1].strip()
+            return answer[:400].strip()   # keep it short and clean
         except Exception as e:
+            return f"Error: {str(e)[:100]}"
+# ====================== MAIN FUNCTION ======================
 def run_and_submit_all(profile: gr.OAuthProfile | None):
     if not profile:
+        return "Please login with Hugging Face first.", None
     username = profile.username.strip()
     api_url = DEFAULT_API_URL
     submit_url = f"{api_url}/submit"
     agent = BasicAgent()
     space_id = os.getenv("SPACE_ID")
     agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main" if space_id else ""
+    # Fetch questions
+    resp = requests.get(questions_url, timeout=20)
+    questions_data = resp.json()
     answers_payload = []
     results_log = []
+    print(f"Running on {len(questions_data)} questions...")
     for item in questions_data:
         task_id = item.get("task_id")
         question = item.get("question")
         answer = agent(question)
         answers_payload.append({"task_id": task_id, "submitted_answer": answer})
+        results_log.append({
+            "Task ID": task_id,
+            "Question": question[:100] + "...",
+            "Answer": answer[:150] + "..." if len(answer) > 150 else answer
+        })
+        time.sleep(35)   # ← IMPORTANT: avoids rate limit
+    # Submit
     submission_data = {"username": username, "agent_code": agent_code, "answers": answers_payload}
     try:
+        r = requests.post(submit_url, json=submission_data, timeout=120)
+        r.raise_for_status()
+        result = r.json()
         score = result.get("score", 0)
+        status = f"✅ SUBMITTED!\nScore: {score}% ({result.get('correct_count',0)}/20)\n{result.get('message','')}"
         return status, pd.DataFrame(results_log)
     except Exception as e:
         return f"Submission failed: {str(e)}", pd.DataFrame(results_log)
 # ====================== UI ======================
 with gr.Blocks() as demo:
+    gr.Markdown("# Unit 4 – Final GAIA Agent (Clean Version)")
+    gr.Markdown("**Login → Click the button** (takes ~12-18 minutes)")
     gr.LoginButton()
     btn = gr.Button("🚀 Run Evaluation & Submit All Answers", variant="primary", size="large")