Spaces:

eigbney
/

AI-Unit2

Runtime error

App Files Files Community

eigbney commited on 14 days ago

Commit

e919265

verified ·

1 Parent(s): 6689564

Update app.py

Browse files

Files changed (1) hide show

app.py +47 -43

app.py CHANGED Viewed

@@ -1,85 +1,78 @@
 import os
-import subprocess
-import sys
-try:
-    import duckduckgo_search
-except ImportError:
-    subprocess.check_call([sys.executable, "-m", "pip", "install", "duckduckgo-search==6.3.2"])
 import gradio as gr
 import requests
 import pandas as pd
 from smolagents import CodeAgent, HfApiModel
-try:
-    from smolagents import DuckDuckGoSearchTool
-    HAS_SEARCH = True
-except ImportError:
-    HAS_SEARCH = False
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
 class BasicAgent:
     def __init__(self):
         self.model = HfApiModel(model_id="Qwen/Qwen2.5-72B-Instruct")
-        tools = []
-        if HAS_SEARCH:
-            try:
-                tools.append(DuckDuckGoSearchTool())
-            except Exception as e:
-                print(f"Could not init search tool: {e}")
         self.agent = CodeAgent(
-            tools=tools,
             model=self.model,
-            add_base_tools=True # Python interpreter for math/logic
         )
-        print(f"Agent initialized. Search available: {HAS_SEARCH}")
     def __call__(self, question: str) -> str:
         clean_prompt = (
-            f"Question: {question}\n\n"
-            "Instructions: Solve the question above. Provide ONLY the final answer "
-            "value. No explanation, no 'The answer is...', just the value."
         )
         try:
             result = self.agent.run(clean_prompt)
             return str(result).strip()
         except Exception as e:
-            return f"Error: {e}"
 def run_and_submit_all(profile: gr.OAuthProfile | None):
     space_id = os.getenv("SPACE_ID")
     if not profile:
         return "Please Login to Hugging Face with the button.", None
-    username = f"{profile.username}"
-    # Define agent code link
-    agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main"
-    # 1. Fetch Questions
     try:
         response = requests.get(f"{DEFAULT_API_URL}/questions", timeout=15)
         questions_data = response.json()
     except Exception as e:
-        return f"Error fetching questions: {e}", None
-    # 2. Run Agent
     agent = BasicAgent()
     answers_payload = []
     results_log = []
-    # Process all questions
     for item in questions_data:
         task_id = item.get("task_id")
         question_text = item.get("question")
         if not task_id: continue
         submitted_answer = agent(question_text)
         answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
-        results_log.append({"Task ID": task_id, "Answer": submitted_answer})
     # 3. Submit
     submission_data = {
@@ -91,20 +84,31 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
     try:
         response = requests.post(f"{DEFAULT_API_URL}/submit", json=submission_data, timeout=60)
         result_data = response.json()
-        status = f"Success! Score: {result_data.get('score')}% ({result_data.get('correct_count')}/{result_data.get('total_attempted')})"
-        return status, pd.DataFrame(results_log)
     except Exception as e:
         return f"Submission Failed: {e}", pd.DataFrame(results_log)
 # --- Gradio Interface ---
 with gr.Blocks() as demo:
-    gr.Markdown("# GAIA Final Solver")
     gr.LoginButton()
-    run_button = gr.Button("Run Evaluation & Submit", variant="primary")
-    status_output = gr.Textbox(label="Status")
-    results_table = gr.DataFrame(label="Answers Generated")
-    run_button.click(fn=run_and_submit_all, outputs=[status_output, results_table])
 if __name__ == "__main__":
     demo.launch()

 import os
 import gradio as gr
 import requests
 import pandas as pd
 from smolagents import CodeAgent, HfApiModel
+# --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
 class BasicAgent:
     def __init__(self):
+        # HfApiModel is native and fast within the HF ecosystem
+        # It uses your HF_TOKEN automatically if set in Secrets
         self.model = HfApiModel(model_id="Qwen/Qwen2.5-72B-Instruct")
+        # We use CodeAgent WITHOUT external tools like Search.
+        # add_base_tools=True provides the Python Interpreter for logic/math.
         self.agent = CodeAgent(
+            tools=[],
             model=self.model,
+            add_base_tools=True
         )
+        print("Clean Agent initialized (Python Interpreter enabled).")
     def __call__(self, question: str) -> str:
+        # Prompt specifically designed for GAIA Exact Match scoring
         clean_prompt = (
+            f"Solve this task: {question}\n\n"
+            "Final Answer Requirement: Provide ONLY the numeric or text value. "
+            "Do not include units, symbols, or conversational filler. "
+            "No 'The answer is...', no 'FINAL ANSWER' text. Just the raw value."
         )
         try:
+            # The agent will write code to solve if the question is complex
             result = self.agent.run(clean_prompt)
             return str(result).strip()
         except Exception as e:
+            print(f"Agent Error: {e}")
+            return "Error"
 def run_and_submit_all(profile: gr.OAuthProfile | None):
     space_id = os.getenv("SPACE_ID")
     if not profile:
         return "Please Login to Hugging Face with the button.", None
+    username = profile.username
+    agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main" if space_id else ""
+    # 1. Fetch
     try:
         response = requests.get(f"{DEFAULT_API_URL}/questions", timeout=15)
         questions_data = response.json()
     except Exception as e:
+        return f"Fetch Error: {e}", None
+    # 2. Run
     agent = BasicAgent()
     answers_payload = []
     results_log = []
+    print(f"Starting evaluation for {len(questions_data)} questions...")
     for item in questions_data:
         task_id = item.get("task_id")
         question_text = item.get("question")
         if not task_id: continue
+        # Run agent
         submitted_answer = agent(question_text)
         answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
+        results_log.append({"Task ID": task_id, "Question": question_text[:100], "Answer": submitted_answer})
     # 3. Submit
     submission_data = {
     try:
         response = requests.post(f"{DEFAULT_API_URL}/submit", json=submission_data, timeout=60)
         result_data = response.json()
+        final_status = (
+            f"Submission Successful!\n"
+            f"Score: {result_data.get('score')}% "
+            f"({result_data.get('correct_count')}/{result_data.get('total_attempted')} correct)"
+        )
+        return final_status, pd.DataFrame(results_log)
     except Exception as e:
         return f"Submission Failed: {e}", pd.DataFrame(results_log)
 # --- Gradio Interface ---
 with gr.Blocks() as demo:
+    gr.Markdown("# GAIA Agent Evaluation Runner (Clean Version)")
+    gr.Markdown("Uses `smolagents` with a built-in Python Interpreter to solve tasks.")
     gr.LoginButton()
+    run_button = gr.Button("Run Evaluation & Submit All", variant="primary")
+    status_output = gr.Textbox(label="Status", lines=4)
+    results_table = gr.DataFrame(label="Generated Answers", wrap=True)
+    run_button.click(
+        fn=run_and_submit_all,
+        outputs=[status_output, results_table]
+    )
 if __name__ == "__main__":
     demo.launch()