Final_Assignment_Template

Sleeping

App Files Files Community

wlchee commited on May 6, 2025

Commit

6b13ec1

verified ·

1 Parent(s): d9fc97b

Update app.py

Browse files

Files changed (1) hide show

app.py +29 -41

app.py CHANGED Viewed

@@ -9,7 +9,7 @@ from smolagents.models import InferenceClientModel
 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
-# --- Custom Tools with Proper Input/Output Specifications ---
 class CalculatorTool(Tool):
     name = "calculator"
     description = "Performs mathematical calculations"
@@ -35,21 +35,21 @@ class CalculatorTool(Tool):
 class TimeTool(Tool):
     name = "current_time"
     description = "Gets current UTC time"
-    input_schema = {}  # No inputs needed
     output_schema = {
         "time": {
             "type": "string",
-            "description": "Current time in UTC (YYYY-MM-DD HH:MM:SS)"
         }
     }
     def use(self) -> dict:
         return {"time": datetime.utcnow().strftime("%Y-%m-%d %H:%M:%S UTC")}
-# --- Enhanced Agent ---
 class LocalAgent:
     def __init__(self):
-        print("Initializing agent with smolagents...")
         self.tools = [CalculatorTool(), TimeTool()]
         self.agent = ToolCallingAgent(
             tools=self.tools,
@@ -60,42 +60,32 @@ class LocalAgent:
         )
     def __call__(self, question: str) -> str:
-        print(f"Processing: {question[:100]}...")
         question_lower = question.lower()
-        # Direct tool usage for simple queries
-        if any(word in question_lower for word in ["calculate", "what is", "how much is", "+", "-", "*", "/"]):
-            result = CalculatorTool().use(question.replace("?", ""))
-            return result["result"]
-        if any(word in question_lower for word in ["time", "current time"]):
-            result = TimeTool().use()
-            return result["time"]
-        # Use full agent for complex questions
         try:
-            response = self.agent.run(question)
-            return str(response)
         except Exception as e:
-            print(f"Agent error: {e}")
-            return "I couldn't process this question."
-# --- Evaluation Runner ---
 def run_and_submit_all(profile: gr.OAuthProfile | None):
     if not profile:
-        return "Please login first", None
     space_id = os.getenv("SPACE_ID", "local-test")
     api_url = os.getenv("API_URL", DEFAULT_API_URL)
     try:
         agent = LocalAgent()
-        response = requests.get(f"{api_url}/questions", timeout=15)
-        response.raise_for_status()
-        questions = response.json()
-        results = []
         answers = []
         for q in questions:
             try:
                 answer = agent(q["question"])
@@ -121,36 +111,34 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
             "answers": answers
         }
-        response = requests.post(f"{api_url}/submit", json=submission, timeout=60)
-        response.raise_for_status()
-        result = response.json()
         return (
-            f"Success! Score: {result.get('score', 'N/A')}%\n"
             f"Correct: {result.get('correct_count', '?')}/{result.get('total_attempted', '?')}",
             pd.DataFrame(results)
         )
     except Exception as e:
-        return f"Evaluation failed: {str(e)}", pd.DataFrame(results if 'results' in locals() else [])
-# --- Gradio Interface ---
 with gr.Blocks(title="Agent Evaluation Runner") as app:
-    gr.Markdown("""
-    ## Advanced Agent Evaluation
-    Uses smolagents with proper tool schemas
-    """)
-    profile = gr.OAuthProfile()
-    run_btn = gr.Button("Run Evaluation")
-    output = gr.Textbox(label="Results")
-    results_table = gr.DataFrame(label="Question Log")
     run_btn.click(
         fn=run_and_submit_all,
-        inputs=[profile],  # <-- Corrected: OAuthProfile passed in
         outputs=[output, results_table]
     )
 if __name__ == "__main__":
     app.launch()

 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
+# --- Custom Tools ---
 class CalculatorTool(Tool):
     name = "calculator"
     description = "Performs mathematical calculations"
 class TimeTool(Tool):
     name = "current_time"
     description = "Gets current UTC time"
+    input_schema = {}  # No input
     output_schema = {
         "time": {
             "type": "string",
+            "description": "Current UTC time (YYYY-MM-DD HH:MM:SS)"
         }
     }
     def use(self) -> dict:
         return {"time": datetime.utcnow().strftime("%Y-%m-%d %H:%M:%S UTC")}
+# --- Agent Setup ---
 class LocalAgent:
     def __init__(self):
+        print("Initializing agent...")
         self.tools = [CalculatorTool(), TimeTool()]
         self.agent = ToolCallingAgent(
             tools=self.tools,
         )
     def __call__(self, question: str) -> str:
         question_lower = question.lower()
+        if any(op in question_lower for op in ["calculate", "what is", "+", "-", "*", "/"]):
+            return CalculatorTool().use(question.replace("?", ""))["result"]
+        if "time" in question_lower:
+            return TimeTool().use()["time"]
         try:
+            return str(self.agent.run(question))
         except Exception as e:
+            return f"Error: {e}"
+# --- Evaluation Logic ---
 def run_and_submit_all(profile: gr.OAuthProfile | None):
     if not profile:
+        return "Please login first.", None
     space_id = os.getenv("SPACE_ID", "local-test")
     api_url = os.getenv("API_URL", DEFAULT_API_URL)
     try:
         agent = LocalAgent()
+        questions = requests.get(f"{api_url}/questions", timeout=15).json()
         answers = []
+        results = []
         for q in questions:
             try:
                 answer = agent(q["question"])
             "answers": answers
         }
+        result = requests.post(f"{api_url}/submit", json=submission, timeout=60).json()
         return (
+            f"✅ Score: {result.get('score', 'N/A')}%\n"
             f"Correct: {result.get('correct_count', '?')}/{result.get('total_attempted', '?')}",
             pd.DataFrame(results)
         )
     except Exception as e:
+        return f"Evaluation failed: {str(e)}", pd.DataFrame([])
+# --- Gradio UI ---
 with gr.Blocks(title="Agent Evaluation Runner") as app:
+    gr.Markdown("## 🤖 Agent Evaluation with smolagents")
+    gr.Markdown("Login, then run the evaluation to test your agent.")
+    gr.LoginButton()  # OAuth Login UI
+    run_btn = gr.Button("🚀 Run Evaluation")
+    output = gr.Textbox(label="Result Summary")
+    results_table = gr.DataFrame(label="Answers and Logs")
     run_btn.click(
         fn=run_and_submit_all,
+        inputs=[],  # No need to pass profile manually
         outputs=[output, results_table]
     )
 if __name__ == "__main__":
     app.launch()