Final_Assignment

Sleeping

App Files Files Community

Shivangsinha commited on 15 days ago

Commit

3098349

verified ·

1 Parent(s): 24811b1

Update app.py

Browse files

Files changed (1) hide show

app.py +30 -12

app.py CHANGED Viewed

@@ -24,13 +24,10 @@ class BasicAgent:
     def __init__(self):
         print("BasicAgent initialized.")
-        # 1. Fetch the NEW Hugging Face token from secrets
-        new_hf_token = os.getenv("HF_TOKEN")
         if not new_hf_token:
-            raise ValueError("HF_TOKEN environment variable not set in Space Secrets.")
-        # 2. Connect to Hugging Face's free Serverless Inference API
-        # Qwen2.5-Coder-32B-Instruct is the recommended model for this course
         self.model = InferenceClientModel(
             model_id="Qwen/Qwen2.5-Coder-32B-Instruct",
             token=new_hf_token,
@@ -46,8 +43,9 @@ class BasicAgent:
         self.agent = CodeAgent(
             tools=self.tools,
             model=self.model,
-            max_steps=7,
-            additional_authorized_imports=["datetime", "re", "json", "math", "collections"],
         )
         print("BasicAgent ready with Hugging Face (Qwen2.5-Coder-32B).")
@@ -65,7 +63,7 @@ class BasicAgent:
                 err_msg = str(e).lower()
                 if "429" in err_msg or "rate limit" in err_msg or "too many requests" in err_msg:
                     wait_time = 20 * (attempt + 1)
-                    print(f"Rate limit hit! Pausing for {wait_time} seconds before retrying (Attempt {attempt+1}/{max_retries})...")
                     time.sleep(wait_time)
                 else:
                     print(f"Agent error processing question: {e}")
@@ -111,11 +109,31 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
     for i, item in enumerate(questions_data):
         task_id = item.get("task_id")
         question_text = item.get("question")
         if not task_id or not question_text:
             continue
         try:
-            submitted_answer = agent(question_text)
             answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
             results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
         except Exception as e:
@@ -150,12 +168,12 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
 # --- Build Gradio UI ---
 with gr.Blocks() as demo:
-    gr.Markdown("# Basic Agent Evaluation Runner (Hugging Face Edition)")
     gr.Markdown(
         """
         **Instructions:**
-        1. Set `NEW_HF_TOKEN` in your Space Secrets using a secondary Hugging Face account.
-        2. Log in with your primary Hugging Face account below.
         3. Click 'Run Evaluation & Submit' to start.
         """
     )

     def __init__(self):
         print("BasicAgent initialized.")
+        new_hf_token = os.getenv("NEW_HF_TOKEN")
         if not new_hf_token:
+            raise ValueError("NEW_HF_TOKEN environment variable not set in Space Secrets.")
         self.model = InferenceClientModel(
             model_id="Qwen/Qwen2.5-Coder-32B-Instruct",
             token=new_hf_token,
         self.agent = CodeAgent(
             tools=self.tools,
             model=self.model,
+            max_steps=10,
+            # CRITICAL FIX: Added pandas and requests so the agent can download and read Excel/CSV files!
+            additional_authorized_imports=["datetime", "re", "json", "math", "collections", "pandas", "requests"],
         )
         print("BasicAgent ready with Hugging Face (Qwen2.5-Coder-32B).")
                 err_msg = str(e).lower()
                 if "429" in err_msg or "rate limit" in err_msg or "too many requests" in err_msg:
                     wait_time = 20 * (attempt + 1)
+                    print(f"Rate limit hit! Pausing for {wait_time} seconds before retrying...")
                     time.sleep(wait_time)
                 else:
                     print(f"Agent error processing question: {e}")
     for i, item in enumerate(questions_data):
         task_id = item.get("task_id")
         question_text = item.get("question")
+        # CRITICAL FIX 1: Grab the hidden file URL if the server provides one
+        file_url = item.get("file_url")
         if not task_id or not question_text:
             continue
+        # CRITICAL FIX 2: Inject the file URL into the agent's prompt so it can download it
+        if file_url:
+            question_text += f"\n\n[IMPORTANT: This task requires analyzing an attached file. You MUST download or read it directly from this URL: {file_url} using your Python tool.]"
+        # CRITICAL FIX 3: Threaten the agent to act like a strict robot to pass the automated grader
+        strict_prompt = (
+            f"{question_text}\n\n"
+            "CRITICAL SUBMISSION INSTRUCTIONS:\n"
+            "The system evaluating your answer is a strict automated parser.\n"
+            "1. You MUST output ONLY the final requested answer.\n"
+            "2. DO NOT include any conversational text, explanations, or reasoning in your final output.\n"
+            "3. If the answer is a name, number, or short string, output ONLY that exact string.\n"
+            "4. For numbers, do not include symbols unless explicitly requested."
+        )
         try:
+            # We pass the strict prompt instead of the raw question
+            submitted_answer = agent(strict_prompt)
             answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
             results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
         except Exception as e:
 # --- Build Gradio UI ---
 with gr.Blocks() as demo:
+    gr.Markdown("# Basic Agent Evaluation Runner")
     gr.Markdown(
         """
         **Instructions:**
+        1. Ensure your `NEW_HF_TOKEN` is set.
+        2. Log in below.
         3. Click 'Run Evaluation & Submit' to start.
         """
     )