Spaces:

Kavya988
/

API_DEBUG_SOLVER

Sleeping

Update tasks/rate_limit/grader.py

by Tarun-sar0ya - opened Apr 12

←

Files changed (1) hide show

tasks/rate_limit/grader.py CHANGED Viewed

@@ -1,9 +1,32 @@
 """Grader for rate_limit task: 429 Too Many Requests."""
-from tasks.grading_helper import run_agent_on_incident
-def grade() -> float:
-    """Grade the rate_limit task. Returns score between 0 and 1."""
-    score = run_agent_on_incident("rate_limit")
-    return max(0.001, min(0.999, score))

 """Grader for rate_limit task: 429 Too Many Requests."""
+def grade(trajectory) -> float:
+    """Grade the rate_limit task based on agent trajectory.
+    Args:
+        trajectory: List of (action, observation, reward) tuples from the episode.
+    Returns:
+        Score between 0 and 1.
+    """
+    if not trajectory:
+        return 0.0
+    # Check if agent used wait_retry to fix the 429 error
+    actions = [step[0] if isinstance(step, (list, tuple)) else step.get("action", "") for step in trajectory]
+    correct_action_used = "wait_retry" in actions
+    resolved = any(
+        (step[2] > 0 if isinstance(step, (list, tuple)) else step.get("reward", 0) > 0)
+        for step in trajectory
+    )
+    if correct_action_used and resolved:
+        return 0.95
+    elif correct_action_used:
+        return 0.6
+    elif resolved:
+        return 0.4
+    else:
+        return 0.05