Spaces:
Sleeping
Sleeping
Update inference.py
Browse files- inference.py +8 -1
inference.py
CHANGED
|
@@ -124,7 +124,14 @@ def run_baseline(task_level: str):
|
|
| 124 |
print(f"[STEP] step={step_count} action={action_str} reward={reward:.2f} done={done_str} error={error_msg}", flush=True)
|
| 125 |
|
| 126 |
# REQUIRED LOG FORMAT: END
|
| 127 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 128 |
success_str = str(score > 0.0).lower()
|
| 129 |
rewards_str = ",".join(f"{r:.2f}" for r in rewards_history)
|
| 130 |
|
|
|
|
| 124 |
print(f"[STEP] step={step_count} action={action_str} reward={reward:.2f} done={done_str} error={error_msg}", flush=True)
|
| 125 |
|
| 126 |
# REQUIRED LOG FORMAT: END
|
| 127 |
+
raw_score = info.get('score', 0.0)
|
| 128 |
+
|
| 129 |
+
# --- MINIMAL FIX FOR GRADER ---
|
| 130 |
+
# The grader requires strictly 0.0 < score < 1.0.
|
| 131 |
+
# We clamp the score so a 0.0 becomes 0.001 and a 1.0 becomes 0.999
|
| 132 |
+
score = max(0.001, min(0.999, raw_score))
|
| 133 |
+
# ------------------------------
|
| 134 |
+
|
| 135 |
success_str = str(score > 0.0).lower()
|
| 136 |
rewards_str = ",".join(f"{r:.2f}" for r in rewards_history)
|
| 137 |
|