Spaces:
Sleeping
Sleeping
chore: updating logs
Browse files- inference.py +3 -2
inference.py
CHANGED
|
@@ -225,7 +225,7 @@ async def run_episode(
|
|
| 225 |
rewards.append(reward)
|
| 226 |
data_seen = json.dumps(obs.visible_data) if obs.visible_data else "{}"
|
| 227 |
history.append(f"Step {step}: {act_str} → reward={reward:.2f} | {obs.feedback}\n Data: {data_seen}")
|
| 228 |
-
print(f"[STEP] step={step} action={
|
| 229 |
|
| 230 |
if done:
|
| 231 |
break
|
|
@@ -254,7 +254,8 @@ async def run_episode(
|
|
| 254 |
|
| 255 |
finally:
|
| 256 |
steps_taken = len(rewards)
|
| 257 |
-
|
|
|
|
| 258 |
|
| 259 |
return {"scenario_key": scenario_key, "score": score, "steps": steps_taken, "success": success}, env
|
| 260 |
|
|
|
|
| 225 |
rewards.append(reward)
|
| 226 |
data_seen = json.dumps(obs.visible_data) if obs.visible_data else "{}"
|
| 227 |
history.append(f"Step {step}: {act_str} → reward={reward:.2f} | {obs.feedback}\n Data: {data_seen}")
|
| 228 |
+
print(f"[STEP] step={step} action={action.action_type} reward={reward:.2f} done={str(done).lower()} error=null", flush=True)
|
| 229 |
|
| 230 |
if done:
|
| 231 |
break
|
|
|
|
| 254 |
|
| 255 |
finally:
|
| 256 |
steps_taken = len(rewards)
|
| 257 |
+
rewards_str = ",".join(f"{r:.2f}" for r in rewards) if rewards else "0.00"
|
| 258 |
+
print(f"[END] success={str(success).lower()} steps={steps_taken} score={score:.2f} rewards={rewards_str}", flush=True)
|
| 259 |
|
| 260 |
return {"scenario_key": scenario_key, "score": score, "steps": steps_taken, "success": success}, env
|
| 261 |
|