Spaces:
Sleeping
Sleeping
chore: code cleanup
Browse files- inference.py +1 -3
inference.py
CHANGED
|
@@ -212,8 +212,6 @@ async def run_episode(
|
|
| 212 |
obs = result.observation
|
| 213 |
reward = result.reward or 0.0
|
| 214 |
done = result.done
|
| 215 |
-
act_str = action.model_dump_json(exclude_none=True, exclude_defaults=True)
|
| 216 |
-
|
| 217 |
if action.action_type in ("inspect_logs", "inspect_config", "inspect_gradients"):
|
| 218 |
source = action.action_type.replace("inspect_", "")
|
| 219 |
if source not in inspection_order:
|
|
@@ -224,7 +222,7 @@ async def run_episode(
|
|
| 224 |
|
| 225 |
rewards.append(reward)
|
| 226 |
data_seen = json.dumps(obs.visible_data) if obs.visible_data else "{}"
|
| 227 |
-
history.append(f"Step {step}: {
|
| 228 |
print(f"[STEP] step={step} action={action.action_type} reward={reward:.2f} done={str(done).lower()} error=null", flush=True)
|
| 229 |
|
| 230 |
if done:
|
|
|
|
| 212 |
obs = result.observation
|
| 213 |
reward = result.reward or 0.0
|
| 214 |
done = result.done
|
|
|
|
|
|
|
| 215 |
if action.action_type in ("inspect_logs", "inspect_config", "inspect_gradients"):
|
| 216 |
source = action.action_type.replace("inspect_", "")
|
| 217 |
if source not in inspection_order:
|
|
|
|
| 222 |
|
| 223 |
rewards.append(reward)
|
| 224 |
data_seen = json.dumps(obs.visible_data) if obs.visible_data else "{}"
|
| 225 |
+
history.append(f"Step {step}: {action.action_type} → reward={reward:.2f} | {obs.feedback}\n Data: {data_seen}")
|
| 226 |
print(f"[STEP] step={step} action={action.action_type} reward={reward:.2f} done={str(done).lower()} error=null", flush=True)
|
| 227 |
|
| 228 |
if done:
|