samrat-rm commited on
Commit
2014a9f
·
1 Parent(s): e7b5e0d

chore: code cleanup

Browse files
Files changed (1) hide show
  1. inference.py +1 -3
inference.py CHANGED
@@ -212,8 +212,6 @@ async def run_episode(
212
  obs = result.observation
213
  reward = result.reward or 0.0
214
  done = result.done
215
- act_str = action.model_dump_json(exclude_none=True, exclude_defaults=True)
216
-
217
  if action.action_type in ("inspect_logs", "inspect_config", "inspect_gradients"):
218
  source = action.action_type.replace("inspect_", "")
219
  if source not in inspection_order:
@@ -224,7 +222,7 @@ async def run_episode(
224
 
225
  rewards.append(reward)
226
  data_seen = json.dumps(obs.visible_data) if obs.visible_data else "{}"
227
- history.append(f"Step {step}: {act_str} → reward={reward:.2f} | {obs.feedback}\n Data: {data_seen}")
228
  print(f"[STEP] step={step} action={action.action_type} reward={reward:.2f} done={str(done).lower()} error=null", flush=True)
229
 
230
  if done:
 
212
  obs = result.observation
213
  reward = result.reward or 0.0
214
  done = result.done
 
 
215
  if action.action_type in ("inspect_logs", "inspect_config", "inspect_gradients"):
216
  source = action.action_type.replace("inspect_", "")
217
  if source not in inspection_order:
 
222
 
223
  rewards.append(reward)
224
  data_seen = json.dumps(obs.visible_data) if obs.visible_data else "{}"
225
+ history.append(f"Step {step}: {action.action_type} → reward={reward:.2f} | {obs.feedback}\n Data: {data_seen}")
226
  print(f"[STEP] step={step} action={action.action_type} reward={reward:.2f} done={str(done).lower()} error=null", flush=True)
227
 
228
  if done: