samrat-rm commited on
Commit
faf4fb8
·
1 Parent(s): f74015b

chore: updating logs

Browse files
Files changed (1) hide show
  1. inference.py +3 -2
inference.py CHANGED
@@ -225,7 +225,7 @@ async def run_episode(
225
  rewards.append(reward)
226
  data_seen = json.dumps(obs.visible_data) if obs.visible_data else "{}"
227
  history.append(f"Step {step}: {act_str} → reward={reward:.2f} | {obs.feedback}\n Data: {data_seen}")
228
- print(f"[STEP] step={step} action={act_str} reward={reward:.2f} done={str(done).lower()} error=null", flush=True)
229
 
230
  if done:
231
  break
@@ -254,7 +254,8 @@ async def run_episode(
254
 
255
  finally:
256
  steps_taken = len(rewards)
257
- print(f"[END] success={str(success).lower()} steps={steps_taken} rewards={score:.2f}", flush=True)
 
258
 
259
  return {"scenario_key": scenario_key, "score": score, "steps": steps_taken, "success": success}, env
260
 
 
225
  rewards.append(reward)
226
  data_seen = json.dumps(obs.visible_data) if obs.visible_data else "{}"
227
  history.append(f"Step {step}: {act_str} → reward={reward:.2f} | {obs.feedback}\n Data: {data_seen}")
228
+ print(f"[STEP] step={step} action={action.action_type} reward={reward:.2f} done={str(done).lower()} error=null", flush=True)
229
 
230
  if done:
231
  break
 
254
 
255
  finally:
256
  steps_taken = len(rewards)
257
+ rewards_str = ",".join(f"{r:.2f}" for r in rewards) if rewards else "0.00"
258
+ print(f"[END] success={str(success).lower()} steps={steps_taken} score={score:.2f} rewards={rewards_str}", flush=True)
259
 
260
  return {"scenario_key": scenario_key, "score": score, "steps": steps_taken, "success": success}, env
261