UjjwalPardeshi commited on
Commit ·
006d13b
1
Parent(s): da20dfa
inference format fix
Browse files- inference.py +5 -2
inference.py
CHANGED
|
@@ -66,15 +66,18 @@ def log_start(task: str, env: str, model: str) -> None:
|
|
| 66 |
def log_step(
|
| 67 |
step: int, action: str, reward: float, done: bool, error: Optional[str]
|
| 68 |
) -> None:
|
|
|
|
|
|
|
| 69 |
print(
|
| 70 |
-
f"[STEP] step={step} action={action} reward={reward} done={
|
| 71 |
flush=True,
|
| 72 |
)
|
| 73 |
|
| 74 |
|
| 75 |
def log_end(success: bool, steps: int, score: float, rewards: list[float]) -> None:
|
|
|
|
| 76 |
print(
|
| 77 |
-
f"[END] success={success} steps={steps} score={score} rewards={
|
| 78 |
flush=True,
|
| 79 |
)
|
| 80 |
|
|
|
|
| 66 |
def log_step(
|
| 67 |
step: int, action: str, reward: float, done: bool, error: Optional[str]
|
| 68 |
) -> None:
|
| 69 |
+
error_val = error if error else "null"
|
| 70 |
+
done_val = str(done).lower()
|
| 71 |
print(
|
| 72 |
+
f"[STEP] step={step} action={action} reward={reward:.2f} done={done_val} error={error_val}",
|
| 73 |
flush=True,
|
| 74 |
)
|
| 75 |
|
| 76 |
|
| 77 |
def log_end(success: bool, steps: int, score: float, rewards: list[float]) -> None:
|
| 78 |
+
rewards_str = ",".join(f"{r:.2f}" for r in rewards)
|
| 79 |
print(
|
| 80 |
+
f"[END] success={str(success).lower()} steps={steps} score={score:.3f} rewards={rewards_str}",
|
| 81 |
flush=True,
|
| 82 |
)
|
| 83 |
|