Spaces:
Sleeping
Sleeping
Update inference.py
Browse files- inference.py +7 -4
inference.py
CHANGED
|
@@ -116,7 +116,8 @@ def run_task(env: SupportTriageEnv, task_id: str):
|
|
| 116 |
rewards = []
|
| 117 |
steps = 0
|
| 118 |
success = False
|
| 119 |
-
|
|
|
|
| 120 |
# ββ [START] ββ
|
| 121 |
print(f"[START] task={task_id} env=support-triage model={MODEL_NAME}", flush=True)
|
| 122 |
|
|
@@ -172,17 +173,19 @@ def run_task(env: SupportTriageEnv, task_id: str):
|
|
| 172 |
|
| 173 |
# Summary check
|
| 174 |
summary = env.episode_summary()
|
| 175 |
-
|
|
|
|
| 176 |
|
| 177 |
except Exception as e:
|
|
|
|
| 178 |
# Emit one error step if reset fails
|
| 179 |
-
print(f"[STEP] step=1 action=null reward=0.
|
| 180 |
|
| 181 |
finally:
|
| 182 |
# ββ [END] ββ
|
| 183 |
success_str = "true" if success else "false"
|
| 184 |
rewards_str = ",".join([f"{r:.2f}" for r in rewards])
|
| 185 |
-
print(f"[END] success={success_str} steps={steps} rewards={rewards_str}", flush=True)
|
| 186 |
|
| 187 |
def main():
|
| 188 |
env = SupportTriageEnv()
|
|
|
|
| 116 |
rewards = []
|
| 117 |
steps = 0
|
| 118 |
success = False
|
| 119 |
+
task_score = 0.01 # default score if something goes wrong early
|
| 120 |
+
|
| 121 |
# ββ [START] ββ
|
| 122 |
print(f"[START] task={task_id} env=support-triage model={MODEL_NAME}", flush=True)
|
| 123 |
|
|
|
|
| 173 |
|
| 174 |
# Summary check
|
| 175 |
summary = env.episode_summary()
|
| 176 |
+
task_score = max(0.01, min(0.99, summary.score))
|
| 177 |
+
success = task_score >= 0.70 # Arbitrary success threshold for log
|
| 178 |
|
| 179 |
except Exception as e:
|
| 180 |
+
task_score = 0.01
|
| 181 |
# Emit one error step if reset fails
|
| 182 |
+
print(f"[STEP] step=1 action=null reward=0.01 done=true error={str(e)}", flush=True)
|
| 183 |
|
| 184 |
finally:
|
| 185 |
# ββ [END] ββ
|
| 186 |
success_str = "true" if success else "false"
|
| 187 |
rewards_str = ",".join([f"{r:.2f}" for r in rewards])
|
| 188 |
+
print(f"[END] success={success_str} steps={steps} score={task_score:.4f} rewards={rewards_str}", flush=True)
|
| 189 |
|
| 190 |
def main():
|
| 191 |
env = SupportTriageEnv()
|