Spaces:
Running
Running
Commit ·
f0a1ea3
1
Parent(s): 689050e
Changes in inferenece decimal
Browse files- inference.py +2 -2
inference.py
CHANGED
|
@@ -70,7 +70,7 @@ def log_step(step: int, action: str, reward: float, done: bool, error: Optional[
|
|
| 70 |
def log_end(success: bool, steps: int, score: float, rewards: List[float]) -> None:
|
| 71 |
rewards_str = ",".join(f"{r:.2f}" for r in rewards)
|
| 72 |
print(
|
| 73 |
-
f"[END] success={str(success).lower()} steps={steps} score={score:.
|
| 74 |
flush=True,
|
| 75 |
)
|
| 76 |
|
|
@@ -91,7 +91,7 @@ def build_user_prompt(obs, step: int, history: List[str]) -> str:
|
|
| 91 |
Previous actions:
|
| 92 |
{history_block}
|
| 93 |
|
| 94 |
-
{"
|
| 95 |
|
| 96 |
Respond with ONLY a JSON object: {{"sql": "...", "query_type": "explore" or "submit"}}
|
| 97 |
""").strip()
|
|
|
|
| 70 |
def log_end(success: bool, steps: int, score: float, rewards: List[float]) -> None:
|
| 71 |
rewards_str = ",".join(f"{r:.2f}" for r in rewards)
|
| 72 |
print(
|
| 73 |
+
f"[END] success={str(success).lower()} steps={steps} score={score:.2f} rewards={rewards_str}",
|
| 74 |
flush=True,
|
| 75 |
)
|
| 76 |
|
|
|
|
| 91 |
Previous actions:
|
| 92 |
{history_block}
|
| 93 |
|
| 94 |
+
{"No more explore steps — you MUST submit now (query_type='submit')" if obs.explore_steps_remaining == 0 else "You can explore more or submit your final answer."}
|
| 95 |
|
| 96 |
Respond with ONLY a JSON object: {{"sql": "...", "query_type": "explore" or "submit"}}
|
| 97 |
""").strip()
|