UjjwalPardeshi commited on
Commit ·
ee366d9
1
Parent(s): e979357
fix: inference
Browse files- inference.py +21 -19
inference.py
CHANGED
|
@@ -196,30 +196,28 @@ def parse_action(raw: str) -> str:
|
|
| 196 |
|
| 197 |
|
| 198 |
async def main() -> None:
|
| 199 |
-
if not API_KEY:
|
| 200 |
-
print(
|
| 201 |
-
"Error: OPENAI_API_KEY or HF_TOKEN required.", flush=True
|
| 202 |
-
)
|
| 203 |
-
sys.exit(1)
|
| 204 |
-
|
| 205 |
-
client = OpenAI(base_url=API_BASE_URL, api_key=API_KEY)
|
| 206 |
-
|
| 207 |
-
# Connect to environment via standard OpenEnv client
|
| 208 |
-
if IMAGE_NAME:
|
| 209 |
-
env = await GenericEnvClient.from_docker_image(IMAGE_NAME)
|
| 210 |
-
else:
|
| 211 |
-
env = GenericEnvClient(base_url=ENV_URL, message_timeout_s=120.0)
|
| 212 |
-
await env.connect()
|
| 213 |
-
|
| 214 |
history: List[str] = []
|
| 215 |
rewards: List[float] = []
|
| 216 |
steps_taken = 0
|
| 217 |
score = 0.0
|
| 218 |
success = False
|
|
|
|
| 219 |
|
| 220 |
log_start(task=TASK_NAME, env=BENCHMARK, model=MODEL_NAME)
|
| 221 |
|
| 222 |
try:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 223 |
result = await env.reset(task_id=TASK_NAME, seed=42)
|
| 224 |
obs = result.observation
|
| 225 |
last_reward = 0.0
|
|
@@ -259,11 +257,15 @@ async def main() -> None:
|
|
| 259 |
score = min(max(score, 0.0), 1.0) # clamp to [0, 1]
|
| 260 |
success = score >= SUCCESS_SCORE_THRESHOLD
|
| 261 |
|
|
|
|
|
|
|
|
|
|
| 262 |
finally:
|
| 263 |
-
|
| 264 |
-
|
| 265 |
-
|
| 266 |
-
|
|
|
|
| 267 |
log_end(success=success, steps=steps_taken, score=score, rewards=rewards)
|
| 268 |
|
| 269 |
|
|
|
|
| 196 |
|
| 197 |
|
| 198 |
async def main() -> None:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 199 |
history: List[str] = []
|
| 200 |
rewards: List[float] = []
|
| 201 |
steps_taken = 0
|
| 202 |
score = 0.0
|
| 203 |
success = False
|
| 204 |
+
env = None
|
| 205 |
|
| 206 |
log_start(task=TASK_NAME, env=BENCHMARK, model=MODEL_NAME)
|
| 207 |
|
| 208 |
try:
|
| 209 |
+
if not API_KEY:
|
| 210 |
+
raise RuntimeError("OPENAI_API_KEY or HF_TOKEN required.")
|
| 211 |
+
|
| 212 |
+
client = OpenAI(base_url=API_BASE_URL, api_key=API_KEY)
|
| 213 |
+
|
| 214 |
+
# Connect to environment via standard OpenEnv client
|
| 215 |
+
if IMAGE_NAME:
|
| 216 |
+
env = await GenericEnvClient.from_docker_image(IMAGE_NAME)
|
| 217 |
+
else:
|
| 218 |
+
env = GenericEnvClient(base_url=ENV_URL, message_timeout_s=120.0)
|
| 219 |
+
await env.connect()
|
| 220 |
+
|
| 221 |
result = await env.reset(task_id=TASK_NAME, seed=42)
|
| 222 |
obs = result.observation
|
| 223 |
last_reward = 0.0
|
|
|
|
| 257 |
score = min(max(score, 0.0), 1.0) # clamp to [0, 1]
|
| 258 |
success = score >= SUCCESS_SCORE_THRESHOLD
|
| 259 |
|
| 260 |
+
except Exception as exc:
|
| 261 |
+
print(f"[DEBUG] Unhandled error: {exc}", flush=True)
|
| 262 |
+
|
| 263 |
finally:
|
| 264 |
+
if env is not None:
|
| 265 |
+
try:
|
| 266 |
+
await env.close()
|
| 267 |
+
except Exception as e:
|
| 268 |
+
print(f"[DEBUG] env.close() error (container cleanup): {e}", flush=True)
|
| 269 |
log_end(success=success, steps=steps_taken, score=score, rewards=rewards)
|
| 270 |
|
| 271 |
|