Files changed (1) hide show
  1. inference.py +19 -3
inference.py CHANGED
@@ -208,7 +208,14 @@ def get_model_answer(
208
  # ─── Main loop ──────────────────────────────────────────────────────────────
209
  async def main() -> None:
210
  client = OpenAI(base_url=API_BASE_URL, api_key=HF_TOKEN)
211
- env = await CodeAssessmentEnv.from_docker_image(LOCAL_IMAGE_NAME)
 
 
 
 
 
 
 
212
 
213
  rewards: List[float] = []
214
  history: List[dict] = []
@@ -242,8 +249,14 @@ async def main() -> None:
242
  user_context=obs.user_context,
243
  )
244
 
245
- result = await env.step(CodeAssessmentAction(answer=answer))
246
- obs = result.observation
 
 
 
 
 
 
247
 
248
  reward = result.reward or 0.0
249
  done = result.done
@@ -261,6 +274,9 @@ async def main() -> None:
261
  score = min(max(score, 0.0), 1.0)
262
  success = score >= SUCCESS_SCORE_THRESHOLD
263
 
 
 
 
264
  finally:
265
  try:
266
  await env.close()
 
208
  # ─── Main loop ──────────────────────────────────────────────────────────────
209
  async def main() -> None:
210
  client = OpenAI(base_url=API_BASE_URL, api_key=HF_TOKEN)
211
+
212
+ # Connect to already-running server (validator provides ENV_URL),
213
+ # fall back to starting a Docker container for local testing.
214
+ env_url = os.getenv("ENV_URL")
215
+ if env_url:
216
+ env = CodeAssessmentEnv(base_url=env_url)
217
+ else:
218
+ env = await CodeAssessmentEnv.from_docker_image(LOCAL_IMAGE_NAME)
219
 
220
  rewards: List[float] = []
221
  history: List[dict] = []
 
249
  user_context=obs.user_context,
250
  )
251
 
252
+ try:
253
+ result = await env.step(CodeAssessmentAction(answer=answer))
254
+ obs = result.observation
255
+ except Exception as exc:
256
+ print(f"[DEBUG] env.step() failed: {exc}", flush=True)
257
+ log_step(step=step, action=answer[:60], reward=0.0, done=True, error=str(exc))
258
+ steps_taken = step
259
+ break
260
 
261
  reward = result.reward or 0.0
262
  done = result.done
 
274
  score = min(max(score, 0.0), 1.0)
275
  success = score >= SUCCESS_SCORE_THRESHOLD
276
 
277
+ except Exception as exc:
278
+ print(f"[DEBUG] Episode failed: {exc}", flush=True)
279
+
280
  finally:
281
  try:
282
  await env.close()