Spaces:
Sleeping
Sleeping
Update inference.py
#13
by rsaibhargav - opened
- inference.py +19 -3
inference.py
CHANGED
|
@@ -208,7 +208,14 @@ def get_model_answer(
|
|
| 208 |
# βββ Main loop ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 209 |
async def main() -> None:
|
| 210 |
client = OpenAI(base_url=API_BASE_URL, api_key=HF_TOKEN)
|
| 211 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 212 |
|
| 213 |
rewards: List[float] = []
|
| 214 |
history: List[dict] = []
|
|
@@ -242,8 +249,14 @@ async def main() -> None:
|
|
| 242 |
user_context=obs.user_context,
|
| 243 |
)
|
| 244 |
|
| 245 |
-
|
| 246 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 247 |
|
| 248 |
reward = result.reward or 0.0
|
| 249 |
done = result.done
|
|
@@ -261,6 +274,9 @@ async def main() -> None:
|
|
| 261 |
score = min(max(score, 0.0), 1.0)
|
| 262 |
success = score >= SUCCESS_SCORE_THRESHOLD
|
| 263 |
|
|
|
|
|
|
|
|
|
|
| 264 |
finally:
|
| 265 |
try:
|
| 266 |
await env.close()
|
|
|
|
| 208 |
# βββ Main loop ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 209 |
async def main() -> None:
|
| 210 |
client = OpenAI(base_url=API_BASE_URL, api_key=HF_TOKEN)
|
| 211 |
+
|
| 212 |
+
# Connect to already-running server (validator provides ENV_URL),
|
| 213 |
+
# fall back to starting a Docker container for local testing.
|
| 214 |
+
env_url = os.getenv("ENV_URL")
|
| 215 |
+
if env_url:
|
| 216 |
+
env = CodeAssessmentEnv(base_url=env_url)
|
| 217 |
+
else:
|
| 218 |
+
env = await CodeAssessmentEnv.from_docker_image(LOCAL_IMAGE_NAME)
|
| 219 |
|
| 220 |
rewards: List[float] = []
|
| 221 |
history: List[dict] = []
|
|
|
|
| 249 |
user_context=obs.user_context,
|
| 250 |
)
|
| 251 |
|
| 252 |
+
try:
|
| 253 |
+
result = await env.step(CodeAssessmentAction(answer=answer))
|
| 254 |
+
obs = result.observation
|
| 255 |
+
except Exception as exc:
|
| 256 |
+
print(f"[DEBUG] env.step() failed: {exc}", flush=True)
|
| 257 |
+
log_step(step=step, action=answer[:60], reward=0.0, done=True, error=str(exc))
|
| 258 |
+
steps_taken = step
|
| 259 |
+
break
|
| 260 |
|
| 261 |
reward = result.reward or 0.0
|
| 262 |
done = result.done
|
|
|
|
| 274 |
score = min(max(score, 0.0), 1.0)
|
| 275 |
success = score >= SUCCESS_SCORE_THRESHOLD
|
| 276 |
|
| 277 |
+
except Exception as exc:
|
| 278 |
+
print(f"[DEBUG] Episode failed: {exc}", flush=True)
|
| 279 |
+
|
| 280 |
finally:
|
| 281 |
try:
|
| 282 |
await env.close()
|