easy task fix

Files changed (15) hide show

.gitignore CHANGED Viewed

@@ -1,2 +1,3 @@
 .venv
 .env

 .venv
 .env
+__pycache__/

inference.py CHANGED Viewed

@@ -8,7 +8,8 @@ from openai import OpenAI
 from support_ops_env.env import SupportOpsEnv
 from support_ops_env.models import Action, Observation
 from support_ops_env.tasks import list_task_ids
 LOCAL_IMAGE_NAME = os.getenv("LOCAL_IMAGE_NAME")
 API_KEY = os.getenv("HF_TOKEN") or os.getenv("OPENAI_API_KEY") or os.getenv("API_KEY")
 API_BASE_URL = os.getenv("API_BASE_URL", "https://router.huggingface.co/v1")
@@ -102,9 +103,11 @@ def get_model_action(client: OpenAI, observation: Observation, step: int, reward
 def clamp_score(score: float) -> float:
-    """Clamp score to strictly open interval (0, 1) as required by the grader."""
-    _EPSILON = 1e-6
-    return min(max(float(score), _EPSILON), 1.0 - _EPSILON)
 def select_tasks(requested: str) -> List[str]:

 from support_ops_env.env import SupportOpsEnv
 from support_ops_env.models import Action, Observation
 from support_ops_env.tasks import list_task_ids
+from dotenv import load_dotenv
+load_dotenv()
 LOCAL_IMAGE_NAME = os.getenv("LOCAL_IMAGE_NAME")
 API_KEY = os.getenv("HF_TOKEN") or os.getenv("OPENAI_API_KEY") or os.getenv("API_KEY")
 API_BASE_URL = os.getenv("API_BASE_URL", "https://router.huggingface.co/v1")
 def clamp_score(score: float) -> float:
+    """Clamp score to strictly open interval (0, 1).
+    Uses 0.001/0.999 so the value survives :.3f log formatting —
+    the submission parser reads that string, so 1e-6 would round
+    to '0.000' and be rejected as exactly 0.0."""
+    return min(max(float(score), 0.001), 0.999)
 def select_tasks(requested: str) -> List[str]:

support_ops_env/__pycache__/__init__.cpython-314.pyc ADDED Viewed

Binary file (447 Bytes). View file

support_ops_env/__pycache__/env.cpython-314.pyc ADDED Viewed

Binary file (18.2 kB). View file

support_ops_env/__pycache__/models.cpython-314.pyc ADDED Viewed

Binary file (5.46 kB). View file

support_ops_env/__pycache__/reward.cpython-314.pyc ADDED Viewed

Binary file (876 Bytes). View file

support_ops_env/__pycache__/state.cpython-314.pyc ADDED Viewed

Binary file (2.34 kB). View file

support_ops_env/graders/__pycache__/__init__.cpython-314.pyc ADDED Viewed

Binary file (1.17 kB). View file

support_ops_env/graders/__pycache__/common.cpython-314.pyc ADDED Viewed

Binary file (7.57 kB). View file

support_ops_env/graders/__pycache__/easy.cpython-314.pyc ADDED Viewed

Binary file (877 Bytes). View file

support_ops_env/graders/__pycache__/hard.cpython-314.pyc ADDED Viewed

Binary file (901 Bytes). View file

support_ops_env/graders/__pycache__/medium.cpython-314.pyc ADDED Viewed

Binary file (879 Bytes). View file

support_ops_env/graders/common.py CHANGED Viewed

@@ -7,8 +7,8 @@ from ..models import StateModel, TaskGrade, TaskSpec, TicketSpec
 # Scores must be strictly within (0, 1) — the submission grader rejects
 # exact 0.0 and 1.0.  Because all non-context components are binary,
 # a perfect or zero run would otherwise produce exactly 0.0 or 1.0.
-_SCORE_MIN = 1e-6
-_SCORE_MAX = 1.0 - 1e-6
 def _clamp(score: float) -> float:

 # Scores must be strictly within (0, 1) — the submission grader rejects
 # exact 0.0 and 1.0.  Because all non-context components are binary,
 # a perfect or zero run would otherwise produce exactly 0.0 or 1.0.
+_SCORE_MIN = 0.001
+_SCORE_MAX = 0.999
 def _clamp(score: float) -> float:

support_ops_env/tasks/__pycache__/__init__.cpython-314.pyc ADDED Viewed

Binary file (307 Bytes). View file

support_ops_env/tasks/__pycache__/loader.cpython-314.pyc ADDED Viewed

Binary file (2.61 kB). View file