Spaces:

Siteshcodes
/

bug-triage-env

Sleeping

App Files Files Community

Siteshcodes commited on Apr 4

Commit

6ff231e

1 Parent(s): 2824eb9

fix: auto-init bug in init for stateless HTTP server

Browse files

Files changed (1) hide show

server/environment.py +15 -45

server/environment.py CHANGED Viewed

@@ -4,11 +4,9 @@ sys.path.insert(0, "/app")
 sys.path.insert(0, "/app/server")
 import uuid
-import random
-from typing import Optional
 from openenv.core.env_server.interfaces import Environment
 from model import TriageAction, TriageObservation, TriageState, BugReport
-from task import TASKS, grade_action, sample_bug
 TASK_PROGRESSION = ["easy", "medium", "hard"]
@@ -23,8 +21,8 @@ class BugTriageEnvironment(Environment):
       Step 2 → medium task (priority + labels + team)
       Step 3 → hard task   (priority + labels + team + milestone)
-    Each reset() picks a fresh random bug from each task pool,
-    so the agent never sees the same sequence twice.
     """
     def __init__(self):
@@ -34,24 +32,21 @@ class BugTriageEnvironment(Environment):
             step_count=0,
             total_score=0.0,
             tasks_completed=[],
-    )
-        self._current_bug: Optional[BugReport] = None
         self._current_task_key: str = "easy"
         self._episode_done: bool = False
-    # ─────────────────────────────────────────
-    # reset()
-    # ─────────────────────────────────────────
     def reset(self) -> TriageObservation:
-        """Start a fresh episode. Picks a random bug from the easy pool."""
         self._state = TriageState(
-           episode_id=str(uuid.uuid4()),
-           current_task="easy",
-           step_count=0,
-           total_score=0.0,
-           tasks_completed=[],
-    )
         self._current_task_key = "easy"
         self._episode_done = False
         self._current_bug = sample_bug("easy")
@@ -65,21 +60,9 @@ class BugTriageEnvironment(Environment):
             reward=0.0,
         )
-    # ─────────────────────────────────────────
-    # step()
-    # ─────────────────────────────────────────
     def step(self, action: TriageAction) -> TriageObservation:
-        """
-        Process the agent's triage action and return the next observation.
-        - Grades the current task
-        - Advances to next task (easy → medium → hard)
-        - Returns done=True after the hard task is graded
-        """
-        # Guard: prevent stepping after episode is over
         if self._episode_done:
-            assert self._current_bug is not None
             return TriageObservation(
                 bug_report=self._current_bug,
                 task_id=self._current_task_key,
@@ -89,28 +72,21 @@ class BugTriageEnvironment(Environment):
                 reward=0.0,
             )
-        # Guard: step() must be called after reset()
-        assert self._current_bug is not None, "step() called before reset()"
         self._state.step_count += 1
         task_key = self._current_task_key
-        # Grade the action for this task
         score, feedback = grade_action(task_key, self._current_bug, action)
         self._state.total_score += score
         self._state.tasks_completed.append(task_key)
-        # Determine progression
         current_idx = TASK_PROGRESSION.index(task_key)
-        done = current_idx == len(TASK_PROGRESSION) - 1  # True after hard task
         if done:
-            # Episode complete — keep current bug/task for final observation
             self._episode_done = True
             next_bug = self._current_bug
             next_task = self._current_task_key
         else:
-            # Advance to next task with a fresh random bug
             next_task = TASK_PROGRESSION[current_idx + 1]
             next_bug = sample_bug(next_task)
             self._current_task_key = next_task
@@ -127,15 +103,9 @@ class BugTriageEnvironment(Environment):
             reward=round(score, 3),
         )
-    # ─────────────────────────────────────────
-    # state() — both property and method forms
-    # ─────────────────────────────────────────
     @property
     def state(self) -> TriageState:
-        """Property form — used internally."""
         return self._state
     def get_state(self) -> TriageState:
-        """Method form — satisfies OpenEnv spec's state() interface."""
         return self._state

 sys.path.insert(0, "/app/server")
 import uuid
 from openenv.core.env_server.interfaces import Environment
 from model import TriageAction, TriageObservation, TriageState, BugReport
+from task import grade_action, sample_bug
 TASK_PROGRESSION = ["easy", "medium", "hard"]
       Step 2 → medium task (priority + labels + team)
       Step 3 → hard task   (priority + labels + team + milestone)
+    NOTE: OpenEnv HTTP server creates a new environment instance per
+    request. So __init__ auto-initializes a bug so step() always works.
     """
     def __init__(self):
             step_count=0,
             total_score=0.0,
             tasks_completed=[],
+        )
         self._current_task_key: str = "easy"
         self._episode_done: bool = False
+        # Auto-init bug so step() works on stateless HTTP server
+        self._current_bug: BugReport = sample_bug("easy")
     def reset(self) -> TriageObservation:
+        """Start a fresh episode."""
         self._state = TriageState(
+            episode_id=str(uuid.uuid4()),
+            current_task="easy",
+            step_count=0,
+            total_score=0.0,
+            tasks_completed=[],
+        )
         self._current_task_key = "easy"
         self._episode_done = False
         self._current_bug = sample_bug("easy")
             reward=0.0,
         )
     def step(self, action: TriageAction) -> TriageObservation:
+        """Process the agent's triage action."""
         if self._episode_done:
             return TriageObservation(
                 bug_report=self._current_bug,
                 task_id=self._current_task_key,
                 reward=0.0,
             )
         self._state.step_count += 1
         task_key = self._current_task_key
         score, feedback = grade_action(task_key, self._current_bug, action)
         self._state.total_score += score
         self._state.tasks_completed.append(task_key)
         current_idx = TASK_PROGRESSION.index(task_key)
+        done = current_idx == len(TASK_PROGRESSION) - 1
         if done:
             self._episode_done = True
             next_bug = self._current_bug
             next_task = self._current_task_key
         else:
             next_task = TASK_PROGRESSION[current_idx + 1]
             next_bug = sample_bug(next_task)
             self._current_task_key = next_task
             reward=round(score, 3),
         )
     @property
     def state(self) -> TriageState:
         return self._state
     def get_state(self) -> TriageState:
         return self._state

fix: auto-init bug in __init__ for stateless HTTP server

fix: auto-init bug in init for stateless HTTP server