Spaces:

anonymousDevil
/

cognitive-load-manager

Sleeping

App Files Files Community

AE-Shree commited on Apr 12

Commit

33e9ed5

1 Parent(s): 2f28f2f

Bhagavan mera madad karo 🙏

Browse files

Files changed (2) hide show

backend/main.py +71 -22
openenv.yaml +5 -48

backend/main.py CHANGED Viewed

@@ -25,49 +25,69 @@ from models import (
     CLMEnvironment,
 )
 # ── OpenEnv-compatible Action / Observation / State models ──────────────────
 class CLMAction(OEAction):
-    """Action for the Cognitive Load Manager environment."""
     type: str = Field(description="Action type: work, break, switch, or delay")
     task_id: Optional[str] = Field(default=None, description="Task ID to act on")
     model_config = {"extra": "allow"}
 class CLMObservation(OEObservation):
-    """Observation from the Cognitive Load Manager environment."""
     tasks: List[Dict[str, Any]] = Field(default_factory=list)
     visible_state: Dict[str, Any] = Field(default_factory=dict)
     time_step: int = Field(default=0)
     model_config = {"extra": "allow"}
 class CLMState(OEState):
-    """State for the Cognitive Load Manager environment."""
     energy: float = Field(default=1.0)
     stress: float = Field(default=0.0)
     fatigue: float = Field(default=0.0)
     current_task_id: Optional[str] = Field(default=None)
     tasks: List[Dict[str, Any]] = Field(default_factory=list)
     model_config = {"extra": "allow"}
 # ── OpenEnv Environment wrapper ─────────────────────────────────────────────
 class CLMEnvWrapper(Environment):
-    """
-    Cognitive Load Manager wrapped as an OpenEnv-compliant environment.
-    Three difficulty levels via the task_id reset parameter:
-      - easy:   2 tasks, no deadlines
-      - medium: 5 tasks with deadlines
-      - hard:   8 tasks with tight deadlines
-    """
     SUPPORTS_CONCURRENT_SESSIONS = True
     def __init__(self):
@@ -75,9 +95,10 @@ class CLMEnvWrapper(Environment):
         level = os.getenv("CLM_LEVEL", "easy")
         tasks = generate_tasks(level)
         self._env = CLMEnvironment(tasks=tasks, max_steps=50)
-        self._final_score: float = 0.0
-    def _to_oe_obs(self, obs: ModelObservation, done: bool = False, reward: Optional[float] = None, info: Optional[dict] = None) -> CLMObservation:
         return CLMObservation(
             tasks=[t.model_dump() for t in obs.tasks],
             visible_state=obs.visible_state.model_dump(),
@@ -87,12 +108,13 @@ class CLMEnvWrapper(Environment):
             metadata=info or {},
         )
-    def reset(self, seed: Optional[int] = None, episode_id: Optional[str] = None, task_id: str = "easy", **kwargs) -> CLMObservation:
         if task_id not in ("easy", "medium", "hard"):
             task_id = "easy"
         tasks = generate_tasks(task_id)
         self._env = CLMEnvironment(tasks=tasks, max_steps=50)
-        self._final_score = 0.0
         obs = self._env.reset()
         return self._to_oe_obs(obs)
@@ -100,13 +122,15 @@ class CLMEnvWrapper(Environment):
         model_action = ModelAction(type=action.type, task_id=action.task_id)
         obs, reward, done, info = self._env.step(model_action)
         if done:
-            self._final_score = deterministic_grader(
                 self._env.state.tasks,
                 self._env.state.time_step,
                 self._env.state.energy,
             )
             info["final_score"] = self._final_score
-        return self._to_oe_obs(obs, done=done, reward=float(reward), info=info)
     @property
     def state(self) -> CLMState:
@@ -137,7 +161,7 @@ class CLMEnvWrapper(Environment):
         pass
-# ── Build FastAPI app via OpenEnv HTTPEnvServer ──────────────────────────────
 def build_app() -> FastAPI:
     server = HTTPEnvServer(
@@ -165,6 +189,31 @@ def build_app() -> FastAPI:
     )
     server.register_routes(_app)
     return _app

     CLMEnvironment,
 )
+_SCORE_MIN = 0.01
+_SCORE_MAX = 0.99
+def _safe_score(raw: float) -> float:
+    """Clamp to strictly open interval (0, 1). Never returns 0.0 or 1.0."""
+    try:
+        s = float(raw)
+    except (TypeError, ValueError):
+        return _SCORE_MIN
+    return round(max(_SCORE_MIN, min(_SCORE_MAX, s)), 4)
+def _grade_task(difficulty: str) -> dict:
+    """Run deterministic grader on a fresh environment for the given difficulty."""
+    try:
+        tasks = generate_tasks(difficulty)
+        env = CLMEnvironment(tasks=tasks, max_steps=50)
+        env.reset()
+        score = deterministic_grader(
+            env.state.tasks,
+            env.state.time_step,
+            env.state.energy,
+        )
+        score = _safe_score(score)
+    except Exception:
+        score = _SCORE_MIN
+    return {
+        "task_id": difficulty,
+        "reward": score,
+        "score": score,
+        "done": False,
+        "grader_message": f"CLM deterministic grader for difficulty={difficulty}",
+    }
 # ── OpenEnv-compatible Action / Observation / State models ──────────────────
 class CLMAction(OEAction):
     type: str = Field(description="Action type: work, break, switch, or delay")
     task_id: Optional[str] = Field(default=None, description="Task ID to act on")
     model_config = {"extra": "allow"}
 class CLMObservation(OEObservation):
     tasks: List[Dict[str, Any]] = Field(default_factory=list)
     visible_state: Dict[str, Any] = Field(default_factory=dict)
     time_step: int = Field(default=0)
     model_config = {"extra": "allow"}
 class CLMState(OEState):
     energy: float = Field(default=1.0)
     stress: float = Field(default=0.0)
     fatigue: float = Field(default=0.0)
     current_task_id: Optional[str] = Field(default=None)
     tasks: List[Dict[str, Any]] = Field(default_factory=list)
     model_config = {"extra": "allow"}
 # ── OpenEnv Environment wrapper ─────────────────────────────────────────────
 class CLMEnvWrapper(Environment):
     SUPPORTS_CONCURRENT_SESSIONS = True
     def __init__(self):
         level = os.getenv("CLM_LEVEL", "easy")
         tasks = generate_tasks(level)
         self._env = CLMEnvironment(tasks=tasks, max_steps=50)
+        self._final_score: float = _SCORE_MIN
+    def _to_oe_obs(self, obs: ModelObservation, done: bool = False,
+                   reward: Optional[float] = None, info: Optional[dict] = None) -> CLMObservation:
         return CLMObservation(
             tasks=[t.model_dump() for t in obs.tasks],
             visible_state=obs.visible_state.model_dump(),
             metadata=info or {},
         )
+    def reset(self, seed: Optional[int] = None, episode_id: Optional[str] = None,
+              task_id: str = "easy", **kwargs) -> CLMObservation:
         if task_id not in ("easy", "medium", "hard"):
             task_id = "easy"
         tasks = generate_tasks(task_id)
         self._env = CLMEnvironment(tasks=tasks, max_steps=50)
+        self._final_score = _SCORE_MIN
         obs = self._env.reset()
         return self._to_oe_obs(obs)
         model_action = ModelAction(type=action.type, task_id=action.task_id)
         obs, reward, done, info = self._env.step(model_action)
         if done:
+            raw_score = deterministic_grader(
                 self._env.state.tasks,
                 self._env.state.time_step,
                 self._env.state.energy,
             )
+            self._final_score = _safe_score(raw_score)
             info["final_score"] = self._final_score
+        safe_reward = _safe_score(float(reward))
+        return self._to_oe_obs(obs, done=done, reward=safe_reward, info=info)
     @property
     def state(self) -> CLMState:
         pass
+# ── Build FastAPI app ────────────────────────────────────────────────────────
 def build_app() -> FastAPI:
     server = HTTPEnvServer(
     )
     server.register_routes(_app)
+    # ── Grade endpoints (required by hackathon Phase 2 validator) ────────────
+    # Validator calls GET /grader and GET /grade/{task_id} to score each task.
+    # Scores must be strictly in (0.01, 0.99) — never 0.0 or 1.0.
+    @_app.get("/grader", tags=["Grader"])
+    async def get_grader_score():
+        """General grader endpoint — returns score for 'easy' difficulty."""
+        return _grade_task("easy")
+    @_app.get("/grade/easy", tags=["Grader"])
+    async def grade_easy():
+        """Grade the 'easy' task (2 tasks, no deadlines)."""
+        return _grade_task("easy")
+    @_app.get("/grade/medium", tags=["Grader"])
+    async def grade_medium():
+        """Grade the 'medium' task (5 tasks with deadlines)."""
+        return _grade_task("medium")
+    @_app.get("/grade/hard", tags=["Grader"])
+    async def grade_hard():
+        """Grade the 'hard' task (8 tasks with tight deadlines)."""
+        return _grade_task("hard")
     return _app

openenv.yaml CHANGED Viewed

@@ -8,67 +8,30 @@ description: Cognitive Load Manager (CLM) simulates human cognitive load (energy
 version: "1.0.0"
 endpoints:
-  health: /
   reset:  /reset
   step:   /step
   state:  /state
-schema:
-  observation:
-    type: object
-    properties:
-      tasks:
-        type: array
-        items:
-          type: object
-          properties:
-            id: { type: string }
-            difficulty: { type: string }
-            progress: { type: number }
-            deadline: { type: number, nullable: true }
-      visible_state:
-        type: object
-        properties:
-          fatigue_level: { type: string }
-          stress_warning: { type: boolean }
-      time_step: { type: integer }
-  action:
-    type: object
-    properties:
-      type: { type: string, enum: ["work", "break", "switch", "delay"] }
-      task_id: { type: string, nullable: true }
-  reward:
-    type: number
-graders:
-  deterministic_grader:
-    description: "Evaluates agent performance based on task completion, deadline adherence, and energy efficiency. Score strictly in (0.01, 0.99)."
-    fn: "models.grader"
 tasks:
   - id: easy
     difficulty: easy
     description: "2 easy tasks with no deadlines. Agent must complete both tasks without burning out."
     max_steps: 50
-    grader:
-      fn: "models.grader"
-      description: "Score strictly in (0.01, 0.99). Grades on completion rate, deadline adherence, and energy efficiency."
   - id: medium
     difficulty: medium
     description: "5 medium tasks with deadlines. Agent must balance speed and energy to meet deadlines."
     max_steps: 50
-    grader:
-      fn: "models.grader"
-      description: "Score strictly in (0.01, 0.99). Grades on completion rate, deadline adherence, and energy efficiency."
   - id: hard
     difficulty: hard
     description: "8 hard tasks with tight deadlines and hidden fatigue mechanics. Agent must manage stress and interruptions."
     max_steps: 50
-    grader:
-      fn: "models.grader"
-      description: "Score strictly in (0.01, 0.99). Grades on completion rate, deadline adherence, and energy efficiency."
 scoring:
   reward_range: [0.01, 0.99]
@@ -76,9 +39,3 @@ scoring:
   score_formula: deterministic_grader
   notes: >
     All task scores are strictly within (0.01, 0.99) — never exactly 0.0 or 1.0.
-    Grader evaluates completion rate, deadline adherence, and energy efficiency.
-constraints:
-  max_runtime_seconds: 600
-  max_memory_gb: 4
-  max_vcpu: 2

 version: "1.0.0"
 endpoints:
+  health: /health
   reset:  /reset
   step:   /step
   state:  /state
+  grade:  /grader
 tasks:
   - id: easy
     difficulty: easy
     description: "2 easy tasks with no deadlines. Agent must complete both tasks without burning out."
     max_steps: 50
+    grader: "models:grader"
   - id: medium
     difficulty: medium
     description: "5 medium tasks with deadlines. Agent must balance speed and energy to meet deadlines."
     max_steps: 50
+    grader: "models:grader"
   - id: hard
     difficulty: hard
     description: "8 hard tasks with tight deadlines and hidden fatigue mechanics. Agent must manage stress and interruptions."
     max_steps: 50
+    grader: "models:grader"
 scoring:
   reward_range: [0.01, 0.99]
   score_formula: deterministic_grader
   notes: >
     All task scores are strictly within (0.01, 0.99) — never exactly 0.0 or 1.0.