Update openenv.yaml
Browse files- openenv.yaml +18 -41
openenv.yaml
CHANGED
|
@@ -1,63 +1,40 @@
|
|
| 1 |
-
|
| 2 |
-
# OpenEnv Specification v1.0
|
| 3 |
-
# Meta x PyTorch Hackathon Submission
|
| 4 |
-
# ============================================================
|
| 5 |
-
|
| 6 |
-
name: email-gatekeeper
|
| 7 |
version: "1.0.0"
|
| 8 |
-
|
| 9 |
-
|
| 10 |
-
|
| 11 |
author: zerogravity
|
| 12 |
license: MIT
|
| 13 |
-
framework: gymnasium
|
| 14 |
python_requires: ">=3.10"
|
| 15 |
|
| 16 |
-
# ββ Entry point βββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 17 |
-
# Dhyan dein: 'env' aapki file ka naam hai aur 'EmailTriageEnv' class ka
|
| 18 |
entry_point: "env:EmailTriageEnv"
|
| 19 |
|
| 20 |
-
# ββ Observation space βββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 21 |
observation_space:
|
| 22 |
-
type:
|
| 23 |
-
|
| 24 |
-
|
| 25 |
-
|
| 26 |
-
|
|
|
|
|
|
|
|
|
|
| 27 |
|
| 28 |
-
# ββ Action space ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 29 |
action_space:
|
| 30 |
-
type:
|
| 31 |
-
|
|
|
|
|
|
|
| 32 |
|
| 33 |
-
# ββ Tasks βββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 34 |
tasks:
|
| 35 |
- id: easy
|
| 36 |
-
difficulty: easy
|
| 37 |
-
num_emails: 4
|
| 38 |
-
target_score: 1.0
|
| 39 |
- id: medium
|
| 40 |
-
difficulty: medium
|
| 41 |
-
num_emails: 8
|
| 42 |
-
target_score: 1.0
|
| 43 |
- id: hard
|
| 44 |
-
difficulty: hard
|
| 45 |
-
num_emails: 16
|
| 46 |
-
target_score: 1.0
|
| 47 |
|
| 48 |
-
|
| 49 |
-
|
| 50 |
dependencies:
|
| 51 |
-
- gymnasium>=0.29.0
|
| 52 |
- numpy>=1.24.0
|
| 53 |
-
- pydantic>=2.0.0
|
| 54 |
-
- fastapi
|
| 55 |
-
- uvicorn
|
| 56 |
-
- gradio
|
| 57 |
-
- pyyaml
|
| 58 |
|
| 59 |
-
# ββ Reproducibility βββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 60 |
reproducibility:
|
| 61 |
-
seed: 42
|
| 62 |
deterministic: true
|
| 63 |
baseline_script: inference.py
|
|
|
|
| 1 |
+
name: email-triage-env
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
version: "1.0.0"
|
| 3 |
+
|
| 4 |
+
description: RL environment for email triage
|
| 5 |
+
|
| 6 |
author: zerogravity
|
| 7 |
license: MIT
|
|
|
|
| 8 |
python_requires: ">=3.10"
|
| 9 |
|
|
|
|
|
|
|
| 10 |
entry_point: "env:EmailTriageEnv"
|
| 11 |
|
|
|
|
| 12 |
observation_space:
|
| 13 |
+
type: object
|
| 14 |
+
properties:
|
| 15 |
+
description:
|
| 16 |
+
type: string
|
| 17 |
+
step:
|
| 18 |
+
type: integer
|
| 19 |
+
remaining:
|
| 20 |
+
type: integer
|
| 21 |
|
|
|
|
| 22 |
action_space:
|
| 23 |
+
type: array
|
| 24 |
+
items:
|
| 25 |
+
type: integer
|
| 26 |
+
length: 3
|
| 27 |
|
|
|
|
| 28 |
tasks:
|
| 29 |
- id: easy
|
|
|
|
|
|
|
|
|
|
| 30 |
- id: medium
|
|
|
|
|
|
|
|
|
|
| 31 |
- id: hard
|
|
|
|
|
|
|
|
|
|
| 32 |
|
| 33 |
+
reward_range: [0.0, 1.0]
|
| 34 |
+
|
| 35 |
dependencies:
|
|
|
|
| 36 |
- numpy>=1.24.0
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 37 |
|
|
|
|
| 38 |
reproducibility:
|
|
|
|
| 39 |
deterministic: true
|
| 40 |
baseline_script: inference.py
|