Spaces:
Sleeping
Sleeping
File size: 2,121 Bytes
6e72b95 e75c8ce 351158b e75c8ce 351158b e75c8ce 351158b e75c8ce 351158b 6e72b95 e75c8ce 6e72b95 e75c8ce | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 | import random
from env.task_graders import TASK_AGENT_GRADERS
# Declared for GET /tasks + openenv.yaml (Phase 1 task/grader discovery).
TASK_MANIFEST = [
{
"name": "easy",
"description": (
"Fewer cache items and low volatility; easier to infer staleness from noisy observations."
),
"difficulty": "easy",
"max_steps": 10,
"grader": True,
"grader_kind": "programmatic",
"grader_callable": "env.task_graders:easy_agent_grader",
"score_range": [0.0, 1.0],
},
{
"name": "medium",
"description": (
"More items and moderate volatility; invalidation vs keep tradeoffs matter more."
),
"difficulty": "medium",
"max_steps": 10,
"grader": True,
"grader_kind": "programmatic",
"grader_callable": "env.task_graders:medium_agent_grader",
"score_range": [0.0, 1.0],
},
{
"name": "hard",
"description": (
"Most items and high volatility; staleness signal is noisy and costly mistakes are easier."
),
"difficulty": "hard",
"max_steps": 10,
"grader": True,
"grader_kind": "programmatic",
"grader_callable": "env.task_graders:hard_agent_grader",
"score_range": [0.0, 1.0],
},
]
def get_task(task_id):
if task_id == "easy":
return {"num_items": 2, "volatility": 0.1}
elif task_id == "medium":
return {"num_items": 3, "volatility": 0.4}
elif task_id == "hard":
return {"num_items": 4, "volatility": 0.8}
else:
return {
"num_items": 3,
"volatility": 0.3,
}
def sample_task(rng=None):
r = rng if rng is not None else random
return r.choice(["easy", "medium", "hard"])
def list_graders():
"""Return task ids that have an enabled agent grader."""
return [
{
"task": name,
"grader_enabled": fn is not None,
"callable": getattr(fn, "__name__", str(fn)),
}
for name, fn in TASK_AGENT_GRADERS.items()
]
|