File size: 1,650 Bytes
85768b6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
openenv_v: 1.0
name: email_triage_assistant
description: "A real-world simulation of email triage and scheduling. Not a toy environment."
category: "Productivity"
tags: ["Agentic", "Email", "Scheduling", "Triage"]

tasks:
  - id: 1
    name: "Spam Guard (Level 1)"
    description: "Identify and archive a clear spam email ($1M claims) to the Spam folder."
    motivation: "Reduces inbox clutter and enhances cybersecurity posture by removing phishing threats."
    difficulty: "easy"
    reward_range: [0.0, 1.0]
    expected_behavior: "Agent identifies the sender 'spam@bott.io' and correctly applies the MOVE action to the 'Spam' target folder."
  - id: 2
    name: "Organization Workflow (Level 2)"
    description: "Categorize multi-topic emails from Inbox into 'Work' and 'Archive' folders."
    motivation: "Standard professional office workflow to maintain a clear organizational structure."
    difficulty: "medium"
    reward_range: [0.0, 1.0]
    expected_behavior: "Agent sorts 'Urgent: Project Update' and 'Daily Briefing' email IDs correctly in a single trajectory."
  - id: 3
    name: "Calendar Coordinator (Level 3)"
    description: "Schedule a meeting reply while avoiding conflicts (Busy 10 AM, Free 2 PM)."
    motivation: "Requires high-level logical reasoning and information extraction from the 'Calendar' observation field."
    difficulty: "hard"
    reward_range: [0.0, 1.0]
    expected_behavior: "Agent extracts busy times from the calendar and generates a SCHEDULE action at a non-conflicting time (2 PM)."

endpoints:
  reset: /reset
  step: /step
  state: /state

docker:
  build: ./Dockerfile
  memory: 8gb
  vcpu: 2