OPENSPEC_Hackhathon / openenv.yaml
SushCodex's picture
Upload 14 files
85768b6 verified
openenv_v: 1.0
name: email_triage_assistant
description: "A real-world simulation of email triage and scheduling. Not a toy environment."
category: "Productivity"
tags: ["Agentic", "Email", "Scheduling", "Triage"]
tasks:
- id: 1
name: "Spam Guard (Level 1)"
description: "Identify and archive a clear spam email ($1M claims) to the Spam folder."
motivation: "Reduces inbox clutter and enhances cybersecurity posture by removing phishing threats."
difficulty: "easy"
reward_range: [0.0, 1.0]
expected_behavior: "Agent identifies the sender 'spam@bott.io' and correctly applies the MOVE action to the 'Spam' target folder."
- id: 2
name: "Organization Workflow (Level 2)"
description: "Categorize multi-topic emails from Inbox into 'Work' and 'Archive' folders."
motivation: "Standard professional office workflow to maintain a clear organizational structure."
difficulty: "medium"
reward_range: [0.0, 1.0]
expected_behavior: "Agent sorts 'Urgent: Project Update' and 'Daily Briefing' email IDs correctly in a single trajectory."
- id: 3
name: "Calendar Coordinator (Level 3)"
description: "Schedule a meeting reply while avoiding conflicts (Busy 10 AM, Free 2 PM)."
motivation: "Requires high-level logical reasoning and information extraction from the 'Calendar' observation field."
difficulty: "hard"
reward_range: [0.0, 1.0]
expected_behavior: "Agent extracts busy times from the calendar and generates a SCHEDULE action at a non-conflicting time (2 PM)."
endpoints:
reset: /reset
step: /step
state: /state
docker:
build: ./Dockerfile
memory: 8gb
vcpu: 2