Spaces:
Sleeping
Sleeping
| [ | |
| { | |
| "task_id": "hard_queue_triage", | |
| "difficulty": "hard", | |
| "title": "Mixed Support Queue Triage", | |
| "description": "Prioritize a small queue of heterogeneous support tickets under SLA pressure and route each one correctly.", | |
| "instruction": "Inspect the queue, gather missing context where useful, assign the right priority and route for each ticket, set a valid resolution, rank the queue from most urgent to least urgent, and finalize.", | |
| "max_steps": 24, | |
| "queue_mode": true, | |
| "gold_queue_order": [ | |
| "T2", | |
| "T3", | |
| "T1" | |
| ], | |
| "grader_name": "hard_support_queue", | |
| "tickets": [ | |
| { | |
| "ticket_id": "T1", | |
| "summary": "Customer reports a duplicate charge on a subscription renewal and asks when the refund will land.", | |
| "visible_context": { | |
| "customer_tier": "consumer", | |
| "surface": "subscriptions", | |
| "sla_hours_remaining": "24" | |
| }, | |
| "hidden_context": { | |
| "payment_status": "The duplicate charge was confirmed and is automatically refundable.", | |
| "refund_status": "No refund has been issued yet.", | |
| "risk_flags": "No fraud indicators or account compromise signals are present." | |
| }, | |
| "required_context": [ | |
| "payment_status" | |
| ], | |
| "gold_priority": "normal", | |
| "gold_route": "billing_refunds", | |
| "gold_resolution": "approve_refund", | |
| "gold_escalation_team": null | |
| }, | |
| { | |
| "ticket_id": "T2", | |
| "summary": "Advertiser cannot log in, says unfamiliar campaigns are spending rapidly, and fears the account was taken over.", | |
| "visible_context": { | |
| "customer_tier": "managed_advertiser", | |
| "surface": "ads_manager", | |
| "sla_hours_remaining": "1" | |
| }, | |
| "hidden_context": { | |
| "account_security": "Two new devices were added and recovery email was changed 30 minutes ago.", | |
| "billing_activity": "Spending accelerated to $1,900 in the last hour.", | |
| "risk_flags": "Account takeover risk score is critical." | |
| }, | |
| "required_context": [ | |
| "account_security", | |
| "billing_activity" | |
| ], | |
| "gold_priority": "urgent", | |
| "gold_route": "account_security", | |
| "gold_resolution": "temporary_lock_and_manual_recovery", | |
| "gold_escalation_team": "security_specialist" | |
| }, | |
| { | |
| "ticket_id": "T3", | |
| "summary": "Verified creator appeals a content moderation decision because a sponsored campaign launches tomorrow and monetization is paused.", | |
| "visible_context": { | |
| "customer_tier": "verified_creator", | |
| "surface": "content_appeals", | |
| "sla_hours_remaining": "4" | |
| }, | |
| "hidden_context": { | |
| "appeal_state": "The content was auto-removed for policy ambiguity and has not been reviewed by a human yet.", | |
| "campaign_deadline": "The sponsored campaign begins in 18 hours.", | |
| "account_history": "No previous policy strikes or abuse reports." | |
| }, | |
| "required_context": [ | |
| "appeal_state", | |
| "campaign_deadline" | |
| ], | |
| "gold_priority": "high", | |
| "gold_route": "policy_appeals", | |
| "gold_resolution": "expedited_human_review", | |
| "gold_escalation_team": null | |
| } | |
| ] | |
| } | |
| ] |