File size: 792 Bytes
36dac03
 
 
 
 
 
 
 
 
 
486044c
 
36dac03
 
 
 
 
 
 
 
 
 
 
486044c
36dac03
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
spec_version: 1
name: api_debug_env
type: space
runtime: fastapi
app: server.app:app
port: 8000

description: >
  API Integration Debugging Environment — an AI agent must diagnose and fix
  broken API integrations by reading error logs, inspecting configurations,
  and submitting corrected API calls. Supports 3 difficulty levels with
  seed-based randomization for reproducible evaluation.

tasks:
  - id: easy
    description: "Fix missing Authorization header and wrong Content-Type in a payment API client"
    max_steps: 15

  - id: medium
    description: "Debug a webhook chain with rate limiting, retry, and signature validation failures"
    max_steps: 25

  - id: hard
    description: "Diagnose cascading failures across a 5-service order processing pipeline"
    max_steps: 40