File size: 1,794 Bytes
d416acc
b9b1184
d416acc
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2fb512c
d416acc
 
 
 
2fb512c
d416acc
 
 
 
2fb512c
d416acc
 
 
 
2fb512c
d416acc
 
 
 
2fb512c
d416acc
 
 
 
2fb512c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
name: api-triage-agent
version: 1.0.0
description: AI agent debugs API failures using curriculum learning

environment:
  class: environment.api_triage_env.APITriageEnv
  max_steps: 10

observation_space:
  step: int
  max_steps: int
  incident_summary: str
  logs: list
  response_code: int
  fix_applied: bool
  is_resolved: bool

action_space:
  - inspect_logs
  - inspect_request
  - refresh_token
  - add_field
  - wait_retry
  - change_endpoint
  - escalate
  - resolve

reward_range: [-20, 20]

tasks:
  - id: "auth_error"
    name: "Authentication Error"
    description: "Diagnose and fix a 401 Unauthorized error caused by an expired API key"
    difficulty: "easy"
    grader: "tasks.auth_error.grader:grade"
  - id: "missing_fields"
    name: "Missing Field Error"
    description: "Diagnose and fix a 400 Bad Request error caused by a missing required field"
    difficulty: "easy"
    grader: "tasks.missing_fields.grader:grade"
  - id: "rate_limit"
    name: "Rate Limit Error"
    description: "Diagnose and fix a 429 Too Many Requests error by applying retry logic"
    difficulty: "medium"
    grader: "tasks.rate_limit.grader:grade"
  - id: "timeout"
    name: "Timeout Error"
    description: "Diagnose and fix a 408 Request Timeout error by applying retry with backoff"
    difficulty: "medium"
    grader: "tasks.timeout.grader:grade"
  - id: "wrong_endpoint"
    name: "Wrong Endpoint Error"
    description: "Diagnose and fix a 404 Not Found error by changing to the correct endpoint"
    difficulty: "medium"
    grader: "tasks.wrong_endpoint.grader:grade"
  - id: "server_error"
    name: "Server Error"
    description: "Diagnose and handle a 500 Internal Server Error by escalating appropriately"
    difficulty: "hard"
    grader: "tasks.server_error.grader:grade"