File size: 1,379 Bytes
f89b1ac
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
spec_version: 1
name: dataops_env
version: 1.0.0
description: Seeded enterprise DataOps benchmark with isolated sessions, deterministic graders, and three escalating remediation tasks.
type: space
runtime: fastapi
app: server.app:app
port: 7860
tasks:
  - id: task_1_easy_anomaly
    name: Delete Corrupted Transaction Rows
    difficulty: easy
    description: Inspect a seeded transaction table and remove only the rows whose amount is NULL, preserving legitimate non-null edge values.
    benchmark_focus: Careful data cleanup without collateral damage.
    allowed_actions:
      - ExecuteSQL
  - id: task_2_medium_syntax
    name: Repair Seeded Pipeline Script
    difficulty: medium
    description: Repair a seeded ETL normalization script and verify it against visible and hidden seeded batches.
    benchmark_focus: Code reading, precise repair, and generalization beyond the demo batch.
    allowed_actions:
      - ReadFile
      - WriteFile
      - RunScript
  - id: task_3_hard_e2e
    name: Resolve Revenue Reporting Incident
    difficulty: hard
    description: Extract a seeded reporting slice, repair the formatter, and send the exact generated report.
    benchmark_focus: End-to-end data extraction, file repair, and communication with provenance.
    allowed_actions:
      - ExecuteSQL
      - ReadFile
      - WriteFile
      - RunScript
      - SendEmail