File size: 1,679 Bytes
bcd8636
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
name: data_detective
version: "1.0.0"
description: >
  DataDetective: A business incident investigation environment where AI agents
  use SQL queries to analyze a realistic e-commerce company database (TechMart)
  and uncover root causes of business problems. Covers 9 tasks spanning order
  analysis, product returns, customer churn, shipping ops, margin analysis,
  supplier quality, inventory stockouts, fraud detection, and retention.
endpoints:
  reset: /reset
  step: /step
  state: /state
tasks:
  - id: orders_drop
    difficulty: easy
    description: Order volume dropped sharply after a major promotion ended
  - id: returns_spike
    difficulty: medium
    description: Product returns spiking in a specific region due to defective SKU
  - id: customer_churn
    difficulty: hard
    description: Active customer count declining across specific segments
  - id: shipping_delay
    difficulty: medium-hard
    description: Customer satisfaction crisis driven by carrier delays in one region
  - id: revenue_paradox
    difficulty: hard
    description: Revenue is up but profit is down  multi-causal margin erosion
  - id: supplier_quality
    difficulty: medium
    description: Systemic quality issues from a single supplier across multiple products
  - id: inventory_stockout
    difficulty: medium-hard
    description: Regional sales underperformance caused by warehouse stockout during promo
  - id: fraud_detection
    difficulty: hard
    description: Coordinated fraud ring of fake accounts placing high-value orders
  - id: repeat_purchase_decline
    difficulty: hard
    description: Repeat purchase rates collapsing while acquisition masks the problem