File size: 1,054 Bytes
569c142
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
spec_version: 1
name: disk_panic
description: "SRE incident response RL environment — fix a production server with a full disk and crashing services without touching business-critical logs."
version: 0.1.0
author: yashppawar
type: space
runtime: fastapi
app: disk_panic.server.app:app
port: 8000
tasks:
  - id: easy
    description: "Free the disk by removing a bloated rotated log."
  - id: medium
    description: "Free the disk, restart the crashed app.service, preserve /var/log/audit."
  - id: hard
    description: "All of the above + tame a runaway writer via a logrotate config."
action_space:
  type: DiskPanicAction
  fields:
    command: "str — a bash-like command (ls, df, du, cat, rm, find, sha256sum, systemctl, or `echo ... > path`)"
observation_space:
  type: DiskPanicObservation
  fields:
    stdout: "str — output of the last command"
    df_output: "str — simulated `df -h /` output"
    service_status: "str — simulated systemctl state of app.service"
    task_id: "str — current task (easy/medium/hard)"
    step: "int"