name: sysadmin-env version: "0.2.0" description: reinforcement learning environment for linux server auto remediation runtime: python: "3.11" entry_point: inference.py server_entry_point: server.app:app reset_endpoint: /reset step_endpoint: /step state_endpoint: /state websocket_endpoint: /ws healthcheck_endpoint: /health tasks_endpoint: /tasks resources: vcpus: 2 memory_gb: 8 gpu: none max_runtime_minutes: 20 tasks: - id: nginx_crash difficulty: easy description: nginx crash with stale pid and config syntax error max_steps: 40 time_limit_seconds: 300 - id: disk_full difficulty: medium description: hidden sparse log file filling a loopback mount max_steps: 55 time_limit_seconds: 420 - id: network_broken difficulty: hard description: broken network namespace with corrupted routing tables max_steps: 70 time_limit_seconds: 480 evaluation: protocol: sequential max_total_runtime_seconds: 1200 tasks_order: - nginx_crash - disk_full - network_broken