cicd-debugger-env-final / openenv.yaml
Lishika's picture
final fix
32445fd
version: "0.2"
name: "cicd-debugger-env"
description: "RL environment for CI/CD debugging with deterministic, hidden, and quality-aware scoring"
metadata:
domain: "devops"
real_world_task: "ci-cd pipeline debugging"
deployment: "huggingface-space-docker"
environment:
entry_point: "env.environment:CICDDebuggerEnvironment"
interface:
observation_type: "json"
action_type: "text"
max_steps: 30
action_space:
tools:
- read_file
- read_logs
- analyze_error
- edit_config
- run_pipeline_stage
- run_tests
- validate_fix
- submit_solution
tasks:
- id: "easy-command-typo"
difficulty: "easy"
failure_stage: "test"
grader: "env.graders.deterministic:DeterministicGrader"
- id: "easy-missing-checkout"
difficulty: "easy"
failure_stage: "build"
grader: "env.graders.deterministic:DeterministicGrader"
- id: "easy-yaml-indentation"
difficulty: "easy"
failure_stage: "build"
grader: "env.graders.deterministic:DeterministicGrader"
- id: "medium-python-version"
difficulty: "medium"
failure_stage: "build"
grader: "env.graders.deterministic:DeterministicGrader"
- id: "medium-cache-key"
difficulty: "medium"
failure_stage: "test"
grader: "env.graders.deterministic:DeterministicGrader"
- id: "medium-artifact-permissions"
difficulty: "medium"
failure_stage: "deploy"
grader: "env.graders.deterministic:DeterministicGrader"
- id: "hard-matrix-logic"
difficulty: "hard"
failure_stage: "test"
grader: "env.graders.deterministic:DeterministicGrader"
- id: "hard-conditional-deploy"
difficulty: "hard"
failure_stage: "deploy"
grader: "env.graders.deterministic:DeterministicGrader"
- id: "hard-needs-order"
difficulty: "hard"
failure_stage: "deploy"
grader: "env.graders.deterministic:DeterministicGrader"