version: "0.2" name: "cicd-debugger-env" description: "RL environment for CI/CD debugging with deterministic, hidden, and quality-aware scoring" metadata: domain: "devops" real_world_task: "ci-cd pipeline debugging" deployment: "huggingface-space-docker" environment: entry_point: "env.environment:CICDDebuggerEnvironment" interface: observation_type: "json" action_type: "text" max_steps: 30 action_space: tools: - read_file - read_logs - analyze_error - edit_config - run_pipeline_stage - run_tests - validate_fix - submit_solution tasks: - id: "easy-command-typo" difficulty: "easy" failure_stage: "test" grader: "env.graders.deterministic:DeterministicGrader" - id: "easy-missing-checkout" difficulty: "easy" failure_stage: "build" grader: "env.graders.deterministic:DeterministicGrader" - id: "easy-yaml-indentation" difficulty: "easy" failure_stage: "build" grader: "env.graders.deterministic:DeterministicGrader" - id: "medium-python-version" difficulty: "medium" failure_stage: "build" grader: "env.graders.deterministic:DeterministicGrader" - id: "medium-cache-key" difficulty: "medium" failure_stage: "test" grader: "env.graders.deterministic:DeterministicGrader" - id: "medium-artifact-permissions" difficulty: "medium" failure_stage: "deploy" grader: "env.graders.deterministic:DeterministicGrader" - id: "hard-matrix-logic" difficulty: "hard" failure_stage: "test" grader: "env.graders.deterministic:DeterministicGrader" - id: "hard-conditional-deploy" difficulty: "hard" failure_stage: "deploy" grader: "env.graders.deterministic:DeterministicGrader" - id: "hard-needs-order" difficulty: "hard" failure_stage: "deploy" grader: "env.graders.deterministic:DeterministicGrader"