Krishna1107's picture
full devops
c8f3b98
name: cloud-native-devops-env
version: "1.0.0"
description: >
Debug broken GitHub Actions workflows, Dockerfiles, and Kubernetes manifests.
AI agents identify and fix cloud-native deployment pipeline issues.
author: Krishna
license: MIT
tags:
- devops
- docker
- github-actions
- kubernetes
- debugging
- infrastructure
- cloud-native
environment:
type: text
observation_space: structured
action_space: structured
max_steps: 10
tasks:
- id: dockerfile_syntax
name: Dockerfile Syntax Errors
description: Fix syntax and instruction errors in Dockerfiles
difficulty: easy
num_scenarios: 5
- id: dockerfile_runtime
name: Dockerfile Runtime Errors
description: Fix runtime/container execution issues in Dockerfiles
difficulty: medium
num_scenarios: 5
- id: workflow_syntax_structure
name: Workflow Syntax and Structure
description: Fix GitHub Actions YAML syntax and job structure issues
difficulty: easy
num_scenarios: 5
- id: workflow_secrets_permissions
name: Workflow Secrets and Permissions
description: Fix secret wiring, env usage, and permissions in workflows
difficulty: medium
num_scenarios: 5
- id: ci_docker_integration
name: CI and Docker Build Integration
description: Debug combined workflow and Docker build integration failures
difficulty: medium-hard
num_scenarios: 5
- id: multi_stage_pipeline_matrix
name: Multi-Stage Pipeline and Matrix
description: Debug complex multi-stage and matrix CI/CD pipelines
difficulty: hard
num_scenarios: 5
- id: k8s_pod_failures
name: Kubernetes Pod Failures
description: Fix Kubernetes pod failures including CrashLoopBackOff, ImagePullBackOff, and resource issues
difficulty: medium
num_scenarios: 5
- id: k8s_networking
name: Kubernetes Service & Ingress Issues
description: Fix Kubernetes networking issues including Service selectors, port mismatches, and Ingress configuration
difficulty: hard
num_scenarios: 5
- id: pipeline_build_deploy
name: CI/CD Build & Push Pipeline
description: Debug GHA-to-Docker-to-Registry pipeline failures across multiple files
difficulty: hard
num_scenarios: 5
- id: pipeline_full_stack
name: Full Stack Deployment Pipeline
description: Debug complex multi-error deployment pipelines across GHA workflows, Dockerfiles, and Kubernetes manifests
difficulty: expert
num_scenarios: 5
graders:
dockerfile_syntax:
type: deterministic
score_range: [0.0, 1.0]
dockerfile_runtime:
type: deterministic
score_range: [0.0, 1.0]
workflow_syntax_structure:
type: deterministic
score_range: [0.0, 1.0]
workflow_secrets_permissions:
type: deterministic
score_range: [0.0, 1.0]
ci_docker_integration:
type: deterministic
score_range: [0.0, 1.0]
multi_stage_pipeline_matrix:
type: deterministic
score_range: [0.0, 1.0]
k8s_pod_failures:
type: deterministic
score_range: [0.0, 1.0]
k8s_networking:
type: deterministic
score_range: [0.0, 1.0]
pipeline_build_deploy:
type: deterministic
score_range: [0.0, 1.0]
pipeline_full_stack:
type: deterministic
score_range: [0.0, 1.0]
baseline:
script: inference.py
expected_scores:
dockerfile_syntax: 0.70
dockerfile_runtime: 0.55
workflow_syntax_structure: 0.65
workflow_secrets_permissions: 0.50
ci_docker_integration: 0.45
multi_stage_pipeline_matrix: 0.30
k8s_pod_failures: 0.50
k8s_networking: 0.40
pipeline_build_deploy: 0.35
pipeline_full_stack: 0.20
resources:
vcpu: 2
memory: 8gb
timeout: 1200