name: stack-2.9 python_env: python_env.yaml entry_points: main: command: "python train.py --train_data data/final/train.jsonl --val_data data/final/val.jsonl" evaluate: command: "python evaluate_model.py --model models/checkpoint --eval_data data/final/test.jsonl" augment: command: "python scripts/augment_training_data.py --input training-data/tool_examples.jsonl --output training-data/augmented.jsonl --multiplier 3" validate: command: "python scripts/validate_training_data.py --input training-data/tool_examples.jsonl" parameters: - name: train_data default: data/final/train.jsonl - name: val_data default: data/final/val.jsonl - name: model_name default: Qwen/Qwen2.5-7B - name: batch_size default: 4 type: int - name: learning_rate default: 5.0e-5 type: float - name: num_epochs default: 3 type: int - name: warmup_steps default: 100 type: int - name: max_seq_length default: 8192 type: int - name: gradient_accumulation_steps default: 4 type: int - name: lora_rank default: 16 type: int - name: lora_alpha default: 32 type: int - name: lora_dropout default: 0.05 type: float - name: use_flash_attention default: true type: bool run_options: # Storage for MLflow tracking tracking_uri: ./mlruns # Experiment configuration experiment: name: stack-2.9-training description: "Stack 2.9 model training experiments" # Resource limits resources: gpu_count: 1 gpu_type: A100 # Logging configuration log_model: artifacts: true save_steps: 500 # Early stopping early_stopping: metric: eval_loss patience: 2 min_delta: 0.001