| | #!/bin/bash |
| | |
| | |
| |
|
| | set -e |
| |
|
| | echo "==============================================" |
| | echo "EXP-A: JSON Format Training" |
| | echo "==============================================" |
| |
|
| | cd ~/seriguela |
| |
|
| | |
| | source venv/bin/activate |
| |
|
| | |
| | if [ ! -f "./data/experiments/exp_a_json/train.csv" ]; then |
| | echo "ERROR: Training data not found!" |
| | echo "Expected: ./data/experiments/exp_a_json/train.csv" |
| | exit 1 |
| | fi |
| |
|
| | |
| | TRAIN_COUNT=$(wc -l < ./data/experiments/exp_a_json/train.csv) |
| | echo "Training samples: $TRAIN_COUNT" |
| |
|
| | |
| | export WANDB_PROJECT="seriguela_experiments" |
| | export HF_TOKEN="${HF_TOKEN:-}" |
| | export WANDB_API_KEY="${WANDB_API_KEY:-}" |
| |
|
| | |
| | echo "" |
| | echo "Starting training..." |
| | echo "Output: ./output/exp_a_json" |
| | echo "" |
| |
|
| | python scripts/train_experiment.py \ |
| | --experiment_name "exp_a_json" \ |
| | --train_file ./data/experiments/exp_a_json/train.csv \ |
| | --validation_file ./data/experiments/exp_a_json/validation.csv \ |
| | --output_dir ./output/exp_a_json \ |
| | --end_marker "<|endofex|>" \ |
| | --num_train_epochs 3 \ |
| | --per_device_train_batch_size 8 \ |
| | --gradient_accumulation_steps 4 \ |
| | --learning_rate 5e-5 \ |
| | --block_size 256 \ |
| | --fp16 \ |
| | --wandb_project seriguela_experiments \ |
| | --wandb_run_name "exp_a_json_$(date +%Y%m%d_%H%M%S)" |
| |
|
| | echo "" |
| | echo "==============================================" |
| | echo "EXP-A Training Complete!" |
| | echo "==============================================" |
| | echo "Model saved to: ./output/exp_a_json" |
| |
|