| # v2: drops expandable_segments (suspected slowdown), uses tighter seq lengths. | |
| # Identical training code; only env + config differ from v1. | |
| set -euo pipefail | |
| cd /home/ubuntu | |
| export TOKENIZERS_PARALLELISM=false | |
| export TRANSFORMERS_NO_ADVISORY_WARNINGS=1 | |
| export HF_HUB_DISABLE_PROGRESS_BARS=1 | |
| unset PYTORCH_CUDA_ALLOC_CONF | |
| mkdir -p /home/ubuntu/work/blt_pilot1 | |
| LOG=/home/ubuntu/work/blt_pilot1/run_v2.log | |
| : > "$LOG" # truncate so progress is unambiguous in tail | |
| nohup python3 -u -m experiments.blt_reasoner.train \ | |
| --config /home/ubuntu/experiments/blt_reasoner/configs/pilot_qwen15b_gsm8k.json \ | |
| >> "$LOG" 2>&1 & | |
| PID=$! | |
| echo "$PID" > /home/ubuntu/work/blt_pilot1/run_v2.pid | |
| echo "Launched BLT v2 pid=$PID log=$LOG" | |