#!/usr/bin/env bash # Chain: train 7B BLT-Reasoner → final n=200 z-ablation → push to HF under pilot7b/ set -uo pipefail REPO="LauraGG/blt-reasoner-pilot1" OUT="/home/ubuntu/work/blt_pilot7b" CFG="/home/ubuntu/experiments/blt_reasoner/configs/pilot7b_qwen_math_gsm8k.json" LOG="/home/ubuntu/work/queue_pilot7b.log" log() { echo "[$(date +%T)] $*" | tee -a "$LOG"; } mkdir -p "$OUT" cd /home/ubuntu export TOKENIZERS_PARALLELISM=false TRANSFORMERS_NO_ADVISORY_WARNINGS=1 HF_HUB_DISABLE_PROGRESS_BARS=1 export PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True log "==========================================" log "7B PILOT: BLT-Reasoner on Qwen2.5-Math-7B-Instruct" log "==========================================" python3 -u -m experiments.blt_reasoner.train --config "$CFG" \ > "$OUT/train.log" 2>&1 rc=$? log "train exit=$rc" # Always try eval + push, even if train errored log "running n=200 K=16 z-ablation on final ckpt" python3 -u -m experiments.blt_reasoner.eval \ --ckpt "$OUT/final" --config "$CFG" \ --n 200 --K 16 --max_new_tokens 192 --temperature 0.0 \ --out "$OUT/final/ablation_n200_K16.json" \ > "$OUT/eval.log" 2>&1 log "eval exit=$?" # Push intermediate ckpts + final + ablation + logs to HF under pilot7b/ log "pushing to HF under pilot7b/" python3 - <