File size: 1,858 Bytes
28b13fc | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 | #!/bin/bash
# ─────────────────────────────────────────────────────────
# train.sh — Launch CXR VLM training (both stages)
# Usage: bash scripts/train.sh
# ─────────────────────────────────────────────────────────
# Exit on error
set -e
# Set project root
PROJ_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)"
cd "$PROJ_DIR"
# ── Config ────────────────────────────────────────────────
MODEL_CONFIG="configs/model_config.yaml"
TRAIN_CONFIG="configs/train_config.yaml"
# ── Optional: resume from checkpoint ──────────────────────
RESUME_FROM="" # e.g. "checkpoints/stage2_instruct/checkpoint-500"
# ── WandB ─────────────────────────────────────────────────
export WANDB_PROJECT="cxr-vlm-thesis"
# ── Run both stages ───────────────────────────────────────
echo "=========================================="
echo " CXR VLM Training"
echo " Model config: $MODEL_CONFIG"
echo " Train config: $TRAIN_CONFIG"
echo "=========================================="
if [ -n "$RESUME_FROM" ]; then
python -m training.train \
--model_config "$MODEL_CONFIG" \
--train_config "$TRAIN_CONFIG" \
--resume_from "$RESUME_FROM"
else
python -m training.train \
--model_config "$MODEL_CONFIG" \
--train_config "$TRAIN_CONFIG"
fi
echo "Training complete!"
|