File size: 1,858 Bytes
28b13fc
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
#!/bin/bash
# ─────────────────────────────────────────────────────────
# train.sh — Launch CXR VLM training (both stages)
# Usage: bash scripts/train.sh
# ─────────────────────────────────────────────────────────

# Exit on error
set -e

# Set project root
PROJ_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)"
cd "$PROJ_DIR"

# ── Config ────────────────────────────────────────────────
MODEL_CONFIG="configs/model_config.yaml"
TRAIN_CONFIG="configs/train_config.yaml"

# ── Optional: resume from checkpoint ──────────────────────
RESUME_FROM=""   # e.g. "checkpoints/stage2_instruct/checkpoint-500"

# ── WandB ─────────────────────────────────────────────────
export WANDB_PROJECT="cxr-vlm-thesis"

# ── Run both stages ───────────────────────────────────────
echo "=========================================="
echo " CXR VLM Training"
echo " Model config: $MODEL_CONFIG"
echo " Train config: $TRAIN_CONFIG"
echo "=========================================="

if [ -n "$RESUME_FROM" ]; then
    python -m training.train \
        --model_config "$MODEL_CONFIG" \
        --train_config "$TRAIN_CONFIG" \
        --resume_from  "$RESUME_FROM"
else
    python -m training.train \
        --model_config "$MODEL_CONFIG" \
        --train_config "$TRAIN_CONFIG"
fi

echo "Training complete!"