#!/bin/bash set -x source ~/miniconda3/etc/profile.d/conda.sh conda activate verl_new cd ~/RL4Phyx/SFT # Use GPUs 4,5,6,7 export CUDA_VISIBLE_DEVICES=4,5,6,7 export PYTHONUNBUFFERED=1 # Full fine-tuning with DeepSpeed ZeRO-2 torchrun --nproc_per_node=4 --master_port=29501 \ train_sft.py \ 2>&1 | tee sft_training_v5.log