neural-mesh-v2 / test /run_ttrlvr_azr_training.sh
hjkim00's picture
Restore all essential files - code, configs, and MBPP/HumanEval data
24c2665 verified
#!/bin/bash
set -x
# GPU ์„ค์ • (๊ธฐ๋ณธ๊ฐ’: 5)
GPU_ID=${GPU_ID:-3}
export CUDA_VISIBLE_DEVICES=$GPU_ID
# ํ™˜๊ฒฝ ๋ณ€์ˆ˜ ์„ค์ •
export VLLM_ATTENTION_BACKEND=FLASH_ATTN
export RAY_memory_monitor_refresh_ms=0
export RAY_LOGGING_LEVEL=DEBUG
export HYDRA_FULL_ERROR=1
export PYTHONPATH="${PYTHONPATH}:/home/ubuntu/RLVR/verl:/home/ubuntu/RLVR/TestTime-RLVR-v2"
# ๋กœ๊ทธ ๋””๋ ‰ํ† ๋ฆฌ ์ƒ์„ฑ
LOG_DIR="/home/ubuntu/RLVR/TestTime-RLVR-v2/logs"
mkdir -p "$LOG_DIR"
# ํƒ€์ž„์Šคํƒฌํ”„ ์ƒ์„ฑ
TIMESTAMP=$(date +"%Y%m%d_%H%M%S")
LOG_FILE="$LOG_DIR/ttrlvr_azr_training_${TIMESTAMP}.log"
echo "๐Ÿ“ Logging to: $LOG_FILE"
# TTRLVR ๋ฐ์ดํ„ฐ ๊ฒฝ๋กœ
TTRLVR_DATA_PATH="/home/ubuntu/RLVR/TestTime-RLVR-v2/tmp/batch_results/ttrlvr_azr_20250730_155352/mbpp/Mbpp_7/round_1/azr_training_data"
# main_azr_ppo ์ง์ ‘ ์‹คํ–‰ (tee๋กœ ์ฝ˜์†”๊ณผ ํŒŒ์ผ์— ๋™์‹œ ์ถœ๋ ฅ)
python -m absolute_zero_reasoner.main_azr_ppo \
--config-path=/home/ubuntu/RLVR/TestTime-RLVR-v2/test/configs \
--config-name=ttrlvr_azr_ppo \
data.train_files=$TTRLVR_DATA_PATH \
data.val_files=$TTRLVR_DATA_PATH \
trainer.experiment_name="ttrlvr_azr_gpu${GPU_ID}" 2>&1 | tee "$LOG_FILE"
# ์‹คํ–‰ ๊ฒฐ๊ณผ ์ €์žฅ
EXITCODE=${PIPESTATUS[0]}
# ๋กœ๊ทธ ํŒŒ์ผ ๋์— ์‹คํ–‰ ๊ฒฐ๊ณผ ์ถ”๊ฐ€
echo "" >> "$LOG_FILE"
echo "========================================" >> "$LOG_FILE"
echo "Execution finished at: $(date)" >> "$LOG_FILE"
echo "Exit code: $EXITCODE" >> "$LOG_FILE"
# ์š”์•ฝ ์ •๋ณด ์ถœ๋ ฅ
echo ""
echo "โœ… Training completed!"
echo "๐Ÿ“„ Full log saved to: $LOG_FILE"
echo "๐Ÿ” Exit code: $EXITCODE"
exit $EXITCODE