zero_tir_0727 / run_evaluation.sh
htxu91's picture
Upload folder using huggingface_hub
c8140ad verified
# export step=600
# export MODEL_NAME_OR_PATH=/cpfs/user/chenhao/outputs/qwen25_7B_reinforce_baseline_zero_tir_fix_boxed_lr1e-6_warmup0.0_kl0.0_zero_tir_0426_nginx_prefetch_fix_env_mask_vllm083_xverify_dapo_async_iternum2/_actor/global_step250/ckpt/pytorch_model.bin/
# export MODEL_NAME_OR_PATH=/cpfs/user/chenhao/outputs/qwen25_7B_reinforce_baseline_zero_tir_fix_boxed_lr1e-6_warmup0.0_kl0.0_zero_tir_0426_nginx_prefetch_fix_env_mask_vllm083_xverify_deepmath_async_iternum2/_actor/global_step350/ckpt/pytorch_model.bin/
# export CUDA_VISIBLE_DEVICES="0"
# export INPUT_KEY='problem,question'
# export ANSWER_KEY='answer,final_answer'
# export PROMPT_TYPE='orz_tir'
# export DATA_NAME="aime25"
# export OUTPUT_DIR=${MODEL_NAME_OR_PATH}/math_eval
# export N_SAMPLING=2
# export TEMPERATURE=0.0
# export VLLM_USE_V1=0
# export USE_TIR='yes'
# export USE_SEPERATE='no'
if [ "$USE_TIR" = "yes" ] && [ "$USE_SEPERATE" = "yes" ]; then
echo "USING TIR and SEPERATE"
bash my_evaluation_tir_seperate.sh
elif [ "$USE_TIR" = "yes" ]; then
echo "USING TIR"
bash my_evaluation_tir.sh
else
bash my_evaluation.sh
fi