| # export step=600 | |
| # export MODEL_NAME_OR_PATH=/cpfs/user/chenhao/outputs/qwen25_7B_reinforce_baseline_zero_tir_fix_boxed_lr1e-6_warmup0.0_kl0.0_zero_tir_0426_nginx_prefetch_fix_env_mask_vllm083_xverify_dapo_async_iternum2/_actor/global_step250/ckpt/pytorch_model.bin/ | |
| # export MODEL_NAME_OR_PATH=/cpfs/user/chenhao/outputs/qwen25_7B_reinforce_baseline_zero_tir_fix_boxed_lr1e-6_warmup0.0_kl0.0_zero_tir_0426_nginx_prefetch_fix_env_mask_vllm083_xverify_deepmath_async_iternum2/_actor/global_step350/ckpt/pytorch_model.bin/ | |
| # export CUDA_VISIBLE_DEVICES="0" | |
| # export INPUT_KEY='problem,question' | |
| # export ANSWER_KEY='answer,final_answer' | |
| # export PROMPT_TYPE='orz_tir' | |
| # export DATA_NAME="aime25" | |
| # export OUTPUT_DIR=${MODEL_NAME_OR_PATH}/math_eval | |
| # export N_SAMPLING=2 | |
| # export TEMPERATURE=0.0 | |
| # export VLLM_USE_V1=0 | |
| # export USE_TIR='yes' | |
| # export USE_SEPERATE='no' | |
| if [ "$USE_TIR" = "yes" ] && [ "$USE_SEPERATE" = "yes" ]; then | |
| echo "USING TIR and SEPERATE" | |
| bash my_evaluation_tir_seperate.sh | |
| elif [ "$USE_TIR" = "yes" ]; then | |
| echo "USING TIR" | |
| bash my_evaluation_tir.sh | |
| else | |
| bash my_evaluation.sh | |
| fi | |