File size: 1,126 Bytes
c8140ad
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28


# export step=600
# export MODEL_NAME_OR_PATH=/cpfs/user/chenhao/outputs/qwen25_7B_reinforce_baseline_zero_tir_fix_boxed_lr1e-6_warmup0.0_kl0.0_zero_tir_0426_nginx_prefetch_fix_env_mask_vllm083_xverify_dapo_async_iternum2/_actor/global_step250/ckpt/pytorch_model.bin/
# export MODEL_NAME_OR_PATH=/cpfs/user/chenhao/outputs/qwen25_7B_reinforce_baseline_zero_tir_fix_boxed_lr1e-6_warmup0.0_kl0.0_zero_tir_0426_nginx_prefetch_fix_env_mask_vllm083_xverify_deepmath_async_iternum2/_actor/global_step350/ckpt/pytorch_model.bin/

# export CUDA_VISIBLE_DEVICES="0"
# export INPUT_KEY='problem,question'
# export ANSWER_KEY='answer,final_answer'
# export PROMPT_TYPE='orz_tir'
# export DATA_NAME="aime25"
# export OUTPUT_DIR=${MODEL_NAME_OR_PATH}/math_eval
# export N_SAMPLING=2
# export TEMPERATURE=0.0
# export VLLM_USE_V1=0
# export USE_TIR='yes'
# export USE_SEPERATE='no'

if [ "$USE_TIR" = "yes" ] && [ "$USE_SEPERATE" = "yes" ]; then
    echo "USING TIR and SEPERATE"
    bash my_evaluation_tir_seperate.sh
elif [ "$USE_TIR" = "yes" ]; then
    echo "USING TIR"
    bash my_evaluation_tir.sh
else
    bash my_evaluation.sh
fi