| # 两阶段推理测试 | |
| set -ex | |
| PROMPT_TYPE=$1 | |
| MODEL_NAME_OR_PATH=$2 | |
| DATA_NAME=$3 | |
| SPLIT="test" | |
| NUM_TEST_SAMPLE=-1 | |
| # English open datasets | |
| export DATA_NAME=$DATA_NAME | |
| # 定义 max_tokens_per_call 的取值范围 | |
| for tokens in 100 250 500 1000 2000 4000 6000 10000 | |
| # for tokens in 1000 2000 4000 6000 10000 30000 | |
| do | |
| echo "max_tokens_per_call: $tokens \n" | |
| export BUDGET=$tokens | |
| echo "export BUDGET=$tokens \n" | |
| TOKENIZERS_PARALLELISM=true \ | |
| python3 -u ./remaining_eval_multi_process.py \ | |
| --model_name_or_path ${MODEL_NAME_OR_PATH} \ | |
| --data_names ${DATA_NAME} \ | |
| --output_dir ./$modelname/$tokens \ | |
| --split ${SPLIT} \ | |
| --prompt_type ${PROMPT_TYPE} \ | |
| --num_test_sample ${NUM_TEST_SAMPLE} \ | |
| --seed 0 \ | |
| --temperature 0 \ | |
| --n_sampling 1 \ | |
| --top_p 1 \ | |
| --start 0 \ | |
| --end -1 \ | |
| --use_safetensors \ | |
| --save_outputs \ | |
| --use_vllm \ | |
| --overwrite \ | |
| --max_tokens_per_call $tokens | |
| done |