| #!/usr/bin/env bash |
| set -euo pipefail |
|
|
| SCRIPT_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd) |
| MODEL_PATH=${1:?Usage: bash verl/eval/run_vllm_math_benchmark_eval.sh /path/to/model [extra args...]} |
| shift |
|
|
| |
| source "$(conda info --base)/etc/profile.d/conda.sh" |
| conda activate "${CONDA_ENV:-verl-qwen3}" |
|
|
| export CUDA_VISIBLE_DEVICES=${CUDA_VISIBLE_DEVICES:-0,1,2,3} |
| export VLLM_USE_V1=${VLLM_USE_V1:-1} |
| export VLLM_LOGGING_LEVEL=${VLLM_LOGGING_LEVEL:-WARN} |
| export PYTORCH_CUDA_ALLOC_CONF=${PYTORCH_CUDA_ALLOC_CONF:-expandable_segments:True} |
| export NCCL_CUMEM_ENABLE=${NCCL_CUMEM_ENABLE:-0} |
|
|
| python "${SCRIPT_DIR}/vllm_math_benchmark_eval.py" \ |
| --model "${MODEL_PATH}" \ |
| --benchmarks AIME24 AIME25 AMC23 MATH500 Minerva Olympiad \ |
| --k 1 2 4 8 16 32 \ |
| --temperature "${TEMPERATURE:-0.6}" \ |
| --top-p "${TOP_P:-0.95}" \ |
| --top-k "${TOP_K:-0}" \ |
| --max-tokens "${MAX_TOKENS:-2048}" \ |
| --sample-batch-size "${SAMPLE_BATCH_SIZE:-4}" \ |
| --tensor-parallel-size "${TENSOR_PARALLEL_SIZE:-4}" \ |
| --gpu-memory-utilization "${GPU_MEMORY_UTILIZATION:-0.75}" \ |
| --disable-custom-all-reduce \ |
| --dtype "${DTYPE:-auto}" \ |
| --seed "${SEED:-0}" \ |
| --output-dir "${OUTPUT_DIR:-${SCRIPT_DIR}/data}" \ |
| "$@" |
|
|