| # Default values | |
| MODEL_PATH="andrewzh/Absolute_Zero_Reasoner-Coder-7b" | |
| CUDA_GPU_ID="0" | |
| NUM_GPUS=1 | |
| BATCH_SIZE=128 | |
| N=1 | |
| TEMPERATURE=0.0 | |
| TOP_P=1.0 | |
| MAX_TOKENS=8096 | |
| # Parse command-line arguments | |
| while [[ $# -gt 0 ]]; do | |
| case $1 in | |
| -m|--model) | |
| MODEL_PATH="$2" | |
| shift 2 | |
| ;; | |
| -g|--gpu) | |
| CUDA_GPU_ID="$2" | |
| shift 2 | |
| ;; | |
| -n|--n) | |
| N="$2" | |
| shift 2 | |
| ;; | |
| -t|--temperature) | |
| TEMPERATURE="$2" | |
| shift 2 | |
| ;; | |
| -p|--top_p) | |
| TOP_P="$2" | |
| shift 2 | |
| ;; | |
| -b|--batch_size) | |
| BATCH_SIZE="$2" | |
| shift 2 | |
| ;; | |
| -k|--max_tokens) | |
| MAX_TOKENS="$2" | |
| shift 2 | |
| ;; | |
| *) | |
| # Unknown option | |
| shift | |
| ;; | |
| esac | |
| done | |
| cd evaluation/code_eval/coding/LiveCodeBench | |
| # Run LiveCodeBench with the AZR template and a local model | |
| CUDA_VISIBLE_DEVICES=$CUDA_GPU_ID python -m lcb_runner.runner.main \ | |
| --model $MODEL_PATH \ | |
| --trust_remote_code \ | |
| --scenario codegeneration \ | |
| --release_version release_v6 \ | |
| --tensor_parallel_size $NUM_GPUS \ | |
| --use_cache \ | |
| --n $N \ | |
| --temperature $TEMPERATURE \ | |
| --max_tokens $MAX_TOKENS \ | |
| --custom_output_save_name $MODEL_PATH \ | |
| --top_p $TOP_P \ | |
| --timeout 60 \ | |
| --evaluate --continue_existing --continue_existing_with_eval | |