Update README.md
Browse files
README.md
CHANGED
|
@@ -83,20 +83,12 @@ The GSM8K results were obtained using the lm-eval framework, based on the Docker
|
|
| 83 |
```
|
| 84 |
export VLLM_ROCM_USE_AITER=1
|
| 85 |
|
| 86 |
-
export
|
| 87 |
log_file=minimax25-lm_eval_gsm8k_mxfp4.txt
|
| 88 |
|
| 89 |
-
lm_eval --model vllm --model_args pretrained=$
|
| 90 |
--gen_kwargs temperature=1.0,top_p=0.95,top_k=40 \
|
| 91 |
--tasks gsm8k --num_fewshot 8 2>&1 | tee $log_file
|
| 92 |
-
|
| 93 |
-
|
| 94 |
-
export model_dir=MiniMaxAI/MiniMax-M2.5/
|
| 95 |
-
log_file=minimax25-lm_eval_gsm8k.txt
|
| 96 |
-
|
| 97 |
-
lm_eval --model vllm --model_args pretrained=$model_dir,enforce_eager=True,tensor_parallel_size=8,trust_remote_code=True,max_model_len=16384 \
|
| 98 |
-
--gen_kwargs temperature=0.8,top_p=0.95,top_k=40 \
|
| 99 |
-
--tasks gsm8k --num_fewshot 8 2>&1 | tee $log_file
|
| 100 |
```
|
| 101 |
|
| 102 |
|
|
|
|
| 83 |
```
|
| 84 |
export VLLM_ROCM_USE_AITER=1
|
| 85 |
|
| 86 |
+
export model_dir=MiniMaxAI/MiniMax-M2.5-mxfp4/
|
| 87 |
log_file=minimax25-lm_eval_gsm8k_mxfp4.txt
|
| 88 |
|
| 89 |
+
lm_eval --model vllm --model_args pretrained=$model_dir,enforce_eager=True,trust_remote_code=True,max_model_len=16384 \
|
| 90 |
--gen_kwargs temperature=1.0,top_p=0.95,top_k=40 \
|
| 91 |
--tasks gsm8k --num_fewshot 8 2>&1 | tee $log_file
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 92 |
```
|
| 93 |
|
| 94 |
|