Update README.md
Browse files
README.md
CHANGED
|
@@ -124,15 +124,27 @@ lm_eval --model local-completions \
|
|
| 124 |
--output_path output_data/DeepSeek-R1-MXFP4
|
| 125 |
```
|
| 126 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 127 |
#### GSM8K
|
| 128 |
```
|
| 129 |
-
lm_eval \
|
| 130 |
-
--model
|
| 131 |
-
--model_args pretrained=amd/DeepSeek-R1-MXFP4,dtype=auto,add_bos_token=True,tensor_parallel_size=8,gpu_memory_utilization=0.8,max_model_len=38768, \
|
| 132 |
--tasks gsm8k \
|
| 133 |
-
--num_fewshot
|
| 134 |
--batch_size auto \
|
| 135 |
-
--
|
|
|
|
| 136 |
```
|
| 137 |
|
| 138 |
|
|
|
|
| 124 |
--output_path output_data/DeepSeek-R1-MXFP4
|
| 125 |
```
|
| 126 |
|
| 127 |
+
#### GPQA Diamond
|
| 128 |
+
```
|
| 129 |
+
lm_eval --model local-completions \
|
| 130 |
+
--model_args model=amd/DeepSeek-R1-MXFP4,base_url=http://localhost:30000/v1/completions,num_concurrent=999999,timeout=999999,tokenized_requests=False,max_length=32000,temperature=0.6,top_p=0.95 \
|
| 131 |
+
--tasks gpqa_diamond_cot_zeroshot \
|
| 132 |
+
--num_fewshot 0 \
|
| 133 |
+
--gen_kwargs "do_sample=True,temperature=0.6,top_p=0.95,max_tokens=32000,max_gen_toks=32000" \
|
| 134 |
+
--batch_size auto \
|
| 135 |
+
--log_samples \
|
| 136 |
+
--output_path output_data/DeepSeek-R1-MXFP4
|
| 137 |
+
```
|
| 138 |
+
|
| 139 |
#### GSM8K
|
| 140 |
```
|
| 141 |
+
lm_eval --model local-completions \
|
| 142 |
+
--model_args model=amd/DeepSeek-R1-MXFP4,base_url=http://localhost:30000/v1/completions,num_concurrent=999999,timeout=999999,tokenized_requests=False,max_length=8096 \
|
|
|
|
| 143 |
--tasks gsm8k \
|
| 144 |
+
--num_fewshot 5 \
|
| 145 |
--batch_size auto \
|
| 146 |
+
--log_samples \
|
| 147 |
+
--output_path output_data/DeepSeek-R1-MXFP4
|
| 148 |
```
|
| 149 |
|
| 150 |
|