Update README.md
Browse files
README.md
CHANGED
|
@@ -246,7 +246,7 @@ The results were obtained using the following commands:
|
|
| 246 |
```
|
| 247 |
lm_eval \
|
| 248 |
--model vllm \
|
| 249 |
-
--model_args pretrained="neuralmagic/
|
| 250 |
--tasks mmlu_llama_3.1_instruct \
|
| 251 |
--fewshot_as_multiturn \
|
| 252 |
--apply_chat_template \
|
|
@@ -258,7 +258,7 @@ lm_eval \
|
|
| 258 |
```
|
| 259 |
lm_eval \
|
| 260 |
--model vllm \
|
| 261 |
-
--model_args pretrained="neuralmagic/
|
| 262 |
--tasks mmlu_cot_0shot_llama_3.1_instruct \
|
| 263 |
--apply_chat_template \
|
| 264 |
--num_fewshot 0 \
|
|
@@ -269,7 +269,7 @@ lm_eval \
|
|
| 269 |
```
|
| 270 |
lm_eval \
|
| 271 |
--model vllm \
|
| 272 |
-
--model_args pretrained="neuralmagic/
|
| 273 |
--tasks arc_challenge_llama_3.1_instruct \
|
| 274 |
--apply_chat_template \
|
| 275 |
--num_fewshot 0 \
|
|
@@ -280,7 +280,7 @@ lm_eval \
|
|
| 280 |
```
|
| 281 |
lm_eval \
|
| 282 |
--model vllm \
|
| 283 |
-
--model_args pretrained="neuralmagic/
|
| 284 |
--tasks gsm8k_cot_llama_3.1_instruct \
|
| 285 |
--fewshot_as_multiturn \
|
| 286 |
--apply_chat_template \
|
|
@@ -292,7 +292,7 @@ lm_eval \
|
|
| 292 |
```
|
| 293 |
lm_eval \
|
| 294 |
--model vllm \
|
| 295 |
-
--model_args pretrained="neuralmagic/
|
| 296 |
--tasks hellaswag \
|
| 297 |
--num_fewshot 10 \
|
| 298 |
--batch_size auto
|
|
@@ -302,7 +302,7 @@ lm_eval \
|
|
| 302 |
```
|
| 303 |
lm_eval \
|
| 304 |
--model vllm \
|
| 305 |
-
--model_args pretrained="neuralmagic/
|
| 306 |
--tasks winogrande \
|
| 307 |
--num_fewshot 5 \
|
| 308 |
--batch_size auto
|
|
@@ -312,7 +312,7 @@ lm_eval \
|
|
| 312 |
```
|
| 313 |
lm_eval \
|
| 314 |
--model vllm \
|
| 315 |
-
--model_args pretrained="neuralmagic/
|
| 316 |
--tasks truthfulqa \
|
| 317 |
--num_fewshot 0 \
|
| 318 |
--batch_size auto
|
|
|
|
| 246 |
```
|
| 247 |
lm_eval \
|
| 248 |
--model vllm \
|
| 249 |
+
--model_args pretrained="neuralmagic/Llama-3.2-1B-Instruct-FP8-dynamic",dtype=auto,add_bos_token=True,max_model_len=3850,max_gen_toks=10,tensor_parallel_size=1 \
|
| 250 |
--tasks mmlu_llama_3.1_instruct \
|
| 251 |
--fewshot_as_multiturn \
|
| 252 |
--apply_chat_template \
|
|
|
|
| 258 |
```
|
| 259 |
lm_eval \
|
| 260 |
--model vllm \
|
| 261 |
+
--model_args pretrained="neuralmagic/Llama-3.2-1B-Instruct-FP8-dynamic",dtype=auto,max_model_len=4064,max_gen_toks=1024,tensor_parallel_size=1 \
|
| 262 |
--tasks mmlu_cot_0shot_llama_3.1_instruct \
|
| 263 |
--apply_chat_template \
|
| 264 |
--num_fewshot 0 \
|
|
|
|
| 269 |
```
|
| 270 |
lm_eval \
|
| 271 |
--model vllm \
|
| 272 |
+
--model_args pretrained="neuralmagic/Llama-3.2-1B-Instruct-FP8-dynamic",dtype=auto,max_model_len=3940,max_gen_toks=100,tensor_parallel_size=1 \
|
| 273 |
--tasks arc_challenge_llama_3.1_instruct \
|
| 274 |
--apply_chat_template \
|
| 275 |
--num_fewshot 0 \
|
|
|
|
| 280 |
```
|
| 281 |
lm_eval \
|
| 282 |
--model vllm \
|
| 283 |
+
--model_args pretrained="neuralmagic/Llama-3.2-1B-Instruct-FP8-dynamic",dtype=auto,max_model_len=4096,max_gen_toks=1024,tensor_parallel_size=1 \
|
| 284 |
--tasks gsm8k_cot_llama_3.1_instruct \
|
| 285 |
--fewshot_as_multiturn \
|
| 286 |
--apply_chat_template \
|
|
|
|
| 292 |
```
|
| 293 |
lm_eval \
|
| 294 |
--model vllm \
|
| 295 |
+
--model_args pretrained="neuralmagic/Llama-3.2-1B-Instruct-FP8-dynamic",dtype=auto,add_bos_token=True,max_model_len=4096,tensor_parallel_size=1 \
|
| 296 |
--tasks hellaswag \
|
| 297 |
--num_fewshot 10 \
|
| 298 |
--batch_size auto
|
|
|
|
| 302 |
```
|
| 303 |
lm_eval \
|
| 304 |
--model vllm \
|
| 305 |
+
--model_args pretrained="neuralmagic/Llama-3.2-1B-Instruct-FP8-dynamic",dtype=auto,add_bos_token=True,max_model_len=4096,tensor_parallel_size=1 \
|
| 306 |
--tasks winogrande \
|
| 307 |
--num_fewshot 5 \
|
| 308 |
--batch_size auto
|
|
|
|
| 312 |
```
|
| 313 |
lm_eval \
|
| 314 |
--model vllm \
|
| 315 |
+
--model_args pretrained="neuralmagic/Llama-3.2-1B-Instruct-FP8-dynamic",dtype=auto,add_bos_token=True,max_model_len=4096,tensor_parallel_size=1 \
|
| 316 |
--tasks truthfulqa \
|
| 317 |
--num_fewshot 0 \
|
| 318 |
--batch_size auto
|