Update README.md
Browse files
README.md
CHANGED
|
@@ -217,7 +217,7 @@ The results were obtained using the following commands:
|
|
| 217 |
```
|
| 218 |
lm_eval --model local-chat-completions \
|
| 219 |
--tasks mmlu_pro \
|
| 220 |
-
--model_args "model=RedHatAI/
|
| 221 |
--num_fewshot 5 \
|
| 222 |
--apply_chat_template \
|
| 223 |
--fewshot_as_multiturn \
|
|
@@ -228,7 +228,7 @@ lm_eval --model local-chat-completions \
|
|
| 228 |
|
| 229 |
lm_eval --model local-chat-completions \
|
| 230 |
--tasks leaderboard_ifeval \
|
| 231 |
-
--model_args "model=RedHatAI/
|
| 232 |
--num_fewshot 5 \
|
| 233 |
--apply_chat_template \
|
| 234 |
--fewshot_as_multiturn \
|
|
@@ -244,7 +244,7 @@ litellm_config.yaml:
|
|
| 244 |
|
| 245 |
model_parameters:
|
| 246 |
provider: "hosted_vllm"
|
| 247 |
-
model_name: "hosted_vllm/
|
| 248 |
base_url: "http://0.0.0.0:3759/v1"
|
| 249 |
api_key: ""
|
| 250 |
timeout: 3600
|
|
|
|
| 217 |
```
|
| 218 |
lm_eval --model local-chat-completions \
|
| 219 |
--tasks mmlu_pro \
|
| 220 |
+
--model_args "model=RedHatAI/GLM-4.6-NVFP4,max_length=90000,base_url=http://0.0.0.0:3758/v1/chat/completions,num_concurrent=128,max_retries=3,tokenized_requests=False,tokenizer_backend=None,timeout=1200" \
|
| 221 |
--num_fewshot 5 \
|
| 222 |
--apply_chat_template \
|
| 223 |
--fewshot_as_multiturn \
|
|
|
|
| 228 |
|
| 229 |
lm_eval --model local-chat-completions \
|
| 230 |
--tasks leaderboard_ifeval \
|
| 231 |
+
--model_args "model=RedHatAI/GLM-4.6-NVFP4,max_length=90000,base_url=http://0.0.0.0:3758/v1/chat/completions,num_concurrent=128,max_retries=3,tokenized_requests=False,tokenizer_backend=None,timeout=1200" \
|
| 232 |
--num_fewshot 5 \
|
| 233 |
--apply_chat_template \
|
| 234 |
--fewshot_as_multiturn \
|
|
|
|
| 244 |
|
| 245 |
model_parameters:
|
| 246 |
provider: "hosted_vllm"
|
| 247 |
+
model_name: "hosted_vllm/redhatai-glm-4.6-nvfp4"
|
| 248 |
base_url: "http://0.0.0.0:3759/v1"
|
| 249 |
api_key: ""
|
| 250 |
timeout: 3600
|