Update README.md
Browse files
README.md
CHANGED
|
@@ -52,7 +52,7 @@ vllm serve Raderspace/RaDeR_Qwen25-7B_NuminaMath_MATH_allquerytypes \
|
|
| 52 |
--override-pooler-config '{"pooling_type": "LAST", "normalize": true}' \
|
| 53 |
--gpu-memory-utilization 0.9 \
|
| 54 |
--api-key abc \
|
| 55 |
-
--tokenizer Qwen/Qwen2.5-
|
| 56 |
--port 8001 \
|
| 57 |
--disable-log-requests \
|
| 58 |
--max-num-seqs 5000
|
|
|
|
| 52 |
--override-pooler-config '{"pooling_type": "LAST", "normalize": true}' \
|
| 53 |
--gpu-memory-utilization 0.9 \
|
| 54 |
--api-key abc \
|
| 55 |
+
--tokenizer Qwen/Qwen2.5-7B-Instruct \
|
| 56 |
--port 8001 \
|
| 57 |
--disable-log-requests \
|
| 58 |
--max-num-seqs 5000
|