Debrup-61 commited on
Commit
6c2f67e
·
verified ·
1 Parent(s): 1d804fc

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +1 -1
README.md CHANGED
@@ -52,7 +52,7 @@ vllm serve Raderspace/RaDeR_Qwen25-7B_NuminaMath_MATH_allquerytypes \
52
  --override-pooler-config '{"pooling_type": "LAST", "normalize": true}' \
53
  --gpu-memory-utilization 0.9 \
54
  --api-key abc \
55
- --tokenizer Qwen/Qwen2.5-14B-Instruct \
56
  --port 8001 \
57
  --disable-log-requests \
58
  --max-num-seqs 5000
 
52
  --override-pooler-config '{"pooling_type": "LAST", "normalize": true}' \
53
  --gpu-memory-utilization 0.9 \
54
  --api-key abc \
55
+ --tokenizer Qwen/Qwen2.5-7B-Instruct \
56
  --port 8001 \
57
  --disable-log-requests \
58
  --max-num-seqs 5000