Create README.md
Browse files
README.md
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
```
|
| 2 |
+
vllm serve nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16 \
|
| 3 |
+
--max-num-seqs 8 \
|
| 4 |
+
--tensor-parallel-size 1 \
|
| 5 |
+
--max-model-len 262144 \
|
| 6 |
+
--port 8000 \
|
| 7 |
+
--trust-remote-code \
|
| 8 |
+
--enable-auto-tool-choice \
|
| 9 |
+
--tool-call-parser qwen3_coder \
|
| 10 |
+
--reasoning-parser-plugin nano_v3_reasoning_parser.py \
|
| 11 |
+
--reasoning-parser nano_v3
|
| 12 |
+
```
|