Update README.md
Browse filesupdate sglang deploy cmd
README.md
CHANGED
|
@@ -220,12 +220,10 @@ pip install "sglang[all] @ git+https://github.com/sgl-project/sglang.git"
|
|
| 220 |
```
|
| 221 |
|
| 222 |
2. Launch the server.
|
|
|
|
| 223 |
|
| 224 |
```bash
|
| 225 |
-
|
| 226 |
-
SGLANG_ENABLE_SPEC_V2=1
|
| 227 |
-
python3 -m sglang.launch_server \
|
| 228 |
-
--model-path <MODEL_PATH_OR_HF_ID> \
|
| 229 |
--served-model-name step3p5-flash \
|
| 230 |
--tp-size 8 \
|
| 231 |
--tool-call-parser step3p5 \
|
|
@@ -240,9 +238,7 @@ python3 -m sglang.launch_server \
|
|
| 240 |
```
|
| 241 |
- For fp8 model
|
| 242 |
```bash
|
| 243 |
-
|
| 244 |
-
python3 -m sglang.launch_server \
|
| 245 |
-
--model-path <MODEL_PATH_OR_HF_ID> \
|
| 246 |
--served-model-name step3p5-flash \
|
| 247 |
--tp-size 8 \
|
| 248 |
--ep-size 8 \
|
|
|
|
| 220 |
```
|
| 221 |
|
| 222 |
2. Launch the server.
|
| 223 |
+
- For bf16 model
|
| 224 |
|
| 225 |
```bash
|
| 226 |
+
sglang serve --model-path <MODEL_PATH_OR_HF_ID> \
|
|
|
|
|
|
|
|
|
|
| 227 |
--served-model-name step3p5-flash \
|
| 228 |
--tp-size 8 \
|
| 229 |
--tool-call-parser step3p5 \
|
|
|
|
| 238 |
```
|
| 239 |
- For fp8 model
|
| 240 |
```bash
|
| 241 |
+
sglang serve --model-path <MODEL_PATH_OR_HF_ID> \
|
|
|
|
|
|
|
| 242 |
--served-model-name step3p5-flash \
|
| 243 |
--tp-size 8 \
|
| 244 |
--ep-size 8 \
|