Upload README.md with huggingface_hub
Browse files
README.md
CHANGED
|
@@ -170,7 +170,7 @@ def main():
|
|
| 170 |
llm = sgl.Engine(
|
| 171 |
model_path="Qwen/Qwen3-Coder-Next-FP8",
|
| 172 |
speculative_draft_model_path="togethercomputer/Aurora-Spec-Qwen3-Coder-Next-FP8",
|
| 173 |
-
speculative_algorithm="
|
| 174 |
speculative_num_steps=5,
|
| 175 |
speculative_eagle_topk=1,
|
| 176 |
speculative_num_draft_tokens=6,
|
|
@@ -199,7 +199,7 @@ if __name__ == "__main__":
|
|
| 199 |
python -m sglang.launch_server \
|
| 200 |
--model-path Qwen/Qwen3-Coder-Next-FP8 \
|
| 201 |
--speculative-draft-model-path togethercomputer/Aurora-Spec-Qwen3-Coder-Next-FP8 \
|
| 202 |
-
--speculative-algorithm
|
| 203 |
--speculative-num-steps 5 \
|
| 204 |
--speculative-eagle-topk 1 \
|
| 205 |
--speculative-num-draft-tokens 6 \
|
|
@@ -259,7 +259,7 @@ If you have downloaded the models locally, replace the HuggingFace model paths w
|
|
| 259 |
python -m sglang.launch_server \
|
| 260 |
--model-path /path/to/Qwen3-Coder-Next-FP8 \
|
| 261 |
--speculative-draft-model-path /path/to/Aurora-Spec-Qwen3-Coder-Next-FP8 \
|
| 262 |
-
--speculative-algorithm
|
| 263 |
--speculative-num-steps 5 \
|
| 264 |
--speculative-eagle-topk 1 \
|
| 265 |
--speculative-num-draft-tokens 6 \
|
|
|
|
| 170 |
llm = sgl.Engine(
|
| 171 |
model_path="Qwen/Qwen3-Coder-Next-FP8",
|
| 172 |
speculative_draft_model_path="togethercomputer/Aurora-Spec-Qwen3-Coder-Next-FP8",
|
| 173 |
+
speculative_algorithm="EAGLE3",
|
| 174 |
speculative_num_steps=5,
|
| 175 |
speculative_eagle_topk=1,
|
| 176 |
speculative_num_draft_tokens=6,
|
|
|
|
| 199 |
python -m sglang.launch_server \
|
| 200 |
--model-path Qwen/Qwen3-Coder-Next-FP8 \
|
| 201 |
--speculative-draft-model-path togethercomputer/Aurora-Spec-Qwen3-Coder-Next-FP8 \
|
| 202 |
+
--speculative-algorithm EAGLE3 \
|
| 203 |
--speculative-num-steps 5 \
|
| 204 |
--speculative-eagle-topk 1 \
|
| 205 |
--speculative-num-draft-tokens 6 \
|
|
|
|
| 259 |
python -m sglang.launch_server \
|
| 260 |
--model-path /path/to/Qwen3-Coder-Next-FP8 \
|
| 261 |
--speculative-draft-model-path /path/to/Aurora-Spec-Qwen3-Coder-Next-FP8 \
|
| 262 |
+
--speculative-algorithm EAGLE3 \
|
| 263 |
--speculative-num-steps 5 \
|
| 264 |
--speculative-eagle-topk 1 \
|
| 265 |
--speculative-num-draft-tokens 6 \
|