Update README.md
Browse files
README.md
CHANGED
|
@@ -25,7 +25,7 @@ sampling_params = SamplingParams(
|
|
| 25 |
temperature=0.80, top_p=0.95, max_tokens=40, min_tokens=10
|
| 26 |
)
|
| 27 |
llm = LLM(
|
| 28 |
-
"
|
| 29 |
tensor_parallel_size=4,
|
| 30 |
max_model_len=4096,
|
| 31 |
enforce_eager=True,
|
|
|
|
| 25 |
temperature=0.80, top_p=0.95, max_tokens=40, min_tokens=10
|
| 26 |
)
|
| 27 |
llm = LLM(
|
| 28 |
+
"inference-optimization/DeepSeek-R1-NVFP4-FP8-BLOCK",
|
| 29 |
tensor_parallel_size=4,
|
| 30 |
max_model_len=4096,
|
| 31 |
enforce_eager=True,
|