Spaces:
Running
Running
Heewon Oh Claude Opus 4.6 commited on
Commit ยท
90d4f5a
1
Parent(s): 1c0fe42
fix(runpod): align sampling params with model card (top_k=40, top_p=0.95, rep=1.0)
Browse files
vela/tools/runpod_client.py
CHANGED
|
@@ -78,9 +78,9 @@ class RunPodClient:
|
|
| 78 |
"max_tokens": max_tokens,
|
| 79 |
"temperature": temperature,
|
| 80 |
# vLLM์ generation_config.json์ ์๋ ์ ์ฉํ์ง ์์ผ๋ฏ๋ก ๋ช
์์ ์ ๋ฌ
|
| 81 |
-
"top_k":
|
| 82 |
-
"top_p": 0.
|
| 83 |
-
"repetition_penalty": 1.
|
| 84 |
}
|
| 85 |
if stop:
|
| 86 |
sampling_params["stop"] = stop
|
|
|
|
| 78 |
"max_tokens": max_tokens,
|
| 79 |
"temperature": temperature,
|
| 80 |
# vLLM์ generation_config.json์ ์๋ ์ ์ฉํ์ง ์์ผ๋ฏ๋ก ๋ช
์์ ์ ๋ฌ
|
| 81 |
+
"top_k": 40,
|
| 82 |
+
"top_p": 0.95,
|
| 83 |
+
"repetition_penalty": 1.0,
|
| 84 |
}
|
| 85 |
if stop:
|
| 86 |
sampling_params["stop"] = stop
|