Heewon Oh Claude Opus 4.6 commited on
Commit
90d4f5a
ยท
1 Parent(s): 1c0fe42

fix(runpod): align sampling params with model card (top_k=40, top_p=0.95, rep=1.0)

Browse files
Files changed (1) hide show
  1. vela/tools/runpod_client.py +3 -3
vela/tools/runpod_client.py CHANGED
@@ -78,9 +78,9 @@ class RunPodClient:
78
  "max_tokens": max_tokens,
79
  "temperature": temperature,
80
  # vLLM์€ generation_config.json์„ ์ž๋™ ์ ์šฉํ•˜์ง€ ์•Š์œผ๋ฏ€๋กœ ๋ช…์‹œ์  ์ „๋‹ฌ
81
- "top_k": 20,
82
- "top_p": 0.8,
83
- "repetition_penalty": 1.1,
84
  }
85
  if stop:
86
  sampling_params["stop"] = stop
 
78
  "max_tokens": max_tokens,
79
  "temperature": temperature,
80
  # vLLM์€ generation_config.json์„ ์ž๋™ ์ ์šฉํ•˜์ง€ ์•Š์œผ๋ฏ€๋กœ ๋ช…์‹œ์  ์ „๋‹ฌ
81
+ "top_k": 40,
82
+ "top_p": 0.95,
83
+ "repetition_penalty": 1.0,
84
  }
85
  if stop:
86
  sampling_params["stop"] = stop