Luigi commited on
Commit
98badf8
·
1 Parent(s): bae5a29

fix: Sync TQ1_0 settings with official ERNIE 4.5 specs

Browse files

- Updated default_temperature: 0.6 -> 0.8 (matches UI display)
- Updated inference_settings to match official ERNIE 4.5:
- temperature: 0.3 -> 0.8
- top_p: 0.9 -> 0.95
- top_k: 30 -> 40
- repeat_penalty: 1.15 -> 1.1
- Now both UI and generation use consistent values

Files changed (1) hide show
  1. app.py +5 -5
app.py CHANGED
@@ -209,13 +209,13 @@ AVAILABLE_MODELS = {
209
  "repo_id": "unsloth/ERNIE-4.5-21B-A3B-Thinking-GGUF",
210
  "filename": "*TQ1_0.gguf",
211
  "max_context": 131072,
212
- "default_temperature": 0.6,
213
  "supports_toggle": False, # Thinking-only mode
214
  "inference_settings": {
215
- "temperature": 0.3,
216
- "top_p": 0.9,
217
- "top_k": 30,
218
- "repeat_penalty": 1.15,
219
  },
220
  },
221
  "ernie_21b_thinking_q2": {
 
209
  "repo_id": "unsloth/ERNIE-4.5-21B-A3B-Thinking-GGUF",
210
  "filename": "*TQ1_0.gguf",
211
  "max_context": 131072,
212
+ "default_temperature": 0.8,
213
  "supports_toggle": False, # Thinking-only mode
214
  "inference_settings": {
215
+ "temperature": 0.8,
216
+ "top_p": 0.95,
217
+ "top_k": 40,
218
+ "repeat_penalty": 1.1,
219
  },
220
  },
221
  "ernie_21b_thinking_q2": {