Luigi commited on
Commit
bae5a29
·
1 Parent(s): d335258

fix: Use official ERNIE 4.5 generation settings

Browse files

- Updated temperature: 0.3 -> 0.8 (per PaddlePaddle/ERNIE docs)
- Updated top_p: 0.9 -> 0.95 (per official recommendation)
- Updated top_k: 30 -> 40 (more exploration)
- Reduced repeat_penalty: 1.15 -> 1.1 (less restrictive)
- Reference: https://github.com/PaddlePaddle/ERNIE#offline-inference

Files changed (1) hide show
  1. app.py +5 -5
app.py CHANGED
@@ -223,13 +223,13 @@ AVAILABLE_MODELS = {
223
  "repo_id": "mradermacher/ERNIE-4.5-21B-A3B-Thinking-i1-GGUF",
224
  "filename": "*IQ3_XXS.gguf",
225
  "max_context": 131072,
226
- "default_temperature": 0.6,
227
  "supports_toggle": False,
228
  "inference_settings": {
229
- "temperature": 0.3,
230
- "top_p": 0.9,
231
- "top_k": 30,
232
- "repeat_penalty": 1.15,
233
  },
234
  },
235
  }
 
223
  "repo_id": "mradermacher/ERNIE-4.5-21B-A3B-Thinking-i1-GGUF",
224
  "filename": "*IQ3_XXS.gguf",
225
  "max_context": 131072,
226
+ "default_temperature": 0.8,
227
  "supports_toggle": False,
228
  "inference_settings": {
229
+ "temperature": 0.8,
230
+ "top_p": 0.95,
231
+ "top_k": 40,
232
+ "repeat_penalty": 1.1,
233
  },
234
  },
235
  }