Spaces:
Running
Running
fix: Sync TQ1_0 settings with official ERNIE 4.5 specs
Browse files- Updated default_temperature: 0.6 -> 0.8 (matches UI display)
- Updated inference_settings to match official ERNIE 4.5:
- temperature: 0.3 -> 0.8
- top_p: 0.9 -> 0.95
- top_k: 30 -> 40
- repeat_penalty: 1.15 -> 1.1
- Now both UI and generation use consistent values
app.py
CHANGED
|
@@ -209,13 +209,13 @@ AVAILABLE_MODELS = {
|
|
| 209 |
"repo_id": "unsloth/ERNIE-4.5-21B-A3B-Thinking-GGUF",
|
| 210 |
"filename": "*TQ1_0.gguf",
|
| 211 |
"max_context": 131072,
|
| 212 |
-
"default_temperature": 0.
|
| 213 |
"supports_toggle": False, # Thinking-only mode
|
| 214 |
"inference_settings": {
|
| 215 |
-
"temperature": 0.
|
| 216 |
-
"top_p": 0.
|
| 217 |
-
"top_k":
|
| 218 |
-
"repeat_penalty": 1.
|
| 219 |
},
|
| 220 |
},
|
| 221 |
"ernie_21b_thinking_q2": {
|
|
|
|
| 209 |
"repo_id": "unsloth/ERNIE-4.5-21B-A3B-Thinking-GGUF",
|
| 210 |
"filename": "*TQ1_0.gguf",
|
| 211 |
"max_context": 131072,
|
| 212 |
+
"default_temperature": 0.8,
|
| 213 |
"supports_toggle": False, # Thinking-only mode
|
| 214 |
"inference_settings": {
|
| 215 |
+
"temperature": 0.8,
|
| 216 |
+
"top_p": 0.95,
|
| 217 |
+
"top_k": 40,
|
| 218 |
+
"repeat_penalty": 1.1,
|
| 219 |
},
|
| 220 |
},
|
| 221 |
"ernie_21b_thinking_q2": {
|