presets : add GLM4.7 flash without thinking
Browse files- preset.ini +10 -1
preset.ini
CHANGED
|
@@ -165,7 +165,16 @@ batch-size = 4096
|
|
| 165 |
ubatch-size = 4096
|
| 166 |
top-p = 0.95
|
| 167 |
top-k = 0
|
| 168 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 169 |
temp = 1.0
|
| 170 |
|
| 171 |
[nemotron-nano-3-30b-hf]
|
|
|
|
| 165 |
ubatch-size = 4096
|
| 166 |
top-p = 0.95
|
| 167 |
top-k = 0
|
| 168 |
+
temp = 0.2
|
| 169 |
+
chat-template-kwargs = {"enable_thinking": false}
|
| 170 |
+
|
| 171 |
+
[glm-4.7-flash-hf-thinking]
|
| 172 |
+
hf = ggml-org/GLM-4.7-Flash-GGUF:Q8_0
|
| 173 |
+
ctx-size = 202752
|
| 174 |
+
batch-size = 4096
|
| 175 |
+
ubatch-size = 4096
|
| 176 |
+
top-p = 0.95
|
| 177 |
+
top-k = 0
|
| 178 |
temp = 1.0
|
| 179 |
|
| 180 |
[nemotron-nano-3-30b-hf]
|