ggerganov HF Staff commited on
Commit
3e4b4d8
·
verified ·
1 Parent(s): 8afd2c6

presets : add GLM4.7 flash without thinking

Browse files
Files changed (1) hide show
  1. preset.ini +10 -1
preset.ini CHANGED
@@ -165,7 +165,16 @@ batch-size = 4096
165
  ubatch-size = 4096
166
  top-p = 0.95
167
  top-k = 0
168
- min-p = 0.01
 
 
 
 
 
 
 
 
 
169
  temp = 1.0
170
 
171
  [nemotron-nano-3-30b-hf]
 
165
  ubatch-size = 4096
166
  top-p = 0.95
167
  top-k = 0
168
+ temp = 0.2
169
+ chat-template-kwargs = {"enable_thinking": false}
170
+
171
+ [glm-4.7-flash-hf-thinking]
172
+ hf = ggml-org/GLM-4.7-Flash-GGUF:Q8_0
173
+ ctx-size = 202752
174
+ batch-size = 4096
175
+ ubatch-size = 4096
176
+ top-p = 0.95
177
+ top-k = 0
178
  temp = 1.0
179
 
180
  [nemotron-nano-3-30b-hf]