Commit ·
efd2986
1
Parent(s): 9469fb1
Upload folder using huggingface_hub (#41)
Browse files- Upload folder using huggingface_hub (bcb770fab8872fb48957551e84d33e53cd9e3637)
Co-authored-by: pathcosmos <somebody-to-love@users.noreply.huggingface.co>
- sampling_config.json +41 -0
sampling_config.json
ADDED
|
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"description": "FRANKENSTALLM 3B v2 sampling/generation parameters (ORPO eval grid best)",
|
| 3 |
+
"default": {
|
| 4 |
+
"max_new_tokens": 512,
|
| 5 |
+
"temperature": 0.8,
|
| 6 |
+
"top_p": 0.9,
|
| 7 |
+
"do_sample": true,
|
| 8 |
+
"repetition_penalty": 1.05
|
| 9 |
+
},
|
| 10 |
+
"recommended": {
|
| 11 |
+
"comment": "ORPO repetition grid best: t0.7_rep1.2 (0% 3-gram rep, 100% EOS)",
|
| 12 |
+
"temperature": 0.7,
|
| 13 |
+
"repetition_penalty": 1.2,
|
| 14 |
+
"top_p": 0.9,
|
| 15 |
+
"max_new_tokens": 512,
|
| 16 |
+
"do_sample": true
|
| 17 |
+
},
|
| 18 |
+
"greedy": {
|
| 19 |
+
"temperature": 0.0,
|
| 20 |
+
"repetition_penalty": 1.0,
|
| 21 |
+
"do_sample": false,
|
| 22 |
+
"max_new_tokens": 256
|
| 23 |
+
},
|
| 24 |
+
"ollama": {
|
| 25 |
+
"comment": "Ollama Modelfile PARAMETERS or runtime options",
|
| 26 |
+
"temperature": 0.7,
|
| 27 |
+
"repeat_penalty": 1.2,
|
| 28 |
+
"top_p": 0.9,
|
| 29 |
+
"num_predict": 512
|
| 30 |
+
},
|
| 31 |
+
"grid_best": {
|
| 32 |
+
"name": "t0.7_rep1.2",
|
| 33 |
+
"temperature": 0.70,
|
| 34 |
+
"repetition_penalty": 1.20,
|
| 35 |
+
"top_p": 0.9,
|
| 36 |
+
"3gram_rep": 0.0,
|
| 37 |
+
"4gram_rep": 0.0,
|
| 38 |
+
"eos_rate": 1.0,
|
| 39 |
+
"avg_tokens": 189.2
|
| 40 |
+
}
|
| 41 |
+
}
|