frankenstallm / sampling_config.json
pathcosmos's picture
Upload folder using huggingface_hub (#41)
efd2986
raw
history blame contribute delete
981 Bytes
{
"description": "FRANKENSTALLM 3B v2 sampling/generation parameters (ORPO eval grid best)",
"default": {
"max_new_tokens": 512,
"temperature": 0.8,
"top_p": 0.9,
"do_sample": true,
"repetition_penalty": 1.05
},
"recommended": {
"comment": "ORPO repetition grid best: t0.7_rep1.2 (0% 3-gram rep, 100% EOS)",
"temperature": 0.7,
"repetition_penalty": 1.2,
"top_p": 0.9,
"max_new_tokens": 512,
"do_sample": true
},
"greedy": {
"temperature": 0.0,
"repetition_penalty": 1.0,
"do_sample": false,
"max_new_tokens": 256
},
"ollama": {
"comment": "Ollama Modelfile PARAMETERS or runtime options",
"temperature": 0.7,
"repeat_penalty": 1.2,
"top_p": 0.9,
"num_predict": 512
},
"grid_best": {
"name": "t0.7_rep1.2",
"temperature": 0.70,
"repetition_penalty": 1.20,
"top_p": 0.9,
"3gram_rep": 0.0,
"4gram_rep": 0.0,
"eos_rate": 1.0,
"avg_tokens": 189.2
}
}