sampling_config.json · pathcosmos/frankenstallm at main

frankenstallm / sampling_config.json

Upload folder using huggingface_hub (#41)

efd2986 6 days ago

981 Bytes

	{
	"description": "FRANKENSTALLM 3B v2 sampling/generation parameters (ORPO eval grid best)",
	"default": {
	"max_new_tokens": 512,
	"temperature": 0.8,
	"top_p": 0.9,
	"do_sample": true,
	"repetition_penalty": 1.05
	},
	"recommended": {
	"comment": "ORPO repetition grid best: t0.7_rep1.2 (0% 3-gram rep, 100% EOS)",
	"temperature": 0.7,
	"repetition_penalty": 1.2,
	"top_p": 0.9,
	"max_new_tokens": 512,
	"do_sample": true
	},
	"greedy": {
	"temperature": 0.0,
	"repetition_penalty": 1.0,
	"do_sample": false,
	"max_new_tokens": 256
	},
	"ollama": {
	"comment": "Ollama Modelfile PARAMETERS or runtime options",
	"temperature": 0.7,
	"repeat_penalty": 1.2,
	"top_p": 0.9,
	"num_predict": 512
	},
	"grid_best": {
	"name": "t0.7_rep1.2",
	"temperature": 0.70,
	"repetition_penalty": 1.20,
	"top_p": 0.9,
	"3gram_rep": 0.0,
	"4gram_rep": 0.0,
	"eos_rate": 1.0,
	"avg_tokens": 189.2
	}
	}