LFM2-350M-Extract-MNN / config.json
cyberfly
Add LFM2-350M MNN model files and inference script
c1e1bf3
raw
history blame contribute delete
502 Bytes
{
"llm_model": "llm.mnn",
"llm_weight": "llm.mnn.weight",
"backend_type": "cpu",
"thread_num": 4,
"precision": "low",
"memory": "low",
"sampler_type": "mixed",
"temperature": 0.8,
"top_k": 40,
"top_p": 0.9,
"min_p": 0.05,
"tfs_z": 1.0,
"typical": 0.95,
"repetition_penalty": 1.0,
"presence_penalty": 0.0,
"frequency_penalty": 0.0,
"penalty_window": 0,
"n_gram": 8,
"ngram_factor": 1.0,
"tokenizer_file": "tokenizer.mtok"
}