WhoIsShe's picture
Add MNN 4-bit quantized model with Model Card
52855b8 verified
{
"path": "/content/models/DS-R1-Qwen3-8B-ArliAI-RpR-v4-Small",
"type": null,
"tokenizer_path": "/content/models/DS-R1-Qwen3-8B-ArliAI-RpR-v4-Small",
"eagle_path": null,
"lora_path": null,
"gptq_path": null,
"dst_path": "/kaggle/working/mnn_output",
"verbose": true,
"test": null,
"export": "mnn",
"onnx_slim": false,
"quant_bit": 4,
"quant_block": 64,
"visual_quant_bit": null,
"visual_quant_block": null,
"lm_quant_bit": 4,
"lm_quant_block": 64,
"mnnconvert": "../../../build/MNNConvert",
"ppl": false,
"awq": false,
"hqq": false,
"omni": false,
"transformer_fuse": false,
"group_conv_native": false,
"smooth": false,
"sym": false,
"visual_sym": false,
"seperate_embed": false,
"lora_split": false,
"calib_data": null,
"act_bit": 16,
"embed_bit": 16,
"act_sym": false,
"generate_for_npu": false,
"skip_weight": false,
"omni_epochs": 20,
"omni_lr": 0.005,
"omni_wd": 0.0001,
"tie_word_embeddings": false
}