Add MNN 4-bit quantized model with Model Card

52855b8 verified 13 days ago

1.06 kB

	{
	"path": "/content/models/DS-R1-Qwen3-8B-ArliAI-RpR-v4-Small",
	"type": null,
	"tokenizer_path": "/content/models/DS-R1-Qwen3-8B-ArliAI-RpR-v4-Small",
	"eagle_path": null,
	"lora_path": null,
	"gptq_path": null,
	"dst_path": "/kaggle/working/mnn_output",
	"verbose": true,
	"test": null,
	"export": "mnn",
	"onnx_slim": false,
	"quant_bit": 4,
	"quant_block": 64,
	"visual_quant_bit": null,
	"visual_quant_block": null,
	"lm_quant_bit": 4,
	"lm_quant_block": 64,
	"mnnconvert": "../../../build/MNNConvert",
	"ppl": false,
	"awq": false,
	"hqq": false,
	"omni": false,
	"transformer_fuse": false,
	"group_conv_native": false,
	"smooth": false,
	"sym": false,
	"visual_sym": false,
	"seperate_embed": false,
	"lora_split": false,
	"calib_data": null,
	"act_bit": 16,
	"embed_bit": 16,
	"act_sym": false,
	"generate_for_npu": false,
	"skip_weight": false,
	"omni_epochs": 20,
	"omni_lr": 0.005,
	"omni_wd": 0.0001,
	"tie_word_embeddings": false
	}