{ "quant_cfg": { "*weight_quantizer": { "num_bits": [ 2, 1 ], "block_sizes": { "-1": 16, "type": "dynamic", "scale_bits": [ 4, 3 ] }, "enable": true }, "*input_quantizer": { "enable": false }, "nn.BatchNorm1d": { "*": { "enable": false } }, "nn.BatchNorm2d": { "*": { "enable": false } }, "nn.BatchNorm3d": { "*": { "enable": false } }, "nn.LeakyReLU": { "*": { "enable": false } }, "*lm_head*": { "enable": false }, "*proj_out.*": { "enable": false }, "*block_sparse_moe.gate*": { "enable": false }, "*router*": { "enable": false }, "*mlp.gate.*": { "enable": false }, "*mlp.shared_expert_gate.*": { "enable": false }, "*linear_attn.conv1d*": { "enable": false }, "*mixer.conv1d*": { "enable": false }, "*output_layer*": { "enable": false }, "output.*": { "enable": false }, "default": { "enable": false }, "*norm*": { "enable": false }, "*layernorm*": { "enable": false }, "*LayerNorm*": { "enable": false }, "*rotary*": { "enable": false }, "*bias*": { "enable": false }, "lm_head*": { "enable": false }, "lm_head.weight_quantizer": { "enable": false }, "*visual.blocks.*.mlp.linear_fc1*": { "enable": false }, "*visual.blocks.*.mlp.linear_fc2*": { "enable": false }, "model.visual.blocks.*.mlp.linear_fc1*": { "enable": false }, "model.visual.blocks.*.mlp.linear_fc2*": { "enable": false } }, "algorithm": null }