| { |
| "quant_cfg": { |
| "*weight_quantizer": { |
| "num_bits": [ |
| 2, |
| 1 |
| ], |
| "block_sizes": { |
| "-1": 16, |
| "type": "dynamic", |
| "scale_bits": [ |
| 4, |
| 3 |
| ] |
| }, |
| "enable": true |
| }, |
| "*input_quantizer": { |
| "enable": false |
| }, |
| "nn.BatchNorm1d": { |
| "*": { |
| "enable": false |
| } |
| }, |
| "nn.BatchNorm2d": { |
| "*": { |
| "enable": false |
| } |
| }, |
| "nn.BatchNorm3d": { |
| "*": { |
| "enable": false |
| } |
| }, |
| "nn.LeakyReLU": { |
| "*": { |
| "enable": false |
| } |
| }, |
| "*lm_head*": { |
| "enable": false |
| }, |
| "*proj_out.*": { |
| "enable": false |
| }, |
| "*block_sparse_moe.gate*": { |
| "enable": false |
| }, |
| "*router*": { |
| "enable": false |
| }, |
| "*mlp.gate.*": { |
| "enable": false |
| }, |
| "*mlp.shared_expert_gate.*": { |
| "enable": false |
| }, |
| "*linear_attn.conv1d*": { |
| "enable": false |
| }, |
| "*mixer.conv1d*": { |
| "enable": false |
| }, |
| "*output_layer*": { |
| "enable": false |
| }, |
| "output.*": { |
| "enable": false |
| }, |
| "default": { |
| "enable": false |
| }, |
| "*embed_tokens*": { |
| "enable": false |
| }, |
| "*norm*": { |
| "enable": false |
| }, |
| "*layernorm*": { |
| "enable": false |
| }, |
| "*LayerNorm*": { |
| "enable": false |
| }, |
| "*rotary*": { |
| "enable": false |
| }, |
| "*pos_embed*": { |
| "enable": false |
| }, |
| "*patch_embed*": { |
| "enable": false |
| }, |
| "*bias*": { |
| "enable": false |
| }, |
| "*final_layer2*": { |
| "enable": false |
| }, |
| "*t_embedder1*": { |
| "enable": false |
| }, |
| "*x_embedder*": { |
| "enable": false |
| }, |
| "*visual*": { |
| "enable": false |
| }, |
| "*visual.*": { |
| "enable": false |
| }, |
| "model.visual*": { |
| "enable": false |
| }, |
| "model.visual.*": { |
| "enable": false |
| }, |
| "*model.visual*": { |
| "enable": false |
| }, |
| "*model.visual.*": { |
| "enable": false |
| }, |
| "*visual*weight_quantizer": { |
| "enable": false |
| }, |
| "*visual*input_quantizer": { |
| "enable": false |
| }, |
| "model.visual*weight_quantizer": { |
| "enable": false |
| }, |
| "model.visual*input_quantizer": { |
| "enable": false |
| }, |
| "*visual.blocks*": { |
| "enable": false |
| }, |
| "*visual.blocks.*": { |
| "enable": false |
| }, |
| "*visual.blocks.*.attn.qkv*": { |
| "enable": false |
| } |
| }, |
| "algorithm": null |
| } |