| apiversion: modelslim_v1 | |
| spec: | |
| process: | |
| - type: flex_smooth_quant | |
| proxy_quant_dtype: mxfp4 | |
| proxy_quant_axes: -1 | |
| enable_subgraph_type: | |
| - up-down | |
| include: | |
| - '*' | |
| exclude: | |
| - model.layers.50* | |
| - model.layers.1.* | |
| - model.layers.2.* | |
| - model.layers.3.* | |
| - model.layers.0.* | |
| - '*mlp.shared_experts*' | |
| - type: linear_quant | |
| qconfig: | |
| act: | |
| scope: per_block | |
| dtype: mxfp4 | |
| symmetric: true | |
| method: minmax | |
| weight: | |
| scope: per_block | |
| dtype: mxfp4 | |
| symmetric: true | |
| method: minmax | |
| include: | |
| - '*' | |
| exclude: | |
| - model.layers.1.* | |
| - model.layers.2.* | |
| - model.layers.3.* | |
| - model.layers.0.* | |
| - '*attn*' | |
| - '*mlp.shared_experts*' | |
| - '*mlp.gate' | |
| - model.layers.50* | |
| dataset: mix_calib.jsonl | |
| save: | |
| - type: ascendv1_saver | |
| part_file_size: 4 | |
| metadata: | |
| config_id: openpangu_mxfp4_e2m1 | |
| score: 50.0 | |
| label: | |
| w_bit: 4 | |
| a_bit: 4 | |
| is_sparse: false | |
| kv_cache: false | |
| verified_model_types: [] | |
| verified_tags: {} | |
| default_mxfp4_e2m1: | |
| act: | |
| scope: per_block | |
| dtype: mxfp4 | |
| symmetric: true | |
| method: minmax | |
| weight: | |
| scope: per_block | |
| dtype: mxfp4 | |
| symmetric: true | |
| method: minmax | |