apiversion: modelslim_v1 spec: process: - type: flex_smooth_quant proxy_quant_dtype: mxfp4 proxy_quant_axes: -1 enable_subgraph_type: - up-down include: - '*' exclude: - model.layers.50* - model.layers.1.* - model.layers.2.* - model.layers.3.* - model.layers.0.* - '*mlp.shared_experts*' - type: linear_quant qconfig: act: scope: per_block dtype: mxfp4 symmetric: true method: minmax weight: scope: per_block dtype: mxfp4 symmetric: true method: minmax include: - '*' exclude: - model.layers.1.* - model.layers.2.* - model.layers.3.* - model.layers.0.* - '*attn*' - '*mlp.shared_experts*' - '*mlp.gate' - model.layers.50* dataset: mix_calib.jsonl save: - type: ascendv1_saver part_file_size: 4 metadata: config_id: openpangu_mxfp4_e2m1 score: 50.0 label: w_bit: 4 a_bit: 4 is_sparse: false kv_cache: false verified_model_types: [] verified_tags: {} default_mxfp4_e2m1: act: scope: per_block dtype: mxfp4 symmetric: true method: minmax weight: scope: per_block dtype: mxfp4 symmetric: true method: minmax