| { |
| "one_external_file": true, |
| "opset": null, |
| "optimization": {}, |
| "optimum_version": "1.14.0.dev0", |
| "quantization": { |
| "activations_dtype": "QUInt8", |
| "activations_symmetric": false, |
| "format": "QDQ", |
| "is_static": true, |
| "mode": "QLinearOps", |
| "nodes_to_exclude": [ |
| "/proj_out/MatMul", |
| "/model/decoder/0/self_attn/q_proj/MatMul_smooth_mul", |
| "/model/decoder/0/self_attn/k_proj/MatMul_smooth_mul", |
| "/model/decoder/0/self_attn/v_proj/MatMul_smooth_mul", |
| "/model/decoder/0/self_attn/out_proj/MatMul_smooth_mul", |
| "/model/decoder/0/encoder_attn/q_proj/MatMul_smooth_mul", |
| "/model/decoder/0/encoder_attn/out_proj/MatMul_smooth_mul", |
| "/model/decoder/0/fc1/MatMul_smooth_mul", |
| "/model/decoder/0/fc2/MatMul_smooth_mul", |
| "/model/decoder/1/self_attn/q_proj/MatMul_smooth_mul", |
| "/model/decoder/1/self_attn/k_proj/MatMul_smooth_mul", |
| "/model/decoder/1/self_attn/v_proj/MatMul_smooth_mul", |
| "/model/decoder/1/self_attn/out_proj/MatMul_smooth_mul", |
| "/model/decoder/1/encoder_attn/MatMul_smooth_mul", |
| "/model/decoder/1/encoder_attn/MatMul_5_smooth_mul", |
| "/model/decoder/1/fc1/MatMul_smooth_mul", |
| "/model/decoder/1/fc2/MatMul_smooth_mul", |
| "/model/decoder/2/self_attn/q_proj/MatMul_smooth_mul", |
| "/model/decoder/2/self_attn/k_proj/MatMul_smooth_mul", |
| "/model/decoder/2/self_attn/v_proj/MatMul_smooth_mul", |
| "/model/decoder/2/self_attn/out_proj/MatMul_smooth_mul", |
| "/model/decoder/2/encoder_attn/MatMul_smooth_mul", |
| "/model/decoder/2/encoder_attn/MatMul_5_smooth_mul", |
| "/model/decoder/2/fc1/MatMul_smooth_mul", |
| "/model/decoder/2/fc2/MatMul_smooth_mul", |
| "/model/decoder/3/self_attn/q_proj/MatMul_smooth_mul", |
| "/model/decoder/3/self_attn/k_proj/MatMul_smooth_mul", |
| "/model/decoder/3/self_attn/v_proj/MatMul_smooth_mul", |
| "/model/decoder/3/self_attn/out_proj/MatMul_smooth_mul", |
| "/model/decoder/3/encoder_attn/MatMul_smooth_mul", |
| "/model/decoder/3/encoder_attn/MatMul_5_smooth_mul", |
| "/model/decoder/3/fc1/MatMul_smooth_mul", |
| "/model/decoder/3/fc2/MatMul_smooth_mul", |
| "/proj_out/MatMul_smooth_mul" |
| ], |
| "nodes_to_quantize": [], |
| "operators_to_quantize": [ |
| "MatMul" |
| ], |
| "per_channel": false, |
| "qdq_add_pair_to_weight": false, |
| "qdq_dedicated_pair": false, |
| "qdq_op_type_per_channel_support_to_axis": { |
| "MatMul": 1 |
| }, |
| "reduce_range": false, |
| "smooth_quant": false, |
| "smooth_quant_alpha": 0.5, |
| "smooth_quant_folding": true, |
| "smooth_quant_op_types": [ |
| "MatMul" |
| ], |
| "weights_dtype": "QInt8", |
| "weights_symmetric": true |
| }, |
| "transformers_version": "4.33.1", |
| "use_external_data_format": false |
| } |
|
|