{ "one_external_file": true, "opset": null, "optimization": {}, "optimum_version": "1.14.0.dev0", "quantization": { "activations_dtype": "QUInt8", "activations_symmetric": false, "format": "QDQ", "is_static": true, "mode": "QLinearOps", "nodes_to_exclude": [ "/proj_out/MatMul", "/model/decoder/0/self_attn/q_proj/MatMul_smooth_mul", "/model/decoder/0/self_attn/k_proj/MatMul_smooth_mul", "/model/decoder/0/self_attn/v_proj/MatMul_smooth_mul", "/model/decoder/0/self_attn/out_proj/MatMul_smooth_mul", "/model/decoder/0/encoder_attn/q_proj/MatMul_smooth_mul", "/model/decoder/0/encoder_attn/out_proj/MatMul_smooth_mul", "/model/decoder/0/fc1/MatMul_smooth_mul", "/model/decoder/0/fc2/MatMul_smooth_mul", "/model/decoder/1/self_attn/q_proj/MatMul_smooth_mul", "/model/decoder/1/self_attn/k_proj/MatMul_smooth_mul", "/model/decoder/1/self_attn/v_proj/MatMul_smooth_mul", "/model/decoder/1/self_attn/out_proj/MatMul_smooth_mul", "/model/decoder/1/encoder_attn/MatMul_smooth_mul", "/model/decoder/1/encoder_attn/MatMul_5_smooth_mul", "/model/decoder/1/fc1/MatMul_smooth_mul", "/model/decoder/1/fc2/MatMul_smooth_mul", "/model/decoder/2/self_attn/q_proj/MatMul_smooth_mul", "/model/decoder/2/self_attn/k_proj/MatMul_smooth_mul", "/model/decoder/2/self_attn/v_proj/MatMul_smooth_mul", "/model/decoder/2/self_attn/out_proj/MatMul_smooth_mul", "/model/decoder/2/encoder_attn/MatMul_smooth_mul", "/model/decoder/2/encoder_attn/MatMul_5_smooth_mul", "/model/decoder/2/fc1/MatMul_smooth_mul", "/model/decoder/2/fc2/MatMul_smooth_mul", "/model/decoder/3/self_attn/q_proj/MatMul_smooth_mul", "/model/decoder/3/self_attn/k_proj/MatMul_smooth_mul", "/model/decoder/3/self_attn/v_proj/MatMul_smooth_mul", "/model/decoder/3/self_attn/out_proj/MatMul_smooth_mul", "/model/decoder/3/encoder_attn/MatMul_smooth_mul", "/model/decoder/3/encoder_attn/MatMul_5_smooth_mul", "/model/decoder/3/fc1/MatMul_smooth_mul", "/model/decoder/3/fc2/MatMul_smooth_mul", "/proj_out/MatMul_smooth_mul" ], "nodes_to_quantize": [], "operators_to_quantize": [ "MatMul" ], "per_channel": false, "qdq_add_pair_to_weight": false, "qdq_dedicated_pair": false, "qdq_op_type_per_channel_support_to_axis": { "MatMul": 1 }, "reduce_range": false, "smooth_quant": false, "smooth_quant_alpha": 0.5, "smooth_quant_folding": true, "smooth_quant_op_types": [ "MatMul" ], "weights_dtype": "QInt8", "weights_symmetric": true }, "transformers_version": "4.33.1", "use_external_data_format": false }