File size: 2,771 Bytes
5acb56c | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 | {
"one_external_file": true,
"opset": null,
"optimization": {},
"optimum_version": "1.14.0.dev0",
"quantization": {
"activations_dtype": "QUInt8",
"activations_symmetric": false,
"format": "QDQ",
"is_static": true,
"mode": "QLinearOps",
"nodes_to_exclude": [
"/proj_out/MatMul",
"/model/decoder/0/self_attn/q_proj/MatMul_smooth_mul",
"/model/decoder/0/self_attn/k_proj/MatMul_smooth_mul",
"/model/decoder/0/self_attn/v_proj/MatMul_smooth_mul",
"/model/decoder/0/self_attn/out_proj/MatMul_smooth_mul",
"/model/decoder/0/encoder_attn/q_proj/MatMul_smooth_mul",
"/model/decoder/0/encoder_attn/out_proj/MatMul_smooth_mul",
"/model/decoder/0/fc1/MatMul_smooth_mul",
"/model/decoder/0/fc2/MatMul_smooth_mul",
"/model/decoder/1/self_attn/q_proj/MatMul_smooth_mul",
"/model/decoder/1/self_attn/k_proj/MatMul_smooth_mul",
"/model/decoder/1/self_attn/v_proj/MatMul_smooth_mul",
"/model/decoder/1/self_attn/out_proj/MatMul_smooth_mul",
"/model/decoder/1/encoder_attn/MatMul_smooth_mul",
"/model/decoder/1/encoder_attn/MatMul_5_smooth_mul",
"/model/decoder/1/fc1/MatMul_smooth_mul",
"/model/decoder/1/fc2/MatMul_smooth_mul",
"/model/decoder/2/self_attn/q_proj/MatMul_smooth_mul",
"/model/decoder/2/self_attn/k_proj/MatMul_smooth_mul",
"/model/decoder/2/self_attn/v_proj/MatMul_smooth_mul",
"/model/decoder/2/self_attn/out_proj/MatMul_smooth_mul",
"/model/decoder/2/encoder_attn/MatMul_smooth_mul",
"/model/decoder/2/encoder_attn/MatMul_5_smooth_mul",
"/model/decoder/2/fc1/MatMul_smooth_mul",
"/model/decoder/2/fc2/MatMul_smooth_mul",
"/model/decoder/3/self_attn/q_proj/MatMul_smooth_mul",
"/model/decoder/3/self_attn/k_proj/MatMul_smooth_mul",
"/model/decoder/3/self_attn/v_proj/MatMul_smooth_mul",
"/model/decoder/3/self_attn/out_proj/MatMul_smooth_mul",
"/model/decoder/3/encoder_attn/MatMul_smooth_mul",
"/model/decoder/3/encoder_attn/MatMul_5_smooth_mul",
"/model/decoder/3/fc1/MatMul_smooth_mul",
"/model/decoder/3/fc2/MatMul_smooth_mul",
"/proj_out/MatMul_smooth_mul"
],
"nodes_to_quantize": [],
"operators_to_quantize": [
"MatMul"
],
"per_channel": false,
"qdq_add_pair_to_weight": false,
"qdq_dedicated_pair": false,
"qdq_op_type_per_channel_support_to_axis": {
"MatMul": 1
},
"reduce_range": false,
"smooth_quant": false,
"smooth_quant_alpha": 0.5,
"smooth_quant_folding": true,
"smooth_quant_op_types": [
"MatMul"
],
"weights_dtype": "QInt8",
"weights_symmetric": true
},
"transformers_version": "4.33.1",
"use_external_data_format": false
}
|