File size: 2,771 Bytes
5acb56c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
{
  "one_external_file": true,
  "opset": null,
  "optimization": {},
  "optimum_version": "1.14.0.dev0",
  "quantization": {
    "activations_dtype": "QUInt8",
    "activations_symmetric": false,
    "format": "QDQ",
    "is_static": true,
    "mode": "QLinearOps",
    "nodes_to_exclude": [
      "/proj_out/MatMul",
      "/model/decoder/0/self_attn/q_proj/MatMul_smooth_mul",
      "/model/decoder/0/self_attn/k_proj/MatMul_smooth_mul",
      "/model/decoder/0/self_attn/v_proj/MatMul_smooth_mul",
      "/model/decoder/0/self_attn/out_proj/MatMul_smooth_mul",
      "/model/decoder/0/encoder_attn/q_proj/MatMul_smooth_mul",
      "/model/decoder/0/encoder_attn/out_proj/MatMul_smooth_mul",
      "/model/decoder/0/fc1/MatMul_smooth_mul",
      "/model/decoder/0/fc2/MatMul_smooth_mul",
      "/model/decoder/1/self_attn/q_proj/MatMul_smooth_mul",
      "/model/decoder/1/self_attn/k_proj/MatMul_smooth_mul",
      "/model/decoder/1/self_attn/v_proj/MatMul_smooth_mul",
      "/model/decoder/1/self_attn/out_proj/MatMul_smooth_mul",
      "/model/decoder/1/encoder_attn/MatMul_smooth_mul",
      "/model/decoder/1/encoder_attn/MatMul_5_smooth_mul",
      "/model/decoder/1/fc1/MatMul_smooth_mul",
      "/model/decoder/1/fc2/MatMul_smooth_mul",
      "/model/decoder/2/self_attn/q_proj/MatMul_smooth_mul",
      "/model/decoder/2/self_attn/k_proj/MatMul_smooth_mul",
      "/model/decoder/2/self_attn/v_proj/MatMul_smooth_mul",
      "/model/decoder/2/self_attn/out_proj/MatMul_smooth_mul",
      "/model/decoder/2/encoder_attn/MatMul_smooth_mul",
      "/model/decoder/2/encoder_attn/MatMul_5_smooth_mul",
      "/model/decoder/2/fc1/MatMul_smooth_mul",
      "/model/decoder/2/fc2/MatMul_smooth_mul",
      "/model/decoder/3/self_attn/q_proj/MatMul_smooth_mul",
      "/model/decoder/3/self_attn/k_proj/MatMul_smooth_mul",
      "/model/decoder/3/self_attn/v_proj/MatMul_smooth_mul",
      "/model/decoder/3/self_attn/out_proj/MatMul_smooth_mul",
      "/model/decoder/3/encoder_attn/MatMul_smooth_mul",
      "/model/decoder/3/encoder_attn/MatMul_5_smooth_mul",
      "/model/decoder/3/fc1/MatMul_smooth_mul",
      "/model/decoder/3/fc2/MatMul_smooth_mul",
      "/proj_out/MatMul_smooth_mul"
    ],
    "nodes_to_quantize": [],
    "operators_to_quantize": [
      "MatMul"
    ],
    "per_channel": false,
    "qdq_add_pair_to_weight": false,
    "qdq_dedicated_pair": false,
    "qdq_op_type_per_channel_support_to_axis": {
      "MatMul": 1
    },
    "reduce_range": false,
    "smooth_quant": false,
    "smooth_quant_alpha": 0.5,
    "smooth_quant_folding": true,
    "smooth_quant_op_types": [
      "MatMul"
    ],
    "weights_dtype": "QInt8",
    "weights_symmetric": true
  },
  "transformers_version": "4.33.1",
  "use_external_data_format": false
}