File size: 3,850 Bytes
d702276
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
{
  "input": "/data/huichiwen/dev/cp/onnx_model/pointpillars.onnx", 
  "output_dir": "./output",
  "output_name": "centerpoint.axmodel",
  "model_type": "ONNX",
  "target_hardware": "AX650",
  "npu_mode": "NPU3",

  "input_shapes": "input.1:1x10x30000x20;indices_input:1x30000x2",

  "quant": {
    "input_configs": [
      {
        "tensor_name": "input.1",
        "calibration_dataset": "/data/huichiwen/dev/cp/quant_data/features.tar.gz",
        "calibration_format": "Numpy",
        "calibration_size": 32
      },
      {
        "tensor_name": "indices_input",
        "calibration_dataset": "/data/huichiwen/dev/cp/quant_data/indices.tar.gz",
        "calibration_format": "Numpy",
        "calibration_size": 32
      }
    ],
    "calibration_method": "MinMax",
    "enable_smooth_quant": false,
    "smooth_quant_strength": 0.5,
    "layer_configs": [
      {
        "layer_names": [
          "pfe_/pfn_layers.0/linear/MatMul",
          "pfe_/pfn_layers.0/norm/BatchNormalization",
          "pfe_/pfn_layers.0/Relu",
          "pfe_/pfn_layers.0/ReduceMax",
          "pfe_/pfn_layers.1/linear/MatMul",
          "pfe_/pfn_layers.1/norm/BatchNormalization",
          "pfe_/pfn_layers.1/Relu",
          "pfe_/pfn_layers.1/ReduceMax",
          "ScatterND_1"

        ],
        "data_type": "FP32",
        "output_data_type": "FP32"
      },
      {
        "layer_names": [
          "/neck/blocks.0/blocks.0.1/Conv",
          "/neck/blocks.0/blocks.0.3/Relu",
          "/neck/blocks.0/blocks.0.4/Conv",
          "/neck/blocks.0/blocks.0.6/Relu",
          "/neck/blocks.0/blocks.0.7/Conv",
          "/neck/blocks.0/blocks.0.9/Relu",
          "/neck/blocks.0/blocks.0.10/Conv",
          "/neck/blocks.0/blocks.0.12/Relu",
          "/neck/deblocks.0/deblocks.0.0/Conv",
          "/neck/blocks.1/blocks.1.1/Conv",
          "/neck/deblocks.0/deblocks.0.2/Relu",
          "/neck/blocks.1/blocks.1.3/Relu",
          "/neck/blocks.1/blocks.1.4/Conv",
          "/neck/blocks.1/blocks.1.6/Relu",
          "/neck/blocks.1/blocks.1.7/Conv",
          "/neck/blocks.1/blocks.1.9/Relu",
          "/neck/blocks.1/blocks.1.10/Conv",
          "/neck/blocks.1/blocks.1.12/Relu",
          "/neck/blocks.1/blocks.1.13/Conv",
          "/neck/blocks.1/blocks.1.15/Relu",
          "/neck/blocks.1/blocks.1.16/Conv",
          "/neck/blocks.1/blocks.1.18/Relu",
          "/neck/deblocks.1/deblocks.1.0/Conv",
          "/neck/deblocks.1/deblocks.1.2/Relu",
          "/neck/blocks.2/blocks.2.1/Conv",
          "/neck/blocks.2/blocks.2.3/Relu",
          "/neck/blocks.2/blocks.2.4/Conv",
          "/neck/blocks.2/blocks.2.6/Relu",
          "/neck/blocks.2/blocks.2.7/Conv",
          "/neck/blocks.2/blocks.2.9/Relu",
          "/neck/blocks.2/blocks.2.10/Conv",
          "/neck/blocks.2/blocks.2.12/Relu",
          "/neck/blocks.2/blocks.2.13/Conv",
          "/neck/blocks.2/blocks.2.15/Relu",
          "/neck/blocks.2/blocks.2.16/Conv",
          "/neck/blocks.2/blocks.2.18/Relu"
        ],
        "data_type": "FP32",
        "output_data_type": "FP32"
      },
      {
        "layer_names": [
          "/Exp",
          "/Sigmoid",
          "/Exp_1",
          "/Sigmoid_1",
          "/Exp_2",
          "/Sigmoid_2",
          "/Exp_3",
          "/Sigmoid_3",
          "/Exp_4",
          "/Sigmoid_4",
          "/Exp_5",
          "/Sigmoid_5",
          "/ReduceMax",
          "/ReduceMax_1",
          "/ReduceMax_2",
          "/ReduceMax_3",
          "/ReduceMax_4",
          "/ReduceMax_5"
    
        ],
        "data_type": "FP32",
        "output_data_type": "FP32"
      }
    ]
  },
  "input_processors": [
    {
      "tensor_name": "input.1",
      "src_dtype": "FP32"
    },
    {
      "tensor_name": "indices_input",
      "src_dtype": "S32"
    }
  ],

  "compiler": {
    "check": 0
  }
}