| { | |
| "model_type": "ONNX", | |
| "npu_mode": "NPU3", | |
| "quant": { | |
| "input_configs": [ | |
| { | |
| "tensor_name": "DEFAULT", | |
| "calibration_dataset": "./onnx-calibration-no-controlnet/transformer.tar", | |
| "calibration_size": -1, | |
| "calibration_format": "NumpyObject" | |
| } | |
| ], | |
| "calibration_method": "MinMax", | |
| "precision_analysis": true, | |
| "precision_analysis_method": "PerLayer", | |
| "enable_smooth_quant": true, | |
| "conv_bias_data_type": "FP32", | |
| "layer_configs": [ | |
| { | |
| "start_tensor_names": [ | |
| "DEFAULT" | |
| ], | |
| "end_tensor_names": [ | |
| "DEFAULT" | |
| ], | |
| "data_type": "U16" | |
| } | |
| ] | |
| }, | |
| "input_processors": [ | |
| { | |
| "tensor_name": "DEFAULT" | |
| } | |
| ], | |
| "compiler": { | |
| "check": 0 | |
| } | |
| } | |