{ "model_type": "ONNX", "npu_mode": "NPU3", "quant": { "input_configs": [ { "tensor_name": "speech", "calibration_dataset": "./calibration_dataset/speech.tar.gz", "calibration_size": -1, "calibration_format": "Numpy" }, { "tensor_name": "speech_lengths", "calibration_dataset": "./calibration_dataset/speech_lengths.tar.gz", "calibration_size": -1, "calibration_format": "Numpy" } ], "layer_configs": [ { "start_tensor_names": ["DEFAULT"], "end_tensor_names": ["DEFAULT"], "data_type": "U16" } ], "calibration_method": "MinMax", "conv_bias_data_type": "FP32", "disable_auto_refine_scale": true, "enable_smooth_quant": true, "precision_analysis": true, "precision_analysis_method": "EndToEnd", "transformer_opt_level": 1 }, "input_processors": [ { "tensor_name": "speech", "src_dtype": "FP32" }, { "tensor_name": "speech_lengths", "src_dtype": "S32" } ], "compiler": { "check": 0 } }