| { |
| "input": "../split_4cls/owlv2_text_4cls.onnx", |
| "output_dir": "../text-output", |
| "output_name": "owlv2_text_4cls_640.axmodel", |
| "model_type": "ONNX", |
| "target_hardware": "AX650", |
| "npu_mode": "NPU3", |
| "onnx_opt": { |
| "disable_onnx_optimization": false, |
| "enable_onnxsim": true |
| }, |
| "quant": { |
| "input_configs": [ |
| { |
| "tensor_name": "input_ids", |
| "calibration_dataset": "../calib_data/input_ids.tar", |
| "calibration_size": -1, |
| "calibration_format": "Numpy" |
| }, |
| { |
| "tensor_name": "attention_mask", |
| "calibration_dataset": "../calib_data/attention_mask.tar", |
| "calibration_size": -1, |
| "calibration_format": "Numpy" |
| } |
| ], |
| "calibration_method": "MinMax", |
| "precision_analysis": false, |
| "precision_analysis_method":"EndToEnd", |
| "precision_analysis_mode": "Reference", |
| "transformer_opt_level": 1, |
| "enable_smooth_quant": true, |
| "conv_bias_data_type": "FP32", |
| "layer_configs": [ |
| { |
| "start_tensor_names": ["DEFAULT"], |
| "end_tensor_names": ["DEFAULT"], |
| "data_type": "U16" |
| }, |
| { |
| "op_types": ["Add"], |
| "data_type": "FP32" |
| } |
| ] |
| }, |
|
|
| "compiler": { |
| "check": 0 |
| } |
| } |
|
|