File size: 476 Bytes
ece074a
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
import numpy as np
def quantize_onnx_model(onnx_model_path, quantized_model_path):
    from onnxruntime.quantization.quantize import quantize_dynamic, QuantType
    import onnx
    onnx_opt_model = onnx.load(onnx_model_path)
    quantize_dynamic(onnx_model_path,
                     quantized_model_path,
                     weight_type=QuantType.QInt8)

    print(f"quantized model saved to:{quantized_model_path}")



quantize_onnx_model("model.onnx", "model_quant.onnx")