Spaces:
Sleeping
Sleeping
File size: 476 Bytes
ece074a | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 | import numpy as np
def quantize_onnx_model(onnx_model_path, quantized_model_path):
from onnxruntime.quantization.quantize import quantize_dynamic, QuantType
import onnx
onnx_opt_model = onnx.load(onnx_model_path)
quantize_dynamic(onnx_model_path,
quantized_model_path,
weight_type=QuantType.QInt8)
print(f"quantized model saved to:{quantized_model_path}")
quantize_onnx_model("model.onnx", "model_quant.onnx")
|