Spaces:
Sleeping
Sleeping
| import numpy as np | |
| def quantize_onnx_model(onnx_model_path, quantized_model_path): | |
| from onnxruntime.quantization.quantize import quantize_dynamic, QuantType | |
| import onnx | |
| onnx_opt_model = onnx.load(onnx_model_path) | |
| quantize_dynamic(onnx_model_path, | |
| quantized_model_path, | |
| weight_type=QuantType.QInt8) | |
| print(f"quantized model saved to:{quantized_model_path}") | |
| quantize_onnx_model("model.onnx", "model_quant.onnx") | |