Link to this sectionReference for ultralytics/utils/export/onnx.py#
Improvements
This page is sourced from https://github.com/ultralytics/ultralytics/blob/main/ultralytics/utils/export/onnx.py. Have an improvement or example to add? Open a Pull Request — thank you! 🙏
Summary
Link to this section ultralytics.utils.export.onnx.onnx_calibration_reader#
def onnx_calibration_reader(dataset, transform_fn, input_name: str = "images")Create an ONNX Runtime calibration data reader from an Ultralytics calibration dataloader.
Args
| Name | Type | Description | Default |
|---|---|---|---|
dataset | required | ||
transform_fn | required | ||
input_name | str | "images" |
Source code in ultralytics/utils/export/onnx.py
def onnx_calibration_reader(dataset, transform_fn, input_name: str = "images"):
"""Create an ONNX Runtime calibration data reader from an Ultralytics calibration dataloader."""
from onnxruntime.quantization import CalibrationDataReader
class _CalibrationReader(CalibrationDataReader):
def __init__(self):
"""Materialize calibration inputs as `{input_name: float32_NCHW}` dicts."""
self.samples = [{input_name: transform_fn(batch)} for batch in dataset]
self.iterator = iter(self.samples)
def get_next(self):
"""Return the next calibration sample, or None when exhausted."""
return next(self.iterator, None)
def rewind(self):
"""Reset the iterator for an additional calibration pass."""
self.iterator = iter(self.samples)
return _CalibrationReader()Link to this section ultralytics.utils.export.onnx.onnx_int8_quantize#
def onnx_int8_quantize(
onnx_file,
output_file,
dataset,
transform_fn,
input_name: str = "images",
prefix: str = "",
) -> strQuantize an ONNX model to INT8 using ONNX Runtime static quantization.
Args
| Name | Type | Description | Default |
|---|---|---|---|
onnx_file | required | ||
output_file | required | ||
dataset | required | ||
transform_fn | required | ||
input_name | str | "images" | |
prefix | str | "" |
Source code in ultralytics/utils/export/onnx.py
def onnx_int8_quantize(
onnx_file,
output_file,
dataset,
transform_fn,
input_name: str = "images",
prefix: str = "",
) -> str:
"""Quantize an ONNX model to INT8 using ONNX Runtime static quantization."""
from onnxruntime.quantization import quantize_static
onnx_file, output_file = Path(onnx_file), Path(output_file)
LOGGER.info(f"{prefix} quantizing INT8 with ONNX Runtime...")
quantize_static(str(onnx_file), str(output_file), onnx_calibration_reader(dataset, transform_fn, input_name))
return str(output_file)