This repository has been archived on 2025-08-26. You can view files and clone it, but cannot push or open issues or pull requests.
Files
enginex-mr_series-sherpa-onnx/scripts/peng-cheng-starling/quantize_models.py
2025-02-10 18:23:40 +08:00

23 lines
553 B
Python
Executable File

#!/usr/bin/env python3
from onnxruntime.quantization import QuantType, quantize_dynamic
from pathlib import Path
def main():
suffix = "epoch-75-avg-11-chunk-16-left-128"
for m in ["encoder", "joiner"]:
if Path(f"{m}-{suffix}.int8.onnx").is_file():
continue
quantize_dynamic(
model_input=f"./{m}-{suffix}.onnx",
model_output=f"./{m}-{suffix}.int8.onnx",
op_types_to_quantize=["MatMul"],
weight_type=QuantType.QInt8,
)
if __name__ == "__main__":
main()