Support int8 quantization in decoder

2025-09-19 05:54:20 +00:00 · 2023-06-29 12:15:06 +08:00 · 2023-06-29 12:15:06 +08:00 · 3544665ace
commit 3544665ace
parent 9c2172c1c4
2 changed files with 2 additions and 2 deletions
--- a/egs/librispeech/ASR/zipformer/export-onnx-streaming.py
+++ b/egs/librispeech/ASR/zipformer/export-onnx-streaming.py
@ -757,7 +757,7 @@ def main():
    quantize_dynamic(
        model_input=decoder_filename,
        model_output=decoder_filename_int8,
-        op_types_to_quantize=["MatMul"],
+        op_types_to_quantize=["MatMul", "Gather"],
        weight_type=QuantType.QInt8,
    )

--- a/egs/librispeech/ASR/zipformer/export-onnx.py
+++ b/egs/librispeech/ASR/zipformer/export-onnx.py
@ -602,7 +602,7 @@ def main():
    quantize_dynamic(
        model_input=decoder_filename,
        model_output=decoder_filename_int8,
-        op_types_to_quantize=["MatMul"],
+        op_types_to_quantize=["MatMul", "Gather"],
        weight_type=QuantType.QInt8,
    )