From a175b6f59ac7f0a727ed5253670ab8efbae2f3df Mon Sep 17 00:00:00 2001 From: Devang Patel <47577486+devang-ml@users.noreply.github.com> Date: Fri, 21 Feb 2025 11:40:09 -0800 Subject: [PATCH] Use OnnxDynamicQuantization for dynamic quantization --- olive/cli/auto_opt.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/olive/cli/auto_opt.py b/olive/cli/auto_opt.py index 3d75469b0..5303da1b7 100644 --- a/olive/cli/auto_opt.py +++ b/olive/cli/auto_opt.py @@ -443,7 +443,7 @@ def _get_passes_config(self, config: Dict[str, Any], olive_config: OlivePackageC ("qnn_preprocess", {"type": "QNNPreprocess"}), ("mixed_precision_overrides", {"type": "MixedPrecisionOverrides", "overrides_config": None}), # quantization passes - ("dynamic_quant", {"type": "OnnxQuantization", "weight_type": "QInt8"}), + ("dynamic_quant", {"type": "OnnxDynamicQuantization", "weight_type": "QInt8"}), ("matmul4", {"type": "OnnxMatMul4Quantizer"}), ("bnb4", {"type": "OnnxBnb4Quantization", "quant_type": "nf4"}), # post processing passes