diff --git a/extension/llm/export/quantizer_lib.py b/extension/llm/export/quantizer_lib.py index 99499e34bb2..b94feb5a1ae 100644 --- a/extension/llm/export/quantizer_lib.py +++ b/extension/llm/export/quantizer_lib.py @@ -192,7 +192,7 @@ def get_qnn_quantizer( act_observer=MinMaxObserver, ) elif quant_config == "16a4w": - quant_dtype = QuantDtype.use_16a16w # pyre-fixme[16] + quant_dtype = QuantDtype.use_16a4w # pyre-fixme[16] qnn_quantizer.set_default_quant_config( quant_dtype, is_qat=is_qat,