We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 6e5e320 commit ec7aa63Copy full SHA for ec7aa63
onnxruntime/python/tools/quantization/matmul_4bits_quantizer.py
@@ -280,7 +280,7 @@ def __init__(
280
281
super().__init__(
282
algorithm="nvidia_awq",
283
- quant_format=quant_format,
+ quant_format=QuantFormat.QDQ,
284
op_types_to_quantize=None, # Assuming op_types_to_quantize is handled elsewhere
285
quant_axes=None, # Assuming quant_axes is handled elsewhere
286
)
0 commit comments