We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent b77b1e6 commit 42575fdCopy full SHA for 42575fd
src/compressed_tensors/quantization/quant_scheme.py
@@ -111,7 +111,7 @@ def is_preset_scheme(name: str) -> bool:
111
weights=QuantizationArgs(), input_activations=QuantizationArgs(symmetric=True)
112
)
113
114
-W4A16 = dict(weights=QuantizationArgs(num_bits=4, symmetric=True))
+W4A16 = dict(weights=QuantizationArgs(num_bits=4, group_size=128))
115
116
PRESET_SCHEMES = {
117
"W8A8": W8A8,
0 commit comments