We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 6625cd3 commit 2dd1b62Copy full SHA for 2dd1b62
src/compressed_tensors/quantization/utils/helpers.py
@@ -165,7 +165,7 @@ def compute_dynamic_scales_and_zp(
165
166
keep_dims = True
167
if args.strategy == QuantizationStrategy.TOKEN:
168
- dim = {1, 2}
+ dim = {0, 1}
169
reduce_dims = tuple(idx for idx in range(value.ndim) if idx not in dim)
170
elif args.strategy == QuantizationStrategy.TENSOR:
171
reduce_dims = None
0 commit comments