We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents d00675c + b2df366 commit 9e2b530Copy full SHA for 9e2b530
src/compressed_tensors/quantization/lifecycle/forward.py
@@ -124,8 +124,13 @@ def dequantize(
124
strategy=QuantizationStrategy.GROUP, group_size=group_size
125
)
126
else:
127
+ rows, cols = x_q.shape[-2], x_q.shape[-1]
128
+ block_height = rows // scale.shape[0] # Rows per block
129
+ block_width = cols // scale.shape[1] # Columns per block
130
+
131
args = QuantizationArgs(
- strategy=QuantizationStrategy.BLOCK, block_structure=scale.shape
132
+ strategy=QuantizationStrategy.BLOCK,
133
+ block_structure=[block_height, block_width],
134
135
136
raise ValueError(
0 commit comments