We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent c69c8bb commit 957a1d1Copy full SHA for 957a1d1
src/compressed_tensors/quantization/lifecycle/forward.py
@@ -124,8 +124,13 @@ def dequantize(
124
strategy=QuantizationStrategy.GROUP, group_size=group_size
125
)
126
else:
127
+ rows, cols = x_q.shape[-2], x_q.shape[-1]
128
+ block_height = rows // scale.shape[0] # Rows per block
129
+ block_width = cols // scale.shape[1] # Columns per block
130
+
131
args = QuantizationArgs(
- strategy=QuantizationStrategy.BLOCK, block_structure=scale.shape
132
+ strategy=QuantizationStrategy.BLOCK,
133
+ block_structure=[block_height, block_width],
134
135
136
raise ValueError(
0 commit comments