File tree Expand file tree Collapse file tree 1 file changed +3
-2
lines changed
csrc/nv_internal/tensorrt_llm/kernels Expand file tree Collapse file tree 1 file changed +3
-2
lines changed Original file line number Diff line number Diff line change @@ -766,8 +766,9 @@ quantize_with_block_size(
766
766
bool isSfSwizzledLayout = layout == QuantizationSFLayout::SWIZZLED_128x4 ||
767
767
layout == QuantizationSFLayout::SWIZZLED_8x4;
768
768
769
- // The number of padded rows considering 128x4 SF layout.
770
- int numPaddedRowsForSf = isSfSwizzledLayout ? PadUpFn (numRows, 128 ) : numRows;
769
+ // The number of padded rows considering 128x4 or 8x4 SF layout.
770
+ int rowTile = (layout == QuantizationSFLayout::SWIZZLED_128x4) ? 128 : 8 ;
771
+ int numPaddedRowsForSf = isSfSwizzledLayout ? PadUpFn (numRows, rowTile) : numRows;
771
772
int numColsForSf = isSfSwizzledLayout ? PadUpFn (numPaddedCols, 4 * SF_VEC_SIZE) : numPaddedCols;
772
773
773
774
// The number of threads in the column dimension。
You can’t perform that action at this time.
0 commit comments