Skip to content

Commit c09e10e

Browse files
committed
fix pitch restriction check + remove commented code
1 parent 8a4cab2 commit c09e10e

File tree

1 file changed

+2
-3
lines changed

1 file changed

+2
-3
lines changed

third_party/intel/lib/TritonIntelGPUTransforms/MaterializeBlockPointer.cpp

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -71,9 +71,7 @@ struct TritonIntelGPUMaterializeBlockPointerPass
7171
}
7272
ArrayRef<int32_t> order = makeTensorPtrOp.getOrder();
7373

74-
// unsigned fastChangeDim = order[0];
7574
if (fastChangeDim >= (rank - 2)) {
76-
7775
// HW 2D block read instruction only supports contiguous access.
7876
Value fastChangeStride = strides[fastChangeDim];
7977
LLVM_DEBUG({
@@ -89,7 +87,8 @@ struct TritonIntelGPUMaterializeBlockPointerPass
8987
Value pitch =
9088
strides[(fastChangeDim == rank - 1) ? rank - 2 : rank - 1];
9189
LDBG("Pitch: " << pitch);
92-
if (!ttgi::isDivisible(pitch, 64 / tensorType.getElementTypeBitWidth()))
90+
if (!ttgi::isDivisible(pitch,
91+
128 / tensorType.getElementTypeBitWidth()))
9392
return;
9493

9594
loadOp->setAttr(ttgi::TritonIntelGPUDialect::getBlockIOAttrName(),

0 commit comments

Comments
 (0)