@@ -110,7 +110,7 @@ std::tuple<Value, Value, Value> emitHardwareTuple(Location loc,
110110 Value warpId = udiv (threadId, threadsPerWarp);
111111 Value blockId =
112112 withCTAOffset ? target.getClusterCTAId (rewriter, loc) : i32_val (0 );
113- return {blockId , warpId, laneId };
113+ return {laneId , warpId, blockId };
114114}
115115
116116SmallVector<SmallVector<Value>>
@@ -130,7 +130,7 @@ emitIndices(Location loc, RewriterBase &rewriter, const TargetInfoBase &target,
130130 StringAttr kWarp = str_attr (" warp" );
131131 StringAttr kBlock = str_attr (" block" );
132132
133- auto [blockId , warpId, laneId ] = emitHardwareTuple (
133+ auto [laneId , warpId, blockId ] = emitHardwareTuple (
134134 loc, rewriter, target, withCTAOffset, ll->getInDimSize (kLane ));
135135 unsigned rank = shape.size ();
136136 SmallVector<SmallVector<Value>> ret;
@@ -353,7 +353,7 @@ bool emitTransferBetweenRegistersAndShared(
353353 std::min (regToSharedLayout->getNumConsecutiveInOut (),
354354 maxVecElems.value_or (std::numeric_limits<int >::max ()));
355355
356- auto [blockId , warpId, laneId ] =
356+ auto [laneId , warpId, blockId ] =
357357 emitHardwareTuple (loc, rewriter, target, /* withCTAOffset=*/ false ,
358358 regToSharedLayout->getInDimSize (kLane ));
359359
@@ -746,7 +746,7 @@ SmallVector<Value> getMultiDimOffset(Attribute layout, Location loc,
746746 auto instrShape = mmaLayout.getInstrShape ();
747747 SmallVector<Value> mmaColIdx (2 );
748748 SmallVector<Value> mmaRowIdx (2 );
749- auto [blockId , warpId, laneId ] = emitHardwareTuple (
749+ auto [laneId , warpId, blockId ] = emitHardwareTuple (
750750 loc, rewriter, targetInfo, /* withCTAOffset=*/ false , 32 );
751751 // TODO: fix the bug in MMAEncodingAttr document
752752 SmallVector<Value> multiDimWarpId (2 );
0 commit comments