@@ -37,7 +37,7 @@ bool isSwizzled(SharedEncodingAttr layout) { return layout.getMaxPhase() != 1; }
3737SmallVector<Value> swizzleIndices (ConversionPatternRewriter &rewriter,
3838 Location loc, SmallVector<Value> rawIndices,
3939 SharedEncodingAttr layout) {
40- auto b = TritonLLVMOpBuilder (loc, rewriter);
40+ auto b = TritonLLVMOpBuilder (loc, & rewriter);
4141 const auto &order = layout.getOrder ();
4242 auto rank = order.size ();
4343
@@ -81,7 +81,7 @@ void storeValuesInLinearVector(PatternRewriter &rewriter, Location loc,
8181 unsigned kIdx , unsigned nonKIdx, unsigned bIdx,
8282 const DimIdx &dim, int vecDim,
8383 ArrayRef<unsigned > opOrder) {
84- auto b = TritonLLVMOpBuilder (loc, rewriter);
84+ auto b = TritonLLVMOpBuilder (loc, & rewriter);
8585 auto vecTy = cast<VectorType>(vec.getType ());
8686 auto vectorSize = vecTy.getNumElements ();
8787 auto elemTy = vecTy.getElementType ();
@@ -118,7 +118,7 @@ Value getUnswizzledFirstElemOffset(ConversionPatternRewriter &rewriter,
118118 Location loc, unsigned B, unsigned NonK,
119119 Value bTileOffset, Value nonKTileOffset,
120120 Value bStride, Value nonKStride) {
121- auto b = TritonLLVMOpBuilder (loc, rewriter);
121+ auto b = TritonLLVMOpBuilder (loc, & rewriter);
122122 auto bOffset = b.mul (b.urem (bTileOffset, b.i32_val (B)), bStride);
123123 auto nonKOffset = b.mul (b.urem (nonKTileOffset, b.i32_val (NonK)), nonKStride);
124124 Value threadIdDependantOffset = b.add (bOffset, nonKOffset);
@@ -157,7 +157,7 @@ Value computeSwizzledOffset(ConversionPatternRewriter &rewriter, Location loc,
157157 SharedEncodingAttr sharedLayout,
158158 ArrayRef<int64_t > opTensorShape,
159159 ArrayRef<Value> strides) {
160- auto b = TritonLLVMOpBuilder (loc, rewriter);
160+ auto b = TritonLLVMOpBuilder (loc, & rewriter);
161161 Value offset = b.i32_val (0 );
162162 // Compute unswizzled multi dim coordinates in shared memory object
163163 SmallVector<Value> elemMultiDimIndices (3 );
@@ -190,7 +190,7 @@ Value computeNonSwizzledOffset(ConversionPatternRewriter &rewriter,
190190 unsigned shapePerCTABTile,
191191 unsigned shapePerCTANonKTile,
192192 ArrayRef<Value> strides) {
193- auto b = TritonLLVMOpBuilder (loc, rewriter);
193+ auto b = TritonLLVMOpBuilder (loc, & rewriter);
194194 SmallVector<Value> offsetIndices (3 );
195195 offsetIndices[dim.batch ] =
196196 b.i32_val ((i.bTile * shapePerCTABTile + i.b ) % tensorShape[dim.batch ]);
@@ -219,7 +219,7 @@ Value loadFMAOp(Value srcVal, Value llVal, BlockedEncodingAttr dLayout,
219219 Value thread, Location loc,
220220 const LLVMTypeConverter *typeConverter,
221221 ConversionPatternRewriter &rewriter, const int dotOpNo) {
222- auto tb = TritonLLVMOpBuilder (loc, rewriter);
222+ auto tb = TritonLLVMOpBuilder (loc, & rewriter);
223223 if (!verifyCTALayout (dLayout.getCTALayout ()))
224224 return Value ();
225225
0 commit comments