@@ -153,7 +153,7 @@ void transform_dialect::VectorToWarpExecuteOnLane0Op::build(
153153// SCCP.
154154static LogicalResult
155155replaceAllUsesOfLaneWithin (RewriterBase &b,
156- vector ::WarpExecuteOnLane0Op executeOp) {
156+ gpu ::WarpExecuteOnLane0Op executeOp) {
157157 OpBuilder::InsertionGuard g (b);
158158 b.setInsertionPoint (executeOp);
159159 Value zero = b.create <arith::ConstantIndexOp>(executeOp.getLoc (), 0 );
@@ -225,7 +225,7 @@ static FailureOr<gpu::ThreadIdOp> isThreadIdxxZeroPredicate(scf::IfOp ifOp) {
225225}
226226
227227struct VectorDistributionResult {
228- vector ::WarpExecuteOnLane0Op warpOp;
228+ gpu ::WarpExecuteOnLane0Op warpOp;
229229};
230230
231231static FailureOr<VectorDistributionResult>
@@ -257,7 +257,7 @@ rewriteScfIfAsWarpExecuteOnLane0(RewriterBase &rewriter, Location loc,
257257 rewriter.create <scf::IfOp>(loc, predicate, /* withElseRegion=*/ false );
258258 rewriter.setInsertionPointToStart (&newIfOp.getThenRegion ().front ());
259259 }
260- auto warpOp = rewriter.create <vector ::WarpExecuteOnLane0Op>(
260+ auto warpOp = rewriter.create <gpu ::WarpExecuteOnLane0Op>(
261261 loc, TypeRange (), threadIdxx, warpSize);
262262
263263 // Move the code from the previous ifOp to the
@@ -270,7 +270,7 @@ rewriteScfIfAsWarpExecuteOnLane0(RewriterBase &rewriter, Location loc,
270270 sourceBlock.without_terminator ().begin (),
271271 sourceBlock.without_terminator ().end ());
272272 rewriter.setInsertionPointToEnd (&targetBlock);
273- rewriter.create <vector ::YieldOp>(loc);
273+ rewriter.create <gpu ::YieldOp>(loc);
274274
275275 // Erase old op.
276276 rewriter.eraseOp (ifOp);
@@ -358,7 +358,7 @@ void transform_dialect::VectorWarpDistributionOp::getEffects(
358358// / Emit shared local memory allocation in case it is needed when lowering the
359359// / warp operations.
360360static Value allocateGlobalSharedMemory (Location loc, OpBuilder &builder,
361- vector ::WarpExecuteOnLane0Op warpOp,
361+ gpu ::WarpExecuteOnLane0Op warpOp,
362362 Type type) {
363363 MemRefType memrefType;
364364 auto addressSpaceAttr = gpu::AddressSpaceAttr::get (
@@ -374,11 +374,11 @@ static Value allocateGlobalSharedMemory(Location loc, OpBuilder &builder,
374374 return builder.create <memref::AllocOp>(loc, memrefType);
375375}
376376
377- // / Return a value yielded by `warpOp` which statifies the filter lamdba
377+ // / Return a value yielded by `warpOp` which satisfies the filter lambda
378378// / condition and is not dead.
379- static OpOperand *getWarpResult (vector ::WarpExecuteOnLane0Op warpOp,
379+ static OpOperand *getWarpResult (gpu ::WarpExecuteOnLane0Op warpOp,
380380 function_ref<bool (Operation *)> fn) {
381- auto yield = cast<vector ::YieldOp>(
381+ auto yield = cast<gpu ::YieldOp>(
382382 warpOp.getBodyRegion ().getBlocks ().begin ()->getTerminator ());
383383 for (OpOperand &yieldOperand : yield->getOpOperands ()) {
384384 Value yieldValues = yieldOperand.get ();
@@ -426,9 +426,9 @@ class InsertElementToBroadcast final
426426// / }
427427// / gpu.synchronize
428428// / %0 = memref.load %src[%c0] : memref<1024xf32>
429- struct WarpOpLoad : public OpRewritePattern <vector ::WarpExecuteOnLane0Op> {
430- using OpRewritePattern<vector ::WarpExecuteOnLane0Op>::OpRewritePattern;
431- LogicalResult matchAndRewrite (vector ::WarpExecuteOnLane0Op warpOp,
429+ struct WarpOpLoad : public OpRewritePattern <gpu ::WarpExecuteOnLane0Op> {
430+ using OpRewritePattern<gpu ::WarpExecuteOnLane0Op>::OpRewritePattern;
431+ LogicalResult matchAndRewrite (gpu ::WarpExecuteOnLane0Op warpOp,
432432 PatternRewriter &rewriter) const override {
433433 OpOperand *operand = getWarpResult (warpOp, llvm::IsaPred<memref::LoadOp>);
434434 if (!operand)
@@ -476,7 +476,7 @@ struct HoistSharedMemoryAlloc : public OpRewritePattern<memref::AllocOp> {
476476 PatternRewriter &rewriter) const override {
477477 if (!iree_compiler::hasSharedMemoryAddressSpace (alloc.getType ()))
478478 return failure ();
479- auto warpParent = alloc->getParentOfType <vector ::WarpExecuteOnLane0Op>();
479+ auto warpParent = alloc->getParentOfType <gpu ::WarpExecuteOnLane0Op>();
480480 if (!warpParent)
481481 return failure ();
482482 alloc->moveBefore (warpParent);
@@ -561,7 +561,7 @@ static void populatePropagateVectorDistribution(Operation *target,
561561}
562562
563563static void warpSyncronizationFn (Location loc, OpBuilder &builder,
564- vector ::WarpExecuteOnLane0Op warpOp) {
564+ gpu ::WarpExecuteOnLane0Op warpOp) {
565565 builder.create <gpu::BarrierOp>(loc);
566566};
567567
0 commit comments