Skip to content

Commit c2fef8e

Browse files
authored
Some gpu tweaks (#160)
1 parent 40bf982 commit c2fef8e

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

numba_dpcomp/numba_dpcomp/mlir_compiler/lib/pipelines/lower_to_gpu.cpp

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3007,7 +3007,8 @@ class GpuLaunchSinkOpsPass
30073007
if (op->walk([](gpu::LaunchOp launch) {
30083008
auto isSinkingBeneficiary = [](mlir::Operation *op) -> bool {
30093009
return isa<arith::ConstantOp, ConstantOp, arith::SelectOp,
3010-
arith::CmpIOp>(op);
3010+
arith::CmpIOp, arith::IndexCastOp, arith::MulIOp,
3011+
arith::SubIOp, arith::AddIOp>(op);
30113012
};
30123013

30133014
// Pull in instructions that can be sunk
@@ -3123,7 +3124,7 @@ static void populateLowerToGPUPipelineLow(mlir::OpPassManager &pm) {
31233124
commonOptPasses(funcPM);
31243125
funcPM.addPass(std::make_unique<KernelMemrefOpsMovementPass>());
31253126
funcPM.addPass(std::make_unique<GpuLaunchSinkOpsPass>());
3126-
funcPM.addPass(std::make_unique<SinkGpuDimsPass>());
3127+
// funcPM.addPass(std::make_unique<SinkGpuDimsPass>());
31273128
pm.addPass(mlir::createGpuKernelOutliningPass());
31283129
pm.addPass(mlir::createSymbolDCEPass());
31293130

0 commit comments

Comments
 (0)