[Dispatch Creation] Fuse pad with generic conv consumer (iree-org#21606)

IanWood1 · keshavvinayak01 · commit 7f9b6aeebc93 · 2025-09-04T18:04:05.000Z
Use `linalg::isaConvolutionOpInterface` instead of
`isa&lt;linalg::ConvolutionOpInterface&gt;` to detect generic convolutions.

Signed-off-by: Ian Wood &lt;ianwood@u.northwestern.edu&gt;
Signed-off-by: keshavvinayak01 &lt;keshavvinayakjha@gmail.com&gt;
diff --git a/compiler/src/iree/compiler/DispatchCreation/FormDispatchRegions.cpp b/compiler/src/iree/compiler/DispatchCreation/FormDispatchRegions.cpp
@@ -768,8 +768,9 @@ static bool isFusableWithProducer(
     return false;
   }
 
+  auto linalgConsumer = dyn_cast<linalg::LinalgOp>(consumer);
   if (options.fusePadWithConsumers && isa<tensor::PadOp>(producer) &&
-      isa<linalg::ConvolutionOpInterface>(consumer)) {
+      linalgConsumer && linalg::isaConvolutionOpInterface(linalgConsumer)) {
     return true;
   }
 
diff --git a/compiler/src/iree/compiler/DispatchCreation/test/pad_fusion_with_consumer.mlir b/compiler/src/iree/compiler/DispatchCreation/test/pad_fusion_with_consumer.mlir
@@ -1,6 +1,6 @@
 // RUN: iree-opt --pass-pipeline="builtin.module(util.func(iree-dispatch-creation-form-dispatch-regions{fuse-pad-with-consumers}))" --split-input-file %s | FileCheck %s
 
-util.func public @fuse_with_consumer(%arg0 : tensor<?x?x?x?xf32>, %arg1 : index,
+util.func public @fuse_with_consumer_named_op(%arg0 : tensor<?x?x?x?xf32>, %arg1 : index,
     %arg2 : index, %arg3 : index, %arg4 : index,
     %arg5 : tensor<?x?x?x?xf32>, %arg6 : tensor<?x?x?x?xf32>) -> tensor<?x?x?x?xf32> {
   %cst = arith.constant 42.0 : f32
@@ -12,7 +12,7 @@ util.func public @fuse_with_consumer(%arg0 : tensor<?x?x?x?xf32>, %arg1 : index,
       outs(%arg6 : tensor<?x?x?x?xf32>) -> tensor<?x?x?x?xf32>
   util.return %1 : tensor<?x?x?x?xf32>
 }
-// CHECK-LABEL: util.func public @fuse_with_consumer
+// CHECK-LABEL: util.func public @fuse_with_consumer_named_op
 //  CHECK-SAME:   %[[ARG0:[a-zA-Z0-9]+]]: tensor<?x?x?x?xf32>
 //  CHECK-SAME:   %[[ARG5:[a-zA-Z0-9]+]]: tensor<?x?x?x?xf32>
 //  CHECK-SAME:   %[[ARG6:[a-zA-Z0-9]+]]: tensor<?x?x?x?xf32>
@@ -23,3 +23,30 @@ util.func public @fuse_with_consumer(%arg0 : tensor<?x?x?x?xf32>, %arg1 : index,
 //  CHECK-SAME:         outs(%[[ARG6]] :
 //       CHECK:     flow.return %[[CONV]]
 //       CHECK:   util.return %[[RETURN]]
+
+// -----
+
+util.func public @fuse_with_consumer_generalized(%arg0: tensor<?x?x?x?xf32>, %arg1: index, %arg2: index, %arg3: index, %arg4: index, %arg5: tensor<?x?x?x?xf32>, %arg6: tensor<?x?x?x?xf32>) -> tensor<?x?x?x?xf32> {
+  %cst = arith.constant 4.200000e+01 : f32
+  %padded = tensor.pad %arg0 low[0, 0, 0, 0] high[%arg1, %arg2, %arg3, %arg4] {
+  ^bb0(%arg7: index, %arg8: index, %arg9: index, %arg10: index):
+    tensor.yield %cst : f32
+  } : tensor<?x?x?x?xf32> to tensor<?x?x?x?xf32>
+  %0 = linalg.generic {indexing_maps = [affine_map<(d0, d1, d2, d3, d4, d5, d6) -> (d0, d1 + d4, d2 + d5, d6)>, affine_map<(d0, d1, d2, d3, d4, d5, d6) -> (d4, d5, d6, d3)>, affine_map<(d0, d1, d2, d3, d4, d5, d6) -> (d0, d1, d2, d3)>], iterator_types = ["parallel", "parallel", "parallel", "parallel", "reduction", "reduction", "reduction"]} ins(%padded, %arg5 : tensor<?x?x?x?xf32>, tensor<?x?x?x?xf32>) outs(%arg6 : tensor<?x?x?x?xf32>) {
+  ^bb0(%in: f32, %in_0: f32, %out: f32):
+    %1 = arith.mulf %in, %in_0 : f32
+    %2 = arith.addf %out, %1 : f32
+    linalg.yield %2 : f32                                                                                                                                                                     } -> tensor<?x?x?x?xf32>
+  util.return %0 : tensor<?x?x?x?xf32>
+}
+// CHECK-LABEL: util.func public @fuse_with_consumer_generalized
+//  CHECK-SAME:   %[[ARG0:[a-zA-Z0-9]+]]: tensor<?x?x?x?xf32>
+//  CHECK-SAME:   %[[ARG5:[a-zA-Z0-9]+]]: tensor<?x?x?x?xf32>
+//  CHECK-SAME:   %[[ARG6:[a-zA-Z0-9]+]]: tensor<?x?x?x?xf32>
+//       CHECK:   %[[RETURN:.+]] = flow.dispatch.region
+//       CHECK:     %[[PADDED:.+]] = tensor.pad %[[ARG0]]
+//       CHECK:     %[[CONV:.+]] = linalg.generic
+//  CHECK-SAME:         ins(%[[PADDED]], %[[ARG5]] :
+//  CHECK-SAME:         outs(%[[ARG6]] :
+//       CHECK:     flow.return %[[CONV]]
+//       CHECK:   util.return %[[RETURN]]

Original file line number	Diff line number	Diff line change
`@@ -768,8 +768,9 @@ static bool isFusableWithProducer(`
`768`	`768`	`return false;`
`769`	`769`	`}`
`770`	`770`
	`771`	`+ auto linalgConsumer = dyn_cast<linalg::LinalgOp>(consumer);`
`771`	`772`	`if (options.fusePadWithConsumers && isa<tensor::PadOp>(producer) &&`
`772`		`- isa<linalg::ConvolutionOpInterface>(consumer)) {`
	`773`	`+ linalgConsumer && linalg::isaConvolutionOpInterface(linalgConsumer)) {`
`773`	`774`	`return true;`
`774`	`775`	`}`
`775`	`776`