canonicalize aten.convolution

hariprasadravi · hariprasadravi · commit b0cd290eceea · 2025-11-24T11:55:10.000-05:00
diff --git a/include/torch-mlir/Dialect/Torch/IR/GeneratedTorchOps.td b/include/torch-mlir/Dialect/Torch/IR/GeneratedTorchOps.td
@@ -7119,6 +7119,7 @@ def Torch_AtenConvolutionOp : Torch_Op<"aten.convolution", [
       printDefaultTorchOp(printer, *this, 9, 1);
     }
   }];
+  let hasCanonicalizer = 1;
 }
 
 def Torch_Aten_ConvolutionOp : Torch_Op<"aten._convolution", [
diff --git a/lib/Dialect/Torch/IR/TorchOps.cpp b/lib/Dialect/Torch/IR/TorchOps.cpp
@@ -6,6 +6,7 @@
 // Also available under a BSD-style license. See LICENSE.
 //
 //===----------------------------------------------------------------------===//
+#include "llvm/ADT/SmallVector.h"
 #define DEBUG_TYPE "torch-mlir-torch-dialect"
 #include "torch-mlir/Dialect/Torch/IR/TorchOps.h"
 #include "torch-mlir/Dialect/Torch/Utils/Utils.h"
@@ -4721,6 +4722,122 @@ OpFoldResult Aten_ShapeAsTensorOp::fold(FoldAdaptor adaptor) {
   return DenseElementsAttr::get(attrty, attrs);
 }
 
+namespace {
+class CanonicalizeConvolutionWithSingleIntTuple
+    : public OpRewritePattern<AtenConvolutionOp> {
+public:
+  using OpRewritePattern<AtenConvolutionOp>::OpRewritePattern;
+
+  LogicalResult matchAndRewrite(AtenConvolutionOp op,
+                                PatternRewriter &rewriter) const override {
+
+    auto weight = op.getWeight();
+    auto weightType = dyn_cast<ValueTensorType>(weight.getType());
+
+    if (!weightType) {
+      return rewriter.notifyMatchFailure(op, "weight is not a vtensor");
+    }
+    auto optionalSizes = weightType.getOptionalSizes();
+    if (!optionalSizes.has_value()) {
+      return rewriter.notifyMatchFailure(op,
+                                         "unranked weight tensor unsupported!");
+    }
+
+    // The rank is the size of the dimensions array
+    int64_t weightRank = optionalSizes.value().size();
+
+    // We canonicalize Rank 4 (2D Conv) or Rank 5 (3D Conv).
+    if (weightRank < 4 || weightRank > 5) {
+      return rewriter.notifyMatchFailure(
+          op, "unsupported weight rank (must be 4 or 5)");
+    }
+    int64_t requiredSpatialDims = weightRank - 2;
+
+    // Validate stride, padding, output_padding, and dilation are constant
+    // lists.
+    SmallVector<int64_t> strideInts;
+    if (!matchPattern(op.getStride(), m_TorchListOfConstantInts(strideInts))) {
+      return rewriter.notifyMatchFailure(op,
+                                         "non-const int stride unsupported!");
+    }
+    SmallVector<int64_t> paddingInts;
+    if (!matchPattern(op.getPadding(),
+                      m_TorchListOfConstantInts(paddingInts))) {
+      return rewriter.notifyMatchFailure(op,
+                                         "non-const int padding unsupported!");
+    }
+    SmallVector<int64_t> outputPaddingInts;
+    if (!matchPattern(op.getOutputPadding(),
+                      m_TorchListOfConstantInts(outputPaddingInts))) {
+      return rewriter.notifyMatchFailure(
+          op, "non-const int output_padding unsupported!");
+    }
+    SmallVector<int64_t> dilationInts;
+    if (!matchPattern(op.getDilation(),
+                      m_TorchListOfConstantInts(dilationInts))) {
+      return rewriter.notifyMatchFailure(op,
+                                         "non-const int dilation unsupported!");
+    }
+
+    // Canonicalization Logic: Only rewrite if padding provided is 1 element
+    // but the convolution requires 2 or 3 elements.
+    if (strideInts.size() == static_cast<size_t>(requiredSpatialDims)) {
+      return rewriter.notifyMatchFailure(op,
+                                         "stride is already fully specified");
+    }
+    if (paddingInts.size() == static_cast<size_t>(requiredSpatialDims)) {
+      return rewriter.notifyMatchFailure(op,
+                                         "padding is already fully specified");
+    }
+    if (outputPaddingInts.size() == static_cast<size_t>(requiredSpatialDims)) {
+      return rewriter.notifyMatchFailure(
+          op, "output_padding is already fully specified");
+    }
+    if (dilationInts.size() == static_cast<size_t>(requiredSpatialDims)) {
+      return rewriter.notifyMatchFailure(op,
+                                         "dialtion is already fully specified");
+    }
+
+    // Construct the new Padding List
+    // If user provided padding=[1], and we need 2 or 3 dims, we create
+    // padding=[1, 1] or padding = [1,1,1]
+    int64_t padVal = paddingInts[0];
+    Location loc = op.getLoc();
+
+    SmallVector<Value> newPaddingValues;
+    Value paddingConst = ConstantIntOp::create(
+        rewriter, loc, rewriter.getI64IntegerAttr(padVal));
+
+    for (int i = 0; i < requiredSpatialDims; ++i) {
+      newPaddingValues.push_back(paddingConst);
+    }
+
+    // Create the list construct op
+    auto newListOp = PrimListConstructOp::create(
+        rewriter, loc, Torch::ListType::get(rewriter.getType<Torch::IntType>()),
+        newPaddingValues);
+
+    // Replace the Op
+    // We create a new convolution op, keeping all operands the same except
+    // padding
+    rewriter.replaceOpWithNewOp<AtenConvolutionOp>(
+        op, op.getType(), op.getInput(), op.getWeight(), op.getBias(),
+        op.getStride(), newListOp.getResult(), op.getDilation(),
+        op.getTransposed(), op.getOutputPadding(), op.getGroups());
+
+    return success();
+  }
+};
+} // namespace
+
+//===----------------------------------------------------------------------===//
+// AtenConvolutionOp Registration
+//===----------------------------------------------------------------------===//
+void AtenConvolutionOp::getCanonicalizationPatterns(RewritePatternSet &results,
+                                                    MLIRContext *context) {
+  results.add<CanonicalizeConvolutionWithSingleIntTuple>(context);
+}
+
 //===----------------------------------------------------------------------===//
 // AtenIntTensorOp
 //===----------------------------------------------------------------------===//
diff --git a/projects/pt1/e2e_testing/xfail_sets.py b/projects/pt1/e2e_testing/xfail_sets.py
@@ -1131,6 +1131,7 @@
     "Conv2dWithPaddingDilationStrideStaticModule_grouped",
     "Conv2dWithPaddingDilationStrideStaticModule_grouped_multiplier",
     "Convolution2DStaticModule_basic",
+    "Convolution2DSingleIntTuplePaddingModule_basic",
     "ConvolutionBackwardModule2DStatic_basic",
     "ConvolutionModule2DTransposeStridedStatic_basic",
     "Conv_Transpose1dStaticModule_basic",
@@ -2166,6 +2167,7 @@
     "Conv2dWithValidPaddingModule_basic",
     "Conv2dWithSamePaddingModule_basic",
     "Convolution2DStaticModule_basic",
+    "Convolution2DSingleIntTuplePaddingModule_basic",
     "CosineSimilarityStaticModule_basic",
     "DetachModule_basic",
     "DropoutEvalFloatModule_basic",
diff --git a/projects/pt1/python/torch_mlir/jit_ir_importer/build_tools/torch_ods_gen.py b/projects/pt1/python/torch_mlir/jit_ir_importer/build_tools/torch_ods_gen.py
@@ -612,7 +612,8 @@ def emit_with_mutating_variants(key, **kwargs):
         "aten::conv_tbc_backward : (Tensor, Tensor, Tensor, Tensor, int) -> (Tensor, Tensor, Tensor)"
     )
     emit(
-        "aten::convolution : (Tensor, Tensor, Tensor?, int[], int[], int[], bool, int[], int) -> (Tensor)"
+        "aten::convolution : (Tensor, Tensor, Tensor?, int[], int[], int[], bool, int[], int) -> (Tensor)",
+        has_canonicalizer=True,
     )
     emit(
         "aten::_convolution : (Tensor, Tensor, Tensor?, int[], int[], int[], bool, int[], int, bool, bool, bool, bool) -> (Tensor)"
diff --git a/projects/pt1/python/torch_mlir_e2e_test/test_suite/conv.py b/projects/pt1/python/torch_mlir_e2e_test/test_suite/conv.py
@@ -304,6 +304,37 @@ def Convolution2DStaticModule_basic(module, tu: TestUtils):
     module.forward(tu.rand(3, 3, 10, 10), tu.rand(3, 3, 2, 2))
 
 
+class Convolution2DSingleIntTuplePaddingModule(torch.nn.Module):
+    def __init__(self):
+        super().__init__()
+
+    @export
+    @annotate_args(
+        [
+            None,
+            ([3, 3, 10, 10], torch.float32, True),
+            ([3, 3, 2, 2], torch.float32, True),
+        ]
+    )
+    def forward(self, inputVec, weight):
+        return torch.ops.aten.convolution(
+            inputVec,
+            weight,
+            bias=None,
+            stride=(4,),
+            padding=(0,),
+            dilation=(1,),
+            transposed=False,
+            output_padding=[0, 0],
+            groups=1,
+        )
+
+
+@register_test_case(module_factory=lambda: Convolution2DSingleIntTuplePaddingModule())
+def Convolution2DSingleIntTuplePaddingModule_basic(module, tu: TestUtils):
+    module.forward(tu.rand(3, 3, 10, 10), tu.rand(3, 3, 2, 2))
+
+
 class Convolution2DStridedModule(torch.nn.Module):
     def __init__(self):
         super().__init__()

Original file line number	Diff line number	Diff line change
`@@ -7119,6 +7119,7 @@ def Torch_AtenConvolutionOp : Torch_Op<"aten.convolution", [`
`7119`	`7119`	`printDefaultTorchOp(printer, *this, 9, 1);`
`7120`	`7120`	`}`
`7121`	`7121`	`}];`
	`7122`	`+ let hasCanonicalizer = 1;`
`7122`	`7123`	`}`
`7123`	`7124`
`7124`	`7125`	`def Torch_Aten_ConvolutionOp : Torch_Op<"aten._convolution", [`
Original file line number	Diff line number	Diff line change
`@@ -612,7 +612,8 @@ def emit_with_mutating_variants(key, **kwargs):`
`612`	`612`	`"aten::conv_tbc_backward : (Tensor, Tensor, Tensor, Tensor, int) -> (Tensor, Tensor, Tensor)"`
`613`	`613`	`)`
`614`	`614`	`emit(`
`615`		`- "aten::convolution : (Tensor, Tensor, Tensor?, int[], int[], int[], bool, int[], int) -> (Tensor)"`
	`615`	`+ "aten::convolution : (Tensor, Tensor, Tensor?, int[], int[], int[], bool, int[], int) -> (Tensor)",`
	`616`	`+ has_canonicalizer=True,`
`616`	`617`	`)`
`617`	`618`	`emit(`
`618`	`619`	`"aten::_convolution : (Tensor, Tensor, Tensor?, int[], int[], int[], bool, int[], int, bool, bool, bool, bool) -> (Tensor)"`