llvm · jerryyin · Mar 17, 2025 · Mar 6, 2025 · Mar 7, 2025 · Mar 7, 2025
@@ -52,6 +52,12 @@ using namespace mlir::linalg;
 #define DBGS() (llvm::dbgs() << '[' << DEBUG_TYPE << "] ")
 #define LDBG(X) LLVM_DEBUG(DBGS() << X << "\n")
 
+// Forward declaration of Conv1DGenerator and its validator
+namespace {
+struct Conv1DGenerator;
+bool validateConv1DGenerator(RewriterBase &rewriter, LinalgOp linalgOp);
+} // namespace
+
 /// Try to vectorize `convOp` as a convolution.
 static FailureOr<Operation *>
 vectorizeConvolution(RewriterBase &rewriter, LinalgOp convOp,
@@ -1990,8 +1996,21 @@ static LogicalResult vectorizeLinalgOpPrecondition(
   // TODO: isaConvolutionOpInterface that can also infer from generic
   // features. But we will still need stride/dilation attributes that will be
   // annoying to reverse-engineer...
-  if (isa<ConvolutionOpInterface>(linalgOp.getOperation()))
+  if (isa<ConvolutionOpInterface>(linalgOp.getOperation())) {
+    // Create a dummy rewriter first, a rewriter is not required for
+    // validation
+    IRRewriter dummyBuilder(linalgOp.getContext());
+    // Check if we can successfully construct a 1d convolution generator.
+    // For example, if it is 2d+ convolution, return failure because we don't
+    // support it. To use this pass on a 2d+ convolution, it should have already
+    // been decomposed to 1d convolution via
+    // DecomposeConvolutionToLowerDimOpsPass.
 // Determine whether `linalgOp` can be generated with this generator 
 if (linalgOp.getNumDpsInputs() != 2 || linalgOp.getNumDpsInits() != 1) 
   return; 
 lhsShaped = linalgOp.getDpsInputOperand(0)->get(); 
 rhsShaped = linalgOp.getDpsInputOperand(1)->get(); 
 resShaped = linalgOp.getDpsInitOperand(0)->get(); 
 lhsShapedType = dyn_cast<ShapedType>(lhsShaped.getType()); 
 rhsShapedType = dyn_cast<ShapedType>(rhsShaped.getType()); 
 resShapedType = dyn_cast<ShapedType>(resShaped.getType()); 
 if (!lhsShapedType || !rhsShapedType || !resShapedType) 
   return; 
 // (LHS has dimension NCW/NWC and RES has dimension NFW/NCW/NWF/NWC) OR 
 // (non-channeled convolution -> LHS and RHS both have single dimensions). 
 if ((lhsShapedType.getRank() != 3 || resShapedType.getRank() != 3) && 
     (lhsShapedType.getRank() != 1 || resShapedType.getRank() != 1)) 
   return; 
 Operation *reduceOp = matchLinalgReduction(linalgOp.getDpsInitOperand(0)); 
 if (!reduceOp) 
   return; 
 redOp = reduceOp->getName().getIdentifier(); 
 if (!setOperKind(reduceOp)) 
   return; 
 auto maybeKind = getCombinerOpKind(reduceOp); 
 // Typically convolution will have a `Add` CombiningKind but for i1 type it 
 // can get strength reduced to `OR` which is also supported. This strength 
 // reduction logic is in `buildBinaryFn` helper in the Linalg dialect. 
 if (!maybeKind || ((*maybeKind != vector::CombiningKind::ADD && 
                     *maybeKind != vector::CombiningKind::OR) && 
                    (oper != Pool || !isSupportedPoolKind(*maybeKind)))) { 
   return; 
 } 
 reductionKind = maybeKind.value(); 
 auto rhsRank = rhsShapedType.getRank(); 
 switch (oper) { 
 case Conv: 
   if (rhsRank != 1 && rhsRank != 2 && rhsRank != 3) 
     return; 
   break; 
 case Pool: 
   if (rhsRank != 1) 
     return; 
   break; 
 } 
 // The op is now known to be valid. 
 valid = true; 
 // Determine whether `linalgOp` can be generated with this generator 
 if (linalgOp.getNumDpsInputs() != 2 || linalgOp.getNumDpsInits() != 1) 
   return; 
 lhsShaped = linalgOp.getDpsInputOperand(0)->get(); 
 rhsShaped = linalgOp.getDpsInputOperand(1)->get(); 
 resShaped = linalgOp.getDpsInitOperand(0)->get(); 
 lhsShapedType = dyn_cast<ShapedType>(lhsShaped.getType()); 
 rhsShapedType = dyn_cast<ShapedType>(rhsShaped.getType()); 
 resShapedType = dyn_cast<ShapedType>(resShaped.getType()); 
 if (!lhsShapedType || !rhsShapedType || !resShapedType) 
   return; 
 // (LHS has dimension NCW/NWC and RES has dimension NFW/NCW/NWF/NWC) OR 
 // (non-channeled convolution -> LHS and RHS both have single dimensions). 
 if ((lhsShapedType.getRank() != 3 || resShapedType.getRank() != 3) && 
     (lhsShapedType.getRank() != 1 || resShapedType.getRank() != 1)) 
   return; 
  
 Operation *reduceOp = matchLinalgReduction(linalgOp.getDpsInitOperand(0)); 
 if (!reduceOp) 
   return; 
 redOp = reduceOp->getName().getIdentifier(); 
  
 if (!setOperKind(reduceOp)) 
   return; 
 auto maybeKind = getCombinerOpKind(reduceOp); 
 // Typically convolution will have a `Add` CombiningKind but for i1 type it 
 // can get strength reduced to `OR` which is also supported. This strength 
 // reduction logic is in `buildBinaryFn` helper in the Linalg dialect. 
 if (!maybeKind || ((*maybeKind != vector::CombiningKind::ADD && 
                     *maybeKind != vector::CombiningKind::OR) && 
                    (oper != Pool || !isSupportedPoolKind(*maybeKind)))) { 
   return; 
 } 
 reductionKind = maybeKind.value(); 
  
 auto rhsRank = rhsShapedType.getRank(); 
 switch (oper) { 
 case Conv: 
   if (rhsRank != 1 && rhsRank != 2 && rhsRank != 3) 
     return; 
   break; 
 case Pool: 
   if (rhsRank != 1) 
     return; 
   break; 
 } 
 // The op is now known to be valid. 
 valid = true; 
+    if (!validateConv1DGenerator(dummyBuilder, linalgOp))
+      return failure();
+
     return success();
+  }
+
   // TODO: the common vector shape is equal to the static loop sizes only when
   // all indexing maps are projected permutations. For convs and stencils the
   // logic will need to evolve.
@@ -3125,10 +3144,8 @@ bool isSupportedPoolKind(vector::CombiningKind kind) {
 /// kw is unrolled, w is unrolled iff dilationW > 1.
 struct Conv1DGenerator
     : public StructuredGenerator<LinalgOp, utils::IteratorType> {
-  Conv1DGenerator(RewriterBase &rewriter, LinalgOp linalgOp, int strideW,
-                  int dilationW)
-      : StructuredGenerator<LinalgOp, utils::IteratorType>(rewriter, linalgOp),
-        strideW(strideW), dilationW(dilationW) {
+  Conv1DGenerator(RewriterBase &rewriter, LinalgOp linalgOp)
+      : StructuredGenerator<LinalgOp, utils::IteratorType>(rewriter, linalgOp) {
     // Determine whether `linalgOp` can be generated with this generator
     if (linalgOp.getNumDpsInputs() != 2 || linalgOp.getNumDpsInits() != 1)
       return;
@@ -3175,10 +3192,22 @@ struct Conv1DGenerator
         return;
       break;
     }
+
+    // The ConvolutionOpInterface gives us guarantees of existence for
+    // strides/dilations. However, we do not need to rely on those, we can
+    // simply use them if present, otherwise use the default and let the generic
+    // conv. matcher in the ConvGenerator succeed or fail.
+    auto strides = linalgOp->getAttrOfType<DenseIntElementsAttr>("strides");
+    auto dilations = linalgOp->getAttrOfType<DenseIntElementsAttr>("dilations");
+    strideW = strides ? *strides.getValues<uint64_t>().begin() : 1;
+    dilationW = dilations ? *dilations.getValues<uint64_t>().begin() : 1;
+
     // The op is now known to be valid.
     valid = true;
   }
 
+  bool isValid() { return valid; }
+
   /// Generate a vector implementation for:
   /// ```
   ///   Op def: (     w,     kw  )
@@ -3889,22 +3918,21 @@ struct Conv1DGenerator
     }
   }
 };
+
+// Helper function to construct Conv1DGenerator
+bool validateConv1DGenerator(RewriterBase &rewriter, LinalgOp linalgOp) {
+  Conv1DGenerator conv1dGen(rewriter, linalgOp);
+  return conv1dGen.isValid();
+}
+
 } // namespace
 
 /// Helper function to vectorize a LinalgOp with convolution semantics.
 // TODO: extend the generic vectorization to support windows and drop this.
 static FailureOr<Operation *> vectorizeConvolution(
     RewriterBase &rewriter, LinalgOp op, ArrayRef<int64_t> inputVecSizes,
     ArrayRef<bool> inputScalableVecDims, bool flatten1DDepthwiseConv) {
-  // The ConvolutionOpInterface gives us guarantees of existence for
-  // strides/dilations. However, we do not need to rely on those, we can
-  // simply use them if present, otherwise use the default and let the generic
-  // conv. matcher in the ConvGenerator succeed or fail.
-  auto strides = op->getAttrOfType<DenseIntElementsAttr>("strides");
-  auto dilations = op->getAttrOfType<DenseIntElementsAttr>("dilations");
-  auto stride = strides ? *strides.getValues<uint64_t>().begin() : 1;
-  auto dilation = dilations ? *dilations.getValues<uint64_t>().begin() : 1;
-  Conv1DGenerator e(rewriter, op, stride, dilation);
+  Conv1DGenerator e(rewriter, op);
   auto res = e.generateNonChanneledConv();
   if (succeeded(res))
     return res;
@@ -3929,9 +3957,11 @@ static FailureOr<Operation *> vectorizeConvolution(
   if (!inputVecSizes.empty()) {
     // Only use the input vector size corresponding to the channel dim. Other
     // vector dims will be inferred from the Ops.
-    assert((isa<linalg::DepthwiseConv1DNwcWcOp>(*op) ||
-            isa<linalg::DepthwiseConv1DNcwCwOp>(*op)) &&
-           "Not a 1D depthwise conv!");
+    if (!isa<linalg::DepthwiseConv1DNwcWcOp>(*op) &&
+        !isa<linalg::DepthwiseConv1DNcwCwOp>(*op)) {
+      return rewriter.notifyMatchFailure(
+          op, "Unexpected convolution: expected 1D depthwise conv");
+    }
     size_t chDimIdx =
         TypeSwitch<Operation *, size_t>(op)
             .Case<linalg::DepthwiseConv1DNwcWcOp>([](auto conv) { return 2; })

diff --git a/mlir/test/Dialect/Linalg/vectorization-unsupported.mlir b/mlir/test/Dialect/Linalg/vectorization-unsupported.mlir
@@ -112,6 +112,25 @@ module attributes {transform.with_named_sequence} {
 
 // -----
 
+func.func @conv2d(%3: tensor<1x64x58x58xf32>, %4:  tensor<64x64x3x3xf32>) {
+  %cst = arith.constant 0.000000e+00 : f32
+  %5 = tensor.empty() : tensor<1x64x56x56xf32>
+  %6 = linalg.fill ins(%cst : f32) outs(%5 : tensor<1x64x56x56xf32>) -> tensor<1x64x56x56xf32>
+  // expected-error @+1 {{Attempted to vectorize, but failed}}
+  %7 = linalg.conv_2d_nchw_fchw {dilations = dense<1> : vector<2xi64>, strides = dense<1> : vector<2xi64>} ins(%3, %4 : tensor<1x64x58x58xf32>, tensor<64x64x3x3xf32>) outs(%6 : tensor<1x64x56x56xf32>) -> tensor<1x64x56x56xf32>
+  return
+}
+
+module attributes {transform.with_named_sequence} {
+  transform.named_sequence @__transform_main(%arg1: !transform.any_op {transform.readonly}) {
+    %0 = transform.structured.match ops{["linalg.conv_2d_nchw_fchw"]} in %arg1 : (!transform.any_op) -> !transform.any_op
+    transform.structured.vectorize %0 : !transform.any_op
+    transform.yield
+  }
+}
+
+// -----
+
 func.func @test_pack_no_vectorize_dynamic_shape(%arg0: tensor<?xf32>, %arg1: tensor<4x16xf32>) -> tensor<4x16xf32> {
   %pad = arith.constant 0.000000e+00 : f32
   // expected-error @+1 {{Attempted to vectorize, but failed}}