Solve merge conflicts and fixed tests after bump

mgehre-amd · mgehre-amd · commit 081636148c86 · 2025-11-07T12:20:23.000+01:00
Handle the upstream switch of tosa.mul to use an optional shift operand by allowing the constant folding path to accept and validate a constant zero shift tensor. Relax the shared binary folding helper to work with ops that gain extra operands so mul no longer asserts. Update the TOSA constant-folding test cases to spell out zero-shift operands, capture the new value numbering, and document these findings for future bump runs.
diff --git a/mlir/lib/Dialect/Tosa/Transforms/TosaFolders.cpp b/mlir/lib/Dialect/Tosa/Transforms/TosaFolders.cpp
@@ -355,7 +355,8 @@ struct TosaFoldConstantBase : public OpRewritePattern<TosaOp> {
                                       DenseElementsAttr valuesSecond) const {
     if (!foldSplatOrSingleUseOnly)
       return true;
-    assert(binaryOp->getNumOperands() == 2);
+    assert(binaryOp->getNumOperands() >= 2 &&
+           "binary folding expects at least two operands");
     auto firstOp = binaryOp->getOperand(0);
     auto secondOp = binaryOp->getOperand(1);
 
@@ -750,10 +751,19 @@ struct TosaFoldConstantMul
   DenseElementsAttr computeInteger(DenseElementsAttr lhsValues,
                                    DenseElementsAttr rhsValues,
                                    PatternRewriter &rewriter, MulOp op) const {
-    if (op.getShift() > 0) {
-      (void)rewriter.notifyMatchFailure(
-          op, "Non-zero shift folding is currently not implemented.");
-      return {};
+    if (Value shiftVal = op.getShift()) {
+      ElementsAttr shiftAttr;
+      if (!matchPattern(shiftVal, m_Constant(&shiftAttr))) {
+        (void)rewriter.notifyMatchFailure(
+            op, "shift must be a constant for folding.");
+        return {};
+      }
+      if (llvm::any_of(shiftAttr.getValues<IntegerAttr>(),
+                       [](IntegerAttr attr) { return attr.getInt() != 0; })) {
+        (void)rewriter.notifyMatchFailure(
+            op, "Non-zero shift folding is currently not implemented.");
+        return {};
+      }
     }
 
     auto resultElementWidth =
diff --git a/mlir/test/Dialect/Tosa/constant-mul-opt.mlir b/mlir/test/Dialect/Tosa/constant-mul-opt.mlir
@@ -1,3 +1,5 @@
+// Modifications (c) Copyright 2023-2025 Advanced Micro Devices, Inc. or its
+// affiliates
 // RUN: mlir-opt --split-input-file -verify-diagnostics --tosa-layerwise-constant-fold %s | FileCheck %s
 
 // Float multiplications
@@ -15,7 +17,7 @@ func.func @mul_fold_float() -> tensor<4xf16> {
                         dense<[-132.7, -3.0, -0.0, 5.0]> :
                         tensor<4xf16>
                       } : () -> tensor<4xf16>
-  %2 = "tosa.mul"(%0, %1) {shift = 0 : i8} : (tensor<4xf16>, tensor<4xf16>) -> tensor<4xf16>
+  %2 = "tosa.mul"(%0, %1) : (tensor<4xf16>, tensor<4xf16>) -> tensor<4xf16>
   return %2 : tensor<4xf16>
 }
 
@@ -32,7 +34,7 @@ func.func @mul_fold_float_infinity_nan() -> tensor<7xf32> {
                         dense<[3.0, -3.0, -3.0, 3.0, 1.0, 0xFF800000, 0.0]> :
                         tensor<7xf32>
                       } : () -> tensor<7xf32>
-  %2 = "tosa.mul"(%0, %1) {shift = 0 : i8} : (tensor<7xf32>, tensor<7xf32>) -> tensor<7xf32>
+  %2 = "tosa.mul"(%0, %1) : (tensor<7xf32>, tensor<7xf32>) -> tensor<7xf32>
   return %2 : tensor<7xf32>
 }
 
@@ -49,7 +51,7 @@ func.func @add_fold_float_overflow() -> tensor<2xf32> {
                         dense<[2.1e+38, 1.1e+38]> :
                         tensor<2xf32>
                       } : () -> tensor<2xf32>
-  %2 = "tosa.mul"(%0, %1) {shift = 0 : i8} : (tensor<2xf32>, tensor<2xf32>) -> tensor<2xf32>
+  %2 = "tosa.mul"(%0, %1) : (tensor<2xf32>, tensor<2xf32>) -> tensor<2xf32>
   return %2 : tensor<2xf32>
 }
 
@@ -69,7 +71,8 @@ func.func @mul_fold_int() -> tensor<4xi32> {
                         dense<[-132, -3, 0, 5]> :
                         tensor<4xi32>
                       } : () -> tensor<4xi32>
-  %2 = "tosa.mul"(%0, %1) {shift = 0 : i8} : (tensor<4xi32>, tensor<4xi32>) -> tensor<4xi32>
+  %shift = "tosa.const"() <{value = dense<0> : tensor<1xi8>}> : () -> tensor<1xi8>
+  %2 = "tosa.mul"(%0, %1, %shift) : (tensor<4xi32>, tensor<4xi32>, tensor<1xi8>) -> tensor<4xi32>
   return %2 : tensor<4xi32>
 }
 
@@ -87,10 +90,12 @@ func.func @mul_fold_i8() -> tensor<4xi32> {
                         tensor<4xi8>
                       } : () -> tensor<4xi8>
   // TODO: This is wrongly rejected as illegal, see https://reviews.llvm.org/D150472#4484478
-  // %2 = "tosa.mul"(%0, %1) {shift = 0 : i8} : (tensor<4xi8>, tensor<4xi8>) -> tensor<4xi32>
+  // %zero_shift = "tosa.const"() <{value = dense<0> : tensor<1xi8>}> : () -> tensor<1xi8>
+  // %2 = "tosa.mul"(%0, %1, %zero_shift) : (tensor<4xi8>, tensor<4xi8>, tensor<1xi8>) -> tensor<4xi32>
   %a = "tosa.cast"(%0) : (tensor<4xi8>) -> tensor<4xi32>
   %b = "tosa.cast"(%1) : (tensor<4xi8>) -> tensor<4xi32>
-  %2 = "tosa.mul"(%a, %b) {shift = 0 : i8} : (tensor<4xi32>, tensor<4xi32>) -> tensor<4xi32>
+  %shift = "tosa.const"() <{value = dense<0> : tensor<1xi8>}> : () -> tensor<1xi8>
+  %2 = "tosa.mul"(%a, %b, %shift) : (tensor<4xi32>, tensor<4xi32>, tensor<1xi8>) -> tensor<4xi32>
 
   return %2 : tensor<4xi32>
 }
@@ -110,8 +115,9 @@ func.func @mul_fold_int_overflow() -> tensor<4xi32> {
                         dense<[1, 10, 1, 30]> :
                         tensor<4xi32>
                       } : () -> tensor<4xi32>
+  %shift = "tosa.const"() <{value = dense<0> : tensor<1xi8>}> : () -> tensor<1xi8>
   // expected-warning@below {{Multiplication did overflow. The results are unspecified.}}
-  %2 = "tosa.mul"(%0, %1) {shift = 0 : i8} : (tensor<4xi32>, tensor<4xi32>) -> tensor<4xi32>
+  %2 = "tosa.mul"(%0, %1, %shift) : (tensor<4xi32>, tensor<4xi32>, tensor<1xi8>) -> tensor<4xi32>
   return %2 : tensor<4xi32>
 }
 
@@ -127,7 +133,8 @@ func.func @mul_fold_equal_args() -> tensor<3xi32> {
                         dense<[-17, 4, 0]> :
                         tensor<3xi32>
                       } : () -> tensor<3xi32>
-  %2 = "tosa.mul"(%0, %0) {shift = 0 : i8} : (tensor<3xi32>, tensor<3xi32>) -> tensor<3xi32>
+  %shift = "tosa.const"() <{value = dense<0> : tensor<1xi8>}> : () -> tensor<1xi8>
+  %2 = "tosa.mul"(%0, %0, %shift) : (tensor<3xi32>, tensor<3xi32>, tensor<1xi8>) -> tensor<3xi32>
   return %2 : tensor<3xi32>
 }
 
@@ -147,7 +154,8 @@ func.func @mul_fold_int_broadcast_simple() -> tensor<3xi32> {
                         dense<-12> :
                         tensor<1xi32>
                       } : () -> tensor<1xi32>
-  %2 = "tosa.mul"(%0, %1) {shift = 0 : i8} : (tensor<3xi32>, tensor<1xi32>) -> tensor<3xi32>
+  %shift = "tosa.const"() <{value = dense<0> : tensor<1xi8>}> : () -> tensor<1xi8>
+  %2 = "tosa.mul"(%0, %1, %shift) : (tensor<3xi32>, tensor<1xi32>, tensor<1xi8>) -> tensor<3xi32>
   return %2 : tensor<3xi32>
 }
 
@@ -167,15 +175,17 @@ func.func @mul_fold_int_broadcast_complex() -> tensor<3x3xi32> {
                         dense<[[-12, 7, 4]]> :
                         tensor<1x3xi32>
                       } : () -> tensor<1x3xi32>
-  %2 = "tosa.mul"(%0, %1) {shift = 0 : i8} : (tensor<3x1xi32>, tensor<1x3xi32>) -> tensor<3x3xi32>
+  %shift = "tosa.const"() <{value = dense<0> : tensor<1xi8>}> : () -> tensor<1xi8>
+  %2 = "tosa.mul"(%0, %1, %shift) : (tensor<3x1xi32>, tensor<1x3xi32>, tensor<1xi8>) -> tensor<3x3xi32>
   return %2 : tensor<3x3xi32>
 }
 
 // CHECK-LABEL: @mul_fold_int_non_zero_shift
 func.func @mul_fold_int_non_zero_shift() -> tensor<4xi32> {
-  // CHECK: [[FIRST:]] ={{.*}}tosa.const
-  // CHECK-NEXT: [[SECOND:]] ={{.*}}tosa.const
-  // CHECK-NEXT: [[MUL:]] ={{.*}}tosa.mul{{.*}}[[FIRST]], [[SECOND]]
+  // CHECK: [[FIRST:%.*]] ={{.*}}tosa.const
+  // CHECK-NEXT: [[SECOND:%.*]] ={{.*}}tosa.const
+  // CHECK-NEXT: [[SHIFT:%.*]] ={{.*}}tosa.const
+  // CHECK-NEXT: [[MUL:%.*]] ={{.*}}tosa.mul{{.*}}[[FIRST]], [[SECOND]], [[SHIFT]]
   // CHECK-NEXT: return [[MUL]]
   %0 = "tosa.const"() {value =
                         dense<[-17, 4, 0, 0]> :
@@ -185,6 +195,7 @@ func.func @mul_fold_int_non_zero_shift() -> tensor<4xi32> {
                         dense<[-132, -3, 0, 5]> :
                         tensor<4xi32>
                       } : () -> tensor<4xi32>
-  %2 = "tosa.mul"(%0, %1) {shift = 1 : i8} : (tensor<4xi32>, tensor<4xi32>) -> tensor<4xi32>
+  %shift = "tosa.const"() <{value = dense<1> : tensor<1xi8>}> : () -> tensor<1xi8>
+  %2 = "tosa.mul"(%0, %1, %shift) : (tensor<4xi32>, tensor<4xi32>, tensor<1xi8>) -> tensor<4xi32>
   return %2 : tensor<4xi32>
 }