llvm
diff --git a/‎llvm/include/llvm/Analysis/ScalarEvolution.h‎
Lines changed: 8 additions & 0 deletions b/‎llvm/include/llvm/Analysis/ScalarEvolution.h‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎llvm/lib/Analysis/Delinearization.cpp‎
Lines changed: 20 additions & 62 deletions b/‎llvm/lib/Analysis/Delinearization.cpp‎
Lines changed: 20 additions & 62 deletions
diff --git a/‎llvm/lib/Analysis/ScalarEvolution.cpp‎
Lines changed: 43 additions & 0 deletions b/‎llvm/lib/Analysis/ScalarEvolution.cpp‎
Lines changed: 43 additions & 0 deletions
diff --git a/‎llvm/test/Analysis/DependenceAnalysis/Banerjee.ll‎
Lines changed: 9 additions & 9 deletions b/‎llvm/test/Analysis/DependenceAnalysis/Banerjee.ll‎
Lines changed: 9 additions & 9 deletions
@@ -544,6 +544,14 @@ class ScalarEvolution {
                                 const SCEV *LHS, const SCEV *RHS,
                                 const Instruction *CtxI = nullptr);
 
+  /// Get the predicate that, if true at runtime, proves that the binary
+  /// operation \p BinOp between \p LHS and \p RHS does not have
+  /// signed/unsigned overflow (depending on \p Signed). Returns the
+  /// predicate, or nullptr if no-overflow is already provable at compile time.
+  LLVM_ABI const SCEVPredicate *
+  getNoOverflowPredicate(Instruction::BinaryOps BinOp, bool Signed,
+                         const SCEV *LHS, const SCEV *RHS);
+
   /// Parse NSW/NUW flags from add/sub/mul IR binary operation \p Op into
   /// SCEV no-wrap flags, and deduce flag[s] that aren't known yet.
   /// Does not mutate the original instruction. Returns std::nullopt if it could
 
@@ -772,37 +772,19 @@ bool llvm::validateDelinearizationResult(
             SE.getNoopOrSignExtend(B, WiderType)};
   };
 
-  // Get a type with twice the bit width of T.
-  auto GetWiderType = [&](Type *T) -> Type * {
-    unsigned BitWidth = SE.getTypeSizeInBits(T);
-    return IntegerType::get(T->getContext(), BitWidth * 2);
-  };
-
   // Check if the result of A + B (signed) does not overflow. If it can be
   // proven at compile-time, return the result. If it might overflow and Assume
   // is provided, add a runtime equality predicate and return the result.
   // Otherwise return nullptr.
   auto AddNoOverflow = [&](const SCEV *A, const SCEV *B) -> const SCEV * {
     std::tie(A, B) = UnifyTypes(A, B);
-    if (SE.willNotOverflow(Instruction::Add, /*IsSigned=*/true, A, B))
-      return SE.getAddExpr(A, B);
-    if (!Assume)
-      return nullptr;
-
-    // Compute the addition in a wider type to detect overflow.
-    // If (sext A) + (sext B) == sext(A + B), then A + B does not overflow.
-    Type *OrigTy = A->getType();
-    Type *WiderTy = GetWiderType(OrigTy);
-    const SCEV *AWide = SE.getSignExtendExpr(A, WiderTy);
-    const SCEV *BWide = SE.getSignExtendExpr(B, WiderTy);
-    const SCEV *SumWide = SE.getAddExpr(AWide, BWide);
-    const SCEV *Sum = SE.getAddExpr(A, B);
-    const SCEV *SumExtended = SE.getSignExtendExpr(Sum, WiderTy);
-    // Add predicate: (sext A) + (sext B) == sext(A + B).
-    if (SumWide != SumExtended &&
-        !SE.isKnownPredicate(ICmpInst::ICMP_EQ, SumWide, SumExtended))
-      Assume->push_back(SE.getEqualPredicate(SumWide, SumExtended));
-    return Sum;
+    if (const auto *Pred = SE.getNoOverflowPredicate(Instruction::Add,
+                                                     /*Signed=*/true, A, B)) {
+      if (!Assume)
+        return nullptr;
+      Assume->push_back(Pred);
+    }
+    return SE.getAddExpr(A, B);
   };
 
   // Check if the result of A * B (signed) does not overflow. If it can be
@@ -811,50 +793,26 @@ bool llvm::validateDelinearizationResult(
   // Otherwise return nullptr.
   auto MulNoOverflow = [&](const SCEV *A, const SCEV *B) -> const SCEV * {
     std::tie(A, B) = UnifyTypes(A, B);
-    if (SE.willNotOverflow(Instruction::Mul, /*IsSigned=*/true, A, B))
-      return SE.getMulExpr(A, B);
-    if (!Assume)
-      return nullptr;
-
-    // Compute the multiplication in a wider type to detect overflow.
-    // If (sext A) * (sext B) == sext(A * B), then A * B does not overflow.
-    Type *OrigTy = A->getType();
-    Type *WiderTy = GetWiderType(OrigTy);
-    const SCEV *AWide = SE.getSignExtendExpr(A, WiderTy);
-    const SCEV *BWide = SE.getSignExtendExpr(B, WiderTy);
-    const SCEV *ProdWide = SE.getMulExpr(AWide, BWide);
-    const SCEV *Prod = SE.getMulExpr(A, B);
-    const SCEV *ProdExtended = SE.getSignExtendExpr(Prod, WiderTy);
-    // Add predicate: (sext A) * (sext B) == sext(A * B).
-    if (ProdWide != ProdExtended &&
-        !SE.isKnownPredicate(ICmpInst::ICMP_EQ, ProdWide, ProdExtended))
-      Assume->push_back(SE.getEqualPredicate(ProdWide, ProdExtended));
-    return Prod;
+    if (const auto *Pred = SE.getNoOverflowPredicate(Instruction::Mul,
+                                                     /*Signed=*/true, A, B)) {
+      if (!Assume)
+        return nullptr;
+      Assume->push_back(Pred);
+    }
+    return SE.getMulExpr(A, B);
   };
 
   // Check if the result of A - B (signed) does not overflow. If it can be
   // proven at compile-time or if Assume is provided (adding a runtime
   // predicate), return true. Otherwise return false.
   auto SubNoOverflow = [&](const SCEV *A, const SCEV *B) -> bool {
     std::tie(A, B) = UnifyTypes(A, B);
-    if (SE.willNotOverflow(Instruction::Sub, /*IsSigned=*/true, A, B))
-      return true;
-    if (!Assume)
-      return false;
-
-    // Compute the subtraction in a wider type to detect overflow.
-    // If (sext A) - (sext B) == sext(A - B), then A - B does not overflow.
-    Type *OrigTy = A->getType();
-    Type *WiderTy = GetWiderType(OrigTy);
-    const SCEV *AWide = SE.getSignExtendExpr(A, WiderTy);
-    const SCEV *BWide = SE.getSignExtendExpr(B, WiderTy);
-    const SCEV *DiffWide = SE.getMinusSCEV(AWide, BWide);
-    const SCEV *Diff = SE.getMinusSCEV(A, B);
-    const SCEV *DiffExtended = SE.getSignExtendExpr(Diff, WiderTy);
-    // Add predicate: (sext A) - (sext B) == sext(A - B).
-    if (DiffWide != DiffExtended &&
-        !SE.isKnownPredicate(ICmpInst::ICMP_EQ, DiffWide, DiffExtended))
-      Assume->push_back(SE.getEqualPredicate(DiffWide, DiffExtended));
+    if (const auto *Pred = SE.getNoOverflowPredicate(Instruction::Sub,
+                                                     /*Signed=*/true, A, B)) {
+      if (!Assume)
+        return false;
+      Assume->push_back(Pred);
+    }
     return true;
   };
 
 
@@ -2376,6 +2376,49 @@ bool ScalarEvolution::willNotOverflow(Instruction::BinaryOps BinOp, bool Signed,
   }
 }
 
+const SCEVPredicate *
+ScalarEvolution::getNoOverflowPredicate(Instruction::BinaryOps BinOp,
+                                        bool Signed, const SCEV *LHS,
+                                        const SCEV *RHS) {
+  // First check if no-overflow can be proven at compile time.
+  if (willNotOverflow(BinOp, Signed, LHS, RHS))
+    return nullptr;
+
+  const SCEV *(ScalarEvolution::*Operation)(const SCEV *, const SCEV *,
+                                            SCEV::NoWrapFlags, unsigned);
+  switch (BinOp) {
+  default:
+    llvm_unreachable("Unsupported binary op");
+  case Instruction::Add:
+    Operation = &ScalarEvolution::getAddExpr;
+    break;
+  case Instruction::Sub:
+    Operation = &ScalarEvolution::getMinusSCEV;
+    break;
+  case Instruction::Mul:
+    Operation = &ScalarEvolution::getMulExpr;
+    break;
+  }
+
+  const SCEV *(ScalarEvolution::*Extension)(const SCEV *, Type *, unsigned) =
+      Signed ? &ScalarEvolution::getSignExtendExpr
+             : &ScalarEvolution::getZeroExtendExpr;
+
+  // Build predicate: ext(LHS op RHS) == ext(LHS) op ext(RHS)
+  auto *NarrowTy = cast<IntegerType>(LHS->getType());
+  auto *WideTy =
+      IntegerType::get(NarrowTy->getContext(), NarrowTy->getBitWidth() * 2);
+
+  const SCEV *A = (this->*Extension)(
+      (this->*Operation)(LHS, RHS, SCEV::FlagAnyWrap, 0), WideTy, 0);
+  const SCEV *LHSB = (this->*Extension)(LHS, WideTy, 0);
+  const SCEV *RHSB = (this->*Extension)(RHS, WideTy, 0);
+  const SCEV *B = (this->*Operation)(LHSB, RHSB, SCEV::FlagAnyWrap, 0);
+
+  // Return the equality predicate.
+  return getEqualPredicate(A, B);
+}
+
 std::optional<SCEV::NoWrapFlags>
 ScalarEvolution::getStrengthenedNoWrapFlagsFromBinOp(
     const OverflowingBinaryOperator *OBO) {
 
@@ -139,27 +139,27 @@ define void @banerjee1(ptr %A, ptr %B, i64 %m, i64 %n) nounwind uwtable ssp {
 ; DELIN-NEXT:    da analyze - consistent output [0 0]!
 ; DELIN-NEXT:    Runtime Assumptions:
 ; DELIN-NEXT:    Compare predicate: {1,+,1}<nuw><nsw><%for.body3> slt) 10
-; DELIN-NEXT:    Equal predicate: {80,+,80}<nuw><nsw><%for.cond1.preheader> == (sext i64 {80,+,80}<%for.cond1.preheader> to i128)
-; DELIN-NEXT:    Equal predicate: (80 + (sext i64 {80,+,80}<%for.cond1.preheader> to i128))<nsw> == (sext i64 {160,+,80}<%for.cond1.preheader> to i128)
-; DELIN-NEXT:    Equal predicate: (-1 + (sext i64 {160,+,80}<%for.cond1.preheader> to i128))<nsw> == (15 + (sext i64 {144,+,80}<%for.cond1.preheader> to i128))<nuw><nsw>
+; DELIN-NEXT:    Equal predicate: (sext i64 {80,+,80}<%for.cond1.preheader> to i128) == {80,+,80}<nuw><nsw><%for.cond1.preheader>
+; DELIN-NEXT:    Equal predicate: (sext i64 {160,+,80}<%for.cond1.preheader> to i128) == (80 + (sext i64 {80,+,80}<%for.cond1.preheader> to i128))<nsw>
+; DELIN-NEXT:    Equal predicate: (15 + (sext i64 {144,+,80}<%for.cond1.preheader> to i128))<nuw><nsw> == (-1 + (sext i64 {160,+,80}<%for.cond1.preheader> to i128))<nsw>
 ; DELIN-NEXT:    Compare predicate: {1,+,1}<nuw><nsw><%for.body3> slt) 10
 ; DELIN-NEXT:  Src: store i64 0, ptr %arrayidx, align 8 --> Dst: %2 = load i64, ptr %arrayidx6, align 8
 ; DELIN-NEXT:    da analyze - consistent flow [0 1]!
 ; DELIN-NEXT:    Runtime Assumptions:
 ; DELIN-NEXT:    Compare predicate: {1,+,1}<nuw><nsw><%for.body3> slt) 10
-; DELIN-NEXT:    Equal predicate: {80,+,80}<nuw><nsw><%for.cond1.preheader> == (sext i64 {80,+,80}<%for.cond1.preheader> to i128)
-; DELIN-NEXT:    Equal predicate: (80 + (sext i64 {80,+,80}<%for.cond1.preheader> to i128))<nsw> == (sext i64 {160,+,80}<%for.cond1.preheader> to i128)
-; DELIN-NEXT:    Equal predicate: (-1 + (sext i64 {160,+,80}<%for.cond1.preheader> to i128))<nsw> == (15 + (sext i64 {144,+,80}<%for.cond1.preheader> to i128))<nuw><nsw>
+; DELIN-NEXT:    Equal predicate: (sext i64 {80,+,80}<%for.cond1.preheader> to i128) == {80,+,80}<nuw><nsw><%for.cond1.preheader>
+; DELIN-NEXT:    Equal predicate: (sext i64 {160,+,80}<%for.cond1.preheader> to i128) == (80 + (sext i64 {80,+,80}<%for.cond1.preheader> to i128))<nsw>
+; DELIN-NEXT:    Equal predicate: (15 + (sext i64 {144,+,80}<%for.cond1.preheader> to i128))<nuw><nsw> == (-1 + (sext i64 {160,+,80}<%for.cond1.preheader> to i128))<nsw>
 ; DELIN-NEXT:    Compare predicate: {0,+,1}<nuw><nsw><%for.body3> slt) 10
 ; DELIN-NEXT:  Src: store i64 0, ptr %arrayidx, align 8 --> Dst: store i64 %2, ptr %B.addr.12, align 8
 ; DELIN-NEXT:    da analyze - confused!
 ; DELIN-NEXT:  Src: %2 = load i64, ptr %arrayidx6, align 8 --> Dst: %2 = load i64, ptr %arrayidx6, align 8
 ; DELIN-NEXT:    da analyze - consistent input [0 0]!
 ; DELIN-NEXT:    Runtime Assumptions:
 ; DELIN-NEXT:    Compare predicate: {0,+,1}<nuw><nsw><%for.body3> slt) 10
-; DELIN-NEXT:    Equal predicate: {80,+,80}<nuw><nsw><%for.cond1.preheader> == (sext i64 {80,+,80}<%for.cond1.preheader> to i128)
-; DELIN-NEXT:    Equal predicate: (80 + (sext i64 {80,+,80}<%for.cond1.preheader> to i128))<nsw> == (sext i64 {160,+,80}<%for.cond1.preheader> to i128)
-; DELIN-NEXT:    Equal predicate: (-1 + (sext i64 {160,+,80}<%for.cond1.preheader> to i128))<nsw> == (15 + (sext i64 {144,+,80}<%for.cond1.preheader> to i128))<nuw><nsw>
+; DELIN-NEXT:    Equal predicate: (sext i64 {80,+,80}<%for.cond1.preheader> to i128) == {80,+,80}<nuw><nsw><%for.cond1.preheader>
+; DELIN-NEXT:    Equal predicate: (sext i64 {160,+,80}<%for.cond1.preheader> to i128) == (80 + (sext i64 {80,+,80}<%for.cond1.preheader> to i128))<nsw>
+; DELIN-NEXT:    Equal predicate: (15 + (sext i64 {144,+,80}<%for.cond1.preheader> to i128))<nuw><nsw> == (-1 + (sext i64 {160,+,80}<%for.cond1.preheader> to i128))<nsw>
 ; DELIN-NEXT:    Compare predicate: {0,+,1}<nuw><nsw><%for.body3> slt) 10
 ; DELIN-NEXT:  Src: %2 = load i64, ptr %arrayidx6, align 8 --> Dst: store i64 %2, ptr %B.addr.12, align 8
 ; DELIN-NEXT:    da analyze - confused!