[LV] Provide utility routine to find uncounted exit recipes #152530

huntergr-arm · 2025-08-07T15:20:31Z

Splitting out just the recipe finding code from #148626 into a utility function (along with the extra pattern matchers). Hopefully this makes reviewing a bit easier.

Added a gtest, since this isn't actually used anywhere yet.

llvmbot · 2025-08-07T15:21:08Z

@llvm/pr-subscribers-llvm-transforms

@llvm/pr-subscribers-vectorizers

Author: Graham Hunter (huntergr-arm)

Changes

Splitting out just the recipe finding code from #148626 into a utility function (along with the extra pattern matchers). Hopefully this makes reviewing a bit easier.

Added a gtest, since this isn't actually used anywhere yet.

Full diff: https://github.com/llvm/llvm-project/pull/152530.diff

6 Files Affected:

(modified) llvm/lib/Transforms/Vectorize/VPlanPatternMatch.h (+31)
(modified) llvm/lib/Transforms/Vectorize/VPlanUtils.cpp (+100)
(modified) llvm/lib/Transforms/Vectorize/VPlanUtils.h (+8)
(modified) llvm/lib/Transforms/Vectorize/VPlanValue.h (+2)
(modified) llvm/unittests/Transforms/Vectorize/CMakeLists.txt (+1)
(added) llvm/unittests/Transforms/Vectorize/VPlanUncountedExitTest.cpp (+99)

diff --git a/llvm/lib/Transforms/Vectorize/VPlanPatternMatch.h b/llvm/lib/Transforms/Vectorize/VPlanPatternMatch.h
index 8818843a30625..d7f9763c4d0c8 100644
--- a/llvm/lib/Transforms/Vectorize/VPlanPatternMatch.h
+++ b/llvm/lib/Transforms/Vectorize/VPlanPatternMatch.h
@@ -692,6 +692,37 @@ m_Intrinsic(const T0 &Op0, const T1 &Op1, const T2 &Op2, const T3 &Op3) {
   return m_CombineAnd(m_Intrinsic<IntrID>(Op0, Op1, Op2), m_Argument<3>(Op3));
 }
 
+struct loop_invariant_vpvalue {
+  template <typename ITy> bool match(ITy *V) const {
+    VPValue *Val = dyn_cast<VPValue>(V);
+    return Val && Val->isDefinedOutsideLoopRegions();
+  }
+};
+
+inline loop_invariant_vpvalue m_LoopInvVPValue() {
+  return loop_invariant_vpvalue();
+}
+
+template <typename Op0_t>
+inline UnaryVPInstruction_match<Op0_t, VPInstruction::AnyOf>
+m_AnyOf(const Op0_t &Op0) {
+  return m_VPInstruction<VPInstruction::AnyOf>(Op0);
+}
+
+template <typename SubPattern_t> struct OneUse_match {
+  SubPattern_t SubPattern;
+
+  OneUse_match(const SubPattern_t &SP) : SubPattern(SP) {}
+
+  template <typename OpTy> bool match(OpTy *V) {
+    return V->hasOneUse() && SubPattern.match(V);
+  }
+};
+
+template <typename T> inline OneUse_match<T> m_OneUse(const T &SubPattern) {
+  return SubPattern;
+}
+
 } // namespace VPlanPatternMatch
 } // namespace llvm
 
diff --git a/llvm/lib/Transforms/Vectorize/VPlanUtils.cpp b/llvm/lib/Transforms/Vectorize/VPlanUtils.cpp
index 14f20c65a7034..358c38f49405c 100644
--- a/llvm/lib/Transforms/Vectorize/VPlanUtils.cpp
+++ b/llvm/lib/Transforms/Vectorize/VPlanUtils.cpp
@@ -138,3 +138,103 @@ VPBasicBlock *vputils::getFirstLoopHeader(VPlan &Plan, VPDominatorTree &VPDT) {
   });
   return I == DepthFirst.end() ? nullptr : cast<VPBasicBlock>(*I);
 }
+
+std::optional<VPValue *> vputils::getRecipesForUncountedExit(
+    VPlan &Plan, SmallVectorImpl<VPRecipeBase *> &Recipes,
+    SmallVectorImpl<VPReplicateRecipe *> &GEPs) {
+  using namespace llvm::VPlanPatternMatch;
+  // Given a vplan like the following (just including the recipes contributing
+  // to loop control exiting here, not the actual work), we're looking to match
+  // the recipes contributing to the uncounted exit condition comparison
+  // (here, vp<%4>) back to the canonical induction for the vector body so that
+  // we can copy them to a preheader and rotate the address in the loop to the
+  // next vector iteration.
+  //
+  // VPlan ' for UF>=1' {
+  // Live-in vp<%0> = VF
+  // Live-in ir<64> = original trip-count
+  //
+  // entry:
+  // Successor(s): preheader, vector.ph
+  //
+  // vector.ph:
+  // Successor(s): vector loop
+  //
+  // <x1> vector loop: {
+  //   vector.body:
+  //     EMIT vp<%2> = CANONICAL-INDUCTION ir<0>
+  //     vp<%3> = SCALAR-STEPS vp<%2>, ir<1>, vp<%0>
+  //     CLONE ir<%ee.addr> = getelementptr ir<0>, vp<%3>
+  //     WIDEN ir<%ee.load> = load ir<%ee.addr>
+  //     WIDEN vp<%4> = icmp eq ir<%ee.load>, ir<0>
+  //     EMIT vp<%5> = any-of vp<%4>
+  //     EMIT vp<%6> = add vp<%2>, vp<%0>
+  //     EMIT vp<%7> = icmp eq vp<%6>, ir<64>
+  //     EMIT vp<%8> = or vp<%5>, vp<%7>
+  //     EMIT branch-on-cond vp<%8>
+  //   No successors
+  // }
+  // Successor(s): middle.block
+  //
+  // middle.block:
+  // Successor(s): preheader
+  //
+  // preheader:
+  // No successors
+  // }
+
+  // Find the uncounted loop exit condition.
+  auto *Region = Plan.getVectorLoopRegion();
+  VPValue *UncountedCondition = nullptr;
+  if (!match(
+          Region->getExitingBasicBlock()->getTerminator(),
+          m_BranchOnCond(m_OneUse(m_c_BinaryOr(
+              m_OneUse(m_AnyOf(m_VPValue(UncountedCondition))), m_VPValue())))))
+    return std::nullopt;
+
+  SmallVector<VPValue *, 4> Worklist;
+  bool LoadFound = false;
+  Worklist.push_back(UncountedCondition);
+  while (!Worklist.empty()) {
+    VPValue *V = Worklist.pop_back_val();
+
+    if (V->isDefinedOutsideLoopRegions())
+      continue;
+    if (V->getNumUsers() > 1)
+      return std::nullopt;
+
+    if (auto *Cmp = dyn_cast<VPWidenRecipe>(V)) {
+      if (Cmp->getOpcode() != Instruction::ICmp)
+        return std::nullopt;
+      Worklist.push_back(Cmp->getOperand(0));
+      Worklist.push_back(Cmp->getOperand(1));
+      Recipes.push_back(Cmp);
+    } else if (auto *Load = dyn_cast<VPWidenLoadRecipe>(V)) {
+      if (!Load->isConsecutive() || Load->isMasked())
+        return std::nullopt;
+      Worklist.push_back(Load->getAddr());
+      Recipes.push_back(Load);
+      LoadFound = true;
+    } else if (auto *VecPtr = dyn_cast<VPVectorPointerRecipe>(V)) {
+      Worklist.push_back(VecPtr->getOperand(0));
+      Recipes.push_back(VecPtr);
+    } else if (auto *GEP = dyn_cast<VPReplicateRecipe>(V)) {
+      if (GEP->getNumOperands() != 2)
+        return std::nullopt;
+      if (!match(GEP, m_GetElementPtr(
+                          m_LoopInvVPValue(),
+                          m_ScalarIVSteps(m_Specific(Plan.getCanonicalIV()),
+                                          m_SpecificInt(1),
+                                          m_Specific(&Plan.getVF())))))
+        return std::nullopt;
+      GEPs.push_back(GEP);
+      Recipes.push_back(GEP);
+    } else
+      return std::nullopt;
+  }
+
+  if (GEPs.empty() || !LoadFound)
+    return std::nullopt;
+
+  return UncountedCondition;
+}
diff --git a/llvm/lib/Transforms/Vectorize/VPlanUtils.h b/llvm/lib/Transforms/Vectorize/VPlanUtils.h
index 8dcd57f1b3598..631d7aa8da9ee 100644
--- a/llvm/lib/Transforms/Vectorize/VPlanUtils.h
+++ b/llvm/lib/Transforms/Vectorize/VPlanUtils.h
@@ -97,6 +97,14 @@ bool isUniformAcrossVFsAndUFs(VPValue *V);
 /// Returns the header block of the first, top-level loop, or null if none
 /// exist.
 VPBasicBlock *getFirstLoopHeader(VPlan &Plan, VPDominatorTree &VPDT);
+
+/// Returns the VPValue representing the uncounted exit comparison if all the
+/// recipes needed to form the condition within the vector loop body were
+/// matched.
+std::optional<VPValue *>
+getRecipesForUncountedExit(VPlan &Plan,
+                           SmallVectorImpl<VPRecipeBase *> &Recipes,
+                           SmallVectorImpl<VPReplicateRecipe *> &GEPs);
 } // namespace vputils
 
 //===----------------------------------------------------------------------===//
diff --git a/llvm/lib/Transforms/Vectorize/VPlanValue.h b/llvm/lib/Transforms/Vectorize/VPlanValue.h
index 24f6d61512ef6..5fecbbdef4b5b 100644
--- a/llvm/lib/Transforms/Vectorize/VPlanValue.h
+++ b/llvm/lib/Transforms/Vectorize/VPlanValue.h
@@ -148,6 +148,8 @@ class LLVM_ABI_FOR_TEST VPValue {
     return Current != user_end();
   }
 
+  bool hasOneUse() const { return getNumUsers() == 1; }
+
   void replaceAllUsesWith(VPValue *New);
 
   /// Go through the uses list for this VPValue and make each use point to \p
diff --git a/llvm/unittests/Transforms/Vectorize/CMakeLists.txt b/llvm/unittests/Transforms/Vectorize/CMakeLists.txt
index 53eeff28c185f..a7254922af007 100644
--- a/llvm/unittests/Transforms/Vectorize/CMakeLists.txt
+++ b/llvm/unittests/Transforms/Vectorize/CMakeLists.txt
@@ -14,5 +14,6 @@ add_llvm_unittest(VectorizeTests
   VPlanHCFGTest.cpp
   VPlanPatternMatchTest.cpp
   VPlanSlpTest.cpp
+  VPlanUncountedExitTest.cpp
   VPlanVerifierTest.cpp
   )
diff --git a/llvm/unittests/Transforms/Vectorize/VPlanUncountedExitTest.cpp b/llvm/unittests/Transforms/Vectorize/VPlanUncountedExitTest.cpp
new file mode 100644
index 0000000000000..81ef67a0fb923
--- /dev/null
+++ b/llvm/unittests/Transforms/Vectorize/VPlanUncountedExitTest.cpp
@@ -0,0 +1,99 @@
+//===- llvm/unittests/Transforms/Vectorize/VPlanUncountedExitTest.cpp -----===//
+//
+//
+// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+//===----------------------------------------------------------------------===//
+
+#include "../lib/Transforms/Vectorize/LoopVectorizationPlanner.h"
+#include "../lib/Transforms/Vectorize/VPlan.h"
+#include "../lib/Transforms/Vectorize/VPlanPatternMatch.h"
+#include "../lib/Transforms/Vectorize/VPlanUtils.h"
+#include "VPlanTestBase.h"
+#include "llvm/ADT/SmallVector.h"
+#include "llvm/IR/Instruction.h"
+#include "llvm/IR/Instructions.h"
+#include "gtest/gtest.h"
+
+namespace llvm {
+
+namespace {
+class VPUncountedExitTest : public VPlanTestBase {};
+
+TEST_F(VPUncountedExitTest, FindUncountedExitRecipes) {
+  // Create CFG skeleton.
+  VPlan &Plan = getPlan();
+  VPBasicBlock *ScalarPH = Plan.getEntry();
+  VPBasicBlock *Entry = Plan.createVPBasicBlock("entry");
+  Plan.setEntry(Entry);
+  VPBasicBlock *VectorPH = Plan.createVPBasicBlock("vector.ph");
+  VPBasicBlock *VecBody = Plan.createVPBasicBlock("vector.body");
+  VPRegionBlock *Region =
+      Plan.createVPRegionBlock(VecBody, VecBody, "vector loop");
+  VPBasicBlock *MiddleBlock = Plan.createVPBasicBlock("middle.block");
+  VPBlockUtils::connectBlocks(Entry, ScalarPH);
+  VPBlockUtils::connectBlocks(Entry, VectorPH);
+  VPBlockUtils::connectBlocks(VectorPH, Region);
+  VPBlockUtils::connectBlocks(Region, MiddleBlock);
+  VPBlockUtils::connectBlocks(MiddleBlock, ScalarPH);
+
+  // Live-Ins
+  IntegerType *I64Ty = IntegerType::get(C, 64);
+  IntegerType *I32Ty = IntegerType::get(C, 32);
+  PointerType *PTy = PointerType::get(C, 0);
+  VPValue *Zero = Plan.getOrAddLiveIn(ConstantInt::get(I64Ty, 0));
+  VPValue *Inc = Plan.getOrAddLiveIn(ConstantInt::get(I64Ty, 1));
+  VPValue *VF = &Plan.getVF();
+  Plan.setTripCount(Plan.getOrAddLiveIn(ConstantInt::get(I64Ty, 64)));
+
+  // Populate vector.body with the recipes for exiting.
+  auto *IV = new VPCanonicalIVPHIRecipe(Zero, {});
+  VecBody->appendRecipe(IV);
+  VPBuilder Builder(VecBody, VecBody->getFirstNonPhi());
+  auto *Steps = Builder.createScalarIVSteps(Instruction::Add, nullptr, IV, Inc,
+                                            VF, DebugLoc());
+
+  // Uncounted Exit; GEP -> Load -> Cmp
+  auto *DummyGEP = GetElementPtrInst::Create(I32Ty, Zero->getUnderlyingValue(),
+                                             {}, Twine("ee.addr"));
+  auto *GEP = new VPReplicateRecipe(DummyGEP, {Zero, Steps}, true, nullptr);
+  Builder.insert(GEP);
+  auto *DummyLoad =
+      new LoadInst(I32Ty, PoisonValue::get(PTy), "ee.load", false, Align(1));
+  VPValue *Load =
+      new VPWidenLoadRecipe(*DummyLoad, GEP, nullptr, true, false, {}, {});
+  Builder.insert(Load->getDefiningRecipe());
+  // Should really splat the zero, but we're not checking types here.
+  VPValue *Cmp = new VPWidenRecipe(Instruction::ICmp, {Load, Zero},
+                                   VPIRFlags(CmpInst::ICMP_EQ), {}, {});
+  Builder.insert(Cmp->getDefiningRecipe());
+  VPValue *AnyOf = Builder.createNaryOp(VPInstruction::AnyOf, Cmp);
+
+  // Counted Exit; Inc IV -> Cmp
+  VPValue *NextIV = Builder.createNaryOp(Instruction::Add, {IV, VF});
+  VPValue *Counted =
+      Builder.createICmp(CmpInst::ICMP_EQ, NextIV, Plan.getTripCount());
+
+  // Combine, and branch.
+  VPValue *Combined = Builder.createNaryOp(Instruction::Or, {AnyOf, Counted});
+  Builder.createNaryOp(VPInstruction::BranchOnCond, {Combined});
+
+  SmallVector<VPRecipeBase *, 8> Recipes;
+  SmallVector<VPReplicateRecipe *, 2> GEPs;
+
+  std::optional<VPValue *> UncountedCondition =
+      vputils::getRecipesForUncountedExit(Plan, Recipes, GEPs);
+  ASSERT_TRUE(UncountedCondition.has_value());
+  ASSERT_EQ(*UncountedCondition, Cmp);
+  ASSERT_EQ(GEPs.size(), 1ull);
+  ASSERT_EQ(GEPs[0], GEP);
+  ASSERT_EQ(Recipes.size(), 3ull);
+
+  delete DummyLoad;
+  delete DummyGEP;
+}
+
+} // namespace
+} // namespace llvm

llvm/lib/Transforms/Vectorize/VPlanUtils.h

llvm/lib/Transforms/Vectorize/VPlanUtils.cpp

david-arm · 2025-08-11T12:22:47Z

llvm/lib/Transforms/Vectorize/VPlanValue.h

The name of the function doesn't match the code, i.e. one use != one user. I think it should either be:

bool hasOneUser() const { return getNumUsers() == 1; }

or

bool hasOneUse() const { return getNumUses() == 1; }

Uses are not directly modeled in VPlan, afaict.

Instead, a User may be recorded multiple times for a given VPValue. See the function directly above this, hasMoreThanOneUniqueUser, which looks through the list of Users seeing if there's one that's different from the first.

Hi @fhahn, I think this is pretty confusing. Can we rename the existing getNumUsers to getNumUses to more closely match the naming conventions used for IR values? If a recipe has duplicate input operands then the number of uses != 1, but the number of users may still be 1. If so, I'd like to put up a patch to tidy this up a little.

david-arm · 2025-08-11T12:24:19Z

llvm/lib/Transforms/Vectorize/VPlanUtils.cpp

Is this function only ever intended to be called before we handle the uncountable exit, i.e. before we've introduced the middle split block? If it's after then the vplan in the comments below probably needs updating to reference the middle.split block.

It might be good to clarify in the comments where you expect this function to be called, as it seems to require the vplan CFG to be in a particular format.

It's intended to be called after the vplan has been created and the CFG simplified so there's only one exit. This is currently after the existing uncounted early exit transformation, but that is changed in the transform PR to not create the split.

We probably want to formalize the strategy as state in the VPlan so we know which parts of the transformations to apply.

david-arm · 2025-08-11T12:32:51Z

llvm/lib/Transforms/Vectorize/VPlanUtils.cpp

Does it matter if this is a loop with an uncountable early exit that doesn't match this pattern? If it's being called as part of VPlanTransforms::handleEarlyExits then it should be fine, but later on I can imagine a VPlanTransform may optimise some of this code. I assume that returning std::nullopt would mean it's game over for vectorisation of a loop with an uncountable early exit and a store?

If we can't match the expected recipes here, then the transform (from #148626) will abandon the vplan and vectorization will not proceed.

It's the reason I can do this as a vplan transform instead of manually planting recipes as part of the initial vplan creation based on what LoopVectorizationLegality finds -- I did it the latter way in 2015 when I originally prototyped early exit autovec.

david-arm · 2025-08-11T12:33:53Z

llvm/lib/Transforms/Vectorize/VPlanUtils.cpp

The IR above suggests we've already called handleUncountableEarlyExit and so this probably should be // Successor(s): middle.split

The transform PR explicitly avoids creating the split, since we won't have finished all iterations before leaving the vector body.

david-arm · 2025-08-11T12:42:13Z

llvm/lib/Transforms/Vectorize/VPlanUtils.cpp

In the general case, LoadFound could be set to true for a vplan where neither icmp input is a load, but you just happen to bump into a load in the loop before the early exit. Are you specifically interested in finding any load in the loop, or finding a specific load, i.e. the load that forms the input to the icmp? If it's the latter I think you need to check that the load forms the input to the icmp before setting the boolean to true.

I realise that some of the legality work you're doing requires something of the form:

%load = load i32, ptr %gep %icmp = icmp i32 %load, 3

but I don't think you should assume that here.

I only consider operands from each recipe; that's what the worklist is for. So I start with the input to AnyOf above, which happens to be an icmp in the loop I'm using for the prototype, confirm that it's valid then add the two operands to the worklist.

In the case of the test, one of those operands is a live-in constant, so is accepted immediately. The other is the load, which is checked and the address recipe is added to the worklist.

I am moving the load checking to be more strict for now, as discussed with Sander above.

Well, I was worried about perfectly valid recipes like this that you might encounter:

%icmp1 = icmp %load1, %load2 %icmp2 = icmp %load3, %load4 %icmp3 = icmp %icmp1, %icmp2 %any_of = any_of %icmp3

Yeah, that should be fine. As long as all the recipes contributing to the exit condition can be found and tracked back to the canonical IV or a live-in I don't see a problem with us matching more recipes.

If you want me to restrict it to a single comparison right now I can do so, but I wanted to show the basis of the transform approach -- using a worklist to handle vplan recipes instead of using IR directly during initial plan construction.

sdesmalen-arm · 2025-08-26T08:45:14Z

llvm/lib/Transforms/Vectorize/VPlanUtils.cpp

nit: Is there a reason this check is done after the above loop using a Loads array, rather than checking it right where it encounters the VPWidenLoadRecipe above?

fhahn · 2025-08-26T09:03:07Z

llvm/lib/Transforms/Vectorize/VPlanUtils.cpp

I think you can use the new m_ICmp matchers here

fhahn · 2025-08-26T09:04:12Z

llvm/lib/Transforms/Vectorize/VPlanUtils.cpp

Suggested change

// Given a vplan like the following (just including the recipes contributing

// Given a VPlan like the following (just including the recipes contributing

fhahn · 2025-08-26T09:08:13Z

llvm/lib/Transforms/Vectorize/VPlanUtils.cpp

Do we need to check for the restriction here? Would it be better to check them in the caller? If not, it would be good to document the restrictions in the doc-comment

fhahn · 2025-08-26T09:09:18Z

llvm/lib/Transforms/Vectorize/VPlanUtils.cpp

Suggested change

vputils::getRecipesForUncountedExit(VPlan &Plan,

vputils::getRecipesForUncountableExit(VPlan &Plan,

Uncounted -> Uncountable throughout to keep consistent with the existing terminology

fhahn · 2025-08-26T09:11:20Z

llvm/unittests/Transforms/Vectorize/VPlanUncountedExitTest.cpp

Can we use VPTestBase::buildVPlan to construct the initial VPlan from a simple CFG loop and then just create convert the Load VPInstructions to VPWidenLoadRecipes? That would ensure we keep things in-sync if the constructed VPlans change.

huntergr-arm · 2025-09-11T15:48:57Z

Rebased, will commit next week if there's no further comments.

fhahn · 2025-09-15T07:11:44Z

llvm/lib/Transforms/Vectorize/VPlanUtils.h

Suggested change

/// the canonical IV and it is deemed safe to copy those recipes into the

/// vector preheader. The recipes are stored in \p Recipes, and recipes

/// the canonical IV. The recipes are stored in \p Recipes, and recipes

I think the latest version doesn't check this?

fhahn · 2025-09-15T07:13:59Z

llvm/lib/Transforms/Vectorize/VPlanUtils.h

Should this mention loads as well? Looks like we stop also stop at them

Should probably also mention the special treatment of masked loads (or remove it)

I've changed it to note that it stops at the addresses of non-masked loads.

fhahn · 2025-09-15T07:16:47Z

llvm/lib/Transforms/Vectorize/VPlanPatternMatch.h

Do we hit pointer bases with recipes that are moved out of the vector loop in practice or would m_LiveIn suffice?

Changed to m_LiveIn, seems to work fine.

fhahn · 2025-09-15T07:17:11Z

llvm/lib/Transforms/Vectorize/VPlanPatternMatch.h

can you move this to the other VPInstruction matchers for consitency?

fhahn · 2025-09-17T08:28:09Z

llvm/lib/Transforms/Vectorize/VPlanUtils.cpp

+  // we can copy them to a preheader and rotate the address in the loop to the
+  // next vector iteration.
+  //
+  // Currently, the address of the load is restricted to a GEP with 2 terms and


Suggested change

// Currently, the address of the load is restricted to a GEP with 2 terms and

// Currently, the address of the load is restricted to a GEP with 2 operands and

fhahn · 2025-09-17T08:29:29Z

llvm/lib/Transforms/Vectorize/VPlanUtils.cpp

+  // Given a VPlan like the following (just including the recipes contributing
+  // to loop control exiting here, not the actual work), we're looking to match
+  // the recipes contributing to the uncountable exit condition comparison
+  // (here, vp<%4>) back to the canonical induction for the vector body so that


It looks this may be out-of-sync with the implementation, it looks like we don't check for a canonical induction, just for loads & live-ins as in the header comment?

fhahn · 2025-09-17T08:31:04Z

llvm/unittests/Transforms/Vectorize/VPlanUncountableExitTest.cpp

+  SmallVector<VPRecipeBase *, 8> Recipes;
+  SmallVector<VPRecipeBase *, 2> GEPs;
+
+  std::optional<VPValue *> UncountableCondition =


it would also be good to add a test without an early exit, to make sure that code path is also covered by the test

fhahn

LGTM, thanks! A few small suggestions left inline

llvm/lib/Transforms/Vectorize/VPlanUtils.cpp

llvm/unittests/Transforms/Vectorize/VPlanUncountableExitTest.cpp

Co-authored-by: Florian Hahn <[email protected]>

huntergr-arm · 2025-09-18T15:19:46Z

Thanks for the review!

llvm-ci · 2025-09-18T15:57:26Z

LLVM Buildbot has detected a new failure on builder openmp-s390x-linux running on systemz-1 while building llvm at step 6 "test-openmp".

Full details are available at: https://lab.llvm.org/buildbot/#/builders/88/builds/16223

Here is the relevant piece of the build log for the reference

Step 6 (test-openmp) failure: test (failure)
******************** TEST 'libomp :: tasking/issue-94260-2.c' FAILED ********************
Exit Code: -11

Command Output (stdout):
--
# RUN: at line 1
/home/uweigand/sandbox/buildbot/openmp-s390x-linux/llvm.build/./bin/clang -fopenmp   -I /home/uweigand/sandbox/buildbot/openmp-s390x-linux/llvm.build/runtimes/runtimes-bins/openmp/runtime/src -I /home/uweigand/sandbox/buildbot/openmp-s390x-linux/llvm.src/openmp/runtime/test -L /home/uweigand/sandbox/buildbot/openmp-s390x-linux/llvm.build/runtimes/runtimes-bins/openmp/runtime/src  -fno-omit-frame-pointer -mbackchain -I /home/uweigand/sandbox/buildbot/openmp-s390x-linux/llvm.src/openmp/runtime/test/ompt /home/uweigand/sandbox/buildbot/openmp-s390x-linux/llvm.src/openmp/runtime/test/tasking/issue-94260-2.c -o /home/uweigand/sandbox/buildbot/openmp-s390x-linux/llvm.build/runtimes/runtimes-bins/openmp/runtime/test/tasking/Output/issue-94260-2.c.tmp -lm -latomic && /home/uweigand/sandbox/buildbot/openmp-s390x-linux/llvm.build/runtimes/runtimes-bins/openmp/runtime/test/tasking/Output/issue-94260-2.c.tmp
# executed command: /home/uweigand/sandbox/buildbot/openmp-s390x-linux/llvm.build/./bin/clang -fopenmp -I /home/uweigand/sandbox/buildbot/openmp-s390x-linux/llvm.build/runtimes/runtimes-bins/openmp/runtime/src -I /home/uweigand/sandbox/buildbot/openmp-s390x-linux/llvm.src/openmp/runtime/test -L /home/uweigand/sandbox/buildbot/openmp-s390x-linux/llvm.build/runtimes/runtimes-bins/openmp/runtime/src -fno-omit-frame-pointer -mbackchain -I /home/uweigand/sandbox/buildbot/openmp-s390x-linux/llvm.src/openmp/runtime/test/ompt /home/uweigand/sandbox/buildbot/openmp-s390x-linux/llvm.src/openmp/runtime/test/tasking/issue-94260-2.c -o /home/uweigand/sandbox/buildbot/openmp-s390x-linux/llvm.build/runtimes/runtimes-bins/openmp/runtime/test/tasking/Output/issue-94260-2.c.tmp -lm -latomic
# executed command: /home/uweigand/sandbox/buildbot/openmp-s390x-linux/llvm.build/runtimes/runtimes-bins/openmp/runtime/test/tasking/Output/issue-94260-2.c.tmp
# note: command had no output on stdout or stderr
# error: command failed with exit status: -11

--

********************

llvm-ci · 2025-09-18T16:04:33Z

LLVM Buildbot has detected a new failure on builder clang-aarch64-quick running on linaro-clang-aarch64-quick while building llvm at step 5 "ninja check 1".

Full details are available at: https://lab.llvm.org/buildbot/#/builders/65/builds/22816

Here is the relevant piece of the build log for the reference

Step 5 (ninja check 1) failure: stage 1 checked (failure)
******************** TEST 'Clangd Unit Tests :: ./ClangdTests/163/332' FAILED ********************
Script(shard):
--
GTEST_OUTPUT=json:/home/tcwg-buildbot/worker/clang-aarch64-quick/stage1/tools/clang/tools/extra/clangd/unittests/./ClangdTests-Clangd Unit Tests-1100936-163-332.json GTEST_SHUFFLE=0 GTEST_TOTAL_SHARDS=332 GTEST_SHARD_INDEX=163 /home/tcwg-buildbot/worker/clang-aarch64-quick/stage1/tools/clang/tools/extra/clangd/unittests/./ClangdTests
--

Note: This is test shard 164 of 332.
[==========] Running 4 tests from 4 test suites.
[----------] Global test environment set-up.
[----------] 1 test from CompletionTest
[ RUN      ] CompletionTest.DeprecatedResults
Built preamble of size 707604 for file /clangd-test/foo.cpp version null in 0.12 seconds
Code complete: sema context Statement, query scopes [] (AnyScope=false), expected type <none>
Code complete: 2 results from Sema, 0 from Index, 0 matched, 0 from identifiers, 2 returned.
[       OK ] CompletionTest.DeprecatedResults (134 ms)
[----------] 1 test from CompletionTest (134 ms total)

[----------] 1 test from FileIndexTest
[ RUN      ] FileIndexTest.ReferencesInMainFileWithPreamble
Built preamble of size 710960 for file /clangd-test/TestTU.cpp version null in 0.09 seconds
indexed file AST for /clangd-test/TestTU.cpp version null:
  symbol slab: 1 symbols, 4448 bytes
  ref slab: 2 symbols, 2 refs, 4272 bytes
  relations slab: 0 relations, 24 bytes
Build dynamic index for main-file symbols with estimated memory usage of 11576 bytes
Built preamble of size 710960 for file /clangd-test/TestTU.cpp version null in 0.10 seconds
indexed preamble AST for /clangd-test/TestTU.cpp version null:
  symbol slab: 2 symbols, 4680 bytes
  ref slab: 0 symbols, 0 refs, 128 bytes
  relations slab: 0 relations, 24 bytes
[       OK ] FileIndexTest.ReferencesInMainFileWithPreamble (260 ms)
[----------] 1 test from FileIndexTest (260 ms total)

[----------] 1 test from JSONTransportTest
[ RUN      ] JSONTransportTest.EndOfFile
<<< {"jsonrpc":"2.0","method":"call","params":1234}

>>> {"id":42,"jsonrpc":"2.0","method":"echo call","params":1234}

[       OK ] JSONTransportTest.EndOfFile (3 ms)
[----------] 1 test from JSONTransportTest (5 ms total)

[----------] 1 test from GoToInclude
[ RUN      ] GoToInclude.All
ASTWorker building file /clangd-test/foo.h version null with command 
[/clangd-test]
clang -ffreestanding /clangd-test/foo.h
Driver produced command: cc1 -cc1 -triple aarch64-unknown-linux-gnu -fsyntax-only -disable-free -clear-ast-before-backend -main-file-name foo.h -mrelocation-model pic -pic-level 2 -pic-is-pie -mframe-pointer=non-leaf -fmath-errno -ffp-contract=on -fno-rounding-math -mconstructor-aliases -ffreestanding -enable-tlsdesc -target-cpu generic -target-feature +v8a -target-feature +fp-armv8 -target-feature +neon -target-abi aapcs -debugger-tuning=gdb -fdebug-compilation-dir=/clangd-test -fcoverage-compilation-dir=/clangd-test -resource-dir lib/clang/22 -internal-isystem lib/clang/22/include -internal-isystem /usr/local/include -internal-externc-isystem /include -internal-externc-isystem /usr/include -ferror-limit 19 -fno-signed-char -fgnuc-version=4.2.1 -fskip-odr-check-in-gmf -no-round-trip-args -target-feature -fmv -faddrsig -x c-header /clangd-test/foo.h
Building first preamble for /clangd-test/foo.h version null
Built preamble of size 730288 for file /clangd-test/foo.h version null in 0.11 seconds
...

huntergr-arm requested review from david-arm, fhahn and sdesmalen-arm August 7, 2025 15:20

llvmbot added vectorizers llvm:transforms labels Aug 7, 2025

sdesmalen-arm reviewed Aug 11, 2025

View reviewed changes

david-arm reviewed Aug 11, 2025

View reviewed changes

sdesmalen-arm approved these changes Aug 26, 2025

View reviewed changes

fhahn reviewed Aug 26, 2025

View reviewed changes

huntergr-arm force-pushed the identify-uncounted-exit-condition-recipes branch from 2debe28 to ebdb2b6 Compare September 3, 2025 14:32

huntergr-arm force-pushed the identify-uncounted-exit-condition-recipes branch from ebdb2b6 to 6f7ca85 Compare September 11, 2025 15:46

fhahn reviewed Sep 15, 2025

View reviewed changes

huntergr-arm added 4 commits September 16, 2025 13:27

WIP

7d75529

Improve comments, be stricter about matching inputs to loads

688eadb

Create test vplan from IR; minor cleanups

3ad198d

Switch to m_LiveIn, update comment

2f81520

huntergr-arm force-pushed the identify-uncounted-exit-condition-recipes branch from 6f7ca85 to 2f81520 Compare September 16, 2025 14:16

fhahn reviewed Sep 17, 2025

View reviewed changes

Add negative test, fix comment

2fd4504

fhahn approved these changes Sep 18, 2025

View reviewed changes

llvm/lib/Transforms/Vectorize/VPlanUtils.cpp Outdated Show resolved Hide resolved

llvm/unittests/Transforms/Vectorize/VPlanUncountableExitTest.cpp Outdated Show resolved Hide resolved

llvm/unittests/Transforms/Vectorize/VPlanUncountableExitTest.cpp Outdated Show resolved Hide resolved

huntergr-arm and others added 3 commits September 18, 2025 16:09

Apply suggestion from @fhahn

febf5ab

Co-authored-by: Florian Hahn <[email protected]>

Apply suggestion from @fhahn

eb82e1b

Co-authored-by: Florian Hahn <[email protected]>

Apply suggestion from @fhahn

8507a8d

Co-authored-by: Florian Hahn <[email protected]>

huntergr-arm enabled auto-merge (squash) September 18, 2025 15:12

huntergr-arm merged commit 6b99a7b into llvm:main Sep 18, 2025
9 checks passed

huntergr-arm deleted the identify-uncounted-exit-condition-recipes branch September 18, 2025 16:06

huntergr-arm mentioned this pull request Oct 29, 2025

[LV] Transform to handle exits in the scalar loop #148626

Open

huntergr-arm mentioned this pull request Nov 6, 2025

[LV] Initial support for stores in early exit loops #137774

Draft

	// Given a vplan like the following (just including the recipes contributing
	// Given a VPlan like the following (just including the recipes contributing

	vputils::getRecipesForUncountedExit(VPlan &Plan,
	vputils::getRecipesForUncountableExit(VPlan &Plan,

	/// the canonical IV and it is deemed safe to copy those recipes into the
	/// vector preheader. The recipes are stored in \p Recipes, and recipes
	/// the canonical IV. The recipes are stored in \p Recipes, and recipes

	// Currently, the address of the load is restricted to a GEP with 2 terms and
	// Currently, the address of the load is restricted to a GEP with 2 operands and

[LV] Provide utility routine to find uncounted exit recipes #152530

[LV] Provide utility routine to find uncounted exit recipes #152530

Uh oh!

Conversation

huntergr-arm commented Aug 7, 2025

Uh oh!

llvmbot commented Aug 7, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

Uh oh!

Uh oh!

Uh oh!

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

david-arm Aug 11, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

huntergr-arm commented Sep 11, 2025

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

Uh oh!

Choose a reason for hiding this comment

llvmbot commented Aug 7, 2025 •

edited

Loading

david-arm Aug 11, 2025 •

edited

Loading