-
Notifications
You must be signed in to change notification settings - Fork 15.2k
[VPlan] Simplify branch on False in VPlan transform (NFC). #140409
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from 13 commits
063d70f
f5ee27b
74eddb5
61779cf
801b98d
069767b
d3df2c3
3f3f002
69ad1de
9233672
6ced27d
2b76566
5797781
761d4ca
ff89acf
fa0eab1
57652c7
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
| Original file line number | Diff line number | Diff line change | ||
|---|---|---|---|---|
|
|
@@ -2380,10 +2380,13 @@ void InnerLoopVectorizer::introduceCheckBlockInVPlan(BasicBlock *CheckIRBB) { | |||
|
|
||||
| // We just connected a new block to the scalar preheader. Update all | ||||
| // VPPhis by adding an incoming value for it, replicating the last value. | ||||
| unsigned NumPredecessors = ScalarPH->getNumPredecessors(); | ||||
| (void)NumPredecessors; | ||||
|
||||
| (void)NumPredecessors; |
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Removed thanks
| Original file line number | Diff line number | Diff line change | ||||
|---|---|---|---|---|---|---|
|
|
@@ -501,8 +501,10 @@ void VPlanTransforms::prepareForVectorization( | |||||
| cast<VPBasicBlock>(HeaderVPB), | ||||||
| cast<VPBasicBlock>(LatchVPB), Range); | ||||||
| HandledUncountableEarlyExit = true; | ||||||
| } else { | ||||||
| for (VPRecipeBase &R : EB->phis()) | ||||||
| cast<VPIRPhi>(&R)->removeIncomingValueFor(Pred); | ||||||
| } | ||||||
|
|
||||||
| cast<VPBasicBlock>(Pred)->getTerminator()->eraseFromParent(); | ||||||
| VPBlockUtils::disconnectBlocks(Pred, EB); | ||||||
| } | ||||||
|
|
@@ -526,32 +528,6 @@ void VPlanTransforms::prepareForVectorization( | |||||
| VPBasicBlock *ScalarPH = Plan.createVPBasicBlock("scalar.ph"); | ||||||
| VPBlockUtils::connectBlocks(ScalarPH, Plan.getScalarHeader()); | ||||||
|
|
||||||
| // If needed, add a check in the middle block to see if we have completed | ||||||
| // all of the iterations in the first vector loop. Three cases: | ||||||
| // 1) If we require a scalar epilogue, there is no conditional branch as | ||||||
| // we unconditionally branch to the scalar preheader. Remove the recipes | ||||||
| // from the exit blocks. | ||||||
| // 2) If (N - N%VF) == N, then we *don't* need to run the remainder. | ||||||
| // Thus if tail is to be folded, we know we don't need to run the | ||||||
| // remainder and we can set the condition to true. | ||||||
| // 3) Otherwise, construct a runtime check. | ||||||
|
|
||||||
| if (!RequiresScalarEpilogueCheck) { | ||||||
| if (auto *LatchExitVPB = MiddleVPBB->getSingleSuccessor()) | ||||||
| VPBlockUtils::disconnectBlocks(MiddleVPBB, LatchExitVPB); | ||||||
| VPBlockUtils::connectBlocks(MiddleVPBB, ScalarPH); | ||||||
| VPBlockUtils::connectBlocks(Plan.getEntry(), ScalarPH); | ||||||
| Plan.getEntry()->swapSuccessors(); | ||||||
|
|
||||||
| // The exit blocks are unreachable, remove their recipes to make sure no | ||||||
| // users remain that may pessimize transforms. | ||||||
| for (auto *EB : Plan.getExitBlocks()) { | ||||||
| for (VPRecipeBase &R : make_early_inc_range(*EB)) | ||||||
| R.eraseFromParent(); | ||||||
| } | ||||||
| return; | ||||||
| } | ||||||
|
|
||||||
| // The connection order corresponds to the operands of the conditional branch, | ||||||
| // with the middle block already connected to the exit block. | ||||||
| VPBlockUtils::connectBlocks(MiddleVPBB, ScalarPH); | ||||||
|
|
@@ -561,21 +537,45 @@ void VPlanTransforms::prepareForVectorization( | |||||
| VPBlockUtils::connectBlocks(Plan.getEntry(), ScalarPH); | ||||||
| Plan.getEntry()->swapSuccessors(); | ||||||
|
|
||||||
| auto *ScalarLatchTerm = TheLoop->getLoopLatch()->getTerminator(); | ||||||
| // Here we use the same DebugLoc as the scalar loop latch terminator instead | ||||||
| // of the corresponding compare because they may have ended up with | ||||||
| // different line numbers and we want to avoid awkward line stepping while | ||||||
| // debugging. Eg. if the compare has got a line number inside the loop. | ||||||
| // If MiddleVPBB has a single successor then the original loop does not exit | ||||||
| // via the latch and the single successor must be the scalar preheader. | ||||||
| // There's no need to add a runtime check to MiddleVPBB. | ||||||
| if (MiddleVPBB->getNumSuccessors() == 1) { | ||||||
| assert(MiddleVPBB->getSingleSuccessor() == ScalarPH && | ||||||
| "must have ScalarPH as single successor"); | ||||||
| return; | ||||||
| } | ||||||
|
|
||||||
| assert(MiddleVPBB->getNumSuccessors() == 2 && "must have 2 successors"); | ||||||
|
|
||||||
| // Add a check in the middle block to see if we have completed$ all of the | ||||||
|
||||||
| // Add a check in the middle block to see if we have completed$ all of the | |
| // Add a check in the middle block to see if we have completed all of the |
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Removed, thanks!
| Original file line number | Diff line number | Diff line change |
|---|---|---|
|
|
@@ -1185,6 +1185,16 @@ void VPIRPhi::execute(VPTransformState &State) { | |
| State.Builder.SetInsertPoint(Phi->getParent(), std::next(Phi->getIterator())); | ||
| } | ||
|
|
||
| void VPPhiAccessors::removeIncomingValueFor(VPBlockBase *IncomingBlock) const { | ||
| VPRecipeBase *R = const_cast<VPRecipeBase *>(getAsRecipe()); | ||
| auto &Preds = R->getParent()->getPredecessors(); | ||
| assert(R->getNumOperands() == Preds.size() && | ||
| "Number of phi operands must match number of predecessors"); | ||
| unsigned Position = std::distance(Preds.begin(), find(Preds, IncomingBlock)); | ||
|
||
| R->getOperand(Position)->removeUser(*R); | ||
| R->removeOperand(Position); | ||
|
||
| } | ||
|
|
||
| #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP) | ||
| void VPPhiAccessors::printPhiOperands(raw_ostream &O, | ||
| VPSlotTracker &SlotTracker) const { | ||
|
|
||
| Original file line number | Diff line number | Diff line change |
|---|---|---|
|
|
@@ -1841,43 +1841,39 @@ void VPlanTransforms::truncateToMinimalBitwidths( | |
| } | ||
| } | ||
|
|
||
| /// Remove BranchOnCond recipes with true conditions together with removing | ||
| /// dead edges to their successors. | ||
| static void removeBranchOnCondTrue(VPlan &Plan) { | ||
| /// Remove BranchOnCond recipes with true or false conditions together with | ||
| /// removing dead edges to their successors. | ||
| static void removeBranchOnConst(VPlan &Plan) { | ||
| using namespace llvm::VPlanPatternMatch; | ||
|
Collaborator
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Name of
Contributor
Author
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. updated, thanks |
||
| for (VPBasicBlock *VPBB : VPBlockUtils::blocksOnly<VPBasicBlock>( | ||
| vp_depth_first_shallow(Plan.getEntry()))) { | ||
| VPValue *Cond; | ||
| if (VPBB->getNumSuccessors() != 2 || VPBB == Plan.getEntry() || | ||
|
Collaborator
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Independent: why is the entry block excluded?
Contributor
Author
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Entry will have 2 successors w/o branch. Will be fixed by introducing a branch recipe, possibly on an opaque condition, when connecting entry to vector.ph/scalar.ph.
Collaborator
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Ah, right, perhaps worth a clarifying TODO. |
||
| !match(&VPBB->back(), m_BranchOnCond(m_True()))) | ||
| !match(&VPBB->back(), m_BranchOnCond(m_VPValue(Cond)))) | ||
| continue; | ||
|
|
||
| VPBasicBlock *RemovedSucc = cast<VPBasicBlock>(VPBB->getSuccessors()[1]); | ||
| unsigned RemovedIdx; | ||
| if (match(Cond, m_True())) | ||
| RemovedIdx = 1; | ||
| else if (match(Cond, m_False())) | ||
| RemovedIdx = 0; | ||
| else | ||
| continue; | ||
|
|
||
| VPBasicBlock *RemovedSucc = | ||
| cast<VPBasicBlock>(VPBB->getSuccessors()[RemovedIdx]); | ||
| const auto &Preds = RemovedSucc->getPredecessors(); | ||
| assert(count(Preds, VPBB) == 1 && | ||
| "There must be a single edge between VPBB and its successor"); | ||
| unsigned DeadIdx = std::distance(Preds.begin(), find(Preds, VPBB)); | ||
|
|
||
| // Values coming from VPBB into ResumePhi recipes of RemoveSucc are removed | ||
| // from these recipes. | ||
| // Values coming from VPBB into phi recipes of RemoveSucc are removed from | ||
| // these recipes. | ||
| for (VPRecipeBase &R : make_early_inc_range(*RemovedSucc)) { | ||
|
||
| assert((!isa<VPIRInstruction>(&R) || | ||
| !isa<PHINode>(cast<VPIRInstruction>(&R)->getInstruction())) && | ||
| !isa<VPHeaderPHIRecipe>(&R) && | ||
| "Cannot update VPIRInstructions wrapping phis or header phis yet"); | ||
| auto *VPI = dyn_cast<VPPhi>(&R); | ||
| if (!VPI) | ||
| auto *Phi = dyn_cast<VPPhiAccessors>(&R); | ||
| if (!Phi) | ||
| break; | ||
|
||
| VPBuilder B(VPI); | ||
| SmallVector<VPValue *> NewOperands; | ||
| // Create new operand list, with the dead incoming value filtered out. | ||
| for (const auto &[Idx, Op] : enumerate(VPI->operands())) { | ||
| if (Idx == DeadIdx) | ||
| continue; | ||
| NewOperands.push_back(Op); | ||
| } | ||
| VPI->replaceAllUsesWith( | ||
| B.createScalarPhi(NewOperands, VPI->getDebugLoc(), VPI->getName())); | ||
| VPI->eraseFromParent(); | ||
| assert((!isa<VPIRPhi>(&R) || RemovedSucc->getNumPredecessors() == 1) && | ||
| "VPIRPhis must have a single predecessor"); | ||
| Phi->removeIncomingValueFor(VPBB); | ||
| } | ||
| // Disconnect blocks and remove the terminator. RemovedSucc will be deleted | ||
| // automatically on VPlan destruction if it becomes unreachable. | ||
|
|
@@ -1897,7 +1893,7 @@ void VPlanTransforms::optimize(VPlan &Plan) { | |
| runPass(legalizeAndOptimizeInductions, Plan); | ||
| runPass(removeRedundantExpandSCEVRecipes, Plan); | ||
| runPass(simplifyRecipes, Plan, *Plan.getCanonicalIV()->getScalarType()); | ||
| runPass(removeBranchOnCondTrue, Plan); | ||
| runPass(removeBranchOnConst, Plan); | ||
| runPass(removeDeadRecipes, Plan); | ||
|
|
||
| runPass(createAndOptimizeReplicateRegions, Plan); | ||
|
|
||
| Original file line number | Diff line number | Diff line change |
|---|---|---|
|
|
@@ -38,6 +38,7 @@ class VPSlotTracker; | |
| class VPUser; | ||
| class VPRecipeBase; | ||
| class VPInterleaveRecipe; | ||
| class VPPhiAccessors; | ||
|
|
||
| // This is the base class of the VPlan Def/Use graph, used for modeling the data | ||
| // flow into, within and out of the VPlan. VPValues can stand for live-ins | ||
|
|
@@ -199,8 +200,13 @@ raw_ostream &operator<<(raw_ostream &OS, const VPRecipeBase &R); | |
| /// This class augments VPValue with operands which provide the inverse def-use | ||
| /// edges from VPValue's users to their defs. | ||
| class VPUser { | ||
| /// Grant access to removeOperand for VPPhiAccessors, the only supported user. | ||
| friend class VPPhiAccessors; | ||
|
||
|
|
||
| SmallVector<VPValue *, 2> Operands; | ||
|
|
||
| void removeOperand(unsigned Idx) { Operands.erase(Operands.begin() + Idx); } | ||
|
|
||
| protected: | ||
| #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP) | ||
| /// Print the operands to \p O. | ||
|
|
||
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
nit: take the number of ScalarPH predecessors once, here, reuse it repeatedly inside the loop, asserting it is one more than the number of ResumePhi's operands.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Updated, thanks