36#define DEBUG_TYPE "loop-simplifycfg"
42 "Number of terminators folded to unconditional branches");
44 "Number of loop blocks deleted");
46 "Number of loop exiting edges deleted");
54 if (BI->isUnconditional())
56 if (BI->getSuccessor(0) == BI->getSuccessor(1))
57 return BI->getSuccessor(0);
61 return Cond->isZero() ? BI->getSuccessor(1) : BI->getSuccessor(0);
68 for (
auto Case :
SI->cases())
69 if (Case.getCaseValue() == CI)
70 return Case.getCaseSuccessor();
71 return SI->getDefaultDest();
79 Loop *LastLoop =
nullptr) {
81 "First loop is supposed to be inside of last loop!");
83 for (
Loop *Current = FirstLoop; Current != LastLoop;
85 Current->removeBlockFromLoop(BB);
92 Loop *Innermost =
nullptr;
95 while (BBL && !BBL->
contains(L.getHeader()))
110class ConstantTerminatorFoldingImpl {
116 MemorySSAUpdater *MSSAU;
122 bool HasIrreducibleCFG =
false;
131 bool DeleteCurrentLoop =
false;
133 bool HasIndirectEntry =
false;
137 SmallPtrSet<BasicBlock *, 8> LiveLoopBlocks;
140 SmallVector<BasicBlock *, 8> DeadLoopBlocks;
143 SmallPtrSet<BasicBlock *, 8> LiveExitBlocks;
146 SmallVector<BasicBlock *, 8> DeadExitBlocks;
148 SmallPtrSet<BasicBlock *, 8> BlocksInLoopAfterFolding;
152 SmallVector<BasicBlock *, 8> FoldCandidates;
155 dbgs() <<
"Constant terminator folding for loop " << L <<
"\n";
156 dbgs() <<
"After terminator constant-folding, the loop will";
157 if (!DeleteCurrentLoop)
159 dbgs() <<
" be destroyed\n";
160 auto PrintOutVector = [&](
const char *Message,
161 const SmallVectorImpl<BasicBlock *> &S) {
162 dbgs() << Message <<
"\n";
163 for (
const BasicBlock *BB : S)
164 dbgs() <<
"\t" << BB->getName() <<
"\n";
166 auto PrintOutSet = [&](
const char *Message,
167 const SmallPtrSetImpl<BasicBlock *> &S) {
168 dbgs() << Message <<
"\n";
169 for (
const BasicBlock *BB : S)
170 dbgs() <<
"\t" << BB->getName() <<
"\n";
172 PrintOutVector(
"Blocks in which we can constant-fold terminator:",
174 PrintOutSet(
"Live blocks from the original loop:", LiveLoopBlocks);
175 PrintOutVector(
"Dead blocks from the original loop:", DeadLoopBlocks);
176 PrintOutSet(
"Live exit blocks:", LiveExitBlocks);
177 PrintOutVector(
"Dead exit blocks:", DeadExitBlocks);
178 if (!DeleteCurrentLoop)
179 PrintOutSet(
"The following blocks will still be part of the loop:",
180 BlocksInLoopAfterFolding);
184 bool hasIrreducibleCFG(LoopBlocksDFS &DFS) {
185 assert(DFS.isComplete() &&
"DFS is expected to be finished");
187 DenseMap<const BasicBlock *, unsigned> RPO;
188 unsigned Current = 0;
189 for (
auto I = DFS.beginRPO(),
E = DFS.endRPO();
I !=
E; ++
I)
192 for (
auto I = DFS.beginRPO(),
E = DFS.endRPO();
I !=
E; ++
I) {
195 if (L.contains(Succ) && !LI.isLoopHeader(Succ) && RPO[BB] > RPO[Succ])
208 assert(DFS.isComplete() &&
"DFS is expected to be finished");
217 if (hasIrreducibleCFG(DFS)) {
218 HasIrreducibleCFG =
true;
225 if (!L.getLoopPreheader()) {
227 [&](BasicBlock *Pred) {
228 return isa<IndirectBrInst>(Pred->getTerminator());
230 "Loop should have preheader if it is not entered indirectly");
231 HasIndirectEntry =
true;
236 LiveLoopBlocks.insert(L.getHeader());
237 for (
auto I = DFS.beginRPO(),
E = DFS.endRPO();
I !=
E; ++
I) {
241 if (!LiveLoopBlocks.count(BB)) {
242 DeadLoopBlocks.push_back(BB);
252 bool TakeFoldCandidate = TheOnlySucc && LI.getLoopFor(BB) == &L;
253 if (TakeFoldCandidate)
254 FoldCandidates.push_back(BB);
258 if (!TakeFoldCandidate || TheOnlySucc == Succ) {
259 if (L.contains(Succ))
260 LiveLoopBlocks.insert(Succ);
262 LiveExitBlocks.insert(Succ);
268 assert(L.getNumBlocks() == LiveLoopBlocks.size() + DeadLoopBlocks.size() &&
269 "Malformed block sets?");
274 SmallVector<BasicBlock *, 8> ExitBlocks;
275 L.getExitBlocks(ExitBlocks);
276 SmallPtrSet<BasicBlock *, 8> UniqueDeadExits;
277 for (
auto *ExitBlock : ExitBlocks)
278 if (!LiveExitBlocks.count(ExitBlock) &&
279 UniqueDeadExits.
insert(ExitBlock).second &&
281 [
this](BasicBlock *Pred) {
return L.contains(Pred); }))
282 DeadExitBlocks.push_back(ExitBlock);
287 if (!LiveLoopBlocks.count(From))
290 return !TheOnlySucc || TheOnlySucc == To || LI.getLoopFor(From) != &L;
294 DeleteCurrentLoop = !IsEdgeLive(L.getLoopLatch(), L.getHeader());
298 if (DeleteCurrentLoop)
303 BlocksInLoopAfterFolding.insert(L.getLoopLatch());
310 return BlocksInLoopAfterFolding.count(Succ) && IsEdgeLive(BB, Succ);
313 for (
auto I = DFS.beginPostorder(),
E = DFS.endPostorder();
I !=
E; ++
I) {
315 if (BlockIsInLoop(BB))
316 BlocksInLoopAfterFolding.insert(BB);
319 assert(BlocksInLoopAfterFolding.count(L.getHeader()) &&
320 "Header not in loop?");
321 assert(BlocksInLoopAfterFolding.size() <= LiveLoopBlocks.size() &&
322 "All blocks that stay in loop should be live!");
360 void handleDeadExits() {
362 if (DeadExitBlocks.empty())
372 SwitchInst *DummySwitch =
373 Builder.CreateSwitch(Builder.getInt32(0), NewPreheader);
376 unsigned DummyIdx = 1;
377 for (BasicBlock *BB : DeadExitBlocks) {
380 SmallVector<Instruction *, 4> DeadInstructions(
384 DeadInstructions.emplace_back(LandingPad);
386 for (Instruction *
I : DeadInstructions) {
389 I->eraseFromParent();
392 assert(DummyIdx != 0 &&
"Too many dead exits!");
393 DummySwitch->
addCase(Builder.getInt32(DummyIdx++), BB);
394 DTUpdates.push_back({DominatorTree::Insert, Preheader, BB});
395 ++NumLoopExitsDeleted;
402 if (DummySwitch->
getParent()->getParent()->hasProfileData()) {
403 SmallVector<uint32_t> DummyBranchWeights(1 + DummySwitch->
getNumCases());
405 DummyBranchWeights[0] = 1;
409 assert(L.getLoopPreheader() == NewPreheader &&
"Malformed CFG?");
410 if (Loop *OuterLoop = LI.getLoopFor(Preheader)) {
419 if (StillReachable != OuterLoop) {
420 LI.changeLoopFor(NewPreheader, StillReachable);
422 for (
auto *BB : L.blocks())
424 OuterLoop->removeChildLoop(&L);
428 LI.addTopLevelLoop(&L);
433 Loop *FixLCSSALoop = OuterLoop;
436 assert(FixLCSSALoop &&
"Should be a loop!");
439 MSSAU->applyUpdates(DTUpdates, DT,
true);
441 DTU.applyUpdates(DTUpdates);
444 SE.forgetBlockAndLoopDispositions();
450 MSSAU->applyUpdates(DTUpdates, DT,
true);
453 MSSAU->getMemorySSA()->verifyMemorySSA();
459 void deleteDeadLoopBlocks() {
461 SmallSetVector<BasicBlock *, 8> DeadLoopBlocksSet(DeadLoopBlocks.begin(),
462 DeadLoopBlocks.end());
463 MSSAU->removeBlocks(DeadLoopBlocksSet);
472 for (
auto *BB : DeadLoopBlocks)
473 if (LI.isLoopHeader(BB)) {
474 assert(LI.getLoopFor(BB) != &L &&
"Attempt to remove current loop!");
475 Loop *
DL = LI.getLoopFor(BB);
476 if (!
DL->isOutermost()) {
477 for (
auto *PL =
DL->getParentLoop(); PL; PL =
PL->getParentLoop())
478 for (
auto *BB :
DL->getBlocks())
479 PL->removeBlockFromLoop(BB);
480 DL->getParentLoop()->removeChildLoop(
DL);
481 LI.addTopLevelLoop(
DL);
486 for (
auto *BB : DeadLoopBlocks) {
487 assert(BB != L.getHeader() &&
488 "Header of the current loop cannot be dead!");
495 DTU.applyUpdates(DTUpdates);
497 for (
auto *BB : DeadLoopBlocks)
500 NumLoopBlocksDeleted += DeadLoopBlocks.size();
505 void foldTerminators() {
506 for (BasicBlock *BB : FoldCandidates) {
507 assert(LI.getLoopFor(BB) == &L &&
"Should be a loop block!");
509 assert(TheOnlySucc &&
"Should have one live successor!");
512 <<
" with an unconditional branch to the block "
513 << TheOnlySucc->
getName() <<
"\n");
515 SmallPtrSet<BasicBlock *, 2> DeadSuccessors;
517 unsigned TheOnlySuccDuplicates = 0;
519 if (Succ != TheOnlySucc) {
520 DeadSuccessors.
insert(Succ);
523 bool PreserveLCSSAPhi = !L.contains(Succ);
526 MSSAU->removeEdge(BB, Succ);
528 ++TheOnlySuccDuplicates;
530 assert(TheOnlySuccDuplicates > 0 &&
"Should be!");
534 bool PreserveLCSSAPhi = !L.contains(TheOnlySucc);
535 for (
unsigned Dup = 1; Dup < TheOnlySuccDuplicates; ++Dup)
537 if (MSSAU && TheOnlySuccDuplicates > 1)
538 MSSAU->removeDuplicatePhiEdgesBetween(BB, TheOnlySucc);
542 Builder.SetInsertPoint(Term);
543 Builder.CreateBr(TheOnlySucc);
544 Term->eraseFromParent();
546 for (
auto *DeadSucc : DeadSuccessors)
547 DTUpdates.push_back({DominatorTree::Delete, BB, DeadSucc});
549 ++NumTerminatorsFolded;
554 ConstantTerminatorFoldingImpl(Loop &L, LoopInfo &LI, DominatorTree &DT,
556 MemorySSAUpdater *MSSAU)
557 : L(L), LI(LI), DT(DT), SE(SE), MSSAU(MSSAU), DFS(&L),
558 DTU(DT, DomTreeUpdater::UpdateStrategy::Eager) {}
560 assert(L.getLoopLatch() &&
"Should be single latch!");
568 LLVM_DEBUG(
dbgs() <<
"In function " << Header->getParent()->getName()
571 if (HasIrreducibleCFG) {
572 LLVM_DEBUG(
dbgs() <<
"Loops with irreducible CFG are not supported!\n");
576 if (HasIndirectEntry) {
577 LLVM_DEBUG(
dbgs() <<
"Loops which can be entered indirectly are not"
583 if (FoldCandidates.empty()) {
585 dbgs() <<
"No constant terminator folding candidates found in loop "
586 << Header->getName() <<
"\n");
591 if (DeleteCurrentLoop) {
594 <<
"Give up constant terminator folding in loop " << Header->getName()
595 <<
": we don't currently support deletion of the current loop.\n");
601 if (BlocksInLoopAfterFolding.size() + DeadLoopBlocks.size() !=
604 dbgs() <<
"Give up constant terminator folding in loop "
605 << Header->getName() <<
": we don't currently"
606 " support blocks that are not dead, but will stop "
607 "being a part of the loop after constant-folding.\n");
614 if (!DeadExitBlocks.empty() && !L.isLCSSAForm(DT,
false)) {
615 assert(L.isLCSSAForm(DT,
true) &&
616 "LCSSA broken not by tokens?");
617 LLVM_DEBUG(
dbgs() <<
"Give up constant terminator folding in loop "
619 <<
": tokens uses potentially break LCSSA form.\n");
623 SE.forgetTopmostLoop(&L);
628 <<
" terminators in loop " << Header->getName() <<
"\n");
630 if (!DeadLoopBlocks.empty())
631 SE.forgetBlockAndLoopDispositions();
637 if (!DeadLoopBlocks.empty()) {
639 <<
" dead blocks in loop " << Header->getName() <<
"\n");
640 deleteDeadLoopBlocks();
643 DTU.applyUpdates(DTUpdates);
648 MSSAU->getMemorySSA()->verifyMemorySSA();
652#if defined(EXPENSIVE_CHECKS)
653 assert(DT.verify(DominatorTree::VerificationLevel::Full) &&
654 "DT broken after transform!");
656 assert(DT.verify(DominatorTree::VerificationLevel::Fast) &&
657 "DT broken after transform!");
659 assert(DT.isReachableFromEntry(Header));
666 bool foldingBreaksCurrentLoop()
const {
667 return DeleteCurrentLoop;
677 bool &IsLoopDeleted) {
683 if (!L.getLoopLatch())
686 ConstantTerminatorFoldingImpl
BranchFolder(L, LI, DT, SE, MSSAU);
701 for (
auto &
Block : Blocks) {
709 if (!Pred || !Pred->getSingleSuccessor() || LI.
getLoopFor(Pred) != &L)
729 bool &IsLoopDeleted) {
750 std::optional<MemorySSAUpdater> MSSAU;
753 bool DeleteCurrentLoop =
false;
758 if (DeleteCurrentLoop)
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
This header provides classes for managing a pipeline of passes over loops in LLVM IR.
static BasicBlock * getOnlyLiveSuccessor(BasicBlock *BB)
If BB is a switch or a conditional branch, but only one of its successors can be reached from this bl...
static bool constantFoldTerminators(Loop &L, DominatorTree &DT, LoopInfo &LI, ScalarEvolution &SE, MemorySSAUpdater *MSSAU, bool &IsLoopDeleted)
Turn branches and switches with known constant conditions into unconditional branches.
static Loop * getInnermostLoopFor(SmallPtrSetImpl< BasicBlock * > &BBs, Loop &L, LoopInfo &LI)
Find innermost loop that contains at least one block from BBs and contains the header of loop L.
static bool mergeBlocksIntoPredecessors(Loop &L, DominatorTree &DT, LoopInfo &LI, MemorySSAUpdater *MSSAU, ScalarEvolution &SE)
static bool simplifyLoopCFG(Loop &L, DominatorTree &DT, LoopInfo &LI, ScalarEvolution &SE, MemorySSAUpdater *MSSAU, bool &IsLoopDeleted)
static cl::opt< bool > EnableTermFolding("enable-loop-simplifycfg-term-folding", cl::init(true))
static void removeBlockFromLoops(BasicBlock *BB, Loop *FirstLoop, Loop *LastLoop=nullptr)
Removes BB from all loops from [FirstLoop, LastLoop) in parent chain.
This file exposes an interface to building/using memory SSA to walk memory instructions using a use/d...
This file contains the declarations for profiling metadata utility functions.
const SmallVectorImpl< MachineOperand > & Cond
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
LLVM Basic Block Representation.
iterator_range< const_phi_iterator > phis() const
Returns a range that iterates over the phis in the basic block.
LLVM_ABI InstListType::const_iterator getFirstNonPHIIt() const
Returns an iterator to the first instruction in this block that is not a PHINode instruction.
LLVM_ABI const BasicBlock * getSinglePredecessor() const
Return the predecessor of this block if it has a single predecessor block.
LLVM_ABI LLVMContext & getContext() const
Get the context in which this basic block lives.
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction if the block is well formed or null if the block is not well forme...
LLVM_ABI void removePredecessor(BasicBlock *Pred, bool KeepOneInputPHIs=false)
Update PHI nodes in this BasicBlock before removal of predecessor Pred.
Conditional or Unconditional Branch instruction.
This is the shared class of boolean and integer constants.
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
LLVM_ABI InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
This class provides an interface for updating the loop pass manager based on mutations to the loop ne...
void markLoopAsDeleted(Loop &L, llvm::StringRef Name)
Loop passes should use this method to indicate they have deleted a loop from the nest.
bool contains(const LoopT *L) const
Return true if the specified loop is contained within in this loop.
BlockT * getHeader() const
unsigned getLoopDepth() const
Return the nesting level of this loop.
void addChildLoop(LoopT *NewChild)
Add the specified loop to be a child of this loop.
LoopT * getParentLoop() const
Return the parent loop if it exists or nullptr for top level loops.
LoopT * getLoopFor(const BlockT *BB) const
Return the inner most loop that BB lives in.
PreservedAnalyses run(Loop &L, LoopAnalysisManager &AM, LoopStandardAnalysisResults &AR, LPMUpdater &U)
Represents a single loop in the control flow graph.
LLVM_ABI instr_iterator erase(instr_iterator I)
Remove an instruction from the instruction list and delete it.
An analysis that produces MemorySSA for a function.
MemorySSA * getMemorySSA() const
Get handle on MemorySSA.
LLVM_ABI void verifyMemorySSA(VerificationLevel=VerificationLevel::Fast) const
Verify that MemorySSA is self consistent (IE definitions dominate all uses, uses appear in the right ...
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
A set of analyses that are preserved following a run of a transformation pass.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
The main scalar evolution driver.
LLVM_ABI void forgetTopmostLoop(const Loop *L)
LLVM_ABI void forgetBlockAndLoopDispositions(Value *V=nullptr)
Called when the client has changed the disposition of values in a loop or block.
A templated base class for SmallPtrSet which provides the typesafe interface that is common across al...
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
LLVM_ABI void addCase(ConstantInt *OnVal, BasicBlock *Dest)
Add an entry to the switch instruction.
unsigned getNumCases() const
Return the number of 'cases' in this switch instruction, excluding the default case.
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
const ParentTy * getParent() const
@ BasicBlock
Various leaf nodes.
initializer< Ty > init(const Ty &Val)
PointerTypeMap run(const Module &M)
Compute the PointerTypeMap for the module M.
friend class Instruction
Iterator for Instructions in a `BasicBlock.
This is an optimization pass for GlobalISel generic memory operations.
void dump(const SparseBitVector< ElementSize > &LHS, raw_ostream &out)
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI void detachDeadBlocks(ArrayRef< BasicBlock * > BBs, SmallVectorImpl< DominatorTree::UpdateType > *Updates, bool KeepOneInputPHIs=false)
Replace contents of every block in BBs with single unreachable instruction.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
auto successors(const MachineBasicBlock *BB)
LLVM_ABI bool formLCSSARecursively(Loop &L, const DominatorTree &DT, const LoopInfo *LI, ScalarEvolution *SE)
Put a loop nest into LCSSA form.
auto cast_or_null(const Y &Val)
LLVM_ABI void setBranchWeights(Instruction &I, ArrayRef< uint32_t > Weights, bool IsExpected, bool ElideAllZero=false)
Create a new branch_weights metadata node and add or overwrite a prof metadata reference to instructi...
AnalysisManager< Loop, LoopStandardAnalysisResults & > LoopAnalysisManager
The loop analysis manager.
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
IRBuilder(LLVMContext &, FolderTy, InserterTy, MDNode *, ArrayRef< OperandBundleDef >) -> IRBuilder< FolderTy, InserterTy >
LLVM_ABI bool VerifyMemorySSA
Enables verification of MemorySSA.
LLVM_ABI bool MergeBlockIntoPredecessor(BasicBlock *BB, DomTreeUpdater *DTU=nullptr, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, MemoryDependenceResults *MemDep=nullptr, bool PredecessorWithTwoSuccessors=false, DominatorTree *DT=nullptr)
Attempts to merge a block into its predecessor, if possible.
LLVM_ABI BasicBlock * SplitBlock(BasicBlock *Old, BasicBlock::iterator SplitPt, DominatorTree *DT, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, const Twine &BBName="", bool Before=false)
Split the specified block at the specified instruction.
LLVM_ABI PreservedAnalyses getLoopPassPreservedAnalyses()
Returns the minimum set of Analyses that all loop passes must preserve.
auto predecessors(const MachineBasicBlock *BB)
iterator_range< pointer_iterator< WrappedIteratorT > > make_pointer_range(RangeT &&Range)
The adaptor from a function pass to a loop pass computes these analyses and makes them available to t...