97#define DEBUG_TYPE "simplifycfg"
102 "simplifycfg-require-and-preserve-domtree",
cl::Hidden,
105 "Temporary development switch used to gradually uplift SimplifyCFG "
106 "into preserving DomTree,"));
115 "Control the amount of phi node folding to perform (default = 2)"));
119 cl::desc(
"Control the maximal total instruction cost that we are willing "
120 "to speculatively execute to fold a 2-entry PHI node into a "
121 "select (default = 4)"));
125 cl::desc(
"Hoist common instructions up to the parent block"));
129 cl::desc(
"Hoist loads if the target supports conditional faulting"));
133 cl::desc(
"Hoist stores if the target supports conditional faulting"));
137 cl::desc(
"Control the maximal conditional load/store that we are willing "
138 "to speculatively execute to eliminate conditional branch "
144 cl::desc(
"Allow reordering across at most this many "
145 "instructions when hoisting"));
149 cl::desc(
"Sink common instructions down to the end block"));
153 cl::desc(
"Hoist conditional stores if an unconditional store precedes"));
157 cl::desc(
"Hoist conditional stores even if an unconditional store does not "
158 "precede - hoist multiple conditional stores into a single "
159 "predicated store"));
163 cl::desc(
"When merging conditional stores, do so even if the resultant "
164 "basic blocks are unlikely to be if-converted as a result"));
168 cl::desc(
"Allow exactly one expensive instruction to be speculatively "
173 cl::desc(
"Limit maximum recursion depth when calculating costs of "
174 "speculatively executed instructions"));
179 cl::desc(
"Max size of a block which is still considered "
180 "small enough to thread through"));
186 cl::desc(
"Maximum cost of combining conditions when "
187 "folding branches"));
190 "simplifycfg-branch-fold-common-dest-vector-multiplier",
cl::Hidden,
192 cl::desc(
"Multiplier to apply to threshold when determining whether or not "
193 "to fold branch to common destination when vector operations are "
198 cl::desc(
"Allow SimplifyCFG to merge invokes together when appropriate"));
202 cl::desc(
"Limit cases to analyze when converting a switch to select"));
206 cl::desc(
"Limit number of blocks a define in a threaded block is allowed "
213STATISTIC(NumBitMaps,
"Number of switch instructions turned into bitmaps");
215 "Number of switch instructions turned into linear mapping");
217 "Number of switch instructions turned into lookup tables");
219 NumLookupTablesHoles,
220 "Number of switch instructions turned into lookup tables (holes checked)");
221STATISTIC(NumTableCmpReuses,
"Number of reused switch table lookup compares");
223 "Number of value comparisons folded into predecessor basic blocks");
225 "Number of branches folded into predecessor basic block");
228 "Number of common instruction 'blocks' hoisted up to the begin block");
230 "Number of common instructions hoisted up to the begin block");
232 "Number of common instruction 'blocks' sunk down to the end block");
234 "Number of common instructions sunk down to the end block");
235STATISTIC(NumSpeculations,
"Number of speculative executed instructions");
237 "Number of invokes with empty resume blocks simplified into calls");
238STATISTIC(NumInvokesMerged,
"Number of invokes that were merged together");
239STATISTIC(NumInvokeSetsFormed,
"Number of invoke sets that were formed");
246using SwitchCaseResultVectorTy =
255struct ValueEqualityComparisonCase {
267 bool operator==(BasicBlock *RHSDest)
const {
return Dest == RHSDest; }
270class SimplifyCFGOpt {
271 const TargetTransformInfo &TTI;
273 const DataLayout &DL;
275 const SimplifyCFGOptions &Options;
278 Value *isValueEqualityComparison(Instruction *TI);
280 Instruction *TI, std::vector<ValueEqualityComparisonCase> &Cases);
281 bool simplifyEqualityComparisonWithOnlyPredecessor(Instruction *TI,
284 bool performValueComparisonIntoPredecessorFolding(Instruction *TI,
Value *&CV,
287 bool foldValueComparisonIntoPredecessors(Instruction *TI,
290 bool simplifyResume(ResumeInst *RI,
IRBuilder<> &Builder);
291 bool simplifySingleResume(ResumeInst *RI);
292 bool simplifyCommonResume(ResumeInst *RI);
293 bool simplifyCleanupReturn(CleanupReturnInst *RI);
294 bool simplifyUnreachable(UnreachableInst *UI);
295 bool simplifySwitch(SwitchInst *SI,
IRBuilder<> &Builder);
296 bool simplifyDuplicateSwitchArms(SwitchInst *SI, DomTreeUpdater *DTU);
297 bool simplifyIndirectBr(IndirectBrInst *IBI);
298 bool simplifyUncondBranch(UncondBrInst *BI,
IRBuilder<> &Builder);
299 bool simplifyCondBranch(CondBrInst *BI,
IRBuilder<> &Builder);
300 bool foldCondBranchOnValueKnownInPredecessor(CondBrInst *BI);
302 bool tryToSimplifyUncondBranchWithICmpInIt(ICmpInst *ICI,
304 bool tryToSimplifyUncondBranchWithICmpSelectInIt(ICmpInst *ICI,
307 bool hoistCommonCodeFromSuccessors(Instruction *TI,
bool AllInstsEqOnly);
308 bool hoistSuccIdenticalTerminatorToSwitchOrIf(
309 Instruction *TI, Instruction *I1,
310 SmallVectorImpl<Instruction *> &OtherSuccTIs,
312 bool speculativelyExecuteBB(CondBrInst *BI, BasicBlock *ThenBB);
313 bool simplifyTerminatorOnSelect(Instruction *OldTerm,
Value *
Cond,
314 BasicBlock *TrueBB, BasicBlock *FalseBB,
315 uint32_t TrueWeight, uint32_t FalseWeight);
316 bool simplifyBranchOnICmpChain(CondBrInst *BI,
IRBuilder<> &Builder,
317 const DataLayout &DL);
318 bool simplifySwitchOnSelect(SwitchInst *SI, SelectInst *
Select);
319 bool simplifyIndirectBrOnSelect(IndirectBrInst *IBI, SelectInst *SI);
320 bool turnSwitchRangeIntoICmp(SwitchInst *SI,
IRBuilder<> &Builder);
321 bool simplifyDuplicatePredecessors(BasicBlock *Succ, DomTreeUpdater *DTU);
324 SimplifyCFGOpt(
const TargetTransformInfo &TTI, DomTreeUpdater *DTU,
326 const SimplifyCFGOptions &Opts)
327 : TTI(TTI), DTU(DTU), DL(DL), LoopHeaders(LoopHeaders), Options(Opts) {
328 assert((!DTU || !DTU->hasPostDomTree()) &&
329 "SimplifyCFG is not yet capable of maintaining validity of a "
330 "PostDomTree, so don't ask for it.");
333 bool simplifyOnce(BasicBlock *BB);
334 bool run(BasicBlock *BB);
337 bool requestResimplify() {
347isSelectInRoleOfConjunctionOrDisjunction(
const SelectInst *
SI) {
367 "Only for a pair of incoming blocks at the time!");
373 Value *IV0 = PN.getIncomingValueForBlock(IncomingBlocks[0]);
374 Value *IV1 = PN.getIncomingValueForBlock(IncomingBlocks[1]);
377 if (EquivalenceSet && EquivalenceSet->contains(IV0) &&
378 EquivalenceSet->contains(IV1))
401 if (!SI1Succs.
count(Succ))
407 FailBlocks->insert(Succ);
423 PN.addIncoming(PN.getIncomingValueForBlock(ExistPred), NewPred);
425 if (
auto *MPhi = MSSAU->getMemorySSA()->getMemoryAccess(Succ))
426 MPhi->addIncoming(MPhi->getIncomingValueForBlock(ExistPred), NewPred);
488 if (AggressiveInsts.
count(
I))
504 ZeroCostInstructions.
insert(OverflowInst);
506 }
else if (!ZeroCostInstructions.
contains(
I))
522 for (
Use &
Op :
I->operands())
524 TTI, AC, ZeroCostInstructions,
Depth + 1))
541 if (
DL.hasUnstableRepresentation(V->getType()))
550 return ConstantInt::get(
IntPtrTy, 0);
555 if (CE->getOpcode() == Instruction::IntToPtr)
579struct ConstantComparesGatherer {
580 const DataLayout &DL;
583 Value *CompValue =
nullptr;
586 Value *Extra =
nullptr;
592 unsigned UsedICmps = 0;
598 bool IgnoreFirstMatch =
false;
599 bool MultipleMatches =
false;
602 ConstantComparesGatherer(Instruction *
Cond,
const DataLayout &DL) : DL(DL) {
604 if (CompValue || !MultipleMatches)
609 IgnoreFirstMatch =
true;
613 ConstantComparesGatherer(
const ConstantComparesGatherer &) =
delete;
614 ConstantComparesGatherer &
615 operator=(
const ConstantComparesGatherer &) =
delete;
620 bool setValueOnce(
Value *NewVal) {
621 if (IgnoreFirstMatch) {
622 IgnoreFirstMatch =
false;
625 if (CompValue && CompValue != NewVal) {
626 MultipleMatches =
true;
640 bool matchInstruction(Instruction *
I,
bool isEQ) {
647 if (!setValueOnce(Val))
667 if (ICI->
getPredicate() == (isEQ ? ICmpInst::ICMP_EQ : ICmpInst::ICMP_NE)) {
711 if (
Mask.isPowerOf2() && (
C->getValue() & ~Mask) ==
C->getValue()) {
713 if (!setValueOnce(RHSVal))
718 ConstantInt::get(
C->getContext(),
719 C->getValue() | Mask));
734 if (
Mask.isPowerOf2() && (
C->getValue() | Mask) ==
C->getValue()) {
736 if (!setValueOnce(RHSVal))
740 Vals.push_back(ConstantInt::get(
C->getContext(),
741 C->getValue() & ~Mask));
762 Value *CandidateVal =
I->getOperand(0);
765 CandidateVal = RHSVal;
780 if (!setValueOnce(CandidateVal))
786 Vals.push_back(ConstantInt::get(
I->getContext(), Tmp));
798 void gather(
Value *V) {
807 SmallVector<Value *, 8> DFT{Op0, Op1};
808 SmallPtrSet<Value *, 8> Visited{
V, Op0, Op1};
810 while (!DFT.
empty()) {
817 if (Visited.
insert(Op1).second)
819 if (Visited.
insert(Op0).second)
826 if (matchInstruction(
I, IsEq))
870 if (!
SI->getParent()->hasNPredecessorsOrMore(128 /
SI->getNumSuccessors()))
871 CV =
SI->getCondition();
873 if (BI->getCondition()->hasOneUse()) {
878 if (Trunc->hasNoUnsignedWrap())
879 CV = Trunc->getOperand(0);
886 Value *Ptr = PTII->getPointerOperand();
887 if (
DL.hasUnstableRepresentation(Ptr->
getType()))
889 if (PTII->getType() ==
DL.getIntPtrType(Ptr->
getType()))
898BasicBlock *SimplifyCFGOpt::getValueEqualityComparisonCases(
899 Instruction *TI, std::vector<ValueEqualityComparisonCase> &Cases) {
901 Cases.reserve(
SI->getNumCases());
902 for (
auto Case :
SI->cases())
903 Cases.push_back(ValueEqualityComparisonCase(Case.getCaseValue(),
904 Case.getCaseSuccessor()));
905 return SI->getDefaultDest();
910 ICmpInst::Predicate Pred;
916 Pred = ICmpInst::ICMP_NE;
921 Cases.push_back(ValueEqualityComparisonCase(
C, Succ));
929 std::vector<ValueEqualityComparisonCase> &Cases) {
935 std::vector<ValueEqualityComparisonCase> &C2) {
936 std::vector<ValueEqualityComparisonCase> *
V1 = &C1, *V2 = &C2;
939 if (
V1->size() > V2->size())
944 if (
V1->size() == 1) {
947 for (
const ValueEqualityComparisonCase &
VECC : *V2)
948 if (TheVal ==
VECC.Value)
955 unsigned i1 = 0, i2 = 0, e1 =
V1->size(), e2 = V2->size();
956 while (i1 != e1 && i2 != e2) {
972bool SimplifyCFGOpt::simplifyEqualityComparisonWithOnlyPredecessor(
973 Instruction *TI, BasicBlock *Pred,
IRBuilder<> &Builder) {
978 Value *ThisVal = isValueEqualityComparison(TI);
979 assert(ThisVal &&
"This isn't a value comparison!!");
980 if (ThisVal != PredVal)
987 std::vector<ValueEqualityComparisonCase> PredCases;
989 getValueEqualityComparisonCases(Pred->
getTerminator(), PredCases);
993 std::vector<ValueEqualityComparisonCase> ThisCases;
994 BasicBlock *ThisDef = getValueEqualityComparisonCases(TI, ThisCases);
1009 assert(ThisCases.size() == 1 &&
"Branch can only have one case!");
1015 ThisCases[0].Dest->removePredecessor(PredDef);
1018 <<
"Through successor TI: " << *TI <<
"Leaving: " << *NI
1025 {{DominatorTree::Delete, PredDef, ThisCases[0].Dest}});
1032 SmallPtrSet<Constant *, 16> DeadCases;
1033 for (
const ValueEqualityComparisonCase &Case : PredCases)
1034 DeadCases.
insert(Case.Value);
1037 <<
"Through successor TI: " << *TI);
1039 SmallDenseMap<BasicBlock *, int, 8> NumPerSuccessorCases;
1042 auto *
Successor = i->getCaseSuccessor();
1045 if (DeadCases.
count(i->getCaseValue())) {
1054 std::vector<DominatorTree::UpdateType> Updates;
1055 for (
const std::pair<BasicBlock *, int> &
I : NumPerSuccessorCases)
1057 Updates.push_back({DominatorTree::Delete, PredDef,
I.first});
1067 ConstantInt *TIV =
nullptr;
1069 for (
const auto &[
Value, Dest] : PredCases)
1075 assert(TIV &&
"No edge from pred to succ?");
1080 for (
const auto &[
Value, Dest] : ThisCases)
1088 TheRealDest = ThisDef;
1090 SmallPtrSet<BasicBlock *, 2> RemovedSuccs;
1095 if (Succ != CheckEdge) {
1096 if (Succ != TheRealDest)
1097 RemovedSuccs.
insert(Succ);
1100 CheckEdge =
nullptr;
1107 <<
"Through successor TI: " << *TI <<
"Leaving: " << *NI
1112 SmallVector<DominatorTree::UpdateType, 2> Updates;
1114 for (
auto *RemovedSucc : RemovedSuccs)
1115 Updates.
push_back({DominatorTree::Delete, TIBB, RemovedSucc});
1126struct ConstantIntOrdering {
1127 bool operator()(
const ConstantInt *
LHS,
const ConstantInt *
RHS)
const {
1128 return LHS->getValue().ult(
RHS->getValue());
1140 return LHS->getValue().ult(
RHS->getValue()) ? 1 : -1;
1149 assert(MD &&
"Invalid branch-weight metadata");
1174 if (BonusInst.isTerminator())
1209 NewBonusInst->
takeName(&BonusInst);
1210 BonusInst.setName(NewBonusInst->
getName() +
".old");
1211 VMap[&BonusInst] = NewBonusInst;
1220 assert(UI->getParent() == BB && BonusInst.comesBefore(UI) &&
1221 "If the user is not a PHI node, then it should be in the same "
1222 "block as, and come after, the original bonus instruction.");
1226 if (PN->getIncomingBlock(U) == BB)
1230 assert(PN->getIncomingBlock(U) == PredBlock &&
1231 "Not in block-closed SSA form?");
1232 U.set(NewBonusInst);
1242 if (!PredDL->getAtomGroup() &&
DL &&
DL->getAtomGroup() &&
1243 PredDL.isSameSourceLocation(
DL)) {
1250bool SimplifyCFGOpt::performValueComparisonIntoPredecessorFolding(
1258 std::vector<ValueEqualityComparisonCase> BBCases;
1259 BasicBlock *BBDefault = getValueEqualityComparisonCases(TI, BBCases);
1261 std::vector<ValueEqualityComparisonCase> PredCases;
1262 BasicBlock *PredDefault = getValueEqualityComparisonCases(PTI, PredCases);
1267 SmallMapVector<BasicBlock *, int, 8> NewSuccessors;
1270 SmallVector<uint64_t, 8> Weights;
1274 if (PredHasWeights) {
1277 if (Weights.
size() != 1 + PredCases.size())
1278 PredHasWeights = SuccHasWeights =
false;
1279 }
else if (SuccHasWeights)
1283 Weights.
assign(1 + PredCases.size(), 1);
1285 SmallVector<uint64_t, 8> SuccWeights;
1286 if (SuccHasWeights) {
1289 if (SuccWeights.
size() != 1 + BBCases.size())
1290 PredHasWeights = SuccHasWeights =
false;
1291 }
else if (PredHasWeights)
1292 SuccWeights.
assign(1 + BBCases.size(), 1);
1294 if (PredDefault == BB) {
1297 std::set<ConstantInt *, ConstantIntOrdering> PTIHandled;
1298 for (
unsigned i = 0, e = PredCases.size(); i != e; ++i)
1299 if (PredCases[i].Dest != BB)
1300 PTIHandled.insert(PredCases[i].
Value);
1303 std::swap(PredCases[i], PredCases.back());
1305 if (PredHasWeights || SuccHasWeights) {
1307 Weights[0] += Weights[i + 1];
1312 PredCases.pop_back();
1318 if (PredDefault != BBDefault) {
1320 if (DTU && PredDefault != BB)
1321 Updates.
push_back({DominatorTree::Delete, Pred, PredDefault});
1322 PredDefault = BBDefault;
1323 ++NewSuccessors[BBDefault];
1326 unsigned CasesFromPred = Weights.
size();
1327 uint64_t ValidTotalSuccWeight = 0;
1328 for (
unsigned i = 0, e = BBCases.size(); i != e; ++i)
1329 if (!PTIHandled.count(BBCases[i].Value) && BBCases[i].Dest != BBDefault) {
1330 PredCases.push_back(BBCases[i]);
1331 ++NewSuccessors[BBCases[i].Dest];
1332 if (SuccHasWeights || PredHasWeights) {
1336 Weights.
push_back(Weights[0] * SuccWeights[i + 1]);
1337 ValidTotalSuccWeight += SuccWeights[i + 1];
1341 if (SuccHasWeights || PredHasWeights) {
1342 ValidTotalSuccWeight += SuccWeights[0];
1344 for (
unsigned i = 1; i < CasesFromPred; ++i)
1345 Weights[i] *= ValidTotalSuccWeight;
1347 Weights[0] *= SuccWeights[0];
1353 std::set<ConstantInt *, ConstantIntOrdering> PTIHandled;
1354 std::map<ConstantInt *, uint64_t> WeightsForHandled;
1355 for (
unsigned i = 0, e = PredCases.size(); i != e; ++i)
1356 if (PredCases[i].Dest == BB) {
1357 PTIHandled.insert(PredCases[i].
Value);
1359 if (PredHasWeights || SuccHasWeights) {
1360 WeightsForHandled[PredCases[i].Value] = Weights[i + 1];
1365 std::swap(PredCases[i], PredCases.back());
1366 PredCases.pop_back();
1373 for (
const ValueEqualityComparisonCase &Case : BBCases)
1374 if (PTIHandled.count(Case.Value)) {
1376 if (PredHasWeights || SuccHasWeights)
1377 Weights.
push_back(WeightsForHandled[Case.Value]);
1378 PredCases.push_back(Case);
1379 ++NewSuccessors[Case.Dest];
1380 PTIHandled.erase(Case.Value);
1385 for (ConstantInt *
I : PTIHandled) {
1386 if (PredHasWeights || SuccHasWeights)
1388 PredCases.push_back(ValueEqualityComparisonCase(
I, BBDefault));
1389 ++NewSuccessors[BBDefault];
1396 SmallPtrSet<BasicBlock *, 2> SuccsOfPred;
1401 for (
const std::pair<BasicBlock *, int /*Num*/> &NewSuccessor :
1403 for (
auto I :
seq(NewSuccessor.second)) {
1407 if (DTU && !SuccsOfPred.
contains(NewSuccessor.first))
1408 Updates.
push_back({DominatorTree::Insert, Pred, NewSuccessor.first});
1415 "Should not end up here with unstable pointers");
1421 SwitchInst *NewSI = Builder.
CreateSwitch(CV, PredDefault, PredCases.size());
1423 for (ValueEqualityComparisonCase &V : PredCases)
1426 if (PredHasWeights || SuccHasWeights)
1438 if (!InfLoopBlock) {
1446 {DominatorTree::Insert, InfLoopBlock, InfLoopBlock});
1453 Updates.
push_back({DominatorTree::Insert, Pred, InfLoopBlock});
1455 Updates.
push_back({DominatorTree::Delete, Pred, BB});
1460 ++NumFoldValueComparisonIntoPredecessors;
1468bool SimplifyCFGOpt::foldValueComparisonIntoPredecessors(Instruction *TI,
1471 Value *CV = isValueEqualityComparison(TI);
1472 assert(CV &&
"Not a comparison?");
1477 while (!Preds.empty()) {
1486 Value *PCV = isValueEqualityComparison(PTI);
1490 SmallSetVector<BasicBlock *, 4> FailBlocks;
1492 for (
auto *Succ : FailBlocks) {
1498 performValueComparisonIntoPredecessorFolding(TI, CV, PTI, Builder);
1512 Value *BB1V = PN.getIncomingValueForBlock(BB1);
1513 Value *BB2V = PN.getIncomingValueForBlock(BB2);
1514 if (BB1V != BB2V && (BB1V == I1 || BB2V == I2)) {
1536 if (
I->mayReadFromMemory())
1568 if (CB->getIntrinsicID() == Intrinsic::experimental_deoptimize)
1576 if (J->getParent() == BB)
1598 if (C1->isMustTailCall() != C2->isMustTailCall())
1601 if (!
TTI.isProfitableToHoist(I1) || !
TTI.isProfitableToHoist(I2))
1607 if (CB1->cannotMerge() || CB1->isConvergent())
1610 if (CB2->cannotMerge() || CB2->isConvergent())
1625 if (!I1->hasDbgRecords())
1627 using CurrentAndEndIt =
1628 std::pair<DbgRecord::self_iterator, DbgRecord::self_iterator>;
1634 auto atEnd = [](
const CurrentAndEndIt &Pair) {
1635 return Pair.first == Pair.second;
1641 return Itrs[0].first->isIdenticalToWhenDefined(*
I);
1647 {I1->getDbgRecordRange().begin(), I1->getDbgRecordRange().end()});
1649 if (!
Other->hasDbgRecords())
1652 {
Other->getDbgRecordRange().begin(),
Other->getDbgRecordRange().end()});
1659 while (
none_of(Itrs, atEnd)) {
1660 bool HoistDVRs = allIdentical(Itrs);
1661 for (CurrentAndEndIt &Pair : Itrs) {
1675 if (I1->isIdenticalToWhenDefined(I2,
true))
1680 return Cmp1->getPredicate() == Cmp2->getSwappedPredicate() &&
1681 Cmp1->getOperand(0) == Cmp2->getOperand(1) &&
1682 Cmp1->getOperand(1) == Cmp2->getOperand(0);
1684 if (I1->isCommutative() && I1->isSameOperationAs(I2)) {
1685 return I1->getOperand(0) == I2->
getOperand(1) &&
1751 auto &Context = BI->getParent()->getContext();
1756 Value *Mask =
nullptr;
1757 Value *MaskFalse =
nullptr;
1758 Value *MaskTrue =
nullptr;
1759 if (Invert.has_value()) {
1760 IRBuilder<> Builder(Sel ? Sel : SpeculatedConditionalLoadsStores.
back());
1761 Mask = Builder.CreateBitCast(
1766 MaskFalse = Builder.CreateBitCast(
1768 MaskTrue = Builder.CreateBitCast(
Cond, VCondTy);
1770 auto PeekThroughBitcasts = [](
Value *V) {
1772 V = BitCast->getOperand(0);
1775 for (
auto *
I : SpeculatedConditionalLoadsStores) {
1777 if (!Invert.has_value())
1778 Mask =
I->getParent() == BI->getSuccessor(0) ? MaskTrue : MaskFalse;
1783 auto *Op0 =
I->getOperand(0);
1784 CallInst *MaskedLoadStore =
nullptr;
1787 auto *Ty =
I->getType();
1789 Value *PassThru =
nullptr;
1790 if (Invert.has_value())
1791 for (
User *U :
I->users()) {
1793 PassThru = Builder.CreateBitCast(
1802 Builder.SetInsertPoint(Ins);
1805 MaskedLoadStore = Builder.CreateMaskedLoad(
1807 Value *NewLoadStore = Builder.CreateBitCast(MaskedLoadStore, Ty);
1810 I->replaceAllUsesWith(NewLoadStore);
1813 auto *StoredVal = Builder.CreateBitCast(
1815 MaskedLoadStore = Builder.CreateMaskedStore(
1826 if (
const MDNode *Ranges =
I->getMetadata(LLVMContext::MD_range))
1828 I->dropUBImplyingAttrsAndUnknownMetadata({LLVMContext::MD_annotation});
1832 I->eraseMetadataIf([](
unsigned MDKind,
MDNode *
Node) {
1833 return Node->getMetadataID() == Metadata::DIAssignIDKind;
1836 I->eraseFromParent();
1843 bool IsStore =
false;
1866bool SimplifyCFGOpt::hoistCommonCodeFromSuccessors(Instruction *TI,
1867 bool AllInstsEqOnly) {
1883 for (
auto *Succ : UniqueSuccessors) {
1899 using SuccIterPair = std::pair<BasicBlock::iterator, unsigned>;
1901 for (
auto *Succ : UniqueSuccessors) {
1905 SuccIterPairs.
push_back(SuccIterPair(SuccItr, 0));
1908 if (AllInstsEqOnly) {
1914 unsigned Size0 = UniqueSuccessors[0]->size();
1915 Instruction *Term0 = UniqueSuccessors[0]->getTerminator();
1919 Succ->
size() == Size0;
1923 LockstepReverseIterator<true> LRI(UniqueSuccessors.getArrayRef());
1924 while (LRI.isValid()) {
1926 if (
any_of(*LRI, [I0](Instruction *
I) {
1940 unsigned NumSkipped = 0;
1943 if (SuccIterPairs.
size() > 2) {
1946 if (SuccIterPairs.
size() < 2)
1953 auto *SuccIterPairBegin = SuccIterPairs.
begin();
1954 auto &BB1ItrPair = *SuccIterPairBegin++;
1955 auto OtherSuccIterPairRange =
1961 bool AllInstsAreIdentical =
true;
1962 bool HasTerminator =
I1->isTerminator();
1963 for (
auto &SuccIter : OtherSuccIterRange) {
1967 MMRAMetadata(*I1) != MMRAMetadata(*I2)))
1968 AllInstsAreIdentical =
false;
1971 SmallVector<Instruction *, 8> OtherInsts;
1972 for (
auto &SuccIter : OtherSuccIterRange)
1977 if (HasTerminator) {
1981 if (NumSkipped || !AllInstsAreIdentical) {
1986 return hoistSuccIdenticalTerminatorToSwitchOrIf(
1987 TI, I1, OtherInsts, UniqueSuccessors.getArrayRef()) ||
1991 if (AllInstsAreIdentical) {
1992 unsigned SkipFlagsBB1 = BB1ItrPair.second;
1993 AllInstsAreIdentical =
1995 all_of(OtherSuccIterPairRange, [=](
const auto &Pair) {
1997 unsigned SkipFlagsBB2 = Pair.second;
2012 AllInstsAreIdentical && CI && CI->isMustTailCall()) {
2013 AllInstsAreIdentical =
2014 NumSkipped == 0 &&
all_of(SuccIterPairs, [](
const SuccIterPair &
P) {
2019 if (AllInstsAreIdentical) {
2029 for (
auto &SuccIter : OtherSuccIterRange) {
2037 assert(
Success &&
"We should not be trying to hoist callbases "
2038 "with non-intersectable attributes");
2050 NumHoistCommonCode += SuccIterPairs.
size();
2052 NumHoistCommonInstrs += SuccIterPairs.
size();
2061 for (
auto &SuccIterPair : SuccIterPairs) {
2070bool SimplifyCFGOpt::hoistSuccIdenticalTerminatorToSwitchOrIf(
2071 Instruction *TI, Instruction *I1,
2072 SmallVectorImpl<Instruction *> &OtherSuccTIs,
2082 auto *I2 = *OtherSuccTIs.
begin();
2102 for (PHINode &PN : Succ->
phis()) {
2103 Value *BB1V = PN.getIncomingValueForBlock(BB1);
2104 for (Instruction *OtherSuccTI : OtherSuccTIs) {
2105 Value *BB2V = PN.getIncomingValueForBlock(OtherSuccTI->getParent());
2125 if (!
NT->getType()->isVoidTy()) {
2126 I1->replaceAllUsesWith(NT);
2127 for (Instruction *OtherSuccTI : OtherSuccTIs)
2128 OtherSuccTI->replaceAllUsesWith(NT);
2132 NumHoistCommonInstrs += OtherSuccTIs.size() + 1;
2138 for (
auto *OtherSuccTI : OtherSuccTIs)
2139 Locs.
push_back(OtherSuccTI->getDebugLoc());
2151 std::map<std::pair<Value *, Value *>, SelectInst *> InsertedSelects;
2153 for (PHINode &PN : Succ->
phis()) {
2154 Value *BB1V = PN.getIncomingValueForBlock(BB1);
2155 Value *BB2V = PN.getIncomingValueForBlock(BB2);
2161 SelectInst *&
SI = InsertedSelects[std::make_pair(BB1V, BB2V)];
2171 for (
unsigned i = 0, e = PN.getNumIncomingValues(); i != e; ++i)
2172 if (PN.getIncomingBlock(i) == BB1 || PN.getIncomingBlock(i) == BB2)
2173 PN.setIncomingValue(i, SI);
2184 Updates.
push_back({DominatorTree::Insert, TIParent, Succ});
2190 for (BasicBlock *Succ : UniqueSuccessors)
2191 Updates.
push_back({DominatorTree::Delete, TIParent, Succ});
2205 if (
I->isIntDivRem())
2220 std::optional<unsigned> NumUses;
2221 for (
auto *
I : Insts) {
2224 I->getType()->isTokenTy())
2229 if (
I->getParent()->getSingleSuccessor() ==
I->getParent())
2237 if (
C->isInlineAsm() ||
C->cannotMerge() ||
C->isConvergent())
2241 NumUses =
I->getNumUses();
2242 else if (NumUses !=
I->getNumUses())
2248 for (
auto *
I : Insts) {
2262 for (
const Use &U : I0->
uses()) {
2263 auto It = PHIOperands.find(&U);
2264 if (It == PHIOperands.end())
2267 if (!
equal(Insts, It->second))
2281 if (HaveIndirectCalls) {
2282 if (!AllCallsAreIndirect)
2286 Value *Callee =
nullptr;
2290 Callee = CurrCallee;
2291 else if (Callee != CurrCallee)
2297 for (
unsigned OI = 0, OE = I0->
getNumOperands(); OI != OE; ++OI) {
2303 if (!
all_of(Insts, SameAsI0)) {
2309 for (
auto *
I : Insts)
2310 Ops.push_back(
I->getOperand(OI));
2320 auto *BBEnd = Blocks[0]->getTerminator()->getSuccessor(0);
2325 for (
auto *BB : Blocks) {
2327 I =
I->getPrevNode();
2352 assert(!
Op->getType()->isTokenTy() &&
"Can't PHI tokens!");
2355 PN->insertBefore(BBEnd->begin());
2356 for (
auto *
I : Insts)
2357 PN->addIncoming(
I->getOperand(O),
I->getParent());
2366 I0->
moveBefore(*BBEnd, BBEnd->getFirstInsertionPt());
2369 for (
auto *
I : Insts)
2383 assert(
Success &&
"We should not be trying to sink callbases "
2384 "with non-intersectable attributes");
2395 PN->replaceAllUsesWith(I0);
2396 PN->eraseFromParent();
2400 for (
auto *
I : Insts) {
2405 assert(
I->user_empty() &&
"Inst unexpectedly still has non-dbg users");
2406 I->replaceAllUsesWith(I0);
2407 I->eraseFromParent();
2457 bool HaveNonUnconditionalPredecessors =
false;
2463 HaveNonUnconditionalPredecessors =
true;
2465 if (UnconditionalPreds.
size() < 2)
2478 for (
const Use &U : PN.incoming_values())
2479 IncomingVals.
insert({PN.getIncomingBlock(U), &U});
2480 auto &
Ops = PHIOperands[IncomingVals[UnconditionalPreds[0]]];
2482 Ops.push_back(*IncomingVals[Pred]);
2490 LLVM_DEBUG(
dbgs() <<
"SINK: instruction can be sunk: " << *(*LRI)[0]
2503 if (!followedByDeoptOrUnreachable) {
2505 auto IsMemOperand = [](
Use &U) {
2518 unsigned NumPHIInsts = 0;
2519 for (
Use &U : (*LRI)[0]->operands()) {
2520 auto It = PHIOperands.
find(&U);
2521 if (It != PHIOperands.
end() && !
all_of(It->second, [&](
Value *V) {
2522 return InstructionsToSink.contains(V);
2529 if (IsMemOperand(U) &&
2530 any_of(It->second, [](
Value *V) { return isa<GEPOperator>(V); }))
2537 LLVM_DEBUG(
dbgs() <<
"SINK: #phi insts: " << NumPHIInsts <<
"\n");
2538 return NumPHIInsts <= 1;
2555 while (Idx < ScanIdx) {
2556 if (!ProfitableToSinkInstruction(LRI)) {
2559 dbgs() <<
"SINK: stopping here, too many PHIs would be created!\n");
2572 if (Idx < ScanIdx) {
2575 InstructionsToSink = InstructionsProfitableToSink;
2581 !ProfitableToSinkInstruction(LRI) &&
2582 "We already know that the last instruction is unprofitable to sink");
2590 for (
auto *
I : *LRI)
2591 InstructionsProfitableToSink.
erase(
I);
2592 if (!ProfitableToSinkInstruction(LRI)) {
2595 InstructionsToSink = InstructionsProfitableToSink;
2609 if (HaveNonUnconditionalPredecessors) {
2610 if (!followedByDeoptOrUnreachable) {
2618 bool Profitable =
false;
2619 while (Idx < ScanIdx) {
2653 for (; SinkIdx != ScanIdx; ++SinkIdx) {
2655 << *UnconditionalPreds[0]->getTerminator()->getPrevNode()
2663 NumSinkCommonInstrs++;
2667 ++NumSinkCommonCode;
2673struct CompatibleSets {
2674 using SetTy = SmallVector<InvokeInst *, 2>;
2680 SetTy &getCompatibleSet(InvokeInst *
II);
2682 void insert(InvokeInst *
II);
2685CompatibleSets::SetTy &CompatibleSets::getCompatibleSet(InvokeInst *
II) {
2690 for (CompatibleSets::SetTy &Set : Sets) {
2691 if (CompatibleSets::shouldBelongToSameSet({
Set.front(),
II}))
2696 return Sets.emplace_back();
2699void CompatibleSets::insert(InvokeInst *
II) {
2700 getCompatibleSet(
II).emplace_back(
II);
2704 assert(Invokes.
size() == 2 &&
"Always called with exactly two candidates.");
2707 auto IsIllegalToMerge = [](InvokeInst *
II) {
2708 return II->cannotMerge() ||
II->isInlineAsm();
2710 if (
any_of(Invokes, IsIllegalToMerge))
2718 if (HaveIndirectCalls) {
2719 if (!AllCallsAreIndirect)
2724 for (InvokeInst *
II : Invokes) {
2725 Value *CurrCallee =
II->getCalledOperand();
2726 assert(CurrCallee &&
"There is always a called operand.");
2729 else if (Callee != CurrCallee)
2736 auto HasNormalDest = [](InvokeInst *
II) {
2739 if (
any_of(Invokes, HasNormalDest)) {
2742 if (!
all_of(Invokes, HasNormalDest))
2747 for (InvokeInst *
II : Invokes) {
2749 assert(CurrNormalBB &&
"There is always a 'continue to' basic block.");
2751 NormalBB = CurrNormalBB;
2752 else if (NormalBB != CurrNormalBB)
2760 NormalBB, {Invokes[0]->getParent(), Invokes[1]->getParent()},
2769 for (InvokeInst *
II : Invokes) {
2771 assert(CurrUnwindBB &&
"There is always an 'unwind to' basic block.");
2773 UnwindBB = CurrUnwindBB;
2775 assert(UnwindBB == CurrUnwindBB &&
"Unexpected unwind destination.");
2782 Invokes.front()->getUnwindDest(),
2783 {Invokes[0]->getParent(), Invokes[1]->getParent()}))
2788 const InvokeInst *II0 = Invokes.front();
2789 for (
auto *
II : Invokes.drop_front())
2794 auto IsIllegalToMergeArguments = [](
auto Ops) {
2795 Use &U0 = std::get<0>(
Ops);
2796 Use &U1 = std::get<1>(
Ops);
2802 assert(Invokes.size() == 2 &&
"Always called with exactly two candidates.");
2803 if (
any_of(
zip(Invokes[0]->data_ops(), Invokes[1]->data_ops()),
2804 IsIllegalToMergeArguments))
2816 assert(Invokes.
size() >= 2 &&
"Must have at least two invokes to merge.");
2822 bool HasNormalDest =
2827 InvokeInst *MergedInvoke = [&Invokes, HasNormalDest]() {
2831 II0->
getParent()->getIterator()->getNextNode();
2836 Ctx, II0BB->
getName() +
".invoke", Func, InsertBeforeBlock);
2840 MergedInvoke->
insertInto(MergedInvokeBB, MergedInvokeBB->
end());
2842 if (!HasNormalDest) {
2846 Ctx, II0BB->
getName() +
".cont", Func, InsertBeforeBlock);
2854 return MergedInvoke;
2868 SuccBBOfMergedInvoke});
2891 return II->getOperand(U.getOperandNo()) != U.get();
2910 Invokes.
front()->getParent());
2918 if (!MergedDebugLoc)
2919 MergedDebugLoc =
II->getDebugLoc();
2927 OrigSuccBB->removePredecessor(
II->getParent());
2931 BI->setDebugLoc(
II->getDebugLoc());
2933 assert(
Success &&
"Merged invokes with incompatible attributes");
2936 II->replaceAllUsesWith(MergedInvoke);
2937 II->eraseFromParent();
2941 ++NumInvokeSetsFormed;
2977 CompatibleSets Grouper;
2987 if (Invokes.
size() < 2)
2999class EphemeralValueTracker {
3000 SmallPtrSet<const Instruction *, 32> EphValues;
3002 bool isEphemeral(
const Instruction *
I) {
3005 return !
I->mayHaveSideEffects() && !
I->isTerminator() &&
3006 all_of(
I->users(), [&](
const User *U) {
3007 return EphValues.count(cast<Instruction>(U));
3012 bool track(
const Instruction *
I) {
3013 if (isEphemeral(
I)) {
3064 unsigned MaxNumInstToLookAt = 9;
3068 if (!MaxNumInstToLookAt)
3070 --MaxNumInstToLookAt;
3083 if (
SI->getPointerOperand() == StorePtr &&
3084 SI->getValueOperand()->getType() == StoreTy &&
SI->isSimple() &&
3087 return SI->getValueOperand();
3092 if (LI->getPointerOperand() == StorePtr && LI->
getType() == StoreTy &&
3093 LI->isSimple() && LI->getAlign() >= StoreToHoist->
getAlign()) {
3095 bool ExplicitlyDereferenceableOnly;
3103 (!ExplicitlyDereferenceableOnly ||
3121 unsigned &SpeculatedInstructions,
3129 bool HaveRewritablePHIs =
false;
3131 Value *OrigV = PN.getIncomingValueForBlock(BB);
3132 Value *ThenV = PN.getIncomingValueForBlock(ThenBB);
3139 Cost +=
TTI.getCmpSelInstrCost(Instruction::Select, PN.getType(),
3148 HaveRewritablePHIs =
true;
3151 if (!OrigCE && !ThenCE)
3158 if (OrigCost + ThenCost > MaxCost)
3165 ++SpeculatedInstructions;
3166 if (SpeculatedInstructions > 1)
3170 return HaveRewritablePHIs;
3174 std::optional<bool> Invert,
3178 if (BI->getMetadata(LLVMContext::MD_unpredictable))
3185 if (!Invert.has_value())
3188 uint64_t EndWeight = *Invert ? TWeight : FWeight;
3192 return BIEndProb < Likely;
3232bool SimplifyCFGOpt::speculativelyExecuteBB(CondBrInst *BI,
3233 BasicBlock *ThenBB) {
3249 bool Invert =
false;
3264 SmallDenseMap<Instruction *, unsigned, 4> SinkCandidateUseCounts;
3266 SmallVector<Instruction *, 4> SpeculatedPseudoProbes;
3268 unsigned SpeculatedInstructions = 0;
3269 bool HoistLoadsStores =
Options.HoistLoadsStoresWithCondFaulting;
3270 SmallVector<Instruction *, 2> SpeculatedConditionalLoadsStores;
3271 Value *SpeculatedStoreValue =
nullptr;
3272 StoreInst *SpeculatedStore =
nullptr;
3273 EphemeralValueTracker EphTracker;
3288 if (EphTracker.track(&
I))
3293 bool IsSafeCheapLoadStore = HoistLoadsStores &&
3295 SpeculatedConditionalLoadsStores.
size() <
3299 if (IsSafeCheapLoadStore)
3300 SpeculatedConditionalLoadsStores.
push_back(&
I);
3302 ++SpeculatedInstructions;
3304 if (SpeculatedInstructions > 1)
3308 if (!IsSafeCheapLoadStore &&
3311 (SpeculatedStoreValue =
3314 if (!IsSafeCheapLoadStore && !SpeculatedStoreValue &&
3320 if (!SpeculatedStore && SpeculatedStoreValue)
3326 for (Use &
Op :
I.operands()) {
3331 ++SinkCandidateUseCounts[OpI];
3338 for (
const auto &[Inst,
Count] : SinkCandidateUseCounts)
3339 if (Inst->hasNUses(
Count)) {
3340 ++SpeculatedInstructions;
3341 if (SpeculatedInstructions > 1)
3348 SpeculatedStore !=
nullptr || !SpeculatedConditionalLoadsStores.
empty();
3351 SpeculatedInstructions,
Cost,
TTI);
3352 if (!Convert ||
Cost > Budget)
3356 LLVM_DEBUG(
dbgs() <<
"SPECULATIVELY EXECUTING BB" << *ThenBB <<
"\n";);
3360 if (SpeculatedStoreValue) {
3364 Value *FalseV = SpeculatedStoreValue;
3368 BrCond, TrueV, FalseV,
"spec.store.select", BI);
3398 for (DbgVariableRecord *DbgAssign :
3401 DbgAssign->replaceVariableLocationOp(OrigV, S);
3411 if (!SpeculatedStoreValue || &
I != SpeculatedStore) {
3414 I.dropUBImplyingAttrsAndMetadata();
3417 if (EphTracker.contains(&
I)) {
3419 I.eraseFromParent();
3425 for (
auto &It : *ThenBB)
3430 !DVR || !DVR->isDbgAssign())
3431 It.dropOneDbgRecord(&DR);
3432 BB->
splice(BI->getIterator(), ThenBB, ThenBB->begin(),
3433 std::prev(ThenBB->end()));
3435 if (!SpeculatedConditionalLoadsStores.
empty())
3441 for (PHINode &PN : EndBB->
phis()) {
3442 unsigned OrigI = PN.getBasicBlockIndex(BB);
3443 unsigned ThenI = PN.getBasicBlockIndex(ThenBB);
3444 Value *OrigV = PN.getIncomingValue(OrigI);
3445 Value *ThenV = PN.getIncomingValue(ThenI);
3454 Value *TrueV = ThenV, *FalseV = OrigV;
3458 PN.setIncomingValue(OrigI, V);
3459 PN.setIncomingValue(ThenI, V);
3463 for (Instruction *
I : SpeculatedPseudoProbes)
3464 I->eraseFromParent();
3477 if (!ReachesNonLocalUses.
insert(BB).second)
3492 EphemeralValueTracker EphTracker;
3499 if (CI->cannotDuplicate() || CI->isConvergent())
3512 for (
User *U :
I.users()) {
3515 if (UsedInBB == BB) {
3519 NonLocalUseBlocks.
insert(UsedInBB);
3533 if (
I &&
I->getParent() == To)
3549static std::optional<bool>
3570 KnownValues[CB].
insert(Pred);
3574 if (KnownValues.
empty())
3599 if (!
findReaching(UseBB, BB, ReachesNonLocalUseBlocks))
3602 for (
const auto &Pair : KnownValues) {
3619 if (ReachesNonLocalUseBlocks.
contains(RealDest))
3624 <<
" has value " << *Pair.first <<
" in predecessors:\n";
3627 dbgs() <<
"Threading to destination " << RealDest->
getName() <<
".\n";
3637 EdgeBB->setName(RealDest->
getName() +
".critedge");
3638 EdgeBB->moveBefore(RealDest);
3648 TranslateMap[
Cond] = CB;
3661 N->insertInto(EdgeBB, InsertPt);
3664 N->setName(BBI->getName() +
".c");
3675 if (!BBI->use_empty())
3676 TranslateMap[&*BBI] = V;
3677 if (!
N->mayHaveSideEffects()) {
3678 N->eraseFromParent();
3683 if (!BBI->use_empty())
3684 TranslateMap[&*BBI] =
N;
3690 for (; SrcDbgCursor != BBI; ++SrcDbgCursor)
3691 N->cloneDebugInfoFrom(&*SrcDbgCursor);
3692 SrcDbgCursor = std::next(BBI);
3694 N->cloneDebugInfoFrom(&*BBI);
3703 for (; &*SrcDbgCursor != BI; ++SrcDbgCursor)
3704 InsertPt->cloneDebugInfoFrom(&*SrcDbgCursor);
3705 InsertPt->cloneDebugInfoFrom(BI);
3710 EdgeBI->setDebugLoc(BI->getDebugLoc());
3726 return std::nullopt;
3732bool SimplifyCFGOpt::foldCondBranchOnValueKnownInPredecessor(CondBrInst *BI) {
3739 std::optional<bool>
Result;
3740 bool EverChanged =
false;
3746 }
while (Result == std::nullopt);
3755 bool SpeculateUnpredictables) {
3777 return isa<UncondBrInst>(IfBlock->getTerminator());
3780 "Will have either one or two blocks to speculate.");
3787 bool IsUnpredictable = DomBI->getMetadata(LLVMContext::MD_unpredictable);
3788 if (!IsUnpredictable) {
3791 (TWeight + FWeight) != 0) {
3796 if (IfBlocks.
size() == 1) {
3798 DomBI->
getSuccessor(0) == BB ? BITrueProb : BIFalseProb;
3799 if (BIBBProb >= Likely)
3802 if (BITrueProb >= Likely || BIFalseProb >= Likely)
3811 if (IfCondPhiInst->getParent() == BB)
3819 unsigned NumPhis = 0;
3832 if (SpeculateUnpredictables && IsUnpredictable)
3833 Budget +=
TTI.getBranchMispredictPenalty();
3846 AggressiveInsts, Cost, Budget,
TTI, AC,
3847 ZeroCostInstructions) ||
3849 AggressiveInsts, Cost, Budget,
TTI, AC,
3850 ZeroCostInstructions))
3863 auto IsBinOpOrAndEq = [](
Value *V) {
3886 if (!AggressiveInsts.
count(&*
I) && !
I->isDebugOrPseudoInst()) {
3899 if (IsUnpredictable)
dbgs() <<
" (unpredictable)";
3901 <<
" F: " << IfFalse->
getName() <<
"\n");
3918 Value *Sel = Builder.CreateSelectFMF(IfCond, TrueVal, FalseVal,
3923 PN->eraseFromParent();
3929 Builder.CreateBr(BB);
3938 DomBI->eraseFromParent();
3950 return Builder.CreateBinOp(
Opc,
LHS,
RHS, Name);
3951 if (
Opc == Instruction::And)
3952 return Builder.CreateLogicalAnd(
LHS,
RHS, Name);
3953 if (
Opc == Instruction::Or)
3954 return Builder.CreateLogicalOr(
LHS,
RHS, Name);
3966 bool PredHasWeights =
3968 bool SuccHasWeights =
3970 if (PredHasWeights || SuccHasWeights) {
3971 if (!PredHasWeights)
3972 PredTrueWeight = PredFalseWeight = 1;
3973 if (!SuccHasWeights)
3974 SuccTrueWeight = SuccFalseWeight = 1;
3984static std::optional<std::tuple<BasicBlock *, Instruction::BinaryOps, bool>>
3987 assert(BI && PBI &&
"Both blocks must end with a conditional branches.");
3989 "PredBB must be a predecessor of BB.");
3995 if (
TTI && !PBI->getMetadata(LLVMContext::MD_unpredictable) &&
3997 (PTWeight + PFWeight) != 0) {
4000 Likely =
TTI->getPredictableBranchThreshold();
4005 if (PBITrueProb.
isUnknown() || PBITrueProb < Likely)
4006 return {{BI->
getSuccessor(0), Instruction::Or,
false}};
4010 return {{BI->
getSuccessor(1), Instruction::And,
false}};
4013 if (PBITrueProb.
isUnknown() || PBITrueProb < Likely)
4014 return {{BI->
getSuccessor(1), Instruction::And,
true}};
4020 return std::nullopt;
4033 bool InvertPredCond;
4034 std::tie(CommonSucc,
Opc, InvertPredCond) =
4037 LLVM_DEBUG(
dbgs() <<
"FOLDING BRANCH TO COMMON DEST:\n" << *PBI << *BB);
4045 I->copyMetadata(*BB->
getTerminator(), LLVMContext::MD_annotation);
4050 if (InvertPredCond) {
4063 uint64_t PredTrueWeight, PredFalseWeight, SuccTrueWeight, SuccFalseWeight;
4066 SuccTrueWeight, SuccFalseWeight)) {
4072 MDWeights.
push_back(PredTrueWeight * SuccTrueWeight);
4077 MDWeights.
push_back(PredFalseWeight * (SuccFalseWeight + SuccTrueWeight) +
4078 PredTrueWeight * SuccFalseWeight);
4084 MDWeights.
push_back(PredTrueWeight * (SuccFalseWeight + SuccTrueWeight) +
4085 PredFalseWeight * SuccTrueWeight);
4087 MDWeights.
push_back(PredFalseWeight * SuccFalseWeight);
4096 PBI->setMetadata(LLVMContext::MD_prof,
nullptr);
4107 if (
MDNode *LoopMD = BI->getMetadata(LLVMContext::MD_loop))
4108 PBI->setMetadata(LLVMContext::MD_loop, LoopMD);
4129 if (!MDWeights.
empty()) {
4130 assert(isSelectInRoleOfConjunctionOrDisjunction(
SI));
4135 ++NumFoldBranchToCommonDest;
4142 return I.getType()->isVectorTy() ||
any_of(
I.operands(), [](
Use &U) {
4143 return U->getType()->isVectorTy();
4154 unsigned BonusInstThreshold) {
4163 Cond->getParent() != BB || !
Cond->hasOneUse())
4184 bool InvertPredCond;
4186 std::tie(CommonSucc,
Opc, InvertPredCond) = *Recipe;
4218 unsigned NumBonusInsts = 0;
4219 bool SawVectorOp =
false;
4220 const unsigned PredCount = Preds.
size();
4224 PredCount == 1 ? Preds[0]->getTerminator() :
nullptr;
4244 NumBonusInsts += PredCount;
4252 auto IsBCSSAUse = [BB, &
I](
Use &U) {
4255 return PN->getIncomingBlock(U) == BB;
4256 return UI->
getParent() == BB &&
I.comesBefore(UI);
4260 if (!
all_of(
I.uses(), IsBCSSAUse))
4264 BonusInstThreshold *
4280 for (
auto *BB : {BB1, BB2}) {
4296 Value *AlternativeV =
nullptr) {
4322 BasicBlock *OtherPredBB = *PredI == BB ? *++PredI : *PredI;
4323 if (
PHI->getIncomingValueForBlock(OtherPredBB) == AlternativeV)
4331 if (!AlternativeV &&
4337 PHI->addIncoming(V, BB);
4347 BasicBlock *PostBB,
Value *Address,
bool InvertPCond,
bool InvertQCond,
4356 if (!PStore || !QStore)
4379 if (
I.mayReadOrWriteMemory())
4381 for (
auto &
I : *QFB)
4382 if (&
I != QStore &&
I.mayReadOrWriteMemory())
4385 for (
auto &
I : *QTB)
4386 if (&
I != QStore &&
I.mayReadOrWriteMemory())
4390 if (&*
I != PStore &&
I->mayReadOrWriteMemory())
4404 for (
auto &
I : *BB) {
4406 if (
I.isTerminator())
4424 "When we run out of budget we will eagerly return from within the "
4425 "per-instruction loop.");
4429 const std::array<StoreInst *, 2> FreeStores = {PStore, QStore};
4431 (!IsWorthwhile(PTB, FreeStores) || !IsWorthwhile(PFB, FreeStores) ||
4432 !IsWorthwhile(QTB, FreeStores) || !IsWorthwhile(QFB, FreeStores)))
4468 InvertPCond ^= (PStore->
getParent() != PTB);
4469 InvertQCond ^= (QStore->
getParent() != QTB);
4490 {CombinedWeights[0], CombinedWeights[1]},
4497 SI->copyMetadata(*QStore);
4503 DbgAssign->replaceVariableLocationOp(PStore->
getValueOperand(), QPHI);
4506 DbgAssign->replaceVariableLocationOp(QStore->
getValueOperand(), QPHI);
4569 bool InvertPCond =
false, InvertQCond =
false;
4571 if (PFB == QBI->getParent()) {
4575 if (QFB == PostBB) {
4582 if (PTB == QBI->getParent())
4593 if (!HasOnePredAndOneSucc(PFB, PBI->getParent(), QBI->getParent()) ||
4594 !HasOnePredAndOneSucc(QFB, QBI->getParent(), PostBB))
4596 if ((PTB && !HasOnePredAndOneSucc(PTB, PBI->getParent(), QBI->getParent())) ||
4597 (QTB && !HasOnePredAndOneSucc(QTB, QBI->getParent(), PostBB)))
4599 if (!QBI->getParent()->hasNUses(2))
4605 for (
auto *BB : {PTB, PFB}) {
4610 PStoreAddresses.
insert(
SI->getPointerOperand());
4612 for (
auto *BB : {QTB, QFB}) {
4617 QStoreAddresses.
insert(
SI->getPointerOperand());
4623 auto &CommonAddresses = PStoreAddresses;
4626 for (
auto *Address : CommonAddresses)
4629 InvertPCond, InvertQCond, DTU,
DL,
TTI);
4647 !BI->getParent()->getSinglePredecessor())
4649 if (!IfFalseBB->
phis().empty())
4659 return I.mayWriteToMemory() ||
I.mayHaveSideEffects();
4664 NoSideEffects(*BI->getParent())) {
4676 NoSideEffects(*BI->getParent())) {
4733 if (&*BB->
begin() != BI)
4761 if (!PBI->getMetadata(LLVMContext::MD_unpredictable) &&
4763 (
static_cast<uint64_t>(PredWeights[0]) + PredWeights[1]) != 0) {
4767 static_cast<uint64_t>(PredWeights[0]) + PredWeights[1]);
4770 if (CommonDestProb >= Likely)
4780 unsigned NumPhis = 0;
4791 <<
"AND: " << *BI->getParent());
4802 if (OtherDest == BB) {
4810 OtherDest = InfLoopBlock;
4822 PBICond = Builder.CreateNot(PBICond, PBICond->
getName() +
".not");
4826 BICond = Builder.CreateNot(BICond, BICond->
getName() +
".not");
4830 createLogicalOp(Builder, Instruction::Or, PBICond, BICond,
"brmerge");
4845 uint64_t PredTrueWeight, PredFalseWeight, SuccTrueWeight, SuccFalseWeight;
4846 uint64_t PredCommon, PredOther, SuccCommon, SuccOther;
4849 SuccTrueWeight, SuccFalseWeight);
4851 PredCommon = PBIOp ? PredFalseWeight : PredTrueWeight;
4852 PredOther = PBIOp ? PredTrueWeight : PredFalseWeight;
4853 SuccCommon = BIOp ? SuccFalseWeight : SuccTrueWeight;
4854 SuccOther = BIOp ? SuccTrueWeight : SuccFalseWeight;
4858 uint64_t NewWeights[2] = {PredCommon * (SuccCommon + SuccOther) +
4859 PredOther * SuccCommon,
4860 PredOther * SuccOther};
4868 assert(isSelectInRoleOfConjunctionOrDisjunction(
SI));
4870 assert(
SI->getCondition() == PBICond);
4887 Value *BIV = PN.getIncomingValueForBlock(BB);
4888 unsigned PBBIdx = PN.getBasicBlockIndex(PBI->getParent());
4889 Value *PBIV = PN.getIncomingValue(PBBIdx);
4893 Builder.CreateSelect(PBICond, PBIV, BIV, PBIV->
getName() +
".mux"));
4894 PN.setIncomingValue(PBBIdx, NV);
4898 uint64_t TrueWeight = PBIOp ? PredFalseWeight : PredTrueWeight;
4899 uint64_t FalseWeight = PBIOp ? PredTrueWeight : PredFalseWeight;
4919bool SimplifyCFGOpt::simplifyTerminatorOnSelect(Instruction *OldTerm,
4921 BasicBlock *FalseBB,
4922 uint32_t TrueWeight,
4923 uint32_t FalseWeight) {
4930 BasicBlock *KeepEdge2 = TrueBB != FalseBB ? FalseBB :
nullptr;
4932 SmallSetVector<BasicBlock *, 2> RemovedSuccessors;
4935 for (BasicBlock *Succ :
successors(OldTerm)) {
4937 if (Succ == KeepEdge1)
4938 KeepEdge1 =
nullptr;
4939 else if (Succ == KeepEdge2)
4940 KeepEdge2 =
nullptr;
4945 if (Succ != TrueBB && Succ != FalseBB)
4946 RemovedSuccessors.
insert(Succ);
4954 if (!KeepEdge1 && !KeepEdge2) {
4955 if (TrueBB == FalseBB) {
4966 }
else if (KeepEdge1 && (KeepEdge2 || TrueBB == FalseBB)) {
4986 SmallVector<DominatorTree::UpdateType, 2> Updates;
4988 for (
auto *RemovedSuccessor : RemovedSuccessors)
4989 Updates.
push_back({DominatorTree::Delete, BB, RemovedSuccessor});
5000bool SimplifyCFGOpt::simplifySwitchOnSelect(SwitchInst *SI,
5005 if (!TrueVal || !FalseVal)
5010 BasicBlock *TrueBB =
SI->findCaseValue(TrueVal)->getCaseSuccessor();
5011 BasicBlock *FalseBB =
SI->findCaseValue(FalseVal)->getCaseSuccessor();
5014 uint32_t TrueWeight = 0, FalseWeight = 0;
5015 SmallVector<uint64_t, 8> Weights;
5019 if (Weights.
size() == 1 +
SI->getNumCases()) {
5021 (uint32_t)Weights[
SI->findCaseValue(TrueVal)->getSuccessorIndex()];
5023 (uint32_t)Weights[
SI->findCaseValue(FalseVal)->getSuccessorIndex()];
5028 return simplifyTerminatorOnSelect(SI, Condition, TrueBB, FalseBB, TrueWeight,
5037bool SimplifyCFGOpt::simplifyIndirectBrOnSelect(IndirectBrInst *IBI,
5051 SmallVector<uint32_t> SelectBranchWeights(2);
5055 return simplifyTerminatorOnSelect(IBI,
SI->getCondition(), TrueBB, FalseBB,
5056 SelectBranchWeights[0],
5057 SelectBranchWeights[1]);
5077bool SimplifyCFGOpt::tryToSimplifyUncondBranchWithICmpInIt(
5081 return tryToSimplifyUncondBranchWithICmpSelectInIt(ICI,
nullptr, Builder);
5127bool SimplifyCFGOpt::tryToSimplifyUncondBranchWithICmpSelectInIt(
5146 ConstantInt *NewCaseVal;
5154 Value *SelectCond, *SelectTrueVal, *SelectFalseVal;
5160 SelectTrueVal = Builder.
getTrue();
5161 SelectFalseVal = Builder.
getFalse();
5164 SelectCond =
Select->getCondition();
5166 if (SelectCond != ICI)
5168 SelectTrueVal =
Select->getTrueValue();
5169 SelectFalseVal =
Select->getFalseValue();
5174 if (
SI->getCondition() != IcmpCond)
5180 if (
SI->getDefaultDest() != BB) {
5181 ConstantInt *VVal =
SI->findCaseDest(BB);
5182 assert(VVal &&
"Should have a unique destination value");
5190 return requestResimplify();
5196 if (
SI->findCaseValue(NewCaseVal) !=
SI->case_default()) {
5198 if (Predicate == ICmpInst::ICMP_EQ)
5206 return requestResimplify();
5213 if (PHIUse ==
nullptr || PHIUse != &SuccBlock->
front() ||
5219 Value *DefaultCst = SelectFalseVal;
5220 Value *NewCst = SelectTrueVal;
5228 Select->replaceAllUsesWith(DefaultCst);
5229 Select->eraseFromParent();
5235 SmallVector<DominatorTree::UpdateType, 2> Updates;
5242 SwitchInstProfUpdateWrapper SIW(*SI);
5243 auto W0 = SIW.getSuccessorWeight(0);
5246 NewW = ((uint64_t(*W0) + 1) >> 1);
5247 SIW.setSuccessorWeight(0, *NewW);
5249 SIW.addCase(NewCaseVal, NewBB, NewW);
5251 Updates.
push_back({DominatorTree::Insert, Pred, NewBB});
5260 Updates.
push_back({DominatorTree::Insert, NewBB, SuccBlock});
5268bool SimplifyCFGOpt::simplifyBranchOnICmpChain(CondBrInst *BI,
5270 const DataLayout &
DL) {
5280 ConstantComparesGatherer ConstantCompare(
Cond,
DL);
5282 SmallVectorImpl<ConstantInt *> &
Values = ConstantCompare.Vals;
5283 Value *CompVal = ConstantCompare.CompValue;
5284 unsigned UsedICmps = ConstantCompare.UsedICmps;
5285 Value *ExtraCase = ConstantCompare.Extra;
5286 bool TrueWhenEqual = ConstantCompare.IsEq;
5303 if (ExtraCase &&
Values.size() < 2)
5306 SmallVector<uint32_t> BranchWeights;
5313 if (!TrueWhenEqual) {
5316 std::swap(BranchWeights[0], BranchWeights[1]);
5322 <<
" cases into SWITCH. BB is:\n"
5325 SmallVector<DominatorTree::UpdateType, 2> Updates;
5332 nullptr,
"switch.early.test");
5343 AssumptionCache *AC =
Options.AC;
5349 auto *Br = TrueWhenEqual ? Builder.
CreateCondBr(ExtraCase, EdgeBB, NewBB)
5356 Updates.
push_back({DominatorTree::Insert, BB, EdgeBB});
5362 LLVM_DEBUG(
dbgs() <<
" ** 'icmp' chain unhandled condition: " << *ExtraCase
5363 <<
"\nEXTRABB = " << *BB);
5371 "Should not end up here with unstable pointers");
5373 CompVal,
DL.getIntPtrType(CompVal->
getType()),
"magicptr");
5378 if (
Values.front()->getValue() -
Values.back()->getValue() ==
5381 Values.back()->getValue(),
Values.front()->getValue() + 1);
5383 ICmpInst::Predicate Pred;
5401 SmallVector<uint32_t> NewWeights(
Values.size() + 1);
5402 NewWeights[0] = BranchWeights[1];
5405 V = BranchWeights[0] /
Values.size();
5410 for (ConstantInt *Val :
Values)
5411 New->addCase(Val, EdgeBB);
5419 for (
unsigned i = 0, e =
Values.size() - 1; i != e; ++i)
5429 LLVM_DEBUG(
dbgs() <<
" ** 'icmp' chain result is:\n" << *BB <<
'\n');
5433bool SimplifyCFGOpt::simplifyResume(ResumeInst *RI,
IRBuilder<> &Builder) {
5435 return simplifyCommonResume(RI);
5439 return simplifySingleResume(RI);
5452 switch (IntrinsicID) {
5453 case Intrinsic::dbg_declare:
5454 case Intrinsic::dbg_value:
5455 case Intrinsic::dbg_label:
5456 case Intrinsic::lifetime_end:
5466bool SimplifyCFGOpt::simplifyCommonResume(ResumeInst *RI) {
5475 SmallSetVector<BasicBlock *, 4> TrivialUnwindBlocks;
5479 for (
unsigned Idx = 0, End = PhiLPInst->getNumIncomingValues(); Idx != End;
5481 auto *IncomingBB = PhiLPInst->getIncomingBlock(Idx);
5482 auto *IncomingValue = PhiLPInst->getIncomingValue(Idx);
5486 if (IncomingBB->getUniqueSuccessor() != BB)
5491 if (IncomingValue != LandingPad)
5495 make_range(LandingPad->getNextNode(), IncomingBB->getTerminator())))
5496 TrivialUnwindBlocks.
insert(IncomingBB);
5500 if (TrivialUnwindBlocks.
empty())
5504 for (
auto *TrivialBB : TrivialUnwindBlocks) {
5508 while (PhiLPInst->getBasicBlockIndex(TrivialBB) != -1)
5511 for (BasicBlock *Pred :
5522 TrivialBB->getTerminator()->eraseFromParent();
5523 new UnreachableInst(RI->
getContext(), TrivialBB);
5525 DTU->
applyUpdates({{DominatorTree::Delete, TrivialBB, BB}});
5532 return !TrivialUnwindBlocks.empty();
5536bool SimplifyCFGOpt::simplifySingleResume(ResumeInst *RI) {
5540 "Resume must unwind the exception that caused control to here");
5596 int Idx = DestPN.getBasicBlockIndex(BB);
5610 Value *SrcVal = DestPN.getIncomingValue(Idx);
5613 bool NeedPHITranslation = SrcPN && SrcPN->
getParent() == BB;
5617 DestPN.addIncoming(Incoming, Pred);
5644 std::vector<DominatorTree::UpdateType> Updates;
5648 if (UnwindDest ==
nullptr) {
5689 if (!SuccessorCleanupPad)
5698 SuccessorCleanupPad->eraseFromParent();
5707bool SimplifyCFGOpt::simplifyCleanupReturn(CleanupReturnInst *RI) {
5724bool SimplifyCFGOpt::simplifyUnreachable(UnreachableInst *UI) {
5756 BBI->dropDbgRecords();
5760 BBI->eraseFromParent();
5766 if (&BB->
front() != UI)
5769 std::vector<DominatorTree::UpdateType> Updates;
5772 for (BasicBlock *Predecessor : Preds) {
5780 Updates.push_back({DominatorTree::Delete, Predecessor, BB});
5791 "The destinations are guaranteed to be different here.");
5792 CallInst *Assumption;
5808 Updates.push_back({DominatorTree::Delete, Predecessor, BB});
5810 SwitchInstProfUpdateWrapper SU(*SI);
5811 for (
auto i = SU->case_begin(), e = SU->case_end(); i != e;) {
5812 if (i->getCaseSuccessor() != BB) {
5817 i = SU.removeCase(i);
5822 if (DTU &&
SI->getDefaultDest() != BB)
5823 Updates.push_back({DominatorTree::Delete, Predecessor, BB});
5825 if (
II->getUnwindDest() == BB) {
5831 if (!CI->doesNotThrow())
5832 CI->setDoesNotThrow();
5836 if (CSI->getUnwindDest() == BB) {
5847 E = CSI->handler_end();
5850 CSI->removeHandler(
I);
5857 Updates.push_back({DominatorTree::Delete, Predecessor, BB});
5858 if (CSI->getNumHandlers() == 0) {
5859 if (CSI->hasUnwindDest()) {
5863 for (
auto *PredecessorOfPredecessor :
predecessors(Predecessor)) {
5864 Updates.push_back({DominatorTree::Insert,
5865 PredecessorOfPredecessor,
5866 CSI->getUnwindDest()});
5867 Updates.push_back({DominatorTree::Delete,
5868 PredecessorOfPredecessor, Predecessor});
5871 Predecessor->replaceAllUsesWith(CSI->getUnwindDest());
5878 SmallVector<BasicBlock *, 8> EHPreds(
predecessors(Predecessor));
5879 for (BasicBlock *EHPred : EHPreds)
5883 new UnreachableInst(CSI->getContext(), CSI->getIterator());
5884 CSI->eraseFromParent();
5889 assert(CRI->hasUnwindDest() && CRI->getUnwindDest() == BB &&
5890 "Expected to always have an unwind to BB.");
5892 Updates.push_back({DominatorTree::Delete, Predecessor, BB});
5920static std::optional<ContiguousCasesResult>
5927 const APInt &Min = Cases.
back()->getValue();
5928 const APInt &Max = Cases.
front()->getValue();
5930 size_t ContiguousOffset = Cases.
size() - 1;
5931 if (
Offset == ContiguousOffset) {
5950 std::adjacent_find(Cases.
begin(), Cases.
end(), [](
auto L,
auto R) {
5951 return L->getValue() != R->getValue() + 1;
5953 if (It == Cases.
end())
5954 return std::nullopt;
5955 auto [OtherMax, OtherMin] = std::make_pair(*It, *std::next(It));
5956 if ((Max - OtherMax->getValue()) + (OtherMin->getValue() - Min) ==
5960 ConstantInt::get(OtherMin->getType(), OtherMin->getValue() + 1)),
5963 ConstantInt::get(OtherMax->getType(), OtherMax->getValue() - 1)),
5971 return std::nullopt;
5976 bool RemoveOrigDefaultBlock =
true) {
5978 auto *BB = Switch->getParent();
5979 auto *OrigDefaultBlock = Switch->getDefaultDest();
5980 if (RemoveOrigDefaultBlock)
5981 OrigDefaultBlock->removePredecessor(BB);
5985 auto *UI =
new UnreachableInst(Switch->getContext(), NewDefaultBlock);
5987 Switch->setDefaultDest(&*NewDefaultBlock);
5991 if (RemoveOrigDefaultBlock &&
6001bool SimplifyCFGOpt::turnSwitchRangeIntoICmp(SwitchInst *SI,
6003 assert(
SI->getNumCases() > 1 &&
"Degenerate switch?");
6005 bool HasDefault = !
SI->defaultDestUnreachable();
6007 auto *BB =
SI->getParent();
6009 BasicBlock *DestA = HasDefault ?
SI->getDefaultDest() :
nullptr;
6014 for (
auto Case :
SI->cases()) {
6018 if (Dest == DestA) {
6024 if (Dest == DestB) {
6034 "Single-destination switch should have been folded.");
6036 assert(DestB !=
SI->getDefaultDest());
6037 assert(!CasesB.
empty() &&
"There must be non-default cases.");
6041 std::optional<ContiguousCasesResult> ContiguousCases;
6044 if (!HasDefault && CasesA.
size() == 1)
6045 ContiguousCases = ContiguousCasesResult{
6053 else if (CasesB.
size() == 1)
6054 ContiguousCases = ContiguousCasesResult{
6063 else if (!HasDefault)
6067 if (!ContiguousCases)
6071 if (!ContiguousCases)
6074 auto [Min,
Max, Dest, OtherDest, Cases, OtherCases] = *ContiguousCases;
6080 Max->getValue() - Min->getValue() + 1);
6083 assert(
Max->getValue() == Min->getValue());
6088 else if (NumCases->
isNullValue() && !Cases->empty()) {
6092 if (!
Offset->isNullValue())
6100 SmallVector<uint64_t, 8> Weights;
6102 if (Weights.
size() == 1 +
SI->getNumCases()) {
6103 uint64_t TrueWeight = 0;
6104 uint64_t FalseWeight = 0;
6105 for (
size_t I = 0,
E = Weights.
size();
I !=
E; ++
I) {
6106 if (
SI->getSuccessor(
I) == Dest)
6107 TrueWeight += Weights[
I];
6109 FalseWeight += Weights[
I];
6111 while (TrueWeight > UINT32_MAX || FalseWeight > UINT32_MAX) {
6122 unsigned PreviousEdges = Cases->size();
6123 if (Dest ==
SI->getDefaultDest())
6125 for (
unsigned I = 0,
E = PreviousEdges - 1;
I !=
E; ++
I)
6126 PHI.removeIncomingValue(
SI->getParent());
6129 unsigned PreviousEdges = OtherCases->size();
6130 if (OtherDest ==
SI->getDefaultDest())
6132 unsigned E = PreviousEdges - 1;
6136 for (
unsigned I = 0;
I !=
E; ++
I)
6137 PHI.removeIncomingValue(
SI->getParent());
6145 auto *UnreachableDefault =
SI->getDefaultDest();
6148 SI->eraseFromParent();
6150 if (!HasDefault && DTU)
6151 DTU->
applyUpdates({{DominatorTree::Delete, BB, UnreachableDefault}});
6169 unsigned MaxSignificantBitsInCond =
6176 for (
const auto &Case :
SI->cases()) {
6177 auto *
Successor = Case.getCaseSuccessor();
6188 (IsKnownValuesValid && !KnownValues.
contains(CaseC))) {
6194 }
else if (IsKnownValuesValid)
6195 KnownValues.
erase(CaseC);
6202 bool HasDefault = !
SI->defaultDestUnreachable();
6203 const unsigned NumUnknownBits =
6206 if (HasDefault && DeadCases.
empty()) {
6212 if (NumUnknownBits < 64 ) {
6213 uint64_t AllNumCases = 1ULL << NumUnknownBits;
6214 if (
SI->getNumCases() == AllNumCases) {
6221 if (
SI->getNumCases() == AllNumCases - 1) {
6222 assert(NumUnknownBits > 1 &&
"Should be canonicalized to a branch");
6224 if (CondTy->getIntegerBitWidth() > 64 ||
6225 !
DL.fitsInLegalInteger(CondTy->getIntegerBitWidth()))
6229 for (
const auto &Case :
SI->cases())
6230 MissingCaseVal ^= Case.getCaseValue()->getValue().getLimitedValue();
6232 ConstantInt::get(
Cond->getType(), MissingCaseVal));
6234 SIW.
addCase(MissingCase,
SI->getDefaultDest(),
6244 if (DeadCases.
empty())
6250 assert(CaseI !=
SI->case_default() &&
6251 "Case was not found. Probably mistake in DeadCases forming.");
6253 CaseI->getCaseSuccessor()->removePredecessor(
SI->getParent());
6258 std::vector<DominatorTree::UpdateType> Updates;
6259 for (
auto *
Successor : UniqueSuccessors)
6260 if (NumPerSuccessorCases[
Successor] == 0)
6287 int Idx =
PHI.getBasicBlockIndex(BB);
6288 assert(Idx >= 0 &&
"PHI has no entry for predecessor?");
6290 Value *InValue =
PHI.getIncomingValue(Idx);
6291 if (InValue != CaseValue)
6307 ForwardingNodesMap ForwardingNodes;
6310 for (
const auto &Case :
SI->cases()) {
6312 BasicBlock *CaseDest = Case.getCaseSuccessor();
6331 int SwitchBBIdx = Phi.getBasicBlockIndex(SwitchBlock);
6332 if (Phi.getIncomingValue(SwitchBBIdx) == CaseValue &&
6333 count(Phi.blocks(), SwitchBlock) == 1) {
6334 Phi.setIncomingValue(SwitchBBIdx,
SI->getCondition());
6342 ForwardingNodes[Phi].push_back(PhiIdx);
6345 for (
auto &ForwardingNode : ForwardingNodes) {
6346 PHINode *Phi = ForwardingNode.first;
6352 for (
int Index : Indexes)
6353 Phi->setIncomingValue(Index,
SI->getCondition());
6363 if (
C->isThreadDependent())
6365 if (
C->isDLLImportDependent())
6373 if (
C->getType()->isScalableTy())
6384 if (!
TTI.shouldBuildLookupTablesForConstant(
C))
6411 if (
A->isAllOnesValue())
6413 if (
A->isNullValue())
6419 for (
unsigned N = 0,
E =
I->getNumOperands();
N !=
E; ++
N) {
6444 ConstantPool.insert(std::make_pair(
SI->getCondition(), CaseVal));
6446 if (
I.isTerminator()) {
6448 if (
I.getNumSuccessors() != 1 ||
I.isSpecialTerminator())
6451 CaseDest =
I.getSuccessor(0);
6458 for (
auto &
Use :
I.uses()) {
6461 if (
I->getParent() == CaseDest)
6464 if (Phi->getIncomingBlock(
Use) == CaseDest)
6477 *CommonDest = CaseDest;
6479 if (CaseDest != *CommonDest)
6484 int Idx =
PHI.getBasicBlockIndex(Pred);
6497 Res.push_back(std::make_pair(&
PHI, ConstVal));
6500 return Res.
size() > 0;
6506 SwitchCaseResultVectorTy &UniqueResults,
6508 for (
auto &
I : UniqueResults) {
6509 if (
I.first == Result) {
6510 I.second.push_back(CaseVal);
6511 return I.second.size();
6514 UniqueResults.push_back(
6525 SwitchCaseResultVectorTy &UniqueResults,
6530 for (
const auto &
I :
SI->cases()) {
6544 const size_t NumCasesForResult =
6552 if (UniqueResults.size() > MaxUniqueResults)
6568 DefaultResults.
size() == 1 ? DefaultResults.
begin()->second :
nullptr;
6570 return DefaultResult ||
SI->defaultDestUnreachable();
6591 const bool HasBranchWeights =
6594 if (ResultVector.size() == 2 && ResultVector[0].second.size() == 1 &&
6595 ResultVector[1].second.size() == 1) {
6596 ConstantInt *FirstCase = ResultVector[0].second[0];
6597 ConstantInt *SecondCase = ResultVector[1].second[0];
6598 Value *SelectValue = ResultVector[1].first;
6599 if (DefaultResult) {
6600 Value *ValueCompare =
6601 Builder.CreateICmpEQ(Condition, SecondCase,
"switch.selectcmp");
6602 SelectValue = Builder.CreateSelect(ValueCompare, ResultVector[1].first,
6603 DefaultResult,
"switch.select");
6605 SI && HasBranchWeights) {
6612 *
SI, {BranchWeights[2], BranchWeights[0] + BranchWeights[1]},
6616 Value *ValueCompare =
6617 Builder.CreateICmpEQ(Condition, FirstCase,
"switch.selectcmp");
6618 Value *Ret = Builder.CreateSelect(ValueCompare, ResultVector[0].first,
6619 SelectValue,
"switch.select");
6625 size_t FirstCasePos = (Condition !=
nullptr);
6626 size_t SecondCasePos = FirstCasePos + 1;
6627 uint32_t DefaultCase = (Condition !=
nullptr) ? BranchWeights[0] : 0;
6629 {BranchWeights[FirstCasePos],
6630 DefaultCase + BranchWeights[SecondCasePos]},
6637 if (ResultVector.size() == 1 && DefaultResult) {
6639 unsigned CaseCount = CaseValues.
size();
6652 for (
auto *Case : CaseValues) {
6653 if (Case->getValue().slt(MinCaseVal->
getValue()))
6655 AndMask &= Case->getValue();
6665 if (FreeBits ==
Log2_32(CaseCount)) {
6666 Value *
And = Builder.CreateAnd(Condition, AndMask);
6667 Value *Cmp = Builder.CreateICmpEQ(
6670 Builder.CreateSelect(Cmp, ResultVector[0].first, DefaultResult);
6686 for (
auto *Case : CaseValues)
6687 BitMask |= (Case->getValue() - MinCaseVal->
getValue());
6693 Condition = Builder.CreateSub(Condition, MinCaseVal);
6694 Value *
And = Builder.CreateAnd(Condition, ~BitMask,
"switch.and");
6695 Value *Cmp = Builder.CreateICmpEQ(
6698 Builder.CreateSelect(Cmp, ResultVector[0].first, DefaultResult);
6711 if (CaseValues.
size() == 2) {
6712 Value *Cmp1 = Builder.CreateICmpEQ(Condition, CaseValues[0],
6713 "switch.selectcmp.case1");
6714 Value *Cmp2 = Builder.CreateICmpEQ(Condition, CaseValues[1],
6715 "switch.selectcmp.case2");
6716 Value *Cmp = Builder.CreateOr(Cmp1, Cmp2,
"switch.selectcmp");
6718 Builder.CreateSelect(Cmp, ResultVector[0].first, DefaultResult);
6738 std::vector<DominatorTree::UpdateType> Updates;
6745 Builder.CreateBr(DestBB);
6749 PHI->removeIncomingValueIf(
6750 [&](
unsigned Idx) {
return PHI->getIncomingBlock(Idx) == SelectBB; });
6751 PHI->addIncoming(SelectValue, SelectBB);
6754 for (
unsigned i = 0, e =
SI->getNumSuccessors(); i < e; ++i) {
6760 if (DTU && RemovedSuccessors.
insert(Succ).second)
6763 SI->eraseFromParent();
6778 SwitchCaseResultVectorTy UniqueResults;
6784 assert(
PHI !=
nullptr &&
"PHI for value select not found");
6785 Builder.SetInsertPoint(
SI);
6788 [[maybe_unused]]
auto HasWeights =
6793 (BranchWeights.
size() >=
6794 UniqueResults.size() + (DefaultResult !=
nullptr)));
6797 Builder,
DL, BranchWeights);
6809class SwitchReplacement {
6816 const SmallVectorImpl<std::pair<ConstantInt *, Constant *>> &
Values,
6817 Constant *DefaultValue,
const DataLayout &
DL,
6818 const TargetTransformInfo &
TTI,
const StringRef &FuncName);
6827 static bool wouldFitInRegister(
const DataLayout &
DL, uint64_t TableSize,
6834 bool isLookupTable();
6871 ConstantInt *BitMap =
nullptr;
6872 IntegerType *BitMapElementTy =
nullptr;
6875 ConstantInt *LinearOffset =
nullptr;
6876 ConstantInt *LinearMultiplier =
nullptr;
6877 bool LinearMapValWrapped =
false;
6885SwitchReplacement::SwitchReplacement(
6887 const SmallVectorImpl<std::pair<ConstantInt *, Constant *>> &
Values,
6888 Constant *DefaultValue,
const DataLayout &
DL,
6889 const TargetTransformInfo &
TTI,
const StringRef &FuncName)
6890 : DefaultValue(DefaultValue) {
6891 assert(
Values.size() &&
"Can't build lookup table without values!");
6892 assert(TableSize >=
Values.size() &&
"Can't fit values in table!");
6895 SingleValue =
Values.begin()->second;
6901 for (
const auto &[CaseVal, CaseRes] :
Values) {
6904 uint64_t Idx = (CaseVal->getValue() -
Offset->getValue()).getLimitedValue();
6905 TableContents[Idx] = CaseRes;
6912 if (
Values.size() < TableSize) {
6914 "Need a default value to fill the lookup table holes.");
6917 if (!TableContents[
I])
6918 TableContents[
I] = DefaultValue;
6924 if (DefaultValue != SingleValue && !DefaultValueIsPoison)
6925 SingleValue =
nullptr;
6931 Kind = SingleValueKind;
6938 bool LinearMappingPossible =
true;
6943 bool NonMonotonic =
false;
6944 assert(TableSize >= 2 &&
"Should be a SingleValue table.");
6961 LinearMappingPossible =
false;
6966 APInt Dist = Val - PrevVal;
6969 }
else if (Dist != DistToPrev) {
6970 LinearMappingPossible =
false;
6978 if (LinearMappingPossible) {
6980 LinearMultiplier = ConstantInt::get(M.getContext(), DistToPrev);
6981 APInt M = LinearMultiplier->getValue();
6982 bool MayWrap =
true;
6983 if (
isIntN(M.getBitWidth(), TableSize - 1))
6984 (void)M.
smul_ov(
APInt(M.getBitWidth(), TableSize - 1), MayWrap);
6985 LinearMapValWrapped = NonMonotonic || MayWrap;
6986 Kind = LinearMapKind;
6992 if (wouldFitInRegister(
DL, TableSize,
ValueType)) {
6994 APInt TableInt(TableSize *
IT->getBitWidth(), 0);
6996 TableInt <<=
IT->getBitWidth();
7000 TableInt |= Val->
getValue().
zext(TableInt.getBitWidth());
7003 BitMap = ConstantInt::get(M.getContext(), TableInt);
7004 BitMapElementTy =
IT;
7015 unsigned NeededBitWidth =
7016 std::max(
TTI.getMinimumLookupTableEntryBitWidth(),
7029 Kind = LookupTableKind;
7035 case SingleValueKind:
7037 case LinearMapKind: {
7041 false,
"switch.idx.cast");
7042 if (!LinearMultiplier->
isOne())
7043 Result = Builder.
CreateMul(Result, LinearMultiplier,
"switch.idx.mult",
7045 !LinearMapValWrapped);
7047 if (!LinearOffset->
isZero())
7050 !LinearMapValWrapped);
7067 ShiftAmt, ConstantInt::get(MapTy, BitMapElementTy->
getBitWidth()),
7068 "switch.shiftamt",
true,
true);
7071 Value *DownShifted =
7072 Builder.
CreateLShr(BitMap, ShiftAmt,
"switch.downshift");
7074 return Builder.
CreateTrunc(DownShifted, BitMapElementTy,
"switch.masked");
7076 case LookupTableKind: {
7079 new GlobalVariable(*
Func->getParent(), Initializer->
getType(),
7080 true, GlobalVariable::PrivateLinkage,
7081 Initializer,
"switch.table." +
Func->getName());
7082 Table->setUnnamedAddr(GlobalValue::UnnamedAddr::Global);
7085 Table->setAlignment(
DL.getPrefTypeAlign(
ValueType));
7086 Type *IndexTy =
DL.getIndexType(Table->getType());
7089 if (
Index->getType() != IndexTy) {
7090 unsigned OldBitWidth =
Index->getType()->getIntegerBitWidth();
7094 isUIntN(OldBitWidth - 1, ArrayTy->getNumElements() - 1));
7097 Value *GEPIndices[] = {ConstantInt::get(IndexTy, 0),
Index};
7101 Builder.
CreateLoad(ArrayTy->getElementType(),
GEP,
"switch.load");
7110bool SwitchReplacement::wouldFitInRegister(
const DataLayout &
DL,
7112 Type *ElementType) {
7120 if (TableSize >= UINT_MAX /
IT->getBitWidth())
7122 return DL.fitsInLegalInteger(TableSize *
IT->getBitWidth());
7128 if (
TTI.isTypeLegal(Ty))
7143 DL.fitsInLegalInteger(
IT->getBitWidth());
7146Constant *SwitchReplacement::getDefaultValue() {
return DefaultValue; }
7148bool SwitchReplacement::isLookupTable() {
return Kind == LookupTableKind; }
7150bool SwitchReplacement::isBitMap() {
return Kind == BitMapKind; }
7157 const uint64_t MinDensity = OptSize ? 40 : 10;
7162 return NumCases * 100 >= CaseRange * MinDensity;
7183 if (
SI->getNumCases() > TableSize)
7186 bool AllTablesFitInRegister =
true;
7187 bool HasIllegalType =
false;
7188 for (
const auto &Ty : ResultTypes) {
7193 AllTablesFitInRegister =
7194 AllTablesFitInRegister &&
7195 SwitchReplacement::wouldFitInRegister(
DL, TableSize, Ty);
7200 if (HasIllegalType && !AllTablesFitInRegister)
7205 if (AllTablesFitInRegister)
7213 SI->getFunction()->hasOptSize());
7223 MaxCaseVal.
getLimitedValue() == std::numeric_limits<uint64_t>::max() ||
7226 return all_of(ResultTypes, [&](
const auto &ResultType) {
7227 return SwitchReplacement::wouldFitInRegister(
7277 if (DefaultConst != TrueConst && DefaultConst != FalseConst)
7282 for (
auto ValuePair :
Values) {
7285 if (!CaseConst || CaseConst == DefaultConst ||
7286 (CaseConst != TrueConst && CaseConst != FalseConst))
7294 BasicBlock *BranchBlock = RangeCheckBranch->getParent();
7300 if (DefaultConst == FalseConst) {
7303 ++NumTableCmpReuses;
7306 Value *InvertedTableCmp = BinaryOperator::CreateXor(
7307 RangeCmp, ConstantInt::get(RangeCmp->
getType(), 1),
"inverted.cmp",
7308 RangeCheckBranch->getIterator());
7310 ++NumTableCmpReuses;
7320 bool ConvertSwitchToLookupTable) {
7321 assert(
SI->getNumCases() > 1 &&
"Degenerate switch?");
7335 if (
SI->getNumCases() < 3)
7357 MinCaseVal = CaseVal;
7359 MaxCaseVal = CaseVal;
7376 It->second.push_back(std::make_pair(CaseVal,
Value));
7384 bool HasDefaultResults =
7386 DefaultResultsList,
DL,
TTI);
7387 for (
const auto &
I : DefaultResultsList) {
7390 DefaultResults[
PHI] = Result;
7394 *MinCaseVal, *MaxCaseVal, HasDefaultResults, ResultTypes,
DL,
TTI);
7397 if (UseSwitchConditionAsTableIndex) {
7399 TableIndexOffset = ConstantInt::get(MaxCaseVal->
getIntegerType(), 0);
7404 TableIndexOffset = MinCaseVal;
7411 bool DefaultIsReachable = !
SI->defaultDestUnreachable();
7413 bool TableHasHoles = (NumResults < TableSize);
7418 bool AllHolesArePoison = TableHasHoles && !HasDefaultResults;
7426 bool NeedMask = AllHolesArePoison && DefaultIsReachable;
7429 if (
SI->getNumCases() < 4)
7431 if (!
DL.fitsInLegalInteger(TableSize))
7440 if (UseSwitchConditionAsTableIndex) {
7441 TableIndex =
SI->getCondition();
7442 if (HasDefaultResults) {
7454 all_of(ResultTypes, [&](
const auto &ResultType) {
7455 return SwitchReplacement::wouldFitInRegister(
DL, UpperBound,
7460 TableSize = std::max(UpperBound, TableSize);
7463 DefaultIsReachable =
false;
7471 const auto &ResultList = ResultLists[
PHI];
7473 Type *ResultType = ResultList.begin()->second->getType();
7478 SwitchReplacement Replacement(*Fn->
getParent(), TableSize, TableIndexOffset,
7479 ResultList, DefaultVal,
DL,
TTI, FuncName);
7480 PhiToReplacementMap.
insert({
PHI, Replacement});
7483 bool AnyLookupTables =
any_of(
7484 PhiToReplacementMap, [](
auto &KV) {
return KV.second.isLookupTable(); });
7485 bool AnyBitMaps =
any_of(PhiToReplacementMap,
7486 [](
auto &KV) {
return KV.second.isBitMap(); });
7494 if (AnyLookupTables &&
7495 (!
TTI.shouldBuildLookupTables() ||
7501 if (!ConvertSwitchToLookupTable &&
7502 (AnyLookupTables || AnyBitMaps || NeedMask))
7505 Builder.SetInsertPoint(
SI);
7508 if (!UseSwitchConditionAsTableIndex) {
7511 bool MayWrap =
true;
7512 if (!DefaultIsReachable) {
7517 TableIndex = Builder.CreateSub(
SI->getCondition(), TableIndexOffset,
7518 "switch.tableidx",
false,
7522 std::vector<DominatorTree::UpdateType> Updates;
7528 assert(MaxTableSize >= TableSize &&
7529 "It is impossible for a switch to have more entries than the max "
7530 "representable value of its input integer type's size.");
7535 Mod.getContext(),
"switch.lookup", CommonDest->
getParent(), CommonDest);
7540 Builder.SetInsertPoint(
SI);
7541 const bool GeneratingCoveredLookupTable = (MaxTableSize == TableSize);
7542 if (!DefaultIsReachable || GeneratingCoveredLookupTable) {
7543 Builder.CreateBr(LookupBB);
7549 Value *Cmp = Builder.CreateICmpULT(
7550 TableIndex, ConstantInt::get(MinCaseVal->
getType(), TableSize));
7552 Builder.CreateCondBr(Cmp, LookupBB,
SI->getDefaultDest());
7553 CondBranch = RangeCheckBranch;
7559 Builder.SetInsertPoint(LookupBB);
7565 MaskBB->
setName(
"switch.hole_check");
7572 APInt MaskInt(TableSizePowOf2, 0);
7573 APInt One(TableSizePowOf2, 1);
7575 const ResultListTy &ResultList = ResultLists[PHIs[0]];
7576 for (
const auto &Result : ResultList) {
7579 MaskInt |= One << Idx;
7581 ConstantInt *TableMask = ConstantInt::get(
Mod.getContext(), MaskInt);
7588 Builder.CreateZExtOrTrunc(TableIndex, MapTy,
"switch.maskindex");
7589 Value *Shifted = Builder.CreateLShr(TableMask, MaskIndex,
"switch.shifted");
7590 Value *LoBit = Builder.CreateTrunc(
7592 CondBranch = Builder.CreateCondBr(LoBit, LookupBB,
SI->getDefaultDest());
7597 Builder.SetInsertPoint(LookupBB);
7601 if (!DefaultIsReachable || GeneratingCoveredLookupTable) {
7604 SI->getDefaultDest()->removePredecessor(BB,
7611 const ResultListTy &ResultList = ResultLists[
PHI];
7612 auto Replacement = PhiToReplacementMap.
at(
PHI);
7613 auto *Result = Replacement.replaceSwitch(TableIndex, Builder,
DL, Fn);
7616 if (!TableHasHoles && HasDefaultResults && RangeCheckBranch) {
7619 for (
auto *
User :
PHI->users()) {
7621 Replacement.getDefaultValue(), ResultList);
7625 PHI->addIncoming(Result, LookupBB);
7628 Builder.CreateBr(CommonDest);
7640 for (
unsigned I = 0,
E =
SI->getNumSuccessors();
I <
E; ++
I) {
7643 if (Succ ==
SI->getDefaultDest()) {
7644 if (HasBranchWeights)
7645 ToDefaultWeight += BranchWeights[
I];
7649 if (DTU && RemovedSuccessors.
insert(Succ).second)
7651 if (HasBranchWeights)
7652 ToLookupWeight += BranchWeights[
I];
7654 SI->eraseFromParent();
7655 if (HasBranchWeights)
7662 ++NumLookupTablesHoles;
7678 if (CondTy->getIntegerBitWidth() > 64 ||
7679 !
DL.fitsInLegalInteger(CondTy->getIntegerBitWidth()))
7683 if (
SI->getNumCases() < 4)
7691 for (
const auto &
C :
SI->cases())
7692 Values.push_back(
C.getCaseValue()->getValue().getSExtValue());
7714 unsigned Shift = 64;
7720 V = (int64_t)((
uint64_t)V >> Shift);
7737 Builder.SetInsertPoint(
SI);
7740 Value *Rot = Builder.CreateIntrinsic(
7741 Ty, Intrinsic::fshl,
7742 {
Sub,
Sub, ConstantInt::get(Ty, Ty->getBitWidth() - Shift)});
7743 SI->replaceUsesOfWith(
SI->getCondition(), Rot);
7745 for (
auto Case :
SI->cases()) {
7746 auto *Orig = Case.getCaseValue();
7747 auto Sub = Orig->getValue() -
APInt(Ty->getBitWidth(),
Base,
true);
7792 for (
auto I =
SI->case_begin(),
E =
SI->case_end();
I !=
E;) {
7793 if (!
I->getCaseValue()->getValue().ugt(
Constant->getValue())) {
7809 if (!
SI->defaultDestUnreachable() || Case ==
SI->case_default()) {
7812 return !Updates.
empty();
7842 Value *Condition =
SI->getCondition();
7846 if (CondTy->getIntegerBitWidth() > 64 ||
7847 !
DL.fitsInLegalInteger(CondTy->getIntegerBitWidth()))
7859 if (
SI->getNumCases() < 4)
7864 for (
const auto &Case :
SI->cases()) {
7865 uint64_t CaseValue = Case.getCaseValue()->getValue().getZExtValue();
7867 Values.push_back(CaseValue);
7877 SI->getFunction()->hasOptSize()))
7881 Builder.SetInsertPoint(
SI);
7883 if (!
SI->defaultDestUnreachable()) {
7886 auto *PopC = Builder.CreateUnaryIntrinsic(Intrinsic::ctpop, Condition);
7887 auto *IsPow2 = Builder.CreateICmpEQ(PopC, ConstantInt::get(CondTy, 1));
7889 auto *OrigBB =
SI->getParent();
7890 auto *DefaultCaseBB =
SI->getDefaultDest();
7892 auto It = OrigBB->getTerminator()->getIterator();
7905 NewWeights[1] = Weights[0] / 2;
7906 NewWeights[0] = OrigDenominator - NewWeights[1];
7918 Weights[0] = NewWeights[1];
7919 uint64_t CasesDenominator = OrigDenominator - Weights[0];
7921 W = NewWeights[0] *
static_cast<double>(W) / CasesDenominator;
7926 BI->setDebugLoc(
SI->getDebugLoc());
7927 It->eraseFromParent();
7935 for (
auto &Case :
SI->cases()) {
7936 auto *OrigValue = Case.getCaseValue();
7937 Case.setValue(ConstantInt::get(OrigValue->getIntegerType(),
7938 OrigValue->getValue().countr_zero()));
7942 auto *ConditionTrailingZeros = Builder.CreateIntrinsic(
7945 SI->setCondition(ConditionTrailingZeros);
7955 if (!Cmp || !Cmp->hasOneUse())
7966 uint32_t SuccWeight = 0, OtherSuccWeight = 0;
7969 if (
SI->getNumCases() == 2) {
7976 Succ =
SI->getDefaultDest();
7977 SuccWeight = Weights[0];
7979 for (
auto &Case :
SI->cases()) {
7980 std::optional<int64_t> Val =
7984 if (!Missing.erase(*Val))
7989 OtherSuccWeight += Weights[Case.getSuccessorIndex()];
7992 assert(Missing.size() == 1 &&
"Should have one case left");
7993 Res = *Missing.begin();
7994 }
else if (
SI->getNumCases() == 3 &&
SI->defaultDestUnreachable()) {
7996 Unreachable =
SI->getDefaultDest();
7998 for (
auto &Case :
SI->cases()) {
7999 BasicBlock *NewSucc = Case.getCaseSuccessor();
8000 uint32_t Weight = Weights[Case.getSuccessorIndex()];
8003 OtherSuccWeight += Weight;
8006 SuccWeight = Weight;
8007 }
else if (Succ == NewSucc) {
8013 for (
auto &Case :
SI->cases()) {
8014 std::optional<int64_t> Val =
8016 if (!Val || (Val != 1 && Val != 0 && Val != -1))
8018 if (Case.getCaseSuccessor() == Succ) {
8040 if (Cmp->isSigned())
8043 MDNode *NewWeights =
nullptr;
8049 Builder.SetInsertPoint(
SI->getIterator());
8050 Value *ICmp = Builder.CreateICmp(Pred, Cmp->getLHS(), Cmp->getRHS());
8051 Builder.CreateCondBr(ICmp, Succ,
OtherSucc, NewWeights,
8052 SI->getMetadata(LLVMContext::MD_unpredictable));
8056 SI->eraseFromParent();
8057 Cmp->eraseFromParent();
8058 if (DTU && Unreachable)
8083 assert(
BB &&
"Expected non-null BB");
8085 if (
BB->isEntryBlock())
8098 if (
BB->hasAddressTaken() ||
BB->isEHPad())
8103 if (&
BB->front() != &
BB->back())
8118 assert(BB->
size() == 1 &&
"Expected just a single branch in the BB");
8129 return (*EBW->PhiPredIVs)[&Phi][BB];
8151 auto IfPhiIVMatch = [&](
PHINode &Phi) {
8154 auto &PredIVs = (*LHS->PhiPredIVs)[&Phi];
8155 return PredIVs[
A] == PredIVs[
B];
8164 if (Candidates.
size() < 2)
8179 assert(Succ &&
"Expected unconditional BB");
8189 PhiPredIVs.
try_emplace(Phi, Phi->getNumIncomingValues()).first->second;
8192 for (
auto &
IV : Phi->incoming_values())
8193 IVs.insert({Phi->getIncomingBlock(
IV),
IV.get()});
8211 bool MadeChange =
false;
8225 if (!LivePreds.
contains(PredOfDead))
8232 Live->printAsOperand(
dbgs());
dbgs() <<
" for ";
8233 Live->getSingleSuccessor()->printAsOperand(
dbgs());
8238 T->replaceSuccessorWith(
Dead, Live);
8243 for (
const auto &EBW : BBs2Merge) {
8246 const auto &[It, Inserted] =
Keep.insert(&EBW);
8255 if (KeepBB == DeadBB)
8259 RedirectIncomingEdges(DeadBB, KeepBB);
8268 if (DTU && !Updates.
empty())
8274bool SimplifyCFGOpt::simplifyDuplicateSwitchArms(SwitchInst *SI,
8275 DomTreeUpdater *DTU) {
8277 SmallSetVector<BasicBlock *, 16> FilteredArms(
8283bool SimplifyCFGOpt::simplifyDuplicatePredecessors(BasicBlock *BB,
8284 DomTreeUpdater *DTU) {
8295 SmallSetVector<BasicBlock *, 8> FilteredPreds(
8301bool SimplifyCFGOpt::simplifySwitch(SwitchInst *SI,
IRBuilder<> &Builder) {
8304 if (isValueEqualityComparison(SI)) {
8308 if (simplifyEqualityComparisonWithOnlyPredecessor(SI, OnlyPred, Builder))
8309 return requestResimplify();
8313 if (simplifySwitchOnSelect(SI,
Select))
8314 return requestResimplify();
8318 if (SI == &*BB->
begin())
8319 if (foldValueComparisonIntoPredecessors(SI, Builder))
8320 return requestResimplify();
8326 if (
Options.ConvertSwitchRangeToICmp && turnSwitchRangeIntoICmp(SI, Builder))
8327 return requestResimplify();
8331 return requestResimplify();
8334 return requestResimplify();
8337 return requestResimplify();
8340 return requestResimplify();
8345 if (
Options.ConvertSwitchToArithmetic ||
Options.ConvertSwitchToLookupTable)
8347 Options.ConvertSwitchToLookupTable))
8348 return requestResimplify();
8351 return requestResimplify();
8354 return requestResimplify();
8357 hoistCommonCodeFromSuccessors(SI, !
Options.HoistCommonInsts))
8358 return requestResimplify();
8362 if (simplifyDuplicateSwitchArms(SI, DTU))
8363 return requestResimplify();
8366 return requestResimplify();
8371bool SimplifyCFGOpt::simplifyIndirectBr(IndirectBrInst *IBI) {
8374 SmallVector<uint32_t> BranchWeights;
8378 DenseMap<const BasicBlock *, uint64_t> TargetWeight;
8379 if (HasBranchWeights)
8384 SmallPtrSet<Value *, 8> Succs;
8385 SmallSetVector<BasicBlock *, 8> RemovedSuccs;
8390 RemovedSuccs.
insert(Dest);
8400 std::vector<DominatorTree::UpdateType> Updates;
8401 Updates.reserve(RemovedSuccs.
size());
8402 for (
auto *RemovedSucc : RemovedSuccs)
8403 Updates.push_back({DominatorTree::Delete, BB, RemovedSucc});
8420 if (HasBranchWeights) {
8427 if (simplifyIndirectBrOnSelect(IBI, SI))
8428 return requestResimplify();
8464 if (BB == OtherPred)
8472 if (!BI2 || !BI2->isIdenticalTo(BI))
8475 std::vector<DominatorTree::UpdateType> Updates;
8482 assert(
II->getNormalDest() != BB &&
II->getUnwindDest() == BB &&
8483 "unexpected successor");
8484 II->setUnwindDest(OtherPred);
8499 Builder.CreateUnreachable();
8500 BI->eraseFromParent();
8508bool SimplifyCFGOpt::simplifyUncondBranch(UncondBrInst *BI,
8520 bool NeedCanonicalLoop =
8534 if (
I->isTerminator() &&
8535 tryToSimplifyUncondBranchWithICmpInIt(ICI, Builder))
8559 if (!PPred || (PredPred && PredPred != PPred))
8600 return Succ1 != Succ && Succ2 != Succ && Succ1 != BB && Succ2 != BB &&
8604 if (!IsSimpleSuccessor(BB1, BB1BI) || !IsSimpleSuccessor(BB2, BB2BI))
8630 bool HasWeight =
false;
8635 BBTWeight = BBFWeight = 1;
8640 BB1TWeight = BB1FWeight = 1;
8645 BB2TWeight = BB2FWeight = 1;
8647 uint64_t Weights[2] = {BBTWeight * BB1FWeight + BBFWeight * BB2TWeight,
8648 BBTWeight * BB1TWeight + BBFWeight * BB2FWeight};
8655bool SimplifyCFGOpt::simplifyCondBranch(CondBrInst *BI,
IRBuilder<> &Builder) {
8659 "Tautological conditional branch should have been eliminated already.");
8662 if (!
Options.SimplifyCondBranch ||
8663 BI->getFunction()->hasFnAttribute(Attribute::OptForFuzzing))
8667 if (isValueEqualityComparison(BI)) {
8672 if (simplifyEqualityComparisonWithOnlyPredecessor(BI, OnlyPred, Builder))
8673 return requestResimplify();
8677 for (
auto &
I : *BB) {
8682 if (foldValueComparisonIntoPredecessors(BI, Builder))
8683 return requestResimplify();
8689 if (simplifyBranchOnICmpChain(BI, Builder,
DL))
8702 return requestResimplify();
8708 if (
Options.SpeculateBlocks &&
8711 return requestResimplify();
8720 hoistCommonCodeFromSuccessors(BI, !
Options.HoistCommonInsts))
8721 return requestResimplify();
8723 if (BI &&
Options.HoistLoadsStoresWithCondFaulting &&
8725 SmallVector<Instruction *, 2> SpeculatedConditionalLoadsStores;
8726 auto CanSpeculateConditionalLoadsStores = [&]() {
8728 for (Instruction &
I : *Succ) {
8729 if (
I.isTerminator()) {
8730 if (
I.getNumSuccessors() > 1)
8734 SpeculatedConditionalLoadsStores.
size() ==
8738 SpeculatedConditionalLoadsStores.
push_back(&
I);
8741 return !SpeculatedConditionalLoadsStores.
empty();
8744 if (CanSpeculateConditionalLoadsStores()) {
8746 std::nullopt,
nullptr);
8747 return requestResimplify();
8757 return requestResimplify();
8766 return requestResimplify();
8772 if (foldCondBranchOnValueKnownInPredecessor(BI))
8773 return requestResimplify();
8780 return requestResimplify();
8788 return requestResimplify();
8792 return requestResimplify();
8799 assert(V->getType() ==
I->getType() &&
"Mismatched types");
8811 auto *Use = cast<Instruction>(U.getUser());
8814 if (Use->getParent() != I->getParent() || Use == I || Use->comesBefore(I))
8817 switch (Use->getOpcode()) {
8820 case Instruction::GetElementPtr:
8821 case Instruction::Ret:
8822 case Instruction::BitCast:
8823 case Instruction::Load:
8824 case Instruction::Store:
8825 case Instruction::Call:
8826 case Instruction::CallBr:
8827 case Instruction::Invoke:
8828 case Instruction::UDiv:
8829 case Instruction::URem:
8833 case Instruction::SDiv:
8834 case Instruction::SRem:
8838 if (FindUse ==
I->use_end())
8840 auto &
Use = *FindUse;
8854 if (
GEP->getPointerOperand() ==
I) {
8857 if (
GEP->getType()->isVectorTy())
8865 if (!
GEP->hasAllZeroIndices() &&
8866 (!
GEP->isInBounds() ||
8868 GEP->getPointerAddressSpace())))
8869 PtrValueMayBeModified =
true;
8875 bool HasNoUndefAttr =
8876 Ret->getFunction()->hasRetAttribute(Attribute::NoUndef);
8881 if (
C->isNullValue() && HasNoUndefAttr &&
8882 Ret->getFunction()->hasRetAttribute(Attribute::NonNull)) {
8883 return !PtrValueMayBeModified;
8889 if (!LI->isVolatile())
8891 LI->getPointerAddressSpace());
8895 if (!
SI->isVolatile())
8897 SI->getPointerAddressSpace())) &&
8898 SI->getPointerOperand() ==
I;
8903 if (
I == Assume->getArgOperand(0))
8911 if (CB->getCalledOperand() ==
I)
8914 if (CB->isArgOperand(&
Use)) {
8915 unsigned ArgIdx = CB->getArgOperandNo(&
Use);
8918 CB->paramHasNonNullAttr(ArgIdx,
false))
8919 return !PtrValueMayBeModified;
8938 for (
unsigned i = 0, e =
PHI.getNumIncomingValues(); i != e; ++i)
8946 Builder.CreateUnreachable();
8947 T->eraseFromParent();
8958 Assumption = Builder.CreateAssumption(Builder.CreateNot(
Cond));
8960 Assumption = Builder.CreateAssumption(
Cond);
8965 BI->eraseFromParent();
8974 Builder.SetInsertPoint(Unreachable);
8976 Builder.CreateUnreachable();
8977 for (
const auto &Case :
SI->cases())
8978 if (Case.getCaseSuccessor() == BB) {
8980 Case.setSuccessor(Unreachable);
8982 if (
SI->getDefaultDest() == BB) {
8984 SI->setDefaultDest(Unreachable);
8998bool SimplifyCFGOpt::simplifyOnce(BasicBlock *BB) {
9023 return requestResimplify();
9042 if (simplifyDuplicatePredecessors(BB, DTU))
9046 if (
Options.SpeculateBlocks &&
9053 Options.SpeculateUnpredictables))
9061 case Instruction::UncondBr:
9064 case Instruction::CondBr:
9067 case Instruction::Resume:
9070 case Instruction::CleanupRet:
9073 case Instruction::Switch:
9076 case Instruction::Unreachable:
9079 case Instruction::IndirectBr:
9087bool SimplifyCFGOpt::run(BasicBlock *BB) {
9097 }
while (Resimplify);
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
AMDGPU Register Bank Select
This file implements a class to represent arbitrary precision integral constant values and operations...
static MachineBasicBlock * OtherSucc(MachineBasicBlock *MBB, MachineBasicBlock *Succ)
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static cl::opt< ITMode > IT(cl::desc("IT block support"), cl::Hidden, cl::init(DefaultIT), cl::values(clEnumValN(DefaultIT, "arm-default-it", "Generate any type of IT block"), clEnumValN(RestrictedIT, "arm-restrict-it", "Disallow complex IT blocks")))
Function Alias Analysis Results
This file contains the simple types necessary to represent the attributes associated with functions a...
static const Function * getParent(const Value *V)
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
This file contains the declarations for the subclasses of Constant, which represent the different fla...
static cl::opt< OutputCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(OutputCostKind::RecipThroughput), cl::values(clEnumValN(OutputCostKind::RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(OutputCostKind::Latency, "latency", "Instruction latency"), clEnumValN(OutputCostKind::CodeSize, "code-size", "Code size"), clEnumValN(OutputCostKind::SizeAndLatency, "size-latency", "Code size and latency"), clEnumValN(OutputCostKind::All, "all", "Print all cost kinds")))
This file defines the DenseMap class.
static bool IsIndirectCall(const MachineInstr *MI)
This file provides various utilities for inspecting and working with the control flow graph in LLVM I...
Module.h This file contains the declarations for the Module class.
This defines the Use class.
static Constant * getFalse(Type *Ty)
For a boolean type or a vector of boolean type, return false or a vector with every element false.
static constexpr Value * getValue(Ty &ValueOrUse)
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
Machine Check Debug Module
This file implements a map that provides insertion order iteration.
This file provides utility for Memory Model Relaxation Annotations (MMRAs).
This file exposes an interface to building/using memory SSA to walk memory instructions using a use/d...
MachineInstr unsigned OpIdx
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))
uint64_t IntrinsicInst * II
if(auto Err=PB.parsePassPipeline(MPM, Passes)) return wrap(std MPM run * Mod
This file contains the declarations for profiling metadata utility functions.
const SmallVectorImpl< MachineOperand > & Cond
static bool contains(SmallPtrSetImpl< ConstantExpr * > &Cache, ConstantExpr *Expr, Constant *C)
Provides some synthesis utilities to produce sequences of values.
This file defines generic set operations that may be used on set's of different types,...
This file implements a set that has insertion order iteration characteristics.
static std::optional< ContiguousCasesResult > findContiguousCases(Value *Condition, SmallVectorImpl< ConstantInt * > &Cases, SmallVectorImpl< ConstantInt * > &OtherCases, BasicBlock *Dest, BasicBlock *OtherDest)
static void addPredecessorToBlock(BasicBlock *Succ, BasicBlock *NewPred, BasicBlock *ExistPred, MemorySSAUpdater *MSSAU=nullptr)
Update PHI nodes in Succ to indicate that there will now be entries in it from the 'NewPred' block.
static bool validLookupTableConstant(Constant *C, const TargetTransformInfo &TTI)
Return true if the backend will be able to handle initializing an array of constants like C.
static StoreInst * findUniqueStoreInBlocks(BasicBlock *BB1, BasicBlock *BB2)
static bool isSwitchDense(uint64_t NumCases, uint64_t CaseRange, bool OptSize)
static bool validateAndCostRequiredSelects(BasicBlock *BB, BasicBlock *ThenBB, BasicBlock *EndBB, unsigned &SpeculatedInstructions, InstructionCost &Cost, const TargetTransformInfo &TTI)
Estimate the cost of the insertion(s) and check that the PHI nodes can be converted to selects.
static bool simplifySwitchLookup(SwitchInst *SI, IRBuilder<> &Builder, DomTreeUpdater *DTU, const DataLayout &DL, const TargetTransformInfo &TTI, bool ConvertSwitchToLookupTable)
If the switch is only used to initialize one or more phi nodes in a common successor block with diffe...
static void removeSwitchAfterSelectFold(SwitchInst *SI, PHINode *PHI, Value *SelectValue, IRBuilder<> &Builder, DomTreeUpdater *DTU)
static bool valuesOverlap(std::vector< ValueEqualityComparisonCase > &C1, std::vector< ValueEqualityComparisonCase > &C2)
Return true if there are any keys in C1 that exist in C2 as well.
static bool isProfitableToSpeculate(const CondBrInst *BI, std::optional< bool > Invert, const TargetTransformInfo &TTI)
static bool mergeConditionalStoreToAddress(BasicBlock *PTB, BasicBlock *PFB, BasicBlock *QTB, BasicBlock *QFB, BasicBlock *PostBB, Value *Address, bool InvertPCond, bool InvertQCond, DomTreeUpdater *DTU, const DataLayout &DL, const TargetTransformInfo &TTI)
static bool mergeCleanupPad(CleanupReturnInst *RI)
static bool isVectorOp(Instruction &I)
Return if an instruction's type or any of its operands' types are a vector type.
static BasicBlock * allPredecessorsComeFromSameSource(BasicBlock *BB)
static void cloneInstructionsIntoPredecessorBlockAndUpdateSSAUses(BasicBlock *BB, BasicBlock *PredBlock, ValueToValueMapTy &VMap)
static int constantIntSortPredicate(ConstantInt *const *P1, ConstantInt *const *P2)
static bool getCaseResults(SwitchInst *SI, ConstantInt *CaseVal, BasicBlock *CaseDest, BasicBlock **CommonDest, SmallVectorImpl< std::pair< PHINode *, Constant * > > &Res, const DataLayout &DL, const TargetTransformInfo &TTI)
Try to determine the resulting constant values in phi nodes at the common destination basic block,...
static bool passingValueIsAlwaysUndefined(Value *V, Instruction *I, bool PtrValueMayBeModified=false)
Check if passing a value to an instruction will cause undefined behavior.
static std::optional< std::tuple< BasicBlock *, Instruction::BinaryOps, bool > > shouldFoldCondBranchesToCommonDestination(CondBrInst *BI, CondBrInst *PBI, const TargetTransformInfo *TTI)
Determine if the two branches share a common destination and deduce a glue that joins the branches' c...
static bool isSafeToHoistInstr(Instruction *I, unsigned Flags)
static bool isSafeToHoistInvoke(BasicBlock *BB1, BasicBlock *BB2, Instruction *I1, Instruction *I2)
static ConstantInt * getConstantInt(Value *V, const DataLayout &DL)
Extract ConstantInt from value, looking through IntToPtr and PointerNullValue.
static bool simplifySwitchOfCmpIntrinsic(SwitchInst *SI, IRBuilderBase &Builder, DomTreeUpdater *DTU)
Fold switch over ucmp/scmp intrinsic to br if two of the switch arms have the same destination.
static bool shouldBuildLookupTable(SwitchInst *SI, uint64_t TableSize, const TargetTransformInfo &TTI, const DataLayout &DL, const SmallVector< Type * > &ResultTypes)
Determine whether a lookup table should be built for this switch, based on the number of cases,...
static Constant * constantFold(Instruction *I, const DataLayout &DL, const SmallDenseMap< Value *, Constant * > &ConstantPool)
Try to fold instruction I into a constant.
static bool areIdenticalUpToCommutativity(const Instruction *I1, const Instruction *I2)
static bool forwardSwitchConditionToPHI(SwitchInst *SI)
Try to forward the condition of a switch instruction to a phi node dominated by the switch,...
static PHINode * findPHIForConditionForwarding(ConstantInt *CaseValue, BasicBlock *BB, int *PhiIndex)
If BB would be eligible for simplification by TryToSimplifyUncondBranchFromEmptyBlock (i....
static bool simplifySwitchOfPowersOfTwo(SwitchInst *SI, IRBuilder<> &Builder, DomTreeUpdater *DTU, const DataLayout &DL, const TargetTransformInfo &TTI)
Tries to transform switch of powers of two to reduce switch range.
static bool isCleanupBlockEmpty(iterator_range< BasicBlock::iterator > R)
static Value * ensureValueAvailableInSuccessor(Value *V, BasicBlock *BB, Value *AlternativeV=nullptr)
static Value * createLogicalOp(IRBuilderBase &Builder, Instruction::BinaryOps Opc, Value *LHS, Value *RHS, const Twine &Name="")
static void hoistConditionalLoadsStores(CondBrInst *BI, SmallVectorImpl< Instruction * > &SpeculatedConditionalLoadsStores, std::optional< bool > Invert, Instruction *Sel)
If the target supports conditional faulting, we look for the following pattern:
static bool shouldHoistCommonInstructions(Instruction *I1, Instruction *I2, const TargetTransformInfo &TTI)
Helper function for hoistCommonCodeFromSuccessors.
static bool reduceSwitchRange(SwitchInst *SI, IRBuilder<> &Builder, const DataLayout &DL, const TargetTransformInfo &TTI)
Try to transform a switch that has "holes" in it to a contiguous sequence of cases.
static bool safeToMergeTerminators(Instruction *SI1, Instruction *SI2, SmallSetVector< BasicBlock *, 4 > *FailBlocks=nullptr)
Return true if it is safe to merge these two terminator instructions together.
@ SkipImplicitControlFlow
static bool incomingValuesAreCompatible(BasicBlock *BB, ArrayRef< BasicBlock * > IncomingBlocks, SmallPtrSetImpl< Value * > *EquivalenceSet=nullptr)
Return true if all the PHI nodes in the basic block BB receive compatible (identical) incoming values...
static bool trySwitchToSelect(SwitchInst *SI, IRBuilder<> &Builder, DomTreeUpdater *DTU, const DataLayout &DL, const TargetTransformInfo &TTI)
If a switch is only used to initialize one or more phi nodes in a common successor block with only tw...
static void createUnreachableSwitchDefault(SwitchInst *Switch, DomTreeUpdater *DTU, bool RemoveOrigDefaultBlock=true)
static Value * foldSwitchToSelect(const SwitchCaseResultVectorTy &ResultVector, Constant *DefaultResult, Value *Condition, IRBuilder<> &Builder, const DataLayout &DL, ArrayRef< uint32_t > BranchWeights)
static bool sinkCommonCodeFromPredecessors(BasicBlock *BB, DomTreeUpdater *DTU)
Check whether BB's predecessors end with unconditional branches.
static bool isTypeLegalForLookupTable(Type *Ty, const TargetTransformInfo &TTI, const DataLayout &DL)
static bool eliminateDeadSwitchCases(SwitchInst *SI, DomTreeUpdater *DTU, AssumptionCache *AC, const DataLayout &DL)
Compute masked bits for the condition of a switch and use it to remove dead cases.
static bool blockIsSimpleEnoughToThreadThrough(BasicBlock *BB, BlocksSet &NonLocalUseBlocks)
Return true if we can thread a branch across this block.
static Value * isSafeToSpeculateStore(Instruction *I, BasicBlock *BrBB, BasicBlock *StoreBB, BasicBlock *EndBB)
Determine if we can hoist sink a sole store instruction out of a conditional block.
static std::optional< bool > foldCondBranchOnValueKnownInPredecessorImpl(CondBrInst *BI, DomTreeUpdater *DTU, const DataLayout &DL, AssumptionCache *AC)
If we have a conditional branch on something for which we know the constant value in predecessors (e....
static bool foldTwoEntryPHINode(PHINode *PN, const TargetTransformInfo &TTI, DomTreeUpdater *DTU, AssumptionCache *AC, const DataLayout &DL, bool SpeculateUnpredictables)
Given a BB that starts with the specified two-entry PHI node, see if we can eliminate it.
static bool findReaching(BasicBlock *BB, BasicBlock *DefBB, BlocksSet &ReachesNonLocalUses)
static bool extractPredSuccWeights(CondBrInst *PBI, CondBrInst *BI, uint64_t &PredTrueWeight, uint64_t &PredFalseWeight, uint64_t &SuccTrueWeight, uint64_t &SuccFalseWeight)
Return true if either PBI or BI has branch weight available, and store the weights in {Pred|Succ}...
static bool initializeUniqueCases(SwitchInst *SI, PHINode *&PHI, BasicBlock *&CommonDest, SwitchCaseResultVectorTy &UniqueResults, Constant *&DefaultResult, const DataLayout &DL, const TargetTransformInfo &TTI, uintptr_t MaxUniqueResults)
static bool shouldUseSwitchConditionAsTableIndex(ConstantInt &MinCaseVal, const ConstantInt &MaxCaseVal, bool HasDefaultResults, const SmallVector< Type * > &ResultTypes, const DataLayout &DL, const TargetTransformInfo &TTI)
static InstructionCost computeSpeculationCost(const User *I, const TargetTransformInfo &TTI)
Compute an abstract "cost" of speculating the given instruction, which is assumed to be safe to specu...
static bool performBranchToCommonDestFolding(CondBrInst *BI, CondBrInst *PBI, DomTreeUpdater *DTU, MemorySSAUpdater *MSSAU, const TargetTransformInfo *TTI)
SmallPtrSet< BasicBlock *, 8 > BlocksSet
static unsigned skippedInstrFlags(Instruction *I)
static bool mergeCompatibleInvokes(BasicBlock *BB, DomTreeUpdater *DTU)
If this block is a landingpad exception handling block, categorize all the predecessor invokes into s...
static bool replacingOperandWithVariableIsCheap(const Instruction *I, int OpIdx)
static void eraseTerminatorAndDCECond(Instruction *TI, MemorySSAUpdater *MSSAU=nullptr)
static void eliminateBlockCases(BasicBlock *BB, std::vector< ValueEqualityComparisonCase > &Cases)
Given a vector of bb/value pairs, remove any entries in the list that match the specified block.
static bool mergeConditionalStores(CondBrInst *PBI, CondBrInst *QBI, DomTreeUpdater *DTU, const DataLayout &DL, const TargetTransformInfo &TTI)
static bool mergeNestedCondBranch(CondBrInst *BI, DomTreeUpdater *DTU)
Fold the following pattern: bb0: br i1 cond1, label bb1, label bb2 bb1: br i1 cond2,...
static void sinkLastInstruction(ArrayRef< BasicBlock * > Blocks)
static size_t mapCaseToResult(ConstantInt *CaseVal, SwitchCaseResultVectorTy &UniqueResults, Constant *Result)
static bool tryWidenCondBranchToCondBranch(CondBrInst *PBI, CondBrInst *BI, DomTreeUpdater *DTU)
If the previous block ended with a widenable branch, determine if reusing the target block is profita...
static void mergeCompatibleInvokesImpl(ArrayRef< InvokeInst * > Invokes, DomTreeUpdater *DTU)
static bool mergeIdenticalBBs(ArrayRef< BasicBlock * > Candidates, DomTreeUpdater *DTU)
static void getBranchWeights(Instruction *TI, SmallVectorImpl< uint64_t > &Weights)
Get Weights of a given terminator, the default weight is at the front of the vector.
static bool tryToMergeLandingPad(LandingPadInst *LPad, UncondBrInst *BI, BasicBlock *BB, DomTreeUpdater *DTU)
Given an block with only a single landing pad and a unconditional branch try to find another basic bl...
static Constant * lookupConstant(Value *V, const SmallDenseMap< Value *, Constant * > &ConstantPool)
If V is a Constant, return it.
static bool SimplifyCondBranchToCondBranch(CondBrInst *PBI, CondBrInst *BI, DomTreeUpdater *DTU, const DataLayout &DL, const TargetTransformInfo &TTI)
If we have a conditional branch as a predecessor of another block, this function tries to simplify it...
static bool canSinkInstructions(ArrayRef< Instruction * > Insts, DenseMap< const Use *, SmallVector< Value *, 4 > > &PHIOperands)
static void hoistLockstepIdenticalDbgVariableRecords(Instruction *TI, Instruction *I1, SmallVectorImpl< Instruction * > &OtherInsts)
Hoists DbgVariableRecords from I1 and OtherInstrs that are identical in lock-step to TI.
static bool removeEmptyCleanup(CleanupReturnInst *RI, DomTreeUpdater *DTU)
static bool removeUndefIntroducingPredecessor(BasicBlock *BB, DomTreeUpdater *DTU, AssumptionCache *AC)
If BB has an incoming value that will always trigger undefined behavior (eg.
static bool simplifySwitchWhenUMin(SwitchInst *SI, DomTreeUpdater *DTU)
Tries to transform the switch when the condition is umin with a constant.
static bool isSafeCheapLoadStore(const Instruction *I, const TargetTransformInfo &TTI)
static ConstantInt * getKnownValueOnEdge(Value *V, BasicBlock *From, BasicBlock *To)
static bool dominatesMergePoint(Value *V, BasicBlock *BB, Instruction *InsertPt, SmallPtrSetImpl< Instruction * > &AggressiveInsts, InstructionCost &Cost, InstructionCost Budget, const TargetTransformInfo &TTI, AssumptionCache *AC, SmallPtrSetImpl< Instruction * > &ZeroCostInstructions, unsigned Depth=0)
If we have a merge point of an "if condition" as accepted above, return true if the specified value d...
static void reuseTableCompare(User *PhiUser, BasicBlock *PhiBlock, CondBrInst *RangeCheckBranch, Constant *DefaultValue, const SmallVectorImpl< std::pair< ConstantInt *, Constant * > > &Values)
Try to reuse the switch table index compare.
This file defines the SmallPtrSet class.
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
static SymbolRef::Type getType(const Symbol *Sym)
static unsigned getBitWidth(Type *Ty, const DataLayout &DL)
Returns the bitwidth of the given scalar or pointer type.
static const uint32_t IV[8]
Class for arbitrary precision integers.
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
LLVM_ABI APInt zext(unsigned width) const
Zero extend to a new width.
unsigned popcount() const
Count the number of bits set.
bool sgt(const APInt &RHS) const
Signed greater than comparison.
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
bool intersects(const APInt &RHS) const
This operation tests if there are any pairs of corresponding bits between this APInt and RHS that are...
bool sle(const APInt &RHS) const
Signed less or equal comparison.
unsigned getSignificantBits() const
Get the minimum bit size for this signed APInt.
bool isStrictlyPositive() const
Determine if this APInt Value is positive.
uint64_t getLimitedValue(uint64_t Limit=UINT64_MAX) const
If this value is smaller than the specified limit, return it, otherwise return the limit value.
LLVM_ABI APInt smul_ov(const APInt &RHS, bool &Overflow) const
bool isSubsetOf(const APInt &RHS) const
This operation checks that all bits set in this APInt are also set in RHS.
bool slt(const APInt &RHS) const
Signed less than comparison.
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
std::optional< int64_t > trySExtValue() const
Get sign extended value if possible.
LLVM_ABI APInt ssub_ov(const APInt &RHS, bool &Overflow) const
bool uge(const APInt &RHS) const
Unsigned greater or equal comparison.
Represent a constant reference to an array (0 or more elements consecutively in memory),...
const T & front() const
Get the first element.
size_t size() const
Get the array size.
bool empty() const
Check if the array is empty.
static LLVM_ABI ArrayType * get(Type *ElementType, uint64_t NumElements)
This static method is the primary way to construct an ArrayType.
A cache of @llvm.assume calls within a function.
LLVM_ABI void registerAssumption(AssumeInst *CI)
Add an @llvm.assume intrinsic to this function's cache.
LLVM_ABI bool getValueAsBool() const
Return the attribute's value as a boolean.
LLVM Basic Block Representation.
iterator begin()
Instruction iterator methods.
iterator_range< const_phi_iterator > phis() const
Returns a range that iterates over the phis in the basic block.
LLVM_ABI const_iterator getFirstInsertionPt() const
Returns an iterator to the first instruction in this block that is suitable for inserting a non-PHI i...
const Function * getParent() const
Return the enclosing method, or null if none.
bool hasAddressTaken() const
Returns true if there are any uses of this basic block other than direct branches,...
LLVM_ABI InstListType::const_iterator getFirstNonPHIIt() const
Returns an iterator to the first instruction in this block that is not a PHINode instruction.
static BasicBlock * Create(LLVMContext &Context, const Twine &Name="", Function *Parent=nullptr, BasicBlock *InsertBefore=nullptr)
Creates a new BasicBlock.
LLVM_ABI InstListType::const_iterator getFirstNonPHIOrDbg(bool SkipPseudoOp=true) const
Returns a pointer to the first instruction in this block that is not a PHINode or a debug intrinsic,...
LLVM_ABI bool hasNPredecessors(unsigned N) const
Return true if this block has exactly N predecessors.
LLVM_ABI const BasicBlock * getUniqueSuccessor() const
Return the successor of this block if it has a unique successor.
LLVM_ABI const BasicBlock * getSinglePredecessor() const
Return the predecessor of this block if it has a single predecessor block.
const Instruction & front() const
LLVM_ABI const CallInst * getTerminatingDeoptimizeCall() const
Returns the call instruction calling @llvm.experimental.deoptimize prior to the terminating return in...
LLVM_ABI const BasicBlock * getUniquePredecessor() const
Return the predecessor of this block if it has a unique predecessor block.
LLVM_ABI const BasicBlock * getSingleSuccessor() const
Return the successor of this block if it has a single successor.
LLVM_ABI void flushTerminatorDbgRecords()
Eject any debug-info trailing at the end of a block.
LLVM_ABI const DataLayout & getDataLayout() const
Get the data layout of the module this basic block belongs to.
InstListType::iterator iterator
Instruction iterators...
LLVM_ABI LLVMContext & getContext() const
Get the context in which this basic block lives.
LLVM_ABI bool isLandingPad() const
Return true if this basic block is a landing pad.
LLVM_ABI bool hasNPredecessorsOrMore(unsigned N) const
Return true if this block has N predecessors or more.
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction; assumes that the block is well-formed.
void splice(BasicBlock::iterator ToIt, BasicBlock *FromBB)
Transfer all instructions from FromBB to this basic block at ToIt.
LLVM_ABI const Module * getModule() const
Return the module owning the function this basic block belongs to, or nullptr if the function does no...
LLVM_ABI void removePredecessor(BasicBlock *Pred, bool KeepOneInputPHIs=false)
Update PHI nodes in this BasicBlock before removal of predecessor Pred.
BasicBlock * getBasicBlock() const
static LLVM_ABI BranchProbability getBranchProbability(uint64_t Numerator, uint64_t Denominator)
BranchProbability getCompl() const
void addRangeRetAttr(const ConstantRange &CR)
adds the range attribute to the list of attributes.
bool isCallee(Value::const_user_iterator UI) const
Determine whether the passed iterator points to the callee operand's Use.
bool isDataOperand(const Use *U) const
bool tryIntersectAttributes(const CallBase *Other)
Try to intersect the attributes from 'this' CallBase and the 'Other' CallBase.
This class represents a function call, abstracting a target machine's calling convention.
mapped_iterator< op_iterator, DerefFnTy > handler_iterator
CleanupPadInst * getCleanupPad() const
Convenience accessor.
BasicBlock * getUnwindDest() const
This class is the base class for the comparison instructions.
static Type * makeCmpResultType(Type *opnd_type)
Create a result type for fcmp/icmp.
bool isEquality() const
Determine if this is an equals/not equals predicate.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
@ ICMP_UGT
unsigned greater than
@ ICMP_ULT
unsigned less than
Predicate getPredicate() const
Return the predicate for this instruction.
An abstraction over a floating-point predicate, and a pack of an integer predicate with samesign info...
Conditional Branch instruction.
static CondBrInst * Create(Value *Cond, BasicBlock *IfTrue, BasicBlock *IfFalse, InsertPosition InsertBefore=nullptr)
void setSuccessor(unsigned idx, BasicBlock *NewSucc)
void setCondition(Value *V)
Value * getCondition() const
BasicBlock * getSuccessor(unsigned i) const
static LLVM_ABI Constant * get(ArrayType *T, ArrayRef< Constant * > V)
A vector constant whose element type is a simple 1/2/4/8-byte integer or float/double,...
A constant value that is initialized with an expression using other constant values.
static LLVM_ABI Constant * getNeg(Constant *C, bool HasNSW=false)
ConstantFP - Floating Point Values [float, double].
ConstantFolder - Create constants with minimum, target independent, folding.
This is the shared class of boolean and integer constants.
bool isOne() const
This is just a convenience method to make client code smaller for a common case.
uint64_t getLimitedValue(uint64_t Limit=~0ULL) const
getLimitedValue - If the value is smaller than the specified limit, return it, otherwise return the l...
IntegerType * getIntegerType() const
Variant of the getType() method to always return an IntegerType, which reduces the amount of casting ...
static LLVM_ABI ConstantInt * getTrue(LLVMContext &Context)
static ConstantInt * getSigned(IntegerType *Ty, int64_t V, bool ImplicitTrunc=false)
Return a ConstantInt with the specified value for the specified type.
bool isZero() const
This is just a convenience method to make client code smaller for a common code.
static LLVM_ABI ConstantInt * getFalse(LLVMContext &Context)
unsigned getBitWidth() const
getBitWidth - Return the scalar bitwidth of this constant.
uint64_t getZExtValue() const
Return the constant as a 64-bit unsigned integer value after it has been zero extended as appropriate...
const APInt & getValue() const
Return the constant as an APInt value reference.
A constant pointer value that points to null.
This class represents a range of values.
LLVM_ABI bool getEquivalentICmp(CmpInst::Predicate &Pred, APInt &RHS) const
Set up Pred and RHS such that ConstantRange::makeExactICmpRegion(Pred, RHS) == *this.
LLVM_ABI ConstantRange subtract(const APInt &CI) const
Subtract the specified constant from the endpoints of this constant range.
const APInt & getLower() const
Return the lower value for this range.
LLVM_ABI APInt getUnsignedMin() const
Return the smallest unsigned value contained in the ConstantRange.
LLVM_ABI bool isEmptySet() const
Return true if this set contains no members.
LLVM_ABI bool isSizeLargerThan(uint64_t MaxSize) const
Compare set size of this range with Value.
const APInt & getUpper() const
Return the upper value for this range.
LLVM_ABI bool isUpperWrapped() const
Return true if the exclusive upper bound wraps around the unsigned domain.
static LLVM_ABI ConstantRange makeExactICmpRegion(CmpInst::Predicate Pred, const APInt &Other)
Produce the exact range such that all values in the returned range satisfy the given predicate with a...
LLVM_ABI ConstantRange inverse() const
Return a new range that is the logical not of the current set.
LLVM_ABI APInt getUnsignedMax() const
Return the largest unsigned value contained in the ConstantRange.
static ConstantRange getNonEmpty(APInt Lower, APInt Upper)
Create non-empty constant range with the given bounds.
This is an important base class in LLVM.
static LLVM_ABI Constant * getIntegerValue(Type *Ty, const APInt &V)
Return the value for an integer or pointer constant, or a vector thereof, with the given scalar value...
bool isNullValue() const
Return true if this is the value that would be returned by getNullValue.
LLVM_ABI bool isOneValue() const
Returns true if the value is one.
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
A parsed version of the target data layout string in and methods for querying it.
Base class for non-instruction debug metadata records that have positions within IR.
LLVM_ABI void removeFromParent()
simple_ilist< DbgRecord >::iterator self_iterator
Record of a variable value-assignment, aka a non instruction representation of the dbg....
bool isSameSourceLocation(const DebugLoc &Other) const
Return true if the source locations match, ignoring isImplicitCode and source atom info.
static DebugLoc getTemporary()
static LLVM_ABI DebugLoc getMergedLocation(DebugLoc LocA, DebugLoc LocB)
When two instructions are combined into a single instruction we also need to combine the original loc...
static LLVM_ABI DebugLoc getMergedLocations(ArrayRef< DebugLoc > Locs)
Try to combine the vector of locations passed as input in a single one.
static DebugLoc getDropped()
ValueT & at(const_arg_type_t< KeyT > Val)
Return the entry for the specified key, or abort if no such entry exists.
iterator find(const_arg_type_t< KeyT > Val)
std::pair< iterator, bool > try_emplace(KeyT &&Key, Ts &&...Args)
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
void reserve(size_type NumEntries)
Grow the densemap so that it can contain at least NumEntries items before resizing again.
Implements a dense probed hash-table based set.
static constexpr UpdateKind Delete
static constexpr UpdateKind Insert
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
const BasicBlock & getEntryBlock() const
Attribute getFnAttribute(Attribute::AttrKind Kind) const
Return the attribute for the given attribute kind.
bool hasMinSize() const
Optimize this function for minimum size (-Oz).
bool hasFnAttribute(Attribute::AttrKind Kind) const
Return true if the function has the attribute.
void applyUpdates(ArrayRef< UpdateT > Updates)
Submit updates to all available trees.
an instruction for type-safe pointer arithmetic to access elements of arrays and structs
Module * getParent()
Get the module that this global value is contained inside of...
This instruction compares its operands according to the predicate given to the constructor.
Predicate getSignedPredicate() const
For example, EQ->EQ, SLE->SLE, UGT->SGT, etc.
static bool isEquality(Predicate P)
Return true if this predicate is either EQ or NE.
Common base class shared among various IRBuilders.
Value * CreateICmpULT(Value *LHS, Value *RHS, const Twine &Name="")
Value * CreateZExtOrTrunc(Value *V, Type *DestTy, const Twine &Name="")
Create a ZExt or Trunc from the integer value V to DestTy.
CondBrInst * CreateCondBr(Value *Cond, BasicBlock *True, BasicBlock *False, MDNode *BranchWeights=nullptr, MDNode *Unpredictable=nullptr)
Create a conditional 'br Cond, TrueDest, FalseDest' instruction.
LLVM_ABI Value * CreateSelectFMF(Value *C, Value *True, Value *False, FMFSource FMFSource, const Twine &Name="", Instruction *MDFrom=nullptr)
ConstantInt * getTrue()
Get the constant value for i1 true.
LLVM_ABI Value * CreateSelect(Value *C, Value *True, Value *False, const Twine &Name="", Instruction *MDFrom=nullptr)
BasicBlock::iterator GetInsertPoint() const
Value * CreateFreeze(Value *V, const Twine &Name="")
void SetCurrentDebugLocation(const DebugLoc &L)
Set location information used by debugging information.
Value * CreateLShr(Value *LHS, Value *RHS, const Twine &Name="", bool isExact=false)
LLVM_ABI CallInst * CreateAssumption(Value *Cond)
Create an assume intrinsic call that allows the optimizer to assume that the provided condition will ...
Value * CreateInBoundsGEP(Type *Ty, Value *Ptr, ArrayRef< Value * > IdxList, const Twine &Name="")
UncondBrInst * CreateBr(BasicBlock *Dest)
Create an unconditional 'br label X' instruction.
Value * CreateNot(Value *V, const Twine &Name="")
SwitchInst * CreateSwitch(Value *V, BasicBlock *Dest, unsigned NumCases=10, MDNode *BranchWeights=nullptr, MDNode *Unpredictable=nullptr)
Create a switch instruction with the specified value, default dest, and with a hint for the number of...
Value * CreateICmpEQ(Value *LHS, Value *RHS, const Twine &Name="")
LoadInst * CreateLoad(Type *Ty, Value *Ptr, const char *Name)
Provided to resolve 'CreateLoad(Ty, Ptr, "...")' correctly, instead of converting the string to 'bool...
Value * CreateZExt(Value *V, Type *DestTy, const Twine &Name="", bool IsNonNeg=false)
StoreInst * CreateStore(Value *Val, Value *Ptr, bool isVolatile=false)
Value * CreateAdd(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Value * CreatePtrToInt(Value *V, Type *DestTy, const Twine &Name="")
ConstantInt * getFalse()
Get the constant value for i1 false.
Value * CreateTrunc(Value *V, Type *DestTy, const Twine &Name="", bool IsNUW=false, bool IsNSW=false)
Value * CreateIntCast(Value *V, Type *DestTy, bool isSigned, const Twine &Name="")
void SetInsertPoint(BasicBlock *TheBB)
This specifies that created instructions should be appended to the end of the specified block.
Value * CreateICmp(CmpInst::Predicate P, Value *LHS, Value *RHS, const Twine &Name="")
Value * CreateOr(Value *LHS, Value *RHS, const Twine &Name="", bool IsDisjoint=false)
Value * CreateMul(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Provides an 'InsertHelper' that calls a user-provided callback after performing the default insertion...
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Indirect Branch Instruction.
BasicBlock * getDestination(unsigned i)
Return the specified destination.
unsigned getNumDestinations() const
return the number of possible destinations in this indirectbr instruction.
LLVM_ABI void removeDestination(unsigned i)
This method removes the specified successor from the indirectbr instruction.
LLVM_ABI void dropUBImplyingAttrsAndMetadata(ArrayRef< unsigned > Keep={})
Drop any attributes or metadata that can cause immediate undefined behavior.
LLVM_ABI Instruction * clone() const
Create a copy of 'this' instruction that is identical in all ways except the following:
LLVM_ABI iterator_range< simple_ilist< DbgRecord >::iterator > cloneDebugInfoFrom(const Instruction *From, std::optional< simple_ilist< DbgRecord >::iterator > FromHere=std::nullopt, bool InsertAtHead=false)
Clone any debug-info attached to From onto this instruction.
LLVM_ABI unsigned getNumSuccessors() const LLVM_READONLY
Return the number of successors that this instruction has.
iterator_range< simple_ilist< DbgRecord >::iterator > getDbgRecordRange() const
Return a range over the DbgRecords attached to this instruction.
const DebugLoc & getDebugLoc() const
Return the debug location for this node as a DebugLoc.
LLVM_ABI const Module * getModule() const
Return the module owning the function this instruction belongs to or nullptr it the function does not...
LLVM_ABI void andIRFlags(const Value *V)
Logical 'and' of any supported wrapping, exact, and fast-math flags of V and this instruction.
LLVM_ABI void moveBefore(InstListType::iterator InsertPos)
Unlink this instruction from its current basic block and insert it into the basic block that MovePos ...
LLVM_ABI bool isAtomic() const LLVM_READONLY
Return true if this instruction has an AtomicOrdering of unordered or higher.
LLVM_ABI InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
Instruction * user_back()
Specialize the methods defined in Value, as we know that an instruction can only be used by other ins...
MDNode * getMetadata(unsigned KindID) const
Get the metadata of given kind attached to this Instruction.
LLVM_ABI BasicBlock * getSuccessor(unsigned Idx) const LLVM_READONLY
Return the specified successor. This instruction must be a terminator.
LLVM_ABI bool mayHaveSideEffects() const LLVM_READONLY
Return true if the instruction may have side effects.
bool isTerminator() const
LLVM_ABI bool isUsedOutsideOfBlock(const BasicBlock *BB) const LLVM_READONLY
Return true if there are any uses of this instruction in blocks other than the specified block.
@ CompareUsingIntersectedAttrs
Check for equivalence with intersected callbase attrs.
LLVM_ABI bool isIdenticalTo(const Instruction *I) const LLVM_READONLY
Return true if the specified instruction is exactly identical to the current one.
void setDebugLoc(DebugLoc Loc)
Set the debug location information for this instruction.
LLVM_ABI void copyMetadata(const Instruction &SrcInst, ArrayRef< unsigned > WL=ArrayRef< unsigned >())
Copy metadata from SrcInst to this instruction.
LLVM_ABI void applyMergedLocation(DebugLoc LocA, DebugLoc LocB)
Merge 2 debug locations and apply it to the Instruction.
LLVM_ABI void dropDbgRecords()
Erase any DbgRecords attached to this instruction.
LLVM_ABI InstListType::iterator insertInto(BasicBlock *ParentBB, InstListType::iterator It)
Inserts an unlinked instruction into ParentBB at position It and returns the iterator of the inserted...
Class to represent integer types.
static LLVM_ABI IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
unsigned getBitWidth() const
Get the number of bits in this IntegerType.
void setNormalDest(BasicBlock *B)
This is an important class for using LLVM in a threaded context.
The landingpad instruction holds all of the information necessary to generate correct exception handl...
An instruction for reading from memory.
static unsigned getPointerOperandIndex()
Iterates through instructions in a set of blocks in reverse order from the first non-terminator.
LLVM_ABI MDNode * createBranchWeights(uint32_t TrueWeight, uint32_t FalseWeight, bool IsExpected=false)
Return metadata containing two branch weights.
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
A Module instance is used to store all the information related to an LLVM module.
void addIncoming(Value *V, BasicBlock *BB)
Add an incoming value to the end of the PHI list.
iterator_range< const_block_iterator > blocks() const
op_range incoming_values()
void setIncomingValue(unsigned i, Value *V)
Value * getIncomingValueForBlock(const BasicBlock *BB) const
BasicBlock * getIncomingBlock(unsigned i) const
Return incoming basic block number i.
Value * getIncomingValue(unsigned i) const
Return incoming value number x.
int getBasicBlockIndex(const BasicBlock *BB) const
Return the first index of the specified basic block in the value list for this PHI.
unsigned getNumIncomingValues() const
Return the number of incoming edges.
static PHINode * Create(Type *Ty, unsigned NumReservedValues, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Constructors - NumReservedValues is a hint for the number of incoming edges that this phi node will h...
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Value * getValue() const
Convenience accessor.
Return a value (possibly void), from a function.
This class represents the LLVM 'select' instruction.
size_type size() const
Determine the number of elements in the SetVector.
void insert_range(Range &&R)
bool empty() const
Determine if the SetVector is empty or not.
bool insert(const value_type &X)
Insert a new element into the SetVector.
A templated base class for SmallPtrSet which provides the typesafe interface that is common across al...
bool erase(PtrType Ptr)
Remove pointer from the set.
size_type count(ConstPtrType Ptr) const
count - Return 1 if the specified pointer is in the set, 0 otherwise.
void insert_range(Range &&R)
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
bool contains(ConstPtrType Ptr) const
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
A SetVector that performs no allocations if smaller than a certain size.
SmallSet - This maintains a set of unique values, optimizing for the case when the set is small (less...
std::pair< const_iterator, bool > insert(const T &V)
insert - Insert an element into the set if it isn't already there.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void assign(size_type NumElts, ValueParamT Elt)
reference emplace_back(ArgTypes &&... Args)
void reserve(size_type N)
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
An instruction for storing to memory.
AtomicOrdering getOrdering() const
Returns the ordering constraint of this store instruction.
Value * getValueOperand()
static unsigned getPointerOperandIndex()
SyncScope::ID getSyncScopeID() const
Returns the synchronization scope ID of this store instruction.
Value * getPointerOperand()
Represent a constant reference to a string, i.e.
A wrapper class to simplify modification of SwitchInst cases along with their prof branch_weights met...
LLVM_ABI void setSuccessorWeight(unsigned idx, CaseWeightOpt W)
LLVM_ABI void addCase(ConstantInt *OnVal, BasicBlock *Dest, CaseWeightOpt W)
Delegate the call to the underlying SwitchInst::addCase() and set the specified branch weight for the...
LLVM_ABI CaseWeightOpt getSuccessorWeight(unsigned idx)
LLVM_ABI void replaceDefaultDest(SwitchInst::CaseIt I)
Replace the default destination by given case.
std::optional< uint32_t > CaseWeightOpt
LLVM_ABI SwitchInst::CaseIt removeCase(SwitchInst::CaseIt I)
Delegate the call to the underlying SwitchInst::removeCase() and remove correspondent branch weight.
CaseIt case_end()
Returns a read/write iterator that points one past the last in the SwitchInst.
BasicBlock * getSuccessor(unsigned idx) const
void setCondition(Value *V)
LLVM_ABI void addCase(ConstantInt *OnVal, BasicBlock *Dest)
Add an entry to the switch instruction.
CaseIteratorImpl< CaseHandle > CaseIt
void setSuccessor(unsigned idx, BasicBlock *NewSucc)
unsigned getNumSuccessors() const
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
The instances of the Type class are immutable: once they are created, they are never changed.
bool isPointerTy() const
True if this is an instance of PointerType.
LLVM_ABI TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.
static LLVM_ABI IntegerType * getInt1Ty(LLVMContext &C)
bool isIntegerTy() const
True if this is an instance of IntegerType.
Unconditional Branch instruction.
void setSuccessor(BasicBlock *NewSucc)
static UncondBrInst * Create(BasicBlock *Target, InsertPosition InsertBefore=nullptr)
BasicBlock * getSuccessor(unsigned i=0) const
'undef' values are things that do not have specified contents.
This function has undefined behavior.
A Use represents the edge between a Value definition and its users.
LLVM_ABI unsigned getOperandNo() const
Return the operand # of this use in its User.
LLVM_ABI void set(Value *Val)
User * getUser() const
Returns the User that contains this Use.
const Use & getOperandUse(unsigned i) const
void setOperand(unsigned i, Value *Val)
LLVM_ABI bool replaceUsesOfWith(Value *From, Value *To)
Replace uses of one Value with another.
Value * getOperand(unsigned i) const
unsigned getNumOperands() const
LLVM Value Representation.
Type * getType() const
All values are typed, get the type of this value.
static constexpr uint64_t MaximumAlignment
LLVM_ABI Value(Type *Ty, unsigned scid)
LLVM_ABI void setName(const Twine &Name)
Change the name of the value.
bool hasOneUse() const
Return true if there is exactly one use of this value.
LLVM_ABI void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
LLVMContext & getContext() const
All values hold a context through their type.
iterator_range< user_iterator > users()
iterator_range< use_iterator > uses()
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
LLVM_ABI void takeName(Value *V)
Transfer the name from V to this value.
Represents an op.with.overflow intrinsic.
const ParentTy * getParent() const
self_iterator getIterator()
NodeTy * getNextNode()
Get the next node, or nullptr for the list tail.
A range adaptor for a pair of iterators.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
@ C
The default llvm calling convention, compatible with C.
@ BasicBlock
Various leaf nodes.
BinaryOp_match< SrcTy, SpecificConstantMatch, TargetOpcode::G_XOR, true > m_Not(const SrcTy &&Src)
Matches a register not-ed by a G_XOR.
OneUse_match< SubPat > m_OneUse(const SubPat &SP)
Predicate
Predicate - These are "(BI << 5) | BO" for various predicates.
match_combine_or< Ty... > m_CombineOr(const Ty &...Ps)
Combine pattern matchers matching any of Ps patterns.
BinaryOp_match< LHS, RHS, Instruction::And > m_And(const LHS &L, const RHS &R)
auto m_Cmp()
Matches any compare instruction and ignore it.
BinaryOp_match< LHS, RHS, Instruction::Add > m_Add(const LHS &L, const RHS &R)
ap_match< APInt > m_APInt(const APInt *&Res)
Match a ConstantInt or splatted ConstantVector, binding the specified pointer to the contained APInt.
bool match(Val *V, const Pattern &P)
match_bind< Instruction > m_Instruction(Instruction *&I)
Match an instruction, capturing it if we match.
auto m_UMin(const Opnd0 &Op0, const Opnd1 &Op1)
specificval_ty m_Specific(const Value *V)
Match if we have a specific specified value.
auto m_BinOp()
Match an arbitrary binary operation and ignore it.
ExtractValue_match< Ind, Val_t > m_ExtractValue(const Val_t &V)
Match a single index ExtractValue instruction.
auto m_Value()
Match an arbitrary value and ignore it.
auto m_LogicalOr()
Matches L || R where L and R are arbitrary values.
ThreeOps_match< decltype(m_Value()), LHS, RHS, Instruction::Select, true > m_c_Select(const LHS &L, const RHS &R)
Match Select(C, LHS, RHS) or Select(C, RHS, LHS)
match_bind< WithOverflowInst > m_WithOverflowInst(WithOverflowInst *&I)
Match a with overflow intrinsic, capturing it if we match.
match_immconstant_ty m_ImmConstant()
Match an arbitrary immediate Constant and ignore it.
NoWrapTrunc_match< OpTy, TruncInst::NoUnsignedWrap > m_NUWTrunc(const OpTy &Op)
Matches trunc nuw.
CmpClass_match< LHS, RHS, ICmpInst > m_ICmp(CmpPredicate &Pred, const LHS &L, const RHS &R)
auto m_LogicalAnd()
Matches L && R where L and R are arbitrary values.
BinaryOp_match< LHS, RHS, Instruction::Or > m_Or(const LHS &L, const RHS &R)
auto m_ConstantInt()
Match an arbitrary ConstantInt and ignore it.
SmallVector< DbgVariableRecord * > getDVRAssignmentMarkers(const Instruction *Inst)
Return a range of dbg_assign records for which Inst performs the assignment they encode.
LLVM_ABI void deleteAssignmentMarkers(const Instruction *Inst)
Delete the llvm.dbg.assign intrinsics linked to Inst.
initializer< Ty > init(const Ty &Val)
DXILDebugInfoMap run(Module &M)
@ User
could "use" a pointer
NodeAddr< UseNode * > Use
NodeAddr< FuncNode * > Func
Context & getContext() const
friend class Instruction
Iterator for Instructions in a `BasicBlock.
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
detail::zippy< detail::zip_shortest, T, U, Args... > zip(T &&t, U &&u, Args &&...args)
zip iterator for two or more iteratable types.
bool operator<(int64_t V1, const APSInt &V2)
constexpr auto not_equal_to(T &&Arg)
Functor variant of std::not_equal_to that can be used as a UnaryPredicate in functional algorithms li...
LLVM_ABI bool foldBranchToCommonDest(CondBrInst *BI, llvm::DomTreeUpdater *DTU=nullptr, MemorySSAUpdater *MSSAU=nullptr, const TargetTransformInfo *TTI=nullptr, AssumptionCache *AC=nullptr, unsigned BonusInstThreshold=1)
If this basic block is ONLY a setcc and a branch, and if a predecessor branches to us and one of our ...
auto find(R &&Range, const T &Val)
Provide wrappers to std::find which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI cl::opt< bool > ProfcheckDisableMetadataFixes
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI bool RecursivelyDeleteTriviallyDeadInstructions(Value *V, const TargetLibraryInfo *TLI=nullptr, MemorySSAUpdater *MSSAU=nullptr, std::function< void(Value *)> AboutToDeleteCallback=std::function< void(Value *)>())
If the specified value is a trivially dead instruction, delete it.
bool succ_empty(const Instruction *I)
LLVM_ABI bool IsBlockFollowedByDeoptOrUnreachable(const BasicBlock *BB)
Check if we can prove that all paths starting from this block converge to a block that either has a @...
LLVM_ABI bool ConstantFoldTerminator(BasicBlock *BB, bool DeleteDeadConditions=false, const TargetLibraryInfo *TLI=nullptr, DomTreeUpdater *DTU=nullptr)
If a terminator instruction is predicated on a constant value, convert it into an unconditional branc...
static cl::opt< unsigned > MaxSwitchCasesPerResult("max-switch-cases-per-result", cl::Hidden, cl::init(16), cl::desc("Limit cases to analyze when converting a switch to select"))
RelativeUniformCounterPtr Values
static cl::opt< bool > SpeculateOneExpensiveInst("speculate-one-expensive-inst", cl::Hidden, cl::init(true), cl::desc("Allow exactly one expensive instruction to be speculatively " "executed"))
auto pred_end(const MachineBasicBlock *BB)
void set_intersect(S1Ty &S1, const S2Ty &S2)
set_intersect(A, B) - Compute A := A ^ B Identical to set_intersection, except that it works on set<>...
LLVM_ABI void setExplicitlyUnknownBranchWeightsIfProfiled(Instruction &I, StringRef PassName, const Function *F=nullptr)
Like setExplicitlyUnknownBranchWeights(...), but only sets unknown branch weights in the new instruct...
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
auto successors(const MachineBasicBlock *BB)
auto accumulate(R &&Range, E &&Init)
Wrapper for std::accumulate.
constexpr from_range_t from_range
iterator_range< T > make_range(T x, T y)
Convenience function for iterating over sub-ranges.
LLVM_ABI MDNode * getBranchWeightMDNode(const Instruction &I)
Get the branch weights metadata node.
constexpr bool isUIntN(unsigned N, uint64_t x)
Checks if an unsigned integer fits into the given (dynamic) bit width.
LLVM_ABI Constant * ConstantFoldCompareInstOperands(unsigned Predicate, Constant *LHS, Constant *RHS, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, const Instruction *I=nullptr)
Attempt to constant fold a compare instruction (icmp/fcmp) with the specified operands.
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
Align getLoadStoreAlignment(const Value *I)
A helper function that returns the alignment of load or store instruction.
LLVM_ABI void DeleteDeadBlock(BasicBlock *BB, DomTreeUpdater *DTU=nullptr, bool KeepOneInputPHIs=false)
Delete the specified block, which must have no predecessors.
LLVM_ABI bool isSafeToSpeculativelyExecute(const Instruction *I, const Instruction *CtxI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr, const TargetLibraryInfo *TLI=nullptr, bool UseVariableInfo=true, bool IgnoreUBImplyingAttrs=true)
Return true if the instruction does not have any effects besides calculating the result and does not ...
auto unique(Range &&R, Predicate P)
static cl::opt< unsigned > MaxSpeculationDepth("max-speculation-depth", cl::Hidden, cl::init(10), cl::desc("Limit maximum recursion depth when calculating costs of " "speculatively executed instructions"))
OutputIt copy_if(R &&Range, OutputIt Out, UnaryPredicate P)
Provide wrappers to std::copy_if which take ranges instead of having to pass begin/end explicitly.
static cl::opt< unsigned > PHINodeFoldingThreshold("phi-node-folding-threshold", cl::Hidden, cl::init(2), cl::desc("Control the amount of phi node folding to perform (default = 2)"))
bool operator==(const AddressRangeValuePair &LHS, const AddressRangeValuePair &RHS)
static cl::opt< bool > MergeCondStoresAggressively("simplifycfg-merge-cond-stores-aggressively", cl::Hidden, cl::init(false), cl::desc("When merging conditional stores, do so even if the resultant " "basic blocks are unlikely to be if-converted as a result"))
constexpr int popcount(T Value) noexcept
Count the number of set bits in a value.
LLVM_ABI ConstantRange getConstantRangeFromMetadata(const MDNode &RangeMD)
Parse out a conservative ConstantRange from !range metadata.
auto map_range(ContainerTy &&C, FuncTy F)
Return a range that applies F to the elements of C.
static cl::opt< unsigned > BranchFoldThreshold("simplifycfg-branch-fold-threshold", cl::Hidden, cl::init(2), cl::desc("Maximum cost of combining conditions when " "folding branches"))
RelativeUniformCounterPtr ValuesPtrExpr VTableAddr Value
uint64_t PowerOf2Ceil(uint64_t A)
Returns the power of two which is greater than or equal to the given value.
int countr_zero(T Val)
Count number of 0's from the least significant bit to the most stopping at the first 1.
LLVM_ABI Value * simplifyInstruction(Instruction *I, const SimplifyQuery &Q)
See if we can compute a simplified version of this instruction.
LLVM_ABI void setBranchWeights(Instruction &I, ArrayRef< uint32_t > Weights, bool IsExpected, bool ElideAllZero=false)
Create a new branch_weights metadata node and add or overwrite a prof metadata reference to instructi...
static cl::opt< bool > SinkCommon("simplifycfg-sink-common", cl::Hidden, cl::init(true), cl::desc("Sink common instructions down to the end block"))
void erase(Container &C, ValueType V)
Wrapper function to remove a value from a container:
constexpr bool has_single_bit(T Value) noexcept
static cl::opt< bool > HoistStoresWithCondFaulting("simplifycfg-hoist-stores-with-cond-faulting", cl::Hidden, cl::init(true), cl::desc("Hoist stores if the target supports conditional faulting"))
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
constexpr detail::StaticCastFunc< To > StaticCastTo
Function objects corresponding to the Cast types defined above.
unsigned Log2_32(uint32_t Value)
Return the floor log base 2 of the specified value, -1 if the value is zero.
LLVM_ABI CondBrInst * GetIfCondition(BasicBlock *BB, BasicBlock *&IfTrue, BasicBlock *&IfFalse)
Check whether BB is the merge point of a if-region.
LLVM_ABI bool TryToSimplifyUncondBranchFromEmptyBlock(BasicBlock *BB, DomTreeUpdater *DTU=nullptr)
BB is known to contain an unconditional branch, and contains no instructions other than PHI nodes,...
void RemapDbgRecordRange(Module *M, iterator_range< DbgRecordIterator > Range, ValueToValueMapTy &VM, RemapFlags Flags=RF_None, ValueMapTypeRemapper *TypeMapper=nullptr, ValueMaterializer *Materializer=nullptr, const MetadataPredicate *IdentityMD=nullptr)
Remap the Values used in the DbgRecords Range using the value map VM.
LLVM_ABI void InvertBranch(CondBrInst *PBI, IRBuilderBase &Builder)
auto reverse(ContainerTy &&C)
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
LLVM_ABI bool impliesPoison(const Value *ValAssumedPoison, const Value *V)
Return true if V is poison given that ValAssumedPoison is already poison.
void sort(IteratorTy Start, IteratorTy End)
static cl::opt< bool > EnableMergeCompatibleInvokes("simplifycfg-merge-compatible-invokes", cl::Hidden, cl::init(true), cl::desc("Allow SimplifyCFG to merge invokes together when appropriate"))
@ RF_IgnoreMissingLocals
If this flag is set, the remapper ignores missing function-local entries (Argument,...
@ RF_NoModuleLevelChanges
If this flag is set, the remapper knows that only local values within a function (such as an instruct...
LLVM_ABI void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
LLVM_ABI bool NullPointerIsDefined(const Function *F, unsigned AS=0)
Check whether null pointer dereferencing is considered undefined behavior for a given function or an ...
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
bool none_of(R &&Range, UnaryPredicate P)
Provide wrappers to std::none_of which take ranges instead of having to pass begin/end explicitly.
auto make_first_range(ContainerTy &&c)
Given a container of pairs, return a range over the first elements.
LLVM_ABI bool collectPossibleValues(const Value *V, SmallPtrSetImpl< const Constant * > &Constants, unsigned MaxCount, bool AllowUndefOrPoison=true)
Enumerates all possible immediate values of V and inserts them into the set Constants.
LLVM_ABI Instruction * removeUnwindEdge(BasicBlock *BB, DomTreeUpdater *DTU=nullptr)
Replace 'BB's terminator with one that does not have an unwind successor block.
auto succ_size(const MachineBasicBlock *BB)
iterator_range< filter_iterator< detail::IterOfRange< RangeT >, PredicateT > > make_filter_range(RangeT &&Range, PredicateT Pred)
Convenience function that takes a range of elements and a predicate, and return a new filter_iterator...
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
static cl::opt< unsigned > MaxJumpThreadingLiveBlocks("max-jump-threading-live-blocks", cl::Hidden, cl::init(24), cl::desc("Limit number of blocks a define in a threaded block is allowed " "to be live in"))
RNSuccIterator< NodeRef, BlockT, RegionT > succ_begin(NodeRef Node)
LLVM_ABI void combineMetadataForCSE(Instruction *K, const Instruction *J, bool DoesKMove)
Combine the metadata of two instructions so that K can replace J.
iterator_range(Container &&) -> iterator_range< llvm::detail::IterOfRange< Container > >
auto drop_end(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the last N elements excluded.
static cl::opt< int > MaxSmallBlockSize("simplifycfg-max-small-block-size", cl::Hidden, cl::init(10), cl::desc("Max size of a block which is still considered " "small enough to thread through"))
LLVM_ABI BasicBlock * SplitBlockPredecessors(BasicBlock *BB, ArrayRef< BasicBlock * > Preds, const char *Suffix, DominatorTree *DT, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, bool PreserveLCSSA=false)
This method introduces at least one new basic block into the function and moves some of the predecess...
LLVM_ABI bool isWidenableBranch(const User *U)
Returns true iff U is a widenable branch (that is, extractWidenableCondition returns widenable condit...
static cl::opt< unsigned > HoistCommonSkipLimit("simplifycfg-hoist-common-skip-limit", cl::Hidden, cl::init(20), cl::desc("Allow reordering across at most this many " "instructions when hoisting"))
IRBuilder(LLVMContext &, FolderTy, InserterTy, MDNode *, ArrayRef< OperandBundleDef >) -> IRBuilder< FolderTy, InserterTy >
LLVM_ABI cl::opt< bool > RequireAndPreserveDomTree
This function is used to do simplification of a CFG.
static cl::opt< bool > MergeCondStores("simplifycfg-merge-cond-stores", cl::Hidden, cl::init(true), cl::desc("Hoist conditional stores even if an unconditional store does not " "precede - hoist multiple conditional stores into a single " "predicated store"))
static cl::opt< unsigned > BranchFoldToCommonDestVectorMultiplier("simplifycfg-branch-fold-common-dest-vector-multiplier", cl::Hidden, cl::init(2), cl::desc("Multiplier to apply to threshold when determining whether or not " "to fold branch to common destination when vector operations are " "present"))
RNSuccIterator< NodeRef, BlockT, RegionT > succ_end(NodeRef Node)
LLVM_ABI bool MergeBlockIntoPredecessor(BasicBlock *BB, DomTreeUpdater *DTU=nullptr, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, MemoryDependenceResults *MemDep=nullptr, bool PredecessorWithTwoSuccessors=false, DominatorTree *DT=nullptr)
Attempts to merge a block into its predecessor, if possible.
LLVM_ABI void hoistAllInstructionsInto(BasicBlock *DomBlock, Instruction *InsertPt, BasicBlock *BB)
Hoist all of the instructions in the IfBlock to the dominant block DomBlock, by moving its instructio...
@ Sub
Subtraction of integers.
LLVM_ABI BasicBlock * SplitBlock(BasicBlock *Old, BasicBlock::iterator SplitPt, DominatorTree *DT, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, const Twine &BBName="")
Split the specified block at the specified instruction.
RelativeUniformCounterPtr ValuesPtrExpr VTableAddr Count
auto count(R &&Range, const E &Element)
Wrapper function around std::count to count the number of times an element Element occurs in the give...
void RemapInstruction(Instruction *I, ValueToValueMapTy &VM, RemapFlags Flags=RF_None, ValueMapTypeRemapper *TypeMapper=nullptr, ValueMaterializer *Materializer=nullptr, const MetadataPredicate *IdentityMD=nullptr)
Convert the instruction operands from referencing the current values into those specified by VM.
LLVM_ABI bool canReplaceOperandWithVariable(const Instruction *I, unsigned OpIdx)
Given an instruction, is it legal to set operand OpIdx to a non-constant value?
DWARFExpression::Operation Op
LLVM_ABI bool PointerMayBeCaptured(const Value *V, bool ReturnCaptures, unsigned MaxUsesToExplore=0)
PointerMayBeCaptured - Return true if this pointer value may be captured by the enclosing function (w...
LLVM_ABI bool FoldSingleEntryPHINodes(BasicBlock *BB, MemoryDependenceResults *MemDep=nullptr)
We know that BB has one predecessor.
LLVM_ABI bool isGuaranteedNotToBeUndefOrPoison(const Value *V, AssumptionCache *AC=nullptr, const Instruction *CtxI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Return true if this function can prove that V does not have undef bits and is never poison.
void RemapDbgRecord(Module *M, DbgRecord *DR, ValueToValueMapTy &VM, RemapFlags Flags=RF_None, ValueMapTypeRemapper *TypeMapper=nullptr, ValueMaterializer *Materializer=nullptr, const MetadataPredicate *IdentityMD=nullptr)
Remap the Values used in the DbgRecord DR using the value map VM.
ArrayRef(const T &OneElt) -> ArrayRef< T >
constexpr unsigned BitWidth
auto sum_of(R &&Range, E Init=E{0})
Returns the sum of all values in Range with Init initial value.
ValueMap< const Value *, WeakTrackingVH > ValueToValueMapTy
LLVM_ABI bool isGuaranteedToTransferExecutionToSuccessor(const Instruction *I)
Return true if this function can prove that the instruction I will always transfer execution to one o...
static cl::opt< bool > HoistCondStores("simplifycfg-hoist-cond-stores", cl::Hidden, cl::init(true), cl::desc("Hoist conditional stores if an unconditional store precedes"))
LLVM_ABI bool extractBranchWeights(const MDNode *ProfileData, SmallVectorImpl< uint32_t > &Weights)
Extract branch weights from MD_prof metadata.
LLVM_ABI bool simplifyCFG(BasicBlock *BB, const TargetTransformInfo &TTI, DomTreeUpdater *DTU=nullptr, const SimplifyCFGOptions &Options={}, ArrayRef< WeakVH > LoopHeaders={})
auto pred_begin(const MachineBasicBlock *BB)
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
auto find_if(R &&Range, UnaryPredicate P)
Provide wrappers to std::find_if which take ranges instead of having to pass begin/end explicitly.
void erase_if(Container &C, UnaryPredicate P)
Provide a container algorithm similar to C++ Library Fundamentals v2's erase_if which is equivalent t...
constexpr bool isIntN(unsigned N, int64_t x)
Checks if an signed integer fits into the given (dynamic) bit width.
auto predecessors(const MachineBasicBlock *BB)
static cl::opt< unsigned > HoistLoadsStoresWithCondFaultingThreshold("hoist-loads-stores-with-cond-faulting-threshold", cl::Hidden, cl::init(6), cl::desc("Control the maximal conditional load/store that we are willing " "to speculatively execute to eliminate conditional branch " "(default = 6)"))
static cl::opt< bool > HoistCommon("simplifycfg-hoist-common", cl::Hidden, cl::init(true), cl::desc("Hoist common instructions up to the parent block"))
iterator_range< pointer_iterator< WrappedIteratorT > > make_pointer_range(RangeT &&Range)
LLVM_ABI unsigned ComputeMaxSignificantBits(const Value *Op, const DataLayout &DL, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Get the upper bound on bit size for this Value Op as a signed integer.
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
static cl::opt< unsigned > TwoEntryPHINodeFoldingThreshold("two-entry-phi-node-folding-threshold", cl::Hidden, cl::init(4), cl::desc("Control the maximal total instruction cost that we are willing " "to speculatively execute to fold a 2-entry PHI node into a " "select (default = 4)"))
Type * getLoadStoreType(const Value *I)
A helper function that returns the type of a load or store instruction.
PointerUnion< const Value *, const PseudoSourceValue * > ValueType
SmallVector< uint64_t, 2 > getDisjunctionWeights(const SmallVector< T1, 2 > &B1, const SmallVector< T2, 2 > &B2)
Get the branch weights of a branch conditioned on b1 || b2, where b1 and b2 are 2 booleans that are t...
bool pred_empty(const BasicBlock *BB)
LLVM_ABI Constant * ConstantFoldCastInstruction(unsigned opcode, Constant *V, Type *DestTy)
LLVM_ABI Instruction * SplitBlockAndInsertIfThen(Value *Cond, BasicBlock::iterator SplitBefore, bool Unreachable, MDNode *BranchWeights=nullptr, DomTreeUpdater *DTU=nullptr, LoopInfo *LI=nullptr, BasicBlock *ThenBlock=nullptr)
Split the containing block at the specified instruction - everything before SplitBefore stays in the ...
LLVM_ABI std::optional< bool > isImpliedByDomCondition(const Value *Cond, const Instruction *ContextI, const DataLayout &DL)
Return the boolean condition value in the context of the given instruction if it is known based on do...
auto seq(T Begin, T End)
Iterate over an integral type from Begin up to - but not including - End.
void array_pod_sort(IteratorTy Start, IteratorTy End)
array_pod_sort - This sorts an array with the specified start and end extent.
LLVM_ABI bool hasBranchWeightMD(const Instruction &I)
Checks if an instructions has Branch Weight Metadata.
hash_code hash_combine(const Ts &...args)
Combine values into a single hash_code.
LLVM_ABI bool isDereferenceablePointer(const Value *V, Type *Ty, const SimplifyQuery &Q, bool IgnoreFree=false)
Equivalent to isDereferenceableAndAlignedPointer with an alignment of 1.
bool equal(L &&LRange, R &&RRange)
Wrapper function around std::equal to detect if pair-wise elements between two ranges are the same.
static cl::opt< bool > HoistLoadsWithCondFaulting("simplifycfg-hoist-loads-with-cond-faulting", cl::Hidden, cl::init(true), cl::desc("Hoist loads if the target supports conditional faulting"))
LLVM_ABI Constant * ConstantFoldInstOperands(const Instruction *I, ArrayRef< Constant * > Ops, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, bool AllowNonDeterministic=true)
ConstantFoldInstOperands - Attempt to constant fold an instruction with the specified operands.
LLVM_ABI void setFittedBranchWeights(Instruction &I, ArrayRef< uint64_t > Weights, bool IsExpected, bool ElideAllZero=false)
Variant of setBranchWeights where the Weights will be fit first to uint32_t by shifting right.
LLVM_ABI const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=MaxLookupSearchDepth)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
LLVM_ABI Constant * ConstantFoldIntegerCast(Constant *C, Type *DestTy, bool IsSigned, const DataLayout &DL)
Constant fold a zext, sext or trunc, depending on IsSigned and whether the DestTy is wider or narrowe...
bool capturesNothing(CaptureComponents CC)
static auto filterDbgVars(iterator_range< simple_ilist< DbgRecord >::iterator > R)
Filter the DbgRecord range to DbgVariableRecord types only and downcast.
LLVM_ABI bool EliminateDuplicatePHINodes(BasicBlock *BB)
Check for and eliminate duplicate PHI nodes in this block.
@ Keep
No function return thunk.
constexpr detail::IsaCheckPredicate< Types... > IsaPred
Function object wrapper for the llvm::isa type check.
LLVM_ABI void RemapSourceAtom(Instruction *I, ValueToValueMapTy &VM)
Remap source location atom.
hash_code hash_combine_range(InputIteratorT first, InputIteratorT last)
Compute a hash_code for a sequence of values.
LLVM_ABI bool isWritableObject(const Value *Object, bool &ExplicitlyDereferenceableOnly)
Return true if the Object is writable, in the sense that any location based on this pointer that can ...
LLVM_ABI void mapAtomInstance(const DebugLoc &DL, ValueToValueMapTy &VMap)
Mark a cloned instruction as a new instance so that its source loc can be updated when remapped.
constexpr uint64_t NextPowerOf2(uint64_t A)
Returns the next power of two (in 64-bits) that is strictly greater than A.
LLVM_ABI void extractFromBranchWeightMD64(const MDNode *ProfileData, SmallVectorImpl< uint64_t > &Weights)
Faster version of extractBranchWeights() that skips checks and must only be called with "branch_weigh...
LLVM_ABI ConstantRange computeConstantRange(const Value *V, bool ForSigned, const SimplifyQuery &SQ, unsigned Depth=0)
Determine the possible constant range of an integer or vector of integer value.
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
SmallVectorImpl< ConstantInt * > * Cases
SmallVectorImpl< ConstantInt * > * OtherCases
Checking whether two BBs are equal depends on the contents of the BasicBlock and the incoming values ...
SmallDenseMap< BasicBlock *, Value *, 8 > BB2ValueMap
DenseMap< PHINode *, BB2ValueMap > Phi2IVsMap
static bool canBeMerged(const BasicBlock *BB)
static bool isEqual(const EqualBBWrapper *LHS, const EqualBBWrapper *RHS)
static unsigned getHashValue(const EqualBBWrapper *EBW)
An information struct used to provide DenseMap with the various necessary components for a given valu...
unsigned getBitWidth() const
Get the bit width of this value.
unsigned countMaxActiveBits() const
Returns the maximum number of bits needed to represent all possible unsigned values with these known ...
APInt getMaxValue() const
Return the maximal unsigned value possible given these KnownBits.
A MapVector that performs no allocations if smaller than a certain size.