97#define DEBUG_TYPE "simplifycfg"
102 "simplifycfg-require-and-preserve-domtree",
cl::Hidden,
105 "Temporary development switch used to gradually uplift SimplifyCFG "
106 "into preserving DomTree,"));
115 "Control the amount of phi node folding to perform (default = 2)"));
119 cl::desc(
"Control the maximal total instruction cost that we are willing "
120 "to speculatively execute to fold a 2-entry PHI node into a "
121 "select (default = 4)"));
125 cl::desc(
"Hoist common instructions up to the parent block"));
129 cl::desc(
"Hoist loads if the target supports conditional faulting"));
133 cl::desc(
"Hoist stores if the target supports conditional faulting"));
137 cl::desc(
"Control the maximal conditional load/store that we are willing "
138 "to speculatively execute to eliminate conditional branch "
144 cl::desc(
"Allow reordering across at most this many "
145 "instructions when hoisting"));
149 cl::desc(
"Sink common instructions down to the end block"));
153 cl::desc(
"Hoist conditional stores if an unconditional store precedes"));
157 cl::desc(
"Hoist conditional stores even if an unconditional store does not "
158 "precede - hoist multiple conditional stores into a single "
159 "predicated store"));
163 cl::desc(
"When merging conditional stores, do so even if the resultant "
164 "basic blocks are unlikely to be if-converted as a result"));
168 cl::desc(
"Allow exactly one expensive instruction to be speculatively "
173 cl::desc(
"Limit maximum recursion depth when calculating costs of "
174 "speculatively executed instructions"));
179 cl::desc(
"Max size of a block which is still considered "
180 "small enough to thread through"));
186 cl::desc(
"Maximum cost of combining conditions when "
187 "folding branches"));
190 "simplifycfg-branch-fold-common-dest-vector-multiplier",
cl::Hidden,
192 cl::desc(
"Multiplier to apply to threshold when determining whether or not "
193 "to fold branch to common destination when vector operations are "
198 cl::desc(
"Allow SimplifyCFG to merge invokes together when appropriate"));
202 cl::desc(
"Limit cases to analyze when converting a switch to select"));
206 cl::desc(
"Limit number of blocks a define in a threaded block is allowed "
213STATISTIC(NumBitMaps,
"Number of switch instructions turned into bitmaps");
215 "Number of switch instructions turned into linear mapping");
217 "Number of switch instructions turned into lookup tables");
219 NumLookupTablesHoles,
220 "Number of switch instructions turned into lookup tables (holes checked)");
221STATISTIC(NumTableCmpReuses,
"Number of reused switch table lookup compares");
223 "Number of value comparisons folded into predecessor basic blocks");
225 "Number of branches folded into predecessor basic block");
228 "Number of common instruction 'blocks' hoisted up to the begin block");
230 "Number of common instructions hoisted up to the begin block");
232 "Number of common instruction 'blocks' sunk down to the end block");
234 "Number of common instructions sunk down to the end block");
235STATISTIC(NumSpeculations,
"Number of speculative executed instructions");
237 "Number of invokes with empty resume blocks simplified into calls");
238STATISTIC(NumInvokesMerged,
"Number of invokes that were merged together");
239STATISTIC(NumInvokeSetsFormed,
"Number of invoke sets that were formed");
246using SwitchCaseResultVectorTy =
255struct ValueEqualityComparisonCase {
267 bool operator==(BasicBlock *RHSDest)
const {
return Dest == RHSDest; }
270class SimplifyCFGOpt {
271 const TargetTransformInfo &TTI;
273 const DataLayout &DL;
275 const SimplifyCFGOptions &Options;
278 Value *isValueEqualityComparison(Instruction *TI);
280 Instruction *TI, std::vector<ValueEqualityComparisonCase> &Cases);
281 bool simplifyEqualityComparisonWithOnlyPredecessor(Instruction *TI,
284 bool performValueComparisonIntoPredecessorFolding(Instruction *TI,
Value *&CV,
287 bool foldValueComparisonIntoPredecessors(Instruction *TI,
290 bool simplifyResume(ResumeInst *RI,
IRBuilder<> &Builder);
291 bool simplifySingleResume(ResumeInst *RI);
292 bool simplifyCommonResume(ResumeInst *RI);
293 bool simplifyCleanupReturn(CleanupReturnInst *RI);
294 bool simplifyUnreachable(UnreachableInst *UI);
295 bool simplifySwitch(SwitchInst *SI,
IRBuilder<> &Builder);
296 bool simplifyDuplicateSwitchArms(SwitchInst *SI, DomTreeUpdater *DTU);
297 bool simplifyIndirectBr(IndirectBrInst *IBI);
298 bool simplifyUncondBranch(UncondBrInst *BI,
IRBuilder<> &Builder);
299 bool simplifyCondBranch(CondBrInst *BI,
IRBuilder<> &Builder);
300 bool foldCondBranchOnValueKnownInPredecessor(BranchInst *BI);
302 bool tryToSimplifyUncondBranchWithICmpInIt(ICmpInst *ICI,
304 bool tryToSimplifyUncondBranchWithICmpSelectInIt(ICmpInst *ICI,
307 bool hoistCommonCodeFromSuccessors(Instruction *TI,
bool AllInstsEqOnly);
308 bool hoistSuccIdenticalTerminatorToSwitchOrIf(
309 Instruction *TI, Instruction *I1,
310 SmallVectorImpl<Instruction *> &OtherSuccTIs,
312 bool speculativelyExecuteBB(BranchInst *BI, BasicBlock *ThenBB);
313 bool simplifyTerminatorOnSelect(Instruction *OldTerm,
Value *
Cond,
314 BasicBlock *TrueBB, BasicBlock *FalseBB,
315 uint32_t TrueWeight, uint32_t FalseWeight);
316 bool simplifyBranchOnICmpChain(BranchInst *BI,
IRBuilder<> &Builder,
317 const DataLayout &DL);
318 bool simplifySwitchOnSelect(SwitchInst *SI, SelectInst *
Select);
319 bool simplifyIndirectBrOnSelect(IndirectBrInst *IBI, SelectInst *SI);
320 bool turnSwitchRangeIntoICmp(SwitchInst *SI,
IRBuilder<> &Builder);
323 SimplifyCFGOpt(
const TargetTransformInfo &TTI, DomTreeUpdater *DTU,
325 const SimplifyCFGOptions &Opts)
326 : TTI(TTI), DTU(DTU), DL(DL), LoopHeaders(LoopHeaders), Options(Opts) {
327 assert((!DTU || !DTU->hasPostDomTree()) &&
328 "SimplifyCFG is not yet capable of maintaining validity of a "
329 "PostDomTree, so don't ask for it.");
332 bool simplifyOnce(BasicBlock *BB);
333 bool run(BasicBlock *BB);
336 bool requestResimplify() {
346isSelectInRoleOfConjunctionOrDisjunction(
const SelectInst *
SI) {
366 "Only for a pair of incoming blocks at the time!");
372 Value *IV0 = PN.getIncomingValueForBlock(IncomingBlocks[0]);
373 Value *IV1 = PN.getIncomingValueForBlock(IncomingBlocks[1]);
376 if (EquivalenceSet && EquivalenceSet->contains(IV0) &&
377 EquivalenceSet->contains(IV1))
400 if (!SI1Succs.
count(Succ))
406 FailBlocks->insert(Succ);
422 PN.addIncoming(PN.getIncomingValueForBlock(ExistPred), NewPred);
424 if (
auto *MPhi = MSSAU->getMemorySSA()->getMemoryAccess(Succ))
425 MPhi->addIncoming(MPhi->getIncomingValueForBlock(ExistPred), NewPred);
487 if (AggressiveInsts.
count(
I))
503 ZeroCostInstructions.
insert(OverflowInst);
505 }
else if (!ZeroCostInstructions.
contains(
I))
521 for (
Use &
Op :
I->operands())
523 TTI, AC, ZeroCostInstructions,
Depth + 1))
540 if (
DL.hasUnstableRepresentation(V->getType()))
549 return ConstantInt::get(IntPtrTy, 0);
554 if (CE->getOpcode() == Instruction::IntToPtr)
578struct ConstantComparesGatherer {
579 const DataLayout &DL;
582 Value *CompValue =
nullptr;
585 Value *Extra =
nullptr;
591 unsigned UsedICmps = 0;
597 bool IgnoreFirstMatch =
false;
598 bool MultipleMatches =
false;
601 ConstantComparesGatherer(Instruction *
Cond,
const DataLayout &DL) : DL(DL) {
603 if (CompValue || !MultipleMatches)
608 IgnoreFirstMatch =
true;
612 ConstantComparesGatherer(
const ConstantComparesGatherer &) =
delete;
613 ConstantComparesGatherer &
614 operator=(
const ConstantComparesGatherer &) =
delete;
619 bool setValueOnce(
Value *NewVal) {
620 if (IgnoreFirstMatch) {
621 IgnoreFirstMatch =
false;
624 if (CompValue && CompValue != NewVal) {
625 MultipleMatches =
true;
639 bool matchInstruction(Instruction *
I,
bool isEQ) {
646 if (!setValueOnce(Val))
666 if (ICI->
getPredicate() == (isEQ ? ICmpInst::ICMP_EQ : ICmpInst::ICMP_NE)) {
710 if (
Mask.isPowerOf2() && (
C->getValue() & ~Mask) ==
C->getValue()) {
712 if (!setValueOnce(RHSVal))
717 ConstantInt::get(
C->getContext(),
718 C->getValue() | Mask));
733 if (
Mask.isPowerOf2() && (
C->getValue() | Mask) ==
C->getValue()) {
735 if (!setValueOnce(RHSVal))
739 Vals.push_back(ConstantInt::get(
C->getContext(),
740 C->getValue() & ~Mask));
761 Value *CandidateVal =
I->getOperand(0);
764 CandidateVal = RHSVal;
779 if (!setValueOnce(CandidateVal))
785 Vals.push_back(ConstantInt::get(
I->getContext(), Tmp));
797 void gather(
Value *V) {
806 SmallVector<Value *, 8> DFT{Op0, Op1};
807 SmallPtrSet<Value *, 8> Visited{
V, Op0, Op1};
809 while (!DFT.
empty()) {
816 if (Visited.
insert(Op1).second)
818 if (Visited.
insert(Op0).second)
825 if (matchInstruction(
I, IsEq))
852 if (BI->isConditional())
870 if (!
SI->getParent()->hasNPredecessorsOrMore(128 /
SI->getNumSuccessors()))
871 CV =
SI->getCondition();
873 if (BI->isConditional() && BI->getCondition()->hasOneUse()) {
878 if (Trunc->hasNoUnsignedWrap())
879 CV = Trunc->getOperand(0);
886 Value *Ptr = PTII->getPointerOperand();
887 if (
DL.hasUnstableRepresentation(Ptr->
getType()))
889 if (PTII->getType() ==
DL.getIntPtrType(Ptr->
getType()))
898BasicBlock *SimplifyCFGOpt::getValueEqualityComparisonCases(
899 Instruction *TI, std::vector<ValueEqualityComparisonCase> &Cases) {
901 Cases.reserve(
SI->getNumCases());
902 for (
auto Case :
SI->cases())
903 Cases.push_back(ValueEqualityComparisonCase(Case.getCaseValue(),
904 Case.getCaseSuccessor()));
905 return SI->getDefaultDest();
910 ICmpInst::Predicate Pred;
916 Pred = ICmpInst::ICMP_NE;
921 Cases.push_back(ValueEqualityComparisonCase(
C, Succ));
929 std::vector<ValueEqualityComparisonCase> &Cases) {
935 std::vector<ValueEqualityComparisonCase> &C2) {
936 std::vector<ValueEqualityComparisonCase> *V1 = &C1, *V2 = &C2;
939 if (V1->size() > V2->size())
944 if (V1->size() == 1) {
947 for (
const ValueEqualityComparisonCase &
VECC : *V2)
948 if (TheVal ==
VECC.Value)
955 unsigned i1 = 0, i2 = 0, e1 = V1->size(), e2 = V2->size();
956 while (i1 != e1 && i2 != e2) {
972bool SimplifyCFGOpt::simplifyEqualityComparisonWithOnlyPredecessor(
973 Instruction *TI, BasicBlock *Pred,
IRBuilder<> &Builder) {
978 Value *ThisVal = isValueEqualityComparison(TI);
979 assert(ThisVal &&
"This isn't a value comparison!!");
980 if (ThisVal != PredVal)
987 std::vector<ValueEqualityComparisonCase> PredCases;
989 getValueEqualityComparisonCases(Pred->
getTerminator(), PredCases);
993 std::vector<ValueEqualityComparisonCase> ThisCases;
994 BasicBlock *ThisDef = getValueEqualityComparisonCases(TI, ThisCases);
1009 assert(ThisCases.size() == 1 &&
"Branch can only have one case!");
1015 ThisCases[0].Dest->removePredecessor(PredDef);
1018 <<
"Through successor TI: " << *TI <<
"Leaving: " << *NI
1025 {{DominatorTree::Delete, PredDef, ThisCases[0].Dest}});
1032 SmallPtrSet<Constant *, 16> DeadCases;
1033 for (
const ValueEqualityComparisonCase &Case : PredCases)
1034 DeadCases.
insert(Case.Value);
1037 <<
"Through successor TI: " << *TI);
1039 SmallDenseMap<BasicBlock *, int, 8> NumPerSuccessorCases;
1042 auto *
Successor = i->getCaseSuccessor();
1045 if (DeadCases.
count(i->getCaseValue())) {
1054 std::vector<DominatorTree::UpdateType> Updates;
1055 for (
const std::pair<BasicBlock *, int> &
I : NumPerSuccessorCases)
1057 Updates.push_back({DominatorTree::Delete, PredDef,
I.first});
1067 ConstantInt *TIV =
nullptr;
1069 for (
const auto &[
Value, Dest] : PredCases)
1075 assert(TIV &&
"No edge from pred to succ?");
1080 for (
const auto &[
Value, Dest] : ThisCases)
1088 TheRealDest = ThisDef;
1090 SmallPtrSet<BasicBlock *, 2> RemovedSuccs;
1095 if (Succ != CheckEdge) {
1096 if (Succ != TheRealDest)
1097 RemovedSuccs.
insert(Succ);
1100 CheckEdge =
nullptr;
1107 <<
"Through successor TI: " << *TI <<
"Leaving: " << *NI
1112 SmallVector<DominatorTree::UpdateType, 2> Updates;
1114 for (
auto *RemovedSucc : RemovedSuccs)
1115 Updates.
push_back({DominatorTree::Delete, TIBB, RemovedSucc});
1126struct ConstantIntOrdering {
1127 bool operator()(
const ConstantInt *
LHS,
const ConstantInt *
RHS)
const {
1128 return LHS->getValue().ult(
RHS->getValue());
1140 return LHS->getValue().ult(
RHS->getValue()) ? 1 : -1;
1149 assert(MD &&
"Invalid branch-weight metadata");
1174 if (BonusInst.isTerminator())
1204 NewBonusInst->
takeName(&BonusInst);
1205 BonusInst.setName(NewBonusInst->
getName() +
".old");
1206 VMap[&BonusInst] = NewBonusInst;
1215 assert(UI->getParent() == BB && BonusInst.comesBefore(UI) &&
1216 "If the user is not a PHI node, then it should be in the same "
1217 "block as, and come after, the original bonus instruction.");
1221 if (PN->getIncomingBlock(U) == BB)
1225 assert(PN->getIncomingBlock(U) == PredBlock &&
1226 "Not in block-closed SSA form?");
1227 U.set(NewBonusInst);
1237 if (!PredDL->getAtomGroup() &&
DL &&
DL->getAtomGroup() &&
1238 PredDL.isSameSourceLocation(
DL)) {
1245bool SimplifyCFGOpt::performValueComparisonIntoPredecessorFolding(
1253 std::vector<ValueEqualityComparisonCase> BBCases;
1254 BasicBlock *BBDefault = getValueEqualityComparisonCases(TI, BBCases);
1256 std::vector<ValueEqualityComparisonCase> PredCases;
1257 BasicBlock *PredDefault = getValueEqualityComparisonCases(PTI, PredCases);
1262 SmallMapVector<BasicBlock *, int, 8> NewSuccessors;
1265 SmallVector<uint64_t, 8> Weights;
1269 if (PredHasWeights) {
1272 if (Weights.
size() != 1 + PredCases.size())
1273 PredHasWeights = SuccHasWeights =
false;
1274 }
else if (SuccHasWeights)
1278 Weights.
assign(1 + PredCases.size(), 1);
1280 SmallVector<uint64_t, 8> SuccWeights;
1281 if (SuccHasWeights) {
1284 if (SuccWeights.
size() != 1 + BBCases.size())
1285 PredHasWeights = SuccHasWeights =
false;
1286 }
else if (PredHasWeights)
1287 SuccWeights.
assign(1 + BBCases.size(), 1);
1289 if (PredDefault == BB) {
1292 std::set<ConstantInt *, ConstantIntOrdering> PTIHandled;
1293 for (
unsigned i = 0, e = PredCases.size(); i != e; ++i)
1294 if (PredCases[i].Dest != BB)
1295 PTIHandled.insert(PredCases[i].
Value);
1298 std::swap(PredCases[i], PredCases.back());
1300 if (PredHasWeights || SuccHasWeights) {
1302 Weights[0] += Weights[i + 1];
1307 PredCases.pop_back();
1313 if (PredDefault != BBDefault) {
1315 if (DTU && PredDefault != BB)
1316 Updates.
push_back({DominatorTree::Delete, Pred, PredDefault});
1317 PredDefault = BBDefault;
1318 ++NewSuccessors[BBDefault];
1321 unsigned CasesFromPred = Weights.
size();
1322 uint64_t ValidTotalSuccWeight = 0;
1323 for (
unsigned i = 0, e = BBCases.size(); i != e; ++i)
1324 if (!PTIHandled.count(BBCases[i].Value) && BBCases[i].Dest != BBDefault) {
1325 PredCases.push_back(BBCases[i]);
1326 ++NewSuccessors[BBCases[i].Dest];
1327 if (SuccHasWeights || PredHasWeights) {
1331 Weights.
push_back(Weights[0] * SuccWeights[i + 1]);
1332 ValidTotalSuccWeight += SuccWeights[i + 1];
1336 if (SuccHasWeights || PredHasWeights) {
1337 ValidTotalSuccWeight += SuccWeights[0];
1339 for (
unsigned i = 1; i < CasesFromPred; ++i)
1340 Weights[i] *= ValidTotalSuccWeight;
1342 Weights[0] *= SuccWeights[0];
1348 std::set<ConstantInt *, ConstantIntOrdering> PTIHandled;
1349 std::map<ConstantInt *, uint64_t> WeightsForHandled;
1350 for (
unsigned i = 0, e = PredCases.size(); i != e; ++i)
1351 if (PredCases[i].Dest == BB) {
1352 PTIHandled.insert(PredCases[i].
Value);
1354 if (PredHasWeights || SuccHasWeights) {
1355 WeightsForHandled[PredCases[i].Value] = Weights[i + 1];
1360 std::swap(PredCases[i], PredCases.back());
1361 PredCases.pop_back();
1368 for (
const ValueEqualityComparisonCase &Case : BBCases)
1369 if (PTIHandled.count(Case.Value)) {
1371 if (PredHasWeights || SuccHasWeights)
1372 Weights.
push_back(WeightsForHandled[Case.Value]);
1373 PredCases.push_back(Case);
1374 ++NewSuccessors[Case.Dest];
1375 PTIHandled.erase(Case.Value);
1380 for (ConstantInt *
I : PTIHandled) {
1381 if (PredHasWeights || SuccHasWeights)
1383 PredCases.push_back(ValueEqualityComparisonCase(
I, BBDefault));
1384 ++NewSuccessors[BBDefault];
1391 SmallPtrSet<BasicBlock *, 2> SuccsOfPred;
1396 for (
const std::pair<BasicBlock *, int /*Num*/> &NewSuccessor :
1398 for (
auto I :
seq(NewSuccessor.second)) {
1402 if (DTU && !SuccsOfPred.
contains(NewSuccessor.first))
1403 Updates.
push_back({DominatorTree::Insert, Pred, NewSuccessor.first});
1410 "Should not end up here with unstable pointers");
1416 SwitchInst *NewSI = Builder.
CreateSwitch(CV, PredDefault, PredCases.size());
1418 for (ValueEqualityComparisonCase &V : PredCases)
1421 if (PredHasWeights || SuccHasWeights)
1433 if (!InfLoopBlock) {
1441 {DominatorTree::Insert, InfLoopBlock, InfLoopBlock});
1448 Updates.
push_back({DominatorTree::Insert, Pred, InfLoopBlock});
1450 Updates.
push_back({DominatorTree::Delete, Pred, BB});
1455 ++NumFoldValueComparisonIntoPredecessors;
1463bool SimplifyCFGOpt::foldValueComparisonIntoPredecessors(Instruction *TI,
1466 Value *CV = isValueEqualityComparison(TI);
1467 assert(CV &&
"Not a comparison?");
1472 while (!Preds.empty()) {
1481 Value *PCV = isValueEqualityComparison(PTI);
1485 SmallSetVector<BasicBlock *, 4> FailBlocks;
1487 for (
auto *Succ : FailBlocks) {
1493 performValueComparisonIntoPredecessorFolding(TI, CV, PTI, Builder);
1507 Value *BB1V = PN.getIncomingValueForBlock(BB1);
1508 Value *BB2V = PN.getIncomingValueForBlock(BB2);
1509 if (BB1V != BB2V && (BB1V == I1 || BB2V == I2)) {
1528 if (
I->mayReadFromMemory())
1560 if (CB->getIntrinsicID() == Intrinsic::experimental_deoptimize)
1568 if (J->getParent() == BB)
1590 if (C1->isMustTailCall() != C2->isMustTailCall())
1593 if (!
TTI.isProfitableToHoist(I1) || !
TTI.isProfitableToHoist(I2))
1599 if (CB1->cannotMerge() || CB1->isConvergent())
1602 if (CB2->cannotMerge() || CB2->isConvergent())
1617 if (!I1->hasDbgRecords())
1619 using CurrentAndEndIt =
1620 std::pair<DbgRecord::self_iterator, DbgRecord::self_iterator>;
1626 auto atEnd = [](
const CurrentAndEndIt &Pair) {
1627 return Pair.first == Pair.second;
1633 return Itrs[0].first->isIdenticalToWhenDefined(*
I);
1639 {I1->getDbgRecordRange().begin(), I1->getDbgRecordRange().end()});
1641 if (!
Other->hasDbgRecords())
1644 {
Other->getDbgRecordRange().begin(),
Other->getDbgRecordRange().end()});
1651 while (
none_of(Itrs, atEnd)) {
1652 bool HoistDVRs = allIdentical(Itrs);
1653 for (CurrentAndEndIt &Pair : Itrs) {
1667 if (I1->isIdenticalToWhenDefined(I2,
true))
1672 return Cmp1->getPredicate() == Cmp2->getSwappedPredicate() &&
1673 Cmp1->getOperand(0) == Cmp2->getOperand(1) &&
1674 Cmp1->getOperand(1) == Cmp2->getOperand(0);
1676 if (I1->isCommutative() && I1->isSameOperationAs(I2)) {
1677 return I1->getOperand(0) == I2->
getOperand(1) &&
1743 auto &Context = BI->
getParent()->getContext();
1748 Value *Mask =
nullptr;
1749 Value *MaskFalse =
nullptr;
1750 Value *MaskTrue =
nullptr;
1751 if (Invert.has_value()) {
1752 IRBuilder<> Builder(Sel ? Sel : SpeculatedConditionalLoadsStores.
back());
1753 Mask = Builder.CreateBitCast(
1758 MaskFalse = Builder.CreateBitCast(
1760 MaskTrue = Builder.CreateBitCast(
Cond, VCondTy);
1762 auto PeekThroughBitcasts = [](
Value *V) {
1764 V = BitCast->getOperand(0);
1767 for (
auto *
I : SpeculatedConditionalLoadsStores) {
1769 if (!Invert.has_value())
1770 Mask =
I->getParent() == BI->getSuccessor(0) ? MaskTrue : MaskFalse;
1775 auto *Op0 =
I->getOperand(0);
1776 CallInst *MaskedLoadStore =
nullptr;
1779 auto *Ty =
I->getType();
1781 Value *PassThru =
nullptr;
1782 if (Invert.has_value())
1783 for (
User *U :
I->users()) {
1785 PassThru = Builder.CreateBitCast(
1794 Builder.SetInsertPoint(Ins);
1797 MaskedLoadStore = Builder.CreateMaskedLoad(
1799 Value *NewLoadStore = Builder.CreateBitCast(MaskedLoadStore, Ty);
1802 I->replaceAllUsesWith(NewLoadStore);
1805 auto *StoredVal = Builder.CreateBitCast(
1807 MaskedLoadStore = Builder.CreateMaskedStore(
1818 if (
const MDNode *Ranges =
I->getMetadata(LLVMContext::MD_range))
1820 I->dropUBImplyingAttrsAndUnknownMetadata({LLVMContext::MD_annotation});
1824 I->eraseMetadataIf([](
unsigned MDKind,
MDNode *
Node) {
1825 return Node->getMetadataID() == Metadata::DIAssignIDKind;
1828 I->eraseFromParent();
1835 bool IsStore =
false;
1858bool SimplifyCFGOpt::hoistCommonCodeFromSuccessors(Instruction *TI,
1859 bool AllInstsEqOnly) {
1875 for (
auto *Succ : UniqueSuccessors) {
1891 using SuccIterPair = std::pair<BasicBlock::iterator, unsigned>;
1893 for (
auto *Succ : UniqueSuccessors) {
1897 SuccIterPairs.
push_back(SuccIterPair(SuccItr, 0));
1900 if (AllInstsEqOnly) {
1906 unsigned Size0 = UniqueSuccessors[0]->size();
1907 Instruction *Term0 = UniqueSuccessors[0]->getTerminator();
1911 Succ->
size() == Size0;
1915 LockstepReverseIterator<true> LRI(UniqueSuccessors.getArrayRef());
1916 while (LRI.isValid()) {
1918 if (
any_of(*LRI, [I0](Instruction *
I) {
1932 unsigned NumSkipped = 0;
1935 if (SuccIterPairs.
size() > 2) {
1938 if (SuccIterPairs.
size() < 2)
1945 auto *SuccIterPairBegin = SuccIterPairs.
begin();
1946 auto &BB1ItrPair = *SuccIterPairBegin++;
1947 auto OtherSuccIterPairRange =
1953 bool AllInstsAreIdentical =
true;
1954 bool HasTerminator =
I1->isTerminator();
1955 for (
auto &SuccIter : OtherSuccIterRange) {
1959 MMRAMetadata(*I1) != MMRAMetadata(*I2)))
1960 AllInstsAreIdentical =
false;
1963 SmallVector<Instruction *, 8> OtherInsts;
1964 for (
auto &SuccIter : OtherSuccIterRange)
1969 if (HasTerminator) {
1973 if (NumSkipped || !AllInstsAreIdentical) {
1978 return hoistSuccIdenticalTerminatorToSwitchOrIf(
1979 TI, I1, OtherInsts, UniqueSuccessors.getArrayRef()) ||
1983 if (AllInstsAreIdentical) {
1984 unsigned SkipFlagsBB1 = BB1ItrPair.second;
1985 AllInstsAreIdentical =
1987 all_of(OtherSuccIterPairRange, [=](
const auto &Pair) {
1989 unsigned SkipFlagsBB2 = Pair.second;
1999 if (AllInstsAreIdentical) {
2009 for (
auto &SuccIter : OtherSuccIterRange) {
2017 assert(
Success &&
"We should not be trying to hoist callbases "
2018 "with non-intersectable attributes");
2030 NumHoistCommonCode += SuccIterPairs.
size();
2032 NumHoistCommonInstrs += SuccIterPairs.
size();
2041 for (
auto &SuccIterPair : SuccIterPairs) {
2050bool SimplifyCFGOpt::hoistSuccIdenticalTerminatorToSwitchOrIf(
2051 Instruction *TI, Instruction *I1,
2052 SmallVectorImpl<Instruction *> &OtherSuccTIs,
2062 auto *I2 = *OtherSuccTIs.
begin();
2082 for (PHINode &PN : Succ->
phis()) {
2083 Value *BB1V = PN.getIncomingValueForBlock(BB1);
2084 for (Instruction *OtherSuccTI : OtherSuccTIs) {
2085 Value *BB2V = PN.getIncomingValueForBlock(OtherSuccTI->getParent());
2105 if (!
NT->getType()->isVoidTy()) {
2106 I1->replaceAllUsesWith(NT);
2107 for (Instruction *OtherSuccTI : OtherSuccTIs)
2108 OtherSuccTI->replaceAllUsesWith(NT);
2112 NumHoistCommonInstrs += OtherSuccTIs.size() + 1;
2118 for (
auto *OtherSuccTI : OtherSuccTIs)
2119 Locs.
push_back(OtherSuccTI->getDebugLoc());
2131 std::map<std::pair<Value *, Value *>, SelectInst *> InsertedSelects;
2133 for (PHINode &PN : Succ->
phis()) {
2134 Value *BB1V = PN.getIncomingValueForBlock(BB1);
2135 Value *BB2V = PN.getIncomingValueForBlock(BB2);
2141 SelectInst *&
SI = InsertedSelects[std::make_pair(BB1V, BB2V)];
2151 for (
unsigned i = 0, e = PN.getNumIncomingValues(); i != e; ++i)
2152 if (PN.getIncomingBlock(i) == BB1 || PN.getIncomingBlock(i) == BB2)
2153 PN.setIncomingValue(i, SI);
2164 Updates.
push_back({DominatorTree::Insert, TIParent, Succ});
2170 for (BasicBlock *Succ : UniqueSuccessors)
2171 Updates.
push_back({DominatorTree::Delete, TIParent, Succ});
2185 if (
I->isIntDivRem())
2200 std::optional<unsigned> NumUses;
2201 for (
auto *
I : Insts) {
2204 I->getType()->isTokenTy())
2209 if (
I->getParent()->getSingleSuccessor() ==
I->getParent())
2217 if (
C->isInlineAsm() ||
C->cannotMerge() ||
C->isConvergent())
2221 NumUses =
I->getNumUses();
2222 else if (NumUses !=
I->getNumUses())
2228 for (
auto *
I : Insts) {
2242 for (
const Use &U : I0->
uses()) {
2243 auto It = PHIOperands.find(&U);
2244 if (It == PHIOperands.end())
2247 if (!
equal(Insts, It->second))
2261 if (HaveIndirectCalls) {
2262 if (!AllCallsAreIndirect)
2266 Value *Callee =
nullptr;
2270 Callee = CurrCallee;
2271 else if (Callee != CurrCallee)
2277 for (
unsigned OI = 0, OE = I0->
getNumOperands(); OI != OE; ++OI) {
2283 if (!
all_of(Insts, SameAsI0)) {
2289 for (
auto *
I : Insts)
2290 Ops.push_back(
I->getOperand(OI));
2300 auto *BBEnd = Blocks[0]->getTerminator()->getSuccessor(0);
2305 for (
auto *BB : Blocks) {
2307 I =
I->getPrevNode();
2332 assert(!
Op->getType()->isTokenTy() &&
"Can't PHI tokens!");
2335 PN->insertBefore(BBEnd->begin());
2336 for (
auto *
I : Insts)
2337 PN->addIncoming(
I->getOperand(O),
I->getParent());
2346 I0->
moveBefore(*BBEnd, BBEnd->getFirstInsertionPt());
2349 for (
auto *
I : Insts)
2363 assert(
Success &&
"We should not be trying to sink callbases "
2364 "with non-intersectable attributes");
2375 PN->replaceAllUsesWith(I0);
2376 PN->eraseFromParent();
2380 for (
auto *
I : Insts) {
2385 assert(
I->user_empty() &&
"Inst unexpectedly still has non-dbg users");
2386 I->replaceAllUsesWith(I0);
2387 I->eraseFromParent();
2437 bool HaveNonUnconditionalPredecessors =
false;
2440 if (PredBr && PredBr->isUnconditional())
2443 HaveNonUnconditionalPredecessors =
true;
2445 if (UnconditionalPreds.
size() < 2)
2458 for (
const Use &U : PN.incoming_values())
2459 IncomingVals.
insert({PN.getIncomingBlock(U), &U});
2460 auto &
Ops = PHIOperands[IncomingVals[UnconditionalPreds[0]]];
2462 Ops.push_back(*IncomingVals[Pred]);
2470 LLVM_DEBUG(
dbgs() <<
"SINK: instruction can be sunk: " << *(*LRI)[0]
2483 if (!followedByDeoptOrUnreachable) {
2485 auto IsMemOperand = [](
Use &U) {
2498 unsigned NumPHIInsts = 0;
2499 for (
Use &U : (*LRI)[0]->operands()) {
2500 auto It = PHIOperands.
find(&U);
2501 if (It != PHIOperands.
end() && !
all_of(It->second, [&](
Value *V) {
2502 return InstructionsToSink.contains(V);
2509 if (IsMemOperand(U) &&
2510 any_of(It->second, [](
Value *V) { return isa<GEPOperator>(V); }))
2517 LLVM_DEBUG(
dbgs() <<
"SINK: #phi insts: " << NumPHIInsts <<
"\n");
2518 return NumPHIInsts <= 1;
2535 while (Idx < ScanIdx) {
2536 if (!ProfitableToSinkInstruction(LRI)) {
2539 dbgs() <<
"SINK: stopping here, too many PHIs would be created!\n");
2552 if (Idx < ScanIdx) {
2555 InstructionsToSink = InstructionsProfitableToSink;
2561 !ProfitableToSinkInstruction(LRI) &&
2562 "We already know that the last instruction is unprofitable to sink");
2570 for (
auto *
I : *LRI)
2571 InstructionsProfitableToSink.
erase(
I);
2572 if (!ProfitableToSinkInstruction(LRI)) {
2575 InstructionsToSink = InstructionsProfitableToSink;
2589 if (HaveNonUnconditionalPredecessors) {
2590 if (!followedByDeoptOrUnreachable) {
2598 bool Profitable =
false;
2599 while (Idx < ScanIdx) {
2633 for (; SinkIdx != ScanIdx; ++SinkIdx) {
2635 << *UnconditionalPreds[0]->getTerminator()->getPrevNode()
2643 NumSinkCommonInstrs++;
2647 ++NumSinkCommonCode;
2653struct CompatibleSets {
2654 using SetTy = SmallVector<InvokeInst *, 2>;
2660 SetTy &getCompatibleSet(InvokeInst *
II);
2662 void insert(InvokeInst *
II);
2665CompatibleSets::SetTy &CompatibleSets::getCompatibleSet(InvokeInst *
II) {
2670 for (CompatibleSets::SetTy &Set : Sets) {
2671 if (CompatibleSets::shouldBelongToSameSet({
Set.front(),
II}))
2676 return Sets.emplace_back();
2679void CompatibleSets::insert(InvokeInst *
II) {
2680 getCompatibleSet(
II).emplace_back(
II);
2684 assert(Invokes.
size() == 2 &&
"Always called with exactly two candidates.");
2687 auto IsIllegalToMerge = [](InvokeInst *
II) {
2688 return II->cannotMerge() ||
II->isInlineAsm();
2690 if (
any_of(Invokes, IsIllegalToMerge))
2698 if (HaveIndirectCalls) {
2699 if (!AllCallsAreIndirect)
2704 for (InvokeInst *
II : Invokes) {
2705 Value *CurrCallee =
II->getCalledOperand();
2706 assert(CurrCallee &&
"There is always a called operand.");
2709 else if (Callee != CurrCallee)
2716 auto HasNormalDest = [](InvokeInst *
II) {
2719 if (
any_of(Invokes, HasNormalDest)) {
2722 if (!
all_of(Invokes, HasNormalDest))
2727 for (InvokeInst *
II : Invokes) {
2729 assert(CurrNormalBB &&
"There is always a 'continue to' basic block.");
2731 NormalBB = CurrNormalBB;
2732 else if (NormalBB != CurrNormalBB)
2740 NormalBB, {Invokes[0]->getParent(), Invokes[1]->getParent()},
2749 for (InvokeInst *
II : Invokes) {
2751 assert(CurrUnwindBB &&
"There is always an 'unwind to' basic block.");
2753 UnwindBB = CurrUnwindBB;
2755 assert(UnwindBB == CurrUnwindBB &&
"Unexpected unwind destination.");
2762 Invokes.front()->getUnwindDest(),
2763 {Invokes[0]->getParent(), Invokes[1]->getParent()}))
2768 const InvokeInst *II0 = Invokes.front();
2769 for (
auto *
II : Invokes.drop_front())
2774 auto IsIllegalToMergeArguments = [](
auto Ops) {
2775 Use &U0 = std::get<0>(
Ops);
2776 Use &U1 = std::get<1>(
Ops);
2782 assert(Invokes.size() == 2 &&
"Always called with exactly two candidates.");
2783 if (
any_of(
zip(Invokes[0]->data_ops(), Invokes[1]->data_ops()),
2784 IsIllegalToMergeArguments))
2796 assert(Invokes.
size() >= 2 &&
"Must have at least two invokes to merge.");
2802 bool HasNormalDest =
2807 InvokeInst *MergedInvoke = [&Invokes, HasNormalDest]() {
2811 II0->
getParent()->getIterator()->getNextNode();
2816 Ctx, II0BB->
getName() +
".invoke", Func, InsertBeforeBlock);
2820 MergedInvoke->
insertInto(MergedInvokeBB, MergedInvokeBB->
end());
2822 if (!HasNormalDest) {
2826 Ctx, II0BB->
getName() +
".cont", Func, InsertBeforeBlock);
2834 return MergedInvoke;
2848 SuccBBOfMergedInvoke});
2871 return II->getOperand(U.getOperandNo()) != U.get();
2890 Invokes.
front()->getParent());
2898 if (!MergedDebugLoc)
2899 MergedDebugLoc =
II->getDebugLoc();
2907 OrigSuccBB->removePredecessor(
II->getParent());
2913 assert(
Success &&
"Merged invokes with incompatible attributes");
2916 II->replaceAllUsesWith(MergedInvoke);
2917 II->eraseFromParent();
2921 ++NumInvokeSetsFormed;
2957 CompatibleSets Grouper;
2967 if (Invokes.
size() < 2)
2979class EphemeralValueTracker {
2980 SmallPtrSet<const Instruction *, 32> EphValues;
2982 bool isEphemeral(
const Instruction *
I) {
2985 return !
I->mayHaveSideEffects() && !
I->isTerminator() &&
2986 all_of(
I->users(), [&](
const User *U) {
2987 return EphValues.count(cast<Instruction>(U));
2992 bool track(
const Instruction *
I) {
2993 if (isEphemeral(
I)) {
3044 unsigned MaxNumInstToLookAt = 9;
3048 if (!MaxNumInstToLookAt)
3050 --MaxNumInstToLookAt;
3060 if (
SI->getPointerOperand() == StorePtr &&
3061 SI->getValueOperand()->getType() == StoreTy &&
SI->isSimple() &&
3064 return SI->getValueOperand();
3069 if (LI->getPointerOperand() == StorePtr && LI->
getType() == StoreTy &&
3070 LI->isSimple() && LI->getAlign() >= StoreToHoist->
getAlign()) {
3072 bool ExplicitlyDereferenceableOnly;
3077 (!ExplicitlyDereferenceableOnly ||
3079 LI->getDataLayout()))) {
3095 unsigned &SpeculatedInstructions,
3103 bool HaveRewritablePHIs =
false;
3105 Value *OrigV = PN.getIncomingValueForBlock(BB);
3106 Value *ThenV = PN.getIncomingValueForBlock(ThenBB);
3113 Cost +=
TTI.getCmpSelInstrCost(Instruction::Select, PN.getType(),
3122 HaveRewritablePHIs =
true;
3125 if (!OrigCE && !ThenCE)
3132 if (OrigCost + ThenCost > MaxCost)
3139 ++SpeculatedInstructions;
3140 if (SpeculatedInstructions > 1)
3144 return HaveRewritablePHIs;
3148 std::optional<bool> Invert,
3152 if (BI->
getMetadata(LLVMContext::MD_unpredictable))
3159 if (!Invert.has_value())
3162 uint64_t EndWeight = *Invert ? TWeight : FWeight;
3166 return BIEndProb < Likely;
3206bool SimplifyCFGOpt::speculativelyExecuteBB(BranchInst *BI,
3207 BasicBlock *ThenBB) {
3223 bool Invert =
false;
3238 SmallDenseMap<Instruction *, unsigned, 4> SinkCandidateUseCounts;
3240 SmallVector<Instruction *, 4> SpeculatedPseudoProbes;
3242 unsigned SpeculatedInstructions = 0;
3243 bool HoistLoadsStores =
Options.HoistLoadsStoresWithCondFaulting;
3244 SmallVector<Instruction *, 2> SpeculatedConditionalLoadsStores;
3245 Value *SpeculatedStoreValue =
nullptr;
3246 StoreInst *SpeculatedStore =
nullptr;
3247 EphemeralValueTracker EphTracker;
3262 if (EphTracker.track(&
I))
3267 bool IsSafeCheapLoadStore = HoistLoadsStores &&
3269 SpeculatedConditionalLoadsStores.
size() <
3273 if (IsSafeCheapLoadStore)
3274 SpeculatedConditionalLoadsStores.
push_back(&
I);
3276 ++SpeculatedInstructions;
3278 if (SpeculatedInstructions > 1)
3282 if (!IsSafeCheapLoadStore &&
3285 (SpeculatedStoreValue =
3288 if (!IsSafeCheapLoadStore && !SpeculatedStoreValue &&
3294 if (!SpeculatedStore && SpeculatedStoreValue)
3300 for (Use &
Op :
I.operands()) {
3305 ++SinkCandidateUseCounts[OpI];
3312 for (
const auto &[Inst,
Count] : SinkCandidateUseCounts)
3313 if (Inst->hasNUses(
Count)) {
3314 ++SpeculatedInstructions;
3315 if (SpeculatedInstructions > 1)
3322 SpeculatedStore !=
nullptr || !SpeculatedConditionalLoadsStores.
empty();
3325 SpeculatedInstructions,
Cost,
TTI);
3326 if (!Convert ||
Cost > Budget)
3330 LLVM_DEBUG(
dbgs() <<
"SPECULATIVELY EXECUTING BB" << *ThenBB <<
"\n";);
3334 if (SpeculatedStoreValue) {
3338 Value *FalseV = SpeculatedStoreValue;
3342 BrCond, TrueV, FalseV,
"spec.store.select", BI);
3372 for (DbgVariableRecord *DbgAssign :
3375 DbgAssign->replaceVariableLocationOp(OrigV, S);
3385 if (!SpeculatedStoreValue || &
I != SpeculatedStore) {
3388 I.dropUBImplyingAttrsAndMetadata();
3391 if (EphTracker.contains(&
I)) {
3393 I.eraseFromParent();
3399 for (
auto &It : *ThenBB)
3404 !DVR || !DVR->isDbgAssign())
3405 It.dropOneDbgRecord(&DR);
3407 std::prev(ThenBB->end()));
3409 if (!SpeculatedConditionalLoadsStores.
empty())
3415 for (PHINode &PN : EndBB->
phis()) {
3416 unsigned OrigI = PN.getBasicBlockIndex(BB);
3417 unsigned ThenI = PN.getBasicBlockIndex(ThenBB);
3418 Value *OrigV = PN.getIncomingValue(OrigI);
3419 Value *ThenV = PN.getIncomingValue(ThenI);
3428 Value *TrueV = ThenV, *FalseV = OrigV;
3432 PN.setIncomingValue(OrigI, V);
3433 PN.setIncomingValue(ThenI, V);
3437 for (Instruction *
I : SpeculatedPseudoProbes)
3438 I->eraseFromParent();
3451 if (!ReachesNonLocalUses.
insert(BB).second)
3466 EphemeralValueTracker EphTracker;
3473 if (CI->cannotDuplicate() || CI->isConvergent())
3486 for (
User *U :
I.users()) {
3489 if (UsedInBB == BB) {
3493 NonLocalUseBlocks.
insert(UsedInBB);
3507 if (
I &&
I->getParent() == To)
3523static std::optional<bool>
3544 KnownValues[CB].
insert(Pred);
3548 if (KnownValues.
empty())
3573 if (!
findReaching(UseBB, BB, ReachesNonLocalUseBlocks))
3576 for (
const auto &Pair : KnownValues) {
3593 if (ReachesNonLocalUseBlocks.
contains(RealDest))
3598 <<
" has value " << *Pair.first <<
" in predecessors:\n";
3601 dbgs() <<
"Threading to destination " << RealDest->
getName() <<
".\n";
3611 EdgeBB->setName(RealDest->
getName() +
".critedge");
3612 EdgeBB->moveBefore(RealDest);
3622 TranslateMap[
Cond] = CB;
3635 N->insertInto(EdgeBB, InsertPt);
3638 N->setName(BBI->getName() +
".c");
3649 if (!BBI->use_empty())
3650 TranslateMap[&*BBI] = V;
3651 if (!
N->mayHaveSideEffects()) {
3652 N->eraseFromParent();
3657 if (!BBI->use_empty())
3658 TranslateMap[&*BBI] =
N;
3664 for (; SrcDbgCursor != BBI; ++SrcDbgCursor)
3665 N->cloneDebugInfoFrom(&*SrcDbgCursor);
3666 SrcDbgCursor = std::next(BBI);
3668 N->cloneDebugInfoFrom(&*BBI);
3677 for (; &*SrcDbgCursor != BI; ++SrcDbgCursor)
3678 InsertPt->cloneDebugInfoFrom(&*SrcDbgCursor);
3679 InsertPt->cloneDebugInfoFrom(BI);
3700 return std::nullopt;
3706bool SimplifyCFGOpt::foldCondBranchOnValueKnownInPredecessor(BranchInst *BI) {
3713 std::optional<bool>
Result;
3714 bool EverChanged =
false;
3720 }
while (Result == std::nullopt);
3729 bool SpeculateUnpredictables) {
3751 return cast<BranchInst>(IfBlock->getTerminator())->isUnconditional();
3754 "Will have either one or two blocks to speculate.");
3761 bool IsUnpredictable = DomBI->
getMetadata(LLVMContext::MD_unpredictable);
3762 if (!IsUnpredictable) {
3765 (TWeight + FWeight) != 0) {
3770 if (IfBlocks.
size() == 1) {
3772 DomBI->
getSuccessor(0) == BB ? BITrueProb : BIFalseProb;
3773 if (BIBBProb >= Likely)
3776 if (BITrueProb >= Likely || BIFalseProb >= Likely)
3785 if (IfCondPhiInst->getParent() == BB)
3793 unsigned NumPhis = 0;
3806 if (SpeculateUnpredictables && IsUnpredictable)
3807 Budget +=
TTI.getBranchMispredictPenalty();
3820 AggressiveInsts, Cost, Budget,
TTI, AC,
3821 ZeroCostInstructions) ||
3823 AggressiveInsts, Cost, Budget,
TTI, AC,
3824 ZeroCostInstructions))
3836 auto CanHoistNotFromBothValues = [](
Value *V0,
Value *V1) {
3847 auto IsBinOpOrAnd = [](
Value *V) {
3864 if (!AggressiveInsts.
count(&*
I) && !
I->isDebugOrPseudoInst()) {
3877 if (IsUnpredictable)
dbgs() <<
" (unpredictable)";
3879 <<
" F: " << IfFalse->
getName() <<
"\n");
3896 Value *Sel = Builder.CreateSelectFMF(IfCond, TrueVal, FalseVal,
3901 PN->eraseFromParent();
3907 Builder.CreateBr(BB);
3928 return Builder.CreateBinOp(
Opc,
LHS,
RHS, Name);
3929 if (
Opc == Instruction::And)
3930 return Builder.CreateLogicalAnd(
LHS,
RHS, Name);
3931 if (
Opc == Instruction::Or)
3932 return Builder.CreateLogicalOr(
LHS,
RHS, Name);
3944 bool PredHasWeights =
3946 bool SuccHasWeights =
3948 if (PredHasWeights || SuccHasWeights) {
3949 if (!PredHasWeights)
3950 PredTrueWeight = PredFalseWeight = 1;
3951 if (!SuccHasWeights)
3952 SuccTrueWeight = SuccFalseWeight = 1;
3962static std::optional<std::tuple<BasicBlock *, Instruction::BinaryOps, bool>>
3966 "Both blocks must end with a conditional branches.");
3968 "PredBB must be a predecessor of BB.");
3976 (PTWeight + PFWeight) != 0) {
3979 Likely =
TTI->getPredictableBranchThreshold();
3984 if (PBITrueProb.
isUnknown() || PBITrueProb < Likely)
3985 return {{BI->
getSuccessor(0), Instruction::Or,
false}};
3989 return {{BI->
getSuccessor(1), Instruction::And,
false}};
3992 if (PBITrueProb.
isUnknown() || PBITrueProb < Likely)
3993 return {{BI->
getSuccessor(1), Instruction::And,
true}};
3999 return std::nullopt;
4012 bool InvertPredCond;
4013 std::tie(CommonSucc,
Opc, InvertPredCond) =
4016 LLVM_DEBUG(
dbgs() <<
"FOLDING BRANCH TO COMMON DEST:\n" << *PBI << *BB);
4023 {LLVMContext::MD_annotation});
4026 if (InvertPredCond) {
4039 uint64_t PredTrueWeight, PredFalseWeight, SuccTrueWeight, SuccFalseWeight;
4042 SuccTrueWeight, SuccFalseWeight)) {
4048 MDWeights.
push_back(PredTrueWeight * SuccTrueWeight);
4053 MDWeights.
push_back(PredFalseWeight * (SuccFalseWeight + SuccTrueWeight) +
4054 PredTrueWeight * SuccFalseWeight);
4060 MDWeights.
push_back(PredTrueWeight * (SuccFalseWeight + SuccTrueWeight) +
4061 PredFalseWeight * SuccTrueWeight);
4063 MDWeights.
push_back(PredFalseWeight * SuccFalseWeight);
4105 if (!MDWeights.
empty()) {
4106 assert(isSelectInRoleOfConjunctionOrDisjunction(
SI));
4111 ++NumFoldBranchToCommonDest;
4118 return I.getType()->isVectorTy() ||
any_of(
I.operands(), [](
Use &U) {
4119 return U->getType()->isVectorTy();
4129 unsigned BonusInstThreshold) {
4143 Cond->getParent() != BB || !
Cond->hasOneUse())
4164 bool InvertPredCond;
4166 std::tie(CommonSucc,
Opc, InvertPredCond) = *Recipe;
4198 unsigned NumBonusInsts = 0;
4199 bool SawVectorOp =
false;
4200 const unsigned PredCount = Preds.
size();
4217 NumBonusInsts += PredCount;
4225 auto IsBCSSAUse = [BB, &
I](
Use &U) {
4228 return PN->getIncomingBlock(U) == BB;
4229 return UI->
getParent() == BB &&
I.comesBefore(UI);
4233 if (!
all_of(
I.uses(), IsBCSSAUse))
4237 BonusInstThreshold *
4253 for (
auto *BB : {BB1, BB2}) {
4269 Value *AlternativeV =
nullptr) {
4295 BasicBlock *OtherPredBB = *PredI == BB ? *++PredI : *PredI;
4296 if (
PHI->getIncomingValueForBlock(OtherPredBB) == AlternativeV)
4304 if (!AlternativeV &&
4310 PHI->addIncoming(V, BB);
4320 BasicBlock *PostBB,
Value *Address,
bool InvertPCond,
bool InvertQCond,
4329 if (!PStore || !QStore)
4350 if (
I.mayReadOrWriteMemory())
4352 for (
auto &
I : *QFB)
4353 if (&
I != QStore &&
I.mayReadOrWriteMemory())
4356 for (
auto &
I : *QTB)
4357 if (&
I != QStore &&
I.mayReadOrWriteMemory())
4361 if (&*
I != PStore &&
I->mayReadOrWriteMemory())
4377 if (
I.isTerminator())
4395 "When we run out of budget we will eagerly return from within the "
4396 "per-instruction loop.");
4400 const std::array<StoreInst *, 2> FreeStores = {PStore, QStore};
4402 (!IsWorthwhile(PTB, FreeStores) || !IsWorthwhile(PFB, FreeStores) ||
4403 !IsWorthwhile(QTB, FreeStores) || !IsWorthwhile(QFB, FreeStores)))
4439 InvertPCond ^= (PStore->
getParent() != PTB);
4440 InvertQCond ^= (QStore->
getParent() != QTB);
4461 {CombinedWeights[0], CombinedWeights[1]},
4525 bool InvertPCond =
false, InvertQCond =
false;
4531 if (QFB == PostBB) {
4550 !HasOnePredAndOneSucc(QFB, QBI->
getParent(), PostBB))
4553 (QTB && !HasOnePredAndOneSucc(QTB, QBI->
getParent(), PostBB)))
4561 for (
auto *BB : {PTB, PFB}) {
4566 PStoreAddresses.
insert(
SI->getPointerOperand());
4568 for (
auto *BB : {QTB, QFB}) {
4573 QStoreAddresses.
insert(
SI->getPointerOperand());
4579 auto &CommonAddresses = PStoreAddresses;
4582 for (
auto *Address : CommonAddresses)
4585 InvertPCond, InvertQCond, DTU,
DL,
TTI);
4603 !BI->
getParent()->getSinglePredecessor())
4605 if (!IfFalseBB->
phis().empty())
4615 return I.mayWriteToMemory() ||
I.mayHaveSideEffects();
4718 if (!PBI->
getMetadata(LLVMContext::MD_unpredictable) &&
4720 (
static_cast<uint64_t>(PredWeights[0]) + PredWeights[1]) != 0) {
4724 static_cast<uint64_t>(PredWeights[0]) + PredWeights[1]);
4727 if (CommonDestProb >= Likely)
4737 unsigned NumPhis = 0;
4759 if (OtherDest == BB) {
4767 OtherDest = InfLoopBlock;
4779 PBICond = Builder.CreateNot(PBICond, PBICond->
getName() +
".not");
4783 BICond = Builder.CreateNot(BICond, BICond->
getName() +
".not");
4787 createLogicalOp(Builder, Instruction::Or, PBICond, BICond,
"brmerge");
4802 uint64_t PredTrueWeight, PredFalseWeight, SuccTrueWeight, SuccFalseWeight;
4803 uint64_t PredCommon, PredOther, SuccCommon, SuccOther;
4806 SuccTrueWeight, SuccFalseWeight);
4808 PredCommon = PBIOp ? PredFalseWeight : PredTrueWeight;
4809 PredOther = PBIOp ? PredTrueWeight : PredFalseWeight;
4810 SuccCommon = BIOp ? SuccFalseWeight : SuccTrueWeight;
4811 SuccOther = BIOp ? SuccTrueWeight : SuccFalseWeight;
4815 uint64_t NewWeights[2] = {PredCommon * (SuccCommon + SuccOther) +
4816 PredOther * SuccCommon,
4817 PredOther * SuccOther};
4825 assert(isSelectInRoleOfConjunctionOrDisjunction(
SI));
4844 Value *BIV = PN.getIncomingValueForBlock(BB);
4845 unsigned PBBIdx = PN.getBasicBlockIndex(PBI->
getParent());
4846 Value *PBIV = PN.getIncomingValue(PBBIdx);
4850 Builder.CreateSelect(PBICond, PBIV, BIV, PBIV->
getName() +
".mux"));
4851 PN.setIncomingValue(PBBIdx, NV);
4855 uint64_t TrueWeight = PBIOp ? PredFalseWeight : PredTrueWeight;
4856 uint64_t FalseWeight = PBIOp ? PredTrueWeight : PredFalseWeight;
4876bool SimplifyCFGOpt::simplifyTerminatorOnSelect(Instruction *OldTerm,
4878 BasicBlock *FalseBB,
4879 uint32_t TrueWeight,
4880 uint32_t FalseWeight) {
4887 BasicBlock *KeepEdge2 = TrueBB != FalseBB ? FalseBB :
nullptr;
4889 SmallSetVector<BasicBlock *, 2> RemovedSuccessors;
4892 for (BasicBlock *Succ :
successors(OldTerm)) {
4894 if (Succ == KeepEdge1)
4895 KeepEdge1 =
nullptr;
4896 else if (Succ == KeepEdge2)
4897 KeepEdge2 =
nullptr;
4902 if (Succ != TrueBB && Succ != FalseBB)
4903 RemovedSuccessors.
insert(Succ);
4911 if (!KeepEdge1 && !KeepEdge2) {
4912 if (TrueBB == FalseBB) {
4923 }
else if (KeepEdge1 && (KeepEdge2 || TrueBB == FalseBB)) {
4943 SmallVector<DominatorTree::UpdateType, 2> Updates;
4945 for (
auto *RemovedSuccessor : RemovedSuccessors)
4946 Updates.
push_back({DominatorTree::Delete, BB, RemovedSuccessor});
4957bool SimplifyCFGOpt::simplifySwitchOnSelect(SwitchInst *SI,
4962 if (!TrueVal || !FalseVal)
4967 BasicBlock *TrueBB =
SI->findCaseValue(TrueVal)->getCaseSuccessor();
4968 BasicBlock *FalseBB =
SI->findCaseValue(FalseVal)->getCaseSuccessor();
4971 uint32_t TrueWeight = 0, FalseWeight = 0;
4972 SmallVector<uint64_t, 8> Weights;
4976 if (Weights.
size() == 1 +
SI->getNumCases()) {
4978 (uint32_t)Weights[
SI->findCaseValue(TrueVal)->getSuccessorIndex()];
4980 (uint32_t)Weights[
SI->findCaseValue(FalseVal)->getSuccessorIndex()];
4985 return simplifyTerminatorOnSelect(SI, Condition, TrueBB, FalseBB, TrueWeight,
4994bool SimplifyCFGOpt::simplifyIndirectBrOnSelect(IndirectBrInst *IBI,
5008 SmallVector<uint32_t> SelectBranchWeights(2);
5012 return simplifyTerminatorOnSelect(IBI,
SI->getCondition(), TrueBB, FalseBB,
5013 SelectBranchWeights[0],
5014 SelectBranchWeights[1]);
5034bool SimplifyCFGOpt::tryToSimplifyUncondBranchWithICmpInIt(
5038 return tryToSimplifyUncondBranchWithICmpSelectInIt(ICI,
nullptr, Builder);
5084bool SimplifyCFGOpt::tryToSimplifyUncondBranchWithICmpSelectInIt(
5103 ConstantInt *NewCaseVal;
5111 Value *SelectCond, *SelectTrueVal, *SelectFalseVal;
5117 SelectTrueVal = Builder.
getTrue();
5118 SelectFalseVal = Builder.
getFalse();
5121 SelectCond =
Select->getCondition();
5123 if (SelectCond != ICI)
5125 SelectTrueVal =
Select->getTrueValue();
5126 SelectFalseVal =
Select->getFalseValue();
5131 if (
SI->getCondition() != IcmpCond)
5137 if (
SI->getDefaultDest() != BB) {
5138 ConstantInt *VVal =
SI->findCaseDest(BB);
5139 assert(VVal &&
"Should have a unique destination value");
5147 return requestResimplify();
5153 if (
SI->findCaseValue(NewCaseVal) !=
SI->case_default()) {
5155 if (Predicate == ICmpInst::ICMP_EQ)
5163 return requestResimplify();
5170 if (PHIUse ==
nullptr || PHIUse != &SuccBlock->
front() ||
5176 Value *DefaultCst = SelectFalseVal;
5177 Value *NewCst = SelectTrueVal;
5185 Select->replaceAllUsesWith(DefaultCst);
5186 Select->eraseFromParent();
5192 SmallVector<DominatorTree::UpdateType, 2> Updates;
5199 SwitchInstProfUpdateWrapper SIW(*SI);
5200 auto W0 = SIW.getSuccessorWeight(0);
5203 NewW = ((uint64_t(*W0) + 1) >> 1);
5204 SIW.setSuccessorWeight(0, *NewW);
5206 SIW.addCase(NewCaseVal, NewBB, NewW);
5208 Updates.
push_back({DominatorTree::Insert, Pred, NewBB});
5217 Updates.
push_back({DominatorTree::Insert, NewBB, SuccBlock});
5226bool SimplifyCFGOpt::simplifyBranchOnICmpChain(BranchInst *BI,
5228 const DataLayout &
DL) {
5238 ConstantComparesGatherer ConstantCompare(
Cond,
DL);
5240 SmallVectorImpl<ConstantInt *> &Values = ConstantCompare.Vals;
5241 Value *CompVal = ConstantCompare.CompValue;
5242 unsigned UsedICmps = ConstantCompare.UsedICmps;
5243 Value *ExtraCase = ConstantCompare.Extra;
5244 bool TrueWhenEqual = ConstantCompare.IsEq;
5261 if (ExtraCase && Values.
size() < 2)
5264 SmallVector<uint32_t> BranchWeights;
5271 if (!TrueWhenEqual) {
5274 std::swap(BranchWeights[0], BranchWeights[1]);
5280 <<
" cases into SWITCH. BB is:\n"
5283 SmallVector<DominatorTree::UpdateType, 2> Updates;
5290 nullptr,
"switch.early.test");
5301 AssumptionCache *AC =
Options.AC;
5307 auto *Br = TrueWhenEqual ? Builder.
CreateCondBr(ExtraCase, EdgeBB, NewBB)
5314 Updates.
push_back({DominatorTree::Insert, BB, EdgeBB});
5320 LLVM_DEBUG(
dbgs() <<
" ** 'icmp' chain unhandled condition: " << *ExtraCase
5321 <<
"\nEXTRABB = " << *BB);
5329 "Should not end up here with unstable pointers");
5331 CompVal,
DL.getIntPtrType(CompVal->
getType()),
"magicptr");
5336 if (Values.
front()->getValue() - Values.
back()->getValue() ==
5337 Values.
size() - 1) {
5339 Values.
back()->getValue(), Values.
front()->getValue() + 1);
5341 ICmpInst::Predicate Pred;
5359 SmallVector<uint32_t> NewWeights(Values.
size() + 1);
5360 NewWeights[0] = BranchWeights[1];
5363 V = BranchWeights[0] / Values.
size();
5368 for (ConstantInt *Val : Values)
5369 New->addCase(Val, EdgeBB);
5377 for (
unsigned i = 0, e = Values.size() - 1; i != e; ++i)
5387 LLVM_DEBUG(
dbgs() <<
" ** 'icmp' chain result is:\n" << *BB <<
'\n');
5391bool SimplifyCFGOpt::simplifyResume(ResumeInst *RI,
IRBuilder<> &Builder) {
5393 return simplifyCommonResume(RI);
5397 return simplifySingleResume(RI);
5410 switch (IntrinsicID) {
5411 case Intrinsic::dbg_declare:
5412 case Intrinsic::dbg_value:
5413 case Intrinsic::dbg_label:
5414 case Intrinsic::lifetime_end:
5424bool SimplifyCFGOpt::simplifyCommonResume(ResumeInst *RI) {
5433 SmallSetVector<BasicBlock *, 4> TrivialUnwindBlocks;
5437 for (
unsigned Idx = 0, End = PhiLPInst->getNumIncomingValues(); Idx != End;
5439 auto *IncomingBB = PhiLPInst->getIncomingBlock(Idx);
5440 auto *IncomingValue = PhiLPInst->getIncomingValue(Idx);
5444 if (IncomingBB->getUniqueSuccessor() != BB)
5449 if (IncomingValue != LandingPad)
5453 make_range(LandingPad->getNextNode(), IncomingBB->getTerminator())))
5454 TrivialUnwindBlocks.
insert(IncomingBB);
5458 if (TrivialUnwindBlocks.
empty())
5462 for (
auto *TrivialBB : TrivialUnwindBlocks) {
5466 while (PhiLPInst->getBasicBlockIndex(TrivialBB) != -1)
5469 for (BasicBlock *Pred :
5480 TrivialBB->getTerminator()->eraseFromParent();
5481 new UnreachableInst(RI->
getContext(), TrivialBB);
5483 DTU->
applyUpdates({{DominatorTree::Delete, TrivialBB, BB}});
5490 return !TrivialUnwindBlocks.empty();
5494bool SimplifyCFGOpt::simplifySingleResume(ResumeInst *RI) {
5498 "Resume must unwind the exception that caused control to here");
5554 int Idx = DestPN.getBasicBlockIndex(BB);
5568 Value *SrcVal = DestPN.getIncomingValue(Idx);
5571 bool NeedPHITranslation = SrcPN && SrcPN->
getParent() == BB;
5575 DestPN.addIncoming(
Incoming, Pred);
5602 std::vector<DominatorTree::UpdateType> Updates;
5606 if (UnwindDest ==
nullptr) {
5647 if (!SuccessorCleanupPad)
5656 SuccessorCleanupPad->eraseFromParent();
5665bool SimplifyCFGOpt::simplifyCleanupReturn(CleanupReturnInst *RI) {
5682bool SimplifyCFGOpt::simplifyUnreachable(UnreachableInst *UI) {
5714 BBI->dropDbgRecords();
5718 BBI->eraseFromParent();
5724 if (&BB->
front() != UI)
5727 std::vector<DominatorTree::UpdateType> Updates;
5730 for (BasicBlock *Predecessor : Preds) {
5737 [BB](
auto *
Successor) { return Successor == BB; })) {
5745 "The destinations are guaranteed to be different here.");
5746 CallInst *Assumption;
5762 Updates.push_back({DominatorTree::Delete, Predecessor, BB});
5764 SwitchInstProfUpdateWrapper SU(*SI);
5765 for (
auto i = SU->case_begin(), e = SU->case_end(); i != e;) {
5766 if (i->getCaseSuccessor() != BB) {
5771 i = SU.removeCase(i);
5776 if (DTU &&
SI->getDefaultDest() != BB)
5777 Updates.push_back({DominatorTree::Delete, Predecessor, BB});
5779 if (
II->getUnwindDest() == BB) {
5785 if (!CI->doesNotThrow())
5786 CI->setDoesNotThrow();
5790 if (CSI->getUnwindDest() == BB) {
5801 E = CSI->handler_end();
5804 CSI->removeHandler(
I);
5811 Updates.push_back({DominatorTree::Delete, Predecessor, BB});
5812 if (CSI->getNumHandlers() == 0) {
5813 if (CSI->hasUnwindDest()) {
5817 for (
auto *PredecessorOfPredecessor :
predecessors(Predecessor)) {
5818 Updates.push_back({DominatorTree::Insert,
5819 PredecessorOfPredecessor,
5820 CSI->getUnwindDest()});
5821 Updates.push_back({DominatorTree::Delete,
5822 PredecessorOfPredecessor, Predecessor});
5825 Predecessor->replaceAllUsesWith(CSI->getUnwindDest());
5832 SmallVector<BasicBlock *, 8> EHPreds(
predecessors(Predecessor));
5833 for (BasicBlock *EHPred : EHPreds)
5837 new UnreachableInst(CSI->getContext(), CSI->getIterator());
5838 CSI->eraseFromParent();
5843 assert(CRI->hasUnwindDest() && CRI->getUnwindDest() == BB &&
5844 "Expected to always have an unwind to BB.");
5846 Updates.push_back({DominatorTree::Delete, Predecessor, BB});
5874static std::optional<ContiguousCasesResult>
5881 const APInt &Min = Cases.
back()->getValue();
5882 const APInt &Max = Cases.
front()->getValue();
5884 size_t ContiguousOffset = Cases.
size() - 1;
5885 if (
Offset == ContiguousOffset) {
5903 std::adjacent_find(Cases.
begin(), Cases.
end(), [](
auto L,
auto R) {
5904 return L->getValue() != R->getValue() + 1;
5906 if (It == Cases.
end())
5907 return std::nullopt;
5908 auto [OtherMax, OtherMin] = std::make_pair(*It, *std::next(It));
5909 if ((Max - OtherMax->getValue()) + (OtherMin->getValue() - Min) ==
5913 ConstantInt::get(OtherMin->getType(), OtherMin->getValue() + 1)),
5916 ConstantInt::get(OtherMax->getType(), OtherMax->getValue() - 1)),
5924 return std::nullopt;
5929 bool RemoveOrigDefaultBlock =
true) {
5931 auto *BB = Switch->getParent();
5932 auto *OrigDefaultBlock = Switch->getDefaultDest();
5933 if (RemoveOrigDefaultBlock)
5934 OrigDefaultBlock->removePredecessor(BB);
5938 auto *UI =
new UnreachableInst(Switch->getContext(), NewDefaultBlock);
5940 Switch->setDefaultDest(&*NewDefaultBlock);
5944 if (RemoveOrigDefaultBlock &&
5954bool SimplifyCFGOpt::turnSwitchRangeIntoICmp(SwitchInst *SI,
5956 assert(
SI->getNumCases() > 1 &&
"Degenerate switch?");
5958 bool HasDefault = !
SI->defaultDestUnreachable();
5960 auto *BB =
SI->getParent();
5962 BasicBlock *DestA = HasDefault ?
SI->getDefaultDest() :
nullptr;
5967 for (
auto Case :
SI->cases()) {
5971 if (Dest == DestA) {
5977 if (Dest == DestB) {
5987 "Single-destination switch should have been folded.");
5989 assert(DestB !=
SI->getDefaultDest());
5990 assert(!CasesB.
empty() &&
"There must be non-default cases.");
5994 std::optional<ContiguousCasesResult> ContiguousCases;
5997 if (!HasDefault && CasesA.
size() == 1)
5998 ContiguousCases = ContiguousCasesResult{
6006 else if (CasesB.
size() == 1)
6007 ContiguousCases = ContiguousCasesResult{
6016 else if (!HasDefault)
6020 if (!ContiguousCases)
6024 if (!ContiguousCases)
6027 auto [Min,
Max, Dest, OtherDest, Cases, OtherCases] = *ContiguousCases;
6033 Max->getValue() - Min->getValue() + 1);
6036 assert(
Max->getValue() == Min->getValue());
6041 else if (NumCases->
isNullValue() && !Cases->empty()) {
6045 if (!
Offset->isNullValue())
6053 SmallVector<uint64_t, 8> Weights;
6055 if (Weights.
size() == 1 +
SI->getNumCases()) {
6056 uint64_t TrueWeight = 0;
6057 uint64_t FalseWeight = 0;
6058 for (
size_t I = 0,
E = Weights.
size();
I !=
E; ++
I) {
6059 if (
SI->getSuccessor(
I) == Dest)
6060 TrueWeight += Weights[
I];
6062 FalseWeight += Weights[
I];
6064 while (TrueWeight > UINT32_MAX || FalseWeight > UINT32_MAX) {
6075 unsigned PreviousEdges = Cases->size();
6076 if (Dest ==
SI->getDefaultDest())
6078 for (
unsigned I = 0,
E = PreviousEdges - 1;
I !=
E; ++
I)
6079 PHI.removeIncomingValue(
SI->getParent());
6082 unsigned PreviousEdges = OtherCases->size();
6083 if (OtherDest ==
SI->getDefaultDest())
6085 unsigned E = PreviousEdges - 1;
6089 for (
unsigned I = 0;
I !=
E; ++
I)
6090 PHI.removeIncomingValue(
SI->getParent());
6098 auto *UnreachableDefault =
SI->getDefaultDest();
6101 SI->eraseFromParent();
6103 if (!HasDefault && DTU)
6104 DTU->
applyUpdates({{DominatorTree::Delete, BB, UnreachableDefault}});
6122 unsigned MaxSignificantBitsInCond =
6129 for (
const auto &Case :
SI->cases()) {
6130 auto *
Successor = Case.getCaseSuccessor();
6141 (IsKnownValuesValid && !KnownValues.
contains(CaseC))) {
6147 }
else if (IsKnownValuesValid)
6148 KnownValues.
erase(CaseC);
6155 bool HasDefault = !
SI->defaultDestUnreachable();
6156 const unsigned NumUnknownBits =
6159 if (HasDefault && DeadCases.
empty()) {
6165 if (NumUnknownBits < 64 ) {
6166 uint64_t AllNumCases = 1ULL << NumUnknownBits;
6167 if (
SI->getNumCases() == AllNumCases) {
6174 if (
SI->getNumCases() == AllNumCases - 1) {
6175 assert(NumUnknownBits > 1 &&
"Should be canonicalized to a branch");
6177 if (CondTy->getIntegerBitWidth() > 64 ||
6178 !
DL.fitsInLegalInteger(CondTy->getIntegerBitWidth()))
6182 for (
const auto &Case :
SI->cases())
6183 MissingCaseVal ^= Case.getCaseValue()->getValue().getLimitedValue();
6185 ConstantInt::get(
Cond->getType(), MissingCaseVal));
6187 SIW.
addCase(MissingCase,
SI->getDefaultDest(),
6197 if (DeadCases.
empty())
6203 assert(CaseI !=
SI->case_default() &&
6204 "Case was not found. Probably mistake in DeadCases forming.");
6206 CaseI->getCaseSuccessor()->removePredecessor(
SI->getParent());
6211 std::vector<DominatorTree::UpdateType> Updates;
6212 for (
auto *
Successor : UniqueSuccessors)
6213 if (NumPerSuccessorCases[
Successor] == 0)
6234 if (!Branch || !Branch->isUnconditional())
6240 int Idx =
PHI.getBasicBlockIndex(BB);
6241 assert(Idx >= 0 &&
"PHI has no entry for predecessor?");
6243 Value *InValue =
PHI.getIncomingValue(Idx);
6244 if (InValue != CaseValue)
6260 ForwardingNodesMap ForwardingNodes;
6263 for (
const auto &Case :
SI->cases()) {
6265 BasicBlock *CaseDest = Case.getCaseSuccessor();
6284 int SwitchBBIdx = Phi.getBasicBlockIndex(SwitchBlock);
6285 if (Phi.getIncomingValue(SwitchBBIdx) == CaseValue &&
6286 count(Phi.blocks(), SwitchBlock) == 1) {
6287 Phi.setIncomingValue(SwitchBBIdx,
SI->getCondition());
6295 ForwardingNodes[Phi].push_back(PhiIdx);
6298 for (
auto &ForwardingNode : ForwardingNodes) {
6299 PHINode *Phi = ForwardingNode.first;
6305 for (
int Index : Indexes)
6306 Phi->setIncomingValue(Index,
SI->getCondition());
6316 if (
C->isThreadDependent())
6318 if (
C->isDLLImportDependent())
6326 if (
C->getType()->isScalableTy())
6337 if (!
TTI.shouldBuildLookupTablesForConstant(
C))
6364 if (
A->isAllOnesValue())
6366 if (
A->isNullValue())
6372 for (
unsigned N = 0,
E =
I->getNumOperands();
N !=
E; ++
N) {
6397 ConstantPool.insert(std::make_pair(
SI->getCondition(), CaseVal));
6399 if (
I.isTerminator()) {
6401 if (
I.getNumSuccessors() != 1 ||
I.isSpecialTerminator())
6404 CaseDest =
I.getSuccessor(0);
6411 for (
auto &
Use :
I.uses()) {
6414 if (
I->getParent() == CaseDest)
6417 if (Phi->getIncomingBlock(
Use) == CaseDest)
6430 *CommonDest = CaseDest;
6432 if (CaseDest != *CommonDest)
6437 int Idx =
PHI.getBasicBlockIndex(Pred);
6450 Res.push_back(std::make_pair(&
PHI, ConstVal));
6453 return Res.
size() > 0;
6459 SwitchCaseResultVectorTy &UniqueResults,
6461 for (
auto &
I : UniqueResults) {
6462 if (
I.first == Result) {
6463 I.second.push_back(CaseVal);
6464 return I.second.size();
6467 UniqueResults.push_back(
6478 SwitchCaseResultVectorTy &UniqueResults,
6482 uintptr_t MaxUniqueResults) {
6483 for (
const auto &
I :
SI->cases()) {
6497 const size_t NumCasesForResult =
6505 if (UniqueResults.size() > MaxUniqueResults)
6521 DefaultResults.
size() == 1 ? DefaultResults.
begin()->second :
nullptr;
6523 return DefaultResult ||
SI->defaultDestUnreachable();
6544 const bool HasBranchWeights =
6547 if (ResultVector.size() == 2 && ResultVector[0].second.size() == 1 &&
6548 ResultVector[1].second.size() == 1) {
6549 ConstantInt *FirstCase = ResultVector[0].second[0];
6550 ConstantInt *SecondCase = ResultVector[1].second[0];
6551 Value *SelectValue = ResultVector[1].first;
6552 if (DefaultResult) {
6553 Value *ValueCompare =
6554 Builder.CreateICmpEQ(Condition, SecondCase,
"switch.selectcmp");
6555 SelectValue = Builder.CreateSelect(ValueCompare, ResultVector[1].first,
6556 DefaultResult,
"switch.select");
6558 SI && HasBranchWeights) {
6565 *
SI, {BranchWeights[2], BranchWeights[0] + BranchWeights[1]},
6569 Value *ValueCompare =
6570 Builder.CreateICmpEQ(Condition, FirstCase,
"switch.selectcmp");
6571 Value *Ret = Builder.CreateSelect(ValueCompare, ResultVector[0].first,
6572 SelectValue,
"switch.select");
6578 size_t FirstCasePos = (Condition !=
nullptr);
6579 size_t SecondCasePos = FirstCasePos + 1;
6580 uint32_t DefaultCase = (Condition !=
nullptr) ? BranchWeights[0] : 0;
6582 {BranchWeights[FirstCasePos],
6583 DefaultCase + BranchWeights[SecondCasePos]},
6590 if (ResultVector.size() == 1 && DefaultResult) {
6592 unsigned CaseCount = CaseValues.
size();
6605 for (
auto *Case : CaseValues) {
6606 if (Case->getValue().slt(MinCaseVal->
getValue()))
6608 AndMask &= Case->getValue();
6618 if (FreeBits ==
Log2_32(CaseCount)) {
6619 Value *
And = Builder.CreateAnd(Condition, AndMask);
6620 Value *Cmp = Builder.CreateICmpEQ(
6623 Builder.CreateSelect(Cmp, ResultVector[0].first, DefaultResult);
6639 for (
auto *Case : CaseValues)
6640 BitMask |= (Case->getValue() - MinCaseVal->
getValue());
6646 Condition = Builder.CreateSub(Condition, MinCaseVal);
6647 Value *
And = Builder.CreateAnd(Condition, ~BitMask,
"switch.and");
6648 Value *Cmp = Builder.CreateICmpEQ(
6651 Builder.CreateSelect(Cmp, ResultVector[0].first, DefaultResult);
6664 if (CaseValues.
size() == 2) {
6665 Value *Cmp1 = Builder.CreateICmpEQ(Condition, CaseValues[0],
6666 "switch.selectcmp.case1");
6667 Value *Cmp2 = Builder.CreateICmpEQ(Condition, CaseValues[1],
6668 "switch.selectcmp.case2");
6669 Value *Cmp = Builder.CreateOr(Cmp1, Cmp2,
"switch.selectcmp");
6671 Builder.CreateSelect(Cmp, ResultVector[0].first, DefaultResult);
6691 std::vector<DominatorTree::UpdateType> Updates;
6698 Builder.CreateBr(DestBB);
6702 PHI->removeIncomingValueIf(
6703 [&](
unsigned Idx) {
return PHI->getIncomingBlock(Idx) == SelectBB; });
6704 PHI->addIncoming(SelectValue, SelectBB);
6707 for (
unsigned i = 0, e =
SI->getNumSuccessors(); i < e; ++i) {
6713 if (DTU && RemovedSuccessors.
insert(Succ).second)
6716 SI->eraseFromParent();
6731 SwitchCaseResultVectorTy UniqueResults;
6737 assert(
PHI !=
nullptr &&
"PHI for value select not found");
6738 Builder.SetInsertPoint(
SI);
6741 [[maybe_unused]]
auto HasWeights =
6746 (BranchWeights.
size() >=
6747 UniqueResults.size() + (DefaultResult !=
nullptr)));
6750 Builder,
DL, BranchWeights);
6762class SwitchReplacement {
6769 const SmallVectorImpl<std::pair<ConstantInt *, Constant *>> &Values,
6770 Constant *DefaultValue,
const DataLayout &
DL,
const StringRef &FuncName);
6779 static bool wouldFitInRegister(
const DataLayout &
DL, uint64_t TableSize,
6786 bool isLookupTable();
6823 ConstantInt *BitMap =
nullptr;
6824 IntegerType *BitMapElementTy =
nullptr;
6827 ConstantInt *LinearOffset =
nullptr;
6828 ConstantInt *LinearMultiplier =
nullptr;
6829 bool LinearMapValWrapped =
false;
6837SwitchReplacement::SwitchReplacement(
6839 const SmallVectorImpl<std::pair<ConstantInt *, Constant *>> &Values,
6840 Constant *DefaultValue,
const DataLayout &
DL,
const StringRef &FuncName)
6841 : DefaultValue(DefaultValue) {
6842 assert(Values.size() &&
"Can't build lookup table without values!");
6843 assert(TableSize >= Values.size() &&
"Can't fit values in table!");
6846 SingleValue = Values.begin()->second;
6848 ValueType = Values.begin()->second->getType();
6852 for (
const auto &[CaseVal, CaseRes] : Values) {
6855 uint64_t Idx = (CaseVal->getValue() -
Offset->getValue()).getLimitedValue();
6856 TableContents[Idx] = CaseRes;
6863 if (Values.size() < TableSize) {
6865 "Need a default value to fill the lookup table holes.");
6868 if (!TableContents[
I])
6869 TableContents[
I] = DefaultValue;
6875 if (DefaultValue != SingleValue && !DefaultValueIsPoison)
6876 SingleValue =
nullptr;
6882 Kind = SingleValueKind;
6889 bool LinearMappingPossible =
true;
6894 bool NonMonotonic =
false;
6895 assert(TableSize >= 2 &&
"Should be a SingleValue table.");
6912 LinearMappingPossible =
false;
6917 APInt Dist = Val - PrevVal;
6920 }
else if (Dist != DistToPrev) {
6921 LinearMappingPossible =
false;
6929 if (LinearMappingPossible) {
6931 LinearMultiplier = ConstantInt::get(M.getContext(), DistToPrev);
6932 APInt M = LinearMultiplier->getValue();
6933 bool MayWrap =
true;
6934 if (
isIntN(M.getBitWidth(), TableSize - 1))
6935 (void)M.
smul_ov(
APInt(M.getBitWidth(), TableSize - 1), MayWrap);
6936 LinearMapValWrapped = NonMonotonic || MayWrap;
6937 Kind = LinearMapKind;
6943 if (wouldFitInRegister(
DL, TableSize,
ValueType)) {
6945 APInt TableInt(TableSize *
IT->getBitWidth(), 0);
6947 TableInt <<=
IT->getBitWidth();
6951 TableInt |= Val->
getValue().
zext(TableInt.getBitWidth());
6954 BitMap = ConstantInt::get(M.getContext(), TableInt);
6955 BitMapElementTy =
IT;
6964 Kind = LookupTableKind;
6970 case SingleValueKind:
6972 case LinearMapKind: {
6976 false,
"switch.idx.cast");
6977 if (!LinearMultiplier->
isOne())
6978 Result = Builder.
CreateMul(Result, LinearMultiplier,
"switch.idx.mult",
6980 !LinearMapValWrapped);
6982 if (!LinearOffset->
isZero())
6985 !LinearMapValWrapped);
7002 ShiftAmt, ConstantInt::get(MapTy, BitMapElementTy->
getBitWidth()),
7003 "switch.shiftamt",
true,
true);
7006 Value *DownShifted =
7007 Builder.
CreateLShr(BitMap, ShiftAmt,
"switch.downshift");
7009 return Builder.
CreateTrunc(DownShifted, BitMapElementTy,
"switch.masked");
7011 case LookupTableKind: {
7014 new GlobalVariable(*
Func->getParent(), Initializer->
getType(),
7015 true, GlobalVariable::PrivateLinkage,
7016 Initializer,
"switch.table." +
Func->getName());
7017 Table->setUnnamedAddr(GlobalValue::UnnamedAddr::Global);
7020 Table->setAlignment(
DL.getPrefTypeAlign(
ValueType));
7021 Type *IndexTy =
DL.getIndexType(Table->getType());
7024 if (
Index->getType() != IndexTy) {
7025 unsigned OldBitWidth =
Index->getType()->getIntegerBitWidth();
7029 isUIntN(OldBitWidth - 1, ArrayTy->getNumElements() - 1));
7032 Value *GEPIndices[] = {ConstantInt::get(IndexTy, 0),
Index};
7035 return Builder.
CreateLoad(ArrayTy->getElementType(),
GEP,
"switch.load");
7041bool SwitchReplacement::wouldFitInRegister(
const DataLayout &
DL,
7043 Type *ElementType) {
7051 if (TableSize >= UINT_MAX /
IT->getBitWidth())
7053 return DL.fitsInLegalInteger(TableSize *
IT->getBitWidth());
7059 if (
TTI.isTypeLegal(Ty))
7074 DL.fitsInLegalInteger(
IT->getBitWidth());
7077Constant *SwitchReplacement::getDefaultValue() {
return DefaultValue; }
7079bool SwitchReplacement::isLookupTable() {
return Kind == LookupTableKind; }
7081bool SwitchReplacement::isBitMap() {
return Kind == BitMapKind; }
7092 return NumCases * 100 >= CaseRange * MinDensity;
7113 if (
SI->getNumCases() > TableSize)
7116 bool AllTablesFitInRegister =
true;
7117 bool HasIllegalType =
false;
7118 for (
const auto &Ty : ResultTypes) {
7123 AllTablesFitInRegister =
7124 AllTablesFitInRegister &&
7125 SwitchReplacement::wouldFitInRegister(
DL, TableSize, Ty);
7130 if (HasIllegalType && !AllTablesFitInRegister)
7135 if (AllTablesFitInRegister)
7152 MaxCaseVal.
getLimitedValue() == std::numeric_limits<uint64_t>::max() ||
7155 return all_of(ResultTypes, [&](
const auto &ResultType) {
7156 return SwitchReplacement::wouldFitInRegister(
7184 const SmallVectorImpl<std::pair<ConstantInt *, Constant *>> &Values) {
7206 if (DefaultConst != TrueConst && DefaultConst != FalseConst)
7211 for (
auto ValuePair : Values) {
7214 if (!CaseConst || CaseConst == DefaultConst ||
7215 (CaseConst != TrueConst && CaseConst != FalseConst))
7229 if (DefaultConst == FalseConst) {
7232 ++NumTableCmpReuses;
7235 Value *InvertedTableCmp = BinaryOperator::CreateXor(
7236 RangeCmp, ConstantInt::get(RangeCmp->
getType(), 1),
"inverted.cmp",
7239 ++NumTableCmpReuses;
7249 bool ConvertSwitchToLookupTable) {
7250 assert(
SI->getNumCases() > 1 &&
"Degenerate switch?");
7264 if (
SI->getNumCases() < 3)
7286 MinCaseVal = CaseVal;
7288 MaxCaseVal = CaseVal;
7305 It->second.push_back(std::make_pair(CaseVal,
Value));
7313 bool HasDefaultResults =
7315 DefaultResultsList,
DL,
TTI);
7316 for (
const auto &
I : DefaultResultsList) {
7319 DefaultResults[
PHI] = Result;
7323 *MinCaseVal, *MaxCaseVal, HasDefaultResults, ResultTypes,
DL,
TTI);
7326 if (UseSwitchConditionAsTableIndex) {
7328 TableIndexOffset = ConstantInt::get(MaxCaseVal->
getIntegerType(), 0);
7333 TableIndexOffset = MinCaseVal;
7340 bool DefaultIsReachable = !
SI->defaultDestUnreachable();
7342 bool TableHasHoles = (NumResults < TableSize);
7347 bool AllHolesArePoison = TableHasHoles && !HasDefaultResults;
7355 bool NeedMask = AllHolesArePoison && DefaultIsReachable;
7358 if (
SI->getNumCases() < 4)
7360 if (!
DL.fitsInLegalInteger(TableSize))
7369 if (UseSwitchConditionAsTableIndex) {
7370 TableIndex =
SI->getCondition();
7371 if (HasDefaultResults) {
7383 all_of(ResultTypes, [&](
const auto &ResultType) {
7384 return SwitchReplacement::wouldFitInRegister(
DL, UpperBound,
7389 TableSize = std::max(UpperBound, TableSize);
7392 DefaultIsReachable =
false;
7400 const auto &ResultList = ResultLists[
PHI];
7402 Type *ResultType = ResultList.begin()->second->getType();
7407 SwitchReplacement Replacement(*Fn->
getParent(), TableSize, TableIndexOffset,
7408 ResultList, DefaultVal,
DL, FuncName);
7409 PhiToReplacementMap.
insert({
PHI, Replacement});
7412 bool AnyLookupTables =
any_of(
7413 PhiToReplacementMap, [](
auto &KV) {
return KV.second.isLookupTable(); });
7414 bool AnyBitMaps =
any_of(PhiToReplacementMap,
7415 [](
auto &KV) {
return KV.second.isBitMap(); });
7423 if (AnyLookupTables &&
7424 (!
TTI.shouldBuildLookupTables() ||
7430 if (!ConvertSwitchToLookupTable &&
7431 (AnyLookupTables || AnyBitMaps || NeedMask))
7434 Builder.SetInsertPoint(
SI);
7437 if (!UseSwitchConditionAsTableIndex) {
7440 bool MayWrap =
true;
7441 if (!DefaultIsReachable) {
7446 TableIndex = Builder.CreateSub(
SI->getCondition(), TableIndexOffset,
7447 "switch.tableidx",
false,
7451 std::vector<DominatorTree::UpdateType> Updates;
7457 assert(MaxTableSize >= TableSize &&
7458 "It is impossible for a switch to have more entries than the max "
7459 "representable value of its input integer type's size.");
7464 Mod.getContext(),
"switch.lookup", CommonDest->
getParent(), CommonDest);
7469 Builder.SetInsertPoint(
SI);
7470 const bool GeneratingCoveredLookupTable = (MaxTableSize == TableSize);
7471 if (!DefaultIsReachable || GeneratingCoveredLookupTable) {
7472 Builder.CreateBr(LookupBB);
7478 Value *Cmp = Builder.CreateICmpULT(
7479 TableIndex, ConstantInt::get(MinCaseVal->
getType(), TableSize));
7481 Builder.CreateCondBr(Cmp, LookupBB,
SI->getDefaultDest());
7482 CondBranch = RangeCheckBranch;
7488 Builder.SetInsertPoint(LookupBB);
7494 MaskBB->
setName(
"switch.hole_check");
7501 APInt MaskInt(TableSizePowOf2, 0);
7502 APInt One(TableSizePowOf2, 1);
7504 const ResultListTy &ResultList = ResultLists[PHIs[0]];
7505 for (
const auto &Result : ResultList) {
7508 MaskInt |= One << Idx;
7510 ConstantInt *TableMask = ConstantInt::get(
Mod.getContext(), MaskInt);
7517 Builder.CreateZExtOrTrunc(TableIndex, MapTy,
"switch.maskindex");
7518 Value *Shifted = Builder.CreateLShr(TableMask, MaskIndex,
"switch.shifted");
7519 Value *LoBit = Builder.CreateTrunc(
7521 CondBranch = Builder.CreateCondBr(LoBit, LookupBB,
SI->getDefaultDest());
7526 Builder.SetInsertPoint(LookupBB);
7530 if (!DefaultIsReachable || GeneratingCoveredLookupTable) {
7533 SI->getDefaultDest()->removePredecessor(BB,
7540 const ResultListTy &ResultList = ResultLists[
PHI];
7541 auto Replacement = PhiToReplacementMap.
at(
PHI);
7542 auto *Result = Replacement.replaceSwitch(TableIndex, Builder,
DL, Fn);
7545 if (!TableHasHoles && HasDefaultResults && RangeCheckBranch) {
7548 for (
auto *
User :
PHI->users()) {
7550 Replacement.getDefaultValue(), ResultList);
7554 PHI->addIncoming(Result, LookupBB);
7557 Builder.CreateBr(CommonDest);
7569 for (
unsigned I = 0,
E =
SI->getNumSuccessors();
I <
E; ++
I) {
7572 if (Succ ==
SI->getDefaultDest()) {
7573 if (HasBranchWeights)
7574 ToDefaultWeight += BranchWeights[
I];
7578 if (DTU && RemovedSuccessors.
insert(Succ).second)
7580 if (HasBranchWeights)
7581 ToLookupWeight += BranchWeights[
I];
7583 SI->eraseFromParent();
7584 if (HasBranchWeights)
7591 ++NumLookupTablesHoles;
7607 if (CondTy->getIntegerBitWidth() > 64 ||
7608 !
DL.fitsInLegalInteger(CondTy->getIntegerBitWidth()))
7612 if (
SI->getNumCases() < 4)
7620 for (
const auto &
C :
SI->cases())
7621 Values.
push_back(
C.getCaseValue()->getValue().getSExtValue());
7629 int64_t
Base = Values[0];
7630 for (
auto &V : Values)
7643 unsigned Shift = 64;
7644 for (
auto &V : Values)
7648 for (
auto &V : Values)
7649 V = (int64_t)((
uint64_t)V >> Shift);
7666 Builder.SetInsertPoint(
SI);
7669 Value *Rot = Builder.CreateIntrinsic(
7670 Ty, Intrinsic::fshl,
7671 {
Sub,
Sub, ConstantInt::get(Ty, Ty->getBitWidth() - Shift)});
7672 SI->replaceUsesOfWith(
SI->getCondition(), Rot);
7674 for (
auto Case :
SI->cases()) {
7675 auto *Orig = Case.getCaseValue();
7676 auto Sub = Orig->getValue() -
APInt(Ty->getBitWidth(),
Base,
true);
7721 for (
auto I =
SI->case_begin(),
E =
SI->case_end();
I !=
E;) {
7722 if (!
I->getCaseValue()->getValue().ugt(
Constant->getValue())) {
7738 if (!
SI->defaultDestUnreachable() || Case ==
SI->case_default()) {
7741 return !Updates.
empty();
7771 Value *Condition =
SI->getCondition();
7775 if (CondTy->getIntegerBitWidth() > 64 ||
7776 !
DL.fitsInLegalInteger(CondTy->getIntegerBitWidth()))
7788 if (
SI->getNumCases() < 4)
7793 for (
const auto &Case :
SI->cases()) {
7794 uint64_t CaseValue = Case.getCaseValue()->getValue().getZExtValue();
7808 Builder.SetInsertPoint(
SI);
7810 if (!
SI->defaultDestUnreachable()) {
7813 auto *PopC = Builder.CreateUnaryIntrinsic(Intrinsic::ctpop, Condition);
7814 auto *IsPow2 = Builder.CreateICmpEQ(PopC, ConstantInt::get(CondTy, 1));
7816 auto *OrigBB =
SI->getParent();
7817 auto *DefaultCaseBB =
SI->getDefaultDest();
7819 auto It = OrigBB->getTerminator()->getIterator();
7832 NewWeights[1] = Weights[0] / 2;
7833 NewWeights[0] = OrigDenominator - NewWeights[1];
7845 Weights[0] = NewWeights[1];
7846 uint64_t CasesDenominator = OrigDenominator - Weights[0];
7848 W = NewWeights[0] *
static_cast<double>(W) / CasesDenominator;
7854 It->eraseFromParent();
7862 for (
auto &Case :
SI->cases()) {
7863 auto *OrigValue = Case.getCaseValue();
7864 Case.setValue(ConstantInt::get(OrigValue->getIntegerType(),
7865 OrigValue->getValue().countr_zero()));
7869 auto *ConditionTrailingZeros = Builder.CreateIntrinsic(
7872 SI->setCondition(ConditionTrailingZeros);
7882 if (!Cmp || !Cmp->hasOneUse())
7893 uint32_t SuccWeight = 0, OtherSuccWeight = 0;
7896 if (
SI->getNumCases() == 2) {
7903 Succ =
SI->getDefaultDest();
7904 SuccWeight = Weights[0];
7906 for (
auto &Case :
SI->cases()) {
7907 std::optional<int64_t> Val =
7911 if (!Missing.erase(*Val))
7916 OtherSuccWeight += Weights[Case.getSuccessorIndex()];
7919 assert(Missing.size() == 1 &&
"Should have one case left");
7920 Res = *Missing.begin();
7921 }
else if (
SI->getNumCases() == 3 &&
SI->defaultDestUnreachable()) {
7923 Unreachable =
SI->getDefaultDest();
7925 for (
auto &Case :
SI->cases()) {
7926 BasicBlock *NewSucc = Case.getCaseSuccessor();
7927 uint32_t Weight = Weights[Case.getSuccessorIndex()];
7930 OtherSuccWeight += Weight;
7933 SuccWeight = Weight;
7934 }
else if (Succ == NewSucc) {
7940 for (
auto &Case :
SI->cases()) {
7941 std::optional<int64_t> Val =
7943 if (!Val || (Val != 1 && Val != 0 && Val != -1))
7945 if (Case.getCaseSuccessor() == Succ) {
7967 if (Cmp->isSigned())
7970 MDNode *NewWeights =
nullptr;
7976 Builder.SetInsertPoint(
SI->getIterator());
7977 Value *ICmp = Builder.CreateICmp(Pred, Cmp->getLHS(), Cmp->getRHS());
7978 Builder.CreateCondBr(ICmp, Succ,
OtherSucc, NewWeights,
7979 SI->getMetadata(LLVMContext::MD_unpredictable));
7983 SI->eraseFromParent();
7984 Cmp->eraseFromParent();
7985 if (DTU && Unreachable)
8016 "Only supporting unconditional branches for now");
8018 "Expected unconditional branches to have one successor");
8019 assert(Succ->
size() == 1 &&
"Expected just a single branch in the BB");
8040 if (LHS == EKey || RHS == EKey || LHS == TKey || RHS == TKey)
8056 "Only supporting unconditional branches for now");
8063 auto &PredIVs = (*LHS->PhiPredIVs)[&Phi];
8064 if (PredIVs[
A] != PredIVs[
B])
8072bool SimplifyCFGOpt::simplifyDuplicateSwitchArms(
SwitchInst *
SI,
8086 for (
unsigned I = 0;
I <
SI->getNumSuccessors(); ++
I) {
8091 if (BB->
size() != 1)
8101 if (!Seen.
insert(BB).second) {
8102 auto It = BBToSuccessorIndexes.
find(BB);
8103 if (It != BBToSuccessorIndexes.
end())
8104 It->second.emplace_back(
I);
8118 Cases.
emplace_back(SwitchSuccWrapper{BB, &PhiPredIVs});
8119 BBToSuccessorIndexes[BB].emplace_back(
I);
8125 for (PHINode *Phi : Phis) {
8127 PhiPredIVs.
try_emplace(Phi,
Phi->getNumIncomingValues()).first->second;
8128 for (
auto &
IV :
Phi->incoming_values())
8129 IVs.insert({
Phi->getIncomingBlock(
IV),
IV.get()});
8140 DenseSet<const SwitchSuccWrapper *> ReplaceWith;
8145 bool MadeChange =
false;
8146 for (
auto &SSW : Cases) {
8153 Updates.
push_back({DominatorTree::Delete,
SI->getParent(), SSW.Dest});
8154 const auto &Successors = BBToSuccessorIndexes.
at(SSW.Dest);
8155 for (
unsigned Idx : Successors)
8156 SI->setSuccessor(Idx, (*It)->Dest);
8167bool SimplifyCFGOpt::simplifySwitch(SwitchInst *SI,
IRBuilder<> &Builder) {
8170 if (isValueEqualityComparison(SI)) {
8174 if (simplifyEqualityComparisonWithOnlyPredecessor(SI, OnlyPred, Builder))
8175 return requestResimplify();
8179 if (simplifySwitchOnSelect(SI,
Select))
8180 return requestResimplify();
8185 if (foldValueComparisonIntoPredecessors(SI, Builder))
8186 return requestResimplify();
8192 if (
Options.ConvertSwitchRangeToICmp && turnSwitchRangeIntoICmp(SI, Builder))
8193 return requestResimplify();
8197 return requestResimplify();
8200 return requestResimplify();
8203 return requestResimplify();
8206 return requestResimplify();
8211 if (
Options.ConvertSwitchToArithmetic ||
Options.ConvertSwitchToLookupTable)
8213 Options.ConvertSwitchToLookupTable))
8214 return requestResimplify();
8217 return requestResimplify();
8220 return requestResimplify();
8223 hoistCommonCodeFromSuccessors(SI, !
Options.HoistCommonInsts))
8224 return requestResimplify();
8226 if (simplifyDuplicateSwitchArms(SI, DTU))
8227 return requestResimplify();
8230 return requestResimplify();
8235bool SimplifyCFGOpt::simplifyIndirectBr(IndirectBrInst *IBI) {
8238 SmallVector<uint32_t> BranchWeights;
8242 DenseMap<const BasicBlock *, uint64_t> TargetWeight;
8243 if (HasBranchWeights)
8248 SmallPtrSet<Value *, 8> Succs;
8249 SmallSetVector<BasicBlock *, 8> RemovedSuccs;
8254 RemovedSuccs.
insert(Dest);
8264 std::vector<DominatorTree::UpdateType> Updates;
8265 Updates.reserve(RemovedSuccs.
size());
8266 for (
auto *RemovedSucc : RemovedSuccs)
8267 Updates.push_back({DominatorTree::Delete, BB, RemovedSucc});
8284 if (HasBranchWeights) {
8291 if (simplifyIndirectBrOnSelect(IBI, SI))
8292 return requestResimplify();
8328 if (BB == OtherPred)
8339 std::vector<DominatorTree::UpdateType> Updates;
8346 assert(
II->getNormalDest() != BB &&
II->getUnwindDest() == BB &&
8347 "unexpected successor");
8348 II->setUnwindDest(OtherPred);
8363 Builder.CreateUnreachable();
8372bool SimplifyCFGOpt::simplifyUncondBranch(UncondBrInst *BI,
8384 bool NeedCanonicalLoop =
8398 if (
I->isTerminator() &&
8399 tryToSimplifyUncondBranchWithICmpInIt(ICI, Builder))
8420 if (
Options.SpeculateBlocks &&
8423 return requestResimplify();
8431 if (!PPred || (PredPred && PredPred != PPred))
8468 if (!SuccBI || !SuccBI->isConditional())
8472 return Succ1 != Succ && Succ2 != Succ && Succ1 != BB && Succ2 != BB &&
8476 if (!IsSimpleSuccessor(BB1, BB1BI) || !IsSimpleSuccessor(BB2, BB2BI))
8502 bool HasWeight =
false;
8507 BBTWeight = BBFWeight = 1;
8512 BB1TWeight = BB1FWeight = 1;
8517 BB2TWeight = BB2FWeight = 1;
8519 uint64_t Weights[2] = {BBTWeight * BB1FWeight + BBFWeight * BB2TWeight,
8520 BBTWeight * BB1TWeight + BBFWeight * BB2FWeight};
8527bool SimplifyCFGOpt::simplifyCondBranch(CondBrInst *BI,
IRBuilder<> &Builder) {
8531 "Tautological conditional branch should have been eliminated already.");
8534 if (!
Options.SimplifyCondBranch ||
8539 if (isValueEqualityComparison(BI)) {
8544 if (simplifyEqualityComparisonWithOnlyPredecessor(BI, OnlyPred, Builder))
8545 return requestResimplify();
8551 if (foldValueComparisonIntoPredecessors(BI, Builder))
8552 return requestResimplify();
8555 if (&*
I == BI && foldValueComparisonIntoPredecessors(BI, Builder))
8556 return requestResimplify();
8561 if (simplifyBranchOnICmpChain(BI, Builder,
DL))
8574 return requestResimplify();
8580 if (
Options.SpeculateBlocks &&
8583 return requestResimplify();
8592 hoistCommonCodeFromSuccessors(BI, !
Options.HoistCommonInsts))
8593 return requestResimplify();
8595 if (BI &&
Options.HoistLoadsStoresWithCondFaulting &&
8597 SmallVector<Instruction *, 2> SpeculatedConditionalLoadsStores;
8598 auto CanSpeculateConditionalLoadsStores = [&]() {
8600 for (Instruction &
I : *Succ) {
8601 if (
I.isTerminator()) {
8602 if (
I.getNumSuccessors() > 1)
8606 SpeculatedConditionalLoadsStores.
size() ==
8610 SpeculatedConditionalLoadsStores.
push_back(&
I);
8613 return !SpeculatedConditionalLoadsStores.
empty();
8616 if (CanSpeculateConditionalLoadsStores()) {
8618 std::nullopt,
nullptr);
8619 return requestResimplify();
8629 return requestResimplify();
8638 return requestResimplify();
8644 if (foldCondBranchOnValueKnownInPredecessor(BI))
8645 return requestResimplify();
8650 if (PBI != BI && PBI->isConditional())
8652 return requestResimplify();
8658 if (PBI != BI && PBI->isConditional())
8660 return requestResimplify();
8664 return requestResimplify();
8671 assert(V->getType() ==
I->getType() &&
"Mismatched types");
8683 auto *Use = cast<Instruction>(U.getUser());
8685 switch (Use->getOpcode()) {
8688 case Instruction::GetElementPtr:
8689 case Instruction::Ret:
8690 case Instruction::BitCast:
8691 case Instruction::Load:
8692 case Instruction::Store:
8693 case Instruction::Call:
8694 case Instruction::CallBr:
8695 case Instruction::Invoke:
8696 case Instruction::UDiv:
8697 case Instruction::URem:
8701 case Instruction::SDiv:
8702 case Instruction::SRem:
8706 if (FindUse ==
I->use_end())
8708 auto &
Use = *FindUse;
8713 if (
User->getParent() !=
I->getParent() ||
User ==
I ||
8714 User->comesBefore(
I))
8728 if (
GEP->getPointerOperand() ==
I) {
8731 if (
GEP->getType()->isVectorTy())
8739 if (!
GEP->hasAllZeroIndices() &&
8740 (!
GEP->isInBounds() ||
8742 GEP->getPointerAddressSpace())))
8743 PtrValueMayBeModified =
true;
8749 bool HasNoUndefAttr =
8750 Ret->getFunction()->hasRetAttribute(Attribute::NoUndef);
8755 if (
C->isNullValue() && HasNoUndefAttr &&
8756 Ret->getFunction()->hasRetAttribute(Attribute::NonNull)) {
8757 return !PtrValueMayBeModified;
8763 if (!LI->isVolatile())
8765 LI->getPointerAddressSpace());
8769 if (!
SI->isVolatile())
8771 SI->getPointerAddressSpace())) &&
8772 SI->getPointerOperand() ==
I;
8777 if (
I == Assume->getArgOperand(0))
8785 if (CB->getCalledOperand() ==
I)
8788 if (CB->isArgOperand(&
Use)) {
8789 unsigned ArgIdx = CB->getArgOperandNo(&
Use);
8792 CB->paramHasNonNullAttr(ArgIdx,
false))
8793 return !PtrValueMayBeModified;
8812 for (
unsigned i = 0, e =
PHI.getNumIncomingValues(); i != e; ++i)
8821 if (BI->isUnconditional())
8822 Builder.CreateUnreachable();
8829 Assumption = Builder.CreateAssumption(Builder.CreateNot(
Cond));
8831 Assumption = Builder.CreateAssumption(
Cond);
8846 Builder.SetInsertPoint(Unreachable);
8848 Builder.CreateUnreachable();
8849 for (
const auto &Case :
SI->cases())
8850 if (Case.getCaseSuccessor() == BB) {
8852 Case.setSuccessor(Unreachable);
8854 if (
SI->getDefaultDest() == BB) {
8856 SI->setDefaultDest(Unreachable);
8870bool SimplifyCFGOpt::simplifyOnce(BasicBlock *BB) {
8895 return requestResimplify();
8916 if (
Options.SpeculateBlocks &&
8923 Options.SpeculateUnpredictables))
8930 case Instruction::UncondBr:
8933 case Instruction::CondBr:
8936 case Instruction::Resume:
8939 case Instruction::CleanupRet:
8942 case Instruction::Switch:
8945 case Instruction::Unreachable:
8948 case Instruction::IndirectBr:
8956bool SimplifyCFGOpt::run(BasicBlock *BB) {
8966 }
while (Resimplify);
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
AMDGPU Register Bank Select
This file implements a class to represent arbitrary precision integral constant values and operations...
static MachineBasicBlock * OtherSucc(MachineBasicBlock *MBB, MachineBasicBlock *Succ)
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static cl::opt< ITMode > IT(cl::desc("IT block support"), cl::Hidden, cl::init(DefaultIT), cl::values(clEnumValN(DefaultIT, "arm-default-it", "Generate any type of IT block"), clEnumValN(RestrictedIT, "arm-restrict-it", "Disallow complex IT blocks")))
Function Alias Analysis Results
This file contains the simple types necessary to represent the attributes associated with functions a...
static const Function * getParent(const Value *V)
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
This file contains the declarations for the subclasses of Constant, which represent the different fla...
static cl::opt< OutputCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(OutputCostKind::RecipThroughput), cl::values(clEnumValN(OutputCostKind::RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(OutputCostKind::Latency, "latency", "Instruction latency"), clEnumValN(OutputCostKind::CodeSize, "code-size", "Code size"), clEnumValN(OutputCostKind::SizeAndLatency, "size-latency", "Code size and latency"), clEnumValN(OutputCostKind::All, "all", "Print all cost kinds")))
This file defines the DenseMap class.
static Value * getCondition(Instruction *I)
static bool IsIndirectCall(const MachineInstr *MI)
This file provides various utilities for inspecting and working with the control flow graph in LLVM I...
Module.h This file contains the declarations for the Module class.
This defines the Use class.
static Constant * getFalse(Type *Ty)
For a boolean type or a vector of boolean type, return false or a vector with every element false.
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
Machine Check Debug Module
This file implements a map that provides insertion order iteration.
This file provides utility for Memory Model Relaxation Annotations (MMRAs).
This file exposes an interface to building/using memory SSA to walk memory instructions using a use/d...
MachineInstr unsigned OpIdx
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))
uint64_t IntrinsicInst * II
if(auto Err=PB.parsePassPipeline(MPM, Passes)) return wrap(std MPM run * Mod
This file contains the declarations for profiling metadata utility functions.
const SmallVectorImpl< MachineOperand > & Cond
static bool contains(SmallPtrSetImpl< ConstantExpr * > &Cache, ConstantExpr *Expr, Constant *C)
Provides some synthesis utilities to produce sequences of values.
This file defines generic set operations that may be used on set's of different types,...
This file implements a set that has insertion order iteration characteristics.
static std::optional< ContiguousCasesResult > findContiguousCases(Value *Condition, SmallVectorImpl< ConstantInt * > &Cases, SmallVectorImpl< ConstantInt * > &OtherCases, BasicBlock *Dest, BasicBlock *OtherDest)
static void addPredecessorToBlock(BasicBlock *Succ, BasicBlock *NewPred, BasicBlock *ExistPred, MemorySSAUpdater *MSSAU=nullptr)
Update PHI nodes in Succ to indicate that there will now be entries in it from the 'NewPred' block.
static bool validLookupTableConstant(Constant *C, const TargetTransformInfo &TTI)
Return true if the backend will be able to handle initializing an array of constants like C.
static StoreInst * findUniqueStoreInBlocks(BasicBlock *BB1, BasicBlock *BB2)
static bool isProfitableToSpeculate(const BranchInst *BI, std::optional< bool > Invert, const TargetTransformInfo &TTI)
static bool validateAndCostRequiredSelects(BasicBlock *BB, BasicBlock *ThenBB, BasicBlock *EndBB, unsigned &SpeculatedInstructions, InstructionCost &Cost, const TargetTransformInfo &TTI)
Estimate the cost of the insertion(s) and check that the PHI nodes can be converted to selects.
static bool simplifySwitchLookup(SwitchInst *SI, IRBuilder<> &Builder, DomTreeUpdater *DTU, const DataLayout &DL, const TargetTransformInfo &TTI, bool ConvertSwitchToLookupTable)
If the switch is only used to initialize one or more phi nodes in a common successor block with diffe...
static void removeSwitchAfterSelectFold(SwitchInst *SI, PHINode *PHI, Value *SelectValue, IRBuilder<> &Builder, DomTreeUpdater *DTU)
static bool valuesOverlap(std::vector< ValueEqualityComparisonCase > &C1, std::vector< ValueEqualityComparisonCase > &C2)
Return true if there are any keys in C1 that exist in C2 as well.
static bool mergeConditionalStoreToAddress(BasicBlock *PTB, BasicBlock *PFB, BasicBlock *QTB, BasicBlock *QFB, BasicBlock *PostBB, Value *Address, bool InvertPCond, bool InvertQCond, DomTreeUpdater *DTU, const DataLayout &DL, const TargetTransformInfo &TTI)
static std::optional< std::tuple< BasicBlock *, Instruction::BinaryOps, bool > > shouldFoldCondBranchesToCommonDestination(BranchInst *BI, BranchInst *PBI, const TargetTransformInfo *TTI)
Determine if the two branches share a common destination and deduce a glue that joins the branches' c...
static bool mergeCleanupPad(CleanupReturnInst *RI)
static void hoistConditionalLoadsStores(BranchInst *BI, SmallVectorImpl< Instruction * > &SpeculatedConditionalLoadsStores, std::optional< bool > Invert, Instruction *Sel)
If the target supports conditional faulting, we look for the following pattern:
static bool isVectorOp(Instruction &I)
Return if an instruction's type or any of its operands' types are a vector type.
static BasicBlock * allPredecessorsComeFromSameSource(BasicBlock *BB)
static void cloneInstructionsIntoPredecessorBlockAndUpdateSSAUses(BasicBlock *BB, BasicBlock *PredBlock, ValueToValueMapTy &VMap)
static int constantIntSortPredicate(ConstantInt *const *P1, ConstantInt *const *P2)
static bool getCaseResults(SwitchInst *SI, ConstantInt *CaseVal, BasicBlock *CaseDest, BasicBlock **CommonDest, SmallVectorImpl< std::pair< PHINode *, Constant * > > &Res, const DataLayout &DL, const TargetTransformInfo &TTI)
Try to determine the resulting constant values in phi nodes at the common destination basic block,...
static bool performBranchToCommonDestFolding(BranchInst *BI, BranchInst *PBI, DomTreeUpdater *DTU, MemorySSAUpdater *MSSAU, const TargetTransformInfo *TTI)
static bool passingValueIsAlwaysUndefined(Value *V, Instruction *I, bool PtrValueMayBeModified=false)
Check if passing a value to an instruction will cause undefined behavior.
static bool isSafeToHoistInstr(Instruction *I, unsigned Flags)
static bool isSafeToHoistInvoke(BasicBlock *BB1, BasicBlock *BB2, Instruction *I1, Instruction *I2)
static ConstantInt * getConstantInt(Value *V, const DataLayout &DL)
Extract ConstantInt from value, looking through IntToPtr and PointerNullValue.
static bool simplifySwitchOfCmpIntrinsic(SwitchInst *SI, IRBuilderBase &Builder, DomTreeUpdater *DTU)
Fold switch over ucmp/scmp intrinsic to br if two of the switch arms have the same destination.
static bool shouldBuildLookupTable(SwitchInst *SI, uint64_t TableSize, const TargetTransformInfo &TTI, const DataLayout &DL, const SmallVector< Type * > &ResultTypes)
Determine whether a lookup table should be built for this switch, based on the number of cases,...
static bool extractPredSuccWeights(BranchInst *PBI, BranchInst *BI, uint64_t &PredTrueWeight, uint64_t &PredFalseWeight, uint64_t &SuccTrueWeight, uint64_t &SuccFalseWeight)
Return true if either PBI or BI has branch weight available, and store the weights in {Pred|Succ}...
static Constant * constantFold(Instruction *I, const DataLayout &DL, const SmallDenseMap< Value *, Constant * > &ConstantPool)
Try to fold instruction I into a constant.
static bool SimplifyCondBranchToCondBranch(BranchInst *PBI, BranchInst *BI, DomTreeUpdater *DTU, const DataLayout &DL, const TargetTransformInfo &TTI)
If we have a conditional branch as a predecessor of another block, this function tries to simplify it...
static bool tryToMergeLandingPad(LandingPadInst *LPad, BranchInst *BI, BasicBlock *BB, DomTreeUpdater *DTU)
Given an block with only a single landing pad and a unconditional branch try to find another basic bl...
static bool areIdenticalUpToCommutativity(const Instruction *I1, const Instruction *I2)
static bool forwardSwitchConditionToPHI(SwitchInst *SI)
Try to forward the condition of a switch instruction to a phi node dominated by the switch,...
static PHINode * findPHIForConditionForwarding(ConstantInt *CaseValue, BasicBlock *BB, int *PhiIndex)
If BB would be eligible for simplification by TryToSimplifyUncondBranchFromEmptyBlock (i....
static bool simplifySwitchOfPowersOfTwo(SwitchInst *SI, IRBuilder<> &Builder, DomTreeUpdater *DTU, const DataLayout &DL, const TargetTransformInfo &TTI)
Tries to transform switch of powers of two to reduce switch range.
static bool isCleanupBlockEmpty(iterator_range< BasicBlock::iterator > R)
static Value * ensureValueAvailableInSuccessor(Value *V, BasicBlock *BB, Value *AlternativeV=nullptr)
static Value * createLogicalOp(IRBuilderBase &Builder, Instruction::BinaryOps Opc, Value *LHS, Value *RHS, const Twine &Name="")
static bool shouldHoistCommonInstructions(Instruction *I1, Instruction *I2, const TargetTransformInfo &TTI)
Helper function for hoistCommonCodeFromSuccessors.
static bool reduceSwitchRange(SwitchInst *SI, IRBuilder<> &Builder, const DataLayout &DL, const TargetTransformInfo &TTI)
Try to transform a switch that has "holes" in it to a contiguous sequence of cases.
static bool mergeConditionalStores(BranchInst *PBI, BranchInst *QBI, DomTreeUpdater *DTU, const DataLayout &DL, const TargetTransformInfo &TTI)
static bool safeToMergeTerminators(Instruction *SI1, Instruction *SI2, SmallSetVector< BasicBlock *, 4 > *FailBlocks=nullptr)
Return true if it is safe to merge these two terminator instructions together.
@ SkipImplicitControlFlow
static bool incomingValuesAreCompatible(BasicBlock *BB, ArrayRef< BasicBlock * > IncomingBlocks, SmallPtrSetImpl< Value * > *EquivalenceSet=nullptr)
Return true if all the PHI nodes in the basic block BB receive compatible (identical) incoming values...
static bool trySwitchToSelect(SwitchInst *SI, IRBuilder<> &Builder, DomTreeUpdater *DTU, const DataLayout &DL, const TargetTransformInfo &TTI)
If a switch is only used to initialize one or more phi nodes in a common successor block with only tw...
static void createUnreachableSwitchDefault(SwitchInst *Switch, DomTreeUpdater *DTU, bool RemoveOrigDefaultBlock=true)
static Value * foldSwitchToSelect(const SwitchCaseResultVectorTy &ResultVector, Constant *DefaultResult, Value *Condition, IRBuilder<> &Builder, const DataLayout &DL, ArrayRef< uint32_t > BranchWeights)
static bool isSwitchDense(uint64_t NumCases, uint64_t CaseRange)
static bool sinkCommonCodeFromPredecessors(BasicBlock *BB, DomTreeUpdater *DTU)
Check whether BB's predecessors end with unconditional branches.
static bool isTypeLegalForLookupTable(Type *Ty, const TargetTransformInfo &TTI, const DataLayout &DL)
static bool eliminateDeadSwitchCases(SwitchInst *SI, DomTreeUpdater *DTU, AssumptionCache *AC, const DataLayout &DL)
Compute masked bits for the condition of a switch and use it to remove dead cases.
static bool blockIsSimpleEnoughToThreadThrough(BasicBlock *BB, BlocksSet &NonLocalUseBlocks)
Return true if we can thread a branch across this block.
static Value * isSafeToSpeculateStore(Instruction *I, BasicBlock *BrBB, BasicBlock *StoreBB, BasicBlock *EndBB)
Determine if we can hoist sink a sole store instruction out of a conditional block.
static bool foldTwoEntryPHINode(PHINode *PN, const TargetTransformInfo &TTI, DomTreeUpdater *DTU, AssumptionCache *AC, const DataLayout &DL, bool SpeculateUnpredictables)
Given a BB that starts with the specified two-entry PHI node, see if we can eliminate it.
static bool findReaching(BasicBlock *BB, BasicBlock *DefBB, BlocksSet &ReachesNonLocalUses)
static bool initializeUniqueCases(SwitchInst *SI, PHINode *&PHI, BasicBlock *&CommonDest, SwitchCaseResultVectorTy &UniqueResults, Constant *&DefaultResult, const DataLayout &DL, const TargetTransformInfo &TTI, uintptr_t MaxUniqueResults)
static bool shouldUseSwitchConditionAsTableIndex(ConstantInt &MinCaseVal, const ConstantInt &MaxCaseVal, bool HasDefaultResults, const SmallVector< Type * > &ResultTypes, const DataLayout &DL, const TargetTransformInfo &TTI)
static InstructionCost computeSpeculationCost(const User *I, const TargetTransformInfo &TTI)
Compute an abstract "cost" of speculating the given instruction, which is assumed to be safe to specu...
SmallPtrSet< BasicBlock *, 8 > BlocksSet
static unsigned skippedInstrFlags(Instruction *I)
static bool mergeCompatibleInvokes(BasicBlock *BB, DomTreeUpdater *DTU)
If this block is a landingpad exception handling block, categorize all the predecessor invokes into s...
static bool replacingOperandWithVariableIsCheap(const Instruction *I, int OpIdx)
static void eraseTerminatorAndDCECond(Instruction *TI, MemorySSAUpdater *MSSAU=nullptr)
static void eliminateBlockCases(BasicBlock *BB, std::vector< ValueEqualityComparisonCase > &Cases)
Given a vector of bb/value pairs, remove any entries in the list that match the specified block.
static void sinkLastInstruction(ArrayRef< BasicBlock * > Blocks)
static std::optional< bool > foldCondBranchOnValueKnownInPredecessorImpl(BranchInst *BI, DomTreeUpdater *DTU, const DataLayout &DL, AssumptionCache *AC)
If we have a conditional branch on something for which we know the constant value in predecessors (e....
static size_t mapCaseToResult(ConstantInt *CaseVal, SwitchCaseResultVectorTy &UniqueResults, Constant *Result)
static void mergeCompatibleInvokesImpl(ArrayRef< InvokeInst * > Invokes, DomTreeUpdater *DTU)
static void getBranchWeights(Instruction *TI, SmallVectorImpl< uint64_t > &Weights)
Get Weights of a given terminator, the default weight is at the front of the vector.
static void reuseTableCompare(User *PhiUser, BasicBlock *PhiBlock, BranchInst *RangeCheckBranch, Constant *DefaultValue, const SmallVectorImpl< std::pair< ConstantInt *, Constant * > > &Values)
Try to reuse the switch table index compare.
static bool tryWidenCondBranchToCondBranch(BranchInst *PBI, BranchInst *BI, DomTreeUpdater *DTU)
If the previous block ended with a widenable branch, determine if reusing the target block is profita...
static bool mergeNestedCondBranch(BranchInst *BI, DomTreeUpdater *DTU)
Fold the following pattern: bb0: br i1 cond1, label bb1, label bb2 bb1: br i1 cond2,...
static Constant * lookupConstant(Value *V, const SmallDenseMap< Value *, Constant * > &ConstantPool)
If V is a Constant, return it.
static bool canSinkInstructions(ArrayRef< Instruction * > Insts, DenseMap< const Use *, SmallVector< Value *, 4 > > &PHIOperands)
static void hoistLockstepIdenticalDbgVariableRecords(Instruction *TI, Instruction *I1, SmallVectorImpl< Instruction * > &OtherInsts)
Hoists DbgVariableRecords from I1 and OtherInstrs that are identical in lock-step to TI.
static bool removeEmptyCleanup(CleanupReturnInst *RI, DomTreeUpdater *DTU)
static bool removeUndefIntroducingPredecessor(BasicBlock *BB, DomTreeUpdater *DTU, AssumptionCache *AC)
If BB has an incoming value that will always trigger undefined behavior (eg.
static bool simplifySwitchWhenUMin(SwitchInst *SI, DomTreeUpdater *DTU)
Tries to transform the switch when the condition is umin with a constant.
static bool isSafeCheapLoadStore(const Instruction *I, const TargetTransformInfo &TTI)
static ConstantInt * getKnownValueOnEdge(Value *V, BasicBlock *From, BasicBlock *To)
static bool dominatesMergePoint(Value *V, BasicBlock *BB, Instruction *InsertPt, SmallPtrSetImpl< Instruction * > &AggressiveInsts, InstructionCost &Cost, InstructionCost Budget, const TargetTransformInfo &TTI, AssumptionCache *AC, SmallPtrSetImpl< Instruction * > &ZeroCostInstructions, unsigned Depth=0)
If we have a merge point of an "if condition" as accepted above, return true if the specified value d...
This file defines the SmallPtrSet class.
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
static TableGen::Emitter::OptClass< SkeletonEmitter > X("gen-skeleton-class", "Generate example skeleton class")
static const uint32_t IV[8]
Class for arbitrary precision integers.
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
LLVM_ABI APInt zext(unsigned width) const
Zero extend to a new width.
unsigned popcount() const
Count the number of bits set.
bool sgt(const APInt &RHS) const
Signed greater than comparison.
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
bool intersects(const APInt &RHS) const
This operation tests if there are any pairs of corresponding bits between this APInt and RHS that are...
bool sle(const APInt &RHS) const
Signed less or equal comparison.
unsigned getSignificantBits() const
Get the minimum bit size for this signed APInt.
bool isStrictlyPositive() const
Determine if this APInt Value is positive.
uint64_t getLimitedValue(uint64_t Limit=UINT64_MAX) const
If this value is smaller than the specified limit, return it, otherwise return the limit value.
LLVM_ABI APInt smul_ov(const APInt &RHS, bool &Overflow) const
bool isSubsetOf(const APInt &RHS) const
This operation checks that all bits set in this APInt are also set in RHS.
bool slt(const APInt &RHS) const
Signed less than comparison.
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
std::optional< int64_t > trySExtValue() const
Get sign extended value if possible.
LLVM_ABI APInt ssub_ov(const APInt &RHS, bool &Overflow) const
bool uge(const APInt &RHS) const
Unsigned greater or equal comparison.
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
const T & back() const
back - Get the last element.
const T & front() const
front - Get the first element.
size_t size() const
size - Get the array size.
bool empty() const
empty - Check if the array is empty.
static LLVM_ABI ArrayType * get(Type *ElementType, uint64_t NumElements)
This static method is the primary way to construct an ArrayType.
A cache of @llvm.assume calls within a function.
LLVM_ABI void registerAssumption(AssumeInst *CI)
Add an @llvm.assume intrinsic to this function's cache.
LLVM_ABI bool getValueAsBool() const
Return the attribute's value as a boolean.
LLVM Basic Block Representation.
iterator begin()
Instruction iterator methods.
iterator_range< const_phi_iterator > phis() const
Returns a range that iterates over the phis in the basic block.
LLVM_ABI const_iterator getFirstInsertionPt() const
Returns an iterator to the first instruction in this block that is suitable for inserting a non-PHI i...
const Function * getParent() const
Return the enclosing method, or null if none.
LLVM_ABI iterator_range< filter_iterator< BasicBlock::const_iterator, std::function< bool(const Instruction &)> > > instructionsWithoutDebug(bool SkipPseudoOp=true) const
Return a const iterator range over the instructions in the block, skipping any debug instructions.
bool hasAddressTaken() const
Returns true if there are any uses of this basic block other than direct branches,...
LLVM_ABI InstListType::const_iterator getFirstNonPHIIt() const
Returns an iterator to the first instruction in this block that is not a PHINode instruction.
static BasicBlock * Create(LLVMContext &Context, const Twine &Name="", Function *Parent=nullptr, BasicBlock *InsertBefore=nullptr)
Creates a new BasicBlock.
LLVM_ABI InstListType::const_iterator getFirstNonPHIOrDbg(bool SkipPseudoOp=true) const
Returns a pointer to the first instruction in this block that is not a PHINode or a debug intrinsic,...
LLVM_ABI bool hasNPredecessors(unsigned N) const
Return true if this block has exactly N predecessors.
LLVM_ABI const BasicBlock * getUniqueSuccessor() const
Return the successor of this block if it has a unique successor.
LLVM_ABI const BasicBlock * getSinglePredecessor() const
Return the predecessor of this block if it has a single predecessor block.
const Instruction & front() const
LLVM_ABI const CallInst * getTerminatingDeoptimizeCall() const
Returns the call instruction calling @llvm.experimental.deoptimize prior to the terminating return in...
LLVM_ABI const BasicBlock * getUniquePredecessor() const
Return the predecessor of this block if it has a unique predecessor block.
LLVM_ABI const BasicBlock * getSingleSuccessor() const
Return the successor of this block if it has a single successor.
LLVM_ABI void flushTerminatorDbgRecords()
Eject any debug-info trailing at the end of a block.
LLVM_ABI const DataLayout & getDataLayout() const
Get the data layout of the module this basic block belongs to.
InstListType::iterator iterator
Instruction iterators...
LLVM_ABI LLVMContext & getContext() const
Get the context in which this basic block lives.
LLVM_ABI bool isLandingPad() const
Return true if this basic block is a landing pad.
LLVM_ABI bool hasNPredecessorsOrMore(unsigned N) const
Return true if this block has N predecessors or more.
const Instruction * getTerminator() const LLVM_READONLY
Returns the terminator instruction if the block is well formed or null if the block is not well forme...
void splice(BasicBlock::iterator ToIt, BasicBlock *FromBB)
Transfer all instructions from FromBB to this basic block at ToIt.
LLVM_ABI const Module * getModule() const
Return the module owning the function this basic block belongs to, or nullptr if the function does no...
LLVM_ABI void removePredecessor(BasicBlock *Pred, bool KeepOneInputPHIs=false)
Update PHI nodes in this BasicBlock before removal of predecessor Pred.
BasicBlock * getBasicBlock() const
Conditional or Unconditional Branch instruction.
iterator_range< succ_op_iterator > successors()
void setCondition(Value *V)
static BranchInst * Create(BasicBlock *IfTrue, InsertPosition InsertBefore=nullptr)
bool isConditional() const
unsigned getNumSuccessors() const
BasicBlock * getSuccessor(unsigned i) const
bool isUnconditional() const
void setSuccessor(unsigned idx, BasicBlock *NewSucc)
Value * getCondition() const
static LLVM_ABI BranchProbability getBranchProbability(uint64_t Numerator, uint64_t Denominator)
BranchProbability getCompl() const
void addRangeRetAttr(const ConstantRange &CR)
adds the range attribute to the list of attributes.
bool isCallee(Value::const_user_iterator UI) const
Determine whether the passed iterator points to the callee operand's Use.
bool isDataOperand(const Use *U) const
bool tryIntersectAttributes(const CallBase *Other)
Try to intersect the attributes from 'this' CallBase and the 'Other' CallBase.
This class represents a function call, abstracting a target machine's calling convention.
mapped_iterator< op_iterator, DerefFnTy > handler_iterator
CleanupPadInst * getCleanupPad() const
Convenience accessor.
BasicBlock * getUnwindDest() const
This class is the base class for the comparison instructions.
static Type * makeCmpResultType(Type *opnd_type)
Create a result type for fcmp/icmp.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
@ ICMP_UGT
unsigned greater than
@ ICMP_ULT
unsigned less than
Predicate getPredicate() const
Return the predicate for this instruction.
void setCondition(Value *V)
Value * getCondition() const
BasicBlock * getSuccessor(unsigned i) const
static LLVM_ABI Constant * get(ArrayType *T, ArrayRef< Constant * > V)
A vector constant whose element type is a simple 1/2/4/8-byte integer or float/double,...
A constant value that is initialized with an expression using other constant values.
static LLVM_ABI Constant * getNeg(Constant *C, bool HasNSW=false)
ConstantFP - Floating Point Values [float, double].
This is the shared class of boolean and integer constants.
bool isOne() const
This is just a convenience method to make client code smaller for a common case.
uint64_t getLimitedValue(uint64_t Limit=~0ULL) const
getLimitedValue - If the value is smaller than the specified limit, return it, otherwise return the l...
IntegerType * getIntegerType() const
Variant of the getType() method to always return an IntegerType, which reduces the amount of casting ...
static LLVM_ABI ConstantInt * getTrue(LLVMContext &Context)
static ConstantInt * getSigned(IntegerType *Ty, int64_t V, bool ImplicitTrunc=false)
Return a ConstantInt with the specified value for the specified type.
bool isZero() const
This is just a convenience method to make client code smaller for a common code.
static LLVM_ABI ConstantInt * getFalse(LLVMContext &Context)
unsigned getBitWidth() const
getBitWidth - Return the scalar bitwidth of this constant.
uint64_t getZExtValue() const
Return the constant as a 64-bit unsigned integer value after it has been zero extended as appropriate...
const APInt & getValue() const
Return the constant as an APInt value reference.
A constant pointer value that points to null.
This class represents a range of values.
LLVM_ABI bool getEquivalentICmp(CmpInst::Predicate &Pred, APInt &RHS) const
Set up Pred and RHS such that ConstantRange::makeExactICmpRegion(Pred, RHS) == *this.
LLVM_ABI ConstantRange subtract(const APInt &CI) const
Subtract the specified constant from the endpoints of this constant range.
const APInt & getLower() const
Return the lower value for this range.
LLVM_ABI APInt getUnsignedMin() const
Return the smallest unsigned value contained in the ConstantRange.
LLVM_ABI bool isEmptySet() const
Return true if this set contains no members.
LLVM_ABI bool isSizeLargerThan(uint64_t MaxSize) const
Compare set size of this range with Value.
const APInt & getUpper() const
Return the upper value for this range.
LLVM_ABI bool isUpperWrapped() const
Return true if the exclusive upper bound wraps around the unsigned domain.
static LLVM_ABI ConstantRange makeExactICmpRegion(CmpInst::Predicate Pred, const APInt &Other)
Produce the exact range such that all values in the returned range satisfy the given predicate with a...
LLVM_ABI ConstantRange inverse() const
Return a new range that is the logical not of the current set.
LLVM_ABI APInt getUnsignedMax() const
Return the largest unsigned value contained in the ConstantRange.
static ConstantRange getNonEmpty(APInt Lower, APInt Upper)
Create non-empty constant range with the given bounds.
This is an important base class in LLVM.
static LLVM_ABI Constant * getIntegerValue(Type *Ty, const APInt &V)
Return the value for an integer or pointer constant, or a vector thereof, with the given scalar value...
LLVM_ABI bool isOneValue() const
Returns true if the value is one.
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
LLVM_ABI bool isNullValue() const
Return true if this is the value that would be returned by getNullValue.
A parsed version of the target data layout string in and methods for querying it.
Base class for non-instruction debug metadata records that have positions within IR.
LLVM_ABI void removeFromParent()
simple_ilist< DbgRecord >::iterator self_iterator
Record of a variable value-assignment, aka a non instruction representation of the dbg....
bool isSameSourceLocation(const DebugLoc &Other) const
Return true if the source locations match, ignoring isImplicitCode and source atom info.
static DebugLoc getTemporary()
static LLVM_ABI DebugLoc getMergedLocation(DebugLoc LocA, DebugLoc LocB)
When two instructions are combined into a single instruction we also need to combine the original loc...
static LLVM_ABI DebugLoc getMergedLocations(ArrayRef< DebugLoc > Locs)
Try to combine the vector of locations passed as input in a single one.
static DebugLoc getDropped()
ValueT & at(const_arg_type_t< KeyT > Val)
at - Return the entry for the specified key, or abort if no such entry exists.
iterator find(const_arg_type_t< KeyT > Val)
std::pair< iterator, bool > try_emplace(KeyT &&Key, Ts &&...Args)
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
void reserve(size_type NumEntries)
Grow the densemap so that it can contain at least NumEntries items before resizing again.
static constexpr UpdateKind Delete
static constexpr UpdateKind Insert
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
const BasicBlock & getEntryBlock() const
Attribute getFnAttribute(Attribute::AttrKind Kind) const
Return the attribute for the given attribute kind.
bool hasMinSize() const
Optimize this function for minimum size (-Oz).
bool hasFnAttribute(Attribute::AttrKind Kind) const
Return true if the function has the attribute.
void applyUpdates(ArrayRef< UpdateT > Updates)
Submit updates to all available trees.
an instruction for type-safe pointer arithmetic to access elements of arrays and structs
Module * getParent()
Get the module that this global value is contained inside of...
This instruction compares its operands according to the predicate given to the constructor.
Predicate getSignedPredicate() const
For example, EQ->EQ, SLE->SLE, UGT->SGT, etc.
static bool isEquality(Predicate P)
Return true if this predicate is either EQ or NE.
Common base class shared among various IRBuilders.
Value * CreateICmpULT(Value *LHS, Value *RHS, const Twine &Name="")
Value * CreateZExtOrTrunc(Value *V, Type *DestTy, const Twine &Name="")
Create a ZExt or Trunc from the integer value V to DestTy.
LLVM_ABI Value * CreateSelectFMF(Value *C, Value *True, Value *False, FMFSource FMFSource, const Twine &Name="", Instruction *MDFrom=nullptr)
LLVM_ABI CallInst * CreateAssumption(Value *Cond, ArrayRef< OperandBundleDef > OpBundles={})
Create an assume intrinsic call that allows the optimizer to assume that the provided condition will ...
ConstantInt * getTrue()
Get the constant value for i1 true.
LLVM_ABI Value * CreateSelect(Value *C, Value *True, Value *False, const Twine &Name="", Instruction *MDFrom=nullptr)
BasicBlock::iterator GetInsertPoint() const
Value * CreateFreeze(Value *V, const Twine &Name="")
Value * CreateLShr(Value *LHS, Value *RHS, const Twine &Name="", bool isExact=false)
void SetCurrentDebugLocation(DebugLoc L)
Set location information used by debugging information.
Value * CreateInBoundsGEP(Type *Ty, Value *Ptr, ArrayRef< Value * > IdxList, const Twine &Name="")
Value * CreateNot(Value *V, const Twine &Name="")
SwitchInst * CreateSwitch(Value *V, BasicBlock *Dest, unsigned NumCases=10, MDNode *BranchWeights=nullptr, MDNode *Unpredictable=nullptr)
Create a switch instruction with the specified value, default dest, and with a hint for the number of...
Value * CreateICmpEQ(Value *LHS, Value *RHS, const Twine &Name="")
BranchInst * CreateCondBr(Value *Cond, BasicBlock *True, BasicBlock *False, MDNode *BranchWeights=nullptr, MDNode *Unpredictable=nullptr)
Create a conditional 'br Cond, TrueDest, FalseDest' instruction.
LoadInst * CreateLoad(Type *Ty, Value *Ptr, const char *Name)
Provided to resolve 'CreateLoad(Ty, Ptr, "...")' correctly, instead of converting the string to 'bool...
StoreInst * CreateStore(Value *Val, Value *Ptr, bool isVolatile=false)
Value * CreateAdd(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
Value * CreatePtrToInt(Value *V, Type *DestTy, const Twine &Name="")
ConstantInt * getFalse()
Get the constant value for i1 false.
Value * CreateTrunc(Value *V, Type *DestTy, const Twine &Name="", bool IsNUW=false, bool IsNSW=false)
BranchInst * CreateBr(BasicBlock *Dest)
Create an unconditional 'br label X' instruction.
Value * CreateIntCast(Value *V, Type *DestTy, bool isSigned, const Twine &Name="")
void SetInsertPoint(BasicBlock *TheBB)
This specifies that created instructions should be appended to the end of the specified block.
Value * CreateICmp(CmpInst::Predicate P, Value *LHS, Value *RHS, const Twine &Name="")
Value * CreateOr(Value *LHS, Value *RHS, const Twine &Name="", bool IsDisjoint=false)
Value * CreateMul(Value *LHS, Value *RHS, const Twine &Name="", bool HasNUW=false, bool HasNSW=false)
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Indirect Branch Instruction.
BasicBlock * getDestination(unsigned i)
Return the specified destination.
unsigned getNumDestinations() const
return the number of possible destinations in this indirectbr instruction.
LLVM_ABI void removeDestination(unsigned i)
This method removes the specified successor from the indirectbr instruction.
LLVM_ABI void dropUBImplyingAttrsAndMetadata(ArrayRef< unsigned > Keep={})
Drop any attributes or metadata that can cause immediate undefined behavior.
LLVM_ABI Instruction * clone() const
Create a copy of 'this' instruction that is identical in all ways except the following:
LLVM_ABI iterator_range< simple_ilist< DbgRecord >::iterator > cloneDebugInfoFrom(const Instruction *From, std::optional< simple_ilist< DbgRecord >::iterator > FromHere=std::nullopt, bool InsertAtHead=false)
Clone any debug-info attached to From onto this instruction.
LLVM_ABI unsigned getNumSuccessors() const LLVM_READONLY
Return the number of successors that this instruction has.
iterator_range< simple_ilist< DbgRecord >::iterator > getDbgRecordRange() const
Return a range over the DbgRecords attached to this instruction.
const DebugLoc & getDebugLoc() const
Return the debug location for this node as a DebugLoc.
LLVM_ABI const Module * getModule() const
Return the module owning the function this instruction belongs to or nullptr it the function does not...
LLVM_ABI void andIRFlags(const Value *V)
Logical 'and' of any supported wrapping, exact, and fast-math flags of V and this instruction.
LLVM_ABI void moveBefore(InstListType::iterator InsertPos)
Unlink this instruction from its current basic block and insert it into the basic block that MovePos ...
LLVM_ABI InstListType::iterator eraseFromParent()
This method unlinks 'this' from the containing basic block and deletes it.
Instruction * user_back()
Specialize the methods defined in Value, as we know that an instruction can only be used by other ins...
LLVM_ABI const Function * getFunction() const
Return the function this instruction belongs to.
MDNode * getMetadata(unsigned KindID) const
Get the metadata of given kind attached to this Instruction.
LLVM_ABI BasicBlock * getSuccessor(unsigned Idx) const LLVM_READONLY
Return the specified successor. This instruction must be a terminator.
LLVM_ABI bool mayHaveSideEffects() const LLVM_READONLY
Return true if the instruction may have side effects.
bool isTerminator() const
LLVM_ABI bool isUsedOutsideOfBlock(const BasicBlock *BB) const LLVM_READONLY
Return true if there are any uses of this instruction in blocks other than the specified block.
LLVM_ABI void setMetadata(unsigned KindID, MDNode *Node)
Set the metadata of the specified kind to the specified node.
@ CompareUsingIntersectedAttrs
Check for equivalence with intersected callbase attrs.
LLVM_ABI AAMDNodes getAAMetadata() const
Returns the AA metadata for this instruction.
LLVM_ABI bool isIdenticalTo(const Instruction *I) const LLVM_READONLY
Return true if the specified instruction is exactly identical to the current one.
void setDebugLoc(DebugLoc Loc)
Set the debug location information for this instruction.
LLVM_ABI void copyMetadata(const Instruction &SrcInst, ArrayRef< unsigned > WL=ArrayRef< unsigned >())
Copy metadata from SrcInst to this instruction.
LLVM_ABI void applyMergedLocation(DebugLoc LocA, DebugLoc LocB)
Merge 2 debug locations and apply it to the Instruction.
LLVM_ABI void dropDbgRecords()
Erase any DbgRecords attached to this instruction.
LLVM_ABI InstListType::iterator insertInto(BasicBlock *ParentBB, InstListType::iterator It)
Inserts an unlinked instruction into ParentBB at position It and returns the iterator of the inserted...
Class to represent integer types.
unsigned getBitWidth() const
Get the number of bits in this IntegerType.
void setNormalDest(BasicBlock *B)
This is an important class for using LLVM in a threaded context.
The landingpad instruction holds all of the information necessary to generate correct exception handl...
An instruction for reading from memory.
static unsigned getPointerOperandIndex()
Iterates through instructions in a set of blocks in reverse order from the first non-terminator.
LLVM_ABI MDNode * createBranchWeights(uint32_t TrueWeight, uint32_t FalseWeight, bool IsExpected=false)
Return metadata containing two branch weights.
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
A Module instance is used to store all the information related to an LLVM module.
void addIncoming(Value *V, BasicBlock *BB)
Add an incoming value to the end of the PHI list.
iterator_range< const_block_iterator > blocks() const
op_range incoming_values()
void setIncomingValue(unsigned i, Value *V)
Value * getIncomingValueForBlock(const BasicBlock *BB) const
BasicBlock * getIncomingBlock(unsigned i) const
Return incoming basic block number i.
Value * getIncomingValue(unsigned i) const
Return incoming value number x.
int getBasicBlockIndex(const BasicBlock *BB) const
Return the first index of the specified basic block in the value list for this PHI.
unsigned getNumIncomingValues() const
Return the number of incoming edges.
static PHINode * Create(Type *Ty, unsigned NumReservedValues, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Constructors - NumReservedValues is a hint for the number of incoming edges that this phi node will h...
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Value * getValue() const
Convenience accessor.
Return a value (possibly void), from a function.
This class represents the LLVM 'select' instruction.
size_type size() const
Determine the number of elements in the SetVector.
bool empty() const
Determine if the SetVector is empty or not.
bool insert(const value_type &X)
Insert a new element into the SetVector.
A templated base class for SmallPtrSet which provides the typesafe interface that is common across al...
bool erase(PtrType Ptr)
Remove pointer from the set.
size_type count(ConstPtrType Ptr) const
count - Return 1 if the specified pointer is in the set, 0 otherwise.
void insert_range(Range &&R)
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
bool contains(ConstPtrType Ptr) const
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
A SetVector that performs no allocations if smaller than a certain size.
SmallSet - This maintains a set of unique values, optimizing for the case when the set is small (less...
std::pair< const_iterator, bool > insert(const T &V)
insert - Insert an element into the set if it isn't already there.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void assign(size_type NumElts, ValueParamT Elt)
reference emplace_back(ArgTypes &&... Args)
void reserve(size_type N)
iterator erase(const_iterator CI)
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
An instruction for storing to memory.
Value * getValueOperand()
static unsigned getPointerOperandIndex()
Value * getPointerOperand()
StringRef - Represent a constant reference to a string, i.e.
A wrapper class to simplify modification of SwitchInst cases along with their prof branch_weights met...
LLVM_ABI void setSuccessorWeight(unsigned idx, CaseWeightOpt W)
LLVM_ABI void addCase(ConstantInt *OnVal, BasicBlock *Dest, CaseWeightOpt W)
Delegate the call to the underlying SwitchInst::addCase() and set the specified branch weight for the...
LLVM_ABI CaseWeightOpt getSuccessorWeight(unsigned idx)
LLVM_ABI void replaceDefaultDest(SwitchInst::CaseIt I)
Replace the default destination by given case.
std::optional< uint32_t > CaseWeightOpt
LLVM_ABI SwitchInst::CaseIt removeCase(SwitchInst::CaseIt I)
Delegate the call to the underlying SwitchInst::removeCase() and remove correspondent branch weight.
CaseIt case_end()
Returns a read/write iterator that points one past the last in the SwitchInst.
BasicBlock * getSuccessor(unsigned idx) const
void setCondition(Value *V)
LLVM_ABI void addCase(ConstantInt *OnVal, BasicBlock *Dest)
Add an entry to the switch instruction.
CaseIteratorImpl< CaseHandle > CaseIt
void setSuccessor(unsigned idx, BasicBlock *NewSucc)
unsigned getNumSuccessors() const
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
The instances of the Type class are immutable: once they are created, they are never changed.
bool isPointerTy() const
True if this is an instance of PointerType.
LLVM_ABI TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.
static LLVM_ABI IntegerType * getInt1Ty(LLVMContext &C)
bool isIntegerTy() const
True if this is an instance of IntegerType.
BasicBlock * getSuccessor(unsigned i=0) const
'undef' values are things that do not have specified contents.
This function has undefined behavior.
A Use represents the edge between a Value definition and its users.
LLVM_ABI unsigned getOperandNo() const
Return the operand # of this use in its User.
LLVM_ABI void set(Value *Val)
User * getUser() const
Returns the User that contains this Use.
const Use & getOperandUse(unsigned i) const
void setOperand(unsigned i, Value *Val)
LLVM_ABI bool replaceUsesOfWith(Value *From, Value *To)
Replace uses of one Value with another.
Value * getOperand(unsigned i) const
unsigned getNumOperands() const
LLVM Value Representation.
Type * getType() const
All values are typed, get the type of this value.
static constexpr uint64_t MaximumAlignment
LLVM_ABI Value(Type *Ty, unsigned scid)
LLVM_ABI void setName(const Twine &Name)
Change the name of the value.
bool hasOneUse() const
Return true if there is exactly one use of this value.
LLVM_ABI void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
LLVMContext & getContext() const
All values hold a context through their type.
iterator_range< user_iterator > users()
iterator_range< use_iterator > uses()
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
LLVM_ABI void takeName(Value *V)
Transfer the name from V to this value.
Represents an op.with.overflow intrinsic.
std::pair< iterator, bool > insert(const ValueT &V)
void reserve(size_t Size)
Grow the DenseSet so that it can contain at least NumEntries items before resizing again.
const ParentTy * getParent() const
self_iterator getIterator()
NodeTy * getNextNode()
Get the next node, or nullptr for the list tail.
A range adaptor for a pair of iterators.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
@ C
The default llvm calling convention, compatible with C.
@ BasicBlock
Various leaf nodes.
BinaryOp_match< SrcTy, SpecificConstantMatch, TargetOpcode::G_XOR, true > m_Not(const SrcTy &&Src)
Matches a register not-ed by a G_XOR.
OneUse_match< SubPat > m_OneUse(const SubPat &SP)
Predicate
Predicate - These are "(BI << 5) | BO" for various predicates.
BinaryOp_match< LHS, RHS, Instruction::And > m_And(const LHS &L, const RHS &R)
BinaryOp_match< LHS, RHS, Instruction::Add > m_Add(const LHS &L, const RHS &R)
class_match< BinaryOperator > m_BinOp()
Match an arbitrary binary operation and ignore it.
ap_match< APInt > m_APInt(const APInt *&Res)
Match a ConstantInt or splatted ConstantVector, binding the specified pointer to the contained APInt.
bool match(Val *V, const Pattern &P)
bind_ty< Instruction > m_Instruction(Instruction *&I)
Match an instruction, capturing it if we match.
specificval_ty m_Specific(const Value *V)
Match if we have a specific specified value.
class_match< ConstantInt > m_ConstantInt()
Match an arbitrary ConstantInt and ignore it.
ExtractValue_match< Ind, Val_t > m_ExtractValue(const Val_t &V)
Match a single index ExtractValue instruction.
cst_pred_ty< is_any_apint > m_AnyIntegralConstant()
Match an integer or vector with any integral constant.
bind_ty< WithOverflowInst > m_WithOverflowInst(WithOverflowInst *&I)
Match a with overflow intrinsic, capturing it if we match.
auto m_LogicalOr()
Matches L || R where L and R are arbitrary values.
ThreeOps_match< decltype(m_Value()), LHS, RHS, Instruction::Select, true > m_c_Select(const LHS &L, const RHS &R)
Match Select(C, LHS, RHS) or Select(C, RHS, LHS)
match_immconstant_ty m_ImmConstant()
Match an arbitrary immediate Constant and ignore it.
NoWrapTrunc_match< OpTy, TruncInst::NoUnsignedWrap > m_NUWTrunc(const OpTy &Op)
Matches trunc nuw.
class_match< Value > m_Value()
Match an arbitrary value and ignore it.
CmpClass_match< LHS, RHS, ICmpInst > m_ICmp(CmpPredicate &Pred, const LHS &L, const RHS &R)
auto m_LogicalAnd()
Matches L && R where L and R are arbitrary values.
BinaryOp_match< LHS, RHS, Instruction::Or > m_Or(const LHS &L, const RHS &R)
MaxMin_match< ICmpInst, LHS, RHS, umin_pred_ty > m_UMin(const LHS &L, const RHS &R)
match_combine_or< LTy, RTy > m_CombineOr(const LTy &L, const RTy &R)
Combine two pattern matchers matching L || R.
SmallVector< DbgVariableRecord * > getDVRAssignmentMarkers(const Instruction *Inst)
Return a range of dbg_assign records for which Inst performs the assignment they encode.
LLVM_ABI void deleteAssignmentMarkers(const Instruction *Inst)
Delete the llvm.dbg.assign intrinsics linked to Inst.
initializer< Ty > init(const Ty &Val)
PointerTypeMap run(const Module &M)
Compute the PointerTypeMap for the module M.
@ User
could "use" a pointer
NodeAddr< PhiNode * > Phi
NodeAddr< UseNode * > Use
NodeAddr< FuncNode * > Func
Context & getContext() const
friend class Instruction
Iterator for Instructions in a `BasicBlock.
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
detail::zippy< detail::zip_shortest, T, U, Args... > zip(T &&t, U &&u, Args &&...args)
zip iterator for two or more iteratable types.
bool operator<(int64_t V1, const APSInt &V2)
constexpr auto not_equal_to(T &&Arg)
Functor variant of std::not_equal_to that can be used as a UnaryPredicate in functional algorithms li...
FunctionAddr VTableAddr Value
auto find(R &&Range, const T &Val)
Provide wrappers to std::find which take ranges instead of having to pass begin/end explicitly.
cl::opt< bool > ProfcheckDisableMetadataFixes
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI bool RecursivelyDeleteTriviallyDeadInstructions(Value *V, const TargetLibraryInfo *TLI=nullptr, MemorySSAUpdater *MSSAU=nullptr, std::function< void(Value *)> AboutToDeleteCallback=std::function< void(Value *)>())
If the specified value is a trivially dead instruction, delete it.
bool succ_empty(const Instruction *I)
LLVM_ABI bool IsBlockFollowedByDeoptOrUnreachable(const BasicBlock *BB)
Check if we can prove that all paths starting from this block converge to a block that either has a @...
LLVM_ABI bool ConstantFoldTerminator(BasicBlock *BB, bool DeleteDeadConditions=false, const TargetLibraryInfo *TLI=nullptr, DomTreeUpdater *DTU=nullptr)
If a terminator instruction is predicated on a constant value, convert it into an unconditional branc...
static cl::opt< unsigned > MaxSwitchCasesPerResult("max-switch-cases-per-result", cl::Hidden, cl::init(16), cl::desc("Limit cases to analyze when converting a switch to select"))
LLVM_ABI BranchInst * GetIfCondition(BasicBlock *BB, BasicBlock *&IfTrue, BasicBlock *&IfFalse)
Check whether BB is the merge point of a if-region.
static cl::opt< bool > SpeculateOneExpensiveInst("speculate-one-expensive-inst", cl::Hidden, cl::init(true), cl::desc("Allow exactly one expensive instruction to be speculatively " "executed"))
auto pred_end(const MachineBasicBlock *BB)
void set_intersect(S1Ty &S1, const S2Ty &S2)
set_intersect(A, B) - Compute A := A ^ B Identical to set_intersection, except that it works on set<>...
LLVM_ABI void setExplicitlyUnknownBranchWeightsIfProfiled(Instruction &I, StringRef PassName, const Function *F=nullptr)
Like setExplicitlyUnknownBranchWeights(...), but only sets unknown branch weights in the new instruct...
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
auto successors(const MachineBasicBlock *BB)
auto accumulate(R &&Range, E &&Init)
Wrapper for std::accumulate.
constexpr from_range_t from_range
iterator_range< T > make_range(T x, T y)
Convenience function for iterating over sub-ranges.
LLVM_ABI MDNode * getBranchWeightMDNode(const Instruction &I)
Get the branch weights metadata node.
constexpr bool isUIntN(unsigned N, uint64_t x)
Checks if an unsigned integer fits into the given (dynamic) bit width.
LLVM_ABI Constant * ConstantFoldCompareInstOperands(unsigned Predicate, Constant *LHS, Constant *RHS, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, const Instruction *I=nullptr)
Attempt to constant fold a compare instruction (icmp/fcmp) with the specified operands.
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
Align getLoadStoreAlignment(const Value *I)
A helper function that returns the alignment of load or store instruction.
LLVM_ABI void DeleteDeadBlock(BasicBlock *BB, DomTreeUpdater *DTU=nullptr, bool KeepOneInputPHIs=false)
Delete the specified block, which must have no predecessors.
LLVM_ABI bool isSafeToSpeculativelyExecute(const Instruction *I, const Instruction *CtxI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr, const TargetLibraryInfo *TLI=nullptr, bool UseVariableInfo=true, bool IgnoreUBImplyingAttrs=true)
Return true if the instruction does not have any effects besides calculating the result and does not ...
auto unique(Range &&R, Predicate P)
static cl::opt< unsigned > MaxSpeculationDepth("max-speculation-depth", cl::Hidden, cl::init(10), cl::desc("Limit maximum recursion depth when calculating costs of " "speculatively executed instructions"))
OutputIt copy_if(R &&Range, OutputIt Out, UnaryPredicate P)
Provide wrappers to std::copy_if which take ranges instead of having to pass begin/end explicitly.
static cl::opt< unsigned > PHINodeFoldingThreshold("phi-node-folding-threshold", cl::Hidden, cl::init(2), cl::desc("Control the amount of phi node folding to perform (default = 2)"))
bool operator==(const AddressRangeValuePair &LHS, const AddressRangeValuePair &RHS)
static cl::opt< bool > MergeCondStoresAggressively("simplifycfg-merge-cond-stores-aggressively", cl::Hidden, cl::init(false), cl::desc("When merging conditional stores, do so even if the resultant " "basic blocks are unlikely to be if-converted as a result"))
constexpr int popcount(T Value) noexcept
Count the number of set bits in a value.
LLVM_ABI ConstantRange getConstantRangeFromMetadata(const MDNode &RangeMD)
Parse out a conservative ConstantRange from !range metadata.
auto map_range(ContainerTy &&C, FuncTy F)
Return a range that applies F to the elements of C.
static cl::opt< unsigned > BranchFoldThreshold("simplifycfg-branch-fold-threshold", cl::Hidden, cl::init(2), cl::desc("Maximum cost of combining conditions when " "folding branches"))
LLVM_ABI ConstantRange computeConstantRange(const Value *V, bool ForSigned, bool UseInstrInfo=true, AssumptionCache *AC=nullptr, const Instruction *CtxI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Determine the possible constant range of an integer or vector of integer value.
int countr_zero(T Val)
Count number of 0's from the least significant bit to the most stopping at the first 1.
LLVM_ABI Value * simplifyInstruction(Instruction *I, const SimplifyQuery &Q)
See if we can compute a simplified version of this instruction.
LLVM_ABI void setBranchWeights(Instruction &I, ArrayRef< uint32_t > Weights, bool IsExpected, bool ElideAllZero=false)
Create a new branch_weights metadata node and add or overwrite a prof metadata reference to instructi...
static cl::opt< bool > SinkCommon("simplifycfg-sink-common", cl::Hidden, cl::init(true), cl::desc("Sink common instructions down to the end block"))
void erase(Container &C, ValueType V)
Wrapper function to remove a value from a container:
constexpr bool has_single_bit(T Value) noexcept
static cl::opt< bool > HoistStoresWithCondFaulting("simplifycfg-hoist-stores-with-cond-faulting", cl::Hidden, cl::init(true), cl::desc("Hoist stores if the target supports conditional faulting"))
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
constexpr detail::StaticCastFunc< To > StaticCastTo
Function objects corresponding to the Cast types defined above.
unsigned Log2_32(uint32_t Value)
Return the floor log base 2 of the specified value, -1 if the value is zero.
LLVM_ABI bool TryToSimplifyUncondBranchFromEmptyBlock(BasicBlock *BB, DomTreeUpdater *DTU=nullptr)
BB is known to contain an unconditional branch, and contains no instructions other than PHI nodes,...
void RemapDbgRecordRange(Module *M, iterator_range< DbgRecordIterator > Range, ValueToValueMapTy &VM, RemapFlags Flags=RF_None, ValueMapTypeRemapper *TypeMapper=nullptr, ValueMaterializer *Materializer=nullptr, const MetadataPredicate *IdentityMD=nullptr)
Remap the Values used in the DbgRecords Range using the value map VM.
auto reverse(ContainerTy &&C)
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
LLVM_ABI void InvertBranch(BranchInst *PBI, IRBuilderBase &Builder)
LLVM_ABI bool impliesPoison(const Value *ValAssumedPoison, const Value *V)
Return true if V is poison given that ValAssumedPoison is already poison.
void sort(IteratorTy Start, IteratorTy End)
static cl::opt< bool > EnableMergeCompatibleInvokes("simplifycfg-merge-compatible-invokes", cl::Hidden, cl::init(true), cl::desc("Allow SimplifyCFG to merge invokes together when appropriate"))
@ RF_IgnoreMissingLocals
If this flag is set, the remapper ignores missing function-local entries (Argument,...
@ RF_NoModuleLevelChanges
If this flag is set, the remapper knows that only local values within a function (such as an instruct...
LLVM_ABI void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
LLVM_ABI bool NullPointerIsDefined(const Function *F, unsigned AS=0)
Check whether null pointer dereferencing is considered undefined behavior for a given function or an ...
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
bool none_of(R &&Range, UnaryPredicate P)
Provide wrappers to std::none_of which take ranges instead of having to pass begin/end explicitly.
auto make_first_range(ContainerTy &&c)
Given a container of pairs, return a range over the first elements.
LLVM_ABI bool collectPossibleValues(const Value *V, SmallPtrSetImpl< const Constant * > &Constants, unsigned MaxCount, bool AllowUndefOrPoison=true)
Enumerates all possible immediate values of V and inserts them into the set Constants.
LLVM_ABI Instruction * removeUnwindEdge(BasicBlock *BB, DomTreeUpdater *DTU=nullptr)
Replace 'BB's terminator with one that does not have an unwind successor block.
FunctionAddr VTableAddr Count
auto succ_size(const MachineBasicBlock *BB)
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
static cl::opt< unsigned > MaxJumpThreadingLiveBlocks("max-jump-threading-live-blocks", cl::Hidden, cl::init(24), cl::desc("Limit number of blocks a define in a threaded block is allowed " "to be live in"))
RNSuccIterator< NodeRef, BlockT, RegionT > succ_begin(NodeRef Node)
LLVM_ABI void combineMetadataForCSE(Instruction *K, const Instruction *J, bool DoesKMove)
Combine the metadata of two instructions so that K can replace J.
iterator_range(Container &&) -> iterator_range< llvm::detail::IterOfRange< Container > >
auto drop_end(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the last N elements excluded.
static cl::opt< int > MaxSmallBlockSize("simplifycfg-max-small-block-size", cl::Hidden, cl::init(10), cl::desc("Max size of a block which is still considered " "small enough to thread through"))
LLVM_ABI BasicBlock * SplitBlockPredecessors(BasicBlock *BB, ArrayRef< BasicBlock * > Preds, const char *Suffix, DominatorTree *DT, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, bool PreserveLCSSA=false)
This method introduces at least one new basic block into the function and moves some of the predecess...
bool isWidenableBranch(const User *U)
Returns true iff U is a widenable branch (that is, extractWidenableCondition returns widenable condit...
static cl::opt< unsigned > HoistCommonSkipLimit("simplifycfg-hoist-common-skip-limit", cl::Hidden, cl::init(20), cl::desc("Allow reordering across at most this many " "instructions when hoisting"))
IRBuilder(LLVMContext &, FolderTy, InserterTy, MDNode *, ArrayRef< OperandBundleDef >) -> IRBuilder< FolderTy, InserterTy >
LLVM_ABI cl::opt< bool > RequireAndPreserveDomTree
This function is used to do simplification of a CFG.
static cl::opt< bool > MergeCondStores("simplifycfg-merge-cond-stores", cl::Hidden, cl::init(true), cl::desc("Hoist conditional stores even if an unconditional store does not " "precede - hoist multiple conditional stores into a single " "predicated store"))
static cl::opt< unsigned > BranchFoldToCommonDestVectorMultiplier("simplifycfg-branch-fold-common-dest-vector-multiplier", cl::Hidden, cl::init(2), cl::desc("Multiplier to apply to threshold when determining whether or not " "to fold branch to common destination when vector operations are " "present"))
RNSuccIterator< NodeRef, BlockT, RegionT > succ_end(NodeRef Node)
LLVM_ABI bool MergeBlockIntoPredecessor(BasicBlock *BB, DomTreeUpdater *DTU=nullptr, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, MemoryDependenceResults *MemDep=nullptr, bool PredecessorWithTwoSuccessors=false, DominatorTree *DT=nullptr)
Attempts to merge a block into its predecessor, if possible.
LLVM_ABI void hoistAllInstructionsInto(BasicBlock *DomBlock, Instruction *InsertPt, BasicBlock *BB)
Hoist all of the instructions in the IfBlock to the dominant block DomBlock, by moving its instructio...
@ Sub
Subtraction of integers.
LLVM_ABI BasicBlock * SplitBlock(BasicBlock *Old, BasicBlock::iterator SplitPt, DominatorTree *DT, LoopInfo *LI=nullptr, MemorySSAUpdater *MSSAU=nullptr, const Twine &BBName="")
Split the specified block at the specified instruction.
auto count(R &&Range, const E &Element)
Wrapper function around std::count to count the number of times an element Element occurs in the give...
void RemapInstruction(Instruction *I, ValueToValueMapTy &VM, RemapFlags Flags=RF_None, ValueMapTypeRemapper *TypeMapper=nullptr, ValueMaterializer *Materializer=nullptr, const MetadataPredicate *IdentityMD=nullptr)
Convert the instruction operands from referencing the current values into those specified by VM.
LLVM_ABI bool canReplaceOperandWithVariable(const Instruction *I, unsigned OpIdx)
Given an instruction, is it legal to set operand OpIdx to a non-constant value?
DWARFExpression::Operation Op
LLVM_ABI bool PointerMayBeCaptured(const Value *V, bool ReturnCaptures, unsigned MaxUsesToExplore=0)
PointerMayBeCaptured - Return true if this pointer value may be captured by the enclosing function (w...
LLVM_ABI bool FoldSingleEntryPHINodes(BasicBlock *BB, MemoryDependenceResults *MemDep=nullptr)
We know that BB has one predecessor.
LLVM_ABI bool isGuaranteedNotToBeUndefOrPoison(const Value *V, AssumptionCache *AC=nullptr, const Instruction *CtxI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Return true if this function can prove that V does not have undef bits and is never poison.
void RemapDbgRecord(Module *M, DbgRecord *DR, ValueToValueMapTy &VM, RemapFlags Flags=RF_None, ValueMapTypeRemapper *TypeMapper=nullptr, ValueMaterializer *Materializer=nullptr, const MetadataPredicate *IdentityMD=nullptr)
Remap the Values used in the DbgRecord DR using the value map VM.
ArrayRef(const T &OneElt) -> ArrayRef< T >
constexpr unsigned BitWidth
auto sum_of(R &&Range, E Init=E{0})
Returns the sum of all values in Range with Init initial value.
ValueMap< const Value *, WeakTrackingVH > ValueToValueMapTy
LLVM_ABI bool isDereferenceablePointer(const Value *V, Type *Ty, const DataLayout &DL, const Instruction *CtxI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr, const TargetLibraryInfo *TLI=nullptr)
Return true if this is always a dereferenceable pointer.
LLVM_ABI bool isGuaranteedToTransferExecutionToSuccessor(const Instruction *I)
Return true if this function can prove that the instruction I will always transfer execution to one o...
static cl::opt< bool > HoistCondStores("simplifycfg-hoist-cond-stores", cl::Hidden, cl::init(true), cl::desc("Hoist conditional stores if an unconditional store precedes"))
LLVM_ABI bool extractBranchWeights(const MDNode *ProfileData, SmallVectorImpl< uint32_t > &Weights)
Extract branch weights from MD_prof metadata.
LLVM_ABI bool simplifyCFG(BasicBlock *BB, const TargetTransformInfo &TTI, DomTreeUpdater *DTU=nullptr, const SimplifyCFGOptions &Options={}, ArrayRef< WeakVH > LoopHeaders={})
auto pred_begin(const MachineBasicBlock *BB)
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
auto find_if(R &&Range, UnaryPredicate P)
Provide wrappers to std::find_if which take ranges instead of having to pass begin/end explicitly.
void erase_if(Container &C, UnaryPredicate P)
Provide a container algorithm similar to C++ Library Fundamentals v2's erase_if which is equivalent t...
constexpr bool isIntN(unsigned N, int64_t x)
Checks if an signed integer fits into the given (dynamic) bit width.
auto predecessors(const MachineBasicBlock *BB)
static cl::opt< unsigned > HoistLoadsStoresWithCondFaultingThreshold("hoist-loads-stores-with-cond-faulting-threshold", cl::Hidden, cl::init(6), cl::desc("Control the maximal conditional load/store that we are willing " "to speculatively execute to eliminate conditional branch " "(default = 6)"))
static cl::opt< bool > HoistCommon("simplifycfg-hoist-common", cl::Hidden, cl::init(true), cl::desc("Hoist common instructions up to the parent block"))
iterator_range< pointer_iterator< WrappedIteratorT > > make_pointer_range(RangeT &&Range)
LLVM_ABI unsigned ComputeMaxSignificantBits(const Value *Op, const DataLayout &DL, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Get the upper bound on bit size for this Value Op as a signed integer.
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
static cl::opt< unsigned > TwoEntryPHINodeFoldingThreshold("two-entry-phi-node-folding-threshold", cl::Hidden, cl::init(4), cl::desc("Control the maximal total instruction cost that we are willing " "to speculatively execute to fold a 2-entry PHI node into a " "select (default = 4)"))
Type * getLoadStoreType(const Value *I)
A helper function that returns the type of a load or store instruction.
PointerUnion< const Value *, const PseudoSourceValue * > ValueType
SmallVector< uint64_t, 2 > getDisjunctionWeights(const SmallVector< T1, 2 > &B1, const SmallVector< T2, 2 > &B2)
Get the branch weights of a branch conditioned on b1 || b2, where b1 and b2 are 2 booleans that are t...
LLVM_ABI bool foldBranchToCommonDest(BranchInst *BI, llvm::DomTreeUpdater *DTU=nullptr, MemorySSAUpdater *MSSAU=nullptr, const TargetTransformInfo *TTI=nullptr, unsigned BonusInstThreshold=1)
If this basic block is ONLY a setcc and a branch, and if a predecessor branches to us and one of our ...
bool pred_empty(const BasicBlock *BB)
LLVM_ABI Instruction * SplitBlockAndInsertIfThen(Value *Cond, BasicBlock::iterator SplitBefore, bool Unreachable, MDNode *BranchWeights=nullptr, DomTreeUpdater *DTU=nullptr, LoopInfo *LI=nullptr, BasicBlock *ThenBlock=nullptr)
Split the containing block at the specified instruction - everything before SplitBefore stays in the ...
LLVM_ABI std::optional< bool > isImpliedByDomCondition(const Value *Cond, const Instruction *ContextI, const DataLayout &DL)
Return the boolean condition value in the context of the given instruction if it is known based on do...
auto seq(T Begin, T End)
Iterate over an integral type from Begin up to - but not including - End.
void array_pod_sort(IteratorTy Start, IteratorTy End)
array_pod_sort - This sorts an array with the specified start and end extent.
LLVM_ABI bool hasBranchWeightMD(const Instruction &I)
Checks if an instructions has Branch Weight Metadata.
hash_code hash_combine(const Ts &...args)
Combine values into a single hash_code.
bool equal(L &&LRange, R &&RRange)
Wrapper function around std::equal to detect if pair-wise elements between two ranges are the same.
static cl::opt< bool > HoistLoadsWithCondFaulting("simplifycfg-hoist-loads-with-cond-faulting", cl::Hidden, cl::init(true), cl::desc("Hoist loads if the target supports conditional faulting"))
LLVM_ABI Constant * ConstantFoldInstOperands(const Instruction *I, ArrayRef< Constant * > Ops, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, bool AllowNonDeterministic=true)
ConstantFoldInstOperands - Attempt to constant fold an instruction with the specified operands.
LLVM_ABI void setFittedBranchWeights(Instruction &I, ArrayRef< uint64_t > Weights, bool IsExpected, bool ElideAllZero=false)
Variant of setBranchWeights where the Weights will be fit first to uint32_t by shifting right.
LLVM_ABI const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=MaxLookupSearchDepth)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
LLVM_ABI Constant * ConstantFoldIntegerCast(Constant *C, Type *DestTy, bool IsSigned, const DataLayout &DL)
Constant fold a zext, sext or trunc, depending on IsSigned and whether the DestTy is wider or narrowe...
bool capturesNothing(CaptureComponents CC)
static auto filterDbgVars(iterator_range< simple_ilist< DbgRecord >::iterator > R)
Filter the DbgRecord range to DbgVariableRecord types only and downcast.
LLVM_ABI bool EliminateDuplicatePHINodes(BasicBlock *BB)
Check for and eliminate duplicate PHI nodes in this block.
constexpr detail::IsaCheckPredicate< Types... > IsaPred
Function object wrapper for the llvm::isa type check.
LLVM_ABI void RemapSourceAtom(Instruction *I, ValueToValueMapTy &VM)
Remap source location atom.
hash_code hash_combine_range(InputIteratorT first, InputIteratorT last)
Compute a hash_code for a sequence of values.
LLVM_ABI bool isWritableObject(const Value *Object, bool &ExplicitlyDereferenceableOnly)
Return true if the Object is writable, in the sense that any location based on this pointer that can ...
LLVM_ABI void mapAtomInstance(const DebugLoc &DL, ValueToValueMapTy &VMap)
Mark a cloned instruction as a new instance so that its source loc can be updated when remapped.
constexpr uint64_t NextPowerOf2(uint64_t A)
Returns the next power of two (in 64-bits) that is strictly greater than A.
LLVM_ABI void extractFromBranchWeightMD64(const MDNode *ProfileData, SmallVectorImpl< uint64_t > &Weights)
Faster version of extractBranchWeights() that skips checks and must only be called with "branch_weigh...
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
SmallVectorImpl< ConstantInt * > * Cases
SmallVectorImpl< ConstantInt * > * OtherCases
Checking whether two cases of SI are equal depends on the contents of the BasicBlock and the incoming...
DenseMap< PHINode *, SmallDenseMap< BasicBlock *, Value *, 8 > > * PhiPredIVs
LLVM_ABI AAMDNodes merge(const AAMDNodes &Other) const
Given two sets of AAMDNodes applying to potentially different locations, determine the best AAMDNodes...
static const SwitchSuccWrapper * getEmptyKey()
static const SwitchSuccWrapper * getTombstoneKey()
static unsigned getHashValue(const SwitchSuccWrapper *SSW)
static bool isEqual(const SwitchSuccWrapper *LHS, const SwitchSuccWrapper *RHS)
An information struct used to provide DenseMap with the various necessary components for a given valu...
Incoming for lane maks phi as machine instruction, incoming register Reg and incoming block Block are...
unsigned getBitWidth() const
Get the bit width of this value.
unsigned countMaxActiveBits() const
Returns the maximum number of bits needed to represent all possible unsigned values with these known ...
APInt getMaxValue() const
Return the maximal unsigned value possible given these KnownBits.
A MapVector that performs no allocations if smaller than a certain size.