14#ifndef LLVM_ANALYSIS_BLOCKFREQUENCYINFOIMPL_H
15#define LLVM_ANALYSIS_BLOCKFREQUENCYINFOIMPL_H
52#define DEBUG_TYPE "block-freq"
61class BranchProbabilityInfo;
65class MachineBasicBlock;
66class MachineBranchProbabilityInfo;
99 return BlockMass(std::numeric_limits<uint64_t>::max());
104 bool isFull()
const {
return Mass == std::numeric_limits<uint64_t>::max(); }
114 Mass = Sum < Mass ? std::numeric_limits<uint64_t>::max() : Sum;
124 Mass = Diff > Mass ? 0 : Diff;
129 Mass =
P.scale(Mass);
207 return std::numeric_limits<uint32_t>::max() - 1;
238 template <
class It1,
class It2>
243 Nodes.insert(
Nodes.end(), FirstOther, LastOther);
295 return Loop->Parent->Parent;
313 return L ? L->getHeader() :
Node;
320 while (L->Parent && L->Parent->IsPackaged)
335 return Loop->Parent->Mass;
466 std::list<LoopData>::iterator Insert);
521 Scaled64 getFloatingBlockFreq(
const BlockNode &
Node)
const;
524 std::optional<uint64_t>
525 getBlockProfileCount(
const Function &
F,
const BlockNode &
Node,
526 bool AllowSynthetic =
false)
const;
527 std::optional<uint64_t>
529 bool AllowSynthetic =
false)
const;
530 bool isIrrLoopHeader(
const BlockNode &
Node);
540namespace bfi_detail {
566 assert(BB &&
"Unexpected nullptr");
567 auto MachineName =
"BB" +
Twine(BB->getNumber());
568 if (BB->getBasicBlock())
569 return (MachineName +
"[" + BB->getName() +
"]").str();
570 return MachineName.str();
574 assert(BB &&
"Unexpected nullptr");
605 using iterator = std::deque<const IrrNode *>::const_iterator;
626 template <
class BlockEdgesAdder>
628 BlockEdgesAdder addBlockEdges) :
BFI(
BFI) {
632 template <
class BlockEdgesAdder>
633 void initialize(
const BFIBase::LoopData *OuterLoop,
634 BlockEdgesAdder addBlockEdges);
644 template <
class BlockEdgesAdder>
646 BlockEdgesAdder addBlockEdges);
648 const BFIBase::LoopData *OuterLoop);
651template <
class BlockEdgesAdder>
653 BlockEdgesAdder addBlockEdges) {
656 for (
auto N : OuterLoop->
Nodes)
660 for (
uint32_t Index = 0; Index <
BFI.Working.size(); ++Index)
661 addEdges(Index, OuterLoop, addBlockEdges);
666template <
class BlockEdgesAdder>
669 BlockEdgesAdder addBlockEdges) {
674 const auto &Working =
BFI.Working[
Node.Index];
676 if (Working.isAPackage())
677 for (
const auto &
I : Working.Loop->Exits)
680 addBlockEdges(*
this, Irr, OuterLoop);
841 using BranchProbabilityInfoT =
848 const BranchProbabilityInfoT *BPI =
nullptr;
849 const LoopInfoT *LI =
nullptr;
850 const FunctionT *F =
nullptr;
853 std::vector<const BlockT *> RPOT;
856 unsigned BlockNumberEpoch;
858 BlockNode getNode(
const BlockT *BB)
const {
859 assert(BlockNumberEpoch ==
862 return BlockNumber < Nodes.size() ? Nodes[BlockNumber] :
BlockNode();
867 return RPOT[
Node.Index];
873 void initializeRPOT();
882 void initializeLoops();
910 bool tryToComputeMassInFunction();
924 void computeIrreducibleMass(
LoopData *OuterLoop,
925 std::list<LoopData>::iterator Insert);
936 void computeMassInLoops();
944 void computeMassInFunction();
946 std::string getBlockName(
const BlockNode &
Node)
const override {
960 bool needIterativeInference()
const;
963 void applyIterativeInference();
965 using ProbMatrixType = std::vector<std::vector<std::pair<size_t, Scaled64>>>;
968 void iterativeInference(
const ProbMatrixType &ProbMatrix,
969 std::vector<Scaled64> &Freq)
const;
973 void findReachableBlocks(std::vector<const BlockT *> &Blocks)
const;
977 void initTransitionProbabilities(
978 const std::vector<const BlockT *> &Blocks,
980 ProbMatrixType &ProbMatrix)
const;
985 Scaled64 discrepancy(
const ProbMatrixType &ProbMatrix,
986 const std::vector<Scaled64> &Freq)
const;
994 void calculate(
const FunctionT &F,
const BranchProbabilityInfoT &BPI,
995 const LoopInfoT &LI);
1003 std::optional<uint64_t>
1005 bool AllowSynthetic =
false)
const {
1010 std::optional<uint64_t>
1012 bool AllowSynthetic =
false)
const {
1027 const BranchProbabilityInfoT &
getBPI()
const {
return *BPI; }
1049 const BranchProbabilityInfoT &BPI,
1050 const LoopInfoT &LI) {
1063 <<
"\n================="
1064 << std::string(F.getName().size(),
'=') <<
"\n");
1070 computeMassInLoops();
1071 computeMassInFunction();
1075 if (needIterativeInference())
1076 applyIterativeInference();
1083 for (
const BlockT &BB : F)
1096 if (Nodes.size() <= BlockNumber)
1099 if (!
Node.isValid()) {
1104 Freqs.emplace_back();
1109template <
class BT>
void BlockFrequencyInfoImpl<BT>::initializeRPOT() {
1110 const BlockT *Entry = &
F->front();
1111 RPOT.reserve(
F->size());
1113 RPOT.emplace_back(BB);
1114 std::reverse(RPOT.begin(), RPOT.end());
1116 assert(RPOT.size() - 1 <= BlockNode::getMaxIndex() &&
1117 "More nodes in function than Block Frequency Info supports");
1123 BlockNode
Node = BlockNode(Idx);
1128 Working.reserve(RPOT.size());
1129 for (
size_t Index = 0; Index < RPOT.size(); ++Index)
1130 Working.emplace_back(Index);
1131 Freqs.resize(RPOT.size());
1134template <
class BT>
void BlockFrequencyInfoImpl<BT>::initializeLoops() {
1140 std::deque<std::pair<const LoopT *, LoopData *>> Q;
1141 for (
const LoopT *L : *LI)
1142 Q.emplace_back(L,
nullptr);
1143 while (!Q.empty()) {
1144 const LoopT *
Loop = Q.front().first;
1145 LoopData *Parent = Q.front().second;
1149 assert(Header.isValid());
1151 Loops.emplace_back(Parent, Header);
1152 Working[Header.Index].Loop = &
Loops.back();
1155 for (
const LoopT *L : *
Loop)
1156 Q.emplace_back(L, &
Loops.back());
1161 for (
size_t Index = 0;
Index < RPOT.size(); ++
Index) {
1163 if (Working[Index].isLoopHeader()) {
1164 LoopData *ContainingLoop = Working[
Index].getContainingLoop();
1166 ContainingLoop->Nodes.push_back(Index);
1170 const LoopT *
Loop = LI->getLoopFor(RPOT[Index]);
1176 assert(Header.isValid());
1177 const auto &HeaderData = Working[Header.Index];
1178 assert(HeaderData.isLoopHeader());
1180 Working[
Index].Loop = HeaderData.Loop;
1181 HeaderData.Loop->Nodes.push_back(Index);
1187template <
class BT>
void BlockFrequencyInfoImpl<BT>::computeMassInLoops() {
1189 for (
auto L =
Loops.rbegin(),
E =
Loops.rend(); L !=
E; ++L) {
1190 if (computeMassInLoop(*L))
1192 auto Next = std::next(L);
1193 computeIrreducibleMass(&*L,
L.base());
1194 L = std::prev(
Next);
1195 if (computeMassInLoop(*L))
1202bool BlockFrequencyInfoImpl<BT>::computeMassInLoop(LoopData &
Loop) {
1206 if (
Loop.isIrreducible()) {
1209 unsigned NumHeadersWithWeight = 0;
1210 std::optional<uint64_t> MinHeaderWeight;
1213 for (uint32_t
H = 0;
H <
Loop.NumHeaders; ++
H) {
1214 auto &HeaderNode =
Loop.Nodes[
H];
1215 const BlockT *
Block = getBlock(HeaderNode);
1216 IsIrrLoopHeader.set(
Loop.Nodes[
H].Index);
1217 std::optional<uint64_t> HeaderWeight =
Block->getIrrLoopHeaderWeight();
1218 if (!HeaderWeight) {
1221 HeadersWithoutWeight.insert(
H);
1225 <<
" has irr loop header weight " << *HeaderWeight
1227 NumHeadersWithWeight++;
1228 uint64_t HeaderWeightValue = *HeaderWeight;
1229 if (!MinHeaderWeight || HeaderWeightValue < MinHeaderWeight)
1230 MinHeaderWeight = HeaderWeightValue;
1231 if (HeaderWeightValue) {
1232 Dist.addLocal(HeaderNode, HeaderWeightValue);
1241 if (!MinHeaderWeight)
1242 MinHeaderWeight = 1;
1243 for (uint32_t
H : HeadersWithoutWeight) {
1244 auto &HeaderNode =
Loop.Nodes[
H];
1245 assert(!getBlock(HeaderNode)->getIrrLoopHeaderWeight() &&
1246 "Shouldn't have a weight metadata");
1247 uint64_t MinWeight = *MinHeaderWeight;
1251 Dist.addLocal(HeaderNode, MinWeight);
1253 distributeIrrLoopHeaderMass(Dist);
1254 for (
const BlockNode &M :
Loop.Nodes)
1255 if (!propagateMassToSuccessors(&
Loop, M))
1257 if (NumHeadersWithWeight == 0)
1259 adjustLoopHeaderMass(
Loop);
1261 Working[
Loop.
getHeader().Index].getMass() = BlockMass::getFull();
1264 for (
const BlockNode &M :
Loop.members())
1265 if (!propagateMassToSuccessors(&
Loop, M))
1270 computeLoopScale(
Loop);
1276bool BlockFrequencyInfoImpl<BT>::tryToComputeMassInFunction() {
1279 assert(!Working.empty() &&
"no blocks in function");
1280 assert(!Working[0].isLoopHeader() &&
"entry block is a loop header");
1282 Working[0].getMass() = BlockMass::getFull();
1283 for (
size_t i = 0, n = RPOT.size(); i != n; ++i) {
1285 if (Working[i].isPackaged())
1288 if (!propagateMassToSuccessors(
nullptr, BlockNode(i)))
1294template <
class BT>
void BlockFrequencyInfoImpl<BT>::computeMassInFunction() {
1295 if (tryToComputeMassInFunction())
1297 computeIrreducibleMass(
nullptr,
Loops.begin());
1298 if (tryToComputeMassInFunction())
1304bool BlockFrequencyInfoImpl<BT>::needIterativeInference()
const {
1307 if (!
F->getFunction().hasProfileData())
1311 for (
auto L =
Loops.rbegin(),
E =
Loops.rend(); L !=
E; ++L) {
1312 if (
L->isIrreducible())
1318template <
class BT>
void BlockFrequencyInfoImpl<BT>::applyIterativeInference() {
1323 std::vector<const BlockT *> ReachableBlocks;
1324 findReachableBlocks(ReachableBlocks);
1325 if (ReachableBlocks.empty())
1332 auto Freq = std::vector<Scaled64>(ReachableBlocks.size());
1334 for (
size_t I = 0;
I < ReachableBlocks.size();
I++) {
1335 const BlockT *BB = ReachableBlocks[
I];
1337 Freq[
I] = getFloatingBlockFreq(BB);
1340 assert(!SumFreq.isZero() &&
"empty initial block frequencies");
1342 LLVM_DEBUG(
dbgs() <<
"Applying iterative inference for " <<
F->getName()
1343 <<
" with " << ReachableBlocks.size() <<
" blocks\n");
1346 for (
auto &
Value : Freq) {
1352 ProbMatrixType ProbMatrix;
1353 initTransitionProbabilities(ReachableBlocks, BlockIndex, ProbMatrix);
1356 iterativeInference(ProbMatrix, Freq);
1359 for (
const BlockT &BB : *
F) {
1361 if (!
Node.isValid())
1363 if (
auto It = BlockIndex.find(&BB); It != BlockIndex.end())
1364 Freqs[
Node.Index].Scaled = Freq[It->second];
1366 Freqs[
Node.Index].Scaled = Scaled64::getZero();
1371void BlockFrequencyInfoImpl<BT>::iterativeInference(
1372 const ProbMatrixType &ProbMatrix, std::vector<Scaled64> &Freq)
const {
1374 "incorrectly specified precision");
1376 const auto Precision =
1382 << discrepancy(ProbMatrix, Freq).
toString() <<
"\n");
1386 auto Successors = std::vector<std::vector<size_t>>(Freq.size());
1387 for (
size_t I = 0;
I < Freq.size();
I++) {
1388 for (
const auto &Jump : ProbMatrix[
I]) {
1389 Successors[Jump.first].push_back(
I);
1397 auto IsActive =
BitVector(Freq.size(),
false);
1398 std::queue<size_t> ActiveSet;
1399 for (
size_t I = 0;
I < Freq.size();
I++) {
1408 while (It++ < MaxIterations && !ActiveSet.empty()) {
1409 size_t I = ActiveSet.front();
1411 IsActive[
I] =
false;
1417 Scaled64 OneMinusSelfProb = Scaled64::getOne();
1418 for (
const auto &Jump : ProbMatrix[
I]) {
1419 if (Jump.first ==
I) {
1420 OneMinusSelfProb -= Jump.second;
1422 NewFreq += Freq[Jump.first] * Jump.second;
1425 if (OneMinusSelfProb != Scaled64::getOne())
1426 NewFreq /= OneMinusSelfProb;
1430 auto Change = Freq[
I] >= NewFreq ? Freq[
I] - NewFreq : NewFreq - Freq[
I];
1431 if (Change > Precision) {
1434 for (
size_t Succ : Successors[
I]) {
1435 if (!IsActive[Succ]) {
1436 ActiveSet.push(Succ);
1437 IsActive[Succ] =
true;
1446 LLVM_DEBUG(
dbgs() <<
" Completed " << It <<
" inference iterations"
1447 <<
format(
" (%0.0f per block)",
double(It) / Freq.size())
1451 << discrepancy(ProbMatrix, Freq).
toString() <<
"\n");
1456void BlockFrequencyInfoImpl<BT>::findReachableBlocks(
1457 std::vector<const BlockT *> &Blocks)
const {
1460 std::queue<const BlockT *>
Queue;
1462 const BlockT *
Entry = &
F->front();
1464 Reachable.insert(Entry);
1465 while (!
Queue.empty()) {
1466 const BlockT *SrcBB =
Queue.front();
1469 auto EP = BPI->getEdgeProbability(SrcBB, It.index());
1472 if (Reachable.insert(It.value()).second)
1473 Queue.push(It.value());
1480 for (
const BlockT &BB : *
F) {
1483 if (!HasSucc && Reachable.count(&BB)) {
1485 InverseReachable.insert(&BB);
1488 while (!
Queue.empty()) {
1489 const BlockT *SrcBB =
Queue.front();
1492 auto EP = BPI->getEdgeProbability(DstBB, SrcBB);
1495 if (InverseReachable.insert(DstBB).second)
1501 Blocks.reserve(
F->size());
1502 for (
const BlockT &BB : *
F) {
1503 if (Reachable.count(&BB) && InverseReachable.count(&BB)) {
1504 Blocks.push_back(&BB);
1510void BlockFrequencyInfoImpl<BT>::initTransitionProbabilities(
1511 const std::vector<const BlockT *> &Blocks,
1513 ProbMatrixType &ProbMatrix)
const {
1514 const size_t NumBlocks = Blocks.size();
1515 auto Succs = std::vector<std::vector<std::pair<size_t, Scaled64>>>(NumBlocks);
1516 auto SumProb = std::vector<Scaled64>(NumBlocks);
1519 for (
size_t Src = 0; Src < NumBlocks; Src++) {
1520 const BlockT *BB = Blocks[Src];
1523 const BlockT *
SI = It.value();
1525 auto BlockIndexIt = BlockIndex.find(
SI);
1526 if (BlockIndexIt == BlockIndex.end())
1529 if (!UniqueSuccs.insert(
SI).second)
1532 auto EP = BPI->getEdgeProbability(BB, It.index());
1537 Scaled64::getFraction(EP.getNumerator(), EP.getDenominator());
1538 size_t Dst = BlockIndexIt->second;
1539 Succs[Src].push_back(std::make_pair(Dst, EdgeProb));
1540 SumProb[Src] += EdgeProb;
1545 ProbMatrix = ProbMatrixType(NumBlocks);
1546 for (
size_t Src = 0; Src < NumBlocks; Src++) {
1548 if (Succs[Src].
empty())
1551 assert(!SumProb[Src].
isZero() &&
"Zero sum probability of non-exit block");
1552 for (
auto &Jump : Succs[Src]) {
1553 size_t Dst = Jump.first;
1554 Scaled64 Prob = Jump.second;
1555 ProbMatrix[Dst].push_back(std::make_pair(Src, Prob / SumProb[Src]));
1560 size_t EntryIdx = BlockIndex.find(&
F->front())->second;
1561 for (
size_t Src = 0; Src < NumBlocks; Src++) {
1562 if (Succs[Src].
empty()) {
1563 ProbMatrix[EntryIdx].push_back(std::make_pair(Src, Scaled64::getOne()));
1571 const ProbMatrixType &ProbMatrix,
const std::vector<Scaled64> &Freq)
const {
1572 assert(Freq[0] > 0 &&
"Incorrectly computed frequency of the entry block");
1573 Scaled64 Discrepancy;
1574 for (
size_t I = 0;
I < ProbMatrix.size();
I++) {
1576 for (
const auto &Jump : ProbMatrix[
I]) {
1577 Sum += Freq[Jump.first] * Jump.second;
1579 Discrepancy += Freq[
I] >= Sum ? Freq[
I] - Sum : Sum - Freq[
I];
1582 return Discrepancy / Freq[0];
1587void BlockFrequencyInfoImpl<BT>::computeIrreducibleMass(
1588 LoopData *OuterLoop, std::list<LoopData>::iterator Insert) {
1590 if (OuterLoop)
dbgs()
1591 <<
"loop: " << getLoopName(*OuterLoop) <<
"\n";
1592 else dbgs() <<
"function\n");
1596 auto addBlockEdges = [&](IrreducibleGraph &
G, IrreducibleGraph::IrrNode &Irr,
1597 const LoopData *OuterLoop) {
1598 const BlockT *BB = RPOT[Irr.Node.Index];
1600 G.addEdge(Irr,
getNode(Succ), OuterLoop);
1602 IrreducibleGraph
G(*
this, OuterLoop, addBlockEdges);
1604 for (
auto &L : analyzeIrreducible(
G, OuterLoop, Insert))
1605 computeMassInLoop(L);
1609 updateLoopWithIrreducible(*OuterLoop);
1619BlockFrequencyInfoImpl<BT>::propagateMassToSuccessors(LoopData *OuterLoop,
1620 const BlockNode &
Node) {
1624 if (
auto *Loop = Working[
Node.Index].getPackagedLoop()) {
1625 assert(Loop != OuterLoop &&
"Cannot propagate mass in a packaged loop");
1626 if (!addLoopSuccessorsToDist(OuterLoop, *Loop, Dist))
1630 const BlockT *BB = getBlock(Node);
1633 Dist, OuterLoop, Node,
getNode(It.value()),
1641 distributeMass(Node, OuterLoop, Dist);
1649 OS <<
"block-frequency-info: " << F->getName() <<
"\n";
1650 for (
const BlockT &BB : *F) {
1656 F->getFunction(), getNode(&BB)))
1658 if (std::optional<uint64_t> IrrLoopHeaderWeight =
1659 BB.getIrrLoopHeaderWeight())
1660 OS <<
", irr_loop_header_weight = " << *IrrLoopHeaderWeight;
1677 for (
const auto &BB : *F)
1680 size_t MinSize = std::min(Nodes.size(),
Other.Nodes.size());
1681 for (
size_t i = 0; i < MinSize; ++i) {
1687 <<
" existence mismatch.\n";
1688 }
else if (Nodes[i].
isValid()) {
1689 const auto &Freq =
Freqs[Nodes[i].Index];
1690 const auto &OtherFreq =
Other.Freqs[
Other.Nodes[i].Index];
1691 if (Freq.Integer != OtherFreq.Integer) {
1694 <<
" " << Freq.Integer <<
" vs " << OtherFreq.Integer <<
"\n";
1699 for (
size_t i = MinSize; i < Nodes.size(); ++i) {
1703 <<
" existence mismatch.\n";
1706 for (
size_t i = MinSize; i <
Other.Nodes.size(); ++i) {
1707 if (
Other.Nodes[i].isValid()) {
1710 <<
" existence mismatch.\n";
1717 dbgs() <<
"Other\n";
1720 assert(Match &&
"BFI mismatch");
1728template <
class BlockFrequencyInfoT,
class BranchProbabilityInfoT>
1741 return G->getFunction()->getName();
1745 unsigned HotPercentThreshold = 0) {
1747 if (!HotPercentThreshold)
1757 std::max(
MaxFrequency, Graph->getBlockFreq(
N).getFrequency());
1773 GVDAGType GType,
int layout_order = -1) {
1777 if (layout_order != -1)
1778 OS <<
Node->getName() <<
"[" << layout_order <<
"] : ";
1780 OS <<
Node->getName() <<
" : ";
1786 OS << Graph->getBlockFreq(
Node).getFrequency();
1789 auto Count = Graph->getBlockProfileCount(
Node);
1798 "never reach this point.");
1804 const BlockFrequencyInfoT *BFI,
1805 const BranchProbabilityInfoT *BPI,
1806 unsigned HotPercentThreshold = 0) {
1819 if (HotPercentThreshold) {
1824 if (EFreq >= HotFreq)
1825 OS <<
",color=\"red\"";
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
static msgpack::DocNode getNode(msgpack::DocNode DN, msgpack::Type Type, MCValue Val)
static void print(raw_ostream &Out, object::Archive::Kind Kind, T Val)
This file implements the BitVector class.
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
This file defines the DenseMap class.
This file defines the DenseSet and SmallDenseSet classes.
This file defines the little GraphTraits<X> template class that should be specialized by classes that...
static bool isZero(Value *V, const DataLayout &DL, DominatorTree *DT, AssumptionCache *AC)
Branch Probability Basic Block static false std::string getBlockName(const MachineBasicBlock *BB)
Helper to print the name of a MBB.
This file builds on the ADT/GraphTraits.h file to build a generic graph post order iterator.
static bool isValid(const char C)
Returns true if C is a valid mangled character: <0-9a-zA-Z_>.
This file defines the SmallPtrSet class.
This file defines the SmallVector class.
This file defines the SparseBitVector class.
LLVM Basic Block Representation.
Base class for BlockFrequencyInfoImpl.
std::vector< WorkingData > Working
Loop data: see initializeLoops().
virtual ~BlockFrequencyInfoImplBase()=default
Virtual destructor.
std::list< LoopData > Loops
Indexed information about loops.
bool addLoopSuccessorsToDist(const LoopData *OuterLoop, LoopData &Loop, Distribution &Dist)
Add all edges out of a packaged loop to the distribution.
ScaledNumber< uint64_t > Scaled64
std::string getLoopName(const LoopData &Loop) const
bool isIrrLoopHeader(const BlockNode &Node)
void computeLoopScale(LoopData &Loop)
Compute the loop scale for a loop.
bfi_detail::BlockMass BlockMass
void packageLoop(LoopData &Loop)
Package up a loop.
virtual raw_ostream & print(raw_ostream &OS) const
void finalizeMetrics()
Finalize frequency metrics.
void setBlockFreq(const BlockNode &Node, BlockFrequency Freq)
BlockFrequency getEntryFreq() const
void updateLoopWithIrreducible(LoopData &OuterLoop)
Update a loop after packaging irreducible SCCs inside of it.
void clear()
Clear all memory.
std::optional< uint64_t > getBlockProfileCount(const Function &F, const BlockNode &Node, bool AllowSynthetic=false) const
BlockFrequency getBlockFreq(const BlockNode &Node) const
void distributeIrrLoopHeaderMass(Distribution &Dist)
iterator_range< std::list< LoopData >::iterator > analyzeIrreducible(const bfi_detail::IrreducibleGraph &G, LoopData *OuterLoop, std::list< LoopData >::iterator Insert)
Analyze irreducible SCCs.
bool addToDist(Distribution &Dist, const LoopData *OuterLoop, const BlockNode &Pred, const BlockNode &Succ, uint64_t Weight)
Add an edge to the distribution.
void unwrapLoops()
Unwrap loops.
std::optional< uint64_t > getProfileCountFromFreq(const Function &F, BlockFrequency Freq, bool AllowSynthetic=false) const
Scaled64 getFloatingBlockFreq(const BlockNode &Node) const
void distributeMass(const BlockNode &Source, LoopData *OuterLoop, Distribution &Dist)
Distribute mass according to a distribution.
SparseBitVector IsIrrLoopHeader
Whether each block is an irreducible loop header.
std::vector< FrequencyData > Freqs
Data about each block. This is used downstream.
void adjustLoopHeaderMass(LoopData &Loop)
Adjust the mass of all headers in an irreducible loop.
bool isIrrLoopHeader(const BlockT *BB)
std::optional< uint64_t > getBlockProfileCount(const Function &F, const BlockT *BB, bool AllowSynthetic=false) const
const BranchProbabilityInfoT & getBPI() const
const FunctionT * getFunction() const
void verifyMatch(BlockFrequencyInfoImpl< BT > &Other) const
Scaled64 getFloatingBlockFreq(const BlockT *BB) const
std::optional< uint64_t > getProfileCountFromFreq(const Function &F, BlockFrequency Freq, bool AllowSynthetic=false) const
void calculate(const FunctionT &F, const BranchProbabilityInfoT &BPI, const LoopInfoT &LI)
void setBlockFreq(const BlockT *BB, BlockFrequency Freq)
BlockFrequencyInfoImpl()=default
raw_ostream & print(raw_ostream &OS) const override
Print the frequencies for the current function.
BlockFrequency getBlockFreq(const BlockT *BB) const
Analysis providing branch probability information.
static LLVM_ABI BranchProbability getBranchProbability(uint64_t Numerator, uint64_t Denominator)
static uint32_t getDenominator()
uint32_t getNumerator() const
Implements a dense probed hash-table based set.
BlockT * getHeader() const
Represents a single loop in the control flow graph.
Simple representation of a scaled number.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
typename SuperClass::const_iterator const_iterator
ptrdiff_t difference_type
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Represent a constant reference to a string, i.e.
std::string str() const
Get the contents as an std::string.
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
The instances of the Type class are immutable: once they are created, they are never changed.
LLVM Value Representation.
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
bool operator<(BlockMass X) const
bool operator>(BlockMass X) const
LLVM_ABI raw_ostream & print(raw_ostream &OS) const
bool operator==(BlockMass X) const
static BlockMass getEmpty()
LLVM_ABI void dump() const
BlockMass & operator-=(BlockMass X)
Subtract another mass.
bool operator<=(BlockMass X) const
BlockMass & operator*=(BranchProbability P)
static BlockMass getFull()
bool operator!=(BlockMass X) const
BlockMass & operator+=(BlockMass X)
Add another mass.
bool operator>=(BlockMass X) const
LLVM_ABI ScaledNumber< uint64_t > toScaled() const
Convert to scaled number.
void reserve(size_t Size)
Grow the DenseSet so that it can contain at least NumEntries items before resizing again.
A range adaptor for a pair of iterators.
This class implements an extremely fast bulk output stream that can only output to a stream.
A raw_ostream that writes to an std::string.
This provides a very simple, boring adaptor for a begin and end iterator into a range type.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
std::string getBlockName(const BlockT *BB)
Get the name of a MachineBasicBlock.
BlockMass operator*(BlockMass L, BranchProbability R)
BlockMass operator+(BlockMass L, BlockMass R)
raw_ostream & operator<<(raw_ostream &OS, BlockMass X)
BlockMass operator-(BlockMass L, BlockMass R)
NodeAddr< NodeBase * > Node
This is an optimization pass for GlobalISel generic memory operations.
Printable print(const GCNRegPressure &RP, const GCNSubtarget *ST=nullptr, unsigned DynamicVGPRBlockSize=0)
uint32_t getWeightFromBranchProb(const BranchProbability Prob)
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
iterator_range< T > make_range(T x, T y)
Convenience function for iterating over sub-ranges.
LLVM_ABI llvm::cl::opt< unsigned > IterativeBFIMaxIterationsPerBlock
LLVM_ABI llvm::cl::opt< bool > UseIterativeBFIInference
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
FunctionAddr VTableAddr Count
Function::ProfileCount ProfileCount
auto post_order(const T &G)
Post-order traversal of a graph.
format_object< Ts... > format(const char *Fmt, const Ts &... Vals)
These are helper functions used to produce formatted output.
LLVM_ABI llvm::cl::opt< bool > CheckBFIUnknownBlockQueries
RNSuccIterator< NodeRef, BlockT, RegionT > succ_begin(NodeRef Node)
constexpr NextUseDistance max(NextUseDistance A, NextUseDistance B)
iterator_range< typename GraphTraits< Inverse< GraphType > >::ChildIteratorType > inverse_children(const typename GraphTraits< GraphType >::NodeRef &G)
FunctionAddr VTableAddr Next
std::string toString(const APInt &I, unsigned Radix, bool Signed, bool formatAsCLiteral=false, bool UpperCase=true, bool InsertSeparators=false)
iterator_range< typename GraphTraits< GraphType >::ChildIteratorType > children(const typename GraphTraits< GraphType >::NodeRef &G)
LLVM_ABI Printable printBlockFreq(const BlockFrequencyInfo &BFI, BlockFrequency Freq)
Print the block frequency Freq relative to the current functions entry frequency.
LLVM_ABI llvm::cl::opt< double > IterativeBFIPrecision
Implement std::hash so that hash_code can be used in STL containers.
GraphTraits< BlockFrequencyInfoT * > GTraits
std::string getNodeAttributes(NodeRef Node, const BlockFrequencyInfoT *Graph, unsigned HotPercentThreshold=0)
typename GTraits::nodes_iterator NodeIter
typename GTraits::NodeRef NodeRef
typename GTraits::ChildIteratorType EdgeIter
std::string getNodeLabel(NodeRef Node, const BlockFrequencyInfoT *Graph, GVDAGType GType, int layout_order=-1)
std::string getEdgeAttributes(NodeRef Node, EdgeIter EI, const BlockFrequencyInfoT *BFI, const BranchProbabilityInfoT *BPI, unsigned HotPercentThreshold=0)
BFIDOTGraphTraitsBase(bool isSimple=false)
static StringRef getGraphName(const BlockFrequencyInfoT *G)
Representative of a block.
bool operator==(const BlockNode &X) const
bool operator!=(const BlockNode &X) const
bool operator<(const BlockNode &X) const
bool operator>=(const BlockNode &X) const
BlockNode(IndexType Index)
static size_t getMaxIndex()
bool operator<=(const BlockNode &X) const
bool operator>(const BlockNode &X) const
Distribution of unscaled probability weight.
void addBackedge(const BlockNode &Node, uint64_t Amount)
SmallVector< Weight, 4 > WeightList
WeightList Weights
Individual successor weights.
uint64_t Total
Sum of all weights.
void addExit(const BlockNode &Node, uint64_t Amount)
bool DidOverflow
Whether Total did overflow.
void addLocal(const BlockNode &Node, uint64_t Amount)
Stats about a block itself.
bool isHeader(const BlockNode &Node) const
SmallVector< std::pair< BlockNode, BlockMass >, 4 > ExitMap
LoopData * Parent
The parent loop.
LoopData(LoopData *Parent, It1 FirstHeader, It1 LastHeader, It2 FirstOther, It2 LastOther)
ExitMap Exits
Successor edges (and weights).
uint32_t NumHeaders
Number of headers.
bool IsPackaged
Whether this has been packaged.
LoopData(LoopData *Parent, const BlockNode &Header)
SmallVector< BlockNode, 4 > NodeList
NodeList::const_iterator members_end() const
NodeList::const_iterator members_begin() const
bool isIrreducible() const
BlockNode getHeader() const
SmallVector< BlockMass, 1 > HeaderMassList
NodeList Nodes
Header and the members of the loop.
HeaderMassList BackedgeMass
Mass returned to each loop header.
HeaderMassList::difference_type getHeaderIndex(const BlockNode &B)
iterator_range< NodeList::const_iterator > members() const
Unscaled probability weight.
Weight(DistType Type, BlockNode TargetNode, uint64_t Amount)
bool isPackaged() const
Has ContainingLoop been packaged up?
BlockMass Mass
Mass distribution from the entry block.
BlockMass & getMass()
Get the appropriate mass for a node.
WorkingData(const BlockNode &Node)
bool isAPackage() const
Has Loop been packaged up?
bool isLoopHeader() const
bool isDoubleLoopHeader() const
LoopData * Loop
The loop this block is inside.
LoopData * getContainingLoop() const
LoopData * getPackagedLoop() const
BlockNode getResolvedNode() const
Resolve a node to its representative.
bool isADoublePackage() const
Has Loop been packaged up twice?
DefaultDOTGraphTraits(bool simple=false)
static nodes_iterator nodes_end(const BlockFrequencyInfo *G)
static nodes_iterator nodes_begin(const BlockFrequencyInfo *G)
typename BlockFrequencyInfoT *::UnknownGraphTypeError NodeRef
iterator pred_end() const
IrrNode(const BlockNode &Node)
iterator pred_begin() const
iterator succ_begin() const
std::deque< const IrrNode * >::const_iterator iterator
std::deque< const IrrNode * > Edges
iterator succ_end() const
Graph of irreducible control flow.
LLVM_ABI void addNodesInFunction()
IrreducibleGraph(BFIBase &BFI, const BFIBase::LoopData *OuterLoop, BlockEdgesAdder addBlockEdges)
Construct an explicit graph containing irreducible control flow.
LLVM_ABI void indexNodes()
LLVM_ABI void addEdge(IrrNode &Irr, const BlockNode &Succ, const BFIBase::LoopData *OuterLoop)
BlockFrequencyInfoImplBase BFIBase
void addEdges(const BlockNode &Node, const BFIBase::LoopData *OuterLoop, BlockEdgesAdder addBlockEdges)
BFIBase::BlockNode BlockNode
std::vector< IrrNode > Nodes
SmallDenseMap< uint32_t, IrrNode *, 4 > Lookup
void initialize(const BFIBase::LoopData *OuterLoop, BlockEdgesAdder addBlockEdges)
void addNode(const BlockNode &Node)
LLVM_ABI void addNodesInLoop(const BFIBase::LoopData &OuterLoop)
BranchProbabilityInfo BranchProbabilityInfoT
MachineLoopInfo LoopInfoT
MachineFunction FunctionT
MachineBranchProbabilityInfo BranchProbabilityInfoT