67#define DEBUG_TYPE "inline"
69STATISTIC(NumInlined,
"Number of functions inlined");
70STATISTIC(NumDeleted,
"Number of functions deleted because all callers found");
75 "Cost multiplier to multiply onto inlined call sites where the "
76 "new call was previously an intra-SCC call (not relevant when the "
77 "original call was already intra-SCC). This can accumulate over "
78 "multiple inlinings (e.g. if a call site already had a cost "
79 "multiplier and one of its inlined calls was also subject to "
80 "this, the inlined call would have the original multiplier "
81 "multiplied by intra-scc-cost-multiplier). This is to prevent tons of "
82 "inlining through a child SCC which can cause terrible compile times"));
86 cl::desc(
"Maximum number of instructions to scan backward for "
87 "store-to-load forwarding in subsequent inlining decisions. "
88 "DefMaxInstsToScan=6 is not enough and misses inlining "
89 "opportunities (e.g. when class stores into mutiple members in "
90 "ctor and afterwards calls a function reading those members)"));
106 "Optimization remarks file containing inline remarks to be replayed "
107 "by cgscc inlining."),
111 "cgscc-inline-replay-scope",
114 "Replay on functions that have remarks associated "
115 "with them (default)"),
117 "Replay on the entire module")),
118 cl::desc(
"Whether inline replay should be applied to the entire "
119 "Module or just the Functions (default) that are present as "
120 "callers in remarks during cgscc inlining."),
124 "cgscc-inline-replay-fallback",
129 "All decisions not in replay send to original advisor (default)"),
131 "AlwaysInline",
"All decisions not in replay are inlined"),
133 "All decisions not in replay are not inlined")),
135 "How cgscc inline replay treats sites that don't come from the replay. "
136 "Original: defers to original advisor, AlwaysInline: inline all sites "
137 "not in replay, NeverInline: inline no sites not in replay"),
141 "cgscc-inline-replay-format",
146 "<Line Number>:<Column Number>"),
148 "LineDiscriminator",
"<Line Number>.<Discriminator>"),
150 "LineColumnDiscriminator",
151 "<Line Number>:<Column Number>.<Discriminator> (default)")),
155InlinerPass::getAdvisor(
const ModuleAnalysisManagerCGSCCProxy::Result &
MAM,
158 return *OwnedAdvisor;
170 OwnedAdvisor = std::make_unique<DefaultInlineAdvisor>(
176 M,
FAM,
M.getContext(), std::move(OwnedAdvisor),
177 ReplayInlinerSettings{CGSCCInlineReplayFile,
178 CGSCCInlineReplayScope,
179 CGSCCInlineReplayFallback,
180 {CGSCCInlineReplayFormat}},
184 return *OwnedAdvisor;
186 assert(IAA->getAdvisor() &&
187 "Expected a present InlineAdvisorAnalysis also have an "
188 "InlineAdvisor initialized");
189 return *IAA->getAdvisor();
193 F.dropAllReferences();
195 BB.eraseFromParent();
203 const auto &MAMProxy =
207 assert(InitialC.
size() > 0 &&
"Cannot handle an empty SCC!");
208 Module &M = *InitialC.
begin()->getFunction().getParent();
246 for (
auto &
N : InitialC) {
256 if (
Function *Callee = CB->getCalledFunction()) {
257 if (!Callee->isDeclaration())
264 << NV(
"Callee", Callee) <<
" will not be inlined into "
265 << NV(
"Caller", CB->getCaller())
266 <<
" because its definition is unavailable"
296 for (
int I = 0;
I < (int)Calls.
size(); ++
I) {
307 <<
" Function size: " <<
F.getInstructionCount()
317 bool DidInline =
false;
318 for (;
I < (int)Calls.
size() && Calls[
I]->getCaller() == &
F; ++
I) {
330 LLVM_DEBUG(
dbgs() <<
"Skipping inlining internal SCC edge from a node "
331 "previously split out of this SCC by inlining: "
332 <<
F.getName() <<
" -> " << Callee.getName() <<
"\n");
342 if (!LI || !LI->isSimple())
354 if (
C->getType() != LI->getType()) {
355 if (
C->isNullValue())
360 LI->replaceAllUsesWith(
C);
361 LI->eraseFromParent();
365 std::unique_ptr<InlineAdvice> Advice =
372 if (!Advice->isInliningRecommended()) {
373 Advice->recordUnattemptedInlining();
385 GetAssumptionCache, PSI,
396 bool TrackInlineHistory = CalleeSCC->
size() != 1 ||
398 CalleeN->
lookup(CalleeN) !=
nullptr;
403 TrackInlineHistory,
nullptr,
405 if (!
IR.isSuccess()) {
406 Advice->recordUnsuccessfulInlining(
IR);
414 InlinedCallees.
insert(&Callee);
418 <<
F.getInstructionCount() <<
"\n");
423 Function *NewCallee = ICB->getCalledFunction();
425 "Intrinsic calls should not be tracked.");
432 NewCallee = ICB->getCalledFunction();
446 if (CalleeSCC !=
C &&
452 ICB->addFnAttr(NewCBCostMult);
464 bool CalleeWasDeleted =
false;
465 if (Callee.isDiscardableIfUnused() && Callee.hasZeroLiveUses() &&
467 if (Callee.hasLocalLinkage() || !Callee.hasComdat()) {
470 return CB->getCaller() == &Callee;
476 Advice->recordInliningWithCalleeDeleted();
481 "Cannot put cause a function to become dead twice!");
483 CalleeWasDeleted =
true;
485 DeadFunctionsInComdats.
push_back(&Callee);
488 if (!CalleeWasDeleted)
489 Advice->recordInlining();
535 if ((
C != OldC || UR.
CWorklist.count(OldC)) &&
537 return CG.lookupSCC(*CG.lookup(*Callee)) == OldC;
539 LLVM_DEBUG(
dbgs() <<
"Inlined an internal call edge and split an SCC, "
540 "retaining this to avoid infinite inlining.\n");
543 InlinedCallees.
clear();
552 if (!DeadFunctionsInComdats.
empty()) {
554 for (
auto *Callee : DeadFunctionsInComdats)
556 DeadFunctions.
append(DeadFunctionsInComdats);
566 for (
Function *DeadF : DeadFunctions) {
571 FAM.clear(*DeadF, DeadF->getName());
572 AM.
clear(DeadC, DeadC.getName());
599 unsigned MaxDevirtIterations)
600 : Params(Params), IC(IC), Mode(Mode),
601 MaxDevirtIterations(MaxDevirtIterations) {
607 if (MandatoryFirst) {
620 if (!IAA.tryCreate(Params, Mode,
621 {CGSCCInlineReplayFile,
622 CGSCCInlineReplayScope,
623 CGSCCInlineReplayFallback,
624 {CGSCCInlineReplayFormat}},
626 M.getContext().emitError(
627 "Could not setup Inlining Advisor for the requested "
628 "mode and/or options");
645 MPM.addPass(std::move(AfterCGMPM));
659 OS, MapClassName2PassName);
661 OS <<
"<only-mandatory>";
669 if (!MPM.isEmpty()) {
670 MPM.printPipeline(OS, MapClassName2PassName);
674 if (MaxDevirtIterations != 0)
675 OS <<
"devirt<" << MaxDevirtIterations <<
">(";
676 PM.printPipeline(OS, MapClassName2PassName);
677 if (MaxDevirtIterations != 0)
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
Expand Atomic instructions
This file contains the simple types necessary to represent the attributes associated with functions a...
This is the interface for LLVM's primary stateless and local alias analysis.
This header provides classes for managing passes over SCCs of the call graph.
#define clEnumValN(ENUMVAL, FLAGNAME, DESC)
@ Available
We know the block is fully available. This is a fixpoint.
Module.h This file contains the declarations for the Module class.
This header defines various interfaces for pass management in LLVM.
static cl::opt< unsigned > InlinerForwardingScanLimit("inliner-forwarding-scan-limit", cl::init(16), cl::Hidden, cl::desc("Maximum number of instructions to scan backward for " "store-to-load forwarding in subsequent inlining decisions. " "DefMaxInstsToScan=6 is not enough and misses inlining " "opportunities (e.g. when class stores into mutiple members in " "ctor and afterwards calls a function reading those members)"))
static cl::opt< ReplayInlinerSettings::Scope > CGSCCInlineReplayScope("cgscc-inline-replay-scope", cl::init(ReplayInlinerSettings::Scope::Function), cl::values(clEnumValN(ReplayInlinerSettings::Scope::Function, "Function", "Replay on functions that have remarks associated " "with them (default)"), clEnumValN(ReplayInlinerSettings::Scope::Module, "Module", "Replay on the entire module")), cl::desc("Whether inline replay should be applied to the entire " "Module or just the Functions (default) that are present as " "callers in remarks during cgscc inlining."), cl::Hidden)
static cl::opt< bool > KeepAdvisorForPrinting("keep-inline-advisor-for-printing", cl::init(false), cl::Hidden)
A flag for test, so we can print the content of the advisor when running it as part of the default (e...
static cl::opt< std::string > CGSCCInlineReplayFile("cgscc-inline-replay", cl::init(""), cl::value_desc("filename"), cl::desc("Optimization remarks file containing inline remarks to be replayed " "by cgscc inlining."), cl::Hidden)
static cl::opt< bool > EnablePostSCCAdvisorPrinting("enable-scc-inline-advisor-printing", cl::init(false), cl::Hidden)
Allows printing the contents of the advisor after each SCC inliner pass.
static cl::opt< int > IntraSCCCostMultiplier("intra-scc-cost-multiplier", cl::init(2), cl::Hidden, cl::desc("Cost multiplier to multiply onto inlined call sites where the " "new call was previously an intra-SCC call (not relevant when the " "original call was already intra-SCC). This can accumulate over " "multiple inlinings (e.g. if a call site already had a cost " "multiplier and one of its inlined calls was also subject to " "this, the inlined call would have the original multiplier " "multiplied by intra-scc-cost-multiplier). This is to prevent tons of " "inlining through a child SCC which can cause terrible compile times"))
static cl::opt< CallSiteFormat::Format > CGSCCInlineReplayFormat("cgscc-inline-replay-format", cl::init(CallSiteFormat::Format::LineColumnDiscriminator), cl::values(clEnumValN(CallSiteFormat::Format::Line, "Line", "<Line Number>"), clEnumValN(CallSiteFormat::Format::LineColumn, "LineColumn", "<Line Number>:<Column Number>"), clEnumValN(CallSiteFormat::Format::LineDiscriminator, "LineDiscriminator", "<Line Number>.<Discriminator>"), clEnumValN(CallSiteFormat::Format::LineColumnDiscriminator, "LineColumnDiscriminator", "<Line Number>:<Column Number>.<Discriminator> (default)")), cl::desc("How cgscc inline replay file is formatted"), cl::Hidden)
void makeFunctionBodyUnreachable(Function &F)
static cl::opt< ReplayInlinerSettings::Fallback > CGSCCInlineReplayFallback("cgscc-inline-replay-fallback", cl::init(ReplayInlinerSettings::Fallback::Original), cl::values(clEnumValN(ReplayInlinerSettings::Fallback::Original, "Original", "All decisions not in replay send to original advisor (default)"), clEnumValN(ReplayInlinerSettings::Fallback::AlwaysInline, "AlwaysInline", "All decisions not in replay are inlined"), clEnumValN(ReplayInlinerSettings::Fallback::NeverInline, "NeverInline", "All decisions not in replay are not inlined")), cl::desc("How cgscc inline replay treats sites that don't come from the replay. " "Original: defers to original advisor, AlwaysInline: inline all sites " "not in replay, NeverInline: inline no sites not in replay"), cl::Hidden)
Implements a lazy call graph analysis and related passes for the new pass manager.
Legalize the Machine IR a function s Machine IR
FunctionAnalysisManager FAM
ModuleAnalysisManager MAM
This file provides a priority worklist.
This file defines the make_scope_exit function, which executes user-defined cleanup logic at scope ex...
This file implements a set that has insertion order iteration characteristics.
This file defines the SmallPtrSet class.
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
A manager for alias analyses.
This templated class represents "all analyses that operate over <aparticular IR unit>" (e....
void clear(IRUnitT &IR, llvm::StringRef Name)
Clear any cached analysis results for a single unit of IR.
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
A function analysis which provides an AssumptionCache.
A cache of @llvm.assume calls within a function.
Functions, function parameters, and return types can have attributes to indicate how they should be t...
static LLVM_ABI Attribute get(LLVMContext &Context, AttrKind Kind, uint64_t Val=0)
Return a uniquified Attribute object.
LLVM Basic Block Representation.
static BasicBlock * Create(LLVMContext &Context, const Twine &Name="", Function *Parent=nullptr, BasicBlock *InsertBefore=nullptr)
Creates a new BasicBlock.
InstListType::iterator iterator
Instruction iterators...
Analysis pass which computes BlockFrequencyInfo.
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Function * getCalledFunction() const
Returns the function called, or null if this is an indirect function invocation or the function signa...
iterator_range< User::op_iterator > args()
Iteration adapter for range-for loops.
LLVM_ABI Function * getCaller()
Helper to get the caller (the parent function).
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
A proxy from a FunctionAnalysisManager to an SCC.
bool isIntrinsic() const
isIntrinsic - Returns true if the function's name starts with "llvm.".
LLVM_ABI bool isDeclaration() const
Return true if the primary definition of this global value is outside of the current translation unit...
Printer pass for the InlineAdvisorAnalysis results.
The InlineAdvisorAnalysis is a module pass because the InlineAdvisor needs to capture state right bef...
Result run(Module &M, ModuleAnalysisManager &MAM)
Interface for deciding whether to inline a call site or not.
virtual void onPassEntry(LazyCallGraph::SCC *SCC=nullptr)
This must be called when the Inliner pass is entered, to allow the InlineAdvisor update internal stat...
virtual void onPassExit(LazyCallGraph::SCC *SCC=nullptr)
This must be called when the Inliner pass is exited, as function passes may be run subsequently.
std::unique_ptr< InlineAdvice > getAdvice(CallBase &CB, bool MandatoryOnly=false)
Get an InlineAdvice containing a recommendation on whether to inline or not.
This class captures the data input to the InlineFunction call, and records the auxiliary results prod...
SmallVector< CallBase *, 8 > InlinedCallSites
All of the new call sites inlined into the caller.
InlineResult is basically true or false.
The inliner pass for the new pass manager.
LLVM_ABI void printPipeline(raw_ostream &OS, function_ref< StringRef(StringRef)> MapClassName2PassName)
LLVM_ABI PreservedAnalyses run(LazyCallGraph::SCC &C, CGSCCAnalysisManager &AM, LazyCallGraph &CG, CGSCCUpdateResult &UR)
A node in the call graph.
An SCC of the call graph.
RefSCC & getOuterRefSCC() const
A lazily constructed view of the call graph of a module.
bool isLibFunction(Function &F) const
Test whether a function is a known and defined library function tracked by the call graph.
LLVM_ABI void markDeadFunction(Function &F)
Mark a function as dead to be removed later by removeDeadFunctions().
Node & get(Function &F)
Get a graph node for a given function, scanning it to populate the graph data as necessary.
SCC * lookupSCC(Node &N) const
Lookup a function's SCC in the graph.
Node * lookup(const Function &F) const
Lookup a function in the graph which has already been scanned and added.
LLVM_ABI PreservedAnalyses run(Module &, ModuleAnalysisManager &)
LLVM_ABI void printPipeline(raw_ostream &OS, function_ref< StringRef(StringRef)> MapClassName2PassName)
LLVM_ABI ModuleInlinerWrapperPass(InlineParams Params=getInlineParams(), bool MandatoryFirst=true, InlineContext IC={}, InliningAdvisorMode Mode=InliningAdvisorMode::Default, unsigned MaxDevirtIterations=0)
A Module instance is used to store all the information related to an LLVM module.
A set of analyses that are preserved following a run of a transformation pass.
static PreservedAnalyses none()
Convenience factory function for the empty preserved set.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
PreservedAnalyses & preserveSet()
Mark an analysis set as preserved.
PreservedAnalyses & preserve()
Mark an analysis as preserved.
An analysis pass based on the new PM to deliver ProfileSummaryInfo.
Analysis providing profile information.
void clear()
Completely clear the SetVector.
bool insert(const value_type &X)
Insert a new element into the SetVector.
A SetVector that performs no allocations if smaller than a certain size.
iterator erase(const_iterator CI)
void append(ItTy in_start, ItTy in_end)
Add the specified range to the end of the SmallVector.
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Represent a constant reference to a string, i.e.
This function has undefined behavior.
LLVM Value Representation.
An efficient, type-erasing, non-owning reference to a callable.
This class implements an extremely fast bulk output stream that can only output to a stream.
@ C
The default llvm calling convention, compatible with C.
const char FunctionInlineCostMultiplierAttributeName[]
ValuesClass values(OptsTy... Options)
Helper to build a ValuesClass by forwarding a variable number of arguments as an initializer list to ...
initializer< Ty > init(const Ty &Val)
Add a small namespace to avoid name clashes with the classes used in the streaming interface.
This is an optimization pass for GlobalISel generic memory operations.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
InliningAdvisorMode
There are 4 scenarios we can use the InlineAdvisor:
LLVM_ABI std::optional< int > getStringFnAttrAsInt(CallBase &CB, StringRef AttrKind)
DevirtSCCRepeatedPass createDevirtSCCRepeatedPass(CGSCCPassT &&Pass, int MaxIterations)
A function to deduce a function pass type and wrap it in the templated adaptor.
LLVM_ABI LazyCallGraph::SCC & updateCGAndAnalysisManagerForCGSCCPass(LazyCallGraph &G, LazyCallGraph::SCC &C, LazyCallGraph::Node &N, CGSCCAnalysisManager &AM, CGSCCUpdateResult &UR, FunctionAnalysisManager &FAM)
Helper to update the call graph after running a CGSCC pass.
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
LLVM_ABI void setInlineRemark(CallBase &CB, StringRef Message)
Set the inline-remark attribute.
LLVM_ABI Value * FindAvailableLoadedValue(LoadInst *Load, BasicBlock *ScanBB, BasicBlock::iterator &ScanFrom, unsigned MaxInstsToScan=DefMaxInstsToScan, BatchAAResults *AA=nullptr, bool *IsLoadCSE=nullptr, unsigned *NumScanedInst=nullptr)
Scan backwards to see if we have the value of the given load available locally within a small number ...
LLVM_ABI InlineResult InlineFunction(CallBase &CB, InlineFunctionInfo &IFI, bool MergeAttributes=false, AAResults *CalleeAAR=nullptr, bool InsertLifetime=true, bool TrackInlineHistory=false, Function *ForwardVarArgsTo=nullptr, OptimizationRemarkEmitter *ORE=nullptr)
This function inlines the called function into the basic block of the caller.
AnalysisManager< LazyCallGraph::SCC, LazyCallGraph & > CGSCCAnalysisManager
The CGSCC analysis manager.
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
ModuleToPostOrderCGSCCPassAdaptor createModuleToPostOrderCGSCCPassAdaptor(CGSCCPassT &&Pass)
A function to deduce a function pass type and wrap it in the templated adaptor.
auto reverse(ContainerTy &&C)
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
std::unique_ptr< InlineAdvisor > getReplayInlineAdvisor(Module &M, FunctionAnalysisManager &FAM, LLVMContext &Context, std::unique_ptr< InlineAdvisor > OriginalAdvisor, const ReplayInlinerSettings &ReplaySettings, bool EmitRemarks, InlineContext IC)
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
OuterAnalysisManagerProxy< ModuleAnalysisManager, LazyCallGraph::SCC, LazyCallGraph & > ModuleAnalysisManagerCGSCCProxy
A proxy from a ModuleAnalysisManager to an SCC.
LLVM_ABI InlineParams getInlineParams()
Generate the parameters to tune the inline cost analysis based only on the commandline options.
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
LLVM_ABI void filterDeadComdatFunctions(SmallVectorImpl< Function * > &DeadComdatFunctions)
Filter out potentially dead comdat functions where other entries keep the entire comdat group alive.
LLVM_ABI bool tryPromoteCall(CallBase &CB)
Try to promote (devirtualize) a virtual call on an Alloca.
AnalysisManager< Function > FunctionAnalysisManager
Convenience typedef for the Function analysis manager.
cl::opt< unsigned > MaxDevirtIterations("max-devirt-iterations", cl::ReallyHidden, cl::init(4))
std::string itostr(int64_t X)
AnalysisManager< Module > ModuleAnalysisManager
Convenience typedef for the Module analysis manager.
Support structure for SCC passes to communicate updates the call graph back to the CGSCC pass manager...
SmallPriorityWorklist< LazyCallGraph::SCC *, 1 > & CWorklist
Worklist of the SCCs queued for processing.
SmallDenseSet< std::pair< LazyCallGraph::Node *, LazyCallGraph::SCC * >, 4 > & InlinedInternalEdges
A hacky area where the inliner can retain history about inlining decisions that mutated the call grap...
SmallVector< Function *, 4 > & DeadFunctions
Functions that a pass has considered to be dead to be removed at the end of the call graph walk in ba...
SmallPtrSetImpl< LazyCallGraph::SCC * > & InvalidatedSCCs
The set of invalidated SCCs which should be skipped if they are found in CWorklist.
Provides context on when an inline advisor is constructed in the pipeline (e.g., link phase,...
Thresholds to tune inline cost analysis.
A CRTP mix-in to automatically provide informational APIs needed for passes.