21#ifndef LLVM_ANALYSIS_TARGETTRANSFORMINFO_H
22#define LLVM_ANALYSIS_TARGETTRANSFORMINFO_H
134 const Value *Ptr =
nullptr;
137 Type *DataTy =
nullptr;
144 bool VariableMask =
true;
147 unsigned AddressSpace = 0;
154 const Value *Ptr,
bool VariableMask,
157 : I(I), Ptr(Ptr), DataTy(DataTy), IID(Id), VariableMask(VariableMask),
158 Alignment(Alignment) {}
162 unsigned AddressSpace = 0)
163 : DataTy(DataTy), IID(Id), AddressSpace(AddressSpace),
164 Alignment(Alignment) {}
167 bool VariableMask,
Align Alignment,
169 : I(I), DataTy(DataTy), IID(Id), VariableMask(VariableMask),
170 Alignment(Alignment) {}
183 Type *RetTy =
nullptr;
196 bool TypeBasedOnly =
false);
221 return Arguments.empty();
265class TargetTransformInfo;
296 std::unique_ptr<const TargetTransformInfoImplBase> Impl);
319 FunctionAnalysisManager::Invalidator &) {
409 static_assert(
sizeof(PointersChainInfo) == 4,
"Was size increase justified?");
417 const PointersChainInfo &Info,
Type *AccessTy,
562 LLVM_ABI std::pair<KnownBits, KnownBits>
569 unsigned FromAS,
unsigned ToAS,
const KnownBits &FromPtrBits)
const;
590 unsigned DstAS)
const;
601 LLVM_ABI std::pair<const Value *, unsigned>
797 LLVM_ABI std::optional<Instruction *>
804 bool &KnownBitsComputed)
const;
811 SimplifyAndSetOp)
const;
855 int64_t BaseOffset,
bool HasBaseReg,
856 int64_t Scale,
unsigned AddrSpace = 0,
858 int64_t ScalableOffset = 0)
const;
932 Align Alignment)
const;
936 Align Alignment)
const;
940 Align Alignment)
const;
952 unsigned AddrSpace)
const;
956 Type *DataType)
const;
997 bool HasBaseReg, int64_t Scale,
998 unsigned AddrSpace = 0)
const;
1044 unsigned ScalarOpdIdx)
const;
1145 bool IsZeroCmp)
const;
1178 unsigned *
Fast =
nullptr)
const;
1312 return {MergeKind, MergeProp};
1335 Type *Ty =
nullptr)
const;
1398 unsigned AddrSpace)
const;
1404 const Instruction &
I,
bool &AllowPromotionWithoutCommonHeader)
const;
1452 unsigned NumStridedMemAccesses,
1453 unsigned NumPrefetches,
1454 bool HasCall)
const;
1492 unsigned Opcode,
Type *InputTypeA,
Type *InputTypeB,
Type *AccumType,
1528 unsigned Opcode,
Type *Ty,
1533 const TargetLibraryInfo *TLibInfo =
nullptr)
const;
1543 VectorType *VecTy,
unsigned Opcode0,
unsigned Opcode1,
1544 const SmallBitVector &OpcodeMask,
1555 ShuffleKind Kind, VectorType *DstTy, VectorType *SrcTy,
1556 ArrayRef<int> Mask = {},
1638 unsigned Index = -1,
const Value *Op0 =
nullptr,
1639 const Value *Op1 =
nullptr,
1654 ArrayRef<std::tuple<Value *, User *, int>> ScalarUserAndIdx,
1665 unsigned Index = -1,
1674 unsigned Index)
const;
1688 Type *EltTy,
int ReplicationFactor,
int VF,
const APInt &DemandedDstElts,
1711 unsigned Opcode,
Type *VecTy,
unsigned Factor, ArrayRef<unsigned> Indices,
1714 bool UseMaskForCond =
false,
bool UseMaskForGaps =
false)
const;
1719 return FMF && !(*FMF).allowReassoc();
1747 unsigned Opcode,
VectorType *Ty, std::optional<FastMathFlags> FMF,
1760 bool IsUnsigned,
unsigned RedOpcode,
Type *ResTy,
VectorType *Ty,
1769 std::optional<FastMathFlags> FMF,
1829 bool CanCreate =
true)
const;
1834 unsigned DestAddrSpace,
Align SrcAlign,
Align DestAlign,
1835 std::optional<uint32_t> AtomicElementSize = std::nullopt)
const;
1845 unsigned RemainingBytes,
unsigned SrcAddrSpace,
unsigned DestAddrSpace,
1847 std::optional<uint32_t> AtomicCpySize = std::nullopt)
const;
1862 unsigned DefaultCallPenalty)
const;
1906 unsigned AddrSpace)
const;
1911 unsigned AddrSpace)
const;
1923 unsigned ChainSizeInBytes,
1929 unsigned ChainSizeInBytes,
2103 std::unique_ptr<const TargetTransformInfoImplBase> TTIImpl;
2136 : TTICallback(Arg.TTICallback) {}
2138 : TTICallback(
std::
move(Arg.TTICallback)) {}
2140 TTICallback =
RHS.TTICallback;
2144 TTICallback = std::move(
RHS.TTICallback);
2176 std::optional<TargetTransformInfo> TTI;
2178 virtual void anchor();
This file implements a class to represent arbitrary precision integral constant values and operations...
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Atomic ordering constants.
static cl::opt< OutputCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(OutputCostKind::RecipThroughput), cl::values(clEnumValN(OutputCostKind::RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(OutputCostKind::Latency, "latency", "Instruction latency"), clEnumValN(OutputCostKind::CodeSize, "code-size", "Code size"), clEnumValN(OutputCostKind::SizeAndLatency, "size-latency", "Code size and latency"), clEnumValN(OutputCostKind::All, "all", "Print all cost kinds")))
TargetTransformInfo::VPLegalization VPLegalization
static cl::opt< bool > ForceNestedLoop("force-nested-hardware-loop", cl::Hidden, cl::init(false), cl::desc("Force allowance of nested hardware loops"))
static cl::opt< bool > ForceHardwareLoopPHI("force-hardware-loop-phi", cl::Hidden, cl::init(false), cl::desc("Force hardware loop counter to be updated through a phi"))
This header defines various interfaces for pass management in LLVM.
This file defines an InstructionCost class that is used when calculating the cost of an instruction,...
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
uint64_t IntrinsicInst * II
static cl::opt< RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode > Mode("regalloc-enable-advisor", cl::Hidden, cl::init(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default), cl::desc("Enable regalloc advisor mode"), cl::values(clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default, "default", "Default"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Release, "release", "precompiled"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Development, "development", "for training")))
static TableGen::Emitter::Opt Y("gen-skeleton-entry", EmitSkeleton, "Generate example skeleton entry")
Class for arbitrary precision integers.
an instruction to allocate memory on the stack
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Class to represent array types.
A cache of @llvm.assume calls within a function.
Functions, function parameters, and return types can have attributes to indicate how they should be t...
LLVM Basic Block Representation.
BlockFrequencyInfo pass uses BlockFrequencyInfoImpl implementation to estimate IR basic block frequen...
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Conditional Branch instruction.
This is an important base class in LLVM.
A parsed version of the target data layout string in and methods for querying it.
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Convenience struct for specifying and reasoning about fast-math flags.
ImmutablePass class - This class is used to provide information that does not need to be run.
The core instruction combiner logic.
static InstructionCost getInvalid(CostType Val=0)
Class to represent integer types.
Drive the analysis of interleaved memory accesses in the loop.
FastMathFlags getFlags() const
const SmallVectorImpl< Type * > & getArgTypes() const
Type * getReturnType() const
bool skipScalarizationCost() const
const SmallVectorImpl< const Value * > & getArgs() const
LLVM_ABI IntrinsicCostAttributes(Intrinsic::ID Id, const CallBase &CI, InstructionCost ScalarCost=InstructionCost::getInvalid(), bool TypeBasedOnly=false)
InstructionCost getScalarizationCost() const
const IntrinsicInst * getInst() const
Intrinsic::ID getID() const
bool isTypeBasedOnly() const
A wrapper class for inspecting calls to intrinsic functions.
This is an important class for using LLVM in a threaded context.
An instruction for reading from memory.
LoopVectorizationLegality checks if it is legal to vectorize a loop, and to what vectorization factor...
Represents a single loop in the control flow graph.
Information for memory intrinsic cost model.
Align getAlignment() const
unsigned getAddressSpace() const
Type * getDataType() const
const Value * getPointer() const
LLVM_ABI MemIntrinsicCostAttributes(Intrinsic::ID Id, Type *DataTy, bool VariableMask, Align Alignment, const Instruction *I=nullptr)
bool getVariableMask() const
LLVM_ABI MemIntrinsicCostAttributes(Intrinsic::ID Id, Type *DataTy, Align Alignment, unsigned AddressSpace=0)
Intrinsic::ID getID() const
const Instruction * getInst() const
LLVM_ABI MemIntrinsicCostAttributes(Intrinsic::ID Id, Type *DataTy, const Value *Ptr, bool VariableMask, Align Alignment, const Instruction *I=nullptr)
A set of analyses that are preserved following a run of a transformation pass.
Analysis providing profile information.
The RecurrenceDescriptor is used to identify recurrences variables in a loop.
This class represents an analyzed expression in the program.
The main scalar evolution driver.
This is a 'bitvector' (really, a variable-sized bit array), optimized for the case when the array is ...
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StackOffset holds a fixed and a scalable offset in bytes.
An instruction for storing to memory.
Analysis pass providing the TargetTransformInfo.
TargetIRAnalysis(const TargetIRAnalysis &Arg)
TargetIRAnalysis & operator=(const TargetIRAnalysis &RHS)
LLVM_ABI Result run(const Function &F, FunctionAnalysisManager &)
TargetTransformInfo Result
LLVM_ABI TargetIRAnalysis()
Default construct a target IR analysis.
TargetIRAnalysis & operator=(TargetIRAnalysis &&RHS)
TargetIRAnalysis(TargetIRAnalysis &&Arg)
Provides information about what library functions are available for the current target.
The instances of the Type class are immutable: once they are created, they are never changed.
This is the common base class for vector predication intrinsics.
LLVM Value Representation.
Base class of all SIMD vector types.
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
@ Fast
Attempts to make calls as fast as possible (e.g.
@ C
The default llvm calling convention, compatible with C.
This namespace contains an enum with a value for every intrinsic/builtin function known by LLVM.
friend class Instruction
Iterator for Instructions in a `BasicBlock.
This is an optimization pass for GlobalISel generic memory operations.
FunctionAddr VTableAddr Value
@ LLVM_MARK_AS_BITMASK_ENUM
LLVM_ATTRIBUTE_VISIBILITY_DEFAULT AnalysisKey InnerAnalysisManagerProxy< AnalysisManagerT, IRUnitT, ExtraArgTs... >::Key
AtomicOrdering
Atomic ordering for LLVM's memory model.
FunctionAddr VTableAddr uintptr_t uintptr_t Data
LLVM_ABI ImmutablePass * createTargetTransformInfoWrapperPass(TargetIRAnalysis TIRA)
Create an analysis pass wrapper around a TTI object.
RecurKind
These are the kinds of recurrences that we support.
ArrayRef(const T &OneElt) -> ArrayRef< T >
constexpr unsigned BitWidth
OutputIt move(R &&Range, OutputIt Out)
Provide wrappers to std::move which take ranges instead of having to pass begin/end explicitly.
@ DataWithEVL
Use predicated EVL instructions for tail-folding.
@ DataAndControlFlow
Use predicate to control both data and control flow.
@ DataWithoutLaneMask
Same as Data, but avoids using the get.active.lane.mask intrinsic to calculate the mask and instead i...
AnalysisManager< Function > FunctionAnalysisManager
Convenience typedef for the Function analysis manager.
ValueUniformity
Enum describing how values behave with respect to uniformity and divergence, to answer the question: ...
Implement std::hash so that hash_code can be used in STL containers.
This struct is a compact representation of a valid (non-zero power of two) alignment.
A CRTP mix-in that provides informational APIs needed for analysis passes.
A special type used by analysis passes to provide an address that identifies that particular analysis...
Attributes of a target dependent hardware loop.
LLVM_ABI bool canAnalyze(LoopInfo &LI)
HardwareLoopInfo()=delete
LLVM_ABI bool isHardwareLoopCandidate(ScalarEvolution &SE, LoopInfo &LI, DominatorTree &DT, bool ForceNestedLoop=false, bool ForceHardwareLoopPHI=false)
Information about a load/store intrinsic defined by the target.
SmallVector< InterestingMemoryOperand, 1 > InterestingOperands
unsigned short MatchingId
Value * PtrVal
This is the pointer that the intrinsic is loading from or storing to.
InterleavedAccessInfo * IAI
TailFoldingInfo(TargetLibraryInfo *TLI, LoopVectorizationLegality *LVL, InterleavedAccessInfo *IAI)
LoopVectorizationLegality * LVL