14#ifndef LLVM_ANALYSIS_TARGETTRANSFORMINFOIMPL_H
15#define LLVM_ANALYSIS_TARGETTRANSFORMINFOIMPL_H
61 for (
const Value *Operand : Operands)
82 return SI.getNumCases();
156 virtual std::pair<KnownBits, KnownBits>
160 "expected pointer or pointer vector type");
163 if (
DL.isNonIntegralAddressSpace(FromAS))
164 return std::pair(
KnownBits(
DL.getPointerSizeInBits(FromAS)),
170 CastI->getDestAddressSpace(), *CastI->getPointerOperand());
171 FromPtrBits = KB.second;
179 return {FromPtrBits, ToPtrBits};
185 unsigned ToASBitSize =
DL.getPointerSizeInBits(ToAS);
187 if (
DL.isNonIntegralAddressSpace(FromAS))
197 unsigned DstAS)
const {
198 return {
DL.getPointerSizeInBits(SrcAS), 0};
210 virtual std::pair<const Value *, unsigned>
212 return std::make_pair(
nullptr, -1);
222 assert(
F &&
"A concrete function must be provided to this routine.");
229 if (
F->isIntrinsic())
232 if (
F->hasLocalLinkage() || !
F->hasName())
239 if (Name ==
"copysign" || Name ==
"copysignf" || Name ==
"copysignl" ||
240 Name ==
"fabs" || Name ==
"fabsf" || Name ==
"fabsl" ||
241 Name ==
"fmin" || Name ==
"fminf" || Name ==
"fminl" ||
242 Name ==
"fmax" || Name ==
"fmaxf" || Name ==
"fmaxl" ||
243 Name ==
"sin" || Name ==
"sinf" || Name ==
"sinl" ||
244 Name ==
"cos" || Name ==
"cosf" || Name ==
"cosl" ||
245 Name ==
"tan" || Name ==
"tanf" || Name ==
"tanl" ||
246 Name ==
"asin" || Name ==
"asinf" || Name ==
"asinl" ||
247 Name ==
"acos" || Name ==
"acosf" || Name ==
"acosl" ||
248 Name ==
"atan" || Name ==
"atanf" || Name ==
"atanl" ||
249 Name ==
"atan2" || Name ==
"atan2f" || Name ==
"atan2l"||
250 Name ==
"sinh" || Name ==
"sinhf" || Name ==
"sinhl" ||
251 Name ==
"cosh" || Name ==
"coshf" || Name ==
"coshl" ||
252 Name ==
"tanh" || Name ==
"tanhf" || Name ==
"tanhl" ||
253 Name ==
"sqrt" || Name ==
"sqrtf" || Name ==
"sqrtl" ||
254 Name ==
"exp10" || Name ==
"exp10l" || Name ==
"exp10f")
258 if (Name ==
"pow" || Name ==
"powf" || Name ==
"powl" || Name ==
"exp2" ||
259 Name ==
"exp2l" || Name ==
"exp2f" || Name ==
"floor" ||
260 Name ==
"floorf" || Name ==
"ceil" || Name ==
"round" ||
261 Name ==
"ffs" || Name ==
"ffsl" || Name ==
"abs" || Name ==
"labs" ||
285 virtual std::optional<Instruction *>
290 virtual std::optional<Value *>
293 bool &KnownBitsComputed)
const {
301 SimplifyAndSetOp)
const {
319 int64_t BaseOffset,
bool HasBaseReg,
320 int64_t Scale,
unsigned AddrSpace,
322 int64_t ScalableOffset = 0)
const {
325 return !BaseGV && BaseOffset == 0 && (Scale == 0 || Scale == 1);
372 unsigned DataSize =
DL.getTypeStoreSize(DataType);
379 unsigned DataSize =
DL.getTypeStoreSize(DataType);
397 Align Alignment)
const {
402 Align Alignment)
const {
407 Align Alignment)
const {
427 unsigned AddrSpace)
const {
432 Type *DataType)
const {
450 bool HasBaseReg, int64_t Scale,
451 unsigned AddrSpace)
const {
454 Scale, AddrSpace,
nullptr,
466 virtual bool useAA()
const {
return false; }
487 unsigned ScalarOpdIdx)
const {
562 unsigned *
Fast)
const {
618 Type *Ty =
nullptr)
const {
625 return "Generic::Unknown Register Class";
627 return "Generic::ScalarRC";
629 return "Generic::VectorRC";
652 virtual std::optional<unsigned>
getMaxVScale()
const {
return std::nullopt; }
666 virtual unsigned getMaximumVF(
unsigned ElemWidth,
unsigned Opcode)
const {
675 const Instruction &
I,
bool &AllowPromotionWithoutCommonHeader)
const {
676 AllowPromotionWithoutCommonHeader =
false;
681 virtual std::optional<unsigned>
692 virtual std::optional<unsigned>
708 unsigned NumStridedMemAccesses,
709 unsigned NumPrefetches,
710 bool HasCall)
const {
718 unsigned Opcode,
Type *InputTypeA,
Type *InputTypeB,
Type *AccumType,
733 auto IsWidenableCondition = [](
const Value *V) {
735 if (
II->getIntrinsicID() == Intrinsic::experimental_widenable_condition)
744 case Instruction::FDiv:
745 case Instruction::FRem:
746 case Instruction::SDiv:
747 case Instruction::SRem:
748 case Instruction::UDiv:
749 case Instruction::URem:
752 case Instruction::And:
753 case Instruction::Or:
754 if (
any_of(Args, IsWidenableCondition))
761 if (Ty->getScalarType()->isFloatingPointTy())
789 case Instruction::IntToPtr: {
790 unsigned SrcSize = Src->getScalarSizeInBits();
791 if (
DL.isLegalInteger(SrcSize) &&
792 SrcSize <=
DL.getPointerTypeSizeInBits(Dst))
796 case Instruction::PtrToAddr: {
797 unsigned DstSize = Dst->getScalarSizeInBits();
798 assert(DstSize ==
DL.getAddressSizeInBits(Src));
799 if (
DL.isLegalInteger(DstSize))
803 case Instruction::PtrToInt: {
804 unsigned DstSize = Dst->getScalarSizeInBits();
805 if (
DL.isLegalInteger(DstSize) &&
806 DstSize >=
DL.getPointerTypeSizeInBits(Src))
810 case Instruction::BitCast:
811 if (Dst == Src || (Dst->isPointerTy() && Src->isPointerTy()))
815 case Instruction::Trunc: {
864 ArrayRef<std::tuple<Value *, User *, int>> ScalarUserAndIdx,
879 unsigned Index)
const {
885 const APInt &DemandedDstElts,
896 if (Opcode == Instruction::InsertValue &&
912 bool UseMaskForCond,
bool UseMaskForGaps)
const {
919 switch (ICA.
getID()) {
922 case Intrinsic::allow_runtime_check:
923 case Intrinsic::allow_ubsan_check:
924 case Intrinsic::annotation:
925 case Intrinsic::assume:
926 case Intrinsic::sideeffect:
927 case Intrinsic::pseudoprobe:
928 case Intrinsic::arithmetic_fence:
929 case Intrinsic::dbg_assign:
930 case Intrinsic::dbg_declare:
931 case Intrinsic::dbg_value:
932 case Intrinsic::dbg_label:
933 case Intrinsic::invariant_start:
934 case Intrinsic::invariant_end:
935 case Intrinsic::launder_invariant_group:
936 case Intrinsic::strip_invariant_group:
937 case Intrinsic::is_constant:
938 case Intrinsic::lifetime_start:
939 case Intrinsic::lifetime_end:
940 case Intrinsic::experimental_noalias_scope_decl:
941 case Intrinsic::objectsize:
942 case Intrinsic::ptr_annotation:
943 case Intrinsic::var_annotation:
944 case Intrinsic::experimental_gc_result:
945 case Intrinsic::experimental_gc_relocate:
946 case Intrinsic::coro_alloc:
947 case Intrinsic::coro_begin:
948 case Intrinsic::coro_begin_custom_abi:
949 case Intrinsic::coro_dead:
950 case Intrinsic::coro_id:
951 case Intrinsic::coro_id_async:
952 case Intrinsic::coro_id_retcon:
953 case Intrinsic::coro_id_retcon_once:
954 case Intrinsic::coro_noop:
955 case Intrinsic::coro_free:
956 case Intrinsic::coro_end:
957 case Intrinsic::coro_frame:
958 case Intrinsic::coro_size:
959 case Intrinsic::coro_align:
960 case Intrinsic::coro_suspend:
961 case Intrinsic::coro_subfn_addr:
962 case Intrinsic::threadlocal_address:
963 case Intrinsic::experimental_widenable_condition:
964 case Intrinsic::ssa_copy:
967 case Intrinsic::bswap:
978 switch (MICA.
getID()) {
979 case Intrinsic::masked_scatter:
980 case Intrinsic::masked_gather:
981 case Intrinsic::masked_load:
982 case Intrinsic::masked_store:
983 case Intrinsic::vp_scatter:
984 case Intrinsic::vp_gather:
985 case Intrinsic::masked_compressstore:
986 case Intrinsic::masked_expandload:
1010 std::optional<FastMathFlags> FMF,
1023 VectorType *Ty, std::optional<FastMathFlags> FMF,
1055 bool CanCreate =
true)
const {
1061 unsigned SrcAddrSpace,
unsigned DestAddrSpace,
1063 std::optional<uint32_t> AtomicElementSize)
const {
1064 return AtomicElementSize ?
Type::getIntNTy(Context, *AtomicElementSize * 8)
1070 unsigned RemainingBytes,
unsigned SrcAddrSpace,
unsigned DestAddrSpace,
1072 std::optional<uint32_t> AtomicCpySize)
const {
1073 unsigned OpSizeInBytes = AtomicCpySize.value_or(1);
1075 for (
unsigned i = 0; i != RemainingBytes; i += OpSizeInBytes)
1081 return (Caller->getFnAttribute(
"target-cpu") ==
1082 Callee->getFnAttribute(
"target-cpu")) &&
1083 (Caller->getFnAttribute(
"target-features") ==
1084 Callee->getFnAttribute(
"target-features"));
1088 unsigned DefaultCallPenalty)
const {
1089 return DefaultCallPenalty;
1102 return (Caller->getFnAttribute(
"target-cpu") ==
1103 Callee->getFnAttribute(
"target-cpu")) &&
1104 (Caller->getFnAttribute(
"target-features") ==
1105 Callee->getFnAttribute(
"target-features"));
1126 unsigned AddrSpace)
const {
1132 unsigned AddrSpace)
const {
1146 unsigned ChainSizeInBytes,
1152 unsigned ChainSizeInBytes,
1258 unsigned MaxRequiredSize =
1259 VT->getElementType()->getPrimitiveSizeInBits().getFixedValue();
1261 unsigned MinRequiredSize = 0;
1262 for (
unsigned i = 0, e = VT->getNumElements(); i < e; ++i) {
1263 if (
auto *IntElement =
1265 bool signedElement = IntElement->getValue().isNegative();
1267 unsigned ElementMinRequiredSize =
1268 IntElement->getValue().getSignificantBits() - 1;
1272 MinRequiredSize = std::max(MinRequiredSize, ElementMinRequiredSize);
1275 return MaxRequiredSize;
1278 return MinRequiredSize;
1282 isSigned = CI->getValue().isNegative();
1283 return CI->getValue().getSignificantBits() - 1;
1288 return Cast->getSrcTy()->getScalarSizeInBits() - 1;
1293 return Cast->getSrcTy()->getScalarSizeInBits();
1305 const SCEV *Ptr)
const {
1313 int64_t MergeDistance)
const {
1327template <
typename T>
1339 assert(PointeeType && Ptr &&
"can't get GEPCost of nullptr");
1341 bool HasBaseReg = (BaseGV ==
nullptr);
1343 auto PtrSizeBits =
DL.getPointerTypeSizeInBits(Ptr->
getType());
1344 APInt BaseOffset(PtrSizeBits, 0);
1348 Type *TargetType =
nullptr;
1352 if (Operands.
empty())
1355 for (
auto I = Operands.
begin();
I != Operands.
end(); ++
I, ++GTI) {
1356 TargetType = GTI.getIndexedType();
1363 if (
StructType *STy = GTI.getStructTypeOrNull()) {
1365 assert(ConstIdx &&
"Unexpected GEP index");
1367 BaseOffset +=
DL.getStructLayout(STy)->getElementOffset(
Field);
1373 int64_t ElementSize =
1374 GTI.getSequentialElementStride(
DL).getFixedValue();
1383 Scale = ElementSize;
1398 AccessType = TargetType;
1429 for (
const Value *V : Ptrs) {
1433 if (Info.isSameBase() && V !=
Base) {
1434 if (
GEP->hasAllConstantIndices())
1438 {TTI::OK_AnyValue, TTI::OP_None}, {TTI::OK_AnyValue, TTI::OP_None},
1443 GEP->getSourceElementType(),
GEP->getPointerOperand(), Indices,
1455 auto *TargetTTI =
static_cast<const T *
>(
this);
1460 if (
const Function *
F = CB->getCalledFunction()) {
1461 if (!TargetTTI->isLoweredToCall(
F))
1470 Type *Ty = U->getType();
1476 case Instruction::Call: {
1480 return TargetTTI->getIntrinsicInstrCost(CostAttrs,
CostKind);
1482 case Instruction::UncondBr:
1483 case Instruction::CondBr:
1484 case Instruction::Ret:
1485 case Instruction::PHI:
1486 case Instruction::Switch:
1487 return TargetTTI->getCFInstrCost(Opcode,
CostKind,
I);
1488 case Instruction::Freeze:
1490 case Instruction::ExtractValue:
1491 case Instruction::InsertValue:
1492 return TargetTTI->getInsertExtractValueCost(Opcode,
CostKind);
1493 case Instruction::Alloca:
1497 case Instruction::GetElementPtr: {
1499 Type *AccessType =
nullptr;
1502 if (
GEP->hasOneUser() &&
I)
1503 AccessType =
I->user_back()->getAccessType();
1505 return TargetTTI->getGEPCost(
GEP->getSourceElementType(),
1509 case Instruction::Add:
1510 case Instruction::FAdd:
1511 case Instruction::Sub:
1512 case Instruction::FSub:
1513 case Instruction::Mul:
1514 case Instruction::FMul:
1515 case Instruction::UDiv:
1516 case Instruction::SDiv:
1517 case Instruction::FDiv:
1518 case Instruction::URem:
1519 case Instruction::SRem:
1520 case Instruction::FRem:
1521 case Instruction::Shl:
1522 case Instruction::LShr:
1523 case Instruction::AShr:
1524 case Instruction::And:
1525 case Instruction::Or:
1526 case Instruction::Xor:
1527 case Instruction::FNeg: {
1530 if (Opcode != Instruction::FNeg)
1532 return TargetTTI->getArithmeticInstrCost(Opcode, Ty,
CostKind, Op1Info,
1533 Op2Info, Operands,
I);
1535 case Instruction::IntToPtr:
1536 case Instruction::PtrToAddr:
1537 case Instruction::PtrToInt:
1538 case Instruction::SIToFP:
1539 case Instruction::UIToFP:
1540 case Instruction::FPToUI:
1541 case Instruction::FPToSI:
1542 case Instruction::Trunc:
1543 case Instruction::FPTrunc:
1544 case Instruction::BitCast:
1545 case Instruction::FPExt:
1546 case Instruction::SExt:
1547 case Instruction::ZExt:
1548 case Instruction::AddrSpaceCast: {
1549 Type *OpTy = Operands[0]->getType();
1550 return TargetTTI->getCastInstrCost(
1553 case Instruction::Store: {
1555 Type *ValTy = Operands[0]->getType();
1557 return TargetTTI->getMemoryOpCost(Opcode, ValTy,
SI->getAlign(),
1561 case Instruction::Load: {
1563 Type *LoadType = U->getType();
1574 LoadType = TI->getDestTy();
1576 return TargetTTI->getMemoryOpCost(Opcode, LoadType, LI->getAlign(),
1578 {TTI::OK_AnyValue, TTI::OP_None},
I);
1580 case Instruction::Select: {
1581 const Value *Op0, *Op1;
1592 return TargetTTI->getArithmeticInstrCost(
1594 CostKind, Op1Info, Op2Info, Operands,
I);
1598 Type *CondTy = Operands[0]->getType();
1599 return TargetTTI->getCmpSelInstrCost(Opcode, U->getType(), CondTy,
1603 case Instruction::ICmp:
1604 case Instruction::FCmp: {
1607 Type *ValTy = Operands[0]->getType();
1609 return TargetTTI->getCmpSelInstrCost(Opcode, ValTy, U->getType(),
1614 case Instruction::InsertElement: {
1620 if (CI->getValue().getActiveBits() <= 32)
1621 Idx = CI->getZExtValue();
1622 return TargetTTI->getVectorInstrCost(*IE, Ty,
CostKind, Idx,
1625 case Instruction::ShuffleVector: {
1633 int NumSubElts, SubIndex;
1636 if (
all_of(Mask, [](
int M) {
return M < 0; }))
1640 if (Shuffle->changesLength()) {
1642 if (Shuffle->increasesLength() && Shuffle->isIdentityWithPadding())
1645 if (Shuffle->isExtractSubvectorMask(SubIndex))
1647 VecSrcTy, Mask,
CostKind, SubIndex,
1648 VecTy, Operands, Shuffle);
1650 if (Shuffle->isInsertSubvectorMask(NumSubElts, SubIndex))
1651 return TargetTTI->getShuffleCost(
1657 int ReplicationFactor, VF;
1658 if (Shuffle->isReplicationMask(ReplicationFactor, VF)) {
1662 DemandedDstElts.
setBit(
I.index());
1664 return TargetTTI->getReplicationShuffleCost(
1665 VecSrcTy->getElementType(), ReplicationFactor, VF,
1670 NumSubElts = VecSrcTy->getElementCount().getKnownMinValue();
1676 if (Shuffle->increasesLength()) {
1677 for (
int &M : AdjustMask)
1678 M = M >= NumSubElts ? (M + (Mask.size() - NumSubElts)) : M;
1680 return TargetTTI->getShuffleCost(
1682 VecTy, AdjustMask,
CostKind, 0,
nullptr, Operands, Shuffle);
1693 VecSrcTy, VecSrcTy, AdjustMask,
CostKind, 0,
nullptr, Operands,
1697 std::iota(ExtractMask.
begin(), ExtractMask.
end(), 0);
1698 return ShuffleCost + TargetTTI->getShuffleCost(
1700 ExtractMask,
CostKind, 0, VecTy, {}, Shuffle);
1703 if (Shuffle->isIdentity())
1706 if (Shuffle->isReverse())
1707 return TargetTTI->getShuffleCost(
TTI::SK_Reverse, VecTy, VecSrcTy, Mask,
1711 if (Shuffle->isTranspose())
1713 Mask,
CostKind, 0,
nullptr, Operands,
1716 if (Shuffle->isZeroEltSplat())
1718 Mask,
CostKind, 0,
nullptr, Operands,
1721 if (Shuffle->isSingleSource())
1723 VecSrcTy, Mask,
CostKind, 0,
nullptr,
1726 if (Shuffle->isInsertSubvectorMask(NumSubElts, SubIndex))
1727 return TargetTTI->getShuffleCost(
1732 if (Shuffle->isSelect())
1733 return TargetTTI->getShuffleCost(
TTI::SK_Select, VecTy, VecSrcTy, Mask,
1737 if (Shuffle->isSplice(SubIndex))
1738 return TargetTTI->getShuffleCost(
TTI::SK_Splice, VecTy, VecSrcTy, Mask,
1739 CostKind, SubIndex,
nullptr, Operands,
1743 Mask,
CostKind, 0,
nullptr, Operands,
1746 case Instruction::ExtractElement: {
1752 if (CI->getValue().getActiveBits() <= 32)
1753 Idx = CI->getZExtValue();
1754 Type *DstTy = Operands[0]->getType();
1755 return TargetTTI->getVectorInstrCost(*EEI, DstTy,
CostKind, Idx);
1764 auto *TargetTTI =
static_cast<const T *
>(
this);
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
static cl::opt< OutputCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(OutputCostKind::RecipThroughput), cl::values(clEnumValN(OutputCostKind::RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(OutputCostKind::Latency, "latency", "Instruction latency"), clEnumValN(OutputCostKind::CodeSize, "code-size", "Code size"), clEnumValN(OutputCostKind::SizeAndLatency, "size-latency", "Code size and latency"), clEnumValN(OutputCostKind::All, "all", "Print all cost kinds")))
static bool isSigned(unsigned Opcode)
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
uint64_t IntrinsicInst * II
OptimizedStructLayoutField Field
static SymbolRef::Type getType(const Symbol *Sym)
static void computeKnownBits(const Value *V, const APInt &DemandedElts, KnownBits &Known, const SimplifyQuery &Q, unsigned Depth)
Determine which bits of V are known to be either zero or one and return them in the Known bit set.
Class for arbitrary precision integers.
void setBit(unsigned BitPosition)
Set the given bit to 1 whose position is given as "bitPosition".
unsigned getBitWidth() const
Return the number of bits in the APInt.
LLVM_ABI APInt sextOrTrunc(unsigned width) const
Sign extend or truncate to width.
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
int64_t getSExtValue() const
Get sign extended value.
This class represents a conversion between pointers from one address space to another.
an instruction to allocate memory on the stack
Represent a constant reference to an array (0 or more elements consecutively in memory),...
ArrayRef< T > drop_front(size_t N=1) const
Drop the first N elements of the array.
const T & front() const
Get the first element.
bool empty() const
Check if the array is empty.
Class to represent array types.
A cache of @llvm.assume calls within a function.
Functions, function parameters, and return types can have attributes to indicate how they should be t...
BlockFrequencyInfo pass uses BlockFrequencyInfoImpl implementation to estimate IR basic block frequen...
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Conditional Branch instruction.
This is the shared class of boolean and integer constants.
uint64_t getZExtValue() const
Return the constant as a 64-bit unsigned integer value after it has been zero extended as appropriate...
const APInt & getValue() const
Return the constant as an APInt value reference.
This is an important base class in LLVM.
A parsed version of the target data layout string in and methods for querying it.
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
static constexpr ElementCount get(ScalarTy MinVal, bool Scalable)
Convenience struct for specifying and reasoning about fast-math flags.
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
The core instruction combiner logic.
static InstructionCost getInvalid(CostType Val=0)
Type * getReturnType() const
Intrinsic::ID getID() const
A wrapper class for inspecting calls to intrinsic functions.
This is an important class for using LLVM in a threaded context.
An instruction for reading from memory.
Represents a single loop in the control flow graph.
Information for memory intrinsic cost model.
Intrinsic::ID getID() const
unsigned getOpcode() const
Return the opcode for this Instruction or ConstantExpr.
Analysis providing profile information.
The RecurrenceDescriptor is used to identify recurrences variables in a loop.
This node represents a polynomial recurrence on the trip count of the specified loop.
SCEVUse getStepRecurrence(ScalarEvolution &SE) const
Constructs and returns the recurrence indicating how much this expression steps by.
This class represents a constant integer value.
const APInt & getAPInt() const
This class represents an analyzed expression in the program.
The main scalar evolution driver.
This is a 'bitvector' (really, a variable-sized bit array), optimized for the case when the array is ...
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void append(ItTy in_start, ItTy in_end)
Add the specified range to the end of the SmallVector.
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StackOffset holds a fixed and a scalable offset in bytes.
static StackOffset getScalable(int64_t Scalable)
static StackOffset getFixed(int64_t Fixed)
An instruction for storing to memory.
Represent a constant reference to a string, i.e.
Class to represent struct types.
Provides information about what library functions are available for the current target.
This class represents a truncation of integer types.
static constexpr TypeSize get(ScalarTy Quantity, bool Scalable)
The instances of the Type class are immutable: once they are created, they are never changed.
bool isVectorTy() const
True if this is an instance of VectorType.
LLVM_ABI bool isScalableTy(SmallPtrSetImpl< const Type * > &Visited) const
Return true if this is a type whose size is a known multiple of vscale.
LLVM_ABI unsigned getPointerAddressSpace() const
Get the address space of this pointer or pointer vector type.
static LLVM_ABI IntegerType * getInt8Ty(LLVMContext &C)
LLVM_ABI unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.
bool isPtrOrPtrVectorTy() const
Return true if this is a pointer type or a vector of pointer types.
static LLVM_ABI IntegerType * getIntNTy(LLVMContext &C, unsigned N)
This is the common base class for vector predication intrinsics.
LLVM Value Representation.
Type * getType() const
All values are typed, get the type of this value.
LLVM_ABI const Value * stripPointerCasts() const
Strip off pointer casts, all-zero GEPs and address space casts.
Base class of all SIMD vector types.
constexpr ScalarTy getFixedValue() const
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
@ Fast
Attempts to make calls as fast as possible (e.g.
@ C
The default llvm calling convention, compatible with C.
This namespace contains an enum with a value for every intrinsic/builtin function known by LLVM.
match_combine_or< Ty... > m_CombineOr(const Ty &...Ps)
Combine pattern matchers matching any of Ps patterns.
LogicalOp_match< LHS, RHS, Instruction::And > m_LogicalAnd(const LHS &L, const RHS &R)
Matches L && R either in the form of L & R or L ?
bool match(Val *V, const Pattern &P)
ThreeOps_match< Cond, LHS, RHS, Instruction::Select > m_Select(const Cond &C, const LHS &L, const RHS &R)
Matches SelectInst.
auto m_Value()
Match an arbitrary value and ignore it.
auto m_Constant()
Match an arbitrary Constant and ignore it.
auto m_LogicalOr()
Matches L || R where L and R are arbitrary values.
auto m_LogicalAnd()
Matches L && R where L and R are arbitrary values.
LogicalOp_match< LHS, RHS, Instruction::Or > m_LogicalOr(const LHS &L, const RHS &R)
Matches L || R either in the form of L | R or L ?
This is an optimization pass for GlobalISel generic memory operations.
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
FunctionAddr VTableAddr uintptr_t uintptr_t DataSize
constexpr bool isPowerOf2_64(uint64_t Value)
Return true if the argument is a power of two > 0 (64 bit edition.)
LLVM_ABI Value * getSplatValue(const Value *V)
Get splat value if the input is a splat vector or return nullptr.
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
constexpr int PoisonMaskElem
RecurKind
These are the kinds of recurrences that we support.
constexpr unsigned BitWidth
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
gep_type_iterator gep_type_begin(const User *GEP)
@ DataWithoutLaneMask
Same as Data, but avoids using the get.active.lane.mask intrinsic to calculate the mask and instead i...
ValueUniformity
Enum describing how values behave with respect to uniformity and divergence, to answer the question: ...
@ Default
The result value is uniform if and only if all operands are uniform.
This struct is a compact representation of a valid (non-zero power of two) alignment.
Attributes of a target dependent hardware loop.
KnownBits anyextOrTrunc(unsigned BitWidth) const
Return known bits for an "any" extension or truncation of the value we're tracking.
Information about a load/store intrinsic defined by the target.