doxygen/X86TargetTransformInfo_8h_source.html

//===-- X86TargetTransformInfo.h - X86 specific TTI -------------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

/// \file

/// This file a TargetTransformInfo::Concept conforming object specific to the

/// X86 target machine. It uses the target's detailed information to

/// provide more precise answers to certain TTI queries, while letting the

/// target independent and default TTI implementations handle the rest.

///

//===----------------------------------------------------------------------===//


#ifndef LLVM_LIB_TARGET_X86_X86TARGETTRANSFORMINFO_H

#define LLVM_LIB_TARGET_X86_X86TARGETTRANSFORMINFO_H


#include "X86TargetMachine.h"

#include "llvm/Analysis/TargetTransformInfo.h"

#include "llvm/CodeGen/BasicTTIImpl.h"

#include <optional>


namespace llvm {


class InstCombiner;


class X86TTIImpl : public BasicTTIImplBase<X86TTIImpl> {

  typedef BasicTTIImplBase<X86TTIImpl> BaseT;

  typedef TargetTransformInfo TTI;

  friend BaseT;


  const X86Subtarget *ST;

  const X86TargetLowering *TLI;


  const X86Subtarget *getST() const { return ST; }

  const X86TargetLowering *getTLI() const { return TLI; }


  const FeatureBitset InlineFeatureIgnoreList = {

      // This indicates the CPU is 64 bit capable not that we are in 64-bit

      // mode.

      X86::FeatureX86_64,


      // These features don't have any intrinsics or ABI effect.

      X86::FeatureNOPL,

      X86::FeatureCX16,

      X86::FeatureLAHFSAHF64,


      // Some older targets can be setup to fold unaligned loads.

      X86::FeatureSSEUnalignedMem,


      // Codegen control options.

      X86::TuningFast11ByteNOP,

      X86::TuningFast15ByteNOP,

      X86::TuningFastBEXTR,

      X86::TuningFastHorizontalOps,

      X86::TuningFastLZCNT,

      X86::TuningFastScalarFSQRT,

      X86::TuningFastSHLDRotate,

      X86::TuningFastScalarShiftMasks,

      X86::TuningFastVectorShiftMasks,

      X86::TuningFastVariableCrossLaneShuffle,

      X86::TuningFastVariablePerLaneShuffle,

      X86::TuningFastVectorFSQRT,

      X86::TuningLEAForSP,

      X86::TuningLEAUsesAG,

      X86::TuningLZCNTFalseDeps,

      X86::TuningBranchFusion,

      X86::TuningMacroFusion,

      X86::TuningPadShortFunctions,

      X86::TuningPOPCNTFalseDeps,

      X86::TuningMULCFalseDeps,

      X86::TuningPERMFalseDeps,

      X86::TuningRANGEFalseDeps,

      X86::TuningGETMANTFalseDeps,

      X86::TuningMULLQFalseDeps,

      X86::TuningSlow3OpsLEA,

      X86::TuningSlowDivide32,

      X86::TuningSlowDivide64,

      X86::TuningSlowIncDec,

      X86::TuningSlowLEA,

      X86::TuningSlowPMADDWD,

      X86::TuningSlowPMULLD,

      X86::TuningSlowSHLD,

      X86::TuningSlowTwoMemOps,

      X86::TuningSlowUAMem16,

      X86::TuningPreferMaskRegisters,

      X86::TuningInsertVZEROUPPER,

      X86::TuningUseSLMArithCosts,

      X86::TuningUseGLMDivSqrtCosts,

      X86::TuningNoDomainDelay,

      X86::TuningNoDomainDelayMov,

      X86::TuningNoDomainDelayShuffle,

      X86::TuningNoDomainDelayBlend,

      X86::TuningPreferShiftShuffle,

      X86::TuningFastImmVectorShift,

      X86::TuningFastDPWSSD,


      // Perf-tuning flags.

      X86::TuningFastGather,

      X86::TuningSlowUAMem32,

      X86::TuningAllowLight256Bit,


      // Based on whether user set the -mprefer-vector-width command line.

      X86::TuningPrefer128Bit,

      X86::TuningPrefer256Bit,


      // CPU name enums. These just follow CPU string.

      X86::ProcIntelAtom

  };


public:

  explicit X86TTIImpl(const X86TargetMachine *TM, const Function &F)

      : BaseT(TM, F.getDataLayout()), ST(TM->getSubtargetImpl(F)),

        TLI(ST->getTargetLowering()) {}


  /// \name Scalar TTI Implementations

  /// @{

  TTI::PopcntSupportKind getPopcntSupport(unsigned TyWidth);


  /// @}


  /// \name Cache TTI Implementation

  /// @{

  std::optional<unsigned> getCacheSize(

    TargetTransformInfo::CacheLevel Level) const override;

  std::optional<unsigned> getCacheAssociativity(

    TargetTransformInfo::CacheLevel Level) const override;

  /// @}


  /// \name Vector TTI Implementations

  /// @{


  unsigned getNumberOfRegisters(unsigned ClassID) const;

  bool hasConditionalLoadStoreForType(Type *Ty = nullptr) const;

  TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const;

  unsigned getLoadStoreVecRegBitWidth(unsigned AS) const;

  unsigned getMaxInterleaveFactor(ElementCount VF);

  InstructionCost getArithmeticInstrCost(

      unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind,

      TTI::OperandValueInfo Op1Info = {TTI::OK_AnyValue, TTI::OP_None},

      TTI::OperandValueInfo Op2Info = {TTI::OK_AnyValue, TTI::OP_None},

      ArrayRef<const Value *> Args = std::nullopt,

      const Instruction *CxtI = nullptr);

  InstructionCost getAltInstrCost(VectorType *VecTy, unsigned Opcode0,

                                  unsigned Opcode1,

                                  const SmallBitVector &OpcodeMask,

                                  TTI::TargetCostKind CostKind) const;


  InstructionCost getShuffleCost(TTI::ShuffleKind Kind, VectorType *Tp,

                                 ArrayRef<int> Mask,

                                 TTI::TargetCostKind CostKind, int Index,

                                 VectorType *SubTp,

                                 ArrayRef<const Value *> Args = std::nullopt,

                                 const Instruction *CxtI = nullptr);

  InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src,

                                   TTI::CastContextHint CCH,

                                   TTI::TargetCostKind CostKind,

                                   const Instruction *I = nullptr);

  InstructionCost getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy,

                                     CmpInst::Predicate VecPred,

                                     TTI::TargetCostKind CostKind,

                                     const Instruction *I = nullptr);

  using BaseT::getVectorInstrCost;

  InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val,

                                     TTI::TargetCostKind CostKind,

                                     unsigned Index, Value *Op0, Value *Op1);

  InstructionCost getScalarizationOverhead(VectorType *Ty,

                                           const APInt &DemandedElts,

                                           bool Insert, bool Extract,

                                           TTI::TargetCostKind CostKind);

  InstructionCost getReplicationShuffleCost(Type *EltTy, int ReplicationFactor,

                                            int VF,

                                            const APInt &DemandedDstElts,

                                            TTI::TargetCostKind CostKind);

  InstructionCost

  getMemoryOpCost(unsigned Opcode, Type *Src, MaybeAlign Alignment,

                  unsigned AddressSpace, TTI::TargetCostKind CostKind,

                  TTI::OperandValueInfo OpInfo = {TTI::OK_AnyValue, TTI::OP_None},

                  const Instruction *I = nullptr);

  InstructionCost getMaskedMemoryOpCost(unsigned Opcode, Type *Src,

                                        Align Alignment, unsigned AddressSpace,

                                        TTI::TargetCostKind CostKind);

  InstructionCost getGatherScatterOpCost(unsigned Opcode, Type *DataTy,

                                         const Value *Ptr, bool VariableMask,

                                         Align Alignment,

                                         TTI::TargetCostKind CostKind,

                                         const Instruction *I);

  InstructionCost getPointersChainCost(ArrayRef<const Value *> Ptrs,

                                       const Value *Base,

                                       const TTI::PointersChainInfo &Info,

                                       Type *AccessTy,

                                       TTI::TargetCostKind CostKind);

  InstructionCost getAddressComputationCost(Type *PtrTy, ScalarEvolution *SE,

                                            const SCEV *Ptr);


  std::optional<Instruction *> instCombineIntrinsic(InstCombiner &IC,

                                                    IntrinsicInst &II) const;

  std::optional<Value *>

  simplifyDemandedUseBitsIntrinsic(InstCombiner &IC, IntrinsicInst &II,

                                   APInt DemandedMask, KnownBits &Known,

                                   bool &KnownBitsComputed) const;

  std::optional<Value *> simplifyDemandedVectorEltsIntrinsic(

      InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts,

      APInt &UndefElts2, APInt &UndefElts3,

      std::function<void(Instruction *, unsigned, APInt, APInt &)>

          SimplifyAndSetOp) const;


  unsigned getAtomicMemIntrinsicMaxElementSize() const;


  InstructionCost getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA,

                                        TTI::TargetCostKind CostKind);


  InstructionCost getArithmeticReductionCost(unsigned Opcode, VectorType *Ty,

                                             std::optional<FastMathFlags> FMF,

                                             TTI::TargetCostKind CostKind);


  InstructionCost getMinMaxCost(Intrinsic::ID IID, Type *Ty,

                                TTI::TargetCostKind CostKind,

                                FastMathFlags FMF);


  InstructionCost getMinMaxReductionCost(Intrinsic::ID IID, VectorType *Ty,

                                         FastMathFlags FMF,

                                         TTI::TargetCostKind CostKind);


  InstructionCost getInterleavedMemoryOpCost(

      unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef<unsigned> Indices,

      Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind,

      bool UseMaskForCond = false, bool UseMaskForGaps = false);

  InstructionCost getInterleavedMemoryOpCostAVX512(

      unsigned Opcode, FixedVectorType *VecTy, unsigned Factor,

      ArrayRef<unsigned> Indices, Align Alignment, unsigned AddressSpace,

      TTI::TargetCostKind CostKind, bool UseMaskForCond = false,

      bool UseMaskForGaps = false);


  InstructionCost getIntImmCost(int64_t);


  InstructionCost getIntImmCost(const APInt &Imm, Type *Ty,

                                TTI::TargetCostKind CostKind);


  InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind,

                                 const Instruction *I = nullptr);


  InstructionCost getIntImmCostInst(unsigned Opcode, unsigned Idx,

                                    const APInt &Imm, Type *Ty,

                                    TTI::TargetCostKind CostKind,

                                    Instruction *Inst = nullptr);

  InstructionCost getIntImmCostIntrin(Intrinsic::ID IID, unsigned Idx,

                                      const APInt &Imm, Type *Ty,

                                      TTI::TargetCostKind CostKind);

  /// Return the cost of the scaling factor used in the addressing

  /// mode represented by AM for this target, for a load/store

  /// of the specified type.

  /// If the AM is supported, the return value must be >= 0.

  /// If the AM is not supported, it returns a negative value.

  InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV,

                                       StackOffset BaseOffset, bool HasBaseReg,

                                       int64_t Scale, unsigned AddrSpace) const;


  bool isLSRCostLess(const TargetTransformInfo::LSRCost &C1,

                     const TargetTransformInfo::LSRCost &C2);

  bool canMacroFuseCmp();

  bool isLegalMaskedLoad(Type *DataType, Align Alignment);

  bool isLegalMaskedStore(Type *DataType, Align Alignment);

  bool isLegalNTLoad(Type *DataType, Align Alignment);

  bool isLegalNTStore(Type *DataType, Align Alignment);

  bool isLegalBroadcastLoad(Type *ElementTy, ElementCount NumElements) const;

  bool forceScalarizeMaskedGather(VectorType *VTy, Align Alignment);

  bool forceScalarizeMaskedScatter(VectorType *VTy, Align Alignment) {

    return forceScalarizeMaskedGather(VTy, Alignment);

  }

  bool isLegalMaskedGatherScatter(Type *DataType, Align Alignment);

  bool isLegalMaskedGather(Type *DataType, Align Alignment);

  bool isLegalMaskedScatter(Type *DataType, Align Alignment);

  bool isLegalMaskedExpandLoad(Type *DataType, Align Alignment);

  bool isLegalMaskedCompressStore(Type *DataType, Align Alignment);

  bool isLegalAltInstr(VectorType *VecTy, unsigned Opcode0, unsigned Opcode1,

                       const SmallBitVector &OpcodeMask) const;

  bool hasDivRemOp(Type *DataType, bool IsSigned);

  bool isExpensiveToSpeculativelyExecute(const Instruction *I);

  bool isFCmpOrdCheaperThanFCmpZero(Type *Ty);

  bool areInlineCompatible(const Function *Caller,

                           const Function *Callee) const;

  bool areTypesABICompatible(const Function *Caller, const Function *Callee,

                             const ArrayRef<Type *> &Type) const;


  uint64_t getMaxMemIntrinsicInlineSizeThreshold() const {

    return ST->getMaxInlineSizeThreshold();

  }


  TTI::MemCmpExpansionOptions enableMemCmpExpansion(bool OptSize,

                                                    bool IsZeroCmp) const;

  bool prefersVectorizedAddressing() const;

  bool supportsEfficientVectorElementLoadStore() const;

  bool enableInterleavedAccessVectorization();


  InstructionCost getBranchMispredictPenalty() const;


private:

  bool supportsGather() const;

  InstructionCost getGSVectorCost(unsigned Opcode, TTI::TargetCostKind CostKind,

                                  Type *DataTy, const Value *Ptr,

                                  Align Alignment, unsigned AddressSpace);


  int getGatherOverhead() const;

  int getScatterOverhead() const;


  /// @}

};


} // end namespace llvm


#endif

BasicTTIImpl.h
This file provides a helper that implements much of the TTI interface in terms of the target-independ...

Info
Analysis containing CSE Info
Definition: CSEInfo.cpp:27

CostKind
static cl::opt< TargetTransformInfo::TargetCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(TargetTransformInfo::TCK_RecipThroughput), cl::values(clEnumValN(TargetTransformInfo::TCK_RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(TargetTransformInfo::TCK_Latency, "latency", "Instruction latency"), clEnumValN(TargetTransformInfo::TCK_CodeSize, "code-size", "Code size"), clEnumValN(TargetTransformInfo::TCK_SizeAndLatency, "size-latency", "Code size and latency")))

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:352

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

InstCombiner
Machine InstCombiner
Definition: MachineCombiner.cpp:137

II
uint64_t IntrinsicInst * II
Definition: NVVMIntrRange.cpp:52

TM
const char LLVMTargetMachineRef TM
Definition: PassBuilderBindings.cpp:48

Ptr
@ Ptr
Definition: TargetLibraryInfo.cpp:77

TargetTransformInfo.h
This pass exposes codegen information to IR-level passes.

X86TargetMachine.h

VectorType
Definition: ItaniumDemangle.h:1149

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::BasicTTIImplBase
Base class which can be used to help build a TTI implementation.
Definition: BasicTTIImpl.h:81

llvm::BasicTTIImplBase< X86TTIImpl >::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, Value *Op0, Value *Op1)
Definition: BasicTTIImpl.h:1279

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition: InstrTypes.h:757

llvm::ElementCount
Definition: TypeSize.h:300

llvm::FeatureBitset
Container class for subtarget features.
Definition: SubtargetFeature.h:41

llvm::Function
Definition: Function.h:64

llvm::InstructionCost
Definition: InstructionCost.h:29

llvm::Instruction
Definition: Instruction.h:68

llvm::SmallBitVector
This is a 'bitvector' (really, a variable-sized bit array), optimized for the case when the array is ...
Definition: SmallBitVector.h:35

llvm::TargetTransformInfoImplBase::getDataLayout
const DataLayout & getDataLayout() const
Definition: TargetTransformInfoImpl.h:48

llvm::TargetTransformInfo
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Definition: TargetTransformInfo.h:214

llvm::TargetTransformInfo::TargetCostKind
TargetCostKind
The kind of cost model.
Definition: TargetTransformInfo.h:259

llvm::TargetTransformInfo::OP_None
@ OP_None
Definition: TargetTransformInfo.h:1090

llvm::TargetTransformInfo::RegisterKind
RegisterKind
Definition: TargetTransformInfo.h:1143

llvm::TargetTransformInfo::PopcntSupportKind
PopcntSupportKind
Flags indicating the kind of support for population count.
Definition: TargetTransformInfo.h:702

llvm::TargetTransformInfo::ShuffleKind
ShuffleKind
The various kinds of shuffle patterns for vector queries.
Definition: TargetTransformInfo.h:1061

llvm::TargetTransformInfo::CastContextHint
CastContextHint
Represents a hint about the context in which a cast is used.
Definition: TargetTransformInfo.h:1338

llvm::TargetTransformInfo::OK_AnyValue
@ OK_AnyValue
Definition: TargetTransformInfo.h:1082

llvm::TargetTransformInfo::CacheLevel
CacheLevel
The possible cache levels.
Definition: TargetTransformInfo.h:1202

llvm::TypeSize
Definition: TypeSize.h:334

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::VectorType
Base class of all SIMD vector types.
Definition: DerivedTypes.h:403

llvm::X86Subtarget
Definition: X86Subtarget.h:53

llvm::X86TTIImpl
Definition: X86TargetTransformInfo.h:28

llvm::X86TTIImpl::getInterleavedMemoryOpCostAVX512
InstructionCost getInterleavedMemoryOpCostAVX512(unsigned Opcode, FixedVectorType *VecTy, unsigned Factor, ArrayRef< unsigned > Indices, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, bool UseMaskForCond=false, bool UseMaskForGaps=false)
Definition: X86TargetTransformInfo.cpp:6256

llvm::X86TTIImpl::isLegalMaskedGather
bool isLegalMaskedGather(Type *DataType, Align Alignment)
Definition: X86TargetTransformInfo.cpp:6068

llvm::X86TTIImpl::getAltInstrCost
InstructionCost getAltInstrCost(VectorType *VecTy, unsigned Opcode0, unsigned Opcode1, const SmallBitVector &OpcodeMask, TTI::TargetCostKind CostKind) const
Definition: X86TargetTransformInfo.cpp:1518

llvm::X86TTIImpl::getCacheAssociativity
std::optional< unsigned > getCacheAssociativity(TargetTransformInfo::CacheLevel Level) const override
Definition: X86TargetTransformInfo.cpp:143

llvm::X86TTIImpl::getPopcntSupport
TTI::PopcntSupportKind getPopcntSupport(unsigned TyWidth)
Definition: X86TargetTransformInfo.cpp:105

llvm::X86TTIImpl::isLegalNTStore
bool isLegalNTStore(Type *DataType, Align Alignment)
Definition: X86TargetTransformInfo.cpp:5974

llvm::X86TTIImpl::enableInterleavedAccessVectorization
bool enableInterleavedAccessVectorization()
Definition: X86TargetTransformInfo.cpp:6245

llvm::X86TTIImpl::getIntImmCostIntrin
InstructionCost getIntImmCostIntrin(Intrinsic::ID IID, unsigned Idx, const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind)
Definition: X86TargetTransformInfo.cpp:5750

llvm::X86TTIImpl::isLegalNTLoad
bool isLegalNTLoad(Type *DataType, Align Alignment)
Definition: X86TargetTransformInfo.cpp:5963

llvm::X86TTIImpl::X86TTIImpl
X86TTIImpl(const X86TargetMachine *TM, const Function &F)
Definition: X86TargetTransformInfo.h:113

llvm::X86TTIImpl::getIntImmCostInst
InstructionCost getIntImmCostInst(unsigned Opcode, unsigned Idx, const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind, Instruction *Inst=nullptr)
Definition: X86TargetTransformInfo.cpp:5651

llvm::X86TTIImpl::instCombineIntrinsic
std::optional< Instruction * > instCombineIntrinsic(InstCombiner &IC, IntrinsicInst &II) const
Definition: X86InstCombineIntrinsic.cpp:2146

llvm::X86TTIImpl::forceScalarizeMaskedScatter
bool forceScalarizeMaskedScatter(VectorType *VTy, Align Alignment)
Definition: X86TargetTransformInfo.h:269

llvm::X86TTIImpl::simplifyDemandedUseBitsIntrinsic
std::optional< Value * > simplifyDemandedUseBitsIntrinsic(InstCombiner &IC, IntrinsicInst &II, APInt DemandedMask, KnownBits &Known, bool &KnownBitsComputed) const
Definition: X86InstCombineIntrinsic.cpp:3060

llvm::X86TTIImpl::isLegalMaskedGatherScatter
bool isLegalMaskedGatherScatter(Type *DataType, Align Alignment)
Definition: X86TargetTransformInfo.cpp:6053

llvm::X86TTIImpl::getScalingFactorCost
InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV, StackOffset BaseOffset, bool HasBaseReg, int64_t Scale, unsigned AddrSpace) const
Return the cost of the scaling factor used in the addressing mode represented by AM for this target,...
Definition: X86TargetTransformInfo.cpp:6725

llvm::X86TTIImpl::isLegalMaskedLoad
bool isLegalMaskedLoad(Type *DataType, Align Alignment)
Definition: X86TargetTransformInfo.cpp:5929

llvm::X86TTIImpl::hasConditionalLoadStoreForType
bool hasConditionalLoadStoreForType(Type *Ty=nullptr) const
Definition: X86TargetTransformInfo.cpp:179

llvm::X86TTIImpl::supportsEfficientVectorElementLoadStore
bool supportsEfficientVectorElementLoadStore() const
Definition: X86TargetTransformInfo.cpp:6241

llvm::X86TTIImpl::enableMemCmpExpansion
TTI::MemCmpExpansionOptions enableMemCmpExpansion(bool OptSize, bool IsZeroCmp) const
Definition: X86TargetTransformInfo.cpp:6213

llvm::X86TTIImpl::prefersVectorizedAddressing
bool prefersVectorizedAddressing() const
Definition: X86TargetTransformInfo.cpp:6237

llvm::X86TTIImpl::getLoadStoreVecRegBitWidth
unsigned getLoadStoreVecRegBitWidth(unsigned AS) const
Definition: X86TargetTransformInfo.cpp:223

llvm::X86TTIImpl::isLegalBroadcastLoad
bool isLegalBroadcastLoad(Type *ElementTy, ElementCount NumElements) const
Definition: X86TargetTransformInfo.cpp:5998

llvm::X86TTIImpl::getMaxMemIntrinsicInlineSizeThreshold
uint64_t getMaxMemIntrinsicInlineSizeThreshold() const
Definition: X86TargetTransformInfo.h:287

llvm::X86TTIImpl::getMinMaxReductionCost
InstructionCost getMinMaxReductionCost(Intrinsic::ID IID, VectorType *Ty, FastMathFlags FMF, TTI::TargetCostKind CostKind)
Definition: X86TargetTransformInfo.cpp:5432

llvm::X86TTIImpl::forceScalarizeMaskedGather
bool forceScalarizeMaskedGather(VectorType *VTy, Align Alignment)
Definition: X86TargetTransformInfo.cpp:6041

llvm::X86TTIImpl::getCacheSize
std::optional< unsigned > getCacheSize(TargetTransformInfo::CacheLevel Level) const override
Definition: X86TargetTransformInfo.cpp:113

llvm::X86TTIImpl::isLegalMaskedStore
bool isLegalMaskedStore(Type *DataType, Align Alignment)
Definition: X86TargetTransformInfo.cpp:5959

llvm::X86TTIImpl::getReplicationShuffleCost
InstructionCost getReplicationShuffleCost(Type *EltTy, int ReplicationFactor, int VF, const APInt &DemandedDstElts, TTI::TargetCostKind CostKind)
Definition: X86TargetTransformInfo.cpp:4787

llvm::X86TTIImpl::getGatherScatterOpCost
InstructionCost getGatherScatterOpCost(unsigned Opcode, Type *DataTy, const Value *Ptr, bool VariableMask, Align Alignment, TTI::TargetCostKind CostKind, const Instruction *I)
Calculate the cost of Gather / Scatter operation.
Definition: X86TargetTransformInfo.cpp:5888

llvm::X86TTIImpl::getInterleavedMemoryOpCost
InstructionCost getInterleavedMemoryOpCost(unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef< unsigned > Indices, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, bool UseMaskForCond=false, bool UseMaskForGaps=false)
Definition: X86TargetTransformInfo.cpp:6410

llvm::X86TTIImpl::getMaxInterleaveFactor
unsigned getMaxInterleaveFactor(ElementCount VF)
Definition: X86TargetTransformInfo.cpp:228

llvm::X86TTIImpl::getRegisterBitWidth
TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const
Definition: X86TargetTransformInfo.cpp:203

llvm::X86TTIImpl::isLegalMaskedCompressStore
bool isLegalMaskedCompressStore(Type *DataType, Align Alignment)
Definition: X86TargetTransformInfo.cpp:6030

llvm::X86TTIImpl::getCastInstrCost
InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src, TTI::CastContextHint CCH, TTI::TargetCostKind CostKind, const Instruction *I=nullptr)
Definition: X86TargetTransformInfo.cpp:2170

llvm::X86TTIImpl::getPointersChainCost
InstructionCost getPointersChainCost(ArrayRef< const Value * > Ptrs, const Value *Base, const TTI::PointersChainInfo &Info, Type *AccessTy, TTI::TargetCostKind CostKind)
Definition: X86TargetTransformInfo.cpp:5126

llvm::X86TTIImpl::getIntrinsicInstrCost
InstructionCost getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA, TTI::TargetCostKind CostKind)
Definition: X86TargetTransformInfo.cpp:3461

llvm::X86TTIImpl::getNumberOfRegisters
unsigned getNumberOfRegisters(unsigned ClassID) const
Definition: X86TargetTransformInfo.cpp:164

llvm::X86TTIImpl::canMacroFuseCmp
bool canMacroFuseCmp()
Definition: X86TargetTransformInfo.cpp:5925

llvm::X86TTIImpl::getMemoryOpCost
InstructionCost getMemoryOpCost(unsigned Opcode, Type *Src, MaybeAlign Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, TTI::OperandValueInfo OpInfo={TTI::OK_AnyValue, TTI::OP_None}, const Instruction *I=nullptr)
Definition: X86TargetTransformInfo.cpp:4892

llvm::X86TTIImpl::isLSRCostLess
bool isLSRCostLess(const TargetTransformInfo::LSRCost &C1, const TargetTransformInfo::LSRCost &C2)
Definition: X86TargetTransformInfo.cpp:5914

llvm::X86TTIImpl::isLegalMaskedExpandLoad
bool isLegalMaskedExpandLoad(Type *DataType, Align Alignment)
Definition: X86TargetTransformInfo.cpp:6006

llvm::X86TTIImpl::getArithmeticReductionCost
InstructionCost getArithmeticReductionCost(unsigned Opcode, VectorType *Ty, std::optional< FastMathFlags > FMF, TTI::TargetCostKind CostKind)
Definition: X86TargetTransformInfo.cpp:5174

llvm::X86TTIImpl::getAtomicMemIntrinsicMaxElementSize
unsigned getAtomicMemIntrinsicMaxElementSize() const
Definition: X86TargetTransformInfo.cpp:3458

llvm::X86TTIImpl::isLegalMaskedScatter
bool isLegalMaskedScatter(Type *DataType, Align Alignment)
Definition: X86TargetTransformInfo.cpp:6107

llvm::X86TTIImpl::getIntImmCost
InstructionCost getIntImmCost(int64_t)
Calculate the cost of materializing a 64-bit value.
Definition: X86TargetTransformInfo.cpp:5606

llvm::X86TTIImpl::getMaskedMemoryOpCost
InstructionCost getMaskedMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind)
Definition: X86TargetTransformInfo.cpp:5059

llvm::X86TTIImpl::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, Value *Op0, Value *Op1)
Definition: X86TargetTransformInfo.cpp:4476

llvm::X86TTIImpl::getScalarizationOverhead
InstructionCost getScalarizationOverhead(VectorType *Ty, const APInt &DemandedElts, bool Insert, bool Extract, TTI::TargetCostKind CostKind)
Definition: X86TargetTransformInfo.cpp:4623

llvm::X86TTIImpl::areInlineCompatible
bool areInlineCompatible(const Function *Caller, const Function *Callee) const
Definition: X86TargetTransformInfo.cpp:6132

llvm::X86TTIImpl::getCmpSelInstrCost
InstructionCost getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred, TTI::TargetCostKind CostKind, const Instruction *I=nullptr)
Definition: X86TargetTransformInfo.cpp:3161

llvm::X86TTIImpl::getBranchMispredictPenalty
InstructionCost getBranchMispredictPenalty() const
Definition: X86TargetTransformInfo.cpp:6760

llvm::X86TTIImpl::isExpensiveToSpeculativelyExecute
bool isExpensiveToSpeculativelyExecute(const Instruction *I)
Definition: X86TargetTransformInfo.cpp:6119

llvm::X86TTIImpl::getAddressComputationCost
InstructionCost getAddressComputationCost(Type *PtrTy, ScalarEvolution *SE, const SCEV *Ptr)
Definition: X86TargetTransformInfo.cpp:5145

llvm::X86TTIImpl::getShuffleCost
InstructionCost getShuffleCost(TTI::ShuffleKind Kind, VectorType *Tp, ArrayRef< int > Mask, TTI::TargetCostKind CostKind, int Index, VectorType *SubTp, ArrayRef< const Value * > Args=std::nullopt, const Instruction *CxtI=nullptr)
Definition: X86TargetTransformInfo.cpp:1526

llvm::X86TTIImpl::isLegalAltInstr
bool isLegalAltInstr(VectorType *VecTy, unsigned Opcode0, unsigned Opcode1, const SmallBitVector &OpcodeMask) const
Definition: X86TargetTransformInfo.cpp:6074

llvm::X86TTIImpl::getMinMaxCost
InstructionCost getMinMaxCost(Intrinsic::ID IID, Type *Ty, TTI::TargetCostKind CostKind, FastMathFlags FMF)
Definition: X86TargetTransformInfo.cpp:5424

llvm::X86TTIImpl::isFCmpOrdCheaperThanFCmpZero
bool isFCmpOrdCheaperThanFCmpZero(Type *Ty)
Definition: X86TargetTransformInfo.cpp:6128

llvm::X86TTIImpl::getCFInstrCost
InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind, const Instruction *I=nullptr)
Definition: X86TargetTransformInfo.cpp:5786

llvm::X86TTIImpl::getArithmeticInstrCost
InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Op2Info={TTI::OK_AnyValue, TTI::OP_None}, ArrayRef< const Value * > Args=std::nullopt, const Instruction *CxtI=nullptr)
Definition: X86TargetTransformInfo.cpp:246

llvm::X86TTIImpl::areTypesABICompatible
bool areTypesABICompatible(const Function *Caller, const Function *Callee, const ArrayRef< Type * > &Type) const
Definition: X86TargetTransformInfo.cpp:6190

llvm::X86TTIImpl::hasDivRemOp
bool hasDivRemOp(Type *DataType, bool IsSigned)
Definition: X86TargetTransformInfo.cpp:6114

llvm::X86TTIImpl::simplifyDemandedVectorEltsIntrinsic
std::optional< Value * > simplifyDemandedVectorEltsIntrinsic(InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts, APInt &UndefElts2, APInt &UndefElts3, std::function< void(Instruction *, unsigned, APInt, APInt &)> SimplifyAndSetOp) const
Definition: X86InstCombineIntrinsic.cpp:3100

llvm::X86TargetLowering
Definition: X86ISelLowering.h:978

llvm::X86TargetMachine
Definition: X86TargetMachine.h:28

uint64_t

llvm::AMDGPU::HSAMD::Kernel::Key::Args
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
Definition: AMDGPUMetadata.h:395

llvm::Intrinsic::ID
unsigned ID
Definition: GenericSSAContext.h:28

llvm::dwarf::Index
Index
Definition: Dwarf.h:875

llvm::sampleprof::Base
@ Base
Definition: Discriminator.h:58

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::AddressSpace
AddressSpace
Definition: NVPTXBaseInfo.h:21

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::TargetTransformInfo::MemCmpExpansionOptions
Returns options for expansion of memcmp. IsZeroCmp is.
Definition: TargetTransformInfo.h:925

llvm::TargetTransformInfo::OperandValueInfo
Definition: TargetTransformInfo.h:1098