doxygen/TargetTransformInfoImpl_8h_source.html

//===- TargetTransformInfoImpl.h --------------------------------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

/// \file

/// This file provides helpers for the implementation of

/// a TargetTransformInfo-conforming class.

///

//===----------------------------------------------------------------------===//


#ifndef LLVM_ANALYSIS_TARGETTRANSFORMINFOIMPL_H

#define LLVM_ANALYSIS_TARGETTRANSFORMINFOIMPL_H


#include "llvm/Analysis/ScalarEvolutionExpressions.h"

#include "llvm/Analysis/TargetTransformInfo.h"

#include "llvm/Analysis/VectorUtils.h"

#include "llvm/IR/DataLayout.h"

#include "llvm/IR/GetElementPtrTypeIterator.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/Operator.h"

#include "llvm/IR/PatternMatch.h"

#include <optional>

#include <utility>


namespace llvm {


class Function;


/// Base class for use as a mix-in that aids implementing

/// a TargetTransformInfo-compatible class.

class TargetTransformInfoImplBase {

protected:

  typedef TargetTransformInfo TTI;


  const DataLayout &DL;


  explicit TargetTransformInfoImplBase(const DataLayout &DL) : DL(DL) {}


public:

  // Provide value semantics. MSVC requires that we spell all of these out.

  TargetTransformInfoImplBase(const TargetTransformInfoImplBase &Arg) = default;

  TargetTransformInfoImplBase(TargetTransformInfoImplBase &&Arg) : DL(Arg.DL) {}


  const DataLayout &getDataLayout() const { return DL; }


  InstructionCost getGEPCost(Type *PointeeType, const Value *Ptr,

                             ArrayRef<const Value *> Operands, Type *AccessType,

                             TTI::TargetCostKind CostKind) const {

    // In the basic model, we just assume that all-constant GEPs will be folded

    // into their uses via addressing modes.

    for (const Value *Operand : Operands)

      if (!isa<Constant>(Operand))

        return TTI::TCC_Basic;


    return TTI::TCC_Free;

  }


  unsigned getEstimatedNumberOfCaseClusters(const SwitchInst &SI,

                                            unsigned &JTSize,

                                            ProfileSummaryInfo *PSI,

                                            BlockFrequencyInfo *BFI) const {

    (void)PSI;

    (void)BFI;

    JTSize = 0;

    return SI.getNumCases();

  }


  unsigned getInliningThresholdMultiplier() const { return 1; }

  unsigned getInliningCostBenefitAnalysisSavingsMultiplier() const { return 8; }

  unsigned getInliningCostBenefitAnalysisProfitableMultiplier() const {

    return 8;

  }

  unsigned adjustInliningThreshold(const CallBase *CB) const { return 0; }

  unsigned getCallerAllocaCost(const CallBase *CB, const AllocaInst *AI) const {

    return 0;

  };


  int getInlinerVectorBonusPercent() const { return 150; }


  InstructionCost getMemcpyCost(const Instruction *I) const {

    return TTI::TCC_Expensive;

  }


  uint64_t getMaxMemIntrinsicInlineSizeThreshold() const {

    return 64;

  }


  // Although this default value is arbitrary, it is not random. It is assumed

  // that a condition that evaluates the same way by a higher percentage than

  // this is best represented as control flow. Therefore, the default value N

  // should be set such that the win from N% correct executions is greater than

  // the loss from (100 - N)% mispredicted executions for the majority of

  //  intended targets.

  BranchProbability getPredictableBranchThreshold() const {

    return BranchProbability(99, 100);

  }


  bool hasBranchDivergence(const Function *F = nullptr) const { return false; }


  bool isSourceOfDivergence(const Value *V) const { return false; }


  bool isAlwaysUniform(const Value *V) const { return false; }


  bool isValidAddrSpaceCast(unsigned FromAS, unsigned ToAS) const {

    return false;

  }


  bool addrspacesMayAlias(unsigned AS0, unsigned AS1) const {

    return true;

  }


  unsigned getFlatAddressSpace() const { return -1; }


  bool collectFlatAddressOperands(SmallVectorImpl<int> &OpIndexes,

                                  Intrinsic::ID IID) const {

    return false;

  }


  bool isNoopAddrSpaceCast(unsigned, unsigned) const { return false; }

  bool canHaveNonUndefGlobalInitializerInAddressSpace(unsigned AS) const {

    return AS == 0;

  };


  unsigned getAssumedAddrSpace(const Value *V) const { return -1; }


  bool isSingleThreaded() const { return false; }


  std::pair<const Value *, unsigned>

  getPredicatedAddrSpace(const Value *V) const {

    return std::make_pair(nullptr, -1);

  }


  Value *rewriteIntrinsicWithAddressSpace(IntrinsicInst *II, Value *OldV,

                                          Value *NewV) const {

    return nullptr;

  }


  bool isLoweredToCall(const Function *F) const {

    assert(F && "A concrete function must be provided to this routine.");


    // FIXME: These should almost certainly not be handled here, and instead

    // handled with the help of TLI or the target itself. This was largely

    // ported from existing analysis heuristics here so that such refactorings

    // can take place in the future.


    if (F->isIntrinsic())

      return false;


    if (F->hasLocalLinkage() || !F->hasName())

      return true;


    StringRef Name = F->getName();


    // These will all likely lower to a single selection DAG node.

    if (Name == "copysign" || Name == "copysignf" || Name == "copysignl" ||

        Name == "fabs" || Name == "fabsf" || Name == "fabsl" || Name == "sin" ||

        Name == "fmin" || Name == "fminf" || Name == "fminl" ||

        Name == "fmax" || Name == "fmaxf" || Name == "fmaxl" ||

        Name == "sinf" || Name == "sinl" || Name == "cos" || Name == "cosf" ||

        Name == "cosl" || Name == "sqrt" || Name == "sqrtf" || Name == "sqrtl")

      return false;


    // These are all likely to be optimized into something smaller.

    if (Name == "pow" || Name == "powf" || Name == "powl" || Name == "exp2" ||

        Name == "exp2l" || Name == "exp2f" || Name == "floor" ||

        Name == "floorf" || Name == "ceil" || Name == "round" ||

        Name == "ffs" || Name == "ffsl" || Name == "abs" || Name == "labs" ||

        Name == "llabs")

      return false;


    return true;

  }


  bool isHardwareLoopProfitable(Loop *L, ScalarEvolution &SE,

                                AssumptionCache &AC, TargetLibraryInfo *LibInfo,

                                HardwareLoopInfo &HWLoopInfo) const {

    return false;

  }


  bool preferPredicateOverEpilogue(TailFoldingInfo *TFI) const { return false; }


  TailFoldingStyle

  getPreferredTailFoldingStyle(bool IVUpdateMayOverflow = true) const {

    return TailFoldingStyle::DataWithoutLaneMask;

  }


  std::optional<Instruction *> instCombineIntrinsic(InstCombiner &IC,

                                                    IntrinsicInst &II) const {

    return std::nullopt;

  }


  std::optional<Value *>

  simplifyDemandedUseBitsIntrinsic(InstCombiner &IC, IntrinsicInst &II,

                                   APInt DemandedMask, KnownBits &Known,

                                   bool &KnownBitsComputed) const {

    return std::nullopt;

  }


  std::optional<Value *> simplifyDemandedVectorEltsIntrinsic(

      InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts,

      APInt &UndefElts2, APInt &UndefElts3,

      std::function<void(Instruction *, unsigned, APInt, APInt &)>

          SimplifyAndSetOp) const {

    return std::nullopt;

  }


  void getUnrollingPreferences(Loop *, ScalarEvolution &,

                               TTI::UnrollingPreferences &,

                               OptimizationRemarkEmitter *) const {}


  void getPeelingPreferences(Loop *, ScalarEvolution &,

                             TTI::PeelingPreferences &) const {}


  bool isLegalAddImmediate(int64_t Imm) const { return false; }


  bool isLegalAddScalableImmediate(int64_t Imm) const { return false; }


  bool isLegalICmpImmediate(int64_t Imm) const { return false; }


  bool isLegalAddressingMode(Type *Ty, GlobalValue *BaseGV, int64_t BaseOffset,

                             bool HasBaseReg, int64_t Scale, unsigned AddrSpace,

                             Instruction *I = nullptr,

                             int64_t ScalableOffset = 0) const {

    // Guess that only reg and reg+reg addressing is allowed. This heuristic is

    // taken from the implementation of LSR.

    return !BaseGV && BaseOffset == 0 && (Scale == 0 || Scale == 1);

  }


  bool isLSRCostLess(const TTI::LSRCost &C1, const TTI::LSRCost &C2) const {

    return std::tie(C1.NumRegs, C1.AddRecCost, C1.NumIVMuls, C1.NumBaseAdds,

                    C1.ScaleCost, C1.ImmCost, C1.SetupCost) <

           std::tie(C2.NumRegs, C2.AddRecCost, C2.NumIVMuls, C2.NumBaseAdds,

                    C2.ScaleCost, C2.ImmCost, C2.SetupCost);

  }


  bool isNumRegsMajorCostOfLSR() const { return true; }


  bool shouldFoldTerminatingConditionAfterLSR() const { return false; }


  bool isProfitableLSRChainElement(Instruction *I) const { return false; }


  bool canMacroFuseCmp() const { return false; }


  bool canSaveCmp(Loop *L, BranchInst **BI, ScalarEvolution *SE, LoopInfo *LI,

                  DominatorTree *DT, AssumptionCache *AC,

                  TargetLibraryInfo *LibInfo) const {

    return false;

  }


  TTI::AddressingModeKind

    getPreferredAddressingMode(const Loop *L, ScalarEvolution *SE) const {

    return TTI::AMK_None;

  }


  bool isLegalMaskedStore(Type *DataType, Align Alignment) const {

    return false;

  }


  bool isLegalMaskedLoad(Type *DataType, Align Alignment) const {

    return false;

  }


  bool isLegalNTStore(Type *DataType, Align Alignment) const {

    // By default, assume nontemporal memory stores are available for stores

    // that are aligned and have a size that is a power of 2.

    unsigned DataSize = DL.getTypeStoreSize(DataType);

    return Alignment >= DataSize && isPowerOf2_32(DataSize);

  }


  bool isLegalNTLoad(Type *DataType, Align Alignment) const {

    // By default, assume nontemporal memory loads are available for loads that

    // are aligned and have a size that is a power of 2.

    unsigned DataSize = DL.getTypeStoreSize(DataType);

    return Alignment >= DataSize && isPowerOf2_32(DataSize);

  }


  bool isLegalBroadcastLoad(Type *ElementTy, ElementCount NumElements) const {

    return false;

  }


  bool isLegalMaskedScatter(Type *DataType, Align Alignment) const {

    return false;

  }


  bool isLegalMaskedGather(Type *DataType, Align Alignment) const {

    return false;

  }


  bool forceScalarizeMaskedGather(VectorType *DataType, Align Alignment) const {

    return false;

  }


  bool forceScalarizeMaskedScatter(VectorType *DataType,

                                   Align Alignment) const {

    return false;

  }


  bool isLegalMaskedCompressStore(Type *DataType, Align Alignment) const {

    return false;

  }


  bool isLegalAltInstr(VectorType *VecTy, unsigned Opcode0, unsigned Opcode1,

                       const SmallBitVector &OpcodeMask) const {

    return false;

  }


  bool isLegalMaskedExpandLoad(Type *DataType, Align Alignment) const {

    return false;

  }


  bool isLegalStridedLoadStore(Type *DataType, Align Alignment) const {

    return false;

  }


  bool enableOrderedReductions() const { return false; }


  bool hasDivRemOp(Type *DataType, bool IsSigned) const { return false; }


  bool hasVolatileVariant(Instruction *I, unsigned AddrSpace) const {

    return false;

  }


  bool prefersVectorizedAddressing() const { return true; }


  InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV,

                                       int64_t BaseOffset, bool HasBaseReg,

                                       int64_t Scale,

                                       unsigned AddrSpace) const {

    // Guess that all legal addressing mode are free.

    if (isLegalAddressingMode(Ty, BaseGV, BaseOffset, HasBaseReg, Scale,

                              AddrSpace))

      return 0;

    return -1;

  }


  bool LSRWithInstrQueries() const { return false; }


  bool isTruncateFree(Type *Ty1, Type *Ty2) const { return false; }


  bool isProfitableToHoist(Instruction *I) const { return true; }


  bool useAA() const { return false; }


  bool isTypeLegal(Type *Ty) const { return false; }


  unsigned getRegUsageForType(Type *Ty) const { return 1; }


  bool shouldBuildLookupTables() const { return true; }


  bool shouldBuildLookupTablesForConstant(Constant *C) const { return true; }


  bool shouldBuildRelLookupTables() const { return false; }


  bool useColdCCForColdCall(Function &F) const { return false; }


  InstructionCost getScalarizationOverhead(VectorType *Ty,

                                           const APInt &DemandedElts,

                                           bool Insert, bool Extract,

                                           TTI::TargetCostKind CostKind) const {

    return 0;

  }


  InstructionCost

  getOperandsScalarizationOverhead(ArrayRef<const Value *> Args,

                                   ArrayRef<Type *> Tys,

                                   TTI::TargetCostKind CostKind) const {

    return 0;

  }


  bool supportsEfficientVectorElementLoadStore() const { return false; }


  bool supportsTailCalls() const { return true; }


  bool enableAggressiveInterleaving(bool LoopHasReductions) const {

    return false;

  }


  TTI::MemCmpExpansionOptions enableMemCmpExpansion(bool OptSize,

                                                    bool IsZeroCmp) const {

    return {};

  }


  bool enableSelectOptimize() const { return true; }


  bool shouldTreatInstructionLikeSelect(const Instruction *I) {

    // If the select is a logical-and/logical-or then it is better treated as a

    // and/or by the backend.

    using namespace llvm::PatternMatch;

    return isa<SelectInst>(I) &&

           !match(I, m_CombineOr(m_LogicalAnd(m_Value(), m_Value()),

                                 m_LogicalOr(m_Value(), m_Value())));

  }


  bool enableInterleavedAccessVectorization() const { return false; }


  bool enableMaskedInterleavedAccessVectorization() const { return false; }


  bool isFPVectorizationPotentiallyUnsafe() const { return false; }


  bool allowsMisalignedMemoryAccesses(LLVMContext &Context, unsigned BitWidth,

                                      unsigned AddressSpace, Align Alignment,

                                      unsigned *Fast) const {

    return false;

  }


  TTI::PopcntSupportKind getPopcntSupport(unsigned IntTyWidthInBit) const {

    return TTI::PSK_Software;

  }


  bool haveFastSqrt(Type *Ty) const { return false; }


  bool isExpensiveToSpeculativelyExecute(const Instruction *I) { return true; }


  bool isFCmpOrdCheaperThanFCmpZero(Type *Ty) const { return true; }


  InstructionCost getFPOpCost(Type *Ty) const {

    return TargetTransformInfo::TCC_Basic;

  }


  InstructionCost getIntImmCodeSizeCost(unsigned Opcode, unsigned Idx,

                                        const APInt &Imm, Type *Ty) const {

    return 0;

  }


  InstructionCost getIntImmCost(const APInt &Imm, Type *Ty,

                                TTI::TargetCostKind CostKind) const {

    return TTI::TCC_Basic;

  }


  InstructionCost getIntImmCostInst(unsigned Opcode, unsigned Idx,

                                    const APInt &Imm, Type *Ty,

                                    TTI::TargetCostKind CostKind,

                                    Instruction *Inst = nullptr) const {

    return TTI::TCC_Free;

  }


  InstructionCost getIntImmCostIntrin(Intrinsic::ID IID, unsigned Idx,

                                      const APInt &Imm, Type *Ty,

                                      TTI::TargetCostKind CostKind) const {

    return TTI::TCC_Free;

  }


  bool preferToKeepConstantsAttached(const Instruction &Inst,

                                     const Function &Fn) const {

    return false;

  }


  unsigned getNumberOfRegisters(unsigned ClassID) const { return 8; }


  unsigned getRegisterClassForType(bool Vector, Type *Ty = nullptr) const {

    return Vector ? 1 : 0;

  };


  const char *getRegisterClassName(unsigned ClassID) const {

    switch (ClassID) {

    default:

      return "Generic::Unknown Register Class";

    case 0:

      return "Generic::ScalarRC";

    case 1:

      return "Generic::VectorRC";

    }

  }


  TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const {

    return TypeSize::getFixed(32);

  }


  unsigned getMinVectorRegisterBitWidth() const { return 128; }


  std::optional<unsigned> getMaxVScale() const { return std::nullopt; }

  std::optional<unsigned> getVScaleForTuning() const { return std::nullopt; }

  bool isVScaleKnownToBeAPowerOfTwo() const { return false; }


  bool

  shouldMaximizeVectorBandwidth(TargetTransformInfo::RegisterKind K) const {

    return false;

  }


  ElementCount getMinimumVF(unsigned ElemWidth, bool IsScalable) const {

    return ElementCount::get(0, IsScalable);

  }


  unsigned getMaximumVF(unsigned ElemWidth, unsigned Opcode) const { return 0; }

  unsigned getStoreMinimumVF(unsigned VF, Type *, Type *) const { return VF; }


  bool shouldConsiderAddressTypePromotion(

      const Instruction &I, bool &AllowPromotionWithoutCommonHeader) const {

    AllowPromotionWithoutCommonHeader = false;

    return false;

  }


  unsigned getCacheLineSize() const { return 0; }

  std::optional<unsigned>

  getCacheSize(TargetTransformInfo::CacheLevel Level) const {

    switch (Level) {

    case TargetTransformInfo::CacheLevel::L1D:

      [[fallthrough]];

    case TargetTransformInfo::CacheLevel::L2D:

      return std::nullopt;

    }

    llvm_unreachable("Unknown TargetTransformInfo::CacheLevel");

  }


  std::optional<unsigned>

  getCacheAssociativity(TargetTransformInfo::CacheLevel Level) const {

    switch (Level) {

    case TargetTransformInfo::CacheLevel::L1D:

      [[fallthrough]];

    case TargetTransformInfo::CacheLevel::L2D:

      return std::nullopt;

    }


    llvm_unreachable("Unknown TargetTransformInfo::CacheLevel");

  }


  std::optional<unsigned> getMinPageSize() const { return {}; }


  unsigned getPrefetchDistance() const { return 0; }

  unsigned getMinPrefetchStride(unsigned NumMemAccesses,

                                unsigned NumStridedMemAccesses,

                                unsigned NumPrefetches, bool HasCall) const {

    return 1;

  }

  unsigned getMaxPrefetchIterationsAhead() const { return UINT_MAX; }

  bool enableWritePrefetching() const { return false; }

  bool shouldPrefetchAddressSpace(unsigned AS) const { return !AS; }


  unsigned getMaxInterleaveFactor(ElementCount VF) const { return 1; }


  InstructionCost getArithmeticInstrCost(

      unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind,

      TTI::OperandValueInfo Opd1Info, TTI::OperandValueInfo Opd2Info,

      ArrayRef<const Value *> Args,

      const Instruction *CxtI = nullptr) const {

    // Widenable conditions will eventually lower into constants, so some

    // operations with them will be trivially optimized away.

    auto IsWidenableCondition = [](const Value *V) {

      if (auto *II = dyn_cast<IntrinsicInst>(V))

        if (II->getIntrinsicID() == Intrinsic::experimental_widenable_condition)

          return true;

      return false;

    };

    // FIXME: A number of transformation tests seem to require these values

    // which seems a little odd for how arbitary there are.

    switch (Opcode) {

    default:

      break;

    case Instruction::FDiv:

    case Instruction::FRem:

    case Instruction::SDiv:

    case Instruction::SRem:

    case Instruction::UDiv:

    case Instruction::URem:

      // FIXME: Unlikely to be true for CodeSize.

      return TTI::TCC_Expensive;

    case Instruction::And:

    case Instruction::Or:

      if (any_of(Args, IsWidenableCondition))

        return TTI::TCC_Free;

      break;

    }


    // Assume a 3cy latency for fp arithmetic ops.

    if (CostKind == TTI::TCK_Latency)

      if (Ty->getScalarType()->isFloatingPointTy())

        return 3;


    return 1;

  }


  InstructionCost getAltInstrCost(VectorType *VecTy, unsigned Opcode0,

                                  unsigned Opcode1,

                                  const SmallBitVector &OpcodeMask,

                                  TTI::TargetCostKind CostKind) const {

    return InstructionCost::getInvalid();

  }


  InstructionCost getShuffleCost(TTI::ShuffleKind Kind, VectorType *Ty,

                                 ArrayRef<int> Mask,

                                 TTI::TargetCostKind CostKind, int Index,

                                 VectorType *SubTp,

                                 ArrayRef<const Value *> Args = std::nullopt,

                                 const Instruction *CxtI = nullptr) const {

    return 1;

  }


  InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src,

                                   TTI::CastContextHint CCH,

                                   TTI::TargetCostKind CostKind,

                                   const Instruction *I) const {

    switch (Opcode) {

    default:

      break;

    case Instruction::IntToPtr: {

      unsigned SrcSize = Src->getScalarSizeInBits();

      if (DL.isLegalInteger(SrcSize) &&

          SrcSize <= DL.getPointerTypeSizeInBits(Dst))

        return 0;

      break;

    }

    case Instruction::PtrToInt: {

      unsigned DstSize = Dst->getScalarSizeInBits();

      if (DL.isLegalInteger(DstSize) &&

          DstSize >= DL.getPointerTypeSizeInBits(Src))

        return 0;

      break;

    }

    case Instruction::BitCast:

      if (Dst == Src || (Dst->isPointerTy() && Src->isPointerTy()))

        // Identity and pointer-to-pointer casts are free.

        return 0;

      break;

    case Instruction::Trunc: {

      // trunc to a native type is free (assuming the target has compare and

      // shift-right of the same width).

      TypeSize DstSize = DL.getTypeSizeInBits(Dst);

      if (!DstSize.isScalable() && DL.isLegalInteger(DstSize.getFixedValue()))

        return 0;

      break;

    }

    }

    return 1;

  }


  InstructionCost getExtractWithExtendCost(unsigned Opcode, Type *Dst,

                                           VectorType *VecTy,

                                           unsigned Index) const {

    return 1;

  }


  InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind,

                                 const Instruction *I = nullptr) const {

    // A phi would be free, unless we're costing the throughput because it

    // will require a register.

    if (Opcode == Instruction::PHI && CostKind != TTI::TCK_RecipThroughput)

      return 0;

    return 1;

  }


  InstructionCost getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy,

                                     CmpInst::Predicate VecPred,

                                     TTI::TargetCostKind CostKind,

                                     const Instruction *I) const {

    return 1;

  }


  InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val,

                                     TTI::TargetCostKind CostKind,

                                     unsigned Index, Value *Op0,

                                     Value *Op1) const {

    return 1;

  }


  InstructionCost getVectorInstrCost(const Instruction &I, Type *Val,

                                     TTI::TargetCostKind CostKind,

                                     unsigned Index) const {

    return 1;

  }


  unsigned getReplicationShuffleCost(Type *EltTy, int ReplicationFactor, int VF,

                                     const APInt &DemandedDstElts,

                                     TTI::TargetCostKind CostKind) {

    return 1;

  }


  InstructionCost getMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment,

                                  unsigned AddressSpace,

                                  TTI::TargetCostKind CostKind,

                                  TTI::OperandValueInfo OpInfo,

                                  const Instruction *I) const {

    return 1;

  }


  InstructionCost getVPMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment,

                                    unsigned AddressSpace,

                                    TTI::TargetCostKind CostKind,

                                    const Instruction *I) const {

    return 1;

  }


  InstructionCost getMaskedMemoryOpCost(unsigned Opcode, Type *Src,

                                        Align Alignment, unsigned AddressSpace,

                                        TTI::TargetCostKind CostKind) const {

    return 1;

  }


  InstructionCost getGatherScatterOpCost(unsigned Opcode, Type *DataTy,

                                         const Value *Ptr, bool VariableMask,

                                         Align Alignment,

                                         TTI::TargetCostKind CostKind,

                                         const Instruction *I = nullptr) const {

    return 1;

  }


  InstructionCost getStridedMemoryOpCost(unsigned Opcode, Type *DataTy,

                                         const Value *Ptr, bool VariableMask,

                                         Align Alignment,

                                         TTI::TargetCostKind CostKind,

                                         const Instruction *I = nullptr) const {

    return InstructionCost::getInvalid();

  }


  unsigned getInterleavedMemoryOpCost(

      unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef<unsigned> Indices,

      Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind,

      bool UseMaskForCond, bool UseMaskForGaps) const {

    return 1;

  }


  InstructionCost getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA,

                                        TTI::TargetCostKind CostKind) const {

    switch (ICA.getID()) {

    default:

      break;

    case Intrinsic::allow_runtime_check:

    case Intrinsic::allow_ubsan_check:

    case Intrinsic::annotation:

    case Intrinsic::assume:

    case Intrinsic::sideeffect:

    case Intrinsic::pseudoprobe:

    case Intrinsic::arithmetic_fence:

    case Intrinsic::dbg_assign:

    case Intrinsic::dbg_declare:

    case Intrinsic::dbg_value:

    case Intrinsic::dbg_label:

    case Intrinsic::invariant_start:

    case Intrinsic::invariant_end:

    case Intrinsic::launder_invariant_group:

    case Intrinsic::strip_invariant_group:

    case Intrinsic::is_constant:

    case Intrinsic::lifetime_start:

    case Intrinsic::lifetime_end:

    case Intrinsic::experimental_noalias_scope_decl:

    case Intrinsic::objectsize:

    case Intrinsic::ptr_annotation:

    case Intrinsic::var_annotation:

    case Intrinsic::experimental_gc_result:

    case Intrinsic::experimental_gc_relocate:

    case Intrinsic::coro_alloc:

    case Intrinsic::coro_begin:

    case Intrinsic::coro_free:

    case Intrinsic::coro_end:

    case Intrinsic::coro_frame:

    case Intrinsic::coro_size:

    case Intrinsic::coro_align:

    case Intrinsic::coro_suspend:

    case Intrinsic::coro_subfn_addr:

    case Intrinsic::threadlocal_address:

    case Intrinsic::experimental_widenable_condition:

    case Intrinsic::ssa_copy:

      // These intrinsics don't actually represent code after lowering.

      return 0;

    }

    return 1;

  }


  InstructionCost getCallInstrCost(Function *F, Type *RetTy,

                                   ArrayRef<Type *> Tys,

                                   TTI::TargetCostKind CostKind) const {

    return 1;

  }


  // Assume that we have a register of the right size for the type.

  unsigned getNumberOfParts(Type *Tp) const { return 1; }


  InstructionCost getAddressComputationCost(Type *Tp, ScalarEvolution *,

                                            const SCEV *) const {

    return 0;

  }


  InstructionCost getArithmeticReductionCost(unsigned, VectorType *,

                                             std::optional<FastMathFlags> FMF,

                                             TTI::TargetCostKind) const {

    return 1;

  }


  InstructionCost getMinMaxReductionCost(Intrinsic::ID IID, VectorType *,

                                         FastMathFlags,

                                         TTI::TargetCostKind) const {

    return 1;

  }


  InstructionCost getExtendedReductionCost(unsigned Opcode, bool IsUnsigned,

                                           Type *ResTy, VectorType *Ty,

                                           FastMathFlags FMF,

                                           TTI::TargetCostKind CostKind) const {

    return 1;

  }


  InstructionCost getMulAccReductionCost(bool IsUnsigned, Type *ResTy,

                                         VectorType *Ty,

                                         TTI::TargetCostKind CostKind) const {

    return 1;

  }


  InstructionCost getCostOfKeepingLiveOverCall(ArrayRef<Type *> Tys) const {

    return 0;

  }


  bool getTgtMemIntrinsic(IntrinsicInst *Inst, MemIntrinsicInfo &Info) const {

    return false;

  }


  unsigned getAtomicMemIntrinsicMaxElementSize() const {

    // Note for overrides: You must ensure for all element unordered-atomic

    // memory intrinsics that all power-of-2 element sizes up to, and

    // including, the return value of this method have a corresponding

    // runtime lib call. These runtime lib call definitions can be found

    // in RuntimeLibcalls.h

    return 0;

  }


  Value *getOrCreateResultFromMemIntrinsic(IntrinsicInst *Inst,

                                           Type *ExpectedType) const {

    return nullptr;

  }


  Type *

  getMemcpyLoopLoweringType(LLVMContext &Context, Value *Length,

                            unsigned SrcAddrSpace, unsigned DestAddrSpace,

                            unsigned SrcAlign, unsigned DestAlign,

                            std::optional<uint32_t> AtomicElementSize) const {

    return AtomicElementSize ? Type::getIntNTy(Context, *AtomicElementSize * 8)

                             : Type::getInt8Ty(Context);

  }


  void getMemcpyLoopResidualLoweringType(

      SmallVectorImpl<Type *> &OpsOut, LLVMContext &Context,

      unsigned RemainingBytes, unsigned SrcAddrSpace, unsigned DestAddrSpace,

      unsigned SrcAlign, unsigned DestAlign,

      std::optional<uint32_t> AtomicCpySize) const {

    unsigned OpSizeInBytes = AtomicCpySize ? *AtomicCpySize : 1;

    Type *OpType = Type::getIntNTy(Context, OpSizeInBytes * 8);

    for (unsigned i = 0; i != RemainingBytes; i += OpSizeInBytes)

      OpsOut.push_back(OpType);

  }


  bool areInlineCompatible(const Function *Caller,

                           const Function *Callee) const {

    return (Caller->getFnAttribute("target-cpu") ==

            Callee->getFnAttribute("target-cpu")) &&

           (Caller->getFnAttribute("target-features") ==

            Callee->getFnAttribute("target-features"));

  }


  unsigned getInlineCallPenalty(const Function *F, const CallBase &Call,

                                unsigned DefaultCallPenalty) const {

    return DefaultCallPenalty;

  }


  bool areTypesABICompatible(const Function *Caller, const Function *Callee,

                             const ArrayRef<Type *> &Types) const {

    return (Caller->getFnAttribute("target-cpu") ==

            Callee->getFnAttribute("target-cpu")) &&

           (Caller->getFnAttribute("target-features") ==

            Callee->getFnAttribute("target-features"));

  }


  bool isIndexedLoadLegal(TTI::MemIndexedMode Mode, Type *Ty,

                          const DataLayout &DL) const {

    return false;

  }


  bool isIndexedStoreLegal(TTI::MemIndexedMode Mode, Type *Ty,

                           const DataLayout &DL) const {

    return false;

  }


  unsigned getLoadStoreVecRegBitWidth(unsigned AddrSpace) const { return 128; }


  bool isLegalToVectorizeLoad(LoadInst *LI) const { return true; }


  bool isLegalToVectorizeStore(StoreInst *SI) const { return true; }


  bool isLegalToVectorizeLoadChain(unsigned ChainSizeInBytes, Align Alignment,

                                   unsigned AddrSpace) const {

    return true;

  }


  bool isLegalToVectorizeStoreChain(unsigned ChainSizeInBytes, Align Alignment,

                                    unsigned AddrSpace) const {

    return true;

  }


  bool isLegalToVectorizeReduction(const RecurrenceDescriptor &RdxDesc,

                                   ElementCount VF) const {

    return true;

  }


  bool isElementTypeLegalForScalableVector(Type *Ty) const { return true; }


  unsigned getLoadVectorFactor(unsigned VF, unsigned LoadSize,

                               unsigned ChainSizeInBytes,

                               VectorType *VecTy) const {

    return VF;

  }


  unsigned getStoreVectorFactor(unsigned VF, unsigned StoreSize,

                                unsigned ChainSizeInBytes,

                                VectorType *VecTy) const {

    return VF;

  }


  bool preferInLoopReduction(unsigned Opcode, Type *Ty,

                             TTI::ReductionFlags Flags) const {

    return false;

  }


  bool preferPredicatedReductionSelect(unsigned Opcode, Type *Ty,

                                       TTI::ReductionFlags Flags) const {

    return false;

  }


  bool preferEpilogueVectorization() const {

    return true;

  }


  bool shouldExpandReduction(const IntrinsicInst *II) const { return true; }


  unsigned getGISelRematGlobalCost() const { return 1; }


  unsigned getMinTripCountTailFoldingThreshold() const { return 0; }


  bool supportsScalableVectors() const { return false; }


  bool enableScalableVectorization() const { return false; }


  bool hasActiveVectorLength(unsigned Opcode, Type *DataType,

                             Align Alignment) const {

    return false;

  }


  TargetTransformInfo::VPLegalization

  getVPLegalizationStrategy(const VPIntrinsic &PI) const {

    return TargetTransformInfo::VPLegalization(

        /* EVLParamStrategy */ TargetTransformInfo::VPLegalization::Discard,

        /* OperatorStrategy */ TargetTransformInfo::VPLegalization::Convert);

  }


  bool hasArmWideBranch(bool) const { return false; }


  unsigned getMaxNumArgs() const { return UINT_MAX; }


protected:

  // Obtain the minimum required size to hold the value (without the sign)

  // In case of a vector it returns the min required size for one element.

  unsigned minRequiredElementSize(const Value *Val, bool &isSigned) const {

    if (isa<ConstantDataVector>(Val) || isa<ConstantVector>(Val)) {

      const auto *VectorValue = cast<Constant>(Val);


      // In case of a vector need to pick the max between the min

      // required size for each element

      auto *VT = cast<FixedVectorType>(Val->getType());


      // Assume unsigned elements

      isSigned = false;


      // The max required size is the size of the vector element type

      unsigned MaxRequiredSize =

          VT->getElementType()->getPrimitiveSizeInBits().getFixedValue();


      unsigned MinRequiredSize = 0;

      for (unsigned i = 0, e = VT->getNumElements(); i < e; ++i) {

        if (auto *IntElement =

                dyn_cast<ConstantInt>(VectorValue->getAggregateElement(i))) {

          bool signedElement = IntElement->getValue().isNegative();

          // Get the element min required size.

          unsigned ElementMinRequiredSize =

              IntElement->getValue().getSignificantBits() - 1;

          // In case one element is signed then all the vector is signed.

          isSigned |= signedElement;

          // Save the max required bit size between all the elements.

          MinRequiredSize = std::max(MinRequiredSize, ElementMinRequiredSize);

        } else {

          // not an int constant element

          return MaxRequiredSize;

        }

      }

      return MinRequiredSize;

    }


    if (const auto *CI = dyn_cast<ConstantInt>(Val)) {

      isSigned = CI->getValue().isNegative();

      return CI->getValue().getSignificantBits() - 1;

    }


    if (const auto *Cast = dyn_cast<SExtInst>(Val)) {

      isSigned = true;

      return Cast->getSrcTy()->getScalarSizeInBits() - 1;

    }


    if (const auto *Cast = dyn_cast<ZExtInst>(Val)) {

      isSigned = false;

      return Cast->getSrcTy()->getScalarSizeInBits();

    }


    isSigned = false;

    return Val->getType()->getScalarSizeInBits();

  }


  bool isStridedAccess(const SCEV *Ptr) const {

    return Ptr && isa<SCEVAddRecExpr>(Ptr);

  }


  const SCEVConstant *getConstantStrideStep(ScalarEvolution *SE,

                                            const SCEV *Ptr) const {

    if (!isStridedAccess(Ptr))

      return nullptr;

    const SCEVAddRecExpr *AddRec = cast<SCEVAddRecExpr>(Ptr);

    return dyn_cast<SCEVConstant>(AddRec->getStepRecurrence(*SE));

  }


  bool isConstantStridedAccessLessThan(ScalarEvolution *SE, const SCEV *Ptr,

                                       int64_t MergeDistance) const {

    const SCEVConstant *Step = getConstantStrideStep(SE, Ptr);

    if (!Step)

      return false;

    APInt StrideVal = Step->getAPInt();

    if (StrideVal.getBitWidth() > 64)

      return false;

    // FIXME: Need to take absolute value for negative stride case.

    return StrideVal.getSExtValue() < MergeDistance;

  }

};


/// CRTP base class for use as a mix-in that aids implementing

/// a TargetTransformInfo-compatible class.

template <typename T>

class TargetTransformInfoImplCRTPBase : public TargetTransformInfoImplBase {

private:

  typedef TargetTransformInfoImplBase BaseT;


protected:

  explicit TargetTransformInfoImplCRTPBase(const DataLayout &DL) : BaseT(DL) {}


public:

  using BaseT::getGEPCost;


  InstructionCost getGEPCost(Type *PointeeType, const Value *Ptr,

                             ArrayRef<const Value *> Operands, Type *AccessType,

                             TTI::TargetCostKind CostKind) {

    assert(PointeeType && Ptr && "can't get GEPCost of nullptr");

    auto *BaseGV = dyn_cast<GlobalValue>(Ptr->stripPointerCasts());

    bool HasBaseReg = (BaseGV == nullptr);


    auto PtrSizeBits = DL.getPointerTypeSizeInBits(Ptr->getType());

    APInt BaseOffset(PtrSizeBits, 0);

    int64_t Scale = 0;


    auto GTI = gep_type_begin(PointeeType, Operands);

    Type *TargetType = nullptr;


    // Handle the case where the GEP instruction has a single operand,

    // the basis, therefore TargetType is a nullptr.

    if (Operands.empty())

      return !BaseGV ? TTI::TCC_Free : TTI::TCC_Basic;


    for (auto I = Operands.begin(); I != Operands.end(); ++I, ++GTI) {

      TargetType = GTI.getIndexedType();

      // We assume that the cost of Scalar GEP with constant index and the

      // cost of Vector GEP with splat constant index are the same.

      const ConstantInt *ConstIdx = dyn_cast<ConstantInt>(*I);

      if (!ConstIdx)

        if (auto Splat = getSplatValue(*I))

          ConstIdx = dyn_cast<ConstantInt>(Splat);

      if (StructType *STy = GTI.getStructTypeOrNull()) {

        // For structures the index is always splat or scalar constant

        assert(ConstIdx && "Unexpected GEP index");

        uint64_t Field = ConstIdx->getZExtValue();

        BaseOffset += DL.getStructLayout(STy)->getElementOffset(Field);

      } else {

        // If this operand is a scalable type, bail out early.

        // TODO: Make isLegalAddressingMode TypeSize aware.

        if (TargetType->isScalableTy())

          return TTI::TCC_Basic;

        int64_t ElementSize =

            GTI.getSequentialElementStride(DL).getFixedValue();

        if (ConstIdx) {

          BaseOffset +=

              ConstIdx->getValue().sextOrTrunc(PtrSizeBits) * ElementSize;

        } else {

          // Needs scale register.

          if (Scale != 0)

            // No addressing mode takes two scale registers.

            return TTI::TCC_Basic;

          Scale = ElementSize;

        }

      }

    }


    // If we haven't been provided a hint, use the target type for now.

    //

    // TODO: Take a look at potentially removing this: This is *slightly* wrong

    // as it's possible to have a GEP with a foldable target type but a memory

    // access that isn't foldable. For example, this load isn't foldable on

    // RISC-V:

    //

    // %p = getelementptr i32, ptr %base, i32 42

    // %x = load <2 x i32>, ptr %p

    if (!AccessType)

      AccessType = TargetType;


    // If the final address of the GEP is a legal addressing mode for the given

    // access type, then we can fold it into its users.

    if (static_cast<T *>(this)->isLegalAddressingMode(

            AccessType, const_cast<GlobalValue *>(BaseGV),

            BaseOffset.sextOrTrunc(64).getSExtValue(), HasBaseReg, Scale,

            Ptr->getType()->getPointerAddressSpace()))

      return TTI::TCC_Free;


    // TODO: Instead of returning TCC_Basic here, we should use

    // getArithmeticInstrCost. Or better yet, provide a hook to let the target

    // model it.

    return TTI::TCC_Basic;

  }


  InstructionCost getPointersChainCost(ArrayRef<const Value *> Ptrs,

                                       const Value *Base,

                                       const TTI::PointersChainInfo &Info,

                                       Type *AccessTy,

                                       TTI::TargetCostKind CostKind) {

    InstructionCost Cost = TTI::TCC_Free;

    // In the basic model we take into account GEP instructions only

    // (although here can come alloca instruction, a value, constants and/or

    // constant expressions, PHIs, bitcasts ... whatever allowed to be used as a

    // pointer). Typically, if Base is a not a GEP-instruction and all the

    // pointers are relative to the same base address, all the rest are

    // either GEP instructions, PHIs, bitcasts or constants. When we have same

    // base, we just calculate cost of each non-Base GEP as an ADD operation if

    // any their index is a non-const.

    // If no known dependecies between the pointers cost is calculated as a sum

    // of costs of GEP instructions.

    for (const Value *V : Ptrs) {

      const auto *GEP = dyn_cast<GetElementPtrInst>(V);

      if (!GEP)

        continue;

      if (Info.isSameBase() && V != Base) {

        if (GEP->hasAllConstantIndices())

          continue;

        Cost += static_cast<T *>(this)->getArithmeticInstrCost(

            Instruction::Add, GEP->getType(), CostKind,

            {TTI::OK_AnyValue, TTI::OP_None}, {TTI::OK_AnyValue, TTI::OP_None},

            std::nullopt);

      } else {

        SmallVector<const Value *> Indices(GEP->indices());

        Cost += static_cast<T *>(this)->getGEPCost(GEP->getSourceElementType(),

                                                   GEP->getPointerOperand(),

                                                   Indices, AccessTy, CostKind);

      }

    }

    return Cost;

  }


  InstructionCost getInstructionCost(const User *U,

                                     ArrayRef<const Value *> Operands,

                                     TTI::TargetCostKind CostKind) {

    using namespace llvm::PatternMatch;


    auto *TargetTTI = static_cast<T *>(this);

    // Handle non-intrinsic calls, invokes, and callbr.

    // FIXME: Unlikely to be true for anything but CodeSize.

    auto *CB = dyn_cast<CallBase>(U);

    if (CB && !isa<IntrinsicInst>(U)) {

      if (const Function *F = CB->getCalledFunction()) {

        if (!TargetTTI->isLoweredToCall(F))

          return TTI::TCC_Basic; // Give a basic cost if it will be lowered


        return TTI::TCC_Basic * (F->getFunctionType()->getNumParams() + 1);

      }

      // For indirect or other calls, scale cost by number of arguments.

      return TTI::TCC_Basic * (CB->arg_size() + 1);

    }


    Type *Ty = U->getType();

    unsigned Opcode = Operator::getOpcode(U);

    auto *I = dyn_cast<Instruction>(U);

    switch (Opcode) {

    default:

      break;

    case Instruction::Call: {

      assert(isa<IntrinsicInst>(U) && "Unexpected non-intrinsic call");

      auto *Intrinsic = cast<IntrinsicInst>(U);

      IntrinsicCostAttributes CostAttrs(Intrinsic->getIntrinsicID(), *CB);

      return TargetTTI->getIntrinsicInstrCost(CostAttrs, CostKind);

    }

    case Instruction::Br:

    case Instruction::Ret:

    case Instruction::PHI:

    case Instruction::Switch:

      return TargetTTI->getCFInstrCost(Opcode, CostKind, I);

    case Instruction::ExtractValue:

    case Instruction::Freeze:

      return TTI::TCC_Free;

    case Instruction::Alloca:

      if (cast<AllocaInst>(U)->isStaticAlloca())

        return TTI::TCC_Free;

      break;

    case Instruction::GetElementPtr: {

      const auto *GEP = cast<GEPOperator>(U);

      Type *AccessType = nullptr;

      // For now, only provide the AccessType in the simple case where the GEP

      // only has one user.

      if (GEP->hasOneUser() && I)

        AccessType = I->user_back()->getAccessType();


      return TargetTTI->getGEPCost(GEP->getSourceElementType(),

                                   Operands.front(), Operands.drop_front(),

                                   AccessType, CostKind);

    }

    case Instruction::Add:

    case Instruction::FAdd:

    case Instruction::Sub:

    case Instruction::FSub:

    case Instruction::Mul:

    case Instruction::FMul:

    case Instruction::UDiv:

    case Instruction::SDiv:

    case Instruction::FDiv:

    case Instruction::URem:

    case Instruction::SRem:

    case Instruction::FRem:

    case Instruction::Shl:

    case Instruction::LShr:

    case Instruction::AShr:

    case Instruction::And:

    case Instruction::Or:

    case Instruction::Xor:

    case Instruction::FNeg: {

      const TTI::OperandValueInfo Op1Info = TTI::getOperandInfo(Operands[0]);

      TTI::OperandValueInfo Op2Info;

      if (Opcode != Instruction::FNeg)

        Op2Info = TTI::getOperandInfo(Operands[1]);

      return TargetTTI->getArithmeticInstrCost(Opcode, Ty, CostKind, Op1Info,

                                               Op2Info, Operands, I);

    }

    case Instruction::IntToPtr:

    case Instruction::PtrToInt:

    case Instruction::SIToFP:

    case Instruction::UIToFP:

    case Instruction::FPToUI:

    case Instruction::FPToSI:

    case Instruction::Trunc:

    case Instruction::FPTrunc:

    case Instruction::BitCast:

    case Instruction::FPExt:

    case Instruction::SExt:

    case Instruction::ZExt:

    case Instruction::AddrSpaceCast: {

      Type *OpTy = Operands[0]->getType();

      return TargetTTI->getCastInstrCost(

          Opcode, Ty, OpTy, TTI::getCastContextHint(I), CostKind, I);

    }

    case Instruction::Store: {

      auto *SI = cast<StoreInst>(U);

      Type *ValTy = Operands[0]->getType();

      TTI::OperandValueInfo OpInfo = TTI::getOperandInfo(Operands[0]);

      return TargetTTI->getMemoryOpCost(Opcode, ValTy, SI->getAlign(),

                                        SI->getPointerAddressSpace(), CostKind,

                                        OpInfo, I);

    }

    case Instruction::Load: {

      // FIXME: Arbitary cost which could come from the backend.

      if (CostKind == TTI::TCK_Latency)

        return 4;

      auto *LI = cast<LoadInst>(U);

      Type *LoadType = U->getType();

      // If there is a non-register sized type, the cost estimation may expand

      // it to be several instructions to load into multiple registers on the

      // target.  But, if the only use of the load is a trunc instruction to a

      // register sized type, the instruction selector can combine these

      // instructions to be a single load.  So, in this case, we use the

      // destination type of the trunc instruction rather than the load to

      // accurately estimate the cost of this load instruction.

      if (CostKind == TTI::TCK_CodeSize && LI->hasOneUse() &&

          !LoadType->isVectorTy()) {

        if (const TruncInst *TI = dyn_cast<TruncInst>(*LI->user_begin()))

          LoadType = TI->getDestTy();

      }

      return TargetTTI->getMemoryOpCost(Opcode, LoadType, LI->getAlign(),

                                        LI->getPointerAddressSpace(), CostKind,

                                        {TTI::OK_AnyValue, TTI::OP_None}, I);

    }

    case Instruction::Select: {

      const Value *Op0, *Op1;

      if (match(U, m_LogicalAnd(m_Value(Op0), m_Value(Op1))) ||

          match(U, m_LogicalOr(m_Value(Op0), m_Value(Op1)))) {

        // select x, y, false --> x & y

        // select x, true, y --> x | y

        const auto Op1Info = TTI::getOperandInfo(Op0);

        const auto Op2Info = TTI::getOperandInfo(Op1);

        assert(Op0->getType()->getScalarSizeInBits() == 1 &&

               Op1->getType()->getScalarSizeInBits() == 1);


        SmallVector<const Value *, 2> Operands{Op0, Op1};

        return TargetTTI->getArithmeticInstrCost(

            match(U, m_LogicalOr()) ? Instruction::Or : Instruction::And, Ty,

            CostKind, Op1Info, Op2Info, Operands, I);

      }

      Type *CondTy = Operands[0]->getType();

      return TargetTTI->getCmpSelInstrCost(Opcode, U->getType(), CondTy,

                                           CmpInst::BAD_ICMP_PREDICATE,

                                           CostKind, I);

    }

    case Instruction::ICmp:

    case Instruction::FCmp: {

      Type *ValTy = Operands[0]->getType();

      // TODO: Also handle ICmp/FCmp constant expressions.

      return TargetTTI->getCmpSelInstrCost(Opcode, ValTy, U->getType(),

                                           I ? cast<CmpInst>(I)->getPredicate()

                                             : CmpInst::BAD_ICMP_PREDICATE,

                                           CostKind, I);

    }

    case Instruction::InsertElement: {

      auto *IE = dyn_cast<InsertElementInst>(U);

      if (!IE)

        return TTI::TCC_Basic; // FIXME

      unsigned Idx = -1;

      if (auto *CI = dyn_cast<ConstantInt>(Operands[2]))

        if (CI->getValue().getActiveBits() <= 32)

          Idx = CI->getZExtValue();

      return TargetTTI->getVectorInstrCost(*IE, Ty, CostKind, Idx);

    }

    case Instruction::ShuffleVector: {

      auto *Shuffle = dyn_cast<ShuffleVectorInst>(U);

      if (!Shuffle)

        return TTI::TCC_Basic; // FIXME


      auto *VecTy = cast<VectorType>(U->getType());

      auto *VecSrcTy = cast<VectorType>(Operands[0]->getType());

      ArrayRef<int> Mask = Shuffle->getShuffleMask();

      int NumSubElts, SubIndex;


      // TODO: move more of this inside improveShuffleKindFromMask.

      if (Shuffle->changesLength()) {

        // Treat a 'subvector widening' as a free shuffle.

        if (Shuffle->increasesLength() && Shuffle->isIdentityWithPadding())

          return 0;


        if (Shuffle->isExtractSubvectorMask(SubIndex))

          return TargetTTI->getShuffleCost(TTI::SK_ExtractSubvector, VecSrcTy,

                                           Mask, CostKind, SubIndex, VecTy,

                                           Operands, Shuffle);


        if (Shuffle->isInsertSubvectorMask(NumSubElts, SubIndex))

          return TargetTTI->getShuffleCost(

              TTI::SK_InsertSubvector, VecTy, Mask, CostKind, SubIndex,

              FixedVectorType::get(VecTy->getScalarType(), NumSubElts),

              Operands, Shuffle);


        int ReplicationFactor, VF;

        if (Shuffle->isReplicationMask(ReplicationFactor, VF)) {

          APInt DemandedDstElts = APInt::getZero(Mask.size());

          for (auto I : enumerate(Mask)) {

            if (I.value() != PoisonMaskElem)

              DemandedDstElts.setBit(I.index());

          }

          return TargetTTI->getReplicationShuffleCost(

              VecSrcTy->getElementType(), ReplicationFactor, VF,

              DemandedDstElts, CostKind);

        }


        bool IsUnary = isa<UndefValue>(Operands[1]);

        NumSubElts = VecSrcTy->getElementCount().getKnownMinValue();

        SmallVector<int, 16> AdjustMask(Mask.begin(), Mask.end());


        // Widening shuffle - widening the source(s) to the new length

        // (treated as free - see above), and then perform the adjusted

        // shuffle at that width.

        if (Shuffle->increasesLength()) {

          for (int &M : AdjustMask)

            M = M >= NumSubElts ? (M + (Mask.size() - NumSubElts)) : M;


          return TargetTTI->getShuffleCost(

              IsUnary ? TTI::SK_PermuteSingleSrc : TTI::SK_PermuteTwoSrc, VecTy,

              AdjustMask, CostKind, 0, nullptr, Operands, Shuffle);

        }


        // Narrowing shuffle - perform shuffle at original wider width and

        // then extract the lower elements.

        AdjustMask.append(NumSubElts - Mask.size(), PoisonMaskElem);


        InstructionCost ShuffleCost = TargetTTI->getShuffleCost(

            IsUnary ? TTI::SK_PermuteSingleSrc : TTI::SK_PermuteTwoSrc,

            VecSrcTy, AdjustMask, CostKind, 0, nullptr, Operands, Shuffle);


        SmallVector<int, 16> ExtractMask(Mask.size());

        std::iota(ExtractMask.begin(), ExtractMask.end(), 0);

        return ShuffleCost + TargetTTI->getShuffleCost(

                                 TTI::SK_ExtractSubvector, VecSrcTy,

                                 ExtractMask, CostKind, 0, VecTy, {}, Shuffle);

      }


      if (Shuffle->isIdentity())

        return 0;


      if (Shuffle->isReverse())

        return TargetTTI->getShuffleCost(TTI::SK_Reverse, VecTy, Mask, CostKind,

                                         0, nullptr, Operands, Shuffle);


      if (Shuffle->isSelect())

        return TargetTTI->getShuffleCost(TTI::SK_Select, VecTy, Mask, CostKind,

                                         0, nullptr, Operands, Shuffle);


      if (Shuffle->isTranspose())

        return TargetTTI->getShuffleCost(TTI::SK_Transpose, VecTy, Mask,

                                         CostKind, 0, nullptr, Operands,

                                         Shuffle);


      if (Shuffle->isZeroEltSplat())

        return TargetTTI->getShuffleCost(TTI::SK_Broadcast, VecTy, Mask,

                                         CostKind, 0, nullptr, Operands,

                                         Shuffle);


      if (Shuffle->isSingleSource())

        return TargetTTI->getShuffleCost(TTI::SK_PermuteSingleSrc, VecTy, Mask,

                                         CostKind, 0, nullptr, Operands,

                                         Shuffle);


      if (Shuffle->isInsertSubvectorMask(NumSubElts, SubIndex))

        return TargetTTI->getShuffleCost(

            TTI::SK_InsertSubvector, VecTy, Mask, CostKind, SubIndex,

            FixedVectorType::get(VecTy->getScalarType(), NumSubElts), Operands,

            Shuffle);


      if (Shuffle->isSplice(SubIndex))

        return TargetTTI->getShuffleCost(TTI::SK_Splice, VecTy, Mask, CostKind,

                                         SubIndex, nullptr, Operands, Shuffle);


      return TargetTTI->getShuffleCost(TTI::SK_PermuteTwoSrc, VecTy, Mask,

                                       CostKind, 0, nullptr, Operands, Shuffle);

    }

    case Instruction::ExtractElement: {

      auto *EEI = dyn_cast<ExtractElementInst>(U);

      if (!EEI)

        return TTI::TCC_Basic; // FIXME

      unsigned Idx = -1;

      if (auto *CI = dyn_cast<ConstantInt>(Operands[1]))

        if (CI->getValue().getActiveBits() <= 32)

          Idx = CI->getZExtValue();

      Type *DstTy = Operands[0]->getType();

      return TargetTTI->getVectorInstrCost(*EEI, DstTy, CostKind, Idx);

    }

    }


    // By default, just classify everything as 'basic' or -1 to represent that

    // don't know the throughput cost.

    return CostKind == TTI::TCK_RecipThroughput ? -1 : TTI::TCC_Basic;

  }


  bool isExpensiveToSpeculativelyExecute(const Instruction *I) {

    auto *TargetTTI = static_cast<T *>(this);

    SmallVector<const Value *, 4> Ops(I->operand_values());

    InstructionCost Cost = TargetTTI->getInstructionCost(

        I, Ops, TargetTransformInfo::TCK_SizeAndLatency);

    return Cost >= TargetTransformInfo::TCC_Expensive;

  }


  bool supportsTailCallFor(const CallBase *CB) const {

    return static_cast<const T *>(this)->supportsTailCalls();

  }

};

} // namespace llvm


#endif

Info
Analysis containing CSE Info
Definition: CSEInfo.cpp:27

CostKind
static cl::opt< TargetTransformInfo::TargetCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(TargetTransformInfo::TCK_RecipThroughput), cl::values(clEnumValN(TargetTransformInfo::TCK_RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(TargetTransformInfo::TCK_Latency, "latency", "Instruction latency"), clEnumValN(TargetTransformInfo::TCK_CodeSize, "code-size", "Code size"), clEnumValN(TargetTransformInfo::TCK_SizeAndLatency, "size-latency", "Code size and latency")))

DataLayout.h

RetTy
return RetTy
Definition: DeadArgumentElimination.cpp:362

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:354

Name
std::string Name
Definition: ELFObjHandler.cpp:77

isSigned
static bool isSigned(unsigned int Opcode)
Definition: ExpandLargeDivRem.cpp:53

GetElementPtrTypeIterator.h

GEP
Hexagon Common GEP
Definition: HexagonCommonGEP.cpp:171

IntrinsicInst.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

Operands
mir Rename Register Operands
Definition: MIRNamerPass.cpp:74

Context
LLVMContext & Context
Definition: NVVMIntrRange.cpp:66

Operator.h

PatternMatch.h

Mode
static cl::opt< RegAllocEvictionAdvisorAnalysis::AdvisorMode > Mode("regalloc-enable-advisor", cl::Hidden, cl::init(RegAllocEvictionAdvisorAnalysis::AdvisorMode::Default), cl::desc("Enable regalloc advisor mode"), cl::values(clEnumValN(RegAllocEvictionAdvisorAnalysis::AdvisorMode::Default, "default", "Default"), clEnumValN(RegAllocEvictionAdvisorAnalysis::AdvisorMode::Release, "release", "precompiled"), clEnumValN(RegAllocEvictionAdvisorAnalysis::AdvisorMode::Development, "development", "for training")))

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

ScalarEvolutionExpressions.h

getType
static SymbolRef::Type getType(const Symbol *Sym)
Definition: TapiFile.cpp:40

Ptr
@ Ptr
Definition: TargetLibraryInfo.cpp:76

TargetTransformInfo.h
This pass exposes codegen information to IR-level passes.

VectorUtils.h

T

llvm::APInt
Class for arbitrary precision integers.
Definition: APInt.h:76

llvm::APInt::setBit
void setBit(unsigned BitPosition)
Set the given bit to 1 whose position is given as "bitPosition".
Definition: APInt.h:1308

llvm::APInt::getBitWidth
unsigned getBitWidth() const
Return the number of bits in the APInt.
Definition: APInt.h:1439

llvm::APInt::sextOrTrunc
APInt sextOrTrunc(unsigned width) const
Sign extend or truncate to width.
Definition: APInt.cpp:1010

llvm::APInt::getZero
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
Definition: APInt.h:178

llvm::APInt::getSExtValue
int64_t getSExtValue() const
Get sign extended value.
Definition: APInt.h:1513

llvm::AllocaInst
an instruction to allocate memory on the stack
Definition: Instructions.h:59

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::AssumptionCache
A cache of @llvm.assume calls within a function.
Definition: AssumptionCache.h:42

llvm::BlockFrequencyInfo
BlockFrequencyInfo pass uses BlockFrequencyInfoImpl implementation to estimate IR basic block frequen...
Definition: BlockFrequencyInfo.h:38

llvm::BranchInst
Conditional or Unconditional Branch instruction.
Definition: Instructions.h:3439

llvm::BranchProbability
Definition: BranchProbability.h:30

llvm::CallBase
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
Definition: InstrTypes.h:1494

llvm::CmpInst::Predicate
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition: InstrTypes.h:993

llvm::CmpInst::BAD_ICMP_PREDICATE
@ BAD_ICMP_PREDICATE
Definition: InstrTypes.h:1026

llvm::ConstantInt
This is the shared class of boolean and integer constants.
Definition: Constants.h:80

llvm::ConstantInt::getZExtValue
uint64_t getZExtValue() const
Return the constant as a 64-bit unsigned integer value after it has been zero extended as appropriate...
Definition: Constants.h:154

llvm::ConstantInt::getValue
const APInt & getValue() const
Return the constant as an APInt value reference.
Definition: Constants.h:145

llvm::Constant
This is an important base class in LLVM.
Definition: Constant.h:41

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:110

llvm::DataLayout::isLegalInteger
bool isLegalInteger(uint64_t Width) const
Returns true if the specified type is known to be a native integer type supported by the CPU.
Definition: DataLayout.h:260

llvm::DataLayout::getStructLayout
const StructLayout * getStructLayout(StructType *Ty) const
Returns a StructLayout object, indicating the alignment of the struct, its size, and the offsets of i...
Definition: DataLayout.cpp:720

llvm::DataLayout::getPointerTypeSizeInBits
unsigned getPointerTypeSizeInBits(Type *) const
Layout pointer size, in bits, based on the type.
Definition: DataLayout.cpp:763

llvm::DataLayout::getTypeSizeInBits
TypeSize getTypeSizeInBits(Type *Ty) const
Size examples:
Definition: DataLayout.h:672

llvm::DataLayout::getTypeStoreSize
TypeSize getTypeStoreSize(Type *Ty) const
Returns the maximum number of bytes that may be overwritten by storing the specified type.
Definition: DataLayout.h:472

llvm::DominatorTree
Concrete subclass of DominatorTreeBase that is used to compute a normal dominator tree.
Definition: Dominators.h:162

llvm::ElementCount
Definition: TypeSize.h:285

llvm::ElementCount::get
static constexpr ElementCount get(ScalarTy MinVal, bool Scalable)
Definition: TypeSize.h:302

llvm::FastMathFlags
Convenience struct for specifying and reasoning about fast-math flags.
Definition: FMF.h:20

llvm::FixedVectorType::get
static FixedVectorType * get(Type *ElementType, unsigned NumElts)
Definition: Type.cpp:692

llvm::Function
Definition: Function.h:63

llvm::GlobalValue
Definition: GlobalValue.h:48

llvm::InstCombiner
The core instruction combiner logic.
Definition: InstCombiner.h:47

llvm::InstructionCost
Definition: InstructionCost.h:29

llvm::InstructionCost::getInvalid
static InstructionCost getInvalid(CostType Val=0)
Definition: InstructionCost.h:73

llvm::Instruction
Definition: Instruction.h:49

llvm::IntrinsicCostAttributes
Definition: TargetTransformInfo.h:120

llvm::IntrinsicCostAttributes::getID
Intrinsic::ID getID() const
Definition: TargetTransformInfo.h:151

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition: IntrinsicInst.h:47

llvm::IntrinsicInst::getIntrinsicID
Intrinsic::ID getIntrinsicID() const
Return the intrinsic ID of this intrinsic.
Definition: IntrinsicInst.h:54

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:67

llvm::LoadInst
An instruction for reading from memory.
Definition: Instructions.h:184

llvm::LoopInfo
Definition: LoopInfo.h:407

llvm::Loop
Represents a single loop in the control flow graph.
Definition: LoopInfo.h:44

llvm::Operator::getOpcode
unsigned getOpcode() const
Return the opcode for this Instruction or ConstantExpr.
Definition: Operator.h:41

llvm::OptimizationRemarkEmitter
The optimization diagnostic interface.
Definition: OptimizationRemarkEmitter.h:33

llvm::ProfileSummaryInfo
Analysis providing profile information.
Definition: ProfileSummaryInfo.h:42

llvm::RecurrenceDescriptor
The RecurrenceDescriptor is used to identify recurrences variables in a loop.
Definition: IVDescriptors.h:71

llvm::SCEVAddRecExpr
This node represents a polynomial recurrence on the trip count of the specified loop.
Definition: ScalarEvolutionExpressions.h:347

llvm::SCEVAddRecExpr::getStepRecurrence
const SCEV * getStepRecurrence(ScalarEvolution &SE) const
Constructs and returns the recurrence indicating how much this expression steps by.
Definition: ScalarEvolutionExpressions.h:365

llvm::SCEVConstant
This class represents a constant integer value.
Definition: ScalarEvolutionExpressions.h:60

llvm::SCEVConstant::getAPInt
const APInt & getAPInt() const
Definition: ScalarEvolutionExpressions.h:70

llvm::SCEV
This class represents an analyzed expression in the program.
Definition: ScalarEvolution.h:75

llvm::ScalarEvolution
The main scalar evolution driver.
Definition: ScalarEvolution.h:452

llvm::SmallBitVector
This is a 'bitvector' (really, a variable-sized bit array), optimized for the case when the array is ...
Definition: SmallBitVector.h:35

llvm::SmallVectorImpl
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:586

llvm::SmallVectorImpl::append
void append(ItTy in_start, ItTy in_end)
Add the specified range to the end of the SmallVector.
Definition: SmallVector.h:696

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:426

llvm::SmallVectorTemplateCommon::end
iterator end()
Definition: SmallVector.h:282

llvm::SmallVectorTemplateCommon::begin
iterator begin()
Definition: SmallVector.h:280

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1209

llvm::StoreInst
An instruction for storing to memory.
Definition: Instructions.h:317

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:50

llvm::StructLayout::getElementOffset
TypeSize getElementOffset(unsigned Idx) const
Definition: DataLayout.h:651

llvm::StructType
Class to represent struct types.
Definition: DerivedTypes.h:216

llvm::SwitchInst
Multiway switch.
Definition: Instructions.h:3598

llvm::TargetLibraryInfo
Provides information about what library functions are available for the current target.
Definition: TargetLibraryInfo.h:281

llvm::TargetTransformInfoImplBase
Base class for use as a mix-in that aids implementing a TargetTransformInfo-compatible class.
Definition: TargetTransformInfoImpl.h:34

llvm::TargetTransformInfoImplBase::getDataLayout
const DataLayout & getDataLayout() const
Definition: TargetTransformInfoImpl.h:47

llvm::TargetTransformInfoImplBase::isSingleThreaded
bool isSingleThreaded() const
Definition: TargetTransformInfoImpl.h:129

llvm::TargetTransformInfoImplBase::getMemcpyLoopResidualLoweringType
void getMemcpyLoopResidualLoweringType(SmallVectorImpl< Type * > &OpsOut, LLVMContext &Context, unsigned RemainingBytes, unsigned SrcAddrSpace, unsigned DestAddrSpace, unsigned SrcAlign, unsigned DestAlign, std::optional< uint32_t > AtomicCpySize) const
Definition: TargetTransformInfoImpl.h:831

llvm::TargetTransformInfoImplBase::isLegalToVectorizeStore
bool isLegalToVectorizeStore(StoreInst *SI) const
Definition: TargetTransformInfoImpl.h:877

llvm::TargetTransformInfoImplBase::addrspacesMayAlias
bool addrspacesMayAlias(unsigned AS0, unsigned AS1) const
Definition: TargetTransformInfoImpl.h:111

llvm::TargetTransformInfoImplBase::getNumberOfParts
unsigned getNumberOfParts(Type *Tp) const
Definition: TargetTransformInfoImpl.h:768

llvm::TargetTransformInfoImplBase::getAtomicMemIntrinsicMaxElementSize
unsigned getAtomicMemIntrinsicMaxElementSize() const
Definition: TargetTransformInfoImpl.h:808

llvm::TargetTransformInfoImplBase::shouldTreatInstructionLikeSelect
bool shouldTreatInstructionLikeSelect(const Instruction *I)
Definition: TargetTransformInfoImpl.h:388

llvm::TargetTransformInfoImplBase::isLegalToVectorizeLoad
bool isLegalToVectorizeLoad(LoadInst *LI) const
Definition: TargetTransformInfoImpl.h:875

llvm::TargetTransformInfoImplBase::isLegalBroadcastLoad
bool isLegalBroadcastLoad(Type *ElementTy, ElementCount NumElements) const
Definition: TargetTransformInfoImpl.h:280

llvm::TargetTransformInfoImplBase::getVScaleForTuning
std::optional< unsigned > getVScaleForTuning() const
Definition: TargetTransformInfoImpl.h:475

llvm::TargetTransformInfoImplBase::shouldMaximizeVectorBandwidth
bool shouldMaximizeVectorBandwidth(TargetTransformInfo::RegisterKind K) const
Definition: TargetTransformInfoImpl.h:479

llvm::TargetTransformInfoImplBase::canSaveCmp
bool canSaveCmp(Loop *L, BranchInst **BI, ScalarEvolution *SE, LoopInfo *LI, DominatorTree *DT, AssumptionCache *AC, TargetLibraryInfo *LibInfo) const
Definition: TargetTransformInfoImpl.h:247

llvm::TargetTransformInfoImplBase::isLegalStridedLoadStore
bool isLegalStridedLoadStore(Type *DataType, Align Alignment) const
Definition: TargetTransformInfoImpl.h:314

llvm::TargetTransformInfoImplBase::simplifyDemandedVectorEltsIntrinsic
std::optional< Value * > simplifyDemandedVectorEltsIntrinsic(InstCombiner &IC, IntrinsicInst &II, APInt DemandedElts, APInt &UndefElts, APInt &UndefElts2, APInt &UndefElts3, std::function< void(Instruction *, unsigned, APInt, APInt &)> SimplifyAndSetOp) const
Definition: TargetTransformInfoImpl.h:202

llvm::TargetTransformInfoImplBase::isLegalICmpImmediate
bool isLegalICmpImmediate(int64_t Imm) const
Definition: TargetTransformInfoImpl.h:221

llvm::TargetTransformInfoImplBase::haveFastSqrt
bool haveFastSqrt(Type *Ty) const
Definition: TargetTransformInfoImpl.h:413

llvm::TargetTransformInfoImplBase::getRegUsageForType
unsigned getRegUsageForType(Type *Ty) const
Definition: TargetTransformInfoImpl.h:349

llvm::TargetTransformInfoImplBase::getInterleavedMemoryOpCost
unsigned getInterleavedMemoryOpCost(unsigned Opcode, Type *VecTy, unsigned Factor, ArrayRef< unsigned > Indices, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, bool UseMaskForCond, bool UseMaskForGaps) const
Definition: TargetTransformInfoImpl.h:707

llvm::TargetTransformInfoImplBase::areTypesABICompatible
bool areTypesABICompatible(const Function *Caller, const Function *Callee, const ArrayRef< Type * > &Types) const
Definition: TargetTransformInfoImpl.h:855

llvm::TargetTransformInfoImplBase::getPeelingPreferences
void getPeelingPreferences(Loop *, ScalarEvolution &, TTI::PeelingPreferences &) const
Definition: TargetTransformInfoImpl.h:214

llvm::TargetTransformInfoImplBase::isAlwaysUniform
bool isAlwaysUniform(const Value *V) const
Definition: TargetTransformInfoImpl.h:105

llvm::TargetTransformInfoImplBase::isProfitableToHoist
bool isProfitableToHoist(Instruction *I) const
Definition: TargetTransformInfoImpl.h:343

llvm::TargetTransformInfoImplBase::getEstimatedNumberOfCaseClusters
unsigned getEstimatedNumberOfCaseClusters(const SwitchInst &SI, unsigned &JTSize, ProfileSummaryInfo *PSI, BlockFrequencyInfo *BFI) const
Definition: TargetTransformInfoImpl.h:61

llvm::TargetTransformInfoImplBase::getIntImmCostInst
InstructionCost getIntImmCostInst(unsigned Opcode, unsigned Idx, const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind, Instruction *Inst=nullptr) const
Definition: TargetTransformInfoImpl.h:433

llvm::TargetTransformInfoImplBase::isLSRCostLess
bool isLSRCostLess(const TTI::LSRCost &C1, const TTI::LSRCost &C2) const
Definition: TargetTransformInfoImpl.h:232

llvm::TargetTransformInfoImplBase::isExpensiveToSpeculativelyExecute
bool isExpensiveToSpeculativelyExecute(const Instruction *I)
Definition: TargetTransformInfoImpl.h:415

llvm::TargetTransformInfoImplBase::isTruncateFree
bool isTruncateFree(Type *Ty1, Type *Ty2) const
Definition: TargetTransformInfoImpl.h:341

llvm::TargetTransformInfoImplBase::enableOrderedReductions
bool enableOrderedReductions() const
Definition: TargetTransformInfoImpl.h:318

llvm::TargetTransformInfoImplBase::getFlatAddressSpace
unsigned getFlatAddressSpace() const
Definition: TargetTransformInfoImpl.h:115

llvm::TargetTransformInfoImplBase::isStridedAccess
bool isStridedAccess(const SCEV *Ptr) const
Definition: TargetTransformInfoImpl.h:1005

llvm::TargetTransformInfoImplBase::useAA
bool useAA() const
Definition: TargetTransformInfoImpl.h:345

llvm::TargetTransformInfoImplBase::enableInterleavedAccessVectorization
bool enableInterleavedAccessVectorization() const
Definition: TargetTransformInfoImpl.h:397

llvm::TargetTransformInfoImplBase::getCallInstrCost
InstructionCost getCallInstrCost(Function *F, Type *RetTy, ArrayRef< Type * > Tys, TTI::TargetCostKind CostKind) const
Definition: TargetTransformInfoImpl.h:761

llvm::TargetTransformInfoImplBase::getArithmeticReductionCost
InstructionCost getArithmeticReductionCost(unsigned, VectorType *, std::optional< FastMathFlags > FMF, TTI::TargetCostKind) const
Definition: TargetTransformInfoImpl.h:775

llvm::TargetTransformInfoImplBase::getFPOpCost
InstructionCost getFPOpCost(Type *Ty) const
Definition: TargetTransformInfoImpl.h:419

llvm::TargetTransformInfoImplBase::shouldConsiderAddressTypePromotion
bool shouldConsiderAddressTypePromotion(const Instruction &I, bool &AllowPromotionWithoutCommonHeader) const
Definition: TargetTransformInfoImpl.h:490

llvm::TargetTransformInfoImplBase::areInlineCompatible
bool areInlineCompatible(const Function *Caller, const Function *Callee) const
Definition: TargetTransformInfoImpl.h:842

llvm::TargetTransformInfoImplBase::getPredicatedAddrSpace
std::pair< const Value *, unsigned > getPredicatedAddrSpace(const Value *V) const
Definition: TargetTransformInfoImpl.h:132

llvm::TargetTransformInfoImplBase::getMemcpyCost
InstructionCost getMemcpyCost(const Instruction *I) const
Definition: TargetTransformInfoImpl.h:83

llvm::TargetTransformInfoImplBase::getCacheLineSize
unsigned getCacheLineSize() const
Definition: TargetTransformInfoImpl.h:496

llvm::TargetTransformInfoImplBase::getInliningCostBenefitAnalysisProfitableMultiplier
unsigned getInliningCostBenefitAnalysisProfitableMultiplier() const
Definition: TargetTransformInfoImpl.h:73

llvm::TargetTransformInfoImplBase::getStoreVectorFactor
unsigned getStoreVectorFactor(unsigned VF, unsigned StoreSize, unsigned ChainSizeInBytes, VectorType *VecTy) const
Definition: TargetTransformInfoImpl.h:902

llvm::TargetTransformInfoImplBase::getMaxNumArgs
unsigned getMaxNumArgs() const
Definition: TargetTransformInfoImpl.h:946

llvm::TargetTransformInfoImplBase::isFPVectorizationPotentiallyUnsafe
bool isFPVectorizationPotentiallyUnsafe() const
Definition: TargetTransformInfoImpl.h:401

llvm::TargetTransformInfoImplBase::getMaxVScale
std::optional< unsigned > getMaxVScale() const
Definition: TargetTransformInfoImpl.h:474

llvm::TargetTransformInfoImplBase::getPopcntSupport
TTI::PopcntSupportKind getPopcntSupport(unsigned IntTyWidthInBit) const
Definition: TargetTransformInfoImpl.h:409

llvm::TargetTransformInfoImplBase::getMinTripCountTailFoldingThreshold
unsigned getMinTripCountTailFoldingThreshold() const
Definition: TargetTransformInfoImpl.h:926

llvm::TargetTransformInfoImplBase::getCallerAllocaCost
unsigned getCallerAllocaCost(const CallBase *CB, const AllocaInst *AI) const
Definition: TargetTransformInfoImpl.h:77

llvm::TargetTransformInfoImplBase::isProfitableLSRChainElement
bool isProfitableLSRChainElement(Instruction *I) const
Definition: TargetTransformInfoImpl.h:243

llvm::TargetTransformInfoImplBase::getShuffleCost
InstructionCost getShuffleCost(TTI::ShuffleKind Kind, VectorType *Ty, ArrayRef< int > Mask, TTI::TargetCostKind CostKind, int Index, VectorType *SubTp, ArrayRef< const Value * > Args=std::nullopt, const Instruction *CxtI=nullptr) const
Definition: TargetTransformInfoImpl.h:582

llvm::TargetTransformInfoImplBase::getIntImmCodeSizeCost
InstructionCost getIntImmCodeSizeCost(unsigned Opcode, unsigned Idx, const APInt &Imm, Type *Ty) const
Definition: TargetTransformInfoImpl.h:423

llvm::TargetTransformInfoImplBase::preferToKeepConstantsAttached
bool preferToKeepConstantsAttached(const Instruction &Inst, const Function &Fn) const
Definition: TargetTransformInfoImpl.h:446

llvm::TargetTransformInfoImplBase::getOrCreateResultFromMemIntrinsic
Value * getOrCreateResultFromMemIntrinsic(IntrinsicInst *Inst, Type *ExpectedType) const
Definition: TargetTransformInfoImpl.h:817

llvm::TargetTransformInfoImplBase::getIntrinsicInstrCost
InstructionCost getIntrinsicInstrCost(const IntrinsicCostAttributes &ICA, TTI::TargetCostKind CostKind) const
Definition: TargetTransformInfoImpl.h:714

llvm::TargetTransformInfoImplBase::isVScaleKnownToBeAPowerOfTwo
bool isVScaleKnownToBeAPowerOfTwo() const
Definition: TargetTransformInfoImpl.h:476

llvm::TargetTransformInfoImplBase::isLegalMaskedStore
bool isLegalMaskedStore(Type *DataType, Align Alignment) const
Definition: TargetTransformInfoImpl.h:258

llvm::TargetTransformInfoImplBase::getGatherScatterOpCost
InstructionCost getGatherScatterOpCost(unsigned Opcode, Type *DataTy, const Value *Ptr, bool VariableMask, Align Alignment, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const
Definition: TargetTransformInfoImpl.h:691

llvm::TargetTransformInfoImplBase::enableWritePrefetching
bool enableWritePrefetching() const
Definition: TargetTransformInfoImpl.h:529

llvm::TargetTransformInfoImplBase::prefersVectorizedAddressing
bool prefersVectorizedAddressing() const
Definition: TargetTransformInfoImpl.h:326

llvm::TargetTransformInfoImplBase::getInlineCallPenalty
unsigned getInlineCallPenalty(const Function *F, const CallBase &Call, unsigned DefaultCallPenalty) const
Definition: TargetTransformInfoImpl.h:850

llvm::TargetTransformInfoImplBase::getVPMemoryOpCost
InstructionCost getVPMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, const Instruction *I) const
Definition: TargetTransformInfoImpl.h:678

llvm::TargetTransformInfoImplBase::getStridedMemoryOpCost
InstructionCost getStridedMemoryOpCost(unsigned Opcode, Type *DataTy, const Value *Ptr, bool VariableMask, Align Alignment, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const
Definition: TargetTransformInfoImpl.h:699

llvm::TargetTransformInfoImplBase::supportsEfficientVectorElementLoadStore
bool supportsEfficientVectorElementLoadStore() const
Definition: TargetTransformInfoImpl.h:373

llvm::TargetTransformInfoImplBase::isNoopAddrSpaceCast
bool isNoopAddrSpaceCast(unsigned, unsigned) const
Definition: TargetTransformInfoImpl.h:122

llvm::TargetTransformInfoImplBase::getStoreMinimumVF
unsigned getStoreMinimumVF(unsigned VF, Type *, Type *) const
Definition: TargetTransformInfoImpl.h:488

llvm::TargetTransformInfoImplBase::LSRWithInstrQueries
bool LSRWithInstrQueries() const
Definition: TargetTransformInfoImpl.h:339

llvm::TargetTransformInfoImplBase::getVectorInstrCost
InstructionCost getVectorInstrCost(const Instruction &I, Type *Val, TTI::TargetCostKind CostKind, unsigned Index) const
Definition: TargetTransformInfoImpl.h:658

llvm::TargetTransformInfoImplBase::preferPredicatedReductionSelect
bool preferPredicatedReductionSelect(unsigned Opcode, Type *Ty, TTI::ReductionFlags Flags) const
Definition: TargetTransformInfoImpl.h:913

llvm::TargetTransformInfoImplBase::TargetTransformInfoImplBase
TargetTransformInfoImplBase(TargetTransformInfoImplBase &&Arg)
Definition: TargetTransformInfoImpl.h:45

llvm::TargetTransformInfoImplBase::getVPLegalizationStrategy
TargetTransformInfo::VPLegalization getVPLegalizationStrategy(const VPIntrinsic &PI) const
Definition: TargetTransformInfoImpl.h:938

llvm::TargetTransformInfoImplBase::getUnrollingPreferences
void getUnrollingPreferences(Loop *, ScalarEvolution &, TTI::UnrollingPreferences &, OptimizationRemarkEmitter *) const
Definition: TargetTransformInfoImpl.h:210

llvm::TargetTransformInfoImplBase::supportsTailCalls
bool supportsTailCalls() const
Definition: TargetTransformInfoImpl.h:375

llvm::TargetTransformInfoImplBase::isLegalToVectorizeLoadChain
bool isLegalToVectorizeLoadChain(unsigned ChainSizeInBytes, Align Alignment, unsigned AddrSpace) const
Definition: TargetTransformInfoImpl.h:879

llvm::TargetTransformInfoImplBase::isLegalAddImmediate
bool isLegalAddImmediate(int64_t Imm) const
Definition: TargetTransformInfoImpl.h:217

llvm::TargetTransformInfoImplBase::isLegalAddressingMode
bool isLegalAddressingMode(Type *Ty, GlobalValue *BaseGV, int64_t BaseOffset, bool HasBaseReg, int64_t Scale, unsigned AddrSpace, Instruction *I=nullptr, int64_t ScalableOffset=0) const
Definition: TargetTransformInfoImpl.h:223

llvm::TargetTransformInfoImplBase::isHardwareLoopProfitable
bool isHardwareLoopProfitable(Loop *L, ScalarEvolution &SE, AssumptionCache &AC, TargetLibraryInfo *LibInfo, HardwareLoopInfo &HWLoopInfo) const
Definition: TargetTransformInfoImpl.h:177

llvm::TargetTransformInfoImplBase::minRequiredElementSize
unsigned minRequiredElementSize(const Value *Val, bool &isSigned) const
Definition: TargetTransformInfoImpl.h:951

llvm::TargetTransformInfoImplBase::getMemcpyLoopLoweringType
Type * getMemcpyLoopLoweringType(LLVMContext &Context, Value *Length, unsigned SrcAddrSpace, unsigned DestAddrSpace, unsigned SrcAlign, unsigned DestAlign, std::optional< uint32_t > AtomicElementSize) const
Definition: TargetTransformInfoImpl.h:823

llvm::TargetTransformInfoImplBase::getCacheSize
std::optional< unsigned > getCacheSize(TargetTransformInfo::CacheLevel Level) const
Definition: TargetTransformInfoImpl.h:498

llvm::TargetTransformInfoImplBase::getAssumedAddrSpace
unsigned getAssumedAddrSpace(const Value *V) const
Definition: TargetTransformInfoImpl.h:127

llvm::TargetTransformInfoImplBase::enableScalableVectorization
bool enableScalableVectorization() const
Definition: TargetTransformInfoImpl.h:930

llvm::TargetTransformInfoImplBase::getGISelRematGlobalCost
unsigned getGISelRematGlobalCost() const
Definition: TargetTransformInfoImpl.h:924

llvm::TargetTransformInfoImplBase::isLegalMaskedExpandLoad
bool isLegalMaskedExpandLoad(Type *DataType, Align Alignment) const
Definition: TargetTransformInfoImpl.h:310

llvm::TargetTransformInfoImplBase::isLegalNTStore
bool isLegalNTStore(Type *DataType, Align Alignment) const
Definition: TargetTransformInfoImpl.h:266

llvm::TargetTransformInfoImplBase::getRegisterClassForType
unsigned getRegisterClassForType(bool Vector, Type *Ty=nullptr) const
Definition: TargetTransformInfoImpl.h:453

llvm::TargetTransformInfoImplBase::isLegalMaskedGather
bool isLegalMaskedGather(Type *DataType, Align Alignment) const
Definition: TargetTransformInfoImpl.h:288

llvm::TargetTransformInfoImplBase::adjustInliningThreshold
unsigned adjustInliningThreshold(const CallBase *CB) const
Definition: TargetTransformInfoImpl.h:76

llvm::TargetTransformInfoImplBase::getPredictableBranchThreshold
BranchProbability getPredictableBranchThreshold() const
Definition: TargetTransformInfoImpl.h:97

llvm::TargetTransformInfoImplBase::getMinPageSize
std::optional< unsigned > getMinPageSize() const
Definition: TargetTransformInfoImpl.h:520

llvm::TargetTransformInfoImplBase::collectFlatAddressOperands
bool collectFlatAddressOperands(SmallVectorImpl< int > &OpIndexes, Intrinsic::ID IID) const
Definition: TargetTransformInfoImpl.h:117

llvm::TargetTransformInfoImplBase::getExtendedReductionCost
InstructionCost getExtendedReductionCost(unsigned Opcode, bool IsUnsigned, Type *ResTy, VectorType *Ty, FastMathFlags FMF, TTI::TargetCostKind CostKind) const
Definition: TargetTransformInfoImpl.h:787

llvm::TargetTransformInfoImplBase::allowsMisalignedMemoryAccesses
bool allowsMisalignedMemoryAccesses(LLVMContext &Context, unsigned BitWidth, unsigned AddressSpace, Align Alignment, unsigned *Fast) const
Definition: TargetTransformInfoImpl.h:403

llvm::TargetTransformInfoImplBase::getConstantStrideStep
const SCEVConstant * getConstantStrideStep(ScalarEvolution *SE, const SCEV *Ptr) const
Definition: TargetTransformInfoImpl.h:1009

llvm::TargetTransformInfoImplBase::getMinPrefetchStride
unsigned getMinPrefetchStride(unsigned NumMemAccesses, unsigned NumStridedMemAccesses, unsigned NumPrefetches, bool HasCall) const
Definition: TargetTransformInfoImpl.h:523

llvm::TargetTransformInfoImplBase::getIntImmCostIntrin
InstructionCost getIntImmCostIntrin(Intrinsic::ID IID, unsigned Idx, const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind) const
Definition: TargetTransformInfoImpl.h:440

llvm::TargetTransformInfoImplBase::getLoadVectorFactor
unsigned getLoadVectorFactor(unsigned VF, unsigned LoadSize, unsigned ChainSizeInBytes, VectorType *VecTy) const
Definition: TargetTransformInfoImpl.h:896

llvm::TargetTransformInfoImplBase::isIndexedLoadLegal
bool isIndexedLoadLegal(TTI::MemIndexedMode Mode, Type *Ty, const DataLayout &DL) const
Definition: TargetTransformInfoImpl.h:863

llvm::TargetTransformInfoImplBase::shouldPrefetchAddressSpace
bool shouldPrefetchAddressSpace(unsigned AS) const
Definition: TargetTransformInfoImpl.h:530

llvm::TargetTransformInfoImplBase::getIntImmCost
InstructionCost getIntImmCost(const APInt &Imm, Type *Ty, TTI::TargetCostKind CostKind) const
Definition: TargetTransformInfoImpl.h:428

llvm::TargetTransformInfoImplBase::getMaxMemIntrinsicInlineSizeThreshold
uint64_t getMaxMemIntrinsicInlineSizeThreshold() const
Definition: TargetTransformInfoImpl.h:87

llvm::TargetTransformInfoImplBase::getReplicationShuffleCost
unsigned getReplicationShuffleCost(Type *EltTy, int ReplicationFactor, int VF, const APInt &DemandedDstElts, TTI::TargetCostKind CostKind)
Definition: TargetTransformInfoImpl.h:664

llvm::TargetTransformInfoImplBase::isSourceOfDivergence
bool isSourceOfDivergence(const Value *V) const
Definition: TargetTransformInfoImpl.h:103

llvm::TargetTransformInfoImplBase::enableAggressiveInterleaving
bool enableAggressiveInterleaving(bool LoopHasReductions) const
Definition: TargetTransformInfoImpl.h:377

llvm::TargetTransformInfoImplBase::getMaxInterleaveFactor
unsigned getMaxInterleaveFactor(ElementCount VF) const
Definition: TargetTransformInfoImpl.h:532

llvm::TargetTransformInfoImplBase::getCastInstrCost
InstructionCost getCastInstrCost(unsigned Opcode, Type *Dst, Type *Src, TTI::CastContextHint CCH, TTI::TargetCostKind CostKind, const Instruction *I) const
Definition: TargetTransformInfoImpl.h:591

llvm::TargetTransformInfoImplBase::getCacheAssociativity
std::optional< unsigned > getCacheAssociativity(TargetTransformInfo::CacheLevel Level) const
Definition: TargetTransformInfoImpl.h:509

llvm::TargetTransformInfoImplBase::hasVolatileVariant
bool hasVolatileVariant(Instruction *I, unsigned AddrSpace) const
Definition: TargetTransformInfoImpl.h:322

llvm::TargetTransformInfoImplBase::getArithmeticInstrCost
InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Opd1Info, TTI::OperandValueInfo Opd2Info, ArrayRef< const Value * > Args, const Instruction *CxtI=nullptr) const
Definition: TargetTransformInfoImpl.h:534

llvm::TargetTransformInfoImplBase::getPreferredAddressingMode
TTI::AddressingModeKind getPreferredAddressingMode(const Loop *L, ScalarEvolution *SE) const
Definition: TargetTransformInfoImpl.h:254

llvm::TargetTransformInfoImplBase::getMaxPrefetchIterationsAhead
unsigned getMaxPrefetchIterationsAhead() const
Definition: TargetTransformInfoImpl.h:528

llvm::TargetTransformInfoImplBase::forceScalarizeMaskedGather
bool forceScalarizeMaskedGather(VectorType *DataType, Align Alignment) const
Definition: TargetTransformInfoImpl.h:292

llvm::TargetTransformInfoImplBase::getTgtMemIntrinsic
bool getTgtMemIntrinsic(IntrinsicInst *Inst, MemIntrinsicInfo &Info) const
Definition: TargetTransformInfoImpl.h:804

llvm::TargetTransformInfoImplBase::getInliningCostBenefitAnalysisSavingsMultiplier
unsigned getInliningCostBenefitAnalysisSavingsMultiplier() const
Definition: TargetTransformInfoImpl.h:72

llvm::TargetTransformInfoImplBase::preferEpilogueVectorization
bool preferEpilogueVectorization() const
Definition: TargetTransformInfoImpl.h:918

llvm::TargetTransformInfoImplBase::canHaveNonUndefGlobalInitializerInAddressSpace
bool canHaveNonUndefGlobalInitializerInAddressSpace(unsigned AS) const
Definition: TargetTransformInfoImpl.h:123

llvm::TargetTransformInfoImplBase::getMulAccReductionCost
InstructionCost getMulAccReductionCost(bool IsUnsigned, Type *ResTy, VectorType *Ty, TTI::TargetCostKind CostKind) const
Definition: TargetTransformInfoImpl.h:794

llvm::TargetTransformInfoImplBase::hasArmWideBranch
bool hasArmWideBranch(bool) const
Definition: TargetTransformInfoImpl.h:944

llvm::TargetTransformInfoImplBase::isIndexedStoreLegal
bool isIndexedStoreLegal(TTI::MemIndexedMode Mode, Type *Ty, const DataLayout &DL) const
Definition: TargetTransformInfoImpl.h:868

llvm::TargetTransformInfoImplBase::hasDivRemOp
bool hasDivRemOp(Type *DataType, bool IsSigned) const
Definition: TargetTransformInfoImpl.h:320

llvm::TargetTransformInfoImplBase::getAddressComputationCost
InstructionCost getAddressComputationCost(Type *Tp, ScalarEvolution *, const SCEV *) const
Definition: TargetTransformInfoImpl.h:770

llvm::TargetTransformInfoImplBase::getInliningThresholdMultiplier
unsigned getInliningThresholdMultiplier() const
Definition: TargetTransformInfoImpl.h:71

llvm::TargetTransformInfoImplBase::isTypeLegal
bool isTypeLegal(Type *Ty) const
Definition: TargetTransformInfoImpl.h:347

llvm::TargetTransformInfoImplBase::getCmpSelInstrCost
InstructionCost getCmpSelInstrCost(unsigned Opcode, Type *ValTy, Type *CondTy, CmpInst::Predicate VecPred, TTI::TargetCostKind CostKind, const Instruction *I) const
Definition: TargetTransformInfoImpl.h:644

llvm::TargetTransformInfoImplBase::isNumRegsMajorCostOfLSR
bool isNumRegsMajorCostOfLSR() const
Definition: TargetTransformInfoImpl.h:239

llvm::TargetTransformInfoImplBase::enableMemCmpExpansion
TTI::MemCmpExpansionOptions enableMemCmpExpansion(bool OptSize, bool IsZeroCmp) const
Definition: TargetTransformInfoImpl.h:381

llvm::TargetTransformInfoImplBase::preferInLoopReduction
bool preferInLoopReduction(unsigned Opcode, Type *Ty, TTI::ReductionFlags Flags) const
Definition: TargetTransformInfoImpl.h:908

llvm::TargetTransformInfoImplBase::getOperandsScalarizationOverhead
InstructionCost getOperandsScalarizationOverhead(ArrayRef< const Value * > Args, ArrayRef< Type * > Tys, TTI::TargetCostKind CostKind) const
Definition: TargetTransformInfoImpl.h:367

llvm::TargetTransformInfoImplBase::shouldBuildLookupTables
bool shouldBuildLookupTables() const
Definition: TargetTransformInfoImpl.h:351

llvm::TargetTransformInfoImplBase::getRegisterBitWidth
TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const
Definition: TargetTransformInfoImpl.h:468

llvm::TargetTransformInfoImplBase::TTI
TargetTransformInfo TTI
Definition: TargetTransformInfoImpl.h:36

llvm::TargetTransformInfoImplBase::isConstantStridedAccessLessThan
bool isConstantStridedAccessLessThan(ScalarEvolution *SE, const SCEV *Ptr, int64_t MergeDistance) const
Definition: TargetTransformInfoImpl.h:1017

llvm::TargetTransformInfoImplBase::getMaskedMemoryOpCost
InstructionCost getMaskedMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind) const
Definition: TargetTransformInfoImpl.h:685

llvm::TargetTransformInfoImplBase::isLoweredToCall
bool isLoweredToCall(const Function *F) const
Definition: TargetTransformInfoImpl.h:141

llvm::TargetTransformInfoImplBase::hasBranchDivergence
bool hasBranchDivergence(const Function *F=nullptr) const
Definition: TargetTransformInfoImpl.h:101

llvm::TargetTransformInfoImplBase::TargetTransformInfoImplBase
TargetTransformInfoImplBase(const DataLayout &DL)
Definition: TargetTransformInfoImpl.h:40

llvm::TargetTransformInfoImplBase::shouldFoldTerminatingConditionAfterLSR
bool shouldFoldTerminatingConditionAfterLSR() const
Definition: TargetTransformInfoImpl.h:241

llvm::TargetTransformInfoImplBase::getMinVectorRegisterBitWidth
unsigned getMinVectorRegisterBitWidth() const
Definition: TargetTransformInfoImpl.h:472

llvm::TargetTransformInfoImplBase::getRegisterClassName
const char * getRegisterClassName(unsigned ClassID) const
Definition: TargetTransformInfoImpl.h:457

llvm::TargetTransformInfoImplBase::isElementTypeLegalForScalableVector
bool isElementTypeLegalForScalableVector(Type *Ty) const
Definition: TargetTransformInfoImpl.h:894

llvm::TargetTransformInfoImplBase::preferPredicateOverEpilogue
bool preferPredicateOverEpilogue(TailFoldingInfo *TFI) const
Definition: TargetTransformInfoImpl.h:183

llvm::TargetTransformInfoImplBase::isLegalToVectorizeReduction
bool isLegalToVectorizeReduction(const RecurrenceDescriptor &RdxDesc, ElementCount VF) const
Definition: TargetTransformInfoImpl.h:889

llvm::TargetTransformInfoImplBase::getScalarizationOverhead
InstructionCost getScalarizationOverhead(VectorType *Ty, const APInt &DemandedElts, bool Insert, bool Extract, TTI::TargetCostKind CostKind) const
Definition: TargetTransformInfoImpl.h:359

llvm::TargetTransformInfoImplBase::getMaximumVF
unsigned getMaximumVF(unsigned ElemWidth, unsigned Opcode) const
Definition: TargetTransformInfoImpl.h:487

llvm::TargetTransformInfoImplBase::getPreferredTailFoldingStyle
TailFoldingStyle getPreferredTailFoldingStyle(bool IVUpdateMayOverflow=true) const
Definition: TargetTransformInfoImpl.h:186

llvm::TargetTransformInfoImplBase::getCFInstrCost
InstructionCost getCFInstrCost(unsigned Opcode, TTI::TargetCostKind CostKind, const Instruction *I=nullptr) const
Definition: TargetTransformInfoImpl.h:635

llvm::TargetTransformInfoImplBase::getCostOfKeepingLiveOverCall
InstructionCost getCostOfKeepingLiveOverCall(ArrayRef< Type * > Tys) const
Definition: TargetTransformInfoImpl.h:800

llvm::TargetTransformInfoImplBase::shouldBuildRelLookupTables
bool shouldBuildRelLookupTables() const
Definition: TargetTransformInfoImpl.h:355

llvm::TargetTransformInfoImplBase::getMinMaxReductionCost
InstructionCost getMinMaxReductionCost(Intrinsic::ID IID, VectorType *, FastMathFlags, TTI::TargetCostKind) const
Definition: TargetTransformInfoImpl.h:781

llvm::TargetTransformInfoImplBase::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, Value *Op0, Value *Op1) const
Definition: TargetTransformInfoImpl.h:651

llvm::TargetTransformInfoImplBase::getLoadStoreVecRegBitWidth
unsigned getLoadStoreVecRegBitWidth(unsigned AddrSpace) const
Definition: TargetTransformInfoImpl.h:873

llvm::TargetTransformInfoImplBase::getMemoryOpCost
InstructionCost getMemoryOpCost(unsigned Opcode, Type *Src, Align Alignment, unsigned AddressSpace, TTI::TargetCostKind CostKind, TTI::OperandValueInfo OpInfo, const Instruction *I) const
Definition: TargetTransformInfoImpl.h:670

llvm::TargetTransformInfoImplBase::useColdCCForColdCall
bool useColdCCForColdCall(Function &F) const
Definition: TargetTransformInfoImpl.h:357

llvm::TargetTransformInfoImplBase::enableSelectOptimize
bool enableSelectOptimize() const
Definition: TargetTransformInfoImpl.h:386

llvm::TargetTransformInfoImplBase::shouldExpandReduction
bool shouldExpandReduction(const IntrinsicInst *II) const
Definition: TargetTransformInfoImpl.h:922

llvm::TargetTransformInfoImplBase::isLegalMaskedScatter
bool isLegalMaskedScatter(Type *DataType, Align Alignment) const
Definition: TargetTransformInfoImpl.h:284

llvm::TargetTransformInfoImplBase::getNumberOfRegisters
unsigned getNumberOfRegisters(unsigned ClassID) const
Definition: TargetTransformInfoImpl.h:451

llvm::TargetTransformInfoImplBase::getExtractWithExtendCost
InstructionCost getExtractWithExtendCost(unsigned Opcode, Type *Dst, VectorType *VecTy, unsigned Index) const
Definition: TargetTransformInfoImpl.h:629

llvm::TargetTransformInfoImplBase::supportsScalableVectors
bool supportsScalableVectors() const
Definition: TargetTransformInfoImpl.h:928

llvm::TargetTransformInfoImplBase::getGEPCost
InstructionCost getGEPCost(Type *PointeeType, const Value *Ptr, ArrayRef< const Value * > Operands, Type *AccessType, TTI::TargetCostKind CostKind) const
Definition: TargetTransformInfoImpl.h:49

llvm::TargetTransformInfoImplBase::isLegalNTLoad
bool isLegalNTLoad(Type *DataType, Align Alignment) const
Definition: TargetTransformInfoImpl.h:273

llvm::TargetTransformInfoImplBase::isFCmpOrdCheaperThanFCmpZero
bool isFCmpOrdCheaperThanFCmpZero(Type *Ty) const
Definition: TargetTransformInfoImpl.h:417

llvm::TargetTransformInfoImplBase::simplifyDemandedUseBitsIntrinsic
std::optional< Value * > simplifyDemandedUseBitsIntrinsic(InstCombiner &IC, IntrinsicInst &II, APInt DemandedMask, KnownBits &Known, bool &KnownBitsComputed) const
Definition: TargetTransformInfoImpl.h:196

llvm::TargetTransformInfoImplBase::forceScalarizeMaskedScatter
bool forceScalarizeMaskedScatter(VectorType *DataType, Align Alignment) const
Definition: TargetTransformInfoImpl.h:296

llvm::TargetTransformInfoImplBase::hasActiveVectorLength
bool hasActiveVectorLength(unsigned Opcode, Type *DataType, Align Alignment) const
Definition: TargetTransformInfoImpl.h:932

llvm::TargetTransformInfoImplBase::isLegalAltInstr
bool isLegalAltInstr(VectorType *VecTy, unsigned Opcode0, unsigned Opcode1, const SmallBitVector &OpcodeMask) const
Definition: TargetTransformInfoImpl.h:305

llvm::TargetTransformInfoImplBase::isLegalMaskedLoad
bool isLegalMaskedLoad(Type *DataType, Align Alignment) const
Definition: TargetTransformInfoImpl.h:262

llvm::TargetTransformInfoImplBase::DL
const DataLayout & DL
Definition: TargetTransformInfoImpl.h:38

llvm::TargetTransformInfoImplBase::isValidAddrSpaceCast
bool isValidAddrSpaceCast(unsigned FromAS, unsigned ToAS) const
Definition: TargetTransformInfoImpl.h:107

llvm::TargetTransformInfoImplBase::instCombineIntrinsic
std::optional< Instruction * > instCombineIntrinsic(InstCombiner &IC, IntrinsicInst &II) const
Definition: TargetTransformInfoImpl.h:190

llvm::TargetTransformInfoImplBase::getInlinerVectorBonusPercent
int getInlinerVectorBonusPercent() const
Definition: TargetTransformInfoImpl.h:81

llvm::TargetTransformInfoImplBase::getScalingFactorCost
InstructionCost getScalingFactorCost(Type *Ty, GlobalValue *BaseGV, int64_t BaseOffset, bool HasBaseReg, int64_t Scale, unsigned AddrSpace) const
Definition: TargetTransformInfoImpl.h:328

llvm::TargetTransformInfoImplBase::getPrefetchDistance
unsigned getPrefetchDistance() const
Definition: TargetTransformInfoImpl.h:522

llvm::TargetTransformInfoImplBase::isLegalAddScalableImmediate
bool isLegalAddScalableImmediate(int64_t Imm) const
Definition: TargetTransformInfoImpl.h:219

llvm::TargetTransformInfoImplBase::isLegalMaskedCompressStore
bool isLegalMaskedCompressStore(Type *DataType, Align Alignment) const
Definition: TargetTransformInfoImpl.h:301

llvm::TargetTransformInfoImplBase::getAltInstrCost
InstructionCost getAltInstrCost(VectorType *VecTy, unsigned Opcode0, unsigned Opcode1, const SmallBitVector &OpcodeMask, TTI::TargetCostKind CostKind) const
Definition: TargetTransformInfoImpl.h:575

llvm::TargetTransformInfoImplBase::canMacroFuseCmp
bool canMacroFuseCmp() const
Definition: TargetTransformInfoImpl.h:245

llvm::TargetTransformInfoImplBase::TargetTransformInfoImplBase
TargetTransformInfoImplBase(const TargetTransformInfoImplBase &Arg)=default

llvm::TargetTransformInfoImplBase::enableMaskedInterleavedAccessVectorization
bool enableMaskedInterleavedAccessVectorization() const
Definition: TargetTransformInfoImpl.h:399

llvm::TargetTransformInfoImplBase::isLegalToVectorizeStoreChain
bool isLegalToVectorizeStoreChain(unsigned ChainSizeInBytes, Align Alignment, unsigned AddrSpace) const
Definition: TargetTransformInfoImpl.h:884

llvm::TargetTransformInfoImplBase::getMinimumVF
ElementCount getMinimumVF(unsigned ElemWidth, bool IsScalable) const
Definition: TargetTransformInfoImpl.h:483

llvm::TargetTransformInfoImplBase::shouldBuildLookupTablesForConstant
bool shouldBuildLookupTablesForConstant(Constant *C) const
Definition: TargetTransformInfoImpl.h:353

llvm::TargetTransformInfoImplBase::rewriteIntrinsicWithAddressSpace
Value * rewriteIntrinsicWithAddressSpace(IntrinsicInst *II, Value *OldV, Value *NewV) const
Definition: TargetTransformInfoImpl.h:136

llvm::TargetTransformInfoImplCRTPBase
CRTP base class for use as a mix-in that aids implementing a TargetTransformInfo-compatible class.
Definition: TargetTransformInfoImpl.h:1033

llvm::TargetTransformInfoImplCRTPBase::TargetTransformInfoImplCRTPBase
TargetTransformInfoImplCRTPBase(const DataLayout &DL)
Definition: TargetTransformInfoImpl.h:1038

llvm::TargetTransformInfoImplCRTPBase::supportsTailCallFor
bool supportsTailCallFor(const CallBase *CB) const
Definition: TargetTransformInfoImpl.h:1462

llvm::TargetTransformInfoImplCRTPBase::getGEPCost
InstructionCost getGEPCost(Type *PointeeType, const Value *Ptr, ArrayRef< const Value * > Operands, Type *AccessType, TTI::TargetCostKind CostKind)
Definition: TargetTransformInfoImpl.h:1043

llvm::TargetTransformInfoImplCRTPBase::getPointersChainCost
InstructionCost getPointersChainCost(ArrayRef< const Value * > Ptrs, const Value *Base, const TTI::PointersChainInfo &Info, Type *AccessTy, TTI::TargetCostKind CostKind)
Definition: TargetTransformInfoImpl.h:1121

llvm::TargetTransformInfoImplCRTPBase::getInstructionCost
InstructionCost getInstructionCost(const User *U, ArrayRef< const Value * > Operands, TTI::TargetCostKind CostKind)
Definition: TargetTransformInfoImpl.h:1158

llvm::TargetTransformInfoImplCRTPBase::isExpensiveToSpeculativelyExecute
bool isExpensiveToSpeculativelyExecute(const Instruction *I)
Definition: TargetTransformInfoImpl.h:1454

llvm::TargetTransformInfo
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Definition: TargetTransformInfo.h:213

llvm::TargetTransformInfo::getCastContextHint
static CastContextHint getCastContextHint(const Instruction *I)
Calculates a CastContextHint from I.
Definition: TargetTransformInfo.cpp:927

llvm::TargetTransformInfo::getOperandInfo
static OperandValueInfo getOperandInfo(const Value *V)
Collect properties of V used in cost analysis, e.g. OP_PowerOf2.
Definition: TargetTransformInfo.cpp:820

llvm::TargetTransformInfo::TargetCostKind
TargetCostKind
The kind of cost model.
Definition: TargetTransformInfo.h:258

llvm::TargetTransformInfo::TCK_RecipThroughput
@ TCK_RecipThroughput
Reciprocal throughput.
Definition: TargetTransformInfo.h:259

llvm::TargetTransformInfo::TCK_CodeSize
@ TCK_CodeSize
Instruction code size.
Definition: TargetTransformInfo.h:261

llvm::TargetTransformInfo::TCK_SizeAndLatency
@ TCK_SizeAndLatency
The weighted sum of size and latency.
Definition: TargetTransformInfo.h:262

llvm::TargetTransformInfo::TCK_Latency
@ TCK_Latency
The latency of instruction.
Definition: TargetTransformInfo.h:260

llvm::TargetTransformInfo::OP_None
@ OP_None
Definition: TargetTransformInfo.h:1076

llvm::TargetTransformInfo::RegisterKind
RegisterKind
Definition: TargetTransformInfo.h:1125

llvm::TargetTransformInfo::PopcntSupportKind
PopcntSupportKind
Flags indicating the kind of support for population count.
Definition: TargetTransformInfo.h:695

llvm::TargetTransformInfo::PSK_Software
@ PSK_Software
Definition: TargetTransformInfo.h:695

llvm::TargetTransformInfo::TCC_Expensive
@ TCC_Expensive
The cost of a 'div' instruction on x86.
Definition: TargetTransformInfo.h:286

llvm::TargetTransformInfo::TCC_Free
@ TCC_Free
Expected to fold away in lowering.
Definition: TargetTransformInfo.h:284

llvm::TargetTransformInfo::TCC_Basic
@ TCC_Basic
The cost of a typical 'add' instruction.
Definition: TargetTransformInfo.h:285

llvm::TargetTransformInfo::MemIndexedMode
MemIndexedMode
The type of load/store indexing.
Definition: TargetTransformInfo.h:1609

llvm::TargetTransformInfo::AddressingModeKind
AddressingModeKind
Definition: TargetTransformInfo.h:757

llvm::TargetTransformInfo::AMK_None
@ AMK_None
Definition: TargetTransformInfo.h:760

llvm::TargetTransformInfo::ShuffleKind
ShuffleKind
The various kinds of shuffle patterns for vector queries.
Definition: TargetTransformInfo.h:1047

llvm::TargetTransformInfo::SK_InsertSubvector
@ SK_InsertSubvector
InsertSubvector. Index indicates start offset.
Definition: TargetTransformInfo.h:1054

llvm::TargetTransformInfo::SK_Select
@ SK_Select
Selects elements from the corresponding lane of either source operand.
Definition: TargetTransformInfo.h:1050

llvm::TargetTransformInfo::SK_PermuteSingleSrc
@ SK_PermuteSingleSrc
Shuffle elements of single source vector with any shuffle mask.
Definition: TargetTransformInfo.h:1058

llvm::TargetTransformInfo::SK_Transpose
@ SK_Transpose
Transpose two vectors.
Definition: TargetTransformInfo.h:1053

llvm::TargetTransformInfo::SK_Splice
@ SK_Splice
Concatenates elements from the first input vector with elements of the second input vector.
Definition: TargetTransformInfo.h:1060

llvm::TargetTransformInfo::SK_Broadcast
@ SK_Broadcast
Broadcast element 0 to all other elements.
Definition: TargetTransformInfo.h:1048

llvm::TargetTransformInfo::SK_PermuteTwoSrc
@ SK_PermuteTwoSrc
Merge elements from two source vectors into one with any shuffle mask.
Definition: TargetTransformInfo.h:1056

llvm::TargetTransformInfo::SK_Reverse
@ SK_Reverse
Reverse the order of the vector.
Definition: TargetTransformInfo.h:1049

llvm::TargetTransformInfo::SK_ExtractSubvector
@ SK_ExtractSubvector
ExtractSubvector Index indicates start offset.
Definition: TargetTransformInfo.h:1055

llvm::TargetTransformInfo::CastContextHint
CastContextHint
Represents a hint about the context in which a cast is used.
Definition: TargetTransformInfo.h:1320

llvm::TargetTransformInfo::OK_AnyValue
@ OK_AnyValue
Definition: TargetTransformInfo.h:1068

llvm::TargetTransformInfo::CacheLevel
CacheLevel
The possible cache levels.
Definition: TargetTransformInfo.h:1184

llvm::TargetTransformInfo::CacheLevel::L1D
@ L1D

llvm::TargetTransformInfo::CacheLevel::L2D
@ L2D

llvm::TruncInst
This class represents a truncation of integer types.
Definition: Instructions.h:5349

llvm::TypeSize
Definition: TypeSize.h:319

llvm::TypeSize::getFixed
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition: TypeSize.h:330

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::isVectorTy
bool isVectorTy() const
True if this is an instance of VectorType.
Definition: Type.h:265

llvm::Type::getPointerAddressSpace
unsigned getPointerAddressSpace() const
Get the address space of this pointer or pointer vector type.

llvm::Type::getIntNTy
static IntegerType * getIntNTy(LLVMContext &C, unsigned N)

llvm::Type::getScalarSizeInBits
unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.

llvm::Type::getInt8Ty
static IntegerType * getInt8Ty(LLVMContext &C)

llvm::Type::isFloatingPointTy
bool isFloatingPointTy() const
Return true if this is one of the floating-point types.
Definition: Type.h:185

llvm::Type::isScalableTy
bool isScalableTy() const
Return true if this is a type whose size is a known multiple of vscale.

llvm::Type::getScalarType
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
Definition: Type.h:348

llvm::User
Definition: User.h:44

llvm::VPIntrinsic
This is the common base class for vector predication intrinsics.
Definition: IntrinsicInst.h:555

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition: Value.h:255

llvm::VectorType
Base class of all SIMD vector types.
Definition: DerivedTypes.h:403

llvm::details::FixedOrScalableQuantity::getFixedValue
constexpr ScalarTy getFixedValue() const
Definition: TypeSize.h:187

llvm::details::FixedOrScalableQuantity::isScalable
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
Definition: TypeSize.h:171

uint64_t

unsigned

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

llvm::CallingConv::Fast
@ Fast
Attempts to make calls as fast as possible (e.g.
Definition: CallingConv.h:41

llvm::CallingConv::C
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34

llvm::PatternMatch
Definition: PatternMatch.h:47

llvm::PatternMatch::match
bool match(Val *V, const Pattern &P)
Definition: PatternMatch.h:49

llvm::PatternMatch::m_LogicalOr
auto m_LogicalOr()
Matches L || R where L and R are arbitrary values.
Definition: PatternMatch.h:2867

llvm::PatternMatch::m_Value
class_match< Value > m_Value()
Match an arbitrary value and ignore it.
Definition: PatternMatch.h:92

llvm::PatternMatch::m_LogicalAnd
auto m_LogicalAnd()
Matches L && R where L and R are arbitrary values.
Definition: PatternMatch.h:2849

llvm::PatternMatch::m_CombineOr
match_combine_or< LTy, RTy > m_CombineOr(const LTy &L, const RTy &R)
Combine two pattern matchers matching L || R.
Definition: PatternMatch.h:239

llvm::codeview::PublicSymFlags::Function
@ Function

llvm::dwarf::Index
Index
Definition: Dwarf.h:872

llvm::sampleprof::Base
@ Base
Definition: Discriminator.h:58

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::Length
@ Length
Definition: DWP.cpp:456

llvm::enumerate
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are are tuples (A,...
Definition: STLExtras.h:2406

llvm::AddressSpace
AddressSpace
Definition: NVPTXBaseInfo.h:21

llvm::getSplatValue
Value * getSplatValue(const Value *V)
Get splat value if the input is a splat vector or return nullptr.
Definition: VectorUtils.cpp:250

llvm::any_of
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1729

llvm::isPowerOf2_32
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition: MathExtras.h:275

llvm::ComplexDeinterleavingOperation::Splat
@ Splat

llvm::PoisonMaskElem
constexpr int PoisonMaskElem
Definition: Instructions.h:2159

llvm::BitWidth
constexpr unsigned BitWidth
Definition: BitmaskEnum.h:191

llvm::gep_type_begin
gep_type_iterator gep_type_begin(const User *GEP)
Definition: GetElementPtrTypeIterator.h:173

llvm::Cost
InstructionCost Cost
Definition: FunctionSpecialization.h:95

llvm::TailFoldingStyle
TailFoldingStyle
Definition: TargetTransformInfo.h:166

llvm::TailFoldingStyle::DataWithoutLaneMask
@ DataWithoutLaneMask
Same as Data, but avoids using the get.active.lane.mask intrinsic to calculate the mask and instead i...

llvm::VFParamKind::Vector
@ Vector

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::HardwareLoopInfo
Attributes of a target dependent hardware loop.
Definition: TargetTransformInfo.h:97

llvm::KnownBits
Definition: KnownBits.h:23

llvm::MemIntrinsicInfo
Information about a load/store intrinsic defined by the target.
Definition: TargetTransformInfo.h:72

llvm::OptimizedStructLayoutField
A field in a structure.
Definition: OptimizedStructLayout.h:45

llvm::TailFoldingInfo
Definition: TargetTransformInfo.h:199

llvm::TargetTransformInfo::LSRCost
Definition: TargetTransformInfo.h:510

llvm::TargetTransformInfo::LSRCost::NumIVMuls
unsigned NumIVMuls
Definition: TargetTransformInfo.h:516

llvm::TargetTransformInfo::LSRCost::ScaleCost
unsigned ScaleCost
Definition: TargetTransformInfo.h:520

llvm::TargetTransformInfo::LSRCost::ImmCost
unsigned ImmCost
Definition: TargetTransformInfo.h:518

llvm::TargetTransformInfo::LSRCost::AddRecCost
unsigned AddRecCost
Definition: TargetTransformInfo.h:515

llvm::TargetTransformInfo::LSRCost::NumRegs
unsigned NumRegs
Definition: TargetTransformInfo.h:514

llvm::TargetTransformInfo::LSRCost::NumBaseAdds
unsigned NumBaseAdds
Definition: TargetTransformInfo.h:517

llvm::TargetTransformInfo::LSRCost::SetupCost
unsigned SetupCost
Definition: TargetTransformInfo.h:519

llvm::TargetTransformInfo::MemCmpExpansionOptions
Returns options for expansion of memcmp. IsZeroCmp is.
Definition: TargetTransformInfo.h:911

llvm::TargetTransformInfo::OperandValueInfo
Definition: TargetTransformInfo.h:1084

llvm::TargetTransformInfo::PeelingPreferences
Definition: TargetTransformInfo.h:639

llvm::TargetTransformInfo::PointersChainInfo
Describe known properties for a set of pointers.
Definition: TargetTransformInfo.h:306

llvm::TargetTransformInfo::ReductionFlags
Flags describing the kind of vector reduction.
Definition: TargetTransformInfo.h:1661

llvm::TargetTransformInfo::UnrollingPreferences
Parameters that control the generic loop unrolling transformation.
Definition: TargetTransformInfo.h:524

llvm::TargetTransformInfo::VPLegalization
Definition: TargetTransformInfo.h:1719

llvm::TargetTransformInfo::VPLegalization::Convert
@ Convert
Definition: TargetTransformInfo.h:1726

llvm::TargetTransformInfo::VPLegalization::Discard
@ Discard
Definition: TargetTransformInfo.h:1724