doxygen/WebAssemblyTargetTransformInfo_8cpp_source.html

//===-- WebAssemblyTargetTransformInfo.cpp - WebAssembly-specific TTI -----===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

///

/// \file

/// This file defines the WebAssembly-specific TargetTransformInfo

/// implementation.

///

//===----------------------------------------------------------------------===//


#include "WebAssemblyTargetTransformInfo.h"

#include "llvm/CodeGen/CostTable.h"

#include "llvm/Support/Debug.h"

using namespace llvm;


#define DEBUG_TYPE "wasmtti"


TargetTransformInfo::PopcntSupportKind

WebAssemblyTTIImpl::getPopcntSupport(unsigned TyWidth) const {

  assert(isPowerOf2_32(TyWidth) && "Ty width must be power of 2");

  return TargetTransformInfo::PSK_FastHardware;

}


unsigned WebAssemblyTTIImpl::getNumberOfRegisters(unsigned ClassID) const {

  unsigned Result = BaseT::getNumberOfRegisters(ClassID);


  // For SIMD, use at least 16 registers, as a rough guess.

  bool Vector = (ClassID == 1);

  if (Vector)

    Result = std::max(Result, 16u);


  return Result;

}


TypeSize WebAssemblyTTIImpl::getRegisterBitWidth(

    TargetTransformInfo::RegisterKind K) const {

  switch (K) {

  case TargetTransformInfo::RGK_Scalar:

    return TypeSize::getFixed(64);

  case TargetTransformInfo::RGK_FixedWidthVector:

    return TypeSize::getFixed(getST()->hasSIMD128() ? 128 : 64);

  case TargetTransformInfo::RGK_ScalableVector:

    return TypeSize::getScalable(0);

  }


  llvm_unreachable("Unsupported register kind");

}


InstructionCost WebAssemblyTTIImpl::getArithmeticInstrCost(

    unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind,

    TTI::OperandValueInfo Op1Info, TTI::OperandValueInfo Op2Info,

    ArrayRef<const Value *> Args,

    const Instruction *CxtI) {


  InstructionCost Cost =

      BasicTTIImplBase<WebAssemblyTTIImpl>::getArithmeticInstrCost(

          Opcode, Ty, CostKind, Op1Info, Op2Info);


  if (auto *VTy = dyn_cast<VectorType>(Ty)) {

    switch (Opcode) {

    case Instruction::LShr:

    case Instruction::AShr:

    case Instruction::Shl:

      // SIMD128's shifts currently only accept a scalar shift count. For each

      // element, we'll need to extract, op, insert. The following is a rough

      // approximation.

      if (!Op2Info.isUniform())

        Cost =

            cast<FixedVectorType>(VTy)->getNumElements() *

            (TargetTransformInfo::TCC_Basic +

             getArithmeticInstrCost(Opcode, VTy->getElementType(), CostKind) +

             TargetTransformInfo::TCC_Basic);

      break;

    }

  }

  return Cost;

}


InstructionCost

WebAssemblyTTIImpl::getVectorInstrCost(unsigned Opcode, Type *Val,

                                       TTI::TargetCostKind CostKind,

                                       unsigned Index, Value *Op0, Value *Op1) {

  InstructionCost Cost = BasicTTIImplBase::getVectorInstrCost(

      Opcode, Val, CostKind, Index, Op0, Op1);


  // SIMD128's insert/extract currently only take constant indices.

  if (Index == -1u)

    return Cost + 25 * TargetTransformInfo::TCC_Expensive;


  return Cost;

}


TTI::ReductionShuffle WebAssemblyTTIImpl::getPreferredExpandedReductionShuffle(

    const IntrinsicInst *II) const {


  switch (II->getIntrinsicID()) {

  default:

    break;

  case Intrinsic::vector_reduce_fadd:

    return TTI::ReductionShuffle::Pairwise;

  }

  return TTI::ReductionShuffle::SplitHalf;

}


bool WebAssemblyTTIImpl::areInlineCompatible(const Function *Caller,

                                             const Function *Callee) const {

  // Allow inlining only when the Callee has a subset of the Caller's

  // features. In principle, we should be able to inline regardless of any

  // features because WebAssembly supports features at module granularity, not

  // function granularity, but without this restriction it would be possible for

  // a module to "forget" about features if all the functions that used them

  // were inlined.

  const TargetMachine &TM = getTLI()->getTargetMachine();


  const FeatureBitset &CallerBits =

      TM.getSubtargetImpl(*Caller)->getFeatureBits();

  const FeatureBitset &CalleeBits =

      TM.getSubtargetImpl(*Callee)->getFeatureBits();


  return (CallerBits & CalleeBits) == CalleeBits;

}


void WebAssemblyTTIImpl::getUnrollingPreferences(

    Loop *L, ScalarEvolution &SE, TTI::UnrollingPreferences &UP,

    OptimizationRemarkEmitter *ORE) const {

  // Scan the loop: don't unroll loops with calls. This is a standard approach

  // for most (all?) targets.

  for (BasicBlock *BB : L->blocks())

    for (Instruction &I : *BB)

      if (isa<CallInst>(I) || isa<InvokeInst>(I))

        if (const Function *F = cast<CallBase>(I).getCalledFunction())

          if (isLoweredToCall(F))

            return;


  // The chosen threshold is within the range of 'LoopMicroOpBufferSize' of

  // the various microarchitectures that use the BasicTTI implementation and

  // has been selected through heuristics across multiple cores and runtimes.

  UP.Partial = UP.Runtime = UP.UpperBound = true;

  UP.PartialThreshold = 30;


  // Avoid unrolling when optimizing for size.

  UP.OptSizeThreshold = 0;

  UP.PartialOptSizeThreshold = 0;


  // Set number of instructions optimized when "back edge"

  // becomes "fall through" to default value of 2.

  UP.BEInsns = 2;

}


bool WebAssemblyTTIImpl::supportsTailCalls() const {

  return getST()->hasTailCall();

}

CostKind
static cl::opt< TargetTransformInfo::TargetCostKind > CostKind("cost-kind", cl::desc("Target cost kind"), cl::init(TargetTransformInfo::TCK_RecipThroughput), cl::values(clEnumValN(TargetTransformInfo::TCK_RecipThroughput, "throughput", "Reciprocal throughput"), clEnumValN(TargetTransformInfo::TCK_Latency, "latency", "Instruction latency"), clEnumValN(TargetTransformInfo::TCK_CodeSize, "code-size", "Code size"), clEnumValN(TargetTransformInfo::TCK_SizeAndLatency, "size-latency", "Code size and latency")))

CostTable.h
Cost tables and simple lookup functions.

Debug.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

I
#define I(x, y, z)
Definition: MD5.cpp:58

getCalledFunction
static const Function * getCalledFunction(const Value *V, bool &IsNoBuiltin)
Definition: MemoryBuiltins.cpp:160

II
uint64_t IntrinsicInst * II
Definition: NVVMIntrRange.cpp:52

TM
const char LLVMTargetMachineRef TM
Definition: PassBuilderBindings.cpp:48

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

WebAssemblyTargetTransformInfo.h
This file a TargetTransformInfo::Concept conforming object specific to the WebAssembly target machine...

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:61

llvm::BasicTTIImplBase::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, Value *Op0, Value *Op1)
Definition: BasicTTIImpl.h:1279

llvm::BasicTTIImplBase::getArithmeticInstrCost
InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Opd1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Opd2Info={TTI::OK_AnyValue, TTI::OP_None}, ArrayRef< const Value * > Args=std::nullopt, const Instruction *CxtI=nullptr)
Definition: BasicTTIImpl.h:897

llvm::FeatureBitset
Container class for subtarget features.
Definition: SubtargetFeature.h:41

llvm::Function
Definition: Function.h:64

llvm::InstructionCost
Definition: InstructionCost.h:29

llvm::Instruction
Definition: Instruction.h:68

llvm::IntrinsicInst
A wrapper class for inspecting calls to intrinsic functions.
Definition: IntrinsicInst.h:48

llvm::Loop
Represents a single loop in the control flow graph.
Definition: LoopInfo.h:44

llvm::OptimizationRemarkEmitter
The optimization diagnostic interface.
Definition: OptimizationRemarkEmitter.h:34

llvm::ScalarEvolution
The main scalar evolution driver.
Definition: ScalarEvolution.h:452

llvm::TargetLoweringBase::getTargetMachine
const TargetMachine & getTargetMachine() const
Definition: TargetLowering.h:362

llvm::TargetMachine
Primary interface to the complete machine description for the target machine.
Definition: TargetMachine.h:77

llvm::TargetTransformInfoImplBase::isLoweredToCall
bool isLoweredToCall(const Function *F) const
Definition: TargetTransformInfoImpl.h:144

llvm::TargetTransformInfoImplBase::getNumberOfRegisters
unsigned getNumberOfRegisters(unsigned ClassID) const
Definition: TargetTransformInfoImpl.h:464

llvm::TargetTransformInfo::ReductionShuffle
ReductionShuffle
Definition: TargetTransformInfo.h:1719

llvm::TargetTransformInfo::ReductionShuffle::Pairwise
@ Pairwise

llvm::TargetTransformInfo::ReductionShuffle::SplitHalf
@ SplitHalf

llvm::TargetTransformInfo::TargetCostKind
TargetCostKind
The kind of cost model.
Definition: TargetTransformInfo.h:259

llvm::TargetTransformInfo::RegisterKind
RegisterKind
Definition: TargetTransformInfo.h:1143

llvm::TargetTransformInfo::RGK_FixedWidthVector
@ RGK_FixedWidthVector
Definition: TargetTransformInfo.h:1143

llvm::TargetTransformInfo::RGK_ScalableVector
@ RGK_ScalableVector
Definition: TargetTransformInfo.h:1143

llvm::TargetTransformInfo::RGK_Scalar
@ RGK_Scalar
Definition: TargetTransformInfo.h:1143

llvm::TargetTransformInfo::PopcntSupportKind
PopcntSupportKind
Flags indicating the kind of support for population count.
Definition: TargetTransformInfo.h:702

llvm::TargetTransformInfo::PSK_FastHardware
@ PSK_FastHardware
Definition: TargetTransformInfo.h:702

llvm::TargetTransformInfo::TCC_Expensive
@ TCC_Expensive
The cost of a 'div' instruction on x86.
Definition: TargetTransformInfo.h:287

llvm::TargetTransformInfo::TCC_Basic
@ TCC_Basic
The cost of a typical 'add' instruction.
Definition: TargetTransformInfo.h:286

llvm::TypeSize
Definition: TypeSize.h:334

llvm::TypeSize::getFixed
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition: TypeSize.h:345

llvm::TypeSize::getScalable
static constexpr TypeSize getScalable(ScalarTy MinimumSize)
Definition: TypeSize.h:348

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::WebAssemblySubtarget::hasTailCall
bool hasTailCall() const
Definition: WebAssemblySubtarget.h:108

llvm::WebAssemblyTTIImpl::getPreferredExpandedReductionShuffle
TTI::ReductionShuffle getPreferredExpandedReductionShuffle(const IntrinsicInst *II) const
Definition: WebAssemblyTargetTransformInfo.cpp:97

llvm::WebAssemblyTTIImpl::supportsTailCalls
bool supportsTailCalls() const
Definition: WebAssemblyTargetTransformInfo.cpp:154

llvm::WebAssemblyTTIImpl::getRegisterBitWidth
TypeSize getRegisterBitWidth(TargetTransformInfo::RegisterKind K) const
Definition: WebAssemblyTargetTransformInfo.cpp:39

llvm::WebAssemblyTTIImpl::areInlineCompatible
bool areInlineCompatible(const Function *Caller, const Function *Callee) const
Definition: WebAssemblyTargetTransformInfo.cpp:109

llvm::WebAssemblyTTIImpl::getVectorInstrCost
InstructionCost getVectorInstrCost(unsigned Opcode, Type *Val, TTI::TargetCostKind CostKind, unsigned Index, Value *Op0, Value *Op1)
Definition: WebAssemblyTargetTransformInfo.cpp:84

llvm::WebAssemblyTTIImpl::getArithmeticInstrCost
InstructionCost getArithmeticInstrCost(unsigned Opcode, Type *Ty, TTI::TargetCostKind CostKind, TTI::OperandValueInfo Op1Info={TTI::OK_AnyValue, TTI::OP_None}, TTI::OperandValueInfo Op2Info={TTI::OK_AnyValue, TTI::OP_None}, ArrayRef< const Value * > Args=std::nullopt, const Instruction *CxtI=nullptr)
Definition: WebAssemblyTargetTransformInfo.cpp:53

llvm::WebAssemblyTTIImpl::getPopcntSupport
TTI::PopcntSupportKind getPopcntSupport(unsigned TyWidth) const
Definition: WebAssemblyTargetTransformInfo.cpp:23

llvm::WebAssemblyTTIImpl::getUnrollingPreferences
void getUnrollingPreferences(Loop *L, ScalarEvolution &SE, TTI::UnrollingPreferences &UP, OptimizationRemarkEmitter *ORE) const
Definition: WebAssemblyTargetTransformInfo.cpp:127

llvm::WebAssemblyTTIImpl::getNumberOfRegisters
unsigned getNumberOfRegisters(unsigned ClassID) const
Definition: WebAssemblyTargetTransformInfo.cpp:28

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

llvm::dwarf::Index
Index
Definition: Dwarf.h:875

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::isPowerOf2_32
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition: MathExtras.h:291

llvm::Cost
InstructionCost Cost
Definition: FunctionSpecialization.h:95

llvm::VFParamKind::Vector
@ Vector

llvm::TargetTransformInfo::OperandValueInfo
Definition: TargetTransformInfo.h:1098

llvm::TargetTransformInfo::OperandValueInfo::isUniform
bool isUniform() const
Definition: TargetTransformInfo.h:1105

llvm::TargetTransformInfo::UnrollingPreferences
Parameters that control the generic loop unrolling transformation.
Definition: TargetTransformInfo.h:531

llvm::TargetTransformInfo::UnrollingPreferences::UpperBound
bool UpperBound
Allow using trip count upper bound to unroll loops.
Definition: TargetTransformInfo.h:602

llvm::TargetTransformInfo::UnrollingPreferences::PartialOptSizeThreshold
unsigned PartialOptSizeThreshold
The cost threshold for the unrolled loop when optimizing for size, like OptSizeThreshold,...
Definition: TargetTransformInfo.h:560

llvm::TargetTransformInfo::UnrollingPreferences::BEInsns
unsigned BEInsns
Definition: TargetTransformInfo.h:585

llvm::TargetTransformInfo::UnrollingPreferences::PartialThreshold
unsigned PartialThreshold
The cost threshold for the unrolled loop, like Threshold, but used for partial/runtime unrolling (set...
Definition: TargetTransformInfo.h:556

llvm::TargetTransformInfo::UnrollingPreferences::Runtime
bool Runtime
Allow runtime unrolling (unrolling of loops to expand the size of the loop body even when the number ...
Definition: TargetTransformInfo.h:592

llvm::TargetTransformInfo::UnrollingPreferences::Partial
bool Partial
Allow partial unrolling (unrolling of loops to expand the size of the loop body, not only to eliminat...
Definition: TargetTransformInfo.h:588

llvm::TargetTransformInfo::UnrollingPreferences::OptSizeThreshold
unsigned OptSizeThreshold
The cost threshold for the unrolled loop when optimizing for size (set to UINT_MAX to disable).
Definition: TargetTransformInfo.h:553