doxygen/AMDGPUCombinerHelper_8cpp_source.html

//=== lib/CodeGen/GlobalISel/AMDGPUCombinerHelper.cpp ---------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//


#include "AMDGPUCombinerHelper.h"

#include "GCNSubtarget.h"

#include "MCTargetDesc/AMDGPUMCTargetDesc.h"

#include "llvm/CodeGen/GlobalISel/GenericMachineInstrs.h"

#include "llvm/CodeGen/GlobalISel/MIPatternMatch.h"

#include "llvm/IR/IntrinsicsAMDGPU.h"

#include "llvm/Target/TargetMachine.h"


using namespace llvm;

using namespace MIPatternMatch;


LLVM_READNONE

static bool fnegFoldsIntoMI(const MachineInstr &MI) {

  switch (MI.getOpcode()) {

  case AMDGPU::G_FADD:

  case AMDGPU::G_FSUB:

  case AMDGPU::G_FMUL:

  case AMDGPU::G_FMA:

  case AMDGPU::G_FMAD:

  case AMDGPU::G_FMINNUM:

  case AMDGPU::G_FMAXNUM:

  case AMDGPU::G_FMINNUM_IEEE:

  case AMDGPU::G_FMAXNUM_IEEE:

  case AMDGPU::G_FMINIMUM:

  case AMDGPU::G_FMAXIMUM:

  case AMDGPU::G_FSIN:

  case AMDGPU::G_FPEXT:

  case AMDGPU::G_INTRINSIC_TRUNC:

  case AMDGPU::G_FPTRUNC:

  case AMDGPU::G_FRINT:

  case AMDGPU::G_FNEARBYINT:

  case AMDGPU::G_INTRINSIC_ROUND:

  case AMDGPU::G_INTRINSIC_ROUNDEVEN:

  case AMDGPU::G_FCANONICALIZE:

  case AMDGPU::G_AMDGPU_RCP_IFLAG:

  case AMDGPU::G_AMDGPU_FMIN_LEGACY:

  case AMDGPU::G_AMDGPU_FMAX_LEGACY:

    return true;

  case AMDGPU::G_INTRINSIC: {

    Intrinsic::ID IntrinsicID = cast<GIntrinsic>(MI).getIntrinsicID();

    switch (IntrinsicID) {

    case Intrinsic::amdgcn_rcp:

    case Intrinsic::amdgcn_rcp_legacy:

    case Intrinsic::amdgcn_sin:

    case Intrinsic::amdgcn_fmul_legacy:

    case Intrinsic::amdgcn_fmed3:

    case Intrinsic::amdgcn_fma_legacy:

      return true;

    default:

      return false;

    }

  }

  default:

    return false;

  }

}


/// \p returns true if the operation will definitely need to use a 64-bit

/// encoding, and thus will use a VOP3 encoding regardless of the source

/// modifiers.

LLVM_READONLY

static bool opMustUseVOP3Encoding(const MachineInstr &MI,

                                  const MachineRegisterInfo &MRI) {

  return MI.getNumOperands() > (isa<GIntrinsic>(MI) ? 4u : 3u) ||

         MRI.getType(MI.getOperand(0).getReg()).getScalarSizeInBits() == 64;

}


// Most FP instructions support source modifiers.

LLVM_READONLY

static bool hasSourceMods(const MachineInstr &MI) {

  if (!MI.memoperands().empty())

    return false;


  switch (MI.getOpcode()) {

  case AMDGPU::COPY:

  case AMDGPU::G_SELECT:

  case AMDGPU::G_FDIV:

  case AMDGPU::G_FREM:

  case TargetOpcode::INLINEASM:

  case TargetOpcode::INLINEASM_BR:

  case AMDGPU::G_INTRINSIC_W_SIDE_EFFECTS:

  case AMDGPU::G_INTRINSIC_CONVERGENT_W_SIDE_EFFECTS:

  case AMDGPU::G_BITCAST:

  case AMDGPU::G_ANYEXT:

  case AMDGPU::G_BUILD_VECTOR:

  case AMDGPU::G_BUILD_VECTOR_TRUNC:

  case AMDGPU::G_PHI:

    return false;

  case AMDGPU::G_INTRINSIC:

  case AMDGPU::G_INTRINSIC_CONVERGENT: {

    Intrinsic::ID IntrinsicID = cast<GIntrinsic>(MI).getIntrinsicID();

    switch (IntrinsicID) {

    case Intrinsic::amdgcn_interp_p1:

    case Intrinsic::amdgcn_interp_p2:

    case Intrinsic::amdgcn_interp_mov:

    case Intrinsic::amdgcn_interp_p1_f16:

    case Intrinsic::amdgcn_interp_p2_f16:

    case Intrinsic::amdgcn_div_scale:

      return false;

    default:

      return true;

    }

  }

  default:

    return true;

  }

}


static bool allUsesHaveSourceMods(MachineInstr &MI, MachineRegisterInfo &MRI,

                                  unsigned CostThreshold = 4) {

  // Some users (such as 3-operand FMA/MAD) must use a VOP3 encoding, and thus

  // it is truly free to use a source modifier in all cases. If there are

  // multiple users but for each one will necessitate using VOP3, there will be

  // a code size increase. Try to avoid increasing code size unless we know it

  // will save on the instruction count.

  unsigned NumMayIncreaseSize = 0;

  Register Dst = MI.getOperand(0).getReg();

  for (const MachineInstr &Use : MRI.use_nodbg_instructions(Dst)) {

    if (!hasSourceMods(Use))

      return false;


    if (!opMustUseVOP3Encoding(Use, MRI)) {

      if (++NumMayIncreaseSize > CostThreshold)

        return false;

    }

  }

  return true;

}


static bool mayIgnoreSignedZero(MachineInstr &MI) {

  const TargetOptions &Options = MI.getMF()->getTarget().Options;

  return Options.NoSignedZerosFPMath || MI.getFlag(MachineInstr::MIFlag::FmNsz);

}


static bool isInv2Pi(const APFloat &APF) {

  static const APFloat KF16(APFloat::IEEEhalf(), APInt(16, 0x3118));

  static const APFloat KF32(APFloat::IEEEsingle(), APInt(32, 0x3e22f983));

  static const APFloat KF64(APFloat::IEEEdouble(),

                            APInt(64, 0x3fc45f306dc9c882));


  return APF.bitwiseIsEqual(KF16) || APF.bitwiseIsEqual(KF32) ||

         APF.bitwiseIsEqual(KF64);

}


// 0 and 1.0 / (0.5 * pi) do not have inline immmediates, so there is an

// additional cost to negate them.

static bool isConstantCostlierToNegate(MachineInstr &MI, Register Reg,

                                       MachineRegisterInfo &MRI) {

  std::optional<FPValueAndVReg> FPValReg;

  if (mi_match(Reg, MRI, m_GFCstOrSplat(FPValReg))) {

    if (FPValReg->Value.isZero() && !FPValReg->Value.isNegative())

      return true;


    const GCNSubtarget &ST = MI.getMF()->getSubtarget<GCNSubtarget>();

    if (ST.hasInv2PiInlineImm() && isInv2Pi(FPValReg->Value))

      return true;

  }

  return false;

}


static unsigned inverseMinMax(unsigned Opc) {

  switch (Opc) {

  case AMDGPU::G_FMAXNUM:

    return AMDGPU::G_FMINNUM;

  case AMDGPU::G_FMINNUM:

    return AMDGPU::G_FMAXNUM;

  case AMDGPU::G_FMAXNUM_IEEE:

    return AMDGPU::G_FMINNUM_IEEE;

  case AMDGPU::G_FMINNUM_IEEE:

    return AMDGPU::G_FMAXNUM_IEEE;

  case AMDGPU::G_FMAXIMUM:

    return AMDGPU::G_FMINIMUM;

  case AMDGPU::G_FMINIMUM:

    return AMDGPU::G_FMAXIMUM;

  case AMDGPU::G_AMDGPU_FMAX_LEGACY:

    return AMDGPU::G_AMDGPU_FMIN_LEGACY;

  case AMDGPU::G_AMDGPU_FMIN_LEGACY:

    return AMDGPU::G_AMDGPU_FMAX_LEGACY;

  default:

    llvm_unreachable("invalid min/max opcode");

  }

}


bool AMDGPUCombinerHelper::matchFoldableFneg(MachineInstr &MI,

                                             MachineInstr *&MatchInfo) {

  Register Src = MI.getOperand(1).getReg();

  MatchInfo = MRI.getVRegDef(Src);


  // If the input has multiple uses and we can either fold the negate down, or

  // the other uses cannot, give up. This both prevents unprofitable

  // transformations and infinite loops: we won't repeatedly try to fold around

  // a negate that has no 'good' form.

  if (MRI.hasOneNonDBGUse(Src)) {

    if (allUsesHaveSourceMods(MI, MRI, 0))

      return false;

  } else {

    if (fnegFoldsIntoMI(*MatchInfo) &&

        (allUsesHaveSourceMods(MI, MRI) ||

         !allUsesHaveSourceMods(*MatchInfo, MRI)))

      return false;

  }


  switch (MatchInfo->getOpcode()) {

  case AMDGPU::G_FMINNUM:

  case AMDGPU::G_FMAXNUM:

  case AMDGPU::G_FMINNUM_IEEE:

  case AMDGPU::G_FMAXNUM_IEEE:

  case AMDGPU::G_FMINIMUM:

  case AMDGPU::G_FMAXIMUM:

  case AMDGPU::G_AMDGPU_FMIN_LEGACY:

  case AMDGPU::G_AMDGPU_FMAX_LEGACY:

    // 0 doesn't have a negated inline immediate.

    return !isConstantCostlierToNegate(*MatchInfo,

                                       MatchInfo->getOperand(2).getReg(), MRI);

  case AMDGPU::G_FADD:

  case AMDGPU::G_FSUB:

  case AMDGPU::G_FMA:

  case AMDGPU::G_FMAD:

    return mayIgnoreSignedZero(*MatchInfo);

  case AMDGPU::G_FMUL:

  case AMDGPU::G_FPEXT:

  case AMDGPU::G_INTRINSIC_TRUNC:

  case AMDGPU::G_FPTRUNC:

  case AMDGPU::G_FRINT:

  case AMDGPU::G_FNEARBYINT:

  case AMDGPU::G_INTRINSIC_ROUND:

  case AMDGPU::G_INTRINSIC_ROUNDEVEN:

  case AMDGPU::G_FSIN:

  case AMDGPU::G_FCANONICALIZE:

  case AMDGPU::G_AMDGPU_RCP_IFLAG:

    return true;

  case AMDGPU::G_INTRINSIC:

  case AMDGPU::G_INTRINSIC_CONVERGENT: {

    Intrinsic::ID IntrinsicID = cast<GIntrinsic>(MatchInfo)->getIntrinsicID();

    switch (IntrinsicID) {

    case Intrinsic::amdgcn_rcp:

    case Intrinsic::amdgcn_rcp_legacy:

    case Intrinsic::amdgcn_sin:

    case Intrinsic::amdgcn_fmul_legacy:

    case Intrinsic::amdgcn_fmed3:

      return true;

    case Intrinsic::amdgcn_fma_legacy:

      return mayIgnoreSignedZero(*MatchInfo);

    default:

      return false;

    }

  }

  default:

    return false;

  }

}


void AMDGPUCombinerHelper::applyFoldableFneg(MachineInstr &MI,

                                             MachineInstr *&MatchInfo) {

  // Transform:

  // %A = inst %Op1, ...

  // %B = fneg %A

  //

  // into:

  //

  // (if %A has one use, specifically fneg above)

  // %B = inst (maybe fneg %Op1), ...

  //

  // (if %A has multiple uses)

  // %B = inst (maybe fneg %Op1), ...

  // %A = fneg %B


  // Replace register in operand with a register holding negated value.

  auto NegateOperand = [&](MachineOperand &Op) {

    Register Reg = Op.getReg();

    if (!mi_match(Reg, MRI, m_GFNeg(m_Reg(Reg))))

      Reg = Builder.buildFNeg(MRI.getType(Reg), Reg).getReg(0);

    replaceRegOpWith(MRI, Op, Reg);

  };


  // Replace either register in operands with a register holding negated value.

  auto NegateEitherOperand = [&](MachineOperand &X, MachineOperand &Y) {

    Register XReg = X.getReg();

    Register YReg = Y.getReg();

    if (mi_match(XReg, MRI, m_GFNeg(m_Reg(XReg))))

      replaceRegOpWith(MRI, X, XReg);

    else if (mi_match(YReg, MRI, m_GFNeg(m_Reg(YReg))))

      replaceRegOpWith(MRI, Y, YReg);

    else {

      YReg = Builder.buildFNeg(MRI.getType(YReg), YReg).getReg(0);

      replaceRegOpWith(MRI, Y, YReg);

    }

  };


  Builder.setInstrAndDebugLoc(*MatchInfo);


  // Negate appropriate operands so that resulting value of MatchInfo is

  // negated.

  switch (MatchInfo->getOpcode()) {

  case AMDGPU::G_FADD:

  case AMDGPU::G_FSUB:

    NegateOperand(MatchInfo->getOperand(1));

    NegateOperand(MatchInfo->getOperand(2));

    break;

  case AMDGPU::G_FMUL:

    NegateEitherOperand(MatchInfo->getOperand(1), MatchInfo->getOperand(2));

    break;

  case AMDGPU::G_FMINNUM:

  case AMDGPU::G_FMAXNUM:

  case AMDGPU::G_FMINNUM_IEEE:

  case AMDGPU::G_FMAXNUM_IEEE:

  case AMDGPU::G_FMINIMUM:

  case AMDGPU::G_FMAXIMUM:

  case AMDGPU::G_AMDGPU_FMIN_LEGACY:

  case AMDGPU::G_AMDGPU_FMAX_LEGACY: {

    NegateOperand(MatchInfo->getOperand(1));

    NegateOperand(MatchInfo->getOperand(2));

    unsigned Opposite = inverseMinMax(MatchInfo->getOpcode());

    replaceOpcodeWith(*MatchInfo, Opposite);

    break;

  }

  case AMDGPU::G_FMA:

  case AMDGPU::G_FMAD:

    NegateEitherOperand(MatchInfo->getOperand(1), MatchInfo->getOperand(2));

    NegateOperand(MatchInfo->getOperand(3));

    break;

  case AMDGPU::G_FPEXT:

  case AMDGPU::G_INTRINSIC_TRUNC:

  case AMDGPU::G_FRINT:

  case AMDGPU::G_FNEARBYINT:

  case AMDGPU::G_INTRINSIC_ROUND:

  case AMDGPU::G_INTRINSIC_ROUNDEVEN:

  case AMDGPU::G_FSIN:

  case AMDGPU::G_FCANONICALIZE:

  case AMDGPU::G_AMDGPU_RCP_IFLAG:

  case AMDGPU::G_FPTRUNC:

    NegateOperand(MatchInfo->getOperand(1));

    break;

  case AMDGPU::G_INTRINSIC:

  case AMDGPU::G_INTRINSIC_CONVERGENT: {

    Intrinsic::ID IntrinsicID = cast<GIntrinsic>(MatchInfo)->getIntrinsicID();

    switch (IntrinsicID) {

    case Intrinsic::amdgcn_rcp:

    case Intrinsic::amdgcn_rcp_legacy:

    case Intrinsic::amdgcn_sin:

      NegateOperand(MatchInfo->getOperand(2));

      break;

    case Intrinsic::amdgcn_fmul_legacy:

      NegateEitherOperand(MatchInfo->getOperand(2), MatchInfo->getOperand(3));

      break;

    case Intrinsic::amdgcn_fmed3:

      NegateOperand(MatchInfo->getOperand(2));

      NegateOperand(MatchInfo->getOperand(3));

      NegateOperand(MatchInfo->getOperand(4));

      break;

    case Intrinsic::amdgcn_fma_legacy:

      NegateEitherOperand(MatchInfo->getOperand(2), MatchInfo->getOperand(3));

      NegateOperand(MatchInfo->getOperand(4));

      break;

    default:

      llvm_unreachable("folding fneg not supported for this intrinsic");

    }

    break;

  }

  default:

    llvm_unreachable("folding fneg not supported for this instruction");

  }


  Register Dst = MI.getOperand(0).getReg();

  Register MatchInfoDst = MatchInfo->getOperand(0).getReg();


  if (MRI.hasOneNonDBGUse(MatchInfoDst)) {

    // MatchInfo now has negated value so use that instead of old Dst.

    replaceRegWith(MRI, Dst, MatchInfoDst);

  } else {

    // We want to swap all uses of Dst with uses of MatchInfoDst and vice versa

    // but replaceRegWith will replace defs as well. It is easier to replace one

    // def with a new register.

    LLT Type = MRI.getType(Dst);

    Register NegatedMatchInfo = MRI.createGenericVirtualRegister(Type);

    replaceRegOpWith(MRI, MatchInfo->getOperand(0), NegatedMatchInfo);


    // MatchInfo now has negated value so use that instead of old Dst.

    replaceRegWith(MRI, Dst, NegatedMatchInfo);


    // Recreate non negated value for other uses of old MatchInfoDst

    auto NextInst = ++MatchInfo->getIterator();

    Builder.setInstrAndDebugLoc(*NextInst);

    Builder.buildFNeg(MatchInfoDst, NegatedMatchInfo, MI.getFlags());

  }


  MI.eraseFromParent();

}


// TODO: Should return converted value / extension source and avoid introducing

// intermediate fptruncs in the apply function.

static bool isFPExtFromF16OrConst(const MachineRegisterInfo &MRI,

                                  Register Reg) {

  const MachineInstr *Def = MRI.getVRegDef(Reg);

  if (Def->getOpcode() == TargetOpcode::G_FPEXT) {

    Register SrcReg = Def->getOperand(1).getReg();

    return MRI.getType(SrcReg) == LLT::scalar(16);

  }


  if (Def->getOpcode() == TargetOpcode::G_FCONSTANT) {

    APFloat Val = Def->getOperand(1).getFPImm()->getValueAPF();

    bool LosesInfo = true;

    Val.convert(APFloat::IEEEhalf(), APFloat::rmNearestTiesToEven, &LosesInfo);

    return !LosesInfo;

  }


  return false;

}


bool AMDGPUCombinerHelper::matchExpandPromotedF16FMed3(MachineInstr &MI,

                                                       Register Src0,

                                                       Register Src1,

                                                       Register Src2) {

  assert(MI.getOpcode() == TargetOpcode::G_FPTRUNC);

  Register SrcReg = MI.getOperand(1).getReg();

  if (!MRI.hasOneNonDBGUse(SrcReg) || MRI.getType(SrcReg) != LLT::scalar(32))

    return false;


  return isFPExtFromF16OrConst(MRI, Src0) && isFPExtFromF16OrConst(MRI, Src1) &&

         isFPExtFromF16OrConst(MRI, Src2);

}


void AMDGPUCombinerHelper::applyExpandPromotedF16FMed3(MachineInstr &MI,

                                                       Register Src0,

                                                       Register Src1,

                                                       Register Src2) {

  // We expect fptrunc (fpext x) to fold out, and to constant fold any constant

  // sources.

  Src0 = Builder.buildFPTrunc(LLT::scalar(16), Src0).getReg(0);

  Src1 = Builder.buildFPTrunc(LLT::scalar(16), Src1).getReg(0);

  Src2 = Builder.buildFPTrunc(LLT::scalar(16), Src2).getReg(0);


  LLT Ty = MRI.getType(Src0);

  auto A1 = Builder.buildFMinNumIEEE(Ty, Src0, Src1);

  auto B1 = Builder.buildFMaxNumIEEE(Ty, Src0, Src1);

  auto C1 = Builder.buildFMaxNumIEEE(Ty, A1, Src2);

  Builder.buildFMinNumIEEE(MI.getOperand(0), B1, C1);

  MI.eraseFromParent();

}

MRI
unsigned const MachineRegisterInfo * MRI
Definition: AArch64AdvSIMDScalarPass.cpp:105

hasSourceMods
static LLVM_READONLY bool hasSourceMods(const MachineInstr &MI)
Definition: AMDGPUCombinerHelper.cpp:78

isInv2Pi
static bool isInv2Pi(const APFloat &APF)
Definition: AMDGPUCombinerHelper.cpp:143

isFPExtFromF16OrConst
static bool isFPExtFromF16OrConst(const MachineRegisterInfo &MRI, Register Reg)
Definition: AMDGPUCombinerHelper.cpp:400

mayIgnoreSignedZero
static bool mayIgnoreSignedZero(MachineInstr &MI)
Definition: AMDGPUCombinerHelper.cpp:138

isConstantCostlierToNegate
static bool isConstantCostlierToNegate(MachineInstr &MI, Register Reg, MachineRegisterInfo &MRI)
Definition: AMDGPUCombinerHelper.cpp:155

allUsesHaveSourceMods
static bool allUsesHaveSourceMods(MachineInstr &MI, MachineRegisterInfo &MRI, unsigned CostThreshold=4)
Definition: AMDGPUCombinerHelper.cpp:117

opMustUseVOP3Encoding
static LLVM_READONLY bool opMustUseVOP3Encoding(const MachineInstr &MI, const MachineRegisterInfo &MRI)
returns true if the operation will definitely need to use a 64-bit encoding, and thus will use a VOP3...
Definition: AMDGPUCombinerHelper.cpp:70

inverseMinMax
static unsigned inverseMinMax(unsigned Opc)
Definition: AMDGPUCombinerHelper.cpp:169

fnegFoldsIntoMI
static LLVM_READNONE bool fnegFoldsIntoMI(const MachineInstr &MI)
Definition: AMDGPUCombinerHelper.cpp:21

AMDGPUCombinerHelper.h
This contains common combine transformations that may be used in a combine pass.

AMDGPUMCTargetDesc.h
Provides AMDGPU specific target descriptions.

LLVM_READNONE
#define LLVM_READNONE
Definition: Compiler.h:220

LLVM_READONLY
#define LLVM_READONLY
Definition: Compiler.h:227

CostThreshold
static cl::opt< unsigned > CostThreshold("dfa-cost-threshold", cl::desc("Maximum cost accepted for the transformation"), cl::Hidden, cl::init(50))

X
static GCMetadataPrinterRegistry::Add< ErlangGCPrinter > X("erlang", "erlang-compatible garbage collector")

GCNSubtarget.h
AMD GCN specific subclass of TargetSubtarget.

GenericMachineInstrs.h
Declares convenience wrapper classes for interpreting MachineInstr instances as specific generic oper...

MI
IRTranslator LLVM IR MI
Definition: IRTranslator.cpp:113

Options
static LVOptions Options
Definition: LVOptions.cpp:25

MIPatternMatch.h
Contains matchers for matching SSA Machine Instructions.

getReg
static unsigned getReg(const MCDisassembler *D, unsigned RC, unsigned RegNo)
Definition: MipsDisassembler.cpp:521

Y
static GCMetadataPrinterRegistry::Add< OcamlGCMetadataPrinter > Y("ocaml", "ocaml 3.10-compatible collector")

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

getScalarSizeInBits
static unsigned getScalarSizeInBits(Type *Ty)
Definition: SystemZTargetTransformInfo.cpp:408

AMDGPUCombinerHelper::applyExpandPromotedF16FMed3
void applyExpandPromotedF16FMed3(MachineInstr &MI, Register Src0, Register Src1, Register Src2)
Definition: AMDGPUCombinerHelper.cpp:431

AMDGPUCombinerHelper::matchFoldableFneg
bool matchFoldableFneg(MachineInstr &MI, MachineInstr *&MatchInfo)
Definition: AMDGPUCombinerHelper.cpp:192

AMDGPUCombinerHelper::matchExpandPromotedF16FMed3
bool matchExpandPromotedF16FMed3(MachineInstr &MI, Register Src0, Register Src1, Register Src2)
Definition: AMDGPUCombinerHelper.cpp:418

AMDGPUCombinerHelper::applyFoldableFneg
void applyFoldableFneg(MachineInstr &MI, MachineInstr *&MatchInfo)
Definition: AMDGPUCombinerHelper.cpp:261

llvm::APFloat
Definition: APFloat.h:811

llvm::APFloat::convert
opStatus convert(const fltSemantics &ToSemantics, roundingMode RM, bool *losesInfo)
Definition: APFloat.cpp:5317

llvm::APFloat::bitwiseIsEqual
bool bitwiseIsEqual(const APFloat &RHS) const
Definition: APFloat.h:1319

llvm::APInt
Class for arbitrary precision integers.
Definition: APInt.h:78

llvm::CombinerHelper::replaceRegWith
void replaceRegWith(MachineRegisterInfo &MRI, Register FromReg, Register ToReg) const
MachineRegisterInfo::replaceRegWith() and inform the observer of the changes.
Definition: CombinerHelper.cpp:164

llvm::CombinerHelper::replaceRegOpWith
void replaceRegOpWith(MachineRegisterInfo &MRI, MachineOperand &FromRegOp, Register ToReg) const
Replace a single register operand with a new register and inform the observer of the changes.
Definition: CombinerHelper.cpp:176

llvm::CombinerHelper::replaceOpcodeWith
void replaceOpcodeWith(MachineInstr &FromMI, unsigned ToOpcode) const
Replace the opcode in instruction with a new opcode and inform the observer of the changes.
Definition: CombinerHelper.cpp:187

llvm::CombinerHelper::MRI
MachineRegisterInfo & MRI
Definition: CombinerHelper.h:106

llvm::CombinerHelper::Builder
MachineIRBuilder & Builder
Definition: CombinerHelper.h:105

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:32

llvm::GCNSubtarget
Definition: GCNSubtarget.h:35

llvm::LLT
Definition: LowLevelType.h:39

llvm::LLT::scalar
static constexpr LLT scalar(unsigned SizeInBits)
Get a low-level scalar or aggregate "bag of bits".
Definition: LowLevelType.h:42

llvm::MachineIRBuilder::buildFMinNumIEEE
MachineInstrBuilder buildFMinNumIEEE(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Definition: MachineIRBuilder.h:1750

llvm::MachineIRBuilder::setInstrAndDebugLoc
void setInstrAndDebugLoc(MachineInstr &MI)
Set the insertion point to before MI, and set the debug loc to MI's loc.
Definition: MachineIRBuilder.h:365

llvm::MachineIRBuilder::buildFNeg
MachineInstrBuilder buildFNeg(const DstOp &Dst, const SrcOp &Src0, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_FNEG Op0.
Definition: MachineIRBuilder.h:1906

llvm::MachineIRBuilder::buildFMaxNumIEEE
MachineInstrBuilder buildFMaxNumIEEE(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Definition: MachineIRBuilder.h:1756

llvm::MachineIRBuilder::buildFPTrunc
MachineInstrBuilder buildFPTrunc(const DstOp &Res, const SrcOp &Op, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_FPTRUNC Op.
Definition: MachineIRBuilder.cpp:893

llvm::MachineInstrBuilder::getReg
Register getReg(unsigned Idx) const
Get the register for the operand index.
Definition: MachineInstrBuilder.h:96

llvm::MachineInstr
Representation of each machine instruction.
Definition: MachineInstr.h:69

llvm::MachineInstr::getOpcode
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
Definition: MachineInstr.h:569

llvm::MachineInstr::getOperand
const MachineOperand & getOperand(unsigned i) const
Definition: MachineInstr.h:579

llvm::MachineOperand
MachineOperand class - Representation of each machine instruction operand.
Definition: MachineOperand.h:48

llvm::MachineOperand::getReg
Register getReg() const
getReg - Returns the register number.
Definition: MachineOperand.h:369

llvm::MachineRegisterInfo
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
Definition: MachineRegisterInfo.h:51

llvm::MachineRegisterInfo::hasOneNonDBGUse
bool hasOneNonDBGUse(Register RegNo) const
hasOneNonDBGUse - Return true if there is exactly one non-Debug use of the specified register.
Definition: MachineRegisterInfo.cpp:428

llvm::MachineRegisterInfo::getVRegDef
MachineInstr * getVRegDef(Register Reg) const
getVRegDef - Return the machine instr that defines the specified virtual register or null if none is ...
Definition: MachineRegisterInfo.cpp:409

llvm::MachineRegisterInfo::getType
LLT getType(Register Reg) const
Get the low-level type of Reg or LLT{} if Reg is not a generic (target independent) virtual register.
Definition: MachineRegisterInfo.h:769

llvm::MachineRegisterInfo::createGenericVirtualRegister
Register createGenericVirtualRegister(LLT Ty, StringRef Name="")
Create and return a new generic virtual register with low-level type Ty.
Definition: MachineRegisterInfo.cpp:196

llvm::Register
Wrapper class representing virtual and physical registers.
Definition: Register.h:19

llvm::TargetOptions
Definition: TargetOptions.h:135

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Use
A Use represents the edge between a Value definition and its users.
Definition: Use.h:43

llvm::ilist_node_impl::getIterator
self_iterator getIterator()
Definition: ilist_node.h:132

unsigned

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

TargetMachine.h

llvm::MIPatternMatch::m_Reg
operand_type_match m_Reg()
Definition: MIPatternMatch.h:270

llvm::MIPatternMatch::mi_match
bool mi_match(Reg R, const MachineRegisterInfo &MRI, Pattern &&P)
Definition: MIPatternMatch.h:25

llvm::MIPatternMatch::m_GFNeg
UnaryOp_match< SrcTy, TargetOpcode::G_FNEG > m_GFNeg(const SrcTy &Src)
Definition: MIPatternMatch.h:625

llvm::MIPatternMatch::m_GFCstOrSplat
GFCstOrSplatGFCstMatch m_GFCstOrSplat(std::optional< FPValueAndVReg > &FPValReg)
Definition: MIPatternMatch.h:180

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::Op
DWARFExpression::Operation Op
Definition: DWARFExpression.cpp:22