doxygen/AArch64RegisterBankInfo_8cpp_source.html

//===- AArch64RegisterBankInfo.cpp ----------------------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

/// \file

/// This file implements the targeting of the RegisterBankInfo class for

/// AArch64.

/// \todo This should be generated by TableGen.

//===----------------------------------------------------------------------===//


#include "AArch64RegisterBankInfo.h"

#include "AArch64RegisterInfo.h"

#include "MCTargetDesc/AArch64MCTargetDesc.h"

#include "llvm/ADT/STLExtras.h"

#include "llvm/ADT/SmallVector.h"

#include "llvm/CodeGen/GlobalISel/GenericMachineInstrs.h"

#include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h"

#include "llvm/CodeGen/GlobalISel/Utils.h"

#include "llvm/CodeGen/LowLevelTypeUtils.h"

#include "llvm/CodeGen/MachineFunction.h"

#include "llvm/CodeGen/MachineInstr.h"

#include "llvm/CodeGen/MachineOperand.h"

#include "llvm/CodeGen/MachineRegisterInfo.h"

#include "llvm/CodeGen/RegisterBank.h"

#include "llvm/CodeGen/RegisterBankInfo.h"

#include "llvm/CodeGen/TargetOpcodes.h"

#include "llvm/CodeGen/TargetRegisterInfo.h"

#include "llvm/CodeGen/TargetSubtargetInfo.h"

#include "llvm/IR/IntrinsicsAArch64.h"

#include "llvm/Support/ErrorHandling.h"

#include "llvm/Support/Threading.h"

#include <algorithm>

#include <cassert>


#define GET_TARGET_REGBANK_IMPL

#include "AArch64GenRegisterBank.inc"


// This file will be TableGen'ed at some point.

#include "AArch64GenRegisterBankInfo.def"


using namespace llvm;


AArch64RegisterBankInfo::AArch64RegisterBankInfo(

    const TargetRegisterInfo &TRI) {

  static llvm::once_flag InitializeRegisterBankFlag;


  static auto InitializeRegisterBankOnce = [&]() {

    // We have only one set of register banks, whatever the subtarget

    // is. Therefore, the initialization of the RegBanks table should be

    // done only once. Indeed the table of all register banks

    // (AArch64::RegBanks) is unique in the compiler. At some point, it

    // will get tablegen'ed and the whole constructor becomes empty.


    const RegisterBank &RBGPR = getRegBank(AArch64::GPRRegBankID);

    (void)RBGPR;

    assert(&AArch64::GPRRegBank == &RBGPR &&

           "The order in RegBanks is messed up");


    const RegisterBank &RBFPR = getRegBank(AArch64::FPRRegBankID);

    (void)RBFPR;

    assert(&AArch64::FPRRegBank == &RBFPR &&

           "The order in RegBanks is messed up");


    const RegisterBank &RBCCR = getRegBank(AArch64::CCRegBankID);

    (void)RBCCR;

    assert(&AArch64::CCRegBank == &RBCCR &&

           "The order in RegBanks is messed up");


    // The GPR register bank is fully defined by all the registers in

    // GR64all + its subclasses.

    assert(RBGPR.covers(*TRI.getRegClass(AArch64::GPR32RegClassID)) &&

           "Subclass not added?");

    assert(getMaximumSize(RBGPR.getID()) == 128 &&

           "GPRs should hold up to 128-bit");


    // The FPR register bank is fully defined by all the registers in

    // GR64all + its subclasses.

    assert(RBFPR.covers(*TRI.getRegClass(AArch64::QQRegClassID)) &&

           "Subclass not added?");

    assert(RBFPR.covers(*TRI.getRegClass(AArch64::FPR64RegClassID)) &&

           "Subclass not added?");

    assert(getMaximumSize(RBFPR.getID()) == 512 &&

           "FPRs should hold up to 512-bit via QQQQ sequence");


    assert(RBCCR.covers(*TRI.getRegClass(AArch64::CCRRegClassID)) &&

           "Class not added?");

    assert(getMaximumSize(RBCCR.getID()) == 32 &&

           "CCR should hold up to 32-bit");


    // Check that the TableGen'ed like file is in sync we our expectations.

    // First, the Idx.

    assert(checkPartialMappingIdx(PMI_FirstGPR, PMI_LastGPR,

                                  {PMI_GPR32, PMI_GPR64, PMI_GPR128}) &&

           "PartialMappingIdx's are incorrectly ordered");

    assert(checkPartialMappingIdx(PMI_FirstFPR, PMI_LastFPR,

                                  {PMI_FPR16, PMI_FPR32, PMI_FPR64, PMI_FPR128,

                                   PMI_FPR256, PMI_FPR512}) &&

           "PartialMappingIdx's are incorrectly ordered");

// Now, the content.

// Check partial mapping.

#define CHECK_PARTIALMAP(Idx, ValStartIdx, ValLength, RB)                      \

  do {                                                                         \

    assert(                                                                    \

        checkPartialMap(PartialMappingIdx::Idx, ValStartIdx, ValLength, RB) && \

        #Idx " is incorrectly initialized");                                   \

  } while (false)


    CHECK_PARTIALMAP(PMI_GPR32, 0, 32, RBGPR);

    CHECK_PARTIALMAP(PMI_GPR64, 0, 64, RBGPR);

    CHECK_PARTIALMAP(PMI_GPR128, 0, 128, RBGPR);

    CHECK_PARTIALMAP(PMI_FPR16, 0, 16, RBFPR);

    CHECK_PARTIALMAP(PMI_FPR32, 0, 32, RBFPR);

    CHECK_PARTIALMAP(PMI_FPR64, 0, 64, RBFPR);

    CHECK_PARTIALMAP(PMI_FPR128, 0, 128, RBFPR);

    CHECK_PARTIALMAP(PMI_FPR256, 0, 256, RBFPR);

    CHECK_PARTIALMAP(PMI_FPR512, 0, 512, RBFPR);


// Check value mapping.

#define CHECK_VALUEMAP_IMPL(RBName, Size, Offset)                              \

  do {                                                                         \

    assert(checkValueMapImpl(PartialMappingIdx::PMI_##RBName##Size,            \

                             PartialMappingIdx::PMI_First##RBName, Size,       \

                             Offset) &&                                        \

           #RBName #Size " " #Offset " is incorrectly initialized");           \

  } while (false)


#define CHECK_VALUEMAP(RBName, Size) CHECK_VALUEMAP_IMPL(RBName, Size, 0)


    CHECK_VALUEMAP(GPR, 32);

    CHECK_VALUEMAP(GPR, 64);

    CHECK_VALUEMAP(GPR, 128);

    CHECK_VALUEMAP(FPR, 16);

    CHECK_VALUEMAP(FPR, 32);

    CHECK_VALUEMAP(FPR, 64);

    CHECK_VALUEMAP(FPR, 128);

    CHECK_VALUEMAP(FPR, 256);

    CHECK_VALUEMAP(FPR, 512);


// Check the value mapping for 3-operands instructions where all the operands

// map to the same value mapping.

#define CHECK_VALUEMAP_3OPS(RBName, Size)                                      \

  do {                                                                         \

    CHECK_VALUEMAP_IMPL(RBName, Size, 0);                                      \

    CHECK_VALUEMAP_IMPL(RBName, Size, 1);                                      \

    CHECK_VALUEMAP_IMPL(RBName, Size, 2);                                      \

  } while (false)


    CHECK_VALUEMAP_3OPS(GPR, 32);

    CHECK_VALUEMAP_3OPS(GPR, 64);

    CHECK_VALUEMAP_3OPS(GPR, 128);

    CHECK_VALUEMAP_3OPS(FPR, 32);

    CHECK_VALUEMAP_3OPS(FPR, 64);

    CHECK_VALUEMAP_3OPS(FPR, 128);

    CHECK_VALUEMAP_3OPS(FPR, 256);

    CHECK_VALUEMAP_3OPS(FPR, 512);


#define CHECK_VALUEMAP_CROSSREGCPY(RBNameDst, RBNameSrc, Size)                 \

  do {                                                                         \

    unsigned PartialMapDstIdx = PMI_##RBNameDst##Size - PMI_Min;               \

    unsigned PartialMapSrcIdx = PMI_##RBNameSrc##Size - PMI_Min;               \

    (void)PartialMapDstIdx;                                                    \

    (void)PartialMapSrcIdx;                                                    \

    const ValueMapping *Map = getCopyMapping(AArch64::RBNameDst##RegBankID,    \

                                             AArch64::RBNameSrc##RegBankID,    \

                                             TypeSize::getFixed(Size));        \

    (void)Map;                                                                 \

    assert(Map[0].BreakDown ==                                                 \

               &AArch64GenRegisterBankInfo::PartMappings[PartialMapDstIdx] &&  \

           Map[0].NumBreakDowns == 1 &&                                        \

           #RBNameDst #Size " Dst is incorrectly initialized");                \

    assert(Map[1].BreakDown ==                                                 \

               &AArch64GenRegisterBankInfo::PartMappings[PartialMapSrcIdx] &&  \

           Map[1].NumBreakDowns == 1 &&                                        \

           #RBNameSrc #Size " Src is incorrectly initialized");                \

                                                                               \

  } while (false)


    CHECK_VALUEMAP_CROSSREGCPY(GPR, GPR, 32);

    CHECK_VALUEMAP_CROSSREGCPY(GPR, FPR, 32);

    CHECK_VALUEMAP_CROSSREGCPY(GPR, GPR, 64);

    CHECK_VALUEMAP_CROSSREGCPY(GPR, FPR, 64);

    CHECK_VALUEMAP_CROSSREGCPY(FPR, FPR, 32);

    CHECK_VALUEMAP_CROSSREGCPY(FPR, GPR, 32);

    CHECK_VALUEMAP_CROSSREGCPY(FPR, FPR, 64);

    CHECK_VALUEMAP_CROSSREGCPY(FPR, GPR, 64);


#define CHECK_VALUEMAP_FPEXT(DstSize, SrcSize)                                 \

  do {                                                                         \

    unsigned PartialMapDstIdx = PMI_FPR##DstSize - PMI_Min;                    \

    unsigned PartialMapSrcIdx = PMI_FPR##SrcSize - PMI_Min;                    \

    (void)PartialMapDstIdx;                                                    \

    (void)PartialMapSrcIdx;                                                    \

    const ValueMapping *Map = getFPExtMapping(DstSize, SrcSize);               \

    (void)Map;                                                                 \

    assert(Map[0].BreakDown ==                                                 \

               &AArch64GenRegisterBankInfo::PartMappings[PartialMapDstIdx] &&  \

           Map[0].NumBreakDowns == 1 && "FPR" #DstSize                         \

                                        " Dst is incorrectly initialized");    \

    assert(Map[1].BreakDown ==                                                 \

               &AArch64GenRegisterBankInfo::PartMappings[PartialMapSrcIdx] &&  \

           Map[1].NumBreakDowns == 1 && "FPR" #SrcSize                         \

                                        " Src is incorrectly initialized");    \

                                                                               \

  } while (false)


    CHECK_VALUEMAP_FPEXT(32, 16);

    CHECK_VALUEMAP_FPEXT(64, 16);

    CHECK_VALUEMAP_FPEXT(64, 32);

    CHECK_VALUEMAP_FPEXT(128, 64);


    assert(verify(TRI) && "Invalid register bank information");

  };


  llvm::call_once(InitializeRegisterBankFlag, InitializeRegisterBankOnce);

}


unsigned AArch64RegisterBankInfo::copyCost(const RegisterBank &A,

                                           const RegisterBank &B,

                                           const TypeSize Size) const {

  // What do we do with different size?

  // copy are same size.

  // Will introduce other hooks for different size:

  // * extract cost.

  // * build_sequence cost.


  // Copy from (resp. to) GPR to (resp. from) FPR involves FMOV.

  // FIXME: This should be deduced from the scheduling model.

  if (&A == &AArch64::GPRRegBank && &B == &AArch64::FPRRegBank)

    // FMOVXDr or FMOVWSr.

    return 5;

  if (&A == &AArch64::FPRRegBank && &B == &AArch64::GPRRegBank)

    // FMOVDXr or FMOVSWr.

    return 4;


  return RegisterBankInfo::copyCost(A, B, Size);

}


const RegisterBank &

AArch64RegisterBankInfo::getRegBankFromRegClass(const TargetRegisterClass &RC,

                                                LLT) const {

  switch (RC.getID()) {

  case AArch64::FPR8RegClassID:

  case AArch64::FPR16RegClassID:

  case AArch64::FPR16_loRegClassID:

  case AArch64::FPR32_with_hsub_in_FPR16_loRegClassID:

  case AArch64::FPR32RegClassID:

  case AArch64::FPR64RegClassID:

  case AArch64::FPR128RegClassID:

  case AArch64::FPR64_loRegClassID:

  case AArch64::FPR128_loRegClassID:

  case AArch64::FPR128_0to7RegClassID:

  case AArch64::DDRegClassID:

  case AArch64::DDDRegClassID:

  case AArch64::DDDDRegClassID:

  case AArch64::QQRegClassID:

  case AArch64::QQQRegClassID:

  case AArch64::QQQQRegClassID:

  case AArch64::ZPRRegClassID:

  case AArch64::ZPR_3bRegClassID:

    return getRegBank(AArch64::FPRRegBankID);

  case AArch64::GPR32commonRegClassID:

  case AArch64::GPR32RegClassID:

  case AArch64::GPR32spRegClassID:

  case AArch64::GPR32sponlyRegClassID:

  case AArch64::GPR32argRegClassID:

  case AArch64::GPR32allRegClassID:

  case AArch64::GPR64commonRegClassID:

  case AArch64::GPR64RegClassID:

  case AArch64::GPR64spRegClassID:

  case AArch64::GPR64sponlyRegClassID:

  case AArch64::GPR64argRegClassID:

  case AArch64::GPR64allRegClassID:

  case AArch64::GPR64noipRegClassID:

  case AArch64::GPR64common_and_GPR64noipRegClassID:

  case AArch64::GPR64noip_and_tcGPR64RegClassID:

  case AArch64::tcGPR64RegClassID:

  case AArch64::tcGPRx16x17RegClassID:

  case AArch64::tcGPRx17RegClassID:

  case AArch64::tcGPRnotx16RegClassID:

  case AArch64::WSeqPairsClassRegClassID:

  case AArch64::XSeqPairsClassRegClassID:

  case AArch64::MatrixIndexGPR32_8_11RegClassID:

  case AArch64::MatrixIndexGPR32_12_15RegClassID:

  case AArch64::GPR64_with_sub_32_in_MatrixIndexGPR32_8_11RegClassID:

  case AArch64::GPR64_with_sub_32_in_MatrixIndexGPR32_12_15RegClassID:

    return getRegBank(AArch64::GPRRegBankID);

  case AArch64::CCRRegClassID:

    return getRegBank(AArch64::CCRegBankID);

  default:

    llvm_unreachable("Register class not supported");

  }

}


RegisterBankInfo::InstructionMappings

AArch64RegisterBankInfo::getInstrAlternativeMappings(

    const MachineInstr &MI) const {

  const MachineFunction &MF = *MI.getParent()->getParent();

  const TargetSubtargetInfo &STI = MF.getSubtarget();

  const TargetRegisterInfo &TRI = *STI.getRegisterInfo();

  const MachineRegisterInfo &MRI = MF.getRegInfo();


  switch (MI.getOpcode()) {

  case TargetOpcode::G_OR: {

    // 32 and 64-bit or can be mapped on either FPR or

    // GPR for the same cost.

    TypeSize Size = getSizeInBits(MI.getOperand(0).getReg(), MRI, TRI);

    if (Size != 32 && Size != 64)

      break;


    // If the instruction has any implicit-defs or uses,

    // do not mess with it.

    if (MI.getNumOperands() != 3)

      break;

    InstructionMappings AltMappings;

    const InstructionMapping &GPRMapping = getInstructionMapping(

        /*ID*/ 1, /*Cost*/ 1, getValueMapping(PMI_FirstGPR, Size),

        /*NumOperands*/ 3);

    const InstructionMapping &FPRMapping = getInstructionMapping(

        /*ID*/ 2, /*Cost*/ 1, getValueMapping(PMI_FirstFPR, Size),

        /*NumOperands*/ 3);


    AltMappings.push_back(&GPRMapping);

    AltMappings.push_back(&FPRMapping);

    return AltMappings;

  }

  case TargetOpcode::G_BITCAST: {

    TypeSize Size = getSizeInBits(MI.getOperand(0).getReg(), MRI, TRI);

    if (Size != 32 && Size != 64)

      break;


    // If the instruction has any implicit-defs or uses,

    // do not mess with it.

    if (MI.getNumOperands() != 2)

      break;


    InstructionMappings AltMappings;

    const InstructionMapping &GPRMapping = getInstructionMapping(

        /*ID*/ 1, /*Cost*/ 1,

        getCopyMapping(AArch64::GPRRegBankID, AArch64::GPRRegBankID, Size),

        /*NumOperands*/ 2);

    const InstructionMapping &FPRMapping = getInstructionMapping(

        /*ID*/ 2, /*Cost*/ 1,

        getCopyMapping(AArch64::FPRRegBankID, AArch64::FPRRegBankID, Size),

        /*NumOperands*/ 2);

    const InstructionMapping &GPRToFPRMapping = getInstructionMapping(

        /*ID*/ 3,

        /*Cost*/

        copyCost(AArch64::GPRRegBank, AArch64::FPRRegBank,

                 TypeSize::getFixed(Size)),

        getCopyMapping(AArch64::FPRRegBankID, AArch64::GPRRegBankID, Size),

        /*NumOperands*/ 2);

    const InstructionMapping &FPRToGPRMapping = getInstructionMapping(

        /*ID*/ 3,

        /*Cost*/

        copyCost(AArch64::GPRRegBank, AArch64::FPRRegBank,

                 TypeSize::getFixed(Size)),

        getCopyMapping(AArch64::GPRRegBankID, AArch64::FPRRegBankID, Size),

        /*NumOperands*/ 2);


    AltMappings.push_back(&GPRMapping);

    AltMappings.push_back(&FPRMapping);

    AltMappings.push_back(&GPRToFPRMapping);

    AltMappings.push_back(&FPRToGPRMapping);

    return AltMappings;

  }

  case TargetOpcode::G_LOAD: {

    TypeSize Size = getSizeInBits(MI.getOperand(0).getReg(), MRI, TRI);

    if (Size != 64)

      break;


    // If the instruction has any implicit-defs or uses,

    // do not mess with it.

    if (MI.getNumOperands() != 2)

      break;


    InstructionMappings AltMappings;

    const InstructionMapping &GPRMapping = getInstructionMapping(

        /*ID*/ 1, /*Cost*/ 1,

        getOperandsMapping(

            {getValueMapping(PMI_FirstGPR, Size),

             // Addresses are GPR 64-bit.

             getValueMapping(PMI_FirstGPR, TypeSize::getFixed(64))}),

        /*NumOperands*/ 2);

    const InstructionMapping &FPRMapping = getInstructionMapping(

        /*ID*/ 2, /*Cost*/ 1,

        getOperandsMapping(

            {getValueMapping(PMI_FirstFPR, Size),

             // Addresses are GPR 64-bit.

             getValueMapping(PMI_FirstGPR, TypeSize::getFixed(64))}),

        /*NumOperands*/ 2);


    AltMappings.push_back(&GPRMapping);

    AltMappings.push_back(&FPRMapping);

    return AltMappings;

  }

  default:

    break;

  }

  return RegisterBankInfo::getInstrAlternativeMappings(MI);

}


void AArch64RegisterBankInfo::applyMappingImpl(

    MachineIRBuilder &Builder, const OperandsMapper &OpdMapper) const {

  MachineInstr &MI = OpdMapper.getMI();

  MachineRegisterInfo &MRI = OpdMapper.getMRI();


  switch (MI.getOpcode()) {

  case TargetOpcode::G_OR:

  case TargetOpcode::G_BITCAST:

  case TargetOpcode::G_LOAD:

    // Those ID must match getInstrAlternativeMappings.

    assert((OpdMapper.getInstrMapping().getID() >= 1 &&

            OpdMapper.getInstrMapping().getID() <= 4) &&

           "Don't know how to handle that ID");

    return applyDefaultMapping(OpdMapper);

  case TargetOpcode::G_INSERT_VECTOR_ELT: {

    // Extend smaller gpr operands to 32 bit.

    Builder.setInsertPt(*MI.getParent(), MI.getIterator());

    auto Ext = Builder.buildAnyExt(LLT::scalar(32), MI.getOperand(2).getReg());

    MRI.setRegBank(Ext.getReg(0), getRegBank(AArch64::GPRRegBankID));

    MI.getOperand(2).setReg(Ext.getReg(0));

    return applyDefaultMapping(OpdMapper);

  }

  default:

    llvm_unreachable("Don't know how to handle that operation");

  }

}


const RegisterBankInfo::InstructionMapping &

AArch64RegisterBankInfo::getSameKindOfOperandsMapping(

    const MachineInstr &MI) const {

  const unsigned Opc = MI.getOpcode();

  const MachineFunction &MF = *MI.getParent()->getParent();

  const MachineRegisterInfo &MRI = MF.getRegInfo();


  unsigned NumOperands = MI.getNumOperands();

  assert(NumOperands <= 3 &&

         "This code is for instructions with 3 or less operands");


  LLT Ty = MRI.getType(MI.getOperand(0).getReg());

  TypeSize Size = Ty.getSizeInBits();

  bool IsFPR = Ty.isVector() || isPreISelGenericFloatingPointOpcode(Opc);


  PartialMappingIdx RBIdx = IsFPR ? PMI_FirstFPR : PMI_FirstGPR;


#ifndef NDEBUG

  // Make sure all the operands are using similar size and type.

  // Should probably be checked by the machine verifier.

  // This code won't catch cases where the number of lanes is

  // different between the operands.

  // If we want to go to that level of details, it is probably

  // best to check that the types are the same, period.

  // Currently, we just check that the register banks are the same

  // for each types.

  for (unsigned Idx = 1; Idx != NumOperands; ++Idx) {

    LLT OpTy = MRI.getType(MI.getOperand(Idx).getReg());

    assert(

        AArch64GenRegisterBankInfo::getRegBankBaseIdxOffset(

            RBIdx, OpTy.getSizeInBits()) ==

            AArch64GenRegisterBankInfo::getRegBankBaseIdxOffset(RBIdx, Size) &&

        "Operand has incompatible size");

    bool OpIsFPR = OpTy.isVector() || isPreISelGenericFloatingPointOpcode(Opc);

    (void)OpIsFPR;

    assert(IsFPR == OpIsFPR && "Operand has incompatible type");

  }

#endif // End NDEBUG.


  return getInstructionMapping(DefaultMappingID, 1,

                               getValueMapping(RBIdx, Size), NumOperands);

}


/// \returns true if a given intrinsic only uses and defines FPRs.

static bool isFPIntrinsic(const MachineRegisterInfo &MRI,

                          const MachineInstr &MI) {

  // TODO: Add more intrinsics.

  switch (cast<GIntrinsic>(MI).getIntrinsicID()) {

  default:

    return false;

  case Intrinsic::aarch64_neon_uaddlv:

  case Intrinsic::aarch64_neon_uaddv:

  case Intrinsic::aarch64_neon_saddv:

  case Intrinsic::aarch64_neon_umaxv:

  case Intrinsic::aarch64_neon_smaxv:

  case Intrinsic::aarch64_neon_uminv:

  case Intrinsic::aarch64_neon_sminv:

  case Intrinsic::aarch64_neon_faddv:

  case Intrinsic::aarch64_neon_fmaxv:

  case Intrinsic::aarch64_neon_fminv:

  case Intrinsic::aarch64_neon_fmaxnmv:

  case Intrinsic::aarch64_neon_fminnmv:

    return true;

  case Intrinsic::aarch64_neon_saddlv: {

    const LLT SrcTy = MRI.getType(MI.getOperand(2).getReg());

    return SrcTy.getElementType().getSizeInBits() >= 16 &&

           SrcTy.getElementCount().getFixedValue() >= 4;

  }

  }

}


bool AArch64RegisterBankInfo::isPHIWithFPContraints(

    const MachineInstr &MI, const MachineRegisterInfo &MRI,

    const TargetRegisterInfo &TRI, const unsigned Depth) const {

  if (!MI.isPHI() || Depth > MaxFPRSearchDepth)

    return false;


  return any_of(MRI.use_nodbg_instructions(MI.getOperand(0).getReg()),

                [&](const MachineInstr &UseMI) {

                  if (onlyUsesFP(UseMI, MRI, TRI, Depth + 1))

                    return true;

                  return isPHIWithFPContraints(UseMI, MRI, TRI, Depth + 1);

                });

}


bool AArch64RegisterBankInfo::hasFPConstraints(const MachineInstr &MI,

                                               const MachineRegisterInfo &MRI,

                                               const TargetRegisterInfo &TRI,

                                               unsigned Depth) const {

  unsigned Op = MI.getOpcode();

  if (Op == TargetOpcode::G_INTRINSIC && isFPIntrinsic(MRI, MI))

    return true;


  // Do we have an explicit floating point instruction?

  if (isPreISelGenericFloatingPointOpcode(Op))

    return true;


  // No. Check if we have a copy-like instruction. If we do, then we could

  // still be fed by floating point instructions.

  if (Op != TargetOpcode::COPY && !MI.isPHI() &&

      !isPreISelGenericOptimizationHint(Op))

    return false;


  // Check if we already know the register bank.

  auto *RB = getRegBank(MI.getOperand(0).getReg(), MRI, TRI);

  if (RB == &AArch64::FPRRegBank)

    return true;

  if (RB == &AArch64::GPRRegBank)

    return false;


  // We don't know anything.

  //

  // If we have a phi, we may be able to infer that it will be assigned a FPR

  // based off of its inputs.

  if (!MI.isPHI() || Depth > MaxFPRSearchDepth)

    return false;


  return any_of(MI.explicit_uses(), [&](const MachineOperand &Op) {

    return Op.isReg() &&

           onlyDefinesFP(*MRI.getVRegDef(Op.getReg()), MRI, TRI, Depth + 1);

  });

}


bool AArch64RegisterBankInfo::onlyUsesFP(const MachineInstr &MI,

                                         const MachineRegisterInfo &MRI,

                                         const TargetRegisterInfo &TRI,

                                         unsigned Depth) const {

  switch (MI.getOpcode()) {

  case TargetOpcode::G_FPTOSI:

  case TargetOpcode::G_FPTOUI:

  case TargetOpcode::G_FCMP:

  case TargetOpcode::G_LROUND:

  case TargetOpcode::G_LLROUND:

    return true;

  default:

    break;

  }

  return hasFPConstraints(MI, MRI, TRI, Depth);

}


bool AArch64RegisterBankInfo::onlyDefinesFP(const MachineInstr &MI,

                                            const MachineRegisterInfo &MRI,

                                            const TargetRegisterInfo &TRI,

                                            unsigned Depth) const {

  switch (MI.getOpcode()) {

  case AArch64::G_DUP:

  case TargetOpcode::G_SITOFP:

  case TargetOpcode::G_UITOFP:

  case TargetOpcode::G_EXTRACT_VECTOR_ELT:

  case TargetOpcode::G_INSERT_VECTOR_ELT:

  case TargetOpcode::G_BUILD_VECTOR:

  case TargetOpcode::G_BUILD_VECTOR_TRUNC:

    return true;

  case TargetOpcode::G_INTRINSIC_W_SIDE_EFFECTS:

    switch (cast<GIntrinsic>(MI).getIntrinsicID()) {

    case Intrinsic::aarch64_neon_ld1x2:

    case Intrinsic::aarch64_neon_ld1x3:

    case Intrinsic::aarch64_neon_ld1x4:

    case Intrinsic::aarch64_neon_ld2:

    case Intrinsic::aarch64_neon_ld2lane:

    case Intrinsic::aarch64_neon_ld2r:

    case Intrinsic::aarch64_neon_ld3:

    case Intrinsic::aarch64_neon_ld3lane:

    case Intrinsic::aarch64_neon_ld3r:

    case Intrinsic::aarch64_neon_ld4:

    case Intrinsic::aarch64_neon_ld4lane:

    case Intrinsic::aarch64_neon_ld4r:

      return true;

    default:

      break;

    }

    break;

  default:

    break;

  }

  return hasFPConstraints(MI, MRI, TRI, Depth);

}


bool AArch64RegisterBankInfo::isLoadFromFPType(const MachineInstr &MI) const {

  // GMemOperation because we also want to match indexed loads.

  auto *MemOp = cast<GMemOperation>(&MI);

  const Value *LdVal = MemOp->getMMO().getValue();

  if (!LdVal)

    return false;


  Type *EltTy = nullptr;

  if (const GlobalValue *GV = dyn_cast<GlobalValue>(LdVal)) {

    EltTy = GV->getValueType();

    // Look at the first element of the struct to determine the type we are

    // loading

    while (StructType *StructEltTy = dyn_cast<StructType>(EltTy)) {

      if (StructEltTy->getNumElements() == 0)

        break;

      EltTy = StructEltTy->getTypeAtIndex(0U);

    }

    // Look at the first element of the array to determine its type

    if (isa<ArrayType>(EltTy))

      EltTy = EltTy->getArrayElementType();

  } else {

    // FIXME: grubbing around uses is pretty ugly, but with no more

    // `getPointerElementType` there's not much else we can do.

    for (const auto *LdUser : LdVal->users()) {

      if (isa<LoadInst>(LdUser)) {

        EltTy = LdUser->getType();

        break;

      }

      if (isa<StoreInst>(LdUser) && LdUser->getOperand(1) == LdVal) {

        EltTy = LdUser->getOperand(0)->getType();

        break;

      }

    }

  }

  return EltTy && EltTy->isFPOrFPVectorTy();

}


const RegisterBankInfo::InstructionMapping &

AArch64RegisterBankInfo::getInstrMapping(const MachineInstr &MI) const {

  const unsigned Opc = MI.getOpcode();


  // Try the default logic for non-generic instructions that are either copies

  // or already have some operands assigned to banks.

  if ((Opc != TargetOpcode::COPY && !isPreISelGenericOpcode(Opc)) ||

      Opc == TargetOpcode::G_PHI) {

    const RegisterBankInfo::InstructionMapping &Mapping =

        getInstrMappingImpl(MI);

    if (Mapping.isValid())

      return Mapping;

  }


  const MachineFunction &MF = *MI.getParent()->getParent();

  const MachineRegisterInfo &MRI = MF.getRegInfo();

  const TargetSubtargetInfo &STI = MF.getSubtarget();

  const TargetRegisterInfo &TRI = *STI.getRegisterInfo();


  switch (Opc) {

    // G_{F|S|U}REM are not listed because they are not legal.

    // Arithmetic ops.

  case TargetOpcode::G_ADD:

  case TargetOpcode::G_SUB:

  case TargetOpcode::G_PTR_ADD:

  case TargetOpcode::G_MUL:

  case TargetOpcode::G_SDIV:

  case TargetOpcode::G_UDIV:

    // Bitwise ops.

  case TargetOpcode::G_AND:

  case TargetOpcode::G_OR:

  case TargetOpcode::G_XOR:

    // Floating point ops.

  case TargetOpcode::G_FADD:

  case TargetOpcode::G_FSUB:

  case TargetOpcode::G_FMUL:

  case TargetOpcode::G_FDIV:

  case TargetOpcode::G_FMAXIMUM:

  case TargetOpcode::G_FMINIMUM:

    return getSameKindOfOperandsMapping(MI);

  case TargetOpcode::G_FPEXT: {

    LLT DstTy = MRI.getType(MI.getOperand(0).getReg());

    LLT SrcTy = MRI.getType(MI.getOperand(1).getReg());

    return getInstructionMapping(

        DefaultMappingID, /*Cost*/ 1,

        getFPExtMapping(DstTy.getSizeInBits(), SrcTy.getSizeInBits()),

        /*NumOperands*/ 2);

  }

    // Shifts.

  case TargetOpcode::G_SHL:

  case TargetOpcode::G_LSHR:

  case TargetOpcode::G_ASHR: {

    LLT ShiftAmtTy = MRI.getType(MI.getOperand(2).getReg());

    LLT SrcTy = MRI.getType(MI.getOperand(1).getReg());

    if (ShiftAmtTy.getSizeInBits() == 64 && SrcTy.getSizeInBits() == 32)

      return getInstructionMapping(DefaultMappingID, 1,

                                   &ValMappings[Shift64Imm], 3);

    return getSameKindOfOperandsMapping(MI);

  }

  case TargetOpcode::COPY: {

    Register DstReg = MI.getOperand(0).getReg();

    Register SrcReg = MI.getOperand(1).getReg();

    // Check if one of the register is not a generic register.

    if ((DstReg.isPhysical() || !MRI.getType(DstReg).isValid()) ||

        (SrcReg.isPhysical() || !MRI.getType(SrcReg).isValid())) {

      const RegisterBank *DstRB = getRegBank(DstReg, MRI, TRI);

      const RegisterBank *SrcRB = getRegBank(SrcReg, MRI, TRI);

      if (!DstRB)

        DstRB = SrcRB;

      else if (!SrcRB)

        SrcRB = DstRB;

      // If both RB are null that means both registers are generic.

      // We shouldn't be here.

      assert(DstRB && SrcRB && "Both RegBank were nullptr");

      TypeSize Size = getSizeInBits(DstReg, MRI, TRI);

      return getInstructionMapping(

          DefaultMappingID, copyCost(*DstRB, *SrcRB, Size),

          getCopyMapping(DstRB->getID(), SrcRB->getID(), Size),

          // We only care about the mapping of the destination.

          /*NumOperands*/ 1);

    }

    // Both registers are generic, use G_BITCAST.

    [[fallthrough]];

  }

  case TargetOpcode::G_BITCAST: {

    LLT DstTy = MRI.getType(MI.getOperand(0).getReg());

    LLT SrcTy = MRI.getType(MI.getOperand(1).getReg());

    TypeSize Size = DstTy.getSizeInBits();

    bool DstIsGPR = !DstTy.isVector() && DstTy.getSizeInBits() <= 64;

    bool SrcIsGPR = !SrcTy.isVector() && SrcTy.getSizeInBits() <= 64;

    const RegisterBank &DstRB =

        DstIsGPR ? AArch64::GPRRegBank : AArch64::FPRRegBank;

    const RegisterBank &SrcRB =

        SrcIsGPR ? AArch64::GPRRegBank : AArch64::FPRRegBank;

    return getInstructionMapping(

        DefaultMappingID, copyCost(DstRB, SrcRB, Size),

        getCopyMapping(DstRB.getID(), SrcRB.getID(), Size),

        // We only care about the mapping of the destination for COPY.

        /*NumOperands*/ Opc == TargetOpcode::G_BITCAST ? 2 : 1);

  }

  default:

    break;

  }


  unsigned NumOperands = MI.getNumOperands();

  unsigned MappingID = DefaultMappingID;


  // Track the size and bank of each register.  We don't do partial mappings.

  SmallVector<unsigned, 4> OpSize(NumOperands);

  SmallVector<PartialMappingIdx, 4> OpRegBankIdx(NumOperands);

  for (unsigned Idx = 0; Idx < NumOperands; ++Idx) {

    auto &MO = MI.getOperand(Idx);

    if (!MO.isReg() || !MO.getReg())

      continue;


    LLT Ty = MRI.getType(MO.getReg());

    if (!Ty.isValid())

      continue;

    OpSize[Idx] = Ty.getSizeInBits().getKnownMinValue();


    // As a top-level guess, vectors including both scalable and non-scalable

    // ones go in FPRs, scalars and pointers in GPRs.

    // For floating-point instructions, scalars go in FPRs.

    if (Ty.isVector())

      OpRegBankIdx[Idx] = PMI_FirstFPR;

    else if (isPreISelGenericFloatingPointOpcode(Opc) ||

             Ty.getSizeInBits() > 64)

      OpRegBankIdx[Idx] = PMI_FirstFPR;

    else

      OpRegBankIdx[Idx] = PMI_FirstGPR;

  }


  unsigned Cost = 1;

  // Some of the floating-point instructions have mixed GPR and FPR operands:

  // fine-tune the computed mapping.

  switch (Opc) {

  case AArch64::G_DUP: {

    Register ScalarReg = MI.getOperand(1).getReg();

    LLT ScalarTy = MRI.getType(ScalarReg);

    auto ScalarDef = MRI.getVRegDef(ScalarReg);

    // We want to select dup(load) into LD1R.

    if (ScalarDef->getOpcode() == TargetOpcode::G_LOAD)

      OpRegBankIdx = {PMI_FirstFPR, PMI_FirstFPR};

    // s8 is an exception for G_DUP, which we always want on gpr.

    else if (ScalarTy.getSizeInBits() != 8 &&

             (getRegBank(ScalarReg, MRI, TRI) == &AArch64::FPRRegBank ||

              onlyDefinesFP(*ScalarDef, MRI, TRI)))

      OpRegBankIdx = {PMI_FirstFPR, PMI_FirstFPR};

    else

      OpRegBankIdx = {PMI_FirstFPR, PMI_FirstGPR};

    break;

  }

  case TargetOpcode::G_TRUNC: {

    LLT SrcTy = MRI.getType(MI.getOperand(1).getReg());

    if (!SrcTy.isVector() && SrcTy.getSizeInBits() == 128)

      OpRegBankIdx = {PMI_FirstFPR, PMI_FirstFPR};

    break;

  }

  case TargetOpcode::G_SITOFP:

  case TargetOpcode::G_UITOFP: {

    if (MRI.getType(MI.getOperand(0).getReg()).isVector())

      break;

    // Integer to FP conversions don't necessarily happen between GPR -> FPR

    // regbanks. They can also be done within an FPR register.

    Register SrcReg = MI.getOperand(1).getReg();

    if (getRegBank(SrcReg, MRI, TRI) == &AArch64::FPRRegBank)

      OpRegBankIdx = {PMI_FirstFPR, PMI_FirstFPR};

    else

      OpRegBankIdx = {PMI_FirstFPR, PMI_FirstGPR};

    break;

  }

  case TargetOpcode::G_FPTOSI:

  case TargetOpcode::G_FPTOUI:

  case TargetOpcode::G_INTRINSIC_LRINT:

  case TargetOpcode::G_INTRINSIC_LLRINT:

    if (MRI.getType(MI.getOperand(0).getReg()).isVector())

      break;

    OpRegBankIdx = {PMI_FirstGPR, PMI_FirstFPR};

    break;

  case TargetOpcode::G_FCMP: {

    // If the result is a vector, it must use a FPR.

    AArch64GenRegisterBankInfo::PartialMappingIdx Idx0 =

        MRI.getType(MI.getOperand(0).getReg()).isVector() ? PMI_FirstFPR

                                                          : PMI_FirstGPR;

    OpRegBankIdx = {Idx0,

                    /* Predicate */ PMI_None, PMI_FirstFPR, PMI_FirstFPR};

    break;

  }

  case TargetOpcode::G_BITCAST:

    // This is going to be a cross register bank copy and this is expensive.

    if (OpRegBankIdx[0] != OpRegBankIdx[1])

      Cost = copyCost(

          *AArch64GenRegisterBankInfo::PartMappings[OpRegBankIdx[0]].RegBank,

          *AArch64GenRegisterBankInfo::PartMappings[OpRegBankIdx[1]].RegBank,

          TypeSize::getFixed(OpSize[0]));

    break;

  case TargetOpcode::G_LOAD: {

    // Loading in vector unit is slightly more expensive.

    // This is actually only true for the LD1R and co instructions,

    // but anyway for the fast mode this number does not matter and

    // for the greedy mode the cost of the cross bank copy will

    // offset this number.

    // FIXME: Should be derived from the scheduling model.

    if (OpRegBankIdx[0] != PMI_FirstGPR) {

      Cost = 2;

      break;

    }


    if (cast<GLoad>(MI).isAtomic()) {

      // Atomics always use GPR destinations. Don't refine any further.

      OpRegBankIdx[0] = PMI_FirstGPR;

      break;

    }


    // Try to guess the type of the load from the MMO.

    if (isLoadFromFPType(MI)) {

      OpRegBankIdx[0] = PMI_FirstFPR;

      break;

    }


    // Check if that load feeds fp instructions.

    // In that case, we want the default mapping to be on FPR

    // instead of blind map every scalar to GPR.

    if (any_of(MRI.use_nodbg_instructions(MI.getOperand(0).getReg()),

               [&](const MachineInstr &UseMI) {

                 // If we have at least one direct or indirect use

                 // in a FP instruction,

                 // assume this was a floating point load in the IR. If it was

                 // not, we would have had a bitcast before reaching that

                 // instruction.

                 //

                 // Int->FP conversion operations are also captured in

                 // onlyDefinesFP().


                 if (isPHIWithFPContraints(UseMI, MRI, TRI))

                   return true;


                 return onlyUsesFP(UseMI, MRI, TRI) ||

                        onlyDefinesFP(UseMI, MRI, TRI);

               }))

      OpRegBankIdx[0] = PMI_FirstFPR;

    break;

  }

  case TargetOpcode::G_STORE:

    // Check if that store is fed by fp instructions.

    if (OpRegBankIdx[0] == PMI_FirstGPR) {

      Register VReg = MI.getOperand(0).getReg();

      if (!VReg)

        break;

      MachineInstr *DefMI = MRI.getVRegDef(VReg);

      if (onlyDefinesFP(*DefMI, MRI, TRI))

        OpRegBankIdx[0] = PMI_FirstFPR;

      break;

    }

    break;

  case TargetOpcode::G_INDEXED_STORE:

    if (OpRegBankIdx[1] == PMI_FirstGPR) {

      Register VReg = MI.getOperand(1).getReg();

      if (!VReg)

        break;

      MachineInstr *DefMI = MRI.getVRegDef(VReg);

      if (onlyDefinesFP(*DefMI, MRI, TRI))

        OpRegBankIdx[1] = PMI_FirstFPR;

      break;

    }

    break;

  case TargetOpcode::G_INDEXED_SEXTLOAD:

  case TargetOpcode::G_INDEXED_ZEXTLOAD:

    // These should always be GPR.

    OpRegBankIdx[0] = PMI_FirstGPR;

    break;

  case TargetOpcode::G_INDEXED_LOAD: {

    if (isLoadFromFPType(MI))

      OpRegBankIdx[0] = PMI_FirstFPR;

    break;

  }

  case TargetOpcode::G_SELECT: {

    // If the destination is FPR, preserve that.

    if (OpRegBankIdx[0] != PMI_FirstGPR)

      break;


    // If we're taking in vectors, we have no choice but to put everything on

    // FPRs, except for the condition. The condition must always be on a GPR.

    LLT SrcTy = MRI.getType(MI.getOperand(2).getReg());

    if (SrcTy.isVector()) {

      OpRegBankIdx = {PMI_FirstFPR, PMI_FirstGPR, PMI_FirstFPR, PMI_FirstFPR};

      break;

    }


    // Try to minimize the number of copies. If we have more floating point

    // constrained values than not, then we'll put everything on FPR. Otherwise,

    // everything has to be on GPR.

    unsigned NumFP = 0;


    // Check if the uses of the result always produce floating point values.

    //

    // For example:

    //

    // %z = G_SELECT %cond %x %y

    // fpr = G_FOO %z ...

    if (any_of(MRI.use_nodbg_instructions(MI.getOperand(0).getReg()),

               [&](MachineInstr &MI) { return onlyUsesFP(MI, MRI, TRI); }))

      ++NumFP;


    // Check if the defs of the source values always produce floating point

    // values.

    //

    // For example:

    //

    // %x = G_SOMETHING_ALWAYS_FLOAT %a ...

    // %z = G_SELECT %cond %x %y

    //

    // Also check whether or not the sources have already been decided to be

    // FPR. Keep track of this.

    //

    // This doesn't check the condition, since it's just whatever is in NZCV.

    // This isn't passed explicitly in a register to fcsel/csel.

    for (unsigned Idx = 2; Idx < 4; ++Idx) {

      Register VReg = MI.getOperand(Idx).getReg();

      MachineInstr *DefMI = MRI.getVRegDef(VReg);

      if (getRegBank(VReg, MRI, TRI) == &AArch64::FPRRegBank ||

          onlyDefinesFP(*DefMI, MRI, TRI))

        ++NumFP;

    }


    // If we have more FP constraints than not, then move everything over to

    // FPR.

    if (NumFP >= 2)

      OpRegBankIdx = {PMI_FirstFPR, PMI_FirstGPR, PMI_FirstFPR, PMI_FirstFPR};


    break;

  }

  case TargetOpcode::G_UNMERGE_VALUES: {

    // If the first operand belongs to a FPR register bank, then make sure that

    // we preserve that.

    if (OpRegBankIdx[0] != PMI_FirstGPR)

      break;


    LLT SrcTy = MRI.getType(MI.getOperand(MI.getNumOperands()-1).getReg());

    // UNMERGE into scalars from a vector should always use FPR.

    // Likewise if any of the uses are FP instructions.

    if (SrcTy.isVector() || SrcTy == LLT::scalar(128) ||

        any_of(MRI.use_nodbg_instructions(MI.getOperand(0).getReg()),

               [&](MachineInstr &MI) { return onlyUsesFP(MI, MRI, TRI); })) {

      // Set the register bank of every operand to FPR.

      for (unsigned Idx = 0, NumOperands = MI.getNumOperands();

           Idx < NumOperands; ++Idx)

        OpRegBankIdx[Idx] = PMI_FirstFPR;

    }

    break;

  }

  case TargetOpcode::G_EXTRACT_VECTOR_ELT:

    // Destination and source need to be FPRs.

    OpRegBankIdx[0] = PMI_FirstFPR;

    OpRegBankIdx[1] = PMI_FirstFPR;


    // Index needs to be a GPR.

    OpRegBankIdx[2] = PMI_FirstGPR;

    break;

  case TargetOpcode::G_INSERT_VECTOR_ELT:

    OpRegBankIdx[0] = PMI_FirstFPR;

    OpRegBankIdx[1] = PMI_FirstFPR;


    // The element may be either a GPR or FPR. Preserve that behaviour.

    if (getRegBank(MI.getOperand(2).getReg(), MRI, TRI) == &AArch64::FPRRegBank)

      OpRegBankIdx[2] = PMI_FirstFPR;

    else {

      // If the type is i8/i16, and the regank will be GPR, then we change the

      // type to i32 in applyMappingImpl.

      LLT Ty = MRI.getType(MI.getOperand(2).getReg());

      if (Ty.getSizeInBits() == 8 || Ty.getSizeInBits() == 16)

        MappingID = 1;

      OpRegBankIdx[2] = PMI_FirstGPR;

    }


    // Index needs to be a GPR.

    OpRegBankIdx[3] = PMI_FirstGPR;

    break;

  case TargetOpcode::G_EXTRACT: {

    // For s128 sources we have to use fpr unless we know otherwise.

    auto Src = MI.getOperand(1).getReg();

    LLT SrcTy = MRI.getType(MI.getOperand(1).getReg());

    if (SrcTy.getSizeInBits() != 128)

      break;

    auto Idx = MRI.getRegClassOrNull(Src) == &AArch64::XSeqPairsClassRegClass

                   ? PMI_FirstGPR

                   : PMI_FirstFPR;

    OpRegBankIdx[0] = Idx;

    OpRegBankIdx[1] = Idx;

    break;

  }

  case TargetOpcode::G_BUILD_VECTOR: {

    // If the first source operand belongs to a FPR register bank, then make

    // sure that we preserve that.

    if (OpRegBankIdx[1] != PMI_FirstGPR)

      break;

    Register VReg = MI.getOperand(1).getReg();

    if (!VReg)

      break;


    // Get the instruction that defined the source operand reg, and check if

    // it's a floating point operation. Or, if it's a type like s16 which

    // doesn't have a exact size gpr register class. The exception is if the

    // build_vector has all constant operands, which may be better to leave as

    // gpr without copies, so it can be matched in imported patterns.

    MachineInstr *DefMI = MRI.getVRegDef(VReg);

    unsigned DefOpc = DefMI->getOpcode();

    const LLT SrcTy = MRI.getType(VReg);

    if (all_of(MI.operands(), [&](const MachineOperand &Op) {

          return Op.isDef() || MRI.getVRegDef(Op.getReg())->getOpcode() ==

                                   TargetOpcode::G_CONSTANT;

        }))

      break;

    if (isPreISelGenericFloatingPointOpcode(DefOpc) ||

        SrcTy.getSizeInBits() < 32 ||

        getRegBank(VReg, MRI, TRI) == &AArch64::FPRRegBank) {

      // Have a floating point op.

      // Make sure every operand gets mapped to a FPR register class.

      unsigned NumOperands = MI.getNumOperands();

      for (unsigned Idx = 0; Idx < NumOperands; ++Idx)

        OpRegBankIdx[Idx] = PMI_FirstFPR;

    }

    break;

  }

  case TargetOpcode::G_VECREDUCE_FADD:

  case TargetOpcode::G_VECREDUCE_FMUL:

  case TargetOpcode::G_VECREDUCE_FMAX:

  case TargetOpcode::G_VECREDUCE_FMIN:

  case TargetOpcode::G_VECREDUCE_FMAXIMUM:

  case TargetOpcode::G_VECREDUCE_FMINIMUM:

  case TargetOpcode::G_VECREDUCE_ADD:

  case TargetOpcode::G_VECREDUCE_MUL:

  case TargetOpcode::G_VECREDUCE_AND:

  case TargetOpcode::G_VECREDUCE_OR:

  case TargetOpcode::G_VECREDUCE_XOR:

  case TargetOpcode::G_VECREDUCE_SMAX:

  case TargetOpcode::G_VECREDUCE_SMIN:

  case TargetOpcode::G_VECREDUCE_UMAX:

  case TargetOpcode::G_VECREDUCE_UMIN:

    // Reductions produce a scalar value from a vector, the scalar should be on

    // FPR bank.

    OpRegBankIdx = {PMI_FirstFPR, PMI_FirstFPR};

    break;

  case TargetOpcode::G_VECREDUCE_SEQ_FADD:

  case TargetOpcode::G_VECREDUCE_SEQ_FMUL:

    // These reductions also take a scalar accumulator input.

    // Assign them FPR for now.

    OpRegBankIdx = {PMI_FirstFPR, PMI_FirstFPR, PMI_FirstFPR};

    break;

  case TargetOpcode::G_INTRINSIC:

  case TargetOpcode::G_INTRINSIC_W_SIDE_EFFECTS: {

    // Check if we know that the intrinsic has any constraints on its register

    // banks. If it does, then update the mapping accordingly.

    unsigned Idx = 0;

    if (onlyDefinesFP(MI, MRI, TRI))

      for (const auto &Op : MI.defs()) {

        if (Op.isReg())

          OpRegBankIdx[Idx] = PMI_FirstFPR;

        ++Idx;

      }

    else

      Idx += MI.getNumExplicitDefs();


    if (onlyUsesFP(MI, MRI, TRI))

      for (const auto &Op : MI.explicit_uses()) {

        if (Op.isReg())

          OpRegBankIdx[Idx] = PMI_FirstFPR;

        ++Idx;

      }

    break;

  }

  case TargetOpcode::G_LROUND:

  case TargetOpcode::G_LLROUND: {

    // Source is always floating point and destination is always integer.

    OpRegBankIdx = {PMI_FirstGPR, PMI_FirstFPR};

    break;

  }

  }


  // Finally construct the computed mapping.

  SmallVector<const ValueMapping *, 8> OpdsMapping(NumOperands);

  for (unsigned Idx = 0; Idx < NumOperands; ++Idx) {

    if (MI.getOperand(Idx).isReg() && MI.getOperand(Idx).getReg()) {

      LLT Ty = MRI.getType(MI.getOperand(Idx).getReg());

      if (!Ty.isValid())

        continue;

      auto Mapping =

          getValueMapping(OpRegBankIdx[Idx], TypeSize::getFixed(OpSize[Idx]));

      if (!Mapping->isValid())

        return getInvalidInstructionMapping();


      OpdsMapping[Idx] = Mapping;

    }

  }


  return getInstructionMapping(MappingID, Cost, getOperandsMapping(OpdsMapping),

                               NumOperands);

}

MRI
unsigned const MachineRegisterInfo * MRI
Definition: AArch64AdvSIMDScalarPass.cpp:105

UseMI
MachineInstrBuilder & UseMI
Definition: AArch64ExpandPseudoInsts.cpp:110

DefMI
MachineInstrBuilder MachineInstrBuilder & DefMI
Definition: AArch64ExpandPseudoInsts.cpp:111

getIntrinsicID
static unsigned getIntrinsicID(const SDNode *N)
Definition: AArch64ISelLowering.cpp:7145

AArch64MCTargetDesc.h

CHECK_VALUEMAP
#define CHECK_VALUEMAP(RBName, Size)

isFPIntrinsic
static bool isFPIntrinsic(const MachineRegisterInfo &MRI, const MachineInstr &MI)
Definition: AArch64RegisterBankInfo.cpp:476

CHECK_VALUEMAP_3OPS
#define CHECK_VALUEMAP_3OPS(RBName, Size)

CHECK_PARTIALMAP
#define CHECK_PARTIALMAP(Idx, ValStartIdx, ValLength, RB)

CHECK_VALUEMAP_CROSSREGCPY
#define CHECK_VALUEMAP_CROSSREGCPY(RBNameDst, RBNameSrc, Size)

CHECK_VALUEMAP_FPEXT
#define CHECK_VALUEMAP_FPEXT(DstSize, SrcSize)

AArch64RegisterBankInfo.h
This file declares the targeting of the RegisterBankInfo class for AArch64.

AArch64RegisterInfo.h

B
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")

A
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")

Utils.h

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:352

Size
uint64_t Size
Definition: ELFObjHandler.cpp:81

GenericMachineInstrs.h
Declares convenience wrapper classes for interpreting MachineInstr instances as specific generic oper...

MI
IRTranslator LLVM IR MI
Definition: IRTranslator.cpp:113

LowLevelTypeUtils.h
Implement a low-level type suitable for MachineInstr level instruction selection.

MachineFunction.h

MachineIRBuilder.h
This file declares the MachineIRBuilder class.

MachineInstr.h

MachineOperand.h

MachineRegisterInfo.h

TRI
unsigned const TargetRegisterInfo * TRI
Definition: MachineSink.cpp:1928

verify
ppc ctr loops verify
Definition: PPCCTRLoopsVerify.cpp:74

FPR
static const MCPhysReg FPR[]
FPR - The set of FP registers that should be allocated for arguments on Darwin and AIX.
Definition: PPCISelLowering.cpp:4096

RegisterBankInfo.h

RegisterBank.h

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

STLExtras.h
This file contains some templates that are useful if you are working with the STL at all.

SmallVector.h
This file defines the SmallVector class.

TargetOpcodes.h

TargetRegisterInfo.h

TargetSubtargetInfo.h

Threading.h

llvm::AArch64GenRegisterBankInfo::PartialMappingIdx
PartialMappingIdx
Definition: AArch64RegisterBankInfo.h:28

llvm::AArch64GenRegisterBankInfo::PMI_FPR64
@ PMI_FPR64
Definition: AArch64RegisterBankInfo.h:32

llvm::AArch64GenRegisterBankInfo::PMI_GPR64
@ PMI_GPR64
Definition: AArch64RegisterBankInfo.h:37

llvm::AArch64GenRegisterBankInfo::PMI_GPR32
@ PMI_GPR32
Definition: AArch64RegisterBankInfo.h:36

llvm::AArch64GenRegisterBankInfo::PMI_GPR128
@ PMI_GPR128
Definition: AArch64RegisterBankInfo.h:38

llvm::AArch64GenRegisterBankInfo::PMI_FirstFPR
@ PMI_FirstFPR
Definition: AArch64RegisterBankInfo.h:41

llvm::AArch64GenRegisterBankInfo::PMI_FPR32
@ PMI_FPR32
Definition: AArch64RegisterBankInfo.h:31

llvm::AArch64GenRegisterBankInfo::PMI_FirstGPR
@ PMI_FirstGPR
Definition: AArch64RegisterBankInfo.h:39

llvm::AArch64GenRegisterBankInfo::PMI_FPR128
@ PMI_FPR128
Definition: AArch64RegisterBankInfo.h:33

llvm::AArch64GenRegisterBankInfo::PMI_FPR16
@ PMI_FPR16
Definition: AArch64RegisterBankInfo.h:30

llvm::AArch64GenRegisterBankInfo::PMI_FPR256
@ PMI_FPR256
Definition: AArch64RegisterBankInfo.h:34

llvm::AArch64GenRegisterBankInfo::PMI_LastGPR
@ PMI_LastGPR
Definition: AArch64RegisterBankInfo.h:40

llvm::AArch64GenRegisterBankInfo::PMI_None
@ PMI_None
Definition: AArch64RegisterBankInfo.h:29

llvm::AArch64GenRegisterBankInfo::PMI_FPR512
@ PMI_FPR512
Definition: AArch64RegisterBankInfo.h:35

llvm::AArch64GenRegisterBankInfo::PMI_LastFPR
@ PMI_LastFPR
Definition: AArch64RegisterBankInfo.h:42

llvm::AArch64GenRegisterBankInfo::getRegBankBaseIdxOffset
static unsigned getRegBankBaseIdxOffset(unsigned RBIdx, TypeSize Size)

llvm::AArch64GenRegisterBankInfo::getCopyMapping
static const RegisterBankInfo::ValueMapping * getCopyMapping(unsigned DstBankID, unsigned SrcBankID, TypeSize Size)
Get the pointer to the ValueMapping of the operands of a copy instruction from the SrcBankID register...

llvm::AArch64GenRegisterBankInfo::checkPartialMappingIdx
static bool checkPartialMappingIdx(PartialMappingIdx FirstAlias, PartialMappingIdx LastAlias, ArrayRef< PartialMappingIdx > Order)

llvm::AArch64GenRegisterBankInfo::Shift64Imm
@ Shift64Imm
Definition: AArch64RegisterBankInfo.h:62

llvm::AArch64GenRegisterBankInfo::PartMappings
static const RegisterBankInfo::PartialMapping PartMappings[]
Definition: AArch64RegisterBankInfo.h:46

llvm::AArch64GenRegisterBankInfo::getFPExtMapping
static const RegisterBankInfo::ValueMapping * getFPExtMapping(unsigned DstSize, unsigned SrcSize)
Get the instruction mapping for G_FPEXT.

llvm::AArch64GenRegisterBankInfo::getValueMapping
static const RegisterBankInfo::ValueMapping * getValueMapping(PartialMappingIdx RBIdx, TypeSize Size)
Get the pointer to the ValueMapping representing the RegisterBank at RBIdx with a size of Size.

llvm::AArch64GenRegisterBankInfo::ValMappings
static const RegisterBankInfo::ValueMapping ValMappings[]
Definition: AArch64RegisterBankInfo.h:47

llvm::AArch64RegisterBankInfo::getRegBankFromRegClass
const RegisterBank & getRegBankFromRegClass(const TargetRegisterClass &RC, LLT) const override
Get a register bank that covers RC.
Definition: AArch64RegisterBankInfo.cpp:242

llvm::AArch64RegisterBankInfo::getInstrAlternativeMappings
InstructionMappings getInstrAlternativeMappings(const MachineInstr &MI) const override
Get the alternative mappings for MI.
Definition: AArch64RegisterBankInfo.cpp:298

llvm::AArch64RegisterBankInfo::copyCost
unsigned copyCost(const RegisterBank &A, const RegisterBank &B, TypeSize Size) const override
Get the cost of a copy from B to A, or put differently, get the cost of A = COPY B.
Definition: AArch64RegisterBankInfo.cpp:220

llvm::AArch64RegisterBankInfo::AArch64RegisterBankInfo
AArch64RegisterBankInfo(const TargetRegisterInfo &TRI)
Definition: AArch64RegisterBankInfo.cpp:46

llvm::AArch64RegisterBankInfo::getInstrMapping
const InstructionMapping & getInstrMapping(const MachineInstr &MI) const override
Get the mapping of the different operands of MI on the register bank.
Definition: AArch64RegisterBankInfo.cpp:648

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:32

llvm::GlobalValue
Definition: GlobalValue.h:48

llvm::InstructionCost
Definition: InstructionCost.h:29

llvm::LLT
Definition: LowLevelType.h:39

llvm::LLT::scalar
static constexpr LLT scalar(unsigned SizeInBits)
Get a low-level scalar or aggregate "bag of bits".
Definition: LowLevelType.h:42

llvm::LLT::isValid
constexpr bool isValid() const
Definition: LowLevelType.h:145

llvm::LLT::isVector
constexpr bool isVector() const
Definition: LowLevelType.h:148

llvm::LLT::getSizeInBits
constexpr TypeSize getSizeInBits() const
Returns the total size of the type. Must only be called on sized types.
Definition: LowLevelType.h:193

llvm::LLT::getElementType
constexpr LLT getElementType() const
Returns the vector's element type. Only valid for vector types.
Definition: LowLevelType.h:290

llvm::LLT::getElementCount
constexpr ElementCount getElementCount() const
Definition: LowLevelType.h:184

llvm::MachineFunction
Definition: MachineFunction.h:258

llvm::MachineFunction::getSubtarget
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
Definition: MachineFunction.h:717

llvm::MachineFunction::getRegInfo
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Definition: MachineFunction.h:727

llvm::MachineIRBuilder
Helper class to build MachineInstr.
Definition: MachineIRBuilder.h:224

llvm::MachineIRBuilder::setInsertPt
void setInsertPt(MachineBasicBlock &MBB, MachineBasicBlock::iterator II)
Set the insertion point before the specified position.
Definition: MachineIRBuilder.h:327

llvm::MachineIRBuilder::buildAnyExt
MachineInstrBuilder buildAnyExt(const DstOp &Res, const SrcOp &Op)
Build and insert Res = G_ANYEXT Op0.
Definition: MachineIRBuilder.cpp:495

llvm::MachineInstr
Representation of each machine instruction.
Definition: MachineInstr.h:69

llvm::MachineInstr::getOpcode
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
Definition: MachineInstr.h:569

llvm::MachineOperand
MachineOperand class - Representation of each machine instruction operand.
Definition: MachineOperand.h:48

llvm::MachineRegisterInfo
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
Definition: MachineRegisterInfo.h:51

llvm::RegisterBankInfo::InstructionMapping
Helper class that represents how the value of an instruction may be mapped and what is the related co...
Definition: RegisterBankInfo.h:191

llvm::RegisterBankInfo::InstructionMapping::isValid
bool isValid() const
Check whether this object is valid.
Definition: RegisterBankInfo.h:255

llvm::RegisterBankInfo::getInstrAlternativeMappings
virtual InstructionMappings getInstrAlternativeMappings(const MachineInstr &MI) const
Get the alternative mappings for MI.
Definition: RegisterBankInfo.cpp:435

llvm::RegisterBankInfo::getInstructionMapping
const InstructionMapping & getInstructionMapping(unsigned ID, unsigned Cost, const ValueMapping *OperandsMapping, unsigned NumOperands) const
Method to get a uniquely generated InstructionMapping.
Definition: RegisterBankInfo.h:534

llvm::RegisterBankInfo::applyDefaultMapping
static void applyDefaultMapping(const OperandsMapper &OpdMapper)
Helper method to apply something that is like the default mapping.
Definition: RegisterBankInfo.cpp:440

llvm::RegisterBankInfo::getInvalidInstructionMapping
const InstructionMapping & getInvalidInstructionMapping() const
Method to get a uniquely generated invalid InstructionMapping.
Definition: RegisterBankInfo.h:542

llvm::RegisterBankInfo::getRegBank
const RegisterBank & getRegBank(unsigned ID)
Get the register bank identified by ID.
Definition: RegisterBankInfo.h:440

llvm::RegisterBankInfo::getMaximumSize
unsigned getMaximumSize(unsigned RegBankID) const
Get the maximum size in bits that fits in the given register bank.
Definition: RegisterBankInfo.h:590

llvm::RegisterBankInfo::getSizeInBits
TypeSize getSizeInBits(Register Reg, const MachineRegisterInfo &MRI, const TargetRegisterInfo &TRI) const
Get the size in bits of Reg.
Definition: RegisterBankInfo.cpp:499

llvm::RegisterBankInfo::getOperandsMapping
const ValueMapping * getOperandsMapping(Iterator Begin, Iterator End) const
Get the uniquely generated array of ValueMapping for the elements of between Begin and End.
Definition: RegisterBankInfo.cpp:334

llvm::RegisterBankInfo::DefaultMappingID
static const unsigned DefaultMappingID
Identifier used when the related instruction mapping instance is generated by target independent code...
Definition: RegisterBankInfo.h:672

llvm::RegisterBankInfo::copyCost
virtual unsigned copyCost(const RegisterBank &A, const RegisterBank &B, TypeSize Size) const
Get the cost of a copy from B to A, or put differently, get the cost of A = COPY B.
Definition: RegisterBankInfo.h:633

llvm::RegisterBankInfo::getInstrMappingImpl
const InstructionMapping & getInstrMappingImpl(const MachineInstr &MI) const
Try to get the mapping of MI.
Definition: RegisterBankInfo.cpp:164

llvm::RegisterBank
This class implements the register bank concept.
Definition: RegisterBank.h:28

llvm::RegisterBank::covers
bool covers(const TargetRegisterClass &RC) const
Check whether this register bank covers RC.
Definition: RegisterBank.cpp:52

llvm::RegisterBank::getID
unsigned getID() const
Get the identifier of this register bank.
Definition: RegisterBank.h:45

llvm::Register
Wrapper class representing virtual and physical registers.
Definition: Register.h:19

llvm::Register::isPhysical
constexpr bool isPhysical() const
Return true if the specified register number is in the physical register namespace.
Definition: Register.h:95

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition: SmallVector.h:426

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1209

llvm::StructType
Class to represent struct types.
Definition: DerivedTypes.h:216

llvm::TargetRegisterClass
Definition: TargetRegisterInfo.h:45

llvm::TargetRegisterClass::getID
unsigned getID() const
Return the register class ID number.
Definition: TargetRegisterInfo.h:74

llvm::TargetRegisterInfo
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
Definition: TargetRegisterInfo.h:238

llvm::TargetSubtargetInfo
TargetSubtargetInfo - Generic base class for all target subtargets.
Definition: TargetSubtargetInfo.h:63

llvm::TargetSubtargetInfo::getRegisterInfo
virtual const TargetRegisterInfo * getRegisterInfo() const
getRegisterInfo - If register information is available, return it.
Definition: TargetSubtargetInfo.h:128

llvm::TypeSize
Definition: TypeSize.h:334

llvm::TypeSize::getFixed
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition: TypeSize.h:345

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::getArrayElementType
Type * getArrayElementType() const
Definition: Type.h:404

llvm::Type::isFPOrFPVectorTy
bool isFPOrFPVectorTy() const
Return true if this is a FP type or a vector of FP.
Definition: Type.h:216

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::Value::users
iterator_range< user_iterator > users()
Definition: Value.h:421

llvm::details::FixedOrScalableQuantity::getFixedValue
constexpr ScalarTy getFixedValue() const
Definition: TypeSize.h:202

llvm::details::FixedOrScalableQuantity::getKnownMinValue
constexpr ScalarTy getKnownMinValue() const
Returns the minimum value this quantity can represent.
Definition: TypeSize.h:168

ErrorHandling.h

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::all_of
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1722

llvm::Depth
@ Depth
Definition: SIMachineScheduler.h:36

llvm::isPreISelGenericOpcode
bool isPreISelGenericOpcode(unsigned Opcode)
Check whether the given Opcode is a generic opcode that is not supposed to appear after ISel.
Definition: TargetOpcodes.h:30

llvm::isPreISelGenericOptimizationHint
bool isPreISelGenericOptimizationHint(unsigned Opcode)
Definition: TargetOpcodes.h:42

llvm::any_of
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition: STLExtras.h:1729

llvm::call_once
void call_once(once_flag &flag, Function &&F, Args &&... ArgList)
Execute the function specified as a parameter once.
Definition: Threading.h:87

llvm::isPreISelGenericFloatingPointOpcode
bool isPreISelGenericFloatingPointOpcode(unsigned Opc)
Returns whether opcode Opc is a pre-isel generic floating-point opcode, having only floating-point op...
Definition: Utils.cpp:1690

llvm::MemOp
Definition: TargetLowering.h:115

llvm::once_flag
The llvm::once_flag structure.
Definition: Threading.h:68