doxygen/AMDGPUAsmBackend_8cpp_source.html

//===-- AMDGPUAsmBackend.cpp - AMDGPU Assembler Backend -------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

/// \file

//===----------------------------------------------------------------------===//


#include "MCTargetDesc/AMDGPUFixupKinds.h"

#include "MCTargetDesc/AMDGPUMCTargetDesc.h"

#include "Utils/AMDGPUBaseInfo.h"

#include "llvm/ADT/StringSwitch.h"

#include "llvm/BinaryFormat/ELF.h"

#include "llvm/MC/MCAsmBackend.h"

#include "llvm/MC/MCAssembler.h"

#include "llvm/MC/MCContext.h"

#include "llvm/MC/MCFixupKindInfo.h"

#include "llvm/MC/MCObjectWriter.h"

#include "llvm/MC/MCSubtargetInfo.h"

#include "llvm/MC/TargetRegistry.h"

#include "llvm/Support/EndianStream.h"

#include "llvm/TargetParser/TargetParser.h"


using namespace llvm;

using namespace llvm::AMDGPU;


namespace {


class AMDGPUAsmBackend : public MCAsmBackend {

public:

  AMDGPUAsmBackend(const Target &T) : MCAsmBackend(llvm::endianness::little) {}


  unsigned getNumFixupKinds() const override { return AMDGPU::NumTargetFixupKinds; };


  void applyFixup(const MCAssembler &Asm, const MCFixup &Fixup,

                  const MCValue &Target, MutableArrayRef<char> Data,

                  uint64_t Value, bool IsResolved,

                  const MCSubtargetInfo *STI) const override;

  bool fixupNeedsRelaxation(const MCFixup &Fixup,

                            uint64_t Value) const override;


  void relaxInstruction(MCInst &Inst,

                        const MCSubtargetInfo &STI) const override;


  bool mayNeedRelaxation(const MCInst &Inst,

                         const MCSubtargetInfo &STI) const override;


  unsigned getMinimumNopSize() const override;

  bool writeNopData(raw_ostream &OS, uint64_t Count,

                    const MCSubtargetInfo *STI) const override;


  std::optional<MCFixupKind> getFixupKind(StringRef Name) const override;

  const MCFixupKindInfo &getFixupKindInfo(MCFixupKind Kind) const override;

  bool shouldForceRelocation(const MCAssembler &Asm, const MCFixup &Fixup,

                             const MCValue &Target,

                             const MCSubtargetInfo *STI) override;

};


} //End anonymous namespace


void AMDGPUAsmBackend::relaxInstruction(MCInst &Inst,

                                        const MCSubtargetInfo &STI) const {

  MCInst Res;

  unsigned RelaxedOpcode = AMDGPU::getSOPPWithRelaxation(Inst.getOpcode());

  Res.setOpcode(RelaxedOpcode);

  Res.addOperand(Inst.getOperand(0));

  Inst = std::move(Res);

}


bool AMDGPUAsmBackend::fixupNeedsRelaxation(const MCFixup &Fixup,

                                            uint64_t Value) const {

  // if the branch target has an offset of x3f this needs to be relaxed to

  // add a s_nop 0 immediately after branch to effectively increment offset

  // for hardware workaround in gfx1010

  return (((int64_t(Value)/4)-1) == 0x3f);

}


bool AMDGPUAsmBackend::mayNeedRelaxation(const MCInst &Inst,

                       const MCSubtargetInfo &STI) const {

  if (!STI.hasFeature(AMDGPU::FeatureOffset3fBug))

    return false;


  if (AMDGPU::getSOPPWithRelaxation(Inst.getOpcode()) >= 0)

    return true;


  return false;

}


static unsigned getFixupKindNumBytes(unsigned Kind) {

  switch (Kind) {

  case AMDGPU::fixup_si_sopp_br:

    return 2;

  case FK_SecRel_1:

  case FK_Data_1:

    return 1;

  case FK_SecRel_2:

  case FK_Data_2:

    return 2;

  case FK_SecRel_4:

  case FK_Data_4:

  case FK_PCRel_4:

    return 4;

  case FK_SecRel_8:

  case FK_Data_8:

    return 8;

  default:

    llvm_unreachable("Unknown fixup kind!");

  }

}


static uint64_t adjustFixupValue(const MCFixup &Fixup, uint64_t Value,

                                 MCContext *Ctx) {

  int64_t SignedValue = static_cast<int64_t>(Value);


  switch (Fixup.getTargetKind()) {

  case AMDGPU::fixup_si_sopp_br: {

    int64_t BrImm = (SignedValue - 4) / 4;


    if (Ctx && !isInt<16>(BrImm))

      Ctx->reportError(Fixup.getLoc(), "branch size exceeds simm16");


    return BrImm;

  }

  case FK_Data_1:

  case FK_Data_2:

  case FK_Data_4:

  case FK_Data_8:

  case FK_PCRel_4:

  case FK_SecRel_4:

    return Value;

  default:

    llvm_unreachable("unhandled fixup kind");

  }

}


void AMDGPUAsmBackend::applyFixup(const MCAssembler &Asm, const MCFixup &Fixup,

                                  const MCValue &Target,

                                  MutableArrayRef<char> Data, uint64_t Value,

                                  bool IsResolved,

                                  const MCSubtargetInfo *STI) const {

  if (Fixup.getKind() >= FirstLiteralRelocationKind)

    return;


  Value = adjustFixupValue(Fixup, Value, &Asm.getContext());

  if (!Value)

    return; // Doesn't change encoding.


  MCFixupKindInfo Info = getFixupKindInfo(Fixup.getKind());


  // Shift the value into position.

  Value <<= Info.TargetOffset;


  unsigned NumBytes = getFixupKindNumBytes(Fixup.getKind());

  uint32_t Offset = Fixup.getOffset();

  assert(Offset + NumBytes <= Data.size() && "Invalid fixup offset!");


  // For each byte of the fragment that the fixup touches, mask in the bits from

  // the fixup value.

  for (unsigned i = 0; i != NumBytes; ++i)

    Data[Offset + i] |= static_cast<uint8_t>((Value >> (i * 8)) & 0xff);

}


std::optional<MCFixupKind>

AMDGPUAsmBackend::getFixupKind(StringRef Name) const {

  return StringSwitch<std::optional<MCFixupKind>>(Name)

#define ELF_RELOC(Name, Value)                                                 \

  .Case(#Name, MCFixupKind(FirstLiteralRelocationKind + Value))

#include "llvm/BinaryFormat/ELFRelocs/AMDGPU.def"

#undef ELF_RELOC

      .Default(std::nullopt);

}


const MCFixupKindInfo &AMDGPUAsmBackend::getFixupKindInfo(

                                                       MCFixupKind Kind) const {

  const static MCFixupKindInfo Infos[AMDGPU::NumTargetFixupKinds] = {

    // name                   offset bits  flags

    { "fixup_si_sopp_br",     0,     16,   MCFixupKindInfo::FKF_IsPCRel },

  };


  if (Kind >= FirstLiteralRelocationKind)

    return MCAsmBackend::getFixupKindInfo(FK_NONE);


  if (Kind < FirstTargetFixupKind)

    return MCAsmBackend::getFixupKindInfo(Kind);


  assert(unsigned(Kind - FirstTargetFixupKind) < getNumFixupKinds() &&

         "Invalid kind!");

  return Infos[Kind - FirstTargetFixupKind];

}


bool AMDGPUAsmBackend::shouldForceRelocation(const MCAssembler &,

                                             const MCFixup &Fixup,

                                             const MCValue &,

                                             const MCSubtargetInfo *STI) {

  return Fixup.getKind() >= FirstLiteralRelocationKind;

}


unsigned AMDGPUAsmBackend::getMinimumNopSize() const {

  return 4;

}


bool AMDGPUAsmBackend::writeNopData(raw_ostream &OS, uint64_t Count,

                                    const MCSubtargetInfo *STI) const {

  // If the count is not 4-byte aligned, we must be writing data into the text

  // section (otherwise we have unaligned instructions, and thus have far

  // bigger problems), so just write zeros instead.

  OS.write_zeros(Count % 4);


  // We are properly aligned, so write NOPs as requested.

  Count /= 4;


  // FIXME: R600 support.

  // s_nop 0

  const uint32_t Encoded_S_NOP_0 = 0xbf800000;


  for (uint64_t I = 0; I != Count; ++I)

    support::endian::write<uint32_t>(OS, Encoded_S_NOP_0, Endian);


  return true;

}


//===----------------------------------------------------------------------===//

// ELFAMDGPUAsmBackend class

//===----------------------------------------------------------------------===//


namespace {


class ELFAMDGPUAsmBackend : public AMDGPUAsmBackend {

  bool Is64Bit;

  bool HasRelocationAddend;

  uint8_t OSABI = ELF::ELFOSABI_NONE;


public:

  ELFAMDGPUAsmBackend(const Target &T, const Triple &TT)

      : AMDGPUAsmBackend(T), Is64Bit(TT.getArch() == Triple::amdgcn),

        HasRelocationAddend(TT.getOS() == Triple::AMDHSA) {

    switch (TT.getOS()) {

    case Triple::AMDHSA:

      OSABI = ELF::ELFOSABI_AMDGPU_HSA;

      break;

    case Triple::AMDPAL:

      OSABI = ELF::ELFOSABI_AMDGPU_PAL;

      break;

    case Triple::Mesa3D:

      OSABI = ELF::ELFOSABI_AMDGPU_MESA3D;

      break;

    default:

      break;

    }

  }


  std::unique_ptr<MCObjectTargetWriter>

  createObjectTargetWriter() const override {

    return createAMDGPUELFObjectWriter(Is64Bit, OSABI, HasRelocationAddend);

  }

};


} // end anonymous namespace


MCAsmBackend *llvm::createAMDGPUAsmBackend(const Target &T,

                                           const MCSubtargetInfo &STI,

                                           const MCRegisterInfo &MRI,

                                           const MCTargetOptions &Options) {

  return new ELFAMDGPUAsmBackend(T, STI.getTargetTriple());

}

MRI
unsigned const MachineRegisterInfo * MRI
Definition: AArch64AdvSIMDScalarPass.cpp:105

ELF_RELOC
#define ELF_RELOC(Name, Value)

adjustFixupValue
static uint64_t adjustFixupValue(const MCFixup &Fixup, uint64_t Value, MCContext *Ctx)
Definition: AMDGPUAsmBackend.cpp:112

getFixupKindNumBytes
static unsigned getFixupKindNumBytes(unsigned Kind)
Definition: AMDGPUAsmBackend.cpp:90

AMDGPUBaseInfo.h

AMDGPUFixupKinds.h

AMDGPUMCTargetDesc.h
Provides AMDGPU specific target descriptions.

ELF.h

Info
Analysis containing CSE Info
Definition: CSEInfo.cpp:27

Default
@ Default
Definition: DwarfDebug.cpp:87

Name
std::string Name
Definition: ELFObjHandler.cpp:77

EndianStream.h

Options
static LVOptions Options
Definition: LVOptions.cpp:25

MCAsmBackend.h

MCAssembler.h

MCContext.h

MCFixupKindInfo.h

MCObjectWriter.h

MCSubtargetInfo.h

I
#define I(x, y, z)
Definition: MD5.cpp:58

Fixup
PowerPC TLS Dynamic Call Fixup
Definition: PPCTLSDynamicCall.cpp:340

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

OS
raw_pwrite_stream & OS
Definition: SampleProfWriter.cpp:53

StringSwitch.h
This file implements the StringSwitch template, which mimics a switch() statement whose cases are str...

TargetParser.h

TargetRegistry.h

T

llvm::MCAsmBackend
Generic interface to target specific assembler backends.
Definition: MCAsmBackend.h:42

llvm::MCAsmBackend::getMinimumNopSize
virtual unsigned getMinimumNopSize() const
Returns the minimum size of a nop in bytes on this target.
Definition: MCAsmBackend.h:205

llvm::MCAsmBackend::writeNopData
virtual bool writeNopData(raw_ostream &OS, uint64_t Count, const MCSubtargetInfo *STI) const =0
Write an (optimal) nop sequence of Count bytes to the given output.

llvm::MCAsmBackend::relaxInstruction
virtual void relaxInstruction(MCInst &Inst, const MCSubtargetInfo &STI) const
Relax the instruction in the given fragment to the next wider instruction.
Definition: MCAsmBackend.h:177

llvm::MCAsmBackend::mayNeedRelaxation
virtual bool mayNeedRelaxation(const MCInst &Inst, const MCSubtargetInfo &STI) const
Check whether the given instruction may need relaxation.
Definition: MCAsmBackend.h:153

llvm::MCAsmBackend::fixupNeedsRelaxation
virtual bool fixupNeedsRelaxation(const MCFixup &Fixup, uint64_t Value) const
Simple predicate for targets where !Resolved implies requiring relaxation.
Definition: MCAsmBackend.h:167

llvm::MCAsmBackend::shouldForceRelocation
virtual bool shouldForceRelocation(const MCAssembler &Asm, const MCFixup &Fixup, const MCValue &Target, const MCSubtargetInfo *STI)
Hook to check if a relocation is needed for some target specific reason.
Definition: MCAsmBackend.h:94

llvm::MCAsmBackend::getNumFixupKinds
virtual unsigned getNumFixupKinds() const =0
Get the number of target specific fixup kinds.

llvm::MCAsmBackend::getFixupKindInfo
virtual const MCFixupKindInfo & getFixupKindInfo(MCFixupKind Kind) const
Get information on a fixup kind.
Definition: MCAsmBackend.cpp:90

llvm::MCAsmBackend::getFixupKind
virtual std::optional< MCFixupKind > getFixupKind(StringRef Name) const
Map a relocation name used in .reloc to a fixup kind.
Definition: MCAsmBackend.cpp:86

llvm::MCAsmBackend::applyFixup
virtual void applyFixup(const MCAssembler &Asm, const MCFixup &Fixup, const MCValue &Target, MutableArrayRef< char > Data, uint64_t Value, bool IsResolved, const MCSubtargetInfo *STI) const =0
Apply the Value for given Fixup into the provided data fragment, at the offset specified by the fixup...

llvm::MCAssembler
Definition: MCAssembler.h:53

llvm::MCContext
Context object for machine code objects.
Definition: MCContext.h:83

llvm::MCContext::reportError
void reportError(SMLoc L, const Twine &Msg)
Definition: MCContext.cpp:1067

llvm::MCFixup
Encode information on a single operation to perform on a byte sequence (e.g., an encoded instruction)...
Definition: MCFixup.h:71

llvm::MCInst
Instances of this class represent a single low-level machine instruction.
Definition: MCInst.h:184

llvm::MCInst::getOpcode
unsigned getOpcode() const
Definition: MCInst.h:198

llvm::MCInst::addOperand
void addOperand(const MCOperand Op)
Definition: MCInst.h:210

llvm::MCInst::setOpcode
void setOpcode(unsigned Op)
Definition: MCInst.h:197

llvm::MCInst::getOperand
const MCOperand & getOperand(unsigned i) const
Definition: MCInst.h:206

llvm::MCRegisterInfo
MCRegisterInfo base class - We assume that the target defines a static array of MCRegisterDesc object...
Definition: MCRegisterInfo.h:146

llvm::MCSubtargetInfo
Generic base class for all target subtargets.
Definition: MCSubtargetInfo.h:76

llvm::MCSubtargetInfo::hasFeature
bool hasFeature(unsigned Feature) const
Definition: MCSubtargetInfo.h:119

llvm::MCSubtargetInfo::getTargetTriple
const Triple & getTargetTriple() const
Definition: MCSubtargetInfo.h:108

llvm::MCTargetOptions
Definition: MCTargetOptions.h:39

llvm::MCValue
This represents an "assembler immediate".
Definition: MCValue.h:36

llvm::MutableArrayRef
MutableArrayRef - Represent a mutable reference to an array (0 or more elements consecutively in memo...
Definition: ArrayRef.h:307

llvm::StringRef
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:50

llvm::StringSwitch
A switch()-like statement whose cases are string literals.
Definition: StringSwitch.h:44

llvm::Target
Target - Wrapper for Target specific information.
Definition: TargetRegistry.h:144

llvm::Triple
Triple - Helper class for working with autoconf configuration names.
Definition: Triple.h:44

llvm::Triple::AMDHSA
@ AMDHSA
Definition: Triple.h:223

llvm::Triple::AMDPAL
@ AMDPAL
Definition: Triple.h:233

llvm::Triple::Mesa3D
@ Mesa3D
Definition: Triple.h:232

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::raw_ostream
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition: raw_ostream.h:52

llvm::raw_ostream::write_zeros
raw_ostream & write_zeros(unsigned NumZeros)
write_zeros - Insert 'NumZeros' nulls.
Definition: raw_ostream.cpp:502

uint32_t

uint64_t

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

llvm::AMDGPU
Definition: AMDGPUMetadataVerifier.h:33

llvm::AMDGPU::fixup_si_sopp_br
@ fixup_si_sopp_br
16-bit PC relative fixup for SOPP branch instructions.
Definition: AMDGPUFixupKinds.h:18

llvm::AMDGPU::NumTargetFixupKinds
@ NumTargetFixupKinds
Definition: AMDGPUFixupKinds.h:22

llvm::AMDGPU::getSOPPWithRelaxation
LLVM_READONLY int getSOPPWithRelaxation(uint16_t Opcode)

llvm::ARM::PredBlockMask::TT
@ TT

llvm::ELF::ELFOSABI_AMDGPU_HSA
@ ELFOSABI_AMDGPU_HSA
Definition: ELF.h:362

llvm::ELF::ELFOSABI_AMDGPU_MESA3D
@ ELFOSABI_AMDGPU_MESA3D
Definition: ELF.h:364

llvm::ELF::ELFOSABI_NONE
@ ELFOSABI_NONE
Definition: ELF.h:342

llvm::ELF::ELFOSABI_AMDGPU_PAL
@ ELFOSABI_AMDGPU_PAL
Definition: ELF.h:363

llvm::HexStyle::Asm
@ Asm
0ffh
Definition: MCInstPrinter.h:36

llvm::lltok::Kind
Kind
Definition: LLToken.h:18

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::Offset
@ Offset
Definition: DWP.cpp:480

llvm::createAMDGPUAsmBackend
MCAsmBackend * createAMDGPUAsmBackend(const Target &T, const MCSubtargetInfo &STI, const MCRegisterInfo &MRI, const MCTargetOptions &Options)
Definition: AMDGPUAsmBackend.cpp:261

llvm::createAMDGPUELFObjectWriter
std::unique_ptr< MCObjectTargetWriter > createAMDGPUELFObjectWriter(bool Is64Bit, uint8_t OSABI, bool HasRelocationAddend)
Definition: AMDGPUELFObjectWriter.cpp:99

llvm::MCFixupKind
MCFixupKind
Extensible enumeration to represent the type of a fixup.
Definition: MCFixup.h:21

llvm::FirstTargetFixupKind
@ FirstTargetFixupKind
Definition: MCFixup.h:45

llvm::FK_PCRel_4
@ FK_PCRel_4
A four-byte pc relative fixup.
Definition: MCFixup.h:30

llvm::FK_SecRel_2
@ FK_SecRel_2
A two-byte section relative fixup.
Definition: MCFixup.h:41

llvm::FirstLiteralRelocationKind
@ FirstLiteralRelocationKind
The range [FirstLiteralRelocationKind, MaxTargetFixupKind) is used for relocations coming from ....
Definition: MCFixup.h:50

llvm::FK_Data_8
@ FK_Data_8
A eight-byte fixup.
Definition: MCFixup.h:26

llvm::FK_Data_1
@ FK_Data_1
A one-byte fixup.
Definition: MCFixup.h:23

llvm::FK_Data_4
@ FK_Data_4
A four-byte fixup.
Definition: MCFixup.h:25

llvm::FK_SecRel_8
@ FK_SecRel_8
A eight-byte section relative fixup.
Definition: MCFixup.h:43

llvm::FK_NONE
@ FK_NONE
A no-op fixup.
Definition: MCFixup.h:22

llvm::FK_SecRel_4
@ FK_SecRel_4
A four-byte section relative fixup.
Definition: MCFixup.h:42

llvm::FK_SecRel_1
@ FK_SecRel_1
A one-byte section relative fixup.
Definition: MCFixup.h:40

llvm::FK_Data_2
@ FK_Data_2
A two-byte fixup.
Definition: MCFixup.h:24

llvm::endianness
endianness
Definition: bit.h:70

llvm::endianness::little
@ little

llvm::MCFixupKindInfo
Target independent information on a fixup kind.
Definition: MCFixupKindInfo.h:15

llvm::MCFixupKindInfo::FKF_IsPCRel
@ FKF_IsPCRel
Is this fixup kind PCrelative? This is used by the assembler backend to evaluate fixup values in a ta...
Definition: MCFixupKindInfo.h:19