LLVM 22.0.0git
NVPTXRegisterInfo.cpp
Go to the documentation of this file.
1//===- NVPTXRegisterInfo.cpp - NVPTX Register Information -----------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file contains the NVPTX implementation of the TargetRegisterInfo class.
10//
11//===----------------------------------------------------------------------===//
12
13#include "NVPTXRegisterInfo.h"
15#include "NVPTX.h"
16#include "NVPTXTargetMachine.h"
17#include "llvm/ADT/BitVector.h"
21
22using namespace llvm;
23
24#define DEBUG_TYPE "nvptx-reg-info"
25
26namespace llvm {
28 if (RC == &NVPTX::B128RegClass)
29 return ".b128";
30 if (RC == &NVPTX::B64RegClass)
31 // We use untyped (.b) integer registers here as NVCC does.
32 // Correctness of generated code does not depend on register type,
33 // but using .s/.u registers runs into ptxas bug that prevents
34 // assembly of otherwise valid PTX into SASS. Despite PTX ISA
35 // specifying only argument size for fp16 instructions, ptxas does
36 // not allow using .s16 or .u16 arguments for .fp16
37 // instructions. At the same time it allows using .s32/.u32
38 // arguments for .fp16v2 instructions:
39 //
40 // .reg .b16 rb16
41 // .reg .s16 rs16
42 // add.f16 rb16,rb16,rb16; // OK
43 // add.f16 rs16,rs16,rs16; // Arguments mismatch for instruction 'add'
44 // but:
45 // .reg .b32 rb32
46 // .reg .s32 rs32
47 // add.f16v2 rb32,rb32,rb32; // OK
48 // add.f16v2 rs32,rs32,rs32; // OK
49 return ".b64";
50 if (RC == &NVPTX::B32RegClass)
51 return ".b32";
52 if (RC == &NVPTX::B16RegClass)
53 return ".b16";
54 if (RC == &NVPTX::B1RegClass)
55 return ".pred";
56 if (RC == &NVPTX::SpecialRegsRegClass)
57 return "!Special!";
58 return "INTERNAL";
59}
60
62 if (RC == &NVPTX::B128RegClass)
63 return "%rq";
64 if (RC == &NVPTX::B64RegClass)
65 return "%rd";
66 if (RC == &NVPTX::B32RegClass)
67 return "%r";
68 if (RC == &NVPTX::B16RegClass)
69 return "%rs";
70 if (RC == &NVPTX::B1RegClass)
71 return "%p";
72 if (RC == &NVPTX::SpecialRegsRegClass)
73 return "!Special!";
74 return "INTERNAL";
75}
76} // namespace llvm
77
80
81#define GET_REGINFO_TARGET_DESC
82#include "NVPTXGenRegisterInfo.inc"
83
84/// NVPTX Callee Saved Registers
85const MCPhysReg *
87 static const MCPhysReg CalleeSavedRegs[] = { 0 };
88 return CalleeSavedRegs;
89}
90
92 BitVector Reserved(getNumRegs());
93 for (unsigned Reg = NVPTX::ENVREG0; Reg <= NVPTX::ENVREG31; ++Reg) {
94 markSuperRegs(Reserved, Reg);
95 }
96 markSuperRegs(Reserved, NVPTX::VRFrame32);
97 markSuperRegs(Reserved, NVPTX::VRFrameLocal32);
98 markSuperRegs(Reserved, NVPTX::VRFrame64);
99 markSuperRegs(Reserved, NVPTX::VRFrameLocal64);
100 markSuperRegs(Reserved, NVPTX::VRDepot);
101 return Reserved;
102}
103
105 int SPAdj, unsigned FIOperandNum,
106 RegScavenger *) const {
107 assert(SPAdj == 0 && "Unexpected");
108
109 MachineInstr &MI = *II;
110 if (MI.isLifetimeMarker()) {
111 MI.eraseFromParent();
112 return true;
113 }
114
115 const int FrameIndex = MI.getOperand(FIOperandNum).getIndex();
116
117 const MachineFunction &MF = *MI.getParent()->getParent();
118 const int Offset = MF.getFrameInfo().getObjectOffset(FrameIndex) +
119 MI.getOperand(FIOperandNum + 1).getImm();
120
121 // Using I0 as the frame pointer
122 MI.getOperand(FIOperandNum).ChangeToRegister(getFrameRegister(MF), false);
123 MI.getOperand(FIOperandNum + 1).ChangeToImmediate(Offset);
124 return false;
125}
126
128 const NVPTXTargetMachine &TM =
129 static_cast<const NVPTXTargetMachine &>(MF.getTarget());
130 return TM.is64Bit() ? NVPTX::VRFrame64 : NVPTX::VRFrame32;
131}
132
135 const NVPTXTargetMachine &TM =
136 static_cast<const NVPTXTargetMachine &>(MF.getTarget());
137 return TM.is64Bit() ? NVPTX::VRFrameLocal64 : NVPTX::VRFrameLocal32;
138}
139
141 debugRegisterMap.clear();
142}
143
145 if (RegisterName.size() > 8)
146 // The name is more than 8 characters long, and so won't fit into 64 bits.
147 return 0;
148
149 // Encode the name string into a DWARF register number using cuda-gdb's
150 // encoding. See cuda_check_dwarf2_reg_ptx_virtual_register in cuda-tdep.c,
151 // https://github.com/NVIDIA/cuda-gdb/blob/e5cf3bddae520ffb326f95b4d98ce5c7474b828b/gdb/cuda/cuda-tdep.c#L353
152 // IE the bytes of the string are concatenated in reverse into a single
153 // number, which is stored in ULEB128, but in practice must be no more than 8
154 // bytes (excluding null terminator, which is not included).
155 uint64_t result = 0;
156 for (unsigned char c : RegisterName)
157 result = (result << 8) | c;
158 return result;
159}
160
162 uint64_t preEncodedVirtualRegister, StringRef RegisterName) const {
163 uint64_t mapped = encodeRegisterForDwarf(RegisterName);
164 if (mapped == 0)
165 return;
166 debugRegisterMap.insert({preEncodedVirtualRegister, mapped});
167}
168
169int64_t NVPTXRegisterInfo::getDwarfRegNum(MCRegister RegNum, bool isEH) const {
171 // In NVPTXFrameLowering.cpp, we do arrange for %Depot to be accessible from
172 // %SP. Using the %Depot register doesn't provide any debug info in
173 // cuda-gdb, but switching it to %SP does.
174 if (RegNum.id() == NVPTX::VRDepot)
175 Name = "%SP";
176 return encodeRegisterForDwarf(Name);
177}
178
180 bool isEH) const {
181 assert(RegNum.isVirtual());
182 uint64_t lookup = debugRegisterMap.lookup(RegNum.id());
183 if (lookup)
184 return lookup;
185 return -1;
186}
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
This file implements the BitVector class.
IRTranslator LLVM IR MI
static bool lookup(const GsymReader &GR, DataExtractor &Data, uint64_t &Offset, uint64_t BaseAddr, uint64_t Addr, SourceLocations &SrcLocs, llvm::Error &Err)
A Lookup helper functions.
static uint64_t encodeRegisterForDwarf(StringRef RegisterName)
uint64_t IntrinsicInst * II
Wrapper class representing physical registers. Should be passed by value.
Definition MCRegister.h:33
constexpr unsigned id() const
Definition MCRegister.h:74
MachineInstrBundleIterator< MachineInstr > iterator
int64_t getObjectOffset(int ObjectIdx) const
Return the assigned stack offset of the specified object from the incoming stack pointer.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
const TargetMachine & getTarget() const
getTarget - Return the target machine this machine code is compiled with
Representation of each machine instruction.
static const char * getRegisterName(MCRegister Reg)
Register getFrameLocalRegister(const MachineFunction &MF) const
const MCPhysReg * getCalleeSavedRegs(const MachineFunction *MF) const override
NVPTX Callee Saved Registers.
bool eliminateFrameIndex(MachineBasicBlock::iterator MI, int SPAdj, unsigned FIOperandNum, RegScavenger *RS=nullptr) const override
BitVector getReservedRegs(const MachineFunction &MF) const override
int64_t getDwarfRegNum(MCRegister RegNum, bool isEH) const override
Register getFrameRegister(const MachineFunction &MF) const override
void addToDebugRegisterMap(uint64_t preEncodedVirtualRegister, StringRef RegisterName) const
int64_t getDwarfRegNumForVirtReg(Register RegNum, bool isEH) const override
Wrapper class representing virtual and physical registers.
Definition Register.h:19
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
Definition Register.h:74
constexpr unsigned id() const
Definition Register.h:95
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55
constexpr size_t size() const
size - Get the string size.
Definition StringRef.h:154
This is an optimization pass for GlobalISel generic memory operations.
@ Offset
Definition DWP.cpp:477
StringRef getNVPTXRegClassStr(TargetRegisterClass const *RC)
StringRef getNVPTXRegClassName(TargetRegisterClass const *RC)
uint16_t MCPhysReg
An unsigned integer type large enough to represent all physical registers, but not necessarily virtua...
Definition MCRegister.h:21