LLVM 18.0.0git
NVPTXSubtarget.cpp
Go to the documentation of this file.
1//===- NVPTXSubtarget.cpp - NVPTX Subtarget Information -------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file implements the NVPTX specific subclass of TargetSubtarget.
10//
11//===----------------------------------------------------------------------===//
12
13#include "NVPTXSubtarget.h"
14#include "NVPTXTargetMachine.h"
15
16using namespace llvm;
17
18#define DEBUG_TYPE "nvptx-subtarget"
19
20#define GET_SUBTARGETINFO_ENUM
21#define GET_SUBTARGETINFO_TARGET_DESC
22#define GET_SUBTARGETINFO_CTOR
23#include "NVPTXGenSubtargetInfo.inc"
24
25static cl::opt<bool>
26 NoF16Math("nvptx-no-f16-math", cl::Hidden,
27 cl::desc("NVPTX Specific: Disable generation of f16 math ops."),
28 cl::init(false));
29// Pin the vtable to this file.
30void NVPTXSubtarget::anchor() {}
31
33 StringRef FS) {
34 // Provide the default CPU if we don't have one.
35 TargetName = std::string(CPU.empty() ? "sm_30" : CPU);
36
37 ParseSubtargetFeatures(TargetName, /*TuneCPU*/ TargetName, FS);
38
39 // Set default to PTX 6.0 (CUDA 9.0)
40 if (PTXVersion == 0) {
41 PTXVersion = 60;
42 }
43
44 return *this;
45}
46
47NVPTXSubtarget::NVPTXSubtarget(const Triple &TT, const std::string &CPU,
48 const std::string &FS,
50 : NVPTXGenSubtargetInfo(TT, CPU, /*TuneCPU*/ CPU, FS), PTXVersion(0),
51 SmVersion(20), TM(TM),
52 TLInfo(TM, initializeSubtargetDependencies(CPU, FS)) {}
53
55 // Enable handles for Kepler+, where CUDA supports indirect surfaces and
56 // textures
57 if (TM.getDrvInterface() == NVPTX::CUDA)
58 return (SmVersion >= 30);
59
60 // Disabled, otherwise
61 return false;
62}
63
65 return hasFP16Math() && NoF16Math == false;
66}
static cl::opt< bool > NoF16Math("nvptx-no-f16-math", cl::Hidden, cl::desc("NVPTX Specific: Disable generation of f16 math ops."), cl::init(false))
unsigned SmVersion
Definition: NVVMReflect.cpp:78
const char LLVMTargetMachineRef TM
bool hasImageHandles() const
void ParseSubtargetFeatures(StringRef CPU, StringRef TuneCPU, StringRef FS)
bool allowFP16Math() const
NVPTXSubtarget(const Triple &TT, const std::string &CPU, const std::string &FS, const NVPTXTargetMachine &TM)
This constructor initializes the data members to match that of the specified module.
NVPTXSubtarget & initializeSubtargetDependencies(StringRef CPU, StringRef FS)
bool hasFP16Math() const
NVPTX::DrvInterface getDrvInterface() const
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:50
constexpr bool empty() const
empty - Check if the string is empty.
Definition: StringRef.h:134
Triple - Helper class for working with autoconf configuration names.
Definition: Triple.h:44
@ CUDA
Definition: NVPTX.h:79
initializer< Ty > init(const Ty &Val)
Definition: CommandLine.h:445
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18