LLVM 23.0.0git
LoongArchTargetMachine.cpp
Go to the documentation of this file.
1//===-- LoongArchTargetMachine.cpp - Define TargetMachine for LoongArch ---===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// Implements the info about LoongArch target spec.
10//
11//===----------------------------------------------------------------------===//
12
14#include "LoongArch.h"
21#include "llvm/CodeGen/Passes.h"
28#include <optional>
29
30using namespace llvm;
31
32#define DEBUG_TYPE "loongarch"
33
48
50 "loongarch-enable-dead-defs", cl::Hidden,
51 cl::desc("Enable the pass that removes dead"
52 " definitons and replaces stores to"
53 " them with stores to r0"),
54 cl::init(true));
55
56static cl::opt<bool>
57 EnableLoopDataPrefetch("loongarch-enable-loop-data-prefetch", cl::Hidden,
58 cl::desc("Enable the loop data prefetch pass"),
59 cl::init(false));
60
61static cl::opt<bool>
62 EnableMergeBaseOffset("loongarch-enable-merge-offset",
63 cl::desc("Enable the merge base offset pass"),
64 cl::init(true), cl::Hidden);
65
66static cl::opt<bool>
67 EnableSinkFold("loongarch-enable-sink-fold",
68 cl::desc("Enable sinking and folding of instruction copies"),
69 cl::init(true), cl::Hidden);
70
71static Reloc::Model getEffectiveRelocModel(std::optional<Reloc::Model> RM) {
72 return RM.value_or(Reloc::Static);
73}
74
77 std::optional<CodeModel::Model> CM) {
78 if (!CM)
79 return TT.isArch64Bit() ? CodeModel::Medium : CodeModel::Small;
80
81 switch (*CM) {
84 return *CM;
86 if (!TT.isArch64Bit())
87 report_fatal_error("Large code model requires LA64");
88 return *CM;
89 default:
91 "Only small, medium and large code models are allowed on LoongArch");
92 }
93}
94
96 const Target &T, const Triple &TT, StringRef CPU, StringRef FS,
97 const TargetOptions &Options, std::optional<Reloc::Model> RM,
98 std::optional<CodeModel::Model> CM, CodeGenOptLevel OL, bool JIT)
99 : CodeGenTargetMachineImpl(T, TT.computeDataLayout(), TT, CPU, FS, Options,
102 TLOF(std::make_unique<LoongArchELFTargetObjectFile>()) {
103 initAsmInfo();
104}
105
107
108const LoongArchSubtarget *
110 Attribute CPUAttr = F.getFnAttribute("target-cpu");
111 Attribute TuneAttr = F.getFnAttribute("tune-cpu");
112 Attribute FSAttr = F.getFnAttribute("target-features");
113
114 std::string CPU =
115 CPUAttr.isValid() ? CPUAttr.getValueAsString().str() : TargetCPU;
116 std::string TuneCPU =
117 TuneAttr.isValid() ? TuneAttr.getValueAsString().str() : CPU;
118 std::string FS =
119 FSAttr.isValid() ? FSAttr.getValueAsString().str() : TargetFS;
120
121 std::string Key = CPU + TuneCPU + FS;
122 auto &I = SubtargetMap[Key];
123 if (!I) {
124 // This needs to be done before we create a new subtarget since any
125 // creation will depend on the TM and the code generation flags on the
126 // function that reside in TargetOptions.
128 auto ABIName = Options.MCOptions.getABIName();
129 if (const MDString *ModuleTargetABI = dyn_cast_or_null<MDString>(
130 F.getParent()->getModuleFlag("target-abi"))) {
131 auto TargetABI = LoongArchABI::getTargetABI(ABIName);
132 if (TargetABI != LoongArchABI::ABI_Unknown &&
133 ModuleTargetABI->getString() != ABIName) {
134 report_fatal_error("-target-abi option != target-abi module flag");
135 }
136 ABIName = ModuleTargetABI->getString();
137 }
138 I = std::make_unique<LoongArchSubtarget>(TargetTriple, CPU, TuneCPU, FS,
139 ABIName, *this);
140 }
141 return I.get();
142}
143
150
151namespace {
152class LoongArchPassConfig : public TargetPassConfig {
153public:
154 LoongArchPassConfig(LoongArchTargetMachine &TM, PassManagerBase &PM)
155 : TargetPassConfig(TM, PM) {
156 setEnableSinkAndFold(EnableSinkFold);
157 }
158
159 LoongArchTargetMachine &getLoongArchTargetMachine() const {
161 }
162
163 void addIRPasses() override;
164 void addCodeGenPrepare() override;
165 bool addInstSelector() override;
166 void addPreEmitPass() override;
167 void addPreEmitPass2() override;
168 void addMachineSSAOptimization() override;
169 void addPreRegAlloc() override;
170 bool addRegAssignAndRewriteFast() override;
171 bool addRegAssignAndRewriteOptimized() override;
172};
173} // end namespace
174
177 return new LoongArchPassConfig(*this, PM);
178}
179
180void LoongArchPassConfig::addIRPasses() {
181 // Run LoopDataPrefetch
182 //
183 // Run this before LSR to remove the multiplies involved in computing the
184 // pointer values N iterations ahead.
185 if (TM->getOptLevel() != CodeGenOptLevel::None && EnableLoopDataPrefetch)
188
190}
191
192void LoongArchPassConfig::addCodeGenPrepare() {
193 if (getOptLevel() != CodeGenOptLevel::None)
196}
197
198bool LoongArchPassConfig::addInstSelector() {
199 addPass(createLoongArchISelDag(getLoongArchTargetMachine(), getOptLevel()));
200
201 return false;
202}
203
206 return TargetTransformInfo(std::make_unique<LoongArchTTIImpl>(this, F));
207}
208
209void LoongArchPassConfig::addPreEmitPass() { addPass(&BranchRelaxationPassID); }
210
211void LoongArchPassConfig::addPreEmitPass2() {
213 // Schedule the expansion of AtomicPseudos at the last possible moment,
214 // avoiding the possibility for other passes to break the requirements for
215 // forward progress in the LL/SC block.
217}
218
219void LoongArchPassConfig::addMachineSSAOptimization() {
221
222 if (TM->getTargetTriple().isLoongArch64()) {
224 }
225}
226
227void LoongArchPassConfig::addPreRegAlloc() {
229 if (TM->getOptLevel() != CodeGenOptLevel::None && EnableMergeBaseOffset)
231}
232
233bool LoongArchPassConfig::addRegAssignAndRewriteFast() {
234 if (TM->getOptLevel() != CodeGenOptLevel::None &&
238}
239
240bool LoongArchPassConfig::addRegAssignAndRewriteOptimized() {
241 if (TM->getOptLevel() != CodeGenOptLevel::None &&
245}
static cl::opt< bool > EnableSinkFold("aarch64-enable-sink-fold", cl::desc("Enable sinking and folding of instruction copies"), cl::init(true), cl::Hidden)
static cl::opt< bool > EnableLoopDataPrefetch("aarch64-enable-loop-data-prefetch", cl::Hidden, cl::desc("Enable the loop data prefetch pass"), cl::init(true))
static Reloc::Model getEffectiveRelocModel()
#define X(NUM, ENUM, NAME)
Definition ELF.h:853
#define LLVM_ABI
Definition Compiler.h:213
#define LLVM_EXTERNAL_VISIBILITY
Definition Compiler.h:132
static cl::opt< bool > EnableLoongArchDeadRegisterElimination("loongarch-enable-dead-defs", cl::Hidden, cl::desc("Enable the pass that removes dead" " definitons and replaces stores to" " them with stores to r0"), cl::init(true))
static cl::opt< bool > EnableMergeBaseOffset("loongarch-enable-merge-offset", cl::desc("Enable the merge base offset pass"), cl::init(true), cl::Hidden)
static cl::opt< bool > EnableLoopDataPrefetch("loongarch-enable-loop-data-prefetch", cl::Hidden, cl::desc("Enable the loop data prefetch pass"), cl::init(false))
LLVM_ABI LLVM_EXTERNAL_VISIBILITY void LLVMInitializeLoongArchTarget()
static CodeModel::Model getEffectiveLoongArchCodeModel(const Triple &TT, std::optional< CodeModel::Model > CM)
static cl::opt< bool > EnableSinkFold("loongarch-enable-sink-fold", cl::desc("Enable sinking and folding of instruction copies"), cl::init(true), cl::Hidden)
This file a TargetTransformInfoImplBase conforming object specific to the LoongArch target machine.
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
#define T
const GCNTargetMachine & getTM(const GCNSubtarget *STI)
static TableGen::Emitter::Opt Y("gen-skeleton-entry", EmitSkeleton, "Generate example skeleton entry")
Target-Independent Code Generator Pass Configuration Options pass.
This pass exposes codegen information to IR-level passes.
Functions, function parameters, and return types can have attributes to indicate how they should be t...
Definition Attributes.h:105
LLVM_ABI StringRef getValueAsString() const
Return the attribute's value as a string.
bool isValid() const
Return true if the attribute is any kind of attribute.
Definition Attributes.h:261
CodeGenTargetMachineImpl(const Target &T, StringRef DataLayoutString, const Triple &TT, StringRef CPU, StringRef FS, const TargetOptions &Options, Reloc::Model RM, CodeModel::Model CM, CodeGenOptLevel OL)
This implementation is used for LoongArch ELF targets.
LoongArchTargetMachine(const Target &T, const Triple &TT, StringRef CPU, StringRef FS, const TargetOptions &Options, std::optional< Reloc::Model > RM, std::optional< CodeModel::Model > CM, CodeGenOptLevel OL, bool JIT)
const LoongArchSubtarget * getSubtargetImpl() const =delete
TargetPassConfig * createPassConfig(PassManagerBase &PM) override
Create a pass configuration object to be used by addPassToEmitX methods for generating a pipeline of ...
TargetTransformInfo getTargetTransformInfo(const Function &F) const override
Get a TargetTransformInfo implementation for the target.
MachineFunctionInfo * createMachineFunctionInfo(BumpPtrAllocator &Allocator, const Function &F, const TargetSubtargetInfo *STI) const override
Create the target's instance of MachineFunctionInfo.
A single uniqued string.
Definition Metadata.h:722
static LLVM_ABI PassRegistry * getPassRegistry()
getPassRegistry - Access the global registry object, which is automatically initialized at applicatio...
Represent a constant reference to a string, i.e.
Definition StringRef.h:56
std::string str() const
Get the contents as an std::string.
Definition StringRef.h:222
Triple TargetTriple
Triple string, CPU name, and target feature strings the TargetMachine instance is created with.
std::unique_ptr< const MCSubtargetInfo > STI
TargetOptions Options
void resetTargetOptions(const Function &F) const
Reset the target options based on the function's attributes.
Target-Independent Code Generator Pass Configuration Options.
virtual void addCodeGenPrepare()
Add pass to prepare the LLVM IR for code generation.
virtual bool addRegAssignAndRewriteFast()
Add core register allocator passes which do the actual register assignment and rewriting.
virtual void addIRPasses()
Add common target configurable passes that perform LLVM IR to IR transforms following machine indepen...
virtual void addMachineSSAOptimization()
addMachineSSAOptimization - Add standard passes that optimize machine instructions in SSA form.
virtual bool addRegAssignAndRewriteOptimized()
TargetSubtargetInfo - Generic base class for all target subtargets.
This pass provides access to the codegen interfaces that are needed for IR-level transformations.
Target - Wrapper for Target specific information.
Triple - Helper class for working with autoconf configuration names.
Definition Triple.h:47
PassManagerBase - An abstract interface to allow code to add passes to a pass manager without having ...
ABI getTargetABI(StringRef ABIName)
initializer< Ty > init(const Ty &Val)
This is an optimization pass for GlobalISel generic memory operations.
Target & getTheLoongArch64Target()
FunctionPass * createLoongArchExpandAtomicPseudoPass()
FunctionPass * createLoongArchDeadRegisterDefinitionsPass()
void initializeLoongArchDAGToDAGISelLegacyPass(PassRegistry &)
LLVM_ABI FunctionPass * createTypePromotionLegacyPass()
Create IR Type Promotion pass.
void initializeLoongArchPreRAExpandPseudoPass(PassRegistry &)
auto dyn_cast_or_null(const Y &Val)
Definition Casting.h:753
void initializeLoongArchMergeBaseOffsetOptPass(PassRegistry &)
static Reloc::Model getEffectiveRelocModel(std::optional< Reloc::Model > RM)
void initializeLoongArchExpandAtomicPseudoPass(PassRegistry &)
LLVM_ABI char & BranchRelaxationPassID
BranchRelaxation - This pass replaces branches that need to jump further than is supported by a branc...
void initializeLoongArchExpandPseudoPass(PassRegistry &)
FunctionPass * createLoongArchOptWInstrsPass()
LLVM_ABI FunctionPass * createLoopDataPrefetchPass()
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
Definition Error.cpp:163
CodeGenOptLevel
Code generation optimization level.
Definition CodeGen.h:82
LLVM_ATTRIBUTE_VISIBILITY_DEFAULT AnalysisKey InnerAnalysisManagerProxy< AnalysisManagerT, IRUnitT, ExtraArgTs... >::Key
Target & getTheLoongArch32Target()
FunctionPass * createLoongArchISelDag(LoongArchTargetMachine &TM, CodeGenOptLevel OptLevel)
FunctionPass * createLoongArchPreRAExpandPseudoPass()
void initializeLoongArchOptWInstrsPass(PassRegistry &)
FunctionPass * createLoongArchExpandPseudoPass()
LLVM_ABI FunctionPass * createAtomicExpandLegacyPass()
AtomicExpandPass - At IR level this pass replace atomic instructions with __atomic_* library calls,...
BumpPtrAllocatorImpl<> BumpPtrAllocator
The standard BumpPtrAllocator which just uses the default template parameters.
Definition Allocator.h:383
void initializeLoongArchDeadRegisterDefinitionsPass(PassRegistry &)
FunctionPass * createLoongArchMergeBaseOffsetOptPass()
Returns an instance of the Merge Base Offset Optimization pass.
Implement std::hash so that hash_code can be used in STL containers.
Definition BitVector.h:874
MachineFunctionInfo - This class can be derived from and used by targets to hold private target-speci...
static FuncInfoTy * create(BumpPtrAllocator &Allocator, const Function &F, const SubtargetTy *STI)
Factory function: default behavior is to call new using the supplied allocator.
RegisterTargetMachine - Helper template for registering a target machine implementation,...