LLVM 23.0.0git
AMDGPURegBankLegalizeRules.h
Go to the documentation of this file.
1//===- AMDGPURegBankLegalizeRules --------------------------------*- C++ -*-==//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
9#ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUREGBANKLEGALIZERULES_H
10#define LLVM_LIB_TARGET_AMDGPU_AMDGPUREGBANKLEGALIZERULES_H
11
12#include "llvm/ADT/DenseMap.h"
14#include <functional>
15
16namespace llvm {
17
18class LLT;
20class MachineInstr;
21class GCNSubtarget;
22class MachineFunction;
23template <typename T> class GenericUniformityInfo;
24template <typename T> class GenericSSAContext;
27
28namespace AMDGPU {
29
30/// \returns true if \p Ty is a pointer type with size \p Width.
31bool isAnyPtr(LLT Ty, unsigned Width);
32
33// IDs used to build predicate for RegBankLegalizeRule. Predicate can have one
34// or more IDs and each represents a check for 'uniform or divergent' + LLT or
35// just LLT on register operand.
36// Most often checking one operand is enough to decide which RegBankLLTMapping
37// to apply (see Fast Rules), IDs are useful when two or more operands need to
38// be checked.
143
144// How to apply register bank on register operand.
145// In most cases, this serves as a LLT and register bank assert.
146// Can change operands and insert copies, extends, truncs, and read-any-lanes.
147// Anything more complicated requires LoweringMethod.
154
155 // any LLT, bank-only apply IDs
158
159 // sgpr scalars, pointers, vectors and B-types
184
185 // vgpr scalars, pointers, vectors and B-types
214
215 // Dst only modifiers: read-any-lane and truncs
231
233
234 // Dst only modifiers: dst was assigned VGPR by RegBankSelect but the
235 // instruction result must be in SGPR. Replace dst with SGPR, then copy the
236 // result back to the original VGPR.
239
240 // Src only modifiers: execute in waterfall loop if divergent
243
244 // Src only modifiers: execute in waterfall loop for calls
247
248 // Src only modifiers: for operands that must end up in M0. If divergent,
249 // readfirstlane to SGPR. The result can then be copied to M0 in ISel.
251
252 // Src only modifiers: operand must be SGPR, if in VGPR, insert readfirstlane
253 // to move to SGPR.
257
258 // Src only modifiers: extends
266
270};
271
272// Instruction needs to be replaced with sequence of instructions. Lowering was
273// not done by legalizer since instructions is available in either sgpr or vgpr.
274// For example S64 AND is available on sgpr, for that reason S64 AND is legal in
275// context of Legalizer that only checks LLT. But S64 AND is not available on
276// vgpr. Lower it to two S32 vgpr ANDs.
316
319 Standard, // S16, S32, S64, V2S16
320 StandardB, // B32, B64, B96, B128
321 Vector, // S32, V2S32, V3S32, V4S32
322};
323
329 std::initializer_list<RegBankLLTMappingApplyID> DstOpMappingList,
330 std::initializer_list<RegBankLLTMappingApplyID> SrcOpMappingList,
332};
333
336 std::function<bool(const MachineInstr &)> TestFunc;
338 std::initializer_list<UniformityLLTOpPredicateID> OpList,
339 std::function<bool(const MachineInstr &)> TestFunc = nullptr);
340
341 bool match(const MachineInstr &MI, const MachineUniformityInfo &MUI,
342 const MachineRegisterInfo &MRI) const;
343};
344
349
351 // "Slow Rules". More complex 'Rules[i].Predicate', check them one by one.
353
354 // "Fast Rules"
355 // Instead of testing each 'Rules[i].Predicate' we do direct access to
356 // RegBankLLTMapping using getFastPredicateSlot. For example if:
357 // - FastTypes == Standard Uni[0] holds Mapping in case Op 0 is uniform S32
358 // - FastTypes == Vector Div[3] holds Mapping in case Op 0 is divergent V4S32
359 FastRulesTypes FastTypes = NoFastRules;
360#define InvMapping RegBankLLTMapping({InvalidMapping}, {InvalidMapping})
361 RegBankLLTMapping Uni[4] = {InvMapping, InvMapping, InvMapping, InvMapping};
362 RegBankLLTMapping Div[4] = {InvMapping, InvMapping, InvMapping, InvMapping};
363
364public:
367
368 const RegBankLLTMapping *
370 const MachineUniformityInfo &MUI) const;
371
372 void addRule(RegBankLegalizeRule Rule);
373
375 RegBankLLTMapping RuleApplyIDs);
377 RegBankLLTMapping RuleApplyIDs);
378
379private:
380 int getFastPredicateSlot(UniformityLLTOpPredicateID Ty) const;
381};
382
383// Essentially 'map<Opcode(or intrinsic_opcode), SetOfRulesForOpcode>' but a
384// little more efficient.
386 const GCNSubtarget *ST;
388 // Separate maps for G-opcodes and intrinsics since they are in different
389 // enums. Multiple opcodes can share same set of rules.
390 // RulesAlias = map<Opcode, KeyOpcode>
391 // Rules = map<KeyOpcode, SetOfRulesForOpcode>
396 class RuleSetInitializer {
397 SetOfRulesForOpcode *RuleSet;
398
399 public:
400 // Used for clang-format line breaks and to force writing all rules for
401 // opcode in same place.
402 template <class AliasMap, class RulesMap>
403 RuleSetInitializer(std::initializer_list<unsigned> OpcList,
404 AliasMap &RulesAlias, RulesMap &Rules,
405 FastRulesTypes FastTypes = NoFastRules) {
406 unsigned KeyOpcode = *OpcList.begin();
407 for (unsigned Opc : OpcList) {
408 [[maybe_unused]] auto [_, NewInput] =
409 RulesAlias.try_emplace(Opc, KeyOpcode);
410 assert(NewInput && "Can't redefine existing Rules");
411 }
412
413 auto [DenseMapIter, NewInput] = Rules.try_emplace(KeyOpcode, FastTypes);
414 assert(NewInput && "Can't redefine existing Rules");
415
416 RuleSet = &DenseMapIter->second;
417 }
418
419 RuleSetInitializer(const RuleSetInitializer &) = delete;
420 RuleSetInitializer &operator=(const RuleSetInitializer &) = delete;
421 RuleSetInitializer(RuleSetInitializer &&) = delete;
422 RuleSetInitializer &operator=(RuleSetInitializer &&) = delete;
423 ~RuleSetInitializer() = default;
424
425 RuleSetInitializer &Div(UniformityLLTOpPredicateID Ty,
426 RegBankLLTMapping RuleApplyIDs,
427 bool STPred = true) {
428 if (STPred)
429 RuleSet->addFastRuleDivergent(Ty, RuleApplyIDs);
430 return *this;
431 }
432
433 RuleSetInitializer &Uni(UniformityLLTOpPredicateID Ty,
434 RegBankLLTMapping RuleApplyIDs,
435 bool STPred = true) {
436 if (STPred)
437 RuleSet->addFastRuleUniform(Ty, RuleApplyIDs);
438 return *this;
439 }
440
441 RuleSetInitializer &Any(RegBankLegalizeRule Init, bool STPred = true) {
442 if (STPred)
443 RuleSet->addRule(Init);
444 return *this;
445 }
446 };
447
448 RuleSetInitializer addRulesForGOpcs(std::initializer_list<unsigned> OpcList,
449 FastRulesTypes FastTypes = NoFastRules);
450
451 RuleSetInitializer addRulesForIOpcs(std::initializer_list<unsigned> OpcList,
452 FastRulesTypes FastTypes = NoFastRules);
453
454public:
455 // Initialize rules for all opcodes.
457
458 // In case we don't want to regenerate same rules, we can use already
459 // generated rules but need to refresh references to objects that are
460 // created for this run.
462 ST = &_ST;
463 MRI = &_MRI;
464 };
465
467};
468
469} // end namespace AMDGPU
470} // end namespace llvm
471
472#endif
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
#define InvMapping
This file defines the DenseMap class.
IRTranslator LLVM IR MI
This file defines the SmallVector class.
RegBankLegalizeRules(const GCNSubtarget &ST, MachineRegisterInfo &MRI)
const SetOfRulesForOpcode * getRulesForOpc(MachineInstr &MI) const
void refreshRefs(const GCNSubtarget &_ST, MachineRegisterInfo &_MRI)
const RegBankLLTMapping * findMappingForMI(const MachineInstr &MI, const MachineRegisterInfo &MRI, const MachineUniformityInfo &MUI) const
void addFastRuleDivergent(UniformityLLTOpPredicateID Ty, RegBankLLTMapping RuleApplyIDs)
void addFastRuleUniform(UniformityLLTOpPredicateID Ty, RegBankLLTMapping RuleApplyIDs)
Representation of each machine instruction.
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
bool isAnyPtr(LLT Ty, unsigned Width)
This is an optimization pass for GlobalISel generic memory operations.
GenericUniformityInfo< MachineSSAContext > MachineUniformityInfo
GenericSSAContext< MachineFunction > MachineSSAContext
SmallVector< UniformityLLTOpPredicateID, 4 > OpUniformityAndTypes
PredicateMapping(std::initializer_list< UniformityLLTOpPredicateID > OpList, std::function< bool(const MachineInstr &)> TestFunc=nullptr)
bool match(const MachineInstr &MI, const MachineUniformityInfo &MUI, const MachineRegisterInfo &MRI) const
std::function< bool(const MachineInstr &)> TestFunc
RegBankLLTMapping(std::initializer_list< RegBankLLTMappingApplyID > DstOpMappingList, std::initializer_list< RegBankLLTMappingApplyID > SrcOpMappingList, LoweringMethodID LoweringMethod=DoNotLower)
SmallVector< RegBankLLTMappingApplyID, 2 > DstOpMapping
SmallVector< RegBankLLTMappingApplyID, 4 > SrcOpMapping