59 const auto &
Op = MdNode->getOperand(
OpIndex);
66getSymbolicOperandRequirements(SPIRV::OperandCategory::OperandCategory Category,
72 AvoidCaps.
S.
insert(SPIRV::Capability::Shader);
74 AvoidCaps.
S.
insert(SPIRV::Capability::Kernel);
79 bool MinVerOK = SPIRVVersion.
empty() || SPIRVVersion >= ReqMinVer;
81 ReqMaxVer.
empty() || SPIRVVersion.
empty() || SPIRVVersion <= ReqMaxVer;
84 if (ReqCaps.
empty()) {
85 if (ReqExts.
empty()) {
86 if (MinVerOK && MaxVerOK)
87 return {
true, {}, {}, ReqMinVer, ReqMaxVer};
90 }
else if (MinVerOK && MaxVerOK) {
91 if (ReqCaps.
size() == 1) {
92 auto Cap = ReqCaps[0];
95 SPIRV::OperandCategory::CapabilityOperand, Cap));
96 return {
true, {Cap}, std::move(ReqExts), ReqMinVer, ReqMaxVer};
106 for (
auto Cap : ReqCaps)
109 for (
size_t i = 0, Sz = UseCaps.
size(); i < Sz; ++i) {
110 auto Cap = UseCaps[i];
111 if (i == Sz - 1 || !AvoidCaps.
S.
contains(Cap)) {
113 SPIRV::OperandCategory::CapabilityOperand, Cap));
114 return {
true, {Cap}, std::move(ReqExts), ReqMinVer, ReqMaxVer};
122 if (
llvm::all_of(ReqExts, [&ST](
const SPIRV::Extension::Extension &Ext) {
123 return ST.canUseExtension(Ext);
134void SPIRVModuleAnalysis::setBaseInfo(
const Module &M) {
138 MAI.RegisterAliasTable.clear();
139 MAI.InstrsToDelete.clear();
141 MAI.GlobalVarList.clear();
142 MAI.ExtInstSetMap.clear();
144 MAI.Reqs.initAvailableCapabilities(*ST);
147 if (
auto MemModel =
M.getNamedMetadata(
"spirv.MemoryModel")) {
148 auto MemMD = MemModel->getOperand(0);
149 MAI.Addr =
static_cast<SPIRV::AddressingModel::AddressingModel
>(
150 getMetadataUInt(MemMD, 0));
152 static_cast<SPIRV::MemoryModel::MemoryModel
>(getMetadataUInt(MemMD, 1));
155 MAI.Mem = ST->isShader() ? SPIRV::MemoryModel::GLSL450
156 : SPIRV::MemoryModel::OpenCL;
157 if (
MAI.Mem == SPIRV::MemoryModel::OpenCL) {
158 unsigned PtrSize = ST->getPointerSize();
159 MAI.Addr = PtrSize == 32 ? SPIRV::AddressingModel::Physical32
160 : PtrSize == 64 ? SPIRV::AddressingModel::Physical64
161 : SPIRV::AddressingModel::Logical;
164 MAI.Addr = SPIRV::AddressingModel::Logical;
169 if (
auto VerNode =
M.getNamedMetadata(
"opencl.ocl.version")) {
170 MAI.SrcLang = SPIRV::SourceLanguage::OpenCL_C;
173 assert(VerNode->getNumOperands() > 0 &&
"Invalid SPIR");
174 auto VersionMD = VerNode->getOperand(0);
175 unsigned MajorNum = getMetadataUInt(VersionMD, 0, 2);
176 unsigned MinorNum = getMetadataUInt(VersionMD, 1);
177 unsigned RevNum = getMetadataUInt(VersionMD, 2);
180 (std::max(1U, MajorNum) * 100 + MinorNum) * 1000 + RevNum;
186 if (!ST->isShader()) {
187 MAI.SrcLang = SPIRV::SourceLanguage::OpenCL_CPP;
188 MAI.SrcLangVersion = 100000;
190 MAI.SrcLang = SPIRV::SourceLanguage::Unknown;
191 MAI.SrcLangVersion = 0;
195 if (
auto ExtNode =
M.getNamedMetadata(
"opencl.used.extensions")) {
196 for (
unsigned I = 0,
E = ExtNode->getNumOperands();
I !=
E; ++
I) {
197 MDNode *MD = ExtNode->getOperand(
I);
207 MAI.Reqs.getAndAddRequirements(SPIRV::OperandCategory::MemoryModelOperand,
209 MAI.Reqs.getAndAddRequirements(SPIRV::OperandCategory::SourceLanguageOperand,
211 MAI.Reqs.getAndAddRequirements(SPIRV::OperandCategory::AddressingModelOperand,
214 if (!ST->isShader()) {
216 MAI.ExtInstSetMap[
static_cast<unsigned>(
217 SPIRV::InstructionSet::OpenCL_std)] =
MAI.getNextIDRegister();
228 if (
UseMI.getOpcode() != SPIRV::OpDecorate &&
229 UseMI.getOpcode() != SPIRV::OpMemberDecorate)
232 for (
unsigned I = 0;
I <
UseMI.getNumOperands(); ++
I) {
250 for (
unsigned i = 0; i <
MI.getNumOperands(); ++i) {
259 unsigned Opcode =
MI.getOpcode();
260 if ((Opcode == SPIRV::OpDecorate) && i >= 2) {
261 unsigned DecorationID =
MI.getOperand(1).getImm();
262 if (DecorationID != SPIRV::Decoration::UserSemantic &&
263 DecorationID != SPIRV::Decoration::CacheControlLoadINTEL &&
264 DecorationID != SPIRV::Decoration::CacheControlStoreINTEL)
270 if (!UseDefReg && MO.
isDef()) {
278 dbgs() <<
"Unexpectedly, no global id found for the operand ";
280 dbgs() <<
"\nInstruction: ";
299 appendDecorationsForReg(
MI.getMF()->getRegInfo(), DefReg, Signature);
306 unsigned Opcode =
MI.getOpcode();
308 case SPIRV::OpTypeForwardPointer:
311 case SPIRV::OpVariable:
312 return static_cast<SPIRV::StorageClass::StorageClass
>(
313 MI.getOperand(2).
getImm()) != SPIRV::StorageClass::Function;
314 case SPIRV::OpFunction:
315 case SPIRV::OpFunctionParameter:
318 if (GR->hasConstFunPtr() && Opcode == SPIRV::OpUndef) {
320 for (MachineInstr &
UseMI :
MRI.use_instructions(DefReg)) {
321 if (
UseMI.getOpcode() != SPIRV::OpConstantFunctionPointerINTEL)
327 MAI.setSkipEmission(&
MI);
331 return TII->isTypeDeclInstr(
MI) || TII->isConstantInstr(
MI) ||
332 TII->isInlineAsmDefInstr(
MI);
338void SPIRVModuleAnalysis::visitFunPtrUse(
340 std::map<const Value *, unsigned> &GlobalToGReg,
const MachineFunction *MF,
342 const MachineOperand *OpFunDef =
343 GR->getFunctionDefinitionByUse(&
MI.getOperand(2));
346 const MachineInstr *OpDefMI = OpFunDef->
getParent();
349 const MachineRegisterInfo &FunDefMRI = FunDefMF->
getRegInfo();
351 visitDecl(FunDefMRI, SignatureToGReg, GlobalToGReg, FunDefMF, *OpDefMI);
353 }
while (OpDefMI && (OpDefMI->
getOpcode() == SPIRV::OpFunction ||
354 OpDefMI->
getOpcode() == SPIRV::OpFunctionParameter));
356 MCRegister GlobalFunDefReg =
357 MAI.getRegisterAlias(FunDefMF, OpFunDef->
getReg());
359 "Function definition must refer to a global register");
360 MAI.setRegisterAlias(MF, OpReg, GlobalFunDefReg);
365void SPIRVModuleAnalysis::visitDecl(
367 std::map<const Value *, unsigned> &GlobalToGReg,
const MachineFunction *MF,
369 unsigned Opcode =
MI.getOpcode();
372 for (
const MachineOperand &MO :
MI.operands()) {
377 if (Opcode == SPIRV::OpConstantFunctionPointerINTEL &&
378 MRI.getRegClass(OpReg) == &SPIRV::pIDRegClass) {
379 visitFunPtrUse(OpReg, SignatureToGReg, GlobalToGReg, MF,
MI);
383 if (
MAI.hasRegisterAlias(MF, MO.
getReg()))
386 if (
const MachineInstr *OpDefMI =
MRI.getUniqueVRegDef(OpReg)) {
387 if (isDeclSection(
MRI, *OpDefMI))
388 visitDecl(
MRI, SignatureToGReg, GlobalToGReg, MF, *OpDefMI);
394 dbgs() <<
"Unexpectedly, no unique definition for the operand ";
396 dbgs() <<
"\nInstruction: ";
401 "No unique definition is found for the virtual register");
405 bool IsFunDef =
false;
406 if (TII->isSpecConstantInstr(
MI)) {
407 GReg =
MAI.getNextIDRegister();
409 }
else if (Opcode == SPIRV::OpFunction ||
410 Opcode == SPIRV::OpFunctionParameter) {
411 GReg = handleFunctionOrParameter(MF,
MI, GlobalToGReg, IsFunDef);
412 }
else if (Opcode == SPIRV::OpTypeStruct ||
413 Opcode == SPIRV::OpConstantComposite) {
414 GReg = handleTypeDeclOrConstant(
MI, SignatureToGReg);
415 const MachineInstr *NextInstr =
MI.getNextNode();
417 ((Opcode == SPIRV::OpTypeStruct &&
418 NextInstr->
getOpcode() == SPIRV::OpTypeStructContinuedINTEL) ||
419 (Opcode == SPIRV::OpConstantComposite &&
421 SPIRV::OpConstantCompositeContinuedINTEL))) {
422 MCRegister Tmp = handleTypeDeclOrConstant(*NextInstr, SignatureToGReg);
424 MAI.setSkipEmission(NextInstr);
427 }
else if (TII->isTypeDeclInstr(
MI) || TII->isConstantInstr(
MI) ||
428 TII->isInlineAsmDefInstr(
MI)) {
429 GReg = handleTypeDeclOrConstant(
MI, SignatureToGReg);
430 }
else if (Opcode == SPIRV::OpVariable) {
431 GReg = handleVariable(MF,
MI, GlobalToGReg);
434 dbgs() <<
"\nInstruction: ";
440 MAI.setRegisterAlias(MF,
MI.getOperand(0).getReg(), GReg);
442 MAI.setSkipEmission(&
MI);
445MCRegister SPIRVModuleAnalysis::handleFunctionOrParameter(
447 std::map<const Value *, unsigned> &GlobalToGReg,
bool &IsFunDef) {
448 const Value *GObj = GR->getGlobalObject(MF,
MI.getOperand(0).getReg());
449 assert(GObj &&
"Unregistered global definition");
453 assert(
F &&
"Expected a reference to a function or an argument");
454 IsFunDef = !
F->isDeclaration();
455 auto [It,
Inserted] = GlobalToGReg.try_emplace(GObj);
458 MCRegister GReg =
MAI.getNextIDRegister();
466SPIRVModuleAnalysis::handleTypeDeclOrConstant(
const MachineInstr &
MI,
469 auto [It,
Inserted] = SignatureToGReg.try_emplace(MISign);
472 MCRegister GReg =
MAI.getNextIDRegister();
478MCRegister SPIRVModuleAnalysis::handleVariable(
480 std::map<const Value *, unsigned> &GlobalToGReg) {
481 MAI.GlobalVarList.push_back(&
MI);
482 const Value *GObj = GR->getGlobalObject(MF,
MI.getOperand(0).getReg());
483 assert(GObj &&
"Unregistered global definition");
484 auto [It,
Inserted] = GlobalToGReg.try_emplace(GObj);
487 MCRegister GReg =
MAI.getNextIDRegister();
493void SPIRVModuleAnalysis::collectDeclarations(
const Module &M) {
495 std::map<const Value *, unsigned> GlobalToGReg;
496 for (
auto F =
M.begin(),
E =
M.end();
F !=
E; ++
F) {
497 MachineFunction *MF = MMI->getMachineFunction(*
F);
501 unsigned PastHeader = 0;
502 for (MachineBasicBlock &
MBB : *MF) {
503 for (MachineInstr &
MI :
MBB) {
504 if (
MI.getNumOperands() == 0)
506 unsigned Opcode =
MI.getOpcode();
507 if (Opcode == SPIRV::OpFunction) {
508 if (PastHeader == 0) {
512 }
else if (Opcode == SPIRV::OpFunctionParameter) {
515 }
else if (PastHeader > 0) {
519 const MachineOperand &DefMO =
MI.getOperand(0);
521 case SPIRV::OpExtension:
522 MAI.Reqs.addExtension(SPIRV::Extension::Extension(DefMO.
getImm()));
523 MAI.setSkipEmission(&
MI);
525 case SPIRV::OpCapability:
526 MAI.Reqs.addCapability(SPIRV::Capability::Capability(DefMO.
getImm()));
527 MAI.setSkipEmission(&
MI);
532 if (DefMO.
isReg() && isDeclSection(
MRI,
MI) &&
533 !
MAI.hasRegisterAlias(MF, DefMO.
getReg()))
534 visitDecl(
MRI, SignatureToGReg, GlobalToGReg, MF,
MI);
547 if (
MI.getOpcode() == SPIRV::OpDecorate) {
549 auto Dec =
MI.getOperand(1).getImm();
550 if (Dec == SPIRV::Decoration::LinkageAttributes) {
551 auto Lnk =
MI.getOperand(
MI.getNumOperands() - 1).getImm();
552 if (Lnk == SPIRV::LinkageType::Import) {
557 MAI.FuncMap[ImportedFunc] =
MAI.getRegisterAlias(
MI.getMF(), Target);
560 }
else if (
MI.getOpcode() == SPIRV::OpFunction) {
563 MCRegister GlobalReg =
MAI.getRegisterAlias(
MI.getMF(),
Reg);
565 MAI.FuncMap[
F] = GlobalReg;
574 bool Append =
true) {
577 auto FoundMI = IS.insert(std::move(MISign));
578 if (!FoundMI.second) {
579 if (
MI.getOpcode() == SPIRV::OpDecorate) {
581 "Decoration instructions must have at least 2 operands");
583 "Only OpDecorate instructions can be duplicates");
588 if (
MI.getOperand(1).getImm() != SPIRV::Decoration::FPFastMathMode)
593 if (instrToSignature(*OrigMI, MAI,
true) == MISign) {
594 assert(OrigMI->getNumOperands() ==
MI.getNumOperands() &&
595 "Original instruction must have the same number of operands");
597 OrigMI->getNumOperands() == 3 &&
598 "FPFastMathMode decoration must have 3 operands for OpDecorate");
599 unsigned OrigFlags = OrigMI->getOperand(2).getImm();
600 unsigned NewFlags =
MI.getOperand(2).getImm();
601 if (OrigFlags == NewFlags)
605 unsigned FinalFlags = OrigFlags | NewFlags;
607 <<
"Warning: Conflicting FPFastMathMode decoration flags "
609 << *OrigMI <<
"Original flags: " << OrigFlags
610 <<
", new flags: " << NewFlags
611 <<
". They will be merged on a best effort basis, but not "
612 "validated. Final flags: "
613 << FinalFlags <<
"\n";
620 assert(
false &&
"No original instruction found for the duplicate "
621 "OpDecorate, but we found one in IS.");
634void SPIRVModuleAnalysis::processOtherInstrs(
const Module &M) {
636 for (
auto F =
M.begin(),
E =
M.end();
F !=
E; ++
F) {
637 if (
F->isDeclaration())
639 MachineFunction *MF = MMI->getMachineFunction(*
F);
642 for (MachineBasicBlock &
MBB : *MF)
643 for (MachineInstr &
MI :
MBB) {
644 if (
MAI.getSkipEmission(&
MI))
646 const unsigned OpCode =
MI.getOpcode();
647 if (OpCode == SPIRV::OpString) {
649 }
else if (OpCode == SPIRV::OpExtInst &&
MI.getOperand(2).isImm() &&
650 MI.getOperand(2).getImm() ==
651 SPIRV::InstructionSet::
652 NonSemantic_Shader_DebugInfo_100) {
653 MachineOperand
Ins =
MI.getOperand(3);
654 namespace NS = SPIRV::NonSemanticExtInst;
655 static constexpr int64_t GlobalNonSemanticDITy[] = {
656 NS::DebugSource, NS::DebugCompilationUnit, NS::DebugInfoNone,
657 NS::DebugTypeBasic, NS::DebugTypePointer};
658 bool IsGlobalDI =
false;
659 for (
unsigned Idx = 0; Idx < std::size(GlobalNonSemanticDITy); ++Idx)
660 IsGlobalDI |=
Ins.getImm() == GlobalNonSemanticDITy[Idx];
663 }
else if (OpCode == SPIRV::OpName || OpCode == SPIRV::OpMemberName) {
665 }
else if (OpCode == SPIRV::OpEntryPoint) {
667 }
else if (TII->isAliasingInstr(
MI)) {
669 }
else if (TII->isDecorationInstr(
MI)) {
671 collectFuncNames(
MI, &*
F);
672 }
else if (TII->isConstantInstr(
MI)) {
676 }
else if (OpCode == SPIRV::OpFunction) {
677 collectFuncNames(
MI, &*
F);
678 }
else if (OpCode == SPIRV::OpTypeForwardPointer) {
688void SPIRVModuleAnalysis::numberRegistersGlobally(
const Module &M) {
689 for (
auto F =
M.begin(),
E =
M.end();
F !=
E; ++
F) {
690 if ((*F).isDeclaration())
692 MachineFunction *MF = MMI->getMachineFunction(*
F);
694 for (MachineBasicBlock &
MBB : *MF) {
695 for (MachineInstr &
MI :
MBB) {
696 for (MachineOperand &
Op :
MI.operands()) {
700 if (
MAI.hasRegisterAlias(MF,
Reg))
702 MCRegister NewReg =
MAI.getNextIDRegister();
703 MAI.setRegisterAlias(MF,
Reg, NewReg);
705 if (
MI.getOpcode() != SPIRV::OpExtInst)
707 auto Set =
MI.getOperand(2).getImm();
708 auto [It,
Inserted] =
MAI.ExtInstSetMap.try_emplace(Set);
710 It->second =
MAI.getNextIDRegister();
718 SPIRV::OperandCategory::OperandCategory Category, uint32_t i,
720 addRequirements(getSymbolicOperandRequirements(Category, i, ST, *
this));
723void SPIRV::RequirementHandler::recursiveAddCapabilities(
725 for (
const auto &Cap : ToPrune) {
729 recursiveAddCapabilities(ImplicitDecls);
734 for (
const auto &Cap : ToAdd) {
735 bool IsNewlyInserted = AllCaps.insert(Cap).second;
736 if (!IsNewlyInserted)
740 recursiveAddCapabilities(ImplicitDecls);
741 MinimalCaps.push_back(Cap);
746 const SPIRV::Requirements &Req) {
750 if (Req.
Cap.has_value())
751 addCapabilities({Req.
Cap.value()});
753 addExtensions(Req.
Exts);
756 if (!MaxVersion.empty() && Req.
MinVer > MaxVersion) {
758 <<
" and <= " << MaxVersion <<
"\n");
762 if (MinVersion.empty() || Req.
MinVer > MinVersion)
767 if (!MinVersion.empty() && Req.
MaxVer < MinVersion) {
769 <<
" and >= " << MinVersion <<
"\n");
773 if (MaxVersion.empty() || Req.
MaxVer < MaxVersion)
779 const SPIRVSubtarget &ST)
const {
781 bool IsSatisfiable =
true;
782 auto TargetVer =
ST.getSPIRVVersion();
784 if (!MaxVersion.empty() && !TargetVer.empty() && MaxVersion < TargetVer) {
786 dbgs() <<
"Target SPIR-V version too high for required features\n"
787 <<
"Required max version: " << MaxVersion <<
" target version "
788 << TargetVer <<
"\n");
789 IsSatisfiable =
false;
792 if (!MinVersion.empty() && !TargetVer.empty() && MinVersion > TargetVer) {
793 LLVM_DEBUG(
dbgs() <<
"Target SPIR-V version too low for required features\n"
794 <<
"Required min version: " << MinVersion
795 <<
" target version " << TargetVer <<
"\n");
796 IsSatisfiable =
false;
799 if (!MinVersion.empty() && !MaxVersion.empty() && MinVersion > MaxVersion) {
802 <<
"Version is too low for some features and too high for others.\n"
803 <<
"Required SPIR-V min version: " << MinVersion
804 <<
" required SPIR-V max version " << MaxVersion <<
"\n");
805 IsSatisfiable =
false;
808 AvoidCapabilitiesSet AvoidCaps;
810 AvoidCaps.
S.
insert(SPIRV::Capability::Shader);
812 AvoidCaps.
S.
insert(SPIRV::Capability::Kernel);
814 for (
auto Cap : MinimalCaps) {
815 if (AvailableCaps.contains(Cap) && !AvoidCaps.
S.
contains(Cap))
819 OperandCategory::CapabilityOperand, Cap)
821 IsSatisfiable =
false;
824 for (
auto Ext : AllExtensions) {
825 if (
ST.canUseExtension(Ext))
829 OperandCategory::ExtensionOperand, Ext)
831 IsSatisfiable =
false;
840 for (
const auto Cap : ToAdd)
841 if (AvailableCaps.insert(Cap).second)
843 SPIRV::OperandCategory::CapabilityOperand, Cap));
847 const Capability::Capability
ToRemove,
848 const Capability::Capability IfPresent) {
849 if (AllCaps.contains(IfPresent))
857 addAvailableCaps({Capability::Shader, Capability::Linkage, Capability::Int8,
860 if (
ST.isAtLeastSPIRVVer(VersionTuple(1, 3)))
862 Capability::GroupNonUniformVote,
863 Capability::GroupNonUniformArithmetic,
864 Capability::GroupNonUniformBallot,
865 Capability::GroupNonUniformClustered,
866 Capability::GroupNonUniformShuffle,
867 Capability::GroupNonUniformShuffleRelative});
869 if (
ST.isAtLeastSPIRVVer(VersionTuple(1, 6)))
871 Capability::DotProductInput4x8Bit,
872 Capability::DotProductInput4x8BitPacked,
873 Capability::DemoteToHelperInvocation});
876 for (
auto Extension :
ST.getAllAvailableExtensions()) {
882 if (!
ST.isShader()) {
883 initAvailableCapabilitiesForOpenCL(ST);
888 initAvailableCapabilitiesForVulkan(ST);
895void RequirementHandler::initAvailableCapabilitiesForOpenCL(
896 const SPIRVSubtarget &ST) {
899 Capability::Kernel, Capability::Vector16,
900 Capability::Groups, Capability::GenericPointer,
901 Capability::StorageImageWriteWithoutFormat,
902 Capability::StorageImageReadWithoutFormat});
903 if (
ST.hasOpenCLFullProfile())
905 if (
ST.hasOpenCLImageSupport()) {
907 Capability::Image1D, Capability::SampledBuffer,
908 Capability::ImageBuffer});
909 if (
ST.isAtLeastOpenCLVer(VersionTuple(2, 0)))
912 if (
ST.isAtLeastSPIRVVer(VersionTuple(1, 1)) &&
913 ST.isAtLeastOpenCLVer(VersionTuple(2, 2)))
915 if (
ST.isAtLeastSPIRVVer(VersionTuple(1, 4)))
916 addAvailableCaps({Capability::DenormPreserve, Capability::DenormFlushToZero,
917 Capability::SignedZeroInfNanPreserve,
918 Capability::RoundingModeRTE,
919 Capability::RoundingModeRTZ});
926void RequirementHandler::initAvailableCapabilitiesForVulkan(
927 const SPIRVSubtarget &ST) {
930 addAvailableCaps({Capability::Int64, Capability::Float16, Capability::Float64,
931 Capability::GroupNonUniform, Capability::Image1D,
932 Capability::SampledBuffer, Capability::ImageBuffer,
933 Capability::UniformBufferArrayDynamicIndexing,
934 Capability::SampledImageArrayDynamicIndexing,
935 Capability::StorageBufferArrayDynamicIndexing,
936 Capability::StorageImageArrayDynamicIndexing});
939 if (
ST.isAtLeastSPIRVVer(VersionTuple(1, 5))) {
941 {Capability::ShaderNonUniformEXT, Capability::RuntimeDescriptorArrayEXT,
942 Capability::InputAttachmentArrayDynamicIndexingEXT,
943 Capability::UniformTexelBufferArrayDynamicIndexingEXT,
944 Capability::StorageTexelBufferArrayDynamicIndexingEXT,
945 Capability::UniformBufferArrayNonUniformIndexingEXT,
946 Capability::SampledImageArrayNonUniformIndexingEXT,
947 Capability::StorageBufferArrayNonUniformIndexingEXT,
948 Capability::StorageImageArrayNonUniformIndexingEXT,
949 Capability::InputAttachmentArrayNonUniformIndexingEXT,
950 Capability::UniformTexelBufferArrayNonUniformIndexingEXT,
951 Capability::StorageTexelBufferArrayNonUniformIndexingEXT});
955 if (
ST.isAtLeastSPIRVVer(VersionTuple(1, 6)))
957 Capability::StorageImageReadWithoutFormat});
965static void addOpDecorateReqs(
const MachineInstr &
MI,
unsigned DecIndex,
968 int64_t DecOp =
MI.getOperand(DecIndex).getImm();
969 auto Dec =
static_cast<SPIRV::Decoration::Decoration
>(DecOp);
971 SPIRV::OperandCategory::DecorationOperand, Dec, ST, Reqs));
973 if (Dec == SPIRV::Decoration::BuiltIn) {
974 int64_t BuiltInOp =
MI.getOperand(DecIndex + 1).getImm();
975 auto BuiltIn =
static_cast<SPIRV::BuiltIn::BuiltIn
>(BuiltInOp);
977 SPIRV::OperandCategory::BuiltInOperand, BuiltIn, ST, Reqs));
978 }
else if (Dec == SPIRV::Decoration::LinkageAttributes) {
979 int64_t LinkageOp =
MI.getOperand(
MI.getNumOperands() - 1).getImm();
980 SPIRV::LinkageType::LinkageType LnkType =
981 static_cast<SPIRV::LinkageType::LinkageType
>(LinkageOp);
982 if (LnkType == SPIRV::LinkageType::LinkOnceODR)
983 Reqs.
addExtension(SPIRV::Extension::SPV_KHR_linkonce_odr);
984 }
else if (Dec == SPIRV::Decoration::CacheControlLoadINTEL ||
985 Dec == SPIRV::Decoration::CacheControlStoreINTEL) {
986 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_cache_controls);
987 }
else if (Dec == SPIRV::Decoration::HostAccessINTEL) {
988 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_global_variable_host_access);
989 }
else if (Dec == SPIRV::Decoration::InitModeINTEL ||
990 Dec == SPIRV::Decoration::ImplementInRegisterMapINTEL) {
992 SPIRV::Extension::SPV_INTEL_global_variable_fpga_decorations);
993 }
else if (Dec == SPIRV::Decoration::NonUniformEXT) {
995 }
else if (Dec == SPIRV::Decoration::FPMaxErrorDecorationINTEL) {
997 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_fp_max_error);
998 }
else if (Dec == SPIRV::Decoration::FPFastMathMode) {
999 if (
ST.canUseExtension(SPIRV::Extension::SPV_KHR_float_controls2)) {
1001 Reqs.
addExtension(SPIRV::Extension::SPV_KHR_float_controls2);
1010 assert(
MI.getNumOperands() >= 8 &&
"Insufficient operands for OpTypeImage");
1013 int64_t ImgFormatOp =
MI.getOperand(7).getImm();
1014 auto ImgFormat =
static_cast<SPIRV::ImageFormat::ImageFormat
>(ImgFormatOp);
1018 bool IsArrayed =
MI.getOperand(4).getImm() == 1;
1019 bool IsMultisampled =
MI.getOperand(5).getImm() == 1;
1020 bool NoSampler =
MI.getOperand(6).getImm() == 2;
1023 switch (
MI.getOperand(2).getImm()) {
1024 case SPIRV::Dim::DIM_1D:
1026 : SPIRV::Capability::Sampled1D);
1028 case SPIRV::Dim::DIM_2D:
1029 if (IsMultisampled && NoSampler)
1032 case SPIRV::Dim::DIM_Cube:
1036 : SPIRV::Capability::SampledCubeArray);
1038 case SPIRV::Dim::DIM_Rect:
1040 : SPIRV::Capability::SampledRect);
1042 case SPIRV::Dim::DIM_Buffer:
1044 : SPIRV::Capability::SampledBuffer);
1046 case SPIRV::Dim::DIM_SubpassData:
1052 if (!
ST.isShader()) {
1053 if (
MI.getNumOperands() > 8 &&
1054 MI.getOperand(8).getImm() == SPIRV::AccessQualifier::ReadWrite)
1062#define ATOM_FLT_REQ_EXT_MSG(ExtName) \
1063 "The atomic float instruction requires the following SPIR-V " \
1064 "extension: SPV_EXT_shader_atomic_float" ExtName
1069 "Expect register operand in atomic float instruction");
1070 Register TypeReg =
MI.getOperand(1).getReg();
1071 SPIRVType *TypeDef =
MI.getMF()->getRegInfo().getVRegDef(TypeReg);
1072 if (TypeDef->
getOpcode() != SPIRV::OpTypeFloat)
1074 "floating-point type scalar");
1077 unsigned Op =
MI.getOpcode();
1078 if (
Op == SPIRV::OpAtomicFAddEXT) {
1079 if (!
ST.canUseExtension(SPIRV::Extension::SPV_EXT_shader_atomic_float_add))
1081 Reqs.
addExtension(SPIRV::Extension::SPV_EXT_shader_atomic_float_add);
1084 if (!
ST.canUseExtension(
1085 SPIRV::Extension::SPV_EXT_shader_atomic_float16_add))
1087 Reqs.
addExtension(SPIRV::Extension::SPV_EXT_shader_atomic_float16_add);
1098 "Unexpected floating-point type width in atomic float instruction");
1101 if (!
ST.canUseExtension(
1102 SPIRV::Extension::SPV_EXT_shader_atomic_float_min_max))
1104 Reqs.
addExtension(SPIRV::Extension::SPV_EXT_shader_atomic_float_min_max);
1107 Reqs.
addCapability(SPIRV::Capability::AtomicFloat16MinMaxEXT);
1110 Reqs.
addCapability(SPIRV::Capability::AtomicFloat32MinMaxEXT);
1113 Reqs.
addCapability(SPIRV::Capability::AtomicFloat64MinMaxEXT);
1117 "Unexpected floating-point type width in atomic float instruction");
1123 if (ImageInst->
getOpcode() != SPIRV::OpTypeImage)
1127 return Dim == SPIRV::Dim::DIM_Buffer && Sampled == 1;
1131 if (ImageInst->
getOpcode() != SPIRV::OpTypeImage)
1135 return Dim == SPIRV::Dim::DIM_Buffer && Sampled == 2;
1139 if (ImageInst->
getOpcode() != SPIRV::OpTypeImage)
1143 return Dim != SPIRV::Dim::DIM_Buffer && Sampled == 1;
1147 if (ImageInst->
getOpcode() != SPIRV::OpTypeImage)
1151 return Dim == SPIRV::Dim::DIM_SubpassData && Sampled == 2;
1155 if (ImageInst->
getOpcode() != SPIRV::OpTypeImage)
1159 return Dim != SPIRV::Dim::DIM_Buffer && Sampled == 2;
1162bool isCombinedImageSampler(
MachineInstr *SampledImageInst) {
1163 if (SampledImageInst->
getOpcode() != SPIRV::OpTypeSampledImage)
1168 auto *ImageInst =
MRI.getUniqueVRegDef(ImageReg);
1169 return isSampledImage(ImageInst);
1173 for (
const auto &
MI :
MRI.reg_instructions(
Reg)) {
1174 if (
MI.getOpcode() != SPIRV::OpDecorate)
1178 if (Dec == SPIRV::Decoration::NonUniformEXT)
1196 if (
StorageClass != SPIRV::StorageClass::StorageClass::UniformConstant &&
1197 StorageClass != SPIRV::StorageClass::StorageClass::Uniform &&
1198 StorageClass != SPIRV::StorageClass::StorageClass::StorageBuffer) {
1203 hasNonUniformDecoration(
Instr.getOperand(0).getReg(),
MRI);
1205 auto FirstIndexReg =
Instr.getOperand(3).getReg();
1206 bool FirstIndexIsConstant =
1209 if (
StorageClass == SPIRV::StorageClass::StorageClass::StorageBuffer) {
1212 SPIRV::Capability::StorageBufferArrayNonUniformIndexingEXT);
1213 else if (!FirstIndexIsConstant)
1215 SPIRV::Capability::StorageBufferArrayDynamicIndexing);
1221 if (PointeeType->
getOpcode() != SPIRV::OpTypeImage &&
1222 PointeeType->
getOpcode() != SPIRV::OpTypeSampledImage &&
1223 PointeeType->
getOpcode() != SPIRV::OpTypeSampler) {
1227 if (isUniformTexelBuffer(PointeeType)) {
1230 SPIRV::Capability::UniformTexelBufferArrayNonUniformIndexingEXT);
1231 else if (!FirstIndexIsConstant)
1233 SPIRV::Capability::UniformTexelBufferArrayDynamicIndexingEXT);
1234 }
else if (isInputAttachment(PointeeType)) {
1237 SPIRV::Capability::InputAttachmentArrayNonUniformIndexingEXT);
1238 else if (!FirstIndexIsConstant)
1240 SPIRV::Capability::InputAttachmentArrayDynamicIndexingEXT);
1241 }
else if (isStorageTexelBuffer(PointeeType)) {
1244 SPIRV::Capability::StorageTexelBufferArrayNonUniformIndexingEXT);
1245 else if (!FirstIndexIsConstant)
1247 SPIRV::Capability::StorageTexelBufferArrayDynamicIndexingEXT);
1248 }
else if (isSampledImage(PointeeType) ||
1249 isCombinedImageSampler(PointeeType) ||
1250 PointeeType->
getOpcode() == SPIRV::OpTypeSampler) {
1253 SPIRV::Capability::SampledImageArrayNonUniformIndexingEXT);
1254 else if (!FirstIndexIsConstant)
1256 SPIRV::Capability::SampledImageArrayDynamicIndexing);
1257 }
else if (isStorageImage(PointeeType)) {
1260 SPIRV::Capability::StorageImageArrayNonUniformIndexingEXT);
1261 else if (!FirstIndexIsConstant)
1263 SPIRV::Capability::StorageImageArrayDynamicIndexing);
1267static bool isImageTypeWithUnknownFormat(
SPIRVType *TypeInst) {
1268 if (TypeInst->
getOpcode() != SPIRV::OpTypeImage)
1277 if (
ST.canUseExtension(SPIRV::Extension::SPV_KHR_integer_dot_product))
1278 Reqs.
addExtension(SPIRV::Extension::SPV_KHR_integer_dot_product);
1282 assert(
MI.getOperand(2).isReg() &&
"Unexpected operand in dot");
1286 assert(
Input->getOperand(1).isReg() &&
"Unexpected operand in dot input");
1290 if (TypeDef->
getOpcode() == SPIRV::OpTypeInt) {
1292 Reqs.
addCapability(SPIRV::Capability::DotProductInput4x8BitPacked);
1293 }
else if (TypeDef->
getOpcode() == SPIRV::OpTypeVector) {
1298 "Dot operand of 8-bit integer type requires 4 components");
1299 Reqs.
addCapability(SPIRV::Capability::DotProductInput4x8Bit);
1314 unsigned AddrSpace = ASOp.
getImm();
1315 if (AddrSpace != SPIRV::StorageClass::UniformConstant) {
1316 if (!
ST.canUseExtension(
1318 SPV_EXT_relaxed_printf_string_address_space)) {
1320 "required because printf uses a format string not "
1321 "in constant address space.",
1325 SPIRV::Extension::SPV_EXT_relaxed_printf_string_address_space);
1331static bool isBFloat16Type(
const SPIRVType *TypeDef) {
1333 TypeDef->
getOpcode() == SPIRV::OpTypeFloat &&
1342 switch (
MI.getOpcode()) {
1343 case SPIRV::OpMemoryModel: {
1344 int64_t Addr =
MI.getOperand(0).getImm();
1347 int64_t Mem =
MI.getOperand(1).getImm();
1352 case SPIRV::OpEntryPoint: {
1353 int64_t
Exe =
MI.getOperand(0).getImm();
1358 case SPIRV::OpExecutionMode:
1359 case SPIRV::OpExecutionModeId: {
1360 int64_t
Exe =
MI.getOperand(1).getImm();
1365 case SPIRV::OpTypeMatrix:
1368 case SPIRV::OpTypeInt: {
1369 unsigned BitWidth =
MI.getOperand(1).getImm();
1378 case SPIRV::OpDot: {
1381 if (isBFloat16Type(TypeDef))
1382 Reqs.
addCapability(SPIRV::Capability::BFloat16DotProductKHR);
1385 case SPIRV::OpTypeFloat: {
1386 unsigned BitWidth =
MI.getOperand(1).getImm();
1390 if (isBFloat16Type(&
MI)) {
1391 if (!
ST.canUseExtension(SPIRV::Extension::SPV_KHR_bfloat16))
1393 "following SPIR-V extension: SPV_KHR_bfloat16",
1403 case SPIRV::OpTypeVector: {
1404 unsigned NumComponents =
MI.getOperand(2).getImm();
1405 if (NumComponents == 8 || NumComponents == 16)
1409 case SPIRV::OpTypePointer: {
1410 auto SC =
MI.getOperand(1).getImm();
1421 (TypeDef->
getOpcode() == SPIRV::OpTypeFloat) &&
1426 case SPIRV::OpExtInst: {
1427 if (
MI.getOperand(2).getImm() ==
1428 static_cast<int64_t
>(
1429 SPIRV::InstructionSet::NonSemantic_Shader_DebugInfo_100)) {
1430 Reqs.
addExtension(SPIRV::Extension::SPV_KHR_non_semantic_info);
1433 if (
MI.getOperand(3).getImm() ==
1434 static_cast<int64_t
>(SPIRV::OpenCLExtInst::printf)) {
1435 addPrintfRequirements(
MI, Reqs, ST);
1442 case SPIRV::OpAliasDomainDeclINTEL:
1443 case SPIRV::OpAliasScopeDeclINTEL:
1444 case SPIRV::OpAliasScopeListDeclINTEL: {
1445 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_memory_access_aliasing);
1446 Reqs.
addCapability(SPIRV::Capability::MemoryAccessAliasingINTEL);
1449 case SPIRV::OpBitReverse:
1450 case SPIRV::OpBitFieldInsert:
1451 case SPIRV::OpBitFieldSExtract:
1452 case SPIRV::OpBitFieldUExtract:
1453 if (!
ST.canUseExtension(SPIRV::Extension::SPV_KHR_bit_instructions)) {
1457 Reqs.
addExtension(SPIRV::Extension::SPV_KHR_bit_instructions);
1460 case SPIRV::OpTypeRuntimeArray:
1463 case SPIRV::OpTypeOpaque:
1464 case SPIRV::OpTypeEvent:
1467 case SPIRV::OpTypePipe:
1468 case SPIRV::OpTypeReserveId:
1471 case SPIRV::OpTypeDeviceEvent:
1472 case SPIRV::OpTypeQueue:
1473 case SPIRV::OpBuildNDRange:
1476 case SPIRV::OpDecorate:
1477 case SPIRV::OpDecorateId:
1478 case SPIRV::OpDecorateString:
1479 addOpDecorateReqs(
MI, 1, Reqs, ST);
1481 case SPIRV::OpMemberDecorate:
1482 case SPIRV::OpMemberDecorateString:
1483 addOpDecorateReqs(
MI, 2, Reqs, ST);
1485 case SPIRV::OpInBoundsPtrAccessChain:
1488 case SPIRV::OpConstantSampler:
1491 case SPIRV::OpInBoundsAccessChain:
1492 case SPIRV::OpAccessChain:
1493 addOpAccessChainReqs(
MI, Reqs, ST);
1495 case SPIRV::OpTypeImage:
1496 addOpTypeImageReqs(
MI, Reqs, ST);
1498 case SPIRV::OpTypeSampler:
1499 if (!
ST.isShader()) {
1503 case SPIRV::OpTypeForwardPointer:
1507 case SPIRV::OpAtomicFlagTestAndSet:
1508 case SPIRV::OpAtomicLoad:
1509 case SPIRV::OpAtomicStore:
1510 case SPIRV::OpAtomicExchange:
1511 case SPIRV::OpAtomicCompareExchange:
1512 case SPIRV::OpAtomicIIncrement:
1513 case SPIRV::OpAtomicIDecrement:
1514 case SPIRV::OpAtomicIAdd:
1515 case SPIRV::OpAtomicISub:
1516 case SPIRV::OpAtomicUMin:
1517 case SPIRV::OpAtomicUMax:
1518 case SPIRV::OpAtomicSMin:
1519 case SPIRV::OpAtomicSMax:
1520 case SPIRV::OpAtomicAnd:
1521 case SPIRV::OpAtomicOr:
1522 case SPIRV::OpAtomicXor: {
1525 if (
MI.getOpcode() == SPIRV::OpAtomicStore) {
1527 InstrPtr =
MRI.getVRegDef(
MI.getOperand(3).getReg());
1528 assert(InstrPtr &&
"Unexpected type instruction for OpAtomicStore");
1533 if (TypeDef->
getOpcode() == SPIRV::OpTypeInt) {
1540 case SPIRV::OpGroupNonUniformIAdd:
1541 case SPIRV::OpGroupNonUniformFAdd:
1542 case SPIRV::OpGroupNonUniformIMul:
1543 case SPIRV::OpGroupNonUniformFMul:
1544 case SPIRV::OpGroupNonUniformSMin:
1545 case SPIRV::OpGroupNonUniformUMin:
1546 case SPIRV::OpGroupNonUniformFMin:
1547 case SPIRV::OpGroupNonUniformSMax:
1548 case SPIRV::OpGroupNonUniformUMax:
1549 case SPIRV::OpGroupNonUniformFMax:
1550 case SPIRV::OpGroupNonUniformBitwiseAnd:
1551 case SPIRV::OpGroupNonUniformBitwiseOr:
1552 case SPIRV::OpGroupNonUniformBitwiseXor:
1553 case SPIRV::OpGroupNonUniformLogicalAnd:
1554 case SPIRV::OpGroupNonUniformLogicalOr:
1555 case SPIRV::OpGroupNonUniformLogicalXor: {
1557 int64_t GroupOp =
MI.getOperand(3).getImm();
1559 case SPIRV::GroupOperation::Reduce:
1560 case SPIRV::GroupOperation::InclusiveScan:
1561 case SPIRV::GroupOperation::ExclusiveScan:
1562 Reqs.
addCapability(SPIRV::Capability::GroupNonUniformArithmetic);
1564 case SPIRV::GroupOperation::ClusteredReduce:
1565 Reqs.
addCapability(SPIRV::Capability::GroupNonUniformClustered);
1567 case SPIRV::GroupOperation::PartitionedReduceNV:
1568 case SPIRV::GroupOperation::PartitionedInclusiveScanNV:
1569 case SPIRV::GroupOperation::PartitionedExclusiveScanNV:
1570 Reqs.
addCapability(SPIRV::Capability::GroupNonUniformPartitionedNV);
1575 case SPIRV::OpGroupNonUniformShuffle:
1576 case SPIRV::OpGroupNonUniformShuffleXor:
1577 Reqs.
addCapability(SPIRV::Capability::GroupNonUniformShuffle);
1579 case SPIRV::OpGroupNonUniformShuffleUp:
1580 case SPIRV::OpGroupNonUniformShuffleDown:
1581 Reqs.
addCapability(SPIRV::Capability::GroupNonUniformShuffleRelative);
1583 case SPIRV::OpGroupAll:
1584 case SPIRV::OpGroupAny:
1585 case SPIRV::OpGroupBroadcast:
1586 case SPIRV::OpGroupIAdd:
1587 case SPIRV::OpGroupFAdd:
1588 case SPIRV::OpGroupFMin:
1589 case SPIRV::OpGroupUMin:
1590 case SPIRV::OpGroupSMin:
1591 case SPIRV::OpGroupFMax:
1592 case SPIRV::OpGroupUMax:
1593 case SPIRV::OpGroupSMax:
1596 case SPIRV::OpGroupNonUniformElect:
1599 case SPIRV::OpGroupNonUniformAll:
1600 case SPIRV::OpGroupNonUniformAny:
1601 case SPIRV::OpGroupNonUniformAllEqual:
1604 case SPIRV::OpGroupNonUniformBroadcast:
1605 case SPIRV::OpGroupNonUniformBroadcastFirst:
1606 case SPIRV::OpGroupNonUniformBallot:
1607 case SPIRV::OpGroupNonUniformInverseBallot:
1608 case SPIRV::OpGroupNonUniformBallotBitExtract:
1609 case SPIRV::OpGroupNonUniformBallotBitCount:
1610 case SPIRV::OpGroupNonUniformBallotFindLSB:
1611 case SPIRV::OpGroupNonUniformBallotFindMSB:
1612 Reqs.
addCapability(SPIRV::Capability::GroupNonUniformBallot);
1614 case SPIRV::OpSubgroupShuffleINTEL:
1615 case SPIRV::OpSubgroupShuffleDownINTEL:
1616 case SPIRV::OpSubgroupShuffleUpINTEL:
1617 case SPIRV::OpSubgroupShuffleXorINTEL:
1618 if (
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_subgroups)) {
1619 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_subgroups);
1620 Reqs.
addCapability(SPIRV::Capability::SubgroupShuffleINTEL);
1623 case SPIRV::OpSubgroupBlockReadINTEL:
1624 case SPIRV::OpSubgroupBlockWriteINTEL:
1625 if (
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_subgroups)) {
1626 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_subgroups);
1627 Reqs.
addCapability(SPIRV::Capability::SubgroupBufferBlockIOINTEL);
1630 case SPIRV::OpSubgroupImageBlockReadINTEL:
1631 case SPIRV::OpSubgroupImageBlockWriteINTEL:
1632 if (
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_subgroups)) {
1633 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_subgroups);
1634 Reqs.
addCapability(SPIRV::Capability::SubgroupImageBlockIOINTEL);
1637 case SPIRV::OpSubgroupImageMediaBlockReadINTEL:
1638 case SPIRV::OpSubgroupImageMediaBlockWriteINTEL:
1639 if (
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_media_block_io)) {
1640 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_media_block_io);
1641 Reqs.
addCapability(SPIRV::Capability::SubgroupImageMediaBlockIOINTEL);
1644 case SPIRV::OpAssumeTrueKHR:
1645 case SPIRV::OpExpectKHR:
1646 if (
ST.canUseExtension(SPIRV::Extension::SPV_KHR_expect_assume)) {
1647 Reqs.
addExtension(SPIRV::Extension::SPV_KHR_expect_assume);
1651 case SPIRV::OpPtrCastToCrossWorkgroupINTEL:
1652 case SPIRV::OpCrossWorkgroupCastToPtrINTEL:
1653 if (
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_usm_storage_classes)) {
1654 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_usm_storage_classes);
1655 Reqs.
addCapability(SPIRV::Capability::USMStorageClassesINTEL);
1658 case SPIRV::OpConstantFunctionPointerINTEL:
1659 if (
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_function_pointers)) {
1660 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_function_pointers);
1661 Reqs.
addCapability(SPIRV::Capability::FunctionPointersINTEL);
1664 case SPIRV::OpGroupNonUniformRotateKHR:
1665 if (!
ST.canUseExtension(SPIRV::Extension::SPV_KHR_subgroup_rotate))
1667 "following SPIR-V extension: SPV_KHR_subgroup_rotate",
1669 Reqs.
addExtension(SPIRV::Extension::SPV_KHR_subgroup_rotate);
1670 Reqs.
addCapability(SPIRV::Capability::GroupNonUniformRotateKHR);
1673 case SPIRV::OpGroupIMulKHR:
1674 case SPIRV::OpGroupFMulKHR:
1675 case SPIRV::OpGroupBitwiseAndKHR:
1676 case SPIRV::OpGroupBitwiseOrKHR:
1677 case SPIRV::OpGroupBitwiseXorKHR:
1678 case SPIRV::OpGroupLogicalAndKHR:
1679 case SPIRV::OpGroupLogicalOrKHR:
1680 case SPIRV::OpGroupLogicalXorKHR:
1681 if (
ST.canUseExtension(
1682 SPIRV::Extension::SPV_KHR_uniform_group_instructions)) {
1683 Reqs.
addExtension(SPIRV::Extension::SPV_KHR_uniform_group_instructions);
1684 Reqs.
addCapability(SPIRV::Capability::GroupUniformArithmeticKHR);
1687 case SPIRV::OpReadClockKHR:
1688 if (!
ST.canUseExtension(SPIRV::Extension::SPV_KHR_shader_clock))
1690 "following SPIR-V extension: SPV_KHR_shader_clock",
1692 Reqs.
addExtension(SPIRV::Extension::SPV_KHR_shader_clock);
1695 case SPIRV::OpFunctionPointerCallINTEL:
1696 if (
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_function_pointers)) {
1697 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_function_pointers);
1698 Reqs.
addCapability(SPIRV::Capability::FunctionPointersINTEL);
1701 case SPIRV::OpAtomicFAddEXT:
1702 case SPIRV::OpAtomicFMinEXT:
1703 case SPIRV::OpAtomicFMaxEXT:
1704 AddAtomicFloatRequirements(
MI, Reqs, ST);
1706 case SPIRV::OpConvertBF16ToFINTEL:
1707 case SPIRV::OpConvertFToBF16INTEL:
1708 if (
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_bfloat16_conversion)) {
1709 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_bfloat16_conversion);
1710 Reqs.
addCapability(SPIRV::Capability::BFloat16ConversionINTEL);
1713 case SPIRV::OpRoundFToTF32INTEL:
1714 if (
ST.canUseExtension(
1715 SPIRV::Extension::SPV_INTEL_tensor_float32_conversion)) {
1716 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_tensor_float32_conversion);
1717 Reqs.
addCapability(SPIRV::Capability::TensorFloat32RoundingINTEL);
1720 case SPIRV::OpVariableLengthArrayINTEL:
1721 case SPIRV::OpSaveMemoryINTEL:
1722 case SPIRV::OpRestoreMemoryINTEL:
1723 if (
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_variable_length_array)) {
1724 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_variable_length_array);
1725 Reqs.
addCapability(SPIRV::Capability::VariableLengthArrayINTEL);
1728 case SPIRV::OpAsmTargetINTEL:
1729 case SPIRV::OpAsmINTEL:
1730 case SPIRV::OpAsmCallINTEL:
1731 if (
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_inline_assembly)) {
1732 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_inline_assembly);
1736 case SPIRV::OpTypeCooperativeMatrixKHR: {
1737 if (!
ST.canUseExtension(SPIRV::Extension::SPV_KHR_cooperative_matrix))
1739 "OpTypeCooperativeMatrixKHR type requires the "
1740 "following SPIR-V extension: SPV_KHR_cooperative_matrix",
1742 Reqs.
addExtension(SPIRV::Extension::SPV_KHR_cooperative_matrix);
1743 Reqs.
addCapability(SPIRV::Capability::CooperativeMatrixKHR);
1746 if (isBFloat16Type(TypeDef))
1747 Reqs.
addCapability(SPIRV::Capability::BFloat16CooperativeMatrixKHR);
1750 case SPIRV::OpArithmeticFenceEXT:
1751 if (!
ST.canUseExtension(SPIRV::Extension::SPV_EXT_arithmetic_fence))
1753 "following SPIR-V extension: SPV_EXT_arithmetic_fence",
1755 Reqs.
addExtension(SPIRV::Extension::SPV_EXT_arithmetic_fence);
1758 case SPIRV::OpControlBarrierArriveINTEL:
1759 case SPIRV::OpControlBarrierWaitINTEL:
1760 if (
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_split_barrier)) {
1761 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_split_barrier);
1765 case SPIRV::OpCooperativeMatrixMulAddKHR: {
1766 if (!
ST.canUseExtension(SPIRV::Extension::SPV_KHR_cooperative_matrix))
1768 "following SPIR-V extension: "
1769 "SPV_KHR_cooperative_matrix",
1771 Reqs.
addExtension(SPIRV::Extension::SPV_KHR_cooperative_matrix);
1772 Reqs.
addCapability(SPIRV::Capability::CooperativeMatrixKHR);
1773 constexpr unsigned MulAddMaxSize = 6;
1774 if (
MI.getNumOperands() != MulAddMaxSize)
1776 const int64_t CoopOperands =
MI.getOperand(MulAddMaxSize - 1).getImm();
1778 SPIRV::CooperativeMatrixOperands::MatrixAAndBTF32ComponentsINTEL) {
1779 if (!
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_joint_matrix))
1781 "require the following SPIR-V extension: "
1782 "SPV_INTEL_joint_matrix",
1784 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_joint_matrix);
1786 SPIRV::Capability::CooperativeMatrixTF32ComponentTypeINTEL);
1789 MatrixAAndBBFloat16ComponentsINTEL ||
1791 SPIRV::CooperativeMatrixOperands::MatrixCBFloat16ComponentsINTEL ||
1793 MatrixResultBFloat16ComponentsINTEL) {
1794 if (!
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_joint_matrix))
1796 "require the following SPIR-V extension: "
1797 "SPV_INTEL_joint_matrix",
1799 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_joint_matrix);
1801 SPIRV::Capability::CooperativeMatrixBFloat16ComponentTypeINTEL);
1805 case SPIRV::OpCooperativeMatrixLoadKHR:
1806 case SPIRV::OpCooperativeMatrixStoreKHR:
1807 case SPIRV::OpCooperativeMatrixLoadCheckedINTEL:
1808 case SPIRV::OpCooperativeMatrixStoreCheckedINTEL:
1809 case SPIRV::OpCooperativeMatrixPrefetchINTEL: {
1810 if (!
ST.canUseExtension(SPIRV::Extension::SPV_KHR_cooperative_matrix))
1812 "following SPIR-V extension: "
1813 "SPV_KHR_cooperative_matrix",
1815 Reqs.
addExtension(SPIRV::Extension::SPV_KHR_cooperative_matrix);
1816 Reqs.
addCapability(SPIRV::Capability::CooperativeMatrixKHR);
1820 std::unordered_map<unsigned, unsigned> LayoutToInstMap = {
1821 {SPIRV::OpCooperativeMatrixLoadKHR, 3},
1822 {SPIRV::OpCooperativeMatrixStoreKHR, 2},
1823 {SPIRV::OpCooperativeMatrixLoadCheckedINTEL, 5},
1824 {SPIRV::OpCooperativeMatrixStoreCheckedINTEL, 4},
1825 {SPIRV::OpCooperativeMatrixPrefetchINTEL, 4}};
1827 const auto OpCode =
MI.getOpcode();
1828 const unsigned LayoutNum = LayoutToInstMap[OpCode];
1829 Register RegLayout =
MI.getOperand(LayoutNum).getReg();
1832 if (MILayout->
getOpcode() == SPIRV::OpConstantI) {
1835 static_cast<unsigned>(SPIRV::CooperativeMatrixLayout::PackedINTEL)) {
1836 if (!
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_joint_matrix))
1838 "extension: SPV_INTEL_joint_matrix",
1840 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_joint_matrix);
1841 Reqs.
addCapability(SPIRV::Capability::PackedCooperativeMatrixINTEL);
1846 if (OpCode == SPIRV::OpCooperativeMatrixLoadKHR ||
1847 OpCode == SPIRV::OpCooperativeMatrixStoreKHR)
1850 std::string InstName;
1852 case SPIRV::OpCooperativeMatrixPrefetchINTEL:
1853 InstName =
"OpCooperativeMatrixPrefetchINTEL";
1855 case SPIRV::OpCooperativeMatrixLoadCheckedINTEL:
1856 InstName =
"OpCooperativeMatrixLoadCheckedINTEL";
1858 case SPIRV::OpCooperativeMatrixStoreCheckedINTEL:
1859 InstName =
"OpCooperativeMatrixStoreCheckedINTEL";
1863 if (!
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_joint_matrix)) {
1864 const std::string ErrorMsg =
1865 InstName +
" instruction requires the "
1866 "following SPIR-V extension: SPV_INTEL_joint_matrix";
1869 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_joint_matrix);
1870 if (OpCode == SPIRV::OpCooperativeMatrixPrefetchINTEL) {
1871 Reqs.
addCapability(SPIRV::Capability::CooperativeMatrixPrefetchINTEL);
1875 SPIRV::Capability::CooperativeMatrixCheckedInstructionsINTEL);
1878 case SPIRV::OpCooperativeMatrixConstructCheckedINTEL:
1879 if (!
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_joint_matrix))
1881 "instructions require the following SPIR-V extension: "
1882 "SPV_INTEL_joint_matrix",
1884 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_joint_matrix);
1886 SPIRV::Capability::CooperativeMatrixCheckedInstructionsINTEL);
1888 case SPIRV::OpCooperativeMatrixGetElementCoordINTEL:
1889 if (!
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_joint_matrix))
1891 "following SPIR-V extension: SPV_INTEL_joint_matrix",
1893 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_joint_matrix);
1895 SPIRV::Capability::CooperativeMatrixInvocationInstructionsINTEL);
1897 case SPIRV::OpConvertHandleToImageINTEL:
1898 case SPIRV::OpConvertHandleToSamplerINTEL:
1899 case SPIRV::OpConvertHandleToSampledImageINTEL: {
1900 if (!
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_bindless_images))
1902 "instructions require the following SPIR-V extension: "
1903 "SPV_INTEL_bindless_images",
1906 SPIRV::AddressingModel::AddressingModel AddrModel = MAI.
Addr;
1908 if (
MI.getOpcode() == SPIRV::OpConvertHandleToImageINTEL &&
1909 TyDef->
getOpcode() != SPIRV::OpTypeImage) {
1911 "OpConvertHandleToImageINTEL",
1913 }
else if (
MI.getOpcode() == SPIRV::OpConvertHandleToSamplerINTEL &&
1914 TyDef->
getOpcode() != SPIRV::OpTypeSampler) {
1916 "OpConvertHandleToSamplerINTEL",
1918 }
else if (
MI.getOpcode() == SPIRV::OpConvertHandleToSampledImageINTEL &&
1919 TyDef->
getOpcode() != SPIRV::OpTypeSampledImage) {
1921 "OpConvertHandleToSampledImageINTEL",
1926 if (!(Bitwidth == 32 && AddrModel == SPIRV::AddressingModel::Physical32) &&
1927 !(Bitwidth == 64 && AddrModel == SPIRV::AddressingModel::Physical64)) {
1929 "Parameter value must be a 32-bit scalar in case of "
1930 "Physical32 addressing model or a 64-bit scalar in case of "
1931 "Physical64 addressing model",
1934 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_bindless_images);
1938 case SPIRV::OpSubgroup2DBlockLoadINTEL:
1939 case SPIRV::OpSubgroup2DBlockLoadTransposeINTEL:
1940 case SPIRV::OpSubgroup2DBlockLoadTransformINTEL:
1941 case SPIRV::OpSubgroup2DBlockPrefetchINTEL:
1942 case SPIRV::OpSubgroup2DBlockStoreINTEL: {
1943 if (!
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_2d_block_io))
1945 "Prefetch/Store]INTEL instructions require the "
1946 "following SPIR-V extension: SPV_INTEL_2d_block_io",
1948 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_2d_block_io);
1949 Reqs.
addCapability(SPIRV::Capability::Subgroup2DBlockIOINTEL);
1951 const auto OpCode =
MI.getOpcode();
1952 if (OpCode == SPIRV::OpSubgroup2DBlockLoadTransposeINTEL) {
1953 Reqs.
addCapability(SPIRV::Capability::Subgroup2DBlockTransposeINTEL);
1956 if (OpCode == SPIRV::OpSubgroup2DBlockLoadTransformINTEL) {
1957 Reqs.
addCapability(SPIRV::Capability::Subgroup2DBlockTransformINTEL);
1962 case SPIRV::OpKill: {
1965 case SPIRV::OpDemoteToHelperInvocation:
1966 Reqs.
addCapability(SPIRV::Capability::DemoteToHelperInvocation);
1968 if (
ST.canUseExtension(
1969 SPIRV::Extension::SPV_EXT_demote_to_helper_invocation)) {
1972 SPIRV::Extension::SPV_EXT_demote_to_helper_invocation);
1977 case SPIRV::OpSUDot:
1978 case SPIRV::OpSDotAccSat:
1979 case SPIRV::OpUDotAccSat:
1980 case SPIRV::OpSUDotAccSat:
1981 AddDotProductRequirements(
MI, Reqs, ST);
1983 case SPIRV::OpImageRead: {
1984 Register ImageReg =
MI.getOperand(2).getReg();
1985 SPIRVType *TypeDef =
ST.getSPIRVGlobalRegistry()->getResultType(
1993 if (isImageTypeWithUnknownFormat(TypeDef) &&
ST.isShader())
1994 Reqs.
addCapability(SPIRV::Capability::StorageImageReadWithoutFormat);
1997 case SPIRV::OpImageWrite: {
1998 Register ImageReg =
MI.getOperand(0).getReg();
1999 SPIRVType *TypeDef =
ST.getSPIRVGlobalRegistry()->getResultType(
2007 if (isImageTypeWithUnknownFormat(TypeDef) &&
ST.isShader())
2008 Reqs.
addCapability(SPIRV::Capability::StorageImageWriteWithoutFormat);
2011 case SPIRV::OpTypeStructContinuedINTEL:
2012 case SPIRV::OpConstantCompositeContinuedINTEL:
2013 case SPIRV::OpSpecConstantCompositeContinuedINTEL:
2014 case SPIRV::OpCompositeConstructContinuedINTEL: {
2015 if (!
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_long_composites))
2017 "Continued instructions require the "
2018 "following SPIR-V extension: SPV_INTEL_long_composites",
2020 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_long_composites);
2024 case SPIRV::OpSubgroupMatrixMultiplyAccumulateINTEL: {
2025 if (!
ST.canUseExtension(
2026 SPIRV::Extension::SPV_INTEL_subgroup_matrix_multiply_accumulate))
2028 "OpSubgroupMatrixMultiplyAccumulateINTEL instruction requires the "
2030 "extension: SPV_INTEL_subgroup_matrix_multiply_accumulate",
2033 SPIRV::Extension::SPV_INTEL_subgroup_matrix_multiply_accumulate);
2035 SPIRV::Capability::SubgroupMatrixMultiplyAccumulateINTEL);
2038 case SPIRV::OpBitwiseFunctionINTEL: {
2039 if (!
ST.canUseExtension(
2040 SPIRV::Extension::SPV_INTEL_ternary_bitwise_function))
2042 "OpBitwiseFunctionINTEL instruction requires the following SPIR-V "
2043 "extension: SPV_INTEL_ternary_bitwise_function",
2045 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_ternary_bitwise_function);
2046 Reqs.
addCapability(SPIRV::Capability::TernaryBitwiseFunctionINTEL);
2049 case SPIRV::OpCopyMemorySized: {
2054 case SPIRV::OpPredicatedLoadINTEL:
2055 case SPIRV::OpPredicatedStoreINTEL: {
2056 if (!
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_predicated_io))
2058 "OpPredicated[Load/Store]INTEL instructions require "
2059 "the following SPIR-V extension: SPV_INTEL_predicated_io",
2061 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_predicated_io);
2065 case SPIRV::OpFAddS:
2066 case SPIRV::OpFSubS:
2067 case SPIRV::OpFMulS:
2068 case SPIRV::OpFDivS:
2069 case SPIRV::OpFRemS:
2071 case SPIRV::OpFNegate:
2072 case SPIRV::OpFAddV:
2073 case SPIRV::OpFSubV:
2074 case SPIRV::OpFMulV:
2075 case SPIRV::OpFDivV:
2076 case SPIRV::OpFRemV:
2077 case SPIRV::OpFNegateV: {
2080 if (TypeDef->
getOpcode() == SPIRV::OpTypeVector)
2082 if (isBFloat16Type(TypeDef)) {
2083 if (!
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_bfloat16_arithmetic))
2085 "Arithmetic instructions with bfloat16 arguments require the "
2086 "following SPIR-V extension: SPV_INTEL_bfloat16_arithmetic",
2088 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_bfloat16_arithmetic);
2089 Reqs.
addCapability(SPIRV::Capability::BFloat16ArithmeticINTEL);
2093 case SPIRV::OpOrdered:
2094 case SPIRV::OpUnordered:
2095 case SPIRV::OpFOrdEqual:
2096 case SPIRV::OpFOrdNotEqual:
2097 case SPIRV::OpFOrdLessThan:
2098 case SPIRV::OpFOrdLessThanEqual:
2099 case SPIRV::OpFOrdGreaterThan:
2100 case SPIRV::OpFOrdGreaterThanEqual:
2101 case SPIRV::OpFUnordEqual:
2102 case SPIRV::OpFUnordNotEqual:
2103 case SPIRV::OpFUnordLessThan:
2104 case SPIRV::OpFUnordLessThanEqual:
2105 case SPIRV::OpFUnordGreaterThan:
2106 case SPIRV::OpFUnordGreaterThanEqual: {
2110 if (TypeDef->
getOpcode() == SPIRV::OpTypeVector)
2112 if (isBFloat16Type(TypeDef)) {
2113 if (!
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_bfloat16_arithmetic))
2115 "Relational instructions with bfloat16 arguments require the "
2116 "following SPIR-V extension: SPV_INTEL_bfloat16_arithmetic",
2118 Reqs.
addExtension(SPIRV::Extension::SPV_INTEL_bfloat16_arithmetic);
2119 Reqs.
addCapability(SPIRV::Capability::BFloat16ArithmeticINTEL);
2131 SPIRV::Capability::Shader);
2137 for (
auto F = M.begin(),
E = M.end();
F !=
E; ++
F) {
2143 addInstrRequirements(
MI, MAI, ST);
2146 auto Node = M.getNamedMetadata(
"spirv.ExecutionMode");
2148 bool RequireFloatControls =
false, RequireIntelFloatControls2 =
false,
2149 RequireKHRFloatControls2 =
false,
2151 bool HasIntelFloatControls2 =
2152 ST.canUseExtension(SPIRV::Extension::SPV_INTEL_float_controls2);
2153 bool HasKHRFloatControls2 =
2154 ST.canUseExtension(SPIRV::Extension::SPV_KHR_float_controls2);
2155 for (
unsigned i = 0; i <
Node->getNumOperands(); i++) {
2161 auto EM =
Const->getZExtValue();
2165 case SPIRV::ExecutionMode::DenormPreserve:
2166 case SPIRV::ExecutionMode::DenormFlushToZero:
2167 case SPIRV::ExecutionMode::RoundingModeRTE:
2168 case SPIRV::ExecutionMode::RoundingModeRTZ:
2169 RequireFloatControls = VerLower14;
2171 SPIRV::OperandCategory::ExecutionModeOperand, EM, ST);
2173 case SPIRV::ExecutionMode::RoundingModeRTPINTEL:
2174 case SPIRV::ExecutionMode::RoundingModeRTNINTEL:
2175 case SPIRV::ExecutionMode::FloatingPointModeALTINTEL:
2176 case SPIRV::ExecutionMode::FloatingPointModeIEEEINTEL:
2177 if (HasIntelFloatControls2) {
2178 RequireIntelFloatControls2 =
true;
2180 SPIRV::OperandCategory::ExecutionModeOperand, EM, ST);
2183 case SPIRV::ExecutionMode::FPFastMathDefault: {
2184 if (HasKHRFloatControls2) {
2185 RequireKHRFloatControls2 =
true;
2187 SPIRV::OperandCategory::ExecutionModeOperand, EM, ST);
2191 case SPIRV::ExecutionMode::ContractionOff:
2192 case SPIRV::ExecutionMode::SignedZeroInfNanPreserve:
2193 if (HasKHRFloatControls2) {
2194 RequireKHRFloatControls2 =
true;
2196 SPIRV::OperandCategory::ExecutionModeOperand,
2197 SPIRV::ExecutionMode::FPFastMathDefault, ST);
2200 SPIRV::OperandCategory::ExecutionModeOperand, EM, ST);
2205 SPIRV::OperandCategory::ExecutionModeOperand, EM, ST);
2210 if (RequireFloatControls &&
2211 ST.canUseExtension(SPIRV::Extension::SPV_KHR_float_controls))
2213 if (RequireIntelFloatControls2)
2215 if (RequireKHRFloatControls2)
2218 for (
auto FI = M.begin(),
E = M.end(); FI !=
E; ++FI) {
2220 if (
F.isDeclaration())
2222 if (
F.getMetadata(
"reqd_work_group_size"))
2224 SPIRV::OperandCategory::ExecutionModeOperand,
2225 SPIRV::ExecutionMode::LocalSize, ST);
2226 if (
F.getFnAttribute(
"hlsl.numthreads").isValid()) {
2228 SPIRV::OperandCategory::ExecutionModeOperand,
2229 SPIRV::ExecutionMode::LocalSize, ST);
2231 if (
F.getFnAttribute(
"enable-maximal-reconvergence").getValueAsBool()) {
2234 if (
F.getMetadata(
"work_group_size_hint"))
2236 SPIRV::OperandCategory::ExecutionModeOperand,
2237 SPIRV::ExecutionMode::LocalSizeHint, ST);
2238 if (
F.getMetadata(
"intel_reqd_sub_group_size"))
2240 SPIRV::OperandCategory::ExecutionModeOperand,
2241 SPIRV::ExecutionMode::SubgroupSize, ST);
2242 if (
F.getMetadata(
"max_work_group_size"))
2244 SPIRV::OperandCategory::ExecutionModeOperand,
2245 SPIRV::ExecutionMode::MaxWorkgroupSizeINTEL, ST);
2246 if (
F.getMetadata(
"vec_type_hint"))
2248 SPIRV::OperandCategory::ExecutionModeOperand,
2249 SPIRV::ExecutionMode::VecTypeHint, ST);
2251 if (
F.hasOptNone()) {
2252 if (
ST.canUseExtension(SPIRV::Extension::SPV_INTEL_optnone)) {
2255 }
else if (
ST.canUseExtension(SPIRV::Extension::SPV_EXT_optnone)) {
2265 unsigned Flags = SPIRV::FPFastMathMode::None;
2266 bool CanUseKHRFloatControls2 =
2267 ST.canUseExtension(SPIRV::Extension::SPV_KHR_float_controls2);
2269 Flags |= SPIRV::FPFastMathMode::NotNaN;
2271 Flags |= SPIRV::FPFastMathMode::NotInf;
2273 Flags |= SPIRV::FPFastMathMode::NSZ;
2275 Flags |= SPIRV::FPFastMathMode::AllowRecip;
2277 Flags |= SPIRV::FPFastMathMode::AllowContract;
2279 if (CanUseKHRFloatControls2)
2287 Flags |= SPIRV::FPFastMathMode::NotNaN | SPIRV::FPFastMathMode::NotInf |
2288 SPIRV::FPFastMathMode::NSZ | SPIRV::FPFastMathMode::AllowRecip |
2289 SPIRV::FPFastMathMode::AllowTransform |
2290 SPIRV::FPFastMathMode::AllowReassoc |
2291 SPIRV::FPFastMathMode::AllowContract;
2293 Flags |= SPIRV::FPFastMathMode::Fast;
2296 if (CanUseKHRFloatControls2) {
2298 assert(!(Flags & SPIRV::FPFastMathMode::Fast) &&
2299 "SPIRV::FPFastMathMode::Fast is deprecated and should not be used "
2304 assert((!(Flags & SPIRV::FPFastMathMode::AllowTransform) ||
2305 ((Flags & SPIRV::FPFastMathMode::AllowReassoc &&
2306 Flags & SPIRV::FPFastMathMode::AllowContract))) &&
2307 "SPIRV::FPFastMathMode::AllowTransform requires AllowReassoc and "
2308 "AllowContract flags to be enabled as well.");
2319 return ST.canUseExtension(SPIRV::Extension::SPV_KHR_float_controls2);
2322static void handleMIFlagDecoration(
2327 getSymbolicOperandRequirements(SPIRV::OperandCategory::DecorationOperand,
2328 SPIRV::Decoration::NoSignedWrap, ST, Reqs)
2331 SPIRV::Decoration::NoSignedWrap, {});
2334 getSymbolicOperandRequirements(SPIRV::OperandCategory::DecorationOperand,
2335 SPIRV::Decoration::NoUnsignedWrap, ST,
2339 SPIRV::Decoration::NoUnsignedWrap, {});
2341 if (!
TII.canUseFastMathFlags(
2342 I,
ST.canUseExtension(SPIRV::Extension::SPV_KHR_float_controls2)))
2345 unsigned FMFlags = getFastMathFlags(
I, ST);
2346 if (FMFlags == SPIRV::FPFastMathMode::None) {
2349 if (FPFastMathDefaultInfoVec.
empty())
2365 assert(
I.getNumOperands() >= 3 &&
"Expected at least 3 operands");
2366 Register ResReg =
I.getOpcode() == SPIRV::OpExtInst
2367 ?
I.getOperand(1).getReg()
2368 :
I.getOperand(2).getReg();
2376 if (Ty == Elem.Ty) {
2377 FMFlags = Elem.FastMathFlags;
2378 Emit = Elem.ContractionOff || Elem.SignedZeroInfNanPreserve ||
2379 Elem.FPFastMathDefault;
2384 if (FMFlags == SPIRV::FPFastMathMode::None && !Emit)
2387 if (isFastMathModeAvailable(ST)) {
2388 Register DstReg =
I.getOperand(0).getReg();
2399 for (
auto F = M.begin(),
E = M.end();
F !=
E; ++
F) {
2404 for (
auto &
MBB : *MF)
2405 for (
auto &
MI :
MBB)
2406 handleMIFlagDecoration(
MI, ST,
TII, MAI.
Reqs, GR,
2414 for (
auto F = M.begin(),
E = M.end();
F !=
E; ++
F) {
2419 for (
auto &
MBB : *MF) {
2420 if (!
MBB.hasName() ||
MBB.empty())
2424 MRI.setRegClass(
Reg, &SPIRV::IDRegClass);
2435 for (
auto F = M.begin(),
E = M.end();
F !=
E; ++
F) {
2439 for (
auto &
MBB : *MF) {
2441 MI.setDesc(
TII.get(SPIRV::OpPhi));
2444 MI.insert(
MI.operands_begin() + 1,
2445 {MachineOperand::CreateReg(ResTypeReg, false)});
2464 SPIRV::FPFastMathMode::None);
2466 SPIRV::FPFastMathMode::None);
2468 SPIRV::FPFastMathMode::None);
2475 size_t BitWidth = Ty->getScalarSizeInBits();
2479 assert(Index >= 0 && Index < 3 &&
2480 "Expected FPFastMathDefaultInfo for half, float, or double");
2481 assert(FPFastMathDefaultInfoVec.
size() == 3 &&
2482 "Expected FPFastMathDefaultInfoVec to have exactly 3 elements");
2483 return FPFastMathDefaultInfoVec[Index];
2486static void collectFPFastMathDefaults(
const Module &M,
2489 if (!
ST.canUseExtension(SPIRV::Extension::SPV_KHR_float_controls2))
2498 auto Node = M.getNamedMetadata(
"spirv.ExecutionMode");
2502 for (
unsigned i = 0; i <
Node->getNumOperands(); i++) {
2511 if (EM == SPIRV::ExecutionMode::FPFastMathDefault) {
2513 "Expected 4 operands for FPFastMathDefault");
2524 Info.FastMathFlags = Flags;
2525 Info.FPFastMathDefault =
true;
2526 }
else if (EM == SPIRV::ExecutionMode::ContractionOff) {
2528 "Expected no operands for ContractionOff");
2535 Info.ContractionOff =
true;
2537 }
else if (EM == SPIRV::ExecutionMode::SignedZeroInfNanPreserve) {
2539 "Expected 1 operand for SignedZeroInfNanPreserve");
2540 unsigned TargetWidth =
2549 assert(Index >= 0 && Index < 3 &&
2550 "Expected FPFastMathDefaultInfo for half, float, or double");
2551 assert(FPFastMathDefaultInfoVec.
size() == 3 &&
2552 "Expected FPFastMathDefaultInfoVec to have exactly 3 elements");
2553 FPFastMathDefaultInfoVec[Index].SignedZeroInfNanPreserve =
true;