26#include "llvm/IR/IntrinsicsDirectX.h"
83 case Intrinsic::dx_wave_is_first_lane:
84 case Intrinsic::dx_wave_getlaneindex:
85 case Intrinsic::dx_wave_any:
86 case Intrinsic::dx_wave_all_equal:
87 case Intrinsic::dx_wave_all:
88 case Intrinsic::dx_wave_readlane:
89 case Intrinsic::dx_wave_active_countbits:
90 case Intrinsic::dx_wave_ballot:
91 case Intrinsic::dx_wave_prefix_bit_count:
93 case Intrinsic::dx_wave_reduce_or:
94 case Intrinsic::dx_wave_reduce_xor:
95 case Intrinsic::dx_wave_reduce_and:
96 case Intrinsic::dx_wave_reduce_sum:
97 case Intrinsic::dx_wave_reduce_usum:
98 case Intrinsic::dx_wave_product:
99 case Intrinsic::dx_wave_uproduct:
100 case Intrinsic::dx_wave_reduce_max:
101 case Intrinsic::dx_wave_reduce_umax:
102 case Intrinsic::dx_wave_reduce_min:
103 case Intrinsic::dx_wave_reduce_umin:
105 case Intrinsic::dx_wave_prefix_sum:
106 case Intrinsic::dx_wave_prefix_usum:
107 case Intrinsic::dx_wave_prefix_product:
108 case Intrinsic::dx_wave_prefix_uproduct:
110 case Intrinsic::dx_quad_read_across_x:
111 case Intrinsic::dx_quad_read_across_y:
112 case Intrinsic::dx_quad_read_across_diagonal:
129 return Flag->getValue().getBoolValue();
138 assert(IID == Intrinsic::dx_resource_load_typedbuffer ||
139 IID == Intrinsic::dx_resource_load_rawbuffer &&
140 "unexpected intrinsic ID");
141 for (
const User *U :
II.users()) {
145 if (EVI->getNumIndices() == 1 && EVI->getIndices()[0] == 1)
161 CSF.Doubles =
I.getType()->getScalarType()->isDoubleTy();
164 for (
const Value *
Op :
I.operands()) {
165 if (
Op->getType()->getScalarType()->isDoubleTy()) {
173 switch (
I.getOpcode()) {
174 case Instruction::FDiv:
175 case Instruction::UIToFP:
176 case Instruction::SIToFP:
177 case Instruction::FPToUI:
178 case Instruction::FPToSI:
179 CSF.DX11_1_DoubleExtensions =
true;
184 if (!CSF.LowPrecisionPresent)
185 CSF.LowPrecisionPresent =
I.getType()->getScalarType()->isIntegerTy(16) ||
186 I.getType()->getScalarType()->isHalfTy();
188 if (!CSF.LowPrecisionPresent) {
189 for (
const Value *
Op :
I.operands()) {
190 if (
Op->getType()->getScalarType()->isIntegerTy(16) ||
191 Op->getType()->getScalarType()->isHalfTy()) {
192 CSF.LowPrecisionPresent =
true;
198 if (CSF.LowPrecisionPresent) {
199 if (CSF.NativeLowPrecisionMode)
200 CSF.NativeLowPrecision =
true;
202 CSF.MinimumPrecision =
true;
206 CSF.Int64Ops =
I.getType()->getScalarType()->isIntegerTy(64);
209 for (
const Value *
Op :
I.operands()) {
210 if (
Op->getType()->getScalarType()->isIntegerTy(64)) {
218 switch (
II->getIntrinsicID()) {
221 case Intrinsic::dx_resource_handlefrombinding: {
226 if (!CSF.ResMayNotAlias && CanSetResMayNotAlias &&
228 CSF.ResMayNotAlias =
true;
233 CSF.EnableRawAndStructuredBuffers =
true;
240 case Intrinsic::dx_resource_load_typedbuffer: {
241 dxil::ResourceTypeInfo &RTI =
246 CSF.TiledResources =
true;
249 case Intrinsic::dx_resource_load_rawbuffer: {
251 CSF.TiledResources =
true;
258 const Function *CF = CI->getCalledFunction();
260 if (FunctionFlags.contains(CF))
261 CSF.
merge(FunctionFlags[CF]);
263 CSF.DX11_1_DoubleExtensions |=
271ModuleShaderFlags::gatherGlobalModuleFlags(
const Module &M,
272 const DXILResourceMap &DRM,
275 ComputedShaderFlags CSF;
282 uint32_t NumUAVs = 0;
287 uint32_t
Size =
UAV.getBinding().Size;
288 uint32_t NewNum = NumUAVs + (
Size == 0 ? ~0
U :
Size);
289 if (NewNum < NumUAVs)
294 CSF.Max64UAVs =
true;
304 M.getModuleFlag(
"dx.nativelowprec")))
306 CSF.NativeLowPrecisionMode = NativeLowPrec->getValue().getBoolValue();
311 CSF.ResMayNotAlias = !DRM.
uavs().
empty();
316 M.getModuleFlag(
"dx.allresourcesbound")))
317 if (AllResourcesBound->getValue().getBoolValue())
318 CSF.AllResourcesBound =
true;
332 M.getModuleFlag(
"dx.resmayalias")))
333 if (ResMayAlias->getValue().getBoolValue())
334 CanSetResMayNotAlias =
false;
344 const std::vector<CallGraphNode *> &CurSCC = *SCCI;
356 if (
F->isDeclaration()) {
357 assert(!
F->getName().starts_with(
"dx.op.") &&
358 "DXIL Shader Flag analysis should not be run post-lowering.");
363 for (
const auto &BB : *
F)
364 for (
const auto &
I : BB)
365 updateFunctionFlags(CSF,
I, DRTM, MMDI);
373 CombinedSFMask.merge(SCCSF);
381 FunctionFlags[
F].merge(SCCSF);
387 OS <<
formatv(
"; Shader Flags Value: {0:x8}\n;\n", FlagVal);
390 OS <<
"; Note: shader requires additional functionality:\n";
391#define SHADER_FEATURE_FLAG(FeatureBit, DxilModuleNum, FlagName, Str) \
393 (OS << ";").indent(7) << Str << "\n";
394#include "llvm/BinaryFormat/DXContainerConstants.def"
395 OS <<
"; Note: extra DXIL module flags:\n";
396#define DXIL_MODULE_FLAG(DxilModuleBit, FlagName, Str) \
398 (OS << ";").indent(7) << Str << "\n";
399#include "llvm/BinaryFormat/DXContainerConstants.def"
406 auto Iter = FunctionFlags.find(Func);
407 assert((Iter != FunctionFlags.end() && Iter->first == Func) &&
408 "Get Shader Flags : No Shader Flags Mask exists for function");
434 OS <<
"; Combined Shader Flags for Module\n";
437 OS <<
"; Shader Flags for Module Functions\n";
438 for (
const auto &
F : M.getFunctionList()) {
439 if (
F.isDeclaration())
442 OS <<
formatv(
"; Function {0} : {1:x8}\n;\n",
F.getName(),
460 MSFI.initialize(M, DRTM, DRM, MMDI);
474 "DXIL Shader Flag Analysis",
true,
true)
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
This file contains the simple types necessary to represent the attributes associated with functions a...
This file provides interfaces used to build and manipulate a call graph, which is a very useful tool ...
bool checkIfStatusIsExtracted(const IntrinsicInst &II)
static bool isOptimizationDisabled(const Module &M)
static bool hasUAVsAtEveryStage(const DXILResourceMap &DRM, const ModuleMetadataInfo &MMDI)
static bool checkDoubleExtensionOps(Intrinsic::ID IID)
static bool checkWaveOps(Intrinsic::ID IID)
Module.h This file contains the declarations for the Module class.
Machine Check Debug Module
uint64_t IntrinsicInst * II
#define INITIALIZE_PASS_DEPENDENCY(depName)
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
This builds on the llvm/ADT/GraphTraits.h file to find the strongly connected components (SCCs) of a ...
This file defines the SmallVector class.
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
Represent the analysis usage information of a pass.
AnalysisUsage & addRequired()
void setPreservesAll()
Set by analyses that do not transform their input at all.
AnalysisUsage & addRequiredTransitive()
A node in the call graph for a module.
The basic data container for the call graph of a Module of IR.
iterator_range< iterator > uavs()
A wrapper class for inspecting calls to intrinsic functions.
A Module instance is used to store all the information related to an LLVM module.
AnalysisType & getAnalysis() const
getAnalysis<AnalysisType>() - This function is used by subclasses to get to the analysis information ...
A set of analyses that are preserved following a run of a transformation pass.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Represent a constant reference to a string, i.e.
Represents a version number in the form major[.minor[.subminor[.build]]].
LLVM_ABI bool isUAV() const
LLVM_ABI bool isTyped() const
LLVM_ABI TypedInfo getTyped() const
dxil::ResourceKind getResourceKind() const
PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM)
Wrapper pass for the legacy pass manager.
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - This function should be overriden by passes that need analysis information to do t...
bool runOnModule(Module &M) override
runOnModule - Virtual method overriden by subclasses to process the module being operated on.
ModuleShaderFlags run(Module &M, ModuleAnalysisManager &AM)
This class implements an extremely fast bulk output stream that can only output to a stream.
Enumerate the SCCs of a directed graph in reverse topological order of the SCC DAG.
bool isAtEnd() const
Direct loop termination test which is more efficient than comparison with end().
std::enable_if_t< detail::IsValidPointer< X, Y >::value, X * > extract_or_null(Y &&MD)
Extract a Value from Metadata, allowing null.
This is an optimization pass for GlobalISel generic memory operations.
FunctionAddr VTableAddr Value
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
scc_iterator< T > scc_begin(const T &G)
Construct the begin iterator for a deduced graph type T.
auto formatv(bool Validate, const char *Fmt, Ts &&...Vals)
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
LLVM_ATTRIBUTE_VISIBILITY_DEFAULT AnalysisKey InnerAnalysisManagerProxy< AnalysisManagerT, IRUnitT, ExtraArgTs... >::Key
DWARFExpression::Operation Op
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
AnalysisManager< Module > ModuleAnalysisManager
Convenience typedef for the Module analysis manager.
A special type used by analysis passes to provide an address that identifies that particular analysis...
void merge(const ComputedShaderFlags CSF)
void print(raw_ostream &OS=dbgs()) const
const ComputedShaderFlags & getFunctionFlags(const Function *) const
Return the shader flags mask of the specified function Func.
void initialize(Module &, DXILResourceTypeMap &DRTM, const DXILResourceMap &DRM, const ModuleMetadataInfo &MMDI)
Construct ModuleShaderFlags for module Module M.
const ComputedShaderFlags & getCombinedFlags() const