23#include "llvm/IR/IntrinsicsDirectX.h"
30#define DEBUG_TYPE "dxil-resource-access"
43 for (
auto *Handle : Handles) {
44 std::string HandleStr;
46 Handle->print(HandleOS);
51 "Resource access is not guaranteed to map to a unique global resource"));
60 assert(
II->getIntrinsicID() == Intrinsic::dx_resource_getpointer &&
61 "Resource access through unexpected intrinsic");
62 return Offset ?
Offset : ConstantInt::get(Builder.getInt32Ty(), 0);
66 assert(
GEP &&
"Resource access through unexpected instruction");
68 unsigned NumIndices =
GEP->getNumIndices();
69 uint64_t IndexScale =
DL.getTypeAllocSize(
GEP->getSourceElementType());
70 APInt ConstantOffset(
DL.getIndexTypeSizeInBits(
GEP->getType()), 0);
72 if (
GEP->accumulateConstantOffset(
DL, ConstantOffset)) {
75 ConstantInt::get(
DL.getIndexType(
GEP->getType()), ConstantOffset);
77 }
else if (NumIndices == 1) {
80 GEPOffset = *
GEP->idx_begin();
81 }
else if (NumIndices == 2) {
83 auto *IndexIt =
GEP->idx_begin();
85 "GEP is not indexing through pointer");
86 GEPOffset = *(++IndexIt);
91 if (!(IndexScale % ElemSize)) {
94 IndexScale /= ElemSize;
98 GEPOffset = Builder.CreateMul(
99 GEPOffset, ConstantInt::get(Builder.getInt32Ty(), IndexScale));
101 GEPOffset = Builder.CreateUDiv(
102 GEPOffset, ConstantInt::get(Builder.getInt32Ty(), ElemSize));
105 Ptr =
GEP->getPointerOperand();
119 Value *V =
SI->getValueOperand();
120 if (V->getType() == ContainedType) {
123 "Store of whole element has mismatched address to store to");
124 }
else if (V->getType() == ScalarType) {
127 auto *Load = Builder.CreateIntrinsic(
128 LoadType, Intrinsic::dx_resource_load_typedbuffer,
129 {
II->getOperand(0),
II->getOperand(1)});
130 auto *Struct = Builder.CreateExtractValue(Load, {0});
132 uint64_t AccessSize =
DL.getTypeSizeInBits(ScalarType) / 8;
135 V = Builder.CreateInsertElement(Struct, V,
Offset);
140 auto *Inst = Builder.CreateIntrinsic(
141 Builder.getVoidTy(), Intrinsic::dx_resource_store_typedbuffer,
142 {II->getOperand(0), II->getOperand(1), V});
143 SI->replaceAllUsesWith(Inst);
152 if (!ConstantOffset || !ConstantOffset->isZero())
153 Index = Builder.CreateAdd(Index,
Offset);
157 Builder.CreateIntrinsic(Builder.getVoidTy(),
158 Intrinsic::dx_resource_store_rawbuffer,
159 {Buffer, Index, Offset, V});
167 Value *V =
SI->getValueOperand();
168 assert(!V->getType()->isAggregateType() &&
169 "Resource store should be scalar or vector type");
171 Value *Index =
II->getOperand(1);
178 if (VT && VT->getNumElements() > 4) {
180 Type *EltTy = VT->getElementType();
181 Value *Stride = ConstantInt::get(Builder.getInt32Ty(),
182 4 * (
DL.getTypeSizeInBits(EltTy) / 8));
185 for (
unsigned int I = 0,
N = VT->getNumElements();
I <
N;
I += 4) {
189 for (
unsigned int J =
I,
E = std::min(
N, J + 4); J <
E; ++J)
191 Value *Part = Builder.CreateShuffleVector(V, Indices);
240 Builder.CreateIntrinsic(LoadType, Intrinsic::dx_resource_load_typedbuffer,
241 {
II->getOperand(0),
II->getOperand(1)});
242 V = Builder.CreateExtractValue(V, {0});
245 uint64_t AccessSize =
DL.getTypeSizeInBits(ScalarType) / 8;
249 if (!ConstantOffset || !ConstantOffset->isZero())
250 V = Builder.CreateExtractElement(V,
Offset);
257 Builder.getInt32(0));
269 if (!ConstantOffset || !ConstantOffset->isZero())
270 Index = Builder.CreateAdd(Index,
Offset);
277 Value *V = Builder.CreateIntrinsic(TypeWithCheck,
278 Intrinsic::dx_resource_load_rawbuffer,
280 return Builder.CreateExtractValue(V, {0});
288 Value *Index =
II->getOperand(1);
298 "Resource load should be scalar or vector type");
303 Type *EltTy = VT->getElementType();
304 Value *Stride = ConstantInt::get(Builder.getInt32Ty(),
305 4 * (
DL.getTypeSizeInBits(EltTy) / 8));
308 for (
unsigned int I = 0,
N = VT->getNumElements();
I <
N;
I += 4) {
326struct CBufferRowIntrin {
329 unsigned int EltSize;
330 unsigned int NumElts;
332 CBufferRowIntrin(
const DataLayout &
DL,
Type *Ty) {
335 switch (
DL.getTypeSizeInBits(Ty)) {
337 IID = Intrinsic::dx_resource_load_cbufferrow_8;
343 IID = Intrinsic::dx_resource_load_cbufferrow_4;
349 IID = Intrinsic::dx_resource_load_cbufferrow_2;
367 CBufferRowIntrin Intrin(
DL, Ty->getScalarType());
370 Value *Handle =
II->getOperand(0);
375 assert(GlobalOffset &&
"CBuffer getpointer index must be constant");
378 Value *CurrentRow = ConstantInt::get(
380 unsigned int CurrentIndex =
390 "Unexpected indirect access to resource without GEP");
394 CurrentRow = Builder.CreateAdd(GEPOffset, CurrentRow);
396 APInt ConstantOffset(
DL.getIndexTypeSizeInBits(LastGEP->getType()), 0);
397 if (LastGEP->accumulateConstantOffset(
DL, ConstantOffset)) {
398 APInt Remainder(
DL.getIndexTypeSizeInBits(LastGEP->getType()),
400 APInt::udivrem(ConstantOffset, Remainder, ConstantOffset, Remainder);
401 CurrentRow = Builder.CreateAdd(
402 CurrentRow, ConstantInt::get(Builder.getInt32Ty(), ConstantOffset));
405 assert(LastGEP->getNumIndices() == 1 &&
406 "Last GEP of cbuffer access is not array or struct access");
412 ? *LastGEP->idx_begin()
413 : Builder.CreateAdd(CurrentRow, *LastGEP->idx_begin());
418 auto *CBufLoad = Builder.CreateIntrinsic(
419 Intrin.RetTy, Intrin.IID, {Handle, CurrentRow},
nullptr, Name +
".load");
421 Builder.CreateExtractValue(CBufLoad, {CurrentIndex++}, Name +
".extract");
425 unsigned int Remaining =
426 ((
DL.getTypeSizeInBits(Ty) / 8) / Intrin.EltSize) - 1;
427 if (Remaining == 0) {
433 assert(VT->getNumElements() == 1 &&
"Can't have multiple elements here");
435 Builder.getInt32(0), Name);
443 while (Remaining--) {
444 CurrentIndex %= Intrin.NumElts;
446 if (CurrentIndex == 0) {
447 CurrentRow = Builder.CreateAdd(CurrentRow,
448 ConstantInt::get(Builder.getInt32Ty(), 1));
449 CBufLoad = Builder.CreateIntrinsic(Intrin.RetTy, Intrin.IID,
450 {Handle, CurrentRow},
nullptr,
454 Extracts.
push_back(Builder.CreateExtractValue(CBufLoad, {CurrentIndex++},
460 for (
int I = 0,
E = Extracts.
size();
I <
E; ++
I)
461 Result = Builder.CreateInsertElement(
462 Result, Extracts[
I], Builder.getInt32(
I), Name +
formatv(
".upto{}",
I));
509 Intrinsic::dx_resource_handlefrombinding,
510 Intrinsic::dx_resource_handlefromimplicitbinding,
517 while (!Worklist.
empty()) {
520 if (!
X->getType()->isPointerTy() && !
X->getType()->isTargetExtTy())
524 for (
Use &V : Phi->incoming_values())
532 if (IID == Intrinsic::dx_resource_getpointer)
546 "Only expects a Handle as determined from collectUsedHandles.");
554 uint32_t UpperBound =
Size == UINT32_MAX ? UINT32_MAX : LowerBound +
Size - 1;
556 return hlsl::Binding(Class, Space, LowerBound, UpperBound,
nullptr);
561struct AccessIndices {
565 bool hasGetPtrIdx() {
return GetPtrIdx !=
nullptr; }
566 bool hasHandleIdx() {
return HandleIdx !=
nullptr; }
580 return {
nullptr,
II->getArgOperand(3)};
583 if (
II->getIntrinsicID() == Intrinsic::dx_resource_getpointer) {
586 assert(!AccessIdx.hasGetPtrIdx() &&
587 "Encountered multiple dx.resource.getpointers in ptr chain?");
588 AccessIdx.GetPtrIdx =
II->getArgOperand(1);
596 unsigned NumEdges = Phi->getNumIncomingValues();
597 assert(NumEdges != 0 &&
"Malformed Phi Node");
603 bool HasGetPtr =
true;
604 for (
unsigned Idx = 0; Idx < NumEdges; Idx++) {
605 auto *BB = Phi->getIncomingBlock(Idx);
608 HasGetPtr &= AccessIdx.hasGetPtrIdx();
615 Builder.Insert(GetPtrPhi);
619 Builder.Insert(HandlePhi);
622 return {GetPtrPhi, HandlePhi};
633 Value *GetPtrSelect =
nullptr;
635 if (TrueAccessIdx.hasGetPtrIdx() && FalseAccessIdx.hasGetPtrIdx())
637 Builder.CreateSelect(
Select->getCondition(), TrueAccessIdx.GetPtrIdx,
638 FalseAccessIdx.GetPtrIdx);
641 Builder.CreateSelect(
Select->getCondition(), TrueAccessIdx.HandleIdx,
642 FalseAccessIdx.HandleIdx);
644 return {GetPtrSelect, HandleSelect};
654 assert(AccessIdx.hasGetPtrIdx() && AccessIdx.hasHandleIdx() &&
655 "Couldn't retrieve indices. This is guaranteed by getAccessIndices");
660 Builder.Insert(Handle);
663 Builder.CreateIntrinsic(Ptr->
getType(), Intrinsic::dx_resource_getpointer,
664 {Handle, AccessIdx.GetPtrIdx});
686 unsigned NumHandles = Handles.
size();
690 bool SameGlobalBinding =
true;
692 for (
unsigned Idx = 1; Idx < NumHandles; Idx++)
696 if (!SameGlobalBinding) {
706 bool MadeChanges =
false;
709 if (
I->hasNUses(0)) {
710 I->eraseFromParent();
719 for (
User *U :
II->users())
723 while (!Worklist.
empty()) {
733 assert(
SI->getValueOperand() !=
II &&
"Pointer escaped!");
746 Dead->eraseFromParent();
747 II->eraseFromParent();
755 if (
II->getIntrinsicID() == Intrinsic::dx_resource_getpointer) {
760 for (
auto &[
II, RI] : Resources)
763 return !Resources.
empty();
771 assert(DRTM &&
"DXILResourceTypeAnalysis must be available");
775 if (!(MadeHandleChanges || MadeResourceChanges))
789 getAnalysis<DXILResourceTypeWrapperPass>().getResourceTypeMap();
792 return MadeHandleChanges || MadeResourceChanges;
794 StringRef getPassName()
const override {
return "DXIL Resource Access"; }
795 DXILResourceAccessLegacy() : FunctionPass(
ID) {}
798 void getAnalysisUsage(llvm::AnalysisUsage &AU)
const override {
803char DXILResourceAccessLegacy::ID = 0;
807 "DXIL Resource Access",
false,
false)
813 return new DXILResourceAccessLegacy();
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
AMDGPU Register Bank Select
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
static void diagnoseNonUniqueResourceAccess(Instruction *I, ArrayRef< IntrinsicInst * > Handles)
static void createLoadIntrinsic(IntrinsicInst *II, LoadInst *LI, dxil::ResourceTypeInfo &RTI)
static Value * emitRawLoad(IRBuilder<> &Builder, Type *Ty, Value *Buffer, Value *Index, Value *Offset, dxil::ResourceTypeInfo &RTI)
static bool legalizeResourceHandles(Function &F, DXILResourceTypeMap &DRTM)
static AccessIndices getAccessIndices(Instruction *I, SmallSetVector< Instruction *, 16 > &DeadInsts)
static void createTypedBufferLoad(IntrinsicInst *II, LoadInst *LI, dxil::ResourceTypeInfo &RTI)
static void createTypedBufferStore(IntrinsicInst *II, StoreInst *SI, dxil::ResourceTypeInfo &RTI)
static SmallVector< IntrinsicInst * > collectUsedHandles(Value *Ptr)
static const std::array< Intrinsic::ID, 2 > HandleIntrins
static bool transformResourcePointers(Function &F, DXILResourceTypeMap &DRTM)
static void replaceHandleWithIndices(Instruction *Ptr, IntrinsicInst *OldHandle, SmallSetVector< Instruction *, 16 > &DeadInsts)
static void emitRawStore(IRBuilder<> &Builder, Value *Buffer, Value *Index, Value *Offset, Value *V, dxil::ResourceTypeInfo &RTI)
static Value * traverseGEPOffsets(const DataLayout &DL, IRBuilder<> &Builder, Value *Ptr, uint64_t AccessSize)
static hlsl::Binding getHandleIntrinsicBinding(IntrinsicInst *Handle, DXILResourceTypeMap &DRTM)
static void createStoreIntrinsic(IntrinsicInst *II, StoreInst *SI, dxil::ResourceTypeInfo &RTI)
static void createCBufferLoad(IntrinsicInst *II, LoadInst *LI, dxil::ResourceTypeInfo &RTI)
static void createRawStores(IntrinsicInst *II, StoreInst *SI, dxil::ResourceTypeInfo &RTI)
static void createRawLoads(IntrinsicInst *II, LoadInst *LI, dxil::ResourceTypeInfo &RTI)
static Instruction * getStoreLoadPointerOperand(Instruction *AI)
static void replaceAccess(IntrinsicInst *II, dxil::ResourceTypeInfo &RTI)
static bool runOnFunction(Function &F, bool PostInlining)
uint64_t IntrinsicInst * II
FunctionAnalysisManager FAM
#define INITIALIZE_PASS_DEPENDENCY(depName)
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
This file implements a set that has insertion order iteration characteristics.
Class for arbitrary precision integers.
LLVM_ABI APInt udiv(const APInt &RHS) const
Unsigned division operation.
static LLVM_ABI void udivrem(const APInt &LHS, const APInt &RHS, APInt &Quotient, APInt &Remainder)
Dual division/remainder interface.
uint64_t getZExtValue() const
Get zero extended value.
AnalysisUsage & addRequired()
AnalysisUsage & addPreserved()
Add the specified Pass class to the set of analyses preserved by this pass.
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
LLVM Basic Block Representation.
Value * getArgOperand(unsigned i) const
void setArgOperand(unsigned i, Value *v)
This is the shared class of boolean and integer constants.
uint64_t getZExtValue() const
Return the constant as a 64-bit unsigned integer value after it has been zero extended as appropriate...
PreservedAnalyses run(Function &F, FunctionAnalysisManager &AM)
A parsed version of the target data layout string in and methods for querying it.
Analysis pass which computes a DominatorTree.
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
FunctionPass class - This class is used to implement most global optimizations.
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
LLVM_ABI Instruction * clone() const
Create a copy of 'this' instruction that is identical in all ways except the following:
LLVM_ABI const DataLayout & getDataLayout() const
Get the data layout of the module this instruction belongs to.
A wrapper class for inspecting calls to intrinsic functions.
Intrinsic::ID getIntrinsicID() const
Return the intrinsic ID of this intrinsic.
This is an important class for using LLVM in a threaded context.
An instruction for reading from memory.
Value * getPointerOperand()
void addIncoming(Value *V, BasicBlock *BB)
Add an incoming value to the end of the PHI list.
static PHINode * Create(Type *Ty, unsigned NumReservedValues, const Twine &NameStr="", InsertPosition InsertBefore=nullptr)
Constructors - NumReservedValues is a hint for the number of incoming edges that this phi node will h...
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
A set of analyses that are preserved following a run of a transformation pass.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
PreservedAnalyses & preserve()
Mark an analysis as preserved.
bool insert(const value_type &X)
Insert a new element into the SetVector.
A SetVector that performs no allocations if smaller than a certain size.
reference emplace_back(ArgTypes &&... Args)
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
An instruction for storing to memory.
StringRef - Represent a constant reference to a string, i.e.
static LLVM_ABI StructType * get(LLVMContext &Context, ArrayRef< Type * > Elements, bool isPacked=false)
This static method is the primary way to create a literal StructType.
Type * getTypeParameter(unsigned i) const
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
The instances of the Type class are immutable: once they are created, they are never changed.
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
bool isAggregateType() const
Return true if the type is an aggregate type.
static LLVM_ABI IntegerType * getInt1Ty(LLVMContext &C)
A Use represents the edge between a Value definition and its users.
LLVM Value Representation.
Type * getType() const
All values are typed, get the type of this value.
LLVM_ABI void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
TargetExtType * getHandleTy() const
LLVM_ABI bool isStruct() const
dxil::ResourceKind getResourceKind() const
A raw_ostream that writes to an std::string.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
@ RTAccelerationStructure
const unsigned CBufferRowSizeInBytes
This is an optimization pass for GlobalISel generic memory operations.
FunctionAddr VTableAddr Value
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
OuterAnalysisManagerProxy< ModuleAnalysisManager, Function > ModuleAnalysisManagerFunctionProxy
Provide the ModuleAnalysisManager to Function proxy.
iterator_range< early_inc_iterator_impl< detail::IterOfRange< RangeT > > > make_early_inc_range(RangeT &&Range)
Make a range that does early increment to allow mutation of the underlying range without disrupting i...
LLVM_ABI Value * concatenateVectors(IRBuilderBase &Builder, ArrayRef< Value * > Vecs)
Concatenate a list of vectors.
auto formatv(bool Validate, const char *Fmt, Ts &&...Vals)
auto reverse(ContainerTy &&C)
FunctionPass * createDXILResourceAccessLegacyPass()
Pass to update resource accesses to use load/store directly.
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
AnalysisManager< Function > FunctionAnalysisManager
Convenience typedef for the Function analysis manager.
LLVM_ABI void reportFatalUsageError(Error Err)
Report a fatal error that does not indicate a bug in LLVM.