52#include "llvm/IR/IntrinsicsSPIRV.h"
66 {Arg->
getType()}, OfType, Arg, {},
B);
67 GR->addAssignPtrTypeInstr(Arg, AssignCI);
70 static FixedVectorType *makeVectorFromTotalBits(
Type *ElemTy,
73 assert(ElemBits && TotalBits % ElemBits == 0 &&
74 "TotalBits must be divisible by element bit size");
79 FixedVectorType *DstTy) {
82 "shuffle resize expects identical element types");
85 const unsigned NumSource = SrcTy->getNumElements();
87 SmallVector<int>
Mask(NumNeeded);
88 for (
unsigned I = 0;
I < NumNeeded; ++
I)
89 Mask[
I] = (
I < NumSource) ?
static_cast<int>(
I) : -1;
91 Value *Resized =
B.CreateShuffleVector(V, V, Mask);
92 buildAssignType(
B, DstTy, Resized);
101 FixedVectorType *TargetType,
Value *Source) {
102 LoadInst *NewLoad =
B.CreateLoad(SourceType, Source);
103 buildAssignType(
B, SourceType, NewLoad);
104 Value *AssignValue = NewLoad;
106 const DataLayout &
DL =
B.GetInsertBlock()->getModule()->getDataLayout();
107 TypeSize TargetTypeSize =
DL.getTypeSizeInBits(TargetType);
108 TypeSize SourceTypeSize =
DL.getTypeSizeInBits(SourceType);
110 Value *BitcastSrcVal = NewLoad;
111 FixedVectorType *BitcastSrcTy =
113 FixedVectorType *BitcastDstTy = TargetType;
115 if (TargetTypeSize != SourceTypeSize) {
116 unsigned TargetElemBits =
118 if (SourceTypeSize % TargetElemBits == 0) {
121 BitcastDstTy = makeVectorFromTotalBits(TargetType->
getElementType(),
125 BitcastSrcTy = makeVectorFromTotalBits(SourceType->
getElementType(),
127 BitcastSrcVal = resizeVectorBitsWithShuffle(
B, NewLoad, BitcastSrcTy);
131 B.CreateIntrinsic(Intrinsic::spv_bitcast,
132 {BitcastDstTy, BitcastSrcTy}, {BitcastSrcVal});
133 buildAssignType(
B, BitcastDstTy, AssignValue);
134 if (BitcastDstTy == TargetType)
142 Value *Output =
B.CreateShuffleVector(AssignValue, AssignValue, Mask);
143 buildAssignType(
B, TargetType, Output);
151 Value *Source, LoadInst *BadLoad) {
154 SmallVector<Value *, 8>
Args{
B.getInt1(
false),
Source};
156 Type *AggregateType = GR->findDeducedElementType(Source);
157 assert(AggregateType &&
"Could not deduce aggregate type");
158 buildGEPIndexChain(
B, ElementType, AggregateType, Args);
160 auto *
GEP =
B.CreateIntrinsic(Intrinsic::spv_gep, {
Types}, {
Args});
161 GR->buildAssignPtr(
B, ElementType,
GEP);
163 LoadInst *LI =
B.CreateLoad(ElementType,
GEP);
165 buildAssignType(
B, ElementType, LI);
173 SmallVector<Value *, 4> LoadedElements;
177 SmallVector<Value *, 4>
Args;
178 Args.push_back(
B.getInt1(
false));
179 Args.push_back(Source);
180 Args.push_back(
B.getInt32(0));
181 Args.push_back(ConstantInt::get(
B.getInt32Ty(), i));
182 auto *ElementPtr =
B.CreateIntrinsic(Intrinsic::spv_gep, {
Types}, {
Args});
193 buildAssignType(
B, TargetType, NewVector);
201 NewVector =
B.CreateIntrinsic(Intrinsic::spv_insertelt, {
Types}, {
Args});
202 buildAssignType(
B, TargetType, NewVector);
209 Value *DstArrayPtr, ArrayType *ArrTy,
214 assert(VecTy->getElementType() == ArrTy->getElementType() &&
215 "Element types of array and vector must be the same.");
217 const DataLayout &
DL =
B.GetInsertBlock()->getModule()->getDataLayout();
218 uint64_t ElemSize =
DL.getTypeAllocSize(ArrTy->getElementType());
220 for (
unsigned i = 0; i < VecTy->getNumElements(); ++i) {
224 SmallVector<Value *, 4>
Args;
225 Args.push_back(
B.getInt1(
false));
226 Args.push_back(DstArrayPtr);
227 Args.push_back(
B.getInt32(0));
228 Args.push_back(ConstantInt::get(
B.getInt32Ty(), i));
229 auto *ElementPtr =
B.CreateIntrinsic(Intrinsic::spv_gep, {
Types}, {
Args});
230 GR->buildAssignPtr(
B, ArrTy->getElementType(), ElementPtr);
236 SmallVector<Value *, 2> EltArgs = {SrcVector,
Index};
238 B.CreateIntrinsic(Intrinsic::spv_extractelt, {EltTypes}, {EltArgs});
239 buildAssignType(
B, VecTy->getElementType(), Element);
243 Args = {Element, ElementPtr,
B.getInt16(2),
B.getInt32(NewAlign.
value())};
244 B.CreateIntrinsic(Intrinsic::spv_store, {
Types}, {
Args});
251 Value *OriginalOperand) {
252 Type *FromTy = GR->findDeducedElementType(OriginalOperand);
253 Type *ToTy = GR->findDeducedElementType(CastedOperand);
254 Value *Output =
nullptr;
260 B.SetInsertPoint(LI);
265 if (isTypeFirstElementAggregate(ToTy, FromTy))
266 Output = loadFirstValueFromAggregate(
B, ToTy, OriginalOperand, LI);
271 Output = loadVectorFromVector(
B, SVT, DVT, OriginalOperand);
272 else if (
SAT && DVT &&
SAT->getElementType() == DVT->getElementType())
273 Output = loadVectorFromArray(
B, DVT, OriginalOperand);
277 GR->replaceAllUsesWith(LI, Output,
true);
278 DeadInstructions.push_back(LI);
289 B.CreateIntrinsic(Intrinsic::spv_insertelt, {
Types}, {
Args});
290 buildAssignType(
B,
Vector->getType(), NewI);
302 B.CreateIntrinsic(Intrinsic::spv_extractelt, {
Types}, {
Args});
303 buildAssignType(
B, ElementType, NewI);
312 FixedVectorType *DstType =
321 [[maybe_unused]]
auto dstBitWidth =
323 [[maybe_unused]]
auto srcBitWidth =
325 assert(dstBitWidth == srcBitWidth &&
326 "Unsupported bitcast between vectors of different sizes.");
329 B.CreateIntrinsic(Intrinsic::spv_bitcast, {DstType, SrcType}, {Src});
330 buildAssignType(
B, DstType, Src);
333 StoreInst *
SI =
B.CreateStore(Src, Dst);
334 SI->setAlignment(Alignment);
339 LoadInst *LI =
B.CreateLoad(DstType, Dst);
341 Value *OldValues = LI;
342 buildAssignType(
B, OldValues->
getType(), OldValues);
343 Value *NewValues = Src;
348 OldValues = makeInsertElement(
B, OldValues, Element,
I);
351 StoreInst *
SI =
B.CreateStore(OldValues, Dst);
352 SI->setAlignment(Alignment);
357 SmallVectorImpl<Value *> &Indices) {
360 if (Search == Aggregate)
364 buildGEPIndexChain(
B, Search,
ST->getTypeAtIndex(0u), Indices);
366 buildGEPIndexChain(
B, Search, AT->getElementType(), Indices);
368 buildGEPIndexChain(
B, Search, VT->getElementType(), Indices);
375 Type *DstPointeeType, Align Alignment) {
377 SmallVector<Value *, 8>
Args{
B.getInt1(
true), Dst};
378 buildGEPIndexChain(
B, Src->getType(), DstPointeeType, Args);
379 auto *
GEP =
B.CreateIntrinsic(Intrinsic::spv_gep, {
Types}, {
Args});
380 GR->buildAssignPtr(
B, Src->getType(),
GEP);
381 StoreInst *
SI =
B.CreateStore(Src,
GEP);
382 SI->setAlignment(Alignment);
386 bool isTypeFirstElementAggregate(
Type *Search,
Type *Aggregate) {
387 if (Search == Aggregate)
390 return isTypeFirstElementAggregate(Search,
ST->getTypeAtIndex(0u));
392 return isTypeFirstElementAggregate(Search, VT->getElementType());
394 return isTypeFirstElementAggregate(Search, AT->getElementType());
401 Value *Dst, Align Alignment) {
402 Type *ToTy = GR->findDeducedElementType(Dst);
403 Type *FromTy = Src->getType();
409 B.SetInsertPoint(BadStore);
410 if (isTypeFirstElementAggregate(FromTy, ToTy))
411 storeToFirstValueAggregate(
B, Src, Dst, ToTy, Alignment);
412 else if (D_VT && S_VT)
413 storeVectorFromVector(
B, Src, Dst, Alignment);
414 else if (D_VT && !S_VT && FromTy == D_VT->getElementType())
415 storeToFirstValueAggregate(
B, Src, Dst, D_VT, Alignment);
416 else if (D_AT && S_VT && S_VT->getElementType() == D_AT->getElementType())
417 storeArrayFromVector(
B, Src, Dst, D_AT, Alignment);
421 DeadInstructions.push_back(BadStore);
424 void legalizePointerCast(IntrinsicInst *
II) {
426 Value *OriginalOperand =
II->getOperand(0);
429 std::vector<Value *>
Users;
430 for (Use &U :
II->uses())
431 Users.push_back(
U.getUser());
435 transformLoad(
B, LI, CastedOperand, OriginalOperand);
440 transformStore(
B, SI,
SI->getValueOperand(), OriginalOperand,
446 if (Intrin->getIntrinsicID() == Intrinsic::spv_assign_ptr_type) {
447 DeadInstructions.push_back(Intrin);
451 if (Intrin->getIntrinsicID() == Intrinsic::spv_gep) {
452 GR->replaceAllUsesWith(CastedOperand, OriginalOperand,
457 if (Intrin->getIntrinsicID() == Intrinsic::spv_store) {
460 Alignment =
Align(
C->getZExtValue());
461 transformStore(
B, Intrin, Intrin->getArgOperand(0), OriginalOperand,
470 DeadInstructions.push_back(
II);
474 SPIRVLegalizePointerCast(SPIRVTargetMachine *TM) : FunctionPass(ID), TM(TM) {}
477 const SPIRVSubtarget &
ST = TM->getSubtarget<SPIRVSubtarget>(
F);
478 GR =
ST.getSPIRVGlobalRegistry();
479 DeadInstructions.clear();
481 std::vector<IntrinsicInst *> WorkList;
485 if (
II &&
II->getIntrinsicID() == Intrinsic::spv_ptrcast)
486 WorkList.push_back(
II);
490 for (IntrinsicInst *
II : WorkList)
491 legalizePointerCast(
II);
493 for (Instruction *
I : DeadInstructions)
494 I->eraseFromParent();
496 return DeadInstructions.size() != 0;
500 SPIRVTargetMachine *TM =
nullptr;
501 SPIRVGlobalRegistry *GR =
nullptr;
502 std::vector<Instruction *> DeadInstructions;
509char SPIRVLegalizePointerCast::ID = 0;
511 "SPIRV legalize bitcast pass",
false,
false)
514 return new SPIRVLegalizePointerCast(TM);
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
static bool runOnFunction(Function &F, bool PostInlining)
iv Induction Variable Users
uint64_t IntrinsicInst * II
#define INITIALIZE_PASS(passName, arg, name, cfg, analysis)
unsigned getNumElements() const
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
FunctionPass class - This class is used to implement most global optimizations.
void setAlignment(Align Align)
Type * getPointerOperandType() const
Align getAlign() const
Return the alignment of the access that is being performed.
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
void push_back(const T &Elt)
LLVM_ABI unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.
Type * getType() const
All values are typed, get the type of this value.
Type * getElementType() const
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
constexpr char Align[]
Key for Kernel::Arg::Metadata::mAlign.
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
@ C
The default llvm calling convention, compatible with C.
ElementType
The element type of an SRV or UAV resource.
friend class Instruction
Iterator for Instructions in a `BasicBlock.
This is an optimization pass for GlobalISel generic memory operations.
FunctionAddr VTableAddr Value
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
FunctionAddr VTableAddr uintptr_t uintptr_t Int32Ty
CallInst * buildIntrWithMD(Intrinsic::ID IntrID, ArrayRef< Type * > Types, Value *Arg, Value *Arg2, ArrayRef< Constant * > Imms, IRBuilder<> &B)
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
IRBuilder(LLVMContext &, FolderTy, InserterTy, MDNode *, ArrayRef< OperandBundleDef >) -> IRBuilder< FolderTy, InserterTy >
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Align commonAlignment(Align A, uint64_t Offset)
Returns the alignment that satisfies both alignments.
FunctionPass * createSPIRVLegalizePointerCastPass(SPIRVTargetMachine *TM)
constexpr uint64_t value() const
This is a hole in the type system and should not be abused.