LLVM 23.0.0git
SPIRVLegalizerInfo.cpp
Go to the documentation of this file.
1//===- SPIRVLegalizerInfo.cpp --- SPIR-V Legalization Rules ------*- C++ -*-==//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file implements the targeting of the Machinelegalizer class for SPIR-V.
10//
11//===----------------------------------------------------------------------===//
12
13#include "SPIRVLegalizerInfo.h"
14#include "SPIRV.h"
15#include "SPIRVGlobalRegistry.h"
16#include "SPIRVSubtarget.h"
17#include "SPIRVUtils.h"
24#include "llvm/IR/IntrinsicsSPIRV.h"
25#include "llvm/Support/Debug.h"
27
28using namespace llvm;
29using namespace llvm::LegalizeActions;
30using namespace llvm::LegalityPredicates;
31
32#define DEBUG_TYPE "spirv-legalizer"
33
34LegalityPredicate typeOfExtendedScalars(unsigned TypeIdx, bool IsExtendedInts) {
35 return [IsExtendedInts, TypeIdx](const LegalityQuery &Query) {
36 const LLT Ty = Query.Types[TypeIdx];
37 return IsExtendedInts && Ty.isValid() && Ty.isScalar();
38 };
39}
40
42 using namespace TargetOpcode;
43
44 this->ST = &ST;
45 GR = ST.getSPIRVGlobalRegistry();
46
47 const LLT s1 = LLT::scalar(1);
48 const LLT s8 = LLT::scalar(8);
49 const LLT s16 = LLT::scalar(16);
50 const LLT s32 = LLT::scalar(32);
51 const LLT s64 = LLT::scalar(64);
52 const LLT s128 = LLT::scalar(128);
53
54 const LLT v16s64 = LLT::fixed_vector(16, 64);
55 const LLT v16s32 = LLT::fixed_vector(16, 32);
56 const LLT v16s16 = LLT::fixed_vector(16, 16);
57 const LLT v16s8 = LLT::fixed_vector(16, 8);
58 const LLT v16s1 = LLT::fixed_vector(16, 1);
59
60 const LLT v8s64 = LLT::fixed_vector(8, 64);
61 const LLT v8s32 = LLT::fixed_vector(8, 32);
62 const LLT v8s16 = LLT::fixed_vector(8, 16);
63 const LLT v8s8 = LLT::fixed_vector(8, 8);
64 const LLT v8s1 = LLT::fixed_vector(8, 1);
65
66 const LLT v4s64 = LLT::fixed_vector(4, 64);
67 const LLT v4s32 = LLT::fixed_vector(4, 32);
68 const LLT v4s16 = LLT::fixed_vector(4, 16);
69 const LLT v4s8 = LLT::fixed_vector(4, 8);
70 const LLT v4s1 = LLT::fixed_vector(4, 1);
71
72 const LLT v3s64 = LLT::fixed_vector(3, 64);
73 const LLT v3s32 = LLT::fixed_vector(3, 32);
74 const LLT v3s16 = LLT::fixed_vector(3, 16);
75 const LLT v3s8 = LLT::fixed_vector(3, 8);
76 const LLT v3s1 = LLT::fixed_vector(3, 1);
77
78 const LLT v2s64 = LLT::fixed_vector(2, 64);
79 const LLT v2s32 = LLT::fixed_vector(2, 32);
80 const LLT v2s16 = LLT::fixed_vector(2, 16);
81 const LLT v2s8 = LLT::fixed_vector(2, 8);
82 const LLT v2s1 = LLT::fixed_vector(2, 1);
83
84 const unsigned PSize = ST.getPointerSize();
85 const LLT p0 = LLT::pointer(0, PSize); // Function
86 const LLT p1 = LLT::pointer(1, PSize); // CrossWorkgroup
87 const LLT p2 = LLT::pointer(2, PSize); // UniformConstant
88 const LLT p3 = LLT::pointer(3, PSize); // Workgroup
89 const LLT p4 = LLT::pointer(4, PSize); // Generic
90 const LLT p5 =
91 LLT::pointer(5, PSize); // Input, SPV_INTEL_usm_storage_classes (Device)
92 const LLT p6 = LLT::pointer(6, PSize); // SPV_INTEL_usm_storage_classes (Host)
93 const LLT p7 = LLT::pointer(7, PSize); // Input
94 const LLT p8 = LLT::pointer(8, PSize); // Output
95 const LLT p9 =
96 LLT::pointer(9, PSize); // CodeSectionINTEL, SPV_INTEL_function_pointers
97 const LLT p10 = LLT::pointer(10, PSize); // Private
98 const LLT p11 = LLT::pointer(11, PSize); // StorageBuffer
99 const LLT p12 = LLT::pointer(12, PSize); // Uniform
100 const LLT p13 = LLT::pointer(13, PSize); // PushConstant
101
102 // TODO: remove copy-pasting here by using concatenation in some way.
103 auto allPtrsScalarsAndVectors = {
104 p0, p1, p2, p3, p4, p5, p6, p7, p8,
105 p9, p10, p11, p12, p13, s1, s8, s16, s32,
106 s64, s128, v2s1, v2s8, v2s16, v2s32, v2s64, v3s1, v3s8,
107 v3s16, v3s32, v3s64, v4s1, v4s8, v4s16, v4s32, v4s64, v8s1,
108 v8s8, v8s16, v8s32, v8s64, v16s1, v16s8, v16s16, v16s32, v16s64};
109
110 auto allVectors = {v2s1, v2s8, v2s16, v2s32, v2s64, v3s1, v3s8,
111 v3s16, v3s32, v3s64, v4s1, v4s8, v4s16, v4s32,
112 v4s64, v8s1, v8s8, v8s16, v8s32, v8s64, v16s1,
113 v16s8, v16s16, v16s32, v16s64};
114
115 auto allShaderVectors = {v2s1, v2s8, v2s16, v2s32, v2s64,
116 v3s1, v3s8, v3s16, v3s32, v3s64,
117 v4s1, v4s8, v4s16, v4s32, v4s64};
118
119 auto allScalars = {s1, s8, s16, s32, s64};
120
121 auto allScalarsAndVectors = {
122 s1, s8, s16, s32, s64, s128, v2s1, v2s8,
123 v2s16, v2s32, v2s64, v3s1, v3s8, v3s16, v3s32, v3s64,
124 v4s1, v4s8, v4s16, v4s32, v4s64, v8s1, v8s8, v8s16,
125 v8s32, v8s64, v16s1, v16s8, v16s16, v16s32, v16s64};
126
127 auto allIntScalarsAndVectors = {
128 s8, s16, s32, s64, s128, v2s8, v2s16, v2s32, v2s64,
129 v3s8, v3s16, v3s32, v3s64, v4s8, v4s16, v4s32, v4s64, v8s8,
130 v8s16, v8s32, v8s64, v16s8, v16s16, v16s32, v16s64};
131
132 auto allBoolScalarsAndVectors = {s1, v2s1, v3s1, v4s1, v8s1, v16s1};
133
134 auto allIntScalars = {s8, s16, s32, s64, s128};
135
136 auto allFloatScalarsAndF16Vector2AndVector4s = {s16, s32, s64, v2s16, v4s16};
137
138 auto allFloatScalars = {s16, s32, s64};
139
140 auto allFloatScalarsAndVectors = {
141 s16, s32, s64, v2s16, v2s32, v2s64, v3s16, v3s32, v3s64,
142 v4s16, v4s32, v4s64, v8s16, v8s32, v8s64, v16s16, v16s32, v16s64};
143
144 auto allShaderFloatVectors = {v2s16, v2s32, v2s64, v3s16, v3s32,
145 v3s64, v4s16, v4s32, v4s64};
146
147 auto allFloatVectors = {v2s16, v2s32, v2s64, v3s16, v3s32,
148 v3s64, v4s16, v4s32, v4s64, v8s16,
149 v8s32, v8s64, v16s16, v16s32, v16s64};
150
151 auto &allowedFloatVectorTypes =
152 ST.isShader() ? allShaderFloatVectors : allFloatVectors;
153
154 auto allFloatAndIntScalarsAndPtrs = {s8, s16, s32, s64, p0, p1,
155 p2, p3, p4, p5, p6, p7,
156 p8, p9, p10, p11, p12, p13};
157
158 auto allPtrs = {p0, p1, p2, p3, p4, p5, p6, p7, p8, p9, p10, p11, p12, p13};
159
160 auto &allowedVectorTypes = ST.isShader() ? allShaderVectors : allVectors;
161
162 bool IsExtendedInts =
163 ST.canUseExtension(
164 SPIRV::Extension::SPV_ALTERA_arbitrary_precision_integers) ||
165 ST.canUseExtension(SPIRV::Extension::SPV_KHR_bit_instructions) ||
166 ST.canUseExtension(SPIRV::Extension::SPV_INTEL_int4);
167 auto extendedScalarsAndVectors =
168 [IsExtendedInts](const LegalityQuery &Query) {
169 const LLT Ty = Query.Types[0];
170 return IsExtendedInts && Ty.isValid() && !Ty.isPointerOrPointerVector();
171 };
172 auto extendedScalarsAndVectorsProduct = [IsExtendedInts](
173 const LegalityQuery &Query) {
174 const LLT Ty1 = Query.Types[0], Ty2 = Query.Types[1];
175 return IsExtendedInts && Ty1.isValid() && Ty2.isValid() &&
176 !Ty1.isPointerOrPointerVector() && !Ty2.isPointerOrPointerVector();
177 };
178 auto extendedPtrsScalarsAndVectors =
179 [IsExtendedInts](const LegalityQuery &Query) {
180 const LLT Ty = Query.Types[0];
181 return IsExtendedInts && Ty.isValid();
182 };
183
184 // The universal validation rules in the SPIR-V specification state that
185 // vector sizes are typically limited to 2, 3, or 4. However, larger vector
186 // sizes (8 and 16) are enabled when the Kernel capability is present. For
187 // shader execution models, vector sizes are strictly limited to 4. In
188 // non-shader contexts, vector sizes of 8 and 16 are also permitted, but
189 // arbitrary sizes (e.g., 6 or 11) are not.
190 uint32_t MaxVectorSize = ST.isShader() ? 4 : 16;
191 LLVM_DEBUG(dbgs() << "MaxVectorSize: " << MaxVectorSize << "\n");
192
193 for (auto Opc : getTypeFoldingSupportedOpcodes()) {
194 switch (Opc) {
195 case G_EXTRACT_VECTOR_ELT:
196 case G_UREM:
197 case G_SREM:
198 case G_UDIV:
199 case G_SDIV:
200 case G_FREM:
201 break;
202 default:
204 .customFor(allScalars)
205 .customFor(allowedVectorTypes)
209 0, ElementCount::getFixed(MaxVectorSize)))
210 .custom();
211 break;
212 }
213 }
214
215 getActionDefinitionsBuilder({G_UREM, G_SREM, G_SDIV, G_UDIV, G_FREM})
216 .customFor(allScalars)
217 .customFor(allowedVectorTypes)
221 0, ElementCount::getFixed(MaxVectorSize)))
222 .custom();
223
224 getActionDefinitionsBuilder({G_FMA, G_STRICT_FMA})
225 .legalFor(allScalars)
226 .legalFor(allowedVectorTypes)
230 0, ElementCount::getFixed(MaxVectorSize)))
231 .alwaysLegal();
232
233 getActionDefinitionsBuilder(G_INTRINSIC_W_SIDE_EFFECTS).custom();
234
235 getActionDefinitionsBuilder(G_SHUFFLE_VECTOR)
236 .legalForCartesianProduct(allowedVectorTypes, allowedVectorTypes)
238 .lowerIf(vectorElementCountIsGreaterThan(0, MaxVectorSize))
240 .lowerIf(vectorElementCountIsGreaterThan(1, MaxVectorSize));
241
242 getActionDefinitionsBuilder(G_EXTRACT_VECTOR_ELT)
246 1, ElementCount::getFixed(MaxVectorSize)))
247 .custom();
248
249 getActionDefinitionsBuilder(G_INSERT_VECTOR_ELT)
253 0, ElementCount::getFixed(MaxVectorSize)))
254 .custom();
255
256 // Illegal G_UNMERGE_VALUES instructions should be handled
257 // during the combine phase.
258 getActionDefinitionsBuilder(G_BUILD_VECTOR)
260
261 // When entering the legalizer, there should be no G_BITCAST instructions.
262 // They should all be calls to the `spv_bitcast` intrinsic. The call to
263 // the intrinsic will be converted to a G_BITCAST during legalization if
264 // the vectors are not legal. After using the rules to legalize a G_BITCAST,
265 // we turn it back into a call to the intrinsic with a custom rule to avoid
266 // potential machine verifier failures.
272 0, ElementCount::getFixed(MaxVectorSize)))
273 .lowerIf(vectorElementCountIsGreaterThan(1, MaxVectorSize))
274 .custom();
275
276 // If the result is still illegal, the combiner should be able to remove it.
277 getActionDefinitionsBuilder(G_CONCAT_VECTORS)
278 .legalForCartesianProduct(allowedVectorTypes, allowedVectorTypes);
279
280 getActionDefinitionsBuilder(G_SPLAT_VECTOR)
281 .legalFor(allowedVectorTypes)
285 .alwaysLegal();
286
287 // Vector Reduction Operations
289 {G_VECREDUCE_SMIN, G_VECREDUCE_SMAX, G_VECREDUCE_UMIN, G_VECREDUCE_UMAX,
290 G_VECREDUCE_ADD, G_VECREDUCE_MUL, G_VECREDUCE_FMUL, G_VECREDUCE_FMIN,
291 G_VECREDUCE_FMAX, G_VECREDUCE_FMINIMUM, G_VECREDUCE_FMAXIMUM,
292 G_VECREDUCE_OR, G_VECREDUCE_AND, G_VECREDUCE_XOR})
293 .legalFor(allowedVectorTypes)
294 .scalarize(1)
295 .lower();
296
297 getActionDefinitionsBuilder({G_VECREDUCE_SEQ_FADD, G_VECREDUCE_SEQ_FMUL})
298 .scalarize(2)
299 .lower();
300
301 // Illegal G_UNMERGE_VALUES instructions should be handled
302 // during the combine phase.
303 getActionDefinitionsBuilder(G_UNMERGE_VALUES)
305
306 getActionDefinitionsBuilder({G_MEMCPY, G_MEMCPY_INLINE, G_MEMMOVE})
307 .unsupportedIf(LegalityPredicates::any(typeIs(0, p9), typeIs(1, p9)))
308 .legalIf(all(typeInSet(0, allPtrs), typeInSet(1, allPtrs)));
309
310 getActionDefinitionsBuilder({G_MEMSET, G_MEMSET_INLINE})
311 .unsupportedIf(typeIs(0, p9))
312 .legalIf(all(typeInSet(0, allPtrs), typeInSet(1, allIntScalars)));
313
314 getActionDefinitionsBuilder(G_ADDRSPACE_CAST)
315 .legalForCartesianProduct(allPtrs, allPtrs);
316
317 // Should we be legalizing bad scalar sizes like s5 here instead
318 // of handling them in the instruction selector?
319 getActionDefinitionsBuilder({G_LOAD, G_STORE})
320 .unsupportedIf(typeIs(1, p9))
321 .legalForCartesianProduct(allowedVectorTypes, allPtrs)
322 .legalForCartesianProduct(allPtrs, allPtrs)
323 .legalIf(isScalar(0))
324 .custom();
325
326 getActionDefinitionsBuilder({G_SMIN, G_SMAX, G_UMIN, G_UMAX, G_ABS,
327 G_BITREVERSE, G_SADDSAT, G_UADDSAT, G_SSUBSAT,
328 G_USUBSAT, G_SCMP, G_UCMP})
329 .legalFor(allIntScalarsAndVectors)
330 .legalIf(extendedScalarsAndVectors);
331
332 getActionDefinitionsBuilder(G_STRICT_FLDEXP)
333 .legalForCartesianProduct(allFloatScalarsAndVectors, allIntScalars);
334
335 getActionDefinitionsBuilder({G_FPTOSI, G_FPTOUI})
336 .legalForCartesianProduct(allIntScalarsAndVectors,
337 allFloatScalarsAndVectors);
338
339 getActionDefinitionsBuilder({G_FPTOSI_SAT, G_FPTOUI_SAT})
340 .legalForCartesianProduct(allIntScalarsAndVectors,
341 allFloatScalarsAndVectors);
342
343 getActionDefinitionsBuilder({G_SITOFP, G_UITOFP})
344 .legalForCartesianProduct(allFloatScalarsAndVectors,
345 allScalarsAndVectors);
346
348 .legalForCartesianProduct(allIntScalarsAndVectors)
349 .legalIf(extendedScalarsAndVectorsProduct);
350
351 // Extensions.
352 getActionDefinitionsBuilder({G_TRUNC, G_ZEXT, G_SEXT, G_ANYEXT})
353 .legalForCartesianProduct(allScalarsAndVectors)
354 .legalIf(extendedScalarsAndVectorsProduct);
355
357 .legalFor(allPtrsScalarsAndVectors)
358 .legalIf(extendedPtrsScalarsAndVectors)
362 0, ElementCount::getFixed(MaxVectorSize)));
363
365 all(typeInSet(0, allPtrsScalarsAndVectors),
366 typeInSet(1, allPtrsScalarsAndVectors)));
367
368 getActionDefinitionsBuilder({G_IMPLICIT_DEF, G_FREEZE})
369 .legalFor({s1, s128})
370 .legalFor(allFloatAndIntScalarsAndPtrs)
371 .legalFor(allowedVectorTypes)
372 .legalIf([](const LegalityQuery &Query) {
373 return Query.Types[0].isPointerVector();
374 })
375 .moreElementsToNextPow2(0)
376 .fewerElementsIf(vectorElementCountIsGreaterThan(0, MaxVectorSize),
378 0, ElementCount::getFixed(MaxVectorSize)));
379
380 getActionDefinitionsBuilder({G_STACKSAVE, G_STACKRESTORE}).alwaysLegal();
381
383 .legalForCartesianProduct(allPtrs, allIntScalars)
384 .legalIf(
385 all(typeInSet(0, allPtrs), typeOfExtendedScalars(1, IsExtendedInts)))
386 .legalIf([](const LegalityQuery &Query) {
387 const LLT DstTy = Query.Types[0];
388 const LLT SrcTy = Query.Types[1];
389 return DstTy.isPointerVector() && SrcTy.isVector() &&
390 !SrcTy.isPointer() &&
391 DstTy.getNumElements() == SrcTy.getNumElements();
392 });
394 .legalForCartesianProduct(allIntScalars, allPtrs)
395 .legalIf(
396 all(typeOfExtendedScalars(0, IsExtendedInts), typeInSet(1, allPtrs)))
397 .legalIf([](const LegalityQuery &Query) {
398 const LLT DstTy = Query.Types[0];
399 const LLT SrcTy = Query.Types[1];
400 return SrcTy.isPointerVector() && DstTy.isVector() &&
401 !DstTy.isPointer() &&
402 DstTy.getNumElements() == SrcTy.getNumElements();
403 });
405 .legalForCartesianProduct(allPtrs, allIntScalars)
406 .legalIf(
407 all(typeInSet(0, allPtrs), typeOfExtendedScalars(1, IsExtendedInts)));
408
410 .legalForCartesianProduct(allPtrs, allIntScalars)
411 .legalIf(
412 all(typeInSet(0, allPtrs), typeOfExtendedScalars(1, IsExtendedInts)))
413 .legalIf([](const LegalityQuery &Query) {
414 const LLT PtrTy = Query.Types[0];
415 const LLT MaskTy = Query.Types[1];
416 return PtrTy.isPointerVector() && MaskTy.isVector() &&
417 !MaskTy.isPointer() &&
418 PtrTy.getNumElements() == MaskTy.getNumElements();
419 });
420
421 // ST.canDirectlyComparePointers() for pointer args is supported in
422 // legalizeCustom().
425 all(typeIs(0, p9), typeInSet(1, allPtrs), typeIsNot(1, p9)),
426 all(typeInSet(0, allPtrs), typeIsNot(0, p9), typeIs(1, p9))))
427 .legalIf([IsExtendedInts](const LegalityQuery &Query) {
428 const LLT Ty = Query.Types[1];
429 return IsExtendedInts && Ty.isValid() && !Ty.isPointerOrPointerVector();
430 })
431 .customIf(all(typeInSet(0, allBoolScalarsAndVectors),
432 typeInSet(1, allPtrsScalarsAndVectors)));
433
435 all(typeInSet(0, allBoolScalarsAndVectors),
436 typeInSet(1, allFloatScalarsAndVectors)));
437
438 getActionDefinitionsBuilder({G_ATOMICRMW_OR, G_ATOMICRMW_ADD, G_ATOMICRMW_AND,
439 G_ATOMICRMW_MAX, G_ATOMICRMW_MIN,
440 G_ATOMICRMW_SUB, G_ATOMICRMW_XOR,
441 G_ATOMICRMW_UMAX, G_ATOMICRMW_UMIN})
442 .legalForCartesianProduct(allIntScalars, allPtrs);
443
445 {G_ATOMICRMW_FADD, G_ATOMICRMW_FSUB, G_ATOMICRMW_FMIN, G_ATOMICRMW_FMAX})
446 .legalForCartesianProduct(allFloatScalarsAndF16Vector2AndVector4s,
447 allPtrs);
448
449 getActionDefinitionsBuilder(G_ATOMICRMW_XCHG)
450 .legalForCartesianProduct(allFloatAndIntScalarsAndPtrs, allPtrs);
451
452 getActionDefinitionsBuilder(G_ATOMIC_CMPXCHG_WITH_SUCCESS).lower();
453 // TODO: add proper legalization rules.
454 getActionDefinitionsBuilder(G_ATOMIC_CMPXCHG).alwaysLegal();
455
456 getActionDefinitionsBuilder({G_UADDO, G_USUBO, G_UMULO, G_SMULO})
457 .alwaysLegal();
458
459 getActionDefinitionsBuilder({G_SADDO, G_SSUBO}).lower();
460
461 getActionDefinitionsBuilder({G_LROUND, G_LLROUND})
462 .legalForCartesianProduct(allFloatScalarsAndVectors,
463 allIntScalarsAndVectors);
464
465 // FP conversions.
466 getActionDefinitionsBuilder({G_FPTRUNC, G_FPEXT})
467 .legalForCartesianProduct(allFloatScalarsAndVectors);
468
469 // Pointer-handling.
470 getActionDefinitionsBuilder(G_FRAME_INDEX).legalFor({p0});
471
472 getActionDefinitionsBuilder(G_GLOBAL_VALUE).legalFor(allPtrs);
473
474 // Control-flow. In some cases (e.g. constants) s1 may be promoted to s32.
476 getActionDefinitionsBuilder(G_BRCOND).legalFor({s1, s32});
477
479 allFloatScalarsAndVectors, {s32, v2s32, v3s32, v4s32, v8s32, v16s32});
480
481 // TODO: Review the target OpenCL and GLSL Extended Instruction Set specs to
482 // tighten these requirements. Many of these math functions are only legal on
483 // specific bitwidths, so they are not selectable for
484 // allFloatScalarsAndVectors.
485 // clang-format off
486 getActionDefinitionsBuilder({G_STRICT_FSQRT,
487 G_FPOW,
488 G_FEXP,
489 G_FMODF,
490 G_FSINCOS,
491 G_FEXP2,
492 G_FEXP10,
493 G_FLOG,
494 G_FLOG2,
495 G_FLOG10,
496 G_FABS,
497 G_FMINNUM,
498 G_FMAXNUM,
499 G_FCEIL,
500 G_FCOS,
501 G_FSIN,
502 G_FTAN,
503 G_FACOS,
504 G_FASIN,
505 G_FATAN,
506 G_FATAN2,
507 G_FCOSH,
508 G_FSINH,
509 G_FTANH,
510 G_FSQRT,
511 G_FFLOOR,
512 G_FRINT,
513 G_FNEARBYINT,
514 G_INTRINSIC_ROUND,
515 G_INTRINSIC_TRUNC,
516 G_FMINIMUM,
517 G_FMAXIMUM,
518 G_INTRINSIC_ROUNDEVEN})
519 .legalFor(allFloatScalars)
520 .legalFor(allowedFloatVectorTypes)
524 0, ElementCount::getFixed(MaxVectorSize)));
525 // clang-format on
526
527 getActionDefinitionsBuilder(G_FCOPYSIGN)
528 .legalForCartesianProduct(allFloatScalarsAndVectors,
529 allFloatScalarsAndVectors);
530
532 allFloatScalarsAndVectors, allIntScalarsAndVectors);
533
534 if (ST.canUseExtInstSet(SPIRV::InstructionSet::OpenCL_std)) {
536 {G_CTTZ, G_CTTZ_ZERO_POISON, G_CTLZ, G_CTLZ_ZERO_POISON})
537 .legalForCartesianProduct(allIntScalarsAndVectors,
538 allIntScalarsAndVectors);
539
540 // Struct return types become a single scalar, so cannot easily legalize.
541 getActionDefinitionsBuilder({G_SMULH, G_UMULH}).alwaysLegal();
542 }
543
544 getActionDefinitionsBuilder(G_IS_FPCLASS).custom();
545
546 getActionDefinitionsBuilder({G_INTRINSIC, G_INTRINSIC_CONVERGENT,
547 G_INTRINSIC_CONVERGENT_W_SIDE_EFFECTS})
548 .alwaysLegal();
550 getActionDefinitionsBuilder({G_TRAP, G_DEBUGTRAP, G_UBSANTRAP}).alwaysLegal();
551
553 verify(*ST.getInstrInfo());
554}
555
558 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
559 Register DstReg = MI.getOperand(0).getReg();
560 Register SrcReg = MI.getOperand(1).getReg();
561 Register IdxReg = MI.getOperand(2).getReg();
562
563 MIRBuilder
564 .buildIntrinsic(Intrinsic::spv_extractelt, ArrayRef<Register>{DstReg})
565 .addUse(SrcReg)
566 .addUse(IdxReg);
567 MI.eraseFromParent();
568 return true;
569}
570
573 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
574 Register DstReg = MI.getOperand(0).getReg();
575 Register SrcReg = MI.getOperand(1).getReg();
576 Register ValReg = MI.getOperand(2).getReg();
577 Register IdxReg = MI.getOperand(3).getReg();
578
579 MIRBuilder
580 .buildIntrinsic(Intrinsic::spv_insertelt, ArrayRef<Register>{DstReg})
581 .addUse(SrcReg)
582 .addUse(ValReg)
583 .addUse(IdxReg);
584 MI.eraseFromParent();
585 return true;
586}
587
589 LegalizerHelper &Helper,
592 Register ConvReg = MRI.createGenericVirtualRegister(ConvTy);
593 MRI.setRegClass(ConvReg, GR->getRegClass(SpvType));
594 GR->assignSPIRVTypeToVReg(SpvType, ConvReg, Helper.MIRBuilder.getMF());
595 Helper.MIRBuilder.buildInstr(TargetOpcode::G_PTRTOINT)
596 .addDef(ConvReg)
597 .addUse(Reg);
598 return ConvReg;
599}
600
601static bool needsVectorLegalization(const LLT &Ty, const SPIRVSubtarget &ST) {
602 if (!Ty.isVector())
603 return false;
604 unsigned NumElements = Ty.getNumElements();
605 unsigned MaxVectorSize = ST.isShader() ? 4 : 16;
606 return (NumElements > 4 && !isPowerOf2_32(NumElements)) ||
607 NumElements > MaxVectorSize;
608}
609
612 MachineRegisterInfo &MRI = MI.getMF()->getRegInfo();
613 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
614 Register DstReg = MI.getOperand(0).getReg();
615 Register PtrReg = MI.getOperand(1).getReg();
616 LLT DstTy = MRI.getType(DstReg);
617
618 if (!DstTy.isVector())
619 return true;
620
621 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
622 if (!needsVectorLegalization(DstTy, ST))
623 return true;
624
625 SmallVector<Register, 8> SplitRegs;
626 LLT EltTy = DstTy.getElementType();
627 unsigned NumElts = DstTy.getNumElements();
628
629 LLT PtrTy = MRI.getType(PtrReg);
630 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0);
631
632 for (unsigned i = 0; i < NumElts; ++i) {
633 auto Idx = MIRBuilder.buildConstant(LLT::scalar(32), i);
634 Register EltPtr = MRI.createGenericVirtualRegister(PtrTy);
635
636 MIRBuilder.buildIntrinsic(Intrinsic::spv_gep, ArrayRef<Register>{EltPtr})
637 .addImm(1) // InBounds
638 .addUse(PtrReg)
639 .addUse(Zero.getReg(0))
640 .addUse(Idx.getReg(0));
641
642 MachinePointerInfo EltPtrInfo;
643 Align EltAlign = Align(1);
644 if (!MI.memoperands_empty()) {
645 MachineMemOperand *MMO = *MI.memoperands_begin();
646 EltPtrInfo =
647 MMO->getPointerInfo().getWithOffset(i * EltTy.getSizeInBytes());
648 EltAlign = commonAlignment(MMO->getAlign(), i * EltTy.getSizeInBytes());
649 }
650
651 Register EltReg = MRI.createGenericVirtualRegister(EltTy);
652 MIRBuilder.buildLoad(EltReg, EltPtr, EltPtrInfo, EltAlign);
653 SplitRegs.push_back(EltReg);
654 }
655
656 MIRBuilder.buildBuildVector(DstReg, SplitRegs);
657 MI.eraseFromParent();
658 return true;
659}
660
663 MachineRegisterInfo &MRI = MI.getMF()->getRegInfo();
664 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
665 Register ValReg = MI.getOperand(0).getReg();
666 Register PtrReg = MI.getOperand(1).getReg();
667 LLT ValTy = MRI.getType(ValReg);
668
669 assert(ValTy.isVector() && "Expected vector store");
670
671 SmallVector<Register, 8> SplitRegs;
672 LLT EltTy = ValTy.getElementType();
673 unsigned NumElts = ValTy.getNumElements();
674
675 for (unsigned i = 0; i < NumElts; ++i)
676 SplitRegs.push_back(MRI.createGenericVirtualRegister(EltTy));
677
678 MIRBuilder.buildUnmerge(SplitRegs, ValReg);
679
680 LLT PtrTy = MRI.getType(PtrReg);
681 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0);
682
683 for (unsigned i = 0; i < NumElts; ++i) {
684 auto Idx = MIRBuilder.buildConstant(LLT::scalar(32), i);
685 Register EltPtr = MRI.createGenericVirtualRegister(PtrTy);
686
687 MIRBuilder.buildIntrinsic(Intrinsic::spv_gep, ArrayRef<Register>{EltPtr})
688 .addImm(1) // InBounds
689 .addUse(PtrReg)
690 .addUse(Zero.getReg(0))
691 .addUse(Idx.getReg(0));
692
693 MachinePointerInfo EltPtrInfo;
694 Align EltAlign = Align(1);
695 if (!MI.memoperands_empty()) {
696 MachineMemOperand *MMO = *MI.memoperands_begin();
697 EltPtrInfo =
698 MMO->getPointerInfo().getWithOffset(i * EltTy.getSizeInBytes());
699 EltAlign = commonAlignment(MMO->getAlign(), i * EltTy.getSizeInBytes());
700 }
701
702 MIRBuilder.buildStore(SplitRegs[i], EltPtr, EltPtrInfo, EltAlign);
703 }
704
705 MI.eraseFromParent();
706 return true;
707}
708
711 LostDebugLocObserver &LocObserver) const {
712 MachineRegisterInfo &MRI = MI.getMF()->getRegInfo();
713 switch (MI.getOpcode()) {
714 default:
715 // TODO: implement legalization for other opcodes.
716 return true;
717 case TargetOpcode::G_BITCAST:
718 return legalizeBitcast(Helper, MI);
719 case TargetOpcode::G_EXTRACT_VECTOR_ELT:
720 return legalizeExtractVectorElt(Helper, MI, GR);
721 case TargetOpcode::G_INSERT_VECTOR_ELT:
722 return legalizeInsertVectorElt(Helper, MI, GR);
723 case TargetOpcode::G_INTRINSIC:
724 case TargetOpcode::G_INTRINSIC_W_SIDE_EFFECTS:
725 return legalizeIntrinsic(Helper, MI);
726 case TargetOpcode::G_IS_FPCLASS:
727 return legalizeIsFPClass(Helper, MI, LocObserver);
728 case TargetOpcode::G_ICMP: {
729 auto &Op0 = MI.getOperand(2);
730 auto &Op1 = MI.getOperand(3);
731 Register Reg0 = Op0.getReg();
732 Register Reg1 = Op1.getReg();
734 static_cast<CmpInst::Predicate>(MI.getOperand(1).getPredicate());
735 if ((!ST->canDirectlyComparePointers() ||
737 MRI.getType(Reg0).isPointer() && MRI.getType(Reg1).isPointer()) {
738 LLT ConvT = LLT::scalar(ST->getPointerSize());
739 Type *LLVMTy = IntegerType::get(MI.getMF()->getFunction().getContext(),
740 ST->getPointerSize());
741 SPIRVTypeInst SpirvTy = GR->getOrCreateSPIRVType(
742 LLVMTy, Helper.MIRBuilder, SPIRV::AccessQualifier::ReadWrite, true);
743 Op0.setReg(convertPtrToInt(Reg0, ConvT, SpirvTy, Helper, MRI, GR));
744 Op1.setReg(convertPtrToInt(Reg1, ConvT, SpirvTy, Helper, MRI, GR));
745 }
746 return true;
747 }
748 case TargetOpcode::G_LOAD:
749 return legalizeLoad(Helper, MI, GR);
750 case TargetOpcode::G_STORE:
751 return legalizeStore(Helper, MI, GR);
752 }
753}
754
757 Register SrcReg, LLT SrcTy,
758 MachinePointerInfo &PtrInfo, Align &VecAlign) {
759 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
760 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
761
762 VecAlign = Helper.getStackTemporaryAlignment(SrcTy);
763 auto StackTemp = Helper.createStackTemporary(
764 TypeSize::getFixed(SrcTy.getSizeInBytes()), VecAlign, PtrInfo);
765
766 // Set the type of StackTemp to a pointer to an array of the element type.
767 SPIRVTypeInst SpvSrcTy = GR->getSPIRVTypeForVReg(SrcReg);
768 SPIRVTypeInst EltSpvTy = GR->getScalarOrVectorComponentType(SpvSrcTy);
769 const Type *LLVMEltTy = GR->getTypeForSPIRVType(EltSpvTy);
770 const Type *LLVMArrTy =
771 ArrayType::get(const_cast<Type *>(LLVMEltTy), SrcTy.getNumElements());
772 SPIRVTypeInst ArrSpvTy = GR->getOrCreateSPIRVType(
773 LLVMArrTy, MIRBuilder, SPIRV::AccessQualifier::ReadWrite, true);
774 SPIRVTypeInst PtrToArrSpvTy = GR->getOrCreateSPIRVPointerType(
775 ArrSpvTy, MIRBuilder, SPIRV::StorageClass::Function);
776
777 Register StackReg = StackTemp.getReg(0);
778 MRI.setRegClass(StackReg, GR->getRegClass(PtrToArrSpvTy));
779 GR->assignSPIRVTypeToVReg(PtrToArrSpvTy, StackReg, MIRBuilder.getMF());
780
781 return StackTemp;
782}
783
786 LLVM_DEBUG(dbgs() << "Found a bitcast instruction\n");
787 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
788 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
789 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
790
791 Register DstReg = MI.getOperand(0).getReg();
792 Register SrcReg = MI.getOperand(2).getReg();
793 LLT DstTy = MRI.getType(DstReg);
794 LLT SrcTy = MRI.getType(SrcReg);
795
796 // If an spv_bitcast needs to be legalized, we convert it to G_BITCAST to
797 // allow using the generic legalization rules.
798 if (needsVectorLegalization(DstTy, ST) ||
799 needsVectorLegalization(SrcTy, ST)) {
800 LLVM_DEBUG(dbgs() << "Replacing with a G_BITCAST\n");
801 MIRBuilder.buildBitcast(DstReg, SrcReg);
802 MI.eraseFromParent();
803 }
804 return true;
805}
806
809 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
810 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
811 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
812
813 Register DstReg = MI.getOperand(0).getReg();
814 LLT DstTy = MRI.getType(DstReg);
815
816 if (needsVectorLegalization(DstTy, ST)) {
817 Register SrcReg = MI.getOperand(2).getReg();
818 Register ValReg = MI.getOperand(3).getReg();
819 LLT SrcTy = MRI.getType(SrcReg);
820 MachineOperand &IdxOperand = MI.getOperand(4);
821
822 if (getImm(IdxOperand, &MRI)) {
823 uint64_t IdxVal = foldImm(IdxOperand, &MRI);
824 if (IdxVal < SrcTy.getNumElements()) {
826 SPIRVTypeInst ElementType =
828 LLT ElementLLTTy = GR->getRegType(ElementType);
829 for (unsigned I = 0, E = SrcTy.getNumElements(); I < E; ++I) {
830 Register Reg = MRI.createGenericVirtualRegister(ElementLLTTy);
831 MRI.setRegClass(Reg, GR->getRegClass(ElementType));
832 GR->assignSPIRVTypeToVReg(ElementType, Reg, *MI.getMF());
833 Regs.push_back(Reg);
834 }
835 MIRBuilder.buildUnmerge(Regs, SrcReg);
836 Regs[IdxVal] = ValReg;
837 MIRBuilder.buildBuildVector(DstReg, Regs);
838 MI.eraseFromParent();
839 return true;
840 }
841 }
842
843 LLT EltTy = SrcTy.getElementType();
844 Align VecAlign;
845 MachinePointerInfo PtrInfo;
846 auto StackTemp = createStackTemporaryForVector(Helper, GR, SrcReg, SrcTy,
847 PtrInfo, VecAlign);
848
849 MIRBuilder.buildStore(SrcReg, StackTemp, PtrInfo, VecAlign);
850
851 Register IdxReg = IdxOperand.getReg();
852 LLT PtrTy = MRI.getType(StackTemp.getReg(0));
853 Register EltPtr = MRI.createGenericVirtualRegister(PtrTy);
854 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0);
855
856 MIRBuilder.buildIntrinsic(Intrinsic::spv_gep, ArrayRef<Register>{EltPtr})
857 .addImm(1) // InBounds
858 .addUse(StackTemp.getReg(0))
859 .addUse(Zero.getReg(0))
860 .addUse(IdxReg);
861
863 Align EltAlign = Helper.getStackTemporaryAlignment(EltTy);
864 MIRBuilder.buildStore(ValReg, EltPtr, EltPtrInfo, EltAlign);
865
866 MIRBuilder.buildLoad(DstReg, StackTemp, PtrInfo, VecAlign);
867 MI.eraseFromParent();
868 return true;
869 }
870 return true;
871}
872
875 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
876 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
877 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
878
879 Register SrcReg = MI.getOperand(2).getReg();
880 LLT SrcTy = MRI.getType(SrcReg);
881
882 if (needsVectorLegalization(SrcTy, ST)) {
883 Register DstReg = MI.getOperand(0).getReg();
884 MachineOperand &IdxOperand = MI.getOperand(3);
885
886 if (getImm(IdxOperand, &MRI)) {
887 uint64_t IdxVal = foldImm(IdxOperand, &MRI);
888 if (IdxVal < SrcTy.getNumElements()) {
889 LLT DstTy = MRI.getType(DstReg);
891 SPIRVTypeInst DstSpvTy = GR->getSPIRVTypeForVReg(DstReg);
892 for (unsigned I = 0, E = SrcTy.getNumElements(); I < E; ++I) {
893 if (I == IdxVal) {
894 Regs.push_back(DstReg);
895 } else {
897 MRI.setRegClass(Reg, GR->getRegClass(DstSpvTy));
898 GR->assignSPIRVTypeToVReg(DstSpvTy, Reg, *MI.getMF());
899 Regs.push_back(Reg);
900 }
901 }
902 MIRBuilder.buildUnmerge(Regs, SrcReg);
903 MI.eraseFromParent();
904 return true;
905 }
906 }
907
908 LLT EltTy = SrcTy.getElementType();
909 Align VecAlign;
910 MachinePointerInfo PtrInfo;
911 auto StackTemp = createStackTemporaryForVector(Helper, GR, SrcReg, SrcTy,
912 PtrInfo, VecAlign);
913
914 MIRBuilder.buildStore(SrcReg, StackTemp, PtrInfo, VecAlign);
915
916 Register IdxReg = IdxOperand.getReg();
917 LLT PtrTy = MRI.getType(StackTemp.getReg(0));
918 Register EltPtr = MRI.createGenericVirtualRegister(PtrTy);
919 auto Zero = MIRBuilder.buildConstant(LLT::scalar(32), 0);
920
921 MIRBuilder.buildIntrinsic(Intrinsic::spv_gep, ArrayRef<Register>{EltPtr})
922 .addImm(1) // InBounds
923 .addUse(StackTemp.getReg(0))
924 .addUse(Zero.getReg(0))
925 .addUse(IdxReg);
926
928 Align EltAlign = Helper.getStackTemporaryAlignment(EltTy);
929 MIRBuilder.buildLoad(DstReg, EltPtr, EltPtrInfo, EltAlign);
930
931 MI.eraseFromParent();
932 return true;
933 }
934 return true;
935}
936
939 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
940 MachineRegisterInfo &MRI = *MIRBuilder.getMRI();
941 const SPIRVSubtarget &ST = MI.getMF()->getSubtarget<SPIRVSubtarget>();
942
943 Register DstReg = MI.getOperand(0).getReg();
944 LLT DstTy = MRI.getType(DstReg);
945
946 if (!needsVectorLegalization(DstTy, ST))
947 return true;
948
950 if (MI.getNumOperands() == 2) {
951 // The "null" case: no values are attached.
952 LLT EltTy = DstTy.getElementType();
953 auto Zero = MIRBuilder.buildConstant(EltTy, 0);
954 SPIRVTypeInst SpvDstTy = GR->getSPIRVTypeForVReg(DstReg);
955 SPIRVTypeInst SpvEltTy = GR->getScalarOrVectorComponentType(SpvDstTy);
956 GR->assignSPIRVTypeToVReg(SpvEltTy, Zero.getReg(0), MIRBuilder.getMF());
957 for (unsigned i = 0; i < DstTy.getNumElements(); ++i)
958 SrcRegs.push_back(Zero.getReg(0));
959 } else {
960 for (unsigned i = 2; i < MI.getNumOperands(); ++i) {
961 SrcRegs.push_back(MI.getOperand(i).getReg());
962 }
963 }
964 MIRBuilder.buildBuildVector(DstReg, SrcRegs);
965 MI.eraseFromParent();
966 return true;
967}
968
970 MachineInstr &MI) const {
971 LLVM_DEBUG(dbgs() << "legalizeIntrinsic: " << MI);
972 auto IntrinsicID = cast<GIntrinsic>(MI).getIntrinsicID();
973 switch (IntrinsicID) {
974 case Intrinsic::spv_bitcast:
975 return legalizeSpvBitcast(Helper, MI, GR);
976 case Intrinsic::spv_insertelt:
977 return legalizeSpvInsertElt(Helper, MI, GR);
978 case Intrinsic::spv_extractelt:
979 return legalizeSpvExtractElt(Helper, MI, GR);
980 case Intrinsic::spv_const_composite:
981 return legalizeSpvConstComposite(Helper, MI, GR);
982 }
983 return true;
984}
985
986bool SPIRVLegalizerInfo::legalizeBitcast(LegalizerHelper &Helper,
987 MachineInstr &MI) const {
988 // Once the G_BITCAST is using vectors that are allowed, we turn it back into
989 // an spv_bitcast to avoid verifier problems when the register types are the
990 // same for the source and the result. Note that the SPIR-V types associated
991 // with the bitcast can be different even if the register types are the same.
992 MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;
993 Register DstReg = MI.getOperand(0).getReg();
994 Register SrcReg = MI.getOperand(1).getReg();
995 SmallVector<Register, 1> DstRegs = {DstReg};
996 MIRBuilder.buildIntrinsic(Intrinsic::spv_bitcast, DstRegs).addUse(SrcReg);
997 MI.eraseFromParent();
998 return true;
999}
1000
1001// Note this code was copied from LegalizerHelper::lowerISFPCLASS and adjusted
1002// to ensure that all instructions created during the lowering have SPIR-V types
1003// assigned to them.
1004bool SPIRVLegalizerInfo::legalizeIsFPClass(
1006 LostDebugLocObserver &LocObserver) const {
1007 auto [DstReg, DstTy, SrcReg, SrcTy] = MI.getFirst2RegLLTs();
1008 FPClassTest Mask = static_cast<FPClassTest>(MI.getOperand(2).getImm());
1009
1010 auto &MIRBuilder = Helper.MIRBuilder;
1011 auto &MF = MIRBuilder.getMF();
1012 MachineRegisterInfo &MRI = MF.getRegInfo();
1013
1014 Type *LLVMDstTy =
1015 IntegerType::get(MIRBuilder.getContext(), DstTy.getScalarSizeInBits());
1016 if (DstTy.isVector())
1017 LLVMDstTy = VectorType::get(LLVMDstTy, DstTy.getElementCount());
1018 SPIRVTypeInst SPIRVDstTy = GR->getOrCreateSPIRVType(
1019 LLVMDstTy, MIRBuilder, SPIRV::AccessQualifier::ReadWrite,
1020 /*EmitIR*/ true);
1021
1022 unsigned BitSize = SrcTy.getScalarSizeInBits();
1023 const fltSemantics &Semantics = getFltSemanticForLLT(SrcTy.getScalarType());
1024
1025 LLT IntTy = LLT::scalar(BitSize);
1026 Type *LLVMIntTy = IntegerType::get(MIRBuilder.getContext(), BitSize);
1027 if (SrcTy.isVector()) {
1028 IntTy = LLT::vector(SrcTy.getElementCount(), IntTy);
1029 LLVMIntTy = VectorType::get(LLVMIntTy, SrcTy.getElementCount());
1030 }
1031 SPIRVTypeInst SPIRVIntTy = GR->getOrCreateSPIRVType(
1032 LLVMIntTy, MIRBuilder, SPIRV::AccessQualifier::ReadWrite,
1033 /*EmitIR*/ true);
1034
1035 // Clang doesn't support capture of structured bindings:
1036 LLT DstTyCopy = DstTy;
1037 const auto assignSPIRVTy = [&](MachineInstrBuilder &&MI) {
1038 // Assign this MI's (assumed only) destination to one of the two types we
1039 // expect: either the G_IS_FPCLASS's destination type, or the integer type
1040 // bitcast from the source type.
1041 LLT MITy = MRI.getType(MI.getReg(0));
1042 assert((MITy == IntTy || MITy == DstTyCopy) &&
1043 "Unexpected LLT type while lowering G_IS_FPCLASS");
1044 SPIRVTypeInst SPVTy = MITy == IntTy ? SPIRVIntTy : SPIRVDstTy;
1045 GR->assignSPIRVTypeToVReg(SPVTy, MI.getReg(0), MF);
1046 return MI;
1047 };
1048
1049 // Helper to build and assign a constant in one go
1050 const auto buildSPIRVConstant = [&](LLT Ty, auto &&C) -> MachineInstrBuilder {
1051 if (!Ty.isFixedVector())
1052 return assignSPIRVTy(MIRBuilder.buildConstant(Ty, C));
1053 auto ScalarC = MIRBuilder.buildConstant(Ty.getScalarType(), C);
1054 assert((Ty == IntTy || Ty == DstTyCopy) &&
1055 "Unexpected LLT type while lowering constant for G_IS_FPCLASS");
1056 SPIRVTypeInst VecEltTy = GR->getOrCreateSPIRVType(
1057 (Ty == IntTy ? LLVMIntTy : LLVMDstTy)->getScalarType(), MIRBuilder,
1058 SPIRV::AccessQualifier::ReadWrite,
1059 /*EmitIR*/ true);
1060 GR->assignSPIRVTypeToVReg(VecEltTy, ScalarC.getReg(0), MF);
1061 return assignSPIRVTy(MIRBuilder.buildSplatBuildVector(Ty, ScalarC));
1062 };
1063
1064 if (Mask == fcNone) {
1065 MIRBuilder.buildCopy(DstReg, buildSPIRVConstant(DstTy, 0));
1066 MI.eraseFromParent();
1067 return true;
1068 }
1069 if (Mask == fcAllFlags) {
1070 MIRBuilder.buildCopy(DstReg, buildSPIRVConstant(DstTy, 1));
1071 MI.eraseFromParent();
1072 return true;
1073 }
1074
1075 // Note that rather than creating a COPY here (between a floating-point and
1076 // integer type of the same size) we create a SPIR-V bitcast immediately. We
1077 // can't create a G_BITCAST because the LLTs are the same, and we can't seem
1078 // to correctly lower COPYs to SPIR-V bitcasts at this moment.
1079 Register ResVReg = MRI.createGenericVirtualRegister(IntTy);
1080 MRI.setRegClass(ResVReg, GR->getRegClass(SPIRVIntTy));
1081 GR->assignSPIRVTypeToVReg(SPIRVIntTy, ResVReg, Helper.MIRBuilder.getMF());
1082 auto AsInt = MIRBuilder.buildInstr(SPIRV::OpBitcast)
1083 .addDef(ResVReg)
1084 .addUse(GR->getSPIRVTypeID(SPIRVIntTy))
1085 .addUse(SrcReg);
1086 AsInt = assignSPIRVTy(std::move(AsInt));
1087
1088 // Various masks.
1089 APInt SignBit = APInt::getSignMask(BitSize);
1090 APInt ValueMask = APInt::getSignedMaxValue(BitSize); // All bits but sign.
1091 APInt Inf = APFloat::getInf(Semantics).bitcastToAPInt(); // Exp and int bit.
1092 APInt ExpMask = Inf;
1093 APInt AllOneMantissa = APFloat::getLargest(Semantics).bitcastToAPInt() & ~Inf;
1094 APInt QNaNBitMask =
1095 APInt::getOneBitSet(BitSize, AllOneMantissa.getActiveBits() - 1);
1096 APInt InversionMask = APInt::getAllOnes(DstTy.getScalarSizeInBits());
1097
1098 auto SignBitC = buildSPIRVConstant(IntTy, SignBit);
1099 auto ValueMaskC = buildSPIRVConstant(IntTy, ValueMask);
1100 auto InfC = buildSPIRVConstant(IntTy, Inf);
1101 auto ExpMaskC = buildSPIRVConstant(IntTy, ExpMask);
1102 auto ZeroC = buildSPIRVConstant(IntTy, 0);
1103
1104 auto Abs = assignSPIRVTy(MIRBuilder.buildAnd(IntTy, AsInt, ValueMaskC));
1105 auto Sign = assignSPIRVTy(
1106 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_NE, DstTy, AsInt, Abs));
1107
1108 auto Res = buildSPIRVConstant(DstTy, 0);
1109
1110 const auto appendToRes = [&](MachineInstrBuilder &&ToAppend) {
1111 Res = assignSPIRVTy(
1112 MIRBuilder.buildOr(DstTyCopy, Res, assignSPIRVTy(std::move(ToAppend))));
1113 };
1114
1115 // Tests that involve more than one class should be processed first.
1116 if ((Mask & fcFinite) == fcFinite) {
1117 // finite(V) ==> abs(V) u< exp_mask
1118 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT, DstTy, Abs,
1119 ExpMaskC));
1120 Mask &= ~fcFinite;
1121 } else if ((Mask & fcFinite) == fcPosFinite) {
1122 // finite(V) && V > 0 ==> V u< exp_mask
1123 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT, DstTy, AsInt,
1124 ExpMaskC));
1125 Mask &= ~fcPosFinite;
1126 } else if ((Mask & fcFinite) == fcNegFinite) {
1127 // finite(V) && V < 0 ==> abs(V) u< exp_mask && signbit == 1
1128 auto Cmp = assignSPIRVTy(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT,
1129 DstTy, Abs, ExpMaskC));
1130 appendToRes(MIRBuilder.buildAnd(DstTy, Cmp, Sign));
1131 Mask &= ~fcNegFinite;
1132 }
1133
1134 if (FPClassTest PartialCheck = Mask & (fcZero | fcSubnormal)) {
1135 // fcZero | fcSubnormal => test all exponent bits are 0
1136 // TODO: Handle sign bit specific cases
1137 // TODO: Handle inverted case
1138 if (PartialCheck == (fcZero | fcSubnormal)) {
1139 auto ExpBits = assignSPIRVTy(MIRBuilder.buildAnd(IntTy, AsInt, ExpMaskC));
1140 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1141 ExpBits, ZeroC));
1142 Mask &= ~PartialCheck;
1143 }
1144 }
1145
1146 // Check for individual classes.
1147 if (FPClassTest PartialCheck = Mask & fcZero) {
1148 if (PartialCheck == fcPosZero)
1149 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1150 AsInt, ZeroC));
1151 else if (PartialCheck == fcZero)
1152 appendToRes(
1153 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy, Abs, ZeroC));
1154 else // fcNegZero
1155 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1156 AsInt, SignBitC));
1157 }
1158
1159 if (FPClassTest PartialCheck = Mask & fcSubnormal) {
1160 // issubnormal(V) ==> unsigned(abs(V) - 1) u< (all mantissa bits set)
1161 // issubnormal(V) && V>0 ==> unsigned(V - 1) u< (all mantissa bits set)
1162 auto V = (PartialCheck == fcPosSubnormal) ? AsInt : Abs;
1163 auto OneC = buildSPIRVConstant(IntTy, 1);
1164 auto VMinusOne = MIRBuilder.buildSub(IntTy, V, OneC);
1165 auto SubnormalRes = assignSPIRVTy(
1166 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT, DstTy, VMinusOne,
1167 buildSPIRVConstant(IntTy, AllOneMantissa)));
1168 if (PartialCheck == fcNegSubnormal)
1169 SubnormalRes = MIRBuilder.buildAnd(DstTy, SubnormalRes, Sign);
1170 appendToRes(std::move(SubnormalRes));
1171 }
1172
1173 if (FPClassTest PartialCheck = Mask & fcInf) {
1174 if (PartialCheck == fcPosInf)
1175 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1176 AsInt, InfC));
1177 else if (PartialCheck == fcInf)
1178 appendToRes(
1179 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy, Abs, InfC));
1180 else { // fcNegInf
1181 APInt NegInf = APFloat::getInf(Semantics, true).bitcastToAPInt();
1182 auto NegInfC = buildSPIRVConstant(IntTy, NegInf);
1183 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_EQ, DstTy,
1184 AsInt, NegInfC));
1185 }
1186 }
1187
1188 if (FPClassTest PartialCheck = Mask & fcNan) {
1189 auto InfWithQnanBitC =
1190 buildSPIRVConstant(IntTy, std::move(Inf) | QNaNBitMask);
1191 if (PartialCheck == fcNan) {
1192 // isnan(V) ==> abs(V) u> int(inf)
1193 appendToRes(
1194 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_UGT, DstTy, Abs, InfC));
1195 } else if (PartialCheck == fcQNan) {
1196 // isquiet(V) ==> abs(V) u>= (unsigned(Inf) | quiet_bit)
1197 appendToRes(MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_UGE, DstTy, Abs,
1198 InfWithQnanBitC));
1199 } else { // fcSNan
1200 // issignaling(V) ==> abs(V) u> unsigned(Inf) &&
1201 // abs(V) u< (unsigned(Inf) | quiet_bit)
1202 auto IsNan = assignSPIRVTy(
1203 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_UGT, DstTy, Abs, InfC));
1204 auto IsNotQnan = assignSPIRVTy(MIRBuilder.buildICmp(
1205 CmpInst::Predicate::ICMP_ULT, DstTy, Abs, InfWithQnanBitC));
1206 appendToRes(MIRBuilder.buildAnd(DstTy, IsNan, IsNotQnan));
1207 }
1208 }
1209
1210 if (FPClassTest PartialCheck = Mask & fcNormal) {
1211 // isnormal(V) ==> (0 u< exp u< max_exp) ==> (unsigned(exp-1) u<
1212 // (max_exp-1))
1213 APInt ExpLSB = ExpMask & ~(ExpMask.shl(1));
1214 auto ExpMinusOne = assignSPIRVTy(
1215 MIRBuilder.buildSub(IntTy, Abs, buildSPIRVConstant(IntTy, ExpLSB)));
1216 APInt MaxExpMinusOne = std::move(ExpMask) - ExpLSB;
1217 auto NormalRes = assignSPIRVTy(
1218 MIRBuilder.buildICmp(CmpInst::Predicate::ICMP_ULT, DstTy, ExpMinusOne,
1219 buildSPIRVConstant(IntTy, MaxExpMinusOne)));
1220 if (PartialCheck == fcNegNormal)
1221 NormalRes = MIRBuilder.buildAnd(DstTy, NormalRes, Sign);
1222 else if (PartialCheck == fcPosNormal) {
1223 auto PosSign = assignSPIRVTy(MIRBuilder.buildXor(
1224 DstTy, Sign, buildSPIRVConstant(DstTy, InversionMask)));
1225 NormalRes = MIRBuilder.buildAnd(DstTy, NormalRes, PosSign);
1226 }
1227 appendToRes(std::move(NormalRes));
1228 }
1229
1230 MIRBuilder.buildCopy(DstReg, Res);
1231 MI.eraseFromParent();
1232 return true;
1233}
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static void scalarize(Instruction *I, SmallVectorImpl< Instruction * > &Worklist)
Declares convenience wrapper classes for interpreting MachineInstr instances as specific generic oper...
IRTranslator LLVM IR MI
#define I(x, y, z)
Definition MD5.cpp:57
This file declares the MachineIRBuilder class.
Register Reg
Promote Memory to Register
Definition Mem2Reg.cpp:110
ppc ctr loops verify
const SmallVectorImpl< MachineOperand > & Cond
static bool legalizeSpvInsertElt(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool needsVectorLegalization(const LLT &Ty, const SPIRVSubtarget &ST)
static MachineInstrBuilder createStackTemporaryForVector(LegalizerHelper &Helper, SPIRVGlobalRegistry *GR, Register SrcReg, LLT SrcTy, MachinePointerInfo &PtrInfo, Align &VecAlign)
static Register convertPtrToInt(Register Reg, LLT ConvTy, SPIRVTypeInst SpvType, LegalizerHelper &Helper, MachineRegisterInfo &MRI, SPIRVGlobalRegistry *GR)
LegalityPredicate typeOfExtendedScalars(unsigned TypeIdx, bool IsExtendedInts)
static bool legalizeExtractVectorElt(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeStore(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeSpvExtractElt(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeSpvBitcast(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeSpvConstComposite(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeLoad(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
static bool legalizeInsertVectorElt(LegalizerHelper &Helper, MachineInstr &MI, SPIRVGlobalRegistry *GR)
#define LLVM_DEBUG(...)
Definition Debug.h:119
APInt bitcastToAPInt() const
Definition APFloat.h:1436
static APFloat getLargest(const fltSemantics &Sem, bool Negative=false)
Returns the largest finite number in the given semantics.
Definition APFloat.h:1203
static APFloat getInf(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative Infinity.
Definition APFloat.h:1163
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
Definition APInt.h:235
static APInt getSignMask(unsigned BitWidth)
Get the SignMask for a specific bit width.
Definition APInt.h:230
unsigned getActiveBits() const
Compute the number of active bits in the value.
Definition APInt.h:1535
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
Definition APInt.h:210
APInt shl(unsigned shiftAmt) const
Left-shift function.
Definition APInt.h:880
static APInt getOneBitSet(unsigned numBits, unsigned BitNo)
Return an APInt with exactly one bit set in the result.
Definition APInt.h:240
Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
static LLVM_ABI ArrayType * get(Type *ElementType, uint64_t NumElements)
This static method is the primary way to construct an ArrayType.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:740
@ ICMP_UGE
unsigned greater or equal
Definition InstrTypes.h:764
@ ICMP_UGT
unsigned greater than
Definition InstrTypes.h:763
@ ICMP_ULT
unsigned less than
Definition InstrTypes.h:765
@ ICMP_NE
not equal
Definition InstrTypes.h:762
static constexpr ElementCount getFixed(ScalarTy MinVal)
Definition TypeSize.h:309
static LLVM_ABI IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition Type.cpp:350
static constexpr LLT vector(ElementCount EC, unsigned ScalarSizeInBits)
Get a low-level vector of some number of elements and element width.
LLT getScalarType() const
constexpr bool isPointerVector() const
static constexpr LLT scalar(unsigned SizeInBits)
Get a low-level scalar or aggregate "bag of bits".
constexpr bool isValid() const
constexpr uint16_t getNumElements() const
Returns the number of elements in a vector LLT.
constexpr bool isVector() const
static constexpr LLT pointer(unsigned AddressSpace, unsigned SizeInBits)
Get a low-level pointer in the given address space.
constexpr bool isPointer() const
constexpr unsigned getAddressSpace() const
static constexpr LLT fixed_vector(unsigned NumElements, unsigned ScalarSizeInBits)
Get a low-level fixed-width vector of some number of elements and element width.
constexpr bool isPointerOrPointerVector() const
constexpr bool isFixedVector() const
Returns true if the LLT is a fixed vector.
constexpr TypeSize getSizeInBytes() const
Returns the total size of the type in bytes, i.e.
LLT getElementType() const
Returns the vector's element type. Only valid for vector types.
LLVM_ABI void computeTables()
Compute any ancillary tables needed to quickly decide how an operation should be handled.
LegalizeRuleSet & legalFor(std::initializer_list< LLT > Types)
The instruction is legal when type index 0 is any type in the given list.
LegalizeRuleSet & fewerElementsIf(LegalityPredicate Predicate, LegalizeMutation Mutation)
Remove elements to reach the type selected by the mutation if the predicate is true.
LegalizeRuleSet & moreElementsToNextPow2(unsigned TypeIdx)
Add more elements to the vector to reach the next power of two.
LegalizeRuleSet & lower()
The instruction is lowered.
LegalizeRuleSet & scalarizeIf(LegalityPredicate Predicate, unsigned TypeIdx)
LegalizeRuleSet & lowerIf(LegalityPredicate Predicate)
The instruction is lowered if predicate is true.
LegalizeRuleSet & custom()
Unconditionally custom lower.
LegalizeRuleSet & unsupportedIf(LegalityPredicate Predicate)
LegalizeRuleSet & alwaysLegal()
LegalizeRuleSet & scalarize(unsigned TypeIdx)
LegalizeRuleSet & legalForCartesianProduct(std::initializer_list< LLT > Types)
The instruction is legal when type indexes 0 and 1 are both in the given list.
LegalizeRuleSet & legalIf(LegalityPredicate Predicate)
The instruction is legal if predicate is true.
LegalizeRuleSet & customFor(std::initializer_list< LLT > Types)
LLVM_ABI MachineInstrBuilder createStackTemporary(TypeSize Bytes, Align Alignment, MachinePointerInfo &PtrInfo)
Create a stack temporary based on the size in bytes and the alignment.
MachineIRBuilder & MIRBuilder
Expose MIRBuilder so clients can set their own RecordInsertInstruction functions.
LLVM_ABI Align getStackTemporaryAlignment(LLT Type, Align MinAlign=Align()) const
Return the alignment to use for a stack temporary object with the given type.
LegalizeRuleSet & getActionDefinitionsBuilder(unsigned Opcode)
Get the action definition builder for the given opcode.
const LegacyLegalizerInfo & getLegacyLegalizerInfo() const
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Helper class to build MachineInstr.
LLVMContext & getContext() const
MachineInstrBuilder buildUnmerge(ArrayRef< LLT > Res, const SrcOp &Op)
Build and insert Res0, ... = G_UNMERGE_VALUES Op.
MachineInstrBuilder buildAnd(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1)
Build and insert Res = G_AND Op0, Op1.
MachineInstrBuilder buildICmp(CmpInst::Predicate Pred, const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1, std::optional< unsigned > Flags=std::nullopt)
Build and insert a Res = G_ICMP Pred, Op0, Op1.
MachineInstrBuilder buildSub(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_SUB Op0, Op1.
MachineInstrBuilder buildIntrinsic(Intrinsic::ID ID, ArrayRef< Register > Res, bool HasSideEffects, bool isConvergent)
Build and insert a G_INTRINSIC instruction.
MachineInstrBuilder buildSplatBuildVector(const DstOp &Res, const SrcOp &Src)
Build and insert Res = G_BUILD_VECTOR with Src replicated to fill the number of elements.
MachineInstrBuilder buildBuildVector(const DstOp &Res, ArrayRef< Register > Ops)
Build and insert Res = G_BUILD_VECTOR Op0, ...
MachineInstrBuilder buildLoad(const DstOp &Res, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert Res = G_LOAD Addr, MMO.
MachineInstrBuilder buildStore(const SrcOp &Val, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert G_STORE Val, Addr, MMO.
MachineInstrBuilder buildInstr(unsigned Opcode)
Build and insert <empty> = Opcode <empty>.
MachineFunction & getMF()
Getter for the function we currently build.
MachineInstrBuilder buildBitcast(const DstOp &Dst, const SrcOp &Src)
Build and insert Dst = G_BITCAST Src.
MachineRegisterInfo * getMRI()
Getter for MRI.
MachineInstrBuilder buildOr(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_OR Op0, Op1.
MachineInstrBuilder buildCopy(const DstOp &Res, const SrcOp &Op)
Build and insert Res = COPY Op.
MachineInstrBuilder buildXor(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1)
Build and insert Res = G_XOR Op0, Op1.
virtual MachineInstrBuilder buildConstant(const DstOp &Res, const ConstantInt &Val)
Build and insert Res = G_CONSTANT Val.
const MachineInstrBuilder & addUse(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register use operand.
const MachineInstrBuilder & addDef(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register definition operand.
Representation of each machine instruction.
A description of a memory reference used in the backend.
const MachinePointerInfo & getPointerInfo() const
LLVM_ABI Align getAlign() const
Return the minimum known alignment in bytes of the actual memory reference.
MachineOperand class - Representation of each machine instruction operand.
Register getReg() const
getReg - Returns the register number.
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
LLT getType(Register Reg) const
Get the low-level type of Reg or LLT{} if Reg is not a generic (target independent) virtual register.
LLVM_ABI void setRegClass(Register Reg, const TargetRegisterClass *RC)
setRegClass - Set the register class of the specified virtual register.
LLVM_ABI Register createGenericVirtualRegister(LLT Ty, StringRef Name="")
Create and return a new generic virtual register with low-level type Ty.
Wrapper class representing virtual and physical registers.
Definition Register.h:20
void assignSPIRVTypeToVReg(SPIRVTypeInst Type, Register VReg, const MachineFunction &MF)
const TargetRegisterClass * getRegClass(SPIRVTypeInst SpvType) const
const Type * getTypeForSPIRVType(SPIRVTypeInst Ty) const
LLT getRegType(SPIRVTypeInst SpvType) const
SPIRVTypeInst getOrCreateSPIRVPointerType(const Type *BaseType, MachineIRBuilder &MIRBuilder, SPIRV::StorageClass::StorageClass SC)
SPIRVTypeInst getScalarOrVectorComponentType(SPIRVTypeInst Type) const
SPIRVTypeInst getOrCreateSPIRVType(const Type *Type, MachineInstr &I, SPIRV::AccessQualifier::AccessQualifier AQ, bool EmitIR)
SPIRVTypeInst getSPIRVTypeForVReg(Register VReg, const MachineFunction *MF=nullptr) const
SPIRVLegalizerInfo(const SPIRVSubtarget &ST)
bool legalizeCustom(LegalizerHelper &Helper, MachineInstr &MI, LostDebugLocObserver &LocObserver) const override
Called for instructions with the Custom LegalizationAction.
bool legalizeIntrinsic(LegalizerHelper &Helper, MachineInstr &MI) const override
SPIRVGlobalRegistry * getSPIRVGlobalRegistry() const
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
static constexpr TypeSize getFixed(ScalarTy ExactSize)
Definition TypeSize.h:343
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:46
static LLVM_ABI VectorType * get(Type *ElementType, ElementCount EC)
This static method is the primary way to construct an VectorType.
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
LLVM_ABI LegalityPredicate isScalar(unsigned TypeIdx)
True iff the specified type index is a scalar.
LLVM_ABI LegalityPredicate numElementsNotPow2(unsigned TypeIdx)
True iff the specified type index is a vector whose element count is not a power of 2.
LLVM_ABI LegalityPredicate vectorElementCountIsLessThanOrEqualTo(unsigned TypeIdx, unsigned Size)
True iff the specified type index is a vector with a number of elements that's less than or equal to ...
LLVM_ABI LegalityPredicate typeInSet(unsigned TypeIdx, std::initializer_list< LLT > TypesInit)
True iff the given type index is one of the specified types.
LLVM_ABI LegalityPredicate vectorElementCountIsGreaterThan(unsigned TypeIdx, unsigned Size)
True iff the specified type index is a vector with a number of elements that's greater than the given...
Predicate any(Predicate P0, Predicate P1)
True iff P0 or P1 are true.
LegalityPredicate typeIsNot(unsigned TypeIdx, LLT Type)
True iff the given type index is not the specified type.
Predicate all(Predicate P0, Predicate P1)
True iff P0 and P1 are true.
LLVM_ABI LegalityPredicate typeIs(unsigned TypeIdx, LLT TypesInit)
True iff the given type index is the specified type.
LLVM_ABI LegalizeMutation changeElementCountTo(unsigned TypeIdx, unsigned FromTypeIdx)
Keep the same scalar or element type as TypeIdx, but take the number of elements from FromTypeIdx.
LLVM_ABI LegalizeMutation changeElementSizeTo(unsigned TypeIdx, unsigned FromTypeIdx)
Change the scalar size or element size to have the same scalar size as type index FromIndex.
Invariant opcodes: All instruction sets have these as their low opcodes.
This is an optimization pass for GlobalISel generic memory operations.
LLVM_ABI const llvm::fltSemantics & getFltSemanticForLLT(LLT Ty)
Get the appropriate floating point arithmetic semantic based on the bit size of the given scalar LLT.
std::function< bool(const LegalityQuery &)> LegalityPredicate
MachineInstr * getImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
constexpr bool isPowerOf2_32(uint32_t Value)
Return true if the argument is a power of two > 0.
Definition MathExtras.h:279
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:209
const std::set< unsigned > & getTypeFoldingSupportedOpcodes()
int64_t foldImm(const MachineOperand &MO, const MachineRegisterInfo *MRI)
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
Align commonAlignment(Align A, uint64_t Offset)
Returns the alignment that satisfies both alignments.
Definition Alignment.h:201
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
The LegalityQuery object bundles together all the information that's needed to decide whether a given...
ArrayRef< LLT > Types
This class contains a discriminated union of information about pointers in memory operands,...
MachinePointerInfo getWithOffset(int64_t O) const