106 std::initializer_list<LLT> PackedVectorAllTypeList = {
112 std::initializer_list<LLT> ScalarAndPtrTypesList = {s8, s16, s32, s64, p0};
116 const TargetMachine &TM = ST.getTargetLowering()->getTargetMachine();
119 if (!ST.hasNEON() || !ST.hasFPARMv8()) {
126 const bool HasFP16 = ST.hasFullFP16();
127 const LLT &MinFPScalar = HasFP16 ? f16 : f32;
129 const bool HasCSSC = ST.hasCSSC();
130 const bool HasRCPC3 = ST.hasRCPC3();
131 const bool HasSVE = ST.hasSVE();
134 {G_IMPLICIT_DEF, G_FREEZE, G_CONSTANT_FOLD_BARRIER})
135 .legalFor({p0, s8, s16, s32, s64})
136 .legalFor({v2s8, v4s8, v8s8, v16s8, v2s16, v4s16, v8s16, v2s32, v4s32,
138 .widenScalarToNextPow2(0)
151 .legalFor(PackedVectorAllTypeList)
165 .widenScalarToNextPow2(0)
170 .maxScalarIf(
typeInSet(0, {s64, p0}), 1, s32);
175 .widenScalarToNextPow2(1)
180 .maxScalarIf(
typeInSet(1, {s64, p0}), 0, s32)
181 .maxScalarIf(
typeInSet(1, {s128}), 0, s64);
184 .legalFor({i32, i64, v8i8, v16i8, v4i16, v8i16, v2i32, v4i32, v2i64})
185 .legalFor(HasSVE, {nxv16i8, nxv8i16, nxv4i32, nxv2i64})
186 .widenScalarToNextPow2(0)
194 return Query.
Types[0].getNumElements() <= 2;
199 return Query.
Types[0].getNumElements() <= 4;
204 return Query.
Types[0].getNumElements() <= 16;
211 .
legalFor({i32, i64, v8i8, v16i8, v4i16, v8i16, v2i32, v4i32, v2i64})
212 .widenScalarToNextPow2(0)
220 return Query.
Types[0].getNumElements() <= 2;
225 return Query.
Types[0].getNumElements() <= 4;
230 return Query.
Types[0].getNumElements() <= 16;
238 const auto &SrcTy = Query.
Types[0];
239 const auto &AmtTy = Query.
Types[1];
240 return !SrcTy.isVector() && SrcTy.getSizeInBits() == 32 &&
241 AmtTy.getSizeInBits() == 32;
255 .widenScalarToNextPow2(0)
269 .
legalFor({{p0, i64}, {v2p0, v2i64}})
270 .clampScalarOrElt(1, s64, s64)
276 .legalFor({i32, i64})
278 .clampScalar(0, s32, s64)
283 .lowerFor({i8, i16, i32, i64, v2i32, v4i32, v2i64})
292 .widenScalarToNextPow2(0, 32)
297 .legalFor({i64, v16i8, v8i16, v4i32})
303 .legalFor({v8i8, v16i8, v4i16, v8i16, v2i32, v4i32})
304 .legalFor(HasCSSC, {i32, i64})
305 .minScalar(HasCSSC, 0, s32)
314 .legalFor({v16i8, v8i16, v4i32, v2i64, v2p0, v8i8, v4i16, v2i32})
318 return SrcTy.isScalar() && SrcTy.getSizeInBits() < 128;
322 [=](
const LegalityQuery &Query) {
return std::make_pair(0, v4i16); })
325 [=](
const LegalityQuery &Query) {
return std::make_pair(0, v2i32); })
326 .clampNumElements(0, v8s8, v16s8)
334 {G_ABDS, G_ABDU, G_UAVGFLOOR, G_UAVGCEIL, G_SAVGFLOOR, G_SAVGCEIL})
335 .legalFor({v8i8, v16i8, v4i16, v8i16, v2i32, v4i32})
339 {G_SADDE, G_SSUBE, G_UADDE, G_USUBE, G_SADDO, G_SSUBO, G_UADDO, G_USUBO})
340 .legalFor({{i32, i32}, {i64, i32}})
341 .clampScalar(0, s32, s64)
346 .customFor({{i32, i32}, {i32, i64}, {i64, i64}})
352 return Q.
Types[0].isScalar() && Q.
Types[1].getScalarSizeInBits() < 64;
358 .customFor({{s32, s32}, {s64, s64}});
362 .
legalFor(HasCSSC, {{i32, i32}, {i64, i64}})
363 .legalFor({{v8i8, v8i8}, {v16i8, v16i8}})
364 .customFor(!HasCSSC, {{s32, s32}, {s64, s64}})
365 .customFor({{s128, s128},
371 .clampScalar(0, s32, s128)
384 .legalFor({{i32, i32},
392 .widenScalarToNextPow2(1, 32)
410 .customFor(!HasCSSC, {s32, s64});
416 .widenScalarToNextPow2(0, 32)
428 .
legalFor({i32, i64, v4i16, v8i16, v2i32, v4i32, v2i64})
437 .legalFor({v8i8, v16i8, v4i16, v8i16, v2i32, v4i32, v2i64})
438 .legalFor(HasSVE, {nxv16i8, nxv8i16, nxv4i32, nxv2i64})
439 .clampNumElements(0, v8s8, v16s8)
448 {G_FADD, G_FSUB, G_FMUL, G_FDIV, G_FMA, G_FSQRT, G_FMAXNUM, G_FMINNUM,
449 G_FMAXIMUM, G_FMINIMUM, G_FCEIL, G_FFLOOR, G_FRINT, G_FNEARBYINT,
450 G_INTRINSIC_TRUNC, G_INTRINSIC_ROUND, G_INTRINSIC_ROUNDEVEN})
451 .legalFor({f32, f64, v2f32, v4f32, v2f64})
452 .legalFor(HasFP16, {f16, v4f16, v8f16})
457 return (!HasFP16 && Q.
Types[0].getScalarType().isFloat16()) ||
458 Q.
Types[0].getScalarType().isBFloat16();
461 .clampNumElements(0, v4s16, v8s16)
467 .legalFor({f32, f64, v2f32, v4f32, v2f64})
468 .legalFor(HasFP16, {f16, v4f16, v8f16})
483 G_FLOG10, G_FTAN, G_FEXP, G_FEXP2, G_FEXP10,
484 G_FACOS, G_FASIN, G_FATAN, G_FATAN2, G_FCOSH,
485 G_FSINH, G_FTANH, G_FMODF})
494 .
libcallFor({{f32, i32}, {f64, i32}, {f128, i32}});
497 .legalFor({{i32, f32}, {i32, f64}, {i64, f32}, {i64, f64}})
498 .legalFor(HasFP16, {{i32, f16}, {i64, f16}})
503 .legalFor({{i64, f32}, {i64, f64}})
504 .legalFor(HasFP16, {{i64, f16}})
522 for (
unsigned Op : {G_SEXTLOAD, G_ZEXTLOAD}) {
525 if (
Op == G_SEXTLOAD)
530 .legalForTypesWithMemDesc({{s32, p0, s8, 8},
538 {v2s32, p0, s64, 8}})
539 .widenScalarToNextPow2(0)
540 .clampScalar(0, s32, s64)
543 .unsupportedIfMemSizeNotPow2()
555 return HasRCPC3 && Query.
Types[0] == s128 &&
559 return Query.
Types[0] == s128 &&
562 .legalForTypesWithMemDesc({{s8, p0, s8, 8},
569 {v16s8, p0, s128, 8},
571 {v8s16, p0, s128, 8},
573 {v4s32, p0, s128, 8},
574 {v2s64, p0, s128, 8}})
576 .legalForTypesWithMemDesc(
577 {{s32, p0, s8, 8}, {s32, p0, s16, 8}, {s64, p0, s32, 8}})
578 .legalForTypesWithMemDesc({
580 {nxv16s8, p0, nxv16s8, 8},
581 {nxv8s16, p0, nxv8s16, 8},
582 {nxv4s32, p0, nxv4s32, 8},
583 {nxv2s64, p0, nxv2s64, 8},
585 .widenScalarToNextPow2(0, 8)
596 return Query.
Types[0].isScalar() &&
598 Query.
Types[0].getSizeInBits() > 32;
607 .customIf(IsPtrVecPred)
613 return HasRCPC3 && Query.
Types[0] == s128 &&
617 return Query.
Types[0] == s128 &&
625 {{s8, p0, s8, 8}, {s16, p0, s8, 8},
628 {s16, p0, s16, 8}, {s32, p0, s16, 8},
630 {s32, p0, s8, 8}, {s32, p0, s16, 8}, {s32, p0, s32, 8},
631 {s64, p0, s64, 8}, {s64, p0, s32, 8},
632 {p0, p0, s64, 8}, {s128, p0, s128, 8}, {v16s8, p0, s128, 8},
633 {v8s8, p0, s64, 8}, {v4s16, p0, s64, 8}, {v8s16, p0, s128, 8},
634 {v2s32, p0, s64, 8}, {v4s32, p0, s128, 8}, {v2s64, p0, s128, 8}})
635 .legalForTypesWithMemDesc({
640 {nxv16s8, p0, nxv16s8, 8},
641 {nxv8s16, p0, nxv8s16, 8},
642 {nxv4s32, p0, nxv4s32, 8},
643 {nxv2s64, p0, nxv2s64, 8},
645 .clampScalar(0, s8, s64)
648 return Query.
Types[0].isScalar() &&
652 .clampMaxNumElements(0, s8, 16)
661 return Query.
Types[0].getSizeInBits() ==
662 Query.
MMODescrs[0].MemoryTy.getSizeInBits();
668 .customIf(IsPtrVecPred)
686 {p0, v16s8, v16s8, 8},
687 {p0, v4s16, v4s16, 8},
688 {p0, v8s16, v8s16, 8},
689 {p0, v2s32, v2s32, 8},
690 {p0, v4s32, v4s32, 8},
691 {p0, v2s64, v2s64, 8},
697 auto IndexedLoadBasicPred = [=](
const LegalityQuery &Query) {
725 return MemTy == s8 || MemTy == s16;
727 return MemTy == s8 || MemTy == s16 || MemTy == s32;
735 .widenScalarToNextPow2(0)
742 .
legalFor({{i32, i32}, {i32, i64}, {i32, p0}})
752 return Ty.isVector() && !SrcTy.isPointerVector() &&
753 Ty.getElementType() != SrcTy.getElementType();
761 return Query.
Types[1].isPointerVector();
778 .legalFor(HasFP16, {{i32, f16}, {v4i16, v4f16}, {v8i16, v8f16}})
783 return (!HasFP16 && Q.
Types[1].getScalarType().isFloat16()) ||
784 Q.
Types[1].getScalarType().isBFloat16();
792 return Ty.isVector() && !SrcTy.isPointerVector() &&
793 Ty.getElementType() != SrcTy.getElementType();
796 .clampNumElements(1, v4s16, v8s16)
804 unsigned DstSize = Query.
Types[0].getSizeInBits();
807 if (Query.
Types[0].isVector())
810 if (DstSize < 8 || DstSize >= 128 || !
isPowerOf2_32(DstSize))
818 unsigned SrcSize = SrcTy.getSizeInBits();
825 .legalIf(ExtLegalFunc)
826 .
legalFor({{v8s16, v8s8}, {v4s32, v4s16}, {v2s64, v2s32}})
827 .clampScalar(0, s64, s64)
834 return (Query.
Types[0].getScalarSizeInBits() >
835 Query.
Types[1].getScalarSizeInBits() * 2) &&
836 Query.
Types[0].isVector() &&
837 (Query.
Types[1].getScalarSizeInBits() == 8 ||
838 Query.
Types[1].getScalarSizeInBits() == 16);
840 .clampMinNumElements(1, s8, 8)
845 .
legalFor({{v8s8, v8s16}, {v4s16, v4s32}, {v2s32, v2s64}})
856 return DstTy.
isVector() && SrcTy.getSizeInBits() > 128 &&
859 .clampMinNumElements(0, s8, 8)
864 .legalFor({{v8i8, v8i16}, {v4i16, v4i32}, {v2i32, v2i64}})
865 .clampNumElements(0, v2s32, v2s32);
868 .
legalFor({i32, i64, v8i8, v16i8, v4i16, v8i16, v2i32, v4i32, v2i64})
879 {{f16, f32}, {f16, f64}, {f32, f64}, {v4f16, v4f32}, {v2f32, v2f64}})
880 .legalFor(ST.hasBF16(), {{bf16, f32}, {v4bf16, v4f32}})
881 .libcallFor({{f16, f128}, {f32, f128}, {f64, f128}})
889 .lowerFor({{bf16, f32}, {v4bf16, v4f32}})
891 .clampNumElements(1, v4s32, v4s32)
895 getActionDefinitionsBuilder(G_FPEXT)
903 .libcallFor({{f128, f64}, {f128, f32}, {f128, f16}})
914 .clampNumElements(0, v4s32, v4s32)
919 getActionDefinitionsBuilder({G_FPTOSI, G_FPTOUI})
920 .legalFor({{i32, f32},
928 {{i32, f16}, {i64, f16}, {v4i16, v4f16}, {v8i16, v8f16}})
935 return Query.
Types[1] == f16 && Query.
Types[0].getSizeInBits() > 64;
944 return Query.
Types[0].getScalarSizeInBits() <= 64 &&
945 Query.
Types[0].getScalarSizeInBits() >
946 Query.
Types[1].getScalarSizeInBits();
951 return Query.
Types[1].getScalarSizeInBits() <= 64 &&
952 Query.
Types[0].getScalarSizeInBits() <
953 Query.
Types[1].getScalarSizeInBits();
956 .clampNumElements(0, v4s16, v8s16)
960 {{i32, f128}, {i64, f128}, {i128, f128}, {i128, f32}, {i128, f64}});
962 getActionDefinitionsBuilder({G_FPTOSI_SAT, G_FPTOUI_SAT})
963 .legalFor({{i32, f32},
972 {{i16, f16}, {i32, f16}, {i64, f16}, {v4i16, v4f16}, {v8i16, v8f16}})
980 return Query.
Types[1] == f16 && Query.
Types[0].getSizeInBits() > 64;
990 unsigned ITySize = Query.
Types[0].getScalarSizeInBits();
991 return (ITySize == 16 || ITySize == 32 || ITySize == 64) &&
992 ITySize > Query.
Types[1].getScalarSizeInBits();
997 unsigned FTySize = Query.
Types[1].getScalarSizeInBits();
998 return (FTySize == 16 || FTySize == 32 || FTySize == 64) &&
999 Query.
Types[0].getScalarSizeInBits() < FTySize;
1007 getActionDefinitionsBuilder({G_SITOFP, G_UITOFP})
1008 .legalFor({{f32, i32},
1016 {{f16, i32}, {f16, i64}, {v4f16, v4i16}, {v8f16, v8i16}})
1018 return Query.
Types[0].getScalarType().isBFloat16();
1026 return Query.
Types[1].isVector() &&
1027 Query.
Types[1].getScalarSizeInBits() == 64 &&
1028 Query.
Types[0].getScalarSizeInBits() == 16;
1030 .widenScalarOrEltToNextPow2OrMinSize(0, HasFP16 ? 16 : 32)
1034 return Query.
Types[0].getScalarSizeInBits() == 32 &&
1035 Query.
Types[1].getScalarSizeInBits() == 64;
1040 return Query.
Types[1].getScalarSizeInBits() <= 64 &&
1041 Query.
Types[0].getScalarSizeInBits() <
1042 Query.
Types[1].getScalarSizeInBits();
1047 return Query.
Types[0].getScalarSizeInBits() <= 64 &&
1048 Query.
Types[0].getScalarSizeInBits() >
1049 Query.
Types[1].getScalarSizeInBits();
1052 .clampNumElements(0, v4s16, v8s16)
1064 getActionDefinitionsBuilder(G_BRCOND)
1066 .clampScalar(0, s32, s32);
1067 getActionDefinitionsBuilder(G_BRINDIRECT).
legalFor({p0});
1069 getActionDefinitionsBuilder(G_SELECT)
1070 .
legalFor({{s32, s32}, {s64, s32}, {p0, s32}})
1071 .widenScalarToNextPow2(0)
1079 getActionDefinitionsBuilder(G_FRAME_INDEX).
legalFor({p0});
1082 getActionDefinitionsBuilder(G_GLOBAL_VALUE).
custom();
1084 getActionDefinitionsBuilder(G_GLOBAL_VALUE).
legalFor({p0});
1086 getActionDefinitionsBuilder(G_PTRAUTH_GLOBAL_VALUE)
1089 getActionDefinitionsBuilder(G_PTRTOINT)
1090 .
legalFor({{i64, p0}, {v2i64, v2p0}})
1091 .widenScalarToNextPow2(0, 64)
1095 getActionDefinitionsBuilder(G_INTTOPTR)
1097 return Query.
Types[0].getSizeInBits() != Query.
Types[1].getSizeInBits();
1099 .legalFor({{p0, i64}, {v2p0, v2i64}})
1100 .clampMaxNumElements(1, s64, 2);
1104 getActionDefinitionsBuilder(G_BITCAST)
1107 .legalForCartesianProduct({s32, v2s16, v4s8})
1108 .legalForCartesianProduct({s64, v8s8, v4s16, v2s32})
1109 .legalForCartesianProduct({s128, v16s8, v8s16, v4s32, v2s64, v2p0})
1118 return Query.
Types[0].isVector() != Query.
Types[1].isVector();
1127 getActionDefinitionsBuilder(G_VASTART).
legalFor({p0});
1131 getActionDefinitionsBuilder(G_VAARG)
1133 .clampScalar(0, s8, s64)
1136 getActionDefinitionsBuilder(G_ATOMIC_CMPXCHG_WITH_SUCCESS)
1140 bool UseOutlineAtomics =
ST.outlineAtomics() && !
ST.hasLSE();
1142 getActionDefinitionsBuilder(G_ATOMIC_CMPXCHG)
1143 .legalFor(!UseOutlineAtomics, {{s32, p0}, {s64, p0}})
1144 .customFor(!UseOutlineAtomics, {{s128, p0}})
1145 .libcallFor(UseOutlineAtomics,
1146 {{s8, p0}, {s16, p0}, {s32, p0}, {s64, p0}, {s128, p0}})
1147 .clampScalar(0, s32, s64);
1149 getActionDefinitionsBuilder({G_ATOMICRMW_XCHG, G_ATOMICRMW_ADD,
1150 G_ATOMICRMW_SUB, G_ATOMICRMW_AND, G_ATOMICRMW_OR,
1152 .legalFor(!UseOutlineAtomics, {{s32, p0}, {s64, p0}})
1153 .libcallFor(UseOutlineAtomics,
1154 {{s8, p0}, {s16, p0}, {s32, p0}, {s64, p0}})
1155 .clampScalar(0, s32, s64);
1159 getActionDefinitionsBuilder(
1160 {G_ATOMICRMW_MIN, G_ATOMICRMW_MAX, G_ATOMICRMW_UMIN, G_ATOMICRMW_UMAX})
1162 .clampScalar(0, s32, s64);
1164 getActionDefinitionsBuilder(G_BLOCK_ADDR).legalFor({p0});
1167 for (
unsigned Op : {G_MERGE_VALUES, G_UNMERGE_VALUES}) {
1168 unsigned BigTyIdx =
Op == G_MERGE_VALUES ? 0 : 1;
1169 unsigned LitTyIdx =
Op == G_MERGE_VALUES ? 1 : 0;
1170 getActionDefinitionsBuilder(
Op)
1171 .widenScalarToNextPow2(LitTyIdx, 8)
1172 .widenScalarToNextPow2(BigTyIdx, 32)
1173 .clampScalar(LitTyIdx, s8, s64)
1174 .clampScalar(BigTyIdx, s32, s128)
1176 switch (Q.
Types[BigTyIdx].getSizeInBits()) {
1184 switch (Q.
Types[LitTyIdx].getSizeInBits()) {
1197 getActionDefinitionsBuilder(G_EXTRACT_VECTOR_ELT)
1198 .legalFor(HasSVE, {{s16, nxv16s8, s64},
1199 {s16, nxv8s16, s64},
1200 {s32, nxv4s32, s64},
1201 {s64, nxv2s64, s64}})
1203 const LLT &EltTy = Query.
Types[1].getElementType();
1204 if (Query.
Types[1].isScalableVector())
1206 return Query.
Types[0] != EltTy;
1211 return VecTy == v8s8 || VecTy == v16s8 || VecTy == v2s16 ||
1212 VecTy == v4s16 || VecTy == v8s16 || VecTy == v2s32 ||
1213 VecTy == v4s32 || VecTy == v2s64 || VecTy == v2p0;
1219 return Query.
Types[1].isFixedVector() &&
1220 Query.
Types[1].getNumElements() <= 2;
1225 return Query.
Types[1].isFixedVector() &&
1226 Query.
Types[1].getNumElements() <= 4;
1231 return Query.
Types[1].isFixedVector() &&
1232 Query.
Types[1].getNumElements() <= 8;
1237 return Query.
Types[1].isFixedVector() &&
1238 Query.
Types[1].getNumElements() <= 16;
1241 .minScalarOrElt(0, s8)
1242 .moreElementsToNextPow2(1)
1243 .clampMaxNumElements(1, s64, 2)
1244 .clampMaxNumElements(1, s32, 4)
1245 .clampMaxNumElements(1, s16, 8)
1246 .clampMaxNumElements(1, s8, 16)
1247 .clampMaxNumElements(1, p0, 2)
1250 getActionDefinitionsBuilder(G_INSERT_VECTOR_ELT)
1252 typeInSet(0, {v8s8, v16s8, v4s16, v8s16, v2s32, v4s32, v2s64, v2p0}))
1253 .legalFor(HasSVE, {{nxv16s8, s32, s64},
1254 {nxv8s16, s32, s64},
1255 {nxv4s32, s32, s64},
1256 {nxv2s64, s64, s64}})
1258 .widenVectorEltsToVectorMinSize(0, 64)
1259 .clampNumElements(0, v8s8, v16s8)
1260 .clampNumElements(0, v4s16, v8s16)
1261 .clampNumElements(0, v2s32, v4s32)
1262 .clampMaxNumElements(0, s64, 2)
1263 .clampMaxNumElements(0, p0, 2)
1266 getActionDefinitionsBuilder(G_BUILD_VECTOR)
1267 .legalFor({{v8s8, s8},
1275 .clampNumElements(0, v4s32, v4s32)
1276 .clampNumElements(0, v2s64, v2s64)
1277 .minScalarOrElt(0, s8)
1278 .widenVectorEltsToVectorMinSize(0, 64)
1279 .widenScalarOrEltToNextPow2(0)
1280 .minScalarSameAs(1, 0);
1282 getActionDefinitionsBuilder(G_BUILD_VECTOR_TRUNC).lower();
1284 getActionDefinitionsBuilder(G_SHUFFLE_VECTOR)
1293 {v8s8, v16s8, v4s16, v8s16, v2s32, v4s32, v2s64}, DstTy);
1297 return Query.
Types[0].getNumElements() >
1298 Query.
Types[1].getNumElements();
1304 return Query.
Types[0].getNumElements() <
1305 Query.
Types[1].getNumElements();
1308 .widenScalarOrEltToNextPow2OrMinSize(0, 8)
1309 .clampNumElements(0, v8s8, v16s8)
1310 .clampNumElements(0, v4s16, v8s16)
1311 .clampNumElements(0, v4s32, v4s32)
1312 .clampNumElements(0, v2s64, v2s64)
1321 getActionDefinitionsBuilder(G_CONCAT_VECTORS)
1322 .legalFor({{v16s8, v8s8}, {v8s16, v4s16}, {v4s32, v2s32}})
1324 return Query.
Types[0].isFixedVector() &&
1325 Query.
Types[0].getScalarSizeInBits() < 8;
1329 return Query.
Types[0].isFixedVector() &&
1330 Query.
Types[1].isFixedVector() &&
1331 Query.
Types[0].getScalarSizeInBits() >= 8 &&
1333 Query.
Types[0].getSizeInBits() <= 128 &&
1334 Query.
Types[1].getSizeInBits() <= 64;
1346 getActionDefinitionsBuilder(G_EXTRACT_SUBVECTOR)
1347 .legalFor({{v8s8, v16s8}, {v4s16, v8s16}, {v2s32, v4s32}})
1352 getActionDefinitionsBuilder(G_SPLAT_VECTOR)
1353 .legalFor(HasSVE, {{nxv4s32, s32}, {nxv2s64, s64}});
1355 getActionDefinitionsBuilder(G_JUMP_TABLE).legalFor({p0});
1357 getActionDefinitionsBuilder(G_BRJT).legalFor({{p0, s64}});
1359 getActionDefinitionsBuilder({G_TRAP, G_DEBUGTRAP, G_UBSANTRAP}).alwaysLegal();
1361 getActionDefinitionsBuilder(G_DYN_STACKALLOC).custom();
1363 getActionDefinitionsBuilder({G_STACKSAVE, G_STACKRESTORE}).lower();
1368 getActionDefinitionsBuilder(G_BZERO).unsupported();
1370 getActionDefinitionsBuilder(G_MEMSET)
1371 .legalForCartesianProduct({p0}, {s64}, {s64})
1372 .customForCartesianProduct({p0}, {s8}, {s64})
1375 getActionDefinitionsBuilder({G_MEMCPY, G_MEMMOVE})
1376 .legalForCartesianProduct({p0}, {p0}, {s64})
1380 getActionDefinitionsBuilder(G_MEMCPY_INLINE)
1381 .legalForCartesianProduct({p0}, {p0}, {s64});
1384 getActionDefinitionsBuilder({G_BZERO, G_MEMCPY, G_MEMMOVE, G_MEMSET})
1391 getActionDefinitionsBuilder(G_VECREDUCE_FADD)
1392 .legalFor({{f32, v2f32}, {f32, v4f32}, {f64, v2f64}})
1393 .legalFor(HasFP16, {{f16, v4f16}, {f16, v8f16}})
1394 .minScalarOrElt(0, MinFPScalar)
1395 .clampMaxNumElements(1, s64, 2)
1396 .clampMaxNumElements(1, s32, 4)
1397 .clampMaxNumElements(1, s16, 8)
1398 .moreElementsToNextPow2(1)
1405 getActionDefinitionsBuilder(G_VECREDUCE_FMUL)
1406 .minScalarOrElt(0, MinFPScalar)
1407 .clampMaxNumElements(1, s64, 2)
1408 .clampMaxNumElements(1, s32, 4)
1409 .clampMaxNumElements(1, s16, 8)
1410 .clampMaxNumElements(1, s32, 2)
1411 .clampMaxNumElements(1, s16, 4)
1415 getActionDefinitionsBuilder({G_VECREDUCE_SEQ_FADD, G_VECREDUCE_SEQ_FMUL})
1419 getActionDefinitionsBuilder(G_VECREDUCE_ADD)
1420 .legalFor({{i8, v8i8},
1428 .clampMaxNumElements(1, s64, 2)
1429 .clampMaxNumElements(1, s32, 4)
1430 .clampMaxNumElements(1, s16, 8)
1431 .clampMaxNumElements(1, s8, 16)
1432 .widenVectorEltsToVectorMinSize(1, 64)
1435 getActionDefinitionsBuilder({G_VECREDUCE_FMIN, G_VECREDUCE_FMAX,
1436 G_VECREDUCE_FMINIMUM, G_VECREDUCE_FMAXIMUM})
1437 .legalFor({{f32, v2f32}, {f32, v4f32}, {f64, v2f64}})
1438 .legalFor(HasFP16, {{f16, v4f16}, {f16, v8f16}})
1439 .minScalarOrElt(0, MinFPScalar)
1440 .clampMaxNumElements(1, s64, 2)
1441 .clampMaxNumElements(1, s32, 4)
1442 .clampMaxNumElements(1, s16, 8)
1446 getActionDefinitionsBuilder(G_VECREDUCE_MUL)
1447 .clampMaxNumElements(1, s32, 2)
1448 .clampMaxNumElements(1, s16, 4)
1449 .clampMaxNumElements(1, s8, 8)
1453 getActionDefinitionsBuilder(
1454 {G_VECREDUCE_SMIN, G_VECREDUCE_SMAX, G_VECREDUCE_UMIN, G_VECREDUCE_UMAX})
1455 .legalFor({{i8, v8i8},
1463 return Query.
Types[1].isVector() &&
1464 Query.
Types[1].getElementType() != s8 &&
1465 Query.
Types[1].getNumElements() & 1;
1468 .clampMaxNumElements(1, s64, 2)
1469 .clampMaxNumElements(1, s32, 4)
1470 .clampMaxNumElements(1, s16, 8)
1471 .clampMaxNumElements(1, s8, 16)
1475 getActionDefinitionsBuilder(
1476 {G_VECREDUCE_OR, G_VECREDUCE_AND, G_VECREDUCE_XOR})
1492 return std::make_pair(1, SrcTy.
divide(2));
1498 getActionDefinitionsBuilder(G_VECTOR_COMPRESS).lower();
1501 getActionDefinitionsBuilder({G_GET_FPENV, G_SET_FPENV, G_RESET_FPENV,
1502 G_GET_FPMODE, G_SET_FPMODE, G_RESET_FPMODE})
1505 getActionDefinitionsBuilder(G_IS_FPCLASS).lower();
1507 getActionDefinitionsBuilder(G_PREFETCH).custom();
1509 getActionDefinitionsBuilder({G_SCMP, G_UCMP}).lower();
1511 getActionDefinitionsBuilder({G_INTRINSIC, G_INTRINSIC_W_SIDE_EFFECTS})
1513 getActionDefinitionsBuilder(G_FENCE).alwaysLegal();
1514 getActionDefinitionsBuilder(G_INVOKE_REGION_START).alwaysLegal();
1516 getLegacyLegalizerInfo().computeTables();
1762 auto LowerUnaryOp = [&
MI, &MIB](
unsigned Opcode) {
1764 MI.eraseFromParent();
1767 auto LowerBinOp = [&
MI, &MIB](
unsigned Opcode) {
1769 {
MI.getOperand(2),
MI.getOperand(3)});
1770 MI.eraseFromParent();
1773 auto LowerTriOp = [&
MI, &MIB](
unsigned Opcode) {
1775 {
MI.getOperand(2),
MI.getOperand(3),
MI.getOperand(4)});
1776 MI.eraseFromParent();
1781 switch (IntrinsicID) {
1782 case Intrinsic::vacopy: {
1783 unsigned PtrSize = ST->isTargetILP32() ? 4 : 8;
1784 unsigned VaListSize =
1785 (ST->isTargetDarwin() || ST->isTargetWindows())
1787 : ST->isTargetILP32() ? 20 : 32;
1795 VaListSize,
Align(PtrSize)));
1799 VaListSize,
Align(PtrSize)));
1800 MI.eraseFromParent();
1803 case Intrinsic::get_dynamic_area_offset: {
1805 MI.eraseFromParent();
1808 case Intrinsic::aarch64_mops_memset_tag: {
1809 assert(
MI.getOpcode() == TargetOpcode::G_INTRINSIC_W_SIDE_EFFECTS);
1812 auto &
Value =
MI.getOperand(3);
1814 Value.setReg(ExtValueReg);
1817 case Intrinsic::aarch64_prefetch: {
1818 auto &AddrVal =
MI.getOperand(1);
1820 int64_t IsWrite =
MI.getOperand(2).getImm();
1821 int64_t
Target =
MI.getOperand(3).getImm();
1822 int64_t IsStream =
MI.getOperand(4).getImm();
1823 int64_t IsData =
MI.getOperand(5).getImm();
1825 unsigned PrfOp = (IsWrite << 4) |
1831 MI.eraseFromParent();
1834 case Intrinsic::aarch64_range_prefetch: {
1835 auto &AddrVal =
MI.getOperand(1);
1837 int64_t IsWrite =
MI.getOperand(2).getImm();
1838 int64_t IsStream =
MI.getOperand(3).getImm();
1839 unsigned PrfOp = (IsStream << 2) | IsWrite;
1841 MIB.
buildInstr(AArch64::G_AARCH64_RANGE_PREFETCH)
1844 .
addUse(
MI.getOperand(4).getReg());
1845 MI.eraseFromParent();
1848 case Intrinsic::aarch64_prefetch_ir: {
1849 auto &AddrVal =
MI.getOperand(1);
1851 MI.eraseFromParent();
1854 case Intrinsic::aarch64_neon_uaddv:
1855 case Intrinsic::aarch64_neon_saddv:
1856 case Intrinsic::aarch64_neon_umaxv:
1857 case Intrinsic::aarch64_neon_smaxv:
1858 case Intrinsic::aarch64_neon_uminv:
1859 case Intrinsic::aarch64_neon_sminv: {
1860 bool IsSigned = IntrinsicID == Intrinsic::aarch64_neon_saddv ||
1861 IntrinsicID == Intrinsic::aarch64_neon_smaxv ||
1862 IntrinsicID == Intrinsic::aarch64_neon_sminv;
1864 auto OldDst =
MI.getOperand(0).getReg();
1865 auto OldDstTy = MRI.
getType(OldDst);
1867 if (OldDstTy == NewDstTy)
1873 MI.getOperand(0).setReg(NewDst);
1877 MIB.
buildExtOrTrunc(IsSigned ? TargetOpcode::G_SEXT : TargetOpcode::G_ZEXT,
1882 case Intrinsic::aarch64_neon_uaddlp:
1883 case Intrinsic::aarch64_neon_saddlp: {
1884 unsigned Opc = IntrinsicID == Intrinsic::aarch64_neon_uaddlp
1886 : AArch64::G_SADDLP;
1888 MI.eraseFromParent();
1892 case Intrinsic::aarch64_neon_uaddlv:
1893 case Intrinsic::aarch64_neon_saddlv: {
1894 unsigned Opc = IntrinsicID == Intrinsic::aarch64_neon_uaddlv
1896 : AArch64::G_SADDLV;
1923 MI.eraseFromParent();
1927 case Intrinsic::aarch64_neon_smax:
1928 return LowerBinOp(TargetOpcode::G_SMAX);
1929 case Intrinsic::aarch64_neon_smin:
1930 return LowerBinOp(TargetOpcode::G_SMIN);
1931 case Intrinsic::aarch64_neon_umax:
1932 return LowerBinOp(TargetOpcode::G_UMAX);
1933 case Intrinsic::aarch64_neon_umin:
1934 return LowerBinOp(TargetOpcode::G_UMIN);
1935 case Intrinsic::aarch64_neon_fmax:
1936 return LowerBinOp(TargetOpcode::G_FMAXIMUM);
1937 case Intrinsic::aarch64_neon_fmin:
1938 return LowerBinOp(TargetOpcode::G_FMINIMUM);
1939 case Intrinsic::aarch64_neon_fmaxnm:
1940 return LowerBinOp(TargetOpcode::G_FMAXNUM);
1941 case Intrinsic::aarch64_neon_fminnm:
1942 return LowerBinOp(TargetOpcode::G_FMINNUM);
1943 case Intrinsic::aarch64_neon_pmull:
1944 case Intrinsic::aarch64_neon_pmull64:
1945 return LowerBinOp(AArch64::G_PMULL);
1946 case Intrinsic::aarch64_neon_smull:
1947 return LowerBinOp(AArch64::G_SMULL);
1948 case Intrinsic::aarch64_neon_umull:
1949 return LowerBinOp(AArch64::G_UMULL);
1950 case Intrinsic::aarch64_neon_sabd:
1951 return LowerBinOp(TargetOpcode::G_ABDS);
1952 case Intrinsic::aarch64_neon_uabd:
1953 return LowerBinOp(TargetOpcode::G_ABDU);
1954 case Intrinsic::aarch64_neon_uhadd:
1955 return LowerBinOp(TargetOpcode::G_UAVGFLOOR);
1956 case Intrinsic::aarch64_neon_urhadd:
1957 return LowerBinOp(TargetOpcode::G_UAVGCEIL);
1958 case Intrinsic::aarch64_neon_shadd:
1959 return LowerBinOp(TargetOpcode::G_SAVGFLOOR);
1960 case Intrinsic::aarch64_neon_srhadd:
1961 return LowerBinOp(TargetOpcode::G_SAVGCEIL);
1962 case Intrinsic::aarch64_neon_sqshrn: {
1967 {MRI.
getType(
MI.getOperand(2).getReg())},
1968 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
1970 MIB.
buildInstr(TargetOpcode::G_TRUNC_SSAT_S, {
MI.getOperand(0)}, {Shr});
1971 MI.eraseFromParent();
1974 case Intrinsic::aarch64_neon_sqshrun: {
1979 {MRI.
getType(
MI.getOperand(2).getReg())},
1980 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
1982 MIB.
buildInstr(TargetOpcode::G_TRUNC_SSAT_U, {
MI.getOperand(0)}, {Shr});
1983 MI.eraseFromParent();
1986 case Intrinsic::aarch64_neon_sqrshrn: {
1990 auto Shr = MIB.
buildInstr(AArch64::G_SRSHR_I,
1991 {MRI.
getType(
MI.getOperand(2).getReg())},
1992 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
1994 MIB.
buildInstr(TargetOpcode::G_TRUNC_SSAT_S, {
MI.getOperand(0)}, {Shr});
1995 MI.eraseFromParent();
1998 case Intrinsic::aarch64_neon_sqrshrun: {
2002 auto Shr = MIB.
buildInstr(AArch64::G_SRSHR_I,
2003 {MRI.
getType(
MI.getOperand(2).getReg())},
2004 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
2006 MIB.
buildInstr(TargetOpcode::G_TRUNC_SSAT_U, {
MI.getOperand(0)}, {Shr});
2007 MI.eraseFromParent();
2010 case Intrinsic::aarch64_neon_uqrshrn: {
2014 auto Shr = MIB.
buildInstr(AArch64::G_URSHR_I,
2015 {MRI.
getType(
MI.getOperand(2).getReg())},
2016 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
2018 MIB.
buildInstr(TargetOpcode::G_TRUNC_USAT_U, {
MI.getOperand(0)}, {Shr});
2019 MI.eraseFromParent();
2022 case Intrinsic::aarch64_neon_uqshrn: {
2027 {MRI.
getType(
MI.getOperand(2).getReg())},
2028 {
MI.getOperand(2),
MI.getOperand(3).getImm()});
2030 MIB.
buildInstr(TargetOpcode::G_TRUNC_USAT_U, {
MI.getOperand(0)}, {Shr});
2031 MI.eraseFromParent();
2034 case Intrinsic::aarch64_neon_sqshlu: {
2040 MIB.
buildInstr(AArch64::G_SQSHLU_I, {
MI.getOperand(0)},
2042 .addImm(ShiftAmount->getSExtValue());
2043 MI.eraseFromParent();
2048 case Intrinsic::aarch64_neon_vsli: {
2050 AArch64::G_SLI, {
MI.getOperand(0)},
2051 {
MI.getOperand(2),
MI.getOperand(3),
MI.getOperand(4).getImm()});
2052 MI.eraseFromParent();
2055 case Intrinsic::aarch64_neon_vsri: {
2057 AArch64::G_SRI, {
MI.getOperand(0)},
2058 {
MI.getOperand(2),
MI.getOperand(3),
MI.getOperand(4).getImm()});
2059 MI.eraseFromParent();
2062 case Intrinsic::aarch64_neon_abs: {
2064 MIB.
buildInstr(TargetOpcode::G_ABS, {
MI.getOperand(0)}, {
MI.getOperand(2)});
2065 MI.eraseFromParent();
2068 case Intrinsic::aarch64_neon_sqadd: {
2070 return LowerBinOp(TargetOpcode::G_SADDSAT);
2073 case Intrinsic::aarch64_neon_sqsub: {
2075 return LowerBinOp(TargetOpcode::G_SSUBSAT);
2078 case Intrinsic::aarch64_neon_uqadd: {
2080 return LowerBinOp(TargetOpcode::G_UADDSAT);
2083 case Intrinsic::aarch64_neon_uqsub: {
2085 return LowerBinOp(TargetOpcode::G_USUBSAT);
2088 case Intrinsic::aarch64_neon_udot:
2089 return LowerTriOp(AArch64::G_UDOT);
2090 case Intrinsic::aarch64_neon_sdot:
2091 return LowerTriOp(AArch64::G_SDOT);
2092 case Intrinsic::aarch64_neon_usdot:
2093 return LowerTriOp(AArch64::G_USDOT);
2094 case Intrinsic::aarch64_neon_sqxtn:
2095 return LowerUnaryOp(TargetOpcode::G_TRUNC_SSAT_S);
2096 case Intrinsic::aarch64_neon_sqxtun:
2097 return LowerUnaryOp(TargetOpcode::G_TRUNC_SSAT_U);
2098 case Intrinsic::aarch64_neon_uqxtn:
2099 return LowerUnaryOp(TargetOpcode::G_TRUNC_USAT_U);
2100 case Intrinsic::aarch64_neon_fcvtzu:
2101 return LowerUnaryOp(TargetOpcode::G_FPTOUI_SAT);
2102 case Intrinsic::aarch64_neon_fcvtzs:
2103 return LowerUnaryOp(TargetOpcode::G_FPTOSI_SAT);
2105 case Intrinsic::vector_reverse: