42#define DEBUG_TYPE "gisel-known-bits"
50 "Analysis for ComputingKnownBits",
false,
true)
53 : MF(MF), MRI(MF.getRegInfo()), TL(*MF.getSubtarget().getTargetLowering()),
58 switch (
MI->getOpcode()) {
59 case TargetOpcode::COPY:
61 case TargetOpcode::G_ASSERT_ALIGN: {
63 return Align(
MI->getOperand(2).getImm());
65 case TargetOpcode::G_FRAME_INDEX: {
66 int FrameIdx =
MI->getOperand(1).getIndex();
67 return MF.getFrameInfo().getObjectAlign(FrameIdx);
69 case TargetOpcode::G_INTRINSIC:
70 case TargetOpcode::G_INTRINSIC_W_SIDE_EFFECTS:
71 case TargetOpcode::G_INTRINSIC_CONVERGENT:
72 case TargetOpcode::G_INTRINSIC_CONVERGENT_W_SIDE_EFFECTS:
74 return TL.computeKnownAlignForTargetInstr(*
this, R, MRI,
Depth + 1);
79 assert(
MI.getNumExplicitDefs() == 1 &&
80 "expected single return generic instruction");
85 const LLT Ty = MRI.getType(R);
95 const APInt &DemandedElts,
103 LLT Ty = MRI.getType(R);
104 unsigned BitWidth = Ty.getScalarSizeInBits();
116[[maybe_unused]]
static void
119 <<
"] Computed for: " <<
MI <<
"[" <<
Depth <<
"] Known: 0x"
130 const APInt &DemandedElts,
161 const APInt &DemandedElts,
164 unsigned Opcode =
MI.getOpcode();
165 LLT DstTy = MRI.getType(R);
179 "DemandedElt width should equal the fixed vector number of elements");
182 "DemandedElt width should be 1 for scalars or scalable vectors");
207 TL.computeKnownBitsForTargetInstr(*
this, R, Known, DemandedElts, MRI,
210 case TargetOpcode::G_BUILD_VECTOR: {
215 if (!DemandedElts[
I])
229 case TargetOpcode::G_SPLAT_VECTOR: {
237 case TargetOpcode::COPY:
238 case TargetOpcode::G_PHI:
239 case TargetOpcode::PHI: {
245 assert(
MI.getOperand(0).getSubReg() == 0 &&
"Is this code in SSA?");
248 for (
unsigned Idx = 1; Idx <
MI.getNumOperands(); Idx += 2) {
251 LLT SrcTy = MRI.getType(SrcReg);
259 if (SrcReg.
isVirtual() && Src.getSubReg() == 0 &&
261 APInt NowDemandedElts;
262 if (!SrcTy.isFixedVector()) {
263 NowDemandedElts =
APInt(1, 1);
266 NowDemandedElts = DemandedElts;
273 Depth + (Opcode != TargetOpcode::COPY));
288 case TargetOpcode::G_STEP_VECTOR: {
289 APInt Step =
MI.getOperand(1).getCImm()->getValue();
297 const APInt MinNumElts =
303 .
umul_ov(MinNumElts, Overflow);
306 const APInt MaxValue = (MaxNumElts - 1).
umul_ov(Step, Overflow);
312 case TargetOpcode::G_CONSTANT: {
316 case TargetOpcode::G_FRAME_INDEX: {
317 int FrameIdx =
MI.getOperand(1).getIndex();
318 TL.computeKnownBitsForFrameIndex(FrameIdx, Known, MF);
321 case TargetOpcode::G_SUB: {
330 case TargetOpcode::G_XOR: {
339 case TargetOpcode::G_PTR_ADD: {
343 LLT Ty = MRI.getType(
MI.getOperand(1).getReg());
344 if (DL.isNonIntegralAddressSpace(Ty.getAddressSpace()))
348 case TargetOpcode::G_ADD: {
356 case TargetOpcode::G_AND: {
366 case TargetOpcode::G_OR: {
376 case TargetOpcode::G_MUL: {
384 case TargetOpcode::G_UMULH: {
392 case TargetOpcode::G_SMULH: {
400 case TargetOpcode::G_ABDU: {
408 case TargetOpcode::G_ABDS: {
417 if (SignBits1 == 1) {
426 case TargetOpcode::G_UDIV: {
435 case TargetOpcode::G_SDIV: {
444 case TargetOpcode::G_UREM: {
456 case TargetOpcode::G_SREM: {
468 case TargetOpcode::G_SELECT: {
469 computeKnownBitsMin(
MI.getOperand(2).getReg(),
MI.getOperand(3).getReg(),
470 Known, DemandedElts,
Depth + 1);
473 case TargetOpcode::G_SMIN: {
483 case TargetOpcode::G_SMAX: {
493 case TargetOpcode::G_UMIN: {
502 case TargetOpcode::G_UMAX: {
511 case TargetOpcode::G_FCMP:
512 case TargetOpcode::G_ICMP: {
515 if (TL.getBooleanContents(DstTy.
isVector(),
516 Opcode == TargetOpcode::G_FCMP) ==
522 case TargetOpcode::G_SEXT: {
530 case TargetOpcode::G_ASSERT_SEXT:
531 case TargetOpcode::G_SEXT_INREG: {
534 Known = Known.
sextInReg(
MI.getOperand(2).getImm());
537 case TargetOpcode::G_ANYEXT: {
543 case TargetOpcode::G_LOAD: {
551 case TargetOpcode::G_SEXTLOAD:
552 case TargetOpcode::G_ZEXTLOAD: {
559 Known = Opcode == TargetOpcode::G_SEXTLOAD
564 case TargetOpcode::G_ASHR: {
573 case TargetOpcode::G_LSHR: {
582 case TargetOpcode::G_SHL: {
591 case TargetOpcode::G_ROTL:
592 case TargetOpcode::G_ROTR: {
593 MachineInstr *AmtOpMI = MRI.getVRegDef(
MI.getOperand(2).getReg());
601 unsigned Amt = MaybeAmtOp->urem(
BitWidth);
604 if (Opcode == TargetOpcode::G_ROTL)
611 case TargetOpcode::G_FSHL:
612 case TargetOpcode::G_FSHR: {
613 MachineInstr *AmtOpMI = MRI.getVRegDef(
MI.getOperand(3).getReg());
618 const APInt Amt = *MaybeAmtOp;
623 Known = Opcode == TargetOpcode::G_FSHL
628 case TargetOpcode::G_INTTOPTR:
629 case TargetOpcode::G_PTRTOINT:
634 case TargetOpcode::G_ZEXT:
635 case TargetOpcode::G_TRUNC: {
641 case TargetOpcode::G_ASSERT_ZEXT: {
645 unsigned SrcBitWidth =
MI.getOperand(2).getImm();
646 assert(SrcBitWidth &&
"SrcBitWidth can't be zero");
648 Known.
Zero |= (~InMask);
649 Known.
One &= (~Known.Zero);
652 case TargetOpcode::G_ASSERT_ALIGN: {
653 int64_t LogOfAlign =
Log2_64(
MI.getOperand(2).getImm());
662 case TargetOpcode::G_MERGE_VALUES: {
663 unsigned NumOps =
MI.getNumOperands();
664 unsigned OpSize = MRI.getType(
MI.getOperand(1).getReg()).getSizeInBits();
666 for (
unsigned I = 0;
I !=
NumOps - 1; ++
I) {
669 DemandedElts,
Depth + 1);
674 case TargetOpcode::G_UNMERGE_VALUES: {
675 unsigned NumOps =
MI.getNumOperands();
677 LLT SrcTy = MRI.getType(SrcReg);
679 if (SrcTy.isVector() && SrcTy.getScalarType() != DstTy.
getScalarType())
684 for (; DstIdx !=
NumOps - 1 &&
MI.getOperand(DstIdx).
getReg() != R;
688 APInt SubDemandedElts = DemandedElts;
689 if (SrcTy.isVector()) {
692 DemandedElts.
zext(SrcTy.getNumElements()).
shl(DstIdx * DstLanes);
698 if (SrcTy.isVector())
699 Known = std::move(SrcOpKnown);
704 case TargetOpcode::G_BSWAP: {
710 case TargetOpcode::G_BITREVERSE: {
716 case TargetOpcode::G_CTPOP: {
728 case TargetOpcode::G_UBFX: {
729 KnownBits SrcOpKnown, OffsetKnown, WidthKnown;
739 case TargetOpcode::G_SBFX: {
740 KnownBits SrcOpKnown, OffsetKnown, WidthKnown;
757 case TargetOpcode::G_UADDO:
758 case TargetOpcode::G_UADDE:
759 case TargetOpcode::G_SADDO:
760 case TargetOpcode::G_SADDE: {
761 if (
MI.getOperand(1).getReg() == R) {
764 if (TL.getBooleanContents(DstTy.
isVector(),
false) ==
771 assert(
MI.getOperand(0).getReg() == R &&
772 "We only compute knownbits for the sum here.");
775 if (Opcode == TargetOpcode::G_UADDE || Opcode == TargetOpcode::G_SADDE) {
779 Carry = Carry.
trunc(1);
791 case TargetOpcode::G_USUBO:
792 case TargetOpcode::G_USUBE:
793 case TargetOpcode::G_SSUBO:
794 case TargetOpcode::G_SSUBE:
795 case TargetOpcode::G_UMULO:
796 case TargetOpcode::G_SMULO: {
797 if (
MI.getOperand(1).getReg() == R) {
800 if (TL.getBooleanContents(DstTy.
isVector(),
false) ==
807 case TargetOpcode::G_CTTZ:
808 case TargetOpcode::G_CTTZ_ZERO_POISON: {
818 case TargetOpcode::G_CTLZ:
819 case TargetOpcode::G_CTLZ_ZERO_POISON: {
829 case TargetOpcode::G_CTLS: {
833 unsigned MaxUpperRedundantSignBits = MRI.getType(Reg).getScalarSizeInBits();
838 Known =
Range.toKnownBits();
841 case TargetOpcode::G_EXTRACT_VECTOR_ELT: {
848 LLT VecVT = MRI.getType(InVec);
866 if (ConstEltNo && ConstEltNo->ult(NumSrcElts))
873 case TargetOpcode::G_SHUFFLE_VECTOR: {
874 APInt DemandedLHS, DemandedRHS;
877 unsigned NumElts = MRI.getType(
MI.getOperand(1).getReg()).getNumElements();
879 DemandedElts, DemandedLHS, DemandedRHS))
900 case TargetOpcode::G_CONCAT_VECTORS: {
901 if (MRI.getType(
MI.getOperand(0).getReg()).isScalableVector())
906 unsigned NumSubVectorElts =
907 MRI.getType(
MI.getOperand(1).getReg()).getNumElements();
911 DemandedElts.
extractBits(NumSubVectorElts,
I * NumSubVectorElts);
923 case TargetOpcode::G_ABS: {
954void GISelValueTracking::computeKnownFPClassForFPTrunc(
962 KnownFPClass KnownSrc;
963 computeKnownFPClass(Val, DemandedElts, InterestedClasses, KnownSrc,
968void GISelValueTracking::computeKnownFPClass(
Register R,
969 const APInt &DemandedElts,
973 assert(Known.
isUnknown() &&
"should not be called with known information");
983 MachineInstr &
MI = *MRI.getVRegDef(R);
984 unsigned Opcode =
MI.getOpcode();
985 LLT DstTy = MRI.getType(R);
993 switch (Cst->getKind()) {
995 auto APF = Cst->getScalarValue();
997 Known.
SignBit = APF.isNegative();
1002 bool SignBitAllZero =
true;
1003 bool SignBitAllOne =
true;
1005 for (
auto C : *Cst) {
1008 SignBitAllZero =
false;
1010 SignBitAllOne =
false;
1013 if (SignBitAllOne != SignBitAllZero)
1014 Known.
SignBit = SignBitAllOne;
1029 KnownNotFromFlags |=
fcNan;
1031 KnownNotFromFlags |=
fcInf;
1035 InterestedClasses &= ~KnownNotFromFlags;
1038 [=, &Known] { Known.
knownNot(KnownNotFromFlags); });
1044 const MachineFunction *MF =
MI.getMF();
1048 TL.computeKnownFPClassForTargetInstr(*
this, R, Known, DemandedElts, MRI,
1051 case TargetOpcode::G_FNEG: {
1053 computeKnownFPClass(Val, DemandedElts, InterestedClasses, Known,
Depth + 1);
1057 case TargetOpcode::G_SELECT: {
1080 bool LookThroughFAbsFNeg = CmpLHS !=
LHS && CmpLHS !=
RHS;
1081 std::tie(TestedValue, MaskIfTrue, MaskIfFalse) =
1087 MaskIfTrue = TestedMask;
1088 MaskIfFalse = ~TestedMask;
1091 if (TestedValue ==
LHS) {
1093 FilterLHS = MaskIfTrue;
1094 }
else if (TestedValue ==
RHS) {
1096 FilterRHS = MaskIfFalse;
1099 KnownFPClass Known2;
1100 computeKnownFPClass(
LHS, DemandedElts, InterestedClasses & FilterLHS, Known,
1104 computeKnownFPClass(
RHS, DemandedElts, InterestedClasses & FilterRHS,
1111 case TargetOpcode::G_FCOPYSIGN: {
1112 Register Magnitude =
MI.getOperand(1).getReg();
1115 KnownFPClass KnownSign;
1117 computeKnownFPClass(Magnitude, DemandedElts, InterestedClasses, Known,
1119 computeKnownFPClass(Sign, DemandedElts, InterestedClasses, KnownSign,
1124 case TargetOpcode::G_FMA:
1125 case TargetOpcode::G_STRICT_FMA:
1126 case TargetOpcode::G_FMAD: {
1139 KnownFPClass KnownSrc, KnownAddend;
1140 computeKnownFPClass(
C, DemandedElts, InterestedClasses, KnownAddend,
1142 computeKnownFPClass(
A, DemandedElts, InterestedClasses, KnownSrc,
1144 if (KnownNotFromFlags) {
1145 KnownSrc.
knownNot(KnownNotFromFlags);
1146 KnownAddend.
knownNot(KnownNotFromFlags);
1150 KnownFPClass KnownSrc[3];
1151 computeKnownFPClass(
A, DemandedElts, InterestedClasses, KnownSrc[0],
1153 if (KnownSrc[0].isUnknown())
1155 computeKnownFPClass(
B, DemandedElts, InterestedClasses, KnownSrc[1],
1157 if (KnownSrc[1].isUnknown())
1159 computeKnownFPClass(
C, DemandedElts, InterestedClasses, KnownSrc[2],
1161 if (KnownSrc[2].isUnknown())
1163 if (KnownNotFromFlags) {
1164 KnownSrc[0].
knownNot(KnownNotFromFlags);
1165 KnownSrc[1].
knownNot(KnownNotFromFlags);
1166 KnownSrc[2].
knownNot(KnownNotFromFlags);
1172 case TargetOpcode::G_FSQRT:
1173 case TargetOpcode::G_STRICT_FSQRT: {
1174 KnownFPClass KnownSrc;
1176 if (InterestedClasses &
fcNan)
1180 computeKnownFPClass(Val, DemandedElts, InterestedSrcs, KnownSrc,
Depth + 1);
1189 case TargetOpcode::G_FABS: {
1194 computeKnownFPClass(Val, DemandedElts, InterestedClasses, Known,
1200 case TargetOpcode::G_FATAN2: {
1203 KnownFPClass KnownY, KnownX;
1204 computeKnownFPClass(
Y, DemandedElts, InterestedClasses, KnownY,
Depth + 1);
1205 computeKnownFPClass(
X, DemandedElts, InterestedClasses, KnownX,
Depth + 1);
1209 case TargetOpcode::G_FSINH: {
1211 KnownFPClass KnownSrc;
1212 computeKnownFPClass(Val, DemandedElts, InterestedClasses, KnownSrc,
1217 case TargetOpcode::G_FCOSH: {
1219 KnownFPClass KnownSrc;
1220 computeKnownFPClass(Val, DemandedElts, InterestedClasses, KnownSrc,
1225 case TargetOpcode::G_FTANH: {
1227 KnownFPClass KnownSrc;
1228 computeKnownFPClass(Val, DemandedElts, InterestedClasses, KnownSrc,
1233 case TargetOpcode::G_FASIN: {
1235 KnownFPClass KnownSrc;
1236 computeKnownFPClass(Val, DemandedElts, InterestedClasses, KnownSrc,
1241 case TargetOpcode::G_FACOS: {
1243 KnownFPClass KnownSrc;
1244 computeKnownFPClass(Val, DemandedElts, InterestedClasses, KnownSrc,
1249 case TargetOpcode::G_FATAN: {
1251 KnownFPClass KnownSrc;
1252 computeKnownFPClass(Val, DemandedElts, InterestedClasses, KnownSrc,
1257 case TargetOpcode::G_FTAN: {
1259 KnownFPClass KnownSrc;
1260 computeKnownFPClass(Val, DemandedElts, InterestedClasses, KnownSrc,
1265 case TargetOpcode::G_FSIN:
1266 case TargetOpcode::G_FCOS: {
1269 KnownFPClass KnownSrc;
1270 computeKnownFPClass(Val, DemandedElts, InterestedClasses, KnownSrc,
1273 : KnownFPClass::sin(KnownSrc);
1276 case TargetOpcode::G_FSINCOS: {
1279 KnownFPClass KnownSrc;
1280 computeKnownFPClass(Src, DemandedElts, InterestedClasses, KnownSrc,
1282 if (R ==
MI.getOperand(0).getReg())
1288 case TargetOpcode::G_FMAXNUM:
1289 case TargetOpcode::G_FMINNUM:
1290 case TargetOpcode::G_FMINNUM_IEEE:
1291 case TargetOpcode::G_FMAXIMUM:
1292 case TargetOpcode::G_FMINIMUM:
1293 case TargetOpcode::G_FMAXNUM_IEEE:
1294 case TargetOpcode::G_FMAXIMUMNUM:
1295 case TargetOpcode::G_FMINIMUMNUM: {
1298 KnownFPClass KnownLHS, KnownRHS;
1300 computeKnownFPClass(
LHS, DemandedElts, InterestedClasses, KnownLHS,
1302 computeKnownFPClass(
RHS, DemandedElts, InterestedClasses, KnownRHS,
1307 case TargetOpcode::G_FMINIMUM:
1310 case TargetOpcode::G_FMAXIMUM:
1313 case TargetOpcode::G_FMINIMUMNUM:
1316 case TargetOpcode::G_FMAXIMUMNUM:
1319 case TargetOpcode::G_FMINNUM:
1320 case TargetOpcode::G_FMINNUM_IEEE:
1323 case TargetOpcode::G_FMAXNUM:
1324 case TargetOpcode::G_FMAXNUM_IEEE:
1336 case TargetOpcode::G_FCANONICALIZE: {
1338 KnownFPClass KnownSrc;
1339 computeKnownFPClass(Val, DemandedElts, InterestedClasses, KnownSrc,
1344 DenormalMode DenormMode = MF->getDenormalMode(FPType);
1348 case TargetOpcode::G_VECREDUCE_FMAX:
1349 case TargetOpcode::G_VECREDUCE_FMIN:
1350 case TargetOpcode::G_VECREDUCE_FMAXIMUM:
1351 case TargetOpcode::G_VECREDUCE_FMINIMUM: {
1357 computeKnownFPClass(Val,
MI.getFlags(), InterestedClasses,
Depth + 1);
1363 case TargetOpcode::G_FFLOOR:
1364 case TargetOpcode::G_FCEIL:
1365 case TargetOpcode::G_FRINT:
1366 case TargetOpcode::G_FNEARBYINT:
1367 case TargetOpcode::G_INTRINSIC_FPTRUNC_ROUND:
1368 case TargetOpcode::G_INTRINSIC_ROUND:
1369 case TargetOpcode::G_INTRINSIC_ROUNDEVEN:
1370 case TargetOpcode::G_INTRINSIC_TRUNC: {
1372 KnownFPClass KnownSrc;
1378 computeKnownFPClass(Val, DemandedElts, InterestedSrcs, KnownSrc,
Depth + 1);
1381 bool IsTrunc = Opcode == TargetOpcode::G_INTRINSIC_TRUNC;
1386 case TargetOpcode::G_FEXP:
1387 case TargetOpcode::G_FEXP2:
1388 case TargetOpcode::G_FEXP10: {
1390 KnownFPClass KnownSrc;
1391 computeKnownFPClass(Val, DemandedElts, InterestedClasses, KnownSrc,
1396 case TargetOpcode::G_FLOG:
1397 case TargetOpcode::G_FLOG2:
1398 case TargetOpcode::G_FLOG10: {
1413 KnownFPClass KnownSrc;
1414 computeKnownFPClass(Val, DemandedElts, InterestedSrcs, KnownSrc,
Depth + 1);
1418 DenormalMode
Mode = MF->getDenormalMode(FltSem);
1422 case TargetOpcode::G_FPOWI: {
1427 LLT ExpTy = MRI.getType(Exp);
1429 Exp, ExpTy.
isVector() ? DemandedElts : APInt(1, 1),
Depth + 1);
1432 if (InterestedClasses &
fcNan)
1433 InterestedSrcs |=
fcNan;
1434 if (!ExponentKnownBits.
isZero()) {
1435 if (InterestedClasses &
fcInf)
1441 KnownFPClass KnownSrc;
1442 if (InterestedSrcs !=
fcNone) {
1444 computeKnownFPClass(Val, DemandedElts, InterestedSrcs, KnownSrc,
1451 case TargetOpcode::G_FLDEXP:
1452 case TargetOpcode::G_STRICT_FLDEXP: {
1454 KnownFPClass KnownSrc;
1455 computeKnownFPClass(Val, DemandedElts, InterestedClasses, KnownSrc,
1463 LLT ExpTy = MRI.getType(ExpReg);
1465 ExpReg, ExpTy.
isVector() ? DemandedElts : APInt(1, 1),
Depth + 1);
1470 DenormalMode
Mode = MF->getDenormalMode(Flt);
1474 case TargetOpcode::G_FADD:
1475 case TargetOpcode::G_STRICT_FADD:
1476 case TargetOpcode::G_FSUB:
1477 case TargetOpcode::G_STRICT_FSUB: {
1480 bool IsAdd = (Opcode == TargetOpcode::G_FADD ||
1481 Opcode == TargetOpcode::G_STRICT_FADD);
1485 bool WantNaN = (InterestedClasses &
fcNan) !=
fcNone;
1488 if (!WantNaN && !WantNegative && !WantNegZero) {
1498 if (InterestedClasses &
fcNan)
1499 InterestedSrcs |=
fcInf;
1503 KnownFPClass KnownSelf;
1504 computeKnownFPClass(
LHS, DemandedElts, InterestedSrcs, KnownSelf,
1510 KnownFPClass KnownLHS, KnownRHS;
1511 computeKnownFPClass(
RHS, DemandedElts, InterestedSrcs, KnownRHS,
Depth + 1);
1515 WantNegZero || !IsAdd) {
1518 computeKnownFPClass(
LHS, DemandedElts, InterestedSrcs, KnownLHS,
1528 case TargetOpcode::G_FMUL:
1529 case TargetOpcode::G_STRICT_FMUL: {
1537 KnownFPClass KnownSrc;
1544 KnownFPClass KnownLHS;
1548 KnownFPClass KnownLHS, KnownRHS;
1564 case TargetOpcode::G_FDIV:
1565 case TargetOpcode::G_FREM: {
1569 if (Opcode == TargetOpcode::G_FREM)
1576 if (Opcode == TargetOpcode::G_FDIV) {
1577 const bool WantNan = (InterestedClasses &
fcNan) !=
fcNone;
1583 KnownFPClass KnownSrc;
1584 computeKnownFPClass(
LHS, DemandedElts,
1589 const bool WantNan = (InterestedClasses &
fcNan) !=
fcNone;
1595 KnownFPClass KnownSrc;
1596 computeKnownFPClass(
LHS, DemandedElts,
1604 const bool WantNan = (InterestedClasses &
fcNan) !=
fcNone;
1606 const bool WantPositive = Opcode == TargetOpcode::G_FREM &&
1608 if (!WantNan && !WantNegative && !WantPositive) {
1612 KnownFPClass KnownLHS, KnownRHS;
1615 KnownRHS,
Depth + 1);
1621 if (KnowSomethingUseful || WantPositive) {
1625 if (Opcode == TargetOpcode::G_FDIV) {
1649 case TargetOpcode::G_FFREXP: {
1651 if (R !=
MI.getOperand(0).getReg())
1654 KnownFPClass KnownSrc;
1655 computeKnownFPClass(Src, DemandedElts, InterestedClasses, KnownSrc,
1662 case TargetOpcode::G_FPEXT: {
1664 KnownFPClass KnownSrc;
1665 computeKnownFPClass(Src, DemandedElts, InterestedClasses, KnownSrc,
1670 LLT SrcTy = MRI.getType(Src).getScalarType();
1676 case TargetOpcode::G_FPTRUNC: {
1677 computeKnownFPClassForFPTrunc(
MI, DemandedElts, InterestedClasses, Known,
1681 case TargetOpcode::G_SITOFP:
1682 case TargetOpcode::G_UITOFP: {
1693 if (Opcode == TargetOpcode::G_UITOFP)
1701 LLT Ty = MRI.getType(Val);
1703 Val, Ty.
isVector() ? DemandedElts : APInt(1, 1),
Depth + 1);
1709 if (Opcode == TargetOpcode::G_SITOFP) {
1719 if (InterestedClasses &
fcInf) {
1726 if (Opcode == TargetOpcode::G_UITOFP)
1740 case TargetOpcode::G_BUILD_VECTOR:
1741 case TargetOpcode::G_CONCAT_VECTORS: {
1748 for (
unsigned Idx = 0; Idx <
Merge.getNumSources(); ++Idx) {
1750 bool NeedsElt = DemandedElts[Idx];
1756 computeKnownFPClass(Src, Known, InterestedClasses,
Depth + 1);
1759 KnownFPClass Known2;
1760 computeKnownFPClass(Src, Known2, InterestedClasses,
Depth + 1);
1772 case TargetOpcode::G_EXTRACT_VECTOR_ELT: {
1782 LLT VecTy = MRI.getType(Vec);
1787 if (CIdx && CIdx->ult(NumElts))
1789 return computeKnownFPClass(Vec, DemandedVecElts, InterestedClasses, Known,
1795 case TargetOpcode::G_INSERT_VECTOR_ELT: {
1801 LLT VecTy = MRI.getType(Vec);
1809 APInt DemandedVecElts = DemandedElts;
1810 bool NeedsElt =
true;
1812 if (CIdx && CIdx->ult(NumElts)) {
1813 DemandedVecElts.
clearBit(CIdx->getZExtValue());
1814 NeedsElt = DemandedElts[CIdx->getZExtValue()];
1819 computeKnownFPClass(Elt, Known, InterestedClasses,
Depth + 1);
1828 if (!DemandedVecElts.
isZero()) {
1829 KnownFPClass Known2;
1830 computeKnownFPClass(Vec, DemandedVecElts, InterestedClasses, Known2,
1837 case TargetOpcode::G_SHUFFLE_VECTOR: {
1841 APInt DemandedLHS, DemandedRHS;
1843 assert(DemandedElts == APInt(1, 1));
1844 DemandedLHS = DemandedRHS = DemandedElts;
1846 unsigned NumElts = MRI.getType(Shuf.
getSrc1Reg()).getNumElements();
1848 DemandedLHS, DemandedRHS)) {
1854 if (!!DemandedLHS) {
1856 computeKnownFPClass(
LHS, DemandedLHS, InterestedClasses, Known,
1866 if (!!DemandedRHS) {
1867 KnownFPClass Known2;
1869 computeKnownFPClass(
RHS, DemandedRHS, InterestedClasses, Known2,
1875 case TargetOpcode::G_PHI: {
1884 for (
unsigned Idx = 1; Idx <
MI.getNumOperands(); Idx += 2) {
1885 const MachineOperand &Src =
MI.getOperand(Idx);
1888 computeKnownFPClass(SrcReg, DemandedElts, InterestedClasses, Known,
1892 KnownFPClass Known2;
1893 computeKnownFPClass(SrcReg, DemandedElts, InterestedClasses, Known2,
1902 case TargetOpcode::COPY: {
1905 if (!Src.isVirtual())
1908 computeKnownFPClass(Src, DemandedElts, InterestedClasses, Known,
Depth + 1);
1919 computeKnownFPClass(R, DemandedElts, InterestedClasses, KnownClasses,
Depth);
1920 return KnownClasses;
1926 computeKnownFPClass(R, Known, InterestedClasses,
Depth);
1934 InterestedClasses &=
~fcNan;
1936 InterestedClasses &=
~fcInf;
1939 computeKnownFPClass(R, DemandedElts, InterestedClasses,
Depth);
1942 Result.KnownFPClasses &=
~fcNan;
1944 Result.KnownFPClasses &=
~fcInf;
1950 LLT Ty = MRI.getType(R);
1951 APInt DemandedElts =
1953 return computeKnownFPClass(R, DemandedElts, Flags, InterestedClasses,
Depth);
1968 switch (
DefMI->getOpcode()) {
1971 case TargetOpcode::G_FADD:
1972 case TargetOpcode::G_STRICT_FADD:
1973 case TargetOpcode::G_FSUB:
1974 case TargetOpcode::G_STRICT_FSUB:
1975 case TargetOpcode::G_FMUL:
1976 case TargetOpcode::G_STRICT_FMUL:
1977 case TargetOpcode::G_FDIV:
1978 case TargetOpcode::G_FREM:
1979 case TargetOpcode::G_FMA:
1980 case TargetOpcode::G_STRICT_FMA:
1981 case TargetOpcode::G_FMAD:
1982 case TargetOpcode::G_FSQRT:
1983 case TargetOpcode::G_STRICT_FSQRT:
1987 case TargetOpcode::G_FSIN:
1988 case TargetOpcode::G_FCOS:
1989 case TargetOpcode::G_FSINCOS:
1990 case TargetOpcode::G_FTAN:
1991 case TargetOpcode::G_FASIN:
1992 case TargetOpcode::G_FACOS:
1993 case TargetOpcode::G_FATAN:
1994 case TargetOpcode::G_FATAN2:
1995 case TargetOpcode::G_FSINH:
1996 case TargetOpcode::G_FCOSH:
1997 case TargetOpcode::G_FTANH:
1998 case TargetOpcode::G_FEXP:
1999 case TargetOpcode::G_FEXP2:
2000 case TargetOpcode::G_FEXP10:
2001 case TargetOpcode::G_FLOG:
2002 case TargetOpcode::G_FLOG2:
2003 case TargetOpcode::G_FLOG10:
2004 case TargetOpcode::G_FPOWI:
2005 case TargetOpcode::G_FLDEXP:
2006 case TargetOpcode::G_STRICT_FLDEXP:
2007 case TargetOpcode::G_FFREXP:
2008 case TargetOpcode::G_INTRINSIC_TRUNC:
2009 case TargetOpcode::G_INTRINSIC_ROUND:
2010 case TargetOpcode::G_INTRINSIC_ROUNDEVEN:
2011 case TargetOpcode::G_FFLOOR:
2012 case TargetOpcode::G_FCEIL:
2013 case TargetOpcode::G_FRINT:
2014 case TargetOpcode::G_FNEARBYINT:
2015 case TargetOpcode::G_FPEXT:
2016 case TargetOpcode::G_FPTRUNC:
2017 case TargetOpcode::G_FCANONICALIZE:
2018 case TargetOpcode::G_FMINNUM:
2019 case TargetOpcode::G_FMAXNUM:
2020 case TargetOpcode::G_FMINNUM_IEEE:
2021 case TargetOpcode::G_FMAXNUM_IEEE:
2022 case TargetOpcode::G_FMINIMUM:
2023 case TargetOpcode::G_FMAXIMUM:
2024 case TargetOpcode::G_FMINIMUMNUM:
2025 case TargetOpcode::G_FMAXIMUMNUM:
2039unsigned GISelValueTracking::computeNumSignBitsMin(
Register Src0,
Register Src1,
2040 const APInt &DemandedElts,
2044 if (Src1SignBits == 1)
2061 case TargetOpcode::G_SEXTLOAD:
2064 case TargetOpcode::G_ZEXTLOAD:
2077 const APInt &DemandedElts,
2080 unsigned Opcode =
MI.getOpcode();
2082 if (Opcode == TargetOpcode::G_CONSTANT)
2083 return MI.getOperand(1).getCImm()->getValue().getNumSignBits();
2091 LLT DstTy = MRI.getType(R);
2101 unsigned FirstAnswer = 1;
2103 case TargetOpcode::COPY: {
2105 if (Src.getReg().isVirtual() && Src.getSubReg() == 0 &&
2106 MRI.getType(Src.getReg()).isValid()) {
2113 case TargetOpcode::G_SEXT: {
2115 LLT SrcTy = MRI.getType(Src);
2119 case TargetOpcode::G_ASSERT_SEXT:
2120 case TargetOpcode::G_SEXT_INREG: {
2123 unsigned SrcBits =
MI.getOperand(2).getImm();
2124 unsigned InRegBits = TyBits - SrcBits + 1;
2128 case TargetOpcode::G_LOAD: {
2135 case TargetOpcode::G_SEXTLOAD: {
2150 case TargetOpcode::G_ZEXTLOAD: {
2165 case TargetOpcode::G_AND:
2166 case TargetOpcode::G_OR:
2167 case TargetOpcode::G_XOR: {
2169 unsigned Src1NumSignBits =
2171 if (Src1NumSignBits != 1) {
2173 unsigned Src2NumSignBits =
2175 FirstAnswer = std::min(Src1NumSignBits, Src2NumSignBits);
2179 case TargetOpcode::G_ASHR: {
2184 FirstAnswer = std::min<uint64_t>(FirstAnswer + *
C, TyBits);
2187 case TargetOpcode::G_SHL: {
2190 if (std::optional<ConstantRange> ShAmtRange =
2192 uint64_t MaxShAmt = ShAmtRange->getUnsignedMax().getZExtValue();
2193 uint64_t MinShAmt = ShAmtRange->getUnsignedMin().getZExtValue();
2203 if (ExtOpc == TargetOpcode::G_SEXT || ExtOpc == TargetOpcode::G_ZEXT ||
2204 ExtOpc == TargetOpcode::G_ANYEXT) {
2205 LLT ExtTy = MRI.getType(Src1);
2207 LLT ExtendeeTy = MRI.getType(Extendee);
2211 if (SizeDiff <= MinShAmt) {
2215 return Tmp - MaxShAmt;
2221 return Tmp - MaxShAmt;
2225 case TargetOpcode::G_SREM: {
2233 case TargetOpcode::G_TRUNC: {
2235 LLT SrcTy = MRI.getType(Src);
2239 unsigned NumSrcBits = SrcTy.getScalarSizeInBits();
2241 if (NumSrcSignBits > (NumSrcBits - DstTyBits))
2242 return NumSrcSignBits - (NumSrcBits - DstTyBits);
2245 case TargetOpcode::G_SELECT: {
2246 return computeNumSignBitsMin(
MI.getOperand(2).getReg(),
2247 MI.getOperand(3).getReg(), DemandedElts,
2250 case TargetOpcode::G_SMIN:
2251 case TargetOpcode::G_SMAX:
2252 case TargetOpcode::G_UMIN:
2253 case TargetOpcode::G_UMAX:
2255 return computeNumSignBitsMin(
MI.getOperand(1).getReg(),
2256 MI.getOperand(2).getReg(), DemandedElts,
2258 case TargetOpcode::G_SADDO:
2259 case TargetOpcode::G_SADDE:
2260 case TargetOpcode::G_UADDO:
2261 case TargetOpcode::G_UADDE:
2262 case TargetOpcode::G_SSUBO:
2263 case TargetOpcode::G_SSUBE:
2264 case TargetOpcode::G_USUBO:
2265 case TargetOpcode::G_USUBE:
2266 case TargetOpcode::G_SMULO:
2267 case TargetOpcode::G_UMULO: {
2271 if (
MI.getOperand(1).getReg() == R) {
2272 if (TL.getBooleanContents(DstTy.
isVector(),
false) ==
2279 case TargetOpcode::G_SUB: {
2281 unsigned Src2NumSignBits =
2283 if (Src2NumSignBits == 1)
2293 if ((Known2.
Zero | 1).isAllOnes())
2300 FirstAnswer = Src2NumSignBits;
2307 unsigned Src1NumSignBits =
2309 if (Src1NumSignBits == 1)
2314 FirstAnswer = std::min(Src1NumSignBits, Src2NumSignBits) - 1;
2317 case TargetOpcode::G_ADD: {
2319 unsigned Src2NumSignBits =
2321 if (Src2NumSignBits <= 2)
2325 unsigned Src1NumSignBits =
2327 if (Src1NumSignBits == 1)
2336 if ((Known1.
Zero | 1).isAllOnes())
2342 FirstAnswer = Src1NumSignBits;
2351 FirstAnswer = std::min(Src1NumSignBits, Src2NumSignBits) - 1;
2354 case TargetOpcode::G_FCMP:
2355 case TargetOpcode::G_ICMP: {
2356 bool IsFP = Opcode == TargetOpcode::G_FCMP;
2359 auto BC = TL.getBooleanContents(DstTy.
isVector(), IsFP);
2366 case TargetOpcode::G_BUILD_VECTOR: {
2368 FirstAnswer = TyBits;
2369 APInt SingleDemandedElt(1, 1);
2371 if (!DemandedElts[
I])
2376 FirstAnswer = std::min(FirstAnswer, Tmp2);
2379 if (FirstAnswer == 1)
2384 case TargetOpcode::G_CONCAT_VECTORS: {
2385 if (MRI.getType(
MI.getOperand(0).getReg()).isScalableVector())
2387 FirstAnswer = TyBits;
2390 unsigned NumSubVectorElts =
2391 MRI.getType(
MI.getOperand(1).getReg()).getNumElements();
2394 DemandedElts.
extractBits(NumSubVectorElts,
I * NumSubVectorElts);
2399 FirstAnswer = std::min(FirstAnswer, Tmp2);
2402 if (FirstAnswer == 1)
2407 case TargetOpcode::G_SHUFFLE_VECTOR: {
2410 APInt DemandedLHS, DemandedRHS;
2412 unsigned NumElts = MRI.getType(Src1).getNumElements();
2414 DemandedElts, DemandedLHS, DemandedRHS))
2420 if (FirstAnswer == 1)
2422 if (!!DemandedRHS) {
2425 FirstAnswer = std::min(FirstAnswer, Tmp2);
2429 case TargetOpcode::G_SPLAT_VECTOR: {
2433 unsigned NumSrcBits = MRI.getType(Src).getSizeInBits();
2434 if (NumSrcSignBits > (NumSrcBits - TyBits))
2435 return NumSrcSignBits - (NumSrcBits - TyBits);
2438 case TargetOpcode::G_INTRINSIC:
2439 case TargetOpcode::G_INTRINSIC_W_SIDE_EFFECTS:
2440 case TargetOpcode::G_INTRINSIC_CONVERGENT:
2441 case TargetOpcode::G_INTRINSIC_CONVERGENT_W_SIDE_EFFECTS:
2444 TL.computeNumSignBitsForTargetInstr(*
this, R, DemandedElts, MRI,
Depth);
2446 FirstAnswer = std::max(FirstAnswer, NumBits);
2466 Mask <<= Mask.getBitWidth() - TyBits;
2467 return std::max(FirstAnswer, Mask.countl_one());
2471 LLT Ty = MRI.getType(R);
2472 APInt DemandedElts =
2481 unsigned Opcode =
MI.getOpcode();
2483 LLT Ty = MRI.getType(R);
2484 unsigned BitWidth = Ty.getScalarSizeInBits();
2486 if (Opcode == TargetOpcode::G_CONSTANT) {
2487 const APInt &ShAmt =
MI.getOperand(1).getCImm()->getValue();
2489 return std::nullopt;
2493 if (Opcode == TargetOpcode::G_BUILD_VECTOR) {
2494 const APInt *MinAmt =
nullptr, *MaxAmt =
nullptr;
2495 for (
unsigned I = 0, E =
MI.getNumOperands() - 1;
I != E; ++
I) {
2496 if (!DemandedElts[
I])
2499 if (
Op->getOpcode() != TargetOpcode::G_CONSTANT) {
2500 MinAmt = MaxAmt =
nullptr;
2504 const APInt &ShAmt =
Op->getOperand(1).getCImm()->getValue();
2506 return std::nullopt;
2507 if (!MinAmt || MinAmt->
ugt(ShAmt))
2509 if (!MaxAmt || MaxAmt->ult(ShAmt))
2512 assert(((!MinAmt && !MaxAmt) || (MinAmt && MaxAmt)) &&
2513 "Failed to find matching min/max shift amounts");
2514 if (MinAmt && MaxAmt)
2524 return std::nullopt;
2529 if (std::optional<ConstantRange> AmtRange =
2531 return AmtRange->getUnsignedMin().getZExtValue();
2532 return std::nullopt;
2550 Info = std::make_unique<GISelValueTracking>(MF, MaxDepth);
2575 if (!MO.isReg() || MO.getReg().isPhysical())
2578 if (!MRI.getType(Reg).isValid())
2580 KnownBits Known = VTA.getKnownBits(Reg);
2581 unsigned SignedBits = VTA.computeNumSignBits(Reg);
2582 OS <<
" " << MO <<
" KnownBits:" << Known <<
" SignBits:" << SignedBits
MachineInstrBuilder MachineInstrBuilder & DefMI
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
This file declares a class to represent arbitrary precision floating point values and provide a varie...
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
Utilities for dealing with flags related to floating point properties and mode controls.
static void dumpResult(const MachineInstr &MI, const KnownBits &Known, unsigned Depth)
static unsigned computeNumSignBitsFromRangeMetadata(const GAnyLoad *Ld, unsigned TyBits)
Compute the known number of sign bits with attached range metadata in the memory operand.
Provides analysis for querying information about KnownBits during GISel passes.
Declares convenience wrapper classes for interpreting MachineInstr instances as specific generic oper...
const size_t AbstractManglingParser< Derived, Alloc >::NumOps
Implement a low-level type suitable for MachineInstr level instruction selection.
Contains matchers for matching SSA Machine Instructions.
Promote Memory to Register
static MCRegister getReg(const MCDisassembler *D, unsigned RC, unsigned RegNo)
ConstantRange Range(APInt(BitWidth, Low), APInt(BitWidth, High))
#define INITIALIZE_PASS(passName, arg, name, cfg, analysis)
const SmallVectorImpl< MachineOperand > & Cond
static cl::opt< RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode > Mode("regalloc-enable-advisor", cl::Hidden, cl::init(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default), cl::desc("Enable regalloc advisor mode"), cl::values(clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default, "default", "Default"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Release, "release", "precompiled"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Development, "development", "for training")))
static uint64_t umul_ov(uint64_t i, uint64_t j, bool &Overflow)
This file defines the make_scope_exit function, which executes user-defined cleanup logic at scope ex...
static TableGen::Emitter::Opt Y("gen-skeleton-entry", EmitSkeleton, "Generate example skeleton entry")
This file describes how to lower LLVM code to machine code.
static bool isAbsoluteValueULEOne(const Value *V)
static Function * getFunction(FunctionType *Ty, const Twine &Name, Module *M)
static APFloat getLargest(const fltSemantics &Sem, bool Negative=false)
Returns the largest finite number in the given semantics.
Class for arbitrary precision integers.
LLVM_ABI APInt umul_ov(const APInt &RHS, bool &Overflow) const
static APInt getAllOnes(unsigned numBits)
Return an APInt of a specified width with all bits set.
void clearBit(unsigned BitPosition)
Set a given bit to 0.
LLVM_ABI APInt zext(unsigned width) const
Zero extend to a new width.
static APInt getSignMask(unsigned BitWidth)
Get the SignMask for a specific bit width.
void setHighBits(unsigned hiBits)
Set the top hiBits bits.
void setBitsFrom(unsigned loBit)
Set the top bits starting from loBit.
bool ugt(const APInt &RHS) const
Unsigned greater than comparison.
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
unsigned getBitWidth() const
Return the number of bits in the APInt.
bool ult(const APInt &RHS) const
Unsigned less than comparison.
LLVM_ABI APInt rotr(unsigned rotateAmt) const
Rotate right by rotateAmt.
unsigned getNumSignBits() const
Computes the number of leading bits of this APInt that are equal to its sign bit.
unsigned countl_zero() const
The APInt version of std::countl_zero.
void clearLowBits(unsigned loBits)
Set bottom loBits bits to 0.
unsigned logBase2() const
uint64_t getLimitedValue(uint64_t Limit=UINT64_MAX) const
If this value is smaller than the specified limit, return it, otherwise return the limit value.
void setAllBits()
Set every bit to 1.
APInt shl(unsigned shiftAmt) const
Left-shift function.
bool isPowerOf2() const
Check if this APInt's value is a power of two greater than zero.
static APInt getLowBitsSet(unsigned numBits, unsigned loBitsSet)
Constructs an APInt value that has the bottom loBitsSet bits set.
void setLowBits(unsigned loBits)
Set the bottom loBits bits.
LLVM_ABI APInt extractBits(unsigned numBits, unsigned bitPosition) const
Return an APInt with the extracted bits [bitPosition,bitPosition+numBits).
static APInt getBitsSetFrom(unsigned numBits, unsigned loBit)
Constructs an APInt value that has a contiguous range of bits set.
static APInt getOneBitSet(unsigned numBits, unsigned BitNo)
Return an APInt with exactly one bit set in the result.
bool uge(const APInt &RHS) const
Unsigned greater or equal comparison.
PassT::Result & getResult(IRUnitT &IR, ExtraArgTs... ExtraArgs)
Get the result of an analysis pass for a given IR unit.
Represent the analysis usage information of a pass.
void setPreservesAll()
Set by analyses that do not transform their input at all.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
This class represents a range of values.
static LLVM_ABI ConstantRange fromKnownBits(const KnownBits &Known, bool IsSigned)
Initialize a range based on a known bits constraint.
LLVM_ABI ConstantRange zeroExtend(uint32_t BitWidth) const
Return a new range in the specified integer type, which must be strictly larger than the current type...
LLVM_ABI APInt getSignedMin() const
Return the smallest signed value contained in the ConstantRange.
LLVM_ABI ConstantRange signExtend(uint32_t BitWidth) const
Return a new range in the specified integer type, which must be strictly larger than the current type...
LLVM_ABI APInt getUnsignedMax() const
Return the largest unsigned value contained in the ConstantRange.
LLVM_ABI APInt getSignedMax() const
Return the largest signed value contained in the ConstantRange.
uint32_t getBitWidth() const
Get the bit width of this ConstantRange.
Represents any generic load, including sign/zero extending variants.
const MDNode * getRanges() const
Returns the Ranges that describes the dereference.
static LLVM_ABI std::optional< GFConstant > getConstant(Register Const, const MachineRegisterInfo &MRI)
To use KnownBitsInfo analysis in a pass, KnownBitsInfo &Info = getAnalysis<GISelValueTrackingInfoAnal...
GISelValueTracking & get(MachineFunction &MF)
bool runOnMachineFunction(MachineFunction &MF) override
runOnMachineFunction - This method must be overloaded to perform the desired machine code transformat...
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - This function should be overriden by passes that need analysis information to do t...
GISelValueTracking Result
LLVM_ABI Result run(MachineFunction &MF, MachineFunctionAnalysisManager &MFAM)
LLVM_ABI PreservedAnalyses run(MachineFunction &MF, MachineFunctionAnalysisManager &MFAM)
unsigned getMaxDepth() const
KnownBits getKnownBits(Register R)
Align computeKnownAlignment(Register R, unsigned Depth=0)
std::optional< ConstantRange > getValidShiftAmountRange(Register R, const APInt &DemandedElts, unsigned Depth)
If a G_SHL/G_ASHR/G_LSHR node with shift operand R has shift amounts that are all less than the eleme...
bool maskedValueIsZero(Register Val, const APInt &Mask)
std::optional< uint64_t > getValidMinimumShiftAmount(Register R, const APInt &DemandedElts, unsigned Depth=0)
If a G_SHL/G_ASHR/G_LSHR node with shift operand R has shift amounts that are all less than the eleme...
bool signBitIsZero(Register Op)
const DataLayout & getDataLayout() const
unsigned computeNumSignBits(Register R, const APInt &DemandedElts, unsigned Depth=0)
const MachineFunction & getMachineFunction() const
bool isKnownNeverNaN(Register Val, bool SNaN=false)
Returns true if Val can be assumed to never be a NaN.
APInt getKnownOnes(Register R)
APInt getKnownZeroes(Register R)
void computeKnownBitsImpl(Register R, KnownBits &Known, const APInt &DemandedElts, unsigned Depth=0)
Register getCondReg() const
Register getFalseReg() const
Register getTrueReg() const
Register getSrc2Reg() const
Register getSrc1Reg() const
ArrayRef< int > getMask() const
constexpr bool isScalableVector() const
Returns true if the LLT is a scalable vector.
constexpr unsigned getScalarSizeInBits() const
LLT getScalarType() const
constexpr bool isValid() const
constexpr uint16_t getNumElements() const
Returns the number of elements in a vector LLT.
constexpr bool isVector() const
constexpr ElementCount getElementCount() const
constexpr bool isFixedVector() const
Returns true if the LLT is a fixed vector.
TypeSize getValue() const
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Function & getFunction()
Return the LLVM function that this machine code represents.
const TargetMachine & getTarget() const
getTarget - Return the target machine this machine code is compiled with
Representation of each machine instruction.
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
const MachineOperand & getOperand(unsigned i) const
A description of a memory reference used in the backend.
LLT getMemoryType() const
Return the memory type of the memory reference.
const MDNode * getRanges() const
Return the range tag for the memory reference.
LocationSize getSizeInBits() const
Return the size in bits of the memory reference.
MachineOperand class - Representation of each machine instruction operand.
Register getReg() const
getReg - Returns the register number.
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
LLT getType(Register Reg) const
Get the low-level type of Reg or LLT{} if Reg is not a generic (target independent) virtual register.
A set of analyses that are preserved following a run of a transformation pass.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Wrapper class representing virtual and physical registers.
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
@ ZeroOrOneBooleanContent
@ ZeroOrNegativeOneBooleanContent
CodeGenOptLevel getOptLevel() const
Returns the optimization level: None, Less, Default, or Aggressive.
LLVM_ABI void printAsOperand(raw_ostream &O, bool PrintType=true, const Module *M=nullptr) const
Print the name of this Value out to the specified raw_ostream.
constexpr ScalarTy getKnownMinValue() const
Returns the minimum value this quantity can represent.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
@ C
The default llvm calling convention, compatible with C.
operand_type_match m_Reg()
UnaryOp_match< SrcTy, TargetOpcode::G_FFLOOR > m_GFFloor(const SrcTy &Src)
operand_type_match m_Pred()
bind_ty< FPClassTest > m_FPClassTest(FPClassTest &T)
deferred_ty< Register > m_DeferredReg(Register &R)
Similar to m_SpecificReg/Type, but the specific value to match originated from an earlier sub-pattern...
BinaryOp_match< LHS, RHS, TargetOpcode::G_FSUB, false > m_GFSub(const LHS &L, const RHS &R)
bool mi_match(Reg R, const MachineRegisterInfo &MRI, Pattern &&P)
ClassifyOp_match< LHS, Test, TargetOpcode::G_IS_FPCLASS > m_GIsFPClass(const LHS &L, const Test &T)
Matches the register and immediate used in a fpclass test G_IS_FPCLASS val, 96.
CompareOp_match< Pred, LHS, RHS, TargetOpcode::G_FCMP > m_GFCmp(const Pred &P, const LHS &L, const RHS &R)
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
LLVM_ABI KnownFPClass computeKnownFPClass(const Value *V, const APInt &DemandedElts, FPClassTest InterestedClasses, const SimplifyQuery &SQ, unsigned Depth=0)
Determine which floating-point classes are valid for V, and return them in KnownFPClass bit sets.
LLVM_ABI std::optional< APInt > getIConstantVRegVal(Register VReg, const MachineRegisterInfo &MRI)
If VReg is defined by a G_CONSTANT, return the corresponding value.
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
LLVM_ABI const llvm::fltSemantics & getFltSemanticForLLT(LLT Ty)
Get the appropriate floating point arithmetic semantic based on the bit size of the given scalar LLT.
scope_exit(Callable) -> scope_exit< Callable >
int bit_width(T Value)
Returns the number of bits needed to represent Value if Value is nonzero.
constexpr bool isUIntN(unsigned N, uint64_t x)
Checks if an unsigned integer fits into the given (dynamic) bit width.
AnalysisManager< MachineFunction > MachineFunctionAnalysisManager
int ilogb(const APFloat &Arg)
Returns the exponent of the internal representation of the APFloat.
LLVM_ABI std::optional< APInt > isConstantOrConstantSplatVector(MachineInstr &MI, const MachineRegisterInfo &MRI)
Determines if MI defines a constant integer or a splat vector of constant integers.
unsigned Log2_64(uint64_t Value)
Return the floor log base 2 of the specified value, -1 if the value is zero.
LLVM_ABI bool isGuaranteedNotToBeUndef(const Value *V, AssumptionCache *AC=nullptr, const Instruction *CtxI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Returns true if V cannot be undef, but may be poison.
LLVM_ABI ConstantRange getConstantRangeFromMetadata(const MDNode &RangeMD)
Parse out a conservative ConstantRange from !range metadata.
std::tuple< Value *, FPClassTest, FPClassTest > fcmpImpliesClass(CmpInst::Predicate Pred, const Function &F, Value *LHS, FPClassTest RHSClass, bool LookThroughSrc=true)
LLVM_ABI bool getShuffleDemandedElts(int SrcWidth, ArrayRef< int > Mask, const APInt &DemandedElts, APInt &DemandedLHS, APInt &DemandedRHS, bool AllowUndefElts=false)
Transform a shuffle mask's output demanded element mask into demanded element masks for the 2 operand...
constexpr unsigned MaxAnalysisRecursionDepth
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
LLVM_ABI ConstantRange getVScaleRange(const Function *F, unsigned BitWidth)
Determine the possible constant range of vscale with the given bit width, based on the vscale_range f...
@ First
Helpers to iterate all locations in the MemoryEffectsBase class.
DWARFExpression::Operation Op
std::string toString(const APInt &I, unsigned Radix, bool Signed, bool formatAsCLiteral=false, bool UpperCase=true, bool InsertSeparators=false)
constexpr unsigned BitWidth
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
static uint32_t extractBits(uint64_t Val, uint32_t Hi, uint32_t Lo)
LLVM_ABI void computeKnownBitsFromRangeMetadata(const MDNode &Ranges, KnownBits &Known)
Compute known bits from the range metadata.
This struct is a compact representation of a valid (non-zero power of two) alignment.
A special type used by analysis passes to provide an address that identifies that particular analysis...
static KnownBits makeConstant(const APInt &C)
Create known bits from a known constant.
KnownBits anyextOrTrunc(unsigned BitWidth) const
Return known bits for an "any" extension or truncation of the value we're tracking.
LLVM_ABI KnownBits sextInReg(unsigned SrcBitWidth) const
Return known bits for a in-register sign extension of the value we're tracking.
static LLVM_ABI KnownBits mulhu(const KnownBits &LHS, const KnownBits &RHS)
Compute known bits from zero-extended multiply-hi.
unsigned countMinSignBits() const
Returns the number of times the sign bit is replicated into the other bits.
static LLVM_ABI KnownBits smax(const KnownBits &LHS, const KnownBits &RHS)
Compute known bits for smax(LHS, RHS).
bool isNonNegative() const
Returns true if this value is known to be non-negative.
bool isZero() const
Returns true if value is all zero.
static LLVM_ABI KnownBits ashr(const KnownBits &LHS, const KnownBits &RHS, bool ShAmtNonZero=false, bool Exact=false)
Compute known bits for ashr(LHS, RHS).
static LLVM_ABI KnownBits urem(const KnownBits &LHS, const KnownBits &RHS)
Compute known bits for urem(LHS, RHS).
bool isUnknown() const
Returns true if we don't know any bits.
unsigned countMaxTrailingZeros() const
Returns the maximum number of trailing zero bits possible.
KnownBits trunc(unsigned BitWidth) const
Return known bits for a truncation of the value we're tracking.
KnownBits byteSwap() const
static LLVM_ABI KnownBits fshl(const KnownBits &LHS, const KnownBits &RHS, const APInt &Amt)
Compute known bits for fshl(LHS, RHS, Amt).
unsigned countMaxPopulation() const
Returns the maximum number of bits that could be one.
void setAllZero()
Make all bits known to be zero and discard any previous information.
KnownBits reverseBits() const
unsigned getBitWidth() const
Get the bit width of this value.
static LLVM_ABI KnownBits umax(const KnownBits &LHS, const KnownBits &RHS)
Compute known bits for umax(LHS, RHS).
KnownBits zext(unsigned BitWidth) const
Return known bits for a zero extension of the value we're tracking.
static KnownBits add(const KnownBits &LHS, const KnownBits &RHS, bool NSW=false, bool NUW=false, bool SelfAdd=false)
Compute knownbits resulting from addition of LHS and RHS.
static LLVM_ABI KnownBits lshr(const KnownBits &LHS, const KnownBits &RHS, bool ShAmtNonZero=false, bool Exact=false)
Compute known bits for lshr(LHS, RHS).
bool isNonZero() const
Returns true if this value is known to be non-zero.
static LLVM_ABI KnownBits abdu(const KnownBits &LHS, const KnownBits &RHS)
Compute known bits for abdu(LHS, RHS).
bool isEven() const
Return if the value is known even (the low bit is 0).
KnownBits extractBits(unsigned NumBits, unsigned BitPosition) const
Return a subset of the known bits from [bitPosition,bitPosition+numBits).
KnownBits intersectWith(const KnownBits &RHS) const
Returns KnownBits information that is known to be true for both this and RHS.
KnownBits sext(unsigned BitWidth) const
Return known bits for a sign extension of the value we're tracking.
KnownBits zextOrTrunc(unsigned BitWidth) const
Return known bits for a zero extension or truncation of the value we're tracking.
unsigned countMinLeadingZeros() const
Returns the minimum number of leading zero bits.
APInt getMaxValue() const
Return the maximal unsigned value possible given these KnownBits.
static LLVM_ABI KnownBits fshr(const KnownBits &LHS, const KnownBits &RHS, const APInt &Amt)
Compute known bits for fshr(LHS, RHS, Amt).
static LLVM_ABI KnownBits abds(KnownBits LHS, KnownBits RHS)
Compute known bits for abds(LHS, RHS).
static LLVM_ABI KnownBits smin(const KnownBits &LHS, const KnownBits &RHS)
Compute known bits for smin(LHS, RHS).
static LLVM_ABI KnownBits mulhs(const KnownBits &LHS, const KnownBits &RHS)
Compute known bits from sign-extended multiply-hi.
static LLVM_ABI KnownBits srem(const KnownBits &LHS, const KnownBits &RHS)
Compute known bits for srem(LHS, RHS).
static LLVM_ABI KnownBits udiv(const KnownBits &LHS, const KnownBits &RHS, bool Exact=false)
Compute known bits for udiv(LHS, RHS).
APInt getMinValue() const
Return the minimal unsigned value possible given these KnownBits.
static LLVM_ABI KnownBits sdiv(const KnownBits &LHS, const KnownBits &RHS, bool Exact=false)
Compute known bits for sdiv(LHS, RHS).
bool isNegative() const
Returns true if this value is known to be negative.
static LLVM_ABI KnownBits computeForAddCarry(const KnownBits &LHS, const KnownBits &RHS, const KnownBits &Carry)
Compute known bits resulting from adding LHS, RHS and a 1-bit Carry.
static KnownBits sub(const KnownBits &LHS, const KnownBits &RHS, bool NSW=false, bool NUW=false)
Compute knownbits resulting from subtraction of LHS and RHS.
unsigned countMaxLeadingZeros() const
Returns the maximum number of leading zero bits possible.
void insertBits(const KnownBits &SubBits, unsigned BitPosition)
Insert the bits from a smaller known bits starting at bitPosition.
static LLVM_ABI KnownBits mul(const KnownBits &LHS, const KnownBits &RHS, bool NoUndefSelfMultiply=false)
Compute known bits resulting from multiplying LHS and RHS.
KnownBits anyext(unsigned BitWidth) const
Return known bits for an "any" extension of the value we're tracking, where we don't know anything ab...
LLVM_ABI KnownBits abs(bool IntMinIsPoison=false) const
Compute known bits for the absolute value.
static LLVM_ABI KnownBits shl(const KnownBits &LHS, const KnownBits &RHS, bool NUW=false, bool NSW=false, bool ShAmtNonZero=false)
Compute known bits for shl(LHS, RHS).
static LLVM_ABI KnownBits umin(const KnownBits &LHS, const KnownBits &RHS)
Compute known bits for umin(LHS, RHS).
bool isAllOnes() const
Returns true if value is all one bits.
FPClassTest KnownFPClasses
Floating-point classes the value could be one of.
bool isKnownNeverInfinity() const
Return true if it's known this can never be an infinity.
bool cannotBeOrderedGreaterThanZero() const
Return true if we can prove that the analyzed floating-point value is either NaN or never greater tha...
static LLVM_ABI KnownFPClass sin(const KnownFPClass &Src)
Report known values for sin.
static LLVM_ABI KnownFPClass fdiv_self(const KnownFPClass &Src, DenormalMode Mode=DenormalMode::getDynamic())
Report known values for fdiv x, x.
static constexpr FPClassTest OrderedGreaterThanZeroMask
static constexpr FPClassTest OrderedLessThanZeroMask
void knownNot(FPClassTest RuleOut)
static LLVM_ABI KnownFPClass fmul(const KnownFPClass &LHS, const KnownFPClass &RHS, DenormalMode Mode=DenormalMode::getDynamic())
Report known values for fmul.
static LLVM_ABI KnownFPClass fadd_self(const KnownFPClass &Src, DenormalMode Mode=DenormalMode::getDynamic())
Report known values for fadd x, x.
void copysign(const KnownFPClass &Sign)
static KnownFPClass square(const KnownFPClass &Src, DenormalMode Mode=DenormalMode::getDynamic())
static LLVM_ABI KnownFPClass fsub(const KnownFPClass &LHS, const KnownFPClass &RHS, DenormalMode Mode=DenormalMode::getDynamic())
Report known values for fsub.
static LLVM_ABI KnownFPClass canonicalize(const KnownFPClass &Src, DenormalMode DenormMode=DenormalMode::getDynamic())
Apply the canonicalize intrinsic to this value.
LLVM_ABI bool isKnownNeverLogicalZero(DenormalMode Mode) const
Return true if it's known this can never be interpreted as a zero.
static LLVM_ABI KnownFPClass log(const KnownFPClass &Src, DenormalMode Mode=DenormalMode::getDynamic())
Propagate known class for log/log2/log10.
static LLVM_ABI KnownFPClass atan(const KnownFPClass &Src)
Report known values for atan.
static LLVM_ABI KnownFPClass atan2(const KnownFPClass &LHS, const KnownFPClass &RHS)
Report known values for atan2.
static LLVM_ABI KnownFPClass fdiv(const KnownFPClass &LHS, const KnownFPClass &RHS, DenormalMode Mode=DenormalMode::getDynamic())
Report known values for fdiv.
static LLVM_ABI KnownFPClass roundToIntegral(const KnownFPClass &Src, bool IsTrunc, bool IsMultiUnitFPType)
Propagate known class for rounding intrinsics (trunc, floor, ceil, rint, nearbyint,...
static LLVM_ABI KnownFPClass cos(const KnownFPClass &Src)
Report known values for cos.
static LLVM_ABI KnownFPClass ldexp(const KnownFPClass &Src, const KnownBits &N, const fltSemantics &Flt, DenormalMode Mode=DenormalMode::getDynamic())
Propagate known class for ldexp.
static LLVM_ABI KnownFPClass cosh(const KnownFPClass &Src)
Report known values for cosh.
static LLVM_ABI KnownFPClass minMaxLike(const KnownFPClass &LHS, const KnownFPClass &RHS, MinMaxKind Kind, DenormalMode DenormMode=DenormalMode::getDynamic())
KnownFPClass intersectWith(const KnownFPClass &RHS) const
static LLVM_ABI KnownFPClass exp(const KnownFPClass &Src)
Report known values for exp, exp2 and exp10.
static LLVM_ABI KnownFPClass frexp_mant(const KnownFPClass &Src, DenormalMode Mode=DenormalMode::getDynamic())
Propagate known class for mantissa component of frexp.
std::optional< bool > SignBit
std::nullopt if the sign bit is unknown, true if the sign bit is definitely set or false if the sign ...
static LLVM_ABI KnownFPClass asin(const KnownFPClass &Src)
Report known values for asin.
bool isKnownNeverNaN() const
Return true if it's known this can never be a nan.
bool isKnownNever(FPClassTest Mask) const
Return true if it's known this can never be one of the mask entries.
static LLVM_ABI KnownFPClass fpext(const KnownFPClass &KnownSrc, const fltSemantics &DstTy, const fltSemantics &SrcTy)
Propagate known class for fpext.
static LLVM_ABI KnownFPClass fma(const KnownFPClass &LHS, const KnownFPClass &RHS, const KnownFPClass &Addend, DenormalMode Mode=DenormalMode::getDynamic())
Report known values for fma.
static LLVM_ABI KnownFPClass tan(const KnownFPClass &Src)
Report known values for tan.
static LLVM_ABI KnownFPClass fptrunc(const KnownFPClass &KnownSrc)
Propagate known class for fptrunc.
bool cannotBeOrderedLessThanZero() const
Return true if we can prove that the analyzed floating-point value is either NaN or never less than -...
void signBitMustBeOne()
Assume the sign bit is one.
void signBitMustBeZero()
Assume the sign bit is zero.
static LLVM_ABI KnownFPClass sqrt(const KnownFPClass &Src, DenormalMode Mode=DenormalMode::getDynamic())
Propagate known class for sqrt.
static LLVM_ABI KnownFPClass fadd(const KnownFPClass &LHS, const KnownFPClass &RHS, DenormalMode Mode=DenormalMode::getDynamic())
Report known values for fadd.
static LLVM_ABI KnownFPClass fma_square(const KnownFPClass &Squared, const KnownFPClass &Addend, DenormalMode Mode=DenormalMode::getDynamic())
Report known values for fma squared, squared, addend.
static LLVM_ABI KnownFPClass acos(const KnownFPClass &Src)
Report known values for acos.
static LLVM_ABI KnownFPClass frem_self(const KnownFPClass &Src, DenormalMode Mode=DenormalMode::getDynamic())
Report known values for frem.
static LLVM_ABI KnownFPClass powi(const KnownFPClass &Src, const KnownBits &N)
Propagate known class for powi.
static LLVM_ABI KnownFPClass sinh(const KnownFPClass &Src)
Report known values for sinh.
static LLVM_ABI KnownFPClass tanh(const KnownFPClass &Src)
Report known values for tanh.