33#define DEBUG_TYPE "hexbit"
45 cl::init(std::numeric_limits<unsigned>::max()));
48 cl::init(std::numeric_limits<unsigned>::max()));
59 explicit RegisterSet(
unsigned s,
bool t =
false) : Bits(s, t) {}
67 unsigned count()
const {
71 unsigned find_first()
const {
78 unsigned find_next(
unsigned Prev)
const {
79 int Next =
Bits.find_next(v2x(Prev));
86 unsigned Idx = v2x(R);
88 bool Exists =
Bits.test(Idx);
93 unsigned T = LRU.front();
101 unsigned Idx = v2x(R);
102 if (Idx <
Bits.size()) {
103 bool Exists =
Bits.test(Idx);
115 for (
unsigned R = Rs.find_first(); R; R = Rs.find_next(R))
120 for (
unsigned R = Rs.find_first(); R; R = Rs.find_next(R))
125 bool operator[](
unsigned R)
const {
126 unsigned Idx = v2x(R);
127 return Idx <
Bits.size() ?
Bits[Idx] :
false;
129 bool has(
unsigned R)
const {
130 unsigned Idx = v2x(R);
131 if (Idx >=
Bits.size())
133 return Bits.test(Idx);
143 return Bits.anyCommon(Rs.Bits);
148 std::deque<unsigned> LRU;
150 void ensure(
unsigned Idx) {
151 if (
Bits.size() <= Idx)
152 Bits.resize(std::max(Idx+1, 32U));
155 static inline unsigned v2x(
unsigned v) {
159 static inline unsigned x2v(
unsigned x) {
160 return Register::index2VirtReg(x);
165 PrintRegSet(
const RegisterSet &S,
const TargetRegisterInfo *RI)
168 friend raw_ostream &
operator<< (raw_ostream &OS,
169 const PrintRegSet &
P);
173 const TargetRegisterInfo *TRI;
177 const PrintRegSet &
P);
180 for (
unsigned R =
P.RS.find_first(); R; R =
P.RS.find_next(R))
186 class Transformation;
192 HexagonBitSimplify() : MachineFunctionPass(ID) {}
194 StringRef getPassName()
const override {
195 return "Hexagon bit simplification";
198 void getAnalysisUsage(AnalysisUsage &AU)
const override {
204 bool runOnMachineFunction(MachineFunction &MF)
override;
206 static void getInstrDefs(
const MachineInstr &
MI,
RegisterSet &Defs);
208 static bool isEqual(
const BitTracker::RegisterCell &RC1, uint16_t B1,
209 const BitTracker::RegisterCell &RC2, uint16_t B2, uint16_t W);
210 static bool isZero(
const BitTracker::RegisterCell &RC, uint16_t
B,
212 static bool getConst(
const BitTracker::RegisterCell &RC, uint16_t
B,
213 uint16_t W, uint64_t &U);
215 MachineRegisterInfo &
MRI);
216 static bool getSubregMask(
const BitTracker::RegisterRef &RR,
217 unsigned &Begin,
unsigned &Width, MachineRegisterInfo &
MRI);
219 MachineRegisterInfo &
MRI);
221 unsigned NewSR, MachineRegisterInfo &
MRI);
222 static bool parseRegSequence(
const MachineInstr &
I,
223 BitTracker::RegisterRef &SL, BitTracker::RegisterRef &SH,
224 const MachineRegisterInfo &
MRI);
226 static bool getUsedBitsInStore(
unsigned Opc, BitVector &Bits,
228 static bool getUsedBits(
unsigned Opc,
unsigned OpN, BitVector &Bits,
229 uint16_t Begin,
const HexagonInstrInfo &HII);
231 static const TargetRegisterClass *getFinalVRegClass(
232 const BitTracker::RegisterRef &RR, MachineRegisterInfo &
MRI);
233 static bool isTransparentCopy(
const BitTracker::RegisterRef &RD,
234 const BitTracker::RegisterRef &RS, MachineRegisterInfo &
MRI);
237 MachineDominatorTree *MDT =
nullptr;
239 bool visitBlock(MachineBasicBlock &
B, Transformation &
T,
RegisterSet &AVs);
240 static bool hasTiedUse(
unsigned Reg, MachineRegisterInfo &
MRI,
241 unsigned NewSub = Hexagon::NoSubRegister);
244 using HBS = HexagonBitSimplify;
249 class Transformation {
253 Transformation(
bool TD) : TopDown(TD) {}
254 virtual ~Transformation() =
default;
256 virtual bool processBlock(MachineBasicBlock &
B,
const RegisterSet &AVs) = 0;
261char HexagonBitSimplify::ID = 0;
264 "Hexagon bit simplification",
false,
false)
278 getInstrDefs(
I, Defs);
279 RegisterSet NewAVs = AVs;
283 Changed |= visitBlock(*(DTN->getBlock()),
T, NewAVs);
296 for (
auto &
Op :
MI.operands()) {
297 if (!
Op.isReg() || !
Op.isDef())
306void HexagonBitSimplify::getInstrUses(
const MachineInstr &
MI,
308 for (
auto &
Op :
MI.operands()) {
309 if (!
Op.isReg() || !
Op.isUse())
319bool HexagonBitSimplify::isEqual(
const BitTracker::RegisterCell &RC1,
320 uint16_t B1,
const BitTracker::RegisterCell &RC2, uint16_t B2,
322 for (uint16_t i = 0; i <
W; ++i) {
329 if (RC1[B1+i] != RC2[B2+i])
335bool HexagonBitSimplify::isZero(
const BitTracker::RegisterCell &RC,
336 uint16_t
B, uint16_t W) {
338 for (uint16_t i =
B; i <
B+
W; ++i)
344bool HexagonBitSimplify::getConst(
const BitTracker::RegisterCell &RC,
345 uint16_t
B, uint16_t W, uint64_t &U) {
348 for (uint16_t i =
B+W; i >
B; --i) {
349 const BitTracker::BitValue &BV = RC[i-1];
361 MachineRegisterInfo &
MRI) {
364 auto Begin =
MRI.use_begin(OldR), End =
MRI.use_end();
366 for (
auto I = Begin;
I != End;
I = NextI) {
367 NextI = std::next(
I);
375 MachineRegisterInfo &
MRI) {
378 if (hasTiedUse(OldR,
MRI, NewSR))
380 auto Begin =
MRI.use_begin(OldR), End =
MRI.use_end();
382 for (
auto I = Begin;
I != End;
I = NextI) {
383 NextI = std::next(
I);
390bool HexagonBitSimplify::replaceSubWithSub(
Register OldR,
unsigned OldSR,
392 MachineRegisterInfo &
MRI) {
395 if (OldSR != NewSR && hasTiedUse(OldR,
MRI, NewSR))
397 auto Begin =
MRI.use_begin(OldR), End =
MRI.use_end();
399 for (
auto I = Begin;
I != End;
I = NextI) {
400 NextI = std::next(
I);
401 if (
I->getSubReg() != OldSR)
412bool HexagonBitSimplify::getSubregMask(
const BitTracker::RegisterRef &RR,
413 unsigned &Begin,
unsigned &Width, MachineRegisterInfo &
MRI) {
414 const TargetRegisterClass *RC =
MRI.getRegClass(RR.
Reg);
417 Width =
MRI.getTargetRegisterInfo()->getRegSizeInBits(*RC);
423 switch (RC->
getID()) {
424 case Hexagon::DoubleRegsRegClassID:
425 case Hexagon::HvxWRRegClassID:
426 Width =
MRI.getTargetRegisterInfo()->getRegSizeInBits(*RC) / 2;
427 if (RR.
Sub == Hexagon::isub_hi || RR.
Sub == Hexagon::vsub_hi)
439bool HexagonBitSimplify::parseRegSequence(
const MachineInstr &
I,
440 BitTracker::RegisterRef &SL, BitTracker::RegisterRef &SH,
441 const MachineRegisterInfo &
MRI) {
442 assert(
I.getOpcode() == TargetOpcode::REG_SEQUENCE);
443 unsigned Sub1 =
I.getOperand(2).getImm(), Sub2 =
I.getOperand(4).getImm();
444 auto &DstRC = *
MRI.getRegClass(
I.getOperand(0).getReg());
445 auto &HRI =
static_cast<const HexagonRegisterInfo&
>(
446 *
MRI.getTargetRegisterInfo());
449 assert((Sub1 == SubLo && Sub2 == SubHi) || (Sub1 == SubHi && Sub2 == SubLo));
450 if (Sub1 == SubLo && Sub2 == SubHi) {
451 SL =
I.getOperand(1);
452 SH =
I.getOperand(3);
455 if (Sub1 == SubHi && Sub2 == SubLo) {
456 SH =
I.getOperand(1);
457 SL =
I.getOperand(3);
469bool HexagonBitSimplify::getUsedBitsInStore(
unsigned Opc, BitVector &Bits,
471 using namespace Hexagon;
476 case S2_storerbnew_io:
477 case S2_pstorerbt_io:
478 case S2_pstorerbf_io:
479 case S4_pstorerbtnew_io:
480 case S4_pstorerbfnew_io:
481 case S2_pstorerbnewt_io:
482 case S2_pstorerbnewf_io:
483 case S4_pstorerbnewtnew_io:
484 case S4_pstorerbnewfnew_io:
486 case S2_storerbnew_pi:
487 case S2_pstorerbt_pi:
488 case S2_pstorerbf_pi:
489 case S2_pstorerbtnew_pi:
490 case S2_pstorerbfnew_pi:
491 case S2_pstorerbnewt_pi:
492 case S2_pstorerbnewf_pi:
493 case S2_pstorerbnewtnew_pi:
494 case S2_pstorerbnewfnew_pi:
496 case S4_storerbnew_ap:
498 case S2_storerbnew_pr:
500 case S4_storerbnew_ur:
502 case S2_storerbnew_pbr:
504 case S2_storerbnew_pci:
506 case S2_storerbnew_pcr:
508 case S4_storerbnew_rr:
509 case S4_pstorerbt_rr:
510 case S4_pstorerbf_rr:
511 case S4_pstorerbtnew_rr:
512 case S4_pstorerbfnew_rr:
513 case S4_pstorerbnewt_rr:
514 case S4_pstorerbnewf_rr:
515 case S4_pstorerbnewtnew_rr:
516 case S4_pstorerbnewfnew_rr:
518 case S2_storerbnewgp:
519 case S4_pstorerbt_abs:
520 case S4_pstorerbf_abs:
521 case S4_pstorerbtnew_abs:
522 case S4_pstorerbfnew_abs:
523 case S4_pstorerbnewt_abs:
524 case S4_pstorerbnewf_abs:
525 case S4_pstorerbnewtnew_abs:
526 case S4_pstorerbnewfnew_abs:
527 Bits.set(Begin, Begin+8);
532 case S2_storerhnew_io:
533 case S2_pstorerht_io:
534 case S2_pstorerhf_io:
535 case S4_pstorerhtnew_io:
536 case S4_pstorerhfnew_io:
537 case S2_pstorerhnewt_io:
538 case S2_pstorerhnewf_io:
539 case S4_pstorerhnewtnew_io:
540 case S4_pstorerhnewfnew_io:
542 case S2_storerhnew_pi:
543 case S2_pstorerht_pi:
544 case S2_pstorerhf_pi:
545 case S2_pstorerhtnew_pi:
546 case S2_pstorerhfnew_pi:
547 case S2_pstorerhnewt_pi:
548 case S2_pstorerhnewf_pi:
549 case S2_pstorerhnewtnew_pi:
550 case S2_pstorerhnewfnew_pi:
552 case S4_storerhnew_ap:
554 case S2_storerhnew_pr:
556 case S4_storerhnew_ur:
558 case S2_storerhnew_pbr:
560 case S2_storerhnew_pci:
562 case S2_storerhnew_pcr:
564 case S4_pstorerht_rr:
565 case S4_pstorerhf_rr:
566 case S4_pstorerhtnew_rr:
567 case S4_pstorerhfnew_rr:
568 case S4_storerhnew_rr:
569 case S4_pstorerhnewt_rr:
570 case S4_pstorerhnewf_rr:
571 case S4_pstorerhnewtnew_rr:
572 case S4_pstorerhnewfnew_rr:
574 case S2_storerhnewgp:
575 case S4_pstorerht_abs:
576 case S4_pstorerhf_abs:
577 case S4_pstorerhtnew_abs:
578 case S4_pstorerhfnew_abs:
579 case S4_pstorerhnewt_abs:
580 case S4_pstorerhnewf_abs:
581 case S4_pstorerhnewtnew_abs:
582 case S4_pstorerhnewfnew_abs:
583 Bits.set(Begin, Begin+16);
588 case S2_pstorerft_io:
589 case S2_pstorerff_io:
590 case S4_pstorerftnew_io:
591 case S4_pstorerffnew_io:
593 case S2_pstorerft_pi:
594 case S2_pstorerff_pi:
595 case S2_pstorerftnew_pi:
596 case S2_pstorerffnew_pi:
604 case S4_pstorerft_rr:
605 case S4_pstorerff_rr:
606 case S4_pstorerftnew_rr:
607 case S4_pstorerffnew_rr:
609 case S4_pstorerft_abs:
610 case S4_pstorerff_abs:
611 case S4_pstorerftnew_abs:
612 case S4_pstorerffnew_abs:
613 Bits.set(Begin+16, Begin+32);
628bool HexagonBitSimplify::getUsedBits(
unsigned Opc,
unsigned OpN,
629 BitVector &Bits, uint16_t Begin,
const HexagonInstrInfo &HII) {
630 using namespace Hexagon;
632 const MCInstrDesc &
D = HII.get(
Opc);
634 if (OpN ==
D.getNumOperands()-1)
635 return getUsedBitsInStore(
Opc, Bits, Begin);
647 Bits.set(Begin, Begin+8);
660 Bits.set(Begin, Begin+16);
668 Bits.set(Begin+16, Begin+32);
678 Bits.set(Begin, Begin+8);
688 case A2_addh_h16_sat_ll:
690 case A2_addh_l16_sat_ll:
693 case A2_subh_h16_sat_ll:
695 case A2_subh_l16_sat_ll:
696 case M2_mpy_acc_ll_s0:
697 case M2_mpy_acc_ll_s1:
698 case M2_mpy_acc_sat_ll_s0:
699 case M2_mpy_acc_sat_ll_s1:
702 case M2_mpy_nac_ll_s0:
703 case M2_mpy_nac_ll_s1:
704 case M2_mpy_nac_sat_ll_s0:
705 case M2_mpy_nac_sat_ll_s1:
706 case M2_mpy_rnd_ll_s0:
707 case M2_mpy_rnd_ll_s1:
708 case M2_mpy_sat_ll_s0:
709 case M2_mpy_sat_ll_s1:
710 case M2_mpy_sat_rnd_ll_s0:
711 case M2_mpy_sat_rnd_ll_s1:
712 case M2_mpyd_acc_ll_s0:
713 case M2_mpyd_acc_ll_s1:
716 case M2_mpyd_nac_ll_s0:
717 case M2_mpyd_nac_ll_s1:
718 case M2_mpyd_rnd_ll_s0:
719 case M2_mpyd_rnd_ll_s1:
720 case M2_mpyu_acc_ll_s0:
721 case M2_mpyu_acc_ll_s1:
724 case M2_mpyu_nac_ll_s0:
725 case M2_mpyu_nac_ll_s1:
726 case M2_mpyud_acc_ll_s0:
727 case M2_mpyud_acc_ll_s1:
730 case M2_mpyud_nac_ll_s0:
731 case M2_mpyud_nac_ll_s1:
732 if (OpN == 1 || OpN == 2) {
733 Bits.set(Begin, Begin+16);
740 case A2_addh_h16_sat_lh:
743 case A2_subh_h16_sat_lh:
744 case M2_mpy_acc_lh_s0:
745 case M2_mpy_acc_lh_s1:
746 case M2_mpy_acc_sat_lh_s0:
747 case M2_mpy_acc_sat_lh_s1:
750 case M2_mpy_nac_lh_s0:
751 case M2_mpy_nac_lh_s1:
752 case M2_mpy_nac_sat_lh_s0:
753 case M2_mpy_nac_sat_lh_s1:
754 case M2_mpy_rnd_lh_s0:
755 case M2_mpy_rnd_lh_s1:
756 case M2_mpy_sat_lh_s0:
757 case M2_mpy_sat_lh_s1:
758 case M2_mpy_sat_rnd_lh_s0:
759 case M2_mpy_sat_rnd_lh_s1:
760 case M2_mpyd_acc_lh_s0:
761 case M2_mpyd_acc_lh_s1:
764 case M2_mpyd_nac_lh_s0:
765 case M2_mpyd_nac_lh_s1:
766 case M2_mpyd_rnd_lh_s0:
767 case M2_mpyd_rnd_lh_s1:
768 case M2_mpyu_acc_lh_s0:
769 case M2_mpyu_acc_lh_s1:
772 case M2_mpyu_nac_lh_s0:
773 case M2_mpyu_nac_lh_s1:
774 case M2_mpyud_acc_lh_s0:
775 case M2_mpyud_acc_lh_s1:
778 case M2_mpyud_nac_lh_s0:
779 case M2_mpyud_nac_lh_s1:
782 case A2_addh_l16_sat_hl:
784 case A2_subh_l16_sat_hl:
786 Bits.set(Begin, Begin+16);
790 Bits.set(Begin+16, Begin+32);
797 case A2_addh_h16_sat_hl:
800 case A2_subh_h16_sat_hl:
801 case M2_mpy_acc_hl_s0:
802 case M2_mpy_acc_hl_s1:
803 case M2_mpy_acc_sat_hl_s0:
804 case M2_mpy_acc_sat_hl_s1:
807 case M2_mpy_nac_hl_s0:
808 case M2_mpy_nac_hl_s1:
809 case M2_mpy_nac_sat_hl_s0:
810 case M2_mpy_nac_sat_hl_s1:
811 case M2_mpy_rnd_hl_s0:
812 case M2_mpy_rnd_hl_s1:
813 case M2_mpy_sat_hl_s0:
814 case M2_mpy_sat_hl_s1:
815 case M2_mpy_sat_rnd_hl_s0:
816 case M2_mpy_sat_rnd_hl_s1:
817 case M2_mpyd_acc_hl_s0:
818 case M2_mpyd_acc_hl_s1:
821 case M2_mpyd_nac_hl_s0:
822 case M2_mpyd_nac_hl_s1:
823 case M2_mpyd_rnd_hl_s0:
824 case M2_mpyd_rnd_hl_s1:
825 case M2_mpyu_acc_hl_s0:
826 case M2_mpyu_acc_hl_s1:
829 case M2_mpyu_nac_hl_s0:
830 case M2_mpyu_nac_hl_s1:
831 case M2_mpyud_acc_hl_s0:
832 case M2_mpyud_acc_hl_s1:
835 case M2_mpyud_nac_hl_s0:
836 case M2_mpyud_nac_hl_s1:
838 Bits.set(Begin+16, Begin+32);
842 Bits.set(Begin, Begin+16);
849 case A2_addh_h16_sat_hh:
852 case A2_subh_h16_sat_hh:
853 case M2_mpy_acc_hh_s0:
854 case M2_mpy_acc_hh_s1:
855 case M2_mpy_acc_sat_hh_s0:
856 case M2_mpy_acc_sat_hh_s1:
859 case M2_mpy_nac_hh_s0:
860 case M2_mpy_nac_hh_s1:
861 case M2_mpy_nac_sat_hh_s0:
862 case M2_mpy_nac_sat_hh_s1:
863 case M2_mpy_rnd_hh_s0:
864 case M2_mpy_rnd_hh_s1:
865 case M2_mpy_sat_hh_s0:
866 case M2_mpy_sat_hh_s1:
867 case M2_mpy_sat_rnd_hh_s0:
868 case M2_mpy_sat_rnd_hh_s1:
869 case M2_mpyd_acc_hh_s0:
870 case M2_mpyd_acc_hh_s1:
873 case M2_mpyd_nac_hh_s0:
874 case M2_mpyd_nac_hh_s1:
875 case M2_mpyd_rnd_hh_s0:
876 case M2_mpyd_rnd_hh_s1:
877 case M2_mpyu_acc_hh_s0:
878 case M2_mpyu_acc_hh_s1:
881 case M2_mpyu_nac_hh_s0:
882 case M2_mpyu_nac_hh_s1:
883 case M2_mpyud_acc_hh_s0:
884 case M2_mpyud_acc_hh_s1:
887 case M2_mpyud_nac_hh_s0:
888 case M2_mpyud_nac_hh_s1:
889 if (OpN == 1 || OpN == 2) {
890 Bits.set(Begin+16, Begin+32);
902const TargetRegisterClass *HexagonBitSimplify::getFinalVRegClass(
903 const BitTracker::RegisterRef &RR, MachineRegisterInfo &
MRI) {
906 auto *RC =
MRI.getRegClass(RR.
Reg);
909 auto &HRI =
static_cast<const HexagonRegisterInfo&
>(
910 *
MRI.getTargetRegisterInfo());
912 auto VerifySR = [&HRI] (
const TargetRegisterClass *RC,
unsigned Sub) ->
void {
918 switch (RC->
getID()) {
919 case Hexagon::DoubleRegsRegClassID:
920 VerifySR(RC, RR.
Sub);
921 return &Hexagon::IntRegsRegClass;
922 case Hexagon::HvxWRRegClassID:
923 VerifySR(RC, RR.
Sub);
924 return &Hexagon::HvxVRRegClass;
933bool HexagonBitSimplify::isTransparentCopy(
const BitTracker::RegisterRef &RD,
934 const BitTracker::RegisterRef &RS, MachineRegisterInfo &
MRI) {
938 auto *DRC = getFinalVRegClass(RD,
MRI);
942 return DRC == getFinalVRegClass(RS,
MRI);
945bool HexagonBitSimplify::hasTiedUse(
unsigned Reg, MachineRegisterInfo &
MRI,
950 [NewSub] (
const MachineOperand &
Op) ->
bool {
951 return Op.getSubReg() != NewSub && Op.isTied();
957 class DeadCodeElimination {
959 DeadCodeElimination(MachineFunction &mf, MachineDominatorTree &mdt)
960 : MF(mf), HII(*MF.getSubtarget<HexagonSubtarget>().getInstrInfo()),
961 MDT(mdt),
MRI(mf.getRegInfo()) {}
968 bool isDead(
unsigned R)
const;
972 const HexagonInstrInfo &HII;
973 MachineDominatorTree &MDT;
974 MachineRegisterInfo &
MRI;
979bool DeadCodeElimination::isDead(
unsigned R)
const {
980 for (
const MachineOperand &MO :
MRI.use_operands(R)) {
981 const MachineInstr *UseI = MO.getParent();
1001 MachineBasicBlock *
B =
N->getBlock();
1002 std::vector<MachineInstr*> Instrs;
1004 Instrs.push_back(&
MI);
1006 for (
auto *
MI : Instrs) {
1007 unsigned Opc =
MI->getOpcode();
1010 if (
Opc == TargetOpcode::LIFETIME_START ||
1011 Opc == TargetOpcode::LIFETIME_END)
1014 if (
MI->isInlineAsm())
1017 if (!
MI->isPHI() && !
MI->isSafeToMove(Store))
1020 bool AllDead =
true;
1021 SmallVector<unsigned,2> Regs;
1022 for (
auto &
Op :
MI->operands()) {
1023 if (!
Op.isReg() || !
Op.isDef())
1026 if (!
R.isVirtual() || !
isDead(R)) {
1036 for (
unsigned Reg : Regs)
1037 MRI.markUsesInDebugValueAsUndef(
Reg);
1056 class RedundantInstrElimination :
public Transformation {
1058 RedundantInstrElimination(BitTracker &bt,
const HexagonInstrInfo &hii,
1059 const HexagonRegisterInfo &hri, MachineRegisterInfo &mri)
1060 : Transformation(
true), HII(hii), HRI(hri),
MRI(mri),
BT(bt) {}
1062 bool processBlock(MachineBasicBlock &
B,
const RegisterSet &AVs)
override;
1065 bool isLossyShiftLeft(
const MachineInstr &
MI,
unsigned OpN,
1066 unsigned &LostB,
unsigned &LostE);
1067 bool isLossyShiftRight(
const MachineInstr &
MI,
unsigned OpN,
1068 unsigned &LostB,
unsigned &LostE);
1069 bool computeUsedBits(
unsigned Reg, BitVector &Bits);
1070 bool computeUsedBits(
const MachineInstr &
MI,
unsigned OpN, BitVector &Bits,
1072 bool usedBitsEqual(BitTracker::RegisterRef RD, BitTracker::RegisterRef RS);
1074 const HexagonInstrInfo &HII;
1075 const HexagonRegisterInfo &HRI;
1076 MachineRegisterInfo &
MRI;
1085bool RedundantInstrElimination::isLossyShiftLeft(
const MachineInstr &
MI,
1086 unsigned OpN,
unsigned &LostB,
unsigned &LostE) {
1087 using namespace Hexagon;
1089 unsigned Opc =
MI.getOpcode();
1090 unsigned ImN, RegN, Width;
1097 case S2_asl_i_p_acc:
1098 case S2_asl_i_p_and:
1099 case S2_asl_i_p_nac:
1101 case S2_asl_i_p_xacc:
1111 case S2_addasl_rrri:
1112 case S4_andi_asl_ri:
1114 case S4_addi_asl_ri:
1115 case S4_subi_asl_ri:
1116 case S2_asl_i_r_acc:
1117 case S2_asl_i_r_and:
1118 case S2_asl_i_r_nac:
1120 case S2_asl_i_r_sat:
1121 case S2_asl_i_r_xacc:
1133 assert(
MI.getOperand(ImN).isImm());
1134 unsigned S =
MI.getOperand(ImN).getImm();
1145bool RedundantInstrElimination::isLossyShiftRight(
const MachineInstr &
MI,
1146 unsigned OpN,
unsigned &LostB,
unsigned &LostE) {
1147 using namespace Hexagon;
1149 unsigned Opc =
MI.getOpcode();
1157 case S2_asr_i_p_acc:
1158 case S2_asr_i_p_and:
1159 case S2_asr_i_p_nac:
1161 case S2_lsr_i_p_acc:
1162 case S2_lsr_i_p_and:
1163 case S2_lsr_i_p_nac:
1165 case S2_lsr_i_p_xacc:
1174 case S4_andi_lsr_ri:
1176 case S4_addi_lsr_ri:
1177 case S4_subi_lsr_ri:
1178 case S2_asr_i_r_acc:
1179 case S2_asr_i_r_and:
1180 case S2_asr_i_r_nac:
1182 case S2_lsr_i_r_acc:
1183 case S2_lsr_i_r_and:
1184 case S2_lsr_i_r_nac:
1186 case S2_lsr_i_r_xacc:
1198 assert(
MI.getOperand(ImN).isImm());
1199 unsigned S =
MI.getOperand(ImN).getImm();
1209bool RedundantInstrElimination::computeUsedBits(
unsigned Reg, BitVector &Bits) {
1212 std::vector<unsigned> Pending;
1213 Pending.push_back(
Reg);
1215 for (
unsigned i = 0; i < Pending.size(); ++i) {
1216 unsigned R = Pending[i];
1220 for (
auto I =
MRI.use_begin(R),
E =
MRI.use_end();
I !=
E; ++
I) {
1221 BitTracker::RegisterRef UR = *
I;
1223 if (!HBS::getSubregMask(UR,
B, W,
MRI))
1230 Pending.push_back(DefR);
1232 if (!computeUsedBits(UseI,
I.getOperandNo(), Used,
B))
1255bool RedundantInstrElimination::computeUsedBits(
const MachineInstr &
MI,
1256 unsigned OpN, BitVector &Bits, uint16_t Begin) {
1257 unsigned Opc =
MI.getOpcode();
1258 BitVector
T(
Bits.size());
1259 bool GotBits = HBS::getUsedBits(
Opc, OpN,
T, Begin, HII);
1264 if (isLossyShiftLeft(
MI, OpN, LB, LE) || isLossyShiftRight(
MI, OpN, LB, LE)) {
1265 assert(
MI.getOperand(OpN).isReg());
1266 BitTracker::RegisterRef RR =
MI.getOperand(OpN);
1267 const TargetRegisterClass *RC = HBS::getFinalVRegClass(RR,
MRI);
1268 uint16_t Width = HRI.getRegSizeInBits(*RC);
1271 T.set(Begin, Begin+Width);
1272 assert(LB <= LE && LB < Width && LE <= Width);
1273 T.reset(Begin+LB, Begin+LE);
1283bool RedundantInstrElimination::usedBitsEqual(BitTracker::RegisterRef RD,
1284 BitTracker::RegisterRef RS) {
1285 const BitTracker::RegisterCell &DC =
BT.
lookup(RD.
Reg);
1286 const BitTracker::RegisterCell &SC =
BT.
lookup(
RS.Reg);
1289 if (!HBS::getSubregMask(RD, DB, DW,
MRI))
1292 if (!HBS::getSubregMask(RS, SB, SW,
MRI))
1298 if (!computeUsedBits(RD.
Reg, Used))
1301 for (
unsigned i = 0; i != DW; ++i)
1302 if (Used[i+DB] && DC[DB+i] != SC[SB+i])
1307bool RedundantInstrElimination::processBlock(MachineBasicBlock &
B,
1313 for (
auto I =
B.begin(),
E =
B.end();
I !=
E; ++
I) {
1314 MachineInstr *
MI = &*
I;
1316 if (
MI->getOpcode() == TargetOpcode::COPY)
1318 if (
MI->isPHI() ||
MI->hasUnmodeledSideEffects() ||
MI->isInlineAsm())
1320 unsigned NumD =
MI->getDesc().getNumDefs();
1324 BitTracker::RegisterRef RD =
MI->getOperand(0);
1327 const BitTracker::RegisterCell &DC =
BT.
lookup(RD.
Reg);
1331 for (
auto &
Op :
MI->uses()) {
1334 BitTracker::RegisterRef
RS =
Op;
1337 if (!HBS::isTransparentCopy(RD, RS,
MRI))
1341 if (!HBS::getSubregMask(RS, BN, BW,
MRI))
1344 const BitTracker::RegisterCell &SC =
BT.
lookup(
RS.Reg);
1345 if (!usedBitsEqual(RD, RS) && !HBS::isEqual(DC, 0, SC, BN, BW))
1350 const TargetRegisterClass *FRC = HBS::getFinalVRegClass(RD,
MRI);
1352 MachineInstr *CopyI =
1353 BuildMI(
B, At,
DL, HII.get(TargetOpcode::COPY), NewR)
1355 HBS::replaceSubWithSub(RD.
Reg, RD.
Sub, NewR, 0,
MRI);
1378 class ConstGeneration :
public Transformation {
1380 ConstGeneration(BitTracker &bt,
const HexagonInstrInfo &hii,
1381 MachineRegisterInfo &mri)
1382 : Transformation(
true), HII(hii),
MRI(mri),
BT(bt) {}
1384 bool processBlock(MachineBasicBlock &
B,
const RegisterSet &AVs)
override;
1385 static bool isTfrConst(
const MachineInstr &
MI);
1388 Register genTfrConst(
const TargetRegisterClass *RC, int64_t
C,
1392 const HexagonInstrInfo &HII;
1393 MachineRegisterInfo &
MRI;
1399bool ConstGeneration::isTfrConst(
const MachineInstr &
MI) {
1400 unsigned Opc =
MI.getOpcode();
1402 case Hexagon::A2_combineii:
1403 case Hexagon::A4_combineii:
1404 case Hexagon::A2_tfrsi:
1405 case Hexagon::A2_tfrpi:
1406 case Hexagon::PS_true:
1407 case Hexagon::PS_false:
1408 case Hexagon::CONST32:
1409 case Hexagon::CONST64:
1417Register ConstGeneration::genTfrConst(
const TargetRegisterClass *RC, int64_t
C,
1418 MachineBasicBlock &
B,
1422 if (RC == &Hexagon::IntRegsRegClass) {
1428 if (RC == &Hexagon::DoubleRegsRegClass) {
1438 : Hexagon::A4_combineii;
1444 MachineFunction *MF =
B.getParent();
1448 if (!HST.isTinyCore() ||
1456 if (RC == &Hexagon::PredRegsRegClass) {
1459 Opc = Hexagon::PS_false;
1460 else if ((
C & 0xFF) == 0xFF)
1461 Opc = Hexagon::PS_true;
1471bool ConstGeneration::processBlock(MachineBasicBlock &
B,
const RegisterSet&) {
1477 for (
auto I =
B.begin(),
E =
B.end();
I !=
E; ++
I) {
1481 HBS::getInstrDefs(*
I, Defs);
1482 if (Defs.count() != 1)
1488 const BitTracker::RegisterCell &DRC =
BT.
lookup(DR);
1489 if (HBS::getConst(DRC, 0, DRC.
width(), U)) {
1492 auto At =
I->isPHI() ?
B.getFirstNonPHI() :
I;
1495 HBS::replaceReg(DR, ImmReg,
MRI);
1496 BT.
put(ImmReg, DRC);
1509 class CopyGeneration :
public Transformation {
1511 CopyGeneration(BitTracker &bt,
const HexagonInstrInfo &hii,
1512 const HexagonRegisterInfo &hri, MachineRegisterInfo &mri)
1513 : Transformation(
true), HII(hii), HRI(hri),
MRI(mri),
BT(bt) {}
1515 bool processBlock(MachineBasicBlock &
B,
const RegisterSet &AVs)
override;
1518 bool findMatch(
const BitTracker::RegisterRef &Inp,
1519 BitTracker::RegisterRef &Out,
const RegisterSet &AVs);
1521 const HexagonInstrInfo &HII;
1522 const HexagonRegisterInfo &HRI;
1523 MachineRegisterInfo &
MRI;
1530 class CopyPropagation :
public Transformation {
1532 CopyPropagation(
const HexagonRegisterInfo &hri, MachineRegisterInfo &mri)
1533 : Transformation(
false), HRI(hri),
MRI(mri) {}
1535 bool processBlock(MachineBasicBlock &
B,
const RegisterSet &AVs)
override;
1537 static bool isCopyReg(
unsigned Opc,
bool NoConv);
1540 bool propagateRegCopy(MachineInstr &
MI);
1542 const HexagonRegisterInfo &HRI;
1543 MachineRegisterInfo &
MRI;
1550bool CopyGeneration::findMatch(
const BitTracker::RegisterRef &Inp,
1551 BitTracker::RegisterRef &Out,
const RegisterSet &AVs) {
1554 const BitTracker::RegisterCell &InpRC =
BT.
lookup(Inp.
Reg);
1555 auto *FRC = HBS::getFinalVRegClass(Inp,
MRI);
1557 if (!HBS::getSubregMask(Inp,
B, W,
MRI))
1560 for (
Register R = AVs.find_first(); R; R = AVs.find_next(R)) {
1561 if (!
BT.
has(R) || Forbidden[R])
1563 const BitTracker::RegisterCell &RC =
BT.
lookup(R);
1564 unsigned RW = RC.
width();
1566 if (FRC !=
MRI.getRegClass(R))
1568 if (!HBS::isTransparentCopy(R, Inp,
MRI))
1570 if (!HBS::isEqual(InpRC,
B, RC, 0, W))
1581 if (
MRI.getRegClass(R) != &Hexagon::DoubleRegsRegClass)
1584 if (HBS::isEqual(InpRC,
B, RC, 0, W))
1585 Out.
Sub = Hexagon::isub_lo;
1586 else if (HBS::isEqual(InpRC,
B, RC, W, W))
1587 Out.
Sub = Hexagon::isub_hi;
1591 if (HBS::isTransparentCopy(Out, Inp,
MRI))
1597bool CopyGeneration::processBlock(MachineBasicBlock &
B,
1605 for (
auto I =
B.begin(),
E =
B.end();
I !=
E; ++
I, AVB.insert(Defs)) {
1607 HBS::getInstrDefs(*
I, Defs);
1609 unsigned Opc =
I->getOpcode();
1610 if (CopyPropagation::isCopyReg(
Opc,
false) ||
1611 ConstGeneration::isTfrConst(*
I))
1615 auto At =
I->isPHI() ?
B.getFirstNonPHI() :
I;
1617 for (
Register R = Defs.find_first(); R; R = Defs.find_next(R)) {
1618 BitTracker::RegisterRef MR;
1619 auto *FRC = HBS::getFinalVRegClass(R,
MRI);
1621 if (findMatch(R, MR, AVB)) {
1623 BuildMI(
B, At,
DL, HII.get(TargetOpcode::COPY), NewR)
1625 BT.
put(BitTracker::RegisterRef(NewR),
BT.
get(MR));
1626 HBS::replaceReg(R, NewR,
MRI);
1627 Forbidden.insert(R);
1631 if (FRC == &Hexagon::DoubleRegsRegClass ||
1632 FRC == &Hexagon::HvxWRRegClass) {
1636 BitTracker::RegisterRef TL = {
R, SubLo };
1637 BitTracker::RegisterRef
TH = {
R, SubHi };
1638 BitTracker::RegisterRef
ML, MH;
1639 if (findMatch(TL,
ML, AVB) && findMatch(TH, MH, AVB)) {
1640 auto *FRC = HBS::getFinalVRegClass(R,
MRI);
1642 BuildMI(
B, At,
DL, HII.get(TargetOpcode::REG_SEQUENCE), NewR)
1647 BT.
put(BitTracker::RegisterRef(NewR),
BT.
get(R));
1648 HBS::replaceReg(R, NewR,
MRI);
1649 Forbidden.insert(R);
1658bool CopyPropagation::isCopyReg(
unsigned Opc,
bool NoConv) {
1660 case TargetOpcode::COPY:
1661 case TargetOpcode::REG_SEQUENCE:
1662 case Hexagon::A4_combineir:
1663 case Hexagon::A4_combineri:
1665 case Hexagon::A2_tfr:
1666 case Hexagon::A2_tfrp:
1667 case Hexagon::A2_combinew:
1668 case Hexagon::V6_vcombine:
1676bool CopyPropagation::propagateRegCopy(MachineInstr &
MI) {
1678 unsigned Opc =
MI.getOpcode();
1679 BitTracker::RegisterRef RD =
MI.getOperand(0);
1680 assert(
MI.getOperand(0).getSubReg() == 0);
1683 case TargetOpcode::COPY:
1684 case Hexagon::A2_tfr:
1685 case Hexagon::A2_tfrp: {
1686 BitTracker::RegisterRef
RS =
MI.getOperand(1);
1687 if (!HBS::isTransparentCopy(RD, RS,
MRI))
1695 case TargetOpcode::REG_SEQUENCE: {
1696 BitTracker::RegisterRef SL, SH;
1697 if (HBS::parseRegSequence(
MI, SL, SH,
MRI)) {
1698 const TargetRegisterClass &RC = *
MRI.getRegClass(RD.
Reg);
1706 case Hexagon::A2_combinew:
1707 case Hexagon::V6_vcombine: {
1708 const TargetRegisterClass &RC = *
MRI.getRegClass(RD.
Reg);
1711 BitTracker::RegisterRef RH =
MI.getOperand(1), RL =
MI.getOperand(2);
1712 Changed = HBS::replaceSubWithSub(RD.
Reg, SubLo, RL.Reg, RL.Sub,
MRI);
1716 case Hexagon::A4_combineir:
1717 case Hexagon::A4_combineri: {
1718 unsigned SrcX = (
Opc == Hexagon::A4_combineir) ? 2 : 1;
1719 unsigned Sub = (
Opc == Hexagon::A4_combineir) ? Hexagon::isub_lo
1721 BitTracker::RegisterRef
RS =
MI.getOperand(SrcX);
1729bool CopyPropagation::processBlock(MachineBasicBlock &
B,
const RegisterSet&) {
1730 std::vector<MachineInstr*> Instrs;
1732 Instrs.push_back(&
MI);
1735 for (
auto *
I : Instrs) {
1736 unsigned Opc =
I->getOpcode();
1737 if (!CopyPropagation::isCopyReg(
Opc,
true))
1750 class BitSimplification :
public Transformation {
1752 BitSimplification(BitTracker &bt,
const MachineDominatorTree &mdt,
1753 const HexagonInstrInfo &hii,
1754 const HexagonRegisterInfo &hri, MachineRegisterInfo &mri,
1755 MachineFunction &mf)
1756 : Transformation(
true), MDT(mdt), HII(hii), HRI(hri),
MRI(mri),
BT(bt) {
1759 bool processBlock(MachineBasicBlock &
B,
const RegisterSet &AVs)
override;
1762 struct RegHalf :
public BitTracker::RegisterRef {
1766 bool matchHalf(
unsigned SelfR,
const BitTracker::RegisterCell &RC,
1767 unsigned B, RegHalf &RH);
1768 bool validateReg(BitTracker::RegisterRef R,
unsigned Opc,
unsigned OpNum);
1770 bool matchPackhl(
unsigned SelfR,
const BitTracker::RegisterCell &RC,
1771 BitTracker::RegisterRef &Rs, BitTracker::RegisterRef &Rt);
1772 unsigned getCombineOpcode(
bool HLow,
bool LLow);
1774 bool genStoreUpperHalf(MachineInstr *
MI);
1775 bool genStoreImmediate(MachineInstr *
MI);
1776 bool genPackhl(MachineInstr *
MI, BitTracker::RegisterRef RD,
1777 const BitTracker::RegisterCell &RC);
1778 bool genExtractHalf(MachineInstr *
MI, BitTracker::RegisterRef RD,
1779 const BitTracker::RegisterCell &RC);
1780 bool genCombineHalf(MachineInstr *
MI, BitTracker::RegisterRef RD,
1781 const BitTracker::RegisterCell &RC);
1782 bool genExtractLow(MachineInstr *
MI, BitTracker::RegisterRef RD,
1783 const BitTracker::RegisterCell &RC);
1784 bool genBitSplit(MachineInstr *
MI, BitTracker::RegisterRef RD,
1785 const BitTracker::RegisterCell &RC,
const RegisterSet &AVs);
1786 bool simplifyTstbit(MachineInstr *
MI, BitTracker::RegisterRef RD,
1787 const BitTracker::RegisterCell &RC);
1788 bool simplifyExtractLow(MachineInstr *
MI, BitTracker::RegisterRef RD,
1789 const BitTracker::RegisterCell &RC,
const RegisterSet &AVs);
1790 bool simplifyRCmp0(MachineInstr *
MI, BitTracker::RegisterRef RD);
1794 std::vector<MachineInstr*> NewMIs;
1796 const MachineDominatorTree &MDT;
1797 const HexagonInstrInfo &HII;
1798 [[maybe_unused]]
const HexagonRegisterInfo &HRI;
1799 MachineRegisterInfo &
MRI;
1808bool BitSimplification::matchHalf(
unsigned SelfR,
1809 const BitTracker::RegisterCell &RC,
unsigned B, RegHalf &RH) {
1819 while (
I <
B+16 && RC[
I].num())
1825 unsigned P = RC[
I].RefI.Pos;
1828 unsigned Pos =
P - (
I-
B);
1830 if (
Reg == 0 ||
Reg == SelfR)
1837 const BitTracker::RegisterCell &SC =
BT.
lookup(
Reg);
1838 if (Pos+16 > SC.
width())
1841 for (
unsigned i = 0; i < 16; ++i) {
1842 const BitTracker::BitValue &RV = RC[i+
B];
1850 if (RC[i+
B] != SC[i+Pos])
1857 Sub = Hexagon::isub_lo;
1861 Sub = Hexagon::isub_lo;
1865 Sub = Hexagon::isub_hi;
1869 Sub = Hexagon::isub_hi;
1880 if (!HBS::getFinalVRegClass(RH,
MRI))
1886bool BitSimplification::validateReg(BitTracker::RegisterRef R,
unsigned Opc,
1888 auto *OpRC = HII.getRegClass(HII.get(
Opc), OpNum);
1889 auto *RRC = HBS::getFinalVRegClass(R,
MRI);
1890 return OpRC->hasSubClassEq(RRC);
1895bool BitSimplification::matchPackhl(
unsigned SelfR,
1896 const BitTracker::RegisterCell &RC, BitTracker::RegisterRef &Rs,
1897 BitTracker::RegisterRef &Rt) {
1898 RegHalf L1, H1, L2, H2;
1900 if (!matchHalf(SelfR, RC, 0, L2) || !matchHalf(SelfR, RC, 16, L1))
1902 if (!matchHalf(SelfR, RC, 32, H2) || !matchHalf(SelfR, RC, 48, H1))
1906 if (H1.Reg != L1.Reg || H1.Sub != L1.Sub || H1.Low || !L1.Low)
1908 if (H2.Reg != L2.Reg || H2.Sub != L2.Sub || H2.Low || !L2.Low)
1916unsigned BitSimplification::getCombineOpcode(
bool HLow,
bool LLow) {
1917 return HLow ? LLow ? Hexagon::A2_combine_ll
1918 : Hexagon::A2_combine_lh
1919 : LLow ? Hexagon::A2_combine_hl
1920 : Hexagon::A2_combine_hh;
1926bool BitSimplification::genStoreUpperHalf(MachineInstr *
MI) {
1927 unsigned Opc =
MI->getOpcode();
1928 if (
Opc != Hexagon::S2_storerh_io)
1931 MachineOperand &ValOp =
MI->getOperand(2);
1932 BitTracker::RegisterRef
RS = ValOp;
1935 const BitTracker::RegisterCell &RC =
BT.
lookup(
RS.Reg);
1937 unsigned B = (
RS.Sub == Hexagon::isub_hi) ? 32 : 0;
1938 if (!matchHalf(0, RC,
B,
H))
1942 MI->setDesc(HII.get(Hexagon::S2_storerf_io));
1950bool BitSimplification::genStoreImmediate(MachineInstr *
MI) {
1951 unsigned Opc =
MI->getOpcode();
1954 case Hexagon::S2_storeri_io:
1957 case Hexagon::S2_storerh_io:
1960 case Hexagon::S2_storerb_io:
1967 if (!
MI->getOperand(0).isReg())
1969 MachineOperand &OffOp =
MI->getOperand(1);
1975 if (!
isUIntN(6+Align, Off) || (Off & ((1<<Align)-1)))
1978 BitTracker::RegisterRef
RS =
MI->getOperand(2);
1981 const BitTracker::RegisterCell &RC =
BT.
lookup(
RS.Reg);
1983 if (!HBS::getConst(RC, 0, RC.
width(), U))
1989 case Hexagon::S2_storerb_io:
1992 case Hexagon::S2_storerh_io:
1995 case Hexagon::S2_storeri_io:
2006 MI->removeOperand(2);
2008 case Hexagon::S2_storerb_io:
2009 MI->setDesc(HII.get(Hexagon::S4_storeirb_io));
2011 case Hexagon::S2_storerh_io:
2012 MI->setDesc(HII.get(Hexagon::S4_storeirh_io));
2014 case Hexagon::S2_storeri_io:
2015 MI->setDesc(HII.get(Hexagon::S4_storeiri_io));
2026bool BitSimplification::genPackhl(MachineInstr *
MI,
2027 BitTracker::RegisterRef RD,
const BitTracker::RegisterCell &RC) {
2028 unsigned Opc =
MI->getOpcode();
2029 if (
Opc == Hexagon::S2_packhl)
2031 BitTracker::RegisterRef Rs, Rt;
2032 if (!matchPackhl(RD.
Reg, RC, Rs, Rt))
2034 if (!validateReg(Rs, Hexagon::S2_packhl, 1) ||
2035 !validateReg(Rt, Hexagon::S2_packhl, 2))
2038 MachineBasicBlock &
B = *
MI->getParent();
2039 Register NewR =
MRI.createVirtualRegister(&Hexagon::DoubleRegsRegClass);
2041 auto At =
MI->isPHI() ?
B.getFirstNonPHI()
2043 BuildMI(
B, At,
DL, HII.get(Hexagon::S2_packhl), NewR)
2046 HBS::replaceSubWithSub(RD.
Reg, RD.
Sub, NewR, 0,
MRI);
2047 BT.
put(BitTracker::RegisterRef(NewR), RC);
2053bool BitSimplification::genExtractHalf(MachineInstr *
MI,
2054 BitTracker::RegisterRef RD,
const BitTracker::RegisterCell &RC) {
2057 if (!matchHalf(RD.
Reg, RC, 0, L) || !HBS::isZero(RC, 16, 16))
2060 unsigned Opc =
MI->getOpcode();
2061 MachineBasicBlock &
B = *
MI->getParent();
2067 auto At =
MI->isPHI() ?
B.getFirstNonPHI()
2069 if (
L.Low &&
Opc != Hexagon::A2_zxth) {
2070 if (validateReg(L, Hexagon::A2_zxth, 1)) {
2071 NewR =
MRI.createVirtualRegister(&Hexagon::IntRegsRegClass);
2072 BuildMI(
B, At,
DL, HII.get(Hexagon::A2_zxth), NewR)
2075 }
else if (!
L.Low &&
Opc != Hexagon::S2_lsr_i_r) {
2076 if (validateReg(L, Hexagon::S2_lsr_i_r, 1)) {
2077 NewR =
MRI.createVirtualRegister(&Hexagon::IntRegsRegClass);
2085 HBS::replaceSubWithSub(RD.
Reg, RD.
Sub, NewR, 0,
MRI);
2086 BT.
put(BitTracker::RegisterRef(NewR), RC);
2092bool BitSimplification::genCombineHalf(MachineInstr *
MI,
2093 BitTracker::RegisterRef RD,
const BitTracker::RegisterCell &RC) {
2096 if (!matchHalf(RD.
Reg, RC, 0, L) || !matchHalf(RD.
Reg, RC, 16,
H))
2099 if (
L.Reg ==
H.Reg &&
L.Sub ==
H.Sub && !
H.Low &&
L.Low)
2102 unsigned Opc =
MI->getOpcode();
2103 unsigned COpc = getCombineOpcode(
H.Low,
L.Low);
2106 if (!validateReg(
H, COpc, 1) || !validateReg(L, COpc, 2))
2109 MachineBasicBlock &
B = *
MI->getParent();
2111 Register NewR =
MRI.createVirtualRegister(&Hexagon::IntRegsRegClass);
2112 auto At =
MI->isPHI() ?
B.getFirstNonPHI()
2117 HBS::replaceSubWithSub(RD.
Reg, RD.
Sub, NewR, 0,
MRI);
2118 BT.
put(BitTracker::RegisterRef(NewR), RC);
2124bool BitSimplification::genExtractLow(MachineInstr *
MI,
2125 BitTracker::RegisterRef RD,
const BitTracker::RegisterCell &RC) {
2126 unsigned Opc =
MI->getOpcode();
2128 case Hexagon::A2_zxtb:
2129 case Hexagon::A2_zxth:
2130 case Hexagon::S2_extractu:
2133 if (
Opc == Hexagon::A2_andir &&
MI->getOperand(2).isImm()) {
2134 int32_t
Imm =
MI->getOperand(2).getImm();
2139 if (
MI->hasUnmodeledSideEffects() ||
MI->isInlineAsm())
2142 while (W > 0 && RC[W-1].is(0))
2144 if (W == 0 || W == RC.
width())
2146 unsigned NewOpc = (
W == 8) ? Hexagon::A2_zxtb
2147 : (
W == 16) ? Hexagon::A2_zxth
2148 : (
W < 10) ? Hexagon::A2_andir
2149 : Hexagon::S2_extractu;
2150 MachineBasicBlock &
B = *
MI->getParent();
2153 for (
auto &
Op :
MI->uses()) {
2156 BitTracker::RegisterRef RS = Op;
2157 if (!BT.has(RS.Reg))
2159 const BitTracker::RegisterCell &SC = BT.lookup(RS.Reg);
2161 if (!HBS::getSubregMask(RS, BN, BW, MRI))
2163 if (BW < W || !HBS::isEqual(RC, 0, SC, BN, W))
2165 if (!validateReg(RS, NewOpc, 1))
2168 Register NewR = MRI.createVirtualRegister(&Hexagon::IntRegsRegClass);
2169 auto At = MI->isPHI() ? B.getFirstNonPHI()
2170 : MachineBasicBlock::iterator(MI);
2171 auto MIB = BuildMI(B, At, DL, HII.get(NewOpc), NewR)
2172 .addReg(RS.Reg, 0, RS.Sub);
2173 if (NewOpc == Hexagon::A2_andir)
2174 MIB.addImm((1 << W) - 1);
2175 else if (NewOpc == Hexagon::S2_extractu)
2176 MIB.addImm(W).addImm(0);
2177 HBS::replaceSubWithSub(RD.Reg, RD.Sub, NewR, 0, MRI);
2178 BT.put(BitTracker::RegisterRef(NewR), RC);
2184bool BitSimplification::genBitSplit(MachineInstr *
MI,
2185 BitTracker::RegisterRef RD,
const BitTracker::RegisterCell &RC,
2194 unsigned Opc =
MI->getOpcode();
2196 case Hexagon::A4_bitsplit:
2197 case Hexagon::A4_bitspliti:
2205 auto ctlz = [] (
const BitTracker::RegisterCell &
C) ->
unsigned {
2206 unsigned Z =
C.width();
2207 while (Z > 0 &&
C[Z-1].is(0))
2209 return C.width() -
Z;
2213 unsigned Z = ctlz(RC);
2214 if (Z == 0 || Z == W)
2219 const BitTracker::BitValue &B0 = RC[0];
2228 for (
unsigned i = 1; i <
W-
Z; ++i) {
2229 const BitTracker::BitValue &
V = RC[i];
2232 if (
V.RefI.Reg != SrcR ||
V.RefI.Pos != Pos+i)
2237 for (
unsigned S = AVs.find_first(); S; S = AVs.find_next(S)) {
2240 unsigned SRC =
MRI.getRegClass(S)->getID();
2241 if (SRC != Hexagon::IntRegsRegClassID &&
2242 SRC != Hexagon::DoubleRegsRegClassID)
2246 const BitTracker::RegisterCell &SC =
BT.
lookup(S);
2247 if (SC.
width() != W || ctlz(SC) != W-Z)
2250 const BitTracker::BitValue &S0 = SC[0];
2255 if (Pos <=
P && (Pos + W-Z) !=
P)
2257 if (
P < Pos && (
P + Z) != Pos)
2260 if (std::min(
P, Pos) != 0 && std::min(
P, Pos) != 32)
2264 for (
I = 1;
I <
Z; ++
I) {
2265 const BitTracker::BitValue &
V = SC[
I];
2268 if (
V.RefI.Reg != SrcR ||
V.RefI.Pos !=
P+
I)
2277 MachineInstr *DefS =
MRI.getVRegDef(S);
2281 auto At = DefS->
isPHI() ?
B.getFirstNonPHI()
2283 if (
MRI.getRegClass(SrcR)->getID() == Hexagon::DoubleRegsRegClassID)
2284 SrcSR = (std::min(Pos,
P) == 32) ? Hexagon::isub_hi : Hexagon::isub_lo;
2285 if (!validateReg({SrcR,SrcSR}, Hexagon::A4_bitspliti, 1))
2287 unsigned ImmOp = Pos <=
P ?
W-
Z :
Z;
2291 for (MachineInstr *In : NewMIs) {
2292 if (
In->getOpcode() != Hexagon::A4_bitspliti)
2294 MachineOperand &Op1 =
In->getOperand(1);
2297 if (
In->getOperand(2).getImm() != ImmOp)
2300 MachineOperand &Op0 =
In->getOperand(0);
2301 MachineInstr *DefI =
MRI.getVRegDef(Op0.
getReg());
2312 NewR =
MRI.createVirtualRegister(&Hexagon::DoubleRegsRegClass);
2313 auto NewBS =
BuildMI(
B, At,
DL, HII.get(Hexagon::A4_bitspliti), NewR)
2316 NewMIs.push_back(NewBS);
2319 HBS::replaceRegWithSub(RD.
Reg, NewR, Hexagon::isub_lo,
MRI);
2320 HBS::replaceRegWithSub(S, NewR, Hexagon::isub_hi,
MRI);
2322 HBS::replaceRegWithSub(S, NewR, Hexagon::isub_lo,
MRI);
2323 HBS::replaceRegWithSub(RD.
Reg, NewR, Hexagon::isub_hi,
MRI);
2337bool BitSimplification::simplifyTstbit(MachineInstr *
MI,
2338 BitTracker::RegisterRef RD,
const BitTracker::RegisterCell &RC) {
2339 unsigned Opc =
MI->getOpcode();
2340 if (
Opc != Hexagon::S2_tstbit_i)
2343 unsigned BN =
MI->getOperand(2).getImm();
2344 BitTracker::RegisterRef
RS =
MI->getOperand(1);
2347 if (!
BT.
has(
RS.Reg) || !HBS::getSubregMask(RS,
F, W,
MRI))
2349 MachineBasicBlock &
B = *
MI->getParent();
2350 auto At =
MI->isPHI() ?
B.getFirstNonPHI()
2353 const BitTracker::RegisterCell &SC =
BT.
lookup(
RS.Reg);
2354 const BitTracker::BitValue &
V = SC[
F+BN];
2356 const TargetRegisterClass *TC =
MRI.getRegClass(
V.RefI.Reg);
2360 unsigned P = std::numeric_limits<unsigned>::max();
2361 BitTracker::RegisterRef RR(
V.RefI.Reg, 0);
2362 if (TC == &Hexagon::DoubleRegsRegClass) {
2364 RR.
Sub = Hexagon::isub_lo;
2367 RR.
Sub = Hexagon::isub_hi;
2369 }
else if (TC == &Hexagon::IntRegsRegClass) {
2372 if (
P != std::numeric_limits<unsigned>::max()) {
2373 Register NewR =
MRI.createVirtualRegister(&Hexagon::PredRegsRegClass);
2374 BuildMI(
B, At,
DL, HII.get(Hexagon::S2_tstbit_i), NewR)
2377 HBS::replaceReg(RD.
Reg, NewR,
MRI);
2381 }
else if (
V.is(0) ||
V.is(1)) {
2382 Register NewR =
MRI.createVirtualRegister(&Hexagon::PredRegsRegClass);
2383 unsigned NewOpc =
V.is(0) ? Hexagon::PS_false : Hexagon::PS_true;
2385 HBS::replaceReg(RD.
Reg, NewR,
MRI);
2397bool BitSimplification::simplifyExtractLow(MachineInstr *
MI,
2398 BitTracker::RegisterRef RD,
const BitTracker::RegisterCell &RC,
2416 const TargetRegisterClass *FRC = HBS::getFinalVRegClass(RD,
MRI);
2417 if (FRC != &Hexagon::IntRegsRegClass && FRC != &Hexagon::DoubleRegsRegClass)
2431 const BitTracker::BitValue &TopV = RC[
W-1];
2437 for (
unsigned I = 0;
I !=
W; ++
I) {
2438 const BitTracker::BitValue &
V = RC[
I];
2446 if (TopV.
is(0) || TopV.
is(1)) {
2447 bool S = TopV.
is(1);
2448 for (--W;
W > 0 && RC[
W-1].is(S); --
W)
2460 for (--W;
W > 0 && RC[
W-1] == TopV; --
W)
2475 dbgs() <<
"Cell: " << RC <<
'\n';
2476 dbgs() <<
"Expected bitfield size: " <<
Len <<
" bits, "
2477 << (
Signed ?
"sign" :
"zero") <<
"-extended\n";
2482 for (
unsigned R = AVs.find_first(); R != 0; R = AVs.find_next(R)) {
2485 const BitTracker::RegisterCell &SC =
BT.
lookup(R);
2486 unsigned SW = SC.
width();
2492 if (SW < RW || (SW % RW) != 0)
2499 while (Off <= SW-Len) {
2500 unsigned OE = (
Off+
Len)/RW;
2511 if (HBS::isEqual(RC, 0, SC, Off, Len))
2520 unsigned ExtOpc = 0;
2523 ExtOpc =
Signed ? Hexagon::A2_sxtb : Hexagon::A2_zxtb;
2525 ExtOpc =
Signed ? Hexagon::A2_sxth : Hexagon::A2_zxth;
2526 else if (Len < 10 && !
Signed)
2527 ExtOpc = Hexagon::A2_andir;
2531 Signed ? (RW == 32 ? Hexagon::S4_extract : Hexagon::S4_extractp)
2532 : (RW == 32 ? Hexagon::S2_extractu : Hexagon::S2_extractup);
2536 if (RW != SW && RW*2 != SW)
2539 SR = (
Off/RW == 0) ? Hexagon::isub_lo : Hexagon::isub_hi;
2542 if (!validateReg({
R,SR}, ExtOpc, 1))
2546 if (
MI->getOpcode() == ExtOpc) {
2548 const MachineOperand &SrcOp =
MI->getOperand(1);
2554 MachineBasicBlock &
B = *
MI->getParent();
2556 auto At =
MI->isPHI() ?
B.getFirstNonPHI()
2558 auto MIB =
BuildMI(
B, At,
DL, HII.get(ExtOpc), NewR)
2561 case Hexagon::A2_sxtb:
2562 case Hexagon::A2_zxtb:
2563 case Hexagon::A2_sxth:
2564 case Hexagon::A2_zxth:
2566 case Hexagon::A2_andir:
2567 MIB.addImm((1u << Len) - 1);
2569 case Hexagon::S4_extract:
2570 case Hexagon::S2_extractu:
2571 case Hexagon::S4_extractp:
2572 case Hexagon::S2_extractup:
2580 HBS::replaceReg(RD.
Reg, NewR,
MRI);
2581 BT.
put(BitTracker::RegisterRef(NewR), RC);
2589bool BitSimplification::simplifyRCmp0(MachineInstr *
MI,
2590 BitTracker::RegisterRef RD) {
2591 unsigned Opc =
MI->getOpcode();
2592 if (
Opc != Hexagon::A4_rcmpeqi &&
Opc != Hexagon::A4_rcmpneqi)
2594 MachineOperand &CmpOp =
MI->getOperand(2);
2598 const TargetRegisterClass *FRC = HBS::getFinalVRegClass(RD,
MRI);
2599 if (FRC != &Hexagon::IntRegsRegClass && FRC != &Hexagon::DoubleRegsRegClass)
2603 MachineBasicBlock &
B = *
MI->getParent();
2605 auto At =
MI->isPHI() ?
B.getFirstNonPHI()
2608 bool KnownNZ =
false;
2610 BitTracker::RegisterRef SR =
MI->getOperand(1);
2613 const BitTracker::RegisterCell &SC =
BT.
lookup(SR.
Reg);
2615 if (!HBS::getSubregMask(SR,
F, W,
MRI))
2618 for (uint16_t
I =
F;
I !=
F+
W; ++
I) {
2619 const BitTracker::BitValue &
V = SC[
I];
2626 auto ReplaceWithConst = [&](
int C) {
2628 BuildMI(
B, At,
DL, HII.get(Hexagon::A2_tfrsi), NewR)
2630 HBS::replaceReg(RD.
Reg, NewR,
MRI);
2631 BitTracker::RegisterCell NewRC(W);
2632 for (uint16_t
I = 0;
I !=
W; ++
I) {
2633 NewRC[
I] = BitTracker::BitValue(
C & 1);
2634 C = unsigned(
C) >> 1;
2636 BT.
put(BitTracker::RegisterRef(NewR), NewRC);
2640 auto IsNonZero = [] (
const MachineOperand &
Op) {
2641 if (
Op.isGlobal() ||
Op.isBlockAddress())
2644 return Op.getImm() != 0;
2646 return !
Op.getCImm()->isZero();
2648 return !
Op.getFPImm()->isZero();
2652 auto IsZero = [] (
const MachineOperand &
Op) {
2653 if (
Op.isGlobal() ||
Op.isBlockAddress())
2656 return Op.getImm() == 0;
2658 return Op.getCImm()->isZero();
2660 return Op.getFPImm()->isZero();
2666 if (KnownZ || KnownNZ) {
2667 assert(KnownZ != KnownNZ &&
"Register cannot be both 0 and non-0");
2668 return ReplaceWithConst(KnownZ == (
Opc == Hexagon::A4_rcmpeqi));
2673 MachineInstr *InpDef =
MRI.getVRegDef(SR.
Reg);
2676 if (SR.
Sub == 0 && InpDef->
getOpcode() == Hexagon::C2_muxii) {
2677 MachineOperand &Src1 = InpDef->
getOperand(2);
2678 MachineOperand &Src2 = InpDef->
getOperand(3);
2680 bool KnownNZ1 = IsNonZero(Src1), KnownNZ2 = IsNonZero(Src2);
2681 if (KnownNZ1 && KnownNZ2)
2682 return ReplaceWithConst(
Opc == Hexagon::A4_rcmpneqi);
2684 bool KnownZ1 = IsZero(Src1), KnownZ2 = IsZero(Src2);
2685 if (KnownZ1 && KnownZ2)
2686 return ReplaceWithConst(
Opc == Hexagon::A4_rcmpeqi);
2691 if ((KnownZ1 || KnownNZ1) && (KnownZ2 || KnownNZ2)) {
2693 BuildMI(
B, At,
DL, HII.get(Hexagon::C2_muxii), NewR)
2695 .
addImm(KnownZ1 == (
Opc == Hexagon::A4_rcmpeqi))
2696 .
addImm(KnownZ2 == (
Opc == Hexagon::A4_rcmpeqi));
2697 HBS::replaceReg(RD.
Reg, NewR,
MRI);
2699 BitTracker::RegisterCell NewRC(W);
2702 BT.
put(BitTracker::RegisterRef(NewR), NewRC);
2710bool BitSimplification::processBlock(MachineBasicBlock &
B,
2718 for (
auto I =
B.begin(),
E =
B.end();
I !=
E; ++
I, AVB.insert(Defs)) {
2719 MachineInstr *
MI = &*
I;
2721 HBS::getInstrDefs(*
MI, Defs);
2723 unsigned Opc =
MI->getOpcode();
2724 if (
Opc == TargetOpcode::COPY ||
Opc == TargetOpcode::REG_SEQUENCE)
2727 if (
MI->mayStore()) {
2728 bool T = genStoreUpperHalf(
MI);
2729 T =
T || genStoreImmediate(
MI);
2734 if (Defs.count() != 1)
2736 const MachineOperand &Op0 =
MI->getOperand(0);
2739 BitTracker::RegisterRef RD = Op0;
2742 const TargetRegisterClass *FRC = HBS::getFinalVRegClass(RD,
MRI);
2743 const BitTracker::RegisterCell &RC =
BT.
lookup(RD.
Reg);
2745 if (FRC->
getID() == Hexagon::DoubleRegsRegClassID) {
2746 bool T = genPackhl(
MI, RD, RC);
2747 T =
T || simplifyExtractLow(
MI, RD, RC, AVB);
2752 if (FRC->
getID() == Hexagon::IntRegsRegClassID) {
2753 bool T = genBitSplit(
MI, RD, RC, AVB);
2754 T =
T || simplifyExtractLow(
MI, RD, RC, AVB);
2755 T =
T || genExtractHalf(
MI, RD, RC);
2756 T =
T || genCombineHalf(
MI, RD, RC);
2757 T =
T || genExtractLow(
MI, RD, RC);
2758 T =
T || simplifyRCmp0(
MI, RD);
2763 if (FRC->
getID() == Hexagon::PredRegsRegClassID) {
2764 bool T = simplifyTstbit(
MI, RD, RC);
2772bool HexagonBitSimplify::runOnMachineFunction(MachineFunction &MF) {
2778 auto &HII = *HST.getInstrInfo();
2780 MDT = &getAnalysis<MachineDominatorTreeWrapperPass>().getDomTree();
2784 Changed = DeadCodeElimination(MF, *MDT).run();
2786 const HexagonEvaluator HE(HRI,
MRI, HII, MF);
2787 BitTracker
BT(HE, MF);
2794 ConstGeneration ImmG(
BT, HII,
MRI);
2795 Changed |= visitBlock(Entry, ImmG, AIG);
2798 RedundantInstrElimination RIE(
BT, HII, HRI,
MRI);
2799 bool Ried = visitBlock(Entry, RIE, ARE);
2806 CopyGeneration CopyG(
BT, HII, HRI,
MRI);
2807 Changed |= visitBlock(Entry, CopyG, ACG);
2810 CopyPropagation CopyP(HRI,
MRI);
2811 Changed |= visitBlock(Entry, CopyP, ACP);
2817 BitSimplification BitS(
BT, *MDT, HII, HRI,
MRI, MF);
2818 Changed |= visitBlock(Entry, BitS, ABS);
2826 DeadCodeElimination(MF, *MDT).run();
2895 class HexagonLoopRescheduling :
public MachineFunctionPass {
2899 HexagonLoopRescheduling() : MachineFunctionPass(
ID) {}
2901 bool runOnMachineFunction(MachineFunction &MF)
override;
2904 const HexagonInstrInfo *HII =
nullptr;
2905 const HexagonRegisterInfo *HRI =
nullptr;
2906 MachineRegisterInfo *
MRI =
nullptr;
2907 BitTracker *BTP =
nullptr;
2910 LoopCand(MachineBasicBlock *lb, MachineBasicBlock *pb,
2911 MachineBasicBlock *eb) : LB(lb),
PB(pb), EB(eb) {}
2913 MachineBasicBlock *LB, *
PB, *EB;
2915 using InstrList = std::vector<MachineInstr *>;
2917 BitTracker::RegisterRef Inp, Out;
2921 PhiInfo(MachineInstr &
P, MachineBasicBlock &
B);
2924 BitTracker::RegisterRef LR, PR;
2925 MachineBasicBlock *LB, *
PB;
2928 static unsigned getDefReg(
const MachineInstr *
MI);
2930 bool isBitShuffle(
const MachineInstr *
MI,
unsigned DefR)
const;
2931 bool isStoreInput(
const MachineInstr *
MI,
unsigned DefR)
const;
2932 bool isShuffleOf(
unsigned OutR,
unsigned InpR)
const;
2933 bool isSameShuffle(
unsigned OutR1,
unsigned InpR1,
unsigned OutR2,
2934 unsigned &InpR2)
const;
2935 void moveGroup(InstrGroup &
G, MachineBasicBlock &LB, MachineBasicBlock &
PB,
2937 bool processLoop(LoopCand &
C);
2942char HexagonLoopRescheduling::ID = 0;
2945 "Hexagon Loop Rescheduling",
false,
false)
2949 DefR = HexagonLoopRescheduling::getDefReg(&
P);
2952 for (
unsigned i = 1, n =
P.getNumOperands(); i < n; i += 2) {
2955 LR =
P.getOperand(i);
2959 PR =
P.getOperand(i);
2963unsigned HexagonLoopRescheduling::getDefReg(
const MachineInstr *
MI) {
2965 HBS::getInstrDefs(*
MI, Defs);
2966 if (Defs.count() != 1)
2968 return Defs.find_first();
2971bool HexagonLoopRescheduling::isConst(
unsigned Reg)
const {
2974 const BitTracker::RegisterCell &RC = BTP->
lookup(
Reg);
2975 for (
unsigned i = 0, w = RC.
width(); i < w; ++i) {
2976 const BitTracker::BitValue &
V = RC[i];
2977 if (!
V.is(0) && !
V.is(1))
2983bool HexagonLoopRescheduling::isBitShuffle(
const MachineInstr *
MI,
2984 unsigned DefR)
const {
2985 unsigned Opc =
MI->getOpcode();
2987 case TargetOpcode::COPY:
2988 case Hexagon::S2_lsr_i_r:
2989 case Hexagon::S2_asr_i_r:
2990 case Hexagon::S2_asl_i_r:
2991 case Hexagon::S2_lsr_i_p:
2992 case Hexagon::S2_asr_i_p:
2993 case Hexagon::S2_asl_i_p:
2994 case Hexagon::S2_insert:
2995 case Hexagon::A2_or:
2996 case Hexagon::A2_orp:
2997 case Hexagon::A2_and:
2998 case Hexagon::A2_andp:
2999 case Hexagon::A2_combinew:
3000 case Hexagon::A4_combineri:
3001 case Hexagon::A4_combineir:
3002 case Hexagon::A2_combineii:
3003 case Hexagon::A4_combineii:
3004 case Hexagon::A2_combine_ll:
3005 case Hexagon::A2_combine_lh:
3006 case Hexagon::A2_combine_hl:
3007 case Hexagon::A2_combine_hh:
3013bool HexagonLoopRescheduling::isStoreInput(
const MachineInstr *
MI,
3014 unsigned InpR)
const {
3015 for (
unsigned i = 0, n =
MI->getNumOperands(); i < n; ++i) {
3016 const MachineOperand &
Op =
MI->getOperand(i);
3019 if (
Op.getReg() == InpR)
3025bool HexagonLoopRescheduling::isShuffleOf(
unsigned OutR,
unsigned InpR)
const {
3026 if (!BTP->
has(OutR) || !BTP->
has(InpR))
3028 const BitTracker::RegisterCell &OutC = BTP->
lookup(OutR);
3029 for (
unsigned i = 0, w = OutC.
width(); i < w; ++i) {
3030 const BitTracker::BitValue &
V = OutC[i];
3033 if (
V.RefI.Reg != InpR)
3039bool HexagonLoopRescheduling::isSameShuffle(
unsigned OutR1,
unsigned InpR1,
3040 unsigned OutR2,
unsigned &InpR2)
const {
3041 if (!BTP->
has(OutR1) || !BTP->
has(InpR1) || !BTP->
has(OutR2))
3043 const BitTracker::RegisterCell &OutC1 = BTP->
lookup(OutR1);
3044 const BitTracker::RegisterCell &OutC2 = BTP->
lookup(OutR2);
3045 unsigned W = OutC1.
width();
3046 unsigned MatchR = 0;
3047 if (W != OutC2.
width())
3049 for (
unsigned i = 0; i <
W; ++i) {
3050 const BitTracker::BitValue &V1 = OutC1[i], &V2 = OutC2[i];
3055 if (V1.
RefI.
Pos != V2.RefI.Pos)
3059 if (V2.RefI.Reg == 0 || V2.RefI.Reg == OutR2)
3062 MatchR = V2.RefI.Reg;
3063 else if (V2.RefI.Reg != MatchR)
3070void HexagonLoopRescheduling::moveGroup(InstrGroup &
G, MachineBasicBlock &LB,
3072 unsigned NewPredR) {
3073 DenseMap<unsigned,unsigned> RegMap;
3075 const TargetRegisterClass *PhiRC =
MRI->getRegClass(NewPredR);
3076 Register PhiR =
MRI->createVirtualRegister(PhiRC);
3077 BuildMI(LB, At, At->getDebugLoc(), HII->get(TargetOpcode::PHI), PhiR)
3082 RegMap.
insert(std::make_pair(
G.Inp.Reg, PhiR));
3085 unsigned DR = getDefReg(SI);
3086 const TargetRegisterClass *RC =
MRI->getRegClass(DR);
3090 auto MIB =
BuildMI(LB, At,
DL, HII->get(
SI->getOpcode()), NewDR);
3091 for (
const MachineOperand &
Op :
SI->operands()) {
3098 unsigned UseR = RegMap[
Op.getReg()];
3099 MIB.addReg(UseR, 0,
Op.getSubReg());
3101 RegMap.
insert(std::make_pair(DR, NewDR));
3104 HBS::replaceReg(OldPhiR, RegMap[
G.Out.Reg], *
MRI);
3107bool HexagonLoopRescheduling::processLoop(LoopCand &
C) {
3110 std::vector<PhiInfo> Phis;
3111 for (
auto &
I : *
C.LB) {
3114 unsigned PR = getDefReg(&
I);
3117 bool BadUse =
false, GoodUse =
false;
3118 for (
const MachineOperand &MO :
MRI->use_operands(PR)) {
3119 const MachineInstr *UseI = MO.
getParent();
3124 if (isBitShuffle(UseI, PR) || isStoreInput(UseI, PR))
3127 if (BadUse || !GoodUse)
3130 Phis.push_back(PhiInfo(
I, *
C.LB));
3134 dbgs() <<
"Phis: {";
3135 for (
auto &
I : Phis) {
3137 <<
printReg(
I.PR.Reg, HRI,
I.PR.Sub) <<
":b" <<
I.PB->getNumber()
3138 <<
',' <<
printReg(
I.LR.Reg, HRI,
I.LR.Sub) <<
":b"
3139 <<
I.LB->getNumber() <<
')';
3155 if (
MI.isTerminator())
3161 HBS::getInstrDefs(
MI, Defs);
3162 if (Defs.count() != 1)
3167 if (!isBitShuffle(&
MI, DefR))
3170 bool BadUse =
false;
3171 for (
auto UI =
MRI->use_begin(DefR), UE =
MRI->use_end(); UI != UE; ++UI) {
3174 if (UseI->
isPHI()) {
3177 unsigned Idx = UI.getOperandNo();
3187 if (
C.EB ==
nullptr)
3196 ShufIns.push_back(&
MI);
3208 using InstrGroupList = std::vector<InstrGroup>;
3211 for (
unsigned i = 0, n = ShufIns.size(); i < n; ++i) {
3212 MachineInstr *
SI = ShufIns[i];
3217 G.Ins.push_back(SI);
3218 G.Out.Reg = getDefReg(SI);
3220 HBS::getInstrUses(*SI, Inputs);
3222 for (
unsigned j = i+1;
j < n; ++
j) {
3223 MachineInstr *
MI = ShufIns[
j];
3227 HBS::getInstrDefs(*
MI, Defs);
3229 if (!Defs.intersects(Inputs))
3233 G.Ins.push_back(
MI);
3234 Inputs.remove(Defs);
3236 HBS::getInstrUses(*
MI, Inputs);
3237 ShufIns[
j] =
nullptr;
3241 if (Inputs.count() > 1)
3243 auto LoopInpEq = [
G] (
const PhiInfo &
P) ->
bool {
3244 return G.Out.Reg ==
P.LR.Reg;
3249 G.Inp.Reg = Inputs.find_first();
3254 for (
unsigned i = 0, n =
Groups.size(); i < n; ++i) {
3256 dbgs() <<
"Group[" << i <<
"] inp: "
3258 <<
" out: " <<
printReg(
G.Out.Reg, HRI,
G.Out.Sub) <<
"\n";
3259 for (
const MachineInstr *
MI :
G.Ins)
3264 for (InstrGroup &
G :
Groups) {
3265 if (!isShuffleOf(
G.Out.Reg,
G.Inp.Reg))
3267 auto LoopInpEq = [
G] (
const PhiInfo &
P) ->
bool {
3268 return G.Out.Reg ==
P.LR.Reg;
3271 if (
F == Phis.end())
3274 if (!isSameShuffle(
G.Out.Reg,
G.Inp.Reg,
F->PR.Reg, PrehR)) {
3275 const MachineInstr *DefPrehR =
MRI->getVRegDef(
F->PR.Reg);
3277 if (
Opc != Hexagon::A2_tfrsi &&
Opc != Hexagon::A2_tfrpi)
3283 const TargetRegisterClass *RC =
MRI->getRegClass(
G.Inp.Reg);
3284 if (RC !=
MRI->getRegClass(
F->PR.Reg)) {
3285 PrehR =
MRI->createVirtualRegister(RC);
3286 unsigned TfrI = (RC == &Hexagon::IntRegsRegClass) ? Hexagon::A2_tfrsi
3287 : Hexagon::A2_tfrpi;
3288 auto T =
C.PB->getFirstTerminator();
3301 if (
MRI->getRegClass(PrehR) !=
MRI->getRegClass(
G.Inp.Reg))
3303 moveGroup(
G, *
F->LB, *
F->PB,
F->LB->getFirstNonPHI(),
F->DefR, PrehR);
3310bool HexagonLoopRescheduling::runOnMachineFunction(MachineFunction &MF) {
3315 HII = HST.getInstrInfo();
3318 const HexagonEvaluator HE(*HRI, *
MRI, *HII, MF);
3319 BitTracker
BT(HE, MF);
3324 std::vector<LoopCand> Cand;
3326 for (
auto &
B : MF) {
3327 if (
B.pred_size() != 2 ||
B.succ_size() != 2)
3329 MachineBasicBlock *
PB =
nullptr;
3330 bool IsLoop =
false;
3331 for (MachineBasicBlock *Pred :
B.predecessors()) {
3340 MachineBasicBlock *EB =
nullptr;
3341 for (MachineBasicBlock *Succ :
B.successors()) {
3346 if (Succ->pred_size() == 1)
3351 Cand.push_back(LoopCand(&
B,
PB, EB));
3355 for (
auto &
C : Cand)
3366 return new HexagonLoopRescheduling();
3370 return new HexagonBitSimplify();
unsigned const MachineRegisterInfo * MRI
for(const MachineOperand &MO :llvm::drop_begin(OldMI.operands(), Desc.getNumOperands()))
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Function Alias Analysis false
This file implements the BitVector class.
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
static std::optional< ArrayRef< InsnRange >::iterator > intersects(const MachineInstr *StartMI, const MachineInstr *EndMI, ArrayRef< InsnRange > Ranges, const InstructionOrdering &Ordering)
Check if the instruction range [StartMI, EndMI] intersects any instruction range in Ranges.
static unsigned CountBitSplit
static cl::opt< bool > PreserveTiedOps("hexbit-keep-tied", cl::Hidden, cl::init(true), cl::desc("Preserve subregisters in tied operands"))
static cl::opt< bool > GenExtract("hexbit-extract", cl::Hidden, cl::init(true), cl::desc("Generate extract instructions"))
static cl::opt< unsigned > MaxBitSplit("hexbit-max-bitsplit", cl::Hidden, cl::init(std::numeric_limits< unsigned >::max()))
static cl::opt< bool > GenBitSplit("hexbit-bitsplit", cl::Hidden, cl::init(true), cl::desc("Generate bitsplit instructions"))
static cl::opt< unsigned > MaxExtract("hexbit-max-extract", cl::Hidden, cl::init(std::numeric_limits< unsigned >::max()))
static cl::opt< unsigned > RegisterSetLimit("hexbit-registerset-limit", cl::Hidden, cl::init(1000))
static unsigned CountExtract
static bool isZero(Value *V, const DataLayout &DL, DominatorTree *DT, AssumptionCache *AC)
Promote Memory to Register
PassBuilder PB(Machine, PassOpts->PTO, std::nullopt, &PIC)
#define INITIALIZE_PASS_DEPENDENCY(depName)
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS(passName, arg, name, cfg, analysis)
Remove Loads Into Fake Uses
bool isDead(const MachineInstr &MI, const MachineRegisterInfo &MRI)
This file defines the SmallVector class.
SmallSet< unsigned, 4 > RegisterSet
static const X86InstrFMA3Group Groups[]
AnalysisUsage & addRequired()
AnalysisUsage & addPreserved()
Add the specified Pass class to the set of analyses preserved by this pass.
bool subsetOf(const BitVector &RHS) const
subsetOf - Check if This is a subset of RHS.
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
DomTreeNodeBase< NodeT > * getRootNode()
getRootNode - This returns the entry node for the CFG of the function.
FunctionPass class - This class is used to implement most global optimizations.
bool hasOptSize() const
Optimize this function for size (-Os) or minimum size (-Oz).
unsigned getHexagonSubRegIndex(const TargetRegisterClass &RC, unsigned GenIdx) const
const HexagonRegisterInfo * getRegisterInfo() const override
MachineInstrBundleIterator< MachineInstr > iterator
Analysis pass which computes a MachineDominatorTree.
bool dominates(const MachineInstr *A, const MachineInstr *B) const
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Function & getFunction()
Return the LLVM function that this machine code represents.
const MachineBasicBlock & front() const
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
const MachineInstrBuilder & addReg(Register RegNo, unsigned flags=0, unsigned SubReg=0) const
Add a new virtual register operand.
const MachineInstrBuilder & addMBB(MachineBasicBlock *MBB, unsigned TargetFlags=0) const
Representation of each machine instruction.
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
const MachineBasicBlock * getParent() const
bool isDebugInstr() const
const DebugLoc & getDebugLoc() const
Returns the debug location id of this MachineInstr.
const MachineOperand & getOperand(unsigned i) const
MachineOperand class - Representation of each machine instruction operand.
void setSubReg(unsigned subReg)
unsigned getSubReg() const
bool isReg() const
isReg - Tests if this is a MO_Register operand.
MachineBasicBlock * getMBB() const
LLVM_ABI void setReg(Register Reg)
Change the register this operand corresponds to.
bool isImm() const
isImm - Tests if this is a MO_Immediate operand.
static MachineOperand CreateImm(int64_t Val)
Register getReg() const
getReg - Returns the register number.
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
std::pair< const_iterator, bool > insert(const unsigned &V)
void push_back(const T &Elt)
unsigned getID() const
Return the register class ID number.
virtual const TargetRegisterInfo * getRegisterInfo() const =0
Return the target's register information.
This class implements an extremely fast bulk output stream that can only output to a stream.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
constexpr char Align[]
Key for Kernel::Arg::Metadata::mAlign.
constexpr char IsConst[]
Key for Kernel::Arg::Metadata::mIsConst.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
@ C
The default llvm calling convention, compatible with C.
@ ABS
ABS - Determine the unsigned absolute value of a signed integer value of the same bitwidth.
SmallVector< const MachineInstr * > InstrList
bool isConst(unsigned Opc)
initializer< Ty > init(const Ty &Val)
PointerTypeMap run(const Module &M)
Compute the PointerTypeMap for the module M.
LLVM_ABI std::error_code remove(const Twine &path, bool IgnoreNonExisting=true)
Remove path.
This is an optimization pass for GlobalISel generic memory operations.
@ Low
Lower the current thread's priority such that it does not affect foreground tasks significantly.
auto find(R &&Range, const T &Val)
Provide wrappers to std::find which take ranges instead of having to pass begin/end explicitly.
bool includes(R1 &&Range1, R2 &&Range2)
Provide wrappers to std::includes which take ranges instead of having to pass begin/end explicitly.
bool isEqual(const GCNRPTracker::LiveRegSet &S1, const GCNRPTracker::LiveRegSet &S2)
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
constexpr bool isInt(int64_t x)
Checks if an integer fits into the given bit width.
constexpr bool isUIntN(unsigned N, uint64_t x)
Checks if an unsigned integer fits into the given (dynamic) bit width.
FunctionPass * createHexagonBitSimplify()
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
auto reverse(ContainerTy &&C)
constexpr uint32_t Hi_32(uint64_t Value)
Return the high 32 bits of a 64 bit value.
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
bool none_of(R &&Range, UnaryPredicate P)
Provide wrappers to std::none_of which take ranges instead of having to pass begin/end explicitly.
constexpr uint32_t Lo_32(uint64_t Value)
Return the low 32 bits of a 64 bit value.
DomTreeNodeBase< MachineBasicBlock > MachineDomTreeNode
FunctionPass * createHexagonLoopRescheduling()
@ First
Helpers to iterate all locations in the MemoryEffectsBase class.
@ Sub
Subtraction of integers.
FunctionAddr VTableAddr Next
auto count(R &&Range, const E &Element)
Wrapper function around std::count to count the number of times an element Element occurs in the give...
DWARFExpression::Operation Op
raw_ostream & operator<<(raw_ostream &OS, const APFixedPoint &FX)
auto find_if(R &&Range, UnaryPredicate P)
Provide wrappers to std::find_if which take ranges instead of having to pass begin/end explicitly.
iterator_range< typename GraphTraits< GraphType >::ChildIteratorType > children(const typename GraphTraits< GraphType >::NodeRef &G)
bool is_contained(R &&Range, const E &Element)
Returns true if Element is found in Range.
LLVM_ABI Printable printReg(Register Reg, const TargetRegisterInfo *TRI=nullptr, unsigned SubIdx=0, const MachineRegisterInfo *MRI=nullptr)
Prints virtual and physical registers with or without a TRI instance.
LLVM_ABI Printable printMBBReference(const MachineBasicBlock &MBB)
Prints a machine basic block reference.
Maximum remaining allocation size observed for a phi node, and how often the allocation size has alre...
bool is(unsigned T) const
static BitValue self(const BitRef &Self=BitRef())
bool has(unsigned Reg) const
const RegisterCell & lookup(unsigned Reg) const
bool reached(const MachineBasicBlock *B) const
void trace(bool On=false)
void put(RegisterRef RR, const RegisterCell &RC)
void visit(const MachineInstr &MI)
RegisterCell get(RegisterRef RR) const