62#define PASS_KEY "x86-flags-copy-lowering"
63#define DEBUG_TYPE PASS_KEY
65STATISTIC(NumCopiesEliminated,
"Number of copies of EFLAGS eliminated");
66STATISTIC(NumSetCCsInserted,
"Number of setCC instructions inserted");
67STATISTIC(NumTestsInserted,
"Number of test instructions inserted");
68STATISTIC(NumAddsInserted,
"Number of adds instructions inserted");
69STATISTIC(NumNFsConvertedTo,
"Number of NF instructions converted to");
76using CondRegArray = std::array<Register, X86::LAST_VALID_COND + 1>;
78class X86FlagsCopyLoweringImpl {
82 bool runOnMachineFunction(MachineFunction &MF);
85 MachineRegisterInfo *MRI =
nullptr;
86 const X86Subtarget *Subtarget =
nullptr;
87 const X86InstrInfo *TII =
nullptr;
88 const TargetRegisterInfo *TRI =
nullptr;
89 const TargetRegisterClass *PromoteRC =
nullptr;
90 MachineDominatorTree *MDT =
nullptr;
92 CondRegArray collectCondsInRegs(MachineBasicBlock &
MBB,
98 std::pair<Register, bool> getCondOrInverseInReg(
106 CondRegArray &CondRegs);
107 void rewriteArithmetic(MachineBasicBlock &
MBB,
109 MachineInstr &
MI, CondRegArray &CondRegs);
111 const DebugLoc &Loc, MachineInstr &
MI, CondRegArray &CondRegs);
116 X86FlagsCopyLoweringLegacy() : MachineFunctionPass(ID) {}
118 StringRef getPassName()
const override {
return "X86 EFLAGS copy lowering"; }
119 bool runOnMachineFunction(MachineFunction &MF)
override;
120 void getAnalysisUsage(AnalysisUsage &AU)
const override;
129 "X86 EFLAGS copy lowering",
false,
false)
134 return new X86FlagsCopyLoweringLegacy();
137char X86FlagsCopyLoweringLegacy::ID = 0;
139void X86FlagsCopyLoweringLegacy::getAnalysisUsage(
AnalysisUsage &AU)
const {
145 return X86::isADC(
Opc) || X86::isSBB(
Opc) || X86::isRCL(
Opc) ||
146 X86::isRCR(
Opc) || (
Opc == X86::SETB_C32r ||
Opc == X86::SETB_C64r);
155 "Split instruction must be in the split block!");
157 "Only designed to split a tail of branch instructions!");
159 "Must split on an actual jCC instruction!");
165 "Must split after an actual jCC instruction!");
167 "Must only have this one terminator prior to the split!");
178 assert(MI.isTerminator() &&
179 "Should only have spliced terminators!");
181 MI.operands(), [&](MachineOperand &MOp) {
182 return MOp.isMBB() && MOp.getMBB() == &UnsplitSucc;
187 MachineBasicBlock &NewMBB = *MF.CreateMachineBasicBlock();
199 if (IsEdgeSplit || *SI != &UnsplitSucc)
207 for (MachineBasicBlock *Succ : NewMBB.
successors())
208 if (Succ != &UnsplitSucc)
209 MBB.replaceSuccessor(Succ, &NewMBB);
213 "Failed to make the new block a successor!");
216 for (MachineBasicBlock *Succ : NewMBB.
successors()) {
217 for (MachineInstr &
MI : *Succ) {
223 MachineOperand &OpV =
MI.getOperand(
OpIdx);
224 MachineOperand &OpMBB =
MI.getOperand(
OpIdx + 1);
225 assert(OpMBB.
isMBB() &&
"Block operand to a PHI is not a block!");
230 if (!IsEdgeSplit || Succ != &UnsplitSucc) {
239 MI.addOperand(MF, OpV);
253 MI.findRegisterDefOperand(X86::EFLAGS,
nullptr);
270bool X86FlagsCopyLoweringImpl::runOnMachineFunction(MachineFunction &MF) {
278 PromoteRC = &X86::GR8RegClass;
284 if (
none_of(
MRI->def_instructions(X86::EFLAGS), [](
const MachineInstr &
MI) {
285 return MI.getOpcode() == TargetOpcode::COPY;
293 std::unique_ptr<MachineDominatorTree> OwnedMDT;
295 OwnedMDT = std::make_unique<MachineDominatorTree>(MF);
296 MDT = OwnedMDT.get();
303 SmallSetVector<MachineInstr *, 4>
Copies;
304 ReversePostOrderTraversal<MachineFunction *> RPOT(&MF);
305 for (MachineBasicBlock *
MBB : RPOT)
306 for (MachineInstr &
MI : *
MBB)
307 if (
MI.getOpcode() == TargetOpcode::COPY &&
308 MI.getOperand(0).getReg() == X86::EFLAGS)
323 if (Subtarget->hasNF()) {
324 SmallSetVector<MachineInstr *, 4> RemovedCopies;
327 while (CopyIIt != CopyIEnd) {
328 auto NCopyIIt = std::next(CopyIIt);
329 SmallSetVector<MachineInstr *, 4> EvitableClobbers;
330 MachineInstr *CopyI = *CopyIIt;
332 MachineInstr *CopyDefI =
MRI->getVRegDef(VOp.
getReg());
333 MachineBasicBlock *CopyIMBB = CopyI->
getParent();
334 MachineBasicBlock *CopyDefIMBB = CopyDefI->
getParent();
342 MachineBasicBlock *
MBB = *BI;
343 for (
auto I = (
MBB != CopyDefIMBB)
349 MachineInstr &
MI = *
I;
355 goto ProcessNextCopyI;
362 RemovedCopies.
insert(CopyI);
365 RemovedCopies.
insert(CopyDefI);
368 ++NumCopiesEliminated;
369 for (
auto *Clobber : EvitableClobbers) {
371 assert(NewOpc &&
"evitable clobber must have a NF variant");
372 Clobber->setDesc(
TII->get(NewOpc));
373 Clobber->removeOperand(
374 Clobber->findRegisterDefOperand(X86::EFLAGS,
nullptr)
381 if (*BI != CopyDefIMBB)
382 BI->addLiveIn(X86::EFLAGS);
386 Copies.set_subtract(RemovedCopies);
404 for (MachineInstr *CopyI :
Copies) {
409 "The input to the copy for EFLAGS should always be a register!");
410 MachineInstr &CopyDefI = *
MRI->getVRegDef(VOp.
getReg());
411 if (CopyDefI.
getOpcode() != TargetOpcode::COPY) {
427 dbgs() <<
"ERROR: Encountered unexpected def of an eflags copy: ";
430 "Cannot lower EFLAGS copy unless it is defined in turn by a copy!");
439 ++NumCopiesEliminated;
443 assert(DOp.isDef() &&
"Expected register def!");
444 assert(DOp.getReg() == X86::EFLAGS &&
"Unexpected copy def register!");
448 MachineBasicBlock *TestMBB = CopyDefI.
getParent();
472 return &
MI != CopyI &&
473 MI.findRegisterDefOperand(X86::EFLAGS,
nullptr);
476 auto HasEFLAGSClobberPath = [&](MachineBasicBlock *BeginMBB,
477 MachineBasicBlock *EndMBB) {
479 "Only support paths down the dominator tree!");
480 SmallPtrSet<MachineBasicBlock *, 4> Visited;
481 SmallVector<MachineBasicBlock *, 4> Worklist;
488 if (!Visited.
insert(PredMBB).second)
490 if (HasEFLAGSClobber(PredMBB->begin(), PredMBB->end()))
495 }
while (!Worklist.
empty());
500 !HasEFLAGSClobber(TestMBB->
begin(), TestPos)) {
503 MachineBasicBlock *HoistMBB =
506 [&](MachineBasicBlock *
LHS, MachineBasicBlock *
RHS) {
507 return MDT->findNearestCommonDominator(LHS, RHS);
513 if (HasEFLAGSClobberPath(HoistMBB, TestMBB))
530 [&](MachineInstr &
MI) {
531 return MI.findRegisterDefOperand(X86::EFLAGS, nullptr);
534 dbgs() <<
" Using EFLAGS defined by: ";
537 dbgs() <<
" Using live-in flags for BB:\n";
545 SmallVector<MachineInstr *, 4> JmpIs;
552 CondRegArray CondRegs = collectCondsInRegs(*TestMBB, TestPos);
565 bool FlagsKilled =
false;
581 MachineInstr &
MI = *MII++;
586 if (&
MI == CopyI || &
MI == &CopyDefI) {
588 "Should only encounter these on the second pass over the "
593 MachineOperand *FlagUse =
594 MI.findRegisterUseOperand(X86::EFLAGS,
nullptr);
595 FlagsKilled =
MI.modifiesRegister(X86::EFLAGS,
TRI);
597 if (!FlagUse && FlagsKilled)
617 auto JmpIt =
MI.getIterator();
619 JmpIs.push_back(&*JmpIt);
627 unsigned Opc =
MI.getOpcode();
628 if (
Opc == TargetOpcode::COPY) {
630 MRI->replaceRegWith(
MI.getOperand(0).getReg(),
632 MI.eraseFromParent();
633 }
else if (X86::isSETCC(
Opc) || X86::isSETZUCC(
Opc)) {
634 rewriteSetCC(*TestMBB, TestPos, TestLoc,
MI, CondRegs);
636 rewriteArithmetic(*TestMBB, TestPos, TestLoc,
MI, CondRegs);
638 rewriteMI(*TestMBB, TestPos, TestLoc,
MI, CondRegs);
652 for (MachineBasicBlock *SuccMBB : UseMBB.
successors())
653 if (SuccMBB->isLiveIn(X86::EFLAGS) &&
668 if (SuccMBB == TestMBB || !MDT->
dominates(TestMBB, SuccMBB)) {
671 <<
"ERROR: Encountered use that is not dominated by our test "
672 "basic block! Rewriting this would require inserting PHI "
673 "nodes to track the flag state across the CFG.\n\nTest "
676 dbgs() <<
"Use block:\n";
680 "Cannot lower EFLAGS copy when original copy def "
681 "does not dominate all uses.");
687 SuccMBB->removeLiveIn(X86::EFLAGS);
689 }
while (!Blocks.
empty());
694 MachineBasicBlock *LastJmpMBB =
nullptr;
695 for (MachineInstr *JmpI : JmpIs) {
698 if (JmpI->getParent() == LastJmpMBB)
703 rewriteMI(*TestMBB, TestPos, TestLoc, *JmpI, CondRegs);
711 for (MachineBasicBlock &
MBB : MF)
712 for (MachineInstr &
MI :
MBB)
713 if (
MI.getOpcode() == TargetOpcode::COPY &&
714 (
MI.getOperand(0).getReg() == X86::EFLAGS ||
715 MI.getOperand(1).getReg() == X86::EFLAGS)) {
727CondRegArray X86FlagsCopyLoweringImpl::collectCondsInRegs(
729 CondRegArray CondRegs = {};
732 for (MachineInstr &
MI :
736 MI.getOperand(0).isReg() &&
MI.getOperand(0).getReg().isVirtual()) {
738 "A non-storing SETcc should always define a register!");
739 CondRegs[
Cond] =
MI.getOperand(0).getReg();
744 if (
MI.findRegisterDefOperand(X86::EFLAGS,
nullptr))
750Register X86FlagsCopyLoweringImpl::promoteCondToReg(
755 BuildMI(TestMBB, TestPos, TestLoc,
756 TII->get((!Subtarget->hasZU() || Subtarget->preferLegacySetCC())
767std::pair<Register, bool> X86FlagsCopyLoweringImpl::getCondOrInverseInReg(
772 if (!CondReg && !InvCondReg)
773 CondReg = promoteCondToReg(TestMBB, TestPos, TestLoc,
Cond);
776 return {CondReg,
false};
778 return {InvCondReg,
true};
781void X86FlagsCopyLoweringImpl::insertTest(MachineBasicBlock &
MBB,
791void X86FlagsCopyLoweringImpl::rewriteSetCC(MachineBasicBlock &
MBB,
795 CondRegArray &CondRegs) {
802 CondReg = promoteCondToReg(
MBB, Pos, Loc,
Cond);
806 if (!
MI.mayStore()) {
808 "Cannot have a non-register defined operand to SETcc!");
812 MRI->clearKillFlags(OldReg);
813 MRI->replaceRegWith(OldReg, CondReg);
814 MI.eraseFromParent();
819 auto MIB =
BuildMI(*
MI.getParent(),
MI.getIterator(),
MI.getDebugLoc(),
820 TII->get(X86::MOV8mr));
823 MIB.add(
MI.getOperand(i));
826 MIB.setMemRefs(
MI.memoperands());
827 MI.eraseFromParent();
830void X86FlagsCopyLoweringImpl::rewriteArithmetic(
832 const DebugLoc &Loc, MachineInstr &
MI, CondRegArray &CondRegs) {
845 CondReg = promoteCondToReg(
MBB, Pos, Loc,
Cond);
848 Register TmpReg =
MRI->createVirtualRegister(PromoteRC);
851 TII->get(Subtarget->hasNDD() ? X86::ADD8ri_ND : X86::ADD8ri))
858 MI.findRegisterUseOperand(X86::EFLAGS,
nullptr)->setIsKill(
true);
862#define FROM_TO(A, B) \
863 case X86::CMOV##A##_Fp32: \
864 case X86::CMOV##A##_Fp64: \
865 case X86::CMOV##A##_Fp80: \
866 return X86::COND_##B;
886 case X86::CMOVB_##A: \
887 case X86::CMOVE_##A: \
888 case X86::CMOVP_##A: \
889 case X86::CMOVBE_##A: \
890 case X86::CMOVNB_##A: \
891 case X86::CMOVNE_##A: \
892 case X86::CMOVNP_##A: \
893 case X86::CMOVNBE_##A: \
894 return (CC == X86::COND_E) ? X86::CMOVE_##A : X86::CMOVNE_##A;
905void X86FlagsCopyLoweringImpl::rewriteMI(MachineBasicBlock &
MBB,
908 CondRegArray &CondRegs) {
910 bool IsImplicitCC =
false;
919 std::tie(CondReg, Inverted) =
920 getCondOrInverseInReg(
MBB, Pos, Loc, CC, CondRegs);
923 insertTest(*
MI.getParent(),
MI.getIterator(),
MI.getDebugLoc(), CondReg);
931 MI.getOperand(
MI.getDesc().getNumOperands() - 1).setImm(NewCC);
933 MI.findRegisterUseOperand(X86::EFLAGS,
nullptr)->setIsKill(
true);
937bool X86FlagsCopyLoweringLegacy::runOnMachineFunction(MachineFunction &MF) {
938 auto *MDTWrapper = getAnalysisIfAvailable<MachineDominatorTreeWrapperPass>();
939 MachineDominatorTree *MDT = MDTWrapper ? &MDTWrapper->getDomTree() :
nullptr;
940 return X86FlagsCopyLoweringImpl(MDT).runOnMachineFunction(MF);
948 bool Changed = X86FlagsCopyLoweringImpl(MDT).runOnMachineFunction(MF);
unsigned const MachineRegisterInfo * MRI
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
#define CASE(ATTRNAME, AANAME,...)
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
SmallPtrSet< const BasicBlock *, 8 > VisitedBlocks
This file builds on the ADT/GraphTraits.h file to build generic depth first graph iterator.
static const HTTPClientCleanup Cleanup
const HexagonInstrInfo * TII
const size_t AbstractManglingParser< Derived, Alloc >::NumOps
This file declares the MachineConstantPool class which is an abstract constant pool to keep track of ...
Register const TargetRegisterInfo * TRI
Promote Memory to Register
MachineInstr unsigned OpIdx
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
This file builds on the ADT/GraphTraits.h file to build a generic graph post order iterator.
const SmallVectorImpl< MachineOperand > & Cond
static void splitBlock(MachineBasicBlock &MBB, MachineInstr &MI, MachineDominatorTree *MDT)
This file defines the make_scope_exit function, which executes user-defined cleanup logic at scope ex...
This file defines the SmallPtrSet class.
This file defines the SmallVector class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
#define FROM_TO(FROM, TO)
cl::opt< bool > X86EnableAPXForRelocation
static X86::CondCode getImplicitCondFromMI(unsigned Opc)
static unsigned getOpcodeWithCC(unsigned Opc, X86::CondCode CC)
static bool isArithmeticOp(unsigned Opc)
static EFLAGSClobber getClobberType(const MachineInstr &MI)
PassT::Result * getCachedResult(IRUnitT &IR) const
Get the cached result of an analysis pass for a given IR unit.
Represent the analysis usage information of a pass.
AnalysisUsage & addUsedIfAvailable()
Add the specified Pass class to the set of analyses used by this pass.
FunctionPass class - This class is used to implement most global optimizations.
void normalizeSuccProbs()
Normalize probabilities of all successors so that the sum of them becomes one.
instr_iterator instr_begin()
LLVM_ABI MachineBasicBlock * getFallThrough(bool JumpToFallThrough=true)
Return the fallthrough block if the block can implicitly transfer control to the block after it by fa...
LLVM_ABI instr_iterator insert(instr_iterator I, MachineInstr *M)
Insert MI into the instruction list before I, possibly inside a bundle.
succ_iterator succ_begin()
LLVM_ABI iterator getFirstTerminator()
Returns an iterator to the first terminator instruction of this basic block.
LLVM_ABI void dump() const
LLVM_ABI void copySuccessor(const MachineBasicBlock *Orig, succ_iterator I)
Copy a successor (and any probability info) from original block to this block's.
pred_iterator pred_begin()
instr_iterator instr_end()
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
iterator_range< succ_iterator > successors()
LLVM_ABI bool isSuccessor(const MachineBasicBlock *MBB) const
Return true if the specified MBB is a successor of this block.
iterator_range< pred_iterator > predecessors()
void splice(iterator Where, MachineBasicBlock *Other, iterator From)
Take an instruction from MBB 'Other' at the position From, and insert it into this MBB right before '...
MachineInstrBundleIterator< MachineInstr > iterator
LLVM_ABI bool isLiveIn(MCRegister Reg, LaneBitmask LaneMask=LaneBitmask::getAll()) const
Return true if the specified register is in the live in set.
Analysis pass which computes a MachineDominatorTree.
Analysis pass which computes a MachineDominatorTree.
DominatorTree Class - Concrete subclass of DominatorTreeBase that is used to compute a normal dominat...
bool dominates(const MachineInstr *A, const MachineInstr *B) const
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
StringRef getName() const
getName - Return the name of the corresponding LLVM function.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
BasicBlockListType::iterator iterator
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
const MachineInstrBuilder & addReg(Register RegNo, unsigned flags=0, unsigned SubReg=0) const
Add a new virtual register operand.
const MachineInstrBuilder & addDef(Register RegNo, unsigned Flags=0, unsigned SubReg=0) const
Add a virtual register definition operand.
Representation of each machine instruction.
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
const MachineBasicBlock * getParent() const
bool isBranch(QueryType Type=AnyInBundle) const
Returns true if this is a conditional, unconditional, or indirect branch.
const DebugLoc & getDebugLoc() const
Returns the debug location id of this MachineInstr.
LLVM_ABI void eraseFromParent()
Unlink 'this' from the containing basic block and delete it.
LLVM_ABI void dump() const
const MachineOperand & getOperand(unsigned i) const
MachineOperand class - Representation of each machine instruction operand.
bool isReg() const
isReg - Tests if this is a MO_Register operand.
MachineBasicBlock * getMBB() const
void setMBB(MachineBasicBlock *MBB)
Register getReg() const
getReg - Returns the register number.
static MachineOperand CreateMBB(MachineBasicBlock *MBB, unsigned TargetFlags=0)
bool isMBB() const
isMBB - Tests if this is a MO_MachineBasicBlock operand.
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
bool insert(const value_type &X)
Insert a new element into the SetVector.
size_type count(ConstPtrType Ptr) const
count - Return 1 if the specified pointer is in the set, 0 otherwise.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
void push_back(const T &Elt)
PreservedAnalyses run(MachineFunction &MF, MachineFunctionAnalysisManager &MFAM)
const X86InstrInfo * getInstrInfo() const override
const X86RegisterInfo * getRegisterInfo() const override
self_iterator getIterator()
Pass manager infrastructure for declaring and invalidating analyses.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
CondCode getCondFromBranch(const MachineInstr &MI)
CondCode getCondFromMI(const MachineInstr &MI)
Return the condition code of the instruction.
CondCode GetOppositeBranchCondition(CondCode CC)
GetOppositeBranchCondition - Return the inverse of the specified cond, e.g.
CondCode getCondFromSETCC(const MachineInstr &MI)
unsigned getNFVariant(unsigned Opc)
This is an optimization pass for GlobalISel generic memory operations.
static bool isAddMemInstrWithRelocation(const MachineInstr &MI)
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
auto successors(const MachineBasicBlock *BB)
scope_exit(Callable) -> scope_exit< Callable >
iterator_range< T > make_range(T x, T y)
Convenience function for iterating over sub-ranges.
AnalysisManager< MachineFunction > MachineFunctionAnalysisManager
LLVM_ABI PreservedAnalyses getMachineFunctionPassPreservedAnalyses()
Returns the minimum set of Analyses that all machine function passes must preserve.
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
auto reverse(ContainerTy &&C)
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
bool none_of(R &&Range, UnaryPredicate P)
Provide wrappers to std::none_of which take ranges instead of having to pass begin/end explicitly.
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
idf_iterator< T > idf_end(const T &G)
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
FunctionPass * createX86FlagsCopyLoweringLegacyPass()
idf_iterator< T > idf_begin(const T &G)
auto find_if(R &&Range, UnaryPredicate P)
Provide wrappers to std::find_if which take ranges instead of having to pass begin/end explicitly.