32#define DEBUG_TYPE "riscv-opt-w-instrs"
33#define RISCV_OPT_W_INSTRS_NAME "RISC-V Optimize W Instructions"
35STATISTIC(NumRemovedSExtW,
"Number of removed sign-extensions");
37 "Number of instructions transformed to W-ops");
40 cl::desc(
"Disable removal of sext.w"),
72char RISCVOptWInstrs::ID = 0;
77 return new RISCVOptWInstrs();
90 Worklist.
push_back(std::make_pair(&OrigMI, OrigBits));
92 while (!Worklist.
empty()) {
95 unsigned Bits =
P.second;
101 if (
MI->getNumExplicitDefs() != 1)
104 for (
auto &UserOp :
MRI.use_operands(
MI->getOperand(0).getReg())) {
106 unsigned OpIdx = UserOp.getOperandNo();
134 case RISCV::FCVT_H_W:
135 case RISCV::FCVT_H_WU:
136 case RISCV::FCVT_S_W:
137 case RISCV::FCVT_S_WU:
138 case RISCV::FCVT_D_W:
139 case RISCV::FCVT_D_WU:
150 case RISCV::ZEXT_H_RV32:
151 case RISCV::ZEXT_H_RV64:
158 if (Bits >= (ST.getXLen() / 2))
168 Worklist.
push_back(std::make_pair(UserMI, Bits - ShAmt));
179 Worklist.
push_back(std::make_pair(UserMI, Bits));
185 Worklist.
push_back(std::make_pair(UserMI, Bits));
190 if (Bits >= (
unsigned)llvm::bit_width<uint64_t>(~Imm))
192 Worklist.
push_back(std::make_pair(UserMI, Bits));
202 if (Bits >=
Log2_32(ST.getXLen()))
206 Worklist.
push_back(std::make_pair(UserMI, Bits));
214 if (OpIdx == 2 && Bits >=
Log2_32(ST.getXLen()))
219 case RISCV::SH1ADD_UW:
220 case RISCV::SH2ADD_UW:
221 case RISCV::SH3ADD_UW:
223 if (OpIdx == 1 && Bits >= 32)
225 Worklist.
push_back(std::make_pair(UserMI, Bits));
235 if (OpIdx == 0 && Bits >= 8)
240 if (OpIdx == 0 && Bits >= 16)
245 if (OpIdx == 0 && Bits >= 32)
275 Worklist.
push_back(std::make_pair(UserMI, Bits));
278 case RISCV::PseudoCCMOVGPR:
282 if (OpIdx != 4 && OpIdx != 5)
284 Worklist.
push_back(std::make_pair(UserMI, Bits));
287 case RISCV::CZERO_EQZ:
288 case RISCV::CZERO_NEZ:
289 case RISCV::VT_MASKC:
290 case RISCV::VT_MASKCN:
293 Worklist.
push_back(std::make_pair(UserMI, Bits));
318 switch (
MI.getOpcode()) {
321 return MI.getOperand(2).getImm() >= 32;
323 return MI.getOperand(2).getImm() > 32;
326 return MI.getOperand(1).isReg() &&
MI.getOperand(1).getReg() == RISCV::X0;
329 return isUInt<11>(
MI.getOperand(2).getImm());
332 return !isUInt<11>(
MI.getOperand(2).getImm());
335 return MI.getOperand(1).getReg() == RISCV::X0;
348 auto AddRegDefToWorkList = [&](
Register SrcReg) {
359 if (!AddRegDefToWorkList(SrcReg))
362 while (!Worklist.
empty()) {
374 switch (
MI->getOpcode()) {
385 if (
MI->getParent() == &MF->
front()) {
391 Register CopySrcReg =
MI->getOperand(1).getReg();
392 if (CopySrcReg == RISCV::X10) {
402 auto II =
MI->getIterator();
404 (--II)->
getOpcode() != RISCV::ADJCALLSTACKUP)
416 auto *IntTy = dyn_cast<IntegerType>(CalleeFn->getReturnType());
420 const AttributeSet &Attrs = CalleeFn->getAttributes().getRetAttrs();
421 unsigned BitWidth = IntTy->getBitWidth();
422 if ((
BitWidth <= 32 && Attrs.hasAttribute(Attribute::SExt)) ||
423 (
BitWidth < 32 && Attrs.hasAttribute(Attribute::ZExt)))
427 if (!AddRegDefToWorkList(CopySrcReg))
437 if (
MI->getOperand(2).getImm() >= 31)
447 if (!AddRegDefToWorkList(
MI->getOperand(1).getReg()))
451 case RISCV::PseudoCCADDW:
452 case RISCV::PseudoCCSUBW:
455 if (!AddRegDefToWorkList(
MI->getOperand(4).getReg()))
469 case RISCV::PseudoCCMOVGPR:
470 case RISCV::PseudoCCAND:
471 case RISCV::PseudoCCOR:
472 case RISCV::PseudoCCXOR:
481 unsigned B = 1,
E = 3,
D = 1;
482 switch (
MI->getOpcode()) {
484 E =
MI->getNumOperands();
487 case RISCV::PseudoCCMOVGPR:
491 case RISCV::PseudoCCAND:
492 case RISCV::PseudoCCOR:
493 case RISCV::PseudoCCXOR:
499 for (
unsigned I =
B;
I !=
E;
I +=
D) {
500 if (!
MI->getOperand(
I).isReg())
503 if (!AddRegDefToWorkList(
MI->getOperand(
I).getReg()))
510 case RISCV::CZERO_EQZ:
511 case RISCV::CZERO_NEZ:
512 case RISCV::VT_MASKC:
513 case RISCV::VT_MASKCN:
516 if (!AddRegDefToWorkList(
MI->getOperand(1).getReg()))
524 if (
MI->getOperand(2).getImm() >= 32)
573 bool MadeChange =
false;
594 if (!
MRI.constrainRegClass(SrcReg,
MRI.getRegClass(DstReg)))
600 Fixable->setDesc(
TII.get(
getWOp(Fixable->getOpcode())));
601 Fixable->clearFlag(MachineInstr::MIFlag::NoSWrap);
602 Fixable->clearFlag(MachineInstr::MIFlag::NoUWrap);
603 Fixable->clearFlag(MachineInstr::MIFlag::IsExact);
605 ++NumTransformedToWInstrs;
609 MRI.replaceRegWith(DstReg, SrcReg);
610 MRI.clearKillFlags(SrcReg);
611 MI->eraseFromParent();
627 bool MadeChange =
false;
633 switch (
MI.getOpcode()) {
636 case RISCV::ADDW: Opc = RISCV::ADD;
break;
637 case RISCV::MULW: Opc = RISCV::MUL;
break;
638 case RISCV::SLLIW: Opc = RISCV::SLLI;
break;
642 MI.setDesc(
TII.get(Opc));
662 bool MadeChange =
false;
663 MadeChange |= removeSExtWInstrs(MF,
TII, ST,
MRI);
664 MadeChange |= stripWSuffixes(MF,
TII, ST,
MRI);
unsigned const MachineRegisterInfo * MRI
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
static GCRegistry::Add< StatepointGC > D("statepoint-example", "an example strategy for statepoint")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
const HexagonInstrInfo * TII
#define INITIALIZE_PASS(passName, arg, name, cfg, analysis)
static bool isSignExtendingOpW(const MachineInstr &MI, const MachineRegisterInfo &MRI)
static bool isSignExtendedW(Register SrcReg, const RISCVSubtarget &ST, const MachineRegisterInfo &MRI, SmallPtrSetImpl< MachineInstr * > &FixableDef)
static bool hasAllWUsers(const MachineInstr &OrigMI, const RISCVSubtarget &ST, const MachineRegisterInfo &MRI)
static cl::opt< bool > DisableStripWSuffix("riscv-disable-strip-w-suffix", cl::desc("Disable strip W suffix"), cl::init(false), cl::Hidden)
static bool hasAllNBitUsers(const MachineInstr &OrigMI, const RISCVSubtarget &ST, const MachineRegisterInfo &MRI, unsigned OrigBits)
#define RISCV_OPT_W_INSTRS_NAME
static cl::opt< bool > DisableSExtWRemoval("riscv-disable-sextw-removal", cl::desc("Disable removal of sext.w"), cl::init(false), cl::Hidden)
static unsigned getWOp(unsigned Opcode)
This file defines the SmallSet class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
static std::optional< unsigned > getOpcode(ArrayRef< VPValue * > Values)
Returns the opcode of Values or ~0 if they do not all agree.
Represent the analysis usage information of a pass.
void setPreservesCFG()
This function should be called by the pass, iff they do not:
FunctionPass class - This class is used to implement most global optimizations.
instr_iterator instr_begin()
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
virtual bool runOnMachineFunction(MachineFunction &MF)=0
runOnMachineFunction - This method must be overloaded to perform the desired machine code transformat...
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
Function & getFunction()
Return the LLVM function that this machine code represents.
Ty * getInfo()
getInfo - Keep track of various per-function pieces of information for backends that would like to do...
const MachineBasicBlock & front() const
Representation of each machine instruction.
unsigned getOpcode() const
Returns the opcode of this MachineInstr.
const MachineBasicBlock * getParent() const
bool isCall(QueryType Type=AnyInBundle) const
const MachineOperand & getOperand(unsigned i) const
const GlobalValue * getGlobal() const
bool isGlobal() const
isGlobal - Tests if this is a MO_GlobalAddress operand.
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
bool isLiveIn(Register Reg) const
static PassRegistry * getPassRegistry()
getPassRegistry - Access the global registry object, which is automatically initialized at applicatio...
virtual StringRef getPassName() const
getPassName - Return a nice clean name for a pass.
RISCVMachineFunctionInfo - This class is derived from MachineFunctionInfo and contains private RISCV-...
bool isSExt32Register(Register Reg) const
Wrapper class representing virtual and physical registers.
constexpr bool isVirtual() const
Return true if the specified register number is in the virtual register namespace.
A templated base class for SmallPtrSet which provides the typesafe interface that is common across al...
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
SmallPtrSet - This class implements a set which is optimized for holding SmallSize or less elements.
SmallSet - This maintains a set of unique values, optimizing for the case when the set is small (less...
std::pair< const_iterator, bool > insert(const T &V)
insert - Insert an element into the set if it isn't already there.
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StringRef - Represent a constant reference to a string, i.e.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
bool isSEXT_W(const MachineInstr &MI)
initializer< Ty > init(const Ty &Val)
This is an optimization pass for GlobalISel generic memory operations.
int bit_width(T Value)
Returns the number of bits needed to represent Value if Value is nonzero.
unsigned Log2_32(uint32_t Value)
Return the floor log base 2 of the specified value, -1 if the value is zero.
raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
FunctionPass * createRISCVOptWInstrsPass()
void initializeRISCVOptWInstrsPass(PassRegistry &)
constexpr unsigned BitWidth