LLVM 18.0.0git
AMDGPUISelLowering.h
Go to the documentation of this file.
1//===-- AMDGPUISelLowering.h - AMDGPU Lowering Interface --------*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9/// \file
10/// Interface definition of the TargetLowering class that is common
11/// to all AMD GPUs.
12//
13//===----------------------------------------------------------------------===//
14
15#ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUISELLOWERING_H
16#define LLVM_LIB_TARGET_AMDGPU_AMDGPUISELLOWERING_H
17
20
21namespace llvm {
22
23class AMDGPUMachineFunction;
24class AMDGPUSubtarget;
25struct ArgDescriptor;
26
28private:
29 const AMDGPUSubtarget *Subtarget;
30
31 /// \returns AMDGPUISD::FFBH_U32 node if the incoming \p Op may have been
32 /// legalized from a smaller type VT. Need to match pre-legalized type because
33 /// the generic legalization inserts the add/sub between the select and
34 /// compare.
35 SDValue getFFBX_U32(SelectionDAG &DAG, SDValue Op, const SDLoc &DL, unsigned Opc) const;
36
37public:
38 /// \returns The minimum number of bits needed to store the value of \Op as an
39 /// unsigned integer. Truncating to this size and then zero-extending to the
40 /// original size will not change the value.
41 static unsigned numBitsUnsigned(SDValue Op, SelectionDAG &DAG);
42
43 /// \returns The minimum number of bits needed to store the value of \Op as a
44 /// signed integer. Truncating to this size and then sign-extending to the
45 /// original size will not change the value.
46 static unsigned numBitsSigned(SDValue Op, SelectionDAG &DAG);
47
48protected:
51 /// Split a vector store into multiple scalar stores.
52 /// \returns The resulting chain.
53
59
63
64 static bool allowApproxFunc(const SelectionDAG &DAG, SDNodeFlags Flags);
65 static bool needsDenormHandlingF32(const SelectionDAG &DAG, SDValue Src,
66 SDNodeFlags Flags);
68 SDNodeFlags Flags) const;
70 std::pair<SDValue, SDValue> getScaledLogInput(SelectionDAG &DAG,
71 const SDLoc SL, SDValue Op,
72 SDNodeFlags Flags) const;
73
78 bool IsLog10, SDNodeFlags Flags) const;
80
82 SDNodeFlags Flags) const;
84
86
91
95
97
98protected:
99 bool shouldCombineMemoryType(EVT VT) const;
104
106 unsigned Opc, SDValue LHS,
107 uint32_t ValLo, uint32_t ValHi) const;
117 SDValue RHS, DAGCombinerInfo &DCI) const;
118
120 SDValue N) const;
122
125
131
133
135 SelectionDAG &DAG) const;
136
137 /// Return 64-bit value Op as two 32-bit integers.
138 std::pair<SDValue, SDValue> split64BitValue(SDValue Op,
139 SelectionDAG &DAG) const;
142
143 /// Split a vector type into two parts. The first part is a power of two
144 /// vector. The second part is whatever is left over, and is a scalar if it
145 /// would otherwise be a 1-vector.
146 std::pair<EVT, EVT> getSplitDestVTs(const EVT &VT, SelectionDAG &DAG) const;
147
148 /// Split a vector value into two parts of types LoVT and HiVT. HiVT could be
149 /// scalar.
150 std::pair<SDValue, SDValue> splitVector(const SDValue &N, const SDLoc &DL,
151 const EVT &LoVT, const EVT &HighVT,
152 SelectionDAG &DAG) const;
153
154 /// Split a vector load into 2 loads of half the vector.
156
157 /// Widen a suitably aligned v3 load. For all other cases, split the input
158 /// vector load.
160
161 /// Split a vector store into 2 stores of half the vector.
163
167 SDValue LowerDIVREM24(SDValue Op, SelectionDAG &DAG, bool sign) const;
170
172 CCState &State,
173 const SmallVectorImpl<ISD::InputArg> &Ins) const;
174
175public:
177
178 bool mayIgnoreSignedZero(SDValue Op) const;
179
180 static inline SDValue stripBitcast(SDValue Val) {
181 return Val.getOpcode() == ISD::BITCAST ? Val.getOperand(0) : Val;
182 }
183
184 static bool shouldFoldFNegIntoSrc(SDNode *FNeg, SDValue FNegSrc);
185 static bool allUsesHaveSourceMods(const SDNode *N,
186 unsigned CostThreshold = 4);
187 bool isFAbsFree(EVT VT) const override;
188 bool isFNegFree(EVT VT) const override;
189 bool isTruncateFree(EVT Src, EVT Dest) const override;
190 bool isTruncateFree(Type *Src, Type *Dest) const override;
191
192 bool isZExtFree(Type *Src, Type *Dest) const override;
193 bool isZExtFree(EVT Src, EVT Dest) const override;
194
196 bool LegalOperations, bool ForCodeSize,
198 unsigned Depth) const override;
199
200 bool isNarrowingProfitable(EVT SrcVT, EVT DestVT) const override;
201
203 CombineLevel Level) const override;
204
206 ISD::NodeType ExtendKind) const override;
207
208 MVT getVectorIdxTy(const DataLayout &) const override;
209 bool isSelectSupported(SelectSupportKind) const override;
210
211 bool isFPImmLegal(const APFloat &Imm, EVT VT,
212 bool ForCodeSize) const override;
213 bool ShouldShrinkFPConstant(EVT VT) const override;
214 bool shouldReduceLoadWidth(SDNode *Load,
215 ISD::LoadExtType ExtType,
216 EVT ExtVT) const override;
217
219 const MachineMemOperand &MMO) const final;
220
221 bool storeOfVectorConstantIsCheap(bool IsZero, EVT MemVT,
222 unsigned NumElem,
223 unsigned AS) const override;
224 bool aggressivelyPreferBuildVectorSources(EVT VecVT) const override;
225 bool isCheapToSpeculateCttz(Type *Ty) const override;
226 bool isCheapToSpeculateCtlz(Type *Ty) const override;
227
228 bool isSDNodeAlwaysUniform(const SDNode *N) const override;
229 static CCAssignFn *CCAssignFnForCall(CallingConv::ID CC, bool IsVarArg);
230 static CCAssignFn *CCAssignFnForReturn(CallingConv::ID CC, bool IsVarArg);
231
232 SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv, bool isVarArg,
234 const SmallVectorImpl<SDValue> &OutVals, const SDLoc &DL,
235 SelectionDAG &DAG) const override;
236
238 SelectionDAG &DAG,
239 MachineFrameInfo &MFI,
240 int ClobberedFI) const;
241
242 SDValue lowerUnhandledCall(CallLoweringInfo &CLI,
244 StringRef Reason) const;
245 SDValue LowerCall(CallLoweringInfo &CLI,
246 SmallVectorImpl<SDValue> &InVals) const override;
247
249 SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override;
250 SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override;
253 SelectionDAG &DAG) const override;
254
256 SDValue RHS, SDValue True, SDValue False,
257 SDValue CC, DAGCombinerInfo &DCI) const;
258
260 SDValue RHS, SDValue True, SDValue False,
261 SDValue CC, DAGCombinerInfo &DCI) const;
262
263 const char* getTargetNodeName(unsigned Opcode) const override;
264
265 // FIXME: Turn off MergeConsecutiveStores() before Instruction Selection for
266 // AMDGPU. Commit r319036,
267 // (https://github.com/llvm/llvm-project/commit/db77e57ea86d941a4262ef60261692f4cb6893e6)
268 // turned on MergeConsecutiveStores() before Instruction Selection for all
269 // targets. Enough AMDGPU compiles go into an infinite loop (
270 // MergeConsecutiveStores() merges two stores; LegalizeStoreOps() un-merges;
271 // MergeConsecutiveStores() re-merges, etc. ) to warrant turning it off for
272 // now.
273 bool mergeStoresAfterLegalization(EVT) const override { return false; }
274
275 bool isFsqrtCheap(SDValue Operand, SelectionDAG &DAG) const override {
276 return true;
277 }
279 int &RefinementSteps, bool &UseOneConstNR,
280 bool Reciprocal) const override;
282 int &RefinementSteps) const override;
283
285 SelectionDAG &DAG) const = 0;
286
287 /// Determine which of the bits specified in \p Mask are known to be
288 /// either zero or one and return them in the \p KnownZero and \p KnownOne
289 /// bitsets.
291 KnownBits &Known,
292 const APInt &DemandedElts,
293 const SelectionDAG &DAG,
294 unsigned Depth = 0) const override;
295
296 unsigned ComputeNumSignBitsForTargetNode(SDValue Op, const APInt &DemandedElts,
297 const SelectionDAG &DAG,
298 unsigned Depth = 0) const override;
299
301 Register R,
302 const APInt &DemandedElts,
304 unsigned Depth = 0) const override;
305
307 const SelectionDAG &DAG,
308 bool SNaN = false,
309 unsigned Depth = 0) const override;
310
312 Register N1) const override;
313
314 /// Helper function that adds Reg to the LiveIn list of the DAG's
315 /// MachineFunction.
316 ///
317 /// \returns a RegisterSDNode representing Reg if \p RawReg is true, otherwise
318 /// a copy from the register.
320 const TargetRegisterClass *RC,
321 Register Reg, EVT VT,
322 const SDLoc &SL,
323 bool RawReg = false) const;
325 const TargetRegisterClass *RC,
326 Register Reg, EVT VT) const {
327 return CreateLiveInRegister(DAG, RC, Reg, VT, SDLoc(DAG.getEntryNode()));
328 }
329
330 // Returns the raw live in register rather than a copy from it.
332 const TargetRegisterClass *RC,
333 Register Reg, EVT VT) const {
334 return CreateLiveInRegister(DAG, RC, Reg, VT, SDLoc(DAG.getEntryNode()), true);
335 }
336
337 /// Similar to CreateLiveInRegister, except value maybe loaded from a stack
338 /// slot rather than passed in a register.
340 EVT VT,
341 const SDLoc &SL,
342 int64_t Offset) const;
343
345 const SDLoc &SL,
346 SDValue Chain,
347 SDValue ArgVal,
348 int64_t Offset) const;
349
351 const TargetRegisterClass *RC,
352 EVT VT, const SDLoc &SL,
353 const ArgDescriptor &Arg) const;
354
360 };
361
362 /// Helper function that returns the byte offset of the given
363 /// type of implicit parameter.
365 const ImplicitParameter Param) const;
366 uint32_t getImplicitParameterOffset(const uint64_t ExplicitKernArgSize,
367 const ImplicitParameter Param) const;
368
369 MVT getFenceOperandTy(const DataLayout &DL) const override {
370 return MVT::i32;
371 }
372
374
376 SmallVectorImpl<Use *> &Ops) const override;
377};
378
379namespace AMDGPUISD {
380
381enum NodeType : unsigned {
382 // AMDIL ISD Opcodes
384 UMUL, // 32bit unsigned multiplication
386 // End AMDIL ISD Opcodes
387
388 // Function call.
394
395 // Masked control flow nodes.
399
400 // A uniform kernel return that terminates the wavefront.
402
403 // s_endpgm, but we may want to insert it in the middle of the block.
405
406 // Return to a shader part's epilog code.
408
409 // Return with values from a non-entry function.
411
412 // Convert a unswizzled wave uniform stack address to an address compatible
413 // with a vector offset for use in stack access.
415
418
419 /// CLAMP value between 0.0 and 1.0. NaN clamped to 0, following clamp output
420 /// modifier behavior with dx10_enable.
422
423 // This is SETCC with the full mask result which is used for a compare with a
424 // result bit per item in the wavefront.
427
429
430 // FP ops with input and output chain.
433
434 // SIN_HW, COS_HW - f32 for SI, 1 ULP max error, valid from -100 pi to 100 pi.
435 // Denormals handled on some parts.
440
455 // For emitting ISD::FMAD when f32 denormals are enabled because mac/mad is
456 // treated as an illegal operation.
458
459 // RCP, RSQ - For f32, 1 ULP max error, no denormal handling.
460 // For f64, max error 2^29 ULP, handles denormals.
465
466 // log2, no denormal handling for f32.
468
469 // exp2, no denormal handling for f32.
471
478 BFE_U32, // Extract range of bits with zero extension to 32-bits.
479 BFE_I32, // Extract range of bits with sign extension to 32-bits.
480 BFI, // (src0 & src1) | (~src0 & src2)
481 BFM, // Insert a range of bits into a 32-bit word.
482 FFBH_U32, // ctlz with -1 if input is zero.
484 FFBL_B32, // cttz with -1 if input is zero.
503
504 // These cvt_f32_ubyte* nodes need to remain consecutive and in order.
509
510 // Convert two float 32 numbers into a single register holding two packed f16
511 // with round to zero.
517
518 // Same as the standard node, except the high bits of the resulting integer
519 // are known 0.
521
522 /// This node is for VLIW targets and it is used to represent a vector
523 /// that is stored in consecutive registers with the same channel.
524 /// For example:
525 /// |X |Y|Z|W|
526 /// T0|v.x| | | |
527 /// T1|v.y| | | |
528 /// T2|v.z| | | |
529 /// T3|v.w| | | |
531 /// Pointer to the start of the shader's constant data.
537
546
588
591
592} // End namespace AMDGPUISD
593
594} // End namespace llvm
595
596#endif
unsigned const MachineRegisterInfo * MRI
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
#define AMDGPUSubtarget
Function Alias Analysis Results
block Block Frequency Analysis
static cl::opt< unsigned > CostThreshold("dfa-cost-threshold", cl::desc("Maximum cost accepted for the transformation"), cl::Hidden, cl::init(50))
#define I(x, y, z)
Definition: MD5.cpp:58
unsigned Reg
LLVMContext & Context
const SmallVectorImpl< MachineOperand > & Cond
This file describes how to lower LLVM code to machine code.
Value * RHS
Value * LHS
static constexpr uint32_t Opcode
Definition: aarch32.h:200
static unsigned numBitsSigned(SDValue Op, SelectionDAG &DAG)
SDValue combineFMinMaxLegacy(const SDLoc &DL, EVT VT, SDValue LHS, SDValue RHS, SDValue True, SDValue False, SDValue CC, DAGCombinerInfo &DCI) const
Generate Min/Max node.
unsigned ComputeNumSignBitsForTargetNode(SDValue Op, const APInt &DemandedElts, const SelectionDAG &DAG, unsigned Depth=0) const override
This method can be implemented by targets that want to expose additional information about sign bits ...
SDValue performMulhuCombine(SDNode *N, DAGCombinerInfo &DCI) const
EVT getTypeForExtReturn(LLVMContext &Context, EVT VT, ISD::NodeType ExtendKind) const override
Return the type that should be used to zero or sign extend a zeroext/signext integer return value.
SDValue SplitVectorLoad(SDValue Op, SelectionDAG &DAG) const
Split a vector load into 2 loads of half the vector.
SDValue LowerCONCAT_VECTORS(SDValue Op, SelectionDAG &DAG) const
SDValue performLoadCombine(SDNode *N, DAGCombinerInfo &DCI) const
void analyzeFormalArgumentsCompute(CCState &State, const SmallVectorImpl< ISD::InputArg > &Ins) const
The SelectionDAGBuilder will automatically promote function arguments with illegal types.
SDValue LowerFROUND(SDValue Op, SelectionDAG &DAG) const
SDValue storeStackInputValue(SelectionDAG &DAG, const SDLoc &SL, SDValue Chain, SDValue ArgVal, int64_t Offset) const
bool storeOfVectorConstantIsCheap(bool IsZero, EVT MemVT, unsigned NumElem, unsigned AS) const override
Return true if it is expected to be cheaper to do a store of vector constant with the given size and ...
SDValue LowerEXTRACT_SUBVECTOR(SDValue Op, SelectionDAG &DAG) const
void computeKnownBitsForTargetNode(const SDValue Op, KnownBits &Known, const APInt &DemandedElts, const SelectionDAG &DAG, unsigned Depth=0) const override
Determine which of the bits specified in Mask are known to be either zero or one and return them in t...
bool shouldCombineMemoryType(EVT VT) const
SDValue splitBinaryBitConstantOpImpl(DAGCombinerInfo &DCI, const SDLoc &SL, unsigned Opc, SDValue LHS, uint32_t ValLo, uint32_t ValHi) const
Split the 64-bit value LHS into two 32-bit components, and perform the binary operation Opc to it wit...
SDValue lowerUnhandledCall(CallLoweringInfo &CLI, SmallVectorImpl< SDValue > &InVals, StringRef Reason) const
SDValue performAssertSZExtCombine(SDNode *N, DAGCombinerInfo &DCI) const
SDValue LowerSTORE(SDValue Op, SelectionDAG &DAG) const
bool isTruncateFree(EVT Src, EVT Dest) const override
bool aggressivelyPreferBuildVectorSources(EVT VecVT) const override
SDValue LowerFCEIL(SDValue Op, SelectionDAG &DAG) const
TargetLowering::NegatibleCost getConstantNegateCost(const ConstantFPSDNode *C) const
SDValue LowerFLOGUnsafe(SDValue Op, const SDLoc &SL, SelectionDAG &DAG, bool IsLog10, SDNodeFlags Flags) const
SDValue performMulhsCombine(SDNode *N, DAGCombinerInfo &DCI) const
AtomicExpansionKind shouldExpandAtomicRMWInIR(AtomicRMWInst *) const override
Returns how the IR-level AtomicExpand pass should expand the given AtomicRMW, if at all.
bool isSDNodeAlwaysUniform(const SDNode *N) const override
bool isDesirableToCommuteWithShift(const SDNode *N, CombineLevel Level) const override
Return true if it is profitable to move this shift by a constant amount through its operand,...
SDValue LowerFREM(SDValue Op, SelectionDAG &DAG) const
Split a vector store into multiple scalar stores.
virtual SDNode * PostISelFolding(MachineSDNode *N, SelectionDAG &DAG) const =0
SDValue performShlCombine(SDNode *N, DAGCombinerInfo &DCI) const
bool isCheapToSpeculateCtlz(Type *Ty) const override
Return true if it is cheap to speculate a call to intrinsic ctlz.
SDValue LowerSDIVREM(SDValue Op, SelectionDAG &DAG) const
bool isFNegFree(EVT VT) const override
Return true if an fneg operation is free to the point where it is never worthwhile to replace it with...
SDValue LowerFLOG10(SDValue Op, SelectionDAG &DAG) const
SDValue LowerINT_TO_FP64(SDValue Op, SelectionDAG &DAG, bool Signed) const
SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override
This callback is invoked for operations that are unsupported by the target, which are registered to u...
SDValue LowerFP_TO_FP16(SDValue Op, SelectionDAG &DAG) const
SDValue addTokenForArgument(SDValue Chain, SelectionDAG &DAG, MachineFrameInfo &MFI, int ClobberedFI) const
bool isConstantCheaperToNegate(SDValue N) const
bool isReassocProfitable(MachineRegisterInfo &MRI, Register N0, Register N1) const override
static bool needsDenormHandlingF32(const SelectionDAG &DAG, SDValue Src, SDNodeFlags Flags)
MVT getFenceOperandTy(const DataLayout &DL) const override
Return the type for operands of fence.
uint32_t getImplicitParameterOffset(const MachineFunction &MF, const ImplicitParameter Param) const
Helper function that returns the byte offset of the given type of implicit parameter.
SDValue LowerFFLOOR(SDValue Op, SelectionDAG &DAG) const
SDValue performSelectCombine(SDNode *N, DAGCombinerInfo &DCI) const
SDValue performFNegCombine(SDNode *N, DAGCombinerInfo &DCI) const
SDValue LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG) const
virtual SDValue LowerGlobalAddress(AMDGPUMachineFunction *MFI, SDValue Op, SelectionDAG &DAG) const
bool isConstantCostlierToNegate(SDValue N) const
SDValue loadInputValue(SelectionDAG &DAG, const TargetRegisterClass *RC, EVT VT, const SDLoc &SL, const ArgDescriptor &Arg) const
SDValue LowerDIVREM24(SDValue Op, SelectionDAG &DAG, bool sign) const
SDValue LowerUINT_TO_FP(SDValue Op, SelectionDAG &DAG) const
SDValue CreateLiveInRegisterRaw(SelectionDAG &DAG, const TargetRegisterClass *RC, Register Reg, EVT VT) const
bool isCheapToSpeculateCttz(Type *Ty) const override
Return true if it is cheap to speculate a call to intrinsic cttz.
SDValue performCtlz_CttzCombine(const SDLoc &SL, SDValue Cond, SDValue LHS, SDValue RHS, DAGCombinerInfo &DCI) const
SDValue performSraCombine(SDNode *N, DAGCombinerInfo &DCI) const
bool isSelectSupported(SelectSupportKind) const override
bool isZExtFree(Type *Src, Type *Dest) const override
Return true if any actual instruction that defines a value of type FromTy implicitly zero-extends the...
SDValue lowerFEXP2(SDValue Op, SelectionDAG &DAG) const
SDValue LowerCall(CallLoweringInfo &CLI, SmallVectorImpl< SDValue > &InVals) const override
This hook must be implemented to lower calls into the specified DAG.
SDValue performSrlCombine(SDNode *N, DAGCombinerInfo &DCI) const
SDValue lowerFEXP(SDValue Op, SelectionDAG &DAG) const
SDValue getIsLtSmallestNormal(SelectionDAG &DAG, SDValue Op, SDNodeFlags Flags) const
bool mayIgnoreSignedZero(SDValue Op) const
SDValue getIsFinite(SelectionDAG &DAG, SDValue Op, SDNodeFlags Flags) const
bool isLoadBitCastBeneficial(EVT, EVT, const SelectionDAG &DAG, const MachineMemOperand &MMO) const final
Return true if the following transform is beneficial: fold (conv (load x)) -> (load (conv*)x) On arch...
bool shouldReduceLoadWidth(SDNode *Load, ISD::LoadExtType ExtType, EVT ExtVT) const override
Return true if it is profitable to reduce a load to a smaller type.
MVT getVectorIdxTy(const DataLayout &) const override
Returns the type to be used for the index operand of: ISD::INSERT_VECTOR_ELT, ISD::EXTRACT_VECTOR_ELT...
std::pair< SDValue, SDValue > splitVector(const SDValue &N, const SDLoc &DL, const EVT &LoVT, const EVT &HighVT, SelectionDAG &DAG) const
Split a vector value into two parts of types LoVT and HiVT.
SDValue LowerFLOGCommon(SDValue Op, SelectionDAG &DAG) const
SDValue foldFreeOpFromSelect(TargetLowering::DAGCombinerInfo &DCI, SDValue N) const
bool shouldSinkOperands(Instruction *I, SmallVectorImpl< Use * > &Ops) const override
Whether it is profitable to sink the operands of an Instruction I to the basic block of I.
SDValue LowerINT_TO_FP32(SDValue Op, SelectionDAG &DAG, bool Signed) const
bool isFAbsFree(EVT VT) const override
Return true if an fabs operation is free to the point where it is never worthwhile to replace it with...
SDValue loadStackInputValue(SelectionDAG &DAG, EVT VT, const SDLoc &SL, int64_t Offset) const
Similar to CreateLiveInRegister, except value maybe loaded from a stack slot rather than passed in a ...
bool isNarrowingProfitable(EVT SrcVT, EVT DestVT) const override
Return true if it's profitable to narrow operations of type SrcVT to DestVT.
SDValue LowerFLOG2(SDValue Op, SelectionDAG &DAG) const
static EVT getEquivalentMemType(LLVMContext &Context, EVT VT)
SDValue getSqrtEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled, int &RefinementSteps, bool &UseOneConstNR, bool Reciprocal) const override
Hooks for building estimates in place of slower divisions and square roots.
unsigned computeNumSignBitsForTargetInstr(GISelKnownBits &Analysis, Register R, const APInt &DemandedElts, const MachineRegisterInfo &MRI, unsigned Depth=0) const override
This method can be implemented by targets that want to expose additional information about sign bits ...
SDValue performTruncateCombine(SDNode *N, DAGCombinerInfo &DCI) const
SDValue LowerSINT_TO_FP(SDValue Op, SelectionDAG &DAG) const
static SDValue stripBitcast(SDValue Val)
SDValue CreateLiveInRegister(SelectionDAG &DAG, const TargetRegisterClass *RC, Register Reg, EVT VT, const SDLoc &SL, bool RawReg=false) const
Helper function that adds Reg to the LiveIn list of the DAG's MachineFunction.
SDValue SplitVectorStore(SDValue Op, SelectionDAG &DAG) const
Split a vector store into 2 stores of half the vector.
SDValue LowerCTLZ_CTTZ(SDValue Op, SelectionDAG &DAG) const
SDValue getNegatedExpression(SDValue Op, SelectionDAG &DAG, bool LegalOperations, bool ForCodeSize, NegatibleCost &Cost, unsigned Depth) const override
Return the newly negated expression if the cost is not expensive and set the cost in Cost to indicate...
std::pair< SDValue, SDValue > split64BitValue(SDValue Op, SelectionDAG &DAG) const
Return 64-bit value Op as two 32-bit integers.
SDValue performMulCombine(SDNode *N, DAGCombinerInfo &DCI) const
SDValue getRecipEstimate(SDValue Operand, SelectionDAG &DAG, int Enabled, int &RefinementSteps) const override
Return a reciprocal estimate value for the input operand.
SDValue CreateLiveInRegister(SelectionDAG &DAG, const TargetRegisterClass *RC, Register Reg, EVT VT) const
SDValue LowerFNEARBYINT(SDValue Op, SelectionDAG &DAG) const
const char * getTargetNodeName(unsigned Opcode) const override
This method returns the name of a target specific DAG node.
SDValue LowerSIGN_EXTEND_INREG(SDValue Op, SelectionDAG &DAG) const
static CCAssignFn * CCAssignFnForReturn(CallingConv::ID CC, bool IsVarArg)
std::pair< SDValue, SDValue > getScaledLogInput(SelectionDAG &DAG, const SDLoc SL, SDValue Op, SDNodeFlags Flags) const
If denormal handling is required return the scaled input to FLOG2, and the check for denormal range.
static CCAssignFn * CCAssignFnForCall(CallingConv::ID CC, bool IsVarArg)
Selects the correct CCAssignFn for a given CallingConvention value.
static bool allUsesHaveSourceMods(const SDNode *N, unsigned CostThreshold=4)
SDValue LowerFROUNDEVEN(SDValue Op, SelectionDAG &DAG) const
bool isFPImmLegal(const APFloat &Imm, EVT VT, bool ForCodeSize) const override
Returns true if the target can instruction select the specified FP immediate natively.
bool isKnownNeverNaNForTargetNode(SDValue Op, const SelectionDAG &DAG, bool SNaN=false, unsigned Depth=0) const override
If SNaN is false,.
static unsigned numBitsUnsigned(SDValue Op, SelectionDAG &DAG)
SDValue lowerFEXPUnsafe(SDValue Op, const SDLoc &SL, SelectionDAG &DAG, SDNodeFlags Flags) const
SDValue LowerFTRUNC(SDValue Op, SelectionDAG &DAG) const
SDValue LowerDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const
static bool allowApproxFunc(const SelectionDAG &DAG, SDNodeFlags Flags)
bool ShouldShrinkFPConstant(EVT VT) const override
If true, then instruction selection should seek to shrink the FP constant of the specified type to a ...
SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv, bool isVarArg, const SmallVectorImpl< ISD::OutputArg > &Outs, const SmallVectorImpl< SDValue > &OutVals, const SDLoc &DL, SelectionDAG &DAG) const override
This hook must be implemented to lower outgoing return values, described by the Outs array,...
SDValue performStoreCombine(SDNode *N, DAGCombinerInfo &DCI) const
void ReplaceNodeResults(SDNode *N, SmallVectorImpl< SDValue > &Results, SelectionDAG &DAG) const override
This callback is invoked when a node result type is illegal for the target, and the operation was reg...
SDValue performRcpCombine(SDNode *N, DAGCombinerInfo &DCI) const
SDValue getLoHalf64(SDValue Op, SelectionDAG &DAG) const
SDValue performFAbsCombine(SDNode *N, DAGCombinerInfo &DCI) const
SDValue LowerFP_TO_INT64(SDValue Op, SelectionDAG &DAG, bool Signed) const
static bool shouldFoldFNegIntoSrc(SDNode *FNeg, SDValue FNegSrc)
SDValue LowerFRINT(SDValue Op, SelectionDAG &DAG) const
SDValue performIntrinsicWOChainCombine(SDNode *N, DAGCombinerInfo &DCI) const
SDValue LowerUDIVREM(SDValue Op, SelectionDAG &DAG) const
SDValue performMulLoHiCombine(SDNode *N, DAGCombinerInfo &DCI) const
SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override
This method will be invoked for all target nodes and for any target-independent nodes that the target...
void LowerUDIVREM64(SDValue Op, SelectionDAG &DAG, SmallVectorImpl< SDValue > &Results) const
SDValue WidenOrSplitVectorLoad(SDValue Op, SelectionDAG &DAG) const
Widen a suitably aligned v3 load.
bool mergeStoresAfterLegalization(EVT) const override
Allow store merging for the specified type after legalization in addition to before legalization.
std::pair< EVT, EVT > getSplitDestVTs(const EVT &VT, SelectionDAG &DAG) const
Split a vector type into two parts.
SDValue getHiHalf64(SDValue Op, SelectionDAG &DAG) const
bool isFsqrtCheap(SDValue Operand, SelectionDAG &DAG) const override
Return true if SQRT(X) shouldn't be replaced with X*RSQRT(X).
SDValue combineFMinMaxLegacyImpl(const SDLoc &DL, EVT VT, SDValue LHS, SDValue RHS, SDValue True, SDValue False, SDValue CC, DAGCombinerInfo &DCI) const
Class for arbitrary precision integers.
Definition: APInt.h:76
an instruction that atomically reads a memory location, combines it with another value,...
Definition: Instructions.h:726
CCState - This class holds information needed while lowering arguments and return values.
This class represents an Operation in the Expression.
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:110
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:67
Machine Value Type.
The MachineFrameInfo class represents an abstract stack frame until prolog/epilog code is inserted.
A description of a memory reference used in the backend.
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
An SDNode that represents everything that will be needed to construct a MachineInstr.
Wrapper class representing virtual and physical registers.
Definition: Register.h:19
Wrapper class for IR location info (IR ordering and DebugLoc) to be passed into SDNode creation funct...
Represents one node in the SelectionDAG.
Unlike LLVM values, Selection DAG nodes may return multiple values as the result of a computation.
const SDValue & getOperand(unsigned i) const
unsigned getOpcode() const
This is used to represent a portion of an LLVM function in a low-level Data Dependence DAG representa...
Definition: SelectionDAG.h:225
SDValue getEntryNode() const
Return the token chain corresponding to the entry of the function.
Definition: SelectionDAG.h:554
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
Definition: SmallVector.h:577
StringRef - Represent a constant reference to a string, i.e.
Definition: StringRef.h:50
SelectSupportKind
Enum that describes what type of support for selects the target has.
AtomicExpansionKind
Enum that specifies what an atomic load/AtomicRMWInst is expanded to, if at all.
NegatibleCost
Enum that specifies when a float negation is beneficial.
This class defines information used to lower LLVM code to legal SelectionDAG operators that the targe...
Primary interface to the complete machine description for the target machine.
Definition: TargetMachine.h:78
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45
@ BUILD_VERTICAL_VECTOR
This node is for VLIW targets and it is used to represent a vector that is stored in consecutive regi...
@ CONST_DATA_PTR
Pointer to the start of the shader's constant data.
@ CLAMP
CLAMP value between 0.0 and 1.0.
@ C
The default llvm calling convention, compatible with C.
Definition: CallingConv.h:34
NodeType
ISD::NodeType enum - This enum defines the target-independent operators for a SelectionDAG.
Definition: ISDOpcodes.h:40
@ BITCAST
BITCAST - This operator converts between integer, vector and FP values, as if the value was stored to...
Definition: ISDOpcodes.h:903
@ BUILTIN_OP_END
BUILTIN_OP_END - This must be the last enum value in this list.
Definition: ISDOpcodes.h:1383
static const int FIRST_TARGET_MEMORY_OPCODE
FIRST_TARGET_MEMORY_OPCODE - Target-specific pre-isel operations which do not reference a specific me...
Definition: ISDOpcodes.h:1395
LoadExtType
LoadExtType enum - This enum defines the three variants of LOADEXT (load with extension).
Definition: ISDOpcodes.h:1486
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18
@ Offset
Definition: DWP.cpp:440
bool CCAssignFn(unsigned ValNo, MVT ValVT, MVT LocVT, CCValAssign::LocInfo LocInfo, ISD::ArgFlagsTy ArgFlags, CCState &State)
CCAssignFn - This function assigns a location for Val, updating State to reflect the change.
CombineLevel
Definition: DAGCombine.h:15
#define N
Extended Value Type.
Definition: ValueTypes.h:34
These are IR-level optimization flags that may be propagated to SDNodes.