#include "NVPTXISelDAGToDAG.h"
#include "NVPTX.h"
#include "NVPTXUtilities.h"
#include "llvm/ADT/APInt.h"
#include "llvm/Analysis/ValueTracking.h"
#include "llvm/CodeGen/ISDOpcodes.h"
#include "llvm/CodeGen/MachineJumpTableInfo.h"
#include "llvm/CodeGen/SelectionDAG.h"
#include "llvm/CodeGen/SelectionDAGNodes.h"
#include "llvm/IR/GlobalValue.h"
#include "llvm/IR/Instructions.h"
#include "llvm/IR/IntrinsicsNVPTX.h"
#include "llvm/IR/NVVMIntrinsicUtils.h"
#include "llvm/Support/AtomicOrdering.h"
#include "llvm/Support/CommandLine.h"
#include "llvm/Support/ErrorHandling.h"
#include "llvm/Support/FormatVariadic.h"
#include "llvm/Support/MathExtras.h"
#include <optional>

Macros
#define	DEBUG_TYPE "nvptx-isel"
#define	PASS_NAME "NVPTX DAG->DAG Pattern Instruction Selection"
#define	TCGEN05_LD_OPCODE(SHAPE, NUM)
#define	CP_ASYNC_BULK_TENSOR_OPCODE(dir, dim, mode, is_s32, suffix)
#define	GET_CP_ASYNC_BULK_TENSOR_OPCODE_S2G_RED(dim, mode, is_ch, is_s32)
#define	TCGEN05_ST_OPCODE(SHAPE, NUM)

Functions
static unsigned	getTcgen05LdOpcode (unsigned IID, bool enablePack)
static NVPTX::Scope	resolveScope (NVPTX::Scope S, const NVPTXSubtarget *T)
static bool	canLowerToLDG (const MemSDNode &N, const NVPTXSubtarget &Subtarget, NVPTX::AddressSpace CodeAddrSpace)
static unsigned int	getFenceOp (NVPTX::Ordering O, NVPTX::Scope S, NVPTXSubtarget const *T)
static std::optional< unsigned >	pickOpcodeForVT (MVT::SimpleValueType VT, std::optional< unsigned > Opcode_i16, std::optional< unsigned > Opcode_i32, std::optional< unsigned > Opcode_i64)
static bool	isAddLike (const SDValue V)
static SDValue	stripAssertAlign (SDValue N)
static SDValue	selectBaseADDR (SDValue N, SelectionDAG *DAG)
static SDValue	accumulateOffset (SDValue &Addr, SDLoc DL, SelectionDAG *DAG)
static std::pair< SDValue, SDValue >	selectADDR (SDValue Addr, SelectionDAG *DAG)
static unsigned	getStoreVectorNumElts (SDNode *N)
static unsigned	GetCpAsyncBulkTensorS2GReductionOpcode (size_t Dim, bool IsShared32, bool IsCacheHint, bool IsIm2Col)
static unsigned	getTcgen05StOpcode (unsigned IID, bool enableUnpack)

Variables
static cl::opt< bool >	EnableRsqrtOpt ("nvptx-rsqrt-approx-opt", cl::init(true), cl::Hidden, cl::desc("Enable reciprocal sqrt optimization"))
static cl::opt< bool >	EnableMADWide ("nvptx-mad-wide-opt", cl::init(false), cl::Hidden, cl::desc("Enable MAD wide optimization"))

Macro Definition Documentation

◆ CP_ASYNC_BULK_TENSOR_OPCODE

#define CP_ASYNC_BULK_TENSOR_OPCODE	(	dir,
		dim,
		mode,
		is_s32,
		suffix )

Value:

  (is_s32                                                                      \
       ? NVPTX::CP_ASYNC_BULK_TENSOR_##dir##_##dim##_SHARED32_##mode##suffix   \
       : NVPTX::CP_ASYNC_BULK_TENSOR_##dir##_##dim##_##mode##suffix)

Definition at line 1913 of file NVPTXISelDAGToDAG.cpp.

◆ DEBUG_TYPE

#define DEBUG_TYPE "nvptx-isel"

Definition at line 35 of file NVPTXISelDAGToDAG.cpp.

◆ GET_CP_ASYNC_BULK_TENSOR_OPCODE_S2G_RED

#define GET_CP_ASYNC_BULK_TENSOR_OPCODE_S2G_RED	(	dim,
		mode,
		is_ch,
		is_s32 )

Value:

(is_ch ? (CP_ASYNC_BULK_TENSOR_OPCODE(RED, dim, mode, is_s32, _CH)) \

: (CP_ASYNC_BULK_TENSOR_OPCODE(RED, dim, mode, is_s32, )))

CP_ASYNC_BULK_TENSOR_OPCODE

#define CP_ASYNC_BULK_TENSOR_OPCODE(dir, dim, mode, is_s32, suffix)

Definition NVPTXISelDAGToDAG.cpp:1913

Definition at line 1918 of file NVPTXISelDAGToDAG.cpp.

Referenced by GetCpAsyncBulkTensorS2GReductionOpcode().

◆ PASS_NAME

#define PASS_NAME "NVPTX DAG->DAG Pattern Instruction Selection"

Definition at line 36 of file NVPTXISelDAGToDAG.cpp.

◆ TCGEN05_LD_OPCODE

#define TCGEN05_LD_OPCODE	(		SHAPE,
			NUM )

Value:

(enablePack ? NVPTX::TCGEN05_LD_##SHAPE##_##NUM##_PACK \

: NVPTX::TCGEN05_LD_##SHAPE##_##NUM)

Definition at line 202 of file NVPTXISelDAGToDAG.cpp.

Referenced by getTcgen05LdOpcode().

◆ TCGEN05_ST_OPCODE

#define TCGEN05_ST_OPCODE	(		SHAPE,
			NUM )

Value:

(enableUnpack ? NVPTX::TCGEN05_ST_##SHAPE##_##NUM##_UNPACK \

: NVPTX::TCGEN05_ST_##SHAPE##_##NUM)

Definition at line 1989 of file NVPTXISelDAGToDAG.cpp.

Referenced by getTcgen05StOpcode().

Function Documentation

◆ accumulateOffset()

SDValue accumulateOffset	(	SDValue &	Addr,
		SDLoc	DL,
		SelectionDAG *	DAG )

static

Definition at line 1073 of file NVPTXISelDAGToDAG.cpp.

References DL, llvm::dyn_cast(), llvm::SDNode::getOperand(), llvm::SDValue::getOperand(), llvm::APInt::getSExtValue(), llvm::SelectionDAG::getSignedTargetConstant(), isAddLike(), llvm::APInt::sext(), and stripAssertAlign().

Referenced by selectADDR().

◆ canLowerToLDG()

bool canLowerToLDG	(	const MemSDNode &	N,
		const NVPTXSubtarget &	Subtarget,
		NVPTX::AddressSpace	CodeAddrSpace )

static

Definition at line 781 of file NVPTXISelDAGToDAG.cpp.

References llvm::NVPTX::Global, llvm::NVPTXSubtarget::hasLDG(), and N.

◆ GetCpAsyncBulkTensorS2GReductionOpcode()

unsigned GetCpAsyncBulkTensorS2GReductionOpcode	(	size_t	Dim,
		bool	IsShared32,
		bool	IsCacheHint,
		bool	IsIm2Col )

static

Definition at line 1922 of file NVPTXISelDAGToDAG.cpp.

References D(), GET_CP_ASYNC_BULK_TENSOR_OPCODE_S2G_RED, and llvm_unreachable.

◆ getFenceOp()

unsigned int getFenceOp	(	NVPTX::Ordering	O,
		NVPTX::Scope	S,
		NVPTXSubtarget const *	T )

static

◆ getStoreVectorNumElts()

unsigned getStoreVectorNumElts ( SDNode * N )

static

Definition at line 1182 of file NVPTXISelDAGToDAG.cpp.

References llvm_unreachable, N, llvm::NVPTXISD::StoreV2, llvm::NVPTXISD::StoreV4, and llvm::NVPTXISD::StoreV8.

◆ getTcgen05LdOpcode()

unsigned getTcgen05LdOpcode	(	unsigned	IID,
		bool	enablePack )

static

Definition at line 206 of file NVPTXISelDAGToDAG.cpp.

References llvm_unreachable, and TCGEN05_LD_OPCODE.

◆ getTcgen05StOpcode()

unsigned getTcgen05StOpcode	(	unsigned	IID,
		bool	enableUnpack )

static

Definition at line 1993 of file NVPTXISelDAGToDAG.cpp.

References llvm_unreachable, and TCGEN05_ST_OPCODE.

◆ isAddLike()

bool isAddLike ( const SDValue V )

inlinestatic

Definition at line 1045 of file NVPTXISelDAGToDAG.cpp.

References llvm::ISD::ADD, and llvm::ISD::OR.

Referenced by accumulateOffset().

◆ pickOpcodeForVT()

std::optional< unsigned > pickOpcodeForVT	(	MVT::SimpleValueType	VT,
		std::optional< unsigned >	Opcode_i16,
		std::optional< unsigned >	Opcode_i32,
		std::optional< unsigned >	Opcode_i64 )

static

Definition at line 1020 of file NVPTXISelDAGToDAG.cpp.

◆ resolveScope()

NVPTX::Scope resolveScope	(	NVPTX::Scope	S,
		const NVPTXSubtarget *	T )

static

Definition at line 540 of file NVPTXISelDAGToDAG.cpp.

References llvm::NVPTX::Block, llvm::NVPTX::Cluster, and T.

Referenced by getFenceOp().

◆ selectADDR()

std::pair< SDValue, SDValue > selectADDR	(	SDValue	Addr,
		SelectionDAG *	DAG )

static

Definition at line 1092 of file NVPTXISelDAGToDAG.cpp.

References accumulateOffset(), llvm::sampleprof::Base, llvm::Offset, and selectBaseADDR().

Referenced by llvm::NVPTXDAGToDAGISel::SelectInlineAsmMemoryOperand().

◆ selectBaseADDR()

SDValue selectBaseADDR	(	SDValue	N,
		SelectionDAG *	DAG )

static

Definition at line 1058 of file NVPTXISelDAGToDAG.cpp.

References llvm::dyn_cast(), llvm::SelectionDAG::getTargetExternalSymbol(), llvm::SelectionDAG::getTargetFrameIndex(), llvm::SelectionDAG::getTargetGlobalAddress(), N, and stripAssertAlign().

Referenced by selectADDR().

◆ stripAssertAlign()

SDValue stripAssertAlign ( SDValue N )

static

Definition at line 1050 of file NVPTXISelDAGToDAG.cpp.

References llvm::ISD::AssertAlign, and N.

Referenced by accumulateOffset(), and selectBaseADDR().

Variable Documentation

◆ EnableMADWide

cl::opt< bool > EnableMADWide("nvptx-mad-wide-opt", cl::init(false), cl::Hidden, cl::desc("Enable MAD wide optimization"))	(	"nvptx-mad-wide-opt"	,
		cl::init(false)	,
		cl::Hidden	,
		cl::desc("Enable MAD wide optimization")	)

static

◆ EnableRsqrtOpt

cl::opt< bool > EnableRsqrtOpt("nvptx-rsqrt-approx-opt", cl::init(true), cl::Hidden, cl::desc("Enable reciprocal sqrt optimization"))	(	"nvptx-rsqrt-approx-opt"	,
		cl::init(true)	,
		cl::Hidden	,
		cl::desc("Enable reciprocal sqrt optimization")	)

static

Macros

Functions

Variables

Macro Definition Documentation

◆ CP_ASYNC_BULK_TENSOR_OPCODE

◆ DEBUG_TYPE

◆ GET_CP_ASYNC_BULK_TENSOR_OPCODE_S2G_RED

◆ PASS_NAME

◆ TCGEN05_LD_OPCODE

◆ TCGEN05_ST_OPCODE

Function Documentation

◆ accumulateOffset()

◆ canLowerToLDG()

◆ GetCpAsyncBulkTensorS2GReductionOpcode()

◆ getFenceOp()

◆ getStoreVectorNumElts()

◆ getTcgen05LdOpcode()

◆ getTcgen05StOpcode()

◆ isAddLike()

◆ pickOpcodeForVT()

◆ resolveScope()

◆ selectADDR()

◆ selectBaseADDR()

◆ stripAssertAlign()

Variable Documentation

◆ EnableMADWide

◆ EnableRsqrtOpt