doxygen/AMDGPULowerKernelArguments_8cpp_source.html

//===-- AMDGPULowerKernelArguments.cpp ------------------------------------------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

/// \file This pass replaces accesses to kernel arguments with loads from

/// offsets from the kernarg base pointer.

//

//===----------------------------------------------------------------------===//


#include "AMDGPU.h"

#include "GCNSubtarget.h"

#include "llvm/CodeGen/TargetPassConfig.h"

#include "llvm/IR/IRBuilder.h"

#include "llvm/IR/IntrinsicsAMDGPU.h"

#include "llvm/IR/MDBuilder.h"

#include "llvm/Target/TargetMachine.h"


#define DEBUG_TYPE "amdgpu-lower-kernel-arguments"


using namespace llvm;


namespace {


class PreloadKernelArgInfo {

private:

  Function &F;

  const GCNSubtarget &ST;

  unsigned NumFreeUserSGPRs;


public:

  SmallVector<llvm::Metadata *, 8> KernelArgMetadata;


  PreloadKernelArgInfo(Function &F, const GCNSubtarget &ST) : F(F), ST(ST) {

    setInitialFreeUserSGPRsCount();

  }


  // Returns the maximum number of user SGPRs that we have available to preload

  // arguments.

  void setInitialFreeUserSGPRsCount() {

    const unsigned MaxUserSGPRs = ST.getMaxNumUserSGPRs();

    GCNUserSGPRUsageInfo UserSGPRInfo(F, ST);


    NumFreeUserSGPRs = MaxUserSGPRs - UserSGPRInfo.getNumUsedUserSGPRs();

  }


  bool tryAllocPreloadSGPRs(unsigned AllocSize, uint64_t ArgOffset,

                            uint64_t LastExplicitArgOffset) {

    //  Check if this argument may be loaded into the same register as the

    //  previous argument.

    if (!isAligned(Align(4), ArgOffset) && AllocSize < 4)

      return true;


    // Pad SGPRs for kernarg alignment.

    unsigned Padding = ArgOffset - LastExplicitArgOffset;

    unsigned PaddingSGPRs = alignTo(Padding, 4) / 4;

    unsigned NumPreloadSGPRs = alignTo(AllocSize, 4) / 4;

    if (NumPreloadSGPRs + PaddingSGPRs > NumFreeUserSGPRs)

      return false;


    NumFreeUserSGPRs -= (NumPreloadSGPRs + PaddingSGPRs);

    return true;

  }

};


class AMDGPULowerKernelArguments : public FunctionPass {

public:

  static char ID;


  AMDGPULowerKernelArguments() : FunctionPass(ID) {}


  bool runOnFunction(Function &F) override;


  void getAnalysisUsage(AnalysisUsage &AU) const override {

    AU.addRequired<TargetPassConfig>();

    AU.setPreservesAll();

 }

};


} // end anonymous namespace


// skip allocas

static BasicBlock::iterator getInsertPt(BasicBlock &BB) {

  BasicBlock::iterator InsPt = BB.getFirstInsertionPt();

  for (BasicBlock::iterator E = BB.end(); InsPt != E; ++InsPt) {

    AllocaInst *AI = dyn_cast<AllocaInst>(&*InsPt);


    // If this is a dynamic alloca, the value may depend on the loaded kernargs,

    // so loads will need to be inserted before it.

    if (!AI || !AI->isStaticAlloca())

      break;

  }


  return InsPt;

}


static bool lowerKernelArguments(Function &F, const TargetMachine &TM) {

  CallingConv::ID CC = F.getCallingConv();

  if (CC != CallingConv::AMDGPU_KERNEL || F.arg_empty())

    return false;


  const GCNSubtarget &ST = TM.getSubtarget<GCNSubtarget>(F);

  LLVMContext &Ctx = F.getParent()->getContext();

  const DataLayout &DL = F.getParent()->getDataLayout();

  BasicBlock &EntryBlock = *F.begin();

  IRBuilder<> Builder(&EntryBlock, getInsertPt(EntryBlock));


  const Align KernArgBaseAlign(16); // FIXME: Increase if necessary

  const uint64_t BaseOffset = ST.getExplicitKernelArgOffset();


  Align MaxAlign;

  // FIXME: Alignment is broken with explicit arg offset.;

  const uint64_t TotalKernArgSize = ST.getKernArgSegmentSize(F, MaxAlign);

  if (TotalKernArgSize == 0)

    return false;


  CallInst *KernArgSegment =

      Builder.CreateIntrinsic(Intrinsic::amdgcn_kernarg_segment_ptr, {}, {},

                              nullptr, F.getName() + ".kernarg.segment");


  KernArgSegment->addRetAttr(Attribute::NonNull);

  KernArgSegment->addRetAttr(

      Attribute::getWithDereferenceableBytes(Ctx, TotalKernArgSize));


  uint64_t ExplicitArgOffset = 0;

  // Preloaded kernel arguments must be sequential.

  bool InPreloadSequence = true;

  PreloadKernelArgInfo PreloadInfo(F, ST);


  for (Argument &Arg : F.args()) {

    const bool IsByRef = Arg.hasByRefAttr();

    Type *ArgTy = IsByRef ? Arg.getParamByRefType() : Arg.getType();

    MaybeAlign ParamAlign = IsByRef ? Arg.getParamAlign() : std::nullopt;

    Align ABITypeAlign = DL.getValueOrABITypeAlignment(ParamAlign, ArgTy);


    uint64_t Size = DL.getTypeSizeInBits(ArgTy);

    uint64_t AllocSize = DL.getTypeAllocSize(ArgTy);


    uint64_t EltOffset = alignTo(ExplicitArgOffset, ABITypeAlign) + BaseOffset;

    uint64_t LastExplicitArgOffset = ExplicitArgOffset;

    ExplicitArgOffset = alignTo(ExplicitArgOffset, ABITypeAlign) + AllocSize;


    // Try to preload this argument into user SGPRs.

    if (Arg.hasInRegAttr() && InPreloadSequence && ST.hasKernargPreload() &&

        !Arg.getType()->isAggregateType())

      if (PreloadInfo.tryAllocPreloadSGPRs(AllocSize, EltOffset,

                                           LastExplicitArgOffset))

        continue;


    InPreloadSequence = false;


    if (Arg.use_empty())

      continue;


    // If this is byval, the loads are already explicit in the function. We just

    // need to rewrite the pointer values.

    if (IsByRef) {

      Value *ArgOffsetPtr = Builder.CreateConstInBoundsGEP1_64(

          Builder.getInt8Ty(), KernArgSegment, EltOffset,

          Arg.getName() + ".byval.kernarg.offset");


      Value *CastOffsetPtr =

          Builder.CreateAddrSpaceCast(ArgOffsetPtr, Arg.getType());

      Arg.replaceAllUsesWith(CastOffsetPtr);

      continue;

    }


    if (PointerType *PT = dyn_cast<PointerType>(ArgTy)) {

      // FIXME: Hack. We rely on AssertZext to be able to fold DS addressing

      // modes on SI to know the high bits are 0 so pointer adds don't wrap. We

      // can't represent this with range metadata because it's only allowed for

      // integer types.

      if ((PT->getAddressSpace() == AMDGPUAS::LOCAL_ADDRESS ||

           PT->getAddressSpace() == AMDGPUAS::REGION_ADDRESS) &&

          !ST.hasUsableDSOffset())

        continue;


      // FIXME: We can replace this with equivalent alias.scope/noalias

      // metadata, but this appears to be a lot of work.

      if (Arg.hasNoAliasAttr())

        continue;

    }


    auto *VT = dyn_cast<FixedVectorType>(ArgTy);

    bool IsV3 = VT && VT->getNumElements() == 3;

    bool DoShiftOpt = Size < 32 && !ArgTy->isAggregateType();


    VectorType *V4Ty = nullptr;


    int64_t AlignDownOffset = alignDown(EltOffset, 4);

    int64_t OffsetDiff = EltOffset - AlignDownOffset;

    Align AdjustedAlign = commonAlignment(

        KernArgBaseAlign, DoShiftOpt ? AlignDownOffset : EltOffset);


    Value *ArgPtr;

    Type *AdjustedArgTy;

    if (DoShiftOpt) { // FIXME: Handle aggregate types

      // Since we don't have sub-dword scalar loads, avoid doing an extload by

      // loading earlier than the argument address, and extracting the relevant

      // bits.

      // TODO: Update this for GFX12 which does have scalar sub-dword loads.

      //

      // Additionally widen any sub-dword load to i32 even if suitably aligned,

      // so that CSE between different argument loads works easily.

      ArgPtr = Builder.CreateConstInBoundsGEP1_64(

          Builder.getInt8Ty(), KernArgSegment, AlignDownOffset,

          Arg.getName() + ".kernarg.offset.align.down");

      AdjustedArgTy = Builder.getInt32Ty();

    } else {

      ArgPtr = Builder.CreateConstInBoundsGEP1_64(

          Builder.getInt8Ty(), KernArgSegment, EltOffset,

          Arg.getName() + ".kernarg.offset");

      AdjustedArgTy = ArgTy;

    }


    if (IsV3 && Size >= 32) {

      V4Ty = FixedVectorType::get(VT->getElementType(), 4);

      // Use the hack that clang uses to avoid SelectionDAG ruining v3 loads

      AdjustedArgTy = V4Ty;

    }


    LoadInst *Load =

        Builder.CreateAlignedLoad(AdjustedArgTy, ArgPtr, AdjustedAlign);

    Load->setMetadata(LLVMContext::MD_invariant_load, MDNode::get(Ctx, {}));


    MDBuilder MDB(Ctx);


    if (isa<PointerType>(ArgTy)) {

      if (Arg.hasNonNullAttr())

        Load->setMetadata(LLVMContext::MD_nonnull, MDNode::get(Ctx, {}));


      uint64_t DerefBytes = Arg.getDereferenceableBytes();

      if (DerefBytes != 0) {

        Load->setMetadata(

          LLVMContext::MD_dereferenceable,

          MDNode::get(Ctx,

                      MDB.createConstant(

                        ConstantInt::get(Builder.getInt64Ty(), DerefBytes))));

      }


      uint64_t DerefOrNullBytes = Arg.getDereferenceableOrNullBytes();

      if (DerefOrNullBytes != 0) {

        Load->setMetadata(

          LLVMContext::MD_dereferenceable_or_null,

          MDNode::get(Ctx,

                      MDB.createConstant(ConstantInt::get(Builder.getInt64Ty(),

                                                          DerefOrNullBytes))));

      }


      if (MaybeAlign ParamAlign = Arg.getParamAlign()) {

        Load->setMetadata(

            LLVMContext::MD_align,

            MDNode::get(Ctx, MDB.createConstant(ConstantInt::get(

                                 Builder.getInt64Ty(), ParamAlign->value()))));

      }

    }


    // TODO: Convert noalias arg to !noalias


    if (DoShiftOpt) {

      Value *ExtractBits = OffsetDiff == 0 ?

        Load : Builder.CreateLShr(Load, OffsetDiff * 8);


      IntegerType *ArgIntTy = Builder.getIntNTy(Size);

      Value *Trunc = Builder.CreateTrunc(ExtractBits, ArgIntTy);

      Value *NewVal = Builder.CreateBitCast(Trunc, ArgTy,

                                            Arg.getName() + ".load");

      Arg.replaceAllUsesWith(NewVal);

    } else if (IsV3) {

      Value *Shuf = Builder.CreateShuffleVector(Load, ArrayRef<int>{0, 1, 2},

                                                Arg.getName() + ".load");

      Arg.replaceAllUsesWith(Shuf);

    } else {

      Load->setName(Arg.getName() + ".load");

      Arg.replaceAllUsesWith(Load);

    }

  }


  KernArgSegment->addRetAttr(

      Attribute::getWithAlignment(Ctx, std::max(KernArgBaseAlign, MaxAlign)));


  return true;

}


bool AMDGPULowerKernelArguments::runOnFunction(Function &F) {

  auto &TPC = getAnalysis<TargetPassConfig>();

  const TargetMachine &TM = TPC.getTM<TargetMachine>();

  return lowerKernelArguments(F, TM);

}


INITIALIZE_PASS_BEGIN(AMDGPULowerKernelArguments, DEBUG_TYPE,

                      "AMDGPU Lower Kernel Arguments", false, false)

INITIALIZE_PASS_END(AMDGPULowerKernelArguments, DEBUG_TYPE, "AMDGPU Lower Kernel Arguments",

                    false, false)


char AMDGPULowerKernelArguments::ID = 0;


FunctionPass *llvm::createAMDGPULowerKernelArgumentsPass() {

  return new AMDGPULowerKernelArguments();

}


PreservedAnalyses

AMDGPULowerKernelArgumentsPass::run(Function &F, FunctionAnalysisManager &AM) {

  bool Changed = lowerKernelArguments(F, TM);

  if (Changed) {

    // TODO: Preserves a lot more.

    PreservedAnalyses PA;

    PA.preserveSet<CFGAnalyses>();

    return PA;

  }


  return PreservedAnalyses::all();

}

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition: AArch64SLSHardening.cpp:74

Arguments
AMDGPU Lower Kernel Arguments
Definition: AMDGPULowerKernelArguments.cpp:296

getInsertPt
static BasicBlock::iterator getInsertPt(BasicBlock &BB)
Definition: AMDGPULowerKernelArguments.cpp:86

lowerKernelArguments
static bool lowerKernelArguments(Function &F, const TargetMachine &TM)
Definition: AMDGPULowerKernelArguments.cpp:100

DEBUG_TYPE
#define DEBUG_TYPE
Definition: AMDGPULowerKernelArguments.cpp:22

AMDGPU.h

Size
uint64_t Size
Definition: ELFObjHandler.cpp:81

GCNSubtarget.h
AMD GCN specific subclass of TargetSubtarget.

IRBuilder.h

F
#define F(x, y, z)
Definition: MD5.cpp:55

MDBuilder.h

TM
const char LLVMTargetMachineRef TM
Definition: PassBuilderBindings.cpp:47

INITIALIZE_PASS_END
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:59

INITIALIZE_PASS_BEGIN
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
Definition: PassSupport.h:52

CC
auto CC
Definition: RISCVRedundantCopyElimination.cpp:79

TargetPassConfig.h
Target-Independent Code Generator Pass Configuration Options pass.

PointerType
Definition: ItaniumDemangle.h:612

VectorType
Definition: ItaniumDemangle.h:1149

llvm::AMDGPULowerKernelArgumentsPass::run
PreservedAnalyses run(Function &, FunctionAnalysisManager &)
Definition: AMDGPULowerKernelArguments.cpp:306

llvm::AllocaInst
an instruction to allocate memory on the stack
Definition: Instructions.h:59

llvm::AllocaInst::isStaticAlloca
bool isStaticAlloca() const
Return true if this alloca is in the entry block of the function and is a constant size.
Definition: Instructions.cpp:1539

llvm::AnalysisManager
A container for analyses that lazily runs them and caches their results.
Definition: PassManager.h:321

llvm::AnalysisUsage
Represent the analysis usage information of a pass.
Definition: PassAnalysisSupport.h:47

llvm::AnalysisUsage::addRequired
AnalysisUsage & addRequired()
Definition: PassAnalysisSupport.h:75

llvm::AnalysisUsage::setPreservesAll
void setPreservesAll()
Set by analyses that do not transform their input at all.
Definition: PassAnalysisSupport.h:130

llvm::Argument
This class represents an incoming formal argument to a Function.
Definition: Argument.h:31

llvm::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition: ArrayRef.h:41

llvm::Attribute::getWithDereferenceableBytes
static Attribute getWithDereferenceableBytes(LLVMContext &Context, uint64_t Bytes)
Definition: Attributes.cpp:204

llvm::Attribute::getWithAlignment
static Attribute getWithAlignment(LLVMContext &Context, Align Alignment)
Return a uniquified Attribute object that has the specific alignment set.
Definition: Attributes.cpp:194

llvm::BasicBlock
LLVM Basic Block Representation.
Definition: BasicBlock.h:60

llvm::BasicBlock::end
iterator end()
Definition: BasicBlock.h:443

llvm::BasicBlock::getFirstInsertionPt
const_iterator getFirstInsertionPt() const
Returns an iterator to the first instruction in this block that is suitable for inserting a non-PHI i...
Definition: BasicBlock.cpp:409

llvm::BasicBlock::iterator
InstListType::iterator iterator
Instruction iterators...
Definition: BasicBlock.h:165

llvm::CFGAnalyses
Represents analyses that only rely on functions' control flow.
Definition: Analysis.h:70

llvm::CallBase::addRetAttr
void addRetAttr(Attribute::AttrKind Kind)
Adds the attribute to the return value.
Definition: InstrTypes.h:1861

llvm::CallInst
This class represents a function call, abstracting a target machine's calling convention.
Definition: Instructions.h:1565

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:110

llvm::FixedVectorType::get
static FixedVectorType * get(Type *ElementType, unsigned NumElts)
Definition: Type.cpp:692

llvm::FunctionPass
FunctionPass class - This class is used to implement most global optimizations.
Definition: Pass.h:311

llvm::FunctionPass::runOnFunction
virtual bool runOnFunction(Function &F)=0
runOnFunction - Virtual method overriden by subclasses to do the per-function processing of the pass.

llvm::Function
Definition: Function.h:62

llvm::GCNSubtarget
Definition: GCNSubtarget.h:35

llvm::GCNUserSGPRUsageInfo
Definition: GCNSubtarget.h:1527

llvm::GCNUserSGPRUsageInfo::getNumUsedUserSGPRs
unsigned getNumUsedUserSGPRs() const
Definition: GCNSubtarget.h:1545

llvm::IRBuilderBase::getIntNTy
IntegerType * getIntNTy(unsigned N)
Fetch the type representing an N-bit integer.
Definition: IRBuilder.h:539

llvm::IRBuilderBase::CreateAlignedLoad
LoadInst * CreateAlignedLoad(Type *Ty, Value *Ptr, MaybeAlign Align, const char *Name)
Definition: IRBuilder.h:1807

llvm::IRBuilderBase::CreateIntrinsic
CallInst * CreateIntrinsic(Intrinsic::ID ID, ArrayRef< Type * > Types, ArrayRef< Value * > Args, Instruction *FMFSource=nullptr, const Twine &Name="")
Create a call to intrinsic ID with Args, mangled using Types.
Definition: IRBuilder.cpp:932

llvm::IRBuilderBase::CreateLShr
Value * CreateLShr(Value *LHS, Value *RHS, const Twine &Name="", bool isExact=false)
Definition: IRBuilder.h:1437

llvm::IRBuilderBase::getInt32Ty
IntegerType * getInt32Ty()
Fetch the type representing a 32-bit integer.
Definition: IRBuilder.h:526

llvm::IRBuilderBase::getInt64Ty
IntegerType * getInt64Ty()
Fetch the type representing a 64-bit integer.
Definition: IRBuilder.h:531

llvm::IRBuilderBase::CreateBitCast
Value * CreateBitCast(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2127

llvm::IRBuilderBase::CreateShuffleVector
Value * CreateShuffleVector(Value *V1, Value *V2, Value *Mask, const Twine &Name="")
Definition: IRBuilder.h:2494

llvm::IRBuilderBase::CreateTrunc
Value * CreateTrunc(Value *V, Type *DestTy, const Twine &Name="", bool IsNUW=false, bool IsNSW=false)
Definition: IRBuilder.h:2007

llvm::IRBuilderBase::CreateConstInBoundsGEP1_64
Value * CreateConstInBoundsGEP1_64(Type *Ty, Value *Ptr, uint64_t Idx0, const Twine &Name="")
Definition: IRBuilder.h:1937

llvm::IRBuilderBase::getInt8Ty
IntegerType * getInt8Ty()
Fetch the type representing an 8-bit integer.
Definition: IRBuilder.h:516

llvm::IRBuilderBase::CreateAddrSpaceCast
Value * CreateAddrSpaceCast(Value *V, Type *DestTy, const Twine &Name="")
Definition: IRBuilder.h:2132

llvm::IRBuilder
This provides a uniform API for creating instructions and inserting them into a basic block: either a...
Definition: IRBuilder.h:2666

llvm::IntegerType
Class to represent integer types.
Definition: DerivedTypes.h:40

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:67

llvm::LoadInst
An instruction for reading from memory.
Definition: Instructions.h:184

llvm::MDBuilder
Definition: MDBuilder.h:36

llvm::MDBuilder::createConstant
ConstantAsMetadata * createConstant(Constant *C)
Return the given constant as metadata.
Definition: MDBuilder.cpp:24

llvm::MDNode::get
static MDTuple * get(LLVMContext &Context, ArrayRef< Metadata * > MDs)
Definition: Metadata.h:1541

llvm::Pass::getAnalysisUsage
virtual void getAnalysisUsage(AnalysisUsage &) const
getAnalysisUsage - This function should be overriden by passes that need analysis information to do t...
Definition: Pass.cpp:98

llvm::PreservedAnalyses
A set of analyses that are preserved following a run of a transformation pass.
Definition: Analysis.h:109

llvm::PreservedAnalyses::all
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
Definition: Analysis.h:115

llvm::PreservedAnalyses::preserveSet
void preserveSet()
Mark an analysis set as preserved.
Definition: Analysis.h:144

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1209

llvm::TargetMachine
Primary interface to the complete machine description for the target machine.
Definition: TargetMachine.h:76

llvm::TargetPassConfig
Target-Independent Code Generator Pass Configuration Options.
Definition: TargetPassConfig.h:85

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::isAggregateType
bool isAggregateType() const
Return true if the type is an aggregate type.
Definition: Type.h:295

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition: Value.h:255

llvm::Value::replaceAllUsesWith
void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
Definition: Value.cpp:534

llvm::Value::getName
StringRef getName() const
Return a constant reference to the value's name.
Definition: Value.cpp:309

uint64_t

unsigned

TargetMachine.h

false
Definition: StackSlotColoring.cpp:184

llvm::AMDGPUAS::REGION_ADDRESS
@ REGION_ADDRESS
Address space for region memory. (GDS)
Definition: AMDGPUAddrSpace.h:32

llvm::AMDGPUAS::LOCAL_ADDRESS
@ LOCAL_ADDRESS
Address space for local memory.
Definition: AMDGPUAddrSpace.h:35

llvm::CallingConv::ID
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition: CallingConv.h:24

llvm::CallingConv::AMDGPU_KERNEL
@ AMDGPU_KERNEL
Used for AMDGPU code object kernels.
Definition: CallingConv.h:200

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::isAligned
bool isAligned(Align Lhs, uint64_t SizeInBytes)
Checks that SizeInBytes is a multiple of the alignment.
Definition: Alignment.h:145

llvm::HexPrintStyle::Lower
@ Lower

llvm::createAMDGPULowerKernelArgumentsPass
FunctionPass * createAMDGPULowerKernelArgumentsPass()
Definition: AMDGPULowerKernelArguments.cpp:301

llvm::alignTo
uint64_t alignTo(uint64_t Size, Align A)
Returns a multiple of A needed to store Size bytes.
Definition: Alignment.h:155

llvm::commonAlignment
Align commonAlignment(Align A, uint64_t Offset)
Returns the alignment that satisfies both alignments.
Definition: Alignment.h:212

llvm::alignDown
uint64_t alignDown(uint64_t Value, uint64_t Align, uint64_t Skew=0)
Returns the largest uint64_t less than or equal to Value and is Skew mod Align.
Definition: MathExtras.h:439

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::MaybeAlign
This struct is a compact representation of a valid (power of two) or undefined (0) alignment.
Definition: Alignment.h:117