doxygen/MatrixBuilder_8h_source.html

//===- llvm/MatrixBuilder.h - Builder to lower matrix ops -------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file defines the MatrixBuilder class, which is used as a convenient way

// to lower matrix operations to LLVM IR.

//

//===----------------------------------------------------------------------===//


#ifndef LLVM_IR_MATRIXBUILDER_H

#define LLVM_IR_MATRIXBUILDER_H


#include "llvm/IR/Constant.h"

#include "llvm/IR/Constants.h"

#include "llvm/IR/IRBuilder.h"

#include "llvm/IR/InstrTypes.h"

#include "llvm/IR/Instruction.h"

#include "llvm/IR/IntrinsicInst.h"

#include "llvm/IR/Type.h"

#include "llvm/IR/Value.h"

#include "llvm/Support/Alignment.h"


namespace llvm {


class Function;

class Twine;

class Module;


class MatrixBuilder {

  IRBuilderBase &B;

  Module *getModule() { return B.GetInsertBlock()->getParent()->getParent(); }


  std::pair<Value *, Value *> splatScalarOperandIfNeeded(Value *LHS,

                                                         Value *RHS) {

    assert((LHS->getType()->isVectorTy() || RHS->getType()->isVectorTy()) &&

           "One of the operands must be a matrix (embedded in a vector)");

    if (LHS->getType()->isVectorTy() && !RHS->getType()->isVectorTy()) {

      assert(!isa<ScalableVectorType>(LHS->getType()) &&

             "LHS Assumed to be fixed width");

      RHS = B.CreateVectorSplat(

          cast<VectorType>(LHS->getType())->getElementCount(), RHS,

          "scalar.splat");

    } else if (!LHS->getType()->isVectorTy() && RHS->getType()->isVectorTy()) {

      assert(!isa<ScalableVectorType>(RHS->getType()) &&

             "RHS Assumed to be fixed width");

      LHS = B.CreateVectorSplat(

          cast<VectorType>(RHS->getType())->getElementCount(), LHS,

          "scalar.splat");

    }

    return {LHS, RHS};

  }


public:

  MatrixBuilder(IRBuilderBase &Builder) : B(Builder) {}


  /// Create a column major, strided matrix load.

  /// \p EltTy   - Matrix element type

  /// \p DataPtr - Start address of the matrix read

  /// \p Rows    - Number of rows in matrix (must be a constant)

  /// \p Columns - Number of columns in matrix (must be a constant)

  /// \p Stride  - Space between columns

  CallInst *CreateColumnMajorLoad(Type *EltTy, Value *DataPtr, Align Alignment,

                                  Value *Stride, bool IsVolatile, unsigned Rows,

                                  unsigned Columns, const Twine &Name = "") {

    auto *RetType = FixedVectorType::get(EltTy, Rows * Columns);


    Value *Ops[] = {DataPtr, Stride, B.getInt1(IsVolatile), B.getInt32(Rows),

                    B.getInt32(Columns)};

    Type *OverloadedTypes[] = {RetType, Stride->getType()};


    Function *TheFn = Intrinsic::getDeclaration(

        getModule(), Intrinsic::matrix_column_major_load, OverloadedTypes);


    CallInst *Call = B.CreateCall(TheFn->getFunctionType(), TheFn, Ops, Name);

    Attribute AlignAttr =

        Attribute::getWithAlignment(Call->getContext(), Alignment);

    Call->addParamAttr(0, AlignAttr);

    return Call;

  }


  /// Create a column major, strided matrix store.

  /// \p Matrix  - Matrix to store

  /// \p Ptr     - Pointer to write back to

  /// \p Stride  - Space between columns

  CallInst *CreateColumnMajorStore(Value *Matrix, Value *Ptr, Align Alignment,

                                   Value *Stride, bool IsVolatile,

                                   unsigned Rows, unsigned Columns,

                                   const Twine &Name = "") {

    Value *Ops[] = {Matrix,           Ptr,

                    Stride,           B.getInt1(IsVolatile),

                    B.getInt32(Rows), B.getInt32(Columns)};

    Type *OverloadedTypes[] = {Matrix->getType(), Stride->getType()};


    Function *TheFn = Intrinsic::getDeclaration(

        getModule(), Intrinsic::matrix_column_major_store, OverloadedTypes);


    CallInst *Call = B.CreateCall(TheFn->getFunctionType(), TheFn, Ops, Name);

    Attribute AlignAttr =

        Attribute::getWithAlignment(Call->getContext(), Alignment);

    Call->addParamAttr(1, AlignAttr);

    return Call;

  }


  /// Create a llvm.matrix.transpose call, transposing \p Matrix with \p Rows

  /// rows and \p Columns columns.

  CallInst *CreateMatrixTranspose(Value *Matrix, unsigned Rows,

                                  unsigned Columns, const Twine &Name = "") {

    auto *OpType = cast<VectorType>(Matrix->getType());

    auto *ReturnType =

        FixedVectorType::get(OpType->getElementType(), Rows * Columns);


    Type *OverloadedTypes[] = {ReturnType};

    Value *Ops[] = {Matrix, B.getInt32(Rows), B.getInt32(Columns)};

    Function *TheFn = Intrinsic::getDeclaration(

        getModule(), Intrinsic::matrix_transpose, OverloadedTypes);


    return B.CreateCall(TheFn->getFunctionType(), TheFn, Ops, Name);

  }


  /// Create a llvm.matrix.multiply call, multiplying matrixes \p LHS and \p

  /// RHS.

  CallInst *CreateMatrixMultiply(Value *LHS, Value *RHS, unsigned LHSRows,

                                 unsigned LHSColumns, unsigned RHSColumns,

                                 const Twine &Name = "") {

    auto *LHSType = cast<VectorType>(LHS->getType());

    auto *RHSType = cast<VectorType>(RHS->getType());


    auto *ReturnType =

        FixedVectorType::get(LHSType->getElementType(), LHSRows * RHSColumns);


    Value *Ops[] = {LHS, RHS, B.getInt32(LHSRows), B.getInt32(LHSColumns),

                    B.getInt32(RHSColumns)};

    Type *OverloadedTypes[] = {ReturnType, LHSType, RHSType};


    Function *TheFn = Intrinsic::getDeclaration(

        getModule(), Intrinsic::matrix_multiply, OverloadedTypes);

    return B.CreateCall(TheFn->getFunctionType(), TheFn, Ops, Name);

  }


  /// Insert a single element \p NewVal into \p Matrix at indices (\p RowIdx, \p

  /// ColumnIdx).

  Value *CreateMatrixInsert(Value *Matrix, Value *NewVal, Value *RowIdx,

                            Value *ColumnIdx, unsigned NumRows) {

    return B.CreateInsertElement(

        Matrix, NewVal,

        B.CreateAdd(B.CreateMul(ColumnIdx, ConstantInt::get(

                                               ColumnIdx->getType(), NumRows)),

                    RowIdx));

  }


  /// Add matrixes \p LHS and \p RHS. Support both integer and floating point

  /// matrixes.

  Value *CreateAdd(Value *LHS, Value *RHS) {

    assert(LHS->getType()->isVectorTy() || RHS->getType()->isVectorTy());

    if (LHS->getType()->isVectorTy() && !RHS->getType()->isVectorTy()) {

      assert(!isa<ScalableVectorType>(LHS->getType()) &&

             "LHS Assumed to be fixed width");

      RHS = B.CreateVectorSplat(

          cast<VectorType>(LHS->getType())->getElementCount(), RHS,

          "scalar.splat");

    } else if (!LHS->getType()->isVectorTy() && RHS->getType()->isVectorTy()) {

      assert(!isa<ScalableVectorType>(RHS->getType()) &&

             "RHS Assumed to be fixed width");

      LHS = B.CreateVectorSplat(

          cast<VectorType>(RHS->getType())->getElementCount(), LHS,

          "scalar.splat");

    }


    return cast<VectorType>(LHS->getType())

                   ->getElementType()

                   ->isFloatingPointTy()

               ? B.CreateFAdd(LHS, RHS)

               : B.CreateAdd(LHS, RHS);

  }


  /// Subtract matrixes \p LHS and \p RHS. Support both integer and floating

  /// point matrixes.

  Value *CreateSub(Value *LHS, Value *RHS) {

    assert(LHS->getType()->isVectorTy() || RHS->getType()->isVectorTy());

    if (LHS->getType()->isVectorTy() && !RHS->getType()->isVectorTy()) {

      assert(!isa<ScalableVectorType>(LHS->getType()) &&

             "LHS Assumed to be fixed width");

      RHS = B.CreateVectorSplat(

          cast<VectorType>(LHS->getType())->getElementCount(), RHS,

          "scalar.splat");

    } else if (!LHS->getType()->isVectorTy() && RHS->getType()->isVectorTy()) {

      assert(!isa<ScalableVectorType>(RHS->getType()) &&

             "RHS Assumed to be fixed width");

      LHS = B.CreateVectorSplat(

          cast<VectorType>(RHS->getType())->getElementCount(), LHS,

          "scalar.splat");

    }


    return cast<VectorType>(LHS->getType())

                   ->getElementType()

                   ->isFloatingPointTy()

               ? B.CreateFSub(LHS, RHS)

               : B.CreateSub(LHS, RHS);

  }


  /// Multiply matrix \p LHS with scalar \p RHS or scalar \p LHS with matrix \p

  /// RHS.

  Value *CreateScalarMultiply(Value *LHS, Value *RHS) {

    std::tie(LHS, RHS) = splatScalarOperandIfNeeded(LHS, RHS);

    if (LHS->getType()->getScalarType()->isFloatingPointTy())

      return B.CreateFMul(LHS, RHS);

    return B.CreateMul(LHS, RHS);

  }


  /// Divide matrix \p LHS by scalar \p RHS. If the operands are integers, \p

  /// IsUnsigned indicates whether UDiv or SDiv should be used.

  Value *CreateScalarDiv(Value *LHS, Value *RHS, bool IsUnsigned) {

    assert(LHS->getType()->isVectorTy() && !RHS->getType()->isVectorTy());

    assert(!isa<ScalableVectorType>(LHS->getType()) &&

           "LHS Assumed to be fixed width");

    RHS =

        B.CreateVectorSplat(cast<VectorType>(LHS->getType())->getElementCount(),

                            RHS, "scalar.splat");

    return cast<VectorType>(LHS->getType())

                   ->getElementType()

                   ->isFloatingPointTy()

               ? B.CreateFDiv(LHS, RHS)

               : (IsUnsigned ? B.CreateUDiv(LHS, RHS) : B.CreateSDiv(LHS, RHS));

  }


  /// Create an assumption that \p Idx is less than \p NumElements.

  void CreateIndexAssumption(Value *Idx, unsigned NumElements,

                             Twine const &Name = "") {

    Value *NumElts =

        B.getIntN(Idx->getType()->getScalarSizeInBits(), NumElements);

    auto *Cmp = B.CreateICmpULT(Idx, NumElts);

    if (isa<ConstantInt>(Cmp))

      assert(cast<ConstantInt>(Cmp)->isOne() && "Index must be valid!");

    else

      B.CreateAssumption(Cmp);

  }


  /// Compute the index to access the element at (\p RowIdx, \p ColumnIdx) from

  /// a matrix with \p NumRows embedded in a vector.

  Value *CreateIndex(Value *RowIdx, Value *ColumnIdx, unsigned NumRows,

                     Twine const &Name = "") {

    unsigned MaxWidth = std::max(RowIdx->getType()->getScalarSizeInBits(),

                                 ColumnIdx->getType()->getScalarSizeInBits());

    Type *IntTy = IntegerType::get(RowIdx->getType()->getContext(), MaxWidth);

    RowIdx = B.CreateZExt(RowIdx, IntTy);

    ColumnIdx = B.CreateZExt(ColumnIdx, IntTy);

    Value *NumRowsV = B.getIntN(MaxWidth, NumRows);

    return B.CreateAdd(B.CreateMul(ColumnIdx, NumRowsV), RowIdx);

  }

};


} // end namespace llvm


#endif // LLVM_IR_MATRIXBUILDER_H

Alignment.h

Constant.h

Constants.h
This file contains the declarations for the subclasses of Constant, which represent the different fla...

Idx
Returns the sub type a function will return at a given Idx Should correspond to the result type of an ExtractValue instruction executed with just that one unsigned Idx
Definition: DeadArgumentElimination.cpp:352

Name
std::string Name
Definition: ELFObjHandler.cpp:77

IRBuilder.h

Instruction.h

InstrTypes.h

IntrinsicInst.h

Matrix
Live Register Matrix
Definition: LiveRegMatrix.cpp:44

Module
Machine Check Debug Module
Definition: MachineCheckDebugify.cpp:124

assert
assert(ImpDefSCC.getReg()==AMDGPU::SCC &&ImpDefSCC.isDef())

Ptr
@ Ptr
Definition: TargetLibraryInfo.cpp:77

Type.h

Value.h

RHS
Value * RHS
Definition: X86PartialReduction.cpp:76

LHS
Value * LHS
Definition: X86PartialReduction.cpp:75

llvm::Attribute
Definition: Attributes.h:67

llvm::Attribute::getWithAlignment
static Attribute getWithAlignment(LLVMContext &Context, Align Alignment)
Return a uniquified Attribute object that has the specific alignment set.
Definition: Attributes.cpp:232

llvm::CallInst
This class represents a function call, abstracting a target machine's calling convention.
Definition: Instructions.h:1398

llvm::FixedVectorType::get
static FixedVectorType * get(Type *ElementType, unsigned NumElts)
Definition: Type.cpp:692

llvm::Function
Definition: Function.h:64

llvm::Function::getFunctionType
FunctionType * getFunctionType() const
Returns the FunctionType for me.
Definition: Function.h:207

llvm::IRBuilderBase
Common base class shared among various IRBuilders.
Definition: IRBuilder.h:91

llvm::IntegerType::get
static IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition: Type.cpp:278

llvm::MatrixBuilder
Definition: MatrixBuilder.h:33

llvm::MatrixBuilder::CreateScalarMultiply
Value * CreateScalarMultiply(Value *LHS, Value *RHS)
Multiply matrix LHS with scalar RHS or scalar LHS with matrix RHS.
Definition: MatrixBuilder.h:207

llvm::MatrixBuilder::CreateScalarDiv
Value * CreateScalarDiv(Value *LHS, Value *RHS, bool IsUnsigned)
Divide matrix LHS by scalar RHS.
Definition: MatrixBuilder.h:216

llvm::MatrixBuilder::CreateSub
Value * CreateSub(Value *LHS, Value *RHS)
Subtract matrixes LHS and RHS.
Definition: MatrixBuilder.h:182

llvm::MatrixBuilder::MatrixBuilder
MatrixBuilder(IRBuilderBase &Builder)
Definition: MatrixBuilder.h:58

llvm::MatrixBuilder::CreateMatrixTranspose
CallInst * CreateMatrixTranspose(Value *Matrix, unsigned Rows, unsigned Columns, const Twine &Name="")
Create a llvm.matrix.transpose call, transposing Matrix with Rows rows and Columns columns.
Definition: MatrixBuilder.h:110

llvm::MatrixBuilder::CreateColumnMajorStore
CallInst * CreateColumnMajorStore(Value *Matrix, Value *Ptr, Align Alignment, Value *Stride, bool IsVolatile, unsigned Rows, unsigned Columns, const Twine &Name="")
Create a column major, strided matrix store.
Definition: MatrixBuilder.h:89

llvm::MatrixBuilder::CreateMatrixInsert
Value * CreateMatrixInsert(Value *Matrix, Value *NewVal, Value *RowIdx, Value *ColumnIdx, unsigned NumRows)
Insert a single element NewVal into Matrix at indices (RowIdx, ColumnIdx).
Definition: MatrixBuilder.h:146

llvm::MatrixBuilder::CreateMatrixMultiply
CallInst * CreateMatrixMultiply(Value *LHS, Value *RHS, unsigned LHSRows, unsigned LHSColumns, unsigned RHSColumns, const Twine &Name="")
Create a llvm.matrix.multiply call, multiplying matrixes LHS and RHS.
Definition: MatrixBuilder.h:126

llvm::MatrixBuilder::CreateIndexAssumption
void CreateIndexAssumption(Value *Idx, unsigned NumElements, Twine const &Name="")
Create an assumption that Idx is less than NumElements.
Definition: MatrixBuilder.h:231

llvm::MatrixBuilder::CreateIndex
Value * CreateIndex(Value *RowIdx, Value *ColumnIdx, unsigned NumRows, Twine const &Name="")
Compute the index to access the element at (RowIdx, ColumnIdx) from a matrix with NumRows embedded in...
Definition: MatrixBuilder.h:244

llvm::MatrixBuilder::CreateColumnMajorLoad
CallInst * CreateColumnMajorLoad(Type *EltTy, Value *DataPtr, Align Alignment, Value *Stride, bool IsVolatile, unsigned Rows, unsigned Columns, const Twine &Name="")
Create a column major, strided matrix load.
Definition: MatrixBuilder.h:66

llvm::MatrixBuilder::CreateAdd
Value * CreateAdd(Value *LHS, Value *RHS)
Add matrixes LHS and RHS.
Definition: MatrixBuilder.h:157

llvm::Module
A Module instance is used to store all the information related to an LLVM module.
Definition: Module.h:65

llvm::Twine
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition: Twine.h:81

llvm::Type
The instances of the Type class are immutable: once they are created, they are never changed.
Definition: Type.h:45

llvm::Type::getScalarSizeInBits
unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.

llvm::Type::getContext
LLVMContext & getContext() const
Return the LLVMContext in which this type was uniqued.
Definition: Type.h:129

llvm::Value
LLVM Value Representation.
Definition: Value.h:74

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition: Value.h:255

llvm::Intrinsic::getDeclaration
Function * getDeclaration(Module *M, ID id, ArrayRef< Type * > Tys=std::nullopt)
Create or insert an LLVM Function declaration for an intrinsic, and return it.
Definition: Function.cpp:1513

llvm::codeview::PublicSymFlags::Function
@ Function

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39