blob: ab92f86ebb4eed437e8bdaa08ac4081a340fef8d [file] [log] [blame]
//===- llvm/MatrixBuilder.h - Builder to lower matrix ops -------*- C++ -*-===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
//
// This file defines the MatrixBuilder class, which is used as a convenient way
// to lower matrix operations to LLVM IR.
//
//===----------------------------------------------------------------------===//
#ifndef LLVM_IR_MATRIXBUILDER_H
#define LLVM_IR_MATRIXBUILDER_H
#include "llvm/IR/Constant.h"
#include "llvm/IR/Constants.h"
#include "llvm/IR/IRBuilder.h"
#include "llvm/IR/InstrTypes.h"
#include "llvm/IR/Instruction.h"
#include "llvm/IR/IntrinsicInst.h"
#include "llvm/IR/Type.h"
#include "llvm/IR/Value.h"
namespace llvm {
class Function;
class Twine;
class Module;
template <class IRBuilderTy> class MatrixBuilder {
IRBuilderTy &B;
Module *getModule() { return B.GetInsertBlock()->getParent()->getParent(); }
public:
MatrixBuilder(IRBuilderTy &Builder) : B(Builder) {}
/// Create a columnwise, strided matrix load.
/// \p DataPtr - Start address of the matrix read
/// \p Rows - Number of rows in matrix (must be a constant)
/// \p Columns - Number of columns in matrix (must be a constant)
/// \p Stride - Space between columns
CallInst *CreateMatrixColumnwiseLoad(Value *DataPtr, unsigned Rows,
unsigned Columns, Value *Stride,
const Twine &Name = "") {
// Deal with the pointer
PointerType *PtrTy = cast<PointerType>(DataPtr->getType());
Type *EltTy = PtrTy->getElementType();
Type *RetType = VectorType::get(EltTy, Rows * Columns);
Value *Ops[] = {DataPtr, Stride, B.getInt32(Rows), B.getInt32(Columns)};
Type *OverloadedTypes[] = {RetType, PtrTy};
Function *TheFn = Intrinsic::getDeclaration(
getModule(), Intrinsic::matrix_columnwise_load, OverloadedTypes);
return B.CreateCall(TheFn->getFunctionType(), TheFn, Ops, Name);
}
/// Create a columnwise, strided matrix store.
/// \p Matrix - Matrix to store
/// \p Ptr - Pointer to write back to
/// \p Stride - Space between columns
CallInst *CreateMatrixColumnwiseStore(Value *Matrix, Value *Ptr,
Value *Stride, unsigned Rows,
unsigned Columns,
const Twine &Name = "") {
Value *Ops[] = {Matrix, Ptr, Stride, B.getInt32(Rows), B.getInt32(Columns)};
Type *OverloadedTypes[] = {Matrix->getType(), Ptr->getType()};
Function *TheFn = Intrinsic::getDeclaration(
getModule(), Intrinsic::matrix_columnwise_store, OverloadedTypes);
return B.CreateCall(TheFn->getFunctionType(), TheFn, Ops, Name);
}
/// Create a llvm.matrix.transpose call, transposing \p Matrix with \p Rows
/// rows and \p Columns columns.
CallInst *CreateMatrixTranspose(Value *Matrix, unsigned Rows,
unsigned Columns, const Twine &Name = "") {
auto *OpType = cast<VectorType>(Matrix->getType());
Type *ReturnType =
VectorType::get(OpType->getElementType(), Rows * Columns);
Type *OverloadedTypes[] = {ReturnType};
Value *Ops[] = {Matrix, B.getInt32(Rows), B.getInt32(Columns)};
Function *TheFn = Intrinsic::getDeclaration(
getModule(), Intrinsic::matrix_transpose, OverloadedTypes);
return B.CreateCall(TheFn->getFunctionType(), TheFn, Ops, Name);
}
/// Create a llvm.matrix.multiply call, multiplying matrixes \p LHS and \p
/// RHS.
CallInst *CreateMatrixMultiply(Value *LHS, Value *RHS, unsigned LHSRows,
unsigned LHSColumns, unsigned RHSColumns,
const Twine &Name = "") {
auto *LHSType = cast<VectorType>(LHS->getType());
auto *RHSType = cast<VectorType>(RHS->getType());
Type *ReturnType =
VectorType::get(LHSType->getElementType(), LHSRows * RHSColumns);
Value *Ops[] = {LHS, RHS, B.getInt32(LHSRows), B.getInt32(LHSColumns),
B.getInt32(RHSColumns)};
Type *OverloadedTypes[] = {ReturnType, LHSType, RHSType};
Function *TheFn = Intrinsic::getDeclaration(
getModule(), Intrinsic::matrix_multiply, OverloadedTypes);
return B.CreateCall(TheFn->getFunctionType(), TheFn, Ops, Name);
}
/// Insert a single element \p NewVal into \p Matrix at indices (\p RowIdx, \p
/// ColumnIdx).
Value *CreateMatrixInsert(Value *Matrix, Value *NewVal, Value *RowIdx,
Value *ColumnIdx, unsigned NumRows) {
return B.CreateInsertElement(
Matrix, NewVal,
B.CreateAdd(B.CreateMul(ColumnIdx, ConstantInt::get(
ColumnIdx->getType(), NumRows)),
RowIdx));
}
/// Add matrixes \p LHS and \p RHS. Support both integer and floating point
/// matrixes.
Value *CreateAdd(Value *LHS, Value *RHS) {
return cast<VectorType>(LHS->getType())
->getElementType()
->isFloatingPointTy()
? B.CreateFAdd(LHS, RHS)
: B.CreateAdd(LHS, RHS);
}
/// Subtract matrixes \p LHS and \p RHS. Support both integer and floating
/// point matrixes.
Value *CreateSub(Value *LHS, Value *RHS) {
return cast<VectorType>(LHS->getType())
->getElementType()
->isFloatingPointTy()
? B.CreateFSub(LHS, RHS)
: B.CreateSub(LHS, RHS);
}
/// Multiply matrix \p LHS with scalar \p RHS.
Value *CreateScalarMultiply(Value *LHS, Value *RHS) {
Value *ScalarVector =
B.CreateVectorSplat(cast<VectorType>(LHS->getType())->getNumElements(),
RHS, "scalar.splat");
if (RHS->getType()->isFloatingPointTy())
return B.CreateFMul(LHS, ScalarVector);
return B.CreateMul(LHS, ScalarVector);
}
/// Extracts the element at (\p Row, \p Column) from \p Matrix.
Value *CreateExtractMatrix(Value *Matrix, Value *Row, Value *Column,
unsigned NumRows, Twine const &Name = "") {
return B.CreateExtractElement(
Matrix,
B.CreateAdd(
B.CreateMul(Column, ConstantInt::get(Column->getType(), NumRows)),
Row));
}
};
} // end namespace llvm
#endif // LLVM_IR_MATRIXBUILDER_H