blob: 13778e9af1e72f5fc7e32140efc478f10c20f6fb [file] [log] [blame]
//===- MemRefUtils.h - Memref helpers to invoke MLIR JIT code ---*- C++ -*-===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
//
// Utils for MLIR ABI interfacing with frameworks.
//
// The templated free functions below make it possible to allocate dense
// contiguous buffers with shapes that interoperate properly with the MLIR
// codegen ABI.
//
//===----------------------------------------------------------------------===//
#include "mlir/ExecutionEngine/CRunnerUtils.h"
#include "mlir/Support/LLVM.h"
#include "llvm/ADT/ArrayRef.h"
#include "llvm/ADT/Optional.h"
#include "llvm/ADT/STLExtras.h"
#include "llvm/Support/raw_ostream.h"
#include <algorithm>
#include <array>
#include <cassert>
#include <functional>
#include <initializer_list>
#include <memory>
#ifndef MLIR_EXECUTIONENGINE_MEMREFUTILS_H_
#define MLIR_EXECUTIONENGINE_MEMREFUTILS_H_
namespace mlir {
using AllocFunType = llvm::function_ref<void *(size_t)>;
namespace detail {
/// Given a shape with sizes greater than 0 along all dimensions, returns the
/// distance, in number of elements, between a slice in a dimension and the next
/// slice in the same dimension.
/// e.g. shape[3, 4, 5] -> strides[20, 5, 1]
template <size_t N>
inline std::array<int64_t, N> makeStrides(ArrayRef<int64_t> shape) {
assert(shape.size() == N && "expect shape specification to match rank");
std::array<int64_t, N> res;
int64_t running = 1;
for (int64_t idx = N - 1; idx >= 0; --idx) {
assert(shape[idx] && "size must be non-negative for all shape dimensions");
res[idx] = running;
running *= shape[idx];
}
return res;
}
/// Build a `StridedMemRefDescriptor<T, N>` that matches the MLIR ABI.
/// This is an implementation detail that is kept in sync with MLIR codegen
/// conventions. Additionally takes a `shapeAlloc` array which
/// is used instead of `shape` to allocate "more aligned" data and compute the
/// corresponding strides.
template <int N, typename T>
typename std::enable_if<(N >= 1), StridedMemRefType<T, N>>::type
makeStridedMemRefDescriptor(T *ptr, T *alignedPtr, ArrayRef<int64_t> shape,
ArrayRef<int64_t> shapeAlloc) {
assert(shape.size() == N);
assert(shapeAlloc.size() == N);
StridedMemRefType<T, N> descriptor;
descriptor.basePtr = static_cast<T *>(ptr);
descriptor.data = static_cast<T *>(alignedPtr);
descriptor.offset = 0;
std::copy(shape.begin(), shape.end(), descriptor.sizes);
auto strides = makeStrides<N>(shapeAlloc);
std::copy(strides.begin(), strides.end(), descriptor.strides);
return descriptor;
}
/// Build a `StridedMemRefDescriptor<T, 0>` that matches the MLIR ABI.
/// This is an implementation detail that is kept in sync with MLIR codegen
/// conventions. Additionally takes a `shapeAlloc` array which
/// is used instead of `shape` to allocate "more aligned" data and compute the
/// corresponding strides.
template <int N, typename T>
typename std::enable_if<(N == 0), StridedMemRefType<T, 0>>::type
makeStridedMemRefDescriptor(T *ptr, T *alignedPtr, ArrayRef<int64_t> shape = {},
ArrayRef<int64_t> shapeAlloc = {}) {
assert(shape.size() == N);
assert(shapeAlloc.size() == N);
StridedMemRefType<T, 0> descriptor;
descriptor.basePtr = static_cast<T *>(ptr);
descriptor.data = static_cast<T *>(alignedPtr);
descriptor.offset = 0;
return descriptor;
}
/// Align `nElements` of type T with an optional `alignment`.
/// This replaces a portable `posix_memalign`.
/// `alignment` must be a power of 2 and greater than the size of T. By default
/// the alignment is sizeof(T).
template <typename T>
std::pair<T *, T *>
allocAligned(size_t nElements, AllocFunType allocFun = &::malloc,
llvm::Optional<uint64_t> alignment = llvm::Optional<uint64_t>()) {
assert(sizeof(T) < (1ul << 32) && "Elemental type overflows");
auto size = nElements * sizeof(T);
auto desiredAlignment = alignment.getValueOr(nextPowerOf2(sizeof(T)));
assert((desiredAlignment & (desiredAlignment - 1)) == 0);
assert(desiredAlignment >= sizeof(T));
T *data = reinterpret_cast<T *>(allocFun(size + desiredAlignment));
uintptr_t addr = reinterpret_cast<uintptr_t>(data);
uintptr_t rem = addr % desiredAlignment;
T *alignedData = (rem == 0)
? data
: reinterpret_cast<T *>(addr + (desiredAlignment - rem));
assert(reinterpret_cast<uintptr_t>(alignedData) % desiredAlignment == 0);
return std::make_pair(data, alignedData);
}
} // namespace detail
//===----------------------------------------------------------------------===//
// Public API
//===----------------------------------------------------------------------===//
/// Convenient callback to "visit" a memref element by element.
/// This takes a reference to an individual element as well as the coordinates.
/// It can be used in conjuction with a StridedMemrefIterator.
template <typename T>
using ElementWiseVisitor = llvm::function_ref<void(T &ptr, ArrayRef<int64_t>)>;
/// Owning MemRef type that abstracts over the runtime type for ranked strided
/// memref.
template <typename T, unsigned Rank>
class OwningMemRef {
public:
using DescriptorType = StridedMemRefType<T, Rank>;
using FreeFunType = std::function<void(DescriptorType)>;
/// Allocate a new dense StridedMemrefRef with a given `shape`. An optional
/// `shapeAlloc` array can be supplied to "pad" every dimension individually.
/// If an ElementWiseVisitor is provided, it will be used to initialize the
/// data, else the memory will be zero-initialized. The alloc and free method
/// used to manage the data allocation can be optionally provided, and default
/// to malloc/free.
OwningMemRef(
ArrayRef<int64_t> shape, ArrayRef<int64_t> shapeAlloc = {},
ElementWiseVisitor<T> init = {},
llvm::Optional<uint64_t> alignment = llvm::Optional<uint64_t>(),
AllocFunType allocFun = &::malloc,
std::function<void(StridedMemRefType<T, Rank>)> freeFun =
[](StridedMemRefType<T, Rank> descriptor) {
::free(descriptor.data);
})
: freeFunc(freeFun) {
if (shapeAlloc.empty())
shapeAlloc = shape;
assert(shape.size() == Rank);
assert(shapeAlloc.size() == Rank);
for (unsigned i = 0; i < Rank; ++i)
assert(shape[i] <= shapeAlloc[i] &&
"shapeAlloc must be greater than or equal to shape");
int64_t nElements = 1;
for (int64_t s : shapeAlloc)
nElements *= s;
T *data, *alignedData;
std::tie(data, alignedData) =
detail::allocAligned<T>(nElements, allocFun, alignment);
descriptor = detail::makeStridedMemRefDescriptor<Rank>(data, alignedData,
shape, shapeAlloc);
if (init) {
for (StridedMemrefIterator<T, Rank> it = descriptor.begin(),
end = descriptor.end();
it != end; ++it)
init(*it, it.getIndices());
} else {
memset(descriptor.data, 0,
nElements * sizeof(T) +
alignment.getValueOr(detail::nextPowerOf2(sizeof(T))));
}
}
/// Take ownership of an existing descriptor with a custom deleter.
OwningMemRef(DescriptorType descriptor, FreeFunType freeFunc)
: freeFunc(freeFunc), descriptor(descriptor) {}
~OwningMemRef() {
if (freeFunc)
freeFunc(descriptor);
}
OwningMemRef(const OwningMemRef &) = delete;
OwningMemRef &operator=(const OwningMemRef &) = delete;
OwningMemRef &operator=(const OwningMemRef &&other) {
freeFunc = other.freeFunc;
descriptor = other.descriptor;
other.freeFunc = nullptr;
memset(0, &other.descriptor, sizeof(other.descriptor));
}
OwningMemRef(OwningMemRef &&other) { *this = std::move(other); }
DescriptorType &operator*() { return descriptor; }
DescriptorType *operator->() { return &descriptor; }
T &operator[](std::initializer_list<int64_t> indices) {
return descriptor[std::move(indices)];
}
private:
/// Custom deleter used to release the data buffer manager with the descriptor
/// below.
FreeFunType freeFunc;
/// The descriptor is an instance of StridedMemRefType<T, rank>.
DescriptorType descriptor;
};
} // namespace mlir
#endif // MLIR_EXECUTIONENGINE_MEMREFUTILS_H_