blob: 85afda09e347ae4be9d9ba7f2cfa1e989dda4d44 [file] [log] [blame]
//===-- include/flang/Runtime/CUDA/kernel.h ---------------------*- C++ -*-===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
#ifndef FORTRAN_RUNTIME_CUDA_KERNEL_H_
#define FORTRAN_RUNTIME_CUDA_KERNEL_H_
#include "flang/Runtime/entry-names.h"
#include <cstddef>
#include <stdint.h>
extern "C" {
// These functions use intptr_t instead of CUDA's unsigned int to match
// the type of MLIR's index type. This avoids the need for casts in the
// generated MLIR code.
void RTDEF(CUFLaunchKernel)(const void *kernelName, intptr_t gridX,
intptr_t gridY, intptr_t gridZ, intptr_t blockX, intptr_t blockY,
intptr_t blockZ, int32_t smem, void **params, void **extra);
void RTDEF(CUFLaunchClusterKernel)(const void *kernelName, intptr_t clusterX,
intptr_t clusterY, intptr_t clusterZ, intptr_t gridX, intptr_t gridY,
intptr_t gridZ, intptr_t blockX, intptr_t blockY, intptr_t blockZ,
int32_t smem, void **params, void **extra);
} // extern "C"
#endif // FORTRAN_RUNTIME_CUDA_KERNEL_H_