| //===- GPUToSPIRVPass.cpp - GPU to SPIR-V Passes --------------------------===// |
| // |
| // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| // See https://llvm.org/LICENSE.txt for license information. |
| // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| // |
| //===----------------------------------------------------------------------===// |
| // |
| // This file implements a pass to convert a kernel function in the GPU Dialect |
| // into a spirv.module operation. |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #include "mlir/Conversion/GPUToSPIRV/GPUToSPIRVPass.h" |
| |
| #include "mlir/Conversion/ArithToSPIRV/ArithToSPIRV.h" |
| #include "mlir/Conversion/FuncToSPIRV/FuncToSPIRV.h" |
| #include "mlir/Conversion/GPUToSPIRV/GPUToSPIRV.h" |
| #include "mlir/Conversion/MemRefToSPIRV/MemRefToSPIRV.h" |
| #include "mlir/Dialect/Func/IR/FuncOps.h" |
| #include "mlir/Dialect/GPU/IR/GPUDialect.h" |
| #include "mlir/Dialect/SPIRV/IR/SPIRVDialect.h" |
| #include "mlir/Dialect/SPIRV/IR/SPIRVOps.h" |
| #include "mlir/Dialect/SPIRV/Transforms/SPIRVConversion.h" |
| |
| namespace mlir { |
| #define GEN_PASS_DEF_CONVERTGPUTOSPIRV |
| #include "mlir/Conversion/Passes.h.inc" |
| } // namespace mlir |
| |
| using namespace mlir; |
| |
| namespace { |
| /// Pass to lower GPU Dialect to SPIR-V. The pass only converts the gpu.func ops |
| /// inside gpu.module ops. i.e., the function that are referenced in |
| /// gpu.launch_func ops. For each such function |
| /// |
| /// 1) Create a spirv::ModuleOp, and clone the function into spirv::ModuleOp |
| /// (the original function is still needed by the gpu::LaunchKernelOp, so cannot |
| /// replace it). |
| /// |
| /// 2) Lower the body of the spirv::ModuleOp. |
| struct GPUToSPIRVPass final : impl::ConvertGPUToSPIRVBase<GPUToSPIRVPass> { |
| explicit GPUToSPIRVPass(bool mapMemorySpace) |
| : mapMemorySpace(mapMemorySpace) {} |
| void runOnOperation() override; |
| |
| private: |
| bool mapMemorySpace; |
| }; |
| |
| void GPUToSPIRVPass::runOnOperation() { |
| MLIRContext *context = &getContext(); |
| ModuleOp module = getOperation(); |
| |
| SmallVector<Operation *, 1> gpuModules; |
| OpBuilder builder(context); |
| |
| auto targetEnvSupportsKernelCapability = [](gpu::GPUModuleOp moduleOp) { |
| Operation *gpuModule = moduleOp.getOperation(); |
| auto targetAttr = spirv::lookupTargetEnvOrDefault(gpuModule); |
| spirv::TargetEnv targetEnv(targetAttr); |
| return targetEnv.allows(spirv::Capability::Kernel); |
| }; |
| |
| module.walk([&](gpu::GPUModuleOp moduleOp) { |
| // Clone each GPU kernel module for conversion, given that the GPU |
| // launch op still needs the original GPU kernel module. |
| // For Vulkan Shader capabilities, we insert the newly converted SPIR-V |
| // module right after the original GPU module, as that's the expectation of |
| // the in-tree Vulkan runner. |
| // For OpenCL Kernel capabilities, we insert the newly converted SPIR-V |
| // module inside the original GPU module, as that's the expectaion of the |
| // normal GPU compilation pipeline. |
| if (targetEnvSupportsKernelCapability(moduleOp)) { |
| builder.setInsertionPoint(moduleOp.getBody(), |
| moduleOp.getBody()->begin()); |
| } else { |
| builder.setInsertionPoint(moduleOp.getOperation()); |
| } |
| gpuModules.push_back(builder.clone(*moduleOp.getOperation())); |
| }); |
| |
| // Run conversion for each module independently as they can have different |
| // TargetEnv attributes. |
| for (Operation *gpuModule : gpuModules) { |
| spirv::TargetEnvAttr targetAttr = |
| spirv::lookupTargetEnvOrDefault(gpuModule); |
| |
| // Map MemRef memory space to SPIR-V storage class first if requested. |
| if (mapMemorySpace) { |
| std::unique_ptr<ConversionTarget> target = |
| spirv::getMemorySpaceToStorageClassTarget(*context); |
| spirv::MemorySpaceToStorageClassMap memorySpaceMap = |
| targetEnvSupportsKernelCapability( |
| dyn_cast<gpu::GPUModuleOp>(gpuModule)) |
| ? spirv::mapMemorySpaceToOpenCLStorageClass |
| : spirv::mapMemorySpaceToVulkanStorageClass; |
| spirv::MemorySpaceToStorageClassConverter converter(memorySpaceMap); |
| |
| RewritePatternSet patterns(context); |
| spirv::populateMemorySpaceToStorageClassPatterns(converter, patterns); |
| |
| if (failed(applyFullConversion(gpuModule, *target, std::move(patterns)))) |
| return signalPassFailure(); |
| } |
| |
| std::unique_ptr<ConversionTarget> target = |
| SPIRVConversionTarget::get(targetAttr); |
| |
| SPIRVConversionOptions options; |
| options.use64bitIndex = this->use64bitIndex; |
| SPIRVTypeConverter typeConverter(targetAttr, options); |
| populateMMAToSPIRVCoopMatrixTypeConversion(typeConverter, |
| this->useCoopMatrixNV); |
| |
| RewritePatternSet patterns(context); |
| populateGPUToSPIRVPatterns(typeConverter, patterns); |
| if (this->useCoopMatrixNV) { |
| populateGpuWMMAToSPIRVCoopMatrixNVConversionPatterns(typeConverter, |
| patterns); |
| } else { |
| populateGpuWMMAToSPIRVCoopMatrixKHRConversionPatterns(typeConverter, |
| patterns); |
| } |
| |
| // TODO: Change SPIR-V conversion to be progressive and remove the following |
| // patterns. |
| mlir::arith::populateArithToSPIRVPatterns(typeConverter, patterns); |
| populateMemRefToSPIRVPatterns(typeConverter, patterns); |
| populateFuncToSPIRVPatterns(typeConverter, patterns); |
| |
| if (failed(applyFullConversion(gpuModule, *target, std::move(patterns)))) |
| return signalPassFailure(); |
| } |
| |
| // For OpenCL, the gpu.func op in the original gpu.module op needs to be |
| // replaced with an empty func.func op with the same arguments as the gpu.func |
| // op. The func.func op needs gpu.kernel attribute set. |
| module.walk([&](gpu::GPUModuleOp moduleOp) { |
| if (targetEnvSupportsKernelCapability(moduleOp)) { |
| moduleOp.walk([&](gpu::GPUFuncOp funcOp) { |
| builder.setInsertionPoint(funcOp); |
| auto newFuncOp = builder.create<func::FuncOp>( |
| funcOp.getLoc(), funcOp.getName(), funcOp.getFunctionType()); |
| auto entryBlock = newFuncOp.addEntryBlock(); |
| builder.setInsertionPointToEnd(entryBlock); |
| builder.create<func::ReturnOp>(funcOp.getLoc()); |
| newFuncOp->setAttr(gpu::GPUDialect::getKernelFuncAttrName(), |
| builder.getUnitAttr()); |
| funcOp.erase(); |
| }); |
| } |
| }); |
| } |
| |
| } // namespace |
| |
| std::unique_ptr<OperationPass<ModuleOp>> |
| mlir::createConvertGPUToSPIRVPass(bool mapMemorySpace) { |
| return std::make_unique<GPUToSPIRVPass>(mapMemorySpace); |
| } |