blob: 94b9f90052769e04369cebaaf8bd57f1811af58e [file] [edit]
// RUN: mlir-opt %s -split-input-file -convert-gpu-to-rocdl | FileCheck %s --check-prefixes=ROCDL
// RUN: mlir-opt %s -split-input-file -convert-gpu-to-nvvm | FileCheck %s --check-prefixes=NVVM
gpu.module @kernel {
gpu.func @gpu_global_id() -> (index) {
%global_id_x = gpu.global_id x
gpu.return %global_id_x : index
}
}
// ROCDL-LABEL: llvm.func @gpu_global_id() -> i64 {
// ROCDL: %[[WORKGROUP_0:.*]] = rocdl.workgroup.id.x : i32
// ROCDL: %[[SEXT_0:.*]] = llvm.sext %[[WORKGROUP_0]] : i32 to i64
// ROCDL: %[[DIM64:.*]] = llvm.call @__ockl_get_local_size(%{{.*}}) : (i32) -> (i64 {llvm.range = #llvm.constant_range<i64, 1, 1025>})
// ROCDL: %[[MUL_0:.*]] = llvm.mul %[[SEXT_0]], %[[DIM64]] : i64
// ROCDL: %[[WORKITEM_0:.*]] = rocdl.workitem.id.x : i32
// ROCDL: %[[SEXT_2:.*]] = llvm.sext %[[WORKITEM_0]] : i32 to i64
// ROCDL: %[[ADD_0:.*]] = llvm.add %[[SEXT_2]], %[[MUL_0]] : i64
// ROCDL: llvm.return %[[ADD_0]] : i64
// ROCDL: }
// NVVM-LABEL: llvm.func @gpu_global_id() -> i64 {
// NVVM: %[[READ_0:.*]] = nvvm.read.ptx.sreg.ctaid.x : i32
// NVVM: %[[SEXT_0:.*]] = llvm.sext %[[READ_0]] : i32 to i64
// NVVM: %[[READ_1:.*]] = nvvm.read.ptx.sreg.ntid.x : i32
// NVVM: %[[SEXT_1:.*]] = llvm.sext %[[READ_1]] : i32 to i64
// NVVM: %[[MUL_0:.*]] = llvm.mul %[[SEXT_0]], %[[SEXT_1]] : i64
// NVVM: %[[READ_2:.*]] = nvvm.read.ptx.sreg.tid.x : i32
// NVVM: %[[SEXT_2:.*]] = llvm.sext %[[READ_2]] : i32 to i64
// NVVM: %[[ADD_0:.*]] = llvm.add %[[SEXT_2]], %[[MUL_0]] : i64
// NVVM: llvm.return %[[ADD_0]] : i64
// NVVM: }