| ; RUN: llc -verify-machineinstrs -O0 -mtriple=spirv64-unknown-unknown %s -o - | FileCheck %s --check-prefix=CHECK-SPIRV |
| ; RUN: %if spirv-tools %{ llc -O0 -mtriple=spirv64-unknown-unknown %s -o - -filetype=obj | spirv-val %} |
| |
| ; RUN: llc -verify-machineinstrs -O0 -mtriple=spirv32-unknown-unknown %s -o - | FileCheck %s --check-prefix=CHECK-SPIRV |
| ; RUN: %if spirv-tools %{ llc -O0 -mtriple=spirv32-unknown-unknown %s -o - -filetype=obj | spirv-val %} |
| |
| ; CHECK-SPIRV-DAG: %[[#int:]] = OpTypeInt 32 0 |
| ; CHECK-SPIRV-DAG: %[[#intv2:]] = OpTypeVector %[[#int]] 2 |
| ; CHECK-SPIRV-DAG: %[[#intv3:]] = OpTypeVector %[[#int]] 3 |
| ; CHECK-SPIRV-DAG: %[[#float:]] = OpTypeFloat 32 |
| ; CHECK-SPIRV-DAG: %[[#ScopeCrossWorkgroup:]] = OpConstantNull %[[#int]] |
| ; CHECK-SPIRV-DAG: %[[#ScopeWorkgroup:]] = OpConstant %[[#int]] 2{{$}} |
| ; CHECK-SPIRV-DAG: %[[#ScopeSubgroup:]] = OpConstant %[[#int]] 3{{$}} |
| |
| ; CHECK-SPIRV: OpFunction |
| ; CHECK-SPIRV: %[[#]] = OpGroupFMax %[[#float]] %[[#ScopeWorkgroup]] Reduce |
| ; CHECK-SPIRV: OpFunctionEnd |
| |
| ;; kernel void testWorkGroupFMax(float a, global float *res) { |
| ;; res[0] = work_group_reduce_max(a); |
| ;; } |
| |
| define dso_local spir_kernel void @testWorkGroupFMax(float noundef %a, float addrspace(1)* nocapture noundef writeonly %res) local_unnamed_addr { |
| entry: |
| %call = call spir_func float @_Z21work_group_reduce_maxf(float noundef %a) |
| store float %call, float addrspace(1)* %res, align 4 |
| ret void |
| } |
| |
| declare spir_func float @_Z21work_group_reduce_maxf(float noundef) local_unnamed_addr |
| |
| ; CHECK-SPIRV: OpFunction |
| ; CHECK-SPIRV: %[[#]] = OpGroupFMin %[[#float]] %[[#ScopeWorkgroup]] Reduce |
| ; CHECK-SPIRV: OpFunctionEnd |
| |
| ;; kernel void testWorkGroupFMin(float a, global float *res) { |
| ;; res[0] = work_group_reduce_min(a); |
| ;; } |
| |
| define dso_local spir_kernel void @testWorkGroupFMin(float noundef %a, float addrspace(1)* nocapture noundef writeonly %res) local_unnamed_addr { |
| entry: |
| %call = call spir_func float @_Z21work_group_reduce_minf(float noundef %a) |
| store float %call, float addrspace(1)* %res, align 4 |
| ret void |
| } |
| |
| declare spir_func float @_Z21work_group_reduce_minf(float noundef) local_unnamed_addr |
| |
| ; CHECK-SPIRV: OpFunction |
| ; CHECK-SPIRV: %[[#]] = OpGroupFAdd %[[#float]] %[[#ScopeWorkgroup]] Reduce |
| ; CHECK-SPIRV: OpFunctionEnd |
| |
| ;; kernel void testWorkGroupFAdd(float a, global float *res) { |
| ;; res[0] = work_group_reduce_add(a); |
| ;; } |
| |
| define dso_local spir_kernel void @testWorkGroupFAdd(float noundef %a, float addrspace(1)* nocapture noundef writeonly %res) local_unnamed_addr { |
| entry: |
| %call = call spir_func float @_Z21work_group_reduce_addf(float noundef %a) |
| store float %call, float addrspace(1)* %res, align 4 |
| ret void |
| } |
| |
| declare spir_func float @_Z21work_group_reduce_addf(float noundef) local_unnamed_addr |
| |
| ; CHECK-SPIRV: OpFunction |
| ; CHECK-SPIRV: %[[#]] = OpGroupFMax %[[#float]] %[[#ScopeWorkgroup]] InclusiveScan |
| ; CHECK-SPIRV: OpFunctionEnd |
| |
| ;; kernel void testWorkGroupScanInclusiveFMax(float a, global float *res) { |
| ;; res[0] = work_group_scan_inclusive_max(a); |
| ;; } |
| |
| define dso_local spir_kernel void @testWorkGroupScanInclusiveFMax(float noundef %a, float addrspace(1)* nocapture noundef writeonly %res) local_unnamed_addr { |
| entry: |
| %call = call spir_func float @_Z29work_group_scan_inclusive_maxf(float noundef %a) |
| store float %call, float addrspace(1)* %res, align 4 |
| ret void |
| } |
| |
| declare spir_func float @_Z29work_group_scan_inclusive_maxf(float noundef) local_unnamed_addr |
| |
| ; CHECK-SPIRV: OpFunction |
| ; CHECK-SPIRV: %[[#]] = OpGroupFMax %[[#float]] %[[#ScopeWorkgroup]] ExclusiveScan |
| ; CHECK-SPIRV: OpFunctionEnd |
| |
| ;; kernel void testWorkGroupScanExclusiveFMax(float a, global float *res) { |
| ;; res[0] = work_group_scan_exclusive_max(a); |
| ;; } |
| |
| define dso_local spir_kernel void @testWorkGroupScanExclusiveFMax(float noundef %a, float addrspace(1)* nocapture noundef writeonly %res) local_unnamed_addr { |
| entry: |
| %call = call spir_func float @_Z29work_group_scan_exclusive_maxf(float noundef %a) |
| store float %call, float addrspace(1)* %res, align 4 |
| ret void |
| } |
| |
| declare spir_func float @_Z29work_group_scan_exclusive_maxf(float noundef) local_unnamed_addr |
| |
| ; CHECK-SPIRV: OpFunction |
| ; CHECK-SPIRV: %[[#]] = OpGroupSMax %[[#int]] %[[#ScopeWorkgroup]] Reduce |
| ; CHECK-SPIRV: OpFunctionEnd |
| |
| ;; kernel void testWorkGroupSMax(int a, global int *res) { |
| ;; res[0] = work_group_reduce_max(a); |
| ;; } |
| |
| define dso_local spir_kernel void @testWorkGroupSMax(i32 noundef %a, i32 addrspace(1)* nocapture noundef writeonly %res) local_unnamed_addr { |
| entry: |
| %call = call spir_func i32 @_Z21work_group_reduce_maxi(i32 noundef %a) |
| store i32 %call, i32 addrspace(1)* %res, align 4 |
| ret void |
| } |
| |
| declare spir_func i32 @_Z21work_group_reduce_maxi(i32 noundef) local_unnamed_addr |
| |
| ; CHECK-SPIRV: OpFunction |
| ; CHECK-SPIRV: %[[#]] = OpGroupSMin %[[#int]] %[[#ScopeWorkgroup]] Reduce |
| ; CHECK-SPIRV: OpFunctionEnd |
| |
| ;; kernel void testWorkGroupSMin(int a, global int *res) { |
| ;; res[0] = work_group_reduce_min(a); |
| ;; } |
| |
| define dso_local spir_kernel void @testWorkGroupSMin(i32 noundef %a, i32 addrspace(1)* nocapture noundef writeonly %res) local_unnamed_addr { |
| entry: |
| %call = call spir_func i32 @_Z21work_group_reduce_mini(i32 noundef %a) |
| store i32 %call, i32 addrspace(1)* %res, align 4 |
| ret void |
| } |
| |
| declare spir_func i32 @_Z21work_group_reduce_mini(i32 noundef) local_unnamed_addr |
| |
| ; CHECK-SPIRV: OpFunction |
| ; CHECK-SPIRV: %[[#]] = OpGroupIAdd %[[#int]] %[[#ScopeWorkgroup]] Reduce |
| ; CHECK-SPIRV: OpFunctionEnd |
| |
| ;; kernel void testWorkGroupIAddSigned(int a, global int *res) { |
| ;; res[0] = work_group_reduce_add(a); |
| ;; } |
| |
| define dso_local spir_kernel void @testWorkGroupIAddSigned(i32 noundef %a, i32 addrspace(1)* nocapture noundef writeonly %res) local_unnamed_addr { |
| entry: |
| %call = call spir_func i32 @_Z21work_group_reduce_addi(i32 noundef %a) |
| store i32 %call, i32 addrspace(1)* %res, align 4 |
| ret void |
| } |
| |
| declare spir_func i32 @_Z21work_group_reduce_addi(i32 noundef) local_unnamed_addr |
| |
| ; CHECK-SPIRV: OpFunction |
| ; CHECK-SPIRV: %[[#]] = OpGroupIAdd %[[#int]] %[[#ScopeWorkgroup]] Reduce |
| ; CHECK-SPIRV: OpFunctionEnd |
| |
| ;; kernel void testWorkGroupIAddUnsigned(uint a, global uint *res) { |
| ;; res[0] = work_group_reduce_add(a); |
| ;; } |
| |
| define dso_local spir_kernel void @testWorkGroupIAddUnsigned(i32 noundef %a, i32 addrspace(1)* nocapture noundef writeonly %res) local_unnamed_addr { |
| entry: |
| %call = call spir_func i32 @_Z21work_group_reduce_addj(i32 noundef %a) |
| store i32 %call, i32 addrspace(1)* %res, align 4 |
| ret void |
| } |
| |
| declare spir_func i32 @_Z21work_group_reduce_addj(i32 noundef) local_unnamed_addr |
| |
| ; CHECK-SPIRV: OpFunction |
| ; CHECK-SPIRV: %[[#]] = OpGroupUMax %[[#int]] %[[#ScopeWorkgroup]] Reduce |
| ; CHECK-SPIRV: OpFunctionEnd |
| |
| ;; kernel void testWorkGroupUMax(uint a, global uint *res) { |
| ;; res[0] = work_group_reduce_max(a); |
| ;; } |
| |
| define dso_local spir_kernel void @testWorkGroupUMax(i32 noundef %a, i32 addrspace(1)* nocapture noundef writeonly %res) local_unnamed_addr { |
| entry: |
| %call = call spir_func i32 @_Z21work_group_reduce_maxj(i32 noundef %a) |
| store i32 %call, i32 addrspace(1)* %res, align 4 |
| ret void |
| } |
| |
| declare spir_func i32 @_Z21work_group_reduce_maxj(i32 noundef) local_unnamed_addr |
| |
| ; CHECK-SPIRV: OpFunction |
| ; CHECK-SPIRV: %[[#]] = OpGroupUMax %[[#int]] %[[#ScopeSubgroup]] Reduce |
| ; CHECK-SPIRV: OpFunctionEnd |
| |
| ;; #pragma OPENCL EXTENSION cl_khr_subgroups: enable |
| ;; kernel void testSubGroupUMax(uint a, global uint *res) { |
| ;; res[0] = sub_group_reduce_max(a); |
| ;; } |
| ;; #pragma OPENCL EXTENSION cl_khr_subgroups: disable |
| |
| define dso_local spir_kernel void @testSubGroupUMax(i32 noundef %a, i32 addrspace(1)* nocapture noundef writeonly %res) local_unnamed_addr { |
| entry: |
| %call = call spir_func i32 @_Z20sub_group_reduce_maxj(i32 noundef %a) |
| store i32 %call, i32 addrspace(1)* %res, align 4 |
| ret void |
| } |
| |
| declare spir_func i32 @_Z20sub_group_reduce_maxj(i32 noundef) local_unnamed_addr |
| |
| ; CHECK-SPIRV: OpFunction |
| ; CHECK-SPIRV: %[[#]] = OpGroupUMax %[[#int]] %[[#ScopeWorkgroup]] InclusiveScan |
| ; CHECK-SPIRV: OpFunctionEnd |
| |
| ;; kernel void testWorkGroupScanInclusiveUMax(uint a, global uint *res) { |
| ;; res[0] = work_group_scan_inclusive_max(a); |
| ;; } |
| |
| define dso_local spir_kernel void @testWorkGroupScanInclusiveUMax(i32 noundef %a, i32 addrspace(1)* nocapture noundef writeonly %res) local_unnamed_addr { |
| entry: |
| %call = call spir_func i32 @_Z29work_group_scan_inclusive_maxj(i32 noundef %a) |
| store i32 %call, i32 addrspace(1)* %res, align 4 |
| ret void |
| } |
| |
| declare spir_func i32 @_Z29work_group_scan_inclusive_maxj(i32 noundef) local_unnamed_addr |
| |
| ; CHECK-SPIRV: OpFunction |
| ; CHECK-SPIRV: %[[#]] = OpGroupUMax %[[#int]] %[[#ScopeWorkgroup]] ExclusiveScan |
| ; CHECK-SPIRV: OpFunctionEnd |
| |
| ;; kernel void testWorkGroupScanExclusiveUMax(uint a, global uint *res) { |
| ;; res[0] = work_group_scan_exclusive_max(a); |
| ;; } |
| |
| define dso_local spir_kernel void @testWorkGroupScanExclusiveUMax(i32 noundef %a, i32 addrspace(1)* nocapture noundef writeonly %res) local_unnamed_addr { |
| entry: |
| %call = call spir_func i32 @_Z29work_group_scan_exclusive_maxj(i32 noundef %a) |
| store i32 %call, i32 addrspace(1)* %res, align 4 |
| ret void |
| } |
| |
| declare spir_func i32 @_Z29work_group_scan_exclusive_maxj(i32 noundef) local_unnamed_addr |
| |
| ; CHECK-SPIRV: OpFunction |
| ; CHECK-SPIRV: %[[#]] = OpGroupUMin %[[#int]] %[[#ScopeWorkgroup]] Reduce |
| ; CHECK-SPIRV: OpFunctionEnd |
| |
| ;; kernel void testWorkGroupUMin(uint a, global uint *res) { |
| ;; res[0] = work_group_reduce_min(a); |
| ;; } |
| |
| define dso_local spir_kernel void @testWorkGroupUMin(i32 noundef %a, i32 addrspace(1)* nocapture noundef writeonly %res) local_unnamed_addr { |
| entry: |
| %call = call spir_func i32 @_Z21work_group_reduce_minj(i32 noundef %a) |
| store i32 %call, i32 addrspace(1)* %res, align 4 |
| ret void |
| } |
| |
| declare spir_func i32 @_Z21work_group_reduce_minj(i32 noundef) local_unnamed_addr |
| |
| ; CHECK-SPIRV: OpFunction |
| ; CHECK-SPIRV: %[[#]] = OpGroupBroadcast %[[#int]] %[[#ScopeWorkgroup]] %[[#BroadcastValue:]] %[[#BroadcastLocalId:]] |
| ; CHECK-SPIRV: %[[#BroadcastVec2:]] = OpCompositeConstruct %[[#intv2]] %[[#BroadcastLocalId]] %[[#BroadcastLocalId]] |
| ; CHECK-SPIRV: %[[#]] = OpGroupBroadcast %[[#int]] %[[#ScopeWorkgroup]] %[[#BroadcastValue]] %[[#BroadcastVec2]] |
| ; CHECK-SPIRV: %[[#BroadcastVec3:]] = OpCompositeConstruct %[[#intv3]] %[[#BroadcastLocalId]] %[[#BroadcastLocalId]] %[[#BroadcastLocalId]] |
| ; CHECK-SPIRV: %[[#]] = OpGroupBroadcast %[[#int]] %[[#ScopeWorkgroup]] %[[#BroadcastValue]] %[[#BroadcastVec3]] |
| ; CHECK-SPIRV: %[[#]] = OpGroupBroadcast %[[#int]] %[[#ScopeCrossWorkgroup]] %[[#BroadcastValue]] %[[#BroadcastLocalId]] |
| ; CHECK-SPIRV: OpFunctionEnd |
| |
| ;; kernel void testWorkGroupBroadcast(uint a, global size_t *id, global int *res) { |
| ;; res[0] = work_group_broadcast(a, *id); |
| ;; } |
| |
| define dso_local spir_kernel void @testWorkGroupBroadcast(i32 noundef %a, i32 addrspace(1)* nocapture noundef readonly %id, i32 addrspace(1)* nocapture noundef writeonly %res) local_unnamed_addr { |
| entry: |
| %0 = load i32, i32 addrspace(1)* %id, align 4 |
| %call = call spir_func i32 @_Z20work_group_broadcastjj(i32 noundef %a, i32 noundef %0) |
| %call_v2 = call spir_func i32 @_Z20work_group_broadcastjj(i32 noundef %a, i32 noundef %0, i32 noundef %0) |
| %call_v3 = call spir_func i32 @_Z20work_group_broadcastjj(i32 noundef %a, i32 noundef %0, i32 noundef %0, i32 noundef %0) |
| store i32 %call, i32 addrspace(1)* %res, align 4 |
| %call1 = call spir_func i32 @__spirv_GroupBroadcast(i32 0, i32 noundef %a, i32 noundef %0) |
| ret void |
| } |
| |
| declare spir_func i32 @_Z20work_group_broadcastjj(i32 noundef, i32 noundef) local_unnamed_addr |
| declare spir_func i32 @_Z20work_group_broadcastjjj(i32 noundef, i32 noundef, i32 noundef) local_unnamed_addr |
| declare spir_func i32 @_Z20work_group_broadcastjjjj(i32 noundef, i32 noundef, i32 noundef, i32 noundef) local_unnamed_addr |
| declare spir_func i32 @__spirv_GroupBroadcast(i32 noundef, i32 noundef, i32 noundef) local_unnamed_addr |
| |
| ; CHECK-SPIRV: OpFunction |
| ; CHECK-SPIRV: %[[#]] = OpGroupFAdd %[[#float]] %[[#ScopeCrossWorkgroup]] Reduce %[[#FValue:]] |
| ; CHECK-SPIRV: %[[#]] = OpGroupFMin %[[#float]] %[[#ScopeWorkgroup]] InclusiveScan %[[#FValue]] |
| ; CHECK-SPIRV: %[[#]] = OpGroupFMax %[[#float]] %[[#ScopeSubgroup]] ExclusiveScan %[[#FValue]] |
| ; CHECK-SPIRV: %[[#]] = OpGroupIAdd %[[#int]] %[[#ScopeCrossWorkgroup]] Reduce %[[#IValue:]] |
| ; CHECK-SPIRV: %[[#]] = OpGroupUMin %[[#int]] %[[#ScopeWorkgroup]] InclusiveScan %[[#IValue]] |
| ; CHECK-SPIRV: %[[#]] = OpGroupSMin %[[#int]] %[[#ScopeSubgroup]] ExclusiveScan %[[#IValue]] |
| ; CHECK-SPIRV: %[[#]] = OpGroupUMax %[[#int]] %[[#ScopeCrossWorkgroup]] Reduce %[[#IValue]] |
| ; CHECK-SPIRV: %[[#]] = OpGroupSMax %[[#int]] %[[#ScopeWorkgroup]] InclusiveScan %[[#IValue]] |
| ; CHECK-SPIRV: OpFunctionEnd |
| |
| define spir_kernel void @foo(float %a, i32 %b) { |
| entry: |
| %f1 = call spir_func float @__spirv_GroupFAdd(i32 0, i32 0, float %a) |
| %f2 = call spir_func float @__spirv_GroupFMin(i32 2, i32 1, float %a) |
| %f3 = call spir_func float @__spirv_GroupFMax(i32 3, i32 2, float %a) |
| %i1 = call spir_func i32 @__spirv_GroupIAdd(i32 0, i32 0, i32 %b) |
| %i2 = call spir_func i32 @__spirv_GroupUMin(i32 2, i32 1, i32 %b) |
| %i3 = call spir_func i32 @__spirv_GroupSMin(i32 3, i32 2, i32 %b) |
| %i4 = call spir_func i32 @__spirv_GroupUMax(i32 0, i32 0, i32 %b) |
| %i5 = call spir_func i32 @__spirv_GroupSMax(i32 2, i32 1, i32 %b) |
| ret void |
| } |
| |
| declare spir_func float @__spirv_GroupFAdd(i32, i32, float) |
| declare spir_func float @__spirv_GroupFMin(i32, i32, float) |
| declare spir_func float @__spirv_GroupFMax(i32, i32, float) |
| declare spir_func i32 @__spirv_GroupIAdd(i32, i32, i32) |
| declare spir_func i32 @__spirv_GroupUMin(i32, i32, i32) |
| declare spir_func i32 @__spirv_GroupSMin(i32, i32, i32) |
| declare spir_func i32 @__spirv_GroupUMax(i32, i32, i32) |
| declare spir_func i32 @__spirv_GroupSMax(i32, i32, i32) |