| // Make sure that invoking blocks in static functions with the same name in |
| // different modules are linked together. |
| |
| // RUN: %clang_cc1 -O0 -cl-std=CL2.0 -triple amdgcn-amd-amdhsa -fno-ident -DKERNEL_NAME=test_kernel_first -DTYPE=float -DCONST=256.0f -emit-llvm-bc -o %t.0.bc %s |
| // RUN: %clang_cc1 -O0 -cl-std=CL2.0 -triple amdgcn-amd-amdhsa -fno-ident -DKERNEL_NAME=test_kernel_second -DTYPE=int -DCONST=128.0f -emit-llvm-bc -o %t.1.bc %s |
| |
| // Make sure nothing strange happens with the linkage choices. |
| // RUN: opt -passes=globalopt -o %t.opt.0.bc %t.0.bc |
| // RUN: opt -passes=globalopt -o %t.opt.1.bc %t.1.bc |
| |
| // Check the result of linking |
| // RUN: llvm-link -S %t.opt.0.bc %t.opt.1.bc -o - | FileCheck %s |
| |
| // Make sure that a block invoke used with the same name works in multiple |
| // translation units |
| |
| // CHECK: @llvm.used = appending addrspace(1) global [4 x ptr] [ptr @__static_invoker_block_invoke_kernel, ptr addrspacecast (ptr addrspace(1) @__static_invoker_block_invoke_kernel.runtime.handle to ptr), ptr @__static_invoker_block_invoke_kernel.2, ptr addrspacecast (ptr addrspace(1) @__static_invoker_block_invoke_kernel.runtime.handle.3 to ptr)], section "llvm.metadata" |
| |
| |
| // CHECK: @__static_invoker_block_invoke_kernel.runtime.handle = internal addrspace(1) externally_initialized constant %block.runtime.handle.t zeroinitializer, section ".amdgpu.kernel.runtime.handle" |
| // CHECK: @__static_invoker_block_invoke_kernel.runtime.handle.3 = internal addrspace(1) externally_initialized constant %block.runtime.handle.t zeroinitializer, section ".amdgpu.kernel.runtime.handle" |
| |
| // CHECK: define internal amdgpu_kernel void @__static_invoker_block_invoke_kernel(<{ i32, i32, ptr, ptr addrspace(1), ptr addrspace(1) }> %0) #{{[0-9]+}} !associated ![[ASSOC_FIRST_MD:[0-9]+]] |
| |
| |
| // CHECK-LABEL: define internal void @__static_invoker_block_invoke(ptr noundef %.block_descriptor) |
| // CHECK: call float @llvm.fmuladd.f32 |
| |
| |
| // CHECK-LABEL: define dso_local amdgpu_kernel void @test_kernel_first( |
| |
| |
| // CHECK-LABEL: define internal fastcc void @static_invoker(ptr addrspace(1) noundef %outptr, ptr addrspace(1) noundef %argptr) |
| // CHECK: call i32 @__enqueue_kernel_basic(ptr addrspace(1) %{{[0-9]+}}, i32 %{{[0-9]+}}, ptr addrspace(5) %tmp, ptr addrspacecast (ptr addrspace(1) @__static_invoker_block_invoke_kernel.runtime.handle to ptr), ptr %{{.+}}) |
| |
| // CHECK: declare i32 @__enqueue_kernel_basic(ptr addrspace(1), i32, ptr addrspace(5), ptr, ptr) local_unnamed_addr |
| |
| |
| // CHECK: define internal amdgpu_kernel void @__static_invoker_block_invoke_kernel.2(<{ i32, i32, ptr, ptr addrspace(1), ptr addrspace(1) }> %0) #{{[0-9]+}} !associated ![[ASSOC_SECOND_MD:[0-9]+]] |
| // CHECK: call void @__static_invoker_block_invoke.4(ptr % |
| |
| |
| // CHECK-LABEL: define internal void @__static_invoker_block_invoke.4(ptr noundef %.block_descriptor) |
| // CHECK: mul nsw i32 |
| // CHECK: sitofp |
| // CHECK: fadd |
| // CHECK: fptosi |
| |
| // CHECK-LABEL: define dso_local amdgpu_kernel void @test_kernel_second(ptr addrspace(1) noundef align 4 %outptr, ptr addrspace(1) noundef align 4 %argptr, ptr addrspace(1) noundef align 4 %difference) |
| |
| // CHECK-LABEL: define internal fastcc void @static_invoker.5(ptr addrspace(1) noundef %outptr, ptr addrspace(1) noundef %argptr) unnamed_addr #{{[0-9]+}} { |
| // CHECK: call i32 @__enqueue_kernel_basic(ptr addrspace(1) %{{[0-9]+}}, i32 %{{[0-9]+}}, ptr addrspace(5) %tmp, ptr addrspacecast (ptr addrspace(1) @__static_invoker_block_invoke_kernel.runtime.handle.3 to ptr), ptr %{{.+}}) |
| |
| |
| typedef struct {int a;} ndrange_t; |
| |
| static void static_invoker(global TYPE* outptr, global TYPE* argptr) { |
| queue_t default_queue; |
| unsigned flags = 0; |
| ndrange_t ndrange; |
| |
| enqueue_kernel(default_queue, flags, ndrange, |
| ^(void) { |
| global TYPE* f = argptr; |
| outptr[0] = f[1] * f[2] + CONST; |
| }); |
| } |
| |
| kernel void KERNEL_NAME(global TYPE *outptr, global TYPE *argptr, global TYPE *difference) { |
| queue_t default_queue; |
| unsigned flags = 0; |
| ndrange_t ndrange; |
| |
| static_invoker(outptr, argptr); |
| |
| *difference = CONST; |
| } |
| |
| // CHECK: ![[ASSOC_FIRST_MD]] = !{ptr addrspace(1) @__static_invoker_block_invoke_kernel.runtime.handle} |
| // CHECK: ![[ASSOC_SECOND_MD]] = !{ptr addrspace(1) @__static_invoker_block_invoke_kernel.runtime.handle.3} |