blob: 0020c2272d23e9c6f75839a7ca9068e3935ea37d [file] [edit]
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -amdgpu-enable-object-linking < %s | FileCheck -check-prefixes=ASM %s --implicit-check-not=.amdgpu_num_agpr
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -amdgpu-enable-object-linking -filetype=obj < %s | llvm-readobj -r --syms --sections - | FileCheck -check-prefixes=ELF %s
; Test that with object linking enabled, external LDS declarations produce
; @abs32@lo relocations, SHN_AMDGPU_LDS symbols, .amdgpu_lds directives,
; and .amdgpu_use edges in the .amdgpu.info section. Covers multiple LDS
; variables with different sizes and alignments (including zero-sized dynamic
; LDS), usage from both kernels and device functions, and
; group_segment_fixed_size = 0 (linker patches via binary patching).
@lds_large = external addrspace(3) global [256 x i8], align 16
@lds_small = external addrspace(3) global [128 x i8], align 4
@lds_dynamic = external addrspace(3) global [0 x i8], align 8
; Instruction-level relocation checks.
; ASM-LABEL: {{^}}device_func:
; ASM: v_add_u32_e32 v{{[0-9]+}}, lds_large@abs32@lo, v{{[0-9]+}}
; ASM-LABEL: {{^}}test_kernel:
; ASM-DAG: s_add_i32 s{{[0-9]+}}, s{{[0-9]+}}, lds_small@abs32@lo
; ASM-DAG: s_add_i32 s{{[0-9]+}}, s{{[0-9]+}}, lds_dynamic@abs32@lo
; .amdgpu.info section with LDS use edges.
; ASM-DAG: .amdgpu_info device_func
; ASM-DAG: .amdgpu_flags {{[0-9]+}}
; ASM-DAG: .amdgpu_num_vgpr {{[0-9]+}}
; ASM-DAG: .amdgpu_num_sgpr {{[0-9]+}}
; ASM-DAG: .amdgpu_private_segment_size {{[0-9]+}}
; ASM-DAG: .amdgpu_use lds_large
; ASM-DAG: .end_amdgpu_info
; ASM-DAG: .amdgpu_info test_kernel
; ASM-DAG: .amdgpu_flags {{[0-9]+}}
; ASM-DAG: .amdgpu_num_vgpr {{[0-9]+}}
; ASM-DAG: .amdgpu_num_sgpr {{[0-9]+}}
; ASM-DAG: .amdgpu_private_segment_size {{[0-9]+}}
; ASM-DAG: .amdgpu_use lds_dynamic
; ASM-DAG: .amdgpu_use lds_small
; ASM-DAG: .amdgpu_call device_func
; ASM-DAG: .end_amdgpu_info
; SHN_AMDGPU_LDS directives.
; ASM-DAG: .amdgpu_lds lds_large, 256, 16
; ASM-DAG: .amdgpu_lds lds_small, 128, 4
; ASM-DAG: .amdgpu_lds lds_dynamic, 0, 8
; ASM: .group_segment_fixed_size: 0
; .amdgpu.info section exists.
; ELF: Section {
; ELF: Name: .amdgpu.info
; ELF: Type: SHT_PROGBITS
; ELF: Flags [
; ELF: SHF_EXCLUDE
; Relocations.
; ELF-DAG: R_AMDGPU_ABS32_LO lds_large
; ELF-DAG: R_AMDGPU_ABS32_LO lds_small
; ELF-DAG: R_AMDGPU_ABS32_LO lds_dynamic
; ELF-DAG: R_AMDGPU_ABS64 device_func
; ELF-DAG: R_AMDGPU_ABS64 test_kernel
; ELF-DAG: R_AMDGPU_ABS64 lds_large
; ELF-DAG: R_AMDGPU_ABS64 lds_small
; ELF-DAG: R_AMDGPU_ABS64 lds_dynamic
; SHN_AMDGPU_LDS symbols.
; ELF-DAG: Name: lds_large
; ELF-DAG: Name: lds_small
; ELF-DAG: Name: lds_dynamic
define void @device_func(i32 %idx) {
%gep = getelementptr [256 x i8], ptr addrspace(3) @lds_large, i32 0, i32 %idx
store i8 1, ptr addrspace(3) %gep
ret void
}
define amdgpu_kernel void @test_kernel(i32 %idx) {
%gep1 = getelementptr [128 x i8], ptr addrspace(3) @lds_small, i32 0, i32 %idx
store i8 2, ptr addrspace(3) %gep1
%gep2 = getelementptr [0 x i8], ptr addrspace(3) @lds_dynamic, i32 0, i32 %idx
store i8 3, ptr addrspace(3) %gep2
call void @device_func(i32 %idx)
ret void
}