blob: a070fa1a3ea8e3bcce5940de3bd77191f07997f0 [file] [edit]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 6
; RUN: llc -global-isel=0 -mtriple=amdgcn -mcpu=gfx1250 < %s | FileCheck --check-prefix=SDAG %s
; RUN: llc -global-isel=1 -new-reg-bank-select -mtriple=amdgcn -mcpu=gfx1250 < %s | FileCheck --check-prefix=GISEL %s
declare i64 @llvm.amdgcn.ds.atomic.barrier.arrive.rtn.b64(ptr addrspace(3), i64)
define void @test_ds_atomic_barrier_arrive_rtn_b64(i64 %data, ptr addrspace(3) %bar, ptr %out) {
; SDAG-LABEL: test_ds_atomic_barrier_arrive_rtn_b64:
; SDAG: ; %bb.0: ; %entry
; SDAG-NEXT: s_wait_loadcnt_dscnt 0x0
; SDAG-NEXT: s_wait_kmcnt 0x0
; SDAG-NEXT: ds_atomic_barrier_arrive_rtn_b64 v[0:1], v2, v[0:1]
; SDAG-NEXT: v_dual_mov_b32 v5, v4 :: v_dual_mov_b32 v4, v3
; SDAG-NEXT: s_wait_dscnt 0x0
; SDAG-NEXT: flat_store_b64 v[4:5], v[0:1]
; SDAG-NEXT: s_wait_dscnt 0x0
; SDAG-NEXT: s_set_pc_i64 s[30:31]
;
; GISEL-LABEL: test_ds_atomic_barrier_arrive_rtn_b64:
; GISEL: ; %bb.0: ; %entry
; GISEL-NEXT: s_wait_loadcnt_dscnt 0x0
; GISEL-NEXT: s_wait_kmcnt 0x0
; GISEL-NEXT: ds_atomic_barrier_arrive_rtn_b64 v[0:1], v2, v[0:1]
; GISEL-NEXT: v_dual_mov_b32 v6, v3 :: v_dual_mov_b32 v7, v4
; GISEL-NEXT: s_wait_dscnt 0x0
; GISEL-NEXT: flat_store_b64 v[6:7], v[0:1]
; GISEL-NEXT: s_wait_dscnt 0x0
; GISEL-NEXT: s_set_pc_i64 s[30:31]
entry:
%ret = call i64 @llvm.amdgcn.ds.atomic.barrier.arrive.rtn.b64(ptr addrspace(3) %bar, i64 %data)
store i64 %ret, ptr %out
ret void
}
define void @test_ds_atomic_barrier_arrive_rtn_b64_off(ptr addrspace(3) %in, ptr %out) {
; SDAG-LABEL: test_ds_atomic_barrier_arrive_rtn_b64_off:
; SDAG: ; %bb.0: ; %entry
; SDAG-NEXT: s_wait_loadcnt_dscnt 0x0
; SDAG-NEXT: s_wait_kmcnt 0x0
; SDAG-NEXT: v_mov_b64_e32 v[4:5], 0x200
; SDAG-NEXT: v_dual_mov_b32 v3, v2 :: v_dual_mov_b32 v2, v1
; SDAG-NEXT: ds_atomic_barrier_arrive_rtn_b64 v[0:1], v0, v[4:5] offset:8184
; SDAG-NEXT: s_wait_dscnt 0x0
; SDAG-NEXT: flat_store_b64 v[2:3], v[0:1]
; SDAG-NEXT: s_wait_dscnt 0x0
; SDAG-NEXT: s_set_pc_i64 s[30:31]
;
; GISEL-LABEL: test_ds_atomic_barrier_arrive_rtn_b64_off:
; GISEL: ; %bb.0: ; %entry
; GISEL-NEXT: s_wait_loadcnt_dscnt 0x0
; GISEL-NEXT: s_wait_kmcnt 0x0
; GISEL-NEXT: v_dual_mov_b32 v4, v1 :: v_dual_mov_b32 v5, v2
; GISEL-NEXT: v_mov_b64_e32 v[2:3], 0x200
; GISEL-NEXT: ds_atomic_barrier_arrive_rtn_b64 v[0:1], v0, v[2:3] offset:8184
; GISEL-NEXT: s_wait_dscnt 0x0
; GISEL-NEXT: flat_store_b64 v[4:5], v[0:1]
; GISEL-NEXT: s_wait_dscnt 0x0
; GISEL-NEXT: s_set_pc_i64 s[30:31]
entry:
%bar = getelementptr i64, ptr addrspace(3) %in, i32 1023
%ret = call i64 @llvm.amdgcn.ds.atomic.barrier.arrive.rtn.b64(ptr addrspace(3) %bar, i64 512)
store i64 %ret, ptr %out
ret void
}
define amdgpu_ps void @test_ds_atomic_barrier_arrive_rtn_b64_ss(ptr addrspace(3) inreg %bar, i64 inreg %data, ptr inreg %out) {
; SDAG-LABEL: test_ds_atomic_barrier_arrive_rtn_b64_ss:
; SDAG: ; %bb.0: ; %entry
; SDAG-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_WAVE_MODE, 25, 1), 1 ; msbs: dst=0 src0=0 src1=0 src2=0
; SDAG-NEXT: v_dual_mov_b32 v0, s1 :: v_dual_mov_b32 v1, s2
; SDAG-NEXT: v_mov_b32_e32 v2, s0
; SDAG-NEXT: s_mov_b32 s5, s4
; SDAG-NEXT: s_mov_b32 s4, s3
; SDAG-NEXT: ds_atomic_barrier_arrive_rtn_b64 v[0:1], v2, v[0:1]
; SDAG-NEXT: v_mov_b32_e32 v2, 0
; SDAG-NEXT: s_wait_dscnt 0x0
; SDAG-NEXT: flat_store_b64 v2, v[0:1], s[4:5]
; SDAG-NEXT: s_endpgm
;
; GISEL-LABEL: test_ds_atomic_barrier_arrive_rtn_b64_ss:
; GISEL: ; %bb.0: ; %entry
; GISEL-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_WAVE_MODE, 25, 1), 1 ; msbs: dst=0 src0=0 src1=0 src2=0
; GISEL-NEXT: s_mov_b32 s6, s1
; GISEL-NEXT: s_mov_b32 s7, s2
; GISEL-NEXT: v_mov_b32_e32 v2, s0
; GISEL-NEXT: v_mov_b64_e32 v[0:1], s[6:7]
; GISEL-NEXT: s_mov_b32 s2, s3
; GISEL-NEXT: s_mov_b32 s3, s4
; GISEL-NEXT: ds_atomic_barrier_arrive_rtn_b64 v[0:1], v2, v[0:1]
; GISEL-NEXT: v_mov_b32_e32 v2, 0
; GISEL-NEXT: s_wait_dscnt 0x0
; GISEL-NEXT: flat_store_b64 v2, v[0:1], s[2:3]
; GISEL-NEXT: s_endpgm
entry:
%ret = call i64 @llvm.amdgcn.ds.atomic.barrier.arrive.rtn.b64(ptr addrspace(3) %bar, i64 %data)
store i64 %ret, ptr %out
ret void
}