| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py |
| ; RUN: llc -global-isel -mtriple=amdgcn--amdhsa -mcpu=gfx900 < %s | FileCheck -check-prefix=GCN %s |
| |
| define amdgpu_kernel void @test_wave64(i32 %arg0, i64 %saved) { |
| ; GCN-LABEL: test_wave64: |
| ; GCN: ; %bb.0: ; %entry |
| ; GCN-NEXT: s_load_dword s0, s[8:9], 0x0 |
| ; GCN-NEXT: s_waitcnt lgkmcnt(0) |
| ; GCN-NEXT: s_cmp_lg_u32 s0, 0 |
| ; GCN-NEXT: s_cbranch_scc1 .LBB0_2 |
| ; GCN-NEXT: ; %bb.1: ; %mid |
| ; GCN-NEXT: v_mov_b32_e32 v0, 0 |
| ; GCN-NEXT: global_store_dword v[0:1], v0, off |
| ; GCN-NEXT: s_waitcnt vmcnt(0) |
| ; GCN-NEXT: .LBB0_2: ; %bb |
| ; GCN-NEXT: s_load_dwordx2 s[0:1], s[8:9], 0x8 |
| ; GCN-NEXT: s_waitcnt lgkmcnt(0) |
| ; GCN-NEXT: s_or_b64 exec, exec, s[0:1] |
| ; GCN-NEXT: v_mov_b32_e32 v0, 0 |
| ; GCN-NEXT: global_store_dword v[0:1], v0, off |
| ; GCN-NEXT: s_waitcnt vmcnt(0) |
| ; GCN-NEXT: s_endpgm |
| entry: |
| %cond = icmp eq i32 %arg0, 0 |
| br i1 %cond, label %mid, label %bb |
| |
| mid: |
| store volatile i32 0, ptr addrspace(1) poison |
| br label %bb |
| |
| bb: |
| call void @llvm.amdgcn.end.cf.i64(i64 %saved) |
| store volatile i32 0, ptr addrspace(1) poison |
| ret void |
| } |
| |
| declare void @llvm.amdgcn.end.cf.i64(i64 %val) |