| ; RUN: llc -march=amdgcn -mcpu=gfx1010 -verify-machineinstrs -amdgpu-s-branch-bits=4 < %s | FileCheck -enable-var-scope -check-prefixes=GCN,GFX10 %s |
| ; RUN: llc -march=amdgcn -mcpu=gfx900 -verify-machineinstrs -amdgpu-s-branch-bits=4 < %s | FileCheck -enable-var-scope -check-prefixes=GCN,GFX9 %s |
| ; Make sure the code size estimate for inline asm is 12-bytes per |
| ; instruction, rather than 8 in previous generations. |
| ; GCN-LABEL: {{^}}long_forward_branch_gfx10only: |
| ; GFX9-NEXT: s_cbranch_scc1 |
| ; GFX10-NEXT: s_cbranch_scc0 |
| define amdgpu_kernel void @long_forward_branch_gfx10only(i32 addrspace(1)* %arg, i32 %cnd) #0 { |
| %cmp = icmp eq i32 %cnd, 0 |
| br i1 %cmp, label %bb3, label %bb2 ; +9 dword branch |
| ; Estimated as 40-bytes on gfx10 (requiring a long branch), but |
| ; 16-bytes on gfx9 (allowing a short branch) |
| store volatile i32 %cnd, i32 addrspace(1)* %arg |