| ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5 |
| ; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1030 < %s | FileCheck %s |
| |
| %ret_struct = type { half, half } |
| |
| define void @extracted_values(ptr %ret_struct, ptr addrspace(3) %arg0, ptr addrspace(3) %arg1, ptr addrspace(3) %arg2, ptr addrspace(3) %arg3) { |
| ; CHECK-LABEL: extracted_values: |
| ; CHECK: ; %bb.0: ; %entry |
| ; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) |
| ; CHECK-NEXT: ds_read_b32 v3, v3 |
| ; CHECK-NEXT: ds_read_b32 v4, v4 |
| ; CHECK-NEXT: ds_read_b32 v2, v2 |
| ; CHECK-NEXT: ds_read_b32 v5, v5 |
| ; CHECK-NEXT: s_waitcnt lgkmcnt(2) |
| ; CHECK-NEXT: v_sub_f16_sdwa v6, v3, v4 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1 src1_sel:WORD_1 |
| ; CHECK-NEXT: v_sub_f16_sdwa v3, v4, v3 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1 src1_sel:WORD_1 |
| ; CHECK-NEXT: s_waitcnt lgkmcnt(0) |
| ; CHECK-NEXT: v_sub_f16_sdwa v7, v2, v5 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1 src1_sel:WORD_1 |
| ; CHECK-NEXT: v_sub_f16_sdwa v2, v5, v2 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1 src1_sel:WORD_1 |
| ; CHECK-NEXT: v_add_f16_e32 v4, v6, v7 |
| ; CHECK-NEXT: v_add_f16_e32 v2, v3, v2 |
| ; CHECK-NEXT: v_pack_b32_f16 v2, v4, v2 |
| ; CHECK-NEXT: flat_store_dword v[0:1], v2 |
| ; CHECK-NEXT: s_waitcnt lgkmcnt(0) |
| ; CHECK-NEXT: s_setpc_b64 s[30:31] |
| entry: |
| %tmp0 = load <2 x half>, ptr addrspace(3) %arg1, align 4 |
| %tmp1 = extractelement <2 x half> %tmp0, i64 1 |
| %tmp2 = load <2 x half>, ptr addrspace(3) %arg2, align 4 |
| %tmp3 = extractelement <2 x half> %tmp2, i64 1 |
| %tmp4 = fsub contract half %tmp1, %tmp3 |
| %tmp5 = load <2 x half>, ptr addrspace(3) %arg0, align 4 |
| %tmp6 = extractelement <2 x half> %tmp5, i64 1 |
| %tmp7 = load <2 x half>, ptr addrspace(3) %arg3, align 4 |
| %tmp8 = extractelement <2 x half> %tmp7, i64 1 |
| %tmp9 = fsub contract half %tmp6, %tmp8 |
| %tmp10 = fadd contract half %tmp4, %tmp9 |
| %tmp11 = fsub contract half %tmp3, %tmp1 |
| %tmp12 = fsub contract half %tmp8, %tmp6 |
| %tmp13 = fadd contract half %tmp11, %tmp12 |
| %field_ptr = getelementptr %ret_struct, ptr %ret_struct, i32 0, i32 0 |
| store half %tmp10, ptr %field_ptr, align 2 |
| %field_ptr1 = getelementptr %ret_struct, ptr %ret_struct, i32 0, i32 1 |
| store half %tmp13, ptr %field_ptr1, align 2 |
| ret void |
| } |