; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 5
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx1030 < %s | FileCheck %s
%ret_struct = type { half, half }
define void @extracted_values(ptr %ret_struct, ptr addrspace(3) %arg0, ptr addrspace(3) %arg1, ptr addrspace(3) %arg2, ptr addrspace(3) %arg3) {
; CHECK-LABEL: extracted_values:
; CHECK: ; %bb.0: ; %entry
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: ds_read_b32 v3, v3
; CHECK-NEXT: ds_read_b32 v4, v4
; CHECK-NEXT: ds_read_b32 v2, v2
; CHECK-NEXT: ds_read_b32 v5, v5
; CHECK-NEXT: s_waitcnt lgkmcnt(2)
; CHECK-NEXT: v_sub_f16_sdwa v6, v3, v4 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1 src1_sel:WORD_1
; CHECK-NEXT: v_sub_f16_sdwa v3, v4, v3 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1 src1_sel:WORD_1
; CHECK-NEXT: s_waitcnt lgkmcnt(0)
; CHECK-NEXT: v_sub_f16_sdwa v7, v2, v5 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1 src1_sel:WORD_1
; CHECK-NEXT: v_sub_f16_sdwa v2, v5, v2 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1 src1_sel:WORD_1
; CHECK-NEXT: v_add_f16_e32 v4, v6, v7
; CHECK-NEXT: v_add_f16_e32 v2, v3, v2
; CHECK-NEXT: v_pack_b32_f16 v2, v4, v2
; CHECK-NEXT: flat_store_dword v[0:1], v2
; CHECK-NEXT: s_waitcnt lgkmcnt(0)
; CHECK-NEXT: s_setpc_b64 s[30:31]
entry:
%tmp0 = load <2 x half>, ptr addrspace(3) %arg1, align 4
%tmp1 = extractelement <2 x half> %tmp0, i64 1
%tmp2 = load <2 x half>, ptr addrspace(3) %arg2, align 4
%tmp3 = extractelement <2 x half> %tmp2, i64 1
%tmp4 = fsub contract half %tmp1, %tmp3
%tmp5 = load <2 x half>, ptr addrspace(3) %arg0, align 4
%tmp6 = extractelement <2 x half> %tmp5, i64 1
%tmp7 = load <2 x half>, ptr addrspace(3) %arg3, align 4
%tmp8 = extractelement <2 x half> %tmp7, i64 1
%tmp9 = fsub contract half %tmp6, %tmp8
%tmp10 = fadd contract half %tmp4, %tmp9
%tmp11 = fsub contract half %tmp3, %tmp1
%tmp12 = fsub contract half %tmp8, %tmp6
%tmp13 = fadd contract half %tmp11, %tmp12
%field_ptr = getelementptr %ret_struct, ptr %ret_struct, i32 0, i32 0
store half %tmp10, ptr %field_ptr, align 2
%field_ptr1 = getelementptr %ret_struct, ptr %ret_struct, i32 0, i32 1
store half %tmp13, ptr %field_ptr1, align 2
ret void
}