; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 2
; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx90a < %s | FileCheck %s
; Regression test for a bug in `DAGCombiner::replaceStoreOfInsertLoad` where
; Idx could be smaller than PtrVT, causing a MUL to be emitted with inconsistent
; LHS/RHS types.
define void @testcase_0(ptr addrspace(1) %in, float %arg) {
; CHECK-LABEL: testcase_0:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: global_store_dword v[0:1], v2, off offset:12
; CHECK-NEXT: s_waitcnt vmcnt(0)
; CHECK-NEXT: s_setpc_b64 s[30:31]
%loaded = load <4 x float>, ptr addrspace(1) %in
%modified = insertelement <4 x float> %loaded, float %arg, i64 3
store <4 x float> %modified, ptr addrspace(1) %in
ret void
}
define void @testcase_1(ptr addrspace(1) %in, float %arg) {
; CHECK-LABEL: testcase_1:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: global_store_dword v[0:1], v2, off offset:16
; CHECK-NEXT: s_waitcnt vmcnt(0)
; CHECK-NEXT: s_setpc_b64 s[30:31]
%loaded = load <6 x float>, ptr addrspace(1) %in
%modified = insertelement <6 x float> %loaded, float %arg, i64 4
store <6 x float> %modified, ptr addrspace(1) %in
ret void
}
define void @testcase_2(ptr addrspace(1) %in, double %arg) {
; CHECK-LABEL: testcase_2:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: global_store_dwordx2 v[0:1], v[2:3], off offset:8
; CHECK-NEXT: s_waitcnt vmcnt(0)
; CHECK-NEXT: s_setpc_b64 s[30:31]
%loaded = load <4 x double>, ptr addrspace(1) %in
%modified = insertelement <4 x double> %loaded, double %arg, i64 1
store <4 x double> %modified, ptr addrspace(1) %in
ret void
}
define void @testcase_3(ptr addrspace(1) %in, double %arg) {
; CHECK-LABEL: testcase_3:
; CHECK: ; %bb.0:
; CHECK-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
; CHECK-NEXT: global_store_dwordx2 v[0:1], v[2:3], off offset:56
; CHECK-NEXT: s_waitcnt vmcnt(0)
; CHECK-NEXT: s_setpc_b64 s[30:31]
%loaded = load <8 x double>, ptr addrspace(1) %in
%modified = insertelement <8 x double> %loaded, double %arg, i64 7
store <8 x double> %modified, ptr addrspace(1) %in
ret void
}