; RUN: llc < %s -mcpu=corei7 -mtriple=x86_64-pc-win64 | FileCheck %s
; CHECK: merge_stores_can
; CHECK: callq foo
; CHECK: xorps %xmm0, %xmm0
; CHECK-NEXT: movups %xmm0
; CHECK-NEXT: movl 36(%rsp), %ebp
; CHECK: callq foo
; CHECK: ret
declare i32 @foo(ptr )
define i32 @merge_stores_can() nounwind ssp {
%object1 = alloca [10 x i32]
%ret0 = call i32 @foo(ptr %object1) nounwind
%O1_1 = getelementptr [10 x i32], ptr %object1, i64 0, i32 1
%O1_2 = getelementptr [10 x i32], ptr %object1, i64 0, i32 2
%O1_3 = getelementptr [10 x i32], ptr %object1, i64 0, i32 3
%O1_4 = getelementptr [10 x i32], ptr %object1, i64 0, i32 4
%ld_ptr = getelementptr [10 x i32], ptr %object1, i64 0, i32 9
store i32 0, ptr %O1_1
store i32 0, ptr %O1_2
%ret = load i32, ptr %ld_ptr ; <--- does not alias.
store i32 0, ptr %O1_3
store i32 0, ptr %O1_4
%ret1 = call i32 @foo(ptr %object1) nounwind
ret i32 %ret
}
; CHECK: merge_stores_cant
; CHECK-NOT: xorps %xmm0, %xmm0
; CHECK-NOT: movups %xmm0
; CHECK: ret
define i32 @merge_stores_cant(ptr %in0, ptr %in1) nounwind ssp {
%O1_1 = getelementptr [10 x i32], ptr %in1, i64 0, i32 1
%O1_2 = getelementptr [10 x i32], ptr %in1, i64 0, i32 2
%O1_3 = getelementptr [10 x i32], ptr %in1, i64 0, i32 3
%O1_4 = getelementptr [10 x i32], ptr %in1, i64 0, i32 4
%ld_ptr = getelementptr [10 x i32], ptr %in0, i64 0, i32 2
store i32 0, ptr %O1_1
store i32 0, ptr %O1_2
%ret = load i32, ptr %ld_ptr ; <--- may alias
store i32 0, ptr %O1_3
store i32 0, ptr %O1_4
ret i32 %ret
}