; RUN: llc < %s -mtriple=thumbv7-apple-ios -relocation-model=pic -mcpu=cortex-a8 | FileCheck %s
; Do not move the umull above previous call which would require use of
; more callee-saved registers and introduce copies.
; rdar://9329627
%struct.FF = type { ptr, ptr, ptr, ptr, ptr, ptr }
%struct.BD = type { ptr, i32, i32, i32, i32, i64, ptr, ptr, ptr, ptr, ptr, [16 x i8], i64, i64 }
@FuncPtr = external hidden unnamed_addr global ptr
@.str1 = external hidden unnamed_addr constant [6 x i8], align 4
@G = external unnamed_addr global i32
@.str2 = external hidden unnamed_addr constant [58 x i8], align 4
@.str3 = external hidden unnamed_addr constant [58 x i8], align 4
define i32 @test() nounwind optsize ssp {
entry:
; CHECK-LABEL: test:
; CHECK: push
; CHECK-NOT: push
%block_size = alloca i32, align 4
%block_count = alloca i32, align 4
%index_cache = alloca i32, align 4
store i32 0, ptr %index_cache, align 4
%tmp = load i32, ptr @G, align 4
%tmp1 = call i32 @bar(i32 0, i32 0, i32 %tmp) nounwind
switch i32 %tmp1, label %bb8 [
i32 0, label %bb
i32 536870913, label %bb4
i32 536870914, label %bb6
]
bb:
%tmp2 = load i32, ptr @G, align 4
%tmp4 = icmp eq i32 %tmp2, 0
br i1 %tmp4, label %bb1, label %bb8
bb1:
; CHECK: %bb1
; CHECK-NOT: umull
; CHECK: bl _Get
; CHECK: umull
; CHECK: bl _foo
%tmp5 = load i32, ptr %block_size, align 4
%tmp6 = load i32, ptr %block_count, align 4
%tmp7 = call ptr @Get() nounwind
store ptr %tmp7, ptr @FuncPtr, align 4
%tmp10 = zext i32 %tmp6 to i64
%tmp11 = zext i32 %tmp5 to i64
%tmp12 = mul nsw i64 %tmp10, %tmp11
%tmp13 = call i32 @foo(ptr @.str1, i64 %tmp12, i32 %tmp5) nounwind
br label %bb8
bb4:
ret i32 0
bb6:
ret i32 1
bb8:
ret i32 -1
}
declare i32 @printf(ptr, ...)
declare ptr @Get()
declare i32 @foo(ptr, i64, i32)
declare i32 @bar(i32, i32, i32)