llvm/llvm/test/CodeGen/ARM/aapcs-hfa-code.ll

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 4
; RUN: llc < %s -mtriple=armv7-linux-gnueabihf -o - | FileCheck %s
; RUN: llc < %s -mtriple=thumbv7em-none-eabi -mcpu=cortex-m4 | FileCheck %s --check-prefix=CHECK-M4F

target datalayout = "e-m:e-p:32:32-i64:64-v128:64:128-n32-S64"

define arm_aapcs_vfpcc void @test_1float({ float } %a) {
; CHECK-LABEL: test_1float:
; CHECK:       @ %bb.0:
; CHECK-NEXT:    .save {r11, lr}
; CHECK-NEXT:    push {r11, lr}
; CHECK-NEXT:    vmov.f32 s0, #1.000000e+00
; CHECK-NEXT:    bl test_1float
; CHECK-NEXT:    pop {r11, pc}
;
; CHECK-M4F-LABEL: test_1float:
; CHECK-M4F:       @ %bb.0:
; CHECK-M4F-NEXT:    .save {r7, lr}
; CHECK-M4F-NEXT:    push {r7, lr}
; CHECK-M4F-NEXT:    vmov.f32 s0, #1.000000e+00
; CHECK-M4F-NEXT:    bl test_1float
; CHECK-M4F-NEXT:    pop {r7, pc}
  call arm_aapcs_vfpcc void @test_1float({ float } { float 1.0 })
  ret void
}

define arm_aapcs_vfpcc void @test_2float({ float, float } %a) {
; CHECK-LABEL: test_2float:
; CHECK:       @ %bb.0:
; CHECK-NEXT:    .save {r11, lr}
; CHECK-NEXT:    push {r11, lr}
; CHECK-NEXT:    vmov.f32 s0, #1.000000e+00
; CHECK-NEXT:    vmov.f32 s1, #2.000000e+00
; CHECK-NEXT:    bl test_2float
; CHECK-NEXT:    pop {r11, pc}
;
; CHECK-M4F-LABEL: test_2float:
; CHECK-M4F:       @ %bb.0:
; CHECK-M4F-NEXT:    .save {r7, lr}
; CHECK-M4F-NEXT:    push {r7, lr}
; CHECK-M4F-NEXT:    vmov.f32 s0, #1.000000e+00
; CHECK-M4F-NEXT:    vmov.f32 s1, #2.000000e+00
; CHECK-M4F-NEXT:    bl test_2float
; CHECK-M4F-NEXT:    pop {r7, pc}
  call arm_aapcs_vfpcc void @test_2float({ float, float } { float 1.0, float 2.0 })
  ret void
}

define arm_aapcs_vfpcc void @test_3float({ float, float, float } %a) {
; CHECK-LABEL: test_3float:
; CHECK:       @ %bb.0:
; CHECK-NEXT:    .save {r11, lr}
; CHECK-NEXT:    push {r11, lr}
; CHECK-NEXT:    vmov.f32 s0, #1.000000e+00
; CHECK-NEXT:    vmov.f32 s1, #2.000000e+00
; CHECK-NEXT:    vmov.f32 s2, #3.000000e+00
; CHECK-NEXT:    bl test_3float
; CHECK-NEXT:    pop {r11, pc}
;
; CHECK-M4F-LABEL: test_3float:
; CHECK-M4F:       @ %bb.0:
; CHECK-M4F-NEXT:    .save {r7, lr}
; CHECK-M4F-NEXT:    push {r7, lr}
; CHECK-M4F-NEXT:    vmov.f32 s0, #1.000000e+00
; CHECK-M4F-NEXT:    vmov.f32 s1, #2.000000e+00
; CHECK-M4F-NEXT:    vmov.f32 s2, #3.000000e+00
; CHECK-M4F-NEXT:    bl test_3float
; CHECK-M4F-NEXT:    pop {r7, pc}
  call arm_aapcs_vfpcc void @test_3float({ float, float, float } { float 1.0, float 2.0, float 3.0 })
  ret void
}

define arm_aapcs_vfpcc void @test_1double({ double } %a) {
; CHECK-LABEL: test_1double:
; CHECK:       @ %bb.0:
; CHECK-NEXT:    .save {r11, lr}
; CHECK-NEXT:    push {r11, lr}
; CHECK-NEXT:    vmov.f64 d0, #1.000000e+00
; CHECK-NEXT:    bl test_1double
; CHECK-NEXT:    pop {r11, pc}
;
; CHECK-M4F-LABEL: test_1double:
; CHECK-M4F:       @ %bb.0:
; CHECK-M4F-NEXT:    .save {r7, lr}
; CHECK-M4F-NEXT:    push {r7, lr}
; CHECK-M4F-NEXT:    vldr d0, .LCPI3_0
; CHECK-M4F-NEXT:    bl test_1double
; CHECK-M4F-NEXT:    pop {r7, pc}
; CHECK-M4F-NEXT:    .p2align 3
; CHECK-M4F-NEXT:  @ %bb.1:
; CHECK-M4F-NEXT:  .LCPI3_0:
; CHECK-M4F-NEXT:    .long 0 @ double 1
; CHECK-M4F-NEXT:    .long 1072693248
  call arm_aapcs_vfpcc void @test_1double({ double } { double 1.0 })
  ret void
}

; Final double argument might be put in s15 & [sp] if we're careless. It should
; go all on the stack.
define arm_aapcs_vfpcc void @test_1double_nosplit([4 x float], [4 x double], [3 x float], double %a) {
; CHECK-LABEL: test_1double_nosplit:
; CHECK:       @ %bb.0:
; CHECK-NEXT:    .save {r11, lr}
; CHECK-NEXT:    push {r11, lr}
; CHECK-NEXT:    .pad #8
; CHECK-NEXT:    sub sp, sp, #8
; CHECK-NEXT:    vmov.f64 d16, #1.000000e+00
; CHECK-NEXT:    vstr d16, [sp]
; CHECK-NEXT:    bl test_1double_nosplit
; CHECK-NEXT:    add sp, sp, #8
; CHECK-NEXT:    pop {r11, pc}
;
; CHECK-M4F-LABEL: test_1double_nosplit:
; CHECK-M4F:       @ %bb.0:
; CHECK-M4F-NEXT:    .save {r7, lr}
; CHECK-M4F-NEXT:    push {r7, lr}
; CHECK-M4F-NEXT:    .pad #8
; CHECK-M4F-NEXT:    sub sp, #8
; CHECK-M4F-NEXT:    movs r0, #0
; CHECK-M4F-NEXT:    movt r0, #16368
; CHECK-M4F-NEXT:    movs r1, #0
; CHECK-M4F-NEXT:    strd r1, r0, [sp]
; CHECK-M4F-NEXT:    bl test_1double_nosplit
; CHECK-M4F-NEXT:    add sp, #8
; CHECK-M4F-NEXT:    pop {r7, pc}
  call arm_aapcs_vfpcc void @test_1double_nosplit([4 x float] undef, [4 x double] undef, [3 x float] undef, double 1.0)
  ret void
}

; Final double argument might go at [sp, #4] if we're careless. Should go at
; [sp, #8] to preserve alignment.
define arm_aapcs_vfpcc void @test_1double_misaligned([4 x double], [4 x double], float, double) {
; CHECK-LABEL: test_1double_misaligned:
; CHECK:       @ %bb.0:
; CHECK-NEXT:    .save {r11, lr}
; CHECK-NEXT:    push {r11, lr}
; CHECK-NEXT:    .pad #16
; CHECK-NEXT:    sub sp, sp, #16
; CHECK-NEXT:    vmov.f64 d16, #1.000000e+00
; CHECK-NEXT:    vstr d16, [sp, #8]
; CHECK-NEXT:    bl test_1double_misaligned
; CHECK-NEXT:    add sp, sp, #16
; CHECK-NEXT:    pop {r11, pc}
;
; CHECK-M4F-LABEL: test_1double_misaligned:
; CHECK-M4F:       @ %bb.0:
; CHECK-M4F-NEXT:    .save {r7, lr}
; CHECK-M4F-NEXT:    push {r7, lr}
; CHECK-M4F-NEXT:    .pad #16
; CHECK-M4F-NEXT:    sub sp, #16
; CHECK-M4F-NEXT:    movs r0, #0
; CHECK-M4F-NEXT:    movt r0, #16368
; CHECK-M4F-NEXT:    movs r1, #0
; CHECK-M4F-NEXT:    strd r1, r0, [sp, #8]
; CHECK-M4F-NEXT:    bl test_1double_misaligned
; CHECK-M4F-NEXT:    add sp, #16
; CHECK-M4F-NEXT:    pop {r7, pc}
  call arm_aapcs_vfpcc void @test_1double_misaligned([4 x double] undef, [4 x double] undef, float undef, double 1.0)

  ret void
}