; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc -mtriple=aarch64 -mcpu=apple-m1 -mattr=+store-pair-suppress -o - %s | FileCheck --check-prefix=SUPPRESS %s
; RUN: llc -mtriple=aarch64 -mcpu=apple-m1 -mattr=-store-pair-suppress -o - %s | FileCheck --check-prefix=NOSUPPRESS %s
define void @vector_units_critial(ptr %dst, <8 x i32> %v0) {
; SUPPRESS-LABEL: vector_units_critial:
; SUPPRESS: // %bb.0: // %entry
; SUPPRESS-NEXT: uzp1 v0.8h, v0.8h, v1.8h
; SUPPRESS-NEXT: xtn v0.8b, v0.8h
; SUPPRESS-NEXT: mul v1.8b, v0.8b, v0.8b
; SUPPRESS-NEXT: str d1, [x0, #8]
; SUPPRESS-NEXT: str d0, [x0]
; SUPPRESS-NEXT: ret
;
; NOSUPPRESS-LABEL: vector_units_critial:
; NOSUPPRESS: // %bb.0: // %entry
; NOSUPPRESS-NEXT: uzp1 v0.8h, v0.8h, v1.8h
; NOSUPPRESS-NEXT: xtn v0.8b, v0.8h
; NOSUPPRESS-NEXT: mul v1.8b, v0.8b, v0.8b
; NOSUPPRESS-NEXT: stp d0, d1, [x0]
; NOSUPPRESS-NEXT: ret
entry:
%add.ptr.1 = getelementptr i8, ptr %dst, i64 8
%t = trunc <8 x i32> %v0 to <8 x i8>
%mul = mul <8 x i8> %t, %t
store <8 x i8> %mul, ptr %add.ptr.1, align 1
store <8 x i8> %t, ptr %dst, align 1
ret void
}
%struct.widget = type { float, float }
define void @load_store_units_critical(ptr %arg, ptr noundef %arg1, i64 noundef %arg2, i64 noundef %arg3) {
; SUPPRESS-LABEL: load_store_units_critical:
; SUPPRESS: // %bb.0: // %bb
; SUPPRESS-NEXT: ldr x8, [x0, #8]
; SUPPRESS-NEXT: ldp s0, s1, [x8]
; SUPPRESS-NEXT: add x8, x1, x2, lsl #3
; SUPPRESS-NEXT: ldp s2, s3, [x8]
; SUPPRESS-NEXT: ldp s4, s5, [x8, #8]
; SUPPRESS-NEXT: fmul s6, s5, s1
; SUPPRESS-NEXT: fmul s1, s4, s1
; SUPPRESS-NEXT: fnmsub s4, s4, s0, s6
; SUPPRESS-NEXT: fmadd s0, s5, s0, s1
; SUPPRESS-NEXT: fadd s1, s4, s2
; SUPPRESS-NEXT: fadd s5, s0, s3
; SUPPRESS-NEXT: stp s1, s5, [x8]
; SUPPRESS-NEXT: fsub s2, s2, s4
; SUPPRESS-NEXT: fsub s0, s3, s0
; SUPPRESS-NEXT: stp s2, s0, [x8, #8]
; SUPPRESS-NEXT: ldr x9, [x0, #8]
; SUPPRESS-NEXT: ldp s3, s4, [x9]
; SUPPRESS-NEXT: ldp s6, s7, [x8, #16]
; SUPPRESS-NEXT: ldp s16, s17, [x8, #24]
; SUPPRESS-NEXT: fmul s18, s17, s4
; SUPPRESS-NEXT: fmul s4, s16, s4
; SUPPRESS-NEXT: fnmsub s16, s16, s3, s18
; SUPPRESS-NEXT: fmadd s3, s17, s3, s4
; SUPPRESS-NEXT: fadd s4, s16, s6
; SUPPRESS-NEXT: fadd s17, s3, s7
; SUPPRESS-NEXT: stp s4, s17, [x8, #16]
; SUPPRESS-NEXT: fsub s6, s6, s16
; SUPPRESS-NEXT: fsub s3, s7, s3
; SUPPRESS-NEXT: stp s6, s3, [x8, #24]
; SUPPRESS-NEXT: ldr x9, [x0, #8]
; SUPPRESS-NEXT: ldp s7, s16, [x9]
; SUPPRESS-NEXT: fmul s18, s16, s17
; SUPPRESS-NEXT: fmul s17, s7, s17
; SUPPRESS-NEXT: fnmsub s7, s7, s4, s18
; SUPPRESS-NEXT: fmadd s4, s16, s4, s17
; SUPPRESS-NEXT: fadd s16, s7, s1
; SUPPRESS-NEXT: fadd s17, s4, s5
; SUPPRESS-NEXT: stp s16, s17, [x8]
; SUPPRESS-NEXT: fsub s1, s1, s7
; SUPPRESS-NEXT: fsub s4, s5, s4
; SUPPRESS-NEXT: stp s1, s4, [x8, #16]
; SUPPRESS-NEXT: ldr x10, [x0, #8]
; SUPPRESS-NEXT: lsl x9, x3, #4
; SUPPRESS-NEXT: add x10, x10, x9
; SUPPRESS-NEXT: ldp s1, s4, [x10]
; SUPPRESS-NEXT: fmul s5, s4, s3
; SUPPRESS-NEXT: fmul s3, s1, s3
; SUPPRESS-NEXT: fnmsub s1, s1, s6, s5
; SUPPRESS-NEXT: fmadd s3, s4, s6, s3
; SUPPRESS-NEXT: fadd s4, s1, s2
; SUPPRESS-NEXT: fadd s5, s3, s0
; SUPPRESS-NEXT: stp s4, s5, [x8, #8]
; SUPPRESS-NEXT: fsub s1, s2, s1
; SUPPRESS-NEXT: fsub s0, s0, s3
; SUPPRESS-NEXT: stp s1, s0, [x8, #24]
; SUPPRESS-NEXT: ldr x10, [x0, #8]
; SUPPRESS-NEXT: ldp s0, s1, [x10]
; SUPPRESS-NEXT: ldp s2, s3, [x8, #32]
; SUPPRESS-NEXT: ldp s4, s5, [x8, #40]
; SUPPRESS-NEXT: fmul s6, s5, s1
; SUPPRESS-NEXT: fmul s1, s4, s1
; SUPPRESS-NEXT: fnmsub s4, s4, s0, s6
; SUPPRESS-NEXT: fmadd s0, s5, s0, s1
; SUPPRESS-NEXT: fadd s1, s4, s2
; SUPPRESS-NEXT: fadd s5, s0, s3
; SUPPRESS-NEXT: stp s1, s5, [x8, #32]
; SUPPRESS-NEXT: fsub s2, s2, s4
; SUPPRESS-NEXT: fsub s3, s3, s0
; SUPPRESS-NEXT: stp s2, s3, [x8, #40]
; SUPPRESS-NEXT: ldr x10, [x0, #8]
; SUPPRESS-NEXT: ldp s0, s4, [x10]
; SUPPRESS-NEXT: ldp s6, s7, [x8, #48]
; SUPPRESS-NEXT: ldp s16, s17, [x8, #56]
; SUPPRESS-NEXT: fmul s18, s17, s4
; SUPPRESS-NEXT: fmul s4, s16, s4
; SUPPRESS-NEXT: fnmsub s16, s16, s0, s18
; SUPPRESS-NEXT: fmadd s0, s17, s0, s4
; SUPPRESS-NEXT: fadd s4, s16, s6
; SUPPRESS-NEXT: fadd s17, s0, s7
; SUPPRESS-NEXT: stp s4, s17, [x8, #48]
; SUPPRESS-NEXT: fsub s6, s6, s16
; SUPPRESS-NEXT: fsub s0, s7, s0
; SUPPRESS-NEXT: stp s6, s0, [x8, #56]
; SUPPRESS-NEXT: ldr x10, [x0, #8]
; SUPPRESS-NEXT: ldp s7, s16, [x10]
; SUPPRESS-NEXT: fmul s18, s16, s17
; SUPPRESS-NEXT: fmul s17, s7, s17
; SUPPRESS-NEXT: fnmsub s7, s7, s4, s18
; SUPPRESS-NEXT: fmadd s4, s16, s4, s17
; SUPPRESS-NEXT: fadd s16, s7, s1
; SUPPRESS-NEXT: fadd s17, s4, s5
; SUPPRESS-NEXT: stp s16, s17, [x8, #32]
; SUPPRESS-NEXT: fsub s7, s1, s7
; SUPPRESS-NEXT: fsub s4, s5, s4
; SUPPRESS-NEXT: stp s7, s4, [x8, #48]
; SUPPRESS-NEXT: ldr x10, [x0, #8]
; SUPPRESS-NEXT: add x9, x10, x9
; SUPPRESS-NEXT: ldp s1, s5, [x9]
; SUPPRESS-NEXT: fmul s18, s5, s0
; SUPPRESS-NEXT: fmul s0, s1, s0
; SUPPRESS-NEXT: fnmsub s1, s1, s6, s18
; SUPPRESS-NEXT: fmadd s5, s5, s6, s0
; SUPPRESS-NEXT: fadd s6, s1, s2
; SUPPRESS-NEXT: fadd s18, s5, s3
; SUPPRESS-NEXT: stp s6, s18, [x8, #40]
; SUPPRESS-NEXT: fsub s0, s2, s1
; SUPPRESS-NEXT: fsub s1, s3, s5
; SUPPRESS-NEXT: stp s0, s1, [x8, #56]
; SUPPRESS-NEXT: ldr x9, [x0, #8]
; SUPPRESS-NEXT: ldp s2, s3, [x9]
; SUPPRESS-NEXT: ldp s5, s19, [x8]
; SUPPRESS-NEXT: fmul s20, s17, s3
; SUPPRESS-NEXT: fmul s3, s16, s3
; SUPPRESS-NEXT: fnmsub s16, s16, s2, s20
; SUPPRESS-NEXT: fmadd s2, s17, s2, s3
; SUPPRESS-NEXT: fadd s3, s16, s5
; SUPPRESS-NEXT: fadd s17, s2, s19
; SUPPRESS-NEXT: stp s3, s17, [x8]
; SUPPRESS-NEXT: fsub s3, s5, s16
; SUPPRESS-NEXT: fsub s2, s19, s2
; SUPPRESS-NEXT: stp s3, s2, [x8, #32]
; SUPPRESS-NEXT: ldr x9, [x0, #8]
; SUPPRESS-NEXT: add x9, x9, w3, sxtw #3
; SUPPRESS-NEXT: ldp s2, s3, [x9]
; SUPPRESS-NEXT: ldp s5, s16, [x8, #8]
; SUPPRESS-NEXT: fmul s17, s18, s3
; SUPPRESS-NEXT: fmul s3, s6, s3
; SUPPRESS-NEXT: fnmsub s6, s6, s2, s17
; SUPPRESS-NEXT: fmadd s2, s18, s2, s3
; SUPPRESS-NEXT: fadd s3, s6, s5
; SUPPRESS-NEXT: fadd s17, s2, s16
; SUPPRESS-NEXT: stp s3, s17, [x8, #8]
; SUPPRESS-NEXT: fsub s3, s5, s6
; SUPPRESS-NEXT: fsub s2, s16, s2
; SUPPRESS-NEXT: stp s3, s2, [x8, #40]
; SUPPRESS-NEXT: lsl x9, x3, #33
; SUPPRESS-NEXT: ldr x10, [x0, #8]
; SUPPRESS-NEXT: add x9, x10, x9, asr #29
; SUPPRESS-NEXT: ldp s2, s3, [x9]
; SUPPRESS-NEXT: ldp s5, s6, [x8, #16]
; SUPPRESS-NEXT: fmul s16, s4, s3
; SUPPRESS-NEXT: fmul s3, s7, s3
; SUPPRESS-NEXT: fnmsub s7, s7, s2, s16
; SUPPRESS-NEXT: fmadd s2, s4, s2, s3
; SUPPRESS-NEXT: fadd s3, s7, s5
; SUPPRESS-NEXT: fadd s4, s2, s6
; SUPPRESS-NEXT: stp s3, s4, [x8, #16]
; SUPPRESS-NEXT: fsub s3, s5, s7
; SUPPRESS-NEXT: fsub s2, s6, s2
; SUPPRESS-NEXT: stp s3, s2, [x8, #48]
; SUPPRESS-NEXT: add w9, w3, w3, lsl #1
; SUPPRESS-NEXT: ldr x10, [x0, #8]
; SUPPRESS-NEXT: add x9, x10, w9, sxtw #3
; SUPPRESS-NEXT: ldp s2, s3, [x9]
; SUPPRESS-NEXT: ldp s4, s5, [x8, #24]
; SUPPRESS-NEXT: fmul s6, s1, s3
; SUPPRESS-NEXT: fmul s3, s0, s3
; SUPPRESS-NEXT: fnmsub s0, s0, s2, s6
; SUPPRESS-NEXT: fmadd s1, s1, s2, s3
; SUPPRESS-NEXT: fadd s2, s0, s4
; SUPPRESS-NEXT: fadd s3, s1, s5
; SUPPRESS-NEXT: stp s2, s3, [x8, #24]
; SUPPRESS-NEXT: fsub s0, s4, s0
; SUPPRESS-NEXT: fsub s1, s5, s1
; SUPPRESS-NEXT: stp s0, s1, [x8, #56]
; SUPPRESS-NEXT: ret
;
; NOSUPPRESS-LABEL: load_store_units_critical:
; NOSUPPRESS: // %bb.0: // %bb
; NOSUPPRESS-NEXT: ldr x8, [x0, #8]
; NOSUPPRESS-NEXT: ldp s0, s1, [x8]
; NOSUPPRESS-NEXT: add x8, x1, x2, lsl #3
; NOSUPPRESS-NEXT: ldp s2, s3, [x8]
; NOSUPPRESS-NEXT: ldp s4, s5, [x8, #8]
; NOSUPPRESS-NEXT: fmul s6, s5, s1
; NOSUPPRESS-NEXT: fmul s1, s4, s1
; NOSUPPRESS-NEXT: fnmsub s4, s4, s0, s6
; NOSUPPRESS-NEXT: fmadd s0, s5, s0, s1
; NOSUPPRESS-NEXT: fadd s1, s4, s2
; NOSUPPRESS-NEXT: fadd s5, s0, s3
; NOSUPPRESS-NEXT: stp s1, s5, [x8]
; NOSUPPRESS-NEXT: fsub s2, s2, s4
; NOSUPPRESS-NEXT: fsub s0, s3, s0
; NOSUPPRESS-NEXT: stp s2, s0, [x8, #8]
; NOSUPPRESS-NEXT: ldr x9, [x0, #8]
; NOSUPPRESS-NEXT: ldp s3, s4, [x9]
; NOSUPPRESS-NEXT: ldp s6, s7, [x8, #16]
; NOSUPPRESS-NEXT: ldp s16, s17, [x8, #24]
; NOSUPPRESS-NEXT: fmul s18, s17, s4
; NOSUPPRESS-NEXT: fmul s4, s16, s4
; NOSUPPRESS-NEXT: fnmsub s16, s16, s3, s18
; NOSUPPRESS-NEXT: fmadd s3, s17, s3, s4
; NOSUPPRESS-NEXT: fadd s4, s16, s6
; NOSUPPRESS-NEXT: fadd s17, s3, s7
; NOSUPPRESS-NEXT: stp s4, s17, [x8, #16]
; NOSUPPRESS-NEXT: fsub s6, s6, s16
; NOSUPPRESS-NEXT: fsub s3, s7, s3
; NOSUPPRESS-NEXT: stp s6, s3, [x8, #24]
; NOSUPPRESS-NEXT: ldr x9, [x0, #8]
; NOSUPPRESS-NEXT: ldp s7, s16, [x9]
; NOSUPPRESS-NEXT: fmul s18, s16, s17
; NOSUPPRESS-NEXT: fmul s17, s7, s17
; NOSUPPRESS-NEXT: fnmsub s7, s7, s4, s18
; NOSUPPRESS-NEXT: fmadd s4, s16, s4, s17
; NOSUPPRESS-NEXT: fadd s16, s7, s1
; NOSUPPRESS-NEXT: fadd s17, s4, s5
; NOSUPPRESS-NEXT: stp s16, s17, [x8]
; NOSUPPRESS-NEXT: fsub s1, s1, s7
; NOSUPPRESS-NEXT: fsub s4, s5, s4
; NOSUPPRESS-NEXT: stp s1, s4, [x8, #16]
; NOSUPPRESS-NEXT: ldr x10, [x0, #8]
; NOSUPPRESS-NEXT: lsl x9, x3, #4
; NOSUPPRESS-NEXT: add x10, x10, x9
; NOSUPPRESS-NEXT: ldp s1, s4, [x10]
; NOSUPPRESS-NEXT: fmul s5, s4, s3
; NOSUPPRESS-NEXT: fmul s3, s1, s3
; NOSUPPRESS-NEXT: fnmsub s1, s1, s6, s5
; NOSUPPRESS-NEXT: fmadd s3, s4, s6, s3
; NOSUPPRESS-NEXT: fadd s4, s1, s2
; NOSUPPRESS-NEXT: fadd s5, s3, s0
; NOSUPPRESS-NEXT: stp s4, s5, [x8, #8]
; NOSUPPRESS-NEXT: fsub s1, s2, s1
; NOSUPPRESS-NEXT: fsub s0, s0, s3
; NOSUPPRESS-NEXT: stp s1, s0, [x8, #24]
; NOSUPPRESS-NEXT: ldr x10, [x0, #8]
; NOSUPPRESS-NEXT: ldp s0, s1, [x10]
; NOSUPPRESS-NEXT: ldp s2, s3, [x8, #32]
; NOSUPPRESS-NEXT: ldp s4, s5, [x8, #40]
; NOSUPPRESS-NEXT: fmul s6, s5, s1
; NOSUPPRESS-NEXT: fmul s1, s4, s1
; NOSUPPRESS-NEXT: fnmsub s4, s4, s0, s6
; NOSUPPRESS-NEXT: fmadd s0, s5, s0, s1
; NOSUPPRESS-NEXT: fadd s1, s4, s2
; NOSUPPRESS-NEXT: fadd s5, s0, s3
; NOSUPPRESS-NEXT: stp s1, s5, [x8, #32]
; NOSUPPRESS-NEXT: fsub s2, s2, s4
; NOSUPPRESS-NEXT: fsub s3, s3, s0
; NOSUPPRESS-NEXT: stp s2, s3, [x8, #40]
; NOSUPPRESS-NEXT: ldr x10, [x0, #8]
; NOSUPPRESS-NEXT: ldp s0, s4, [x10]
; NOSUPPRESS-NEXT: ldp s6, s7, [x8, #48]
; NOSUPPRESS-NEXT: ldp s16, s17, [x8, #56]
; NOSUPPRESS-NEXT: fmul s18, s17, s4
; NOSUPPRESS-NEXT: fmul s4, s16, s4
; NOSUPPRESS-NEXT: fnmsub s16, s16, s0, s18
; NOSUPPRESS-NEXT: fmadd s0, s17, s0, s4
; NOSUPPRESS-NEXT: fadd s4, s16, s6
; NOSUPPRESS-NEXT: fadd s17, s0, s7
; NOSUPPRESS-NEXT: stp s4, s17, [x8, #48]
; NOSUPPRESS-NEXT: fsub s6, s6, s16
; NOSUPPRESS-NEXT: fsub s0, s7, s0
; NOSUPPRESS-NEXT: stp s6, s0, [x8, #56]
; NOSUPPRESS-NEXT: ldr x10, [x0, #8]
; NOSUPPRESS-NEXT: ldp s7, s16, [x10]
; NOSUPPRESS-NEXT: fmul s18, s16, s17
; NOSUPPRESS-NEXT: fmul s17, s7, s17
; NOSUPPRESS-NEXT: fnmsub s7, s7, s4, s18
; NOSUPPRESS-NEXT: fmadd s4, s16, s4, s17
; NOSUPPRESS-NEXT: fadd s16, s7, s1
; NOSUPPRESS-NEXT: fadd s17, s4, s5
; NOSUPPRESS-NEXT: stp s16, s17, [x8, #32]
; NOSUPPRESS-NEXT: fsub s7, s1, s7
; NOSUPPRESS-NEXT: fsub s4, s5, s4
; NOSUPPRESS-NEXT: stp s7, s4, [x8, #48]
; NOSUPPRESS-NEXT: ldr x10, [x0, #8]
; NOSUPPRESS-NEXT: add x9, x10, x9
; NOSUPPRESS-NEXT: ldp s1, s5, [x9]
; NOSUPPRESS-NEXT: fmul s18, s5, s0
; NOSUPPRESS-NEXT: fmul s0, s1, s0
; NOSUPPRESS-NEXT: fnmsub s1, s1, s6, s18
; NOSUPPRESS-NEXT: fmadd s5, s5, s6, s0
; NOSUPPRESS-NEXT: fadd s6, s1, s2
; NOSUPPRESS-NEXT: fadd s18, s5, s3
; NOSUPPRESS-NEXT: stp s6, s18, [x8, #40]
; NOSUPPRESS-NEXT: fsub s0, s2, s1
; NOSUPPRESS-NEXT: fsub s1, s3, s5
; NOSUPPRESS-NEXT: stp s0, s1, [x8, #56]
; NOSUPPRESS-NEXT: ldr x9, [x0, #8]
; NOSUPPRESS-NEXT: ldp s2, s3, [x9]
; NOSUPPRESS-NEXT: ldp s5, s19, [x8]
; NOSUPPRESS-NEXT: fmul s20, s17, s3
; NOSUPPRESS-NEXT: fmul s3, s16, s3
; NOSUPPRESS-NEXT: fnmsub s16, s16, s2, s20
; NOSUPPRESS-NEXT: fmadd s2, s17, s2, s3
; NOSUPPRESS-NEXT: fadd s3, s16, s5
; NOSUPPRESS-NEXT: fadd s17, s2, s19
; NOSUPPRESS-NEXT: stp s3, s17, [x8]
; NOSUPPRESS-NEXT: fsub s3, s5, s16
; NOSUPPRESS-NEXT: fsub s2, s19, s2
; NOSUPPRESS-NEXT: stp s3, s2, [x8, #32]
; NOSUPPRESS-NEXT: ldr x9, [x0, #8]
; NOSUPPRESS-NEXT: add x9, x9, w3, sxtw #3
; NOSUPPRESS-NEXT: ldp s2, s3, [x9]
; NOSUPPRESS-NEXT: ldp s5, s16, [x8, #8]
; NOSUPPRESS-NEXT: fmul s17, s18, s3
; NOSUPPRESS-NEXT: fmul s3, s6, s3
; NOSUPPRESS-NEXT: fnmsub s6, s6, s2, s17
; NOSUPPRESS-NEXT: fmadd s2, s18, s2, s3
; NOSUPPRESS-NEXT: fadd s3, s6, s5
; NOSUPPRESS-NEXT: fadd s17, s2, s16
; NOSUPPRESS-NEXT: stp s3, s17, [x8, #8]
; NOSUPPRESS-NEXT: fsub s3, s5, s6
; NOSUPPRESS-NEXT: fsub s2, s16, s2
; NOSUPPRESS-NEXT: stp s3, s2, [x8, #40]
; NOSUPPRESS-NEXT: lsl x9, x3, #33
; NOSUPPRESS-NEXT: ldr x10, [x0, #8]
; NOSUPPRESS-NEXT: add x9, x10, x9, asr #29
; NOSUPPRESS-NEXT: ldp s2, s3, [x9]
; NOSUPPRESS-NEXT: ldp s5, s6, [x8, #16]
; NOSUPPRESS-NEXT: fmul s16, s4, s3
; NOSUPPRESS-NEXT: fmul s3, s7, s3
; NOSUPPRESS-NEXT: fnmsub s7, s7, s2, s16
; NOSUPPRESS-NEXT: fmadd s2, s4, s2, s3
; NOSUPPRESS-NEXT: fadd s3, s7, s5
; NOSUPPRESS-NEXT: fadd s4, s2, s6
; NOSUPPRESS-NEXT: stp s3, s4, [x8, #16]
; NOSUPPRESS-NEXT: fsub s3, s5, s7
; NOSUPPRESS-NEXT: fsub s2, s6, s2
; NOSUPPRESS-NEXT: stp s3, s2, [x8, #48]
; NOSUPPRESS-NEXT: add w9, w3, w3, lsl #1
; NOSUPPRESS-NEXT: ldr x10, [x0, #8]
; NOSUPPRESS-NEXT: add x9, x10, w9, sxtw #3
; NOSUPPRESS-NEXT: ldp s2, s3, [x9]
; NOSUPPRESS-NEXT: ldp s4, s5, [x8, #24]
; NOSUPPRESS-NEXT: fmul s6, s1, s3
; NOSUPPRESS-NEXT: fmul s3, s0, s3
; NOSUPPRESS-NEXT: fnmsub s0, s0, s2, s6
; NOSUPPRESS-NEXT: fmadd s1, s1, s2, s3
; NOSUPPRESS-NEXT: fadd s2, s0, s4
; NOSUPPRESS-NEXT: fadd s3, s1, s5
; NOSUPPRESS-NEXT: stp s2, s3, [x8, #24]
; NOSUPPRESS-NEXT: fsub s0, s4, s0
; NOSUPPRESS-NEXT: fsub s1, s5, s1
; NOSUPPRESS-NEXT: stp s0, s1, [x8, #56]
; NOSUPPRESS-NEXT: ret
bb:
%shl = shl i64 %arg3, 1
%getelementptr = getelementptr inbounds i8, ptr %arg, i64 8
%load = load ptr, ptr %getelementptr, align 8
%load4 = load float, ptr %load, align 4
%getelementptr5 = getelementptr inbounds i8, ptr %load, i64 4
%load6 = load float, ptr %getelementptr5, align 4
%getelementptr7 = getelementptr %struct.widget, ptr %arg1, i64 %arg2
%load8 = load float, ptr %getelementptr7, align 4
%getelementptr9 = getelementptr inbounds i8, ptr %getelementptr7, i64 4
%load10 = load float, ptr %getelementptr9, align 4
%getelementptr11 = getelementptr i8, ptr %getelementptr7, i64 8
%load12 = load float, ptr %getelementptr11, align 4
%getelementptr13 = getelementptr i8, ptr %getelementptr7, i64 12
%load14 = load float, ptr %getelementptr13, align 4
%fmul = fmul fast float %load12, %load4
%fmul15 = fmul fast float %load14, %load6
%fmul16 = fmul fast float %load14, %load4
%fmul17 = fmul fast float %load12, %load6
%fsub = fsub fast float %fmul, %fmul15
%fadd = fadd fast float %fmul16, %fmul17
%fadd18 = fadd fast float %fsub, %load8
%fadd19 = fadd fast float %fadd, %load10
store float %fadd18, ptr %getelementptr7, align 4
store float %fadd19, ptr %getelementptr9, align 4
%fsub20 = fsub fast float %load8, %fsub
%fsub21 = fsub fast float %load10, %fadd
store float %fsub20, ptr %getelementptr11, align 4
store float %fsub21, ptr %getelementptr13, align 4
%load22 = load ptr, ptr %getelementptr, align 8
%load23 = load float, ptr %load22, align 4
%getelementptr24 = getelementptr inbounds i8, ptr %load22, i64 4
%load25 = load float, ptr %getelementptr24, align 4
%getelementptr26 = getelementptr i8, ptr %getelementptr7, i64 16
%load27 = load float, ptr %getelementptr26, align 4
%getelementptr28 = getelementptr i8, ptr %getelementptr7, i64 20
%load29 = load float, ptr %getelementptr28, align 4
%getelementptr30 = getelementptr i8, ptr %getelementptr7, i64 24
%load31 = load float, ptr %getelementptr30, align 4
%getelementptr32 = getelementptr i8, ptr %getelementptr7, i64 28
%load33 = load float, ptr %getelementptr32, align 4
%fmul34 = fmul fast float %load31, %load23
%fmul35 = fmul fast float %load33, %load25
%fmul36 = fmul fast float %load33, %load23
%fmul37 = fmul fast float %load31, %load25
%fsub38 = fsub fast float %fmul34, %fmul35
%fadd39 = fadd fast float %fmul36, %fmul37
%fadd40 = fadd fast float %fsub38, %load27
%fadd41 = fadd fast float %fadd39, %load29
store float %fadd40, ptr %getelementptr26, align 4
store float %fadd41, ptr %getelementptr28, align 4
%fsub42 = fsub fast float %load27, %fsub38
%fsub43 = fsub fast float %load29, %fadd39
store float %fsub42, ptr %getelementptr30, align 4
store float %fsub43, ptr %getelementptr32, align 4
%load44 = load ptr, ptr %getelementptr, align 8
%load45 = load float, ptr %load44, align 4
%getelementptr46 = getelementptr inbounds i8, ptr %load44, i64 4
%load47 = load float, ptr %getelementptr46, align 4
%fmul48 = fmul fast float %load45, %fadd40
%fmul49 = fmul fast float %load47, %fadd41
%fmul50 = fmul fast float %load45, %fadd41
%fmul51 = fmul fast float %load47, %fadd40
%fsub52 = fsub fast float %fmul48, %fmul49
%fadd53 = fadd fast float %fmul51, %fmul50
%fadd54 = fadd fast float %fsub52, %fadd18
%fadd55 = fadd fast float %fadd53, %fadd19
store float %fadd54, ptr %getelementptr7, align 4
store float %fadd55, ptr %getelementptr9, align 4
%fsub56 = fsub fast float %fadd18, %fsub52
%fsub57 = fsub fast float %fadd19, %fadd53
store float %fsub56, ptr %getelementptr26, align 4
store float %fsub57, ptr %getelementptr28, align 4
%load58 = load ptr, ptr %getelementptr, align 8
%getelementptr59 = getelementptr inbounds %struct.widget, ptr %load58, i64 %shl
%load60 = load float, ptr %getelementptr59, align 4
%getelementptr61 = getelementptr inbounds i8, ptr %getelementptr59, i64 4
%load62 = load float, ptr %getelementptr61, align 4
%fmul63 = fmul fast float %load60, %fsub42
%fmul64 = fmul fast float %load62, %fsub43
%fmul65 = fmul fast float %load60, %fsub43
%fmul66 = fmul fast float %load62, %fsub42
%fsub67 = fsub fast float %fmul63, %fmul64
%fadd68 = fadd fast float %fmul66, %fmul65
%fadd69 = fadd fast float %fsub67, %fsub20
%fadd70 = fadd fast float %fadd68, %fsub21
store float %fadd69, ptr %getelementptr11, align 4
store float %fadd70, ptr %getelementptr13, align 4
%fsub71 = fsub fast float %fsub20, %fsub67
%fsub72 = fsub fast float %fsub21, %fadd68
store float %fsub71, ptr %getelementptr30, align 4
store float %fsub72, ptr %getelementptr32, align 4
%load73 = load ptr, ptr %getelementptr, align 8
%load74 = load float, ptr %load73, align 4
%getelementptr75 = getelementptr inbounds i8, ptr %load73, i64 4
%load76 = load float, ptr %getelementptr75, align 4
%getelementptr77 = getelementptr i8, ptr %getelementptr7, i64 32
%load78 = load float, ptr %getelementptr77, align 4
%getelementptr79 = getelementptr i8, ptr %getelementptr7, i64 36
%load80 = load float, ptr %getelementptr79, align 4
%getelementptr81 = getelementptr i8, ptr %getelementptr7, i64 40
%load82 = load float, ptr %getelementptr81, align 4
%getelementptr83 = getelementptr i8, ptr %getelementptr7, i64 44
%load84 = load float, ptr %getelementptr83, align 4
%fmul85 = fmul fast float %load82, %load74
%fmul86 = fmul fast float %load84, %load76
%fmul87 = fmul fast float %load84, %load74
%fmul88 = fmul fast float %load82, %load76
%fsub89 = fsub fast float %fmul85, %fmul86
%fadd90 = fadd fast float %fmul87, %fmul88
%fadd91 = fadd fast float %fsub89, %load78
%fadd92 = fadd fast float %fadd90, %load80
store float %fadd91, ptr %getelementptr77, align 4
store float %fadd92, ptr %getelementptr79, align 4
%fsub93 = fsub fast float %load78, %fsub89
%fsub94 = fsub fast float %load80, %fadd90
store float %fsub93, ptr %getelementptr81, align 4
store float %fsub94, ptr %getelementptr83, align 4
%load95 = load ptr, ptr %getelementptr, align 8
%load96 = load float, ptr %load95, align 4
%getelementptr97 = getelementptr inbounds i8, ptr %load95, i64 4
%load98 = load float, ptr %getelementptr97, align 4
%getelementptr99 = getelementptr i8, ptr %getelementptr7, i64 48
%load100 = load float, ptr %getelementptr99, align 4
%getelementptr101 = getelementptr i8, ptr %getelementptr7, i64 52
%load102 = load float, ptr %getelementptr101, align 4
%getelementptr103 = getelementptr i8, ptr %getelementptr7, i64 56
%load104 = load float, ptr %getelementptr103, align 4
%getelementptr105 = getelementptr i8, ptr %getelementptr7, i64 60
%load106 = load float, ptr %getelementptr105, align 4
%fmul107 = fmul fast float %load104, %load96
%fmul108 = fmul fast float %load106, %load98
%fmul109 = fmul fast float %load106, %load96
%fmul110 = fmul fast float %load104, %load98
%fsub111 = fsub fast float %fmul107, %fmul108
%fadd112 = fadd fast float %fmul109, %fmul110
%fadd113 = fadd fast float %fsub111, %load100
%fadd114 = fadd fast float %fadd112, %load102
store float %fadd113, ptr %getelementptr99, align 4
store float %fadd114, ptr %getelementptr101, align 4
%fsub115 = fsub fast float %load100, %fsub111
%fsub116 = fsub fast float %load102, %fadd112
store float %fsub115, ptr %getelementptr103, align 4
store float %fsub116, ptr %getelementptr105, align 4
%load117 = load ptr, ptr %getelementptr, align 8
%load118 = load float, ptr %load117, align 4
%getelementptr119 = getelementptr inbounds i8, ptr %load117, i64 4
%load120 = load float, ptr %getelementptr119, align 4
%fmul121 = fmul fast float %load118, %fadd113
%fmul122 = fmul fast float %load120, %fadd114
%fmul123 = fmul fast float %load118, %fadd114
%fmul124 = fmul fast float %load120, %fadd113
%fsub125 = fsub fast float %fmul121, %fmul122
%fadd126 = fadd fast float %fmul124, %fmul123
%fadd127 = fadd fast float %fsub125, %fadd91
%fadd128 = fadd fast float %fadd126, %fadd92
store float %fadd127, ptr %getelementptr77, align 4
store float %fadd128, ptr %getelementptr79, align 4
%fsub129 = fsub fast float %fadd91, %fsub125
%fsub130 = fsub fast float %fadd92, %fadd126
store float %fsub129, ptr %getelementptr99, align 4
store float %fsub130, ptr %getelementptr101, align 4
%load131 = load ptr, ptr %getelementptr, align 8
%getelementptr132 = getelementptr inbounds %struct.widget, ptr %load131, i64 %shl
%load133 = load float, ptr %getelementptr132, align 4
%getelementptr134 = getelementptr inbounds i8, ptr %getelementptr132, i64 4
%load135 = load float, ptr %getelementptr134, align 4
%fmul136 = fmul fast float %load133, %fsub115
%fmul137 = fmul fast float %load135, %fsub116
%fmul138 = fmul fast float %load133, %fsub116
%fmul139 = fmul fast float %load135, %fsub115
%fsub140 = fsub fast float %fmul136, %fmul137
%fadd141 = fadd fast float %fmul139, %fmul138
%fadd142 = fadd fast float %fsub140, %fsub93
%fadd143 = fadd fast float %fadd141, %fsub94
store float %fadd142, ptr %getelementptr81, align 4
store float %fadd143, ptr %getelementptr83, align 4
%fsub144 = fsub fast float %fsub93, %fsub140
%fsub145 = fsub fast float %fsub94, %fadd141
store float %fsub144, ptr %getelementptr103, align 4
store float %fsub145, ptr %getelementptr105, align 4
%load146 = load ptr, ptr %getelementptr, align 8
%load147 = load float, ptr %load146, align 4
%getelementptr148 = getelementptr inbounds i8, ptr %load146, i64 4
%load149 = load float, ptr %getelementptr148, align 4
%load150 = load float, ptr %getelementptr7, align 4
%load151 = load float, ptr %getelementptr9, align 4
%fmul152 = fmul fast float %fadd127, %load147
%fmul153 = fmul fast float %fadd128, %load149
%fmul154 = fmul fast float %fadd128, %load147
%fmul155 = fmul fast float %fadd127, %load149
%fsub156 = fsub fast float %fmul152, %fmul153
%fadd157 = fadd fast float %fmul154, %fmul155
%fadd158 = fadd fast float %fsub156, %load150
%fadd159 = fadd fast float %fadd157, %load151
store float %fadd158, ptr %getelementptr7, align 4
store float %fadd159, ptr %getelementptr9, align 4
%fsub160 = fsub fast float %load150, %fsub156
%fsub161 = fsub fast float %load151, %fadd157
store float %fsub160, ptr %getelementptr77, align 4
store float %fsub161, ptr %getelementptr79, align 4
%shl162 = shl i64 %arg3, 32
%ashr = ashr exact i64 %shl162, 32
%load163 = load ptr, ptr %getelementptr, align 8
%getelementptr164 = getelementptr inbounds %struct.widget, ptr %load163, i64 %ashr
%load165 = load float, ptr %getelementptr164, align 4
%getelementptr166 = getelementptr inbounds i8, ptr %getelementptr164, i64 4
%load167 = load float, ptr %getelementptr166, align 4
%load168 = load float, ptr %getelementptr11, align 4
%getelementptr169 = getelementptr i8, ptr %getelementptr7, i64 12
%load170 = load float, ptr %getelementptr169, align 4
%getelementptr171 = getelementptr i8, ptr %getelementptr7, i64 40
%getelementptr172 = getelementptr i8, ptr %getelementptr7, i64 44
%fmul173 = fmul fast float %fadd142, %load165
%fmul174 = fmul fast float %fadd143, %load167
%fmul175 = fmul fast float %fadd143, %load165
%fmul176 = fmul fast float %fadd142, %load167
%fsub177 = fsub fast float %fmul173, %fmul174
%fadd178 = fadd fast float %fmul175, %fmul176
%fadd179 = fadd fast float %fsub177, %load168
%fadd180 = fadd fast float %fadd178, %load170
store float %fadd179, ptr %getelementptr11, align 4
store float %fadd180, ptr %getelementptr169, align 4
%fsub181 = fsub fast float %load168, %fsub177
%fsub182 = fsub fast float %load170, %fadd178
store float %fsub181, ptr %getelementptr171, align 4
store float %fsub182, ptr %getelementptr172, align 4
%shl183 = shl i64 %arg3, 33
%ashr184 = ashr exact i64 %shl183, 32
%load185 = load ptr, ptr %getelementptr, align 8
%getelementptr186 = getelementptr inbounds %struct.widget, ptr %load185, i64 %ashr184
%load187 = load float, ptr %getelementptr186, align 4
%getelementptr188 = getelementptr inbounds i8, ptr %getelementptr186, i64 4
%load189 = load float, ptr %getelementptr188, align 4
%load190 = load float, ptr %getelementptr26, align 4
%getelementptr191 = getelementptr i8, ptr %getelementptr7, i64 20
%load192 = load float, ptr %getelementptr191, align 4
%getelementptr193 = getelementptr i8, ptr %getelementptr7, i64 48
%getelementptr194 = getelementptr i8, ptr %getelementptr7, i64 52
%fmul195 = fmul fast float %fsub129, %load187
%fmul196 = fmul fast float %fsub130, %load189
%fmul197 = fmul fast float %fsub130, %load187
%fmul198 = fmul fast float %fsub129, %load189
%fsub199 = fsub fast float %fmul195, %fmul196
%fadd200 = fadd fast float %fmul197, %fmul198
%fadd201 = fadd fast float %fsub199, %load190
%fadd202 = fadd fast float %fadd200, %load192
store float %fadd201, ptr %getelementptr26, align 4
store float %fadd202, ptr %getelementptr191, align 4
%fsub203 = fsub fast float %load190, %fsub199
%fsub204 = fsub fast float %load192, %fadd200
store float %fsub203, ptr %getelementptr193, align 4
store float %fsub204, ptr %getelementptr194, align 4
%add = add i64 %ashr184, %arg3
%shl205 = shl i64 %add, 32
%ashr206 = ashr exact i64 %shl205, 32
%load207 = load ptr, ptr %getelementptr, align 8
%getelementptr208 = getelementptr inbounds %struct.widget, ptr %load207, i64 %ashr206
%load209 = load float, ptr %getelementptr208, align 4
%getelementptr210 = getelementptr inbounds i8, ptr %getelementptr208, i64 4
%load211 = load float, ptr %getelementptr210, align 4
%load212 = load float, ptr %getelementptr30, align 4
%getelementptr213 = getelementptr i8, ptr %getelementptr7, i64 28
%load214 = load float, ptr %getelementptr213, align 4
%getelementptr215 = getelementptr i8, ptr %getelementptr7, i64 56
%getelementptr216 = getelementptr i8, ptr %getelementptr7, i64 60
%fmul217 = fmul fast float %fsub144, %load209
%fmul218 = fmul fast float %fsub145, %load211
%fmul219 = fmul fast float %fsub145, %load209
%fmul220 = fmul fast float %fsub144, %load211
%fsub221 = fsub fast float %fmul217, %fmul218
%fadd222 = fadd fast float %fmul219, %fmul220
%fadd223 = fadd fast float %fsub221, %load212
%fadd224 = fadd fast float %fadd222, %load214
store float %fadd223, ptr %getelementptr30, align 4
store float %fadd224, ptr %getelementptr213, align 4
%fsub225 = fsub fast float %load212, %fsub221
%fsub226 = fsub fast float %load214, %fadd222
store float %fsub225, ptr %getelementptr215, align 4
store float %fsub226, ptr %getelementptr216, align 4
ret void
}