; PR52927: Relaxed atomics can load to/store from fp regs directly
; RUN: llc < %s -mtriple=arm64-eabi -asm-verbose=false -verify-machineinstrs -mcpu=cyclone | FileCheck %s
define float @atomic_load_relaxed_f32(ptr %p, i32 %off32, i64 %off64) #0 {
; CHECK-LABEL: atomic_load_relaxed_f32:
%ptr_unsigned = getelementptr float, ptr %p, i32 4095
%val_unsigned = load atomic float, ptr %ptr_unsigned monotonic, align 4
; CHECK: ldr {{s[0-9]+}}, [x0, #16380]
%ptr_regoff = getelementptr float, ptr %p, i32 %off32
%val_regoff = load atomic float, ptr %ptr_regoff unordered, align 4
%tot1 = fadd float %val_unsigned, %val_regoff
; CHECK: ldr {{s[0-9]+}}, [x0, w1, sxtw #2]
%ptr_regoff64 = getelementptr float, ptr %p, i64 %off64
%val_regoff64 = load atomic float, ptr %ptr_regoff64 monotonic, align 4
%tot2 = fadd float %tot1, %val_regoff64
; CHECK: ldr {{s[0-9]+}}, [x0, x2, lsl #2]
%ptr_unscaled = getelementptr float, ptr %p, i32 -64
%val_unscaled = load atomic float, ptr %ptr_unscaled unordered, align 4
%tot3 = fadd float %tot2, %val_unscaled
; CHECK: ldur {{s[0-9]+}}, [x0, #-256]
ret float %tot3
}
define double @atomic_load_relaxed_f64(ptr %p, i32 %off32, i64 %off64) #0 {
; CHECK-LABEL: atomic_load_relaxed_f64:
%ptr_unsigned = getelementptr double, ptr %p, i32 4095
%val_unsigned = load atomic double, ptr %ptr_unsigned monotonic, align 8
; CHECK: ldr {{d[0-9]+}}, [x0, #32760]
%ptr_regoff = getelementptr double, ptr %p, i32 %off32
%val_regoff = load atomic double, ptr %ptr_regoff unordered, align 8
%tot1 = fadd double %val_unsigned, %val_regoff
; CHECK: ldr {{d[0-9]+}}, [x0, w1, sxtw #3]
%ptr_regoff64 = getelementptr double, ptr %p, i64 %off64
%val_regoff64 = load atomic double, ptr %ptr_regoff64 monotonic, align 8
%tot2 = fadd double %tot1, %val_regoff64
; CHECK: ldr {{d[0-9]+}}, [x0, x2, lsl #3]
%ptr_unscaled = getelementptr double, ptr %p, i32 -32
%val_unscaled = load atomic double, ptr %ptr_unscaled unordered, align 8
%tot3 = fadd double %tot2, %val_unscaled
; CHECK: ldur {{d[0-9]+}}, [x0, #-256]
ret double %tot3
}
define void @atomic_store_relaxed_f32(ptr %p, i32 %off32, i64 %off64, float %val) #0 {
; CHECK-LABEL: atomic_store_relaxed_f32:
%ptr_unsigned = getelementptr float, ptr %p, i32 4095
store atomic float %val, ptr %ptr_unsigned monotonic, align 4
; CHECK: str {{s[0-9]+}}, [x0, #16380]
%ptr_regoff = getelementptr float, ptr %p, i32 %off32
store atomic float %val, ptr %ptr_regoff unordered, align 4
; CHECK: str {{s[0-9]+}}, [x0, w1, sxtw #2]
%ptr_regoff64 = getelementptr float, ptr %p, i64 %off64
store atomic float %val, ptr %ptr_regoff64 monotonic, align 4
; CHECK: str {{s[0-9]+}}, [x0, x2, lsl #2]
%ptr_unscaled = getelementptr float, ptr %p, i32 -64
store atomic float %val, ptr %ptr_unscaled unordered, align 4
; CHECK: stur {{s[0-9]+}}, [x0, #-256]
ret void
}
define void @atomic_store_relaxed_f64(ptr %p, i32 %off32, i64 %off64, double %val) #0 {
; CHECK-LABEL: atomic_store_relaxed_f64:
%ptr_unsigned = getelementptr double, ptr %p, i32 4095
store atomic double %val, ptr %ptr_unsigned monotonic, align 8
; CHECK: str {{d[0-9]+}}, [x0, #32760]
%ptr_regoff = getelementptr double, ptr %p, i32 %off32
store atomic double %val, ptr %ptr_regoff unordered, align 8
; CHECK: str {{d[0-9]+}}, [x0, w1, sxtw #3]
%ptr_regoff64 = getelementptr double, ptr %p, i64 %off64
store atomic double %val, ptr %ptr_regoff64 unordered, align 8
; CHECK: str {{d[0-9]+}}, [x0, x2, lsl #3]
%ptr_unscaled = getelementptr double, ptr %p, i32 -32
store atomic double %val, ptr %ptr_unscaled monotonic, align 8
; CHECK: stur {{d[0-9]+}}, [x0, #-256]
ret void
}
define half @atomic_load_relaxed_f16(ptr %p, i32 %off32, i64 %off64) #0 {
; CHECK-LABEL: atomic_load_relaxed_f16:
%ptr_unsigned = getelementptr half, ptr %p, i32 4095
%val_unsigned = load atomic half, ptr %ptr_unsigned monotonic, align 4
; CHECK: ldrh {{w[0-9]+}}, [x0, #8190]
%ptr_regoff = getelementptr half, ptr %p, i32 %off32
%val_regoff = load atomic half, ptr %ptr_regoff unordered, align 4
%tot1 = fadd half %val_unsigned, %val_regoff
; CHECK: ldrh {{w[0-9]+}}, [x0, w1, sxtw #1]
%ptr_regoff64 = getelementptr half, ptr %p, i64 %off64
%val_regoff64 = load atomic half, ptr %ptr_regoff64 monotonic, align 4
%tot2 = fadd half %tot1, %val_regoff64
; CHECK: ldrh {{w[0-9]+}}, [x0, x2, lsl #1]
%ptr_unscaled = getelementptr half, ptr %p, i32 -64
%val_unscaled = load atomic half, ptr %ptr_unscaled unordered, align 4
%tot3 = fadd half %tot2, %val_unscaled
; CHECK: ldurh {{w[0-9]+}}, [x0, #-128]
ret half %tot3
}
define bfloat @atomic_load_relaxed_bf16(ptr %p, i32 %off32, i64 %off64) #0 {
; CHECK-LABEL: atomic_load_relaxed_bf16:
%ptr_unsigned = getelementptr bfloat, ptr %p, i32 4095
%val_unsigned = load atomic bfloat, ptr %ptr_unsigned monotonic, align 4
; CHECK: ldrh {{w[0-9]+}}, [x0, #8190]
%ptr_regoff = getelementptr bfloat, ptr %p, i32 %off32
%val_regoff = load atomic bfloat, ptr %ptr_regoff unordered, align 4
%tot1 = fadd bfloat %val_unsigned, %val_regoff
; CHECK: ldrh {{w[0-9]+}}, [x0, w1, sxtw #1]
%ptr_regoff64 = getelementptr bfloat, ptr %p, i64 %off64
%val_regoff64 = load atomic bfloat, ptr %ptr_regoff64 monotonic, align 4
%tot2 = fadd bfloat %tot1, %val_regoff64
; CHECK: ldrh {{w[0-9]+}}, [x0, x2, lsl #1]
%ptr_unscaled = getelementptr bfloat, ptr %p, i32 -64
%val_unscaled = load atomic bfloat, ptr %ptr_unscaled unordered, align 4
%tot3 = fadd bfloat %tot2, %val_unscaled
; CHECK: ldurh {{w[0-9]+}}, [x0, #-128]
ret bfloat %tot3
}
define void @atomic_store_relaxed_f16(ptr %p, i32 %off32, i64 %off64, half %val) #0 {
; CHECK-LABEL: atomic_store_relaxed_f16:
%ptr_unsigned = getelementptr half, ptr %p, i32 4095
store atomic half %val, ptr %ptr_unsigned monotonic, align 4
; CHECK: strh {{w[0-9]+}}, [x0, #8190]
%ptr_regoff = getelementptr half, ptr %p, i32 %off32
store atomic half %val, ptr %ptr_regoff unordered, align 4
; CHECK: strh {{w[0-9]+}}, [x0, w1, sxtw #1]
%ptr_regoff64 = getelementptr half, ptr %p, i64 %off64
store atomic half %val, ptr %ptr_regoff64 monotonic, align 4
; CHECK: strh {{w[0-9]+}}, [x0, x2, lsl #1]
%ptr_unscaled = getelementptr half, ptr %p, i32 -64
store atomic half %val, ptr %ptr_unscaled unordered, align 4
; CHECK: sturh {{w[0-9]+}}, [x0, #-128]
ret void
}
define void @atomic_store_relaxed_bf16(ptr %p, i32 %off32, i64 %off64, bfloat %val) #0 {
; CHECK-LABEL: atomic_store_relaxed_bf16:
%ptr_unsigned = getelementptr bfloat, ptr %p, i32 4095
store atomic bfloat %val, ptr %ptr_unsigned monotonic, align 4
; CHECK: strh {{w[0-9]+}}, [x0, #8190]
%ptr_regoff = getelementptr bfloat, ptr %p, i32 %off32
store atomic bfloat %val, ptr %ptr_regoff unordered, align 4
; CHECK: strh {{w[0-9]+}}, [x0, w1, sxtw #1]
%ptr_regoff64 = getelementptr bfloat, ptr %p, i64 %off64
store atomic bfloat %val, ptr %ptr_regoff64 monotonic, align 4
; CHECK: strh {{w[0-9]+}}, [x0, x2, lsl #1]
%ptr_unscaled = getelementptr bfloat, ptr %p, i32 -64
store atomic bfloat %val, ptr %ptr_unscaled unordered, align 4
; CHECK: sturh {{w[0-9]+}}, [x0, #-128]
ret void
}
attributes #0 = { nounwind }