; RUN: llc -mtriple=aarch64-none-linux-gnu -mattr=+sve -mattr=+bf16 < %s | FileCheck %s
; This file checks that unpredicated load/store instructions to locals
; use the right instructions and offsets.
; Data fills
define void @fill_nxv16i8() {
; CHECK-LABEL: fill_nxv16i8
; CHECK-DAG: ld1b { z{{[01]}}.b }, p0/z, [sp]
; CHECK-DAG: ld1b { z{{[01]}}.b }, p0/z, [sp, #1, mul vl]
%local0 = alloca <vscale x 16 x i8>
%local1 = alloca <vscale x 16 x i8>
load volatile <vscale x 16 x i8>, ptr %local0
load volatile <vscale x 16 x i8>, ptr %local1
ret void
}
define void @fill_nxv8i8() {
; CHECK-LABEL: fill_nxv8i8
; CHECK-DAG: ld1b { z{{[01]}}.h }, p0/z, [sp]
; CHECK-DAG: ld1b { z{{[01]}}.h }, p0/z, [sp, #1, mul vl]
%local0 = alloca <vscale x 8 x i8>
%local1 = alloca <vscale x 8 x i8>
load volatile <vscale x 8 x i8>, ptr %local0
load volatile <vscale x 8 x i8>, ptr %local1
ret void
}
define <vscale x 8 x i16> @fill_signed_nxv8i8() {
; CHECK-LABEL: fill_signed_nxv8i8
; CHECK-DAG: ld1sb { z{{[01]}}.h }, p0/z, [sp]
; CHECK-DAG: ld1sb { z{{[01]}}.h }, p0/z, [sp, #1, mul vl]
%local0 = alloca <vscale x 8 x i8>
%local1 = alloca <vscale x 8 x i8>
%a = load volatile <vscale x 8 x i8>, ptr %local0
%a_ext = sext <vscale x 8 x i8> %a to <vscale x 8 x i16>
%b = load volatile <vscale x 8 x i8>, ptr %local1
%b_ext = sext <vscale x 8 x i8> %b to <vscale x 8 x i16>
%sum = add <vscale x 8 x i16> %a_ext, %b_ext
ret <vscale x 8 x i16> %sum
}
define void @fill_nxv4i8() {
; CHECK-LABEL: fill_nxv4i8
; CHECK-DAG: ld1b { z{{[01]}}.s }, p0/z, [sp, #3, mul vl]
; CHECK-DAG: ld1b { z{{[01]}}.s }, p0/z, [sp, #2, mul vl]
%local0 = alloca <vscale x 4 x i8>
%local1 = alloca <vscale x 4 x i8>
load volatile <vscale x 4 x i8>, ptr %local0
load volatile <vscale x 4 x i8>, ptr %local1
ret void
}
define <vscale x 4 x i32> @fill_signed_nxv4i8() {
; CHECK-LABEL: fill_signed_nxv4i8
; CHECK-DAG: ld1sb { z{{[01]}}.s }, p0/z, [sp, #3, mul vl]
; CHECK-DAG: ld1sb { z{{[01]}}.s }, p0/z, [sp, #2, mul vl]
%local0 = alloca <vscale x 4 x i8>
%local1 = alloca <vscale x 4 x i8>
%a = load volatile <vscale x 4 x i8>, ptr %local0
%a_ext = sext <vscale x 4 x i8> %a to <vscale x 4 x i32>
%b = load volatile <vscale x 4 x i8>, ptr %local1
%b_ext = sext <vscale x 4 x i8> %b to <vscale x 4 x i32>
%sum = add <vscale x 4 x i32> %a_ext, %b_ext
ret <vscale x 4 x i32> %sum
}
define void @fill_nxv2i8() {
; CHECK-LABEL: fill_nxv2i8
; CHECK-DAG: ld1b { z{{[01]}}.d }, p0/z, [sp, #7, mul vl]
; CHECK-DAG: ld1b { z{{[01]}}.d }, p0/z, [sp, #6, mul vl]
%local0 = alloca <vscale x 2 x i8>
%local1 = alloca <vscale x 2 x i8>
load volatile <vscale x 2 x i8>, ptr %local0
load volatile <vscale x 2 x i8>, ptr %local1
ret void
}
define <vscale x 2 x i64> @fill_signed_nxv2i8() {
; CHECK-LABEL: fill_signed_nxv2i8
; CHECK-DAG: ld1sb { z{{[01]}}.d }, p0/z, [sp, #7, mul vl]
; CHECK-DAG: ld1sb { z{{[01]}}.d }, p0/z, [sp, #6, mul vl]
%local0 = alloca <vscale x 2 x i8>
%local1 = alloca <vscale x 2 x i8>
%a = load volatile <vscale x 2 x i8>, ptr %local0
%a_ext = sext <vscale x 2 x i8> %a to <vscale x 2 x i64>
%b = load volatile <vscale x 2 x i8>, ptr %local1
%b_ext = sext <vscale x 2 x i8> %b to <vscale x 2 x i64>
%sum = add <vscale x 2 x i64> %a_ext, %b_ext
ret <vscale x 2 x i64> %sum
}
define void @fill_nxv8i16() {
; CHECK-LABEL: fill_nxv8i16
; CHECK-DAG: ld1h { z{{[01]}}.h }, p0/z, [sp]
; CHECK-DAG: ld1h { z{{[01]}}.h }, p0/z, [sp, #1, mul vl]
%local0 = alloca <vscale x 8 x i16>
%local1 = alloca <vscale x 8 x i16>
load volatile <vscale x 8 x i16>, ptr %local0
load volatile <vscale x 8 x i16>, ptr %local1
ret void
}
define void @fill_nxv4i16() {
; CHECK-LABEL: fill_nxv4i16
; CHECK-DAG: ld1h { z{{[01]}}.s }, p0/z, [sp]
; CHECK-DAG: ld1h { z{{[01]}}.s }, p0/z, [sp, #1, mul vl]
%local0 = alloca <vscale x 4 x i16>
%local1 = alloca <vscale x 4 x i16>
load volatile <vscale x 4 x i16>, ptr %local0
load volatile <vscale x 4 x i16>, ptr %local1
ret void
}
define <vscale x 4 x i32> @fill_signed_nxv4i16() {
; CHECK-LABEL: fill_signed_nxv4i16
; CHECK-DAG: ld1sh { z{{[01]}}.s }, p0/z, [sp]
; CHECK-DAG: ld1sh { z{{[01]}}.s }, p0/z, [sp, #1, mul vl]
%local0 = alloca <vscale x 4 x i16>
%local1 = alloca <vscale x 4 x i16>
%a = load volatile <vscale x 4 x i16>, ptr %local0
%a_ext = sext <vscale x 4 x i16> %a to <vscale x 4 x i32>
%b = load volatile <vscale x 4 x i16>, ptr %local1
%b_ext = sext <vscale x 4 x i16> %b to <vscale x 4 x i32>
%sum = add <vscale x 4 x i32> %a_ext, %b_ext
ret <vscale x 4 x i32> %sum
}
define void @fill_nxv2i16() {
; CHECK-LABEL: fill_nxv2i16
; CHECK-DAG: ld1h { z{{[01]}}.d }, p0/z, [sp, #3, mul vl]
; CHECK-DAG: ld1h { z{{[01]}}.d }, p0/z, [sp, #2, mul vl]
%local0 = alloca <vscale x 2 x i16>
%local1 = alloca <vscale x 2 x i16>
load volatile <vscale x 2 x i16>, ptr %local0
load volatile <vscale x 2 x i16>, ptr %local1
ret void
}
define <vscale x 2 x i64> @fill_signed_nxv2i16() {
; CHECK-LABEL: fill_signed_nxv2i16
; CHECK-DAG: ld1sh { z{{[01]}}.d }, p0/z, [sp, #3, mul vl]
; CHECK-DAG: ld1sh { z{{[01]}}.d }, p0/z, [sp, #2, mul vl]
%local0 = alloca <vscale x 2 x i16>
%local1 = alloca <vscale x 2 x i16>
%a = load volatile <vscale x 2 x i16>, ptr %local0
%a_ext = sext <vscale x 2 x i16> %a to <vscale x 2 x i64>
%b = load volatile <vscale x 2 x i16>, ptr %local1
%b_ext = sext <vscale x 2 x i16> %b to <vscale x 2 x i64>
%sum = add <vscale x 2 x i64> %a_ext, %b_ext
ret <vscale x 2 x i64> %sum
}
define void @fill_nxv4i32() {
; CHECK-LABEL: fill_nxv4i32
; CHECK-DAG: ld1w { z{{[01]}}.s }, p0/z, [sp]
; CHECK-DAG: ld1w { z{{[01]}}.s }, p0/z, [sp, #1, mul vl]
%local0 = alloca <vscale x 4 x i32>
%local1 = alloca <vscale x 4 x i32>
load volatile <vscale x 4 x i32>, ptr %local0
load volatile <vscale x 4 x i32>, ptr %local1
ret void
}
define void @fill_nxv2i32() {
; CHECK-LABEL: fill_nxv2i32
; CHECK-DAG: ld1w { z{{[01]}}.d }, p0/z, [sp]
; CHECK-DAG: ld1w { z{{[01]}}.d }, p0/z, [sp, #1, mul vl]
%local0 = alloca <vscale x 2 x i32>
%local1 = alloca <vscale x 2 x i32>
load volatile <vscale x 2 x i32>, ptr %local0
load volatile <vscale x 2 x i32>, ptr %local1
ret void
}
define <vscale x 2 x i64> @fill_signed_nxv2i32() {
; CHECK-LABEL: fill_signed_nxv2i32
; CHECK-DAG: ld1sw { z{{[01]}}.d }, p0/z, [sp]
; CHECK-DAG: ld1sw { z{{[01]}}.d }, p0/z, [sp, #1, mul vl]
%local0 = alloca <vscale x 2 x i32>
%local1 = alloca <vscale x 2 x i32>
%a = load volatile <vscale x 2 x i32>, ptr %local0
%a_ext = sext <vscale x 2 x i32> %a to <vscale x 2 x i64>
%b = load volatile <vscale x 2 x i32>, ptr %local1
%b_ext = sext <vscale x 2 x i32> %b to <vscale x 2 x i64>
%sum = add <vscale x 2 x i64> %a_ext, %b_ext
ret <vscale x 2 x i64> %sum
}
define void @fill_nxv2i64() {
; CHECK-LABEL: fill_nxv2i64
; CHECK-DAG: ld1d { z{{[01]}}.d }, p0/z, [sp]
; CHECK-DAG: ld1d { z{{[01]}}.d }, p0/z, [sp, #1, mul vl]
%local0 = alloca <vscale x 2 x i64>
%local1 = alloca <vscale x 2 x i64>
load volatile <vscale x 2 x i64>, ptr %local0
load volatile <vscale x 2 x i64>, ptr %local1
ret void
}
define void @fill_nxv8bf16() {
; CHECK-LABEL: fill_nxv8bf16
; CHECK-DAG: ld1h { z{{[01]}}.h }, p0/z, [sp]
; CHECK-DAG: ld1h { z{{[01]}}.h }, p0/z, [sp, #1, mul vl]
%local0 = alloca <vscale x 8 x bfloat>
%local1 = alloca <vscale x 8 x bfloat>
load volatile <vscale x 8 x bfloat>, ptr %local0
load volatile <vscale x 8 x bfloat>, ptr %local1
ret void
}
define void @fill_nxv8f16() {
; CHECK-LABEL: fill_nxv8f16
; CHECK-DAG: ld1h { z{{[01]}}.h }, p0/z, [sp]
; CHECK-DAG: ld1h { z{{[01]}}.h }, p0/z, [sp, #1, mul vl]
%local0 = alloca <vscale x 8 x half>
%local1 = alloca <vscale x 8 x half>
load volatile <vscale x 8 x half>, ptr %local0
load volatile <vscale x 8 x half>, ptr %local1
ret void
}
define void @fill_nxv4f32() {
; CHECK-LABEL: fill_nxv4f32
; CHECK-DAG: ld1w { z{{[01]}}.s }, p0/z, [sp]
; CHECK-DAG: ld1w { z{{[01]}}.s }, p0/z, [sp, #1, mul vl]
%local0 = alloca <vscale x 4 x float>
%local1 = alloca <vscale x 4 x float>
load volatile <vscale x 4 x float>, ptr %local0
load volatile <vscale x 4 x float>, ptr %local1
ret void
}
define void @fill_nxv2f64() {
; CHECK-LABEL: fill_nxv2f64
; CHECK-DAG: ld1d { z{{[01]}}.d }, p0/z, [sp]
; CHECK-DAG: ld1d { z{{[01]}}.d }, p0/z, [sp, #1, mul vl]
%local0 = alloca <vscale x 2 x double>
%local1 = alloca <vscale x 2 x double>
load volatile <vscale x 2 x double>, ptr %local0
load volatile <vscale x 2 x double>, ptr %local1
ret void
}
; Data spills
define void @spill_nxv16i8(<vscale x 16 x i8> %v0, <vscale x 16 x i8> %v1) {
; CHECK-LABEL: spill_nxv16i8
; CHECK-DAG: st1b { z{{[01]}}.b }, p0, [sp]
; CHECK-DAG: st1b { z{{[01]}}.b }, p0, [sp, #1, mul vl]
%local0 = alloca <vscale x 16 x i8>
%local1 = alloca <vscale x 16 x i8>
store volatile <vscale x 16 x i8> %v0, ptr %local0
store volatile <vscale x 16 x i8> %v1, ptr %local1
ret void
}
define void @spill_nxv8i8(<vscale x 8 x i8> %v0, <vscale x 8 x i8> %v1) {
; CHECK-LABEL: spill_nxv8i8
; CHECK-DAG: st1b { z{{[01]}}.h }, p0, [sp]
; CHECK-DAG: st1b { z{{[01]}}.h }, p0, [sp, #1, mul vl]
%local0 = alloca <vscale x 8 x i8>
%local1 = alloca <vscale x 8 x i8>
store volatile <vscale x 8 x i8> %v0, ptr %local0
store volatile <vscale x 8 x i8> %v1, ptr %local1
ret void
}
define void @spill_nxv4i8(<vscale x 4 x i8> %v0, <vscale x 4 x i8> %v1) {
; CHECK-LABEL: spill_nxv4i8
; CHECK-DAG: st1b { z{{[01]}}.s }, p0, [sp, #3, mul vl]
; CHECK-DAG: st1b { z{{[01]}}.s }, p0, [sp, #2, mul vl]
%local0 = alloca <vscale x 4 x i8>
%local1 = alloca <vscale x 4 x i8>
store volatile <vscale x 4 x i8> %v0, ptr %local0
store volatile <vscale x 4 x i8> %v1, ptr %local1
ret void
}
define void @spill_nxv2i8(<vscale x 2 x i8> %v0, <vscale x 2 x i8> %v1) {
; CHECK-LABEL: spill_nxv2i8
; CHECK-DAG: st1b { z{{[01]}}.d }, p0, [sp, #7, mul vl]
; CHECK-DAG: st1b { z{{[01]}}.d }, p0, [sp, #6, mul vl]
%local0 = alloca <vscale x 2 x i8>
%local1 = alloca <vscale x 2 x i8>
store volatile <vscale x 2 x i8> %v0, ptr %local0
store volatile <vscale x 2 x i8> %v1, ptr %local1
ret void
}
define void @spill_nxv8i16(<vscale x 8 x i16> %v0, <vscale x 8 x i16> %v1) {
; CHECK-LABEL: spill_nxv8i16
; CHECK-DAG: st1h { z{{[01]}}.h }, p0, [sp]
; CHECK-DAG: st1h { z{{[01]}}.h }, p0, [sp, #1, mul vl]
%local0 = alloca <vscale x 8 x i16>
%local1 = alloca <vscale x 8 x i16>
store volatile <vscale x 8 x i16> %v0, ptr %local0
store volatile <vscale x 8 x i16> %v1, ptr %local1
ret void
}
define void @spill_nxv4i16(<vscale x 4 x i16> %v0, <vscale x 4 x i16> %v1) {
; CHECK-LABEL: spill_nxv4i16
; CHECK-DAG: st1h { z{{[01]}}.s }, p0, [sp]
; CHECK-DAG: st1h { z{{[01]}}.s }, p0, [sp, #1, mul vl]
%local0 = alloca <vscale x 4 x i16>
%local1 = alloca <vscale x 4 x i16>
store volatile <vscale x 4 x i16> %v0, ptr %local0
store volatile <vscale x 4 x i16> %v1, ptr %local1
ret void
}
define void @spill_nxv2i16(<vscale x 2 x i16> %v0, <vscale x 2 x i16> %v1) {
; CHECK-LABEL: spill_nxv2i16
; CHECK-DAG: st1h { z{{[01]}}.d }, p0, [sp, #3, mul vl]
; CHECK-DAG: st1h { z{{[01]}}.d }, p0, [sp, #2, mul vl]
%local0 = alloca <vscale x 2 x i16>
%local1 = alloca <vscale x 2 x i16>
store volatile <vscale x 2 x i16> %v0, ptr %local0
store volatile <vscale x 2 x i16> %v1, ptr %local1
ret void
}
define void @spill_nxv4i32(<vscale x 4 x i32> %v0, <vscale x 4 x i32> %v1) {
; CHECK-LABEL: spill_nxv4i32
; CHECK-DAG: st1w { z{{[01]}}.s }, p0, [sp]
; CHECK-DAG: st1w { z{{[01]}}.s }, p0, [sp, #1, mul vl]
%local0 = alloca <vscale x 4 x i32>
%local1 = alloca <vscale x 4 x i32>
store volatile <vscale x 4 x i32> %v0, ptr %local0
store volatile <vscale x 4 x i32> %v1, ptr %local1
ret void
}
define void @spill_nxv2i32(<vscale x 2 x i32> %v0, <vscale x 2 x i32> %v1) {
; CHECK-LABEL: spill_nxv2i32
; CHECK-DAG: st1w { z{{[01]}}.d }, p0, [sp]
; CHECK-DAG: st1w { z{{[01]}}.d }, p0, [sp, #1, mul vl]
%local0 = alloca <vscale x 2 x i32>
%local1 = alloca <vscale x 2 x i32>
store volatile <vscale x 2 x i32> %v0, ptr %local0
store volatile <vscale x 2 x i32> %v1, ptr %local1
ret void
}
define void @spill_nxv2i64(<vscale x 2 x i64> %v0, <vscale x 2 x i64> %v1) {
; CHECK-LABEL: spill_nxv2i64
; CHECK-DAG: st1d { z{{[01]}}.d }, p0, [sp]
; CHECK-DAG: st1d { z{{[01]}}.d }, p0, [sp, #1, mul vl]
%local0 = alloca <vscale x 2 x i64>
%local1 = alloca <vscale x 2 x i64>
store volatile <vscale x 2 x i64> %v0, ptr %local0
store volatile <vscale x 2 x i64> %v1, ptr %local1
ret void
}
define void @spill_nxv8f16(<vscale x 8 x half> %v0, <vscale x 8 x half> %v1) {
; CHECK-LABEL: spill_nxv8f16
; CHECK-DAG: st1h { z{{[01]}}.h }, p0, [sp]
; CHECK-DAG: st1h { z{{[01]}}.h }, p0, [sp, #1, mul vl]
%local0 = alloca <vscale x 8 x half>
%local1 = alloca <vscale x 8 x half>
store volatile <vscale x 8 x half> %v0, ptr %local0
store volatile <vscale x 8 x half> %v1, ptr %local1
ret void
}
define void @spill_nxv8bf16(<vscale x 8 x bfloat> %v0, <vscale x 8 x bfloat> %v1) {
; CHECK-LABEL: spill_nxv8bf16
; CHECK-DAG: st1h { z{{[01]}}.h }, p0, [sp]
; CHECK-DAG: st1h { z{{[01]}}.h }, p0, [sp, #1, mul vl]
%local0 = alloca <vscale x 8 x bfloat>
%local1 = alloca <vscale x 8 x bfloat>
store volatile <vscale x 8 x bfloat> %v0, ptr %local0
store volatile <vscale x 8 x bfloat> %v1, ptr %local1
ret void
}
define void @spill_nxv4f32(<vscale x 4 x float> %v0, <vscale x 4 x float> %v1) {
; CHECK-LABEL: spill_nxv4f32
; CHECK-DAG: st1w { z{{[01]}}.s }, p0, [sp]
; CHECK-DAG: st1w { z{{[01]}}.s }, p0, [sp, #1, mul vl]
%local0 = alloca <vscale x 4 x float>
%local1 = alloca <vscale x 4 x float>
store volatile <vscale x 4 x float> %v0, ptr %local0
store volatile <vscale x 4 x float> %v1, ptr %local1
ret void
}
define void @spill_nxv2f64(<vscale x 2 x double> %v0, <vscale x 2 x double> %v1) {
; CHECK-LABEL: spill_nxv2f64
; CHECK-DAG: st1d { z{{[01]}}.d }, p0, [sp]
; CHECK-DAG: st1d { z{{[01]}}.d }, p0, [sp, #1, mul vl]
%local0 = alloca <vscale x 2 x double>
%local1 = alloca <vscale x 2 x double>
store volatile <vscale x 2 x double> %v0, ptr %local0
store volatile <vscale x 2 x double> %v1, ptr %local1
ret void
}
; Predicate fills
define void @fill_nxv16i1() {
; CHECK-LABEL: fill_nxv16i1
; CHECK-DAG: ldr p{{[01]}}, [sp, #7, mul vl]
; CHECK-DAG: ldr p{{[01]}}, [sp, #6, mul vl]
%local0 = alloca <vscale x 16 x i1>
%local1 = alloca <vscale x 16 x i1>
load volatile <vscale x 16 x i1>, ptr %local0
load volatile <vscale x 16 x i1>, ptr %local1
ret void
}
; Predicate spills
define void @spill_nxv16i1(<vscale x 16 x i1> %v0, <vscale x 16 x i1> %v1) {
; CHECK-LABEL: spill_nxv16i1
; CHECK-DAG: str p{{[01]}}, [sp, #7, mul vl]
; CHECK-DAG: str p{{[01]}}, [sp, #6, mul vl]
%local0 = alloca <vscale x 16 x i1>
%local1 = alloca <vscale x 16 x i1>
store volatile <vscale x 16 x i1> %v0, ptr %local0
store volatile <vscale x 16 x i1> %v1, ptr %local1
ret void
}