llvm/llvm/test/CodeGen/AArch64/sve2-sli-sri.ll

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 4
; RUN: llc -mtriple=aarch64 -mattr=+sve < %s -o - | FileCheck --check-prefixes=CHECK,SVE %s
; RUN: llc -mtriple=aarch64 -mattr=+sve2 < %s -o - | FileCheck --check-prefixes=CHECK,SVE2 %s

define <vscale x 16 x i8> @testLeftGood16x8(<vscale x 16 x i8> %src1, <vscale x 16 x i8> %src2) {
; SVE-LABEL: testLeftGood16x8:
; SVE:       // %bb.0:
; SVE-NEXT:    and z0.b, z0.b, #0x7
; SVE-NEXT:    lsl z1.b, z1.b, #3
; SVE-NEXT:    orr z0.d, z0.d, z1.d
; SVE-NEXT:    ret
;
; SVE2-LABEL: testLeftGood16x8:
; SVE2:       // %bb.0:
; SVE2-NEXT:    sli z0.b, z1.b, #3
; SVE2-NEXT:    ret
  %and.i = and <vscale x 16 x i8> %src1, splat(i8 7)
  %vshl_n = shl <vscale x 16 x i8> %src2, splat(i8 3)
  %result = or <vscale x 16 x i8> %and.i, %vshl_n
  ret <vscale x 16 x i8> %result
}

define <vscale x 16 x i8> @testLeftBad16x8(<vscale x 16 x i8> %src1, <vscale x 16 x i8> %src2) {
; CHECK-LABEL: testLeftBad16x8:
; CHECK:       // %bb.0:
; CHECK-NEXT:    mov z2.b, #-91 // =0xffffffffffffffa5
; CHECK-NEXT:    lsl z1.b, z1.b, #1
; CHECK-NEXT:    and z0.d, z0.d, z2.d
; CHECK-NEXT:    orr z0.d, z0.d, z1.d
; CHECK-NEXT:    ret
  %and.i = and <vscale x 16 x i8> %src1, splat(i8 165)
  %vshl_n = shl <vscale x 16 x i8> %src2, splat(i8 1)
  %result = or <vscale x 16 x i8> %and.i, %vshl_n
  ret <vscale x 16 x i8> %result
}

define <vscale x 16 x i8> @testRightGood16x8(<vscale x 16 x i8> %src1, <vscale x 16 x i8> %src2) {
; SVE-LABEL: testRightGood16x8:
; SVE:       // %bb.0:
; SVE-NEXT:    and z0.b, z0.b, #0xe0
; SVE-NEXT:    lsr z1.b, z1.b, #3
; SVE-NEXT:    orr z0.d, z0.d, z1.d
; SVE-NEXT:    ret
;
; SVE2-LABEL: testRightGood16x8:
; SVE2:       // %bb.0:
; SVE2-NEXT:    sri z0.b, z1.b, #3
; SVE2-NEXT:    ret
  %and.i = and <vscale x 16 x i8> %src1, splat(i8 224)
  %vshl_n = lshr <vscale x 16 x i8> %src2, splat(i8 3)
  %result = or <vscale x 16 x i8> %and.i, %vshl_n
  ret <vscale x 16 x i8> %result
}

define <vscale x 16 x i8> @testRightBad16x8(<vscale x 16 x i8> %src1, <vscale x 16 x i8> %src2) {
; CHECK-LABEL: testRightBad16x8:
; CHECK:       // %bb.0:
; CHECK-NEXT:    mov z2.b, #-91 // =0xffffffffffffffa5
; CHECK-NEXT:    lsr z1.b, z1.b, #1
; CHECK-NEXT:    and z0.d, z0.d, z2.d
; CHECK-NEXT:    orr z0.d, z0.d, z1.d
; CHECK-NEXT:    ret
  %and.i = and <vscale x 16 x i8> %src1, splat(i8 165)
  %vshl_n = lshr <vscale x 16 x i8> %src2, splat(i8 1)
  %result = or <vscale x 16 x i8> %and.i, %vshl_n
  ret <vscale x 16 x i8> %result
}

define <vscale x 8 x i16> @testLeftGood8x16(<vscale x 8 x i16> %src1, <vscale x 8 x i16> %src2) {
; SVE-LABEL: testLeftGood8x16:
; SVE:       // %bb.0:
; SVE-NEXT:    and z0.h, z0.h, #0x3fff
; SVE-NEXT:    lsl z1.h, z1.h, #14
; SVE-NEXT:    orr z0.d, z0.d, z1.d
; SVE-NEXT:    ret
;
; SVE2-LABEL: testLeftGood8x16:
; SVE2:       // %bb.0:
; SVE2-NEXT:    sli z0.h, z1.h, #14
; SVE2-NEXT:    ret
  %and.i = and <vscale x 8 x i16> %src1, splat(i16 16383)
  %vshl_n = shl <vscale x 8 x i16> %src2, splat(i16 14)
  %result = or <vscale x 8 x i16> %and.i, %vshl_n
  ret <vscale x 8 x i16> %result
}

define <vscale x 8 x i16> @testLeftBad8x16(<vscale x 8 x i16> %src1, <vscale x 8 x i16> %src2) {
; CHECK-LABEL: testLeftBad8x16:
; CHECK:       // %bb.0:
; CHECK-NEXT:    mov w8, #16500 // =0x4074
; CHECK-NEXT:    lsl z1.h, z1.h, #14
; CHECK-NEXT:    mov z2.h, w8
; CHECK-NEXT:    and z0.d, z0.d, z2.d
; CHECK-NEXT:    orr z0.d, z0.d, z1.d
; CHECK-NEXT:    ret
  %and.i = and <vscale x 8 x i16> %src1, splat(i16 16500)
  %vshl_n = shl <vscale x 8 x i16> %src2, splat(i16 14)
  %result = or <vscale x 8 x i16> %and.i, %vshl_n
  ret <vscale x 8 x i16> %result
}

define <vscale x 8 x i16> @testRightGood8x16(<vscale x 8 x i16> %src1, <vscale x 8 x i16> %src2) {
; SVE-LABEL: testRightGood8x16:
; SVE:       // %bb.0:
; SVE-NEXT:    and z0.h, z0.h, #0xfffc
; SVE-NEXT:    lsr z1.h, z1.h, #14
; SVE-NEXT:    orr z0.d, z0.d, z1.d
; SVE-NEXT:    ret
;
; SVE2-LABEL: testRightGood8x16:
; SVE2:       // %bb.0:
; SVE2-NEXT:    sri z0.h, z1.h, #14
; SVE2-NEXT:    ret
  %and.i = and <vscale x 8 x i16> %src1, splat(i16 65532)
  %vshl_n = lshr <vscale x 8 x i16> %src2, splat(i16 14)
  %result = or <vscale x 8 x i16> %and.i, %vshl_n
  ret <vscale x 8 x i16> %result
}

define <vscale x 8 x i16> @testRightBad8x16(<vscale x 8 x i16> %src1, <vscale x 8 x i16> %src2) {
; CHECK-LABEL: testRightBad8x16:
; CHECK:       // %bb.0:
; CHECK-NEXT:    mov w8, #16500 // =0x4074
; CHECK-NEXT:    lsr z1.h, z1.h, #14
; CHECK-NEXT:    mov z2.h, w8
; CHECK-NEXT:    and z0.d, z0.d, z2.d
; CHECK-NEXT:    orr z0.d, z0.d, z1.d
; CHECK-NEXT:    ret
  %and.i = and <vscale x 8 x i16> %src1, splat(i16 16500)
  %vshl_n = lshr <vscale x 8 x i16> %src2, splat(i16 14)
  %result = or <vscale x 8 x i16> %and.i, %vshl_n
  ret <vscale x 8 x i16> %result
}

define <vscale x 4 x i32> @testLeftGood4x32(<vscale x 4 x i32> %src1, <vscale x 4 x i32> %src2) {
; SVE-LABEL: testLeftGood4x32:
; SVE:       // %bb.0:
; SVE-NEXT:    and z0.s, z0.s, #0x3fffff
; SVE-NEXT:    lsl z1.s, z1.s, #22
; SVE-NEXT:    orr z0.d, z0.d, z1.d
; SVE-NEXT:    ret
;
; SVE2-LABEL: testLeftGood4x32:
; SVE2:       // %bb.0:
; SVE2-NEXT:    sli z0.s, z1.s, #22
; SVE2-NEXT:    ret
  %and.i = and <vscale x 4 x i32> %src1, splat(i32 4194303)
  %vshl_n = shl <vscale x 4 x i32> %src2, splat(i32 22)
  %result = or <vscale x 4 x i32> %and.i, %vshl_n
  ret <vscale x 4 x i32> %result
}

define <vscale x 4 x i32> @testLeftBad4x32(<vscale x 4 x i32> %src1, <vscale x 4 x i32> %src2) {
; CHECK-LABEL: testLeftBad4x32:
; CHECK:       // %bb.0:
; CHECK-NEXT:    and z0.s, z0.s, #0x3ffffc
; CHECK-NEXT:    lsl z1.s, z1.s, #22
; CHECK-NEXT:    orr z0.d, z0.d, z1.d
; CHECK-NEXT:    ret
  %and.i = and <vscale x 4 x i32> %src1, splat(i32 4194300)
  %vshl_n = shl <vscale x 4 x i32> %src2, splat(i32 22)
  %result = or <vscale x 4 x i32> %and.i, %vshl_n
  ret <vscale x 4 x i32> %result
}

define <vscale x 4 x i32> @testRightGood4x32(<vscale x 4 x i32> %src1, <vscale x 4 x i32> %src2) {
; SVE-LABEL: testRightGood4x32:
; SVE:       // %bb.0:
; SVE-NEXT:    and z0.s, z0.s, #0xfffffc00
; SVE-NEXT:    lsr z1.s, z1.s, #22
; SVE-NEXT:    orr z0.d, z0.d, z1.d
; SVE-NEXT:    ret
;
; SVE2-LABEL: testRightGood4x32:
; SVE2:       // %bb.0:
; SVE2-NEXT:    sri z0.s, z1.s, #22
; SVE2-NEXT:    ret
  %and.i = and <vscale x 4 x i32> %src1, splat(i32 4294966272)
  %vshl_n = lshr <vscale x 4 x i32> %src2, splat(i32 22)
  %result = or <vscale x 4 x i32> %and.i, %vshl_n
  ret <vscale x 4 x i32> %result
}

define <vscale x 4 x i32> @testRightBad4x32(<vscale x 4 x i32> %src1, <vscale x 4 x i32> %src2) {
; CHECK-LABEL: testRightBad4x32:
; CHECK:       // %bb.0:
; CHECK-NEXT:    and z0.s, z0.s, #0x3ffffc
; CHECK-NEXT:    lsr z1.s, z1.s, #22
; CHECK-NEXT:    orr z0.d, z0.d, z1.d
; CHECK-NEXT:    ret
  %and.i = and <vscale x 4 x i32> %src1, splat(i32 4194300)
  %vshl_n = lshr <vscale x 4 x i32> %src2, splat(i32 22)
  %result = or <vscale x 4 x i32> %and.i, %vshl_n
  ret <vscale x 4 x i32> %result
}

define <vscale x 2 x i64> @testLeftGood2x64(<vscale x 2 x i64> %src1, <vscale x 2 x i64> %src2) {
; SVE-LABEL: testLeftGood2x64:
; SVE:       // %bb.0:
; SVE-NEXT:    and z0.d, z0.d, #0xffffffffffff
; SVE-NEXT:    lsl z1.d, z1.d, #48
; SVE-NEXT:    orr z0.d, z0.d, z1.d
; SVE-NEXT:    ret
;
; SVE2-LABEL: testLeftGood2x64:
; SVE2:       // %bb.0:
; SVE2-NEXT:    sli z0.d, z1.d, #48
; SVE2-NEXT:    ret
  %and.i = and <vscale x 2 x i64> %src1, splat(i64 281474976710655)
  %vshl_n = shl <vscale x 2 x i64> %src2, splat(i64 48)
  %result = or <vscale x 2 x i64> %and.i, %vshl_n
  ret <vscale x 2 x i64> %result
}

define <vscale x 2 x i64> @testLeftBad2x64(<vscale x 2 x i64> %src1, <vscale x 2 x i64> %src2) {
; CHECK-LABEL: testLeftBad2x64:
; CHECK:       // %bb.0:
; CHECK-NEXT:    mov x8, #10 // =0xa
; CHECK-NEXT:    lsl z1.d, z1.d, #48
; CHECK-NEXT:    movk x8, #1, lsl #48
; CHECK-NEXT:    mov z2.d, x8
; CHECK-NEXT:    and z0.d, z0.d, z2.d
; CHECK-NEXT:    orr z0.d, z0.d, z1.d
; CHECK-NEXT:    ret
  %and.i = and <vscale x 2 x i64> %src1, splat(i64 281474976710666)
  %vshl_n = shl <vscale x 2 x i64> %src2, splat(i64 48)
  %result = or <vscale x 2 x i64> %and.i, %vshl_n
  ret <vscale x 2 x i64> %result
}

define <vscale x 2 x i64> @testRightGood2x64(<vscale x 2 x i64> %src1, <vscale x 2 x i64> %src2) {
; SVE-LABEL: testRightGood2x64:
; SVE:       // %bb.0:
; SVE-NEXT:    and z0.d, z0.d, #0xffffffffffff0000
; SVE-NEXT:    lsr z1.d, z1.d, #48
; SVE-NEXT:    orr z0.d, z0.d, z1.d
; SVE-NEXT:    ret
;
; SVE2-LABEL: testRightGood2x64:
; SVE2:       // %bb.0:
; SVE2-NEXT:    sri z0.d, z1.d, #48
; SVE2-NEXT:    ret
  %and.i = and <vscale x 2 x i64> %src1, splat(i64 18446744073709486080)
  %vshl_n = lshr <vscale x 2 x i64> %src2, splat(i64 48)
  %result = or <vscale x 2 x i64> %and.i, %vshl_n
  ret <vscale x 2 x i64> %result
}

define <vscale x 2 x i64> @testRightBad2x64(<vscale x 2 x i64> %src1, <vscale x 2 x i64> %src2) {
; CHECK-LABEL: testRightBad2x64:
; CHECK:       // %bb.0:
; CHECK-NEXT:    mov x8, #10 // =0xa
; CHECK-NEXT:    lsr z1.d, z1.d, #48
; CHECK-NEXT:    movk x8, #1, lsl #48
; CHECK-NEXT:    mov z2.d, x8
; CHECK-NEXT:    and z0.d, z0.d, z2.d
; CHECK-NEXT:    orr z0.d, z0.d, z1.d
; CHECK-NEXT:    ret
  %and.i = and <vscale x 2 x i64> %src1, splat(i64 281474976710666)
  %vshl_n = lshr <vscale x 2 x i64> %src2, splat(i64 48)
  %result = or <vscale x 2 x i64> %and.i, %vshl_n
  ret <vscale x 2 x i64> %result
}