llvm/llvm/test/CodeGen/SystemZ/bswap-09.ll

; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 2
; Test i128 byteswaps on z13 and higher.
;
; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z13 | FileCheck %s

declare i128 @llvm.bswap.i128(i128 %a)

; Check 128-bit register-to-register byteswaps.
define i128 @f1(i128 %a, i128 %b, i128 %c) {
; CHECK-LABEL: f1:
; CHECK:       # %bb.0:
; CHECK-NEXT:    vl %v1, 0(%r4), 3
; CHECK-NEXT:    vl %v2, 0(%r3), 3
; CHECK-NEXT:    larl %r1, .LCPI0_0
; CHECK-NEXT:    vaq %v1, %v2, %v1
; CHECK-NEXT:    vl %v2, 0(%r1), 3
; CHECK-NEXT:    vl %v0, 0(%r5), 3
; CHECK-NEXT:    vperm %v1, %v1, %v1, %v2
; CHECK-NEXT:    vaq %v0, %v1, %v0
; CHECK-NEXT:    vst %v0, 0(%r2), 3
; CHECK-NEXT:    br %r14
  %in = add i128 %a, %b
  %swapped = call i128 @llvm.bswap.i128(i128 %in)
  %out = add i128 %swapped, %c
  ret i128 %out
}

; Check 128-bit register-to-memory byteswaps.
define i128 @f2(i128 %a, i128 %b) {
; CHECK-LABEL: f2:
; CHECK:       # %bb.0:
; CHECK-NEXT:    vl %v0, 0(%r4), 3
; CHECK-NEXT:    vl %v1, 0(%r3), 3
; CHECK-NEXT:    larl %r1, .LCPI1_0
; CHECK-NEXT:    vaq %v0, %v1, %v0
; CHECK-NEXT:    vl %v1, 0(%r1), 3
; CHECK-NEXT:    vperm %v0, %v0, %v0, %v1
; CHECK-NEXT:    vst %v0, 0(%r2), 3
; CHECK-NEXT:    br %r14
  %in = add i128 %a, %b
  %swapped = call i128 @llvm.bswap.i128(i128 %in)
  ret i128 %swapped
}

; Check 128-bit memory-to-register byteswaps.
define i128 @f3(i128 %a, i128 %b) {
; CHECK-LABEL: f3:
; CHECK:       # %bb.0:
; CHECK-NEXT:    larl %r1, .LCPI2_0
; CHECK-NEXT:    vl %v1, 0(%r3), 3
; CHECK-NEXT:    vl %v2, 0(%r1), 3
; CHECK-NEXT:    vl %v0, 0(%r4), 3
; CHECK-NEXT:    vperm %v1, %v1, %v1, %v2
; CHECK-NEXT:    vaq %v0, %v1, %v0
; CHECK-NEXT:    vst %v0, 0(%r2), 3
; CHECK-NEXT:    br %r14
  %swapped = call i128 @llvm.bswap.i128(i128 %a)
  %out = add i128 %swapped, %b
  ret i128 %out
}