llvm/llvm/test/CodeGen/AArch64/neon-idiv.ll

; RUN: llc -mtriple=aarch64-none-linux-gnu < %s -mattr=+neon | FileCheck %s

define <4 x i32> @test1(<4 x i32> %a) {
  %rem = srem <4 x i32> %a, <i32 7, i32 7, i32 7, i32 7>
  ret <4 x i32> %rem
; For C constant X/C is simplified to X-X/C*C. The X/C division is lowered
; to MULHS due the simplification by multiplying by a magic number
; (TargetLowering::BuildSDIV).
; CHECK-LABEL: test1:
; CHECK: smull2 [[SMULL2:(v[0-9]+)]].2d, {{v[0-9]+}}.4s, {{v[0-9]+}}.4s
; CHECK: smull  [[SMULL:(v[0-9]+)]].2d, {{v[0-9]+}}.2s, {{v[0-9]+}}.2s
; CHECK: uzp2   [[UZP2:(v[0-9]+).4s]], [[SMULL]].4s, [[SMULL2]].4s
; CHECK: add    [[ADD:(v[0-9]+.4s)]], [[UZP2]], v0.4s
; CHECK: sshr   [[SSHR:(v[0-9]+.4s)]], [[ADD]], #2
}