neon-idiv.ll
707 Bytes
; RUN: llc -mtriple=aarch64-none-linux-gnu < %s -mattr=+neon | FileCheck %s
define <4 x i32> @test1(<4 x i32> %a) {
%rem = srem <4 x i32> %a, <i32 7, i32 7, i32 7, i32 7>
ret <4 x i32> %rem
; For C constant X/C is simplified to X-X/C*C. The X/C division is lowered
; to MULHS due the simplification by multiplying by a magic number
; (TargetLowering::BuildSDIV).
; CHECK-LABEL: test1:
; CHECK: smull2 [[SMULL2:(v[0-9]+)]].2d, {{v[0-9]+}}.4s, {{v[0-9]+}}.4s
; CHECK: smull [[SMULL:(v[0-9]+)]].2d, {{v[0-9]+}}.2s, {{v[0-9]+}}.2s
; CHECK: uzp2 [[UZP2:(v[0-9]+).4s]], [[SMULL]].4s, [[SMULL2]].4s
; CHECK: add [[ADD:(v[0-9]+.4s)]], [[UZP2]], v0.4s
; CHECK: sshr [[SSHR:(v[0-9]+.4s)]], [[ADD]], #2
}