1
0
mirror of https://github.com/RPCS3/llvm-mirror.git synced 2024-10-23 04:52:54 +02:00
llvm-mirror/test/CodeGen/AArch64/recp-fastmath.ll
Evandro Menezes ed469b20bc [AArch64] Compute the Newton series for reciprocals natively
Implement the Newton series for square root, its reciprocal and reciprocal
natively using the specialized instructions in AArch64 to perform each
series iteration.

Differential revision: https://reviews.llvm.org/D26518

llvm-svn: 286907
2016-11-14 23:29:01 +00:00

151 lines
3.8 KiB
LLVM

; RUN: llc < %s -mtriple=aarch64-unknown-linux-gnu -mattr=+neon | FileCheck %s
define float @frecp0(float %x) #0 {
%div = fdiv fast float 1.0, %x
ret float %div
; CHECK-LABEL: frecp0:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: fdiv
}
define float @frecp1(float %x) #1 {
%div = fdiv fast float 1.0, %x
ret float %div
; CHECK-LABEL: frecp1:
; CHECK-NEXT: BB#0
; CHECK-NEXT: frecpe [[R:s[0-7]]]
; CHECK-NEXT: frecps {{s[0-7](, s[0-7])?}}, [[R]]
}
define <2 x float> @f2recp0(<2 x float> %x) #0 {
%div = fdiv fast <2 x float> <float 1.0, float 1.0>, %x
ret <2 x float> %div
; CHECK-LABEL: f2recp0:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: fdiv
}
define <2 x float> @f2recp1(<2 x float> %x) #1 {
%div = fdiv fast <2 x float> <float 1.0, float 1.0>, %x
ret <2 x float> %div
; CHECK-LABEL: f2recp1:
; CHECK-NEXT: BB#0
; CHECK-NEXT: frecpe [[R:v[0-7]\.2s]]
; CHECK-NEXT: frecps {{v[0-7]\.2s(, v[0-7].2s)?}}, [[R]]
}
define <4 x float> @f4recp0(<4 x float> %x) #0 {
%div = fdiv fast <4 x float> <float 1.0, float 1.0, float 1.0, float 1.0>, %x
ret <4 x float> %div
; CHECK-LABEL: f4recp0:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: fdiv
}
define <4 x float> @f4recp1(<4 x float> %x) #1 {
%div = fdiv fast <4 x float> <float 1.0, float 1.0, float 1.0, float 1.0>, %x
ret <4 x float> %div
; CHECK-LABEL: f4recp1:
; CHECK-NEXT: BB#0
; CHECK-NEXT: frecpe [[R:v[0-7]\.4s]]
; CHECK-NEXT: frecps {{v[0-7]\.4s(, v[0-7].4s)?}}, [[R]]
}
define <8 x float> @f8recp0(<8 x float> %x) #0 {
%div = fdiv fast <8 x float> <float 1.0, float 1.0, float 1.0, float 1.0, float 1.0, float 1.0, float 1.0, float 1.0>, %x
ret <8 x float> %div
; CHECK-LABEL: f8recp0:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: fdiv
; CHECK-NEXT: fdiv
}
define <8 x float> @f8recp1(<8 x float> %x) #1 {
%div = fdiv fast <8 x float> <float 1.0, float 1.0, float 1.0, float 1.0, float 1.0, float 1.0, float 1.0, float 1.0>, %x
ret <8 x float> %div
; CHECK-LABEL: f8recp1:
; CHECK-NEXT: BB#0
; CHECK-NEXT: frecpe [[RA:v[0-7]\.4s]]
; CHECK-NEXT: frecpe [[RB:v[0-7]\.4s]]
; CHECK-NEXT: frecps {{v[0-7]\.4s(, v[0-7].4s)?}}, [[RA]]
; CHECK: frecps {{v[0-7]\.4s(, v[0-7].4s)?}}, [[RB]]
}
define double @drecp0(double %x) #0 {
%div = fdiv fast double 1.0, %x
ret double %div
; CHECK-LABEL: drecp0:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: fdiv
}
define double @drecp1(double %x) #1 {
%div = fdiv fast double 1.0, %x
ret double %div
; CHECK-LABEL: drecp1:
; CHECK-NEXT: BB#0
; CHECK-NEXT: frecpe [[R:d[0-7]]]
; CHECK-NEXT: frecps {{d[0-7](, d[0-7])?}}, [[R]]
}
define <2 x double> @d2recp0(<2 x double> %x) #0 {
%div = fdiv fast <2 x double> <double 1.0, double 1.0>, %x
ret <2 x double> %div
; CHECK-LABEL: d2recp0:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: fdiv
}
define <2 x double> @d2recp1(<2 x double> %x) #1 {
%div = fdiv fast <2 x double> <double 1.0, double 1.0>, %x
ret <2 x double> %div
; CHECK-LABEL: d2recp1:
; CHECK-NEXT: BB#0
; CHECK-NEXT: frecpe [[R:v[0-7]\.2d]]
; CHECK-NEXT: frecps {{v[0-7]\.2d(, v[0-7].2d)?}}, [[R]]
}
define <4 x double> @d4recp0(<4 x double> %x) #0 {
%div = fdiv fast <4 x double> <double 1.0, double 1.0, double 1.0, double 1.0>, %x
ret <4 x double> %div
; CHECK-LABEL: d4recp0:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: fdiv
; CHECK-NEXT: fdiv
}
define <4 x double> @d4recp1(<4 x double> %x) #1 {
%div = fdiv fast <4 x double> <double 1.0, double 1.0, double 1.0, double 1.0>, %x
ret <4 x double> %div
; CHECK-LABEL: d4recp1:
; CHECK-NEXT: BB#0
; CHECK-NEXT: frecpe [[RA:v[0-7]\.2d]]
; CHECK-NEXT: frecpe [[RB:v[0-7]\.2d]]
; CHECK-NEXT: frecps {{v[0-7]\.2d(, v[0-7].2d)?}}, [[RA]]
; CHECK: frecps {{v[0-7]\.2d(, v[0-7].2d)?}}, [[RB]]
}
attributes #0 = { nounwind "unsafe-fp-math"="true" }
attributes #1 = { nounwind "unsafe-fp-math"="true" "reciprocal-estimates"="div,vec-div" }