llvm-project/llvm/test/CodeGen/AArch64/sqrt-fastmath.ll

; RUN: llc < %s -mtriple=aarch64 -mattr=neon -recip=!sqrt,!vec-sqrt   | FileCheck %s --check-prefix=FAULT
; RUN: llc < %s -mtriple=aarch64 -mattr=neon,-use-reverse-square-root | FileCheck %s --check-prefix=FAULT
; RUN: llc < %s -mtriple=aarch64 -mattr=neon -recip=sqrt,vec-sqrt     | FileCheck %s
; RUN: llc < %s -mtriple=aarch64 -mattr=neon,+use-reverse-square-root | FileCheck %s

declare float @llvm.sqrt.f32(float) #1
declare <2 x float> @llvm.sqrt.v2f32(<2 x float>) #1
declare <4 x float> @llvm.sqrt.v4f32(<4 x float>) #1
declare <8 x float> @llvm.sqrt.v8f32(<8 x float>) #1
declare double @llvm.sqrt.f64(double) #1
declare <2 x double> @llvm.sqrt.v2f64(<2 x double>) #1
declare <4 x double> @llvm.sqrt.v4f64(<4 x double>) #1

define float @fsqrt(float %a) #0 {
  %1 = tail call fast float @llvm.sqrt.f32(float %a)
  ret float %1

; FAULT-LABEL: fsqrt:
; FAULT-NEXT: BB#0
; FAULT-NEXT: fsqrt

; CHECK-LABEL: fsqrt:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: frsqrte
}

define <2 x float> @f2sqrt(<2 x float> %a) #0 {
  %1 = tail call fast <2 x float> @llvm.sqrt.v2f32(<2 x float> %a) #2
  ret <2 x float> %1

; FAULT-LABEL: f2sqrt:
; FAULT-NEXT: BB#0
; FAULT-NEXT: fsqrt

; CHECK-LABEL: f2sqrt:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: mov
; CHECK-NEXT: frsqrte
}

define <4 x float> @f4sqrt(<4 x float> %a) #0 {
  %1 = tail call fast <4 x float> @llvm.sqrt.v4f32(<4 x float> %a) #2
  ret <4 x float> %1

; FAULT-LABEL: f4sqrt:
; FAULT-NEXT: BB#0
; FAULT-NEXT: fsqrt

; CHECK-LABEL: f4sqrt:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: mov
; CHECK-NEXT: frsqrte
}

define <8 x float> @f8sqrt(<8 x float> %a) #0 {
  %1 = tail call fast <8 x float> @llvm.sqrt.v8f32(<8 x float> %a) #2
  ret <8 x float> %1

; FAULT-LABEL: f8sqrt:
; FAULT-NEXT: BB#0
; FAULT-NEXT: fsqrt
; FAULT-NEXT: fsqrt

; CHECK-LABEL: f8sqrt:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: mov
; CHECK-NEXT: frsqrte
; CHECK: frsqrte
}

define double @dsqrt(double %a) #0 {
  %1 = tail call fast double @llvm.sqrt.f64(double %a)
  ret double %1

; FAULT-LABEL: dsqrt:
; FAULT-NEXT: BB#0
; FAULT-NEXT: fsqrt

; CHECK-LABEL: dsqrt:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: frsqrte
}

define <2 x double> @d2sqrt(<2 x double> %a) #0 {
  %1 = tail call fast <2 x double> @llvm.sqrt.v2f64(<2 x double> %a) #2
  ret <2 x double> %1

; FAULT-LABEL: d2sqrt:
; FAULT-NEXT: BB#0
; FAULT-NEXT: fsqrt

; CHECK-LABEL: d2sqrt:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: mov
; CHECK-NEXT: frsqrte
}

define <4 x double> @d4sqrt(<4 x double> %a) #0 {
  %1 = tail call fast <4 x double> @llvm.sqrt.v4f64(<4 x double> %a) #4
  ret <4 x double> %1

; FAULT-LABEL: d4sqrt:
; FAULT-NEXT: BB#0
; FAULT-NEXT: fsqrt
; FAULT-NEXT: fsqrt

; CHECK-LABEL: d4sqrt:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: mov
; CHECK-NEXT: frsqrte
; CHECK: frsqrte
}

define float @frsqrt(float %a) #0 {
  %1 = tail call fast float @llvm.sqrt.f32(float %a)
  %2 = fdiv fast float 1.000000e+00, %1
  ret float %2

; FAULT-LABEL: frsqrt:
; FAULT-NEXT: BB#0
; FAULT-NEXT: fsqrt

; CHECK-LABEL: frsqrt:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: frsqrte
}

define <2 x float> @f2rsqrt(<2 x float> %a) #0 {
  %1 = tail call fast <2 x float> @llvm.sqrt.v2f32(<2 x float> %a) #2
  %2 = fdiv fast <2 x float> <float 1.000000e+00, float 1.000000e+00>, %1
  ret <2 x float> %2

; FAULT-LABEL: f2rsqrt:
; FAULT-NEXT: BB#0
; FAULT-NEXT: fsqrt

; CHECK-LABEL: f2rsqrt:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: frsqrte
}

define <4 x float> @f4rsqrt(<4 x float> %a) #0 {
  %1 = tail call fast <4 x float> @llvm.sqrt.v4f32(<4 x float> %a) #2
  %2 = fdiv fast <4 x float> <float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00>, %1
  ret <4 x float> %2

; FAULT-LABEL: f4rsqrt:
; FAULT-NEXT: BB#0
; FAULT-NEXT: fsqrt

; CHECK-LABEL: f4rsqrt:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: frsqrte
}

define <8 x float> @f8rsqrt(<8 x float> %a) #0 {
  %1 = tail call fast <8 x float> @llvm.sqrt.v8f32(<8 x float> %a) #2
  %2 = fdiv fast <8 x float> <float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00>, %1
  ret <8 x float> %2

; FAULT-LABEL: f8rsqrt:
; FAULT-NEXT: BB#0
; FAULT-NEXT: fsqrt
; FAULT-NEXT: fsqrt

; CHECK-LABEL: f8rsqrt:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: frsqrte
; CHECK: frsqrte
}

define double @drsqrt(double %a) #0 {
  %1 = tail call fast double @llvm.sqrt.f64(double %a)
  %2 = fdiv fast double 1.000000e+00, %1
  ret double %2

; FAULT-LABEL: drsqrt:
; FAULT-NEXT: BB#0
; FAULT-NEXT: fsqrt

; CHECK-LABEL: drsqrt:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: frsqrte
}

define <2 x double> @d2rsqrt(<2 x double> %a) #0 {
  %1 = tail call fast <2 x double> @llvm.sqrt.v2f64(<2 x double> %a) #2
  %2 = fdiv fast <2 x double> <double 1.000000e+00, double 1.000000e+00>, %1
  ret <2 x double> %2

; FAULT-LABEL: d2rsqrt:
; FAULT-NEXT: BB#0
; FAULT-NEXT: fsqrt

; CHECK-LABEL: d2rsqrt:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: frsqrte
}

define <4 x double> @d4rsqrt(<4 x double> %a) #0 {
  %1 = tail call fast <4 x double> @llvm.sqrt.v4f64(<4 x double> %a) #4
  %2 = fdiv fast <4 x double> <double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00>, %1
  ret <4 x double> %2

; FAULT-LABEL: d4rsqrt:
; FAULT-NEXT: BB#0
; FAULT-NEXT: fsqrt
; FAULT-NEXT: fsqrt

; CHECK-LABEL: d4rsqrt:
; CHECK-NEXT: BB#0
; CHECK-NEXT: fmov
; CHECK-NEXT: frsqrte
; CHECK: frsqrte
}

attributes #0 = { nounwind "unsafe-fp-math"="true" }
[AArch64] Properly validate the reciprocal estimation. Add check for legal data types when expanding into a Newton series. Differential Revision: https://reviews.llvm.org/D22267 llvm-svn: 276041 2016-07-20 06:31:11 +08:00			`; RUN: llc < %s -mtriple=aarch64 -mattr=neon -recip=!sqrt,!vec-sqrt \| FileCheck %s --check-prefix=FAULT`
			`; RUN: llc < %s -mtriple=aarch64 -mattr=neon,-use-reverse-square-root \| FileCheck %s --check-prefix=FAULT`
			`; RUN: llc < %s -mtriple=aarch64 -mattr=neon -recip=sqrt,vec-sqrt \| FileCheck %s`
[AArch64] Switch regression tests to test features not CPUs Summary: We have switched to using features for all heuristics, but the tests for these are still using -mcpu, which means we are not directly testing the features. This converts at least some of the existing regression tests to use the new features. This still leaves the following features untested: merge-narrow-ld predictable-select-expensive alternate-sextload-cvt-f32-pattern disable-latency-sched-heuristic Reviewers: mcrosier, t.p.northover, rengolin Subscribers: MatzeB, aemerson, llvm-commits, rengolin Differential Revision: http://reviews.llvm.org/D21288 llvm-svn: 273271 2016-06-21 23:16:34 +08:00			`; RUN: llc < %s -mtriple=aarch64 -mattr=neon,+use-reverse-square-root \| FileCheck %s`
[AArch64] Use the reciprocal estimation machinery This patch adds support for estimating the square root, its reciprocal and division or reciprocal using the combiner generic reciprocal machinery. llvm-svn: 268539 2016-05-05 04:18:27 +08:00
			`declare float @llvm.sqrt.f32(float) #1`
			`declare <2 x float> @llvm.sqrt.v2f32(<2 x float>) #1`
			`declare <4 x float> @llvm.sqrt.v4f32(<4 x float>) #1`
[AArch64] Properly validate the reciprocal estimation. Add check for legal data types when expanding into a Newton series. Differential Revision: https://reviews.llvm.org/D22267 llvm-svn: 276041 2016-07-20 06:31:11 +08:00			`declare <8 x float> @llvm.sqrt.v8f32(<8 x float>) #1`
			`declare double @llvm.sqrt.f64(double) #1`
[AArch64] Use the reciprocal estimation machinery This patch adds support for estimating the square root, its reciprocal and division or reciprocal using the combiner generic reciprocal machinery. llvm-svn: 268539 2016-05-05 04:18:27 +08:00			`declare <2 x double> @llvm.sqrt.v2f64(<2 x double>) #1`
[AArch64] Properly validate the reciprocal estimation. Add check for legal data types when expanding into a Newton series. Differential Revision: https://reviews.llvm.org/D22267 llvm-svn: 276041 2016-07-20 06:31:11 +08:00			`declare <4 x double> @llvm.sqrt.v4f64(<4 x double>) #1`
[AArch64] Use the reciprocal estimation machinery This patch adds support for estimating the square root, its reciprocal and division or reciprocal using the combiner generic reciprocal machinery. llvm-svn: 268539 2016-05-05 04:18:27 +08:00
			`define float @fsqrt(float %a) #0 {`
			`%1 = tail call fast float @llvm.sqrt.f32(float %a)`
			`ret float %1`

			`; FAULT-LABEL: fsqrt:`
			`; FAULT-NEXT: BB#0`
			`; FAULT-NEXT: fsqrt`

			`; CHECK-LABEL: fsqrt:`
			`; CHECK-NEXT: BB#0`
			`; CHECK-NEXT: fmov`
			`; CHECK-NEXT: frsqrte`
			`}`

			`define <2 x float> @f2sqrt(<2 x float> %a) #0 {`
			`%1 = tail call fast <2 x float> @llvm.sqrt.v2f32(<2 x float> %a) #2`
			`ret <2 x float> %1`

			`; FAULT-LABEL: f2sqrt:`
			`; FAULT-NEXT: BB#0`
			`; FAULT-NEXT: fsqrt`

			`; CHECK-LABEL: f2sqrt:`
			`; CHECK-NEXT: BB#0`
			`; CHECK-NEXT: fmov`
			`; CHECK-NEXT: mov`
			`; CHECK-NEXT: frsqrte`
			`}`

			`define <4 x float> @f4sqrt(<4 x float> %a) #0 {`
			`%1 = tail call fast <4 x float> @llvm.sqrt.v4f32(<4 x float> %a) #2`
			`ret <4 x float> %1`

			`; FAULT-LABEL: f4sqrt:`
			`; FAULT-NEXT: BB#0`
			`; FAULT-NEXT: fsqrt`

			`; CHECK-LABEL: f4sqrt:`
			`; CHECK-NEXT: BB#0`
			`; CHECK-NEXT: fmov`
			`; CHECK-NEXT: mov`
			`; CHECK-NEXT: frsqrte`
			`}`

[AArch64] Properly validate the reciprocal estimation. Add check for legal data types when expanding into a Newton series. Differential Revision: https://reviews.llvm.org/D22267 llvm-svn: 276041 2016-07-20 06:31:11 +08:00			`define <8 x float> @f8sqrt(<8 x float> %a) #0 {`
			`%1 = tail call fast <8 x float> @llvm.sqrt.v8f32(<8 x float> %a) #2`
			`ret <8 x float> %1`

			`; FAULT-LABEL: f8sqrt:`
			`; FAULT-NEXT: BB#0`
			`; FAULT-NEXT: fsqrt`
			`; FAULT-NEXT: fsqrt`

			`; CHECK-LABEL: f8sqrt:`
			`; CHECK-NEXT: BB#0`
			`; CHECK-NEXT: fmov`
			`; CHECK-NEXT: mov`
			`; CHECK-NEXT: frsqrte`
			`; CHECK: frsqrte`
			`}`

[AArch64] Use the reciprocal estimation machinery This patch adds support for estimating the square root, its reciprocal and division or reciprocal using the combiner generic reciprocal machinery. llvm-svn: 268539 2016-05-05 04:18:27 +08:00			`define double @dsqrt(double %a) #0 {`
			`%1 = tail call fast double @llvm.sqrt.f64(double %a)`
			`ret double %1`

			`; FAULT-LABEL: dsqrt:`
			`; FAULT-NEXT: BB#0`
			`; FAULT-NEXT: fsqrt`

			`; CHECK-LABEL: dsqrt:`
			`; CHECK-NEXT: BB#0`
			`; CHECK-NEXT: fmov`
			`; CHECK-NEXT: frsqrte`
			`}`

			`define <2 x double> @d2sqrt(<2 x double> %a) #0 {`
			`%1 = tail call fast <2 x double> @llvm.sqrt.v2f64(<2 x double> %a) #2`
			`ret <2 x double> %1`

			`; FAULT-LABEL: d2sqrt:`
			`; FAULT-NEXT: BB#0`
			`; FAULT-NEXT: fsqrt`

			`; CHECK-LABEL: d2sqrt:`
			`; CHECK-NEXT: BB#0`
			`; CHECK-NEXT: fmov`
			`; CHECK-NEXT: mov`
			`; CHECK-NEXT: frsqrte`
			`}`

[AArch64] Properly validate the reciprocal estimation. Add check for legal data types when expanding into a Newton series. Differential Revision: https://reviews.llvm.org/D22267 llvm-svn: 276041 2016-07-20 06:31:11 +08:00			`define <4 x double> @d4sqrt(<4 x double> %a) #0 {`
			`%1 = tail call fast <4 x double> @llvm.sqrt.v4f64(<4 x double> %a) #4`
			`ret <4 x double> %1`

			`; FAULT-LABEL: d4sqrt:`
			`; FAULT-NEXT: BB#0`
			`; FAULT-NEXT: fsqrt`
			`; FAULT-NEXT: fsqrt`

			`; CHECK-LABEL: d4sqrt:`
			`; CHECK-NEXT: BB#0`
			`; CHECK-NEXT: fmov`
			`; CHECK-NEXT: mov`
			`; CHECK-NEXT: frsqrte`
			`; CHECK: frsqrte`
			`}`

[AArch64] Use the reciprocal estimation machinery This patch adds support for estimating the square root, its reciprocal and division or reciprocal using the combiner generic reciprocal machinery. llvm-svn: 268539 2016-05-05 04:18:27 +08:00			`define float @frsqrt(float %a) #0 {`
			`%1 = tail call fast float @llvm.sqrt.f32(float %a)`
			`%2 = fdiv fast float 1.000000e+00, %1`
			`ret float %2`

			`; FAULT-LABEL: frsqrt:`
			`; FAULT-NEXT: BB#0`
			`; FAULT-NEXT: fsqrt`

			`; CHECK-LABEL: frsqrt:`
			`; CHECK-NEXT: BB#0`
			`; CHECK-NEXT: fmov`
			`; CHECK-NEXT: frsqrte`
			`}`

			`define <2 x float> @f2rsqrt(<2 x float> %a) #0 {`
			`%1 = tail call fast <2 x float> @llvm.sqrt.v2f32(<2 x float> %a) #2`
			`%2 = fdiv fast <2 x float> <float 1.000000e+00, float 1.000000e+00>, %1`
			`ret <2 x float> %2`

			`; FAULT-LABEL: f2rsqrt:`
			`; FAULT-NEXT: BB#0`
			`; FAULT-NEXT: fsqrt`

			`; CHECK-LABEL: f2rsqrt:`
			`; CHECK-NEXT: BB#0`
			`; CHECK-NEXT: fmov`
			`; CHECK-NEXT: frsqrte`
			`}`

			`define <4 x float> @f4rsqrt(<4 x float> %a) #0 {`
			`%1 = tail call fast <4 x float> @llvm.sqrt.v4f32(<4 x float> %a) #2`
			`%2 = fdiv fast <4 x float> <float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00>, %1`
			`ret <4 x float> %2`

			`; FAULT-LABEL: f4rsqrt:`
			`; FAULT-NEXT: BB#0`
			`; FAULT-NEXT: fsqrt`

			`; CHECK-LABEL: f4rsqrt:`
			`; CHECK-NEXT: BB#0`
			`; CHECK-NEXT: fmov`
			`; CHECK-NEXT: frsqrte`
			`}`

[AArch64] Properly validate the reciprocal estimation. Add check for legal data types when expanding into a Newton series. Differential Revision: https://reviews.llvm.org/D22267 llvm-svn: 276041 2016-07-20 06:31:11 +08:00			`define <8 x float> @f8rsqrt(<8 x float> %a) #0 {`
			`%1 = tail call fast <8 x float> @llvm.sqrt.v8f32(<8 x float> %a) #2`
			`%2 = fdiv fast <8 x float> <float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00>, %1`
			`ret <8 x float> %2`

			`; FAULT-LABEL: f8rsqrt:`
			`; FAULT-NEXT: BB#0`
			`; FAULT-NEXT: fsqrt`
			`; FAULT-NEXT: fsqrt`

			`; CHECK-LABEL: f8rsqrt:`
			`; CHECK-NEXT: BB#0`
			`; CHECK-NEXT: fmov`
			`; CHECK-NEXT: frsqrte`
			`; CHECK: frsqrte`
			`}`

[AArch64] Use the reciprocal estimation machinery This patch adds support for estimating the square root, its reciprocal and division or reciprocal using the combiner generic reciprocal machinery. llvm-svn: 268539 2016-05-05 04:18:27 +08:00			`define double @drsqrt(double %a) #0 {`
			`%1 = tail call fast double @llvm.sqrt.f64(double %a)`
			`%2 = fdiv fast double 1.000000e+00, %1`
			`ret double %2`

			`; FAULT-LABEL: drsqrt:`
			`; FAULT-NEXT: BB#0`
			`; FAULT-NEXT: fsqrt`

			`; CHECK-LABEL: drsqrt:`
			`; CHECK-NEXT: BB#0`
			`; CHECK-NEXT: fmov`
			`; CHECK-NEXT: frsqrte`
			`}`

			`define <2 x double> @d2rsqrt(<2 x double> %a) #0 {`
			`%1 = tail call fast <2 x double> @llvm.sqrt.v2f64(<2 x double> %a) #2`
			`%2 = fdiv fast <2 x double> <double 1.000000e+00, double 1.000000e+00>, %1`
			`ret <2 x double> %2`

			`; FAULT-LABEL: d2rsqrt:`
			`; FAULT-NEXT: BB#0`
			`; FAULT-NEXT: fsqrt`

			`; CHECK-LABEL: d2rsqrt:`
			`; CHECK-NEXT: BB#0`
			`; CHECK-NEXT: fmov`
			`; CHECK-NEXT: frsqrte`
			`}`

[AArch64] Properly validate the reciprocal estimation. Add check for legal data types when expanding into a Newton series. Differential Revision: https://reviews.llvm.org/D22267 llvm-svn: 276041 2016-07-20 06:31:11 +08:00			`define <4 x double> @d4rsqrt(<4 x double> %a) #0 {`
			`%1 = tail call fast <4 x double> @llvm.sqrt.v4f64(<4 x double> %a) #4`
			`%2 = fdiv fast <4 x double> <double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00>, %1`
			`ret <4 x double> %2`

			`; FAULT-LABEL: d4rsqrt:`
			`; FAULT-NEXT: BB#0`
			`; FAULT-NEXT: fsqrt`
			`; FAULT-NEXT: fsqrt`

			`; CHECK-LABEL: d4rsqrt:`
			`; CHECK-NEXT: BB#0`
			`; CHECK-NEXT: fmov`
			`; CHECK-NEXT: frsqrte`
			`; CHECK: frsqrte`
			`}`

[AArch64] Use the reciprocal estimation machinery This patch adds support for estimating the square root, its reciprocal and division or reciprocal using the combiner generic reciprocal machinery. llvm-svn: 268539 2016-05-05 04:18:27 +08:00			`attributes #0 = { nounwind "unsafe-fp-math"="true" }`