1 ; RUN: llc < %s -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr7 -enable-unsafe-fp-math -mattr=-vsx | FileCheck %s
2 ; RUN: llc < %s -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr7 -mattr=-vsx | FileCheck -check-prefix=CHECK-SAFE %s
3 target datalayout = "E-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-f128:128:128-v128:128:128-n32:64"
4 target triple = "powerpc64-unknown-linux-gnu"
6 declare double @llvm.sqrt.f64(double)
7 declare float @llvm.sqrt.f32(float)
8 declare <4 x float> @llvm.sqrt.v4f32(<4 x float>)
10 define double @foo(double %a, double %b) nounwind {
11 %x = call double @llvm.sqrt.f64(double %b)
12 %r = fdiv double %a, %x
33 define double @foof(double %a, float %b) nounwind {
34 %x = call float @llvm.sqrt.f32(float %b)
35 %y = fpext float %x to double
36 %r = fdiv double %a, %y
54 define float @food(float %a, double %b) nounwind {
55 %x = call double @llvm.sqrt.f64(double %b)
56 %y = fptrunc double %x to float
57 %r = fdiv float %a, %y
79 define float @goo(float %a, float %b) nounwind {
80 %x = call float @llvm.sqrt.f32(float %b)
81 %r = fdiv float %a, %x
99 ; Recognize that this is rsqrt(a) * rcp(b) * c,
100 ; not 1 / ( 1 / sqrt(a)) * rcp(b) * c.
101 define float @rsqrt_fmul(float %a, float %b, float %c) {
102 %x = call float @llvm.sqrt.f32(float %a)
103 %y = fmul float %x, %b
104 %z = fdiv float %c, %y
108 ; CHECK-DAG: frsqrtes
120 ; CHECK-SAFE: @rsqrt_fmul
127 define <4 x float> @hoo(<4 x float> %a, <4 x float> %b) nounwind {
128 %x = call <4 x float> @llvm.sqrt.v4f32(<4 x float> %b)
129 %r = fdiv <4 x float> %a, %x
136 ; CHECK-SAFE-NOT: vrsqrtefp
140 define double @foo2(double %a, double %b) nounwind {
141 %r = fdiv double %a, %b
158 define float @goo2(float %a, float %b) nounwind {
159 %r = fdiv float %a, %b
174 define <4 x float> @hoo2(<4 x float> %a, <4 x float> %b) nounwind {
175 %r = fdiv <4 x float> %a, %b
182 ; CHECK-SAFE-NOT: vrefp
186 define double @foo3(double %a) nounwind {
187 %r = call double @llvm.sqrt.f64(double %a)
208 define float @goo3(float %a) nounwind {
209 %r = call float @llvm.sqrt.f32(float %a)
214 ; CHECK-DAG: frsqrtes
227 define <4 x float> @hoo3(<4 x float> %a) nounwind {
228 %r = call <4 x float> @llvm.sqrt.v4f32(<4 x float> %a)
233 ; CHECK-DAG: vcmpeqfp
236 ; CHECK-SAFE-NOT: vrsqrtefp