test/Transforms/InstCombine/fabs.ll

   1 ; RUN: opt < %s -instcombine -S | FileCheck %s
   2
   3 ; Make sure all library calls are eliminated when the input is known positive.
   4
   5 declare float @fabsf(float)
   6 declare double @fabs(double)
   7 declare fp128 @fabsl(fp128)
   8
   9 define float @square_fabs_call_f32(float %x) {
  10   %mul = fmul float %x, %x
  11   %fabsf = tail call float @fabsf(float %mul)
  12   ret float %fabsf
  13
  14 ; CHECK-LABEL: square_fabs_call_f32(
  15 ; CHECK-NEXT: %mul = fmul float %x, %x
  16 ; CHECK-NEXT: ret float %mul
  17 }
  18
  19 define double @square_fabs_call_f64(double %x) {
  20   %mul = fmul double %x, %x
  21   %fabs = tail call double @fabs(double %mul)
  22   ret double %fabs
  23
  24 ; CHECK-LABEL: square_fabs_call_f64(
  25 ; CHECK-NEXT: %mul = fmul double %x, %x
  26 ; CHECK-NEXT: ret double %mul
  27 }
  28
  29 define fp128 @square_fabs_call_f128(fp128 %x) {
  30   %mul = fmul fp128 %x, %x
  31   %fabsl = tail call fp128 @fabsl(fp128 %mul)
  32   ret fp128 %fabsl
  33
  34 ; CHECK-LABEL: square_fabs_call_f128(
  35 ; CHECK-NEXT: %mul = fmul fp128 %x, %x
  36 ; CHECK-NEXT: ret fp128 %mul
  37 }
  38
  39 ; Make sure all intrinsic calls are eliminated when the input is known positive.
  40
  41 declare float @llvm.fabs.f32(float)
  42 declare double @llvm.fabs.f64(double)
  43 declare fp128 @llvm.fabs.f128(fp128)
  44 declare <4 x float> @llvm.fabs.v4f32(<4 x float>)
  45
  46 define float @square_fabs_intrinsic_f32(float %x) {
  47   %mul = fmul float %x, %x
  48   %fabsf = tail call float @llvm.fabs.f32(float %mul)
  49   ret float %fabsf
  50
  51 ; CHECK-LABEL: square_fabs_intrinsic_f32(
  52 ; CHECK-NEXT: %mul = fmul float %x, %x
  53 ; CHECK-NEXT: ret float %mul
  54 }
  55
  56 define double @square_fabs_intrinsic_f64(double %x) {
  57   %mul = fmul double %x, %x
  58   %fabs = tail call double @llvm.fabs.f64(double %mul)
  59   ret double %fabs
  60
  61 ; CHECK-LABEL: square_fabs_intrinsic_f64(
  62 ; CHECK-NEXT: %mul = fmul double %x, %x
  63 ; CHECK-NEXT: ret double %mul
  64 }
  65
  66 define fp128 @square_fabs_intrinsic_f128(fp128 %x) {
  67   %mul = fmul fp128 %x, %x
  68   %fabsl = tail call fp128 @llvm.fabs.f128(fp128 %mul)
  69   ret fp128 %fabsl
  70
  71 ; CHECK-LABEL: square_fabs_intrinsic_f128(
  72 ; CHECK-NEXT: %mul = fmul fp128 %x, %x
  73 ; CHECK-NEXT: ret fp128 %mul
  74 }
  75
  76 ; Shrinking a library call to a smaller type should not be inhibited by nor inhibit the square optimization.
  77
  78 define float @square_fabs_shrink_call1(float %x) {
  79   %ext = fpext float %x to double
  80   %sq = fmul double %ext, %ext
  81   %fabs = call double @fabs(double %sq)
  82   %trunc = fptrunc double %fabs to float
  83   ret float %trunc
  84
  85 ; CHECK-LABEL: square_fabs_shrink_call1(
  86 ; CHECK-NEXT: %trunc = fmul float %x, %x
  87 ; CHECK-NEXT: ret float %trunc
  88 }
  89
  90 define float @square_fabs_shrink_call2(float %x) {
  91   %sq = fmul float %x, %x
  92   %ext = fpext float %sq to double
  93   %fabs = call double @fabs(double %ext)
  94   %trunc = fptrunc double %fabs to float
  95   ret float %trunc
  96
  97 ; CHECK-LABEL: square_fabs_shrink_call2(
  98 ; CHECK-NEXT: %sq = fmul float %x, %x
  99 ; CHECK-NEXT: ret float %sq
 100 }
 101
 102 ; A scalar fabs op makes the sign bit zero, so masking off all of the other bits means we can return zero.
 103
 104 define i32 @fabs_value_tracking_f32(float %x) {
 105   %call = call float @llvm.fabs.f32(float %x)
 106   %bc = bitcast float %call to i32
 107   %and = and i32 %bc, 2147483648
 108   ret i32 %and
 109
 110 ; CHECK-LABEL: fabs_value_tracking_f32(
 111 ; CHECK:       ret i32 0
 112 }
 113
 114 ; TODO: A vector fabs op makes the sign bits zero, so masking off all of the other bits means we can return zero.
 115
 116 define <4 x i32> @fabs_value_tracking_v4f32(<4 x float> %x) {
 117   %call = call <4 x float> @llvm.fabs.v4f32(<4 x float> %x)
 118   %bc = bitcast <4 x float> %call to <4 x i32>
 119   %and = and <4 x i32> %bc, <i32 2147483648, i32 2147483648, i32 2147483648, i32 2147483648>
 120   ret <4 x i32> %and
 121
 122 ; CHECK-LABEL: fabs_value_tracking_v4f32(
 123 ; CHECK:       ret <4 x i32> %and
 124 }
 125