Home | History | Annotate | Download | only in InstCombine
      1 ; RUN: opt < %s -instcombine -S | FileCheck %s
      2 
      3 ; Make sure all library calls are eliminated when the input is known positive.
      4 
      5 declare float @fabsf(float)
      6 declare double @fabs(double)
      7 declare fp128 @fabsl(fp128)
      8 
      9 define float @square_fabs_call_f32(float %x) {
     10   %mul = fmul float %x, %x
     11   %fabsf = tail call float @fabsf(float %mul)
     12   ret float %fabsf
     13 
     14 ; CHECK-LABEL: square_fabs_call_f32(
     15 ; CHECK-NEXT: %mul = fmul float %x, %x
     16 ; CHECK-NEXT: ret float %mul
     17 }
     18 
     19 define double @square_fabs_call_f64(double %x) {
     20   %mul = fmul double %x, %x
     21   %fabs = tail call double @fabs(double %mul)
     22   ret double %fabs
     23 
     24 ; CHECK-LABEL: square_fabs_call_f64(
     25 ; CHECK-NEXT: %mul = fmul double %x, %x
     26 ; CHECK-NEXT: ret double %mul
     27 }
     28 
     29 define fp128 @square_fabs_call_f128(fp128 %x) {
     30   %mul = fmul fp128 %x, %x
     31   %fabsl = tail call fp128 @fabsl(fp128 %mul)
     32   ret fp128 %fabsl
     33 
     34 ; CHECK-LABEL: square_fabs_call_f128(
     35 ; CHECK-NEXT: %mul = fmul fp128 %x, %x
     36 ; CHECK-NEXT: ret fp128 %mul
     37 }
     38 
     39 ; Make sure all intrinsic calls are eliminated when the input is known positive.
     40 
     41 declare float @llvm.fabs.f32(float)
     42 declare double @llvm.fabs.f64(double)
     43 declare fp128 @llvm.fabs.f128(fp128)
     44 declare <4 x float> @llvm.fabs.v4f32(<4 x float>)
     45 
     46 define float @square_fabs_intrinsic_f32(float %x) {
     47   %mul = fmul float %x, %x
     48   %fabsf = tail call float @llvm.fabs.f32(float %mul)
     49   ret float %fabsf
     50 
     51 ; CHECK-LABEL: square_fabs_intrinsic_f32(
     52 ; CHECK-NEXT: %mul = fmul float %x, %x
     53 ; CHECK-NEXT: ret float %mul
     54 }
     55 
     56 define double @square_fabs_intrinsic_f64(double %x) {
     57   %mul = fmul double %x, %x
     58   %fabs = tail call double @llvm.fabs.f64(double %mul)
     59   ret double %fabs
     60 
     61 ; CHECK-LABEL: square_fabs_intrinsic_f64(
     62 ; CHECK-NEXT: %mul = fmul double %x, %x
     63 ; CHECK-NEXT: ret double %mul
     64 }
     65 
     66 define fp128 @square_fabs_intrinsic_f128(fp128 %x) {
     67   %mul = fmul fp128 %x, %x
     68   %fabsl = tail call fp128 @llvm.fabs.f128(fp128 %mul)
     69   ret fp128 %fabsl
     70 
     71 ; CHECK-LABEL: square_fabs_intrinsic_f128(
     72 ; CHECK-NEXT: %mul = fmul fp128 %x, %x
     73 ; CHECK-NEXT: ret fp128 %mul
     74 }
     75 
     76 ; Shrinking a library call to a smaller type should not be inhibited by nor inhibit the square optimization.
     77 
     78 define float @square_fabs_shrink_call1(float %x) {
     79   %ext = fpext float %x to double
     80   %sq = fmul double %ext, %ext
     81   %fabs = call double @fabs(double %sq)
     82   %trunc = fptrunc double %fabs to float
     83   ret float %trunc
     84 
     85 ; CHECK-LABEL: square_fabs_shrink_call1(
     86 ; CHECK-NEXT: %trunc = fmul float %x, %x
     87 ; CHECK-NEXT: ret float %trunc
     88 }
     89 
     90 define float @square_fabs_shrink_call2(float %x) {
     91   %sq = fmul float %x, %x
     92   %ext = fpext float %sq to double
     93   %fabs = call double @fabs(double %ext)
     94   %trunc = fptrunc double %fabs to float
     95   ret float %trunc
     96 
     97 ; CHECK-LABEL: square_fabs_shrink_call2(
     98 ; CHECK-NEXT: %sq = fmul float %x, %x
     99 ; CHECK-NEXT: ret float %sq
    100 }
    101 
    102 ; A scalar fabs op makes the sign bit zero, so masking off all of the other bits means we can return zero.
    103 
    104 define i32 @fabs_value_tracking_f32(float %x) {
    105   %call = call float @llvm.fabs.f32(float %x)
    106   %bc = bitcast float %call to i32
    107   %and = and i32 %bc, 2147483648
    108   ret i32 %and
    109 
    110 ; CHECK-LABEL: fabs_value_tracking_f32(
    111 ; CHECK:       ret i32 0
    112 }
    113 
    114 ; TODO: A vector fabs op makes the sign bits zero, so masking off all of the other bits means we can return zero.
    115 
    116 define <4 x i32> @fabs_value_tracking_v4f32(<4 x float> %x) {
    117   %call = call <4 x float> @llvm.fabs.v4f32(<4 x float> %x)
    118   %bc = bitcast <4 x float> %call to <4 x i32>
    119   %and = and <4 x i32> %bc, <i32 2147483648, i32 2147483648, i32 2147483648, i32 2147483648>
    120   ret <4 x i32> %and
    121 
    122 ; CHECK-LABEL: fabs_value_tracking_v4f32(
    123 ; CHECK:       ret <4 x i32> %and
    124 }
    125 
    126