Home | History | Annotate | Download | only in SystemZ
      1 ; RUN: llc < %s -mtriple=s390x-linux-gnu | FileCheck %s
      2 
      3 declare float @llvm.fma.f32(float %f1, float %f2, float %f3)
      4 
      5 define float @f1(float %f1, float %f2, float %acc) {
      6 ; CHECK-LABEL: f1:
      7 ; CHECK: msebr %f4, %f0, %f2
      8 ; CHECK: ler %f0, %f4
      9 ; CHECK: br %r14
     10   %negacc = fsub float -0.0, %acc
     11   %res = call float @llvm.fma.f32 (float %f1, float %f2, float %negacc)
     12   ret float %res
     13 }
     14 
     15 define float @f2(float %f1, float *%ptr, float %acc) {
     16 ; CHECK-LABEL: f2:
     17 ; CHECK: mseb %f2, %f0, 0(%r2)
     18 ; CHECK: ler %f0, %f2
     19 ; CHECK: br %r14
     20   %f2 = load float , float *%ptr
     21   %negacc = fsub float -0.0, %acc
     22   %res = call float @llvm.fma.f32 (float %f1, float %f2, float %negacc)
     23   ret float %res
     24 }
     25 
     26 define float @f3(float %f1, float *%base, float %acc) {
     27 ; CHECK-LABEL: f3:
     28 ; CHECK: mseb %f2, %f0, 4092(%r2)
     29 ; CHECK: ler %f0, %f2
     30 ; CHECK: br %r14
     31   %ptr = getelementptr float, float *%base, i64 1023
     32   %f2 = load float , float *%ptr
     33   %negacc = fsub float -0.0, %acc
     34   %res = call float @llvm.fma.f32 (float %f1, float %f2, float %negacc)
     35   ret float %res
     36 }
     37 
     38 define float @f4(float %f1, float *%base, float %acc) {
     39 ; The important thing here is that we don't generate an out-of-range
     40 ; displacement.  Other sequences besides this one would be OK.
     41 ;
     42 ; CHECK-LABEL: f4:
     43 ; CHECK: aghi %r2, 4096
     44 ; CHECK: mseb %f2, %f0, 0(%r2)
     45 ; CHECK: ler %f0, %f2
     46 ; CHECK: br %r14
     47   %ptr = getelementptr float, float *%base, i64 1024
     48   %f2 = load float , float *%ptr
     49   %negacc = fsub float -0.0, %acc
     50   %res = call float @llvm.fma.f32 (float %f1, float %f2, float %negacc)
     51   ret float %res
     52 }
     53 
     54 define float @f5(float %f1, float *%base, float %acc) {
     55 ; Here too the important thing is that we don't generate an out-of-range
     56 ; displacement.  Other sequences besides this one would be OK.
     57 ;
     58 ; CHECK-LABEL: f5:
     59 ; CHECK: aghi %r2, -4
     60 ; CHECK: mseb %f2, %f0, 0(%r2)
     61 ; CHECK: ler %f0, %f2
     62 ; CHECK: br %r14
     63   %ptr = getelementptr float, float *%base, i64 -1
     64   %f2 = load float , float *%ptr
     65   %negacc = fsub float -0.0, %acc
     66   %res = call float @llvm.fma.f32 (float %f1, float %f2, float %negacc)
     67   ret float %res
     68 }
     69 
     70 define float @f6(float %f1, float *%base, i64 %index, float %acc) {
     71 ; CHECK-LABEL: f6:
     72 ; CHECK: sllg %r1, %r3, 2
     73 ; CHECK: mseb %f2, %f0, 0(%r1,%r2)
     74 ; CHECK: ler %f0, %f2
     75 ; CHECK: br %r14
     76   %ptr = getelementptr float, float *%base, i64 %index
     77   %f2 = load float , float *%ptr
     78   %negacc = fsub float -0.0, %acc
     79   %res = call float @llvm.fma.f32 (float %f1, float %f2, float %negacc)
     80   ret float %res
     81 }
     82 
     83 define float @f7(float %f1, float *%base, i64 %index, float %acc) {
     84 ; CHECK-LABEL: f7:
     85 ; CHECK: sllg %r1, %r3, 2
     86 ; CHECK: mseb %f2, %f0, 4092({{%r1,%r2|%r2,%r1}})
     87 ; CHECK: ler %f0, %f2
     88 ; CHECK: br %r14
     89   %index2 = add i64 %index, 1023
     90   %ptr = getelementptr float, float *%base, i64 %index2
     91   %f2 = load float , float *%ptr
     92   %negacc = fsub float -0.0, %acc
     93   %res = call float @llvm.fma.f32 (float %f1, float %f2, float %negacc)
     94   ret float %res
     95 }
     96 
     97 define float @f8(float %f1, float *%base, i64 %index, float %acc) {
     98 ; CHECK-LABEL: f8:
     99 ; CHECK: sllg %r1, %r3, 2
    100 ; CHECK: lay %r1, 4096({{%r1,%r2|%r2,%r1}})
    101 ; CHECK: mseb %f2, %f0, 0(%r1)
    102 ; CHECK: ler %f0, %f2
    103 ; CHECK: br %r14
    104   %index2 = add i64 %index, 1024
    105   %ptr = getelementptr float, float *%base, i64 %index2
    106   %f2 = load float , float *%ptr
    107   %negacc = fsub float -0.0, %acc
    108   %res = call float @llvm.fma.f32 (float %f1, float %f2, float %negacc)
    109   ret float %res
    110 }
    111