Home | History | Annotate | Download | only in SystemZ
      1 ; Test vector subtraction.
      2 ;
      3 ; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z13 | FileCheck %s
      4 
      5 ; Test a v16i8 subtraction.
      6 define <16 x i8> @f1(<16 x i8> %dummy, <16 x i8> %val1, <16 x i8> %val2) {
      7 ; CHECK-LABEL: f1:
      8 ; CHECK: vsb %v24, %v26, %v28
      9 ; CHECK: br %r14
     10   %ret = sub <16 x i8> %val1, %val2
     11   ret <16 x i8> %ret
     12 }
     13 
     14 ; Test a v8i16 subtraction.
     15 define <8 x i16> @f2(<8 x i16> %dummy, <8 x i16> %val1, <8 x i16> %val2) {
     16 ; CHECK-LABEL: f2:
     17 ; CHECK: vsh %v24, %v26, %v28
     18 ; CHECK: br %r14
     19   %ret = sub <8 x i16> %val1, %val2
     20   ret <8 x i16> %ret
     21 }
     22 
     23 ; Test a v4i32 subtraction.
     24 define <4 x i32> @f3(<4 x i32> %dummy, <4 x i32> %val1, <4 x i32> %val2) {
     25 ; CHECK-LABEL: f3:
     26 ; CHECK: vsf %v24, %v26, %v28
     27 ; CHECK: br %r14
     28   %ret = sub <4 x i32> %val1, %val2
     29   ret <4 x i32> %ret
     30 }
     31 
     32 ; Test a v2i64 subtraction.
     33 define <2 x i64> @f4(<2 x i64> %dummy, <2 x i64> %val1, <2 x i64> %val2) {
     34 ; CHECK-LABEL: f4:
     35 ; CHECK: vsg %v24, %v26, %v28
     36 ; CHECK: br %r14
     37   %ret = sub <2 x i64> %val1, %val2
     38   ret <2 x i64> %ret
     39 }
     40 
     41 ; Test a v4f32 subtraction, as an example of an operation that needs to be
     42 ; scalarized and reassembled.  At present there's an unnecessary move that
     43 ; could be avoided with smarter ordering.  It also isn't important whether
     44 ; the VSLDBs use the result of the VLRs or use %v24 and %v26 directly.
     45 define <4 x float> @f5(<4 x float> %val1, <4 x float> %val2) {
     46 ; CHECK-LABEL: f5:
     47 ; CHECK-DAG: vlr %v[[A1:[0-5]]], %v24
     48 ; CHECK-DAG: vlr %v[[A2:[0-5]]], %v26
     49 ; CHECK-DAG: vrepf %v[[B1:[0-5]]], %v[[A1]], 1
     50 ; CHECK-DAG: vrepf %v[[B2:[0-5]]], %v[[A2]], 1
     51 ; CHECK-DAG: vrepf %v[[C1:[0-5]]], %v[[A1]], 2
     52 ; CHECK-DAG: vrepf %v[[C2:[0-5]]], %v[[A2]], 2
     53 ; CHECK-DAG: vrepf %v[[D1:[0-5]]], %v[[A1]], 3
     54 ; CHECK-DAG: vrepf %v[[D2:[0-5]]], %v[[A2]], 3
     55 ; CHECK-DAG: ler %f[[A1copy:[0-5]]], %f[[A1]]
     56 ; CHECK-DAG: sebr %f[[A1copy]], %f[[A2]]
     57 ; CHECK-DAG: sebr %f[[B1]], %f[[B2]]
     58 ; CHECK-DAG: sebr %f[[C1]], %f[[C2]]
     59 ; CHECK-DAG: sebr %f[[D1]], %f[[D2]]
     60 ; CHECK-DAG: vmrhf [[HIGH:%v[0-9]+]], %v[[A1copy]], %v[[B1]]
     61 ; CHECK-DAG: vmrhf [[LOW:%v[0-9]+]], %v[[C1]], %v[[D1]]
     62 ; CHECK: vmrhg %v24, [[HIGH]], [[LOW]]
     63 ; CHECK: br %r14
     64   %ret = fsub <4 x float> %val1, %val2
     65   ret <4 x float> %ret
     66 }
     67 
     68 ; Test a v2f64 subtraction.
     69 define <2 x double> @f6(<2 x double> %dummy, <2 x double> %val1,
     70                         <2 x double> %val2) {
     71 ; CHECK-LABEL: f6:
     72 ; CHECK: vfsdb %v24, %v26, %v28
     73 ; CHECK: br %r14
     74   %ret = fsub <2 x double> %val1, %val2
     75   ret <2 x double> %ret
     76 }
     77 
     78 ; Test an f64 subtraction that uses vector registers.
     79 define double @f7(<2 x double> %val1, <2 x double> %val2) {
     80 ; CHECK-LABEL: f7:
     81 ; CHECK: wfsdb %f0, %v24, %v26
     82 ; CHECK: br %r14
     83   %scalar1 = extractelement <2 x double> %val1, i32 0
     84   %scalar2 = extractelement <2 x double> %val2, i32 0
     85   %ret = fsub double %scalar1, %scalar2
     86   ret double %ret
     87 }
     88 
     89 ; Test a v2i8 subtraction, which gets promoted to v16i8.
     90 define <2 x i8> @f8(<2 x i8> %dummy, <2 x i8> %val1, <2 x i8> %val2) {
     91 ; CHECK-LABEL: f8:
     92 ; CHECK: vsb %v24, %v26, %v28
     93 ; CHECK: br %r14
     94   %ret = sub <2 x i8> %val1, %val2
     95   ret <2 x i8> %ret
     96 }
     97 
     98 ; Test a v4i8 subtraction, which gets promoted to v16i8.
     99 define <4 x i8> @f9(<4 x i8> %dummy, <4 x i8> %val1, <4 x i8> %val2) {
    100 ; CHECK-LABEL: f9:
    101 ; CHECK: vsb %v24, %v26, %v28
    102 ; CHECK: br %r14
    103   %ret = sub <4 x i8> %val1, %val2
    104   ret <4 x i8> %ret
    105 }
    106 
    107 ; Test a v8i8 subtraction, which gets promoted to v16i8.
    108 define <8 x i8> @f10(<8 x i8> %dummy, <8 x i8> %val1, <8 x i8> %val2) {
    109 ; CHECK-LABEL: f10:
    110 ; CHECK: vsb %v24, %v26, %v28
    111 ; CHECK: br %r14
    112   %ret = sub <8 x i8> %val1, %val2
    113   ret <8 x i8> %ret
    114 }
    115 
    116 ; Test a v2i16 subtraction, which gets promoted to v8i16.
    117 define <2 x i16> @f11(<2 x i16> %dummy, <2 x i16> %val1, <2 x i16> %val2) {
    118 ; CHECK-LABEL: f11:
    119 ; CHECK: vsh %v24, %v26, %v28
    120 ; CHECK: br %r14
    121   %ret = sub <2 x i16> %val1, %val2
    122   ret <2 x i16> %ret
    123 }
    124 
    125 ; Test a v4i16 subtraction, which gets promoted to v8i16.
    126 define <4 x i16> @f12(<4 x i16> %dummy, <4 x i16> %val1, <4 x i16> %val2) {
    127 ; CHECK-LABEL: f12:
    128 ; CHECK: vsh %v24, %v26, %v28
    129 ; CHECK: br %r14
    130   %ret = sub <4 x i16> %val1, %val2
    131   ret <4 x i16> %ret
    132 }
    133 
    134 ; Test a v2i32 subtraction, which gets promoted to v4i32.
    135 define <2 x i32> @f13(<2 x i32> %dummy, <2 x i32> %val1, <2 x i32> %val2) {
    136 ; CHECK-LABEL: f13:
    137 ; CHECK: vsf %v24, %v26, %v28
    138 ; CHECK: br %r14
    139   %ret = sub <2 x i32> %val1, %val2
    140   ret <2 x i32> %ret
    141 }
    142 
    143 ; Test a v2f32 subtraction, which gets promoted to v4f32.
    144 define <2 x float> @f14(<2 x float> %val1, <2 x float> %val2) {
    145 ; No particular output expected, but must compile.
    146   %ret = fsub <2 x float> %val1, %val2
    147   ret <2 x float> %ret
    148 }
    149