Home | History | Annotate | Download | only in msa
      1 ; RUN: llc -march=mips -mattr=+msa,+fp64 < %s | FileCheck %s
      2 ; RUN: llc -march=mipsel -mattr=+msa,+fp64 < %s | FileCheck %s
      3 
      4 declare <4 x float> @llvm.mips.fmax.w(<4 x float>, <4 x float>) nounwind
      5 declare <2 x double> @llvm.mips.fmax.d(<2 x double>, <2 x double>) nounwind
      6 declare <4 x float> @llvm.mips.fmin.w(<4 x float>, <4 x float>) nounwind
      7 declare <2 x double> @llvm.mips.fmin.d(<2 x double>, <2 x double>) nounwind
      8 
      9 define void @false_v4f32(<4 x i32>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
     10   ; CHECK: false_v4f32:
     11 
     12   %1 = load <4 x float>, <4 x float>* %a
     13   %2 = load <4 x float>, <4 x float>* %b
     14   %3 = fcmp false <4 x float> %1, %2
     15   %4 = sext <4 x i1> %3 to <4 x i32>
     16   store <4 x i32> %4, <4 x i32>* %c
     17   ret void
     18 
     19   ; (setcc $a, $b, SETFALSE) is always folded, so we won't get fcaf:
     20   ; CHECK-DAG: ldi.b [[R1:\$w[0-9]+]], 0
     21   ; CHECK-DAG: st.w [[R1]], 0($4)
     22   ; CHECK: .size false_v4f32
     23 }
     24 
     25 define void @false_v2f64(<2 x i64>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
     26   ; CHECK: false_v2f64:
     27 
     28   %1 = load <2 x double>, <2 x double>* %a
     29   %2 = load <2 x double>, <2 x double>* %b
     30   %3 = fcmp false <2 x double> %1, %2
     31   %4 = sext <2 x i1> %3 to <2 x i64>
     32   store <2 x i64> %4, <2 x i64>* %c
     33   ret void
     34 
     35   ; (setcc $a, $b, SETFALSE) is always folded
     36   ; CHECK-DAG: ldi.b [[R1:\$w[0-9]+]], 0
     37   ; CHECK-DAG: st.w [[R1]], 0($4)
     38   ; CHECK: .size false_v2f64
     39 }
     40 
     41 define void @oeq_v4f32(<4 x i32>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
     42   ; CHECK: oeq_v4f32:
     43 
     44   %1 = load <4 x float>, <4 x float>* %a
     45   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
     46   %2 = load <4 x float>, <4 x float>* %b
     47   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
     48   %3 = fcmp oeq <4 x float> %1, %2
     49   %4 = sext <4 x i1> %3 to <4 x i32>
     50   ; CHECK-DAG: fceq.w [[R3:\$w[0-9]+]], [[R1]], [[R2]]
     51   store <4 x i32> %4, <4 x i32>* %c
     52   ; CHECK-DAG: st.w [[R3]], 0($4)
     53 
     54   ret void
     55   ; CHECK: .size oeq_v4f32
     56 }
     57 
     58 define void @oeq_v2f64(<2 x i64>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
     59   ; CHECK: oeq_v2f64:
     60 
     61   %1 = load <2 x double>, <2 x double>* %a
     62   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
     63   %2 = load <2 x double>, <2 x double>* %b
     64   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
     65   %3 = fcmp oeq <2 x double> %1, %2
     66   %4 = sext <2 x i1> %3 to <2 x i64>
     67   ; CHECK-DAG: fceq.d [[R3:\$w[0-9]+]], [[R1]], [[R2]]
     68   store <2 x i64> %4, <2 x i64>* %c
     69   ; CHECK-DAG: st.d [[R3]], 0($4)
     70 
     71   ret void
     72   ; CHECK: .size oeq_v2f64
     73 }
     74 
     75 define void @oge_v4f32(<4 x i32>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
     76   ; CHECK: oge_v4f32:
     77 
     78   %1 = load <4 x float>, <4 x float>* %a
     79   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
     80   %2 = load <4 x float>, <4 x float>* %b
     81   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
     82   %3 = fcmp oge <4 x float> %1, %2
     83   %4 = sext <4 x i1> %3 to <4 x i32>
     84   ; CHECK-DAG: fcle.w [[R3:\$w[0-9]+]], [[R2]], [[R1]]
     85   store <4 x i32> %4, <4 x i32>* %c
     86   ; CHECK-DAG: st.w [[R3]], 0($4)
     87 
     88   ret void
     89   ; CHECK: .size oge_v4f32
     90 }
     91 
     92 define void @oge_v2f64(<2 x i64>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
     93   ; CHECK: oge_v2f64:
     94 
     95   %1 = load <2 x double>, <2 x double>* %a
     96   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
     97   %2 = load <2 x double>, <2 x double>* %b
     98   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
     99   %3 = fcmp oge <2 x double> %1, %2
    100   %4 = sext <2 x i1> %3 to <2 x i64>
    101   ; CHECK-DAG: fcle.d [[R3:\$w[0-9]+]], [[R2]], [[R1]]
    102   store <2 x i64> %4, <2 x i64>* %c
    103   ; CHECK-DAG: st.d [[R3]], 0($4)
    104 
    105   ret void
    106   ; CHECK: .size oge_v2f64
    107 }
    108 
    109 define void @ogt_v4f32(<4 x i32>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
    110   ; CHECK: ogt_v4f32:
    111 
    112   %1 = load <4 x float>, <4 x float>* %a
    113   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
    114   %2 = load <4 x float>, <4 x float>* %b
    115   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
    116   %3 = fcmp ogt <4 x float> %1, %2
    117   %4 = sext <4 x i1> %3 to <4 x i32>
    118   ; CHECK-DAG: fclt.w [[R3:\$w[0-9]+]], [[R2]], [[R1]]
    119   store <4 x i32> %4, <4 x i32>* %c
    120   ; CHECK-DAG: st.w [[R3]], 0($4)
    121 
    122   ret void
    123   ; CHECK: .size ogt_v4f32
    124 }
    125 
    126 define void @ogt_v2f64(<2 x i64>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
    127   ; CHECK: ogt_v2f64:
    128 
    129   %1 = load <2 x double>, <2 x double>* %a
    130   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
    131   %2 = load <2 x double>, <2 x double>* %b
    132   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
    133   %3 = fcmp ogt <2 x double> %1, %2
    134   %4 = sext <2 x i1> %3 to <2 x i64>
    135   ; CHECK-DAG: fclt.d [[R3:\$w[0-9]+]], [[R2]], [[R1]]
    136   store <2 x i64> %4, <2 x i64>* %c
    137   ; CHECK-DAG: st.d [[R3]], 0($4)
    138 
    139   ret void
    140   ; CHECK: .size ogt_v2f64
    141 }
    142 
    143 define void @ole_v4f32(<4 x i32>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
    144   ; CHECK: ole_v4f32:
    145 
    146   %1 = load <4 x float>, <4 x float>* %a
    147   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
    148   %2 = load <4 x float>, <4 x float>* %b
    149   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
    150   %3 = fcmp ole <4 x float> %1, %2
    151   %4 = sext <4 x i1> %3 to <4 x i32>
    152   ; CHECK-DAG: fcle.w [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    153   store <4 x i32> %4, <4 x i32>* %c
    154   ; CHECK-DAG: st.w [[R3]], 0($4)
    155 
    156   ret void
    157   ; CHECK: .size ole_v4f32
    158 }
    159 
    160 define void @ole_v2f64(<2 x i64>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
    161   ; CHECK: ole_v2f64:
    162 
    163   %1 = load <2 x double>, <2 x double>* %a
    164   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
    165   %2 = load <2 x double>, <2 x double>* %b
    166   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
    167   %3 = fcmp ole <2 x double> %1, %2
    168   %4 = sext <2 x i1> %3 to <2 x i64>
    169   ; CHECK-DAG: fcle.d [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    170   store <2 x i64> %4, <2 x i64>* %c
    171   ; CHECK-DAG: st.d [[R3]], 0($4)
    172 
    173   ret void
    174   ; CHECK: .size ole_v2f64
    175 }
    176 
    177 define void @olt_v4f32(<4 x i32>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
    178   ; CHECK: olt_v4f32:
    179 
    180   %1 = load <4 x float>, <4 x float>* %a
    181   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
    182   %2 = load <4 x float>, <4 x float>* %b
    183   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
    184   %3 = fcmp olt <4 x float> %1, %2
    185   %4 = sext <4 x i1> %3 to <4 x i32>
    186   ; CHECK-DAG: fclt.w [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    187   store <4 x i32> %4, <4 x i32>* %c
    188   ; CHECK-DAG: st.w [[R3]], 0($4)
    189 
    190   ret void
    191   ; CHECK: .size olt_v4f32
    192 }
    193 
    194 define void @olt_v2f64(<2 x i64>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
    195   ; CHECK: olt_v2f64:
    196 
    197   %1 = load <2 x double>, <2 x double>* %a
    198   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
    199   %2 = load <2 x double>, <2 x double>* %b
    200   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
    201   %3 = fcmp olt <2 x double> %1, %2
    202   %4 = sext <2 x i1> %3 to <2 x i64>
    203   ; CHECK-DAG: fclt.d [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    204   store <2 x i64> %4, <2 x i64>* %c
    205   ; CHECK-DAG: st.d [[R3]], 0($4)
    206 
    207   ret void
    208   ; CHECK: .size olt_v2f64
    209 }
    210 
    211 define void @one_v4f32(<4 x i32>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
    212   ; CHECK: one_v4f32:
    213 
    214   %1 = load <4 x float>, <4 x float>* %a
    215   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
    216   %2 = load <4 x float>, <4 x float>* %b
    217   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
    218   %3 = fcmp one <4 x float> %1, %2
    219   %4 = sext <4 x i1> %3 to <4 x i32>
    220   ; CHECK-DAG: fcne.w [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    221   store <4 x i32> %4, <4 x i32>* %c
    222   ; CHECK-DAG: st.w [[R3]], 0($4)
    223 
    224   ret void
    225   ; CHECK: .size one_v4f32
    226 }
    227 
    228 define void @one_v2f64(<2 x i64>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
    229   ; CHECK: one_v2f64:
    230 
    231   %1 = load <2 x double>, <2 x double>* %a
    232   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
    233   %2 = load <2 x double>, <2 x double>* %b
    234   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
    235   %3 = fcmp one <2 x double> %1, %2
    236   %4 = sext <2 x i1> %3 to <2 x i64>
    237   ; CHECK-DAG: fcne.d [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    238   store <2 x i64> %4, <2 x i64>* %c
    239   ; CHECK-DAG: st.d [[R3]], 0($4)
    240 
    241   ret void
    242   ; CHECK: .size one_v2f64
    243 }
    244 
    245 define void @ord_v4f32(<4 x i32>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
    246   ; CHECK: ord_v4f32:
    247 
    248   %1 = load <4 x float>, <4 x float>* %a
    249   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
    250   %2 = load <4 x float>, <4 x float>* %b
    251   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
    252   %3 = fcmp ord <4 x float> %1, %2
    253   %4 = sext <4 x i1> %3 to <4 x i32>
    254   ; CHECK-DAG: fcor.w [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    255   store <4 x i32> %4, <4 x i32>* %c
    256   ; CHECK-DAG: st.w [[R3]], 0($4)
    257 
    258   ret void
    259   ; CHECK: .size ord_v4f32
    260 }
    261 
    262 define void @ord_v2f64(<2 x i64>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
    263   ; CHECK: ord_v2f64:
    264 
    265   %1 = load <2 x double>, <2 x double>* %a
    266   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
    267   %2 = load <2 x double>, <2 x double>* %b
    268   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
    269   %3 = fcmp ord <2 x double> %1, %2
    270   %4 = sext <2 x i1> %3 to <2 x i64>
    271   ; CHECK-DAG: fcor.d [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    272   store <2 x i64> %4, <2 x i64>* %c
    273   ; CHECK-DAG: st.d [[R3]], 0($4)
    274 
    275   ret void
    276   ; CHECK: .size ord_v2f64
    277 }
    278 
    279 define void @ueq_v4f32(<4 x i32>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
    280   ; CHECK: ueq_v4f32:
    281 
    282   %1 = load <4 x float>, <4 x float>* %a
    283   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
    284   %2 = load <4 x float>, <4 x float>* %b
    285   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
    286   %3 = fcmp ueq <4 x float> %1, %2
    287   %4 = sext <4 x i1> %3 to <4 x i32>
    288   ; CHECK-DAG: fcueq.w [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    289   store <4 x i32> %4, <4 x i32>* %c
    290   ; CHECK-DAG: st.w [[R3]], 0($4)
    291 
    292   ret void
    293   ; CHECK: .size ueq_v4f32
    294 }
    295 
    296 define void @ueq_v2f64(<2 x i64>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
    297   ; CHECK: ueq_v2f64:
    298 
    299   %1 = load <2 x double>, <2 x double>* %a
    300   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
    301   %2 = load <2 x double>, <2 x double>* %b
    302   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
    303   %3 = fcmp ueq <2 x double> %1, %2
    304   %4 = sext <2 x i1> %3 to <2 x i64>
    305   ; CHECK-DAG: fcueq.d [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    306   store <2 x i64> %4, <2 x i64>* %c
    307   ; CHECK-DAG: st.d [[R3]], 0($4)
    308 
    309   ret void
    310   ; CHECK: .size ueq_v2f64
    311 }
    312 
    313 define void @uge_v4f32(<4 x i32>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
    314   ; CHECK: uge_v4f32:
    315 
    316   %1 = load <4 x float>, <4 x float>* %a
    317   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
    318   %2 = load <4 x float>, <4 x float>* %b
    319   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
    320   %3 = fcmp uge <4 x float> %1, %2
    321   %4 = sext <4 x i1> %3 to <4 x i32>
    322   ; CHECK-DAG: fcule.w [[R3:\$w[0-9]+]], [[R2]], [[R1]]
    323   store <4 x i32> %4, <4 x i32>* %c
    324   ; CHECK-DAG: st.w [[R3]], 0($4)
    325 
    326   ret void
    327   ; CHECK: .size uge_v4f32
    328 }
    329 
    330 define void @uge_v2f64(<2 x i64>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
    331   ; CHECK: uge_v2f64:
    332 
    333   %1 = load <2 x double>, <2 x double>* %a
    334   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
    335   %2 = load <2 x double>, <2 x double>* %b
    336   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
    337   %3 = fcmp uge <2 x double> %1, %2
    338   %4 = sext <2 x i1> %3 to <2 x i64>
    339   ; CHECK-DAG: fcule.d [[R3:\$w[0-9]+]], [[R2]], [[R1]]
    340   store <2 x i64> %4, <2 x i64>* %c
    341   ; CHECK-DAG: st.d [[R3]], 0($4)
    342 
    343   ret void
    344   ; CHECK: .size uge_v2f64
    345 }
    346 
    347 define void @ugt_v4f32(<4 x i32>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
    348   ; CHECK: ugt_v4f32:
    349 
    350   %1 = load <4 x float>, <4 x float>* %a
    351   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
    352   %2 = load <4 x float>, <4 x float>* %b
    353   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
    354   %3 = fcmp ugt <4 x float> %1, %2
    355   %4 = sext <4 x i1> %3 to <4 x i32>
    356   ; CHECK-DAG: fcult.w [[R3:\$w[0-9]+]], [[R2]], [[R1]]
    357   store <4 x i32> %4, <4 x i32>* %c
    358   ; CHECK-DAG: st.w [[R3]], 0($4)
    359 
    360   ret void
    361   ; CHECK: .size ugt_v4f32
    362 }
    363 
    364 define void @ugt_v2f64(<2 x i64>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
    365   ; CHECK: ugt_v2f64:
    366 
    367   %1 = load <2 x double>, <2 x double>* %a
    368   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
    369   %2 = load <2 x double>, <2 x double>* %b
    370   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
    371   %3 = fcmp ugt <2 x double> %1, %2
    372   %4 = sext <2 x i1> %3 to <2 x i64>
    373   ; CHECK-DAG: fcult.d [[R3:\$w[0-9]+]], [[R2]], [[R1]]
    374   store <2 x i64> %4, <2 x i64>* %c
    375   ; CHECK-DAG: st.d [[R3]], 0($4)
    376 
    377   ret void
    378   ; CHECK: .size ugt_v2f64
    379 }
    380 
    381 define void @ule_v4f32(<4 x i32>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
    382   ; CHECK: ule_v4f32:
    383 
    384   %1 = load <4 x float>, <4 x float>* %a
    385   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
    386   %2 = load <4 x float>, <4 x float>* %b
    387   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
    388   %3 = fcmp ule <4 x float> %1, %2
    389   %4 = sext <4 x i1> %3 to <4 x i32>
    390   ; CHECK-DAG: fcule.w [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    391   store <4 x i32> %4, <4 x i32>* %c
    392   ; CHECK-DAG: st.w [[R3]], 0($4)
    393 
    394   ret void
    395   ; CHECK: .size ule_v4f32
    396 }
    397 
    398 define void @ule_v2f64(<2 x i64>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
    399   ; CHECK: ule_v2f64:
    400 
    401   %1 = load <2 x double>, <2 x double>* %a
    402   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
    403   %2 = load <2 x double>, <2 x double>* %b
    404   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
    405   %3 = fcmp ule <2 x double> %1, %2
    406   %4 = sext <2 x i1> %3 to <2 x i64>
    407   ; CHECK-DAG: fcule.d [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    408   store <2 x i64> %4, <2 x i64>* %c
    409   ; CHECK-DAG: st.d [[R3]], 0($4)
    410 
    411   ret void
    412   ; CHECK: .size ule_v2f64
    413 }
    414 
    415 define void @ult_v4f32(<4 x i32>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
    416   ; CHECK: ult_v4f32:
    417 
    418   %1 = load <4 x float>, <4 x float>* %a
    419   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
    420   %2 = load <4 x float>, <4 x float>* %b
    421   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
    422   %3 = fcmp ult <4 x float> %1, %2
    423   %4 = sext <4 x i1> %3 to <4 x i32>
    424   ; CHECK-DAG: fcult.w [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    425   store <4 x i32> %4, <4 x i32>* %c
    426   ; CHECK-DAG: st.w [[R3]], 0($4)
    427 
    428   ret void
    429   ; CHECK: .size ult_v4f32
    430 }
    431 
    432 define void @ult_v2f64(<2 x i64>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
    433   ; CHECK: ult_v2f64:
    434 
    435   %1 = load <2 x double>, <2 x double>* %a
    436   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
    437   %2 = load <2 x double>, <2 x double>* %b
    438   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
    439   %3 = fcmp ult <2 x double> %1, %2
    440   %4 = sext <2 x i1> %3 to <2 x i64>
    441   ; CHECK-DAG: fcult.d [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    442   store <2 x i64> %4, <2 x i64>* %c
    443   ; CHECK-DAG: st.d [[R3]], 0($4)
    444 
    445   ret void
    446   ; CHECK: .size ult_v2f64
    447 }
    448 
    449 define void @uno_v4f32(<4 x i32>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
    450   ; CHECK: uno_v4f32:
    451 
    452   %1 = load <4 x float>, <4 x float>* %a
    453   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
    454   %2 = load <4 x float>, <4 x float>* %b
    455   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
    456   %3 = fcmp uno <4 x float> %1, %2
    457   %4 = sext <4 x i1> %3 to <4 x i32>
    458   ; CHECK-DAG: fcun.w [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    459   store <4 x i32> %4, <4 x i32>* %c
    460   ; CHECK-DAG: st.w [[R3]], 0($4)
    461 
    462   ret void
    463   ; CHECK: .size uno_v4f32
    464 }
    465 
    466 define void @uno_v2f64(<2 x i64>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
    467   ; CHECK: uno_v2f64:
    468 
    469   %1 = load <2 x double>, <2 x double>* %a
    470   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
    471   %2 = load <2 x double>, <2 x double>* %b
    472   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
    473   %3 = fcmp uno <2 x double> %1, %2
    474   %4 = sext <2 x i1> %3 to <2 x i64>
    475   ; CHECK-DAG: fcun.d [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    476   store <2 x i64> %4, <2 x i64>* %c
    477   ; CHECK-DAG: st.d [[R3]], 0($4)
    478 
    479   ret void
    480   ; CHECK: .size uno_v2f64
    481 }
    482 
    483 define void @true_v4f32(<4 x i32>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
    484   ; CHECK: true_v4f32:
    485 
    486   %1 = load <4 x float>, <4 x float>* %a
    487   %2 = load <4 x float>, <4 x float>* %b
    488   %3 = fcmp true <4 x float> %1, %2
    489   %4 = sext <4 x i1> %3 to <4 x i32>
    490   store <4 x i32> %4, <4 x i32>* %c
    491   ret void
    492 
    493   ; (setcc $a, $b, SETTRUE) is always folded, so we won't get fcaf:
    494   ; CHECK-DAG: ldi.b [[R1:\$w[0-9]+]], -1
    495   ; CHECK-DAG: st.w [[R1]], 0($4)
    496   ; CHECK: .size true_v4f32
    497 }
    498 
    499 define void @true_v2f64(<2 x i64>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
    500   ; CHECK: true_v2f64:
    501 
    502   %1 = load <2 x double>, <2 x double>* %a
    503   %2 = load <2 x double>, <2 x double>* %b
    504   %3 = fcmp true <2 x double> %1, %2
    505   %4 = sext <2 x i1> %3 to <2 x i64>
    506   store <2 x i64> %4, <2 x i64>* %c
    507   ret void
    508 
    509   ; (setcc $a, $b, SETTRUE) is always folded.
    510   ; CHECK-DAG: ldi.b [[R1:\$w[0-9]+]], -1
    511   ; CHECK-DAG: st.w [[R1]], 0($4)
    512   ; CHECK: .size true_v2f64
    513 }
    514 
    515 define void @bsel_v4f32(<4 x float>* %d, <4 x float>* %a, <4 x float>* %b,
    516                           <4 x float>* %c) nounwind {
    517   ; CHECK: bsel_v4f32:
    518 
    519   %1 = load <4 x float>, <4 x float>* %a
    520   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
    521   %2 = load <4 x float>, <4 x float>* %b
    522   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
    523   %3 = load <4 x float>, <4 x float>* %c
    524   ; CHECK-DAG: ld.w [[R3:\$w[0-9]+]], 0($7)
    525   %4 = fcmp ogt <4 x float> %1, %2
    526   ; CHECK-DAG: fclt.w [[R4:\$w[0-9]+]], [[R2]], [[R1]]
    527   %5 = select <4 x i1> %4, <4 x float> %1, <4 x float> %3
    528   ; Note that IfSet and IfClr are swapped since the condition is inverted
    529   ; CHECK-DAG: bsel.v [[R4]], [[R3]], [[R1]]
    530   store <4 x float> %5, <4 x float>* %d
    531   ; CHECK-DAG: st.w [[R4]], 0($4)
    532 
    533   ret void
    534   ; CHECK: .size bsel_v4f32
    535 }
    536 
    537 define void @bsel_v2f64(<2 x double>* %d, <2 x double>* %a, <2 x double>* %b,
    538                           <2 x double>* %c) nounwind {
    539   ; CHECK: bsel_v2f64:
    540 
    541   %1 = load <2 x double>, <2 x double>* %a
    542   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
    543   %2 = load <2 x double>, <2 x double>* %b
    544   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
    545   %3 = load <2 x double>, <2 x double>* %c
    546   ; CHECK-DAG: ld.d [[R3:\$w[0-9]+]], 0($7)
    547   %4 = fcmp ogt <2 x double> %1, %2
    548   ; CHECK-DAG: fclt.d [[R4:\$w[0-9]+]], [[R2]], [[R1]]
    549   %5 = select <2 x i1> %4, <2 x double> %1, <2 x double> %3
    550   ; Note that IfSet and IfClr are swapped since the condition is inverted
    551   ; CHECK-DAG: bsel.v [[R4]], [[R3]], [[R1]]
    552   store <2 x double> %5, <2 x double>* %d
    553   ; CHECK-DAG: st.d [[R4]], 0($4)
    554 
    555   ret void
    556   ; CHECK: .size bsel_v2f64
    557 }
    558 
    559 define void @bseli_v4f32(<4 x float>* %d, <4 x float>* %a, <4 x float>* %b,
    560                           <4 x float>* %c) nounwind {
    561   ; CHECK: bseli_v4f32:
    562 
    563   %1 = load <4 x float>, <4 x float>* %a
    564   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
    565   %2 = load <4 x float>, <4 x float>* %b
    566   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
    567   %3 = fcmp ogt <4 x float> %1, %2
    568   ; CHECK-DAG: fclt.w [[R4:\$w[0-9]+]], [[R2]], [[R1]]
    569   %4 = select <4 x i1> %3, <4 x float> %1, <4 x float> zeroinitializer
    570   ; Note that IfSet and IfClr are swapped since the condition is inverted
    571   ; CHECK-DAG: bsel.v [[R4]], [[R3:\$w[0-9]+]], [[R1]]
    572   store <4 x float> %4, <4 x float>* %d
    573   ; CHECK-DAG: st.w [[R4]], 0($4)
    574 
    575   ret void
    576   ; CHECK: .size bseli_v4f32
    577 }
    578 
    579 define void @bseli_v2f64(<2 x double>* %d, <2 x double>* %a, <2 x double>* %b,
    580                           <2 x double>* %c) nounwind {
    581   ; CHECK: bseli_v2f64:
    582 
    583   %1 = load <2 x double>, <2 x double>* %a
    584   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
    585   %2 = load <2 x double>, <2 x double>* %b
    586   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
    587   %3 = fcmp ogt <2 x double> %1, %2
    588   ; CHECK-DAG: fclt.d [[R4:\$w[0-9]+]], [[R2]], [[R1]]
    589   %4 = select <2 x i1> %3, <2 x double> %1, <2 x double> zeroinitializer
    590   ; Note that IfSet and IfClr are swapped since the condition is inverted
    591   ; CHECK-DAG: bsel.v [[R4]], [[R3:\$w[0-9]+]], [[R1]]
    592   store <2 x double> %4, <2 x double>* %d
    593   ; CHECK-DAG: st.d [[R4]], 0($4)
    594 
    595   ret void
    596   ; CHECK: .size bseli_v2f64
    597 }
    598 
    599 define void @max_v4f32(<4 x float>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
    600   ; CHECK: max_v4f32:
    601 
    602   %1 = load <4 x float>, <4 x float>* %a
    603   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
    604   %2 = load <4 x float>, <4 x float>* %b
    605   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
    606   %3 = tail call <4 x float> @llvm.mips.fmax.w(<4 x float> %1, <4 x float> %2)
    607   ; CHECK-DAG: fmax.w [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    608   store <4 x float> %3, <4 x float>* %c
    609   ; CHECK-DAG: st.w [[R3]], 0($4)
    610 
    611   ret void
    612   ; CHECK: .size max_v4f32
    613 }
    614 
    615 define void @max_v2f64(<2 x double>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
    616   ; CHECK: max_v2f64:
    617 
    618   %1 = load <2 x double>, <2 x double>* %a
    619   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
    620   %2 = load <2 x double>, <2 x double>* %b
    621   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
    622   %3 = tail call <2 x double> @llvm.mips.fmax.d(<2 x double> %1, <2 x double> %2)
    623   ; CHECK-DAG: fmax.d [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    624   store <2 x double> %3, <2 x double>* %c
    625   ; CHECK-DAG: st.d [[R3]], 0($4)
    626 
    627   ret void
    628   ; CHECK: .size max_v2f64
    629 }
    630 
    631 define void @min_v4f32(<4 x float>* %c, <4 x float>* %a, <4 x float>* %b) nounwind {
    632   ; CHECK: min_v4f32:
    633 
    634   %1 = load <4 x float>, <4 x float>* %a
    635   ; CHECK-DAG: ld.w [[R1:\$w[0-9]+]], 0($5)
    636   %2 = load <4 x float>, <4 x float>* %b
    637   ; CHECK-DAG: ld.w [[R2:\$w[0-9]+]], 0($6)
    638   %3 = tail call <4 x float> @llvm.mips.fmin.w(<4 x float> %1, <4 x float> %2)
    639   ; CHECK-DAG: fmin.w [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    640   store <4 x float> %3, <4 x float>* %c
    641   ; CHECK-DAG: st.w [[R3]], 0($4)
    642 
    643   ret void
    644   ; CHECK: .size min_v4f32
    645 }
    646 
    647 define void @min_v2f64(<2 x double>* %c, <2 x double>* %a, <2 x double>* %b) nounwind {
    648   ; CHECK: min_v2f64:
    649 
    650   %1 = load <2 x double>, <2 x double>* %a
    651   ; CHECK-DAG: ld.d [[R1:\$w[0-9]+]], 0($5)
    652   %2 = load <2 x double>, <2 x double>* %b
    653   ; CHECK-DAG: ld.d [[R2:\$w[0-9]+]], 0($6)
    654   %3 = tail call <2 x double> @llvm.mips.fmin.d(<2 x double> %1, <2 x double> %2)
    655   ; CHECK-DAG: fmin.d [[R3:\$w[0-9]+]], [[R1]], [[R2]]
    656   store <2 x double> %3, <2 x double>* %c
    657   ; CHECK-DAG: st.d [[R3]], 0($4)
    658 
    659   ret void
    660   ; CHECK: .size min_v2f64
    661 }
    662