Home | History | Annotate | Download | only in SystemZ
      1 ; Test 8-bit atomic min/max operations.
      2 ;
      3 ; RUN: llc < %s -mtriple=s390x-linux-gnu | FileCheck %s -check-prefix=CHECK
      4 ; RUN: llc < %s -mtriple=s390x-linux-gnu | FileCheck %s -check-prefix=CHECK-SHIFT1
      5 ; RUN: llc < %s -mtriple=s390x-linux-gnu | FileCheck %s -check-prefix=CHECK-SHIFT2
      6 
      7 ; Check signed minimum.
      8 ; - CHECK is for the main loop.
      9 ; - CHECK-SHIFT1 makes sure that the negated shift count used by the second
     10 ;   RLL is set up correctly.  The negation is independent of the NILL and L
     11 ;   tested in CHECK.
     12 ; - CHECK-SHIFT2 makes sure that %b is shifted into the high part of the word
     13 ;   before being used, and that the low bits are set to 1.  This sequence is
     14 ;   independent of the other loop prologue instructions.
     15 define i16 @f1(i16 *%src, i16 %b) {
     16 ; CHECK-LABEL: f1:
     17 ; CHECK: sllg [[SHIFT:%r[1-9]+]], %r2, 3
     18 ; CHECK: nill %r2, 65532
     19 ; CHECK: l [[OLD:%r[0-9]+]], 0(%r2)
     20 ; CHECK: [[LOOP:\.[^:]*]]:
     21 ; CHECK: rll [[ROT:%r[0-9]+]], [[OLD]], 0([[SHIFT]])
     22 ; CHECK: crjle [[ROT]], %r3, [[KEEP:\..*]]
     23 ; CHECK: risbg [[ROT]], %r3, 32, 47, 0
     24 ; CHECK: [[KEEP]]:
     25 ; CHECK: rll [[NEW:%r[0-9]+]], [[ROT]], 0({{%r[1-9]+}})
     26 ; CHECK: cs [[OLD]], [[NEW]], 0(%r2)
     27 ; CHECK: jl [[LOOP]]
     28 ; CHECK: rll %r2, [[OLD]], 16([[SHIFT]])
     29 ; CHECK: br %r14
     30 ;
     31 ; CHECK-SHIFT1-LABEL: f1:
     32 ; CHECK-SHIFT1: sllg [[SHIFT:%r[1-9]+]], %r2, 3
     33 ; CHECK-SHIFT1: lcr [[NEGSHIFT:%r[1-9]+]], [[SHIFT]]
     34 ; CHECK-SHIFT1: rll
     35 ; CHECK-SHIFT1: rll {{%r[0-9]+}}, {{%r[0-9]+}}, 0([[NEGSHIFT]])
     36 ; CHECK-SHIFT1: rll
     37 ; CHECK-SHIFT1: br %r14
     38 ;
     39 ; CHECK-SHIFT2-LABEL: f1:
     40 ; CHECK-SHIFT2: sll %r3, 16
     41 ; CHECK-SHIFT2: rll
     42 ; CHECK-SHIFT2: crjle {{%r[0-9]+}}, %r3
     43 ; CHECK-SHIFT2: rll
     44 ; CHECK-SHIFT2: rll
     45 ; CHECK-SHIFT2: br %r14
     46   %res = atomicrmw min i16 *%src, i16 %b seq_cst
     47   ret i16 %res
     48 }
     49 
     50 ; Check signed maximum.
     51 define i16 @f2(i16 *%src, i16 %b) {
     52 ; CHECK-LABEL: f2:
     53 ; CHECK: sllg [[SHIFT:%r[1-9]+]], %r2, 3
     54 ; CHECK: nill %r2, 65532
     55 ; CHECK: l [[OLD:%r[0-9]+]], 0(%r2)
     56 ; CHECK: [[LOOP:\.[^:]*]]:
     57 ; CHECK: rll [[ROT:%r[0-9]+]], [[OLD]], 0([[SHIFT]])
     58 ; CHECK: crjhe [[ROT]], %r3, [[KEEP:\..*]]
     59 ; CHECK: risbg [[ROT]], %r3, 32, 47, 0
     60 ; CHECK: [[KEEP]]:
     61 ; CHECK: rll [[NEW:%r[0-9]+]], [[ROT]], 0({{%r[1-9]+}})
     62 ; CHECK: cs [[OLD]], [[NEW]], 0(%r2)
     63 ; CHECK: jl [[LOOP]]
     64 ; CHECK: rll %r2, [[OLD]], 16([[SHIFT]])
     65 ; CHECK: br %r14
     66 ;
     67 ; CHECK-SHIFT1-LABEL: f2:
     68 ; CHECK-SHIFT1: sllg [[SHIFT:%r[1-9]+]], %r2, 3
     69 ; CHECK-SHIFT1: lcr [[NEGSHIFT:%r[1-9]+]], [[SHIFT]]
     70 ; CHECK-SHIFT1: rll
     71 ; CHECK-SHIFT1: rll {{%r[0-9]+}}, {{%r[0-9]+}}, 0([[NEGSHIFT]])
     72 ; CHECK-SHIFT1: rll
     73 ; CHECK-SHIFT1: br %r14
     74 ;
     75 ; CHECK-SHIFT2-LABEL: f2:
     76 ; CHECK-SHIFT2: sll %r3, 16
     77 ; CHECK-SHIFT2: rll
     78 ; CHECK-SHIFT2: crjhe {{%r[0-9]+}}, %r3
     79 ; CHECK-SHIFT2: rll
     80 ; CHECK-SHIFT2: rll
     81 ; CHECK-SHIFT2: br %r14
     82   %res = atomicrmw max i16 *%src, i16 %b seq_cst
     83   ret i16 %res
     84 }
     85 
     86 ; Check unsigned minimum.
     87 define i16 @f3(i16 *%src, i16 %b) {
     88 ; CHECK-LABEL: f3:
     89 ; CHECK: sllg [[SHIFT:%r[1-9]+]], %r2, 3
     90 ; CHECK: nill %r2, 65532
     91 ; CHECK: l [[OLD:%r[0-9]+]], 0(%r2)
     92 ; CHECK: [[LOOP:\.[^:]*]]:
     93 ; CHECK: rll [[ROT:%r[0-9]+]], [[OLD]], 0([[SHIFT]])
     94 ; CHECK: clr [[ROT]], %r3
     95 ; CHECK: jle [[KEEP:\..*]]
     96 ; CHECK: risbg [[ROT]], %r3, 32, 47, 0
     97 ; CHECK: [[KEEP]]:
     98 ; CHECK: rll [[NEW:%r[0-9]+]], [[ROT]], 0({{%r[1-9]+}})
     99 ; CHECK: cs [[OLD]], [[NEW]], 0(%r2)
    100 ; CHECK: jl [[LOOP]]
    101 ; CHECK: rll %r2, [[OLD]], 16([[SHIFT]])
    102 ; CHECK: br %r14
    103 ;
    104 ; CHECK-SHIFT1-LABEL: f3:
    105 ; CHECK-SHIFT1: sllg [[SHIFT:%r[1-9]+]], %r2, 3
    106 ; CHECK-SHIFT1: lcr [[NEGSHIFT:%r[1-9]+]], [[SHIFT]]
    107 ; CHECK-SHIFT1: rll
    108 ; CHECK-SHIFT1: rll {{%r[0-9]+}}, {{%r[0-9]+}}, 0([[NEGSHIFT]])
    109 ; CHECK-SHIFT1: rll
    110 ; CHECK-SHIFT1: br %r14
    111 ;
    112 ; CHECK-SHIFT2-LABEL: f3:
    113 ; CHECK-SHIFT2: sll %r3, 16
    114 ; CHECK-SHIFT2: rll
    115 ; CHECK-SHIFT2: clr {{%r[0-9]+}}, %r3
    116 ; CHECK-SHIFT2: rll
    117 ; CHECK-SHIFT2: rll
    118 ; CHECK-SHIFT2: br %r14
    119   %res = atomicrmw umin i16 *%src, i16 %b seq_cst
    120   ret i16 %res
    121 }
    122 
    123 ; Check unsigned maximum.
    124 define i16 @f4(i16 *%src, i16 %b) {
    125 ; CHECK-LABEL: f4:
    126 ; CHECK: sllg [[SHIFT:%r[1-9]+]], %r2, 3
    127 ; CHECK: nill %r2, 65532
    128 ; CHECK: l [[OLD:%r[0-9]+]], 0(%r2)
    129 ; CHECK: [[LOOP:\.[^:]*]]:
    130 ; CHECK: rll [[ROT:%r[0-9]+]], [[OLD]], 0([[SHIFT]])
    131 ; CHECK: clr [[ROT]], %r3
    132 ; CHECK: jhe [[KEEP:\..*]]
    133 ; CHECK: risbg [[ROT]], %r3, 32, 47, 0
    134 ; CHECK: [[KEEP]]:
    135 ; CHECK: rll [[NEW:%r[0-9]+]], [[ROT]], 0({{%r[1-9]+}})
    136 ; CHECK: cs [[OLD]], [[NEW]], 0(%r2)
    137 ; CHECK: jl [[LOOP]]
    138 ; CHECK: rll %r2, [[OLD]], 16([[SHIFT]])
    139 ; CHECK: br %r14
    140 ;
    141 ; CHECK-SHIFT1-LABEL: f4:
    142 ; CHECK-SHIFT1: sllg [[SHIFT:%r[1-9]+]], %r2, 3
    143 ; CHECK-SHIFT1: lcr [[NEGSHIFT:%r[1-9]+]], [[SHIFT]]
    144 ; CHECK-SHIFT1: rll
    145 ; CHECK-SHIFT1: rll {{%r[0-9]+}}, {{%r[0-9]+}}, 0([[NEGSHIFT]])
    146 ; CHECK-SHIFT1: rll
    147 ; CHECK-SHIFT1: br %r14
    148 ;
    149 ; CHECK-SHIFT2-LABEL: f4:
    150 ; CHECK-SHIFT2: sll %r3, 16
    151 ; CHECK-SHIFT2: rll
    152 ; CHECK-SHIFT2: clr {{%r[0-9]+}}, %r3
    153 ; CHECK-SHIFT2: rll
    154 ; CHECK-SHIFT2: rll
    155 ; CHECK-SHIFT2: br %r14
    156   %res = atomicrmw umax i16 *%src, i16 %b seq_cst
    157   ret i16 %res
    158 }
    159 
    160 ; Check the lowest useful signed minimum value.  We need to load 0x80010000
    161 ; into the source register.
    162 define i16 @f5(i16 *%src) {
    163 ; CHECK-LABEL: f5:
    164 ; CHECK: llilh [[SRC2:%r[0-9]+]], 32769
    165 ; CHECK: crjle [[ROT:%r[0-9]+]], [[SRC2]]
    166 ; CHECK: risbg [[ROT]], [[SRC2]], 32, 47, 0
    167 ; CHECK: br %r14
    168 ;
    169 ; CHECK-SHIFT1-LABEL: f5:
    170 ; CHECK-SHIFT1: br %r14
    171 ; CHECK-SHIFT2-LABEL: f5:
    172 ; CHECK-SHIFT2: br %r14
    173   %res = atomicrmw min i16 *%src, i16 -32767 seq_cst
    174   ret i16 %res
    175 }
    176 
    177 ; Check the highest useful signed maximum value.  We need to load 0x7ffe0000
    178 ; into the source register.
    179 define i16 @f6(i16 *%src) {
    180 ; CHECK-LABEL: f6:
    181 ; CHECK: llilh [[SRC2:%r[0-9]+]], 32766
    182 ; CHECK: crjhe [[ROT:%r[0-9]+]], [[SRC2]]
    183 ; CHECK: risbg [[ROT]], [[SRC2]], 32, 47, 0
    184 ; CHECK: br %r14
    185 ;
    186 ; CHECK-SHIFT1-LABEL: f6:
    187 ; CHECK-SHIFT1: br %r14
    188 ; CHECK-SHIFT2-LABEL: f6:
    189 ; CHECK-SHIFT2: br %r14
    190   %res = atomicrmw max i16 *%src, i16 32766 seq_cst
    191   ret i16 %res
    192 }
    193 
    194 ; Check the lowest useful unsigned maximum value.  We need to load 0x00010000
    195 ; into the source register.
    196 define i16 @f7(i16 *%src) {
    197 ; CHECK-LABEL: f7:
    198 ; CHECK: llilh [[SRC2:%r[0-9]+]], 1
    199 ; CHECK: clr [[ROT:%r[0-9]+]], [[SRC2]]
    200 ; CHECK: risbg [[ROT]], [[SRC2]], 32, 47, 0
    201 ; CHECK: br %r14
    202 ;
    203 ; CHECK-SHIFT1-LABEL: f7:
    204 ; CHECK-SHIFT1: br %r14
    205 ; CHECK-SHIFT2-LABEL: f7:
    206 ; CHECK-SHIFT2: br %r14
    207   %res = atomicrmw umin i16 *%src, i16 1 seq_cst
    208   ret i16 %res
    209 }
    210 
    211 ; Check the highest useful unsigned maximum value.  We need to load 0xfffe0000
    212 ; into the source register.
    213 define i16 @f8(i16 *%src) {
    214 ; CHECK-LABEL: f8:
    215 ; CHECK: llilh [[SRC2:%r[0-9]+]], 65534
    216 ; CHECK: clr [[ROT:%r[0-9]+]], [[SRC2]]
    217 ; CHECK: risbg [[ROT]], [[SRC2]], 32, 47, 0
    218 ; CHECK: br %r14
    219 ;
    220 ; CHECK-SHIFT1-LABEL: f8:
    221 ; CHECK-SHIFT1: br %r14
    222 ; CHECK-SHIFT2-LABEL: f8:
    223 ; CHECK-SHIFT2: br %r14
    224   %res = atomicrmw umax i16 *%src, i16 65534 seq_cst
    225   ret i16 %res
    226 }
    227