Home | History | Annotate | Download | only in NVPTX
      1 ; RUN: llc < %s -march=nvptx -mcpu=sm_20 | FileCheck %s
      2 ; RUN: llc < %s -march=nvptx64 -mcpu=sm_20 | FileCheck %s
      3 
      4 ;; These tests should run for all targets
      5 
      6 ;;===-- Basic instruction selection tests ---------------------------------===;;
      7 
      8 
      9 ;;; i64
     10 
     11 define i64 @icmp_eq_i64(i64 %a, i64 %b) {
     12 ; CHECK: setp.eq.s64 %p[[P0:[0-9]+]], %rd{{[0-9]+}}, %rd{{[0-9]+}}
     13 ; CHECK: selp.u64 %rd{{[0-9]+}}, 1, 0, %p[[P0]]
     14 ; CHECK: ret
     15   %cmp = icmp eq i64 %a, %b
     16   %ret = zext i1 %cmp to i64
     17   ret i64 %ret
     18 }
     19 
     20 define i64 @icmp_ne_i64(i64 %a, i64 %b) {
     21 ; CHECK: setp.ne.s64 %p[[P0:[0-9]+]], %rd{{[0-9]+}}, %rd{{[0-9]+}}
     22 ; CHECK: selp.u64 %rd{{[0-9]+}}, 1, 0, %p[[P0]]
     23 ; CHECK: ret
     24   %cmp = icmp ne i64 %a, %b
     25   %ret = zext i1 %cmp to i64
     26   ret i64 %ret
     27 }
     28 
     29 define i64 @icmp_ugt_i64(i64 %a, i64 %b) {
     30 ; CHECK: setp.gt.u64 %p[[P0:[0-9]+]], %rd{{[0-9]+}}, %rd{{[0-9]+}}
     31 ; CHECK: selp.u64 %rd{{[0-9]+}}, 1, 0, %p[[P0]]
     32 ; CHECK: ret
     33   %cmp = icmp ugt i64 %a, %b
     34   %ret = zext i1 %cmp to i64
     35   ret i64 %ret
     36 }
     37 
     38 define i64 @icmp_uge_i64(i64 %a, i64 %b) {
     39 ; CHECK: setp.ge.u64 %p[[P0:[0-9]+]], %rd{{[0-9]+}}, %rd{{[0-9]+}}
     40 ; CHECK: selp.u64 %rd{{[0-9]+}}, 1, 0, %p[[P0]]
     41 ; CHECK: ret
     42   %cmp = icmp uge i64 %a, %b
     43   %ret = zext i1 %cmp to i64
     44   ret i64 %ret
     45 }
     46 
     47 define i64 @icmp_ult_i64(i64 %a, i64 %b) {
     48 ; CHECK: setp.lt.u64 %p[[P0:[0-9]+]], %rd{{[0-9]+}}, %rd{{[0-9]+}}
     49 ; CHECK: selp.u64 %rd{{[0-9]+}}, 1, 0, %p[[P0]]
     50 ; CHECK: ret
     51   %cmp = icmp ult i64 %a, %b
     52   %ret = zext i1 %cmp to i64
     53   ret i64 %ret
     54 }
     55 
     56 define i64 @icmp_ule_i64(i64 %a, i64 %b) {
     57 ; CHECK: setp.le.u64 %p[[P0:[0-9]+]], %rd{{[0-9]+}}, %rd{{[0-9]+}}
     58 ; CHECK: selp.u64 %rd{{[0-9]+}}, 1, 0, %p[[P0]]
     59 ; CHECK: ret
     60   %cmp = icmp ule i64 %a, %b
     61   %ret = zext i1 %cmp to i64
     62   ret i64 %ret
     63 }
     64 
     65 define i64 @icmp_sgt_i64(i64 %a, i64 %b) {
     66 ; CHECK: setp.gt.s64 %p[[P0:[0-9]+]], %rd{{[0-9]+}}, %rd{{[0-9]+}}
     67 ; CHECK: selp.u64 %rd{{[0-9]+}}, 1, 0, %p[[P0]]
     68 ; CHECK: ret
     69   %cmp = icmp sgt i64 %a, %b
     70   %ret = zext i1 %cmp to i64
     71   ret i64 %ret
     72 }
     73 
     74 define i64 @icmp_sge_i64(i64 %a, i64 %b) {
     75 ; CHECK: setp.ge.s64 %p[[P0:[0-9]+]], %rd{{[0-9]+}}, %rd{{[0-9]+}}
     76 ; CHECK: selp.u64 %rd{{[0-9]+}}, 1, 0, %p[[P0]]
     77 ; CHECK: ret
     78   %cmp = icmp sge i64 %a, %b
     79   %ret = zext i1 %cmp to i64
     80   ret i64 %ret
     81 }
     82 
     83 define i64 @icmp_slt_i64(i64 %a, i64 %b) {
     84 ; CHECK: setp.lt.s64 %p[[P0:[0-9]+]], %rd{{[0-9]+}}, %rd{{[0-9]+}}
     85 ; CHECK: selp.u64 %rd{{[0-9]+}}, 1, 0, %p[[P0]]
     86 ; CHECK: ret
     87   %cmp = icmp slt i64 %a, %b
     88   %ret = zext i1 %cmp to i64
     89   ret i64 %ret
     90 }
     91 
     92 define i64 @icmp_sle_i64(i64 %a, i64 %b) {
     93 ; CHECK: setp.le.s64 %p[[P0:[0-9]+]], %rd{{[0-9]+}}, %rd{{[0-9]+}}
     94 ; CHECK: selp.u64 %rd{{[0-9]+}}, 1, 0, %p[[P0]]
     95 ; CHECK: ret
     96   %cmp = icmp sle i64 %a, %b
     97   %ret = zext i1 %cmp to i64
     98   ret i64 %ret
     99 }
    100 
    101 ;;; i32
    102 
    103 define i32 @icmp_eq_i32(i32 %a, i32 %b) {
    104 ; CHECK: setp.eq.s32 %p[[P0:[0-9]+]], %r{{[0-9]+}}, %r{{[0-9]+}}
    105 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    106 ; CHECK: ret
    107   %cmp = icmp eq i32 %a, %b
    108   %ret = zext i1 %cmp to i32
    109   ret i32 %ret
    110 }
    111 
    112 define i32 @icmp_ne_i32(i32 %a, i32 %b) {
    113 ; CHECK: setp.ne.s32 %p[[P0:[0-9]+]], %r{{[0-9]+}}, %r{{[0-9]+}}
    114 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    115 ; CHECK: ret
    116   %cmp = icmp ne i32 %a, %b
    117   %ret = zext i1 %cmp to i32
    118   ret i32 %ret
    119 }
    120 
    121 define i32 @icmp_ugt_i32(i32 %a, i32 %b) {
    122 ; CHECK: setp.gt.u32 %p[[P0:[0-9]+]], %r{{[0-9]+}}, %r{{[0-9]+}}
    123 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    124 ; CHECK: ret
    125   %cmp = icmp ugt i32 %a, %b
    126   %ret = zext i1 %cmp to i32
    127   ret i32 %ret
    128 }
    129 
    130 define i32 @icmp_uge_i32(i32 %a, i32 %b) {
    131 ; CHECK: setp.ge.u32 %p[[P0:[0-9]+]], %r{{[0-9]+}}, %r{{[0-9]+}}
    132 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    133 ; CHECK: ret
    134   %cmp = icmp uge i32 %a, %b
    135   %ret = zext i1 %cmp to i32
    136   ret i32 %ret
    137 }
    138 
    139 define i32 @icmp_ult_i32(i32 %a, i32 %b) {
    140 ; CHECK: setp.lt.u32 %p[[P0:[0-9]+]], %r{{[0-9]+}}, %r{{[0-9]+}}
    141 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    142 ; CHECK: ret
    143   %cmp = icmp ult i32 %a, %b
    144   %ret = zext i1 %cmp to i32
    145   ret i32 %ret
    146 }
    147 
    148 define i32 @icmp_ule_i32(i32 %a, i32 %b) {
    149 ; CHECK: setp.le.u32 %p[[P0:[0-9]+]], %r{{[0-9]+}}, %r{{[0-9]+}}
    150 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    151 ; CHECK: ret
    152   %cmp = icmp ule i32 %a, %b
    153   %ret = zext i1 %cmp to i32
    154   ret i32 %ret
    155 }
    156 
    157 define i32 @icmp_sgt_i32(i32 %a, i32 %b) {
    158 ; CHECK: setp.gt.s32 %p[[P0:[0-9]+]], %r{{[0-9]+}}, %r{{[0-9]+}}
    159 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    160 ; CHECK: ret
    161   %cmp = icmp sgt i32 %a, %b
    162   %ret = zext i1 %cmp to i32
    163   ret i32 %ret
    164 }
    165 
    166 define i32 @icmp_sge_i32(i32 %a, i32 %b) {
    167 ; CHECK: setp.ge.s32 %p[[P0:[0-9]+]], %r{{[0-9]+}}, %r{{[0-9]+}}
    168 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    169 ; CHECK: ret
    170   %cmp = icmp sge i32 %a, %b
    171   %ret = zext i1 %cmp to i32
    172   ret i32 %ret
    173 }
    174 
    175 define i32 @icmp_slt_i32(i32 %a, i32 %b) {
    176 ; CHECK: setp.lt.s32 %p[[P0:[0-9]+]], %r{{[0-9]+}}, %r{{[0-9]+}}
    177 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    178 ; CHECK: ret
    179   %cmp = icmp slt i32 %a, %b
    180   %ret = zext i1 %cmp to i32
    181   ret i32 %ret
    182 }
    183 
    184 define i32 @icmp_sle_i32(i32 %a, i32 %b) {
    185 ; CHECK: setp.le.s32 %p[[P0:[0-9]+]], %r{{[0-9]+}}, %r{{[0-9]+}}
    186 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    187 ; CHECK: ret
    188   %cmp = icmp sle i32 %a, %b
    189   %ret = zext i1 %cmp to i32
    190   ret i32 %ret
    191 }
    192 
    193 
    194 ;;; i16
    195 
    196 define i16 @icmp_eq_i16(i16 %a, i16 %b) {
    197 ; CHECK: setp.eq.s16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    198 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    199 ; CHECK: ret
    200   %cmp = icmp eq i16 %a, %b
    201   %ret = zext i1 %cmp to i16
    202   ret i16 %ret
    203 }
    204 
    205 define i16 @icmp_ne_i16(i16 %a, i16 %b) {
    206 ; CHECK: setp.ne.s16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    207 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    208 ; CHECK: ret
    209   %cmp = icmp ne i16 %a, %b
    210   %ret = zext i1 %cmp to i16
    211   ret i16 %ret
    212 }
    213 
    214 define i16 @icmp_ugt_i16(i16 %a, i16 %b) {
    215 ; CHECK: setp.gt.u16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    216 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    217 ; CHECK: ret
    218   %cmp = icmp ugt i16 %a, %b
    219   %ret = zext i1 %cmp to i16
    220   ret i16 %ret
    221 }
    222 
    223 define i16 @icmp_uge_i16(i16 %a, i16 %b) {
    224 ; CHECK: setp.ge.u16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    225 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    226 ; CHECK: ret
    227   %cmp = icmp uge i16 %a, %b
    228   %ret = zext i1 %cmp to i16
    229   ret i16 %ret
    230 }
    231 
    232 define i16 @icmp_ult_i16(i16 %a, i16 %b) {
    233 ; CHECK: setp.lt.u16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    234 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    235 ; CHECK: ret
    236   %cmp = icmp ult i16 %a, %b
    237   %ret = zext i1 %cmp to i16
    238   ret i16 %ret
    239 }
    240 
    241 define i16 @icmp_ule_i16(i16 %a, i16 %b) {
    242 ; CHECK: setp.le.u16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    243 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    244 ; CHECK: ret
    245   %cmp = icmp ule i16 %a, %b
    246   %ret = zext i1 %cmp to i16
    247   ret i16 %ret
    248 }
    249 
    250 define i16 @icmp_sgt_i16(i16 %a, i16 %b) {
    251 ; CHECK: setp.gt.s16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    252 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    253 ; CHECK: ret
    254   %cmp = icmp sgt i16 %a, %b
    255   %ret = zext i1 %cmp to i16
    256   ret i16 %ret
    257 }
    258 
    259 define i16 @icmp_sge_i16(i16 %a, i16 %b) {
    260 ; CHECK: setp.ge.s16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    261 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    262 ; CHECK: ret
    263   %cmp = icmp sge i16 %a, %b
    264   %ret = zext i1 %cmp to i16
    265   ret i16 %ret
    266 }
    267 
    268 define i16 @icmp_slt_i16(i16 %a, i16 %b) {
    269 ; CHECK: setp.lt.s16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    270 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    271 ; CHECK: ret
    272   %cmp = icmp slt i16 %a, %b
    273   %ret = zext i1 %cmp to i16
    274   ret i16 %ret
    275 }
    276 
    277 define i16 @icmp_sle_i16(i16 %a, i16 %b) {
    278 ; CHECK: setp.le.s16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    279 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    280 ; CHECK: ret
    281   %cmp = icmp sle i16 %a, %b
    282   %ret = zext i1 %cmp to i16
    283   ret i16 %ret
    284 }
    285 
    286 
    287 ;;; i8
    288 
    289 define i8 @icmp_eq_i8(i8 %a, i8 %b) {
    290 ; Comparison happens in 16-bit
    291 ; CHECK: setp.eq.s16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    292 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    293 ; CHECK: ret
    294   %cmp = icmp eq i8 %a, %b
    295   %ret = zext i1 %cmp to i8
    296   ret i8 %ret
    297 }
    298 
    299 define i8 @icmp_ne_i8(i8 %a, i8 %b) {
    300 ; Comparison happens in 16-bit
    301 ; CHECK: setp.ne.s16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    302 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    303 ; CHECK: ret
    304   %cmp = icmp ne i8 %a, %b
    305   %ret = zext i1 %cmp to i8
    306   ret i8 %ret
    307 }
    308 
    309 define i8 @icmp_ugt_i8(i8 %a, i8 %b) {
    310 ; Comparison happens in 16-bit
    311 ; CHECK: setp.gt.u16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    312 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    313 ; CHECK: ret
    314   %cmp = icmp ugt i8 %a, %b
    315   %ret = zext i1 %cmp to i8
    316   ret i8 %ret
    317 }
    318 
    319 define i8 @icmp_uge_i8(i8 %a, i8 %b) {
    320 ; Comparison happens in 16-bit
    321 ; CHECK: setp.ge.u16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    322 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    323 ; CHECK: ret
    324   %cmp = icmp uge i8 %a, %b
    325   %ret = zext i1 %cmp to i8
    326   ret i8 %ret
    327 }
    328 
    329 define i8 @icmp_ult_i8(i8 %a, i8 %b) {
    330 ; Comparison happens in 16-bit
    331 ; CHECK: setp.lt.u16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    332 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    333 ; CHECK: ret
    334   %cmp = icmp ult i8 %a, %b
    335   %ret = zext i1 %cmp to i8
    336   ret i8 %ret
    337 }
    338 
    339 define i8 @icmp_ule_i8(i8 %a, i8 %b) {
    340 ; Comparison happens in 16-bit
    341 ; CHECK: setp.le.u16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    342 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    343 ; CHECK: ret
    344   %cmp = icmp ule i8 %a, %b
    345   %ret = zext i1 %cmp to i8
    346   ret i8 %ret
    347 }
    348 
    349 define i8 @icmp_sgt_i8(i8 %a, i8 %b) {
    350 ; Comparison happens in 16-bit
    351 ; CHECK: setp.gt.s16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    352 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    353 ; CHECK: ret
    354   %cmp = icmp sgt i8 %a, %b
    355   %ret = zext i1 %cmp to i8
    356   ret i8 %ret
    357 }
    358 
    359 define i8 @icmp_sge_i8(i8 %a, i8 %b) {
    360 ; Comparison happens in 16-bit
    361 ; CHECK: setp.ge.s16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    362 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    363 ; CHECK: ret
    364   %cmp = icmp sge i8 %a, %b
    365   %ret = zext i1 %cmp to i8
    366   ret i8 %ret
    367 }
    368 
    369 define i8 @icmp_slt_i8(i8 %a, i8 %b) {
    370 ; Comparison happens in 16-bit
    371 ; CHECK: setp.lt.s16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    372 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    373 ; CHECK: ret
    374   %cmp = icmp slt i8 %a, %b
    375   %ret = zext i1 %cmp to i8
    376   ret i8 %ret
    377 }
    378 
    379 define i8 @icmp_sle_i8(i8 %a, i8 %b) {
    380 ; Comparison happens in 16-bit
    381 ; CHECK: setp.le.s16 %p[[P0:[0-9]+]], %rs{{[0-9]+}}, %rs{{[0-9]+}}
    382 ; CHECK: selp.u32 %r{{[0-9]+}}, 1, 0, %p[[P0]]
    383 ; CHECK: ret
    384   %cmp = icmp sle i8 %a, %b
    385   %ret = zext i1 %cmp to i8
    386   ret i8 %ret
    387 }
    388