Home | History | Annotate | Download | only in AArch64
      1 ; RUN: llc -verify-machineinstrs < %s -mtriple=aarch64-none-linux-gnu | FileCheck %s
      2 
      3 @var32 = global i32 0
      4 @var64 = global i64 0
      5 
      6 define void @test_lsl_arith(i32 %lhs32, i32 %rhs32, i64 %lhs64, i64 %rhs64) {
      7 ; CHECK-LABEL: test_lsl_arith:
      8 
      9   %rhs1 = load volatile i32* @var32
     10   %shift1 = shl i32 %rhs1, 18
     11   %val1 = add i32 %lhs32, %shift1
     12   store volatile i32 %val1, i32* @var32
     13 ; CHECK: add {{w[0-9]+}}, {{w[0-9]+}}, {{w[0-9]+}}, lsl #18
     14 
     15   %rhs2 = load volatile i32* @var32
     16   %shift2 = shl i32 %rhs2, 31
     17   %val2 = add i32 %shift2, %lhs32
     18   store volatile i32 %val2, i32* @var32
     19 ; CHECK: add {{w[0-9]+}}, {{w[0-9]+}}, {{w[0-9]+}}, lsl #31
     20 
     21   %rhs3 = load volatile i32* @var32
     22   %shift3 = shl i32 %rhs3, 5
     23   %val3 = sub i32 %lhs32, %shift3
     24   store volatile i32 %val3, i32* @var32
     25 ; CHECK: sub {{w[0-9]+}}, {{w[0-9]+}}, {{w[0-9]+}}, lsl #5
     26 
     27 ; Subtraction is not commutative!
     28   %rhs4 = load volatile i32* @var32
     29   %shift4 = shl i32 %rhs4, 19
     30   %val4 = sub i32 %shift4, %lhs32
     31   store volatile i32 %val4, i32* @var32
     32 ; CHECK-NOT: sub {{w[0-9]+}}, {{w[0-9]+}}, {{w[0-9]+}}, lsl #19
     33 
     34   %lhs4a = load volatile i32* @var32
     35   %shift4a = shl i32 %lhs4a, 15
     36   %val4a = sub i32 0, %shift4a
     37   store volatile i32 %val4a, i32* @var32
     38 ; CHECK: sub {{w[0-9]+}}, wzr, {{w[0-9]+}}, lsl #15
     39 
     40   %rhs5 = load volatile i64* @var64
     41   %shift5 = shl i64 %rhs5, 18
     42   %val5 = add i64 %lhs64, %shift5
     43   store volatile i64 %val5, i64* @var64
     44 ; CHECK: add {{x[0-9]+}}, {{x[0-9]+}}, {{x[0-9]+}}, lsl #18
     45 
     46   %rhs6 = load volatile i64* @var64
     47   %shift6 = shl i64 %rhs6, 31
     48   %val6 = add i64 %shift6, %lhs64
     49   store volatile i64 %val6, i64* @var64
     50 ; CHECK: add {{x[0-9]+}}, {{x[0-9]+}}, {{x[0-9]+}}, lsl #31
     51 
     52   %rhs7 = load volatile i64* @var64
     53   %shift7 = shl i64 %rhs7, 5
     54   %val7 = sub i64 %lhs64, %shift7
     55   store volatile i64 %val7, i64* @var64
     56 ; CHECK: sub {{x[0-9]+}}, {{x[0-9]+}}, {{x[0-9]+}}, lsl #5
     57 
     58 ; Subtraction is not commutative!
     59   %rhs8 = load volatile i64* @var64
     60   %shift8 = shl i64 %rhs8, 19
     61   %val8 = sub i64 %shift8, %lhs64
     62   store volatile i64 %val8, i64* @var64
     63 ; CHECK-NOT: sub {{x[0-9]+}}, {{x[0-9]+}}, {{x[0-9]+}}, lsl #19
     64 
     65   %lhs8a = load volatile i64* @var64
     66   %shift8a = shl i64 %lhs8a, 60
     67   %val8a = sub i64 0, %shift8a
     68   store volatile i64 %val8a, i64* @var64
     69 ; CHECK: sub {{x[0-9]+}}, xzr, {{x[0-9]+}}, lsl #60
     70 
     71   ret void
     72 ; CHECK: ret
     73 }
     74 
     75 define void @test_lsr_arith(i32 %lhs32, i32 %rhs32, i64 %lhs64, i64 %rhs64) {
     76 ; CHECK-LABEL: test_lsr_arith:
     77 
     78   %shift1 = lshr i32 %rhs32, 18
     79   %val1 = add i32 %lhs32, %shift1
     80   store volatile i32 %val1, i32* @var32
     81 ; CHECK: add {{w[0-9]+}}, {{w[0-9]+}}, {{w[0-9]+}}, lsr #18
     82 
     83   %shift2 = lshr i32 %rhs32, 31
     84   %val2 = add i32 %shift2, %lhs32
     85   store volatile i32 %val2, i32* @var32
     86 ; CHECK: add {{w[0-9]+}}, {{w[0-9]+}}, {{w[0-9]+}}, lsr #31
     87 
     88   %shift3 = lshr i32 %rhs32, 5
     89   %val3 = sub i32 %lhs32, %shift3
     90   store volatile i32 %val3, i32* @var32
     91 ; CHECK: sub {{w[0-9]+}}, {{w[0-9]+}}, {{w[0-9]+}}, lsr #5
     92 
     93 ; Subtraction is not commutative!
     94   %shift4 = lshr i32 %rhs32, 19
     95   %val4 = sub i32 %shift4, %lhs32
     96   store volatile i32 %val4, i32* @var32
     97 ; CHECK-NOT: sub {{w[0-9]+}}, {{w[0-9]+}}, {{w[0-9]+}}, lsr #19
     98 
     99   %shift4a = lshr i32 %lhs32, 15
    100   %val4a = sub i32 0, %shift4a
    101   store volatile i32 %val4a, i32* @var32
    102 ; CHECK: sub {{w[0-9]+}}, wzr, {{w[0-9]+}}, lsr #15
    103 
    104   %shift5 = lshr i64 %rhs64, 18
    105   %val5 = add i64 %lhs64, %shift5
    106   store volatile i64 %val5, i64* @var64
    107 ; CHECK: add {{x[0-9]+}}, {{x[0-9]+}}, {{x[0-9]+}}, lsr #18
    108 
    109   %shift6 = lshr i64 %rhs64, 31
    110   %val6 = add i64 %shift6, %lhs64
    111   store volatile i64 %val6, i64* @var64
    112 ; CHECK: add {{x[0-9]+}}, {{x[0-9]+}}, {{x[0-9]+}}, lsr #31
    113 
    114   %shift7 = lshr i64 %rhs64, 5
    115   %val7 = sub i64 %lhs64, %shift7
    116   store volatile i64 %val7, i64* @var64
    117 ; CHECK: sub {{x[0-9]+}}, {{x[0-9]+}}, {{x[0-9]+}}, lsr #5
    118 
    119 ; Subtraction is not commutative!
    120   %shift8 = lshr i64 %rhs64, 19
    121   %val8 = sub i64 %shift8, %lhs64
    122   store volatile i64 %val8, i64* @var64
    123 ; CHECK-NOT: sub {{x[0-9]+}}, {{x[0-9]+}}, {{x[0-9]+}}, lsr #19
    124 
    125   %shift8a = lshr i64 %lhs64, 45
    126   %val8a = sub i64 0, %shift8a
    127   store volatile i64 %val8a, i64* @var64
    128 ; CHECK: sub {{x[0-9]+}}, xzr, {{x[0-9]+}}, lsr #45
    129 
    130   ret void
    131 ; CHECK: ret
    132 }
    133 
    134 define void @test_asr_arith(i32 %lhs32, i32 %rhs32, i64 %lhs64, i64 %rhs64) {
    135 ; CHECK-LABEL: test_asr_arith:
    136 
    137   %shift1 = ashr i32 %rhs32, 18
    138   %val1 = add i32 %lhs32, %shift1
    139   store volatile i32 %val1, i32* @var32
    140 ; CHECK: add {{w[0-9]+}}, {{w[0-9]+}}, {{w[0-9]+}}, asr #18
    141 
    142   %shift2 = ashr i32 %rhs32, 31
    143   %val2 = add i32 %shift2, %lhs32
    144   store volatile i32 %val2, i32* @var32
    145 ; CHECK: add {{w[0-9]+}}, {{w[0-9]+}}, {{w[0-9]+}}, asr #31
    146 
    147   %shift3 = ashr i32 %rhs32, 5
    148   %val3 = sub i32 %lhs32, %shift3
    149   store volatile i32 %val3, i32* @var32
    150 ; CHECK: sub {{w[0-9]+}}, {{w[0-9]+}}, {{w[0-9]+}}, asr #5
    151 
    152 ; Subtraction is not commutative!
    153   %shift4 = ashr i32 %rhs32, 19
    154   %val4 = sub i32 %shift4, %lhs32
    155   store volatile i32 %val4, i32* @var32
    156 ; CHECK-NOT: sub {{w[0-9]+}}, {{w[0-9]+}}, {{w[0-9]+}}, asr #19
    157 
    158   %shift4a = ashr i32 %lhs32, 15
    159   %val4a = sub i32 0, %shift4a
    160   store volatile i32 %val4a, i32* @var32
    161 ; CHECK: sub {{w[0-9]+}}, wzr, {{w[0-9]+}}, asr #15
    162 
    163   %shift5 = ashr i64 %rhs64, 18
    164   %val5 = add i64 %lhs64, %shift5
    165   store volatile i64 %val5, i64* @var64
    166 ; CHECK: add {{x[0-9]+}}, {{x[0-9]+}}, {{x[0-9]+}}, asr #18
    167 
    168   %shift6 = ashr i64 %rhs64, 31
    169   %val6 = add i64 %shift6, %lhs64
    170   store volatile i64 %val6, i64* @var64
    171 ; CHECK: add {{x[0-9]+}}, {{x[0-9]+}}, {{x[0-9]+}}, asr #31
    172 
    173   %shift7 = ashr i64 %rhs64, 5
    174   %val7 = sub i64 %lhs64, %shift7
    175   store volatile i64 %val7, i64* @var64
    176 ; CHECK: sub {{x[0-9]+}}, {{x[0-9]+}}, {{x[0-9]+}}, asr #5
    177 
    178 ; Subtraction is not commutative!
    179   %shift8 = ashr i64 %rhs64, 19
    180   %val8 = sub i64 %shift8, %lhs64
    181   store volatile i64 %val8, i64* @var64
    182 ; CHECK-NOT: sub {{x[0-9]+}}, {{x[0-9]+}}, {{x[0-9]+}}, asr #19
    183 
    184   %shift8a = ashr i64 %lhs64, 45
    185   %val8a = sub i64 0, %shift8a
    186   store volatile i64 %val8a, i64* @var64
    187 ; CHECK: sub {{x[0-9]+}}, xzr, {{x[0-9]+}}, asr #45
    188 
    189   ret void
    190 ; CHECK: ret
    191 }
    192 
    193 define i32 @test_cmp(i32 %lhs32, i32 %rhs32, i64 %lhs64, i64 %rhs64) {
    194 ; CHECK-LABEL: test_cmp:
    195 
    196   %shift1 = shl i32 %rhs32, 13
    197   %tst1 = icmp uge i32 %lhs32, %shift1
    198   br i1 %tst1, label %t2, label %end
    199 ; CHECK: cmp {{w[0-9]+}}, {{w[0-9]+}}, lsl #13
    200 
    201 t2:
    202   %shift2 = lshr i32 %rhs32, 20
    203   %tst2 = icmp ne i32 %lhs32, %shift2
    204   br i1 %tst2, label %t3, label %end
    205 ; CHECK: cmp {{w[0-9]+}}, {{w[0-9]+}}, lsr #20
    206 
    207 t3:
    208   %shift3 = ashr i32 %rhs32, 9
    209   %tst3 = icmp ne i32 %lhs32, %shift3
    210   br i1 %tst3, label %t4, label %end
    211 ; CHECK: cmp {{w[0-9]+}}, {{w[0-9]+}}, asr #9
    212 
    213 t4:
    214   %shift4 = shl i64 %rhs64, 43
    215   %tst4 = icmp uge i64 %lhs64, %shift4
    216   br i1 %tst4, label %t5, label %end
    217 ; CHECK: cmp {{x[0-9]+}}, {{x[0-9]+}}, lsl #43
    218 
    219 t5:
    220   %shift5 = lshr i64 %rhs64, 20
    221   %tst5 = icmp ne i64 %lhs64, %shift5
    222   br i1 %tst5, label %t6, label %end
    223 ; CHECK: cmp {{x[0-9]+}}, {{x[0-9]+}}, lsr #20
    224 
    225 t6:
    226   %shift6 = ashr i64 %rhs64, 59
    227   %tst6 = icmp ne i64 %lhs64, %shift6
    228   br i1 %tst6, label %t7, label %end
    229 ; CHECK: cmp {{x[0-9]+}}, {{x[0-9]+}}, asr #59
    230 
    231 t7:
    232   ret i32 1
    233 end:
    234 
    235   ret i32 0
    236 ; CHECK: ret
    237 }
    238 
    239 define i32 @test_cmn(i32 %lhs32, i32 %rhs32, i64 %lhs64, i64 %rhs64) {
    240 ; CHECK-LABEL: test_cmn:
    241 
    242   %shift1 = shl i32 %rhs32, 13
    243   %val1 = sub i32 0, %shift1
    244   %tst1 = icmp uge i32 %lhs32, %val1
    245   br i1 %tst1, label %t2, label %end
    246   ; Important that this isn't lowered to a cmn instruction because if %rhs32 ==
    247   ; 0 then the results will differ.
    248 ; CHECK: sub [[RHS:w[0-9]+]], wzr, {{w[0-9]+}}, lsl #13
    249 ; CHECK: cmp {{w[0-9]+}}, [[RHS]]
    250 
    251 t2:
    252   %shift2 = lshr i32 %rhs32, 20
    253   %val2 = sub i32 0, %shift2
    254   %tst2 = icmp ne i32 %lhs32, %val2
    255   br i1 %tst2, label %t3, label %end
    256 ; CHECK: cmn {{w[0-9]+}}, {{w[0-9]+}}, lsr #20
    257 
    258 t3:
    259   %shift3 = ashr i32 %rhs32, 9
    260   %val3 = sub i32 0, %shift3
    261   %tst3 = icmp eq i32 %lhs32, %val3
    262   br i1 %tst3, label %t4, label %end
    263 ; CHECK: cmn {{w[0-9]+}}, {{w[0-9]+}}, asr #9
    264 
    265 t4:
    266   %shift4 = shl i64 %rhs64, 43
    267   %val4 = sub i64 0, %shift4
    268   %tst4 = icmp slt i64 %lhs64, %val4
    269   br i1 %tst4, label %t5, label %end
    270   ; Again, it's important that cmn isn't used here in case %rhs64 == 0.
    271 ; CHECK: sub [[RHS:x[0-9]+]], xzr, {{x[0-9]+}}, lsl #43
    272 ; CHECK: cmp {{x[0-9]+}}, [[RHS]]
    273 
    274 t5:
    275   %shift5 = lshr i64 %rhs64, 20
    276   %val5 = sub i64 0, %shift5
    277   %tst5 = icmp ne i64 %lhs64, %val5
    278   br i1 %tst5, label %t6, label %end
    279 ; CHECK: cmn {{x[0-9]+}}, {{x[0-9]+}}, lsr #20
    280 
    281 t6:
    282   %shift6 = ashr i64 %rhs64, 59
    283   %val6 = sub i64 0, %shift6
    284   %tst6 = icmp ne i64 %lhs64, %val6
    285   br i1 %tst6, label %t7, label %end
    286 ; CHECK: cmn {{x[0-9]+}}, {{x[0-9]+}}, asr #59
    287 
    288 t7:
    289   ret i32 1
    290 end:
    291 
    292   ret i32 0
    293 ; CHECK: ret
    294 }
    295 
    296