Home | History | Annotate | Download | only in Mips
      1 ; RUN: llc -march=mips -mattr=dsp < %s | FileCheck %s -check-prefix=R1
      2 ; RUN: llc -march=mips -mattr=dspr2 < %s | FileCheck %s -check-prefix=R2
      3 
      4 ; R1-LABEL: test_lbux:
      5 ; R1: lbux ${{[0-9]+}}
      6 
      7 define zeroext i8 @test_lbux(i8* nocapture %b, i32 %i) {
      8 entry:
      9   %add.ptr = getelementptr inbounds i8* %b, i32 %i
     10   %0 = load i8* %add.ptr, align 1
     11   ret i8 %0
     12 }
     13 
     14 ; R1-LABEL: test_lhx:
     15 ; R1: lhx ${{[0-9]+}}
     16 
     17 define signext i16 @test_lhx(i16* nocapture %b, i32 %i) {
     18 entry:
     19   %add.ptr = getelementptr inbounds i16* %b, i32 %i
     20   %0 = load i16* %add.ptr, align 2
     21   ret i16 %0
     22 }
     23 
     24 ; R1-LABEL: test_lwx:
     25 ; R1: lwx ${{[0-9]+}}
     26 
     27 define i32 @test_lwx(i32* nocapture %b, i32 %i) {
     28 entry:
     29   %add.ptr = getelementptr inbounds i32* %b, i32 %i
     30   %0 = load i32* %add.ptr, align 4
     31   ret i32 %0
     32 }
     33 
     34 ; R1-LABEL: test_add_v2q15_:
     35 ; R1: addq.ph ${{[0-9]+}}
     36 
     37 define { i32 } @test_add_v2q15_(i32 %a.coerce, i32 %b.coerce) {
     38 entry:
     39   %0 = bitcast i32 %a.coerce to <2 x i16>
     40   %1 = bitcast i32 %b.coerce to <2 x i16>
     41   %add = add <2 x i16> %0, %1
     42   %2 = bitcast <2 x i16> %add to i32
     43   %.fca.0.insert = insertvalue { i32 } undef, i32 %2, 0
     44   ret { i32 } %.fca.0.insert
     45 }
     46 
     47 ; R1-LABEL: test_sub_v2q15_:
     48 ; R1: subq.ph ${{[0-9]+}}
     49 
     50 define { i32 } @test_sub_v2q15_(i32 %a.coerce, i32 %b.coerce) {
     51 entry:
     52   %0 = bitcast i32 %a.coerce to <2 x i16>
     53   %1 = bitcast i32 %b.coerce to <2 x i16>
     54   %sub = sub <2 x i16> %0, %1
     55   %2 = bitcast <2 x i16> %sub to i32
     56   %.fca.0.insert = insertvalue { i32 } undef, i32 %2, 0
     57   ret { i32 } %.fca.0.insert
     58 }
     59 
     60 ; R2-LABEL: test_mul_v2q15_:
     61 ; R2: mul.ph ${{[0-9]+}}
     62 
     63 ; mul.ph is an R2 instruction. Check that multiply node gets expanded.
     64 ; R1-LABEL: test_mul_v2q15_:
     65 ; R1: mul ${{[0-9]+}}
     66 ; R1: mul ${{[0-9]+}}
     67 
     68 define { i32 } @test_mul_v2q15_(i32 %a.coerce, i32 %b.coerce) {
     69 entry:
     70   %0 = bitcast i32 %a.coerce to <2 x i16>
     71   %1 = bitcast i32 %b.coerce to <2 x i16>
     72   %mul = mul <2 x i16> %0, %1
     73   %2 = bitcast <2 x i16> %mul to i32
     74   %.fca.0.insert = insertvalue { i32 } undef, i32 %2, 0
     75   ret { i32 } %.fca.0.insert
     76 }
     77 
     78 ; R1-LABEL: test_add_v4i8_:
     79 ; R1: addu.qb ${{[0-9]+}}
     80 
     81 define { i32 } @test_add_v4i8_(i32 %a.coerce, i32 %b.coerce) {
     82 entry:
     83   %0 = bitcast i32 %a.coerce to <4 x i8>
     84   %1 = bitcast i32 %b.coerce to <4 x i8>
     85   %add = add <4 x i8> %0, %1
     86   %2 = bitcast <4 x i8> %add to i32
     87   %.fca.0.insert = insertvalue { i32 } undef, i32 %2, 0
     88   ret { i32 } %.fca.0.insert
     89 }
     90 
     91 ; R1-LABEL: test_sub_v4i8_:
     92 ; R1: subu.qb ${{[0-9]+}}
     93 
     94 define { i32 } @test_sub_v4i8_(i32 %a.coerce, i32 %b.coerce) {
     95 entry:
     96   %0 = bitcast i32 %a.coerce to <4 x i8>
     97   %1 = bitcast i32 %b.coerce to <4 x i8>
     98   %sub = sub <4 x i8> %0, %1
     99   %2 = bitcast <4 x i8> %sub to i32
    100   %.fca.0.insert = insertvalue { i32 } undef, i32 %2, 0
    101   ret { i32 } %.fca.0.insert
    102 }
    103 
    104 ; DSP-ASE doesn't have a v4i8 multiply instruction. Check that multiply node gets expanded.
    105 ; R2-LABEL: test_mul_v4i8_:
    106 ; R2: mul ${{[0-9]+}}
    107 ; R2: mul ${{[0-9]+}}
    108 ; R2: mul ${{[0-9]+}}
    109 ; R2: mul ${{[0-9]+}}
    110 
    111 define { i32 } @test_mul_v4i8_(i32 %a.coerce, i32 %b.coerce) {
    112 entry:
    113   %0 = bitcast i32 %a.coerce to <4 x i8>
    114   %1 = bitcast i32 %b.coerce to <4 x i8>
    115   %mul = mul <4 x i8> %0, %1
    116   %2 = bitcast <4 x i8> %mul to i32
    117   %.fca.0.insert = insertvalue { i32 } undef, i32 %2, 0
    118   ret { i32 } %.fca.0.insert
    119 }
    120 
    121 ; R1-LABEL: test_addsc:
    122 ; R1: addsc ${{[0-9]+}}
    123 ; R1: addwc ${{[0-9]+}}
    124 
    125 define i64 @test_addsc(i64 %a, i64 %b) {
    126 entry:
    127   %add = add nsw i64 %b, %a
    128   ret i64 %add
    129 }
    130 
    131 ; R1-LABEL: shift1_v2i16_shl_:
    132 ; R1: shll.ph ${{[0-9]+}}, ${{[0-9]+}}, 15
    133 
    134 define { i32 } @shift1_v2i16_shl_(i32 %a0.coerce) {
    135 entry:
    136   %0 = bitcast i32 %a0.coerce to <2 x i16>
    137   %shl = shl <2 x i16> %0, <i16 15, i16 15>
    138   %1 = bitcast <2 x i16> %shl to i32
    139   %.fca.0.insert = insertvalue { i32 } undef, i32 %1, 0
    140   ret { i32 } %.fca.0.insert
    141 }
    142 
    143 ; R1-LABEL: shift1_v2i16_sra_:
    144 ; R1: shra.ph ${{[0-9]+}}, ${{[0-9]+}}, 15
    145 
    146 define { i32 } @shift1_v2i16_sra_(i32 %a0.coerce) {
    147 entry:
    148   %0 = bitcast i32 %a0.coerce to <2 x i16>
    149   %shr = ashr <2 x i16> %0, <i16 15, i16 15>
    150   %1 = bitcast <2 x i16> %shr to i32
    151   %.fca.0.insert = insertvalue { i32 } undef, i32 %1, 0
    152   ret { i32 } %.fca.0.insert
    153 }
    154 
    155 ; R1-LABEL: shift1_v2ui16_srl_:
    156 ; R1-NOT: shrl.ph
    157 ; R2-LABEL: shift1_v2ui16_srl_:
    158 ; R2: shrl.ph ${{[0-9]+}}, ${{[0-9]+}}, 15
    159 
    160 define { i32 } @shift1_v2ui16_srl_(i32 %a0.coerce) {
    161 entry:
    162   %0 = bitcast i32 %a0.coerce to <2 x i16>
    163   %shr = lshr <2 x i16> %0, <i16 15, i16 15>
    164   %1 = bitcast <2 x i16> %shr to i32
    165   %.fca.0.insert = insertvalue { i32 } undef, i32 %1, 0
    166   ret { i32 } %.fca.0.insert
    167 }
    168 
    169 ; R1-LABEL: shift1_v4i8_shl_:
    170 ; R1: shll.qb ${{[0-9]+}}, ${{[0-9]+}}, 7
    171 
    172 define { i32 } @shift1_v4i8_shl_(i32 %a0.coerce) {
    173 entry:
    174   %0 = bitcast i32 %a0.coerce to <4 x i8>
    175   %shl = shl <4 x i8> %0, <i8 7, i8 7, i8 7, i8 7>
    176   %1 = bitcast <4 x i8> %shl to i32
    177   %.fca.0.insert = insertvalue { i32 } undef, i32 %1, 0
    178   ret { i32 } %.fca.0.insert
    179 }
    180 
    181 ; R1-LABEL: shift1_v4i8_sra_:
    182 ; R1-NOT: shra.qb
    183 ; R2-LABEL: shift1_v4i8_sra_:
    184 ; R2: shra.qb ${{[0-9]+}}, ${{[0-9]+}}, 7
    185 
    186 define { i32 } @shift1_v4i8_sra_(i32 %a0.coerce) {
    187 entry:
    188   %0 = bitcast i32 %a0.coerce to <4 x i8>
    189   %shr = ashr <4 x i8> %0, <i8 7, i8 7, i8 7, i8 7>
    190   %1 = bitcast <4 x i8> %shr to i32
    191   %.fca.0.insert = insertvalue { i32 } undef, i32 %1, 0
    192   ret { i32 } %.fca.0.insert
    193 }
    194 
    195 ; R1-LABEL: shift1_v4ui8_srl_:
    196 ; R1: shrl.qb ${{[0-9]+}}, ${{[0-9]+}}, 7
    197 
    198 define { i32 } @shift1_v4ui8_srl_(i32 %a0.coerce) {
    199 entry:
    200   %0 = bitcast i32 %a0.coerce to <4 x i8>
    201   %shr = lshr <4 x i8> %0, <i8 7, i8 7, i8 7, i8 7>
    202   %1 = bitcast <4 x i8> %shr to i32
    203   %.fca.0.insert = insertvalue { i32 } undef, i32 %1, 0
    204   ret { i32 } %.fca.0.insert
    205 }
    206 
    207 ; Check that shift node is expanded if splat element size is not 16-bit.
    208 ;
    209 ; R1-LABEL: test_vector_splat_imm_v2q15:
    210 ; R1-NOT: shll.ph
    211 
    212 define { i32 } @test_vector_splat_imm_v2q15(i32 %a.coerce) {
    213 entry:
    214   %0 = bitcast i32 %a.coerce to <2 x i16>
    215   %shl = shl <2 x i16> %0, <i16 0, i16 2>
    216   %1 = bitcast <2 x i16> %shl to i32
    217   %.fca.0.insert = insertvalue { i32 } undef, i32 %1, 0
    218   ret { i32 } %.fca.0.insert
    219 }
    220 
    221 ; Check that shift node is expanded if splat element size is not 8-bit.
    222 ;
    223 ; R1-LABEL: test_vector_splat_imm_v4i8:
    224 ; R1-NOT: shll.qb
    225 
    226 define { i32 } @test_vector_splat_imm_v4i8(i32 %a.coerce) {
    227 entry:
    228   %0 = bitcast i32 %a.coerce to <4 x i8>
    229   %shl = shl <4 x i8> %0, <i8 0, i8 2, i8 0, i8 2>
    230   %1 = bitcast <4 x i8> %shl to i32
    231   %.fca.0.insert = insertvalue { i32 } undef, i32 %1, 0
    232   ret { i32 } %.fca.0.insert
    233 }
    234 
    235 ; Check that shift node is expanded if shift amount doesn't fit in 4-bit sa field.
    236 ;
    237 ; R1-LABEL: test_shift_amount_v2q15:
    238 ; R1-NOT: shll.ph
    239 
    240 define { i32 } @test_shift_amount_v2q15(i32 %a.coerce) {
    241 entry:
    242   %0 = bitcast i32 %a.coerce to <2 x i16>
    243   %shl = shl <2 x i16> %0, <i16 16, i16 16>
    244   %1 = bitcast <2 x i16> %shl to i32
    245   %.fca.0.insert = insertvalue { i32 } undef, i32 %1, 0
    246   ret { i32 } %.fca.0.insert
    247 }
    248 
    249 ; Check that shift node is expanded if shift amount doesn't fit in 3-bit sa field.
    250 ;
    251 ; R1-LABEL: test_shift_amount_v4i8:
    252 ; R1-NOT: shll.qb
    253 
    254 define { i32 } @test_shift_amount_v4i8(i32 %a.coerce) {
    255 entry:
    256   %0 = bitcast i32 %a.coerce to <4 x i8>
    257   %shl = shl <4 x i8> %0, <i8 8, i8 8, i8 8, i8 8>
    258   %1 = bitcast <4 x i8> %shl to i32
    259   %.fca.0.insert = insertvalue { i32 } undef, i32 %1, 0
    260   ret { i32 } %.fca.0.insert
    261 }
    262