Home | History | Annotate | Download | only in ARM
      1 ; RUN: llc -mtriple=arm-eabi -mattr=+neon %s -o - | FileCheck %s
      2 
      3 define <8 x i16> @vshlls8(<8 x i8>* %A) nounwind {
      4 ;CHECK-LABEL: vshlls8:
      5 ;CHECK: vshll.s8
      6         %tmp1 = load <8 x i8>, <8 x i8>* %A
      7         %sext = sext <8 x i8> %tmp1 to <8 x i16>
      8         %shift = shl <8 x i16> %sext, <i16 7, i16 7, i16 7, i16 7, i16 7, i16 7, i16 7, i16 7>
      9         ret <8 x i16> %shift
     10 }
     11 
     12 define <4 x i32> @vshlls16(<4 x i16>* %A) nounwind {
     13 ;CHECK-LABEL: vshlls16:
     14 ;CHECK: vshll.s16
     15         %tmp1 = load <4 x i16>, <4 x i16>* %A
     16         %sext = sext <4 x i16> %tmp1 to <4 x i32>
     17         %shift = shl <4 x i32> %sext, <i32 15, i32 15, i32 15, i32 15>
     18         ret <4 x i32> %shift
     19 }
     20 
     21 define <2 x i64> @vshlls32(<2 x i32>* %A) nounwind {
     22 ;CHECK-LABEL: vshlls32:
     23 ;CHECK: vshll.s32
     24         %tmp1 = load <2 x i32>, <2 x i32>* %A
     25         %sext = sext <2 x i32> %tmp1 to <2 x i64>
     26         %shift = shl <2 x i64> %sext, <i64 31, i64 31>
     27         ret <2 x i64> %shift
     28 }
     29 
     30 define <8 x i16> @vshllu8(<8 x i8>* %A) nounwind {
     31 ;CHECK-LABEL: vshllu8:
     32 ;CHECK: vshll.u8
     33         %tmp1 = load <8 x i8>, <8 x i8>* %A
     34         %zext = zext <8 x i8> %tmp1 to <8 x i16>
     35         %shift = shl <8 x i16> %zext, <i16 7, i16 7, i16 7, i16 7, i16 7, i16 7, i16 7, i16 7>
     36         ret <8 x i16> %shift
     37 }
     38 
     39 define <4 x i32> @vshllu16(<4 x i16>* %A) nounwind {
     40 ;CHECK-LABEL: vshllu16:
     41 ;CHECK: vshll.u16
     42         %tmp1 = load <4 x i16>, <4 x i16>* %A
     43         %zext = zext <4 x i16> %tmp1 to <4 x i32>
     44         %shift = shl <4 x i32> %zext, <i32 15, i32 15, i32 15, i32 15>
     45         ret <4 x i32> %shift
     46 }
     47 
     48 define <2 x i64> @vshllu32(<2 x i32>* %A) nounwind {
     49 ;CHECK-LABEL: vshllu32:
     50 ;CHECK: vshll.u32
     51         %tmp1 = load <2 x i32>, <2 x i32>* %A
     52         %zext = zext <2 x i32> %tmp1 to <2 x i64>
     53         %shift = shl <2 x i64> %zext, <i64 31, i64 31>
     54         ret <2 x i64> %shift
     55 }
     56 
     57 ; The following tests use the maximum shift count, so the signedness is
     58 ; irrelevant.  Test both signed and unsigned versions.
     59 define <8 x i16> @vshlli8(<8 x i8>* %A) nounwind {
     60 ;CHECK-LABEL: vshlli8:
     61 ;CHECK: vshll.i8
     62         %tmp1 = load <8 x i8>, <8 x i8>* %A
     63         %sext = sext <8 x i8> %tmp1 to <8 x i16>
     64         %shift = shl <8 x i16> %sext, <i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8>
     65         ret <8 x i16> %shift
     66 }
     67 
     68 define <4 x i32> @vshlli16(<4 x i16>* %A) nounwind {
     69 ;CHECK-LABEL: vshlli16:
     70 ;CHECK: vshll.i16
     71         %tmp1 = load <4 x i16>, <4 x i16>* %A
     72         %zext = zext <4 x i16> %tmp1 to <4 x i32>
     73         %shift = shl <4 x i32> %zext, <i32 16, i32 16, i32 16, i32 16>
     74         ret <4 x i32> %shift
     75 }
     76 
     77 define <2 x i64> @vshlli32(<2 x i32>* %A) nounwind {
     78 ;CHECK-LABEL: vshlli32:
     79 ;CHECK: vshll.i32
     80         %tmp1 = load <2 x i32>, <2 x i32>* %A
     81         %zext = zext <2 x i32> %tmp1 to <2 x i64>
     82         %shift = shl <2 x i64> %zext, <i64 32, i64 32>
     83         ret <2 x i64> %shift
     84 }
     85 
     86 ; And these have a shift just out of range so separate vmovl and vshl
     87 ; instructions are needed.
     88 define <8 x i16> @vshllu8_bad(<8 x i8>* %A) nounwind {
     89 ; CHECK-LABEL: vshllu8_bad:
     90 ; CHECK: vmovl.u8
     91 ; CHECK: vshl.i16
     92         %tmp1 = load <8 x i8>, <8 x i8>* %A
     93         %zext = zext <8 x i8> %tmp1 to <8 x i16>
     94         %shift = shl <8 x i16> %zext, <i16 9, i16 9, i16 9, i16 9, i16 9, i16 9, i16 9, i16 9>
     95         ret <8 x i16> %shift
     96 }
     97 
     98 define <4 x i32> @vshlls16_bad(<4 x i16>* %A) nounwind {
     99 ; CHECK-LABEL: vshlls16_bad:
    100 ; CHECK: vmovl.s16
    101 ; CHECK: vshl.i32
    102         %tmp1 = load <4 x i16>, <4 x i16>* %A
    103         %sext = sext <4 x i16> %tmp1 to <4 x i32>
    104         %shift = shl <4 x i32> %sext, <i32 17, i32 17, i32 17, i32 17>
    105         ret <4 x i32> %shift
    106 }
    107 
    108 define <2 x i64> @vshllu32_bad(<2 x i32>* %A) nounwind {
    109 ; CHECK-LABEL: vshllu32_bad:
    110 ; CHECK: vmovl.u32
    111 ; CHECK: vshl.i64
    112         %tmp1 = load <2 x i32>, <2 x i32>* %A
    113         %zext = zext <2 x i32> %tmp1 to <2 x i64>
    114         %shift = shl <2 x i64> %zext, <i64 33, i64 33>
    115         ret <2 x i64> %shift
    116 }
    117