Home | History | Annotate | Download | only in ARM
      1 ; RUN: llc < %s -march=arm -mattr=+neon | FileCheck %s
      2 
      3 ; PR12281
      4 ; Test generataion of code for vmull instruction when multiplying 128-bit
      5 ; vectors that were created by sign-extending smaller vector sizes.
      6 ;
      7 ; The vmull operation requires 64-bit vectors, so we must extend the original
      8 ; vector size to 64 bits for vmull operation.
      9 ; Previously failed with an assertion because the <4 x i8> vector was too small
     10 ; for vmull.
     11 
     12 ; Vector x Constant
     13 ; v4i8
     14 ;
     15 define void @sextload_v4i8_c(<4 x i8>* %v) nounwind {
     16 ;CHECK: sextload_v4i8_c:
     17 entry:
     18   %0 = load <4 x i8>* %v, align 8
     19   %v0  = sext <4 x i8> %0 to <4 x i32>
     20 ;CHECK: vmull
     21   %v1 = mul <4 x i32>  %v0, <i32 3, i32 3, i32 3, i32 3>
     22   store <4 x i32> %v1, <4 x i32>* undef, align 8
     23   ret void;
     24 }
     25 
     26 ; v2i8
     27 ;
     28 define void @sextload_v2i8_c(<2 x i8>* %v) nounwind {
     29 ;CHECK: sextload_v2i8_c:
     30 entry:
     31   %0   = load <2 x i8>* %v, align 8
     32   %v0  = sext <2 x i8>  %0 to <2 x i64>
     33 ;CHECK: vmull
     34   %v1  = mul <2 x i64>  %v0, <i64 3, i64 3>
     35   store <2 x i64> %v1, <2 x i64>* undef, align 8
     36   ret void;
     37 }
     38 
     39 ; v2i16
     40 ;
     41 define void @sextload_v2i16_c(<2 x i16>* %v) nounwind {
     42 ;CHECK: sextload_v2i16_c:
     43 entry:
     44   %0   = load <2 x i16>* %v, align 8
     45   %v0  = sext <2 x i16>  %0 to <2 x i64>
     46 ;CHECK: vmull
     47   %v1  = mul <2 x i64>  %v0, <i64 3, i64 3>
     48   store <2 x i64> %v1, <2 x i64>* undef, align 8
     49   ret void;
     50 }
     51 
     52 
     53 ; Vector x Vector
     54 ; v4i8
     55 ;
     56 define void @sextload_v4i8_v(<4 x i8>* %v, <4 x i8>* %p) nounwind {
     57 ;CHECK: sextload_v4i8_v:
     58 entry:
     59   %0 = load <4 x i8>* %v, align 8
     60   %v0  = sext <4 x i8> %0 to <4 x i32>
     61 
     62   %1  = load <4 x i8>* %p, align 8
     63   %v2 = sext <4 x i8> %1 to <4 x i32>
     64 ;CHECK: vmull
     65   %v1 = mul <4 x i32>  %v0, %v2
     66   store <4 x i32> %v1, <4 x i32>* undef, align 8
     67   ret void;
     68 }
     69 
     70 ; v2i8
     71 ;
     72 define void @sextload_v2i8_v(<2 x i8>* %v, <2 x i8>* %p) nounwind {
     73 ;CHECK: sextload_v2i8_v:
     74 entry:
     75   %0 = load <2 x i8>* %v, align 8
     76   %v0  = sext <2 x i8> %0 to <2 x i64>
     77 
     78   %1  = load <2 x i8>* %p, align 8
     79   %v2 = sext <2 x i8> %1 to <2 x i64>
     80 ;CHECK: vmull
     81   %v1 = mul <2 x i64>  %v0, %v2
     82   store <2 x i64> %v1, <2 x i64>* undef, align 8
     83   ret void;
     84 }
     85 
     86 ; v2i16
     87 ;
     88 define void @sextload_v2i16_v(<2 x i16>* %v, <2 x i16>* %p) nounwind {
     89 ;CHECK: sextload_v2i16_v:
     90 entry:
     91   %0 = load <2 x i16>* %v, align 8
     92   %v0  = sext <2 x i16> %0 to <2 x i64>
     93 
     94   %1  = load <2 x i16>* %p, align 8
     95   %v2 = sext <2 x i16> %1 to <2 x i64>
     96 ;CHECK: vmull
     97   %v1 = mul <2 x i64>  %v0, %v2
     98   store <2 x i64> %v1, <2 x i64>* undef, align 8
     99   ret void;
    100 }
    101 
    102 
    103 ; Vector(small) x Vector(big)
    104 ; v4i8 x v4i16
    105 ;
    106 define void @sextload_v4i8_vs(<4 x i8>* %v, <4 x i16>* %p) nounwind {
    107 ;CHECK: sextload_v4i8_vs:
    108 entry:
    109   %0 = load <4 x i8>* %v, align 8
    110   %v0  = sext <4 x i8> %0 to <4 x i32>
    111 
    112   %1  = load <4 x i16>* %p, align 8
    113   %v2 = sext <4 x i16> %1 to <4 x i32>
    114 ;CHECK: vmull
    115   %v1 = mul <4 x i32>  %v0, %v2
    116   store <4 x i32> %v1, <4 x i32>* undef, align 8
    117   ret void;
    118 }
    119 
    120 ; v2i8
    121 ; v2i8 x v2i16
    122 define void @sextload_v2i8_vs(<2 x i8>* %v, <2 x i16>* %p) nounwind {
    123 ;CHECK: sextload_v2i8_vs:
    124 entry:
    125   %0 = load <2 x i8>* %v, align 8
    126   %v0  = sext <2 x i8> %0 to <2 x i64>
    127 
    128   %1  = load <2 x i16>* %p, align 8
    129   %v2 = sext <2 x i16> %1 to <2 x i64>
    130 ;CHECK: vmull
    131   %v1 = mul <2 x i64>  %v0, %v2
    132   store <2 x i64> %v1, <2 x i64>* undef, align 8
    133   ret void;
    134 }
    135 
    136 ; v2i16
    137 ; v2i16 x v2i32
    138 define void @sextload_v2i16_vs(<2 x i16>* %v, <2 x i32>* %p) nounwind {
    139 ;CHECK: sextload_v2i16_vs:
    140 entry:
    141   %0 = load <2 x i16>* %v, align 8
    142   %v0  = sext <2 x i16> %0 to <2 x i64>
    143 
    144   %1  = load <2 x i32>* %p, align 8
    145   %v2 = sext <2 x i32> %1 to <2 x i64>
    146 ;CHECK: vmull
    147   %v1 = mul <2 x i64>  %v0, %v2
    148   store <2 x i64> %v1, <2 x i64>* undef, align 8
    149   ret void;
    150 }
    151