Home | History | Annotate | Download | only in ARM
      1 ; RUN: llc -mtriple=armv7-none-eabi -mattr=+neon < %s -o - | FileCheck %s
      2 
      3 ; The following functions test the use case where an X constraint is used to
      4 ; add a dependency between an assembly instruction (vmsr in this case) and
      5 ; another instruction. In each function, we use a different type for the
      6 ; X constraint argument.
      7 ;
      8 ; We can something similar from the following C code:
      9 ; double f1(double f, int pscr_value) {
     10 ;   asm volatile("vmsr fpscr,%0" : "=X" ((f)): "r" (pscr_value));
     11 ;   return f+f;
     12 ; }
     13 
     14 ; CHECK-LABEL: f1
     15 ; CHECK: vmsr fpscr
     16 ; CHECK: vadd.f64
     17 
     18 define arm_aapcs_vfpcc double @f1(double %f, i32 %pscr_value) {
     19 entry:
     20   %f.addr = alloca double, align 8
     21   store double %f, double* %f.addr, align 8
     22   call void asm sideeffect "vmsr fpscr,$1", "=*X,r"(double* nonnull %f.addr, i32 %pscr_value) nounwind
     23   %0 = load double, double* %f.addr, align 8
     24   %add = fadd double %0, %0
     25   ret double %add
     26 }
     27 
     28 ; int f2(int f, int pscr_value) {
     29 ;   asm volatile("vmsr fpscr,%0" : "=X" ((f)): "r" (pscr_value));
     30 ;   return f+f;
     31 ; }
     32 
     33 ; CHECK-LABEL: f2
     34 ; CHECK: vmsr fpscr
     35 ; CHECK: mul
     36 define arm_aapcs_vfpcc i32 @f2(i32 %f, i32 %pscr_value) {
     37 entry:
     38   %f.addr = alloca i32, align 4
     39   store i32 %f, i32* %f.addr, align 4
     40   call void asm sideeffect "vmsr fpscr,$1", "=*X,r"(i32* nonnull %f.addr, i32 %pscr_value) nounwind
     41   %0 = load i32, i32* %f.addr, align 4
     42   %mul = mul i32 %0, %0
     43   ret i32 %mul
     44 }
     45 
     46 
     47 ; int f3(int f, int pscr_value) {
     48 ;   asm volatile("vmsr fpscr,%0" : "=X" ((f)): "r" (pscr_value));
     49 ;   return f+f;
     50 ; }
     51 
     52 ; typedef signed char int8_t;
     53 ; typedef __attribute__((neon_vector_type(8))) int8_t int8x8_t;
     54 ; void f3 (void)
     55 ; {
     56 ;   int8x8_t vector_res_int8x8;
     57 ;   unsigned int fpscr;
     58 ;   asm volatile ("vmsr fpscr,%1" : "=X" ((vector_res_int8x8)) : "r" (fpscr));
     59 ;   return vector_res_int8x8 * vector_res_int8x8;
     60 ; }
     61 
     62 ; CHECK-LABEL: f3
     63 ; CHECK: vmsr fpscr
     64 ; CHECK: vmul.i8
     65 define arm_aapcs_vfpcc <8 x i8> @f3() {
     66 entry:
     67   %vector_res_int8x8 = alloca <8 x i8>, align 8
     68   %0 = getelementptr inbounds <8 x i8>, <8 x i8>* %vector_res_int8x8, i32 0, i32 0
     69   call void asm sideeffect "vmsr fpscr,$1", "=*X,r"(<8 x i8>* nonnull %vector_res_int8x8, i32 undef) nounwind
     70   %1 = load <8 x i8>, <8 x i8>* %vector_res_int8x8, align 8
     71   %mul = mul <8 x i8> %1, %1
     72   ret <8 x i8> %mul
     73 }
     74 
     75 ; We can emit integer constants.
     76 ; We can get this from:
     77 ; void f() {
     78 ;   int x = 2;
     79 ;   asm volatile ("add r0, r0, %0" : : "X" (x));
     80 ; }
     81 ;
     82 ; CHECK-LABEL: f4
     83 ; CHECK: add r0, r0, #2
     84 define void @f4() {
     85 entry:
     86   tail call void asm sideeffect "add r0, r0, $0", "X"(i32 2)
     87   ret void
     88 }
     89 
     90 ; We can emit function labels. This is equivalent to the following C code:
     91 ; void f(void) {
     92 ;   void (*x)(void) = &foo;
     93 ;   asm volatile ("bl %0" : : "X" (x));
     94 ; }
     95 ; CHECK-LABEL: f5
     96 ; CHECK: bl f4
     97 define void @f5() {
     98 entry:
     99   tail call void asm sideeffect "bl $0", "X"(void ()* nonnull @f4)
    100   ret void
    101 }
    102 
    103 declare void @foo(...)
    104 
    105 ; This tests the behavior of the X constraint when used on functions pointers,
    106 ; or functions with a cast. In the first asm call we figure out that this
    107 ; is a function pointer and emit the label. However, in the second asm call
    108 ; we can't see through the bitcast and we end up having to lower this constraint
    109 ; to something else. This is not ideal, but it is a correct behaviour according
    110 ; to the definition of the X constraint.
    111 ;
    112 ; In this case (and other cases where we could have emitted something else),
    113 ; what we're doing with the X constraint is not particularly useful either,
    114 ; since the user could have used "r" in this situation for the same effect.
    115 
    116 ; CHECK-LABEL: f6
    117 ; CHECK: bl foo
    118 ; CHECK: bl r
    119 
    120 define void @f6() nounwind {
    121 entry:
    122   tail call void asm sideeffect "bl $0", "X"(void (...)* @foo) nounwind
    123   tail call void asm sideeffect "bl $0", "X"(void (...)* bitcast (void ()* @f4 to void (...)*)) nounwind
    124   ret void
    125 }
    126 
    127 ; The following IR can be generated from C code with a function like:
    128 ; void a() {
    129 ;   void* a = &&A;
    130 ;   asm volatile ("bl %0" : : "X" (a));
    131 ;  A:
    132 ;   return;
    133 ; }
    134 ;
    135 ; Ideally this would give the block address of bb, but it requires us to see
    136 ; through blockaddress, which we can't do at the moment. This might break some
    137 ; existing use cases where a user would expect to get a block label and instead
    138 ; gets the block address in a register. However, note that according to the
    139 ; "no constraints" definition this behaviour is correct (although not very nice).
    140 
    141 ; CHECK-LABEL: f7
    142 ; CHECK: bl
    143 define void @f7() {
    144   call void asm sideeffect "bl $0", "X"( i8* blockaddress(@f7, %bb) )
    145   br label %bb
    146 bb:
    147   ret void
    148 }
    149 
    150 ; If we use a constraint "=*X", we should get a store back to *%x (in r0).
    151 ; CHECK-LABEL: f8
    152 ; CHECK: str	r{{.*}}, [r0]
    153 define void @f8(i32 *%x) {
    154 entry:
    155   tail call void asm sideeffect "add $0, r0, r0", "=*X"(i32 *%x)
    156   ret void
    157 }
    158