Home | History | Annotate | Download | only in ARM
      1 ; Disable shrink-wrapping on the first test otherwise we wouldn't
      2 ; exerce the path for PR18136.
      3 ; RUN: llc -mtriple=thumbv7-apple-none-macho < %s -enable-shrink-wrap=false | FileCheck %s
      4 ; RUN: llc -mtriple=thumbv6m-apple-none-macho -disable-fp-elim < %s | FileCheck %s --check-prefix=CHECK-T1
      5 ; RUN: llc -mtriple=thumbv7-apple-darwin-ios -disable-fp-elim < %s | FileCheck %s --check-prefix=CHECK-IOS
      6 ; RUN: llc -mtriple=thumbv7--linux-gnueabi -disable-fp-elim < %s | FileCheck %s --check-prefix=CHECK-LINUX
      7 
      8 
      9 declare void @bar(i8*)
     10 
     11 %bigVec = type [2 x double]
     12 
     13 @var = global %bigVec zeroinitializer
     14 
     15 define void @check_simple() minsize {
     16 ; CHECK-LABEL: check_simple:
     17 ; CHECK: push {r3, r4, r5, r6, r7, lr}
     18 ; CHECK-NOT: sub sp, sp,
     19 ; ...
     20 ; CHECK-NOT: add sp, sp,
     21 ; CHECK: pop {r0, r1, r2, r3, r7, pc}
     22 
     23 ; CHECK-T1-LABEL: check_simple:
     24 ; CHECK-T1: push {r3, r4, r5, r6, r7, lr}
     25 ; CHECK-T1: add r7, sp, #16
     26 ; CHECK-T1-NOT: sub sp, sp,
     27 ; ...
     28 ; CHECK-T1-NOT: add sp, sp,
     29 ; CHECK-T1: pop {r0, r1, r2, r3, r7, pc}
     30 
     31   ; iOS always has a frame pointer and messing with the push affects
     32   ; how it's set in the prologue. Make sure we get that right.
     33 ; CHECK-IOS-LABEL: check_simple:
     34 ; CHECK-IOS: push {r3, r4, r5, r6, r7, lr}
     35 ; CHECK-NOT: sub sp,
     36 ; CHECK-IOS: add r7, sp, #16
     37 ; CHECK-NOT: sub sp,
     38 ; ...
     39 ; CHECK-NOT: add sp,
     40 ; CHEC: pop {r3, r4, r5, r6, r7, pc}
     41 
     42   %var = alloca i8, i32 16
     43   call void @bar(i8* %var)
     44   ret void
     45 }
     46 
     47 define void @check_simple_too_big() minsize {
     48 ; CHECK-LABEL: check_simple_too_big:
     49 ; CHECK: push {r7, lr}
     50 ; CHECK: sub sp,
     51 ; ...
     52 ; CHECK: add sp,
     53 ; CHECK: pop {r7, pc}
     54   %var = alloca i8, i32 64
     55   call void @bar(i8* %var)
     56   ret void
     57 }
     58 
     59 define void @check_vfp_fold() minsize {
     60 ; CHECK-LABEL: check_vfp_fold:
     61 ; CHECK: push {r[[GLOBREG:[0-9]+]], lr}
     62 ; CHECK: vpush {d6, d7, d8, d9}
     63 ; CHECK-NOT: sub sp,
     64 ; ...
     65 ; CHECK-NOT: add sp,
     66 ; CHECK: vpop {d6, d7, d8, d9}
     67 ; CHECK: pop {r[[GLOBREG]], pc}
     68 
     69   ; iOS uses aligned NEON stores here, which is convenient since we
     70   ; want to make sure that works too.
     71 ; CHECK-IOS-LABEL: check_vfp_fold:
     72 ; CHECK-IOS: push {r4, r7, lr}
     73 ; CHECK-IOS: sub.w r4, sp, #16
     74 ; CHECK-IOS: bfc r4, #0, #4
     75 ; CHECK-IOS: mov sp, r4
     76 ; CHECK-IOS: vst1.64 {d8, d9}, [r4:128]
     77 ; CHECK-IOS: sub sp, #16
     78 ; ...
     79 ; CHECK-IOS: add r4, sp, #16
     80 ; CHECK-IOS: vld1.64 {d8, d9}, [r4:128]
     81 ; CHECK-IOS: mov sp, r4
     82 ; CHECK-IOS: pop {r4, r7, pc}
     83 
     84   %var = alloca i8, i32 16
     85 
     86   call void asm "", "r,~{d8},~{d9}"(i8* %var)
     87   call void @bar(i8* %var)
     88 
     89   ret void
     90 }
     91 
     92 ; This function should use just enough space that the "add sp, sp, ..." could be
     93 ; folded in except that doing so would clobber the value being returned.
     94 define i64 @check_no_return_clobber() minsize {
     95 ; CHECK-LABEL: check_no_return_clobber:
     96 ; CHECK: push {r1, r2, r3, r4, r5, r6, r7, lr}
     97 ; CHECK-NOT: sub sp,
     98 ; ...
     99 ; CHECK: add sp, #24
    100 ; CHECK: pop {r7, pc}
    101 
    102   ; Just to keep iOS FileCheck within previous function:
    103 ; CHECK-IOS-LABEL: check_no_return_clobber:
    104 
    105   %var = alloca i8, i32 20
    106   call void @bar(i8* %var)
    107   ret i64 0
    108 }
    109 
    110 define arm_aapcs_vfpcc double @check_vfp_no_return_clobber() minsize {
    111 ; CHECK-LABEL: check_vfp_no_return_clobber:
    112 ; CHECK: push {r[[GLOBREG:[0-9]+]], lr}
    113 ; CHECK: vpush {d0, d1, d2, d3, d4, d5, d6, d7, d8, d9}
    114 ; CHECK-NOT: sub sp,
    115 ; ...
    116 ; CHECK: add sp, #64
    117 ; CHECK: vpop {d8, d9}
    118 ; CHECK: pop {r[[GLOBREG]], pc}
    119 
    120   %var = alloca i8, i32 64
    121 
    122   %tmp = load %bigVec, %bigVec* @var
    123   call void @bar(i8* %var)
    124   store %bigVec %tmp, %bigVec* @var
    125 
    126   ret double 1.0
    127 }
    128 
    129 @dbl = global double 0.0
    130 
    131 ; PR18136: there was a bug determining where the first eligible pop in a
    132 ; basic-block was when the entire block was epilogue code.
    133 define void @test_fold_point(i1 %tst) minsize {
    134 ; CHECK-LABEL: test_fold_point:
    135 
    136   ; Important to check for beginning of basic block, because if it gets
    137   ; if-converted the test is probably no longer checking what it should.
    138 ; CHECK: %end
    139 ; CHECK-NEXT: vpop {d7, d8}
    140 ; CHECK-NEXT: pop {r4, pc}
    141 
    142   ; With a guaranteed frame-pointer, we want to make sure that its offset in the
    143   ; push block is correct, even if a few registers have been tacked onto a later
    144   ; vpush (PR18160).
    145 ; CHECK-IOS-LABEL: test_fold_point:
    146 ; CHECK-IOS: push {r4, r7, lr}
    147 ; CHECK-IOS-NEXT: add r7, sp, #4
    148 ; CHECK-IOS-NEXT: vpush {d7, d8}
    149 
    150   ; We want some memory so there's a stack adjustment to fold...
    151   %var = alloca i8, i32 8
    152 
    153   ; We want a long-lived floating register so that a callee-saved dN is used and
    154   ; there's both a vpop and a pop.
    155   %live_val = load double, double* @dbl
    156   br i1 %tst, label %true, label %end
    157 true:
    158   call void @bar(i8* %var)
    159   store double %live_val, double* @dbl
    160   br label %end
    161 end:
    162   ; We want the epilogue to be the only thing in a basic block so that we hit
    163   ; the correct edge-case (first inst in block is correct one to adjust).
    164   ret void
    165 }
    166 
    167 define void @test_varsize(...) minsize {
    168 ; CHECK-T1-LABEL: test_varsize:
    169 ; CHECK-T1: sub	sp, #16
    170 ; CHECK-T1: push	{r5, r6, r7, lr}
    171 ; ...
    172 ; CHECK-T1: pop	{r2, r3, r7}
    173 ; CHECK-T1: pop {[[POP_REG:r[0-3]]]}
    174 ; CHECK-T1: add	sp, #16
    175 ; CHECK-T1: bx	[[POP_REG]]
    176 
    177 ; CHECK-LABEL: test_varsize:
    178 ; CHECK: sub	sp, #16
    179 ; CHECK: push	{r5, r6, r7, lr}
    180 ; ...
    181 ; CHECK: pop.w	{r2, r3, r7, lr}
    182 ; CHECK: add	sp, #16
    183 ; CHECK: bx	lr
    184 
    185   %var = alloca i8, i32 8
    186   call void @llvm.va_start(i8* %var)
    187   call void @bar(i8* %var)
    188   ret void
    189 }
    190 
    191 %"MyClass" = type { i8*, i32, i32, float, float, float, [2 x i8], i32, i32* }
    192 
    193 declare float @foo()
    194 
    195 declare void @bar3()
    196 
    197 declare %"MyClass"* @bar2(%"MyClass"* returned, i16*, i32, float, float, i32, i32, i1 zeroext, i1 zeroext, i32)
    198 
    199 define fastcc float @check_vfp_no_return_clobber2(i16* %r, i16* %chars, i32 %length, i1 zeroext %flag) minsize {
    200 entry:
    201 ; CHECK-LINUX-LABEL: check_vfp_no_return_clobber2
    202 ; CHECK-LINUX: vpush	{d0, d1, d2, d3, d4, d5, d6, d7, d8}
    203 ; CHECK-NOT: sub sp,
    204 ; ...
    205 ; CHECK-LINUX: add sp
    206 ; CHECK-LINUX: vpop {d8}
    207   %run = alloca %"MyClass", align 4
    208   %call = call %"MyClass"* @bar2(%"MyClass"* %run, i16* %chars, i32 %length, float 0.000000e+00, float 0.000000e+00, i32 1, i32 1, i1 zeroext false, i1 zeroext true, i32 3)
    209   %call1 = call float @foo()
    210   %cmp = icmp eq %"MyClass"* %run, null
    211   br i1 %cmp, label %exit, label %if.then
    212 
    213 if.then:                                          ; preds = %entry
    214   call void @bar3()
    215   br label %exit
    216 
    217 exit:                                             ; preds = %if.then, %entry
    218   ret float %call1
    219 }
    220 
    221 declare void @use_arr(i32*)
    222 define void @test_fold_reuse() minsize {
    223 ; CHECK-LABEL: test_fold_reuse:
    224 ; CHECK: push.w {r4, r7, r8, lr}
    225 ; CHECK: sub sp, #24
    226 ; [...]
    227 ; CHECK: add sp, #24
    228 ; CHECK: pop.w {r4, r7, r8, pc}
    229   %arr = alloca i8, i32 24
    230   call void asm sideeffect "", "~{r8},~{r4}"()
    231   call void @bar(i8* %arr)
    232   ret void
    233 }
    234 
    235 declare void @llvm.va_start(i8*) nounwind
    236