Home | History | Annotate | Download | only in ARM
      1 ; RUN: llc < %s -mtriple=armv7k-apple-watchos2.0 | FileCheck %s
      2 ; RUN: llc < %s -mtriple=armv7k-apple-watchos2.0 -enable-shrink-wrap=true | FileCheck %s
      3 ; RUN: llc < %s -mtriple=armv7-apple-ios8.0 | FileCheck %s
      4 ; RUN: llc < %s -mtriple=armv7-apple-ios8.0 -enable-shrink-wrap=true | FileCheck %s
      5 
      6 ; RUN: llc < %s -mtriple=armv7k-apple-watchos2.0 -O0 | FileCheck --check-prefix=CHECK-O0 --check-prefix=WATCH-O0 %s
      7 ; RUN: llc < %s -mtriple=armv7-apple-ios8.0 -O0 | FileCheck --check-prefix=CHECK-O0 --check-prefix=IOS-O0 %s
      8 
      9 ; RUN: llc < %s -mtriple=thumbv7-apple-ios8.0 | FileCheck --check-prefix=THUMB %s
     10 
     11 %struct.S = type { i8 }
     12 
     13 @sg = internal thread_local global %struct.S zeroinitializer, align 1
     14 @__dso_handle = external global i8
     15 @__tls_guard = internal thread_local unnamed_addr global i1 false
     16 @sum1 = internal thread_local global i32 0, align 4
     17 
     18 %class.C = type { i32 }
     19 @tC = internal thread_local global %class.C zeroinitializer, align 4
     20 
     21 declare %struct.S* @_ZN1SC1Ev(%struct.S* returned)
     22 declare %struct.S* @_ZN1SD1Ev(%struct.S* returned)
     23 declare i32 @_tlv_atexit(void (i8*)*, i8*, i8*)
     24 
     25 ; Make sure Epilog does not overwrite an explicitly-handled CSR in CXX_FAST_TLS.
     26 ; THUMB-LABEL: _ZTW2sg
     27 ; THUMB: push {{.*}}lr
     28 ; THUMB: blx
     29 ; THUMB: bne [[TH_end:.?LBB0_[0-9]+]]
     30 ; THUMB: blx
     31 ; THUMB: tlv_atexit
     32 ; THUMB: [[TH_end]]:
     33 ; THUMB: blx
     34 ; THUMB: r4
     35 ; THUMB: pop {{.*}}r4
     36 define cxx_fast_tlscc nonnull %struct.S* @_ZTW2sg() nounwind {
     37   %.b.i = load i1, i1* @__tls_guard, align 1
     38   br i1 %.b.i, label %__tls_init.exit, label %init.i
     39 
     40 init.i:
     41   store i1 true, i1* @__tls_guard, align 1
     42   %call.i.i = tail call %struct.S* @_ZN1SC1Ev(%struct.S* nonnull @sg)
     43   %1 = tail call i32 @_tlv_atexit(void (i8*)* nonnull bitcast (%struct.S* (%struct.S*)* @_ZN1SD1Ev to void (i8*)*), i8* nonnull getelementptr inbounds (%struct.S, %struct.S* @sg, i64 0, i32 0), i8* nonnull @__dso_handle)
     44   br label %__tls_init.exit
     45 
     46 __tls_init.exit:
     47   ret %struct.S* @sg
     48 }
     49 
     50 ; CHECK-LABEL: _ZTW2sg
     51 ; CHECK: push {r4, r5, r7, lr}
     52 ; CHECK: push {r11, r12}
     53 ; CHECK-NOT: vpush {d16, d17, d18, d19, d20, d21, d22, d23, d24, d25, d26, d27, d28, d29, d30, d31}
     54 ; CHECK-NOT: vpush {d0, d1, d2, d3, d4, d5, d6, d7}
     55 ; CHECK: blx
     56 ; CHECK: bne [[BB_end:.?LBB0_[0-9]+]]
     57 ; CHECK: blx
     58 ; CHECK: tlv_atexit
     59 ; CHECK: [[BB_end]]:
     60 ; CHECK: blx
     61 ; CHECK-NOT: vpop {d0, d1, d2, d3, d4, d5, d6, d7}
     62 ; CHECK-NOT: vpop {d16, d17, d18, d19, d20, d21, d22, d23, d24, d25, d26, d27, d28, d29, d30, d31}
     63 ; CHECK-NOT: pop {r9, r12}
     64 ; CHECK-NOT: pop {r1, r2, r3, r4, r7, pc}
     65 ; CHECK: pop {r4, r5, r7, pc}
     66 
     67 ; CHECK-O0-LABEL: _ZTW2sg
     68 ; WATCH-O0: push {r1, r2, r3, r6, r7, lr}
     69 ; IOS-O0: push {r1, r2, r3, r7, lr}
     70 ; CHECK-O0: push {r9, r12}
     71 ; CHECK-O0: vpush {d16, d17, d18, d19, d20, d21, d22, d23, d24, d25, d26, d27, d28, d29, d30, d31}
     72 ; CHECK-O0: vpush {d0, d1, d2, d3, d4, d5, d6, d7}
     73 ; CHECK-O0: blx
     74 ; CHECK-O0: bne [[BB_end:.?LBB0_[0-9]+]]
     75 ; CHECK-O0: blx
     76 ; CHECK-O0: tlv_atexit
     77 ; CHECK-O0: [[BB_end]]:
     78 ; CHECK-O0: blx
     79 ; CHECK-O0: vpop {d0, d1, d2, d3, d4, d5, d6, d7}
     80 ; CHECK-O0: vpop {d16, d17, d18, d19, d20, d21, d22, d23, d24, d25, d26, d27, d28, d29, d30, d31}
     81 ; CHECK-O0: pop {r9, r12}
     82 ; WATCH-O0: pop {r1, r2, r3, r6, r7, pc}
     83 ; IOS-O0: pop {r1, r2, r3, r7, pc}
     84 
     85 ; CHECK-LABEL: _ZTW4sum1
     86 ; CHECK-NOT: push {r1, r2, r3, r4, r7, lr}
     87 ; CHECK-NOT: push {r9, r12}
     88 ; CHECK-NOT: vpush {d16, d17, d18, d19, d20, d21, d22, d23, d24, d25, d26, d27, d28, d29, d30, d31}
     89 ; CHECK-NOT: vpush {d0, d1, d2, d3, d4, d5, d6, d7}
     90 ; CHECK: blx
     91 
     92 ; CHECK-O0-LABEL: _ZTW4sum1
     93 ; CHECK-O0-NOT: vpush
     94 ; CHECK-O0-NOT: vstr
     95 ; CHECK-O0-NOT: vpop
     96 ; CHECK-O0-NOT: vldr
     97 ; CHECK-O0: pop
     98 define cxx_fast_tlscc nonnull i32* @_ZTW4sum1() nounwind {
     99   ret i32* @sum1
    100 }
    101 
    102 ; Make sure at O0, we don't generate spilling/reloading of the CSRs.
    103 ; CHECK-O0-LABEL: tls_test2
    104 ; CHECK-O0: push
    105 ; CHECK-O0-NOT: vpush
    106 ; CHECK-O0-NOT: vstr
    107 ; CHECK-O0: tls_helper
    108 ; CHECK-O0-NOT: vpop
    109 ; CHECK-O0-NOT: vldr
    110 ; CHECK-O0: pop
    111 declare cxx_fast_tlscc void @tls_helper()
    112 define cxx_fast_tlscc %class.C* @tls_test2() #1 {
    113   call cxx_fast_tlscc void @tls_helper()
    114   ret %class.C* @tC
    115 }
    116 
    117 ; Make sure we do not allow tail call when caller and callee have different
    118 ; calling conventions.
    119 declare %class.C* @_ZN1CD1Ev(%class.C* readnone returned %this)
    120 ; CHECK-LABEL: tls_test
    121 ; CHECK: bl __tlv_atexit
    122 define cxx_fast_tlscc void @__tls_test() {
    123 entry:
    124   store i32 0, i32* getelementptr inbounds (%class.C, %class.C* @tC, i64 0, i32 0), align 4
    125   %0 = tail call i32 @_tlv_atexit(void (i8*)* bitcast (%class.C* (%class.C*)* @_ZN1CD1Ev to void (i8*)*), i8* bitcast (%class.C* @tC to i8*), i8* nonnull @__dso_handle) #1
    126   ret void
    127 }
    128 
    129 declare void @somefunc()
    130 define cxx_fast_tlscc void @test_ccmismatch_notail() {
    131 ; A tail call is not possible here because somefunc does not preserve enough
    132 ; registers.
    133 ; CHECK-LABEL: test_ccmismatch_notail:
    134 ; CHECK-NOT: b _somefunc
    135 ; CHECK: bl _somefunc
    136   tail call void @somefunc()
    137   ret void
    138 }
    139 
    140 declare cxx_fast_tlscc void @some_fast_tls_func()
    141 define void @test_ccmismatch_tail() {
    142 ; We can perform a tail call here because some_fast_tls_func preserves all
    143 ; necessary registers (and more).
    144 ; CHECK-LABEL: test_ccmismatch_tail:
    145 ; CHECK-NOT: bl _some_fast_tls_func
    146 ; CHECK: b _some_fast_tls_func
    147   tail call cxx_fast_tlscc void @some_fast_tls_func()
    148   ret void
    149 }
    150 
    151 attributes #0 = { nounwind "no-frame-pointer-elim"="true" }
    152 attributes #1 = { nounwind }
    153