Home | History | Annotate | Download | only in XCore
      1 ; RUN: llc < %s -march=xcore | FileCheck %s
      2 ; RUN: llc < %s -march=xcore -disable-fp-elim | FileCheck %s -check-prefix=CHECKFP
      3 
      4 ; When using SP for small frames, we don't need any scratch registers (SR).
      5 ; When using SP for large frames, we may need two scratch registers.
      6 ; When using FP, for large or small frames, we may need one scratch register.
      7 
      8 ; FP + small frame: spill FP+SR = entsp 2
      9 ; CHECKFP-LABEL: f1
     10 ; CHECKFP: entsp 2
     11 ; CHECKFP-NEXT: stw r10, sp[1]
     12 ; CHECKFP-NEXT: ldaw r10, sp[0]
     13 ; CHECKFP: set sp, r10
     14 ; CHECKFP-NEXT: ldw r10, sp[1]
     15 ; CHECKFP-NEXT: retsp 2
     16 ;
     17 ; !FP + small frame: no spills = no stack adjustment needed
     18 ; CHECK-LABEL: f1
     19 ; CHECK: stw lr, sp[0]
     20 ; CHECK: ldw lr, sp[0]
     21 ; CHECK-NEXT: retsp 0
     22 define void @f1() nounwind {
     23 entry:
     24   tail call void asm sideeffect "", "~{lr}"() nounwind
     25   ret void
     26 }
     27 
     28 
     29 ; FP + small frame: spill FP+SR+R0+LR = entsp 3 + extsp 1
     30 ; CHECKFP-LABEL:f3
     31 ; CHECKFP: entsp 3
     32 ; CHECKFP-NEXT: stw r10, sp[1]
     33 ; CHECKFP-NEXT: ldaw r10, sp[0]
     34 ; CHECKFP-NEXT: stw [[REG:r[4-9]+]], r10[2]
     35 ; CHECKFP-NEXT: mov [[REG]], r0
     36 ; CHECKFP-NEXT: extsp 1
     37 ; CHECKFP-NEXT: bl f2
     38 ; CHECKFP-NEXT: ldaw sp, sp[1]
     39 ; CHECKFP-NEXT: mov r0, [[REG]]
     40 ; CHECKFP-NEXT: ldw [[REG]], r10[2]
     41 ; CHECKFP-NEXT: set sp, r10
     42 ; CHECKFP-NEXT: ldw r10, sp[1]
     43 ; CHECKFP-NEXT: retsp 3
     44 ;
     45 ; !FP + small frame: spill R0+LR = entsp 2
     46 ; CHECK-LABEL: f3
     47 ; CHECK: entsp 2
     48 ; CHECK-NEXT: stw [[REG:r[4-9]+]], sp[1]
     49 ; CHECK-NEXT: mov [[REG]], r0
     50 ; CHECK-NEXT: bl f2
     51 ; CHECK-NEXT: mov r0, [[REG]]
     52 ; CHECK-NEXT: ldw [[REG]], sp[1]
     53 ; CHECK-NEXT: retsp 2
     54 declare void @f2()
     55 define i32 @f3(i32 %i) nounwind {
     56 entry:
     57   call void @f2()
     58   ret i32 %i
     59 }
     60 
     61 
     62 ; FP + large frame: spill FP+SR = entsp 2 + 100000
     63 ; CHECKFP-LABEL: f4
     64 ; CHECKFP: entsp 65535
     65 ; CHECKFP-NEXT: .Ltmp{{[0-9]+}}
     66 ; CHECKFP-NEXT: .cfi_def_cfa_offset 262140
     67 ; CHECKFP-NEXT: .Ltmp{{[0-9]+}}
     68 ; CHECKFP-NEXT: .cfi_offset 15, 0
     69 ; CHECKFP-NEXT: extsp 34467
     70 ; CHECKFP-NEXT: .Ltmp{{[0-9]+}}
     71 ; CHECKFP-NEXT: .cfi_def_cfa_offset 400008
     72 ; CHECKFP-NEXT: stw r10, sp[1]
     73 ; CHECKFP-NEXT: .Ltmp{{[0-9]+}}
     74 ; CHECKFP-NEXT: .cfi_offset 10, -400004
     75 ; CHECKFP-NEXT: ldaw r10, sp[0]
     76 ; CHECKFP-NEXT: .Ltmp{{[0-9]+}}
     77 ; CHECKFP-NEXT: .cfi_def_cfa_register 10
     78 ; CHECKFP-NEXT: set sp, r10
     79 ; CHECKFP-NEXT: ldw r10, sp[1]
     80 ; CHECKFP-NEXT: ldaw sp, sp[65535]
     81 ; CHECKFP-NEXT: retsp 34467
     82 ;
     83 ; !FP + large frame: spill SR+SR = entsp 2 + 100000
     84 ; CHECK-LABEL: f4
     85 ; CHECK: entsp 65535
     86 ; CHECK-NEXT: .Ltmp{{[0-9]+}}
     87 ; CHECK-NEXT: .cfi_def_cfa_offset 262140
     88 ; CHECK-NEXT: .Ltmp{{[0-9]+}}
     89 ; CHECK-NEXT: .cfi_offset 15, 0
     90 ; CHECK-NEXT: extsp 34467
     91 ; CHECK-NEXT: .Ltmp{{[0-9]+}}
     92 ; CHECK-NEXT: .cfi_def_cfa_offset 400008
     93 ; CHECK-NEXT: ldaw sp, sp[65535]
     94 ; CHECK-NEXT: retsp 34467
     95 define void @f4() {
     96 entry:
     97   %0 = alloca [100000 x i32]
     98   ret void
     99 }
    100 
    101 
    102 ; FP + large frame: spill FP+SR+R4+LR = entsp 3 + 200000  + extsp 1
    103 ; CHECKFP: .section .cp.rodata.cst4,"aMc",@progbits,4
    104 ; CHECKFP-NEXT: .align 4
    105 ; CHECKFP-NEXT: .LCPI[[CNST0:[0-9_]+]]:
    106 ; CHECKFP-NEXT: .long 200002
    107 ; CHECKFP-NEXT: .LCPI[[CNST1:[0-9_]+]]:
    108 ; CHECKFP-NEXT: .long 200001
    109 ; CHECKFP-NEXT: .text
    110 ; CHECKFP-LABEL: f6
    111 ; CHECKFP: entsp 65535
    112 ; CHECKFP-NEXT: .Ltmp{{[0-9]+}}
    113 ; CHECKFP-NEXT: .cfi_def_cfa_offset 262140
    114 ; CHECKFP-NEXT: .Ltmp{{[0-9]+}}
    115 ; CHECKFP-NEXT: .cfi_offset 15, 0
    116 ; CHECKFP-NEXT: extsp 65535
    117 ; CHECKFP-NEXT: .Ltmp{{[0-9]+}}
    118 ; CHECKFP-NEXT: .cfi_def_cfa_offset 524280
    119 ; CHECKFP-NEXT: extsp 65535
    120 ; CHECKFP-NEXT: .Ltmp{{[0-9]+}}
    121 ; CHECKFP-NEXT: .cfi_def_cfa_offset 786420
    122 ; CHECKFP-NEXT: extsp 3398
    123 ; CHECKFP-NEXT: .Ltmp{{[0-9]+}}
    124 ; CHECKFP-NEXT: .cfi_def_cfa_offset 800012
    125 ; CHECKFP-NEXT: stw r10, sp[1]
    126 ; CHECKFP-NEXT: .Ltmp{{[0-9]+}}
    127 ; CHECKFP-NEXT: .cfi_offset 10, -800008
    128 ; CHECKFP-NEXT: ldaw r10, sp[0]
    129 ; CHECKFP-NEXT: .Ltmp{{[0-9]+}}
    130 ; CHECKFP-NEXT: .cfi_def_cfa_register 10
    131 ; CHECKFP-NEXT: ldw r1, cp[.LCPI[[CNST0]]]
    132 ; CHECKFP-NEXT: stw [[REG:r[4-9]+]], r10[r1]
    133 ; CHECKFP-NEXT: .Ltmp{{[0-9]+}}
    134 ; CHECKFP-NEXT: .cfi_offset 4, -4
    135 ; CHECKFP-NEXT: mov [[REG]], r0
    136 ; CHECKFP-NEXT: extsp 1
    137 ; CHECKFP-NEXT: ldaw r0, r10[2]
    138 ; CHECKFP-NEXT: bl f5
    139 ; CHECKFP-NEXT: ldaw sp, sp[1]
    140 ; CHECKFP-NEXT: ldw r1, cp[.LCPI3_1]
    141 ; CHECKFP-NEXT: ldaw r0, r10[r1]
    142 ; CHECKFP-NEXT: extsp 1
    143 ; CHECKFP-NEXT: bl f5
    144 ; CHECKFP-NEXT: ldaw sp, sp[1]
    145 ; CHECKFP-NEXT: mov r0, [[REG]]
    146 ; CHECKFP-NEXT: ldw r1, cp[.LCPI[[CNST0]]]
    147 ; CHECKFP-NEXT: ldw [[REG]], r10[r1]
    148 ; CHECKFP-NEXT: set sp, r10
    149 ; CHECKFP-NEXT: ldw r10, sp[1]
    150 ; CHECKFP-NEXT: ldaw sp, sp[65535]
    151 ; CHECKFP-NEXT: ldaw sp, sp[65535]
    152 ; CHECKFP-NEXT: ldaw sp, sp[65535]
    153 ; CHECKFP-NEXT: retsp 3398
    154 ;
    155 ; !FP + large frame: spill SR+SR+R4+LR = entsp 4 + 200000
    156 ; CHECK: .section .cp.rodata.cst4,"aMc",@progbits,4
    157 ; CHECK-NEXT: .align 4
    158 ; CHECK-NEXT: .LCPI[[CNST0:[0-9_]+]]:
    159 ; CHECK-NEXT: .long 200003
    160 ; CHECK-NEXT: .LCPI[[CNST1:[0-9_]+]]:
    161 ; CHECK-NEXT: .long 200002
    162 ; CHECK-NEXT: .text
    163 ; CHECK-LABEL: f6
    164 ; CHECK: entsp 65535
    165 ; CHECK-NEXT: .Ltmp{{[0-9]+}}
    166 ; CHECK-NEXT: .cfi_def_cfa_offset 262140
    167 ; CHECK-NEXT: .Ltmp{{[0-9]+}}
    168 ; CHECK-NEXT: .cfi_offset 15, 0
    169 ; CHECK-NEXT: extsp 65535
    170 ; CHECK-NEXT: .Ltmp{{[0-9]+}}
    171 ; CHECK-NEXT: .cfi_def_cfa_offset 524280
    172 ; CHECK-NEXT: extsp 65535
    173 ; CHECK-NEXT: .Ltmp{{[0-9]+}}
    174 ; CHECK-NEXT: .cfi_def_cfa_offset 786420
    175 ; CHECK-NEXT: extsp 3399
    176 ; CHECK-NEXT: .Ltmp{{[0-9]+}}
    177 ; CHECK-NEXT: .cfi_def_cfa_offset 800016
    178 ; CHECK-NEXT: ldaw r1, sp[0]
    179 ; CHECK-NEXT: ldw r2, cp[.LCPI[[CNST0]]]
    180 ; CHECK-NEXT: stw [[REG:r[4-9]+]], r1[r2]
    181 ; CHECK-NEXT: .Ltmp{{[0-9]+}}
    182 ; CHECK-NEXT: .cfi_offset 4, -4
    183 ; CHECK-NEXT: mov [[REG]], r0
    184 ; CHECK-NEXT: ldaw r0, sp[3]
    185 ; CHECK-NEXT: bl f5
    186 ; CHECK-NEXT: ldaw r0, sp[0]
    187 ; CHECK-NEXT: ldw r1, cp[.LCPI[[CNST1]]]
    188 ; CHECK-NEXT: ldaw r0, r0[r1]
    189 ; CHECK-NEXT: bl f5
    190 ; CHECK-NEXT: mov r0, [[REG]]
    191 ; CHECK-NEXT: ldaw [[REG]], sp[0]
    192 ; CHECK-NEXT: ldw r1, cp[.LCPI[[CNST0]]]
    193 ; CHECK-NEXT: ldw [[REG]], [[REG]][r1]
    194 ; CHECK-NEXT: ldaw sp, sp[65535]
    195 ; CHECK-NEXT: ldaw sp, sp[65535]
    196 ; CHECK-NEXT: ldaw sp, sp[65535]
    197 ; CHECK-NEXT: retsp 3399
    198 declare void @f5(i32*)
    199 define i32 @f6(i32 %i) {
    200 entry:
    201   %0 = alloca [200000 x i32]
    202   %1 = getelementptr inbounds [200000 x i32], [200000 x i32]* %0, i32 0, i32 0
    203   call void @f5(i32* %1)
    204   %2 = getelementptr inbounds [200000 x i32], [200000 x i32]* %0, i32 0, i32 199999
    205   call void @f5(i32* %2)
    206   ret i32 %i
    207 }
    208 
    209 ; FP + large frame: spill FP+SR+LR = entsp 2 + 256  + extsp 1
    210 ; CHECKFP-LABEL:f8
    211 ; CHECKFP: entsp 258
    212 ; CHECKFP-NEXT: stw r10, sp[1]
    213 ; CHECKFP-NEXT: ldaw r10, sp[0]
    214 ; CHECKFP-NEXT: mkmsk [[REG:r[0-9]+]], 8
    215 ; CHECKFP-NEXT: ldaw r0, r10{{\[}}[[REG]]{{\]}}
    216 ; CHECKFP-NEXT: extsp 1
    217 ; CHECKFP-NEXT: bl f5
    218 ; CHECKFP-NEXT: ldaw sp, sp[1]
    219 ; CHECKFP-NEXT: set sp, r10
    220 ; CHECKFP-NEXT: ldw r10, sp[1]
    221 ; CHECKFP-NEXT: retsp 258
    222 ;
    223 ; !FP + large frame: spill SR+SR+LR = entsp 3 + 256
    224 ; CHECK-LABEL:f8
    225 ; CHECK: entsp 257
    226 ; CHECK-NEXT: ldaw r0, sp[254]
    227 ; CHECK-NEXT: bl f5
    228 ; CHECK-NEXT: retsp 257
    229 define void @f8() nounwind {
    230 entry:
    231   %0 = alloca [256 x i32]
    232   %1 = getelementptr inbounds [256 x i32], [256 x i32]* %0, i32 0, i32 253
    233   call void @f5(i32* %1)
    234   ret void
    235 }
    236 
    237 ; FP + large frame: spill FP+SR+LR = entsp 2 + 32768  + extsp 1
    238 ; CHECKFP-LABEL:f9
    239 ; CHECKFP: entsp 32770
    240 ; CHECKFP-NEXT: stw r10, sp[1]
    241 ; CHECKFP-NEXT: ldaw r10, sp[0]
    242 ; CHECKFP-NEXT: ldc [[REG:r[0-9]+]], 32767
    243 ; CHECKFP-NEXT: ldaw r0, r10{{\[}}[[REG]]{{\]}}
    244 ; CHECKFP-NEXT: extsp 1
    245 ; CHECKFP-NEXT: bl f5
    246 ; CHECKFP-NEXT: ldaw sp, sp[1]
    247 ; CHECKFP-NEXT: set sp, r10
    248 ; CHECKFP-NEXT: ldw r10, sp[1]
    249 ; CHECKFP-NEXT: retsp 32770
    250 ;
    251 ; !FP + large frame: spill SR+SR+LR = entsp 3 + 32768
    252 ; CHECK-LABEL:f9
    253 ; CHECK: entsp 32771
    254 ; CHECK-NEXT: ldaw r0, sp[32768]
    255 ; CHECK-NEXT: bl f5
    256 ; CHECK-NEXT: retsp 32771
    257 define void @f9() nounwind {
    258 entry:
    259   %0 = alloca [32768 x i32]
    260   %1 = getelementptr inbounds [32768 x i32], [32768 x i32]* %0, i32 0, i32 32765
    261   call void @f5(i32* %1)
    262   ret void
    263 }
    264