Home | History | Annotate | Download | only in PowerPC
      1 ; RUN: llc -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr7 < %s | FileCheck %s
      2 ; RUN: llc -mtriple=powerpc64-unknown-linux-gnu -mcpu=pwr7 -disable-fp-elim < %s | FileCheck -check-prefix=CHECK-FP %s
      3 ; RUN: llc -mtriple=powerpc-unknown-linux-gnu -disable-fp-elim < %s | FileCheck -check-prefix=CHECK-32 %s
      4 ; RUN: llc -mtriple=powerpc-unknown-linux-gnu -disable-fp-elim -relocation-model=pic < %s | FileCheck -check-prefix=CHECK-32-PIC %s
      5 target datalayout = "E-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-f128:128:128-v128:128:128-n32:64"
      6 target triple = "powerpc64-unknown-linux-gnu"
      7 
      8 %struct.s = type { i32, i32 }
      9 
     10 declare void @bar(i32*)
     11 
     12 @barbaz = external global i32
     13 
     14 define void @goo(%struct.s* byval nocapture readonly %a) {
     15 entry:
     16   %x = alloca [2 x i32], align 32
     17   %a1 = getelementptr inbounds %struct.s, %struct.s* %a, i64 0, i32 0
     18   %0 = load i32, i32* %a1, align 4
     19   %arrayidx = getelementptr inbounds [2 x i32], [2 x i32]* %x, i64 0, i64 0
     20   store i32 %0, i32* %arrayidx, align 32
     21   %b = getelementptr inbounds %struct.s, %struct.s* %a, i64 0, i32 1
     22   %1 = load i32, i32* %b, align 4
     23   %2 = load i32, i32* @barbaz, align 4
     24   %arrayidx2 = getelementptr inbounds [2 x i32], [2 x i32]* %x, i64 0, i64 1
     25   store i32 %2, i32* %arrayidx2, align 4
     26   call void @bar(i32* %arrayidx)
     27   ret void
     28 }
     29 
     30 ; CHECK-LABEL: @goo
     31 
     32 ; CHECK-DAG: mflr {{[0-9]+}}
     33 ; CHECK-DAG: clrldi [[REG:[0-9]+]], 1, 59
     34 ; CHECK-DAG: std 30, -16(1)
     35 ; CHECK-DAG: mr 30, 1
     36 ; CHECK-DAG: std 0, 16(1)
     37 ; CHECK-DAG: subfic 0, [[REG]], -160
     38 ; CHECK: stdux 1, 1, 0
     39 
     40 ; CHECK: .cfi_def_cfa_register r30
     41 ; CHECK: .cfi_offset r30, -16
     42 ; CHECK: .cfi_offset lr, 16
     43 
     44 ; CHECK: std 3, 48(30)
     45 
     46 ; CHECK: ld 1, 0(1)
     47 ; CHECK-DAG: ld [[SR:[0-9]+]], 16(1)
     48 ; CHECK-DAG: ld 30, -16(1)
     49 ; CHECK-DAG: mtlr [[SR]]
     50 ; CHECK: blr
     51 
     52 ; CHECK-FP-LABEL: @goo
     53 
     54 ; CHECK-FP-DAG: mflr {{[0-9]+}}
     55 ; CHECK-FP-DAG: clrldi [[REG:[0-9]+]], 1, 59
     56 ; CHECK-FP-DAG: std 31, -8(1)
     57 ; CHECK-FP-DAG: std 30, -16(1)
     58 ; CHECK-FP-DAG: mr 30, 1
     59 ; CHECK-FP-DAG: std 0, 16(1)
     60 ; CHECK-FP-DAG: subfic 0, [[REG]], -160
     61 ; CHECK-FP: stdux 1, 1, 0
     62 
     63 ; CHECK-FP: .cfi_def_cfa_register r30
     64 ; CHECK-FP: .cfi_offset r31, -8
     65 ; CHECK-FP: .cfi_offset r30, -16
     66 ; CHECK-FP: .cfi_offset lr, 16
     67 
     68 ; CHECK-FP: mr 31, 1
     69 
     70 ; CHECK-FP: std 3, 48(30)
     71 
     72 ; CHECK-FP: ld 1, 0(1)
     73 ; CHECK-FP-DAG: ld [[SR:[0-9]+]], 16(1)
     74 ; CHECK-FP-DAG: ld 31, -8(1)
     75 ; CHECK-FP-DAG: ld 30, -16(1)
     76 ; CHECK-FP-DAG: mtlr [[SR]]
     77 ; CHECK-FP: blr
     78 
     79 ; CHECK-32-LABEL: @goo
     80 ; CHECK-32-DAG: mflr [[LR:[0-9]+]]
     81 ; CHECK-32-DAG: clrlwi [[REG:[0-9]+]], 1, 27
     82 ; CHECK-32-DAG: stw [[LR]], 4(1)
     83 ; CHECK-32-DAG: subfic 0, [[REG]], -64
     84 ; CHECK-32: stwux 1, 1, 0
     85 ; CHECK-32: subf 0, 0, 1
     86 ; CHECK-32: addic 0, 0, -4
     87 ; CHECK-32: stwx 31, 0, 0
     88 ; CHECK-32: addic 0, 0, -4
     89 ; CHECK-32: stwx 30, 0, 0
     90 ; CHECK-32: addic 30, 0, 8
     91 
     92 ; CHECK-32-PIC-LABEL: @goo
     93 ; CHECK-32-PIC-DAG: mflr [[LR:[0-9]+]]
     94 ; CHECK-32-PIC-DAG: clrlwi [[REG:[0-9]+]], 1, 27
     95 ; CHECK-32-PIC-DAG: stw [[LR]], 4(1)
     96 ; CHECK-32-PIC-DAG: subfic 0, [[REG]], -64
     97 ; CHECK-32-PIC:     stwux 1, 1, 0
     98 ; CHECK-32-PIC:     subf 0, 0, 1
     99 ; CHECK-32-PIC:     addic 0, 0, -4
    100 ; CHECK-32-PIC:     stwx 31, 0, 0
    101 ; CHECK-32-PIC:     addic 0, 0, -4
    102 ; CHECK-32-PIC:     stwx 30, 0, 0
    103 ; CHECK-32-PIC:     addic 0, 0, -4
    104 ; CHECK-32-PIC:     stwx 29, 0, 0
    105 ; CHECK-32-PIC:     addic 29, 0, 12
    106 
    107 ; The large-frame-size case.
    108 define void @hoo(%struct.s* byval nocapture readonly %a) {
    109 entry:
    110   %x = alloca [200000 x i32], align 32
    111   %a1 = getelementptr inbounds %struct.s, %struct.s* %a, i64 0, i32 0
    112   %0 = load i32, i32* %a1, align 4
    113   %arrayidx = getelementptr inbounds [200000 x i32], [200000 x i32]* %x, i64 0, i64 0
    114   store i32 %0, i32* %arrayidx, align 32
    115   %b = getelementptr inbounds %struct.s, %struct.s* %a, i64 0, i32 1
    116   %1 = load i32, i32* %b, align 4
    117   %arrayidx2 = getelementptr inbounds [200000 x i32], [200000 x i32]* %x, i64 0, i64 1
    118   store i32 %1, i32* %arrayidx2, align 4
    119   call void @bar(i32* %arrayidx)
    120   ret void
    121 }
    122 
    123 ; CHECK-LABEL: @hoo
    124 
    125 ; CHECK-DAG: lis [[REG1:[0-9]+]], -13
    126 ; CHECK-DAG: clrldi [[REG3:[0-9]+]], 1, 59
    127 ; CHECK-DAG: mflr {{[0-9]+}}
    128 ; CHECK-DAG: ori [[REG2:[0-9]+]], [[REG1]], 51808
    129 ; CHECK-DAG: std 30, -16(1)
    130 ; CHECK-DAG: mr 30, 1
    131 ; CHECK-DAG: std 0, 16(1)
    132 ; CHECK-DAG: subfc 0, [[REG3]], [[REG2]]
    133 ; CHECK: stdux 1, 1, 0
    134 
    135 ; CHECK: .cfi_def_cfa_register r30
    136 
    137 ; CHECK: blr
    138 
    139 ; CHECK-32-LABEL: @hoo
    140 
    141 ; CHECK-32-DAG: lis [[REG1:[0-9]+]], -13
    142 ; CHECK-32-DAG: clrlwi [[REG3:[0-9]+]], 1, 27
    143 ; CHECK-32-DAG: mflr [[LR:[0-9]+]]
    144 ; CHECK-32-DAG: ori [[REG2:[0-9]+]], [[REG1]], 51904
    145 ; CHECK-32-DAG: stw [[LR]], 4(1)
    146 ; CHECK-32-DAG: subfc 0, [[REG3]], [[REG2]]
    147 ; CHECK-32:     stwux 1, 1, 0
    148 ; CHECK-32:     subf 0, 0, 1
    149 ; CHECK-32:     addic 0, 0, -4
    150 ; CHECK-32:     stwx 31, 0, 0
    151 ; CHECK-32:     addic 0, 0, -4
    152 ; CHECK-32:     stwx 30, 0, 0
    153 ; CHECK-32:     addic 30, 0, 8
    154 
    155 ; CHECK-32: blr
    156 
    157 ; CHECK-32-PIC-LABEL: @hoo
    158 
    159 ; CHECK-32-PIC-DAG: lis [[REG1:[0-9]+]], -13
    160 ; CHECK-32-PIC-DAG: clrlwi [[REG3:[0-9]+]], 1, 27
    161 ; CHECK-32-PIC-DAG: mflr {{[0-9]+}}
    162 ; CHECK-32-PIC-DAG: ori [[REG2:[0-9]+]], [[REG1]], 51904
    163 ; CHECK-32-PIC-DAG: stw 0, 4(1)
    164 ; CHECK-32-PIC-DAG: subfc 0, [[REG3]], [[REG2]]
    165 ; CHECK-32-PIC:     stwux 1, 1, 0
    166 ; CHECK-32-PIC:     subf 0, 0, 1
    167 ; CHECK-32-PIC:     addic 0, 0, -4
    168 ; CHECK-32-PIC:     stwx 31, 0, 0
    169 ; CHECK-32-PIC:     addic 0, 0, -8
    170 ; CHECK-32-PIC:     stwx 29, 0, 0
    171 ; CHECK-32-PIC:     addic 29, 0, 12
    172 
    173 ; CHECK-32: blr
    174 
    175 ; Make sure that the FP save area is still allocated correctly relative to
    176 ; where r30 is saved.
    177 define void @loo(%struct.s* byval nocapture readonly %a) {
    178 entry:
    179   %x = alloca [2 x i32], align 32
    180   %a1 = getelementptr inbounds %struct.s, %struct.s* %a, i64 0, i32 0
    181   %0 = load i32, i32* %a1, align 4
    182   %arrayidx = getelementptr inbounds [2 x i32], [2 x i32]* %x, i64 0, i64 0
    183   store i32 %0, i32* %arrayidx, align 32
    184   %b = getelementptr inbounds %struct.s, %struct.s* %a, i64 0, i32 1
    185   %1 = load i32, i32* %b, align 4
    186   %arrayidx2 = getelementptr inbounds [2 x i32], [2 x i32]* %x, i64 0, i64 1
    187   store i32 %1, i32* %arrayidx2, align 4
    188   call void @bar(i32* %arrayidx)
    189   call void asm sideeffect "", "~{f30}"() nounwind
    190   ret void
    191 }
    192 
    193 ; CHECK-LABEL: @loo
    194 
    195 ; CHECK-DAG: mflr {{[0-9]+}}
    196 ; CHECK-DAG: clrldi [[REG:[0-9]+]], 1, 59
    197 ; CHECK-DAG: std 30, -32(1)
    198 ; CHECK-DAG: mr 30, 1
    199 ; CHECK-DAG: std 0, 16(1)
    200 ; CHECK-DAG: subfic 0, [[REG]], -192
    201 ; CHECK: stdux 1, 1, 0
    202 
    203 ; CHECK: .cfi_def_cfa_register r30
    204 
    205 ; CHECK: stfd 30, -16(30)
    206 
    207 ; CHECK: blr
    208 
    209 ; CHECK-FP-LABEL: @loo
    210 
    211 ; CHECK-FP-DAG: mflr {{[0-9]+}}
    212 ; CHECK-FP-DAG: clrldi [[REG:[0-9]+]], 1, 59
    213 ; CHECK-FP-DAG: std 31, -24(1)
    214 ; CHECK-FP-DAG: std 30, -32(1)
    215 ; CHECK-FP-DAG: mr 30, 1
    216 ; CHECK-FP-DAG: std 0, 16(1)
    217 ; CHECK-FP-DAG: subfic 0, [[REG]], -192
    218 ; CHECK-FP: stdux 1, 1, 0
    219 
    220 ; CHECK-FP: .cfi_def_cfa_register r30
    221 
    222 ; CHECK-FP: stfd 30, -16(30)
    223 
    224 ; CHECK-FP: blr
    225