1 ; Like frame-02.ll, but with long doubles rather than floats. Some of the 2 ; cases are slightly different because we need to allocate pairs of FPRs. 3 ; 4 ; RUN: llc < %s -mtriple=s390x-linux-gnu | FileCheck %s 5 6 ; This function should require all FPRs, but no other spill slots. 7 ; We need to save and restore 8 of the 16 FPRs, so the frame size 8 ; should be exactly 160 + 8 * 8 = 224. The CFA offset is 160 9 ; (the caller-allocated part of the frame) + 224. 10 define void @f1(fp128 *%ptr) { 11 ; CHECK-LABEL: f1: 12 ; CHECK: aghi %r15, -224 13 ; CHECK: .cfi_def_cfa_offset 384 14 ; CHECK: std %f8, 216(%r15) 15 ; CHECK: std %f9, 208(%r15) 16 ; CHECK: std %f10, 200(%r15) 17 ; CHECK: std %f11, 192(%r15) 18 ; CHECK: std %f12, 184(%r15) 19 ; CHECK: std %f13, 176(%r15) 20 ; CHECK: std %f14, 168(%r15) 21 ; CHECK: std %f15, 160(%r15) 22 ; CHECK: .cfi_offset %f8, -168 23 ; CHECK: .cfi_offset %f9, -176 24 ; CHECK: .cfi_offset %f10, -184 25 ; CHECK: .cfi_offset %f11, -192 26 ; CHECK: .cfi_offset %f12, -200 27 ; CHECK: .cfi_offset %f13, -208 28 ; CHECK: .cfi_offset %f14, -216 29 ; CHECK: .cfi_offset %f15, -224 30 ; ...main function body... 31 ; CHECK: ld %f8, 216(%r15) 32 ; CHECK: ld %f9, 208(%r15) 33 ; CHECK: ld %f10, 200(%r15) 34 ; CHECK: ld %f11, 192(%r15) 35 ; CHECK: ld %f12, 184(%r15) 36 ; CHECK: ld %f13, 176(%r15) 37 ; CHECK: ld %f14, 168(%r15) 38 ; CHECK: ld %f15, 160(%r15) 39 ; CHECK: aghi %r15, 224 40 ; CHECK: br %r14 41 %l0 = load volatile fp128 , fp128 *%ptr 42 %l1 = load volatile fp128 , fp128 *%ptr 43 %l4 = load volatile fp128 , fp128 *%ptr 44 %l5 = load volatile fp128 , fp128 *%ptr 45 %l8 = load volatile fp128 , fp128 *%ptr 46 %l9 = load volatile fp128 , fp128 *%ptr 47 %l12 = load volatile fp128 , fp128 *%ptr 48 %l13 = load volatile fp128 , fp128 *%ptr 49 %add0 = fadd fp128 %l0, %l0 50 %add1 = fadd fp128 %l1, %add0 51 %add4 = fadd fp128 %l4, %add1 52 %add5 = fadd fp128 %l5, %add4 53 %add8 = fadd fp128 %l8, %add5 54 %add9 = fadd fp128 %l9, %add8 55 %add12 = fadd fp128 %l12, %add9 56 %add13 = fadd fp128 %l13, %add12 57 store volatile fp128 %add0, fp128 *%ptr 58 store volatile fp128 %add1, fp128 *%ptr 59 store volatile fp128 %add4, fp128 *%ptr 60 store volatile fp128 %add5, fp128 *%ptr 61 store volatile fp128 %add8, fp128 *%ptr 62 store volatile fp128 %add9, fp128 *%ptr 63 store volatile fp128 %add12, fp128 *%ptr 64 store volatile fp128 %add13, fp128 *%ptr 65 ret void 66 } 67 68 ; Like f1, but requires one fewer FPR pair. We allocate in numerical order, 69 ; so %f13+%f15 is the pair that gets dropped. 70 define void @f2(fp128 *%ptr) { 71 ; CHECK-LABEL: f2: 72 ; CHECK: aghi %r15, -208 73 ; CHECK: .cfi_def_cfa_offset 368 74 ; CHECK: std %f8, 200(%r15) 75 ; CHECK: std %f9, 192(%r15) 76 ; CHECK: std %f10, 184(%r15) 77 ; CHECK: std %f11, 176(%r15) 78 ; CHECK: std %f12, 168(%r15) 79 ; CHECK: std %f14, 160(%r15) 80 ; CHECK: .cfi_offset %f8, -168 81 ; CHECK: .cfi_offset %f9, -176 82 ; CHECK: .cfi_offset %f10, -184 83 ; CHECK: .cfi_offset %f11, -192 84 ; CHECK: .cfi_offset %f12, -200 85 ; CHECK: .cfi_offset %f14, -208 86 ; CHECK-NOT: %f13 87 ; CHECK-NOT: %f15 88 ; ...main function body... 89 ; CHECK: ld %f8, 200(%r15) 90 ; CHECK: ld %f9, 192(%r15) 91 ; CHECK: ld %f10, 184(%r15) 92 ; CHECK: ld %f11, 176(%r15) 93 ; CHECK: ld %f12, 168(%r15) 94 ; CHECK: ld %f14, 160(%r15) 95 ; CHECK: aghi %r15, 208 96 ; CHECK: br %r14 97 %l0 = load volatile fp128 , fp128 *%ptr 98 %l1 = load volatile fp128 , fp128 *%ptr 99 %l4 = load volatile fp128 , fp128 *%ptr 100 %l5 = load volatile fp128 , fp128 *%ptr 101 %l8 = load volatile fp128 , fp128 *%ptr 102 %l9 = load volatile fp128 , fp128 *%ptr 103 %l12 = load volatile fp128 , fp128 *%ptr 104 %add0 = fadd fp128 %l0, %l0 105 %add1 = fadd fp128 %l1, %add0 106 %add4 = fadd fp128 %l4, %add1 107 %add5 = fadd fp128 %l5, %add4 108 %add8 = fadd fp128 %l8, %add5 109 %add9 = fadd fp128 %l9, %add8 110 %add12 = fadd fp128 %l12, %add9 111 store volatile fp128 %add0, fp128 *%ptr 112 store volatile fp128 %add1, fp128 *%ptr 113 store volatile fp128 %add4, fp128 *%ptr 114 store volatile fp128 %add5, fp128 *%ptr 115 store volatile fp128 %add8, fp128 *%ptr 116 store volatile fp128 %add9, fp128 *%ptr 117 store volatile fp128 %add12, fp128 *%ptr 118 ret void 119 } 120 121 ; Like f1, but requires only one call-saved FPR pair. We allocate in 122 ; numerical order so the pair should be %f8+%f10. 123 define void @f3(fp128 *%ptr) { 124 ; CHECK-LABEL: f3: 125 ; CHECK: aghi %r15, -176 126 ; CHECK: .cfi_def_cfa_offset 336 127 ; CHECK: std %f8, 168(%r15) 128 ; CHECK: std %f10, 160(%r15) 129 ; CHECK: .cfi_offset %f8, -168 130 ; CHECK: .cfi_offset %f10, -176 131 ; CHECK-NOT: %f9 132 ; CHECK-NOT: %f11 133 ; CHECK-NOT: %f12 134 ; CHECK-NOT: %f13 135 ; CHECK-NOT: %f14 136 ; CHECK-NOT: %f15 137 ; ...main function body... 138 ; CHECK: ld %f8, 168(%r15) 139 ; CHECK: ld %f10, 160(%r15) 140 ; CHECK: aghi %r15, 176 141 ; CHECK: br %r14 142 %l0 = load volatile fp128 , fp128 *%ptr 143 %l1 = load volatile fp128 , fp128 *%ptr 144 %l4 = load volatile fp128 , fp128 *%ptr 145 %l5 = load volatile fp128 , fp128 *%ptr 146 %l8 = load volatile fp128 , fp128 *%ptr 147 %add0 = fadd fp128 %l0, %l0 148 %add1 = fadd fp128 %l1, %add0 149 %add4 = fadd fp128 %l4, %add1 150 %add5 = fadd fp128 %l5, %add4 151 %add8 = fadd fp128 %l8, %add5 152 store volatile fp128 %add0, fp128 *%ptr 153 store volatile fp128 %add1, fp128 *%ptr 154 store volatile fp128 %add4, fp128 *%ptr 155 store volatile fp128 %add5, fp128 *%ptr 156 store volatile fp128 %add8, fp128 *%ptr 157 ret void 158 } 159 160 ; This function should use all call-clobbered FPRs but no call-saved ones. 161 ; It shouldn't need to create a frame. 162 define void @f4(fp128 *%ptr) { 163 ; CHECK-LABEL: f4: 164 ; CHECK-NOT: %r15 165 ; CHECK-NOT: %f8 166 ; CHECK-NOT: %f9 167 ; CHECK-NOT: %f10 168 ; CHECK-NOT: %f11 169 ; CHECK-NOT: %f12 170 ; CHECK-NOT: %f13 171 ; CHECK-NOT: %f14 172 ; CHECK-NOT: %f15 173 ; CHECK: br %r14 174 %l0 = load volatile fp128 , fp128 *%ptr 175 %l1 = load volatile fp128 , fp128 *%ptr 176 %l4 = load volatile fp128 , fp128 *%ptr 177 %l5 = load volatile fp128 , fp128 *%ptr 178 %add0 = fadd fp128 %l0, %l0 179 %add1 = fadd fp128 %l1, %add0 180 %add4 = fadd fp128 %l4, %add1 181 %add5 = fadd fp128 %l5, %add4 182 store volatile fp128 %add0, fp128 *%ptr 183 store volatile fp128 %add1, fp128 *%ptr 184 store volatile fp128 %add4, fp128 *%ptr 185 store volatile fp128 %add5, fp128 *%ptr 186 ret void 187 } 188