1 ; RUN: llc < %s -mtriple=i386-apple-darwin -relocation-model=pic -disable-fp-elim | FileCheck %s -check-prefix=X86-32 2 ; RUN: llc < %s -mtriple=x86_64-apple-darwin -relocation-model=pic -disable-fp-elim | FileCheck %s -check-prefix=X86-64 3 4 ; MachineLICM should be able to hoist loop invariant reload out of the loop. 5 ; Only linear scan needs this, -regalloc=greedy sinks the spill instead. 6 ; rdar://7233099 7 8 %struct.FILE = type { i8*, i32, i32, i16, i16, %struct.__sbuf, i32, i8*, i32 (i8*)*, i32 (i8*, i8*, i32)*, i64 (i8*, i64, i32)*, i32 (i8*, i8*, i32)*, %struct.__sbuf, %struct.__sFILEX*, i32, [3 x i8], [1 x i8], %struct.__sbuf, i32, i64 } 9 %struct.__sFILEX = type opaque 10 %struct.__sbuf = type { i8*, i32 } 11 %struct.epoch_t = type { %struct.trans_t*, %struct.trans_t*, i32, i32, i32, i32, i32 } 12 %struct.trans_t = type { i32, i32, i32, i8* } 13 14 @.str12 = external constant [2 x i8], align 1 ; <[2 x i8]*> [#uses=1] 15 @.str19 = external constant [7 x i8], align 1 ; <[7 x i8]*> [#uses=1] 16 @.str24 = external constant [4 x i8], align 1 ; <[4 x i8]*> [#uses=1] 17 18 define i32 @t1(i32 %c, i8** nocapture %v) nounwind ssp { 19 ; X86-32-LABEL: t1: 20 entry: 21 br i1 undef, label %bb, label %bb3 22 23 bb: ; preds = %entry 24 unreachable 25 26 bb3: ; preds = %entry 27 br i1 undef, label %bb.i, label %bb.nph41 28 29 bb.i: ; preds = %bb3 30 unreachable 31 32 bb.nph41: ; preds = %bb3 33 %0 = call %struct.FILE* @"\01_fopen$UNIX2003"(i8* undef, i8* getelementptr inbounds ([2 x i8], [2 x i8]* @.str12, i32 0, i32 0)) nounwind ; <%struct.FILE*> [#uses=3] 34 br i1 undef, label %bb4, label %bb5.preheader 35 36 bb5.preheader: ; preds = %bb.nph41 37 br label %bb5 38 39 bb4: ; preds = %bb.nph41 40 unreachable 41 42 bb5: ; preds = %bb5, %bb5.preheader 43 br i1 undef, label %bb7, label %bb5 44 45 bb7: ; preds = %bb5 46 br i1 undef, label %bb9, label %bb12 47 48 bb9: ; preds = %bb7 49 unreachable 50 51 bb12: ; preds = %bb7 52 br i1 undef, label %bb16, label %bb22 53 54 bb16: ; preds = %bb12 55 unreachable 56 57 bb22: ; preds = %bb12 58 br label %bb.i1 59 60 bb.i1: ; preds = %bb.i1, %bb22 61 %1 = icmp eq i8 undef, 69 ; <i1> [#uses=1] 62 br i1 %1, label %imix_test.exit, label %bb.i1 63 64 imix_test.exit: ; preds = %bb.i1 65 br i1 undef, label %bb23, label %bb26.preheader 66 67 bb26.preheader: ; preds = %imix_test.exit 68 br i1 undef, label %bb28, label %bb30 69 70 bb23: ; preds = %imix_test.exit 71 unreachable 72 ; Verify that there are no loads inside the loop. 73 ; X86-32: .align 4 74 ; X86-32: %bb28 75 ; X86-32-NOT: (%esp), 76 ; X86-32-NOT: (%ebp), 77 ; X86-32: jmp 78 79 bb28: ; preds = %bb28, %bb26.preheader 80 %counter.035 = phi i32 [ %3, %bb28 ], [ 0, %bb26.preheader ] ; <i32> [#uses=2] 81 %tmp56 = shl i32 %counter.035, 2 ; <i32> [#uses=0] 82 %2 = call i8* @fgets(i8* undef, i32 50, %struct.FILE* %0) nounwind ; <i8*> [#uses=0] 83 %3 = add nsw i32 %counter.035, 1 ; <i32> [#uses=1] 84 %4 = call i32 @feof(%struct.FILE* %0) nounwind ; <i32> [#uses=0] 85 br label %bb28 86 87 bb30: ; preds = %bb26.preheader 88 %5 = call i32 @strcmp(i8* undef, i8* getelementptr inbounds ([7 x i8], [7 x i8]* @.str19, i32 0, i32 0)) nounwind readonly ; <i32> [#uses=0] 89 br i1 undef, label %bb34, label %bb70 90 91 bb32.loopexit: ; preds = %bb45 92 %6 = icmp eq i32 undef, 0 ; <i1> [#uses=1] 93 %indvar.next55 = add i32 %indvar54, 1 ; <i32> [#uses=1] 94 br i1 %6, label %bb34, label %bb70 95 96 bb34: ; preds = %bb32.loopexit, %bb30 97 %indvar54 = phi i32 [ %indvar.next55, %bb32.loopexit ], [ 0, %bb30 ] ; <i32> [#uses=3] 98 br i1 false, label %bb35, label %bb39.preheader 99 100 bb35: ; preds = %bb34 101 unreachable 102 103 bb39.preheader: ; preds = %bb34 104 %7 = getelementptr inbounds %struct.epoch_t, %struct.epoch_t* undef, i32 %indvar54, i32 3 ; <i32*> [#uses=1] 105 %8 = getelementptr inbounds %struct.epoch_t, %struct.epoch_t* undef, i32 %indvar54, i32 2 ; <i32*> [#uses=0] 106 br i1 false, label %bb42, label %bb45 107 108 bb42: ; preds = %bb39.preheader 109 unreachable 110 111 bb45: ; preds = %bb39.preheader 112 %9 = call i32 @strcmp(i8* undef, i8* getelementptr inbounds ([4 x i8], [4 x i8]* @.str24, i32 0, i32 0)) nounwind readonly ; <i32> [#uses=0] 113 br i1 false, label %bb47, label %bb32.loopexit 114 115 bb47: ; preds = %bb45 116 %10 = load i32, i32* %7, align 4 ; <i32> [#uses=0] 117 unreachable 118 119 bb70: ; preds = %bb32.loopexit, %bb30 120 br i1 undef, label %bb78, label %bb76 121 122 bb76: ; preds = %bb70 123 unreachable 124 125 bb78: ; preds = %bb70 126 br i1 undef, label %bb83, label %bb79 127 128 bb79: ; preds = %bb78 129 unreachable 130 131 bb83: ; preds = %bb78 132 call void @rewind(%struct.FILE* %0) nounwind 133 unreachable 134 } 135 136 declare %struct.FILE* @"\01_fopen$UNIX2003"(i8*, i8*) 137 138 declare i8* @fgets(i8*, i32, %struct.FILE* nocapture) nounwind 139 140 declare void @rewind(%struct.FILE* nocapture) nounwind 141 142 declare i32 @feof(%struct.FILE* nocapture) nounwind 143 144 declare i32 @strcmp(i8* nocapture, i8* nocapture) nounwind readonly 145 146 @map_4_to_16 = external constant [16 x i16], align 32 ; <[16 x i16]*> [#uses=2] 147 148 define void @t2(i8* nocapture %bufp, i8* nocapture %data, i32 %dsize) nounwind ssp { 149 ; X86-64-LABEL: t2: 150 entry: 151 br i1 undef, label %return, label %bb.nph 152 153 bb.nph: ; preds = %entry 154 ; X86-64: movq _map_4_to_16@GOTPCREL(%rip) 155 ; X86-64: .align 4 156 %tmp5 = zext i32 undef to i64 ; <i64> [#uses=1] 157 %tmp6 = add i64 %tmp5, 1 ; <i64> [#uses=1] 158 %tmp11 = shl i64 undef, 1 ; <i64> [#uses=1] 159 %tmp14 = mul i64 undef, 3 ; <i64> [#uses=1] 160 br label %bb 161 162 bb: ; preds = %bb, %bb.nph 163 %tmp9 = mul i64 undef, undef ; <i64> [#uses=2] 164 %tmp12 = add i64 %tmp11, %tmp9 ; <i64> [#uses=1] 165 %scevgep13 = getelementptr i8, i8* %bufp, i64 %tmp12 ; <i8*> [#uses=1] 166 %tmp15 = add i64 %tmp14, %tmp9 ; <i64> [#uses=1] 167 %scevgep16 = getelementptr i8, i8* %bufp, i64 %tmp15 ; <i8*> [#uses=1] 168 %0 = load i8, i8* undef, align 1 ; <i8> [#uses=1] 169 %1 = zext i8 %0 to i32 ; <i32> [#uses=1] 170 %2 = getelementptr inbounds [16 x i16], [16 x i16]* @map_4_to_16, i64 0, i64 0 ; <i16*> [#uses=1] 171 %3 = load i16, i16* %2, align 2 ; <i16> [#uses=1] 172 %4 = trunc i16 %3 to i8 ; <i8> [#uses=1] 173 store i8 %4, i8* undef, align 1 174 %5 = and i32 %1, 15 ; <i32> [#uses=1] 175 %6 = zext i32 %5 to i64 ; <i64> [#uses=1] 176 %7 = getelementptr inbounds [16 x i16], [16 x i16]* @map_4_to_16, i64 0, i64 %6 ; <i16*> [#uses=1] 177 %8 = load i16, i16* %7, align 2 ; <i16> [#uses=2] 178 %9 = lshr i16 %8, 8 ; <i16> [#uses=1] 179 %10 = trunc i16 %9 to i8 ; <i8> [#uses=1] 180 store i8 %10, i8* %scevgep13, align 1 181 %11 = trunc i16 %8 to i8 ; <i8> [#uses=1] 182 store i8 %11, i8* %scevgep16, align 1 183 %exitcond = icmp eq i64 undef, %tmp6 ; <i1> [#uses=1] 184 br i1 %exitcond, label %return, label %bb 185 186 return: ; preds = %bb, %entry 187 ret void 188 } 189