1 ; RUN: opt -S -loop-reroll %s | FileCheck %s 2 target triple = "aarch64--linux-gnu" 3 4 define void @test(i32 %n, float* %arrayidx200, float* %arrayidx164, float* %arrayidx172) { 5 entry: 6 %rem.i = srem i32 %n, 4 7 %t22 = load float, float* %arrayidx172, align 4 8 %cmp.9 = icmp eq i32 %n, 0 9 %t7 = sext i32 %n to i64 10 br i1 %cmp.9, label %while.end, label %while.body.preheader 11 12 while.body.preheader: 13 br label %while.body 14 15 while.body: 16 ;CHECK-LABEL: while.body: 17 ;CHECK-NEXT: %indvars.iv.i423 = phi i64 [ %indvars.iv.next.i424, %while.body ], [ 0, %while.body.preheader ] 18 ;CHECK-NEXT: [[T1:%[0-9]+]] = trunc i64 %indvars.iv.i423 to i32 19 ;CHECK-NEXT: %arrayidx62.i = getelementptr inbounds float, float* %arrayidx200, i64 %indvars.iv.i423 20 ;CHECK-NEXT: %t1 = load float, float* %arrayidx62.i, align 4 21 ;CHECK-NEXT: %arrayidx64.i = getelementptr inbounds float, float* %arrayidx164, i64 %indvars.iv.i423 22 ;CHECK-NEXT: %t2 = load float, float* %arrayidx64.i, align 4 23 ;CHECK-NEXT: %mul65.i = fmul fast float %t2, %t22 24 ;CHECK-NEXT: %add66.i = fadd fast float %mul65.i, %t1 25 ;CHECK-NEXT: store float %add66.i, float* %arrayidx62.i, align 4 26 ;CHECK-NEXT: %indvars.iv.next.i424 = add i64 %indvars.iv.i423, 1 27 ;CHECK-NEXT: [[T2:%[0-9]+]] = sext i32 [[T1]] to i64 28 ;CHECK-NEXT: %exitcond = icmp eq i64 [[T2]], %{{[0-9]+}} 29 ;CHECK-NEXT: br i1 %exitcond, label %while.end.loopexit, label %while.body 30 31 %indvars.iv.i423 = phi i64 [ %indvars.iv.next.i424, %while.body ], [ 0, %while.body.preheader ] 32 %i.22.i = phi i32 [ %add103.i, %while.body ], [ %rem.i, %while.body.preheader ] 33 %arrayidx62.i = getelementptr inbounds float, float* %arrayidx200, i64 %indvars.iv.i423 34 %t1 = load float, float* %arrayidx62.i, align 4 35 %arrayidx64.i = getelementptr inbounds float, float* %arrayidx164, i64 %indvars.iv.i423 36 %t2 = load float, float* %arrayidx64.i, align 4 37 %mul65.i = fmul fast float %t2, %t22 38 %add66.i = fadd fast float %mul65.i, %t1 39 store float %add66.i, float* %arrayidx62.i, align 4 40 %t3 = add nsw i64 %indvars.iv.i423, 1 41 %arrayidx71.i = getelementptr inbounds float, float* %arrayidx200, i64 %t3 42 %t4 = load float, float* %arrayidx71.i, align 4 43 %arrayidx74.i = getelementptr inbounds float, float* %arrayidx164, i64 %t3 44 %t5 = load float, float* %arrayidx74.i, align 4 45 %mul75.i = fmul fast float %t5, %t22 46 %add76.i = fadd fast float %mul75.i, %t4 47 store float %add76.i, float* %arrayidx71.i, align 4 48 %add103.i = add nsw i32 %i.22.i, 2 49 %t6 = sext i32 %add103.i to i64 50 %cmp58.i = icmp slt i64 %t6, %t7 51 %indvars.iv.next.i424 = add i64 %indvars.iv.i423, 2 52 br i1 %cmp58.i, label %while.body, label %while.end.loopexit 53 54 while.end.loopexit: 55 br label %while.end 56 57 while.end: 58 ret void 59 } 60 61 ; Function Attrs: noinline norecurse nounwind 62 define i32 @test2(i64 %n, i32* nocapture %x, i32* nocapture readonly %y) { 63 entry: 64 %cmp18 = icmp sgt i64 %n, 0 65 br i1 %cmp18, label %for.body.preheader, label %for.end 66 67 for.body.preheader: ; preds = %entry 68 br label %for.body 69 70 for.body: ; preds = %for.body.preheader, %for.body 71 72 ;CHECK: for.body: 73 ;CHECK-NEXT: %indvar = phi i64 [ %indvar.next, %for.body ], [ 0, %for.body.preheader ] 74 ;CHECK-NEXT: %arrayidx = getelementptr inbounds i32, i32* %y, i64 %indvar 75 ;CHECK-NEXT: [[T1:%[0-9]+]] = load i32, i32* %arrayidx, align 4 76 ;CHECK-NEXT: %arrayidx3 = getelementptr inbounds i32, i32* %x, i64 %indvar 77 ;CHECK-NEXT: store i32 [[T1]], i32* %arrayidx3, align 4 78 ;CHECK-NEXT: %indvar.next = add i64 %indvar, 1 79 ;CHECK-NEXT: %exitcond = icmp eq i64 %indvar, %{{[0-9]+}} 80 ;CHECK-NEXT: br i1 %exitcond, label %for.end.loopexit, label %for.body 81 82 %indvars.iv = phi i64 [ %indvars.iv.next, %for.body ], [ 0, %for.body.preheader ] 83 %arrayidx = getelementptr inbounds i32, i32* %y, i64 %indvars.iv 84 %0 = load i32, i32* %arrayidx, align 4 85 %arrayidx3 = getelementptr inbounds i32, i32* %x, i64 %indvars.iv 86 store i32 %0, i32* %arrayidx3, align 4 87 %1 = or i64 %indvars.iv, 1 88 %arrayidx5 = getelementptr inbounds i32, i32* %y, i64 %1 89 %2 = load i32, i32* %arrayidx5, align 4 90 %arrayidx8 = getelementptr inbounds i32, i32* %x, i64 %1 91 store i32 %2, i32* %arrayidx8, align 4 92 %indvars.iv.next = add nuw nsw i64 %indvars.iv, 2 93 %cmp = icmp slt i64 %indvars.iv.next, %n 94 br i1 %cmp, label %for.body, label %for.end.loopexit 95 96 for.end.loopexit: ; preds = %for.body 97 br label %for.end 98 99 for.end: ; preds = %for.end.loopexit, %entry 100 ret i32 0 101 } 102 103 ; Function Attrs: noinline norecurse nounwind 104 define i32 @test3(i32 %n, i32* nocapture %x, i32* nocapture readonly %y) { 105 entry: 106 %cmp21 = icmp sgt i32 %n, 0 107 br i1 %cmp21, label %for.body.preheader, label %for.end 108 109 for.body.preheader: ; preds = %entry 110 br label %for.body 111 112 for.body: ; preds = %for.body.preheader, %for.body 113 114 ;CHECK: for.body: 115 ;CHECK: %add12 = add i8 %i.022, 2 116 ;CHECK-NEXT: %conv = sext i8 %add12 to i32 117 ;CHECK-NEXT: %cmp = icmp slt i32 %conv, %n 118 ;CHECK-NEXT: br i1 %cmp, label %for.body, label %for.end.loopexit 119 120 %conv23 = phi i32 [ %conv, %for.body ], [ 0, %for.body.preheader ] 121 %i.022 = phi i8 [ %add12, %for.body ], [ 0, %for.body.preheader ] 122 %idxprom = sext i8 %i.022 to i64 123 %arrayidx = getelementptr inbounds i32, i32* %y, i64 %idxprom 124 %0 = load i32, i32* %arrayidx, align 4 125 %arrayidx3 = getelementptr inbounds i32, i32* %x, i64 %idxprom 126 store i32 %0, i32* %arrayidx3, align 4 127 %add = or i32 %conv23, 1 128 %idxprom5 = sext i32 %add to i64 129 %arrayidx6 = getelementptr inbounds i32, i32* %y, i64 %idxprom5 130 %1 = load i32, i32* %arrayidx6, align 4 131 %arrayidx10 = getelementptr inbounds i32, i32* %x, i64 %idxprom5 132 store i32 %1, i32* %arrayidx10, align 4 133 %add12 = add i8 %i.022, 2 134 %conv = sext i8 %add12 to i32 135 %cmp = icmp slt i32 %conv, %n 136 br i1 %cmp, label %for.body, label %for.end.loopexit 137 138 for.end.loopexit: ; preds = %for.body 139 br label %for.end 140 141 for.end: ; preds = %for.end.loopexit, %entry 142 ret i32 0 143 } 144 145 ; Function Attrs: noinline norecurse nounwind 146 define i32 @test4(i64 %n, i32* nocapture %x, i32* nocapture readonly %y) { 147 entry: 148 %cmp18 = icmp eq i64 %n, 0 149 br i1 %cmp18, label %for.end, label %for.body.preheader 150 151 for.body.preheader: ; preds = %entry 152 br label %for.body 153 154 for.body: ; preds = %for.body.preheader, %for.body 155 156 ;CHECK: for.body: 157 ;CHECK-NEXT: %indvar = phi i64 [ %indvar.next, %for.body ], [ 0, %for.body.preheader ] 158 ;CHECK-NEXT: %arrayidx = getelementptr inbounds i32, i32* %y, i64 %indvar 159 ;CHECK-NEXT: [[T1:%[0-9]+]] = load i32, i32* %arrayidx, align 4 160 ;CHECK-NEXT: %arrayidx3 = getelementptr inbounds i32, i32* %x, i64 %indvar 161 ;CHECK-NEXT: store i32 [[T1]], i32* %arrayidx3, align 4 162 ;CHECK-NEXT: %indvar.next = add i64 %indvar, 1 163 ;CHECK-NEXT: %exitcond = icmp eq i64 %indvar, %{{[0-9]+}} 164 ;CHECK-NEXT: br i1 %exitcond, label %for.end.loopexit, label %for.body 165 166 %indvars.iv = phi i64 [ %indvars.iv.next, %for.body ], [ 0, %for.body.preheader ] 167 %arrayidx = getelementptr inbounds i32, i32* %y, i64 %indvars.iv 168 %0 = load i32, i32* %arrayidx, align 4 169 %arrayidx3 = getelementptr inbounds i32, i32* %x, i64 %indvars.iv 170 store i32 %0, i32* %arrayidx3, align 4 171 %1 = or i64 %indvars.iv, 1 172 %arrayidx5 = getelementptr inbounds i32, i32* %y, i64 %1 173 %2 = load i32, i32* %arrayidx5, align 4 174 %arrayidx8 = getelementptr inbounds i32, i32* %x, i64 %1 175 store i32 %2, i32* %arrayidx8, align 4 176 %indvars.iv.next = add nuw nsw i64 %indvars.iv, 2 177 %cmp = icmp ult i64 %indvars.iv.next, %n 178 br i1 %cmp, label %for.body, label %for.end.loopexit 179 180 for.end.loopexit: ; preds = %for.body 181 br label %for.end 182 183 for.end: ; preds = %for.end.loopexit, %entry 184 ret i32 0 185 } 186 187