Home | History | Annotate | Download | only in InstCombine
      1 ; This test makes sure that these instructions are properly eliminated.
      2 ;
      3 ; RUN: opt < %s -instcombine -S | FileCheck %s
      4 
      5 target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128:n8:16:32:64"
      6 
      7 define i32 @test1(i32 %A, i1 %b) {
      8 BB0:
      9         br i1 %b, label %BB1, label %BB2
     10 
     11 BB1:
     12         ; Combine away one argument PHI nodes
     13         %B = phi i32 [ %A, %BB0 ]               
     14         ret i32 %B
     15 
     16 BB2:
     17         ret i32 %A
     18 ; CHECK: @test1
     19 ; CHECK: BB1:
     20 ; CHECK-NEXT: ret i32 %A
     21 }
     22 
     23 define i32 @test2(i32 %A, i1 %b) {
     24 BB0:
     25         br i1 %b, label %BB1, label %BB2
     26 
     27 BB1:
     28         br label %BB2
     29 
     30 BB2:
     31         ; Combine away PHI nodes with same values
     32         %B = phi i32 [ %A, %BB0 ], [ %A, %BB1 ]         
     33         ret i32 %B
     34 ; CHECK: @test2
     35 ; CHECK: BB2:
     36 ; CHECK-NEXT: ret i32 %A
     37 }
     38 
     39 define i32 @test3(i32 %A, i1 %b) {
     40 BB0:
     41         br label %Loop
     42 
     43 Loop:
     44         ; PHI has same value always.
     45         %B = phi i32 [ %A, %BB0 ], [ %B, %Loop ]
     46         br i1 %b, label %Loop, label %Exit
     47 
     48 Exit:
     49         ret i32 %B
     50 ; CHECK: @test3
     51 ; CHECK: Exit:
     52 ; CHECK-NEXT: ret i32 %A
     53 }
     54 
     55 define i32 @test4(i1 %b) {
     56 BB0:
     57         ; Loop is unreachable
     58         ret i32 7
     59 
     60 Loop:           ; preds = %L2, %Loop
     61         ; PHI has same value always.
     62         %B = phi i32 [ %B, %L2 ], [ %B, %Loop ]         
     63         br i1 %b, label %L2, label %Loop
     64 
     65 L2:             ; preds = %Loop
     66         br label %Loop
     67 ; CHECK: @test4
     68 ; CHECK: Loop:
     69 ; CHECK-NEXT: br i1 %b
     70 }
     71 
     72 define i32 @test5(i32 %A, i1 %b) {
     73 BB0:
     74         br label %Loop
     75 
     76 Loop:           ; preds = %Loop, %BB0
     77         ; PHI has same value always.
     78         %B = phi i32 [ %A, %BB0 ], [ undef, %Loop ]             
     79         br i1 %b, label %Loop, label %Exit
     80 
     81 Exit:           ; preds = %Loop
     82         ret i32 %B
     83 ; CHECK: @test5
     84 ; CHECK: Loop:
     85 ; CHECK-NEXT: br i1 %b
     86 ; CHECK: Exit:
     87 ; CHECK-NEXT: ret i32 %A
     88 }
     89 
     90 define i32 @test6(i16 %A, i1 %b) {
     91 BB0:
     92         %X = zext i16 %A to i32              
     93         br i1 %b, label %BB1, label %BB2
     94 
     95 BB1:           
     96         %Y = zext i16 %A to i32              
     97         br label %BB2
     98 
     99 BB2:           
    100         ;; Suck casts into phi
    101         %B = phi i32 [ %X, %BB0 ], [ %Y, %BB1 ]         
    102         ret i32 %B
    103 ; CHECK: @test6
    104 ; CHECK: BB2:
    105 ; CHECK: zext i16 %A to i32
    106 ; CHECK-NEXT: ret i32
    107 }
    108 
    109 define i32 @test7(i32 %A, i1 %b) {
    110 BB0:
    111         br label %Loop
    112 
    113 Loop:           ; preds = %Loop, %BB0
    114         ; PHI is dead.
    115         %B = phi i32 [ %A, %BB0 ], [ %C, %Loop ]                
    116         %C = add i32 %B, 123            
    117         br i1 %b, label %Loop, label %Exit
    118 
    119 Exit:           ; preds = %Loop
    120         ret i32 0
    121 ; CHECK: @test7
    122 ; CHECK: Loop:
    123 ; CHECK-NEXT: br i1 %b
    124 }
    125 
    126 define i32* @test8({ i32, i32 } *%A, i1 %b) {
    127 BB0:
    128         %X = getelementptr inbounds { i32, i32 } *%A, i32 0, i32 1
    129         br i1 %b, label %BB1, label %BB2
    130 
    131 BB1:
    132         %Y = getelementptr { i32, i32 } *%A, i32 0, i32 1
    133         br label %BB2
    134 
    135 BB2:
    136         ;; Suck GEPs into phi
    137         %B = phi i32* [ %X, %BB0 ], [ %Y, %BB1 ]
    138         ret i32* %B
    139 ; CHECK: @test8
    140 ; CHECK-NOT: phi
    141 ; CHECK: BB2:
    142 ; CHECK-NEXT: %B = getelementptr { i32, i32 }* %A 
    143 ; CHECK-NEXT: ret i32* %B
    144 }
    145 
    146 define i32 @test9(i32* %A, i32* %B) {
    147 entry:
    148   %c = icmp eq i32* %A, null
    149   br i1 %c, label %bb1, label %bb
    150 
    151 bb:
    152   %C = load i32* %B, align 1
    153   br label %bb2
    154 
    155 bb1:
    156   %D = load i32* %A, align 1
    157   br label %bb2
    158 
    159 bb2:
    160   %E = phi i32 [ %C, %bb ], [ %D, %bb1 ]
    161   ret i32 %E
    162 ; CHECK: @test9
    163 ; CHECK:       bb2:
    164 ; CHECK-NEXT:        phi i32* [ %B, %bb ], [ %A, %bb1 ]
    165 ; CHECK-NEXT:   %E = load i32* %{{[^,]*}}, align 1
    166 ; CHECK-NEXT:   ret i32 %E
    167 
    168 }
    169 
    170 define i32 @test10(i32* %A, i32* %B) {
    171 entry:
    172   %c = icmp eq i32* %A, null
    173   br i1 %c, label %bb1, label %bb
    174 
    175 bb:
    176   %C = load i32* %B, align 16
    177   br label %bb2
    178 
    179 bb1:
    180   %D = load i32* %A, align 32
    181   br label %bb2
    182 
    183 bb2:
    184   %E = phi i32 [ %C, %bb ], [ %D, %bb1 ]
    185   ret i32 %E
    186 ; CHECK: @test10
    187 ; CHECK:       bb2:
    188 ; CHECK-NEXT:        phi i32* [ %B, %bb ], [ %A, %bb1 ]
    189 ; CHECK-NEXT:   %E = load i32* %{{[^,]*}}, align 16
    190 ; CHECK-NEXT:   ret i32 %E
    191 }
    192 
    193 
    194 ; PR1777
    195 declare i1 @test11a()
    196 
    197 define i1 @test11() {
    198 entry:
    199   %a = alloca i32
    200   %i = ptrtoint i32* %a to i64
    201   %b = call i1 @test11a()
    202   br i1 %b, label %one, label %two
    203 
    204 one:
    205   %x = phi i64 [%i, %entry], [%y, %two]
    206   %c = call i1 @test11a()
    207   br i1 %c, label %two, label %end
    208 
    209 two:
    210   %y = phi i64 [%i, %entry], [%x, %one]
    211   %d = call i1 @test11a()
    212   br i1 %d, label %one, label %end
    213 
    214 end:
    215   %f = phi i64 [ %x, %one], [%y, %two]
    216   ; Change the %f to %i, and the optimizer suddenly becomes a lot smarter
    217   ; even though %f must equal %i at this point
    218   %g = inttoptr i64 %f to i32*
    219   store i32 10, i32* %g
    220   %z = call i1 @test11a()
    221   ret i1 %z
    222 ; CHECK: @test11
    223 ; CHECK-NOT: phi i32
    224 ; CHECK: ret i1 %z
    225 }
    226 
    227 
    228 define i64 @test12(i1 %cond, i8* %Ptr, i64 %Val) {
    229 entry:
    230   %tmp41 = ptrtoint i8* %Ptr to i64
    231   %tmp42 = zext i64 %tmp41 to i128
    232   br i1 %cond, label %end, label %two
    233 
    234 two:
    235   %tmp36 = zext i64 %Val to i128            ; <i128> [#uses=1]
    236   %tmp37 = shl i128 %tmp36, 64                    ; <i128> [#uses=1]
    237   %ins39 = or i128 %tmp42, %tmp37                 ; <i128> [#uses=1]
    238   br label %end
    239 
    240 end:
    241   %tmp869.0 = phi i128 [ %tmp42, %entry ], [ %ins39, %two ]
    242   %tmp32 = trunc i128 %tmp869.0 to i64            ; <i64> [#uses=1]
    243   %tmp29 = lshr i128 %tmp869.0, 64                ; <i128> [#uses=1]
    244   %tmp30 = trunc i128 %tmp29 to i64               ; <i64> [#uses=1]
    245 
    246   %tmp2 = add i64 %tmp32, %tmp30
    247   ret i64 %tmp2
    248 ; CHECK: @test12
    249 ; CHECK-NOT: zext
    250 ; CHECK: end:
    251 ; CHECK-NEXT: phi i64 [ 0, %entry ], [ %Val, %two ]
    252 ; CHECK-NOT: phi
    253 ; CHECK: ret i64
    254 }
    255 
    256 declare void @test13f(double, i32)
    257 
    258 define void @test13(i1 %cond, i32 %V1, double %Vald) {
    259 entry:
    260   %tmp42 = zext i32 %V1 to i128
    261   br i1 %cond, label %end, label %two
    262 
    263 two:
    264   %Val = bitcast double %Vald to i64
    265   %tmp36 = zext i64 %Val to i128            ; <i128> [#uses=1]
    266   %tmp37 = shl i128 %tmp36, 64                    ; <i128> [#uses=1]
    267   %ins39 = or i128 %tmp42, %tmp37                 ; <i128> [#uses=1]
    268   br label %end
    269 
    270 end:
    271   %tmp869.0 = phi i128 [ %tmp42, %entry ], [ %ins39, %two ]
    272   %tmp32 = trunc i128 %tmp869.0 to i32
    273   %tmp29 = lshr i128 %tmp869.0, 64                ; <i128> [#uses=1]
    274   %tmp30 = trunc i128 %tmp29 to i64               ; <i64> [#uses=1]
    275   %tmp31 = bitcast i64 %tmp30 to double
    276   
    277   call void @test13f(double %tmp31, i32 %tmp32)
    278   ret void
    279 ; CHECK: @test13
    280 ; CHECK-NOT: zext
    281 ; CHECK: end:
    282 ; CHECK-NEXT: phi double [ 0.000000e+00, %entry ], [ %Vald, %two ]
    283 ; CHECK-NEXT: call void @test13f(double {{[^,]*}}, i32 %V1)
    284 ; CHECK: ret void
    285 }
    286 
    287 define i640 @test14a(i320 %A, i320 %B, i1 %b1) {
    288 BB0:
    289         %a = zext i320 %A to i640
    290         %b = zext i320 %B to i640
    291         br label %Loop
    292 
    293 Loop:
    294         %C = phi i640 [ %a, %BB0 ], [ %b, %Loop ]             
    295         br i1 %b1, label %Loop, label %Exit
    296 
    297 Exit:           ; preds = %Loop
    298         ret i640 %C
    299 ; CHECK: @test14a
    300 ; CHECK: Loop:
    301 ; CHECK-NEXT: phi i320
    302 }
    303 
    304 define i160 @test14b(i320 %A, i320 %B, i1 %b1) {
    305 BB0:
    306         %a = trunc i320 %A to i160
    307         %b = trunc i320 %B to i160
    308         br label %Loop
    309 
    310 Loop:
    311         %C = phi i160 [ %a, %BB0 ], [ %b, %Loop ]             
    312         br i1 %b1, label %Loop, label %Exit
    313 
    314 Exit:           ; preds = %Loop
    315         ret i160 %C
    316 ; CHECK: @test14b
    317 ; CHECK: Loop:
    318 ; CHECK-NEXT: phi i160
    319 }
    320 
    321 declare i64 @test15a(i64)
    322 
    323 define i64 @test15b(i64 %A, i1 %b) {
    324 ; CHECK: @test15b
    325 entry:
    326   %i0 = zext i64 %A to i128
    327   %i1 = shl i128 %i0, 64
    328   %i = or i128 %i1, %i0
    329   br i1 %b, label %one, label %two
    330 ; CHECK: entry:
    331 ; CHECK-NEXT: br i1 %b
    332 
    333 one:
    334   %x = phi i128 [%i, %entry], [%y, %two]
    335   %x1 = lshr i128 %x, 64
    336   %x2 = trunc i128 %x1 to i64
    337   %c = call i64 @test15a(i64 %x2)
    338   %c1 = zext i64 %c to i128
    339   br label %two
    340 
    341 ; CHECK: one:
    342 ; CHECK-NEXT: phi i64
    343 ; CHECK-NEXT: %c = call i64 @test15a
    344 
    345 two:
    346   %y = phi i128 [%i, %entry], [%c1, %one]
    347   %y1 = lshr i128 %y, 64
    348   %y2 = trunc i128 %y1 to i64
    349   %d = call i64 @test15a(i64 %y2)
    350   %d1 = trunc i64 %d to i1
    351   br i1 %d1, label %one, label %end
    352 
    353 ; CHECK: two:
    354 ; CHECK-NEXT: phi i64
    355 ; CHECK-NEXT: phi i64
    356 ; CHECK-NEXT: %d = call i64 @test15a
    357 
    358 end:
    359   %g = trunc i128 %y to i64
    360   ret i64 %g
    361 ; CHECK: end: 
    362 ; CHECK-NEXT: ret i64
    363 }
    364 
    365 ; PR6512 - Shouldn't merge loads from different addr spaces.
    366 define i32 @test16(i32 addrspace(1)* %pointer1, i32 %flag, i32* %pointer2)
    367 nounwind {
    368 entry:
    369   %retval = alloca i32, align 4                   ; <i32*> [#uses=2]
    370   %pointer1.addr = alloca i32 addrspace(1)*, align 4 ; <i32 addrspace(1)**>
    371   %flag.addr = alloca i32, align 4                ; <i32*> [#uses=2]
    372   %pointer2.addr = alloca i32*, align 4           ; <i32**> [#uses=2]
    373   %res = alloca i32, align 4                      ; <i32*> [#uses=4]
    374   store i32 addrspace(1)* %pointer1, i32 addrspace(1)** %pointer1.addr
    375   store i32 %flag, i32* %flag.addr
    376   store i32* %pointer2, i32** %pointer2.addr
    377   store i32 10, i32* %res
    378   %tmp = load i32* %flag.addr                     ; <i32> [#uses=1]
    379   %tobool = icmp ne i32 %tmp, 0                   ; <i1> [#uses=1]
    380   br i1 %tobool, label %if.then, label %if.else
    381 
    382 return:                                           ; preds = %if.end
    383   %tmp7 = load i32* %retval                       ; <i32> [#uses=1]
    384   ret i32 %tmp7
    385 
    386 if.end:                                           ; preds = %if.else, %if.then
    387   %tmp6 = load i32* %res                          ; <i32> [#uses=1]
    388   store i32 %tmp6, i32* %retval
    389   br label %return
    390 
    391 if.then:                                          ; preds = %entry
    392   %tmp1 = load i32 addrspace(1)** %pointer1.addr  ; <i32 addrspace(1)*>
    393   %arrayidx = getelementptr i32 addrspace(1)* %tmp1, i32 0 ; <i32 addrspace(1)*> [#uses=1]
    394   %tmp2 = load i32 addrspace(1)* %arrayidx        ; <i32> [#uses=1]
    395   store i32 %tmp2, i32* %res
    396   br label %if.end
    397 
    398 if.else:                                          ; preds = %entry
    399   %tmp3 = load i32** %pointer2.addr               ; <i32*> [#uses=1]
    400   %arrayidx4 = getelementptr i32* %tmp3, i32 0    ; <i32*> [#uses=1]
    401   %tmp5 = load i32* %arrayidx4                    ; <i32> [#uses=1]
    402   store i32 %tmp5, i32* %res
    403   br label %if.end
    404 }
    405 
    406 ; PR4413
    407 declare i32 @ext()
    408 ; CHECK: @test17
    409 define i32 @test17(i1 %a) {
    410 entry:
    411     br i1 %a, label %bb1, label %bb2
    412 
    413 bb1:        ; preds = %entry
    414     %0 = tail call i32 @ext()        ; <i32> [#uses=1]
    415     br label %bb2
    416 
    417 bb2:        ; preds = %bb1, %entry
    418     %cond = phi i1 [ true, %bb1 ], [ false, %entry ]        ; <i1> [#uses=1]
    419 ; CHECK-NOT: %val = phi i32 [ %0, %bb1 ], [ 0, %entry ]
    420     %val = phi i32 [ %0, %bb1 ], [ 0, %entry ]        ; <i32> [#uses=1]
    421     %res = select i1 %cond, i32 %val, i32 0        ; <i32> [#uses=1]
    422 ; CHECK: ret i32 %cond
    423     ret i32 %res
    424 }
    425 
    426 define i1 @test18(i1 %cond) {
    427   %zero = alloca i32
    428   %one = alloca i32
    429   br i1 %cond, label %true, label %false
    430 true:
    431   br label %ret
    432 false:
    433   br label %ret
    434 ret:
    435   %ptr = phi i32* [ %zero, %true ] , [ %one, %false ]
    436   %isnull = icmp eq i32* %ptr, null
    437   ret i1 %isnull
    438 ; CHECK: @test18
    439 ; CHECK: ret i1 false
    440 }
    441 
    442 define i1 @test19(i1 %cond, double %x) {
    443   br i1 %cond, label %true, label %false
    444 true:
    445   br label %ret
    446 false:
    447   br label %ret
    448 ret:
    449   %p = phi double [ %x, %true ], [ 0x7FF0000000000000, %false ]; RHS = +infty
    450   %cmp = fcmp ule double %x, %p
    451   ret i1 %cmp
    452 ; CHECK: @test19
    453 ; CHECK: ret i1 true
    454 }
    455 
    456 define i1 @test20(i1 %cond) {
    457   %a = alloca i32
    458   %b = alloca i32
    459   %c = alloca i32
    460   br i1 %cond, label %true, label %false
    461 true:
    462   br label %ret
    463 false:
    464   br label %ret
    465 ret:
    466   %p = phi i32* [ %a, %true ], [ %b, %false ]
    467   %r = icmp eq i32* %p, %c
    468   ret i1 %r
    469 ; CHECK: @test20
    470 ; CHECK: ret i1 false
    471 }
    472 
    473 define i1 @test21(i1 %c1, i1 %c2) {
    474   %a = alloca i32
    475   %b = alloca i32
    476   %c = alloca i32
    477   br i1 %c1, label %true, label %false
    478 true:
    479   br label %loop
    480 false:
    481   br label %loop
    482 loop:
    483   %p = phi i32* [ %a, %true ], [ %b, %false ], [ %p, %loop ]
    484   %r = icmp eq i32* %p, %c
    485   br i1 %c2, label %ret, label %loop
    486 ret:
    487   ret i1 %r
    488 ; CHECK: @test21
    489 ; CHECK: ret i1 false
    490 }
    491 
    492 define void @test22() {
    493 ; CHECK: @test22
    494 entry:
    495   br label %loop
    496 loop:
    497   %phi = phi i32 [ 0, %entry ], [ %y, %loop ]
    498   %y = add i32 %phi, 1
    499   %o = or i32 %y, %phi
    500   %e = icmp eq i32 %o, %y
    501   br i1 %e, label %loop, label %ret
    502 ; CHECK: br i1 %e
    503 ret:
    504   ret void
    505 }
    506 
    507 define i32 @test23(i32 %A, i1 %b, i32 * %P) {
    508 BB0:
    509         br label %Loop
    510 
    511 Loop:           ; preds = %Loop, %BB0
    512         ; PHI has same value always.
    513         %B = phi i32 [ %A, %BB0 ], [ 42, %Loop ]
    514         %D = add i32 %B, 19
    515         store i32 %D, i32* %P
    516         br i1 %b, label %Loop, label %Exit
    517 
    518 Exit:           ; preds = %Loop
    519         %E = add i32 %B, 19
    520         ret i32 %E
    521 ; CHECK: @test23
    522 ; CHECK: %phitmp = add i32 %A, 19
    523 ; CHECK: Loop:
    524 ; CHECK-NEXT: %B = phi i32 [ %phitmp, %BB0 ], [ 61, %Loop ]
    525 ; CHECK: Exit:
    526 ; CHECK-NEXT: ret i32 %B
    527 }
    528 
    529 define i32 @test24(i32 %A, i1 %cond) {
    530 BB0:
    531         %X = add nuw nsw i32 %A, 1
    532         br i1 %cond, label %BB1, label %BB2
    533 
    534 BB1:
    535         %Y = add nuw i32 %A, 1
    536         br label %BB2
    537 
    538 BB2:
    539         %C = phi i32 [ %X, %BB0 ], [ %Y, %BB1 ]
    540         ret i32 %C
    541 ; CHECK: @test24
    542 ; CHECK-NOT: phi
    543 ; CHECK: BB2:
    544 ; CHECK-NEXT: %C = add nuw i32 %A, 1
    545 ; CHECK-NEXT: ret i32 %C
    546 }
    547 
    548 ; Same as test11, but used to be missed due to a bug.
    549 declare i1 @test25a()
    550 
    551 define i1 @test25() {
    552 entry:
    553   %a = alloca i32
    554   %i = ptrtoint i32* %a to i64
    555   %b = call i1 @test25a()
    556   br i1 %b, label %one, label %two
    557 
    558 one:
    559   %x = phi i64 [%y, %two], [%i, %entry]
    560   %c = call i1 @test25a()
    561   br i1 %c, label %two, label %end
    562 
    563 two:
    564   %y = phi i64 [%x, %one], [%i, %entry]
    565   %d = call i1 @test25a()
    566   br i1 %d, label %one, label %end
    567 
    568 end:
    569   %f = phi i64 [ %x, %one], [%y, %two]
    570   ; Change the %f to %i, and the optimizer suddenly becomes a lot smarter
    571   ; even though %f must equal %i at this point
    572   %g = inttoptr i64 %f to i32*
    573   store i32 10, i32* %g
    574   %z = call i1 @test25a()
    575   ret i1 %z
    576 ; CHECK: @test25
    577 ; CHECK-NOT: phi i32
    578 ; CHECK: ret i1 %z
    579 }
    580 
    581 declare i1 @test26a()
    582 
    583 define i1 @test26(i32 %n) {
    584 entry:
    585   %a = alloca i32
    586   %i = ptrtoint i32* %a to i64
    587   %b = call i1 @test26a()
    588   br label %one
    589 
    590 one:
    591   %x = phi i64 [%y, %two], [%w, %three], [%i, %entry]
    592   %c = call i1 @test26a()
    593   switch i32 %n, label %end [
    594           i32 2, label %two
    595           i32 3, label %three
    596   ]
    597 
    598 two:
    599   %y = phi i64 [%x, %one], [%w, %three]
    600   %d = call i1 @test26a()
    601   switch i32 %n, label %end [
    602           i32 10, label %one
    603           i32 30, label %three
    604   ]
    605 
    606 three:
    607   %w = phi i64 [%y, %two], [%x, %one]
    608   %e = call i1 @test26a()
    609   br i1 %e, label %one, label %two
    610 
    611 end:
    612   %f = phi i64 [ %x, %one], [%y, %two]
    613   ; Change the %f to %i, and the optimizer suddenly becomes a lot smarter
    614   ; even though %f must equal %i at this point
    615   %g = inttoptr i64 %f to i32*
    616   store i32 10, i32* %g
    617   %z = call i1 @test26a()
    618   ret i1 %z
    619 ; CHECK: @test26
    620 ; CHECK-NOT: phi i32
    621 ; CHECK: ret i1 %z
    622 }
    623