1 ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py 2 ; This test makes sure that div instructions are properly eliminated. 3 4 ; RUN: opt < %s -instcombine -S | FileCheck %s 5 6 define i32 @test1(i32 %A) { 7 ; CHECK-LABEL: @test1( 8 ; CHECK-NEXT: ret i32 %A 9 ; 10 %B = sdiv i32 %A, 1 ; <i32> [#uses=1] 11 ret i32 %B 12 } 13 14 define i32 @test2(i32 %A) { 15 ; => Shift 16 ; CHECK-LABEL: @test2( 17 ; CHECK-NEXT: [[B:%.*]] = lshr i32 %A, 3 18 ; CHECK-NEXT: ret i32 [[B]] 19 ; 20 %B = udiv i32 %A, 8 ; <i32> [#uses=1] 21 ret i32 %B 22 } 23 24 define i32 @test3(i32 %A) { 25 ; => 0, don't need to keep traps 26 ; CHECK-LABEL: @test3( 27 ; CHECK-NEXT: ret i32 0 28 ; 29 %B = sdiv i32 0, %A ; <i32> [#uses=1] 30 ret i32 %B 31 } 32 33 define i32 @test4(i32 %A) { 34 ; 0-A 35 ; CHECK-LABEL: @test4( 36 ; CHECK-NEXT: [[B:%.*]] = sub i32 0, %A 37 ; CHECK-NEXT: ret i32 [[B]] 38 ; 39 %B = sdiv i32 %A, -1 ; <i32> [#uses=1] 40 ret i32 %B 41 } 42 43 define i32 @test5(i32 %A) { 44 ; CHECK-LABEL: @test5( 45 ; CHECK-NEXT: ret i32 0 46 ; 47 %B = udiv i32 %A, -16 ; <i32> [#uses=1] 48 %C = udiv i32 %B, -4 ; <i32> [#uses=1] 49 ret i32 %C 50 } 51 52 define i1 @test6(i32 %A) { 53 ; CHECK-LABEL: @test6( 54 ; CHECK-NEXT: [[TMP1:%.*]] = icmp ult i32 %A, 123 55 ; CHECK-NEXT: ret i1 [[TMP1]] 56 ; 57 %B = udiv i32 %A, 123 ; <i32> [#uses=1] 58 ; A < 123 59 %C = icmp eq i32 %B, 0 ; <i1> [#uses=1] 60 ret i1 %C 61 } 62 63 define i1 @test7(i32 %A) { 64 ; CHECK-LABEL: @test7( 65 ; CHECK-NEXT: [[A_OFF:%.*]] = add i32 %A, -20 66 ; CHECK-NEXT: [[TMP1:%.*]] = icmp ult i32 [[A_OFF]], 10 67 ; CHECK-NEXT: ret i1 [[TMP1]] 68 ; 69 %B = udiv i32 %A, 10 ; <i32> [#uses=1] 70 ; A >= 20 && A < 30 71 %C = icmp eq i32 %B, 2 ; <i1> [#uses=1] 72 ret i1 %C 73 } 74 75 define i1 @test8(i8 %A) { 76 ; CHECK-LABEL: @test8( 77 ; CHECK-NEXT: [[C:%.*]] = icmp ugt i8 %A, -11 78 ; CHECK-NEXT: ret i1 [[C]] 79 ; 80 %B = udiv i8 %A, 123 ; <i8> [#uses=1] 81 ; A >= 246 82 %C = icmp eq i8 %B, 2 ; <i1> [#uses=1] 83 ret i1 %C 84 } 85 86 define i1 @test9(i8 %A) { 87 ; CHECK-LABEL: @test9( 88 ; CHECK-NEXT: [[C:%.*]] = icmp ult i8 %A, -10 89 ; CHECK-NEXT: ret i1 [[C]] 90 ; 91 %B = udiv i8 %A, 123 ; <i8> [#uses=1] 92 ; A < 246 93 %C = icmp ne i8 %B, 2 ; <i1> [#uses=1] 94 ret i1 %C 95 } 96 97 define i32 @test10(i32 %X, i1 %C) { 98 ; CHECK-LABEL: @test10( 99 ; CHECK-NEXT: [[R_V:%.*]] = select i1 %C, i32 6, i32 3 100 ; CHECK-NEXT: [[R:%.*]] = lshr i32 %X, [[R:%.*]].v 101 ; CHECK-NEXT: ret i32 [[R]] 102 ; 103 %V = select i1 %C, i32 64, i32 8 ; <i32> [#uses=1] 104 %R = udiv i32 %X, %V ; <i32> [#uses=1] 105 ret i32 %R 106 } 107 108 define i32 @test11(i32 %X, i1 %C) { 109 ; CHECK-LABEL: @test11( 110 ; CHECK-NEXT: [[B_V:%.*]] = select i1 %C, i32 10, i32 5 111 ; CHECK-NEXT: [[B:%.*]] = lshr i32 %X, [[B:%.*]].v 112 ; CHECK-NEXT: ret i32 [[B]] 113 ; 114 %A = select i1 %C, i32 1024, i32 32 ; <i32> [#uses=1] 115 %B = udiv i32 %X, %A ; <i32> [#uses=1] 116 ret i32 %B 117 } 118 119 ; PR2328 120 define i32 @test12(i32 %x) nounwind { 121 ; CHECK-LABEL: @test12( 122 ; CHECK-NEXT: ret i32 1 123 ; 124 %tmp3 = udiv i32 %x, %x ; 1 125 ret i32 %tmp3 126 } 127 128 define i32 @test13(i32 %x) nounwind { 129 ; CHECK-LABEL: @test13( 130 ; CHECK-NEXT: ret i32 1 131 ; 132 %tmp3 = sdiv i32 %x, %x ; 1 133 ret i32 %tmp3 134 } 135 136 define i32 @test14(i8 %x) nounwind { 137 ; CHECK-LABEL: @test14( 138 ; CHECK-NEXT: ret i32 0 139 ; 140 %zext = zext i8 %x to i32 141 %div = udiv i32 %zext, 257 ; 0 142 ret i32 %div 143 } 144 145 ; PR9814 146 define i32 @test15(i32 %a, i32 %b) nounwind { 147 ; CHECK-LABEL: @test15( 148 ; CHECK-NEXT: [[TMP1:%.*]] = add i32 %b, -2 149 ; CHECK-NEXT: [[DIV2:%.*]] = lshr i32 %a, [[TMP1]] 150 ; CHECK-NEXT: ret i32 [[DIV2]] 151 ; 152 %shl = shl i32 1, %b 153 %div = lshr i32 %shl, 2 154 %div2 = udiv i32 %a, %div 155 ret i32 %div2 156 } 157 158 define <2 x i64> @test16(<2 x i64> %x) nounwind { 159 ; CHECK-LABEL: @test16( 160 ; CHECK-NEXT: [[DIV:%.*]] = udiv <2 x i64> %x, <i64 192, i64 192> 161 ; CHECK-NEXT: ret <2 x i64> [[DIV]] 162 ; 163 %shr = lshr <2 x i64> %x, <i64 5, i64 5> 164 %div = udiv <2 x i64> %shr, <i64 6, i64 6> 165 ret <2 x i64> %div 166 } 167 168 define <2 x i64> @test17(<2 x i64> %x) nounwind { 169 ; CHECK-LABEL: @test17( 170 ; CHECK-NEXT: [[DIV:%.*]] = sdiv <2 x i64> %x, <i64 -3, i64 -4> 171 ; CHECK-NEXT: ret <2 x i64> [[DIV]] 172 ; 173 %neg = sub nsw <2 x i64> zeroinitializer, %x 174 %div = sdiv <2 x i64> %neg, <i64 3, i64 4> 175 ret <2 x i64> %div 176 } 177 178 define <2 x i64> @test18(<2 x i64> %x) nounwind { 179 ; CHECK-LABEL: @test18( 180 ; CHECK-NEXT: [[DIV:%.*]] = sub <2 x i64> zeroinitializer, %x 181 ; CHECK-NEXT: ret <2 x i64> [[DIV]] 182 ; 183 %div = sdiv <2 x i64> %x, <i64 -1, i64 -1> 184 ret <2 x i64> %div 185 } 186 187 define i32 @test19(i32 %x) { 188 ; CHECK-LABEL: @test19( 189 ; CHECK-NEXT: [[TMP1:%.*]] = icmp eq i32 %x, 1 190 ; CHECK-NEXT: [[A:%.*]] = zext i1 [[TMP1]] to i32 191 ; CHECK-NEXT: ret i32 [[A]] 192 ; 193 %A = udiv i32 1, %x 194 ret i32 %A 195 } 196 197 define i32 @test20(i32 %x) { 198 ; CHECK-LABEL: @test20( 199 ; CHECK-NEXT: [[TMP1:%.*]] = add i32 %x, 1 200 ; CHECK-NEXT: [[TMP2:%.*]] = icmp ult i32 [[TMP1]], 3 201 ; CHECK-NEXT: [[A:%.*]] = select i1 [[TMP2]], i32 %x, i32 0 202 ; CHECK-NEXT: ret i32 [[A]] 203 ; 204 %A = sdiv i32 1, %x 205 ret i32 %A 206 } 207 208 define i32 @test21(i32 %a) { 209 ; CHECK-LABEL: @test21( 210 ; CHECK-NEXT: [[DIV:%.*]] = sdiv i32 %a, 3 211 ; CHECK-NEXT: ret i32 [[DIV]] 212 ; 213 %shl = shl nsw i32 %a, 2 214 %div = sdiv i32 %shl, 12 215 ret i32 %div 216 } 217 218 define i32 @test22(i32 %a) { 219 ; CHECK-LABEL: @test22( 220 ; CHECK-NEXT: [[DIV:%.*]] = sdiv i32 %a, 4 221 ; CHECK-NEXT: ret i32 [[DIV]] 222 ; 223 %mul = mul nsw i32 %a, 3 224 %div = sdiv i32 %mul, 12 225 ret i32 %div 226 } 227 228 define i32 @test23(i32 %a) { 229 ; CHECK-LABEL: @test23( 230 ; CHECK-NEXT: [[DIV:%.*]] = udiv i32 %a, 3 231 ; CHECK-NEXT: ret i32 [[DIV]] 232 ; 233 %shl = shl nuw i32 %a, 2 234 %div = udiv i32 %shl, 12 235 ret i32 %div 236 } 237 238 define i32 @test24(i32 %a) { 239 ; CHECK-LABEL: @test24( 240 ; CHECK-NEXT: [[DIV:%.*]] = lshr i32 %a, 2 241 ; CHECK-NEXT: ret i32 [[DIV]] 242 ; 243 %mul = mul nuw i32 %a, 3 244 %div = udiv i32 %mul, 12 245 ret i32 %div 246 } 247 248 define i32 @test25(i32 %a) { 249 ; CHECK-LABEL: @test25( 250 ; CHECK-NEXT: [[DIV:%.*]] = shl nsw i32 %a, 1 251 ; CHECK-NEXT: ret i32 [[DIV]] 252 ; 253 %shl = shl nsw i32 %a, 2 254 %div = sdiv i32 %shl, 2 255 ret i32 %div 256 } 257 258 define i32 @test26(i32 %a) { 259 ; CHECK-LABEL: @test26( 260 ; CHECK-NEXT: [[DIV:%.*]] = shl nsw i32 %a, 2 261 ; CHECK-NEXT: ret i32 [[DIV]] 262 ; 263 %mul = mul nsw i32 %a, 12 264 %div = sdiv i32 %mul, 3 265 ret i32 %div 266 } 267 268 define i32 @test27(i32 %a) { 269 ; CHECK-LABEL: @test27( 270 ; CHECK-NEXT: [[DIV:%.*]] = shl nuw i32 %a, 1 271 ; CHECK-NEXT: ret i32 [[DIV]] 272 ; 273 %shl = shl nuw i32 %a, 2 274 %div = udiv i32 %shl, 2 275 ret i32 %div 276 } 277 278 define i32 @test28(i32 %a) { 279 ; CHECK-LABEL: @test28( 280 ; CHECK-NEXT: [[DIV:%.*]] = mul nuw i32 %a, 12 281 ; CHECK-NEXT: ret i32 [[DIV]] 282 ; 283 %mul = mul nuw i32 %a, 36 284 %div = udiv i32 %mul, 3 285 ret i32 %div 286 } 287 288 define i32 @test29(i32 %a) { 289 ; CHECK-LABEL: @test29( 290 ; CHECK-NEXT: [[MUL_LOBIT:%.*]] = and i32 %a, 1 291 ; CHECK-NEXT: ret i32 [[MUL_LOBIT]] 292 ; 293 %mul = shl nsw i32 %a, 31 294 %div = sdiv i32 %mul, -2147483648 295 ret i32 %div 296 } 297 298 define i32 @test30(i32 %a) { 299 ; CHECK-LABEL: @test30( 300 ; CHECK-NEXT: ret i32 %a 301 ; 302 %mul = shl nuw i32 %a, 31 303 %div = udiv i32 %mul, -2147483648 304 ret i32 %div 305 } 306 307 define <2 x i32> @test31(<2 x i32> %x) { 308 ; CHECK-LABEL: @test31( 309 ; CHECK-NEXT: ret <2 x i32> zeroinitializer 310 ; 311 %shr = lshr <2 x i32> %x, <i32 31, i32 31> 312 %div = udiv <2 x i32> %shr, <i32 2147483647, i32 2147483647> 313 ret <2 x i32> %div 314 } 315 316 define i32 @test32(i32 %a, i32 %b) { 317 ; CHECK-LABEL: @test32( 318 ; CHECK-NEXT: [[SHL:%.*]] = shl i32 2, %b 319 ; CHECK-NEXT: [[DIV:%.*]] = lshr i32 [[SHL]], 2 320 ; CHECK-NEXT: [[DIV2:%.*]] = udiv i32 %a, [[DIV]] 321 ; CHECK-NEXT: ret i32 [[DIV2]] 322 ; 323 %shl = shl i32 2, %b 324 %div = lshr i32 %shl, 2 325 %div2 = udiv i32 %a, %div 326 ret i32 %div2 327 } 328 329 define <2 x i64> @test33(<2 x i64> %x) nounwind { 330 ; CHECK-LABEL: @test33( 331 ; CHECK-NEXT: [[DIV:%.*]] = udiv exact <2 x i64> %x, <i64 192, i64 192> 332 ; CHECK-NEXT: ret <2 x i64> [[DIV]] 333 ; 334 %shr = lshr exact <2 x i64> %x, <i64 5, i64 5> 335 %div = udiv exact <2 x i64> %shr, <i64 6, i64 6> 336 ret <2 x i64> %div 337 } 338 339 define <2 x i64> @test34(<2 x i64> %x) nounwind { 340 ; CHECK-LABEL: @test34( 341 ; CHECK-NEXT: [[DIV:%.*]] = sdiv exact <2 x i64> %x, <i64 -3, i64 -4> 342 ; CHECK-NEXT: ret <2 x i64> [[DIV]] 343 ; 344 %neg = sub nsw <2 x i64> zeroinitializer, %x 345 %div = sdiv exact <2 x i64> %neg, <i64 3, i64 4> 346 ret <2 x i64> %div 347 } 348 349 define i32 @test35(i32 %A) { 350 ; CHECK-LABEL: @test35( 351 ; CHECK-NEXT: [[AND:%.*]] = and i32 %A, 2147483647 352 ; CHECK-NEXT: [[MUL:%.*]] = udiv exact i32 [[AND]], 2147483647 353 ; CHECK-NEXT: ret i32 [[MUL]] 354 ; 355 %and = and i32 %A, 2147483647 356 %mul = sdiv exact i32 %and, 2147483647 357 ret i32 %mul 358 } 359 360 define i32 @test36(i32 %A) { 361 ; CHECK-LABEL: @test36( 362 ; CHECK-NEXT: [[AND:%.*]] = and i32 %A, 2147483647 363 ; CHECK-NEXT: [[MUL:%.*]] = lshr exact i32 [[AND]], %A 364 ; CHECK-NEXT: ret i32 [[MUL]] 365 ; 366 %and = and i32 %A, 2147483647 367 %shl = shl nsw i32 1, %A 368 %mul = sdiv exact i32 %and, %shl 369 ret i32 %mul 370 } 371 372 ; FIXME: Vector should get same transform as scalar. 373 374 define <2 x i32> @test36vec(<2 x i32> %A) { 375 ; CHECK-LABEL: @test36vec( 376 ; CHECK-NEXT: [[AND:%.*]] = and <2 x i32> %A, <i32 2147483647, i32 2147483647> 377 ; CHECK-NEXT: [[SHL:%.*]] = shl nuw nsw <2 x i32> <i32 1, i32 1>, %A 378 ; CHECK-NEXT: [[MUL:%.*]] = sdiv exact <2 x i32> [[AND]], [[SHL]] 379 ; CHECK-NEXT: ret <2 x i32> [[MUL]] 380 ; 381 %and = and <2 x i32> %A, <i32 2147483647, i32 2147483647> 382 %shl = shl nsw <2 x i32> <i32 1, i32 1>, %A 383 %mul = sdiv exact <2 x i32> %and, %shl 384 ret <2 x i32> %mul 385 } 386 387 define i32 @test37(i32* %b) { 388 ; CHECK-LABEL: @test37( 389 ; CHECK-NEXT: entry: 390 ; CHECK-NEXT: store i32 0, i32* %b, align 4 391 ; CHECK-NEXT: br i1 undef, label %lor.rhs, label %lor.end 392 ; CHECK: lor.rhs: 393 ; CHECK-NEXT: br label %lor.end 394 ; CHECK: lor.end: 395 ; CHECK-NEXT: ret i32 0 396 ; 397 entry: 398 store i32 0, i32* %b, align 4 399 %0 = load i32, i32* %b, align 4 400 br i1 undef, label %lor.rhs, label %lor.end 401 402 lor.rhs: ; preds = %entry 403 %mul = mul nsw i32 undef, %0 404 br label %lor.end 405 406 lor.end: ; preds = %lor.rhs, %entry 407 %t.0 = phi i32 [ %0, %entry ], [ %mul, %lor.rhs ] 408 %div = sdiv i32 %t.0, 2 409 ret i32 %div 410 } 411 412 ; We can perform the division in the smaller type. 413 414 define i32 @shrink(i8 %x) { 415 ; CHECK-LABEL: @shrink( 416 ; CHECK-NEXT: [[TMP1:%.*]] = sdiv i8 %x, 127 417 ; CHECK-NEXT: [[DIV:%.*]] = sext i8 [[TMP1]] to i32 418 ; CHECK-NEXT: ret i32 [[DIV]] 419 ; 420 %conv = sext i8 %x to i32 421 %div = sdiv i32 %conv, 127 422 ret i32 %div 423 } 424 425 ; Division in the smaller type can lead to more optimizations. 426 427 define i32 @zap(i8 %x) { 428 ; CHECK-LABEL: @zap( 429 ; CHECK-NEXT: [[TMP1:%.*]] = icmp eq i8 %x, -128 430 ; CHECK-NEXT: [[DIV:%.*]] = zext i1 [[TMP1]] to i32 431 ; CHECK-NEXT: ret i32 [[DIV]] 432 ; 433 %conv = sext i8 %x to i32 434 %div = sdiv i32 %conv, -128 435 ret i32 %div 436 } 437 438 ; Splat constant divisors should get the same folds. 439 440 define <3 x i32> @shrink_vec(<3 x i8> %x) { 441 ; CHECK-LABEL: @shrink_vec( 442 ; CHECK-NEXT: [[TMP1:%.*]] = sdiv <3 x i8> %x, <i8 127, i8 127, i8 127> 443 ; CHECK-NEXT: [[DIV:%.*]] = sext <3 x i8> [[TMP1]] to <3 x i32> 444 ; CHECK-NEXT: ret <3 x i32> [[DIV]] 445 ; 446 %conv = sext <3 x i8> %x to <3 x i32> 447 %div = sdiv <3 x i32> %conv, <i32 127, i32 127, i32 127> 448 ret <3 x i32> %div 449 } 450 451 define <2 x i32> @zap_vec(<2 x i8> %x) { 452 ; CHECK-LABEL: @zap_vec( 453 ; CHECK-NEXT: [[TMP1:%.*]] = icmp eq <2 x i8> %x, <i8 -128, i8 -128> 454 ; CHECK-NEXT: [[DIV:%.*]] = zext <2 x i1> [[TMP1]] to <2 x i32> 455 ; CHECK-NEXT: ret <2 x i32> [[DIV]] 456 ; 457 %conv = sext <2 x i8> %x to <2 x i32> 458 %div = sdiv <2 x i32> %conv, <i32 -128, i32 -128> 459 ret <2 x i32> %div 460 } 461 462 ; But we can't do this if the signed constant won't fit in the original type. 463 464 define i32 @shrink_no(i8 %x) { 465 ; CHECK-LABEL: @shrink_no( 466 ; CHECK-NEXT: [[CONV:%.*]] = sext i8 %x to i32 467 ; CHECK-NEXT: [[DIV:%.*]] = sdiv i32 [[CONV]], 128 468 ; CHECK-NEXT: ret i32 [[DIV]] 469 ; 470 %conv = sext i8 %x to i32 471 %div = sdiv i32 %conv, 128 472 ret i32 %div 473 } 474 475 define i32 @shrink_no2(i8 %x) { 476 ; CHECK-LABEL: @shrink_no2( 477 ; CHECK-NEXT: [[CONV:%.*]] = sext i8 %x to i32 478 ; CHECK-NEXT: [[DIV:%.*]] = sdiv i32 [[CONV]], -129 479 ; CHECK-NEXT: ret i32 [[DIV]] 480 ; 481 %conv = sext i8 %x to i32 482 %div = sdiv i32 %conv, -129 483 ret i32 %div 484 } 485 486 ; 17 bits are needed to represent 65535 as a signed value, so this shouldn't fold. 487 488 define i32 @shrink_no3(i16 %x) { 489 ; CHECK-LABEL: @shrink_no3( 490 ; CHECK-NEXT: [[CONV:%.*]] = sext i16 %x to i32 491 ; CHECK-NEXT: [[DIV:%.*]] = sdiv i32 [[CONV]], 65535 492 ; CHECK-NEXT: ret i32 [[DIV]] 493 ; 494 %conv = sext i16 %x to i32 495 %div = sdiv i32 %conv, 65535 496 ret i32 %div 497 } 498 499