1 ; Check that a division is bypassed when appropriate only. 2 ; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mcpu=atom < %s | FileCheck -check-prefixes=ATOM,CHECK %s 3 ; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mcpu=silvermont < %s | FileCheck -check-prefixes=REST,CHECK %s 4 ; RUN: llc -mtriple=x86_64-unknown-linux-gnu -mcpu=skylake < %s | FileCheck -check-prefixes=REST,CHECK %s 5 ; RUN: llc -profile-summary-huge-working-set-size-threshold=1 -mtriple=x86_64-unknown-linux-gnu -mcpu=skylake < %s | FileCheck -check-prefixes=HUGEWS %s 6 7 ; Verify that div32 is bypassed only for Atoms. 8 define i32 @div32(i32 %a, i32 %b) { 9 entry: 10 ; ATOM-LABEL: div32: 11 ; ATOM: orl %{{.*}}, [[REG:%[a-z]+]] 12 ; ATOM: testl $-256, [[REG]] 13 ; ATOM: divb 14 ; 15 ; REST-LABEL: div32: 16 ; REST-NOT: divb 17 ; 18 %div = sdiv i32 %a, %b 19 ret i32 %div 20 } 21 22 ; Verify that div64 is always bypassed. 23 define i64 @div64(i64 %a, i64 %b) { 24 entry: 25 ; CHECK-LABEL: div64: 26 ; CHECK: orq %{{.*}}, [[REG:%[a-z]+]] 27 ; CHECK: shrq $32, [[REG]] 28 ; CHECK: divl 29 ; 30 %div = sdiv i64 %a, %b 31 ret i64 %div 32 } 33 34 35 ; Verify that no extra code is generated when optimizing for size. 36 37 define i64 @div64_optsize(i64 %a, i64 %b) optsize { 38 ; CHECK-LABEL: div64_optsize: 39 ; CHECK-NOT: divl 40 ; CHECK: ret 41 %div = sdiv i64 %a, %b 42 ret i64 %div 43 } 44 45 define i64 @div64_hugews(i64 %a, i64 %b) { 46 ; HUGEWS-LABEL: div64_hugews: 47 ; HUGEWS-NOT: divl 48 ; HUGEWS: ret 49 %div = sdiv i64 %a, %b 50 ret i64 %div 51 } 52 53 define i32 @div32_optsize(i32 %a, i32 %b) optsize { 54 ; CHECK-LABEL: div32_optsize: 55 ; CHECK-NOT: divb 56 ; CHECK: ret 57 %div = sdiv i32 %a, %b 58 ret i32 %div 59 } 60 61 define i32 @div32_minsize(i32 %a, i32 %b) minsize { 62 ; CHECK-LABEL: div32_minsize: 63 ; CHECK-NOT: divb 64 ; CHECK: ret 65 %div = sdiv i32 %a, %b 66 ret i32 %div 67 } 68 69 !llvm.module.flags = !{!1} 70 !1 = !{i32 1, !"ProfileSummary", !2} 71 !2 = !{!3, !4, !5, !6, !7, !8, !9, !10} 72 !3 = !{!"ProfileFormat", !"InstrProf"} 73 !4 = !{!"TotalCount", i64 10000} 74 !5 = !{!"MaxCount", i64 1000} 75 !6 = !{!"MaxInternalCount", i64 1} 76 !7 = !{!"MaxFunctionCount", i64 1000} 77 !8 = !{!"NumCounts", i64 3} 78 !9 = !{!"NumFunctions", i64 3} 79 !10 = !{!"DetailedSummary", !11} 80 !11 = !{!12, !13, !14} 81 !12 = !{i32 10000, i64 1000, i32 1} 82 !13 = !{i32 999000, i64 1000, i32 3} 83 !14 = !{i32 999999, i64 5, i32 3} 84