Home | History | Annotate | Download | only in SampleProfile
      1 ; RUN: opt < %s -sample-profile -sample-profile-file=%S/Inputs/propagate.prof | opt -analyze -branch-prob | FileCheck %s
      2 ; RUN: opt < %s -passes=sample-profile -sample-profile-file=%S/Inputs/propagate.prof | opt -analyze -branch-prob | FileCheck %s
      3 
      4 ; Original C++ code for this test case:
      5 ;
      6 ; #include <stdio.h>
      7 ;
      8 ; long foo(int x, int y, long N) {
      9 ;   if (x < y) {
     10 ;     return y - x;
     11 ;   } else {
     12 ;     for (long i = 0; i < N; i++) {
     13 ;       if (i > N / 3)
     14 ;         x--;
     15 ;       if (i > N / 4) {
     16 ;         y++;
     17 ;         x += 3;
     18 ;       } else {
     19 ;         for (unsigned j = 0; j < 100; j++) {
     20 ;           x += j;
     21 ;           y -= 3;
     22 ;         }
     23 ;       }
     24 ;     }
     25 ;   }
     26 ;   return y * x;
     27 ; }
     28 ;
     29 ; int main() {
     30 ;   int x = 5678;
     31 ;   int y = 1234;
     32 ;   long N = 9999999;
     33 ;   printf("foo(%d, %d, %ld) = %ld\n", x, y, N, foo(x, y, N));
     34 ;   return 0;
     35 ; }
     36 
     37 ; ModuleID = 'propagate.cc'
     38 target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
     39 target triple = "x86_64-unknown-linux-gnu"
     40 
     41 @.str = private unnamed_addr constant [24 x i8] c"foo(%d, %d, %ld) = %ld\0A\00", align 1
     42 
     43 ; Function Attrs: nounwind uwtable
     44 define i64 @_Z3fooiil(i32 %x, i32 %y, i64 %N) #0 !dbg !6 {
     45 entry:
     46   %retval = alloca i64, align 8
     47   %x.addr = alloca i32, align 4
     48   %y.addr = alloca i32, align 4
     49   %N.addr = alloca i64, align 8
     50   %i = alloca i64, align 8
     51   %j = alloca i64, align 8
     52   store i32 %x, i32* %x.addr, align 4
     53   call void @llvm.dbg.declare(metadata i32* %x.addr, metadata !11, metadata !12), !dbg !13
     54   store i32 %y, i32* %y.addr, align 4
     55   call void @llvm.dbg.declare(metadata i32* %y.addr, metadata !14, metadata !12), !dbg !15
     56   store i64 %N, i64* %N.addr, align 8
     57   call void @llvm.dbg.declare(metadata i64* %N.addr, metadata !16, metadata !12), !dbg !17
     58   %0 = load i32, i32* %x.addr, align 4, !dbg !18
     59   %1 = load i32, i32* %y.addr, align 4, !dbg !20
     60   %cmp = icmp slt i32 %0, %1, !dbg !21
     61   br i1 %cmp, label %if.then, label %if.else, !dbg !22
     62 
     63 if.then:                                          ; preds = %entry
     64   %2 = load i32, i32* %y.addr, align 4, !dbg !23
     65   %3 = load i32, i32* %x.addr, align 4, !dbg !25
     66   %sub = sub nsw i32 %2, %3, !dbg !26
     67   %conv = sext i32 %sub to i64, !dbg !23
     68   store i64 %conv, i64* %retval, align 8, !dbg !27
     69   br label %return, !dbg !27
     70 
     71 if.else:                                          ; preds = %entry
     72   call void @llvm.dbg.declare(metadata i64* %i, metadata !28, metadata !12), !dbg !31
     73   store i64 0, i64* %i, align 8, !dbg !31
     74   br label %for.cond, !dbg !32
     75 
     76 for.cond:                                         ; preds = %for.inc17, %if.else
     77   %4 = load i64, i64* %i, align 8, !dbg !33
     78   %5 = load i64, i64* %N.addr, align 8, !dbg !36
     79   %cmp1 = icmp slt i64 %4, %5, !dbg !37
     80   br i1 %cmp1, label %for.body, label %for.end19, !dbg !38
     81 
     82 for.body:                                         ; preds = %for.cond
     83   %6 = load i64, i64* %i, align 8, !dbg !39
     84   %7 = load i64, i64* %N.addr, align 8, !dbg !42
     85   %div = sdiv i64 %7, 3, !dbg !43
     86   %cmp2 = icmp sgt i64 %6, %div, !dbg !44
     87   br i1 %cmp2, label %if.then3, label %if.end, !dbg !45
     88 ; CHECK:  edge for.body -> if.then3 probability is 0x51451451 / 0x80000000 = 63.49%
     89 ; CHECK:  edge for.body -> if.end probability is 0x2ebaebaf / 0x80000000 = 36.51%
     90 
     91 if.then3:                                         ; preds = %for.body
     92   %8 = load i32, i32* %x.addr, align 4, !dbg !46
     93   %dec = add nsw i32 %8, -1, !dbg !46
     94   store i32 %dec, i32* %x.addr, align 4, !dbg !46
     95   br label %if.end, !dbg !47
     96 
     97 if.end:                                           ; preds = %if.then3, %for.body
     98   %9 = load i64, i64* %i, align 8, !dbg !48
     99   %10 = load i64, i64* %N.addr, align 8, !dbg !50
    100   %div4 = sdiv i64 %10, 4, !dbg !51
    101   %cmp5 = icmp sgt i64 %9, %div4, !dbg !52
    102   br i1 %cmp5, label %if.then6, label %if.else7, !dbg !53
    103 ; CHECK:  edge if.end -> if.then6 probability is 0x5dbaa1dc / 0x80000000 = 73.23%
    104 ; CHECK:  edge if.end -> if.else7 probability is 0x22455e24 / 0x80000000 = 26.77%
    105 
    106 if.then6:                                         ; preds = %if.end
    107   %11 = load i32, i32* %y.addr, align 4, !dbg !54
    108   %inc = add nsw i32 %11, 1, !dbg !54
    109   store i32 %inc, i32* %y.addr, align 4, !dbg !54
    110   %12 = load i32, i32* %x.addr, align 4, !dbg !56
    111   %add = add nsw i32 %12, 3, !dbg !56
    112   store i32 %add, i32* %x.addr, align 4, !dbg !56
    113   br label %if.end16, !dbg !57
    114 
    115 if.else7:                                         ; preds = %if.end
    116   call void @llvm.dbg.declare(metadata i64* %j, metadata !58, metadata !12), !dbg !62
    117   store i64 0, i64* %j, align 8, !dbg !62
    118   br label %for.cond8, !dbg !63
    119 
    120 for.cond8:                                        ; preds = %for.inc, %if.else7
    121   %13 = load i64, i64* %j, align 8, !dbg !64
    122   %cmp9 = icmp slt i64 %13, 100, !dbg !67
    123   br i1 %cmp9, label %for.body10, label %for.end, !dbg !68
    124 ; CHECK: edge for.cond8 -> for.body10 probability is 0x7e985735 / 0x80000000 = 98.90% [HOT edge]
    125 ; CHECK: edge for.cond8 -> for.end probability is 0x0167a8cb / 0x80000000 = 1.10%
    126 
    127 
    128 for.body10:                                       ; preds = %for.cond8
    129   %14 = load i64, i64* %j, align 8, !dbg !69
    130   %15 = load i32, i32* %x.addr, align 4, !dbg !71
    131   %conv11 = sext i32 %15 to i64, !dbg !71
    132   %add12 = add nsw i64 %conv11, %14, !dbg !71
    133   %conv13 = trunc i64 %add12 to i32, !dbg !71
    134   store i32 %conv13, i32* %x.addr, align 4, !dbg !71
    135   %16 = load i32, i32* %y.addr, align 4, !dbg !72
    136   %sub14 = sub nsw i32 %16, 3, !dbg !72
    137   store i32 %sub14, i32* %y.addr, align 4, !dbg !72
    138   br label %for.inc, !dbg !73
    139 
    140 for.inc:                                          ; preds = %for.body10
    141   %17 = load i64, i64* %j, align 8, !dbg !74
    142   %inc15 = add nsw i64 %17, 1, !dbg !74
    143   store i64 %inc15, i64* %j, align 8, !dbg !74
    144   br label %for.cond8, !dbg !76
    145 
    146 for.end:                                          ; preds = %for.cond8
    147   br label %if.end16
    148 
    149 if.end16:                                         ; preds = %for.end, %if.then6
    150   br label %for.inc17, !dbg !77
    151 
    152 for.inc17:                                        ; preds = %if.end16
    153   %18 = load i64, i64* %i, align 8, !dbg !78
    154   %inc18 = add nsw i64 %18, 1, !dbg !78
    155   store i64 %inc18, i64* %i, align 8, !dbg !78
    156   br label %for.cond, !dbg !80
    157 
    158 for.end19:                                        ; preds = %for.cond
    159   br label %if.end20
    160 
    161 if.end20:                                         ; preds = %for.end19
    162   %19 = load i32, i32* %y.addr, align 4, !dbg !81
    163   %20 = load i32, i32* %x.addr, align 4, !dbg !82
    164   %mul = mul nsw i32 %19, %20, !dbg !83
    165   %conv21 = sext i32 %mul to i64, !dbg !81
    166   store i64 %conv21, i64* %retval, align 8, !dbg !84
    167   br label %return, !dbg !84
    168 
    169 return:                                           ; preds = %if.end20, %if.then
    170   %21 = load i64, i64* %retval, align 8, !dbg !85
    171   ret i64 %21, !dbg !85
    172 }
    173 
    174 ; Function Attrs: nounwind readnone
    175 declare void @llvm.dbg.declare(metadata, metadata, metadata) #1
    176 
    177 ; Function Attrs: norecurse uwtable
    178 define i32 @main() #2 !dbg !86 {
    179 entry:
    180   %retval = alloca i32, align 4
    181   %x = alloca i32, align 4
    182   %y = alloca i32, align 4
    183   %N = alloca i64, align 8
    184   store i32 0, i32* %retval, align 4
    185   call void @llvm.dbg.declare(metadata i32* %x, metadata !89, metadata !12), !dbg !90
    186   store i32 5678, i32* %x, align 4, !dbg !90
    187   call void @llvm.dbg.declare(metadata i32* %y, metadata !91, metadata !12), !dbg !92
    188   store i32 1234, i32* %y, align 4, !dbg !92
    189   call void @llvm.dbg.declare(metadata i64* %N, metadata !93, metadata !12), !dbg !94
    190   store i64 9999999, i64* %N, align 8, !dbg !94
    191   %0 = load i32, i32* %x, align 4, !dbg !95
    192   %1 = load i32, i32* %y, align 4, !dbg !96
    193   %2 = load i64, i64* %N, align 8, !dbg !97
    194   %3 = load i32, i32* %x, align 4, !dbg !98
    195   %4 = load i32, i32* %y, align 4, !dbg !99
    196   %5 = load i64, i64* %N, align 8, !dbg !100
    197   %call = call i64 @_Z3fooiil(i32 %3, i32 %4, i64 %5), !dbg !101
    198   %call1 = call i32 (i8*, ...) @printf(i8* getelementptr inbounds ([24 x i8], [24 x i8]* @.str, i32 0, i32 0), i32 %0, i32 %1, i64 %2, i64 %call), !dbg !102
    199   ret i32 0, !dbg !104
    200 }
    201 
    202 declare i32 @printf(i8*, ...) #3
    203 
    204 attributes #0 = { nounwind uwtable "disable-tail-calls"="false" "less-precise-fpmad"="false" "no-frame-pointer-elim"="true" "no-frame-pointer-elim-non-leaf" "no-infs-fp-math"="false" "no-jump-tables"="false" "no-nans-fp-math"="false" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+fxsr,+mmx,+sse,+sse2,+x87" "unsafe-fp-math"="false" "use-soft-float"="false" }
    205 attributes #1 = { nounwind readnone }
    206 attributes #2 = { norecurse uwtable "disable-tail-calls"="false" "less-precise-fpmad"="false" "no-frame-pointer-elim"="true" "no-frame-pointer-elim-non-leaf" "no-infs-fp-math"="false" "no-jump-tables"="false" "no-nans-fp-math"="false" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+fxsr,+mmx,+sse,+sse2,+x87" "unsafe-fp-math"="false" "use-soft-float"="false" }
    207 attributes #3 = { "disable-tail-calls"="false" "less-precise-fpmad"="false" "no-frame-pointer-elim"="true" "no-frame-pointer-elim-non-leaf" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+fxsr,+mmx,+sse,+sse2,+x87" "unsafe-fp-math"="false" "use-soft-float"="false" }
    208 
    209 !llvm.dbg.cu = !{!0}
    210 !llvm.module.flags = !{!3, !4}
    211 !llvm.ident = !{!5}
    212 
    213 !0 = distinct !DICompileUnit(language: DW_LANG_C_plus_plus, file: !1, producer: "clang version 3.9.0 (trunk 266819)", isOptimized: false, runtimeVersion: 0, emissionKind: FullDebug, enums: !2)
    214 !1 = !DIFile(filename: "propagate.cc", directory: ".")
    215 !2 = !{}
    216 !3 = !{i32 2, !"Dwarf Version", i32 4}
    217 !4 = !{i32 2, !"Debug Info Version", i32 3}
    218 !5 = !{!"clang version 3.9.0 (trunk 266819)"}
    219 !6 = distinct !DISubprogram(name: "foo", linkageName: "_Z3fooiil", scope: !1, file: !1, line: 3, type: !7, isLocal: false, isDefinition: true, scopeLine: 3, flags: DIFlagPrototyped, isOptimized: false, unit: !0, variables: !2)
    220 !7 = !DISubroutineType(types: !8)
    221 !8 = !{!9, !10, !10, !9}
    222 !9 = !DIBasicType(name: "long int", size: 64, align: 64, encoding: DW_ATE_signed)
    223 !10 = !DIBasicType(name: "int", size: 32, align: 32, encoding: DW_ATE_signed)
    224 !11 = !DILocalVariable(name: "x", arg: 1, scope: !6, file: !1, line: 3, type: !10)
    225 !12 = !DIExpression()
    226 !13 = !DILocation(line: 3, column: 14, scope: !6)
    227 !14 = !DILocalVariable(name: "y", arg: 2, scope: !6, file: !1, line: 3, type: !10)
    228 !15 = !DILocation(line: 3, column: 21, scope: !6)
    229 !16 = !DILocalVariable(name: "N", arg: 3, scope: !6, file: !1, line: 3, type: !9)
    230 !17 = !DILocation(line: 3, column: 29, scope: !6)
    231 !18 = !DILocation(line: 4, column: 7, scope: !19)
    232 !19 = distinct !DILexicalBlock(scope: !6, file: !1, line: 4, column: 7)
    233 !20 = !DILocation(line: 4, column: 11, scope: !19)
    234 !21 = !DILocation(line: 4, column: 9, scope: !19)
    235 !22 = !DILocation(line: 4, column: 7, scope: !6)
    236 !23 = !DILocation(line: 5, column: 12, scope: !24)
    237 !24 = distinct !DILexicalBlock(scope: !19, file: !1, line: 4, column: 14)
    238 !25 = !DILocation(line: 5, column: 16, scope: !24)
    239 !26 = !DILocation(line: 5, column: 14, scope: !24)
    240 !27 = !DILocation(line: 5, column: 5, scope: !24)
    241 !28 = !DILocalVariable(name: "i", scope: !29, file: !1, line: 7, type: !9)
    242 !29 = distinct !DILexicalBlock(scope: !30, file: !1, line: 7, column: 5)
    243 !30 = distinct !DILexicalBlock(scope: !19, file: !1, line: 6, column: 10)
    244 !31 = !DILocation(line: 7, column: 15, scope: !29)
    245 !32 = !DILocation(line: 7, column: 10, scope: !29)
    246 !33 = !DILocation(line: 7, column: 22, scope: !34)
    247 !34 = !DILexicalBlockFile(scope: !35, file: !1, discriminator: 1)
    248 !35 = distinct !DILexicalBlock(scope: !29, file: !1, line: 7, column: 5)
    249 !36 = !DILocation(line: 7, column: 26, scope: !34)
    250 !37 = !DILocation(line: 7, column: 24, scope: !34)
    251 !38 = !DILocation(line: 7, column: 5, scope: !34)
    252 !39 = !DILocation(line: 8, column: 11, scope: !40)
    253 !40 = distinct !DILexicalBlock(scope: !41, file: !1, line: 8, column: 11)
    254 !41 = distinct !DILexicalBlock(scope: !35, file: !1, line: 7, column: 34)
    255 !42 = !DILocation(line: 8, column: 15, scope: !40)
    256 !43 = !DILocation(line: 8, column: 17, scope: !40)
    257 !44 = !DILocation(line: 8, column: 13, scope: !40)
    258 !45 = !DILocation(line: 8, column: 11, scope: !41)
    259 !46 = !DILocation(line: 9, column: 10, scope: !40)
    260 !47 = !DILocation(line: 9, column: 9, scope: !40)
    261 !48 = !DILocation(line: 10, column: 11, scope: !49)
    262 !49 = distinct !DILexicalBlock(scope: !41, file: !1, line: 10, column: 11)
    263 !50 = !DILocation(line: 10, column: 15, scope: !49)
    264 !51 = !DILocation(line: 10, column: 17, scope: !49)
    265 !52 = !DILocation(line: 10, column: 13, scope: !49)
    266 !53 = !DILocation(line: 10, column: 11, scope: !41)
    267 !54 = !DILocation(line: 11, column: 10, scope: !55)
    268 !55 = distinct !DILexicalBlock(scope: !49, file: !1, line: 10, column: 22)
    269 !56 = !DILocation(line: 12, column: 11, scope: !55)
    270 !57 = !DILocation(line: 13, column: 7, scope: !55)
    271 !58 = !DILocalVariable(name: "j", scope: !59, file: !1, line: 14, type: !61)
    272 !59 = distinct !DILexicalBlock(scope: !60, file: !1, line: 14, column: 9)
    273 !60 = distinct !DILexicalBlock(scope: !49, file: !1, line: 13, column: 14)
    274 !61 = !DIBasicType(name: "long long int", size: 64, align: 64, encoding: DW_ATE_signed)
    275 !62 = !DILocation(line: 14, column: 24, scope: !59)
    276 !63 = !DILocation(line: 14, column: 14, scope: !59)
    277 !64 = !DILocation(line: 14, column: 31, scope: !65)
    278 !65 = !DILexicalBlockFile(scope: !66, file: !1, discriminator: 1)
    279 !66 = distinct !DILexicalBlock(scope: !59, file: !1, line: 14, column: 9)
    280 !67 = !DILocation(line: 14, column: 33, scope: !65)
    281 !68 = !DILocation(line: 14, column: 9, scope: !65)
    282 !69 = !DILocation(line: 15, column: 16, scope: !70)
    283 !70 = distinct !DILexicalBlock(scope: !66, file: !1, line: 14, column: 45)
    284 !71 = !DILocation(line: 15, column: 13, scope: !70)
    285 !72 = !DILocation(line: 16, column: 13, scope: !70)
    286 !73 = !DILocation(line: 17, column: 9, scope: !70)
    287 !74 = !DILocation(line: 14, column: 41, scope: !75)
    288 !75 = !DILexicalBlockFile(scope: !66, file: !1, discriminator: 2)
    289 !76 = !DILocation(line: 14, column: 9, scope: !75)
    290 !77 = !DILocation(line: 19, column: 5, scope: !41)
    291 !78 = !DILocation(line: 7, column: 30, scope: !79)
    292 !79 = !DILexicalBlockFile(scope: !35, file: !1, discriminator: 2)
    293 !80 = !DILocation(line: 7, column: 5, scope: !79)
    294 !81 = !DILocation(line: 21, column: 10, scope: !6)
    295 !82 = !DILocation(line: 21, column: 14, scope: !6)
    296 !83 = !DILocation(line: 21, column: 12, scope: !6)
    297 !84 = !DILocation(line: 21, column: 3, scope: !6)
    298 !85 = !DILocation(line: 22, column: 1, scope: !6)
    299 !86 = distinct !DISubprogram(name: "main", scope: !1, file: !1, line: 24, type: !87, isLocal: false, isDefinition: true, scopeLine: 24, flags: DIFlagPrototyped, isOptimized: false, unit: !0, variables: !2)
    300 !87 = !DISubroutineType(types: !88)
    301 !88 = !{!10}
    302 !89 = !DILocalVariable(name: "x", scope: !86, file: !1, line: 25, type: !10)
    303 !90 = !DILocation(line: 25, column: 7, scope: !86)
    304 !91 = !DILocalVariable(name: "y", scope: !86, file: !1, line: 26, type: !10)
    305 !92 = !DILocation(line: 26, column: 7, scope: !86)
    306 !93 = !DILocalVariable(name: "N", scope: !86, file: !1, line: 27, type: !9)
    307 !94 = !DILocation(line: 27, column: 8, scope: !86)
    308 !95 = !DILocation(line: 28, column: 38, scope: !86)
    309 !96 = !DILocation(line: 28, column: 41, scope: !86)
    310 !97 = !DILocation(line: 28, column: 44, scope: !86)
    311 !98 = !DILocation(line: 28, column: 51, scope: !86)
    312 !99 = !DILocation(line: 28, column: 54, scope: !86)
    313 !100 = !DILocation(line: 28, column: 57, scope: !86)
    314 !101 = !DILocation(line: 28, column: 47, scope: !86)
    315 !102 = !DILocation(line: 28, column: 3, scope: !103)
    316 !103 = !DILexicalBlockFile(scope: !86, file: !1, discriminator: 1)
    317 !104 = !DILocation(line: 29, column: 3, scope: !86)
    318