1 /* 2 * Copyright (c) 1983, 1993, 2001 3 * The Regents of the University of California. All rights reserved. 4 * 5 * Redistribution and use in source and binary forms, with or without 6 * modification, are permitted provided that the following conditions 7 * are met: 8 * 1. Redistributions of source code must retain the above copyright 9 * notice, this list of conditions and the following disclaimer. 10 * 2. Redistributions in binary form must reproduce the above copyright 11 * notice, this list of conditions and the following disclaimer in the 12 * documentation and/or other materials provided with the distribution. 13 * 3. Neither the name of the University nor the names of its contributors 14 * may be used to endorse or promote products derived from this software 15 * without specific prior written permission. 16 * 17 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 20 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 27 * SUCH DAMAGE. 28 */ 29 #include "gprof.h" 30 #include "libiberty.h" 31 #include "search_list.h" 32 #include "source.h" 33 #include "symtab.h" 34 #include "call_graph.h" 35 #include "cg_arcs.h" 36 #include "cg_dfn.h" 37 #include "cg_print.h" 38 #include "utils.h" 39 #include "sym_ids.h" 40 41 static int cmp_topo (const PTR, const PTR); 42 static void propagate_time (Sym *); 43 static void cycle_time (void); 44 static void cycle_link (void); 45 static void inherit_flags (Sym *); 46 static void propagate_flags (Sym **); 47 static int cmp_total (const PTR, const PTR); 48 49 Sym *cycle_header; 50 unsigned int num_cycles; 51 Arc **arcs; 52 unsigned int numarcs; 53 54 /* 55 * Return TRUE iff PARENT has an arc to covers the address 56 * range covered by CHILD. 57 */ 58 Arc * 59 arc_lookup (Sym *parent, Sym *child) 60 { 61 Arc *arc; 62 63 if (!parent || !child) 64 { 65 printf ("[arc_lookup] parent == 0 || child == 0\n"); 66 return 0; 67 } 68 DBG (LOOKUPDEBUG, printf ("[arc_lookup] parent %s child %s\n", 69 parent->name, child->name)); 70 for (arc = parent->cg.children; arc; arc = arc->next_child) 71 { 72 DBG (LOOKUPDEBUG, printf ("[arc_lookup]\t parent %s child %s\n", 73 arc->parent->name, arc->child->name)); 74 if (child->addr >= arc->child->addr 75 && child->end_addr <= arc->child->end_addr) 76 { 77 return arc; 78 } 79 } 80 return 0; 81 } 82 83 84 /* 85 * Add (or just increment) an arc: 86 */ 87 void 88 arc_add (Sym *parent, Sym *child, unsigned long count) 89 { 90 static unsigned int maxarcs = 0; 91 Arc *arc, **newarcs; 92 93 DBG (TALLYDEBUG, printf ("[arc_add] %lu arcs from %s to %s\n", 94 count, parent->name, child->name)); 95 arc = arc_lookup (parent, child); 96 if (arc) 97 { 98 /* 99 * A hit: just increment the count. 100 */ 101 DBG (TALLYDEBUG, printf ("[tally] hit %lu += %lu\n", 102 arc->count, count)); 103 arc->count += count; 104 return; 105 } 106 arc = (Arc *) xmalloc (sizeof (*arc)); 107 memset (arc, 0, sizeof (*arc)); 108 arc->parent = parent; 109 arc->child = child; 110 arc->count = count; 111 112 /* If this isn't an arc for a recursive call to parent, then add it 113 to the array of arcs. */ 114 if (parent != child) 115 { 116 /* If we've exhausted space in our current array, get a new one 117 and copy the contents. We might want to throttle the doubling 118 factor one day. */ 119 if (numarcs == maxarcs) 120 { 121 /* Determine how much space we want to allocate. */ 122 if (maxarcs == 0) 123 maxarcs = 1; 124 maxarcs *= 2; 125 126 /* Allocate the new array. */ 127 newarcs = (Arc **)xmalloc(sizeof (Arc *) * maxarcs); 128 129 /* Copy the old array's contents into the new array. */ 130 memcpy (newarcs, arcs, numarcs * sizeof (Arc *)); 131 132 /* Free up the old array. */ 133 free (arcs); 134 135 /* And make the new array be the current array. */ 136 arcs = newarcs; 137 } 138 139 /* Place this arc in the arc array. */ 140 arcs[numarcs++] = arc; 141 } 142 143 /* prepend this child to the children of this parent: */ 144 arc->next_child = parent->cg.children; 145 parent->cg.children = arc; 146 147 /* prepend this parent to the parents of this child: */ 148 arc->next_parent = child->cg.parents; 149 child->cg.parents = arc; 150 } 151 152 153 static int 154 cmp_topo (const PTR lp, const PTR rp) 155 { 156 const Sym *left = *(const Sym **) lp; 157 const Sym *right = *(const Sym **) rp; 158 159 return left->cg.top_order - right->cg.top_order; 160 } 161 162 163 static void 164 propagate_time (Sym *parent) 165 { 166 Arc *arc; 167 Sym *child; 168 double share, prop_share; 169 170 if (parent->cg.prop.fract == 0.0) 171 { 172 return; 173 } 174 175 /* gather time from children of this parent: */ 176 177 for (arc = parent->cg.children; arc; arc = arc->next_child) 178 { 179 child = arc->child; 180 if (arc->count == 0 || child == parent || child->cg.prop.fract == 0) 181 { 182 continue; 183 } 184 if (child->cg.cyc.head != child) 185 { 186 if (parent->cg.cyc.num == child->cg.cyc.num) 187 { 188 continue; 189 } 190 if (parent->cg.top_order <= child->cg.top_order) 191 { 192 fprintf (stderr, "[propagate] toporder botches\n"); 193 } 194 child = child->cg.cyc.head; 195 } 196 else 197 { 198 if (parent->cg.top_order <= child->cg.top_order) 199 { 200 fprintf (stderr, "[propagate] toporder botches\n"); 201 continue; 202 } 203 } 204 if (child->ncalls == 0) 205 { 206 continue; 207 } 208 209 /* distribute time for this arc: */ 210 arc->time = child->hist.time * (((double) arc->count) 211 / ((double) child->ncalls)); 212 arc->child_time = child->cg.child_time 213 * (((double) arc->count) / ((double) child->ncalls)); 214 share = arc->time + arc->child_time; 215 parent->cg.child_time += share; 216 217 /* (1 - cg.prop.fract) gets lost along the way: */ 218 prop_share = parent->cg.prop.fract * share; 219 220 /* fix things for printing: */ 221 parent->cg.prop.child += prop_share; 222 arc->time *= parent->cg.prop.fract; 223 arc->child_time *= parent->cg.prop.fract; 224 225 /* add this share to the parent's cycle header, if any: */ 226 if (parent->cg.cyc.head != parent) 227 { 228 parent->cg.cyc.head->cg.child_time += share; 229 parent->cg.cyc.head->cg.prop.child += prop_share; 230 } 231 DBG (PROPDEBUG, 232 printf ("[prop_time] child \t"); 233 print_name (child); 234 printf (" with %f %f %lu/%lu\n", child->hist.time, 235 child->cg.child_time, arc->count, child->ncalls); 236 printf ("[prop_time] parent\t"); 237 print_name (parent); 238 printf ("\n[prop_time] share %f\n", share)); 239 } 240 } 241 242 243 /* 244 * Compute the time of a cycle as the sum of the times of all 245 * its members. 246 */ 247 static void 248 cycle_time () 249 { 250 Sym *member, *cyc; 251 252 for (cyc = &cycle_header[1]; cyc <= &cycle_header[num_cycles]; ++cyc) 253 { 254 for (member = cyc->cg.cyc.next; member; member = member->cg.cyc.next) 255 { 256 if (member->cg.prop.fract == 0.0) 257 { 258 /* 259 * All members have the same propfraction except those 260 * that were excluded with -E. 261 */ 262 continue; 263 } 264 cyc->hist.time += member->hist.time; 265 } 266 cyc->cg.prop.self = cyc->cg.prop.fract * cyc->hist.time; 267 } 268 } 269 270 271 static void 272 cycle_link () 273 { 274 Sym *sym, *cyc, *member; 275 Arc *arc; 276 int num; 277 278 /* count the number of cycles, and initialize the cycle lists: */ 279 280 num_cycles = 0; 281 for (sym = symtab.base; sym < symtab.limit; ++sym) 282 { 283 /* this is how you find unattached cycles: */ 284 if (sym->cg.cyc.head == sym && sym->cg.cyc.next) 285 { 286 ++num_cycles; 287 } 288 } 289 290 /* 291 * cycle_header is indexed by cycle number: i.e. it is origin 1, 292 * not origin 0. 293 */ 294 cycle_header = (Sym *) xmalloc ((num_cycles + 1) * sizeof (Sym)); 295 296 /* 297 * Now link cycles to true cycle-heads, number them, accumulate 298 * the data for the cycle. 299 */ 300 num = 0; 301 cyc = cycle_header; 302 for (sym = symtab.base; sym < symtab.limit; ++sym) 303 { 304 if (!(sym->cg.cyc.head == sym && sym->cg.cyc.next != 0)) 305 { 306 continue; 307 } 308 ++num; 309 ++cyc; 310 sym_init (cyc); 311 cyc->cg.print_flag = TRUE; /* should this be printed? */ 312 cyc->cg.top_order = DFN_NAN; /* graph call chain top-sort order */ 313 cyc->cg.cyc.num = num; /* internal number of cycle on */ 314 cyc->cg.cyc.head = cyc; /* pointer to head of cycle */ 315 cyc->cg.cyc.next = sym; /* pointer to next member of cycle */ 316 DBG (CYCLEDEBUG, printf ("[cycle_link] "); 317 print_name (sym); 318 printf (" is the head of cycle %d\n", num)); 319 320 /* link members to cycle header: */ 321 for (member = sym; member; member = member->cg.cyc.next) 322 { 323 member->cg.cyc.num = num; 324 member->cg.cyc.head = cyc; 325 } 326 327 /* 328 * Count calls from outside the cycle and those among cycle 329 * members: 330 */ 331 for (member = sym; member; member = member->cg.cyc.next) 332 { 333 for (arc = member->cg.parents; arc; arc = arc->next_parent) 334 { 335 if (arc->parent == member) 336 { 337 continue; 338 } 339 if (arc->parent->cg.cyc.num == num) 340 { 341 cyc->cg.self_calls += arc->count; 342 } 343 else 344 { 345 cyc->ncalls += arc->count; 346 } 347 } 348 } 349 } 350 } 351 352 353 /* 354 * Check if any parent of this child (or outside parents of this 355 * cycle) have their print flags on and set the print flag of the 356 * child (cycle) appropriately. Similarly, deal with propagation 357 * fractions from parents. 358 */ 359 static void 360 inherit_flags (Sym *child) 361 { 362 Sym *head, *parent, *member; 363 Arc *arc; 364 365 head = child->cg.cyc.head; 366 if (child == head) 367 { 368 /* just a regular child, check its parents: */ 369 child->cg.print_flag = FALSE; 370 child->cg.prop.fract = 0.0; 371 for (arc = child->cg.parents; arc; arc = arc->next_parent) 372 { 373 parent = arc->parent; 374 if (child == parent) 375 { 376 continue; 377 } 378 child->cg.print_flag |= parent->cg.print_flag; 379 /* 380 * If the child was never actually called (e.g., this arc 381 * is static (and all others are, too)) no time propagates 382 * along this arc. 383 */ 384 if (child->ncalls != 0) 385 { 386 child->cg.prop.fract += parent->cg.prop.fract 387 * (((double) arc->count) / ((double) child->ncalls)); 388 } 389 } 390 } 391 else 392 { 393 /* 394 * Its a member of a cycle, look at all parents from outside 395 * the cycle. 396 */ 397 head->cg.print_flag = FALSE; 398 head->cg.prop.fract = 0.0; 399 for (member = head->cg.cyc.next; member; member = member->cg.cyc.next) 400 { 401 for (arc = member->cg.parents; arc; arc = arc->next_parent) 402 { 403 if (arc->parent->cg.cyc.head == head) 404 { 405 continue; 406 } 407 parent = arc->parent; 408 head->cg.print_flag |= parent->cg.print_flag; 409 /* 410 * If the cycle was never actually called (e.g. this 411 * arc is static (and all others are, too)) no time 412 * propagates along this arc. 413 */ 414 if (head->ncalls != 0) 415 { 416 head->cg.prop.fract += parent->cg.prop.fract 417 * (((double) arc->count) / ((double) head->ncalls)); 418 } 419 } 420 } 421 for (member = head; member; member = member->cg.cyc.next) 422 { 423 member->cg.print_flag = head->cg.print_flag; 424 member->cg.prop.fract = head->cg.prop.fract; 425 } 426 } 427 } 428 429 430 /* 431 * In one top-to-bottom pass over the topologically sorted symbols 432 * propagate: 433 * cg.print_flag as the union of parents' print_flags 434 * propfraction as the sum of fractional parents' propfractions 435 * and while we're here, sum time for functions. 436 */ 437 static void 438 propagate_flags (Sym **symbols) 439 { 440 int sym_index; 441 Sym *old_head, *child; 442 443 old_head = 0; 444 for (sym_index = symtab.len - 1; sym_index >= 0; --sym_index) 445 { 446 child = symbols[sym_index]; 447 /* 448 * If we haven't done this function or cycle, inherit things 449 * from parent. This way, we are linear in the number of arcs 450 * since we do all members of a cycle (and the cycle itself) 451 * as we hit the first member of the cycle. 452 */ 453 if (child->cg.cyc.head != old_head) 454 { 455 old_head = child->cg.cyc.head; 456 inherit_flags (child); 457 } 458 DBG (PROPDEBUG, 459 printf ("[prop_flags] "); 460 print_name (child); 461 printf ("inherits print-flag %d and prop-fract %f\n", 462 child->cg.print_flag, child->cg.prop.fract)); 463 if (!child->cg.print_flag) 464 { 465 /* 466 * Printflag is off. It gets turned on by being in the 467 * INCL_GRAPH table, or there being an empty INCL_GRAPH 468 * table and not being in the EXCL_GRAPH table. 469 */ 470 if (sym_lookup (&syms[INCL_GRAPH], child->addr) 471 || (syms[INCL_GRAPH].len == 0 472 && !sym_lookup (&syms[EXCL_GRAPH], child->addr))) 473 { 474 child->cg.print_flag = TRUE; 475 } 476 } 477 else 478 { 479 /* 480 * This function has printing parents: maybe someone wants 481 * to shut it up by putting it in the EXCL_GRAPH table. 482 * (But favor INCL_GRAPH over EXCL_GRAPH.) 483 */ 484 if (!sym_lookup (&syms[INCL_GRAPH], child->addr) 485 && sym_lookup (&syms[EXCL_GRAPH], child->addr)) 486 { 487 child->cg.print_flag = FALSE; 488 } 489 } 490 if (child->cg.prop.fract == 0.0) 491 { 492 /* 493 * No parents to pass time to. Collect time from children 494 * if its in the INCL_TIME table, or there is an empty 495 * INCL_TIME table and its not in the EXCL_TIME table. 496 */ 497 if (sym_lookup (&syms[INCL_TIME], child->addr) 498 || (syms[INCL_TIME].len == 0 499 && !sym_lookup (&syms[EXCL_TIME], child->addr))) 500 { 501 child->cg.prop.fract = 1.0; 502 } 503 } 504 else 505 { 506 /* 507 * It has parents to pass time to, but maybe someone wants 508 * to shut it up by puttting it in the EXCL_TIME table. 509 * (But favor being in INCL_TIME tabe over being in 510 * EXCL_TIME table.) 511 */ 512 if (!sym_lookup (&syms[INCL_TIME], child->addr) 513 && sym_lookup (&syms[EXCL_TIME], child->addr)) 514 { 515 child->cg.prop.fract = 0.0; 516 } 517 } 518 child->cg.prop.self = child->hist.time * child->cg.prop.fract; 519 print_time += child->cg.prop.self; 520 DBG (PROPDEBUG, 521 printf ("[prop_flags] "); 522 print_name (child); 523 printf (" ends up with printflag %d and prop-fract %f\n", 524 child->cg.print_flag, child->cg.prop.fract); 525 printf ("[prop_flags] time %f propself %f print_time %f\n", 526 child->hist.time, child->cg.prop.self, print_time)); 527 } 528 } 529 530 531 /* 532 * Compare by decreasing propagated time. If times are equal, but one 533 * is a cycle header, say that's first (e.g. less, i.e. -1). If one's 534 * name doesn't have an underscore and the other does, say that one is 535 * first. All else being equal, compare by names. 536 */ 537 static int 538 cmp_total (const PTR lp, const PTR rp) 539 { 540 const Sym *left = *(const Sym **) lp; 541 const Sym *right = *(const Sym **) rp; 542 double diff; 543 544 diff = (left->cg.prop.self + left->cg.prop.child) 545 - (right->cg.prop.self + right->cg.prop.child); 546 if (diff < 0.0) 547 { 548 return 1; 549 } 550 if (diff > 0.0) 551 { 552 return -1; 553 } 554 if (!left->name && left->cg.cyc.num != 0) 555 { 556 return -1; 557 } 558 if (!right->name && right->cg.cyc.num != 0) 559 { 560 return 1; 561 } 562 if (!left->name) 563 { 564 return -1; 565 } 566 if (!right->name) 567 { 568 return 1; 569 } 570 if (left->name[0] != '_' && right->name[0] == '_') 571 { 572 return -1; 573 } 574 if (left->name[0] == '_' && right->name[0] != '_') 575 { 576 return 1; 577 } 578 if (left->ncalls > right->ncalls) 579 { 580 return -1; 581 } 582 if (left->ncalls < right->ncalls) 583 { 584 return 1; 585 } 586 return strcmp (left->name, right->name); 587 } 588 589 590 /* Topologically sort the graph (collapsing cycles), and propagates 591 time bottom up and flags top down. */ 592 593 Sym ** 594 cg_assemble (void) 595 { 596 Sym *parent, **time_sorted_syms, **top_sorted_syms; 597 unsigned int sym_index; 598 Arc *arc; 599 600 /* Initialize various things: 601 Zero out child times. 602 Count self-recursive calls. 603 Indicate that nothing is on cycles. */ 604 for (parent = symtab.base; parent < symtab.limit; parent++) 605 { 606 parent->cg.child_time = 0.0; 607 arc = arc_lookup (parent, parent); 608 if (arc && parent == arc->child) 609 { 610 parent->ncalls -= arc->count; 611 parent->cg.self_calls = arc->count; 612 } 613 else 614 { 615 parent->cg.self_calls = 0; 616 } 617 parent->cg.prop.fract = 0.0; 618 parent->cg.prop.self = 0.0; 619 parent->cg.prop.child = 0.0; 620 parent->cg.print_flag = FALSE; 621 parent->cg.top_order = DFN_NAN; 622 parent->cg.cyc.num = 0; 623 parent->cg.cyc.head = parent; 624 parent->cg.cyc.next = 0; 625 if (ignore_direct_calls) 626 find_call (parent, parent->addr, (parent + 1)->addr); 627 } 628 629 /* Topologically order things. If any node is unnumbered, number 630 it and any of its descendents. */ 631 for (parent = symtab.base; parent < symtab.limit; parent++) 632 { 633 if (parent->cg.top_order == DFN_NAN) 634 cg_dfn (parent); 635 } 636 637 /* Link together nodes on the same cycle. */ 638 cycle_link (); 639 640 /* Sort the symbol table in reverse topological order. */ 641 top_sorted_syms = (Sym **) xmalloc (symtab.len * sizeof (Sym *)); 642 for (sym_index = 0; sym_index < symtab.len; ++sym_index) 643 top_sorted_syms[sym_index] = &symtab.base[sym_index]; 644 645 qsort (top_sorted_syms, symtab.len, sizeof (Sym *), cmp_topo); 646 DBG (DFNDEBUG, 647 printf ("[cg_assemble] topological sort listing\n"); 648 for (sym_index = 0; sym_index < symtab.len; ++sym_index) 649 { 650 printf ("[cg_assemble] "); 651 printf ("%d:", top_sorted_syms[sym_index]->cg.top_order); 652 print_name (top_sorted_syms[sym_index]); 653 printf ("\n"); 654 } 655 ); 656 657 /* Starting from the topological top, propagate print flags to 658 children. also, calculate propagation fractions. this happens 659 before time propagation since time propagation uses the 660 fractions. */ 661 propagate_flags (top_sorted_syms); 662 663 /* Starting from the topological bottom, propogate children times 664 up to parents. */ 665 cycle_time (); 666 for (sym_index = 0; sym_index < symtab.len; ++sym_index) 667 propagate_time (top_sorted_syms[sym_index]); 668 669 free (top_sorted_syms); 670 671 /* Now, sort by CG.PROP.SELF + CG.PROP.CHILD. Sorting both the regular 672 function names and cycle headers. */ 673 time_sorted_syms = (Sym **) xmalloc ((symtab.len + num_cycles) * sizeof (Sym *)); 674 for (sym_index = 0; sym_index < symtab.len; sym_index++) 675 time_sorted_syms[sym_index] = &symtab.base[sym_index]; 676 677 for (sym_index = 1; sym_index <= num_cycles; sym_index++) 678 time_sorted_syms[symtab.len + sym_index - 1] = &cycle_header[sym_index]; 679 680 qsort (time_sorted_syms, symtab.len + num_cycles, sizeof (Sym *), 681 cmp_total); 682 683 for (sym_index = 0; sym_index < symtab.len + num_cycles; sym_index++) 684 time_sorted_syms[sym_index]->cg.index = sym_index + 1; 685 686 return time_sorted_syms; 687 } 688