2 * Copyright (c) 1983, 2001 Regents of the University of California.
5 * Redistribution and use in source and binary forms are permitted
6 * provided that: (1) source distributions retain this entire copyright
7 * notice and comment, and (2) distributions including binaries display
8 * the following acknowledgement: ``This product includes software
9 * developed by the University of California, Berkeley and its contributors''
10 * in the documentation or other materials provided with the distribution
11 * and in all advertising materials mentioning features or use of this
12 * software. Neither the name of the University nor the names of its
13 * contributors may be used to endorse or promote products derived
14 * from this software without specific prior written permission.
15 * THIS SOFTWARE IS PROVIDED ``AS IS'' AND WITHOUT ANY EXPRESS OR
16 * IMPLIED WARRANTIES, INCLUDING, WITHOUT LIMITATION, THE IMPLIED
17 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.
19 #include "libiberty.h"
21 #include "call_graph.h"
29 unsigned int num_cycles
;
34 * Return TRUE iff PARENT has an arc to covers the address
35 * range covered by CHILD.
38 DEFUN (arc_lookup
, (parent
, child
), Sym
* parent AND Sym
* child
)
42 if (!parent
|| !child
)
44 printf ("[arc_lookup] parent == 0 || child == 0\n");
47 DBG (LOOKUPDEBUG
, printf ("[arc_lookup] parent %s child %s\n",
48 parent
->name
, child
->name
));
49 for (arc
= parent
->cg
.children
; arc
; arc
= arc
->next_child
)
51 DBG (LOOKUPDEBUG
, printf ("[arc_lookup]\t parent %s child %s\n",
52 arc
->parent
->name
, arc
->child
->name
));
53 if (child
->addr
>= arc
->child
->addr
54 && child
->end_addr
<= arc
->child
->end_addr
)
64 * Add (or just increment) an arc:
67 DEFUN (arc_add
, (parent
, child
, count
),
68 Sym
* parent AND Sym
* child AND
unsigned long count
)
70 static unsigned int maxarcs
= 0;
73 DBG (TALLYDEBUG
, printf ("[arc_add] %lu arcs from %s to %s\n",
74 count
, parent
->name
, child
->name
));
75 arc
= arc_lookup (parent
, child
);
79 * A hit: just increment the count.
81 DBG (TALLYDEBUG
, printf ("[tally] hit %lu += %lu\n",
86 arc
= (Arc
*) xmalloc (sizeof (*arc
));
87 memset (arc
, 0, sizeof (*arc
));
92 /* If this isn't an arc for a recursive call to parent, then add it
93 to the array of arcs. */
96 /* If we've exhausted space in our current array, get a new one
97 and copy the contents. We might want to throttle the doubling
99 if (numarcs
== maxarcs
)
101 /* Determine how much space we want to allocate. */
106 /* Allocate the new array. */
107 newarcs
= (Arc
**)xmalloc(sizeof (Arc
*) * maxarcs
);
109 /* Copy the old array's contents into the new array. */
110 memcpy (newarcs
, arcs
, numarcs
* sizeof (Arc
*));
112 /* Free up the old array. */
115 /* And make the new array be the current array. */
119 /* Place this arc in the arc array. */
120 arcs
[numarcs
++] = arc
;
123 /* prepend this child to the children of this parent: */
124 arc
->next_child
= parent
->cg
.children
;
125 parent
->cg
.children
= arc
;
127 /* prepend this parent to the parents of this child: */
128 arc
->next_parent
= child
->cg
.parents
;
129 child
->cg
.parents
= arc
;
134 DEFUN (cmp_topo
, (lp
, rp
), const PTR lp AND
const PTR rp
)
136 const Sym
*left
= *(const Sym
**) lp
;
137 const Sym
*right
= *(const Sym
**) rp
;
139 return left
->cg
.top_order
- right
->cg
.top_order
;
144 DEFUN (propagate_time
, (parent
), Sym
* parent
)
148 double share
, prop_share
;
150 if (parent
->cg
.prop
.fract
== 0.0)
155 /* gather time from children of this parent: */
157 for (arc
= parent
->cg
.children
; arc
; arc
= arc
->next_child
)
160 if (arc
->count
== 0 || child
== parent
|| child
->cg
.prop
.fract
== 0)
164 if (child
->cg
.cyc
.head
!= child
)
166 if (parent
->cg
.cyc
.num
== child
->cg
.cyc
.num
)
170 if (parent
->cg
.top_order
<= child
->cg
.top_order
)
172 fprintf (stderr
, "[propagate] toporder botches\n");
174 child
= child
->cg
.cyc
.head
;
178 if (parent
->cg
.top_order
<= child
->cg
.top_order
)
180 fprintf (stderr
, "[propagate] toporder botches\n");
184 if (child
->ncalls
== 0)
189 /* distribute time for this arc: */
190 arc
->time
= child
->hist
.time
* (((double) arc
->count
)
191 / ((double) child
->ncalls
));
192 arc
->child_time
= child
->cg
.child_time
193 * (((double) arc
->count
) / ((double) child
->ncalls
));
194 share
= arc
->time
+ arc
->child_time
;
195 parent
->cg
.child_time
+= share
;
197 /* (1 - cg.prop.fract) gets lost along the way: */
198 prop_share
= parent
->cg
.prop
.fract
* share
;
200 /* fix things for printing: */
201 parent
->cg
.prop
.child
+= prop_share
;
202 arc
->time
*= parent
->cg
.prop
.fract
;
203 arc
->child_time
*= parent
->cg
.prop
.fract
;
205 /* add this share to the parent's cycle header, if any: */
206 if (parent
->cg
.cyc
.head
!= parent
)
208 parent
->cg
.cyc
.head
->cg
.child_time
+= share
;
209 parent
->cg
.cyc
.head
->cg
.prop
.child
+= prop_share
;
212 printf ("[prop_time] child \t");
214 printf (" with %f %f %lu/%lu\n", child
->hist
.time
,
215 child
->cg
.child_time
, arc
->count
, child
->ncalls
);
216 printf ("[prop_time] parent\t");
218 printf ("\n[prop_time] share %f\n", share
));
224 * Compute the time of a cycle as the sum of the times of all
228 DEFUN_VOID (cycle_time
)
232 for (cyc
= &cycle_header
[1]; cyc
<= &cycle_header
[num_cycles
]; ++cyc
)
234 for (member
= cyc
->cg
.cyc
.next
; member
; member
= member
->cg
.cyc
.next
)
236 if (member
->cg
.prop
.fract
== 0.0)
239 * All members have the same propfraction except those
240 * that were excluded with -E.
244 cyc
->hist
.time
+= member
->hist
.time
;
246 cyc
->cg
.prop
.self
= cyc
->cg
.prop
.fract
* cyc
->hist
.time
;
252 DEFUN_VOID (cycle_link
)
254 Sym
*sym
, *cyc
, *member
;
258 /* count the number of cycles, and initialize the cycle lists: */
261 for (sym
= symtab
.base
; sym
< symtab
.limit
; ++sym
)
263 /* this is how you find unattached cycles: */
264 if (sym
->cg
.cyc
.head
== sym
&& sym
->cg
.cyc
.next
)
271 * cycle_header is indexed by cycle number: i.e. it is origin 1,
274 cycle_header
= (Sym
*) xmalloc ((num_cycles
+ 1) * sizeof (Sym
));
277 * Now link cycles to true cycle-heads, number them, accumulate
278 * the data for the cycle.
282 for (sym
= symtab
.base
; sym
< symtab
.limit
; ++sym
)
284 if (!(sym
->cg
.cyc
.head
== sym
&& sym
->cg
.cyc
.next
!= 0))
291 cyc
->cg
.print_flag
= TRUE
; /* should this be printed? */
292 cyc
->cg
.top_order
= DFN_NAN
; /* graph call chain top-sort order */
293 cyc
->cg
.cyc
.num
= num
; /* internal number of cycle on */
294 cyc
->cg
.cyc
.head
= cyc
; /* pointer to head of cycle */
295 cyc
->cg
.cyc
.next
= sym
; /* pointer to next member of cycle */
296 DBG (CYCLEDEBUG
, printf ("[cycle_link] ");
298 printf (" is the head of cycle %d\n", num
));
300 /* link members to cycle header: */
301 for (member
= sym
; member
; member
= member
->cg
.cyc
.next
)
303 member
->cg
.cyc
.num
= num
;
304 member
->cg
.cyc
.head
= cyc
;
308 * Count calls from outside the cycle and those among cycle
311 for (member
= sym
; member
; member
= member
->cg
.cyc
.next
)
313 for (arc
= member
->cg
.parents
; arc
; arc
= arc
->next_parent
)
315 if (arc
->parent
== member
)
319 if (arc
->parent
->cg
.cyc
.num
== num
)
321 cyc
->cg
.self_calls
+= arc
->count
;
325 cyc
->ncalls
+= arc
->count
;
334 * Check if any parent of this child (or outside parents of this
335 * cycle) have their print flags on and set the print flag of the
336 * child (cycle) appropriately. Similarly, deal with propagation
337 * fractions from parents.
340 DEFUN (inherit_flags
, (child
), Sym
* child
)
342 Sym
*head
, *parent
, *member
;
345 head
= child
->cg
.cyc
.head
;
348 /* just a regular child, check its parents: */
349 child
->cg
.print_flag
= FALSE
;
350 child
->cg
.prop
.fract
= 0.0;
351 for (arc
= child
->cg
.parents
; arc
; arc
= arc
->next_parent
)
353 parent
= arc
->parent
;
358 child
->cg
.print_flag
|= parent
->cg
.print_flag
;
360 * If the child was never actually called (e.g., this arc
361 * is static (and all others are, too)) no time propagates
364 if (child
->ncalls
!= 0)
366 child
->cg
.prop
.fract
+= parent
->cg
.prop
.fract
367 * (((double) arc
->count
) / ((double) child
->ncalls
));
374 * Its a member of a cycle, look at all parents from outside
377 head
->cg
.print_flag
= FALSE
;
378 head
->cg
.prop
.fract
= 0.0;
379 for (member
= head
->cg
.cyc
.next
; member
; member
= member
->cg
.cyc
.next
)
381 for (arc
= member
->cg
.parents
; arc
; arc
= arc
->next_parent
)
383 if (arc
->parent
->cg
.cyc
.head
== head
)
387 parent
= arc
->parent
;
388 head
->cg
.print_flag
|= parent
->cg
.print_flag
;
390 * If the cycle was never actually called (e.g. this
391 * arc is static (and all others are, too)) no time
392 * propagates along this arc.
394 if (head
->ncalls
!= 0)
396 head
->cg
.prop
.fract
+= parent
->cg
.prop
.fract
397 * (((double) arc
->count
) / ((double) head
->ncalls
));
401 for (member
= head
; member
; member
= member
->cg
.cyc
.next
)
403 member
->cg
.print_flag
= head
->cg
.print_flag
;
404 member
->cg
.prop
.fract
= head
->cg
.prop
.fract
;
411 * In one top-to-bottom pass over the topologically sorted symbols
413 * cg.print_flag as the union of parents' print_flags
414 * propfraction as the sum of fractional parents' propfractions
415 * and while we're here, sum time for functions.
418 DEFUN (propagate_flags
, (symbols
), Sym
** symbols
)
421 Sym
*old_head
, *child
;
424 for (index
= symtab
.len
- 1; index
>= 0; --index
)
426 child
= symbols
[index
];
428 * If we haven't done this function or cycle, inherit things
429 * from parent. This way, we are linear in the number of arcs
430 * since we do all members of a cycle (and the cycle itself)
431 * as we hit the first member of the cycle.
433 if (child
->cg
.cyc
.head
!= old_head
)
435 old_head
= child
->cg
.cyc
.head
;
436 inherit_flags (child
);
439 printf ("[prop_flags] ");
441 printf ("inherits print-flag %d and prop-fract %f\n",
442 child
->cg
.print_flag
, child
->cg
.prop
.fract
));
443 if (!child
->cg
.print_flag
)
446 * Printflag is off. It gets turned on by being in the
447 * INCL_GRAPH table, or there being an empty INCL_GRAPH
448 * table and not being in the EXCL_GRAPH table.
450 if (sym_lookup (&syms
[INCL_GRAPH
], child
->addr
)
451 || (syms
[INCL_GRAPH
].len
== 0
452 && !sym_lookup (&syms
[EXCL_GRAPH
], child
->addr
)))
454 child
->cg
.print_flag
= TRUE
;
460 * This function has printing parents: maybe someone wants
461 * to shut it up by putting it in the EXCL_GRAPH table.
462 * (But favor INCL_GRAPH over EXCL_GRAPH.)
464 if (!sym_lookup (&syms
[INCL_GRAPH
], child
->addr
)
465 && sym_lookup (&syms
[EXCL_GRAPH
], child
->addr
))
467 child
->cg
.print_flag
= FALSE
;
470 if (child
->cg
.prop
.fract
== 0.0)
473 * No parents to pass time to. Collect time from children
474 * if its in the INCL_TIME table, or there is an empty
475 * INCL_TIME table and its not in the EXCL_TIME table.
477 if (sym_lookup (&syms
[INCL_TIME
], child
->addr
)
478 || (syms
[INCL_TIME
].len
== 0
479 && !sym_lookup (&syms
[EXCL_TIME
], child
->addr
)))
481 child
->cg
.prop
.fract
= 1.0;
487 * It has parents to pass time to, but maybe someone wants
488 * to shut it up by puttting it in the EXCL_TIME table.
489 * (But favor being in INCL_TIME tabe over being in
492 if (!sym_lookup (&syms
[INCL_TIME
], child
->addr
)
493 && sym_lookup (&syms
[EXCL_TIME
], child
->addr
))
495 child
->cg
.prop
.fract
= 0.0;
498 child
->cg
.prop
.self
= child
->hist
.time
* child
->cg
.prop
.fract
;
499 print_time
+= child
->cg
.prop
.self
;
501 printf ("[prop_flags] ");
503 printf (" ends up with printflag %d and prop-fract %f\n",
504 child
->cg
.print_flag
, child
->cg
.prop
.fract
);
505 printf ("[prop_flags] time %f propself %f print_time %f\n",
506 child
->hist
.time
, child
->cg
.prop
.self
, print_time
));
512 * Compare by decreasing propagated time. If times are equal, but one
513 * is a cycle header, say that's first (e.g. less, i.e. -1). If one's
514 * name doesn't have an underscore and the other does, say that one is
515 * first. All else being equal, compare by names.
518 DEFUN (cmp_total
, (lp
, rp
), const PTR lp AND
const PTR rp
)
520 const Sym
*left
= *(const Sym
**) lp
;
521 const Sym
*right
= *(const Sym
**) rp
;
524 diff
= (left
->cg
.prop
.self
+ left
->cg
.prop
.child
)
525 - (right
->cg
.prop
.self
+ right
->cg
.prop
.child
);
534 if (!left
->name
&& left
->cg
.cyc
.num
!= 0)
538 if (!right
->name
&& right
->cg
.cyc
.num
!= 0)
550 if (left
->name
[0] != '_' && right
->name
[0] == '_')
554 if (left
->name
[0] == '_' && right
->name
[0] != '_')
558 if (left
->ncalls
> right
->ncalls
)
562 if (left
->ncalls
< right
->ncalls
)
566 return strcmp (left
->name
, right
->name
);
571 * Topologically sort the graph (collapsing cycles), and propagates
572 * time bottom up and flags top down.
575 DEFUN_VOID (cg_assemble
)
577 Sym
*parent
, **time_sorted_syms
, **top_sorted_syms
;
582 * initialize various things:
583 * zero out child times.
584 * count self-recursive calls.
585 * indicate that nothing is on cycles.
587 for (parent
= symtab
.base
; parent
< symtab
.limit
; parent
++)
589 parent
->cg
.child_time
= 0.0;
590 arc
= arc_lookup (parent
, parent
);
591 if (arc
&& parent
== arc
->child
)
593 parent
->ncalls
-= arc
->count
;
594 parent
->cg
.self_calls
= arc
->count
;
598 parent
->cg
.self_calls
= 0;
600 parent
->cg
.prop
.fract
= 0.0;
601 parent
->cg
.prop
.self
= 0.0;
602 parent
->cg
.prop
.child
= 0.0;
603 parent
->cg
.print_flag
= FALSE
;
604 parent
->cg
.top_order
= DFN_NAN
;
605 parent
->cg
.cyc
.num
= 0;
606 parent
->cg
.cyc
.head
= parent
;
607 parent
->cg
.cyc
.next
= 0;
608 if (ignore_direct_calls
)
610 find_call (parent
, parent
->addr
, (parent
+ 1)->addr
);
614 * Topologically order things. If any node is unnumbered, number
615 * it and any of its descendents.
617 for (parent
= symtab
.base
; parent
< symtab
.limit
; parent
++)
619 if (parent
->cg
.top_order
== DFN_NAN
)
625 /* link together nodes on the same cycle: */
628 /* sort the symbol table in reverse topological order: */
629 top_sorted_syms
= (Sym
**) xmalloc (symtab
.len
* sizeof (Sym
*));
630 for (index
= 0; index
< symtab
.len
; ++index
)
632 top_sorted_syms
[index
] = &symtab
.base
[index
];
634 qsort (top_sorted_syms
, symtab
.len
, sizeof (Sym
*), cmp_topo
);
636 printf ("[cg_assemble] topological sort listing\n");
637 for (index
= 0; index
< symtab
.len
; ++index
)
639 printf ("[cg_assemble] ");
640 printf ("%d:", top_sorted_syms
[index
]->cg
.top_order
);
641 print_name (top_sorted_syms
[index
]);
646 * Starting from the topological top, propagate print flags to
647 * children. also, calculate propagation fractions. this happens
648 * before time propagation since time propagation uses the
651 propagate_flags (top_sorted_syms
);
654 * Starting from the topological bottom, propogate children times
658 for (index
= 0; index
< symtab
.len
; ++index
)
660 propagate_time (top_sorted_syms
[index
]);
663 free (top_sorted_syms
);
666 * Now, sort by CG.PROP.SELF + CG.PROP.CHILD. Sorting both the regular
667 * function names and cycle headers.
669 time_sorted_syms
= (Sym
**) xmalloc ((symtab
.len
+ num_cycles
) * sizeof (Sym
*));
670 for (index
= 0; index
< symtab
.len
; index
++)
672 time_sorted_syms
[index
] = &symtab
.base
[index
];
674 for (index
= 1; index
<= num_cycles
; index
++)
676 time_sorted_syms
[symtab
.len
+ index
- 1] = &cycle_header
[index
];
678 qsort (time_sorted_syms
, symtab
.len
+ num_cycles
, sizeof (Sym
*),
680 for (index
= 0; index
< symtab
.len
+ num_cycles
; index
++)
682 time_sorted_syms
[index
]->cg
.index
= index
+ 1;
684 return time_sorted_syms
;