1 """Class for printing reports on profiled python code."""
3 # Class for printing reports on profiled python code. rev 1.0 4/1/94
5 # Based on prior profile module by Sjoerd Mullender...
6 # which was hacked somewhat by: Guido van Rossum
8 # see profile.doc and profile.py for more info.
10 # Copyright 1994, by InfoSeek Corporation, all rights reserved.
11 # Written by James Roskind
13 # Permission to use, copy, modify, and distribute this Python software
14 # and its associated documentation for any purpose (subject to the
15 # restriction in the following sentence) without fee is hereby granted,
16 # provided that the above copyright notice appears in all copies, and
17 # that both that copyright notice and this permission notice appear in
18 # supporting documentation, and that the name of InfoSeek not be used in
19 # advertising or publicity pertaining to distribution of the software
20 # without specific, written prior permission. This permission is
21 # explicitly restricted to the copying and modification of the software
22 # to remain in Python, compiled Python, or other languages (such as C)
23 # wherein the modified or derived code is exclusively imported into a
26 # INFOSEEK CORPORATION DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS
27 # SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND
28 # FITNESS. IN NO EVENT SHALL INFOSEEK CORPORATION BE LIABLE FOR ANY
29 # SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER
30 # RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF
31 # CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN
32 # CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
43 """This class is used for creating reports from data generated by the
44 Profile class. It is a "friend" of that class, and imports data either
45 by direct access to members of Profile class, or by reading in a dictionary
46 that was emitted (via marshal) from the Profile class.
48 The big change from the previous Profiler (in terms of raw functionality)
49 is that an "add()" method has been provided to combine Stats from
50 several distinct profile runs. Both the constructor and the add()
51 method now take arbitrarily many file names as arguments.
53 All the print methods now take an argument that indicates how many lines
54 to print. If the arg is a floating point number between 0 and 1.0, then
55 it is taken as a decimal percentage of the available lines to be printed
56 (e.g., .1 means print 10% of all available lines). If it is an integer,
57 it is taken to mean the number of lines of data that you wish to have
60 The sort_stats() method now processes some additional options (i.e., in
61 addition to the old -1, 0, 1, or 2). It takes an arbitrary number of quoted
62 strings to select the sort order. For example sort_stats('time', 'name')
63 sorts on the major key of "internal function time", and on the minor
64 key of 'the name of the function'. Look at the two tables in sort_stats()
65 and get_sort_arg_defs(self) for more examples.
67 All methods now return "self", so you can string together commands like:
68 Stats('foo', 'goo').strip_dirs().sort_stats('calls').\
69 print_stats(5).print_callers(5)
72 def __init__(self
, *args
):
82 self
.all_callees
= None # calc only if needed
91 self
.sort_arg_dict
= {}
95 self
.get_top_level_stats()
99 print "Invalid timing data",
100 if self
.files
: print self
.files
[-1],
103 def load_stats(self
, arg
):
104 if not arg
: self
.stats
= {}
105 elif type(arg
) == type(""):
107 self
.stats
= marshal
.load(f
)
110 file_stats
= os
.stat(arg
)
111 arg
= time
.ctime(file_stats
.st_mtime
) + " " + arg
112 except: # in case this is not unix
115 elif hasattr(arg
, 'create_stats'):
117 self
.stats
= arg
.stats
120 raise TypeError, "Cannot create or construct a %r object from '%r''" % (
124 def get_top_level_stats(self
):
125 for func
, (cc
, nc
, tt
, ct
, callers
) in self
.stats
.items():
126 self
.total_calls
+= nc
127 self
.prim_calls
+= cc
129 if callers
.has_key(("jprofile", 0, "profiler")):
130 self
.top_level
[func
] = None
131 if len(func_std_string(func
)) > self
.max_name_len
:
132 self
.max_name_len
= len(func_std_string(func
))
134 def add(self
, *arg_list
):
135 if not arg_list
: return self
136 if len(arg_list
) > 1: self
.add(*arg_list
[1:])
138 if type(self
) != type(other
) or self
.__class
__ != other
.__class
__:
140 self
.files
+= other
.files
141 self
.total_calls
+= other
.total_calls
142 self
.prim_calls
+= other
.prim_calls
143 self
.total_tt
+= other
.total_tt
144 for func
in other
.top_level
:
145 self
.top_level
[func
] = None
147 if self
.max_name_len
< other
.max_name_len
:
148 self
.max_name_len
= other
.max_name_len
152 for func
, stat
in other
.stats
.iteritems():
153 if func
in self
.stats
:
154 old_func_stat
= self
.stats
[func
]
156 old_func_stat
= (0, 0, 0, 0, {},)
157 self
.stats
[func
] = add_func_stats(old_func_stat
, stat
)
160 def dump_stats(self
, filename
):
161 """Write the profile data to a file we know how to load back."""
162 f
= file(filename
, 'wb')
164 marshal
.dump(self
.stats
, f
)
168 # list the tuple indices and directions for sorting,
169 # along with some printable description
170 sort_arg_dict_default
= {
171 "calls" : (((1,-1), ), "call count"),
172 "cumulative": (((3,-1), ), "cumulative time"),
173 "file" : (((4, 1), ), "file name"),
174 "line" : (((5, 1), ), "line number"),
175 "module" : (((4, 1), ), "file name"),
176 "name" : (((6, 1), ), "function name"),
177 "nfl" : (((6, 1),(4, 1),(5, 1),), "name/file/line"),
178 "pcalls" : (((0,-1), ), "call count"),
179 "stdname" : (((7, 1), ), "standard name"),
180 "time" : (((2,-1), ), "internal time"),
183 def get_sort_arg_defs(self
):
184 """Expand all abbreviations that are unique."""
185 if not self
.sort_arg_dict
:
186 self
.sort_arg_dict
= dict = {}
188 for word
, tup
in self
.sort_arg_dict_default
.iteritems():
194 bad_list
[fragment
] = 0
197 fragment
= fragment
[:-1]
198 for word
in bad_list
:
200 return self
.sort_arg_dict
202 def sort_stats(self
, *field
):
206 if len(field
) == 1 and type(field
[0]) == type(1):
207 # Be compatible with old profiler
208 field
= [ {-1: "stdname",
211 2: "cumulative" } [ field
[0] ] ]
213 sort_arg_defs
= self
.get_sort_arg_defs()
218 sort_tuple
= sort_tuple
+ sort_arg_defs
[word
][0]
219 self
.sort_type
+= connector
+ sort_arg_defs
[word
][1]
223 for func
, (cc
, nc
, tt
, ct
, callers
) in self
.stats
.iteritems():
224 stats_list
.append((cc
, nc
, tt
, ct
) + func
+
225 (func_std_string(func
), func
))
227 stats_list
.sort(TupleComp(sort_tuple
).compare
)
229 self
.fcn_list
= fcn_list
= []
230 for tuple in stats_list
:
231 fcn_list
.append(tuple[-1])
234 def reverse_order(self
):
236 self
.fcn_list
.reverse()
239 def strip_dirs(self
):
240 oldstats
= self
.stats
241 self
.stats
= newstats
= {}
243 for func
, (cc
, nc
, tt
, ct
, callers
) in oldstats
.iteritems():
244 newfunc
= func_strip_path(func
)
245 if len(func_std_string(newfunc
)) > max_name_len
:
246 max_name_len
= len(func_std_string(newfunc
))
248 for func2
, caller
in callers
.iteritems():
249 newcallers
[func_strip_path(func2
)] = caller
251 if newfunc
in newstats
:
252 newstats
[newfunc
] = add_func_stats(
254 (cc
, nc
, tt
, ct
, newcallers
))
256 newstats
[newfunc
] = (cc
, nc
, tt
, ct
, newcallers
)
257 old_top
= self
.top_level
258 self
.top_level
= new_top
= {}
260 new_top
[func_strip_path(func
)] = None
262 self
.max_name_len
= max_name_len
265 self
.all_callees
= None
268 def calc_callees(self
):
269 if self
.all_callees
: return
270 self
.all_callees
= all_callees
= {}
271 for func
, (cc
, nc
, tt
, ct
, callers
) in self
.stats
.iteritems():
272 if not func
in all_callees
:
273 all_callees
[func
] = {}
274 for func2
, caller
in callers
.iteritems():
275 if not func2
in all_callees
:
276 all_callees
[func2
] = {}
277 all_callees
[func2
][func
] = caller
280 #******************************************************************
281 # The following functions support actual printing of reports
282 #******************************************************************
284 # Optional "amount" is either a line count, or a percentage of lines.
286 def eval_print_amount(self
, sel
, list, msg
):
288 if type(sel
) == type(""):
291 if re
.search(sel
, func_std_string(func
)):
292 new_list
.append(func
)
295 if type(sel
) == type(1.0) and 0.0 <= sel
< 1.0:
296 count
= int(count
* sel
+ .5)
297 new_list
= list[:count
]
298 elif type(sel
) == type(1) and 0 <= sel
< count
:
300 new_list
= list[:count
]
301 if len(list) != len(new_list
):
302 msg
= msg
+ " List reduced from %r to %r due to restriction <%r>\n" % (
303 len(list), len(new_list
), sel
)
307 def get_print_list(self
, sel_list
):
308 width
= self
.max_name_len
310 list = self
.fcn_list
[:]
311 msg
= " Ordered by: " + self
.sort_type
+ '\n'
313 list = self
.stats
.keys()
314 msg
= " Random listing order was used\n"
316 for selection
in sel_list
:
317 list, msg
= self
.eval_print_amount(selection
, list, msg
)
324 if count
< len(self
.stats
):
327 if len(func_std_string(func
)) > width
:
328 width
= len(func_std_string(func
))
331 def print_stats(self
, *amount
):
332 for filename
in self
.files
:
336 for func
in self
.top_level
:
337 print indent
, func_get_function_name(func
)
339 print indent
, self
.total_calls
, "function calls",
340 if self
.total_calls
!= self
.prim_calls
:
341 print "(%d primitive calls)" % self
.prim_calls
,
342 print "in %.3f CPU seconds" % self
.total_tt
344 width
, list = self
.get_print_list(amount
)
348 self
.print_line(func
)
353 def print_callees(self
, *amount
):
354 width
, list = self
.get_print_list(amount
)
358 self
.print_call_heading(width
, "called...")
360 if func
in self
.all_callees
:
361 self
.print_call_line(width
, func
, self
.all_callees
[func
])
363 self
.print_call_line(width
, func
, {})
368 def print_callers(self
, *amount
):
369 width
, list = self
.get_print_list(amount
)
371 self
.print_call_heading(width
, "was called by...")
373 cc
, nc
, tt
, ct
, callers
= self
.stats
[func
]
374 self
.print_call_line(width
, func
, callers
)
379 def print_call_heading(self
, name_size
, column_title
):
380 print "Function ".ljust(name_size
) + column_title
382 def print_call_line(self
, name_size
, source
, call_dict
):
383 print func_std_string(source
).ljust(name_size
),
387 clist
= call_dict
.keys()
389 name_size
= name_size
+ 1
392 name
= func_std_string(func
)
393 print indent
*name_size
+ name
+ '(%r)' % (call_dict
[func
],), \
394 f8(self
.stats
[func
][3])
397 def print_title(self
):
398 print ' ncalls tottime percall cumtime percall', \
399 'filename:lineno(function)'
401 def print_line(self
, func
): # hack : should print percentages
402 cc
, nc
, tt
, ct
, callers
= self
.stats
[func
]
405 c
= c
+ '/' + str(cc
)
417 print func_std_string(func
)
420 """This class provides a generic function for comparing any two tuples.
421 Each instance records a list of tuple-indices (from most significant
422 to least significant), and sort direction (ascending or decending) for
423 each tuple-index. The compare functions can then be used as the function
424 argument to the system sort() function when a list of tuples need to be
425 sorted in the instances order."""
427 def __init__(self
, comp_select_list
):
428 self
.comp_select_list
= comp_select_list
430 def compare (self
, left
, right
):
431 for index
, direction
in self
.comp_select_list
:
440 #**************************************************************************
441 # func_name is a triple (file:string, line:int, name:string)
443 def func_strip_path(func_name
):
444 filename
, line
, name
= func_name
445 return os
.path
.basename(filename
), line
, name
447 def func_get_function_name(func
):
450 def func_std_string(func_name
): # match what old profile produced
451 return "%s:%d(%s)" % func_name
453 #**************************************************************************
454 # The following functions combine statists for pairs functions.
455 # The bulk of the processing involves correctly handling "call" lists,
456 # such as callers and callees.
457 #**************************************************************************
459 def add_func_stats(target
, source
):
460 """Add together all the stats for two profile entries."""
461 cc
, nc
, tt
, ct
, callers
= source
462 t_cc
, t_nc
, t_tt
, t_ct
, t_callers
= target
463 return (cc
+t_cc
, nc
+t_nc
, tt
+t_tt
, ct
+t_ct
,
464 add_callers(t_callers
, callers
))
466 def add_callers(target
, source
):
467 """Combine two caller lists in a single list."""
469 for func
, caller
in target
.iteritems():
470 new_callers
[func
] = caller
471 for func
, caller
in source
.iteritems():
472 if func
in new_callers
:
473 new_callers
[func
] = caller
+ new_callers
[func
]
475 new_callers
[func
] = caller
478 def count_calls(callers
):
479 """Sum the caller statistics to get total number of calls received."""
481 for calls
in callers
.itervalues():
485 #**************************************************************************
486 # The following functions support printing of reports
487 #**************************************************************************
492 #**************************************************************************
493 # Statistics browser added by ESR, April 2001
494 #**************************************************************************
496 if __name__
== '__main__':
503 class ProfileBrowser(cmd
.Cmd
):
504 def __init__(self
, profile
=None):
505 cmd
.Cmd
.__init
__(self
)
507 if profile
is not None:
508 self
.stats
= Stats(profile
)
512 def generic(self
, fn
, line
):
517 processed
.append(int(term
))
523 if frac
> 1 or frac
< 0:
524 print "Fraction argument mus be in [0, 1]"
526 processed
.append(frac
)
530 processed
.append(term
)
532 getattr(self
.stats
, fn
)(*processed
)
534 print "No statistics object is loaded."
536 def generic_help(self
):
537 print "Arguments may be:"
538 print "* An integer maximum number of entries to print."
539 print "* A decimal fractional number between 0 and 1, controlling"
540 print " what fraction of selected entries to print."
541 print "* A regular expression; only entries with function names"
542 print " that match it are printed."
544 def do_add(self
, line
):
548 print "Add profile info from given file to current statistics object."
550 def do_callees(self
, line
):
551 return self
.generic('print_callees', line
)
552 def help_callees(self
):
553 print "Print callees statistics from the current stat object."
556 def do_callers(self
, line
):
557 return self
.generic('print_callers', line
)
558 def help_callers(self
):
559 print "Print callers statistics from the current stat object."
562 def do_EOF(self
, line
):
566 print "Leave the profile brower."
568 def do_quit(self
, line
):
571 print "Leave the profile brower."
573 def do_read(self
, line
):
576 self
.stats
= Stats(line
)
577 except IOError, args
:
580 self
.prompt
= line
+ "% "
581 elif len(self
.prompt
) > 2:
582 line
= self
.prompt
[-2:]
584 print "No statistics object is current -- cannot reload."
587 print "Read in profile data from a specified file."
589 def do_reverse(self
, line
):
590 self
.stats
.reverse_order()
592 def help_reverse(self
):
593 print "Reverse the sort order of the profiling report."
595 def do_sort(self
, line
):
596 abbrevs
= self
.stats
.get_sort_arg_defs()
597 if line
and not filter(lambda x
,a
=abbrevs
: x
not in a
,line
.split()):
598 self
.stats
.sort_stats(*line
.split())
600 print "Valid sort keys (unique prefixes are accepted):"
601 for (key
, value
) in Stats
.sort_arg_dict_default
.iteritems():
602 print "%s -- %s" % (key
, value
[1])
605 print "Sort profile data according to specified keys."
606 print "(Typing `sort' without arguments lists valid keys.)"
607 def complete_sort(self
, text
, *args
):
608 return [a
for a
in Stats
.sort_arg_dict_default
if a
.startswith(text
)]
610 def do_stats(self
, line
):
611 return self
.generic('print_stats', line
)
612 def help_stats(self
):
613 print "Print statistics from the current stat object."
616 def do_strip(self
, line
):
617 self
.stats
.strip_dirs()
619 def help_strip(self
):
620 print "Strip leading path information from filenames in the report."
622 def postcmd(self
, stop
, line
):
628 print "Welcome to the profile statistics browser."
629 if len(sys
.argv
) > 1:
630 initprofile
= sys
.argv
[1]
634 ProfileBrowser(initprofile
).cmdloop()
636 except KeyboardInterrupt: