perf tools: Rewrite and improve support for kernel modules
[linux-2.6/btrfs-unstable.git] / tools / perf / builtin-report.c
blob3ed3baf96ffba62dbbc8a7f06f090a2be7d9651f
1 /*
2 * builtin-report.c
4 * Builtin report command: Analyze the perf.data input file,
5 * look up and read DSOs and symbol information and display
6 * a histogram of results, along various sorting keys.
7 */
8 #include "builtin.h"
10 #include "util/util.h"
12 #include "util/color.h"
13 #include <linux/list.h>
14 #include "util/cache.h"
15 #include <linux/rbtree.h>
16 #include "util/symbol.h"
17 #include "util/string.h"
18 #include "util/callchain.h"
19 #include "util/strlist.h"
20 #include "util/values.h"
22 #include "perf.h"
23 #include "util/debug.h"
24 #include "util/header.h"
26 #include "util/parse-options.h"
27 #include "util/parse-events.h"
29 #include "util/thread.h"
30 #include "util/sort.h"
31 #include "util/hist.h"
33 static char const *input_name = "perf.data";
35 static char *dso_list_str, *comm_list_str, *sym_list_str,
36 *col_width_list_str;
37 static struct strlist *dso_list, *comm_list, *sym_list;
39 static int force;
40 static int input;
41 static int show_mask = SHOW_KERNEL | SHOW_USER | SHOW_HV;
43 static int full_paths;
44 static int show_nr_samples;
46 static int show_threads;
47 static struct perf_read_values show_threads_values;
49 static char default_pretty_printing_style[] = "normal";
50 static char *pretty_printing_style = default_pretty_printing_style;
52 static unsigned long page_size;
53 static unsigned long mmap_window = 32;
55 static int exclude_other = 1;
57 static char callchain_default_opt[] = "fractal,0.5";
59 static char __cwd[PATH_MAX];
60 static char *cwd = __cwd;
61 static int cwdlen;
63 static struct rb_root threads;
64 static struct thread *last_match;
66 static struct perf_header *header;
68 static u64 sample_type;
70 static size_t ipchain__fprintf_graph_line(FILE *fp, int depth, int depth_mask)
72 int i;
73 size_t ret = 0;
75 ret += fprintf(fp, "%s", " ");
77 for (i = 0; i < depth; i++)
78 if (depth_mask & (1 << i))
79 ret += fprintf(fp, "| ");
80 else
81 ret += fprintf(fp, " ");
83 ret += fprintf(fp, "\n");
85 return ret;
87 static size_t
88 ipchain__fprintf_graph(FILE *fp, struct callchain_list *chain, int depth,
89 int depth_mask, int count, u64 total_samples,
90 int hits)
92 int i;
93 size_t ret = 0;
95 ret += fprintf(fp, "%s", " ");
96 for (i = 0; i < depth; i++) {
97 if (depth_mask & (1 << i))
98 ret += fprintf(fp, "|");
99 else
100 ret += fprintf(fp, " ");
101 if (!count && i == depth - 1) {
102 double percent;
104 percent = hits * 100.0 / total_samples;
105 ret += percent_color_fprintf(fp, "--%2.2f%%-- ", percent);
106 } else
107 ret += fprintf(fp, "%s", " ");
109 if (chain->sym)
110 ret += fprintf(fp, "%s\n", chain->sym->name);
111 else
112 ret += fprintf(fp, "%p\n", (void *)(long)chain->ip);
114 return ret;
117 static struct symbol *rem_sq_bracket;
118 static struct callchain_list rem_hits;
120 static void init_rem_hits(void)
122 rem_sq_bracket = malloc(sizeof(*rem_sq_bracket) + 6);
123 if (!rem_sq_bracket) {
124 fprintf(stderr, "Not enough memory to display remaining hits\n");
125 return;
128 strcpy(rem_sq_bracket->name, "[...]");
129 rem_hits.sym = rem_sq_bracket;
132 static size_t
133 callchain__fprintf_graph(FILE *fp, struct callchain_node *self,
134 u64 total_samples, int depth, int depth_mask)
136 struct rb_node *node, *next;
137 struct callchain_node *child;
138 struct callchain_list *chain;
139 int new_depth_mask = depth_mask;
140 u64 new_total;
141 u64 remaining;
142 size_t ret = 0;
143 int i;
145 if (callchain_param.mode == CHAIN_GRAPH_REL)
146 new_total = self->children_hit;
147 else
148 new_total = total_samples;
150 remaining = new_total;
152 node = rb_first(&self->rb_root);
153 while (node) {
154 u64 cumul;
156 child = rb_entry(node, struct callchain_node, rb_node);
157 cumul = cumul_hits(child);
158 remaining -= cumul;
161 * The depth mask manages the output of pipes that show
162 * the depth. We don't want to keep the pipes of the current
163 * level for the last child of this depth.
164 * Except if we have remaining filtered hits. They will
165 * supersede the last child
167 next = rb_next(node);
168 if (!next && (callchain_param.mode != CHAIN_GRAPH_REL || !remaining))
169 new_depth_mask &= ~(1 << (depth - 1));
172 * But we keep the older depth mask for the line seperator
173 * to keep the level link until we reach the last child
175 ret += ipchain__fprintf_graph_line(fp, depth, depth_mask);
176 i = 0;
177 list_for_each_entry(chain, &child->val, list) {
178 if (chain->ip >= PERF_CONTEXT_MAX)
179 continue;
180 ret += ipchain__fprintf_graph(fp, chain, depth,
181 new_depth_mask, i++,
182 new_total,
183 cumul);
185 ret += callchain__fprintf_graph(fp, child, new_total,
186 depth + 1,
187 new_depth_mask | (1 << depth));
188 node = next;
191 if (callchain_param.mode == CHAIN_GRAPH_REL &&
192 remaining && remaining != new_total) {
194 if (!rem_sq_bracket)
195 return ret;
197 new_depth_mask &= ~(1 << (depth - 1));
199 ret += ipchain__fprintf_graph(fp, &rem_hits, depth,
200 new_depth_mask, 0, new_total,
201 remaining);
204 return ret;
207 static size_t
208 callchain__fprintf_flat(FILE *fp, struct callchain_node *self,
209 u64 total_samples)
211 struct callchain_list *chain;
212 size_t ret = 0;
214 if (!self)
215 return 0;
217 ret += callchain__fprintf_flat(fp, self->parent, total_samples);
220 list_for_each_entry(chain, &self->val, list) {
221 if (chain->ip >= PERF_CONTEXT_MAX)
222 continue;
223 if (chain->sym)
224 ret += fprintf(fp, " %s\n", chain->sym->name);
225 else
226 ret += fprintf(fp, " %p\n",
227 (void *)(long)chain->ip);
230 return ret;
233 static size_t
234 hist_entry_callchain__fprintf(FILE *fp, struct hist_entry *self,
235 u64 total_samples)
237 struct rb_node *rb_node;
238 struct callchain_node *chain;
239 size_t ret = 0;
241 rb_node = rb_first(&self->sorted_chain);
242 while (rb_node) {
243 double percent;
245 chain = rb_entry(rb_node, struct callchain_node, rb_node);
246 percent = chain->hit * 100.0 / total_samples;
247 switch (callchain_param.mode) {
248 case CHAIN_FLAT:
249 ret += percent_color_fprintf(fp, " %6.2f%%\n",
250 percent);
251 ret += callchain__fprintf_flat(fp, chain, total_samples);
252 break;
253 case CHAIN_GRAPH_ABS: /* Falldown */
254 case CHAIN_GRAPH_REL:
255 ret += callchain__fprintf_graph(fp, chain,
256 total_samples, 1, 1);
257 case CHAIN_NONE:
258 default:
259 break;
261 ret += fprintf(fp, "\n");
262 rb_node = rb_next(rb_node);
265 return ret;
268 static size_t
269 hist_entry__fprintf(FILE *fp, struct hist_entry *self, u64 total_samples)
271 struct sort_entry *se;
272 size_t ret;
274 if (exclude_other && !self->parent)
275 return 0;
277 if (total_samples)
278 ret = percent_color_fprintf(fp,
279 field_sep ? "%.2f" : " %6.2f%%",
280 (self->count * 100.0) / total_samples);
281 else
282 ret = fprintf(fp, field_sep ? "%lld" : "%12lld ", self->count);
284 if (show_nr_samples) {
285 if (field_sep)
286 fprintf(fp, "%c%lld", *field_sep, self->count);
287 else
288 fprintf(fp, "%11lld", self->count);
291 list_for_each_entry(se, &hist_entry__sort_list, list) {
292 if (se->elide)
293 continue;
295 fprintf(fp, "%s", field_sep ?: " ");
296 ret += se->print(fp, self, se->width ? *se->width : 0);
299 ret += fprintf(fp, "\n");
301 if (callchain)
302 hist_entry_callchain__fprintf(fp, self, total_samples);
304 return ret;
311 static void dso__calc_col_width(struct dso *self)
313 if (!col_width_list_str && !field_sep &&
314 (!dso_list || strlist__has_entry(dso_list, self->name))) {
315 unsigned int slen = strlen(self->name);
316 if (slen > dsos__col_width)
317 dsos__col_width = slen;
320 self->slen_calculated = 1;
323 static void thread__comm_adjust(struct thread *self)
325 char *comm = self->comm;
327 if (!col_width_list_str && !field_sep &&
328 (!comm_list || strlist__has_entry(comm_list, comm))) {
329 unsigned int slen = strlen(comm);
331 if (slen > comms__col_width) {
332 comms__col_width = slen;
333 threads__col_width = slen + 6;
338 static int thread__set_comm_adjust(struct thread *self, const char *comm)
340 int ret = thread__set_comm(self, comm);
342 if (ret)
343 return ret;
345 thread__comm_adjust(self);
347 return 0;
351 static struct symbol *
352 resolve_symbol(struct thread *thread, struct map **mapp, u64 *ipp)
354 struct map *map = mapp ? *mapp : NULL;
355 u64 ip = *ipp;
357 if (map)
358 goto got_map;
360 if (!thread)
361 return NULL;
363 map = thread__find_map(thread, ip);
364 if (map != NULL) {
366 * We have to do this here as we may have a dso
367 * with no symbol hit that has a name longer than
368 * the ones with symbols sampled.
370 if (!sort_dso.elide && !map->dso->slen_calculated)
371 dso__calc_col_width(map->dso);
373 if (mapp)
374 *mapp = map;
375 got_map:
376 ip = map->map_ip(map, ip);
377 } else {
379 * If this is outside of all known maps,
380 * and is a negative address, try to look it
381 * up in the kernel dso, as it might be a
382 * vsyscall or vdso (which executes in user-mode).
384 * XXX This is nasty, we should have a symbol list in
385 * the "[vdso]" dso, but for now lets use the old
386 * trick of looking in the whole kernel symbol list.
388 if ((long long)ip < 0) {
389 map = kernel_map;
390 if (mapp)
391 *mapp = map;
394 dump_printf(" ...... dso: %s\n",
395 map ? map->dso->long_name : "<not found>");
396 dump_printf(" ...... map: %Lx -> %Lx\n", *ipp, ip);
397 *ipp = ip;
399 return map ? map->dso->find_symbol(map->dso, ip) : NULL;
402 static int call__match(struct symbol *sym)
404 if (sym->name && !regexec(&parent_regex, sym->name, 0, NULL, 0))
405 return 1;
407 return 0;
410 static struct symbol **
411 resolve_callchain(struct thread *thread, struct map *map,
412 struct ip_callchain *chain, struct hist_entry *entry)
414 u64 context = PERF_CONTEXT_MAX;
415 struct symbol **syms = NULL;
416 unsigned int i;
418 if (callchain) {
419 syms = calloc(chain->nr, sizeof(*syms));
420 if (!syms) {
421 fprintf(stderr, "Can't allocate memory for symbols\n");
422 exit(-1);
426 for (i = 0; i < chain->nr; i++) {
427 u64 ip = chain->ips[i];
428 struct symbol *sym = NULL;
430 if (ip >= PERF_CONTEXT_MAX) {
431 context = ip;
432 continue;
435 switch (context) {
436 case PERF_CONTEXT_HV:
437 break;
438 case PERF_CONTEXT_KERNEL:
439 sym = kernel_maps__find_symbol(ip, &map);
440 break;
441 default:
442 sym = resolve_symbol(thread, &map, &ip);
443 break;
446 if (sym) {
447 if (sort__has_parent && call__match(sym) &&
448 !entry->parent)
449 entry->parent = sym;
450 if (!callchain)
451 break;
452 syms[i] = sym;
456 return syms;
460 * collect histogram counts
463 static int
464 hist_entry__add(struct thread *thread, struct map *map,
465 struct symbol *sym, u64 ip, struct ip_callchain *chain,
466 char level, u64 count)
468 struct rb_node **p = &hist.rb_node;
469 struct rb_node *parent = NULL;
470 struct hist_entry *he;
471 struct symbol **syms = NULL;
472 struct hist_entry entry = {
473 .thread = thread,
474 .map = map,
475 .sym = sym,
476 .ip = ip,
477 .level = level,
478 .count = count,
479 .parent = NULL,
480 .sorted_chain = RB_ROOT
482 int cmp;
484 if ((sort__has_parent || callchain) && chain)
485 syms = resolve_callchain(thread, map, chain, &entry);
487 while (*p != NULL) {
488 parent = *p;
489 he = rb_entry(parent, struct hist_entry, rb_node);
491 cmp = hist_entry__cmp(&entry, he);
493 if (!cmp) {
494 he->count += count;
495 if (callchain) {
496 append_chain(&he->callchain, chain, syms);
497 free(syms);
499 return 0;
502 if (cmp < 0)
503 p = &(*p)->rb_left;
504 else
505 p = &(*p)->rb_right;
508 he = malloc(sizeof(*he));
509 if (!he)
510 return -ENOMEM;
511 *he = entry;
512 if (callchain) {
513 callchain_init(&he->callchain);
514 append_chain(&he->callchain, chain, syms);
515 free(syms);
517 rb_link_node(&he->rb_node, parent, p);
518 rb_insert_color(&he->rb_node, &hist);
520 return 0;
523 static size_t output__fprintf(FILE *fp, u64 total_samples)
525 struct hist_entry *pos;
526 struct sort_entry *se;
527 struct rb_node *nd;
528 size_t ret = 0;
529 unsigned int width;
530 char *col_width = col_width_list_str;
531 int raw_printing_style;
533 raw_printing_style = !strcmp(pretty_printing_style, "raw");
535 init_rem_hits();
537 fprintf(fp, "# Samples: %Ld\n", (u64)total_samples);
538 fprintf(fp, "#\n");
540 fprintf(fp, "# Overhead");
541 if (show_nr_samples) {
542 if (field_sep)
543 fprintf(fp, "%cSamples", *field_sep);
544 else
545 fputs(" Samples ", fp);
547 list_for_each_entry(se, &hist_entry__sort_list, list) {
548 if (se->elide)
549 continue;
550 if (field_sep) {
551 fprintf(fp, "%c%s", *field_sep, se->header);
552 continue;
554 width = strlen(se->header);
555 if (se->width) {
556 if (col_width_list_str) {
557 if (col_width) {
558 *se->width = atoi(col_width);
559 col_width = strchr(col_width, ',');
560 if (col_width)
561 ++col_width;
564 width = *se->width = max(*se->width, width);
566 fprintf(fp, " %*s", width, se->header);
568 fprintf(fp, "\n");
570 if (field_sep)
571 goto print_entries;
573 fprintf(fp, "# ........");
574 if (show_nr_samples)
575 fprintf(fp, " ..........");
576 list_for_each_entry(se, &hist_entry__sort_list, list) {
577 unsigned int i;
579 if (se->elide)
580 continue;
582 fprintf(fp, " ");
583 if (se->width)
584 width = *se->width;
585 else
586 width = strlen(se->header);
587 for (i = 0; i < width; i++)
588 fprintf(fp, ".");
590 fprintf(fp, "\n");
592 fprintf(fp, "#\n");
594 print_entries:
595 for (nd = rb_first(&output_hists); nd; nd = rb_next(nd)) {
596 pos = rb_entry(nd, struct hist_entry, rb_node);
597 ret += hist_entry__fprintf(fp, pos, total_samples);
600 if (sort_order == default_sort_order &&
601 parent_pattern == default_parent_pattern) {
602 fprintf(fp, "#\n");
603 fprintf(fp, "# (For a higher level overview, try: perf report --sort comm,dso)\n");
604 fprintf(fp, "#\n");
606 fprintf(fp, "\n");
608 free(rem_sq_bracket);
610 if (show_threads)
611 perf_read_values_display(fp, &show_threads_values,
612 raw_printing_style);
614 return ret;
617 static int validate_chain(struct ip_callchain *chain, event_t *event)
619 unsigned int chain_size;
621 chain_size = event->header.size;
622 chain_size -= (unsigned long)&event->ip.__more_data - (unsigned long)event;
624 if (chain->nr*sizeof(u64) > chain_size)
625 return -1;
627 return 0;
630 static int
631 process_sample_event(event_t *event, unsigned long offset, unsigned long head)
633 char level;
634 int show = 0;
635 struct symbol *sym = NULL;
636 struct thread *thread;
637 u64 ip = event->ip.ip;
638 u64 period = 1;
639 struct map *map = NULL;
640 void *more_data = event->ip.__more_data;
641 struct ip_callchain *chain = NULL;
642 int cpumode;
644 thread = threads__findnew(event->ip.pid, &threads, &last_match);
646 if (sample_type & PERF_SAMPLE_PERIOD) {
647 period = *(u64 *)more_data;
648 more_data += sizeof(u64);
651 dump_printf("%p [%p]: PERF_RECORD_SAMPLE (IP, %d): %d/%d: %p period: %Ld\n",
652 (void *)(offset + head),
653 (void *)(long)(event->header.size),
654 event->header.misc,
655 event->ip.pid, event->ip.tid,
656 (void *)(long)ip,
657 (long long)period);
659 if (sample_type & PERF_SAMPLE_CALLCHAIN) {
660 unsigned int i;
662 chain = (void *)more_data;
664 dump_printf("... chain: nr:%Lu\n", chain->nr);
666 if (validate_chain(chain, event) < 0) {
667 eprintf("call-chain problem with event, skipping it.\n");
668 return 0;
671 if (dump_trace) {
672 for (i = 0; i < chain->nr; i++)
673 dump_printf("..... %2d: %016Lx\n", i, chain->ips[i]);
677 dump_printf(" ... thread: %s:%d\n", thread->comm, thread->pid);
679 if (thread == NULL) {
680 eprintf("problem processing %d event, skipping it.\n",
681 event->header.type);
682 return -1;
685 if (comm_list && !strlist__has_entry(comm_list, thread->comm))
686 return 0;
688 cpumode = event->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
690 if (cpumode == PERF_RECORD_MISC_KERNEL) {
691 show = SHOW_KERNEL;
692 level = 'k';
694 sym = kernel_maps__find_symbol(ip, &map);
695 dump_printf(" ...... dso: %s\n",
696 map ? map->dso->long_name : "<not found>");
697 } else if (cpumode == PERF_RECORD_MISC_USER) {
699 show = SHOW_USER;
700 level = '.';
701 sym = resolve_symbol(thread, &map, &ip);
703 } else {
704 show = SHOW_HV;
705 level = 'H';
707 dump_printf(" ...... dso: [hypervisor]\n");
710 if (show & show_mask) {
711 if (dso_list &&
712 (!map || !map->dso ||
713 !(strlist__has_entry(dso_list, map->dso->short_name) ||
714 (map->dso->short_name != map->dso->long_name &&
715 strlist__has_entry(dso_list, map->dso->long_name)))))
716 return 0;
718 if (sym_list && sym && !strlist__has_entry(sym_list, sym->name))
719 return 0;
721 if (hist_entry__add(thread, map, sym, ip,
722 chain, level, period)) {
723 eprintf("problem incrementing symbol count, skipping event\n");
724 return -1;
727 total += period;
729 return 0;
732 static int
733 process_mmap_event(event_t *event, unsigned long offset, unsigned long head)
735 struct thread *thread;
736 struct map *map = map__new(&event->mmap, cwd, cwdlen);
738 thread = threads__findnew(event->mmap.pid, &threads, &last_match);
740 dump_printf("%p [%p]: PERF_RECORD_MMAP %d/%d: [%p(%p) @ %p]: %s\n",
741 (void *)(offset + head),
742 (void *)(long)(event->header.size),
743 event->mmap.pid,
744 event->mmap.tid,
745 (void *)(long)event->mmap.start,
746 (void *)(long)event->mmap.len,
747 (void *)(long)event->mmap.pgoff,
748 event->mmap.filename);
750 if (thread == NULL || map == NULL) {
751 dump_printf("problem processing PERF_RECORD_MMAP, skipping event.\n");
752 return 0;
755 thread__insert_map(thread, map);
756 total_mmap++;
758 return 0;
761 static int
762 process_comm_event(event_t *event, unsigned long offset, unsigned long head)
764 struct thread *thread;
766 thread = threads__findnew(event->comm.pid, &threads, &last_match);
768 dump_printf("%p [%p]: PERF_RECORD_COMM: %s:%d\n",
769 (void *)(offset + head),
770 (void *)(long)(event->header.size),
771 event->comm.comm, event->comm.pid);
773 if (thread == NULL ||
774 thread__set_comm_adjust(thread, event->comm.comm)) {
775 dump_printf("problem processing PERF_RECORD_COMM, skipping event.\n");
776 return -1;
778 total_comm++;
780 return 0;
783 static int
784 process_task_event(event_t *event, unsigned long offset, unsigned long head)
786 struct thread *thread;
787 struct thread *parent;
789 thread = threads__findnew(event->fork.pid, &threads, &last_match);
790 parent = threads__findnew(event->fork.ppid, &threads, &last_match);
792 dump_printf("%p [%p]: PERF_RECORD_%s: (%d:%d):(%d:%d)\n",
793 (void *)(offset + head),
794 (void *)(long)(event->header.size),
795 event->header.type == PERF_RECORD_FORK ? "FORK" : "EXIT",
796 event->fork.pid, event->fork.tid,
797 event->fork.ppid, event->fork.ptid);
800 * A thread clone will have the same PID for both
801 * parent and child.
803 if (thread == parent)
804 return 0;
806 if (event->header.type == PERF_RECORD_EXIT)
807 return 0;
809 if (!thread || !parent || thread__fork(thread, parent)) {
810 dump_printf("problem processing PERF_RECORD_FORK, skipping event.\n");
811 return -1;
813 total_fork++;
815 return 0;
818 static int
819 process_lost_event(event_t *event, unsigned long offset, unsigned long head)
821 dump_printf("%p [%p]: PERF_RECORD_LOST: id:%Ld: lost:%Ld\n",
822 (void *)(offset + head),
823 (void *)(long)(event->header.size),
824 event->lost.id,
825 event->lost.lost);
827 total_lost += event->lost.lost;
829 return 0;
832 static int
833 process_read_event(event_t *event, unsigned long offset, unsigned long head)
835 struct perf_event_attr *attr;
837 attr = perf_header__find_attr(event->read.id, header);
839 if (show_threads) {
840 const char *name = attr ? __event_name(attr->type, attr->config)
841 : "unknown";
842 perf_read_values_add_value(&show_threads_values,
843 event->read.pid, event->read.tid,
844 event->read.id,
845 name,
846 event->read.value);
849 dump_printf("%p [%p]: PERF_RECORD_READ: %d %d %s %Lu\n",
850 (void *)(offset + head),
851 (void *)(long)(event->header.size),
852 event->read.pid,
853 event->read.tid,
854 attr ? __event_name(attr->type, attr->config)
855 : "FAIL",
856 event->read.value);
858 return 0;
861 static int
862 process_event(event_t *event, unsigned long offset, unsigned long head)
864 trace_event(event);
866 switch (event->header.type) {
867 case PERF_RECORD_SAMPLE:
868 return process_sample_event(event, offset, head);
870 case PERF_RECORD_MMAP:
871 return process_mmap_event(event, offset, head);
873 case PERF_RECORD_COMM:
874 return process_comm_event(event, offset, head);
876 case PERF_RECORD_FORK:
877 case PERF_RECORD_EXIT:
878 return process_task_event(event, offset, head);
880 case PERF_RECORD_LOST:
881 return process_lost_event(event, offset, head);
883 case PERF_RECORD_READ:
884 return process_read_event(event, offset, head);
887 * We dont process them right now but they are fine:
890 case PERF_RECORD_THROTTLE:
891 case PERF_RECORD_UNTHROTTLE:
892 return 0;
894 default:
895 return -1;
898 return 0;
901 static int __cmd_report(void)
903 int ret, rc = EXIT_FAILURE;
904 unsigned long offset = 0;
905 unsigned long head, shift;
906 struct stat input_stat;
907 struct thread *idle;
908 event_t *event;
909 uint32_t size;
910 char *buf;
912 idle = register_idle_thread(&threads, &last_match);
913 thread__comm_adjust(idle);
915 if (show_threads)
916 perf_read_values_init(&show_threads_values);
918 input = open(input_name, O_RDONLY);
919 if (input < 0) {
920 fprintf(stderr, " failed to open file: %s", input_name);
921 if (!strcmp(input_name, "perf.data"))
922 fprintf(stderr, " (try 'perf record' first)");
923 fprintf(stderr, "\n");
924 exit(-1);
927 ret = fstat(input, &input_stat);
928 if (ret < 0) {
929 perror("failed to stat file");
930 exit(-1);
933 if (!force && input_stat.st_uid && (input_stat.st_uid != geteuid())) {
934 fprintf(stderr, "file: %s not owned by current user or root\n", input_name);
935 exit(-1);
938 if (!input_stat.st_size) {
939 fprintf(stderr, "zero-sized file, nothing to do!\n");
940 exit(0);
943 header = perf_header__read(input);
944 head = header->data_offset;
946 sample_type = perf_header__sample_type(header);
948 if (!(sample_type & PERF_SAMPLE_CALLCHAIN)) {
949 if (sort__has_parent) {
950 fprintf(stderr, "selected --sort parent, but no"
951 " callchain data. Did you call"
952 " perf record without -g?\n");
953 exit(-1);
955 if (callchain) {
956 fprintf(stderr, "selected -g but no callchain data."
957 " Did you call perf record without"
958 " -g?\n");
959 exit(-1);
961 } else if (callchain_param.mode != CHAIN_NONE && !callchain) {
962 callchain = 1;
963 if (register_callchain_param(&callchain_param) < 0) {
964 fprintf(stderr, "Can't register callchain"
965 " params\n");
966 exit(-1);
970 if (load_kernel() < 0) {
971 perror("failed to load kernel symbols");
972 return EXIT_FAILURE;
975 if (!full_paths) {
976 if (getcwd(__cwd, sizeof(__cwd)) == NULL) {
977 perror("failed to get the current directory");
978 return EXIT_FAILURE;
980 cwdlen = strlen(cwd);
981 } else {
982 cwd = NULL;
983 cwdlen = 0;
986 shift = page_size * (head / page_size);
987 offset += shift;
988 head -= shift;
990 remap:
991 buf = (char *)mmap(NULL, page_size * mmap_window, PROT_READ,
992 MAP_SHARED, input, offset);
993 if (buf == MAP_FAILED) {
994 perror("failed to mmap file");
995 exit(-1);
998 more:
999 event = (event_t *)(buf + head);
1001 size = event->header.size;
1002 if (!size)
1003 size = 8;
1005 if (head + event->header.size >= page_size * mmap_window) {
1006 int munmap_ret;
1008 shift = page_size * (head / page_size);
1010 munmap_ret = munmap(buf, page_size * mmap_window);
1011 assert(munmap_ret == 0);
1013 offset += shift;
1014 head -= shift;
1015 goto remap;
1018 size = event->header.size;
1020 dump_printf("\n%p [%p]: event: %d\n",
1021 (void *)(offset + head),
1022 (void *)(long)event->header.size,
1023 event->header.type);
1025 if (!size || process_event(event, offset, head) < 0) {
1027 dump_printf("%p [%p]: skipping unknown header type: %d\n",
1028 (void *)(offset + head),
1029 (void *)(long)(event->header.size),
1030 event->header.type);
1032 total_unknown++;
1035 * assume we lost track of the stream, check alignment, and
1036 * increment a single u64 in the hope to catch on again 'soon'.
1039 if (unlikely(head & 7))
1040 head &= ~7ULL;
1042 size = 8;
1045 head += size;
1047 if (offset + head >= header->data_offset + header->data_size)
1048 goto done;
1050 if (offset + head < (unsigned long)input_stat.st_size)
1051 goto more;
1053 done:
1054 rc = EXIT_SUCCESS;
1055 close(input);
1057 dump_printf(" IP events: %10ld\n", total);
1058 dump_printf(" mmap events: %10ld\n", total_mmap);
1059 dump_printf(" comm events: %10ld\n", total_comm);
1060 dump_printf(" fork events: %10ld\n", total_fork);
1061 dump_printf(" lost events: %10ld\n", total_lost);
1062 dump_printf(" unknown events: %10ld\n", total_unknown);
1064 if (dump_trace)
1065 return 0;
1067 if (verbose >= 3)
1068 threads__fprintf(stdout, &threads);
1070 if (verbose >= 2)
1071 dsos__fprintf(stdout);
1073 collapse__resort();
1074 output__resort(total);
1075 output__fprintf(stdout, total);
1077 if (show_threads)
1078 perf_read_values_destroy(&show_threads_values);
1080 return rc;
1083 static int
1084 parse_callchain_opt(const struct option *opt __used, const char *arg,
1085 int unset __used)
1087 char *tok;
1088 char *endptr;
1090 callchain = 1;
1092 if (!arg)
1093 return 0;
1095 tok = strtok((char *)arg, ",");
1096 if (!tok)
1097 return -1;
1099 /* get the output mode */
1100 if (!strncmp(tok, "graph", strlen(arg)))
1101 callchain_param.mode = CHAIN_GRAPH_ABS;
1103 else if (!strncmp(tok, "flat", strlen(arg)))
1104 callchain_param.mode = CHAIN_FLAT;
1106 else if (!strncmp(tok, "fractal", strlen(arg)))
1107 callchain_param.mode = CHAIN_GRAPH_REL;
1109 else if (!strncmp(tok, "none", strlen(arg))) {
1110 callchain_param.mode = CHAIN_NONE;
1111 callchain = 0;
1113 return 0;
1116 else
1117 return -1;
1119 /* get the min percentage */
1120 tok = strtok(NULL, ",");
1121 if (!tok)
1122 goto setup;
1124 callchain_param.min_percent = strtod(tok, &endptr);
1125 if (tok == endptr)
1126 return -1;
1128 setup:
1129 if (register_callchain_param(&callchain_param) < 0) {
1130 fprintf(stderr, "Can't register callchain params\n");
1131 return -1;
1133 return 0;
1136 //static const char * const report_usage[] = {
1137 const char * const report_usage[] = {
1138 "perf report [<options>] <command>",
1139 NULL
1142 static const struct option options[] = {
1143 OPT_STRING('i', "input", &input_name, "file",
1144 "input file name"),
1145 OPT_BOOLEAN('v', "verbose", &verbose,
1146 "be more verbose (show symbol address, etc)"),
1147 OPT_BOOLEAN('D', "dump-raw-trace", &dump_trace,
1148 "dump raw trace in ASCII"),
1149 OPT_STRING('k', "vmlinux", &vmlinux_name, "file", "vmlinux pathname"),
1150 OPT_BOOLEAN('f', "force", &force, "don't complain, do it"),
1151 OPT_BOOLEAN('m', "modules", &modules,
1152 "load module symbols - WARNING: use only with -k and LIVE kernel"),
1153 OPT_BOOLEAN('n', "show-nr-samples", &show_nr_samples,
1154 "Show a column with the number of samples"),
1155 OPT_BOOLEAN('T', "threads", &show_threads,
1156 "Show per-thread event counters"),
1157 OPT_STRING(0, "pretty", &pretty_printing_style, "key",
1158 "pretty printing style key: normal raw"),
1159 OPT_STRING('s', "sort", &sort_order, "key[,key2...]",
1160 "sort by key(s): pid, comm, dso, symbol, parent"),
1161 OPT_BOOLEAN('P', "full-paths", &full_paths,
1162 "Don't shorten the pathnames taking into account the cwd"),
1163 OPT_STRING('p', "parent", &parent_pattern, "regex",
1164 "regex filter to identify parent, see: '--sort parent'"),
1165 OPT_BOOLEAN('x', "exclude-other", &exclude_other,
1166 "Only display entries with parent-match"),
1167 OPT_CALLBACK_DEFAULT('g', "call-graph", NULL, "output_type,min_percent",
1168 "Display callchains using output_type and min percent threshold. "
1169 "Default: fractal,0.5", &parse_callchain_opt, callchain_default_opt),
1170 OPT_STRING('d', "dsos", &dso_list_str, "dso[,dso...]",
1171 "only consider symbols in these dsos"),
1172 OPT_STRING('C', "comms", &comm_list_str, "comm[,comm...]",
1173 "only consider symbols in these comms"),
1174 OPT_STRING('S', "symbols", &sym_list_str, "symbol[,symbol...]",
1175 "only consider these symbols"),
1176 OPT_STRING('w', "column-widths", &col_width_list_str,
1177 "width[,width...]",
1178 "don't try to adjust column width, use these fixed values"),
1179 OPT_STRING('t', "field-separator", &field_sep, "separator",
1180 "separator for columns, no spaces will be added between "
1181 "columns '.' is reserved."),
1182 OPT_END()
1185 static void setup_sorting(void)
1187 char *tmp, *tok, *str = strdup(sort_order);
1189 for (tok = strtok_r(str, ", ", &tmp);
1190 tok; tok = strtok_r(NULL, ", ", &tmp)) {
1191 if (sort_dimension__add(tok) < 0) {
1192 error("Unknown --sort key: `%s'", tok);
1193 usage_with_options(report_usage, options);
1197 free(str);
1200 static void setup_list(struct strlist **list, const char *list_str,
1201 struct sort_entry *se, const char *list_name,
1202 FILE *fp)
1204 if (list_str) {
1205 *list = strlist__new(true, list_str);
1206 if (!*list) {
1207 fprintf(stderr, "problems parsing %s list\n",
1208 list_name);
1209 exit(129);
1211 if (strlist__nr_entries(*list) == 1) {
1212 fprintf(fp, "# %s: %s\n", list_name,
1213 strlist__entry(*list, 0)->s);
1214 se->elide = true;
1219 int cmd_report(int argc, const char **argv, const char *prefix __used)
1221 symbol__init();
1223 page_size = getpagesize();
1225 argc = parse_options(argc, argv, options, report_usage, 0);
1227 setup_sorting();
1229 if (parent_pattern != default_parent_pattern) {
1230 sort_dimension__add("parent");
1231 sort_parent.elide = 1;
1232 } else
1233 exclude_other = 0;
1236 * Any (unrecognized) arguments left?
1238 if (argc)
1239 usage_with_options(report_usage, options);
1241 setup_pager();
1243 setup_list(&dso_list, dso_list_str, &sort_dso, "dso", stdout);
1244 setup_list(&comm_list, comm_list_str, &sort_comm, "comm", stdout);
1245 setup_list(&sym_list, sym_list_str, &sort_sym, "symbol", stdout);
1247 if (field_sep && *field_sep == '.') {
1248 fputs("'.' is the only non valid --field-separator argument\n",
1249 stderr);
1250 exit(129);
1253 return __cmd_report();