perf tools: Encode kernel module mappings in perf.data
[linux-2.6/btrfs-unstable.git] / tools / perf / util / event.c
blob4f3e7ef33b834da3b2067e7abdca1fba0ed08480
1 #include <linux/types.h>
2 #include "event.h"
3 #include "debug.h"
4 #include "session.h"
5 #include "sort.h"
6 #include "string.h"
7 #include "strlist.h"
8 #include "thread.h"
10 static pid_t event__synthesize_comm(pid_t pid, int full,
11 event__handler_t process,
12 struct perf_session *session)
14 event_t ev;
15 char filename[PATH_MAX];
16 char bf[BUFSIZ];
17 FILE *fp;
18 size_t size = 0;
19 DIR *tasks;
20 struct dirent dirent, *next;
21 pid_t tgid = 0;
23 snprintf(filename, sizeof(filename), "/proc/%d/status", pid);
25 fp = fopen(filename, "r");
26 if (fp == NULL) {
27 out_race:
29 * We raced with a task exiting - just return:
31 pr_debug("couldn't open %s\n", filename);
32 return 0;
35 memset(&ev.comm, 0, sizeof(ev.comm));
36 while (!ev.comm.comm[0] || !ev.comm.pid) {
37 if (fgets(bf, sizeof(bf), fp) == NULL)
38 goto out_failure;
40 if (memcmp(bf, "Name:", 5) == 0) {
41 char *name = bf + 5;
42 while (*name && isspace(*name))
43 ++name;
44 size = strlen(name) - 1;
45 memcpy(ev.comm.comm, name, size++);
46 } else if (memcmp(bf, "Tgid:", 5) == 0) {
47 char *tgids = bf + 5;
48 while (*tgids && isspace(*tgids))
49 ++tgids;
50 tgid = ev.comm.pid = atoi(tgids);
54 ev.comm.header.type = PERF_RECORD_COMM;
55 size = ALIGN(size, sizeof(u64));
56 ev.comm.header.size = sizeof(ev.comm) - (sizeof(ev.comm.comm) - size);
58 if (!full) {
59 ev.comm.tid = pid;
61 process(&ev, session);
62 goto out_fclose;
65 snprintf(filename, sizeof(filename), "/proc/%d/task", pid);
67 tasks = opendir(filename);
68 if (tasks == NULL)
69 goto out_race;
71 while (!readdir_r(tasks, &dirent, &next) && next) {
72 char *end;
73 pid = strtol(dirent.d_name, &end, 10);
74 if (*end)
75 continue;
77 ev.comm.tid = pid;
79 process(&ev, session);
81 closedir(tasks);
83 out_fclose:
84 fclose(fp);
85 return tgid;
87 out_failure:
88 pr_warning("couldn't get COMM and pgid, malformed %s\n", filename);
89 return -1;
92 static int event__synthesize_mmap_events(pid_t pid, pid_t tgid,
93 event__handler_t process,
94 struct perf_session *session)
96 char filename[PATH_MAX];
97 FILE *fp;
99 snprintf(filename, sizeof(filename), "/proc/%d/maps", pid);
101 fp = fopen(filename, "r");
102 if (fp == NULL) {
104 * We raced with a task exiting - just return:
106 pr_debug("couldn't open %s\n", filename);
107 return -1;
110 while (1) {
111 char bf[BUFSIZ], *pbf = bf;
112 event_t ev = {
113 .header = { .type = PERF_RECORD_MMAP },
115 int n;
116 size_t size;
117 if (fgets(bf, sizeof(bf), fp) == NULL)
118 break;
120 /* 00400000-0040c000 r-xp 00000000 fd:01 41038 /bin/cat */
121 n = hex2u64(pbf, &ev.mmap.start);
122 if (n < 0)
123 continue;
124 pbf += n + 1;
125 n = hex2u64(pbf, &ev.mmap.len);
126 if (n < 0)
127 continue;
128 pbf += n + 3;
129 if (*pbf == 'x') { /* vm_exec */
130 char *execname = strchr(bf, '/');
132 /* Catch VDSO */
133 if (execname == NULL)
134 execname = strstr(bf, "[vdso]");
136 if (execname == NULL)
137 continue;
139 size = strlen(execname);
140 execname[size - 1] = '\0'; /* Remove \n */
141 memcpy(ev.mmap.filename, execname, size);
142 size = ALIGN(size, sizeof(u64));
143 ev.mmap.len -= ev.mmap.start;
144 ev.mmap.header.size = (sizeof(ev.mmap) -
145 (sizeof(ev.mmap.filename) - size));
146 ev.mmap.pid = tgid;
147 ev.mmap.tid = pid;
149 process(&ev, session);
153 fclose(fp);
154 return 0;
157 int event__synthesize_modules(event__handler_t process,
158 struct perf_session *session)
160 struct rb_node *nd;
162 for (nd = rb_first(&session->kmaps.maps[MAP__FUNCTION]);
163 nd; nd = rb_next(nd)) {
164 event_t ev;
165 size_t size;
166 struct map *pos = rb_entry(nd, struct map, rb_node);
168 if (pos->dso->kernel)
169 continue;
171 size = ALIGN(pos->dso->long_name_len + 1, sizeof(u64));
172 memset(&ev, 0, sizeof(ev));
173 ev.mmap.header.type = PERF_RECORD_MMAP;
174 ev.mmap.header.size = (sizeof(ev.mmap) -
175 (sizeof(ev.mmap.filename) - size));
176 ev.mmap.start = pos->start;
177 ev.mmap.len = pos->end - pos->start;
179 memcpy(ev.mmap.filename, pos->dso->long_name,
180 pos->dso->long_name_len + 1);
181 process(&ev, session);
184 return 0;
187 int event__synthesize_thread(pid_t pid, event__handler_t process,
188 struct perf_session *session)
190 pid_t tgid = event__synthesize_comm(pid, 1, process, session);
191 if (tgid == -1)
192 return -1;
193 return event__synthesize_mmap_events(pid, tgid, process, session);
196 void event__synthesize_threads(event__handler_t process,
197 struct perf_session *session)
199 DIR *proc;
200 struct dirent dirent, *next;
202 proc = opendir("/proc");
204 while (!readdir_r(proc, &dirent, &next) && next) {
205 char *end;
206 pid_t pid = strtol(dirent.d_name, &end, 10);
208 if (*end) /* only interested in proper numerical dirents */
209 continue;
211 event__synthesize_thread(pid, process, session);
214 closedir(proc);
217 struct process_symbol_args {
218 const char *name;
219 u64 start;
222 static int find_symbol_cb(void *arg, const char *name, char type, u64 start)
224 struct process_symbol_args *args = arg;
226 if (!symbol_type__is_a(type, MAP__FUNCTION) || strcmp(name, args->name))
227 return 0;
229 args->start = start;
230 return 1;
233 int event__synthesize_kernel_mmap(event__handler_t process,
234 struct perf_session *session,
235 const char *symbol_name)
237 size_t size;
238 event_t ev = {
239 .header = { .type = PERF_RECORD_MMAP },
242 * We should get this from /sys/kernel/sections/.text, but till that is
243 * available use this, and after it is use this as a fallback for older
244 * kernels.
246 struct process_symbol_args args = { .name = symbol_name, };
248 if (kallsyms__parse(&args, find_symbol_cb) <= 0)
249 return -ENOENT;
251 size = snprintf(ev.mmap.filename, sizeof(ev.mmap.filename),
252 "[kernel.kallsyms.%s]", symbol_name) + 1;
253 size = ALIGN(size, sizeof(u64));
254 ev.mmap.header.size = (sizeof(ev.mmap) - (sizeof(ev.mmap.filename) - size));
255 ev.mmap.pgoff = args.start;
256 ev.mmap.start = session->vmlinux_maps[MAP__FUNCTION]->start;
257 ev.mmap.len = session->vmlinux_maps[MAP__FUNCTION]->end - ev.mmap.start ;
259 return process(&ev, session);
262 static void thread__comm_adjust(struct thread *self)
264 char *comm = self->comm;
266 if (!symbol_conf.col_width_list_str && !symbol_conf.field_sep &&
267 (!symbol_conf.comm_list ||
268 strlist__has_entry(symbol_conf.comm_list, comm))) {
269 unsigned int slen = strlen(comm);
271 if (slen > comms__col_width) {
272 comms__col_width = slen;
273 threads__col_width = slen + 6;
278 static int thread__set_comm_adjust(struct thread *self, const char *comm)
280 int ret = thread__set_comm(self, comm);
282 if (ret)
283 return ret;
285 thread__comm_adjust(self);
287 return 0;
290 int event__process_comm(event_t *self, struct perf_session *session)
292 struct thread *thread = perf_session__findnew(session, self->comm.pid);
294 dump_printf(": %s:%d\n", self->comm.comm, self->comm.pid);
296 if (thread == NULL || thread__set_comm_adjust(thread, self->comm.comm)) {
297 dump_printf("problem processing PERF_RECORD_COMM, skipping event.\n");
298 return -1;
301 return 0;
304 int event__process_lost(event_t *self, struct perf_session *session)
306 dump_printf(": id:%Ld: lost:%Ld\n", self->lost.id, self->lost.lost);
307 session->events_stats.lost += self->lost.lost;
308 return 0;
311 int event__process_mmap(event_t *self, struct perf_session *session)
313 struct thread *thread;
314 struct map *map;
316 dump_printf(" %d/%d: [%p(%p) @ %p]: %s\n",
317 self->mmap.pid, self->mmap.tid,
318 (void *)(long)self->mmap.start,
319 (void *)(long)self->mmap.len,
320 (void *)(long)self->mmap.pgoff,
321 self->mmap.filename);
323 if (self->mmap.pid == 0) {
324 static const char kmmap_prefix[] = "[kernel.kallsyms.";
326 if (self->mmap.filename[0] == '/') {
327 char short_module_name[1024];
328 char *name = strrchr(self->mmap.filename, '/'), *dot;
330 if (name == NULL)
331 goto out_problem;
333 ++name; /* skip / */
334 dot = strrchr(name, '.');
335 if (dot == NULL)
336 goto out_problem;
338 snprintf(short_module_name, sizeof(short_module_name),
339 "[%.*s]", (int)(dot - name), name);
340 strxfrchar(short_module_name, '-', '_');
342 map = perf_session__new_module_map(session,
343 self->mmap.start,
344 short_module_name);
345 if (map == NULL)
346 goto out_problem;
348 name = strdup(self->mmap.filename);
349 if (name == NULL)
350 goto out_problem;
352 dso__set_long_name(map->dso, name);
353 map->end = map->start + self->mmap.len;
354 } else if (memcmp(self->mmap.filename, kmmap_prefix,
355 sizeof(kmmap_prefix) - 1) == 0) {
356 const char *symbol_name = (self->mmap.filename +
357 sizeof(kmmap_prefix) - 1);
359 * Should be there already, from the build-id table in
360 * the header.
362 struct dso *kernel = __dsos__findnew(&dsos__kernel,
363 "[kernel.kallsyms]");
364 if (kernel == NULL)
365 goto out_problem;
367 if (__map_groups__create_kernel_maps(&session->kmaps,
368 session->vmlinux_maps,
369 kernel) < 0)
370 goto out_problem;
372 session->vmlinux_maps[MAP__FUNCTION]->start = self->mmap.start;
373 session->vmlinux_maps[MAP__FUNCTION]->end = self->mmap.start + self->mmap.len;
375 perf_session__set_kallsyms_ref_reloc_sym(session, symbol_name,
376 self->mmap.pgoff);
378 return 0;
381 thread = perf_session__findnew(session, self->mmap.pid);
382 map = map__new(&self->mmap, MAP__FUNCTION,
383 session->cwd, session->cwdlen);
385 if (thread == NULL || map == NULL)
386 goto out_problem;
388 thread__insert_map(thread, map);
389 return 0;
391 out_problem:
392 dump_printf("problem processing PERF_RECORD_MMAP, skipping event.\n");
393 return 0;
396 int event__process_task(event_t *self, struct perf_session *session)
398 struct thread *thread = perf_session__findnew(session, self->fork.pid);
399 struct thread *parent = perf_session__findnew(session, self->fork.ppid);
401 dump_printf("(%d:%d):(%d:%d)\n", self->fork.pid, self->fork.tid,
402 self->fork.ppid, self->fork.ptid);
404 * A thread clone will have the same PID for both parent and child.
406 if (thread == parent)
407 return 0;
409 if (self->header.type == PERF_RECORD_EXIT)
410 return 0;
412 if (thread == NULL || parent == NULL ||
413 thread__fork(thread, parent) < 0) {
414 dump_printf("problem processing PERF_RECORD_FORK, skipping event.\n");
415 return -1;
418 return 0;
421 void thread__find_addr_location(struct thread *self,
422 struct perf_session *session, u8 cpumode,
423 enum map_type type, u64 addr,
424 struct addr_location *al,
425 symbol_filter_t filter)
427 struct map_groups *mg = &self->mg;
429 al->thread = self;
430 al->addr = addr;
432 if (cpumode & PERF_RECORD_MISC_KERNEL) {
433 al->level = 'k';
434 mg = &session->kmaps;
435 } else if (cpumode & PERF_RECORD_MISC_USER)
436 al->level = '.';
437 else {
438 al->level = 'H';
439 al->map = NULL;
440 al->sym = NULL;
441 return;
443 try_again:
444 al->map = map_groups__find(mg, type, al->addr);
445 if (al->map == NULL) {
447 * If this is outside of all known maps, and is a negative
448 * address, try to look it up in the kernel dso, as it might be
449 * a vsyscall or vdso (which executes in user-mode).
451 * XXX This is nasty, we should have a symbol list in the
452 * "[vdso]" dso, but for now lets use the old trick of looking
453 * in the whole kernel symbol list.
455 if ((long long)al->addr < 0 && mg != &session->kmaps) {
456 mg = &session->kmaps;
457 goto try_again;
459 al->sym = NULL;
460 } else {
461 al->addr = al->map->map_ip(al->map, al->addr);
462 al->sym = map__find_symbol(al->map, session, al->addr, filter);
466 static void dso__calc_col_width(struct dso *self)
468 if (!symbol_conf.col_width_list_str && !symbol_conf.field_sep &&
469 (!symbol_conf.dso_list ||
470 strlist__has_entry(symbol_conf.dso_list, self->name))) {
471 unsigned int slen = strlen(self->name);
472 if (slen > dsos__col_width)
473 dsos__col_width = slen;
476 self->slen_calculated = 1;
479 int event__preprocess_sample(const event_t *self, struct perf_session *session,
480 struct addr_location *al, symbol_filter_t filter)
482 u8 cpumode = self->header.misc & PERF_RECORD_MISC_CPUMODE_MASK;
483 struct thread *thread = perf_session__findnew(session, self->ip.pid);
485 if (thread == NULL)
486 return -1;
488 if (symbol_conf.comm_list &&
489 !strlist__has_entry(symbol_conf.comm_list, thread->comm))
490 goto out_filtered;
492 dump_printf(" ... thread: %s:%d\n", thread->comm, thread->pid);
494 thread__find_addr_location(thread, session, cpumode, MAP__FUNCTION,
495 self->ip.ip, al, filter);
496 dump_printf(" ...... dso: %s\n",
497 al->map ? al->map->dso->long_name :
498 al->level == 'H' ? "[hypervisor]" : "<not found>");
500 * We have to do this here as we may have a dso with no symbol hit that
501 * has a name longer than the ones with symbols sampled.
503 if (al->map && !sort_dso.elide && !al->map->dso->slen_calculated)
504 dso__calc_col_width(al->map->dso);
506 if (symbol_conf.dso_list &&
507 (!al->map || !al->map->dso ||
508 !(strlist__has_entry(symbol_conf.dso_list, al->map->dso->short_name) ||
509 (al->map->dso->short_name != al->map->dso->long_name &&
510 strlist__has_entry(symbol_conf.dso_list, al->map->dso->long_name)))))
511 goto out_filtered;
513 if (symbol_conf.sym_list && al->sym &&
514 !strlist__has_entry(symbol_conf.sym_list, al->sym->name))
515 goto out_filtered;
517 al->filtered = false;
518 return 0;
520 out_filtered:
521 al->filtered = true;
522 return 0;
525 int event__parse_sample(event_t *event, u64 type, struct sample_data *data)
527 u64 *array = event->sample.array;
529 if (type & PERF_SAMPLE_IP) {
530 data->ip = event->ip.ip;
531 array++;
534 if (type & PERF_SAMPLE_TID) {
535 u32 *p = (u32 *)array;
536 data->pid = p[0];
537 data->tid = p[1];
538 array++;
541 if (type & PERF_SAMPLE_TIME) {
542 data->time = *array;
543 array++;
546 if (type & PERF_SAMPLE_ADDR) {
547 data->addr = *array;
548 array++;
551 if (type & PERF_SAMPLE_ID) {
552 data->id = *array;
553 array++;
556 if (type & PERF_SAMPLE_STREAM_ID) {
557 data->stream_id = *array;
558 array++;
561 if (type & PERF_SAMPLE_CPU) {
562 u32 *p = (u32 *)array;
563 data->cpu = *p;
564 array++;
567 if (type & PERF_SAMPLE_PERIOD) {
568 data->period = *array;
569 array++;
572 if (type & PERF_SAMPLE_READ) {
573 pr_debug("PERF_SAMPLE_READ is unsuported for now\n");
574 return -1;
577 if (type & PERF_SAMPLE_CALLCHAIN) {
578 data->callchain = (struct ip_callchain *)array;
579 array += 1 + data->callchain->nr;
582 if (type & PERF_SAMPLE_RAW) {
583 u32 *p = (u32 *)array;
584 data->raw_size = *p;
585 p++;
586 data->raw_data = p;
589 return 0;