x86, numa: Fake node-to-cpumask for NUMA emulation
[linux-2.6/libata-dev.git] / kernel / trace / trace_events.c
blob0725eeab1937ef24a301f2c0b0404f64ce95e026
1 /*
2 * event tracer
4 * Copyright (C) 2008 Red Hat Inc, Steven Rostedt <srostedt@redhat.com>
6 * - Added format output of fields of the trace point.
7 * This was based off of work by Tom Zanussi <tzanussi@gmail.com>.
9 */
11 #include <linux/workqueue.h>
12 #include <linux/spinlock.h>
13 #include <linux/kthread.h>
14 #include <linux/debugfs.h>
15 #include <linux/uaccess.h>
16 #include <linux/module.h>
17 #include <linux/ctype.h>
18 #include <linux/slab.h>
19 #include <linux/delay.h>
21 #include <asm/setup.h>
23 #include "trace_output.h"
25 #undef TRACE_SYSTEM
26 #define TRACE_SYSTEM "TRACE_SYSTEM"
28 DEFINE_MUTEX(event_mutex);
30 LIST_HEAD(ftrace_events);
31 LIST_HEAD(ftrace_common_fields);
33 struct list_head *
34 trace_get_fields(struct ftrace_event_call *event_call)
36 if (!event_call->class->get_fields)
37 return &event_call->class->fields;
38 return event_call->class->get_fields(event_call);
41 static int __trace_define_field(struct list_head *head, const char *type,
42 const char *name, int offset, int size,
43 int is_signed, int filter_type)
45 struct ftrace_event_field *field;
47 field = kzalloc(sizeof(*field), GFP_KERNEL);
48 if (!field)
49 goto err;
51 field->name = kstrdup(name, GFP_KERNEL);
52 if (!field->name)
53 goto err;
55 field->type = kstrdup(type, GFP_KERNEL);
56 if (!field->type)
57 goto err;
59 if (filter_type == FILTER_OTHER)
60 field->filter_type = filter_assign_type(type);
61 else
62 field->filter_type = filter_type;
64 field->offset = offset;
65 field->size = size;
66 field->is_signed = is_signed;
68 list_add(&field->link, head);
70 return 0;
72 err:
73 if (field)
74 kfree(field->name);
75 kfree(field);
77 return -ENOMEM;
80 int trace_define_field(struct ftrace_event_call *call, const char *type,
81 const char *name, int offset, int size, int is_signed,
82 int filter_type)
84 struct list_head *head;
86 if (WARN_ON(!call->class))
87 return 0;
89 head = trace_get_fields(call);
90 return __trace_define_field(head, type, name, offset, size,
91 is_signed, filter_type);
93 EXPORT_SYMBOL_GPL(trace_define_field);
95 #define __common_field(type, item) \
96 ret = __trace_define_field(&ftrace_common_fields, #type, \
97 "common_" #item, \
98 offsetof(typeof(ent), item), \
99 sizeof(ent.item), \
100 is_signed_type(type), FILTER_OTHER); \
101 if (ret) \
102 return ret;
104 static int trace_define_common_fields(void)
106 int ret;
107 struct trace_entry ent;
109 __common_field(unsigned short, type);
110 __common_field(unsigned char, flags);
111 __common_field(unsigned char, preempt_count);
112 __common_field(int, pid);
113 __common_field(int, lock_depth);
115 return ret;
118 void trace_destroy_fields(struct ftrace_event_call *call)
120 struct ftrace_event_field *field, *next;
121 struct list_head *head;
123 head = trace_get_fields(call);
124 list_for_each_entry_safe(field, next, head, link) {
125 list_del(&field->link);
126 kfree(field->type);
127 kfree(field->name);
128 kfree(field);
132 int trace_event_raw_init(struct ftrace_event_call *call)
134 int id;
136 id = register_ftrace_event(&call->event);
137 if (!id)
138 return -ENODEV;
140 return 0;
142 EXPORT_SYMBOL_GPL(trace_event_raw_init);
144 int ftrace_event_reg(struct ftrace_event_call *call, enum trace_reg type)
146 switch (type) {
147 case TRACE_REG_REGISTER:
148 return tracepoint_probe_register(call->name,
149 call->class->probe,
150 call);
151 case TRACE_REG_UNREGISTER:
152 tracepoint_probe_unregister(call->name,
153 call->class->probe,
154 call);
155 return 0;
157 #ifdef CONFIG_PERF_EVENTS
158 case TRACE_REG_PERF_REGISTER:
159 return tracepoint_probe_register(call->name,
160 call->class->perf_probe,
161 call);
162 case TRACE_REG_PERF_UNREGISTER:
163 tracepoint_probe_unregister(call->name,
164 call->class->perf_probe,
165 call);
166 return 0;
167 #endif
169 return 0;
171 EXPORT_SYMBOL_GPL(ftrace_event_reg);
173 void trace_event_enable_cmd_record(bool enable)
175 struct ftrace_event_call *call;
177 mutex_lock(&event_mutex);
178 list_for_each_entry(call, &ftrace_events, list) {
179 if (!(call->flags & TRACE_EVENT_FL_ENABLED))
180 continue;
182 if (enable) {
183 tracing_start_cmdline_record();
184 call->flags |= TRACE_EVENT_FL_RECORDED_CMD;
185 } else {
186 tracing_stop_cmdline_record();
187 call->flags &= ~TRACE_EVENT_FL_RECORDED_CMD;
190 mutex_unlock(&event_mutex);
193 static int ftrace_event_enable_disable(struct ftrace_event_call *call,
194 int enable)
196 int ret = 0;
198 switch (enable) {
199 case 0:
200 if (call->flags & TRACE_EVENT_FL_ENABLED) {
201 call->flags &= ~TRACE_EVENT_FL_ENABLED;
202 if (call->flags & TRACE_EVENT_FL_RECORDED_CMD) {
203 tracing_stop_cmdline_record();
204 call->flags &= ~TRACE_EVENT_FL_RECORDED_CMD;
206 call->class->reg(call, TRACE_REG_UNREGISTER);
208 break;
209 case 1:
210 if (!(call->flags & TRACE_EVENT_FL_ENABLED)) {
211 if (trace_flags & TRACE_ITER_RECORD_CMD) {
212 tracing_start_cmdline_record();
213 call->flags |= TRACE_EVENT_FL_RECORDED_CMD;
215 ret = call->class->reg(call, TRACE_REG_REGISTER);
216 if (ret) {
217 tracing_stop_cmdline_record();
218 pr_info("event trace: Could not enable event "
219 "%s\n", call->name);
220 break;
222 call->flags |= TRACE_EVENT_FL_ENABLED;
224 break;
227 return ret;
230 static void ftrace_clear_events(void)
232 struct ftrace_event_call *call;
234 mutex_lock(&event_mutex);
235 list_for_each_entry(call, &ftrace_events, list) {
236 ftrace_event_enable_disable(call, 0);
238 mutex_unlock(&event_mutex);
242 * __ftrace_set_clr_event(NULL, NULL, NULL, set) will set/unset all events.
244 static int __ftrace_set_clr_event(const char *match, const char *sub,
245 const char *event, int set)
247 struct ftrace_event_call *call;
248 int ret = -EINVAL;
250 mutex_lock(&event_mutex);
251 list_for_each_entry(call, &ftrace_events, list) {
253 if (!call->name || !call->class || !call->class->reg)
254 continue;
256 if (match &&
257 strcmp(match, call->name) != 0 &&
258 strcmp(match, call->class->system) != 0)
259 continue;
261 if (sub && strcmp(sub, call->class->system) != 0)
262 continue;
264 if (event && strcmp(event, call->name) != 0)
265 continue;
267 ftrace_event_enable_disable(call, set);
269 ret = 0;
271 mutex_unlock(&event_mutex);
273 return ret;
276 static int ftrace_set_clr_event(char *buf, int set)
278 char *event = NULL, *sub = NULL, *match;
281 * The buf format can be <subsystem>:<event-name>
282 * *:<event-name> means any event by that name.
283 * :<event-name> is the same.
285 * <subsystem>:* means all events in that subsystem
286 * <subsystem>: means the same.
288 * <name> (no ':') means all events in a subsystem with
289 * the name <name> or any event that matches <name>
292 match = strsep(&buf, ":");
293 if (buf) {
294 sub = match;
295 event = buf;
296 match = NULL;
298 if (!strlen(sub) || strcmp(sub, "*") == 0)
299 sub = NULL;
300 if (!strlen(event) || strcmp(event, "*") == 0)
301 event = NULL;
304 return __ftrace_set_clr_event(match, sub, event, set);
308 * trace_set_clr_event - enable or disable an event
309 * @system: system name to match (NULL for any system)
310 * @event: event name to match (NULL for all events, within system)
311 * @set: 1 to enable, 0 to disable
313 * This is a way for other parts of the kernel to enable or disable
314 * event recording.
316 * Returns 0 on success, -EINVAL if the parameters do not match any
317 * registered events.
319 int trace_set_clr_event(const char *system, const char *event, int set)
321 return __ftrace_set_clr_event(NULL, system, event, set);
324 /* 128 should be much more than enough */
325 #define EVENT_BUF_SIZE 127
327 static ssize_t
328 ftrace_event_write(struct file *file, const char __user *ubuf,
329 size_t cnt, loff_t *ppos)
331 struct trace_parser parser;
332 ssize_t read, ret;
334 if (!cnt)
335 return 0;
337 ret = tracing_update_buffers();
338 if (ret < 0)
339 return ret;
341 if (trace_parser_get_init(&parser, EVENT_BUF_SIZE + 1))
342 return -ENOMEM;
344 read = trace_get_user(&parser, ubuf, cnt, ppos);
346 if (read >= 0 && trace_parser_loaded((&parser))) {
347 int set = 1;
349 if (*parser.buffer == '!')
350 set = 0;
352 parser.buffer[parser.idx] = 0;
354 ret = ftrace_set_clr_event(parser.buffer + !set, set);
355 if (ret)
356 goto out_put;
359 ret = read;
361 out_put:
362 trace_parser_put(&parser);
364 return ret;
367 static void *
368 t_next(struct seq_file *m, void *v, loff_t *pos)
370 struct ftrace_event_call *call = v;
372 (*pos)++;
374 list_for_each_entry_continue(call, &ftrace_events, list) {
376 * The ftrace subsystem is for showing formats only.
377 * They can not be enabled or disabled via the event files.
379 if (call->class && call->class->reg)
380 return call;
383 return NULL;
386 static void *t_start(struct seq_file *m, loff_t *pos)
388 struct ftrace_event_call *call;
389 loff_t l;
391 mutex_lock(&event_mutex);
393 call = list_entry(&ftrace_events, struct ftrace_event_call, list);
394 for (l = 0; l <= *pos; ) {
395 call = t_next(m, call, &l);
396 if (!call)
397 break;
399 return call;
402 static void *
403 s_next(struct seq_file *m, void *v, loff_t *pos)
405 struct ftrace_event_call *call = v;
407 (*pos)++;
409 list_for_each_entry_continue(call, &ftrace_events, list) {
410 if (call->flags & TRACE_EVENT_FL_ENABLED)
411 return call;
414 return NULL;
417 static void *s_start(struct seq_file *m, loff_t *pos)
419 struct ftrace_event_call *call;
420 loff_t l;
422 mutex_lock(&event_mutex);
424 call = list_entry(&ftrace_events, struct ftrace_event_call, list);
425 for (l = 0; l <= *pos; ) {
426 call = s_next(m, call, &l);
427 if (!call)
428 break;
430 return call;
433 static int t_show(struct seq_file *m, void *v)
435 struct ftrace_event_call *call = v;
437 if (strcmp(call->class->system, TRACE_SYSTEM) != 0)
438 seq_printf(m, "%s:", call->class->system);
439 seq_printf(m, "%s\n", call->name);
441 return 0;
444 static void t_stop(struct seq_file *m, void *p)
446 mutex_unlock(&event_mutex);
449 static int
450 ftrace_event_seq_open(struct inode *inode, struct file *file)
452 const struct seq_operations *seq_ops;
454 if ((file->f_mode & FMODE_WRITE) &&
455 (file->f_flags & O_TRUNC))
456 ftrace_clear_events();
458 seq_ops = inode->i_private;
459 return seq_open(file, seq_ops);
462 static ssize_t
463 event_enable_read(struct file *filp, char __user *ubuf, size_t cnt,
464 loff_t *ppos)
466 struct ftrace_event_call *call = filp->private_data;
467 char *buf;
469 if (call->flags & TRACE_EVENT_FL_ENABLED)
470 buf = "1\n";
471 else
472 buf = "0\n";
474 return simple_read_from_buffer(ubuf, cnt, ppos, buf, 2);
477 static ssize_t
478 event_enable_write(struct file *filp, const char __user *ubuf, size_t cnt,
479 loff_t *ppos)
481 struct ftrace_event_call *call = filp->private_data;
482 char buf[64];
483 unsigned long val;
484 int ret;
486 if (cnt >= sizeof(buf))
487 return -EINVAL;
489 if (copy_from_user(&buf, ubuf, cnt))
490 return -EFAULT;
492 buf[cnt] = 0;
494 ret = strict_strtoul(buf, 10, &val);
495 if (ret < 0)
496 return ret;
498 ret = tracing_update_buffers();
499 if (ret < 0)
500 return ret;
502 switch (val) {
503 case 0:
504 case 1:
505 mutex_lock(&event_mutex);
506 ret = ftrace_event_enable_disable(call, val);
507 mutex_unlock(&event_mutex);
508 break;
510 default:
511 return -EINVAL;
514 *ppos += cnt;
516 return ret ? ret : cnt;
519 static ssize_t
520 system_enable_read(struct file *filp, char __user *ubuf, size_t cnt,
521 loff_t *ppos)
523 const char set_to_char[4] = { '?', '0', '1', 'X' };
524 const char *system = filp->private_data;
525 struct ftrace_event_call *call;
526 char buf[2];
527 int set = 0;
528 int ret;
530 mutex_lock(&event_mutex);
531 list_for_each_entry(call, &ftrace_events, list) {
532 if (!call->name || !call->class || !call->class->reg)
533 continue;
535 if (system && strcmp(call->class->system, system) != 0)
536 continue;
539 * We need to find out if all the events are set
540 * or if all events or cleared, or if we have
541 * a mixture.
543 set |= (1 << !!(call->flags & TRACE_EVENT_FL_ENABLED));
546 * If we have a mixture, no need to look further.
548 if (set == 3)
549 break;
551 mutex_unlock(&event_mutex);
553 buf[0] = set_to_char[set];
554 buf[1] = '\n';
556 ret = simple_read_from_buffer(ubuf, cnt, ppos, buf, 2);
558 return ret;
561 static ssize_t
562 system_enable_write(struct file *filp, const char __user *ubuf, size_t cnt,
563 loff_t *ppos)
565 const char *system = filp->private_data;
566 unsigned long val;
567 char buf[64];
568 ssize_t ret;
570 if (cnt >= sizeof(buf))
571 return -EINVAL;
573 if (copy_from_user(&buf, ubuf, cnt))
574 return -EFAULT;
576 buf[cnt] = 0;
578 ret = strict_strtoul(buf, 10, &val);
579 if (ret < 0)
580 return ret;
582 ret = tracing_update_buffers();
583 if (ret < 0)
584 return ret;
586 if (val != 0 && val != 1)
587 return -EINVAL;
589 ret = __ftrace_set_clr_event(NULL, system, NULL, val);
590 if (ret)
591 goto out;
593 ret = cnt;
595 out:
596 *ppos += cnt;
598 return ret;
601 enum {
602 FORMAT_HEADER = 1,
603 FORMAT_FIELD_SEPERATOR = 2,
604 FORMAT_PRINTFMT = 3,
607 static void *f_next(struct seq_file *m, void *v, loff_t *pos)
609 struct ftrace_event_call *call = m->private;
610 struct ftrace_event_field *field;
611 struct list_head *common_head = &ftrace_common_fields;
612 struct list_head *head = trace_get_fields(call);
614 (*pos)++;
616 switch ((unsigned long)v) {
617 case FORMAT_HEADER:
618 if (unlikely(list_empty(common_head)))
619 return NULL;
621 field = list_entry(common_head->prev,
622 struct ftrace_event_field, link);
623 return field;
625 case FORMAT_FIELD_SEPERATOR:
626 if (unlikely(list_empty(head)))
627 return NULL;
629 field = list_entry(head->prev, struct ftrace_event_field, link);
630 return field;
632 case FORMAT_PRINTFMT:
633 /* all done */
634 return NULL;
637 field = v;
638 if (field->link.prev == common_head)
639 return (void *)FORMAT_FIELD_SEPERATOR;
640 else if (field->link.prev == head)
641 return (void *)FORMAT_PRINTFMT;
643 field = list_entry(field->link.prev, struct ftrace_event_field, link);
645 return field;
648 static void *f_start(struct seq_file *m, loff_t *pos)
650 loff_t l = 0;
651 void *p;
653 /* Start by showing the header */
654 if (!*pos)
655 return (void *)FORMAT_HEADER;
657 p = (void *)FORMAT_HEADER;
658 do {
659 p = f_next(m, p, &l);
660 } while (p && l < *pos);
662 return p;
665 static int f_show(struct seq_file *m, void *v)
667 struct ftrace_event_call *call = m->private;
668 struct ftrace_event_field *field;
669 const char *array_descriptor;
671 switch ((unsigned long)v) {
672 case FORMAT_HEADER:
673 seq_printf(m, "name: %s\n", call->name);
674 seq_printf(m, "ID: %d\n", call->event.type);
675 seq_printf(m, "format:\n");
676 return 0;
678 case FORMAT_FIELD_SEPERATOR:
679 seq_putc(m, '\n');
680 return 0;
682 case FORMAT_PRINTFMT:
683 seq_printf(m, "\nprint fmt: %s\n",
684 call->print_fmt);
685 return 0;
688 field = v;
691 * Smartly shows the array type(except dynamic array).
692 * Normal:
693 * field:TYPE VAR
694 * If TYPE := TYPE[LEN], it is shown:
695 * field:TYPE VAR[LEN]
697 array_descriptor = strchr(field->type, '[');
699 if (!strncmp(field->type, "__data_loc", 10))
700 array_descriptor = NULL;
702 if (!array_descriptor)
703 seq_printf(m, "\tfield:%s %s;\toffset:%u;\tsize:%u;\tsigned:%d;\n",
704 field->type, field->name, field->offset,
705 field->size, !!field->is_signed);
706 else
707 seq_printf(m, "\tfield:%.*s %s%s;\toffset:%u;\tsize:%u;\tsigned:%d;\n",
708 (int)(array_descriptor - field->type),
709 field->type, field->name,
710 array_descriptor, field->offset,
711 field->size, !!field->is_signed);
713 return 0;
716 static void f_stop(struct seq_file *m, void *p)
720 static const struct seq_operations trace_format_seq_ops = {
721 .start = f_start,
722 .next = f_next,
723 .stop = f_stop,
724 .show = f_show,
727 static int trace_format_open(struct inode *inode, struct file *file)
729 struct ftrace_event_call *call = inode->i_private;
730 struct seq_file *m;
731 int ret;
733 ret = seq_open(file, &trace_format_seq_ops);
734 if (ret < 0)
735 return ret;
737 m = file->private_data;
738 m->private = call;
740 return 0;
743 static ssize_t
744 event_id_read(struct file *filp, char __user *ubuf, size_t cnt, loff_t *ppos)
746 struct ftrace_event_call *call = filp->private_data;
747 struct trace_seq *s;
748 int r;
750 if (*ppos)
751 return 0;
753 s = kmalloc(sizeof(*s), GFP_KERNEL);
754 if (!s)
755 return -ENOMEM;
757 trace_seq_init(s);
758 trace_seq_printf(s, "%d\n", call->event.type);
760 r = simple_read_from_buffer(ubuf, cnt, ppos,
761 s->buffer, s->len);
762 kfree(s);
763 return r;
766 static ssize_t
767 event_filter_read(struct file *filp, char __user *ubuf, size_t cnt,
768 loff_t *ppos)
770 struct ftrace_event_call *call = filp->private_data;
771 struct trace_seq *s;
772 int r;
774 if (*ppos)
775 return 0;
777 s = kmalloc(sizeof(*s), GFP_KERNEL);
778 if (!s)
779 return -ENOMEM;
781 trace_seq_init(s);
783 print_event_filter(call, s);
784 r = simple_read_from_buffer(ubuf, cnt, ppos, s->buffer, s->len);
786 kfree(s);
788 return r;
791 static ssize_t
792 event_filter_write(struct file *filp, const char __user *ubuf, size_t cnt,
793 loff_t *ppos)
795 struct ftrace_event_call *call = filp->private_data;
796 char *buf;
797 int err;
799 if (cnt >= PAGE_SIZE)
800 return -EINVAL;
802 buf = (char *)__get_free_page(GFP_TEMPORARY);
803 if (!buf)
804 return -ENOMEM;
806 if (copy_from_user(buf, ubuf, cnt)) {
807 free_page((unsigned long) buf);
808 return -EFAULT;
810 buf[cnt] = '\0';
812 err = apply_event_filter(call, buf);
813 free_page((unsigned long) buf);
814 if (err < 0)
815 return err;
817 *ppos += cnt;
819 return cnt;
822 static ssize_t
823 subsystem_filter_read(struct file *filp, char __user *ubuf, size_t cnt,
824 loff_t *ppos)
826 struct event_subsystem *system = filp->private_data;
827 struct trace_seq *s;
828 int r;
830 if (*ppos)
831 return 0;
833 s = kmalloc(sizeof(*s), GFP_KERNEL);
834 if (!s)
835 return -ENOMEM;
837 trace_seq_init(s);
839 print_subsystem_event_filter(system, s);
840 r = simple_read_from_buffer(ubuf, cnt, ppos, s->buffer, s->len);
842 kfree(s);
844 return r;
847 static ssize_t
848 subsystem_filter_write(struct file *filp, const char __user *ubuf, size_t cnt,
849 loff_t *ppos)
851 struct event_subsystem *system = filp->private_data;
852 char *buf;
853 int err;
855 if (cnt >= PAGE_SIZE)
856 return -EINVAL;
858 buf = (char *)__get_free_page(GFP_TEMPORARY);
859 if (!buf)
860 return -ENOMEM;
862 if (copy_from_user(buf, ubuf, cnt)) {
863 free_page((unsigned long) buf);
864 return -EFAULT;
866 buf[cnt] = '\0';
868 err = apply_subsystem_event_filter(system, buf);
869 free_page((unsigned long) buf);
870 if (err < 0)
871 return err;
873 *ppos += cnt;
875 return cnt;
878 static ssize_t
879 show_header(struct file *filp, char __user *ubuf, size_t cnt, loff_t *ppos)
881 int (*func)(struct trace_seq *s) = filp->private_data;
882 struct trace_seq *s;
883 int r;
885 if (*ppos)
886 return 0;
888 s = kmalloc(sizeof(*s), GFP_KERNEL);
889 if (!s)
890 return -ENOMEM;
892 trace_seq_init(s);
894 func(s);
895 r = simple_read_from_buffer(ubuf, cnt, ppos, s->buffer, s->len);
897 kfree(s);
899 return r;
902 static const struct seq_operations show_event_seq_ops = {
903 .start = t_start,
904 .next = t_next,
905 .show = t_show,
906 .stop = t_stop,
909 static const struct seq_operations show_set_event_seq_ops = {
910 .start = s_start,
911 .next = s_next,
912 .show = t_show,
913 .stop = t_stop,
916 static const struct file_operations ftrace_avail_fops = {
917 .open = ftrace_event_seq_open,
918 .read = seq_read,
919 .llseek = seq_lseek,
920 .release = seq_release,
923 static const struct file_operations ftrace_set_event_fops = {
924 .open = ftrace_event_seq_open,
925 .read = seq_read,
926 .write = ftrace_event_write,
927 .llseek = seq_lseek,
928 .release = seq_release,
931 static const struct file_operations ftrace_enable_fops = {
932 .open = tracing_open_generic,
933 .read = event_enable_read,
934 .write = event_enable_write,
935 .llseek = default_llseek,
938 static const struct file_operations ftrace_event_format_fops = {
939 .open = trace_format_open,
940 .read = seq_read,
941 .llseek = seq_lseek,
942 .release = seq_release,
945 static const struct file_operations ftrace_event_id_fops = {
946 .open = tracing_open_generic,
947 .read = event_id_read,
948 .llseek = default_llseek,
951 static const struct file_operations ftrace_event_filter_fops = {
952 .open = tracing_open_generic,
953 .read = event_filter_read,
954 .write = event_filter_write,
955 .llseek = default_llseek,
958 static const struct file_operations ftrace_subsystem_filter_fops = {
959 .open = tracing_open_generic,
960 .read = subsystem_filter_read,
961 .write = subsystem_filter_write,
962 .llseek = default_llseek,
965 static const struct file_operations ftrace_system_enable_fops = {
966 .open = tracing_open_generic,
967 .read = system_enable_read,
968 .write = system_enable_write,
969 .llseek = default_llseek,
972 static const struct file_operations ftrace_show_header_fops = {
973 .open = tracing_open_generic,
974 .read = show_header,
975 .llseek = default_llseek,
978 static struct dentry *event_trace_events_dir(void)
980 static struct dentry *d_tracer;
981 static struct dentry *d_events;
983 if (d_events)
984 return d_events;
986 d_tracer = tracing_init_dentry();
987 if (!d_tracer)
988 return NULL;
990 d_events = debugfs_create_dir("events", d_tracer);
991 if (!d_events)
992 pr_warning("Could not create debugfs "
993 "'events' directory\n");
995 return d_events;
998 static LIST_HEAD(event_subsystems);
1000 static struct dentry *
1001 event_subsystem_dir(const char *name, struct dentry *d_events)
1003 struct event_subsystem *system;
1004 struct dentry *entry;
1006 /* First see if we did not already create this dir */
1007 list_for_each_entry(system, &event_subsystems, list) {
1008 if (strcmp(system->name, name) == 0) {
1009 system->nr_events++;
1010 return system->entry;
1014 /* need to create new entry */
1015 system = kmalloc(sizeof(*system), GFP_KERNEL);
1016 if (!system) {
1017 pr_warning("No memory to create event subsystem %s\n",
1018 name);
1019 return d_events;
1022 system->entry = debugfs_create_dir(name, d_events);
1023 if (!system->entry) {
1024 pr_warning("Could not create event subsystem %s\n",
1025 name);
1026 kfree(system);
1027 return d_events;
1030 system->nr_events = 1;
1031 system->name = kstrdup(name, GFP_KERNEL);
1032 if (!system->name) {
1033 debugfs_remove(system->entry);
1034 kfree(system);
1035 return d_events;
1038 list_add(&system->list, &event_subsystems);
1040 system->filter = NULL;
1042 system->filter = kzalloc(sizeof(struct event_filter), GFP_KERNEL);
1043 if (!system->filter) {
1044 pr_warning("Could not allocate filter for subsystem "
1045 "'%s'\n", name);
1046 return system->entry;
1049 entry = debugfs_create_file("filter", 0644, system->entry, system,
1050 &ftrace_subsystem_filter_fops);
1051 if (!entry) {
1052 kfree(system->filter);
1053 system->filter = NULL;
1054 pr_warning("Could not create debugfs "
1055 "'%s/filter' entry\n", name);
1058 trace_create_file("enable", 0644, system->entry,
1059 (void *)system->name,
1060 &ftrace_system_enable_fops);
1062 return system->entry;
1065 static int
1066 event_create_dir(struct ftrace_event_call *call, struct dentry *d_events,
1067 const struct file_operations *id,
1068 const struct file_operations *enable,
1069 const struct file_operations *filter,
1070 const struct file_operations *format)
1072 struct list_head *head;
1073 int ret;
1076 * If the trace point header did not define TRACE_SYSTEM
1077 * then the system would be called "TRACE_SYSTEM".
1079 if (strcmp(call->class->system, TRACE_SYSTEM) != 0)
1080 d_events = event_subsystem_dir(call->class->system, d_events);
1082 call->dir = debugfs_create_dir(call->name, d_events);
1083 if (!call->dir) {
1084 pr_warning("Could not create debugfs "
1085 "'%s' directory\n", call->name);
1086 return -1;
1089 if (call->class->reg)
1090 trace_create_file("enable", 0644, call->dir, call,
1091 enable);
1093 #ifdef CONFIG_PERF_EVENTS
1094 if (call->event.type && call->class->reg)
1095 trace_create_file("id", 0444, call->dir, call,
1096 id);
1097 #endif
1100 * Other events may have the same class. Only update
1101 * the fields if they are not already defined.
1103 head = trace_get_fields(call);
1104 if (list_empty(head)) {
1105 ret = call->class->define_fields(call);
1106 if (ret < 0) {
1107 pr_warning("Could not initialize trace point"
1108 " events/%s\n", call->name);
1109 return ret;
1112 trace_create_file("filter", 0644, call->dir, call,
1113 filter);
1115 trace_create_file("format", 0444, call->dir, call,
1116 format);
1118 return 0;
1121 static int
1122 __trace_add_event_call(struct ftrace_event_call *call, struct module *mod,
1123 const struct file_operations *id,
1124 const struct file_operations *enable,
1125 const struct file_operations *filter,
1126 const struct file_operations *format)
1128 struct dentry *d_events;
1129 int ret;
1131 /* The linker may leave blanks */
1132 if (!call->name)
1133 return -EINVAL;
1135 if (call->class->raw_init) {
1136 ret = call->class->raw_init(call);
1137 if (ret < 0) {
1138 if (ret != -ENOSYS)
1139 pr_warning("Could not initialize trace events/%s\n",
1140 call->name);
1141 return ret;
1145 d_events = event_trace_events_dir();
1146 if (!d_events)
1147 return -ENOENT;
1149 ret = event_create_dir(call, d_events, id, enable, filter, format);
1150 if (!ret)
1151 list_add(&call->list, &ftrace_events);
1152 call->mod = mod;
1154 return ret;
1157 /* Add an additional event_call dynamically */
1158 int trace_add_event_call(struct ftrace_event_call *call)
1160 int ret;
1161 mutex_lock(&event_mutex);
1162 ret = __trace_add_event_call(call, NULL, &ftrace_event_id_fops,
1163 &ftrace_enable_fops,
1164 &ftrace_event_filter_fops,
1165 &ftrace_event_format_fops);
1166 mutex_unlock(&event_mutex);
1167 return ret;
1170 static void remove_subsystem_dir(const char *name)
1172 struct event_subsystem *system;
1174 if (strcmp(name, TRACE_SYSTEM) == 0)
1175 return;
1177 list_for_each_entry(system, &event_subsystems, list) {
1178 if (strcmp(system->name, name) == 0) {
1179 if (!--system->nr_events) {
1180 struct event_filter *filter = system->filter;
1182 debugfs_remove_recursive(system->entry);
1183 list_del(&system->list);
1184 if (filter) {
1185 kfree(filter->filter_string);
1186 kfree(filter);
1188 kfree(system->name);
1189 kfree(system);
1191 break;
1197 * Must be called under locking both of event_mutex and trace_event_mutex.
1199 static void __trace_remove_event_call(struct ftrace_event_call *call)
1201 ftrace_event_enable_disable(call, 0);
1202 if (call->event.funcs)
1203 __unregister_ftrace_event(&call->event);
1204 debugfs_remove_recursive(call->dir);
1205 list_del(&call->list);
1206 trace_destroy_fields(call);
1207 destroy_preds(call);
1208 remove_subsystem_dir(call->class->system);
1211 /* Remove an event_call */
1212 void trace_remove_event_call(struct ftrace_event_call *call)
1214 mutex_lock(&event_mutex);
1215 down_write(&trace_event_mutex);
1216 __trace_remove_event_call(call);
1217 up_write(&trace_event_mutex);
1218 mutex_unlock(&event_mutex);
1221 #define for_each_event(event, start, end) \
1222 for (event = start; \
1223 (unsigned long)event < (unsigned long)end; \
1224 event++)
1226 #ifdef CONFIG_MODULES
1228 static LIST_HEAD(ftrace_module_file_list);
1231 * Modules must own their file_operations to keep up with
1232 * reference counting.
1234 struct ftrace_module_file_ops {
1235 struct list_head list;
1236 struct module *mod;
1237 struct file_operations id;
1238 struct file_operations enable;
1239 struct file_operations format;
1240 struct file_operations filter;
1243 static struct ftrace_module_file_ops *
1244 trace_create_file_ops(struct module *mod)
1246 struct ftrace_module_file_ops *file_ops;
1249 * This is a bit of a PITA. To allow for correct reference
1250 * counting, modules must "own" their file_operations.
1251 * To do this, we allocate the file operations that will be
1252 * used in the event directory.
1255 file_ops = kmalloc(sizeof(*file_ops), GFP_KERNEL);
1256 if (!file_ops)
1257 return NULL;
1259 file_ops->mod = mod;
1261 file_ops->id = ftrace_event_id_fops;
1262 file_ops->id.owner = mod;
1264 file_ops->enable = ftrace_enable_fops;
1265 file_ops->enable.owner = mod;
1267 file_ops->filter = ftrace_event_filter_fops;
1268 file_ops->filter.owner = mod;
1270 file_ops->format = ftrace_event_format_fops;
1271 file_ops->format.owner = mod;
1273 list_add(&file_ops->list, &ftrace_module_file_list);
1275 return file_ops;
1278 static void trace_module_add_events(struct module *mod)
1280 struct ftrace_module_file_ops *file_ops = NULL;
1281 struct ftrace_event_call *call, *start, *end;
1283 start = mod->trace_events;
1284 end = mod->trace_events + mod->num_trace_events;
1286 if (start == end)
1287 return;
1289 file_ops = trace_create_file_ops(mod);
1290 if (!file_ops)
1291 return;
1293 for_each_event(call, start, end) {
1294 __trace_add_event_call(call, mod,
1295 &file_ops->id, &file_ops->enable,
1296 &file_ops->filter, &file_ops->format);
1300 static void trace_module_remove_events(struct module *mod)
1302 struct ftrace_module_file_ops *file_ops;
1303 struct ftrace_event_call *call, *p;
1304 bool found = false;
1306 down_write(&trace_event_mutex);
1307 list_for_each_entry_safe(call, p, &ftrace_events, list) {
1308 if (call->mod == mod) {
1309 found = true;
1310 __trace_remove_event_call(call);
1314 /* Now free the file_operations */
1315 list_for_each_entry(file_ops, &ftrace_module_file_list, list) {
1316 if (file_ops->mod == mod)
1317 break;
1319 if (&file_ops->list != &ftrace_module_file_list) {
1320 list_del(&file_ops->list);
1321 kfree(file_ops);
1325 * It is safest to reset the ring buffer if the module being unloaded
1326 * registered any events.
1328 if (found)
1329 tracing_reset_current_online_cpus();
1330 up_write(&trace_event_mutex);
1333 static int trace_module_notify(struct notifier_block *self,
1334 unsigned long val, void *data)
1336 struct module *mod = data;
1338 mutex_lock(&event_mutex);
1339 switch (val) {
1340 case MODULE_STATE_COMING:
1341 trace_module_add_events(mod);
1342 break;
1343 case MODULE_STATE_GOING:
1344 trace_module_remove_events(mod);
1345 break;
1347 mutex_unlock(&event_mutex);
1349 return 0;
1351 #else
1352 static int trace_module_notify(struct notifier_block *self,
1353 unsigned long val, void *data)
1355 return 0;
1357 #endif /* CONFIG_MODULES */
1359 static struct notifier_block trace_module_nb = {
1360 .notifier_call = trace_module_notify,
1361 .priority = 0,
1364 extern struct ftrace_event_call __start_ftrace_events[];
1365 extern struct ftrace_event_call __stop_ftrace_events[];
1367 static char bootup_event_buf[COMMAND_LINE_SIZE] __initdata;
1369 static __init int setup_trace_event(char *str)
1371 strlcpy(bootup_event_buf, str, COMMAND_LINE_SIZE);
1372 ring_buffer_expanded = 1;
1373 tracing_selftest_disabled = 1;
1375 return 1;
1377 __setup("trace_event=", setup_trace_event);
1379 static __init int event_trace_init(void)
1381 struct ftrace_event_call *call;
1382 struct dentry *d_tracer;
1383 struct dentry *entry;
1384 struct dentry *d_events;
1385 int ret;
1386 char *buf = bootup_event_buf;
1387 char *token;
1389 d_tracer = tracing_init_dentry();
1390 if (!d_tracer)
1391 return 0;
1393 entry = debugfs_create_file("available_events", 0444, d_tracer,
1394 (void *)&show_event_seq_ops,
1395 &ftrace_avail_fops);
1396 if (!entry)
1397 pr_warning("Could not create debugfs "
1398 "'available_events' entry\n");
1400 entry = debugfs_create_file("set_event", 0644, d_tracer,
1401 (void *)&show_set_event_seq_ops,
1402 &ftrace_set_event_fops);
1403 if (!entry)
1404 pr_warning("Could not create debugfs "
1405 "'set_event' entry\n");
1407 d_events = event_trace_events_dir();
1408 if (!d_events)
1409 return 0;
1411 /* ring buffer internal formats */
1412 trace_create_file("header_page", 0444, d_events,
1413 ring_buffer_print_page_header,
1414 &ftrace_show_header_fops);
1416 trace_create_file("header_event", 0444, d_events,
1417 ring_buffer_print_entry_header,
1418 &ftrace_show_header_fops);
1420 trace_create_file("enable", 0644, d_events,
1421 NULL, &ftrace_system_enable_fops);
1423 if (trace_define_common_fields())
1424 pr_warning("tracing: Failed to allocate common fields");
1426 for_each_event(call, __start_ftrace_events, __stop_ftrace_events) {
1427 __trace_add_event_call(call, NULL, &ftrace_event_id_fops,
1428 &ftrace_enable_fops,
1429 &ftrace_event_filter_fops,
1430 &ftrace_event_format_fops);
1433 while (true) {
1434 token = strsep(&buf, ",");
1436 if (!token)
1437 break;
1438 if (!*token)
1439 continue;
1441 ret = ftrace_set_clr_event(token, 1);
1442 if (ret)
1443 pr_warning("Failed to enable trace event: %s\n", token);
1446 ret = register_module_notifier(&trace_module_nb);
1447 if (ret)
1448 pr_warning("Failed to register trace events module notifier\n");
1450 return 0;
1452 fs_initcall(event_trace_init);
1454 #ifdef CONFIG_FTRACE_STARTUP_TEST
1456 static DEFINE_SPINLOCK(test_spinlock);
1457 static DEFINE_SPINLOCK(test_spinlock_irq);
1458 static DEFINE_MUTEX(test_mutex);
1460 static __init void test_work(struct work_struct *dummy)
1462 spin_lock(&test_spinlock);
1463 spin_lock_irq(&test_spinlock_irq);
1464 udelay(1);
1465 spin_unlock_irq(&test_spinlock_irq);
1466 spin_unlock(&test_spinlock);
1468 mutex_lock(&test_mutex);
1469 msleep(1);
1470 mutex_unlock(&test_mutex);
1473 static __init int event_test_thread(void *unused)
1475 void *test_malloc;
1477 test_malloc = kmalloc(1234, GFP_KERNEL);
1478 if (!test_malloc)
1479 pr_info("failed to kmalloc\n");
1481 schedule_on_each_cpu(test_work);
1483 kfree(test_malloc);
1485 set_current_state(TASK_INTERRUPTIBLE);
1486 while (!kthread_should_stop())
1487 schedule();
1489 return 0;
1493 * Do various things that may trigger events.
1495 static __init void event_test_stuff(void)
1497 struct task_struct *test_thread;
1499 test_thread = kthread_run(event_test_thread, NULL, "test-events");
1500 msleep(1);
1501 kthread_stop(test_thread);
1505 * For every trace event defined, we will test each trace point separately,
1506 * and then by groups, and finally all trace points.
1508 static __init void event_trace_self_tests(void)
1510 struct ftrace_event_call *call;
1511 struct event_subsystem *system;
1512 int ret;
1514 pr_info("Running tests on trace events:\n");
1516 list_for_each_entry(call, &ftrace_events, list) {
1518 /* Only test those that have a probe */
1519 if (!call->class || !call->class->probe)
1520 continue;
1523 * Testing syscall events here is pretty useless, but
1524 * we still do it if configured. But this is time consuming.
1525 * What we really need is a user thread to perform the
1526 * syscalls as we test.
1528 #ifndef CONFIG_EVENT_TRACE_TEST_SYSCALLS
1529 if (call->class->system &&
1530 strcmp(call->class->system, "syscalls") == 0)
1531 continue;
1532 #endif
1534 pr_info("Testing event %s: ", call->name);
1537 * If an event is already enabled, someone is using
1538 * it and the self test should not be on.
1540 if (call->flags & TRACE_EVENT_FL_ENABLED) {
1541 pr_warning("Enabled event during self test!\n");
1542 WARN_ON_ONCE(1);
1543 continue;
1546 ftrace_event_enable_disable(call, 1);
1547 event_test_stuff();
1548 ftrace_event_enable_disable(call, 0);
1550 pr_cont("OK\n");
1553 /* Now test at the sub system level */
1555 pr_info("Running tests on trace event systems:\n");
1557 list_for_each_entry(system, &event_subsystems, list) {
1559 /* the ftrace system is special, skip it */
1560 if (strcmp(system->name, "ftrace") == 0)
1561 continue;
1563 pr_info("Testing event system %s: ", system->name);
1565 ret = __ftrace_set_clr_event(NULL, system->name, NULL, 1);
1566 if (WARN_ON_ONCE(ret)) {
1567 pr_warning("error enabling system %s\n",
1568 system->name);
1569 continue;
1572 event_test_stuff();
1574 ret = __ftrace_set_clr_event(NULL, system->name, NULL, 0);
1575 if (WARN_ON_ONCE(ret))
1576 pr_warning("error disabling system %s\n",
1577 system->name);
1579 pr_cont("OK\n");
1582 /* Test with all events enabled */
1584 pr_info("Running tests on all trace events:\n");
1585 pr_info("Testing all events: ");
1587 ret = __ftrace_set_clr_event(NULL, NULL, NULL, 1);
1588 if (WARN_ON_ONCE(ret)) {
1589 pr_warning("error enabling all events\n");
1590 return;
1593 event_test_stuff();
1595 /* reset sysname */
1596 ret = __ftrace_set_clr_event(NULL, NULL, NULL, 0);
1597 if (WARN_ON_ONCE(ret)) {
1598 pr_warning("error disabling all events\n");
1599 return;
1602 pr_cont("OK\n");
1605 #ifdef CONFIG_FUNCTION_TRACER
1607 static DEFINE_PER_CPU(atomic_t, ftrace_test_event_disable);
1609 static void
1610 function_test_events_call(unsigned long ip, unsigned long parent_ip)
1612 struct ring_buffer_event *event;
1613 struct ring_buffer *buffer;
1614 struct ftrace_entry *entry;
1615 unsigned long flags;
1616 long disabled;
1617 int cpu;
1618 int pc;
1620 pc = preempt_count();
1621 preempt_disable_notrace();
1622 cpu = raw_smp_processor_id();
1623 disabled = atomic_inc_return(&per_cpu(ftrace_test_event_disable, cpu));
1625 if (disabled != 1)
1626 goto out;
1628 local_save_flags(flags);
1630 event = trace_current_buffer_lock_reserve(&buffer,
1631 TRACE_FN, sizeof(*entry),
1632 flags, pc);
1633 if (!event)
1634 goto out;
1635 entry = ring_buffer_event_data(event);
1636 entry->ip = ip;
1637 entry->parent_ip = parent_ip;
1639 trace_nowake_buffer_unlock_commit(buffer, event, flags, pc);
1641 out:
1642 atomic_dec(&per_cpu(ftrace_test_event_disable, cpu));
1643 preempt_enable_notrace();
1646 static struct ftrace_ops trace_ops __initdata =
1648 .func = function_test_events_call,
1651 static __init void event_trace_self_test_with_function(void)
1653 register_ftrace_function(&trace_ops);
1654 pr_info("Running tests again, along with the function tracer\n");
1655 event_trace_self_tests();
1656 unregister_ftrace_function(&trace_ops);
1658 #else
1659 static __init void event_trace_self_test_with_function(void)
1662 #endif
1664 static __init int event_trace_self_tests_init(void)
1666 if (!tracing_selftest_disabled) {
1667 event_trace_self_tests();
1668 event_trace_self_test_with_function();
1671 return 0;
1674 late_initcall(event_trace_self_tests_init);
1676 #endif