Merge branch 'cfq-2.6.33' into for-2.6.33
[linux-2.6/next.git] / include / linux / tracepoint.h
blob2aac8a83e89b9a7994b7570ffb3ea879d763ee23
1 #ifndef _LINUX_TRACEPOINT_H
2 #define _LINUX_TRACEPOINT_H
4 /*
5 * Kernel Tracepoint API.
7 * See Documentation/trace/tracepoints.txt.
9 * (C) Copyright 2008 Mathieu Desnoyers <mathieu.desnoyers@polymtl.ca>
11 * Heavily inspired from the Linux Kernel Markers.
13 * This file is released under the GPLv2.
14 * See the file COPYING for more details.
17 #include <linux/types.h>
18 #include <linux/rcupdate.h>
20 struct module;
21 struct tracepoint;
23 struct tracepoint {
24 const char *name; /* Tracepoint name */
25 int state; /* State. */
26 void (*regfunc)(void);
27 void (*unregfunc)(void);
28 void **funcs;
29 } __attribute__((aligned(32))); /*
30 * Aligned on 32 bytes because it is
31 * globally visible and gcc happily
32 * align these on the structure size.
33 * Keep in sync with vmlinux.lds.h.
36 #ifndef DECLARE_TRACE
38 #define TP_PROTO(args...) args
39 #define TP_ARGS(args...) args
41 #ifdef CONFIG_TRACEPOINTS
44 * it_func[0] is never NULL because there is at least one element in the array
45 * when the array itself is non NULL.
47 #define __DO_TRACE(tp, proto, args) \
48 do { \
49 void **it_func; \
51 rcu_read_lock_sched_notrace(); \
52 it_func = rcu_dereference((tp)->funcs); \
53 if (it_func) { \
54 do { \
55 ((void(*)(proto))(*it_func))(args); \
56 } while (*(++it_func)); \
57 } \
58 rcu_read_unlock_sched_notrace(); \
59 } while (0)
62 * Make sure the alignment of the structure in the __tracepoints section will
63 * not add unwanted padding between the beginning of the section and the
64 * structure. Force alignment to the same alignment as the section start.
66 #define DECLARE_TRACE(name, proto, args) \
67 extern struct tracepoint __tracepoint_##name; \
68 static inline void trace_##name(proto) \
69 { \
70 if (unlikely(__tracepoint_##name.state)) \
71 __DO_TRACE(&__tracepoint_##name, \
72 TP_PROTO(proto), TP_ARGS(args)); \
73 } \
74 static inline int register_trace_##name(void (*probe)(proto)) \
75 { \
76 return tracepoint_probe_register(#name, (void *)probe); \
77 } \
78 static inline int unregister_trace_##name(void (*probe)(proto)) \
79 { \
80 return tracepoint_probe_unregister(#name, (void *)probe);\
84 #define DEFINE_TRACE_FN(name, reg, unreg) \
85 static const char __tpstrtab_##name[] \
86 __attribute__((section("__tracepoints_strings"))) = #name; \
87 struct tracepoint __tracepoint_##name \
88 __attribute__((section("__tracepoints"), aligned(32))) = \
89 { __tpstrtab_##name, 0, reg, unreg, NULL }
91 #define DEFINE_TRACE(name) \
92 DEFINE_TRACE_FN(name, NULL, NULL);
94 #define EXPORT_TRACEPOINT_SYMBOL_GPL(name) \
95 EXPORT_SYMBOL_GPL(__tracepoint_##name)
96 #define EXPORT_TRACEPOINT_SYMBOL(name) \
97 EXPORT_SYMBOL(__tracepoint_##name)
99 extern void tracepoint_update_probe_range(struct tracepoint *begin,
100 struct tracepoint *end);
102 #else /* !CONFIG_TRACEPOINTS */
103 #define DECLARE_TRACE(name, proto, args) \
104 static inline void _do_trace_##name(struct tracepoint *tp, proto) \
105 { } \
106 static inline void trace_##name(proto) \
107 { } \
108 static inline int register_trace_##name(void (*probe)(proto)) \
110 return -ENOSYS; \
112 static inline int unregister_trace_##name(void (*probe)(proto)) \
114 return -ENOSYS; \
117 #define DEFINE_TRACE_FN(name, reg, unreg)
118 #define DEFINE_TRACE(name)
119 #define EXPORT_TRACEPOINT_SYMBOL_GPL(name)
120 #define EXPORT_TRACEPOINT_SYMBOL(name)
122 static inline void tracepoint_update_probe_range(struct tracepoint *begin,
123 struct tracepoint *end)
125 #endif /* CONFIG_TRACEPOINTS */
126 #endif /* DECLARE_TRACE */
129 * Connect a probe to a tracepoint.
130 * Internal API, should not be used directly.
132 extern int tracepoint_probe_register(const char *name, void *probe);
135 * Disconnect a probe from a tracepoint.
136 * Internal API, should not be used directly.
138 extern int tracepoint_probe_unregister(const char *name, void *probe);
140 extern int tracepoint_probe_register_noupdate(const char *name, void *probe);
141 extern int tracepoint_probe_unregister_noupdate(const char *name, void *probe);
142 extern void tracepoint_probe_update_all(void);
144 struct tracepoint_iter {
145 struct module *module;
146 struct tracepoint *tracepoint;
149 extern void tracepoint_iter_start(struct tracepoint_iter *iter);
150 extern void tracepoint_iter_next(struct tracepoint_iter *iter);
151 extern void tracepoint_iter_stop(struct tracepoint_iter *iter);
152 extern void tracepoint_iter_reset(struct tracepoint_iter *iter);
153 extern int tracepoint_get_iter_range(struct tracepoint **tracepoint,
154 struct tracepoint *begin, struct tracepoint *end);
157 * tracepoint_synchronize_unregister must be called between the last tracepoint
158 * probe unregistration and the end of module exit to make sure there is no
159 * caller executing a probe when it is freed.
161 static inline void tracepoint_synchronize_unregister(void)
163 synchronize_sched();
166 #define PARAMS(args...) args
168 #endif /* _LINUX_TRACEPOINT_H */
171 * Note: we keep the TRACE_EVENT outside the include file ifdef protection.
172 * This is due to the way trace events work. If a file includes two
173 * trace event headers under one "CREATE_TRACE_POINTS" the first include
174 * will override the TRACE_EVENT and break the second include.
177 #ifndef TRACE_EVENT
179 * For use with the TRACE_EVENT macro:
181 * We define a tracepoint, its arguments, its printk format
182 * and its 'fast binay record' layout.
184 * Firstly, name your tracepoint via TRACE_EVENT(name : the
185 * 'subsystem_event' notation is fine.
187 * Think about this whole construct as the
188 * 'trace_sched_switch() function' from now on.
191 * TRACE_EVENT(sched_switch,
194 * * A function has a regular function arguments
195 * * prototype, declare it via TP_PROTO():
198 * TP_PROTO(struct rq *rq, struct task_struct *prev,
199 * struct task_struct *next),
202 * * Define the call signature of the 'function'.
203 * * (Design sidenote: we use this instead of a
204 * * TP_PROTO1/TP_PROTO2/TP_PROTO3 ugliness.)
207 * TP_ARGS(rq, prev, next),
210 * * Fast binary tracing: define the trace record via
211 * * TP_STRUCT__entry(). You can think about it like a
212 * * regular C structure local variable definition.
214 * * This is how the trace record is structured and will
215 * * be saved into the ring buffer. These are the fields
216 * * that will be exposed to user-space in
217 * * /sys/kernel/debug/tracing/events/<*>/format.
219 * * The declared 'local variable' is called '__entry'
221 * * __field(pid_t, prev_prid) is equivalent to a standard declariton:
223 * * pid_t prev_pid;
225 * * __array(char, prev_comm, TASK_COMM_LEN) is equivalent to:
227 * * char prev_comm[TASK_COMM_LEN];
230 * TP_STRUCT__entry(
231 * __array( char, prev_comm, TASK_COMM_LEN )
232 * __field( pid_t, prev_pid )
233 * __field( int, prev_prio )
234 * __array( char, next_comm, TASK_COMM_LEN )
235 * __field( pid_t, next_pid )
236 * __field( int, next_prio )
237 * ),
240 * * Assign the entry into the trace record, by embedding
241 * * a full C statement block into TP_fast_assign(). You
242 * * can refer to the trace record as '__entry' -
243 * * otherwise you can put arbitrary C code in here.
245 * * Note: this C code will execute every time a trace event
246 * * happens, on an active tracepoint.
249 * TP_fast_assign(
250 * memcpy(__entry->next_comm, next->comm, TASK_COMM_LEN);
251 * __entry->prev_pid = prev->pid;
252 * __entry->prev_prio = prev->prio;
253 * memcpy(__entry->prev_comm, prev->comm, TASK_COMM_LEN);
254 * __entry->next_pid = next->pid;
255 * __entry->next_prio = next->prio;
259 * * Formatted output of a trace record via TP_printk().
260 * * This is how the tracepoint will appear under ftrace
261 * * plugins that make use of this tracepoint.
263 * * (raw-binary tracing wont actually perform this step.)
266 * TP_printk("task %s:%d [%d] ==> %s:%d [%d]",
267 * __entry->prev_comm, __entry->prev_pid, __entry->prev_prio,
268 * __entry->next_comm, __entry->next_pid, __entry->next_prio),
270 * );
272 * This macro construct is thus used for the regular printk format
273 * tracing setup, it is used to construct a function pointer based
274 * tracepoint callback (this is used by programmatic plugins and
275 * can also by used by generic instrumentation like SystemTap), and
276 * it is also used to expose a structured trace record in
277 * /sys/kernel/debug/tracing/events/.
279 * A set of (un)registration functions can be passed to the variant
280 * TRACE_EVENT_FN to perform any (un)registration work.
283 #define TRACE_EVENT(name, proto, args, struct, assign, print) \
284 DECLARE_TRACE(name, PARAMS(proto), PARAMS(args))
285 #define TRACE_EVENT_FN(name, proto, args, struct, \
286 assign, print, reg, unreg) \
287 DECLARE_TRACE(name, PARAMS(proto), PARAMS(args))
289 #endif /* ifdef TRACE_EVENT (see note above) */