1 /* SPDX-License-Identifier: GPL-2.0 */
3 #define TRACE_SYSTEM sched
5 #if !defined(LTTNG_TRACE_SCHED_H) || defined(TRACE_HEADER_MULTI_READ)
6 #define LTTNG_TRACE_SCHED_H
8 #include <probes/lttng-tracepoint-event.h>
9 #include <linux/sched.h>
10 #include <linux/pid_namespace.h>
11 #include <linux/binfmts.h>
12 #include <linux/version.h>
13 #if (LINUX_VERSION_CODE >= KERNEL_VERSION(3,9,0))
14 #include <linux/sched/rt.h>
17 #if (LINUX_VERSION_CODE >= KERNEL_VERSION(3,19,0))
18 #define lttng_proc_inum ns.inum
20 #define lttng_proc_inum proc_inum
23 #define LTTNG_MAX_PID_NS_LEVEL 32
25 #ifndef _TRACE_SCHED_DEF_
26 #define _TRACE_SCHED_DEF_
28 #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,4,0))
30 static inline long __trace_sched_switch_state(bool preempt
, struct task_struct
*p
)
32 #ifdef CONFIG_SCHED_DEBUG
34 #endif /* CONFIG_SCHED_DEBUG */
36 * Preemption ignores task state, therefore preempted tasks are always RUNNING
37 * (we will not have dequeued if state != RUNNING).
39 return preempt
? TASK_RUNNING
| TASK_STATE_MAX
: p
->state
;
42 #elif (LINUX_VERSION_CODE >= KERNEL_VERSION(3,19,0))
44 static inline long __trace_sched_switch_state(struct task_struct
*p
)
46 long state
= p
->state
;
49 #ifdef CONFIG_SCHED_DEBUG
51 #endif /* CONFIG_SCHED_DEBUG */
53 * For all intents and purposes a preempted task is a running task.
55 if (preempt_count() & PREEMPT_ACTIVE
)
56 state
= TASK_RUNNING
| TASK_STATE_MAX
;
57 #endif /* CONFIG_PREEMPT */
62 #elif (LINUX_VERSION_CODE >= KERNEL_VERSION(3,13,0))
64 static inline long __trace_sched_switch_state(struct task_struct
*p
)
66 long state
= p
->state
;
70 * For all intents and purposes a preempted task is a running task.
72 if (task_preempt_count(p
) & PREEMPT_ACTIVE
)
73 state
= TASK_RUNNING
| TASK_STATE_MAX
;
79 #elif (LINUX_VERSION_CODE >= KERNEL_VERSION(3,2,0))
81 static inline long __trace_sched_switch_state(struct task_struct
*p
)
83 long state
= p
->state
;
87 * For all intents and purposes a preempted task is a running task.
89 if (task_thread_info(p
)->preempt_count
& PREEMPT_ACTIVE
)
90 state
= TASK_RUNNING
| TASK_STATE_MAX
;
98 static inline long __trace_sched_switch_state(struct task_struct
*p
)
100 long state
= p
->state
;
102 #ifdef CONFIG_PREEMPT
104 * For all intents and purposes a preempted task is a running task.
106 if (task_thread_info(p
)->preempt_count
& PREEMPT_ACTIVE
)
107 state
= TASK_RUNNING
;
115 #endif /* _TRACE_SCHED_DEF_ */
118 * Tracepoint for calling kthread_stop, performed to end a kthread:
120 LTTNG_TRACEPOINT_EVENT(sched_kthread_stop
,
122 TP_PROTO(struct task_struct
*t
),
127 ctf_array_text(char, comm
, t
->comm
, TASK_COMM_LEN
)
128 ctf_integer(pid_t
, tid
, t
->pid
)
133 * Tracepoint for the return value of the kthread stopping:
135 LTTNG_TRACEPOINT_EVENT(sched_kthread_stop_ret
,
142 ctf_integer(int, ret
, ret
)
147 * Tracepoint for waking up a task:
149 #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,3,0) || \
150 LTTNG_RT_KERNEL_RANGE(4,1,10,11, 4,2,0,0) || \
151 LTTNG_RT_KERNEL_RANGE(3,18,27,26, 3,19,0,0) || \
152 LTTNG_RT_KERNEL_RANGE(3,14,61,63, 3,15,0,0) || \
153 LTTNG_RT_KERNEL_RANGE(3,12,54,73, 3,13,0,0) || \
154 LTTNG_RT_KERNEL_RANGE(3,10,97,106, 3,11,0,0) || \
155 LTTNG_RT_KERNEL_RANGE(3,4,110,139, 3,5,0,0) || \
156 LTTNG_RT_KERNEL_RANGE(3,2,77,111, 3,3,0,0))
157 LTTNG_TRACEPOINT_EVENT_CLASS(sched_wakeup_template
,
159 TP_PROTO(struct task_struct
*p
),
164 ctf_array_text(char, comm
, p
->comm
, TASK_COMM_LEN
)
165 ctf_integer(pid_t
, tid
, p
->pid
)
166 ctf_integer(int, prio
, p
->prio
- MAX_RT_PRIO
)
167 ctf_integer(int, target_cpu
, task_cpu(p
))
170 #else /* #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,3,0)) */
171 LTTNG_TRACEPOINT_EVENT_CLASS(sched_wakeup_template
,
173 TP_PROTO(struct task_struct
*p
, int success
),
178 ctf_array_text(char, comm
, p
->comm
, TASK_COMM_LEN
)
179 ctf_integer(pid_t
, tid
, p
->pid
)
180 ctf_integer(int, prio
, p
->prio
- MAX_RT_PRIO
)
181 ctf_integer(int, success
, success
)
182 ctf_integer(int, target_cpu
, task_cpu(p
))
185 #endif /* #else #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,3,0)) */
187 #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,3,0) || \
188 LTTNG_RT_KERNEL_RANGE(4,1,10,11, 4,2,0,0) || \
189 LTTNG_RT_KERNEL_RANGE(3,18,27,26, 3,19,0,0) || \
190 LTTNG_RT_KERNEL_RANGE(3,14,61,63, 3,15,0,0) || \
191 LTTNG_RT_KERNEL_RANGE(3,12,54,73, 3,13,0,0) || \
192 LTTNG_RT_KERNEL_RANGE(3,10,97,106, 3,11,0,0) || \
193 LTTNG_RT_KERNEL_RANGE(3,4,110,139, 3,5,0,0) || \
194 LTTNG_RT_KERNEL_RANGE(3,2,77,111, 3,3,0,0))
197 * Tracepoint called when waking a task; this tracepoint is guaranteed to be
198 * called from the waking context.
200 LTTNG_TRACEPOINT_EVENT_INSTANCE(sched_wakeup_template
, sched_waking
,
201 TP_PROTO(struct task_struct
*p
),
205 * Tracepoint called when the task is actually woken; p->state == TASK_RUNNNG.
206 * It it not always called from the waking context.
208 LTTNG_TRACEPOINT_EVENT_INSTANCE(sched_wakeup_template
, sched_wakeup
,
209 TP_PROTO(struct task_struct
*p
),
213 * Tracepoint for waking up a new task:
215 LTTNG_TRACEPOINT_EVENT_INSTANCE(sched_wakeup_template
, sched_wakeup_new
,
216 TP_PROTO(struct task_struct
*p
),
221 LTTNG_TRACEPOINT_EVENT_INSTANCE(sched_wakeup_template
, sched_wakeup
,
222 TP_PROTO(struct task_struct
*p
, int success
),
226 * Tracepoint for waking up a new task:
228 LTTNG_TRACEPOINT_EVENT_INSTANCE(sched_wakeup_template
, sched_wakeup_new
,
229 TP_PROTO(struct task_struct
*p
, int success
),
232 #endif /* #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,3,0)) */
235 * Tracepoint for task switches, performed by the scheduler:
237 LTTNG_TRACEPOINT_EVENT(sched_switch
,
239 #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,4,0))
240 TP_PROTO(bool preempt
,
241 struct task_struct
*prev
,
242 struct task_struct
*next
),
244 TP_ARGS(preempt
, prev
, next
),
246 TP_PROTO(struct task_struct
*prev
,
247 struct task_struct
*next
),
250 #endif /* #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,4,0)) */
253 ctf_array_text(char, prev_comm
, prev
->comm
, TASK_COMM_LEN
)
254 ctf_integer(pid_t
, prev_tid
, prev
->pid
)
255 ctf_integer(int, prev_prio
, prev
->prio
- MAX_RT_PRIO
)
256 #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,4,0))
257 ctf_integer(long, prev_state
, __trace_sched_switch_state(preempt
, prev
))
259 ctf_integer(long, prev_state
, __trace_sched_switch_state(prev
))
261 ctf_array_text(char, next_comm
, next
->comm
, TASK_COMM_LEN
)
262 ctf_integer(pid_t
, next_tid
, next
->pid
)
263 ctf_integer(int, next_prio
, next
->prio
- MAX_RT_PRIO
)
268 * Tracepoint for a task being migrated:
270 LTTNG_TRACEPOINT_EVENT(sched_migrate_task
,
272 TP_PROTO(struct task_struct
*p
, int dest_cpu
),
274 TP_ARGS(p
, dest_cpu
),
277 ctf_array_text(char, comm
, p
->comm
, TASK_COMM_LEN
)
278 ctf_integer(pid_t
, tid
, p
->pid
)
279 ctf_integer(int, prio
, p
->prio
- MAX_RT_PRIO
)
280 ctf_integer(int, orig_cpu
, task_cpu(p
))
281 ctf_integer(int, dest_cpu
, dest_cpu
)
285 LTTNG_TRACEPOINT_EVENT_CLASS(sched_process_template
,
287 TP_PROTO(struct task_struct
*p
),
292 ctf_array_text(char, comm
, p
->comm
, TASK_COMM_LEN
)
293 ctf_integer(pid_t
, tid
, p
->pid
)
294 ctf_integer(int, prio
, p
->prio
- MAX_RT_PRIO
)
299 * Tracepoint for freeing a task:
301 LTTNG_TRACEPOINT_EVENT_INSTANCE(sched_process_template
, sched_process_free
,
302 TP_PROTO(struct task_struct
*p
),
307 * Tracepoint for a task exiting:
309 LTTNG_TRACEPOINT_EVENT_INSTANCE(sched_process_template
, sched_process_exit
,
310 TP_PROTO(struct task_struct
*p
),
314 * Tracepoint for waiting on task to unschedule:
316 LTTNG_TRACEPOINT_EVENT_INSTANCE(sched_process_template
, sched_wait_task
,
317 TP_PROTO(struct task_struct
*p
),
321 * Tracepoint for a waiting task:
323 LTTNG_TRACEPOINT_EVENT(sched_process_wait
,
325 TP_PROTO(struct pid
*pid
),
330 ctf_array_text(char, comm
, current
->comm
, TASK_COMM_LEN
)
331 ctf_integer(pid_t
, tid
, pid_nr(pid
))
332 ctf_integer(int, prio
, current
->prio
- MAX_RT_PRIO
)
337 * Tracepoint for do_fork.
338 * Saving both TID and PID information, especially for the child, allows
339 * trace analyzers to distinguish between creation of a new process and
340 * creation of a new thread. Newly created processes will have child_tid
341 * == child_pid, while creation of a thread yields to child_tid !=
344 LTTNG_TRACEPOINT_EVENT_CODE(sched_process_fork
,
346 TP_PROTO(struct task_struct
*parent
, struct task_struct
*child
),
348 TP_ARGS(parent
, child
),
351 pid_t vtids
[LTTNG_MAX_PID_NS_LEVEL
];
352 unsigned int ns_level
;
357 struct pid
*child_pid
;
360 child_pid
= task_pid(child
);
361 tp_locvar
->ns_level
=
362 min_t(unsigned int, child_pid
->level
+ 1,
363 LTTNG_MAX_PID_NS_LEVEL
);
364 for (i
= 0; i
< tp_locvar
->ns_level
; i
++)
365 tp_locvar
->vtids
[i
] = child_pid
->numbers
[i
].nr
;
370 ctf_array_text(char, parent_comm
, parent
->comm
, TASK_COMM_LEN
)
371 ctf_integer(pid_t
, parent_tid
, parent
->pid
)
372 ctf_integer(pid_t
, parent_pid
, parent
->tgid
)
373 #if (LINUX_VERSION_CODE >= KERNEL_VERSION(3,8,0))
374 ctf_integer(unsigned int, parent_ns_inum
,
376 unsigned int parent_ns_inum
= 0;
379 struct pid_namespace
*pid_ns
;
381 pid_ns
= task_active_pid_ns(parent
);
384 pid_ns
->lttng_proc_inum
;
389 ctf_array_text(char, child_comm
, child
->comm
, TASK_COMM_LEN
)
390 ctf_integer(pid_t
, child_tid
, child
->pid
)
391 ctf_sequence(pid_t
, vtids
, tp_locvar
->vtids
, u8
, tp_locvar
->ns_level
)
392 ctf_integer(pid_t
, child_pid
, child
->tgid
)
393 #if (LINUX_VERSION_CODE >= KERNEL_VERSION(3,8,0))
394 ctf_integer(unsigned int, child_ns_inum
,
396 unsigned int child_ns_inum
= 0;
399 struct pid_namespace
*pid_ns
;
401 pid_ns
= task_active_pid_ns(child
);
404 pid_ns
->lttng_proc_inum
;
414 #if (LINUX_VERSION_CODE >= KERNEL_VERSION(3,4,0))
416 * Tracepoint for exec:
418 LTTNG_TRACEPOINT_EVENT(sched_process_exec
,
420 TP_PROTO(struct task_struct
*p
, pid_t old_pid
,
421 struct linux_binprm
*bprm
),
423 TP_ARGS(p
, old_pid
, bprm
),
426 ctf_string(filename
, bprm
->filename
)
427 ctf_integer(pid_t
, tid
, p
->pid
)
428 ctf_integer(pid_t
, old_tid
, old_pid
)
434 * XXX the below sched_stat tracepoints only apply to SCHED_OTHER/BATCH/IDLE
435 * adding sched_stat support to SCHED_FIFO/RR would be welcome.
437 LTTNG_TRACEPOINT_EVENT_CLASS(sched_stat_template
,
439 TP_PROTO(struct task_struct
*tsk
, u64 delay
),
444 ctf_array_text(char, comm
, tsk
->comm
, TASK_COMM_LEN
)
445 ctf_integer(pid_t
, tid
, tsk
->pid
)
446 ctf_integer(u64
, delay
, delay
)
452 * Tracepoint for accounting wait time (time the task is runnable
453 * but not actually running due to scheduler contention).
455 LTTNG_TRACEPOINT_EVENT_INSTANCE(sched_stat_template
, sched_stat_wait
,
456 TP_PROTO(struct task_struct
*tsk
, u64 delay
),
460 * Tracepoint for accounting sleep time (time the task is not runnable,
461 * including iowait, see below).
463 LTTNG_TRACEPOINT_EVENT_INSTANCE(sched_stat_template
, sched_stat_sleep
,
464 TP_PROTO(struct task_struct
*tsk
, u64 delay
),
468 * Tracepoint for accounting iowait time (time the task is not runnable
469 * due to waiting on IO to complete).
471 LTTNG_TRACEPOINT_EVENT_INSTANCE(sched_stat_template
, sched_stat_iowait
,
472 TP_PROTO(struct task_struct
*tsk
, u64 delay
),
475 #if (LINUX_VERSION_CODE >= KERNEL_VERSION(3,3,0))
477 * Tracepoint for accounting blocked time (time the task is in uninterruptible).
479 LTTNG_TRACEPOINT_EVENT_INSTANCE(sched_stat_template
, sched_stat_blocked
,
480 TP_PROTO(struct task_struct
*tsk
, u64 delay
),
485 * Tracepoint for accounting runtime (time the task is executing
488 LTTNG_TRACEPOINT_EVENT(sched_stat_runtime
,
490 TP_PROTO(struct task_struct
*tsk
, u64 runtime
, u64 vruntime
),
492 TP_ARGS(tsk
, runtime
, vruntime
),
495 ctf_array_text(char, comm
, tsk
->comm
, TASK_COMM_LEN
)
496 ctf_integer(pid_t
, tid
, tsk
->pid
)
497 ctf_integer(u64
, runtime
, runtime
)
498 ctf_integer(u64
, vruntime
, vruntime
)
502 #if (LINUX_VERSION_CODE >= KERNEL_VERSION(4,12,0) || \
503 LTTNG_RT_KERNEL_RANGE(4,9,27,18, 4,10,0,0) || \
504 LTTNG_RT_KERNEL_RANGE(4,11,5,1, 4,12,0,0))
506 * Tracepoint for showing priority inheritance modifying a tasks
509 LTTNG_TRACEPOINT_EVENT(sched_pi_setprio
,
511 TP_PROTO(struct task_struct
*tsk
, struct task_struct
*pi_task
),
513 TP_ARGS(tsk
, pi_task
),
516 ctf_array_text(char, comm
, tsk
->comm
, TASK_COMM_LEN
)
517 ctf_integer(pid_t
, tid
, tsk
->pid
)
518 ctf_integer(int, oldprio
, tsk
->prio
- MAX_RT_PRIO
)
519 ctf_integer(int, newprio
, pi_task
? pi_task
->prio
- MAX_RT_PRIO
: tsk
->prio
- MAX_RT_PRIO
)
524 * Tracepoint for showing priority inheritance modifying a tasks
527 LTTNG_TRACEPOINT_EVENT(sched_pi_setprio
,
529 TP_PROTO(struct task_struct
*tsk
, int newprio
),
531 TP_ARGS(tsk
, newprio
),
534 ctf_array_text(char, comm
, tsk
->comm
, TASK_COMM_LEN
)
535 ctf_integer(pid_t
, tid
, tsk
->pid
)
536 ctf_integer(int, oldprio
, tsk
->prio
- MAX_RT_PRIO
)
537 ctf_integer(int, newprio
, newprio
- MAX_RT_PRIO
)
542 #endif /* LTTNG_TRACE_SCHED_H */
544 /* This part must be outside protection */
545 #include <probes/define_trace.h>
This page took 0.041836 seconds and 5 git commands to generate.