sched.h 10.2 KB
Newer Older
1 2 3
#undef TRACE_SYSTEM
#define TRACE_SYSTEM sched

4
#if !defined(_TRACE_SCHED_H) || defined(TRACE_HEADER_MULTI_READ)
5 6 7 8
#define _TRACE_SCHED_H

#include <linux/sched.h>
#include <linux/tracepoint.h>
9
#include <linux/binfmts.h>
10

11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29
/*
 * Tracepoint for calling kthread_stop, performed to end a kthread:
 */
TRACE_EVENT(sched_kthread_stop,

	TP_PROTO(struct task_struct *t),

	TP_ARGS(t),

	TP_STRUCT__entry(
		__array(	char,	comm,	TASK_COMM_LEN	)
		__field(	pid_t,	pid			)
	),

	TP_fast_assign(
		memcpy(__entry->comm, t->comm, TASK_COMM_LEN);
		__entry->pid	= t->pid;
	),

30
	TP_printk("comm=%s pid=%d", __entry->comm, __entry->pid)
31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49
);

/*
 * Tracepoint for the return value of the kthread stopping:
 */
TRACE_EVENT(sched_kthread_stop_ret,

	TP_PROTO(int ret),

	TP_ARGS(ret),

	TP_STRUCT__entry(
		__field(	int,	ret	)
	),

	TP_fast_assign(
		__entry->ret	= ret;
	),

50
	TP_printk("ret=%d", __entry->ret)
51 52 53 54 55
);

/*
 * Tracepoint for waking up a task:
 */
56
DECLARE_EVENT_CLASS(sched_wakeup_template,
57

58
	TP_PROTO(struct task_struct *p, int success),
59

60
	TP_ARGS(__perf_task(p), success),
61 62 63 64 65 66

	TP_STRUCT__entry(
		__array(	char,	comm,	TASK_COMM_LEN	)
		__field(	pid_t,	pid			)
		__field(	int,	prio			)
		__field(	int,	success			)
67
		__field(	int,	target_cpu		)
68 69 70 71 72 73 74
	),

	TP_fast_assign(
		memcpy(__entry->comm, p->comm, TASK_COMM_LEN);
		__entry->pid		= p->pid;
		__entry->prio		= p->prio;
		__entry->success	= success;
75
		__entry->target_cpu	= task_cpu(p);
76 77
	),

78
	TP_printk("comm=%s pid=%d prio=%d success=%d target_cpu=%03d",
79
		  __entry->comm, __entry->pid, __entry->prio,
80
		  __entry->success, __entry->target_cpu)
81 82
);

83
DEFINE_EVENT(sched_wakeup_template, sched_wakeup,
84 85
	     TP_PROTO(struct task_struct *p, int success),
	     TP_ARGS(p, success));
86

87 88 89
/*
 * Tracepoint for waking up a new task:
 */
90
DEFINE_EVENT(sched_wakeup_template, sched_wakeup_new,
91 92
	     TP_PROTO(struct task_struct *p, int success),
	     TP_ARGS(p, success));
93

94 95 96 97 98 99 100 101 102
#ifdef CREATE_TRACE_POINTS
static inline long __trace_sched_switch_state(struct task_struct *p)
{
	long state = p->state;

#ifdef CONFIG_PREEMPT
	/*
	 * For all intents and purposes a preempted task is a running task.
	 */
103
	if (task_preempt_count(p) & PREEMPT_ACTIVE)
104
		state = TASK_RUNNING | TASK_STATE_MAX;
105 106 107 108 109 110
#endif

	return state;
}
#endif

111 112 113 114 115
/*
 * Tracepoint for task switches, performed by the scheduler:
 */
TRACE_EVENT(sched_switch,

116
	TP_PROTO(struct task_struct *prev,
117 118
		 struct task_struct *next),

119
	TP_ARGS(prev, next),
120 121 122 123 124

	TP_STRUCT__entry(
		__array(	char,	prev_comm,	TASK_COMM_LEN	)
		__field(	pid_t,	prev_pid			)
		__field(	int,	prev_prio			)
125
		__field(	long,	prev_state			)
126 127 128 129 130 131 132 133 134
		__array(	char,	next_comm,	TASK_COMM_LEN	)
		__field(	pid_t,	next_pid			)
		__field(	int,	next_prio			)
	),

	TP_fast_assign(
		memcpy(__entry->next_comm, next->comm, TASK_COMM_LEN);
		__entry->prev_pid	= prev->pid;
		__entry->prev_prio	= prev->prio;
135
		__entry->prev_state	= __trace_sched_switch_state(prev);
136 137 138 139 140
		memcpy(__entry->prev_comm, prev->comm, TASK_COMM_LEN);
		__entry->next_pid	= next->pid;
		__entry->next_prio	= next->prio;
	),

141
	TP_printk("prev_comm=%s prev_pid=%d prev_prio=%d prev_state=%s%s ==> next_comm=%s next_pid=%d next_prio=%d",
142
		__entry->prev_comm, __entry->prev_pid, __entry->prev_prio,
143 144
		__entry->prev_state & (TASK_STATE_MAX-1) ?
		  __print_flags(__entry->prev_state & (TASK_STATE_MAX-1), "|",
145 146
				{ 1, "S"} , { 2, "D" }, { 4, "T" }, { 8, "t" },
				{ 16, "Z" }, { 32, "X" }, { 64, "x" },
147
				{ 128, "K" }, { 256, "W" }, { 512, "P" }) : "R",
148
		__entry->prev_state & TASK_STATE_MAX ? "+" : "",
149 150 151 152 153 154 155 156
		__entry->next_comm, __entry->next_pid, __entry->next_prio)
);

/*
 * Tracepoint for a task being migrated:
 */
TRACE_EVENT(sched_migrate_task,

157
	TP_PROTO(struct task_struct *p, int dest_cpu),
158

159
	TP_ARGS(p, dest_cpu),
160 161 162 163 164 165 166 167 168 169 170 171 172

	TP_STRUCT__entry(
		__array(	char,	comm,	TASK_COMM_LEN	)
		__field(	pid_t,	pid			)
		__field(	int,	prio			)
		__field(	int,	orig_cpu		)
		__field(	int,	dest_cpu		)
	),

	TP_fast_assign(
		memcpy(__entry->comm, p->comm, TASK_COMM_LEN);
		__entry->pid		= p->pid;
		__entry->prio		= p->prio;
173
		__entry->orig_cpu	= task_cpu(p);
174 175 176
		__entry->dest_cpu	= dest_cpu;
	),

177
	TP_printk("comm=%s pid=%d prio=%d orig_cpu=%d dest_cpu=%d",
178 179 180 181
		  __entry->comm, __entry->pid, __entry->prio,
		  __entry->orig_cpu, __entry->dest_cpu)
);

182
DECLARE_EVENT_CLASS(sched_process_template,
183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199

	TP_PROTO(struct task_struct *p),

	TP_ARGS(p),

	TP_STRUCT__entry(
		__array(	char,	comm,	TASK_COMM_LEN	)
		__field(	pid_t,	pid			)
		__field(	int,	prio			)
	),

	TP_fast_assign(
		memcpy(__entry->comm, p->comm, TASK_COMM_LEN);
		__entry->pid		= p->pid;
		__entry->prio		= p->prio;
	),

200
	TP_printk("comm=%s pid=%d prio=%d",
201 202 203 204
		  __entry->comm, __entry->pid, __entry->prio)
);

/*
205
 * Tracepoint for freeing a task:
206
 */
207 208 209 210
DEFINE_EVENT(sched_process_template, sched_process_free,
	     TP_PROTO(struct task_struct *p),
	     TP_ARGS(p));
	     
211

212 213 214 215 216 217
/*
 * Tracepoint for a task exiting:
 */
DEFINE_EVENT(sched_process_template, sched_process_exit,
	     TP_PROTO(struct task_struct *p),
	     TP_ARGS(p));
218

219 220 221 222 223 224 225
/*
 * Tracepoint for waiting on task to unschedule:
 */
DEFINE_EVENT(sched_process_template, sched_wait_task,
	TP_PROTO(struct task_struct *p),
	TP_ARGS(p));

226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246
/*
 * Tracepoint for a waiting task:
 */
TRACE_EVENT(sched_process_wait,

	TP_PROTO(struct pid *pid),

	TP_ARGS(pid),

	TP_STRUCT__entry(
		__array(	char,	comm,	TASK_COMM_LEN	)
		__field(	pid_t,	pid			)
		__field(	int,	prio			)
	),

	TP_fast_assign(
		memcpy(__entry->comm, current->comm, TASK_COMM_LEN);
		__entry->pid		= pid_nr(pid);
		__entry->prio		= current->prio;
	),

247
	TP_printk("comm=%s pid=%d prio=%d",
248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273
		  __entry->comm, __entry->pid, __entry->prio)
);

/*
 * Tracepoint for do_fork:
 */
TRACE_EVENT(sched_process_fork,

	TP_PROTO(struct task_struct *parent, struct task_struct *child),

	TP_ARGS(parent, child),

	TP_STRUCT__entry(
		__array(	char,	parent_comm,	TASK_COMM_LEN	)
		__field(	pid_t,	parent_pid			)
		__array(	char,	child_comm,	TASK_COMM_LEN	)
		__field(	pid_t,	child_pid			)
	),

	TP_fast_assign(
		memcpy(__entry->parent_comm, parent->comm, TASK_COMM_LEN);
		__entry->parent_pid	= parent->pid;
		memcpy(__entry->child_comm, child->comm, TASK_COMM_LEN);
		__entry->child_pid	= child->pid;
	),

274
	TP_printk("comm=%s pid=%d child_comm=%s child_pid=%d",
275 276 277 278
		__entry->parent_comm, __entry->parent_pid,
		__entry->child_comm, __entry->child_pid)
);

279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297
/*
 * Tracepoint for exec:
 */
TRACE_EVENT(sched_process_exec,

	TP_PROTO(struct task_struct *p, pid_t old_pid,
		 struct linux_binprm *bprm),

	TP_ARGS(p, old_pid, bprm),

	TP_STRUCT__entry(
		__string(	filename,	bprm->filename	)
		__field(	pid_t,		pid		)
		__field(	pid_t,		old_pid		)
	),

	TP_fast_assign(
		__assign_str(filename, bprm->filename);
		__entry->pid		= p->pid;
298
		__entry->old_pid	= old_pid;
299 300 301 302 303 304
	),

	TP_printk("filename=%s pid=%d old_pid=%d", __get_str(filename),
		  __entry->pid, __entry->old_pid)
);

305 306 307 308
/*
 * XXX the below sched_stat tracepoints only apply to SCHED_OTHER/BATCH/IDLE
 *     adding sched_stat support to SCHED_FIFO/RR would be welcome.
 */
309
DECLARE_EVENT_CLASS(sched_stat_template,
310 311 312

	TP_PROTO(struct task_struct *tsk, u64 delay),

313
	TP_ARGS(__perf_task(tsk), __perf_count(delay)),
314 315 316 317 318 319 320 321 322 323 324 325 326

	TP_STRUCT__entry(
		__array( char,	comm,	TASK_COMM_LEN	)
		__field( pid_t,	pid			)
		__field( u64,	delay			)
	),

	TP_fast_assign(
		memcpy(__entry->comm, tsk->comm, TASK_COMM_LEN);
		__entry->pid	= tsk->pid;
		__entry->delay	= delay;
	),

327
	TP_printk("comm=%s pid=%d delay=%Lu [ns]",
328 329 330 331
			__entry->comm, __entry->pid,
			(unsigned long long)__entry->delay)
);

332 333 334 335 336 337 338 339 340 341 342 343 344

/*
 * Tracepoint for accounting wait time (time the task is runnable
 * but not actually running due to scheduler contention).
 */
DEFINE_EVENT(sched_stat_template, sched_stat_wait,
	     TP_PROTO(struct task_struct *tsk, u64 delay),
	     TP_ARGS(tsk, delay));

/*
 * Tracepoint for accounting sleep time (time the task is not runnable,
 * including iowait, see below).
 */
345 346 347
DEFINE_EVENT(sched_stat_template, sched_stat_sleep,
	     TP_PROTO(struct task_struct *tsk, u64 delay),
	     TP_ARGS(tsk, delay));
348 349 350 351 352

/*
 * Tracepoint for accounting iowait time (time the task is not runnable
 * due to waiting on IO to complete).
 */
353 354 355
DEFINE_EVENT(sched_stat_template, sched_stat_iowait,
	     TP_PROTO(struct task_struct *tsk, u64 delay),
	     TP_ARGS(tsk, delay));
356

357 358 359 360 361 362 363
/*
 * Tracepoint for accounting blocked time (time the task is in uninterruptible).
 */
DEFINE_EVENT(sched_stat_template, sched_stat_blocked,
	     TP_PROTO(struct task_struct *tsk, u64 delay),
	     TP_ARGS(tsk, delay));

364 365 366 367
/*
 * Tracepoint for accounting runtime (time the task is executing
 * on a CPU).
 */
368
DECLARE_EVENT_CLASS(sched_stat_runtime,
369 370 371

	TP_PROTO(struct task_struct *tsk, u64 runtime, u64 vruntime),

372
	TP_ARGS(tsk, __perf_count(runtime), vruntime),
373 374 375 376 377 378 379 380 381 382 383 384 385 386 387

	TP_STRUCT__entry(
		__array( char,	comm,	TASK_COMM_LEN	)
		__field( pid_t,	pid			)
		__field( u64,	runtime			)
		__field( u64,	vruntime			)
	),

	TP_fast_assign(
		memcpy(__entry->comm, tsk->comm, TASK_COMM_LEN);
		__entry->pid		= tsk->pid;
		__entry->runtime	= runtime;
		__entry->vruntime	= vruntime;
	),

388
	TP_printk("comm=%s pid=%d runtime=%Lu [ns] vruntime=%Lu [ns]",
389 390 391 392 393
			__entry->comm, __entry->pid,
			(unsigned long long)__entry->runtime,
			(unsigned long long)__entry->vruntime)
);

394 395 396 397
DEFINE_EVENT(sched_stat_runtime, sched_stat_runtime,
	     TP_PROTO(struct task_struct *tsk, u64 runtime, u64 vruntime),
	     TP_ARGS(tsk, runtime, vruntime));

398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426
/*
 * Tracepoint for showing priority inheritance modifying a tasks
 * priority.
 */
TRACE_EVENT(sched_pi_setprio,

	TP_PROTO(struct task_struct *tsk, int newprio),

	TP_ARGS(tsk, newprio),

	TP_STRUCT__entry(
		__array( char,	comm,	TASK_COMM_LEN	)
		__field( pid_t,	pid			)
		__field( int,	oldprio			)
		__field( int,	newprio			)
	),

	TP_fast_assign(
		memcpy(__entry->comm, tsk->comm, TASK_COMM_LEN);
		__entry->pid		= tsk->pid;
		__entry->oldprio	= tsk->prio;
		__entry->newprio	= newprio;
	),

	TP_printk("comm=%s pid=%d oldprio=%d newprio=%d",
			__entry->comm, __entry->pid,
			__entry->oldprio, __entry->newprio)
);

427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445
#ifdef CONFIG_DETECT_HUNG_TASK
TRACE_EVENT(sched_process_hang,
	TP_PROTO(struct task_struct *tsk),
	TP_ARGS(tsk),

	TP_STRUCT__entry(
		__array( char,	comm,	TASK_COMM_LEN	)
		__field( pid_t,	pid			)
	),

	TP_fast_assign(
		memcpy(__entry->comm, tsk->comm, TASK_COMM_LEN);
		__entry->pid = tsk->pid;
	),

	TP_printk("comm=%s pid=%d", __entry->comm, __entry->pid)
);
#endif /* CONFIG_DETECT_HUNG_TASK */

446
#endif /* _TRACE_SCHED_H */
447 448 449

/* This part must be outside protection */
#include <trace/define_trace.h>