sched_debug.c 8.4 KB
Newer Older
I
Ingo Molnar 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30
/*
 * kernel/time/sched_debug.c
 *
 * Print the CFS rbtree
 *
 * Copyright(C) 2007, Red Hat, Inc., Ingo Molnar
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License version 2 as
 * published by the Free Software Foundation.
 */

#include <linux/proc_fs.h>
#include <linux/sched.h>
#include <linux/seq_file.h>
#include <linux/kallsyms.h>
#include <linux/utsname.h>

/*
 * This allows printing both to /proc/sched_debug and
 * to the console
 */
#define SEQ_printf(m, x...)			\
 do {						\
	if (m)					\
		seq_printf(m, x);		\
	else					\
		printk(x);			\
 } while (0)

I
Ingo Molnar 已提交
31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55
/*
 * Ease the printing of nsec fields:
 */
static long long nsec_high(long long nsec)
{
	if (nsec < 0) {
		nsec = -nsec;
		do_div(nsec, 1000000);
		return -nsec;
	}
	do_div(nsec, 1000000);

	return nsec;
}

static unsigned long nsec_low(long long nsec)
{
	if (nsec < 0)
		nsec = -nsec;

	return do_div(nsec, 1000000);
}

#define SPLIT_NS(x) nsec_high(x), nsec_low(x)

I
Ingo Molnar 已提交
56
static void
57
print_task(struct seq_file *m, struct rq *rq, struct task_struct *p)
I
Ingo Molnar 已提交
58 59 60 61 62 63
{
	if (rq->curr == p)
		SEQ_printf(m, "R");
	else
		SEQ_printf(m, " ");

I
Ingo Molnar 已提交
64
	SEQ_printf(m, "%15s %5d %9Ld.%06ld %9Ld %5d ",
I
Ingo Molnar 已提交
65
		p->comm, p->pid,
I
Ingo Molnar 已提交
66
		SPLIT_NS(p->se.vruntime),
I
Ingo Molnar 已提交
67
		(long long)(p->nvcsw + p->nivcsw),
68
		p->prio);
I
Ingo Molnar 已提交
69
#ifdef CONFIG_SCHEDSTATS
70
	SEQ_printf(m, "%9Ld.%06ld %9Ld.%06ld %9Ld.%06ld\n",
I
Ingo Molnar 已提交
71 72 73
		SPLIT_NS(p->se.vruntime),
		SPLIT_NS(p->se.sum_exec_runtime),
		SPLIT_NS(p->se.sum_sleep_runtime));
I
Ingo Molnar 已提交
74
#else
I
Ingo Molnar 已提交
75 76
	SEQ_printf(m, "%15Ld %15Ld %15Ld.%06ld %15Ld.%06ld %15Ld.%06ld\n",
		0LL, 0LL, 0LL, 0L, 0LL, 0L, 0LL, 0L);
I
Ingo Molnar 已提交
77
#endif
I
Ingo Molnar 已提交
78 79
}

80
static void print_rq(struct seq_file *m, struct rq *rq, int rq_cpu)
I
Ingo Molnar 已提交
81 82 83 84 85
{
	struct task_struct *g, *p;

	SEQ_printf(m,
	"\nrunnable tasks:\n"
86 87
	"            task   PID         tree-key  switches  prio"
	"     exec-runtime         sum-exec        sum-sleep\n"
88
	"------------------------------------------------------"
89
	"----------------------------------------------------\n");
I
Ingo Molnar 已提交
90 91 92 93 94 95 96

	read_lock_irq(&tasklist_lock);

	do_each_thread(g, p) {
		if (!p->se.on_rq || task_cpu(p) != rq_cpu)
			continue;

97
		print_task(m, rq, p);
I
Ingo Molnar 已提交
98 99 100 101 102
	} while_each_thread(g, p);

	read_unlock_irq(&tasklist_lock);
}

103
void print_cfs_rq(struct seq_file *m, int cpu, struct cfs_rq *cfs_rq)
I
Ingo Molnar 已提交
104
{
I
Ingo Molnar 已提交
105 106
	s64 MIN_vruntime = -1, min_vruntime, max_vruntime = -1,
		spread, rq0_min_vruntime, spread0;
I
Ingo Molnar 已提交
107 108 109 110
	struct rq *rq = &per_cpu(runqueues, cpu);
	struct sched_entity *last;
	unsigned long flags;

111
	SEQ_printf(m, "\ncfs_rq\n");
I
Ingo Molnar 已提交
112

I
Ingo Molnar 已提交
113 114
	SEQ_printf(m, "  .%-30s: %Ld.%06ld\n", "exec_clock",
			SPLIT_NS(cfs_rq->exec_clock));
I
Ingo Molnar 已提交
115 116 117 118 119 120 121

	spin_lock_irqsave(&rq->lock, flags);
	if (cfs_rq->rb_leftmost)
		MIN_vruntime = (__pick_next_entity(cfs_rq))->vruntime;
	last = __pick_last_entity(cfs_rq);
	if (last)
		max_vruntime = last->vruntime;
I
Ingo Molnar 已提交
122 123
	min_vruntime = rq->cfs.min_vruntime;
	rq0_min_vruntime = per_cpu(runqueues, 0).cfs.min_vruntime;
I
Ingo Molnar 已提交
124
	spin_unlock_irqrestore(&rq->lock, flags);
I
Ingo Molnar 已提交
125 126 127 128 129 130
	SEQ_printf(m, "  .%-30s: %Ld.%06ld\n", "MIN_vruntime",
			SPLIT_NS(MIN_vruntime));
	SEQ_printf(m, "  .%-30s: %Ld.%06ld\n", "min_vruntime",
			SPLIT_NS(min_vruntime));
	SEQ_printf(m, "  .%-30s: %Ld.%06ld\n", "max_vruntime",
			SPLIT_NS(max_vruntime));
I
Ingo Molnar 已提交
131
	spread = max_vruntime - MIN_vruntime;
I
Ingo Molnar 已提交
132 133
	SEQ_printf(m, "  .%-30s: %Ld.%06ld\n", "spread",
			SPLIT_NS(spread));
I
Ingo Molnar 已提交
134
	spread0 = min_vruntime - rq0_min_vruntime;
I
Ingo Molnar 已提交
135 136
	SEQ_printf(m, "  .%-30s: %Ld.%06ld\n", "spread0",
			SPLIT_NS(spread0));
137 138
	SEQ_printf(m, "  .%-30s: %ld\n", "nr_running", cfs_rq->nr_running);
	SEQ_printf(m, "  .%-30s: %ld\n", "load", cfs_rq->load.weight);
139
#ifdef CONFIG_SCHEDSTATS
I
Ingo Molnar 已提交
140 141
	SEQ_printf(m, "  .%-30s: %ld\n", "bkl_cnt",
			rq->bkl_cnt);
142
#endif
P
Peter Zijlstra 已提交
143 144
	SEQ_printf(m, "  .%-30s: %ld\n", "nr_spread_over",
			cfs_rq->nr_spread_over);
I
Ingo Molnar 已提交
145 146
}

147
static void print_cpu(struct seq_file *m, int cpu)
I
Ingo Molnar 已提交
148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163
{
	struct rq *rq = &per_cpu(runqueues, cpu);

#ifdef CONFIG_X86
	{
		unsigned int freq = cpu_khz ? : 1;

		SEQ_printf(m, "\ncpu#%d, %u.%03u MHz\n",
			   cpu, freq / 1000, (freq % 1000));
	}
#else
	SEQ_printf(m, "\ncpu#%d\n", cpu);
#endif

#define P(x) \
	SEQ_printf(m, "  .%-30s: %Ld\n", #x, (long long)(rq->x))
I
Ingo Molnar 已提交
164 165
#define PN(x) \
	SEQ_printf(m, "  .%-30s: %Ld.%06ld\n", #x, SPLIT_NS(rq->x))
I
Ingo Molnar 已提交
166 167 168

	P(nr_running);
	SEQ_printf(m, "  .%-30s: %lu\n", "load",
169
		   rq->load.weight);
I
Ingo Molnar 已提交
170 171 172 173
	P(nr_switches);
	P(nr_load_updates);
	P(nr_uninterruptible);
	SEQ_printf(m, "  .%-30s: %lu\n", "jiffies", jiffies);
I
Ingo Molnar 已提交
174
	PN(next_balance);
I
Ingo Molnar 已提交
175
	P(curr->pid);
I
Ingo Molnar 已提交
176 177 178
	PN(clock);
	PN(idle_clock);
	PN(prev_clock_raw);
I
Ingo Molnar 已提交
179 180
	P(clock_warps);
	P(clock_overflows);
181
	P(clock_deep_idle_events);
I
Ingo Molnar 已提交
182
	PN(clock_max_delta);
I
Ingo Molnar 已提交
183 184 185 186 187 188
	P(cpu_load[0]);
	P(cpu_load[1]);
	P(cpu_load[2]);
	P(cpu_load[3]);
	P(cpu_load[4]);
#undef P
I
Ingo Molnar 已提交
189
#undef PN
I
Ingo Molnar 已提交
190

191
	print_cfs_stats(m, cpu);
I
Ingo Molnar 已提交
192

193
	print_rq(m, rq, cpu);
I
Ingo Molnar 已提交
194 195 196 197 198 199 200
}

static int sched_debug_show(struct seq_file *m, void *v)
{
	u64 now = ktime_to_ns(ktime_get());
	int cpu;

I
Ingo Molnar 已提交
201
	SEQ_printf(m, "Sched Debug Version: v0.05-v20, %s %.*s\n",
I
Ingo Molnar 已提交
202 203 204 205
		init_utsname()->release,
		(int)strcspn(init_utsname()->version, " "),
		init_utsname()->version);

I
Ingo Molnar 已提交
206
	SEQ_printf(m, "now at %Lu.%06ld msecs\n", SPLIT_NS(now));
I
Ingo Molnar 已提交
207

I
Ingo Molnar 已提交
208
#define P(x) \
209
	SEQ_printf(m, "  .%-40s: %Ld\n", #x, (long long)(x))
I
Ingo Molnar 已提交
210
#define PN(x) \
211
	SEQ_printf(m, "  .%-40s: %Ld.%06ld\n", #x, SPLIT_NS(x))
I
Ingo Molnar 已提交
212 213 214 215 216 217 218 219 220
	PN(sysctl_sched_latency);
	PN(sysctl_sched_min_granularity);
	PN(sysctl_sched_wakeup_granularity);
	PN(sysctl_sched_batch_wakeup_granularity);
	PN(sysctl_sched_child_runs_first);
	P(sysctl_sched_features);
#undef PN
#undef P

I
Ingo Molnar 已提交
221
	for_each_online_cpu(cpu)
222
		print_cpu(m, cpu);
I
Ingo Molnar 已提交
223 224 225 226 227 228

	SEQ_printf(m, "\n");

	return 0;
}

229
static void sysrq_sched_debug_show(void)
I
Ingo Molnar 已提交
230 231 232 233
{
	sched_debug_show(NULL, NULL);
}

234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276
#ifdef CONFIG_FAIR_USER_SCHED

static DEFINE_MUTEX(root_user_share_mutex);

static int
root_user_share_read_proc(char *page, char **start, off_t off, int count,
				 int *eof, void *data)
{
	int len;

	len = sprintf(page, "%d\n", init_task_grp_load);

	return len;
}

static int
root_user_share_write_proc(struct file *file, const char __user *buffer,
				 unsigned long count, void *data)
{
	unsigned long shares;
	char kbuf[sizeof(unsigned long)+1];
	int rc = 0;

	if (copy_from_user(kbuf, buffer, sizeof(kbuf)))
		return -EFAULT;

	shares = simple_strtoul(kbuf, NULL, 0);

	if (!shares)
		shares = NICE_0_LOAD;

	mutex_lock(&root_user_share_mutex);

	init_task_grp_load = shares;
	rc = sched_group_set_shares(&init_task_grp, shares);

	mutex_unlock(&root_user_share_mutex);

	return (rc < 0 ? rc : count);
}

#endif	/* CONFIG_FAIR_USER_SCHED */

I
Ingo Molnar 已提交
277 278 279 280 281 282 283 284 285
static int sched_debug_open(struct inode *inode, struct file *filp)
{
	return single_open(filp, sched_debug_show, NULL);
}

static struct file_operations sched_debug_fops = {
	.open		= sched_debug_open,
	.read		= seq_read,
	.llseek		= seq_lseek,
286
	.release	= single_release,
I
Ingo Molnar 已提交
287 288 289 290 291 292 293 294 295 296 297 298
};

static int __init init_sched_debug_procfs(void)
{
	struct proc_dir_entry *pe;

	pe = create_proc_entry("sched_debug", 0644, NULL);
	if (!pe)
		return -ENOMEM;

	pe->proc_fops = &sched_debug_fops;

299 300 301 302 303 304 305 306 307
#ifdef CONFIG_FAIR_USER_SCHED
	pe = create_proc_entry("root_user_share", 0644, NULL);
	if (!pe)
		return -ENOMEM;

	pe->read_proc = root_user_share_read_proc;
	pe->write_proc = root_user_share_write_proc;
#endif

I
Ingo Molnar 已提交
308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328
	return 0;
}

__initcall(init_sched_debug_procfs);

void proc_sched_show_task(struct task_struct *p, struct seq_file *m)
{
	unsigned long flags;
	int num_threads = 1;

	rcu_read_lock();
	if (lock_task_sighand(p, &flags)) {
		num_threads = atomic_read(&p->signal->count);
		unlock_task_sighand(p, &flags);
	}
	rcu_read_unlock();

	SEQ_printf(m, "%s (%d, #threads: %d)\n", p->comm, p->pid, num_threads);
	SEQ_printf(m, "----------------------------------------------\n");
#define P(F) \
	SEQ_printf(m, "%-25s:%20Ld\n", #F, (long long)p->F)
I
Ingo Molnar 已提交
329 330
#define PN(F) \
	SEQ_printf(m, "%-25s:%14Ld.%06ld\n", #F, SPLIT_NS((long long)p->F))
I
Ingo Molnar 已提交
331

I
Ingo Molnar 已提交
332 333 334
	PN(se.exec_start);
	PN(se.vruntime);
	PN(se.sum_exec_runtime);
I
Ingo Molnar 已提交
335 336

#ifdef CONFIG_SCHEDSTATS
I
Ingo Molnar 已提交
337 338 339 340 341 342 343 344
	PN(se.wait_start);
	PN(se.sleep_start);
	PN(se.block_start);
	PN(se.sleep_max);
	PN(se.block_max);
	PN(se.exec_max);
	PN(se.slice_max);
	PN(se.wait_max);
I
Ingo Molnar 已提交
345
	P(sched_info.bkl_cnt);
I
Ingo Molnar 已提交
346
#endif
I
Ingo Molnar 已提交
347 348 349 350 351 352
	SEQ_printf(m, "%-25s:%20Ld\n",
		   "nr_switches", (long long)(p->nvcsw + p->nivcsw));
	P(se.load.weight);
	P(policy);
	P(prio);
#undef P
I
Ingo Molnar 已提交
353
#undef PN
I
Ingo Molnar 已提交
354 355 356 357 358 359 360 361 362 363 364 365 366

	{
		u64 t0, t1;

		t0 = sched_clock();
		t1 = sched_clock();
		SEQ_printf(m, "%-25s:%20Ld\n",
			   "clock-delta", (long long)(t1-t0));
	}
}

void proc_sched_set_task(struct task_struct *p)
{
I
Ingo Molnar 已提交
367
#ifdef CONFIG_SCHEDSTATS
I
Ingo Molnar 已提交
368 369 370
	p->se.sleep_max			= 0;
	p->se.block_max			= 0;
	p->se.exec_max			= 0;
I
Ingo Molnar 已提交
371
	p->se.slice_max			= 0;
I
Ingo Molnar 已提交
372
	p->se.wait_max			= 0;
I
Ingo Molnar 已提交
373
	p->sched_info.bkl_cnt		= 0;
I
Ingo Molnar 已提交
374
#endif
I
Ingo Molnar 已提交
375
	p->se.sum_exec_runtime		= 0;
376
	p->se.prev_sum_exec_runtime	= 0;
I
Ingo Molnar 已提交
377
}