array.c 17.6 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42
/*
 *  linux/fs/proc/array.c
 *
 *  Copyright (C) 1992  by Linus Torvalds
 *  based on ideas by Darren Senn
 *
 * Fixes:
 * Michael. K. Johnson: stat,statm extensions.
 *                      <johnsonm@stolaf.edu>
 *
 * Pauline Middelink :  Made cmdline,envline only break at '\0's, to
 *                      make sure SET_PROCTITLE works. Also removed
 *                      bad '!' which forced address recalculation for
 *                      EVERY character on the current page.
 *                      <middelin@polyware.iaf.nl>
 *
 * Danny ter Haar    :	added cpuinfo
 *			<dth@cistron.nl>
 *
 * Alessandro Rubini :  profile extension.
 *                      <rubini@ipvvis.unipv.it>
 *
 * Jeff Tranter      :  added BogoMips field to cpuinfo
 *                      <Jeff_Tranter@Mitel.COM>
 *
 * Bruno Haible      :  remove 4K limit for the maps file
 *			<haible@ma2s2.mathematik.uni-karlsruhe.de>
 *
 * Yves Arrouye      :  remove removal of trailing spaces in get_array.
 *			<Yves.Arrouye@marin.fdn.fr>
 *
 * Jerome Forissier  :  added per-CPU time information to /proc/stat
 *                      and /proc/<pid>/cpu extension
 *                      <forissier@isia.cma.fr>
 *			- Incorporation and non-SMP safe operation
 *			of forissier patch in 2.1.78 by
 *			Hans Marcus <crowbar@concepts.nl>
 *
 * aeb@cwi.nl        :  /proc/partitions
 *
 *
 * Alan Cox	     :  security fixes.
A
Alan Cox 已提交
43
 *			<alan@lxorguk.ukuu.org.uk>
L
Linus Torvalds 已提交
44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64
 *
 * Al Viro           :  safe handling of mm_struct
 *
 * Gerhard Wichert   :  added BIGMEM support
 * Siemens AG           <Gerhard.Wichert@pdb.siemens.de>
 *
 * Al Viro & Jeff Garzik :  moved most of the thing into base.c and
 *			 :  proc_misc.c. The rest may eventually go into
 *			 :  base.c too.
 */

#include <linux/types.h>
#include <linux/errno.h>
#include <linux/time.h>
#include <linux/kernel.h>
#include <linux/kernel_stat.h>
#include <linux/tty.h>
#include <linux/string.h>
#include <linux/mman.h>
#include <linux/proc_fs.h>
#include <linux/ioport.h>
65 66
#include <linux/uaccess.h>
#include <linux/io.h>
L
Linus Torvalds 已提交
67 68 69 70 71 72 73 74
#include <linux/mm.h>
#include <linux/hugetlb.h>
#include <linux/pagemap.h>
#include <linux/swap.h>
#include <linux/smp.h>
#include <linux/signal.h>
#include <linux/highmem.h>
#include <linux/file.h>
A
Al Viro 已提交
75
#include <linux/fdtable.h>
L
Linus Torvalds 已提交
76 77
#include <linux/times.h>
#include <linux/cpuset.h>
78
#include <linux/rcupdate.h>
79
#include <linux/delayacct.h>
80
#include <linux/seq_file.h>
81
#include <linux/pid_namespace.h>
82
#include <linux/ptrace.h>
83
#include <linux/tracehook.h>
84
#include <linux/string_helpers.h>
85
#include <linux/user_namespace.h>
L
Linus Torvalds 已提交
86 87 88 89 90

#include <asm/pgtable.h>
#include <asm/processor.h>
#include "internal.h"

91
static inline void task_name(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
92
{
93
	char *buf;
L
Linus Torvalds 已提交
94 95 96 97
	char tcomm[sizeof(p->comm)];

	get_task_comm(tcomm, p);

98
	seq_puts(m, "Name:\t");
99
	buf = m->buf + m->count;
100 101 102 103 104

	/* Ignore error for now */
	string_escape_str(tcomm, &buf, m->size - m->count,
			  ESCAPE_SPACE | ESCAPE_SPECIAL, "\n\\");

105
	m->count = buf - m->buf;
106
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
107 108 109 110 111 112 113 114
}

/*
 * The task state array is a strange "bitmap" of
 * reasons to sleep. Thus "running" is zero, and
 * you can test for combinations of others with
 * simple bit tests.
 */
M
Mike Frysinger 已提交
115
static const char * const task_state_array[] = {
116 117 118 119 120
	"R (running)",		/*   0 */
	"S (sleeping)",		/*   1 */
	"D (disk sleep)",	/*   2 */
	"T (stopped)",		/*   4 */
	"t (tracing stop)",	/*   8 */
121 122
	"X (dead)",		/*  16 */
	"Z (zombie)",		/*  32 */
L
Linus Torvalds 已提交
123 124
};

125
static inline const char *get_task_state(struct task_struct *tsk)
L
Linus Torvalds 已提交
126
{
127
	unsigned int state = (tsk->state | tsk->exit_state) & TASK_REPORT;
L
Linus Torvalds 已提交
128

129
	BUILD_BUG_ON(1 + ilog2(TASK_REPORT) != ARRAY_SIZE(task_state_array)-1);
130

131
	return task_state_array[fls(state)];
L
Linus Torvalds 已提交
132 133
}

134 135
static inline void task_state(struct seq_file *m, struct pid_namespace *ns,
				struct pid *pid, struct task_struct *p)
L
Linus Torvalds 已提交
136
{
137
	struct user_namespace *user_ns = seq_user_ns(m);
L
Linus Torvalds 已提交
138 139
	struct group_info *group_info;
	int g;
140
	struct task_struct *tracer;
141
	const struct cred *cred;
142
	pid_t ppid, tpid = 0, tgid, ngid;
143
	unsigned int max_fds = 0;
L
Linus Torvalds 已提交
144

145
	rcu_read_lock();
146 147
	ppid = pid_alive(p) ?
		task_tgid_nr_ns(rcu_dereference(p->real_parent), ns) : 0;
148 149 150 151

	tracer = ptrace_parent(p);
	if (tracer)
		tpid = task_pid_nr_ns(tracer, ns);
152 153 154

	tgid = task_tgid_nr_ns(p, ns);
	ngid = task_numa_group_id(p);
155
	cred = get_task_cred(p);
156 157 158 159 160

	task_lock(p);
	if (p->files)
		max_fds = files_fdtable(p->files)->max_fds;
	task_unlock(p);
161
	rcu_read_unlock();
162

163
	seq_printf(m,
L
Linus Torvalds 已提交
164 165
		"State:\t%s\n"
		"Tgid:\t%d\n"
166
		"Ngid:\t%d\n"
L
Linus Torvalds 已提交
167 168 169 170
		"Pid:\t%d\n"
		"PPid:\t%d\n"
		"TracerPid:\t%d\n"
		"Uid:\t%d\t%d\t%d\t%d\n"
171 172
		"Gid:\t%d\t%d\t%d\t%d\n"
		"FDSize:\t%d\nGroups:\t",
L
Linus Torvalds 已提交
173
		get_task_state(p),
174
		tgid, ngid, pid_nr_ns(pid, ns), ppid, tpid,
175 176 177 178 179 180 181
		from_kuid_munged(user_ns, cred->uid),
		from_kuid_munged(user_ns, cred->euid),
		from_kuid_munged(user_ns, cred->suid),
		from_kuid_munged(user_ns, cred->fsuid),
		from_kgid_munged(user_ns, cred->gid),
		from_kgid_munged(user_ns, cred->egid),
		from_kgid_munged(user_ns, cred->sgid),
182 183
		from_kgid_munged(user_ns, cred->fsgid),
		max_fds);
L
Linus Torvalds 已提交
184

185
	group_info = cred->group_info;
186
	for (g = 0; g < group_info->ngroups; g++)
187 188
		seq_printf(m, "%d ",
			   from_kgid_munged(user_ns, GROUP_AT(group_info, g)));
189
	put_cred(cred);
L
Linus Torvalds 已提交
190

191
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
192 193
}

194
void render_sigset_t(struct seq_file *m, const char *header,
195
				sigset_t *set)
L
Linus Torvalds 已提交
196
{
197
	int i;
L
Linus Torvalds 已提交
198

199
	seq_puts(m, header);
L
Linus Torvalds 已提交
200 201 202 203 204 205 206 207 208 209

	i = _NSIG;
	do {
		int x = 0;

		i -= 4;
		if (sigismember(set, i+1)) x |= 1;
		if (sigismember(set, i+2)) x |= 2;
		if (sigismember(set, i+3)) x |= 4;
		if (sigismember(set, i+4)) x |= 8;
210
		seq_printf(m, "%x", x);
L
Linus Torvalds 已提交
211 212
	} while (i >= 4);

213
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230
}

static void collect_sigign_sigcatch(struct task_struct *p, sigset_t *ign,
				    sigset_t *catch)
{
	struct k_sigaction *k;
	int i;

	k = p->sighand->action;
	for (i = 1; i <= _NSIG; ++i, ++k) {
		if (k->sa.sa_handler == SIG_IGN)
			sigaddset(ign, i);
		else if (k->sa.sa_handler != SIG_DFL)
			sigaddset(catch, i);
	}
}

231
static inline void task_sig(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
232
{
233
	unsigned long flags;
L
Linus Torvalds 已提交
234 235 236 237 238 239 240 241 242 243 244
	sigset_t pending, shpending, blocked, ignored, caught;
	int num_threads = 0;
	unsigned long qsize = 0;
	unsigned long qlim = 0;

	sigemptyset(&pending);
	sigemptyset(&shpending);
	sigemptyset(&blocked);
	sigemptyset(&ignored);
	sigemptyset(&caught);

245
	if (lock_task_sighand(p, &flags)) {
L
Linus Torvalds 已提交
246 247 248 249
		pending = p->pending.signal;
		shpending = p->signal->shared_pending.signal;
		blocked = p->blocked;
		collect_sigign_sigcatch(p, &ignored, &caught);
250
		num_threads = get_nr_threads(p);
251
		rcu_read_lock();  /* FIXME: is this correct? */
252
		qsize = atomic_read(&__task_cred(p)->user->sigpending);
253
		rcu_read_unlock();
J
Jiri Slaby 已提交
254
		qlim = task_rlimit(p, RLIMIT_SIGPENDING);
255
		unlock_task_sighand(p, &flags);
L
Linus Torvalds 已提交
256 257
	}

258 259
	seq_printf(m, "Threads:\t%d\n", num_threads);
	seq_printf(m, "SigQ:\t%lu/%lu\n", qsize, qlim);
L
Linus Torvalds 已提交
260 261

	/* render them all */
262 263 264 265 266
	render_sigset_t(m, "SigPnd:\t", &pending);
	render_sigset_t(m, "ShdPnd:\t", &shpending);
	render_sigset_t(m, "SigBlk:\t", &blocked);
	render_sigset_t(m, "SigIgn:\t", &ignored);
	render_sigset_t(m, "SigCgt:\t", &caught);
L
Linus Torvalds 已提交
267 268
}

269 270
static void render_cap_t(struct seq_file *m, const char *header,
			kernel_cap_t *a)
271 272 273
{
	unsigned __capi;

274
	seq_puts(m, header);
275
	CAP_FOR_EACH_U32(__capi) {
276
		seq_printf(m, "%08x",
277
			   a->cap[CAP_LAST_U32 - __capi]);
278
	}
279
	seq_putc(m, '\n');
280 281
}

282
static inline void task_cap(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
283
{
284 285
	const struct cred *cred;
	kernel_cap_t cap_inheritable, cap_permitted, cap_effective, cap_bset;
286

287 288 289 290 291 292 293 294 295 296 297 298
	rcu_read_lock();
	cred = __task_cred(p);
	cap_inheritable	= cred->cap_inheritable;
	cap_permitted	= cred->cap_permitted;
	cap_effective	= cred->cap_effective;
	cap_bset	= cred->cap_bset;
	rcu_read_unlock();

	render_cap_t(m, "CapInh:\t", &cap_inheritable);
	render_cap_t(m, "CapPrm:\t", &cap_permitted);
	render_cap_t(m, "CapEff:\t", &cap_effective);
	render_cap_t(m, "CapBnd:\t", &cap_bset);
L
Linus Torvalds 已提交
299 300
}

K
Kees Cook 已提交
301 302 303 304 305 306 307
static inline void task_seccomp(struct seq_file *m, struct task_struct *p)
{
#ifdef CONFIG_SECCOMP
	seq_printf(m, "Seccomp:\t%d\n", p->seccomp.mode);
#endif
}

308 309
static inline void task_context_switch_counts(struct seq_file *m,
						struct task_struct *p)
310
{
311 312 313 314
	seq_printf(m,	"voluntary_ctxt_switches:\t%lu\n"
			"nonvoluntary_ctxt_switches:\t%lu\n",
			p->nvcsw,
			p->nivcsw);
315 316
}

317 318
static void task_cpus_allowed(struct seq_file *m, struct task_struct *task)
{
319 320 321 322
	seq_printf(m, "Cpus_allowed:\t%*pb\n",
		   cpumask_pr_args(&task->cpus_allowed));
	seq_printf(m, "Cpus_allowed_list:\t%*pbl\n",
		   cpumask_pr_args(&task->cpus_allowed));
323 324
}

325 326
int proc_pid_status(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
327 328 329
{
	struct mm_struct *mm = get_task_mm(task);

330 331
	task_name(m, task);
	task_state(m, ns, pid, task);
332

L
Linus Torvalds 已提交
333
	if (mm) {
334
		task_mem(m, mm);
L
Linus Torvalds 已提交
335 336
		mmput(mm);
	}
337 338
	task_sig(m, task);
	task_cap(m, task);
K
Kees Cook 已提交
339
	task_seccomp(m, task);
340
	task_cpus_allowed(m, task);
341 342 343
	cpuset_task_status_allowed(m, task);
	task_context_switch_counts(m, task);
	return 0;
L
Linus Torvalds 已提交
344 345
}

346 347
static int do_task_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task, int whole)
L
Linus Torvalds 已提交
348 349
{
	unsigned long vsize, eip, esp, wchan = ~0UL;
350
	int priority, nice;
L
Linus Torvalds 已提交
351 352 353
	int tty_pgrp = -1, tty_nr = 0;
	sigset_t sigign, sigcatch;
	char state;
354
	pid_t ppid = 0, pgid = -1, sid = -1;
L
Linus Torvalds 已提交
355
	int num_threads = 0;
356
	int permitted;
L
Linus Torvalds 已提交
357 358 359 360
	struct mm_struct *mm;
	unsigned long long start_time;
	unsigned long cmin_flt = 0, cmaj_flt = 0;
	unsigned long  min_flt = 0,  maj_flt = 0;
361
	cputime_t cutime, cstime, utime, stime;
362
	cputime_t cgtime, gtime;
L
Linus Torvalds 已提交
363 364
	unsigned long rsslim = 0;
	char tcomm[sizeof(task->comm)];
365
	unsigned long flags;
L
Linus Torvalds 已提交
366 367 368

	state = *get_task_state(task);
	vsize = eip = esp = 0;
369
	permitted = ptrace_may_access(task, PTRACE_MODE_READ | PTRACE_MODE_NOAUDIT);
L
Linus Torvalds 已提交
370 371 372
	mm = get_task_mm(task);
	if (mm) {
		vsize = task_vsize(mm);
373 374 375 376
		if (permitted) {
			eip = KSTK_EIP(task);
			esp = KSTK_ESP(task);
		}
L
Linus Torvalds 已提交
377 378 379 380 381 382
	}

	get_task_comm(tcomm, task);

	sigemptyset(&sigign);
	sigemptyset(&sigcatch);
383 384
	cutime = cstime = utime = stime = 0;
	cgtime = gtime = 0;
385

386 387
	if (lock_task_sighand(task, &flags)) {
		struct signal_struct *sig = task->signal;
388 389

		if (sig->tty) {
390 391 392
			struct pid *pgrp = tty_get_pgrp(sig->tty);
			tty_pgrp = pid_nr_ns(pgrp, ns);
			put_pid(pgrp);
393
			tty_nr = new_encode_dev(tty_devnum(sig->tty));
394 395
		}

396
		num_threads = get_nr_threads(task);
L
Linus Torvalds 已提交
397 398
		collect_sigign_sigcatch(task, &sigign, &sigcatch);

399 400 401 402
		cmin_flt = sig->cmin_flt;
		cmaj_flt = sig->cmaj_flt;
		cutime = sig->cutime;
		cstime = sig->cstime;
403
		cgtime = sig->cgtime;
J
Jiri Slaby 已提交
404
		rsslim = ACCESS_ONCE(sig->rlim[RLIMIT_RSS].rlim_cur);
405

L
Linus Torvalds 已提交
406 407
		/* add up live thread stats at the group level */
		if (whole) {
408
			struct task_struct *t = task;
L
Linus Torvalds 已提交
409 410 411
			do {
				min_flt += t->min_flt;
				maj_flt += t->maj_flt;
412
				gtime += task_gtime(t);
413
			} while_each_thread(task, t);
L
Linus Torvalds 已提交
414

415 416
			min_flt += sig->min_flt;
			maj_flt += sig->maj_flt;
417
			thread_group_cputime_adjusted(task, &utime, &stime);
418
			gtime += sig->gtime;
L
Linus Torvalds 已提交
419
		}
420

421
		sid = task_session_nr_ns(task, ns);
422
		ppid = task_tgid_nr_ns(task->real_parent, ns);
423
		pgid = task_pgrp_nr_ns(task, ns);
424 425

		unlock_task_sighand(task, &flags);
L
Linus Torvalds 已提交
426 427
	}

428
	if (permitted && (!whole || num_threads < 2))
L
Linus Torvalds 已提交
429 430 431 432
		wchan = get_wchan(task);
	if (!whole) {
		min_flt = task->min_flt;
		maj_flt = task->maj_flt;
433
		task_cputime_adjusted(task, &utime, &stime);
434
		gtime = task_gtime(task);
L
Linus Torvalds 已提交
435 436 437 438 439 440 441 442
	}

	/* scale priority and nice values from timeslices to -20..20 */
	/* to make it look like a "normal" Unix priority/nice value  */
	priority = task_prio(task);
	nice = task_nice(task);

	/* convert nsec -> ticks */
443
	start_time = nsec_to_clock_t(task->real_start_time);
L
Linus Torvalds 已提交
444

445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465
	seq_printf(m, "%d (%s) %c", pid_nr_ns(pid, ns), tcomm, state);
	seq_put_decimal_ll(m, ' ', ppid);
	seq_put_decimal_ll(m, ' ', pgid);
	seq_put_decimal_ll(m, ' ', sid);
	seq_put_decimal_ll(m, ' ', tty_nr);
	seq_put_decimal_ll(m, ' ', tty_pgrp);
	seq_put_decimal_ull(m, ' ', task->flags);
	seq_put_decimal_ull(m, ' ', min_flt);
	seq_put_decimal_ull(m, ' ', cmin_flt);
	seq_put_decimal_ull(m, ' ', maj_flt);
	seq_put_decimal_ull(m, ' ', cmaj_flt);
	seq_put_decimal_ull(m, ' ', cputime_to_clock_t(utime));
	seq_put_decimal_ull(m, ' ', cputime_to_clock_t(stime));
	seq_put_decimal_ll(m, ' ', cputime_to_clock_t(cutime));
	seq_put_decimal_ll(m, ' ', cputime_to_clock_t(cstime));
	seq_put_decimal_ll(m, ' ', priority);
	seq_put_decimal_ll(m, ' ', nice);
	seq_put_decimal_ll(m, ' ', num_threads);
	seq_put_decimal_ull(m, ' ', 0);
	seq_put_decimal_ull(m, ' ', start_time);
	seq_put_decimal_ull(m, ' ', vsize);
466
	seq_put_decimal_ull(m, ' ', mm ? get_mm_rss(mm) : 0);
467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490
	seq_put_decimal_ull(m, ' ', rsslim);
	seq_put_decimal_ull(m, ' ', mm ? (permitted ? mm->start_code : 1) : 0);
	seq_put_decimal_ull(m, ' ', mm ? (permitted ? mm->end_code : 1) : 0);
	seq_put_decimal_ull(m, ' ', (permitted && mm) ? mm->start_stack : 0);
	seq_put_decimal_ull(m, ' ', esp);
	seq_put_decimal_ull(m, ' ', eip);
	/* The signal information here is obsolete.
	 * It must be decimal for Linux 2.0 compatibility.
	 * Use /proc/#/status for real-time signals.
	 */
	seq_put_decimal_ull(m, ' ', task->pending.signal.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, ' ', task->blocked.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, ' ', sigign.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, ' ', sigcatch.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, ' ', wchan);
	seq_put_decimal_ull(m, ' ', 0);
	seq_put_decimal_ull(m, ' ', 0);
	seq_put_decimal_ll(m, ' ', task->exit_signal);
	seq_put_decimal_ll(m, ' ', task_cpu(task));
	seq_put_decimal_ull(m, ' ', task->rt_priority);
	seq_put_decimal_ull(m, ' ', task->policy);
	seq_put_decimal_ull(m, ' ', delayacct_blkio_ticks(task));
	seq_put_decimal_ull(m, ' ', cputime_to_clock_t(gtime));
	seq_put_decimal_ll(m, ' ', cputime_to_clock_t(cgtime));
491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507

	if (mm && permitted) {
		seq_put_decimal_ull(m, ' ', mm->start_data);
		seq_put_decimal_ull(m, ' ', mm->end_data);
		seq_put_decimal_ull(m, ' ', mm->start_brk);
		seq_put_decimal_ull(m, ' ', mm->arg_start);
		seq_put_decimal_ull(m, ' ', mm->arg_end);
		seq_put_decimal_ull(m, ' ', mm->env_start);
		seq_put_decimal_ull(m, ' ', mm->env_end);
	} else
		seq_printf(m, " 0 0 0 0 0 0 0");

	if (permitted)
		seq_put_decimal_ll(m, ' ', task->exit_code);
	else
		seq_put_decimal_ll(m, ' ', 0);

508
	seq_putc(m, '\n');
509
	if (mm)
L
Linus Torvalds 已提交
510
		mmput(mm);
511
	return 0;
L
Linus Torvalds 已提交
512 513
}

514 515
int proc_tid_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
516
{
517
	return do_task_stat(m, ns, pid, task, 0);
L
Linus Torvalds 已提交
518 519
}

520 521
int proc_tgid_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
522
{
523
	return do_task_stat(m, ns, pid, task, 1);
L
Linus Torvalds 已提交
524 525
}

526 527
int proc_pid_statm(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
528
{
529
	unsigned long size = 0, resident = 0, shared = 0, text = 0, data = 0;
L
Linus Torvalds 已提交
530
	struct mm_struct *mm = get_task_mm(task);
531

L
Linus Torvalds 已提交
532 533 534 535
	if (mm) {
		size = task_statm(mm, &shared, &text, &data, &resident);
		mmput(mm);
	}
536 537 538 539 540 541 542 543 544 545 546
	/*
	 * For quick read, open code by putting numbers directly
	 * expected format is
	 * seq_printf(m, "%lu %lu %lu %lu 0 %lu 0\n",
	 *               size, resident, shared, text, data);
	 */
	seq_put_decimal_ull(m, 0, size);
	seq_put_decimal_ull(m, ' ', resident);
	seq_put_decimal_ull(m, ' ', shared);
	seq_put_decimal_ull(m, ' ', text);
	seq_put_decimal_ull(m, ' ', 0);
K
KAMEZAWA Hiroyuki 已提交
547
	seq_put_decimal_ull(m, ' ', data);
548 549
	seq_put_decimal_ull(m, ' ', 0);
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
550

551
	return 0;
L
Linus Torvalds 已提交
552
}
553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675

#ifdef CONFIG_CHECKPOINT_RESTORE
static struct pid *
get_children_pid(struct inode *inode, struct pid *pid_prev, loff_t pos)
{
	struct task_struct *start, *task;
	struct pid *pid = NULL;

	read_lock(&tasklist_lock);

	start = pid_task(proc_pid(inode), PIDTYPE_PID);
	if (!start)
		goto out;

	/*
	 * Lets try to continue searching first, this gives
	 * us significant speedup on children-rich processes.
	 */
	if (pid_prev) {
		task = pid_task(pid_prev, PIDTYPE_PID);
		if (task && task->real_parent == start &&
		    !(list_empty(&task->sibling))) {
			if (list_is_last(&task->sibling, &start->children))
				goto out;
			task = list_first_entry(&task->sibling,
						struct task_struct, sibling);
			pid = get_pid(task_pid(task));
			goto out;
		}
	}

	/*
	 * Slow search case.
	 *
	 * We might miss some children here if children
	 * are exited while we were not holding the lock,
	 * but it was never promised to be accurate that
	 * much.
	 *
	 * "Just suppose that the parent sleeps, but N children
	 *  exit after we printed their tids. Now the slow paths
	 *  skips N extra children, we miss N tasks." (c)
	 *
	 * So one need to stop or freeze the leader and all
	 * its children to get a precise result.
	 */
	list_for_each_entry(task, &start->children, sibling) {
		if (pos-- == 0) {
			pid = get_pid(task_pid(task));
			break;
		}
	}

out:
	read_unlock(&tasklist_lock);
	return pid;
}

static int children_seq_show(struct seq_file *seq, void *v)
{
	struct inode *inode = seq->private;
	pid_t pid;

	pid = pid_nr_ns(v, inode->i_sb->s_fs_info);
	return seq_printf(seq, "%d ", pid);
}

static void *children_seq_start(struct seq_file *seq, loff_t *pos)
{
	return get_children_pid(seq->private, NULL, *pos);
}

static void *children_seq_next(struct seq_file *seq, void *v, loff_t *pos)
{
	struct pid *pid;

	pid = get_children_pid(seq->private, v, *pos + 1);
	put_pid(v);

	++*pos;
	return pid;
}

static void children_seq_stop(struct seq_file *seq, void *v)
{
	put_pid(v);
}

static const struct seq_operations children_seq_ops = {
	.start	= children_seq_start,
	.next	= children_seq_next,
	.stop	= children_seq_stop,
	.show	= children_seq_show,
};

static int children_seq_open(struct inode *inode, struct file *file)
{
	struct seq_file *m;
	int ret;

	ret = seq_open(file, &children_seq_ops);
	if (ret)
		return ret;

	m = file->private_data;
	m->private = inode;

	return ret;
}

int children_seq_release(struct inode *inode, struct file *file)
{
	seq_release(inode, file);
	return 0;
}

const struct file_operations proc_tid_children_operations = {
	.open    = children_seq_open,
	.read    = seq_read,
	.llseek  = seq_lseek,
	.release = children_seq_release,
};
#endif /* CONFIG_CHECKPOINT_RESTORE */