array.c 18.3 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42
/*
 *  linux/fs/proc/array.c
 *
 *  Copyright (C) 1992  by Linus Torvalds
 *  based on ideas by Darren Senn
 *
 * Fixes:
 * Michael. K. Johnson: stat,statm extensions.
 *                      <johnsonm@stolaf.edu>
 *
 * Pauline Middelink :  Made cmdline,envline only break at '\0's, to
 *                      make sure SET_PROCTITLE works. Also removed
 *                      bad '!' which forced address recalculation for
 *                      EVERY character on the current page.
 *                      <middelin@polyware.iaf.nl>
 *
 * Danny ter Haar    :	added cpuinfo
 *			<dth@cistron.nl>
 *
 * Alessandro Rubini :  profile extension.
 *                      <rubini@ipvvis.unipv.it>
 *
 * Jeff Tranter      :  added BogoMips field to cpuinfo
 *                      <Jeff_Tranter@Mitel.COM>
 *
 * Bruno Haible      :  remove 4K limit for the maps file
 *			<haible@ma2s2.mathematik.uni-karlsruhe.de>
 *
 * Yves Arrouye      :  remove removal of trailing spaces in get_array.
 *			<Yves.Arrouye@marin.fdn.fr>
 *
 * Jerome Forissier  :  added per-CPU time information to /proc/stat
 *                      and /proc/<pid>/cpu extension
 *                      <forissier@isia.cma.fr>
 *			- Incorporation and non-SMP safe operation
 *			of forissier patch in 2.1.78 by
 *			Hans Marcus <crowbar@concepts.nl>
 *
 * aeb@cwi.nl        :  /proc/partitions
 *
 *
 * Alan Cox	     :  security fixes.
A
Alan Cox 已提交
43
 *			<alan@lxorguk.ukuu.org.uk>
L
Linus Torvalds 已提交
44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64
 *
 * Al Viro           :  safe handling of mm_struct
 *
 * Gerhard Wichert   :  added BIGMEM support
 * Siemens AG           <Gerhard.Wichert@pdb.siemens.de>
 *
 * Al Viro & Jeff Garzik :  moved most of the thing into base.c and
 *			 :  proc_misc.c. The rest may eventually go into
 *			 :  base.c too.
 */

#include <linux/types.h>
#include <linux/errno.h>
#include <linux/time.h>
#include <linux/kernel.h>
#include <linux/kernel_stat.h>
#include <linux/tty.h>
#include <linux/string.h>
#include <linux/mman.h>
#include <linux/proc_fs.h>
#include <linux/ioport.h>
65 66
#include <linux/uaccess.h>
#include <linux/io.h>
L
Linus Torvalds 已提交
67 68 69 70 71 72 73 74
#include <linux/mm.h>
#include <linux/hugetlb.h>
#include <linux/pagemap.h>
#include <linux/swap.h>
#include <linux/smp.h>
#include <linux/signal.h>
#include <linux/highmem.h>
#include <linux/file.h>
A
Al Viro 已提交
75
#include <linux/fdtable.h>
L
Linus Torvalds 已提交
76 77
#include <linux/times.h>
#include <linux/cpuset.h>
78
#include <linux/rcupdate.h>
79
#include <linux/delayacct.h>
80
#include <linux/seq_file.h>
81
#include <linux/pid_namespace.h>
82
#include <linux/ptrace.h>
83
#include <linux/tracehook.h>
84
#include <linux/user_namespace.h>
L
Linus Torvalds 已提交
85 86 87 88 89

#include <asm/pgtable.h>
#include <asm/processor.h>
#include "internal.h"

90
static inline void task_name(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
91 92
{
	int i;
93
	char *buf, *end;
94
	char *name;
L
Linus Torvalds 已提交
95 96 97 98
	char tcomm[sizeof(p->comm)];

	get_task_comm(tcomm, p);

99
	seq_puts(m, "Name:\t");
100 101
	end = m->buf + m->size;
	buf = m->buf + m->count;
L
Linus Torvalds 已提交
102 103
	name = tcomm;
	i = sizeof(tcomm);
104
	while (i && (buf < end)) {
L
Linus Torvalds 已提交
105 106 107 108 109 110 111
		unsigned char c = *name;
		name++;
		i--;
		*buf = c;
		if (!c)
			break;
		if (c == '\\') {
112 113 114
			buf++;
			if (buf < end)
				*buf++ = c;
L
Linus Torvalds 已提交
115 116 117
			continue;
		}
		if (c == '\n') {
118 119 120
			*buf++ = '\\';
			if (buf < end)
				*buf++ = 'n';
L
Linus Torvalds 已提交
121 122 123
			continue;
		}
		buf++;
124 125
	}
	m->count = buf - m->buf;
126
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
127 128 129 130 131 132 133 134
}

/*
 * The task state array is a strange "bitmap" of
 * reasons to sleep. Thus "running" is zero, and
 * you can test for combinations of others with
 * simple bit tests.
 */
M
Mike Frysinger 已提交
135
static const char * const task_state_array[] = {
136 137 138 139 140
	"R (running)",		/*   0 */
	"S (sleeping)",		/*   1 */
	"D (disk sleep)",	/*   2 */
	"T (stopped)",		/*   4 */
	"t (tracing stop)",	/*   8 */
141 142
	"X (dead)",		/*  16 */
	"Z (zombie)",		/*  32 */
L
Linus Torvalds 已提交
143 144
};

145
static inline const char *get_task_state(struct task_struct *tsk)
L
Linus Torvalds 已提交
146
{
147
	unsigned int state = (tsk->state | tsk->exit_state) & TASK_REPORT;
L
Linus Torvalds 已提交
148

149
	BUILD_BUG_ON(1 + ilog2(TASK_REPORT) != ARRAY_SIZE(task_state_array)-1);
150

151
	return task_state_array[fls(state)];
L
Linus Torvalds 已提交
152 153
}

154 155
static inline void task_state(struct seq_file *m, struct pid_namespace *ns,
				struct pid *pid, struct task_struct *p)
L
Linus Torvalds 已提交
156
{
157
	struct user_namespace *user_ns = seq_user_ns(m);
L
Linus Torvalds 已提交
158 159
	struct group_info *group_info;
	int g;
160
	struct fdtable *fdt = NULL;
161
	const struct cred *cred;
162
	pid_t ppid, tpid;
L
Linus Torvalds 已提交
163

164
	rcu_read_lock();
165 166
	ppid = pid_alive(p) ?
		task_tgid_nr_ns(rcu_dereference(p->real_parent), ns) : 0;
167 168
	tpid = 0;
	if (pid_alive(p)) {
169
		struct task_struct *tracer = ptrace_parent(p);
170 171 172
		if (tracer)
			tpid = task_pid_nr_ns(tracer, ns);
	}
173
	cred = get_task_cred(p);
174
	seq_printf(m,
L
Linus Torvalds 已提交
175 176
		"State:\t%s\n"
		"Tgid:\t%d\n"
177
		"Ngid:\t%d\n"
L
Linus Torvalds 已提交
178 179 180 181 182 183
		"Pid:\t%d\n"
		"PPid:\t%d\n"
		"TracerPid:\t%d\n"
		"Uid:\t%d\t%d\t%d\t%d\n"
		"Gid:\t%d\t%d\t%d\t%d\n",
		get_task_state(p),
184
		task_tgid_nr_ns(p, ns),
185
		task_numa_group_id(p),
186
		pid_nr_ns(pid, ns),
187
		ppid, tpid,
188 189 190 191 192 193 194 195
		from_kuid_munged(user_ns, cred->uid),
		from_kuid_munged(user_ns, cred->euid),
		from_kuid_munged(user_ns, cred->suid),
		from_kuid_munged(user_ns, cred->fsuid),
		from_kgid_munged(user_ns, cred->gid),
		from_kgid_munged(user_ns, cred->egid),
		from_kgid_munged(user_ns, cred->sgid),
		from_kgid_munged(user_ns, cred->fsgid));
196

L
Linus Torvalds 已提交
197
	task_lock(p);
198 199
	if (p->files)
		fdt = files_fdtable(p->files);
200
	seq_printf(m,
L
Linus Torvalds 已提交
201 202
		"FDSize:\t%d\n"
		"Groups:\t",
203
		fdt ? fdt->max_fds : 0);
204
	rcu_read_unlock();
L
Linus Torvalds 已提交
205

206
	group_info = cred->group_info;
L
Linus Torvalds 已提交
207 208
	task_unlock(p);

209
	for (g = 0; g < group_info->ngroups; g++)
210 211
		seq_printf(m, "%d ",
			   from_kgid_munged(user_ns, GROUP_AT(group_info, g)));
212
	put_cred(cred);
L
Linus Torvalds 已提交
213

214
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
215 216
}

217
void render_sigset_t(struct seq_file *m, const char *header,
218
				sigset_t *set)
L
Linus Torvalds 已提交
219
{
220
	int i;
L
Linus Torvalds 已提交
221

222
	seq_puts(m, header);
L
Linus Torvalds 已提交
223 224 225 226 227 228 229 230 231 232

	i = _NSIG;
	do {
		int x = 0;

		i -= 4;
		if (sigismember(set, i+1)) x |= 1;
		if (sigismember(set, i+2)) x |= 2;
		if (sigismember(set, i+3)) x |= 4;
		if (sigismember(set, i+4)) x |= 8;
233
		seq_printf(m, "%x", x);
L
Linus Torvalds 已提交
234 235
	} while (i >= 4);

236
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253
}

static void collect_sigign_sigcatch(struct task_struct *p, sigset_t *ign,
				    sigset_t *catch)
{
	struct k_sigaction *k;
	int i;

	k = p->sighand->action;
	for (i = 1; i <= _NSIG; ++i, ++k) {
		if (k->sa.sa_handler == SIG_IGN)
			sigaddset(ign, i);
		else if (k->sa.sa_handler != SIG_DFL)
			sigaddset(catch, i);
	}
}

254
static inline void task_sig(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
255
{
256
	unsigned long flags;
L
Linus Torvalds 已提交
257 258 259 260 261 262 263 264 265 266 267
	sigset_t pending, shpending, blocked, ignored, caught;
	int num_threads = 0;
	unsigned long qsize = 0;
	unsigned long qlim = 0;

	sigemptyset(&pending);
	sigemptyset(&shpending);
	sigemptyset(&blocked);
	sigemptyset(&ignored);
	sigemptyset(&caught);

268
	if (lock_task_sighand(p, &flags)) {
L
Linus Torvalds 已提交
269 270 271 272
		pending = p->pending.signal;
		shpending = p->signal->shared_pending.signal;
		blocked = p->blocked;
		collect_sigign_sigcatch(p, &ignored, &caught);
273
		num_threads = get_nr_threads(p);
274
		rcu_read_lock();  /* FIXME: is this correct? */
275
		qsize = atomic_read(&__task_cred(p)->user->sigpending);
276
		rcu_read_unlock();
J
Jiri Slaby 已提交
277
		qlim = task_rlimit(p, RLIMIT_SIGPENDING);
278
		unlock_task_sighand(p, &flags);
L
Linus Torvalds 已提交
279 280
	}

281 282
	seq_printf(m, "Threads:\t%d\n", num_threads);
	seq_printf(m, "SigQ:\t%lu/%lu\n", qsize, qlim);
L
Linus Torvalds 已提交
283 284

	/* render them all */
285 286 287 288 289
	render_sigset_t(m, "SigPnd:\t", &pending);
	render_sigset_t(m, "ShdPnd:\t", &shpending);
	render_sigset_t(m, "SigBlk:\t", &blocked);
	render_sigset_t(m, "SigIgn:\t", &ignored);
	render_sigset_t(m, "SigCgt:\t", &caught);
L
Linus Torvalds 已提交
290 291
}

292 293
static void render_cap_t(struct seq_file *m, const char *header,
			kernel_cap_t *a)
294 295 296
{
	unsigned __capi;

297
	seq_puts(m, header);
298
	CAP_FOR_EACH_U32(__capi) {
299
		seq_printf(m, "%08x",
300
			   a->cap[(_KERNEL_CAPABILITY_U32S-1) - __capi]);
301
	}
302
	seq_putc(m, '\n');
303 304
}

305 306 307 308
/* Remove non-existent capabilities */
#define NORM_CAPS(v) (v.cap[CAP_TO_INDEX(CAP_LAST_CAP)] &= \
				CAP_TO_MASK(CAP_LAST_CAP + 1) - 1)

309
static inline void task_cap(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
310
{
311 312
	const struct cred *cred;
	kernel_cap_t cap_inheritable, cap_permitted, cap_effective, cap_bset;
313

314 315 316 317 318 319 320 321
	rcu_read_lock();
	cred = __task_cred(p);
	cap_inheritable	= cred->cap_inheritable;
	cap_permitted	= cred->cap_permitted;
	cap_effective	= cred->cap_effective;
	cap_bset	= cred->cap_bset;
	rcu_read_unlock();

322 323 324 325 326
	NORM_CAPS(cap_inheritable);
	NORM_CAPS(cap_permitted);
	NORM_CAPS(cap_effective);
	NORM_CAPS(cap_bset);

327 328 329 330
	render_cap_t(m, "CapInh:\t", &cap_inheritable);
	render_cap_t(m, "CapPrm:\t", &cap_permitted);
	render_cap_t(m, "CapEff:\t", &cap_effective);
	render_cap_t(m, "CapBnd:\t", &cap_bset);
L
Linus Torvalds 已提交
331 332
}

K
Kees Cook 已提交
333 334 335 336 337 338 339
static inline void task_seccomp(struct seq_file *m, struct task_struct *p)
{
#ifdef CONFIG_SECCOMP
	seq_printf(m, "Seccomp:\t%d\n", p->seccomp.mode);
#endif
}

340 341
static inline void task_context_switch_counts(struct seq_file *m,
						struct task_struct *p)
342
{
343 344 345 346
	seq_printf(m,	"voluntary_ctxt_switches:\t%lu\n"
			"nonvoluntary_ctxt_switches:\t%lu\n",
			p->nvcsw,
			p->nivcsw);
347 348
}

349 350
static void task_cpus_allowed(struct seq_file *m, struct task_struct *task)
{
351
	seq_puts(m, "Cpus_allowed:\t");
352
	seq_cpumask(m, &task->cpus_allowed);
353 354
	seq_putc(m, '\n');
	seq_puts(m, "Cpus_allowed_list:\t");
355
	seq_cpumask_list(m, &task->cpus_allowed);
356
	seq_putc(m, '\n');
357 358
}

359 360
int proc_pid_status(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
361 362 363
{
	struct mm_struct *mm = get_task_mm(task);

364 365
	task_name(m, task);
	task_state(m, ns, pid, task);
366

L
Linus Torvalds 已提交
367
	if (mm) {
368
		task_mem(m, mm);
L
Linus Torvalds 已提交
369 370
		mmput(mm);
	}
371 372
	task_sig(m, task);
	task_cap(m, task);
K
Kees Cook 已提交
373
	task_seccomp(m, task);
374
	task_cpus_allowed(m, task);
375 376 377
	cpuset_task_status_allowed(m, task);
	task_context_switch_counts(m, task);
	return 0;
L
Linus Torvalds 已提交
378 379
}

380 381
static int do_task_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task, int whole)
L
Linus Torvalds 已提交
382 383
{
	unsigned long vsize, eip, esp, wchan = ~0UL;
384
	int priority, nice;
L
Linus Torvalds 已提交
385 386 387
	int tty_pgrp = -1, tty_nr = 0;
	sigset_t sigign, sigcatch;
	char state;
388
	pid_t ppid = 0, pgid = -1, sid = -1;
L
Linus Torvalds 已提交
389
	int num_threads = 0;
390
	int permitted;
L
Linus Torvalds 已提交
391 392 393 394
	struct mm_struct *mm;
	unsigned long long start_time;
	unsigned long cmin_flt = 0, cmaj_flt = 0;
	unsigned long  min_flt = 0,  maj_flt = 0;
395
	cputime_t cutime, cstime, utime, stime;
396
	cputime_t cgtime, gtime;
L
Linus Torvalds 已提交
397 398
	unsigned long rsslim = 0;
	char tcomm[sizeof(task->comm)];
399
	unsigned long flags;
L
Linus Torvalds 已提交
400 401 402

	state = *get_task_state(task);
	vsize = eip = esp = 0;
403
	permitted = ptrace_may_access(task, PTRACE_MODE_READ | PTRACE_MODE_NOAUDIT);
L
Linus Torvalds 已提交
404 405 406
	mm = get_task_mm(task);
	if (mm) {
		vsize = task_vsize(mm);
407 408 409 410
		if (permitted) {
			eip = KSTK_EIP(task);
			esp = KSTK_ESP(task);
		}
L
Linus Torvalds 已提交
411 412 413 414 415 416
	}

	get_task_comm(tcomm, task);

	sigemptyset(&sigign);
	sigemptyset(&sigcatch);
417 418
	cutime = cstime = utime = stime = 0;
	cgtime = gtime = 0;
419

420 421
	if (lock_task_sighand(task, &flags)) {
		struct signal_struct *sig = task->signal;
422 423

		if (sig->tty) {
424 425 426
			struct pid *pgrp = tty_get_pgrp(sig->tty);
			tty_pgrp = pid_nr_ns(pgrp, ns);
			put_pid(pgrp);
427
			tty_nr = new_encode_dev(tty_devnum(sig->tty));
428 429
		}

430
		num_threads = get_nr_threads(task);
L
Linus Torvalds 已提交
431 432
		collect_sigign_sigcatch(task, &sigign, &sigcatch);

433 434 435 436
		cmin_flt = sig->cmin_flt;
		cmaj_flt = sig->cmaj_flt;
		cutime = sig->cutime;
		cstime = sig->cstime;
437
		cgtime = sig->cgtime;
J
Jiri Slaby 已提交
438
		rsslim = ACCESS_ONCE(sig->rlim[RLIMIT_RSS].rlim_cur);
439

L
Linus Torvalds 已提交
440 441
		/* add up live thread stats at the group level */
		if (whole) {
442
			struct task_struct *t = task;
L
Linus Torvalds 已提交
443 444 445
			do {
				min_flt += t->min_flt;
				maj_flt += t->maj_flt;
446
				gtime += task_gtime(t);
447
			} while_each_thread(task, t);
L
Linus Torvalds 已提交
448

449 450
			min_flt += sig->min_flt;
			maj_flt += sig->maj_flt;
451
			thread_group_cputime_adjusted(task, &utime, &stime);
452
			gtime += sig->gtime;
L
Linus Torvalds 已提交
453
		}
454

455
		sid = task_session_nr_ns(task, ns);
456
		ppid = task_tgid_nr_ns(task->real_parent, ns);
457
		pgid = task_pgrp_nr_ns(task, ns);
458 459

		unlock_task_sighand(task, &flags);
L
Linus Torvalds 已提交
460 461
	}

462
	if (permitted && (!whole || num_threads < 2))
L
Linus Torvalds 已提交
463 464 465 466
		wchan = get_wchan(task);
	if (!whole) {
		min_flt = task->min_flt;
		maj_flt = task->maj_flt;
467
		task_cputime_adjusted(task, &utime, &stime);
468
		gtime = task_gtime(task);
L
Linus Torvalds 已提交
469 470 471 472 473 474 475 476 477
	}

	/* scale priority and nice values from timeslices to -20..20 */
	/* to make it look like a "normal" Unix priority/nice value  */
	priority = task_prio(task);
	nice = task_nice(task);

	/* Temporary variable needed for gcc-2.96 */
	/* convert timespec -> nsec*/
478 479 480
	start_time =
		(unsigned long long)task->real_start_time.tv_sec * NSEC_PER_SEC
				+ task->real_start_time.tv_nsec;
L
Linus Torvalds 已提交
481 482 483
	/* convert nsec -> ticks */
	start_time = nsec_to_clock_t(start_time);

484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504
	seq_printf(m, "%d (%s) %c", pid_nr_ns(pid, ns), tcomm, state);
	seq_put_decimal_ll(m, ' ', ppid);
	seq_put_decimal_ll(m, ' ', pgid);
	seq_put_decimal_ll(m, ' ', sid);
	seq_put_decimal_ll(m, ' ', tty_nr);
	seq_put_decimal_ll(m, ' ', tty_pgrp);
	seq_put_decimal_ull(m, ' ', task->flags);
	seq_put_decimal_ull(m, ' ', min_flt);
	seq_put_decimal_ull(m, ' ', cmin_flt);
	seq_put_decimal_ull(m, ' ', maj_flt);
	seq_put_decimal_ull(m, ' ', cmaj_flt);
	seq_put_decimal_ull(m, ' ', cputime_to_clock_t(utime));
	seq_put_decimal_ull(m, ' ', cputime_to_clock_t(stime));
	seq_put_decimal_ll(m, ' ', cputime_to_clock_t(cutime));
	seq_put_decimal_ll(m, ' ', cputime_to_clock_t(cstime));
	seq_put_decimal_ll(m, ' ', priority);
	seq_put_decimal_ll(m, ' ', nice);
	seq_put_decimal_ll(m, ' ', num_threads);
	seq_put_decimal_ull(m, ' ', 0);
	seq_put_decimal_ull(m, ' ', start_time);
	seq_put_decimal_ull(m, ' ', vsize);
505
	seq_put_decimal_ull(m, ' ', mm ? get_mm_rss(mm) : 0);
506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529
	seq_put_decimal_ull(m, ' ', rsslim);
	seq_put_decimal_ull(m, ' ', mm ? (permitted ? mm->start_code : 1) : 0);
	seq_put_decimal_ull(m, ' ', mm ? (permitted ? mm->end_code : 1) : 0);
	seq_put_decimal_ull(m, ' ', (permitted && mm) ? mm->start_stack : 0);
	seq_put_decimal_ull(m, ' ', esp);
	seq_put_decimal_ull(m, ' ', eip);
	/* The signal information here is obsolete.
	 * It must be decimal for Linux 2.0 compatibility.
	 * Use /proc/#/status for real-time signals.
	 */
	seq_put_decimal_ull(m, ' ', task->pending.signal.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, ' ', task->blocked.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, ' ', sigign.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, ' ', sigcatch.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, ' ', wchan);
	seq_put_decimal_ull(m, ' ', 0);
	seq_put_decimal_ull(m, ' ', 0);
	seq_put_decimal_ll(m, ' ', task->exit_signal);
	seq_put_decimal_ll(m, ' ', task_cpu(task));
	seq_put_decimal_ull(m, ' ', task->rt_priority);
	seq_put_decimal_ull(m, ' ', task->policy);
	seq_put_decimal_ull(m, ' ', delayacct_blkio_ticks(task));
	seq_put_decimal_ull(m, ' ', cputime_to_clock_t(gtime));
	seq_put_decimal_ll(m, ' ', cputime_to_clock_t(cgtime));
530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546

	if (mm && permitted) {
		seq_put_decimal_ull(m, ' ', mm->start_data);
		seq_put_decimal_ull(m, ' ', mm->end_data);
		seq_put_decimal_ull(m, ' ', mm->start_brk);
		seq_put_decimal_ull(m, ' ', mm->arg_start);
		seq_put_decimal_ull(m, ' ', mm->arg_end);
		seq_put_decimal_ull(m, ' ', mm->env_start);
		seq_put_decimal_ull(m, ' ', mm->env_end);
	} else
		seq_printf(m, " 0 0 0 0 0 0 0");

	if (permitted)
		seq_put_decimal_ll(m, ' ', task->exit_code);
	else
		seq_put_decimal_ll(m, ' ', 0);

547
	seq_putc(m, '\n');
548
	if (mm)
L
Linus Torvalds 已提交
549
		mmput(mm);
550
	return 0;
L
Linus Torvalds 已提交
551 552
}

553 554
int proc_tid_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
555
{
556
	return do_task_stat(m, ns, pid, task, 0);
L
Linus Torvalds 已提交
557 558
}

559 560
int proc_tgid_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
561
{
562
	return do_task_stat(m, ns, pid, task, 1);
L
Linus Torvalds 已提交
563 564
}

565 566
int proc_pid_statm(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
567
{
568
	unsigned long size = 0, resident = 0, shared = 0, text = 0, data = 0;
L
Linus Torvalds 已提交
569
	struct mm_struct *mm = get_task_mm(task);
570

L
Linus Torvalds 已提交
571 572 573 574
	if (mm) {
		size = task_statm(mm, &shared, &text, &data, &resident);
		mmput(mm);
	}
575 576 577 578 579 580 581 582 583 584 585
	/*
	 * For quick read, open code by putting numbers directly
	 * expected format is
	 * seq_printf(m, "%lu %lu %lu %lu 0 %lu 0\n",
	 *               size, resident, shared, text, data);
	 */
	seq_put_decimal_ull(m, 0, size);
	seq_put_decimal_ull(m, ' ', resident);
	seq_put_decimal_ull(m, ' ', shared);
	seq_put_decimal_ull(m, ' ', text);
	seq_put_decimal_ull(m, ' ', 0);
K
KAMEZAWA Hiroyuki 已提交
586
	seq_put_decimal_ull(m, ' ', data);
587 588
	seq_put_decimal_ull(m, ' ', 0);
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
589

590
	return 0;
L
Linus Torvalds 已提交
591
}
592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714

#ifdef CONFIG_CHECKPOINT_RESTORE
static struct pid *
get_children_pid(struct inode *inode, struct pid *pid_prev, loff_t pos)
{
	struct task_struct *start, *task;
	struct pid *pid = NULL;

	read_lock(&tasklist_lock);

	start = pid_task(proc_pid(inode), PIDTYPE_PID);
	if (!start)
		goto out;

	/*
	 * Lets try to continue searching first, this gives
	 * us significant speedup on children-rich processes.
	 */
	if (pid_prev) {
		task = pid_task(pid_prev, PIDTYPE_PID);
		if (task && task->real_parent == start &&
		    !(list_empty(&task->sibling))) {
			if (list_is_last(&task->sibling, &start->children))
				goto out;
			task = list_first_entry(&task->sibling,
						struct task_struct, sibling);
			pid = get_pid(task_pid(task));
			goto out;
		}
	}

	/*
	 * Slow search case.
	 *
	 * We might miss some children here if children
	 * are exited while we were not holding the lock,
	 * but it was never promised to be accurate that
	 * much.
	 *
	 * "Just suppose that the parent sleeps, but N children
	 *  exit after we printed their tids. Now the slow paths
	 *  skips N extra children, we miss N tasks." (c)
	 *
	 * So one need to stop or freeze the leader and all
	 * its children to get a precise result.
	 */
	list_for_each_entry(task, &start->children, sibling) {
		if (pos-- == 0) {
			pid = get_pid(task_pid(task));
			break;
		}
	}

out:
	read_unlock(&tasklist_lock);
	return pid;
}

static int children_seq_show(struct seq_file *seq, void *v)
{
	struct inode *inode = seq->private;
	pid_t pid;

	pid = pid_nr_ns(v, inode->i_sb->s_fs_info);
	return seq_printf(seq, "%d ", pid);
}

static void *children_seq_start(struct seq_file *seq, loff_t *pos)
{
	return get_children_pid(seq->private, NULL, *pos);
}

static void *children_seq_next(struct seq_file *seq, void *v, loff_t *pos)
{
	struct pid *pid;

	pid = get_children_pid(seq->private, v, *pos + 1);
	put_pid(v);

	++*pos;
	return pid;
}

static void children_seq_stop(struct seq_file *seq, void *v)
{
	put_pid(v);
}

static const struct seq_operations children_seq_ops = {
	.start	= children_seq_start,
	.next	= children_seq_next,
	.stop	= children_seq_stop,
	.show	= children_seq_show,
};

static int children_seq_open(struct inode *inode, struct file *file)
{
	struct seq_file *m;
	int ret;

	ret = seq_open(file, &children_seq_ops);
	if (ret)
		return ret;

	m = file->private_data;
	m->private = inode;

	return ret;
}

int children_seq_release(struct inode *inode, struct file *file)
{
	seq_release(inode, file);
	return 0;
}

const struct file_operations proc_tid_children_operations = {
	.open    = children_seq_open,
	.read    = seq_read,
	.llseek  = seq_lseek,
	.release = children_seq_release,
};
#endif /* CONFIG_CHECKPOINT_RESTORE */