array.c 18.2 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42
/*
 *  linux/fs/proc/array.c
 *
 *  Copyright (C) 1992  by Linus Torvalds
 *  based on ideas by Darren Senn
 *
 * Fixes:
 * Michael. K. Johnson: stat,statm extensions.
 *                      <johnsonm@stolaf.edu>
 *
 * Pauline Middelink :  Made cmdline,envline only break at '\0's, to
 *                      make sure SET_PROCTITLE works. Also removed
 *                      bad '!' which forced address recalculation for
 *                      EVERY character on the current page.
 *                      <middelin@polyware.iaf.nl>
 *
 * Danny ter Haar    :	added cpuinfo
 *			<dth@cistron.nl>
 *
 * Alessandro Rubini :  profile extension.
 *                      <rubini@ipvvis.unipv.it>
 *
 * Jeff Tranter      :  added BogoMips field to cpuinfo
 *                      <Jeff_Tranter@Mitel.COM>
 *
 * Bruno Haible      :  remove 4K limit for the maps file
 *			<haible@ma2s2.mathematik.uni-karlsruhe.de>
 *
 * Yves Arrouye      :  remove removal of trailing spaces in get_array.
 *			<Yves.Arrouye@marin.fdn.fr>
 *
 * Jerome Forissier  :  added per-CPU time information to /proc/stat
 *                      and /proc/<pid>/cpu extension
 *                      <forissier@isia.cma.fr>
 *			- Incorporation and non-SMP safe operation
 *			of forissier patch in 2.1.78 by
 *			Hans Marcus <crowbar@concepts.nl>
 *
 * aeb@cwi.nl        :  /proc/partitions
 *
 *
 * Alan Cox	     :  security fixes.
A
Alan Cox 已提交
43
 *			<alan@lxorguk.ukuu.org.uk>
L
Linus Torvalds 已提交
44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64
 *
 * Al Viro           :  safe handling of mm_struct
 *
 * Gerhard Wichert   :  added BIGMEM support
 * Siemens AG           <Gerhard.Wichert@pdb.siemens.de>
 *
 * Al Viro & Jeff Garzik :  moved most of the thing into base.c and
 *			 :  proc_misc.c. The rest may eventually go into
 *			 :  base.c too.
 */

#include <linux/types.h>
#include <linux/errno.h>
#include <linux/time.h>
#include <linux/kernel.h>
#include <linux/kernel_stat.h>
#include <linux/tty.h>
#include <linux/string.h>
#include <linux/mman.h>
#include <linux/proc_fs.h>
#include <linux/ioport.h>
65 66
#include <linux/uaccess.h>
#include <linux/io.h>
L
Linus Torvalds 已提交
67 68 69 70 71 72 73 74
#include <linux/mm.h>
#include <linux/hugetlb.h>
#include <linux/pagemap.h>
#include <linux/swap.h>
#include <linux/smp.h>
#include <linux/signal.h>
#include <linux/highmem.h>
#include <linux/file.h>
A
Al Viro 已提交
75
#include <linux/fdtable.h>
L
Linus Torvalds 已提交
76 77
#include <linux/times.h>
#include <linux/cpuset.h>
78
#include <linux/rcupdate.h>
79
#include <linux/delayacct.h>
80
#include <linux/seq_file.h>
81
#include <linux/pid_namespace.h>
82
#include <linux/ptrace.h>
83
#include <linux/tracehook.h>
84
#include <linux/user_namespace.h>
L
Linus Torvalds 已提交
85 86 87 88 89

#include <asm/pgtable.h>
#include <asm/processor.h>
#include "internal.h"

90
static inline void task_name(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
91 92
{
	int i;
93
	char *buf, *end;
94
	char *name;
L
Linus Torvalds 已提交
95 96 97 98
	char tcomm[sizeof(p->comm)];

	get_task_comm(tcomm, p);

99
	seq_puts(m, "Name:\t");
100 101
	end = m->buf + m->size;
	buf = m->buf + m->count;
L
Linus Torvalds 已提交
102 103
	name = tcomm;
	i = sizeof(tcomm);
104
	while (i && (buf < end)) {
L
Linus Torvalds 已提交
105 106 107 108 109 110 111
		unsigned char c = *name;
		name++;
		i--;
		*buf = c;
		if (!c)
			break;
		if (c == '\\') {
112 113 114
			buf++;
			if (buf < end)
				*buf++ = c;
L
Linus Torvalds 已提交
115 116 117
			continue;
		}
		if (c == '\n') {
118 119 120
			*buf++ = '\\';
			if (buf < end)
				*buf++ = 'n';
L
Linus Torvalds 已提交
121 122 123
			continue;
		}
		buf++;
124 125
	}
	m->count = buf - m->buf;
126
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
127 128 129 130 131 132 133 134
}

/*
 * The task state array is a strange "bitmap" of
 * reasons to sleep. Thus "running" is zero, and
 * you can test for combinations of others with
 * simple bit tests.
 */
M
Mike Frysinger 已提交
135
static const char * const task_state_array[] = {
136 137 138 139 140 141 142 143
	"R (running)",		/*   0 */
	"S (sleeping)",		/*   1 */
	"D (disk sleep)",	/*   2 */
	"T (stopped)",		/*   4 */
	"t (tracing stop)",	/*   8 */
	"Z (zombie)",		/*  16 */
	"X (dead)",		/*  32 */
	"x (dead)",		/*  64 */
144 145
	"K (wakekill)",		/* 128 */
	"W (waking)",		/* 256 */
L
Linus Torvalds 已提交
146 147
};

148
static inline const char *get_task_state(struct task_struct *tsk)
L
Linus Torvalds 已提交
149
{
M
Matthew Wilcox 已提交
150
	unsigned int state = (tsk->state & TASK_REPORT) | tsk->exit_state;
M
Mike Frysinger 已提交
151
	const char * const *p = &task_state_array[0];
L
Linus Torvalds 已提交
152

153 154
	BUILD_BUG_ON(1 + ilog2(TASK_STATE_MAX) != ARRAY_SIZE(task_state_array));

L
Linus Torvalds 已提交
155 156 157 158 159 160 161
	while (state) {
		p++;
		state >>= 1;
	}
	return *p;
}

162 163
static inline void task_state(struct seq_file *m, struct pid_namespace *ns,
				struct pid *pid, struct task_struct *p)
L
Linus Torvalds 已提交
164
{
165
	struct user_namespace *user_ns = current_user_ns();
L
Linus Torvalds 已提交
166 167
	struct group_info *group_info;
	int g;
168
	struct fdtable *fdt = NULL;
169
	const struct cred *cred;
170
	pid_t ppid, tpid;
L
Linus Torvalds 已提交
171

172
	rcu_read_lock();
173 174
	ppid = pid_alive(p) ?
		task_tgid_nr_ns(rcu_dereference(p->real_parent), ns) : 0;
175 176
	tpid = 0;
	if (pid_alive(p)) {
177
		struct task_struct *tracer = ptrace_parent(p);
178 179 180
		if (tracer)
			tpid = task_pid_nr_ns(tracer, ns);
	}
181
	cred = get_task_cred(p);
182
	seq_printf(m,
L
Linus Torvalds 已提交
183 184 185 186 187 188 189 190
		"State:\t%s\n"
		"Tgid:\t%d\n"
		"Pid:\t%d\n"
		"PPid:\t%d\n"
		"TracerPid:\t%d\n"
		"Uid:\t%d\t%d\t%d\t%d\n"
		"Gid:\t%d\t%d\t%d\t%d\n",
		get_task_state(p),
191
		task_tgid_nr_ns(p, ns),
192
		pid_nr_ns(pid, ns),
193
		ppid, tpid,
194 195 196 197 198 199 200 201
		from_kuid_munged(user_ns, cred->uid),
		from_kuid_munged(user_ns, cred->euid),
		from_kuid_munged(user_ns, cred->suid),
		from_kuid_munged(user_ns, cred->fsuid),
		from_kgid_munged(user_ns, cred->gid),
		from_kgid_munged(user_ns, cred->egid),
		from_kgid_munged(user_ns, cred->sgid),
		from_kgid_munged(user_ns, cred->fsgid));
202

L
Linus Torvalds 已提交
203
	task_lock(p);
204 205
	if (p->files)
		fdt = files_fdtable(p->files);
206
	seq_printf(m,
L
Linus Torvalds 已提交
207 208
		"FDSize:\t%d\n"
		"Groups:\t",
209
		fdt ? fdt->max_fds : 0);
210
	rcu_read_unlock();
L
Linus Torvalds 已提交
211

212
	group_info = cred->group_info;
L
Linus Torvalds 已提交
213 214
	task_unlock(p);

215
	for (g = 0; g < min(group_info->ngroups, NGROUPS_SMALL); g++)
216 217
		seq_printf(m, "%d ",
			   from_kgid_munged(user_ns, GROUP_AT(group_info, g)));
218
	put_cred(cred);
L
Linus Torvalds 已提交
219

220
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
221 222
}

223 224
static void render_sigset_t(struct seq_file *m, const char *header,
				sigset_t *set)
L
Linus Torvalds 已提交
225
{
226
	int i;
L
Linus Torvalds 已提交
227

228
	seq_puts(m, header);
L
Linus Torvalds 已提交
229 230 231 232 233 234 235 236 237 238

	i = _NSIG;
	do {
		int x = 0;

		i -= 4;
		if (sigismember(set, i+1)) x |= 1;
		if (sigismember(set, i+2)) x |= 2;
		if (sigismember(set, i+3)) x |= 4;
		if (sigismember(set, i+4)) x |= 8;
239
		seq_printf(m, "%x", x);
L
Linus Torvalds 已提交
240 241
	} while (i >= 4);

242
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259
}

static void collect_sigign_sigcatch(struct task_struct *p, sigset_t *ign,
				    sigset_t *catch)
{
	struct k_sigaction *k;
	int i;

	k = p->sighand->action;
	for (i = 1; i <= _NSIG; ++i, ++k) {
		if (k->sa.sa_handler == SIG_IGN)
			sigaddset(ign, i);
		else if (k->sa.sa_handler != SIG_DFL)
			sigaddset(catch, i);
	}
}

260
static inline void task_sig(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
261
{
262
	unsigned long flags;
L
Linus Torvalds 已提交
263 264 265 266 267 268 269 270 271 272 273
	sigset_t pending, shpending, blocked, ignored, caught;
	int num_threads = 0;
	unsigned long qsize = 0;
	unsigned long qlim = 0;

	sigemptyset(&pending);
	sigemptyset(&shpending);
	sigemptyset(&blocked);
	sigemptyset(&ignored);
	sigemptyset(&caught);

274
	if (lock_task_sighand(p, &flags)) {
L
Linus Torvalds 已提交
275 276 277 278
		pending = p->pending.signal;
		shpending = p->signal->shared_pending.signal;
		blocked = p->blocked;
		collect_sigign_sigcatch(p, &ignored, &caught);
279
		num_threads = get_nr_threads(p);
280
		rcu_read_lock();  /* FIXME: is this correct? */
281
		qsize = atomic_read(&__task_cred(p)->user->sigpending);
282
		rcu_read_unlock();
J
Jiri Slaby 已提交
283
		qlim = task_rlimit(p, RLIMIT_SIGPENDING);
284
		unlock_task_sighand(p, &flags);
L
Linus Torvalds 已提交
285 286
	}

287 288
	seq_printf(m, "Threads:\t%d\n", num_threads);
	seq_printf(m, "SigQ:\t%lu/%lu\n", qsize, qlim);
L
Linus Torvalds 已提交
289 290

	/* render them all */
291 292 293 294 295
	render_sigset_t(m, "SigPnd:\t", &pending);
	render_sigset_t(m, "ShdPnd:\t", &shpending);
	render_sigset_t(m, "SigBlk:\t", &blocked);
	render_sigset_t(m, "SigIgn:\t", &ignored);
	render_sigset_t(m, "SigCgt:\t", &caught);
L
Linus Torvalds 已提交
296 297
}

298 299
static void render_cap_t(struct seq_file *m, const char *header,
			kernel_cap_t *a)
300 301 302
{
	unsigned __capi;

303
	seq_puts(m, header);
304
	CAP_FOR_EACH_U32(__capi) {
305
		seq_printf(m, "%08x",
306
			   a->cap[(_KERNEL_CAPABILITY_U32S-1) - __capi]);
307
	}
308
	seq_putc(m, '\n');
309 310
}

311 312 313 314
/* Remove non-existent capabilities */
#define NORM_CAPS(v) (v.cap[CAP_TO_INDEX(CAP_LAST_CAP)] &= \
				CAP_TO_MASK(CAP_LAST_CAP + 1) - 1)

315
static inline void task_cap(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
316
{
317 318
	const struct cred *cred;
	kernel_cap_t cap_inheritable, cap_permitted, cap_effective, cap_bset;
319

320 321 322 323 324 325 326 327
	rcu_read_lock();
	cred = __task_cred(p);
	cap_inheritable	= cred->cap_inheritable;
	cap_permitted	= cred->cap_permitted;
	cap_effective	= cred->cap_effective;
	cap_bset	= cred->cap_bset;
	rcu_read_unlock();

328 329 330 331 332
	NORM_CAPS(cap_inheritable);
	NORM_CAPS(cap_permitted);
	NORM_CAPS(cap_effective);
	NORM_CAPS(cap_bset);

333 334 335 336
	render_cap_t(m, "CapInh:\t", &cap_inheritable);
	render_cap_t(m, "CapPrm:\t", &cap_permitted);
	render_cap_t(m, "CapEff:\t", &cap_effective);
	render_cap_t(m, "CapBnd:\t", &cap_bset);
L
Linus Torvalds 已提交
337 338
}

339 340
static inline void task_context_switch_counts(struct seq_file *m,
						struct task_struct *p)
341
{
342 343 344 345
	seq_printf(m,	"voluntary_ctxt_switches:\t%lu\n"
			"nonvoluntary_ctxt_switches:\t%lu\n",
			p->nvcsw,
			p->nivcsw);
346 347
}

348 349
static void task_cpus_allowed(struct seq_file *m, struct task_struct *task)
{
350
	seq_puts(m, "Cpus_allowed:\t");
351
	seq_cpumask(m, &task->cpus_allowed);
352 353
	seq_putc(m, '\n');
	seq_puts(m, "Cpus_allowed_list:\t");
354
	seq_cpumask_list(m, &task->cpus_allowed);
355
	seq_putc(m, '\n');
356 357
}

358 359
int proc_pid_status(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
360 361 362
{
	struct mm_struct *mm = get_task_mm(task);

363 364
	task_name(m, task);
	task_state(m, ns, pid, task);
365

L
Linus Torvalds 已提交
366
	if (mm) {
367
		task_mem(m, mm);
L
Linus Torvalds 已提交
368 369
		mmput(mm);
	}
370 371
	task_sig(m, task);
	task_cap(m, task);
372
	task_cpus_allowed(m, task);
373 374 375
	cpuset_task_status_allowed(m, task);
	task_context_switch_counts(m, task);
	return 0;
L
Linus Torvalds 已提交
376 377
}

378 379
static int do_task_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task, int whole)
L
Linus Torvalds 已提交
380 381
{
	unsigned long vsize, eip, esp, wchan = ~0UL;
382
	int priority, nice;
L
Linus Torvalds 已提交
383 384 385
	int tty_pgrp = -1, tty_nr = 0;
	sigset_t sigign, sigcatch;
	char state;
386
	pid_t ppid = 0, pgid = -1, sid = -1;
L
Linus Torvalds 已提交
387
	int num_threads = 0;
388
	int permitted;
L
Linus Torvalds 已提交
389 390 391 392
	struct mm_struct *mm;
	unsigned long long start_time;
	unsigned long cmin_flt = 0, cmaj_flt = 0;
	unsigned long  min_flt = 0,  maj_flt = 0;
393
	cputime_t cutime, cstime, utime, stime;
394
	cputime_t cgtime, gtime;
L
Linus Torvalds 已提交
395 396
	unsigned long rsslim = 0;
	char tcomm[sizeof(task->comm)];
397
	unsigned long flags;
L
Linus Torvalds 已提交
398 399 400

	state = *get_task_state(task);
	vsize = eip = esp = 0;
401
	permitted = ptrace_may_access(task, PTRACE_MODE_READ | PTRACE_MODE_NOAUDIT);
L
Linus Torvalds 已提交
402 403 404
	mm = get_task_mm(task);
	if (mm) {
		vsize = task_vsize(mm);
405 406 407 408
		if (permitted) {
			eip = KSTK_EIP(task);
			esp = KSTK_ESP(task);
		}
L
Linus Torvalds 已提交
409 410 411 412 413 414
	}

	get_task_comm(tcomm, task);

	sigemptyset(&sigign);
	sigemptyset(&sigcatch);
415 416
	cutime = cstime = utime = stime = 0;
	cgtime = gtime = 0;
417

418 419
	if (lock_task_sighand(task, &flags)) {
		struct signal_struct *sig = task->signal;
420 421

		if (sig->tty) {
422 423 424
			struct pid *pgrp = tty_get_pgrp(sig->tty);
			tty_pgrp = pid_nr_ns(pgrp, ns);
			put_pid(pgrp);
425
			tty_nr = new_encode_dev(tty_devnum(sig->tty));
426 427
		}

428
		num_threads = get_nr_threads(task);
L
Linus Torvalds 已提交
429 430
		collect_sigign_sigcatch(task, &sigign, &sigcatch);

431 432 433 434
		cmin_flt = sig->cmin_flt;
		cmaj_flt = sig->cmaj_flt;
		cutime = sig->cutime;
		cstime = sig->cstime;
435
		cgtime = sig->cgtime;
J
Jiri Slaby 已提交
436
		rsslim = ACCESS_ONCE(sig->rlim[RLIMIT_RSS].rlim_cur);
437

L
Linus Torvalds 已提交
438 439
		/* add up live thread stats at the group level */
		if (whole) {
440
			struct task_struct *t = task;
L
Linus Torvalds 已提交
441 442 443
			do {
				min_flt += t->min_flt;
				maj_flt += t->maj_flt;
444
				gtime += t->gtime;
L
Linus Torvalds 已提交
445 446 447
				t = next_thread(t);
			} while (t != task);

448 449
			min_flt += sig->min_flt;
			maj_flt += sig->maj_flt;
450
			thread_group_cputime_adjusted(task, &utime, &stime);
451
			gtime += sig->gtime;
L
Linus Torvalds 已提交
452
		}
453

454
		sid = task_session_nr_ns(task, ns);
455
		ppid = task_tgid_nr_ns(task->real_parent, ns);
456
		pgid = task_pgrp_nr_ns(task, ns);
457 458

		unlock_task_sighand(task, &flags);
L
Linus Torvalds 已提交
459 460
	}

461
	if (permitted && (!whole || num_threads < 2))
L
Linus Torvalds 已提交
462 463 464 465
		wchan = get_wchan(task);
	if (!whole) {
		min_flt = task->min_flt;
		maj_flt = task->maj_flt;
466
		task_cputime_adjusted(task, &utime, &stime);
H
Hidetoshi Seto 已提交
467
		gtime = task->gtime;
L
Linus Torvalds 已提交
468 469 470 471 472 473 474 475 476
	}

	/* scale priority and nice values from timeslices to -20..20 */
	/* to make it look like a "normal" Unix priority/nice value  */
	priority = task_prio(task);
	nice = task_nice(task);

	/* Temporary variable needed for gcc-2.96 */
	/* convert timespec -> nsec*/
477 478 479
	start_time =
		(unsigned long long)task->real_start_time.tv_sec * NSEC_PER_SEC
				+ task->real_start_time.tv_nsec;
L
Linus Torvalds 已提交
480 481 482
	/* convert nsec -> ticks */
	start_time = nsec_to_clock_t(start_time);

483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503
	seq_printf(m, "%d (%s) %c", pid_nr_ns(pid, ns), tcomm, state);
	seq_put_decimal_ll(m, ' ', ppid);
	seq_put_decimal_ll(m, ' ', pgid);
	seq_put_decimal_ll(m, ' ', sid);
	seq_put_decimal_ll(m, ' ', tty_nr);
	seq_put_decimal_ll(m, ' ', tty_pgrp);
	seq_put_decimal_ull(m, ' ', task->flags);
	seq_put_decimal_ull(m, ' ', min_flt);
	seq_put_decimal_ull(m, ' ', cmin_flt);
	seq_put_decimal_ull(m, ' ', maj_flt);
	seq_put_decimal_ull(m, ' ', cmaj_flt);
	seq_put_decimal_ull(m, ' ', cputime_to_clock_t(utime));
	seq_put_decimal_ull(m, ' ', cputime_to_clock_t(stime));
	seq_put_decimal_ll(m, ' ', cputime_to_clock_t(cutime));
	seq_put_decimal_ll(m, ' ', cputime_to_clock_t(cstime));
	seq_put_decimal_ll(m, ' ', priority);
	seq_put_decimal_ll(m, ' ', nice);
	seq_put_decimal_ll(m, ' ', num_threads);
	seq_put_decimal_ull(m, ' ', 0);
	seq_put_decimal_ull(m, ' ', start_time);
	seq_put_decimal_ull(m, ' ', vsize);
504
	seq_put_decimal_ull(m, ' ', mm ? get_mm_rss(mm) : 0);
505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528
	seq_put_decimal_ull(m, ' ', rsslim);
	seq_put_decimal_ull(m, ' ', mm ? (permitted ? mm->start_code : 1) : 0);
	seq_put_decimal_ull(m, ' ', mm ? (permitted ? mm->end_code : 1) : 0);
	seq_put_decimal_ull(m, ' ', (permitted && mm) ? mm->start_stack : 0);
	seq_put_decimal_ull(m, ' ', esp);
	seq_put_decimal_ull(m, ' ', eip);
	/* The signal information here is obsolete.
	 * It must be decimal for Linux 2.0 compatibility.
	 * Use /proc/#/status for real-time signals.
	 */
	seq_put_decimal_ull(m, ' ', task->pending.signal.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, ' ', task->blocked.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, ' ', sigign.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, ' ', sigcatch.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, ' ', wchan);
	seq_put_decimal_ull(m, ' ', 0);
	seq_put_decimal_ull(m, ' ', 0);
	seq_put_decimal_ll(m, ' ', task->exit_signal);
	seq_put_decimal_ll(m, ' ', task_cpu(task));
	seq_put_decimal_ull(m, ' ', task->rt_priority);
	seq_put_decimal_ull(m, ' ', task->policy);
	seq_put_decimal_ull(m, ' ', delayacct_blkio_ticks(task));
	seq_put_decimal_ull(m, ' ', cputime_to_clock_t(gtime));
	seq_put_decimal_ll(m, ' ', cputime_to_clock_t(cgtime));
529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545

	if (mm && permitted) {
		seq_put_decimal_ull(m, ' ', mm->start_data);
		seq_put_decimal_ull(m, ' ', mm->end_data);
		seq_put_decimal_ull(m, ' ', mm->start_brk);
		seq_put_decimal_ull(m, ' ', mm->arg_start);
		seq_put_decimal_ull(m, ' ', mm->arg_end);
		seq_put_decimal_ull(m, ' ', mm->env_start);
		seq_put_decimal_ull(m, ' ', mm->env_end);
	} else
		seq_printf(m, " 0 0 0 0 0 0 0");

	if (permitted)
		seq_put_decimal_ll(m, ' ', task->exit_code);
	else
		seq_put_decimal_ll(m, ' ', 0);

546
	seq_putc(m, '\n');
547
	if (mm)
L
Linus Torvalds 已提交
548
		mmput(mm);
549
	return 0;
L
Linus Torvalds 已提交
550 551
}

552 553
int proc_tid_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
554
{
555
	return do_task_stat(m, ns, pid, task, 0);
L
Linus Torvalds 已提交
556 557
}

558 559
int proc_tgid_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
560
{
561
	return do_task_stat(m, ns, pid, task, 1);
L
Linus Torvalds 已提交
562 563
}

564 565
int proc_pid_statm(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
566
{
567
	unsigned long size = 0, resident = 0, shared = 0, text = 0, data = 0;
L
Linus Torvalds 已提交
568
	struct mm_struct *mm = get_task_mm(task);
569

L
Linus Torvalds 已提交
570 571 572 573
	if (mm) {
		size = task_statm(mm, &shared, &text, &data, &resident);
		mmput(mm);
	}
574 575 576 577 578 579 580 581 582 583 584
	/*
	 * For quick read, open code by putting numbers directly
	 * expected format is
	 * seq_printf(m, "%lu %lu %lu %lu 0 %lu 0\n",
	 *               size, resident, shared, text, data);
	 */
	seq_put_decimal_ull(m, 0, size);
	seq_put_decimal_ull(m, ' ', resident);
	seq_put_decimal_ull(m, ' ', shared);
	seq_put_decimal_ull(m, ' ', text);
	seq_put_decimal_ull(m, ' ', 0);
K
KAMEZAWA Hiroyuki 已提交
585
	seq_put_decimal_ull(m, ' ', data);
586 587
	seq_put_decimal_ull(m, ' ', 0);
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
588

589
	return 0;
L
Linus Torvalds 已提交
590
}
591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713

#ifdef CONFIG_CHECKPOINT_RESTORE
static struct pid *
get_children_pid(struct inode *inode, struct pid *pid_prev, loff_t pos)
{
	struct task_struct *start, *task;
	struct pid *pid = NULL;

	read_lock(&tasklist_lock);

	start = pid_task(proc_pid(inode), PIDTYPE_PID);
	if (!start)
		goto out;

	/*
	 * Lets try to continue searching first, this gives
	 * us significant speedup on children-rich processes.
	 */
	if (pid_prev) {
		task = pid_task(pid_prev, PIDTYPE_PID);
		if (task && task->real_parent == start &&
		    !(list_empty(&task->sibling))) {
			if (list_is_last(&task->sibling, &start->children))
				goto out;
			task = list_first_entry(&task->sibling,
						struct task_struct, sibling);
			pid = get_pid(task_pid(task));
			goto out;
		}
	}

	/*
	 * Slow search case.
	 *
	 * We might miss some children here if children
	 * are exited while we were not holding the lock,
	 * but it was never promised to be accurate that
	 * much.
	 *
	 * "Just suppose that the parent sleeps, but N children
	 *  exit after we printed their tids. Now the slow paths
	 *  skips N extra children, we miss N tasks." (c)
	 *
	 * So one need to stop or freeze the leader and all
	 * its children to get a precise result.
	 */
	list_for_each_entry(task, &start->children, sibling) {
		if (pos-- == 0) {
			pid = get_pid(task_pid(task));
			break;
		}
	}

out:
	read_unlock(&tasklist_lock);
	return pid;
}

static int children_seq_show(struct seq_file *seq, void *v)
{
	struct inode *inode = seq->private;
	pid_t pid;

	pid = pid_nr_ns(v, inode->i_sb->s_fs_info);
	return seq_printf(seq, "%d ", pid);
}

static void *children_seq_start(struct seq_file *seq, loff_t *pos)
{
	return get_children_pid(seq->private, NULL, *pos);
}

static void *children_seq_next(struct seq_file *seq, void *v, loff_t *pos)
{
	struct pid *pid;

	pid = get_children_pid(seq->private, v, *pos + 1);
	put_pid(v);

	++*pos;
	return pid;
}

static void children_seq_stop(struct seq_file *seq, void *v)
{
	put_pid(v);
}

static const struct seq_operations children_seq_ops = {
	.start	= children_seq_start,
	.next	= children_seq_next,
	.stop	= children_seq_stop,
	.show	= children_seq_show,
};

static int children_seq_open(struct inode *inode, struct file *file)
{
	struct seq_file *m;
	int ret;

	ret = seq_open(file, &children_seq_ops);
	if (ret)
		return ret;

	m = file->private_data;
	m->private = inode;

	return ret;
}

int children_seq_release(struct inode *inode, struct file *file)
{
	seq_release(inode, file);
	return 0;
}

const struct file_operations proc_tid_children_operations = {
	.open    = children_seq_open,
	.read    = seq_read,
	.llseek  = seq_lseek,
	.release = children_seq_release,
};
#endif /* CONFIG_CHECKPOINT_RESTORE */