array.c 20.0 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42
/*
 *  linux/fs/proc/array.c
 *
 *  Copyright (C) 1992  by Linus Torvalds
 *  based on ideas by Darren Senn
 *
 * Fixes:
 * Michael. K. Johnson: stat,statm extensions.
 *                      <johnsonm@stolaf.edu>
 *
 * Pauline Middelink :  Made cmdline,envline only break at '\0's, to
 *                      make sure SET_PROCTITLE works. Also removed
 *                      bad '!' which forced address recalculation for
 *                      EVERY character on the current page.
 *                      <middelin@polyware.iaf.nl>
 *
 * Danny ter Haar    :	added cpuinfo
 *			<dth@cistron.nl>
 *
 * Alessandro Rubini :  profile extension.
 *                      <rubini@ipvvis.unipv.it>
 *
 * Jeff Tranter      :  added BogoMips field to cpuinfo
 *                      <Jeff_Tranter@Mitel.COM>
 *
 * Bruno Haible      :  remove 4K limit for the maps file
 *			<haible@ma2s2.mathematik.uni-karlsruhe.de>
 *
 * Yves Arrouye      :  remove removal of trailing spaces in get_array.
 *			<Yves.Arrouye@marin.fdn.fr>
 *
 * Jerome Forissier  :  added per-CPU time information to /proc/stat
 *                      and /proc/<pid>/cpu extension
 *                      <forissier@isia.cma.fr>
 *			- Incorporation and non-SMP safe operation
 *			of forissier patch in 2.1.78 by
 *			Hans Marcus <crowbar@concepts.nl>
 *
 * aeb@cwi.nl        :  /proc/partitions
 *
 *
 * Alan Cox	     :  security fixes.
A
Alan Cox 已提交
43
 *			<alan@lxorguk.ukuu.org.uk>
L
Linus Torvalds 已提交
44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62
 *
 * Al Viro           :  safe handling of mm_struct
 *
 * Gerhard Wichert   :  added BIGMEM support
 * Siemens AG           <Gerhard.Wichert@pdb.siemens.de>
 *
 * Al Viro & Jeff Garzik :  moved most of the thing into base.c and
 *			 :  proc_misc.c. The rest may eventually go into
 *			 :  base.c too.
 */

#include <linux/types.h>
#include <linux/errno.h>
#include <linux/time.h>
#include <linux/kernel.h>
#include <linux/kernel_stat.h>
#include <linux/tty.h>
#include <linux/string.h>
#include <linux/mman.h>
63
#include <linux/sched/mm.h>
64
#include <linux/sched/numa_balancing.h>
65
#include <linux/sched/task_stack.h>
66
#include <linux/sched/task.h>
67
#include <linux/sched/cputime.h>
L
Linus Torvalds 已提交
68 69
#include <linux/proc_fs.h>
#include <linux/ioport.h>
70 71
#include <linux/uaccess.h>
#include <linux/io.h>
L
Linus Torvalds 已提交
72 73 74 75 76 77 78 79
#include <linux/mm.h>
#include <linux/hugetlb.h>
#include <linux/pagemap.h>
#include <linux/swap.h>
#include <linux/smp.h>
#include <linux/signal.h>
#include <linux/highmem.h>
#include <linux/file.h>
A
Al Viro 已提交
80
#include <linux/fdtable.h>
L
Linus Torvalds 已提交
81 82
#include <linux/times.h>
#include <linux/cpuset.h>
83
#include <linux/rcupdate.h>
84
#include <linux/delayacct.h>
85
#include <linux/seq_file.h>
86
#include <linux/pid_namespace.h>
87
#include <linux/ptrace.h>
88
#include <linux/tracehook.h>
89
#include <linux/string_helpers.h>
90
#include <linux/user_namespace.h>
91
#include <linux/fs_struct.h>
L
Linus Torvalds 已提交
92 93 94 95 96

#include <asm/pgtable.h>
#include <asm/processor.h>
#include "internal.h"

97
static inline void task_name(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
98
{
99
	char *buf;
100
	size_t size;
L
Linus Torvalds 已提交
101
	char tcomm[sizeof(p->comm)];
102
	int ret;
L
Linus Torvalds 已提交
103 104 105

	get_task_comm(tcomm, p);

106
	seq_puts(m, "Name:\t");
107

108 109 110
	size = seq_get_buf(m, &buf);
	ret = string_escape_str(tcomm, buf, size, ESCAPE_SPACE | ESCAPE_SPECIAL, "\n\\");
	seq_commit(m, ret < size ? ret : -1);
111

112
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
113 114 115 116 117 118 119 120
}

/*
 * The task state array is a strange "bitmap" of
 * reasons to sleep. Thus "running" is zero, and
 * you can test for combinations of others with
 * simple bit tests.
 */
M
Mike Frysinger 已提交
121
static const char * const task_state_array[] = {
122 123 124 125 126
	"R (running)",		/*   0 */
	"S (sleeping)",		/*   1 */
	"D (disk sleep)",	/*   2 */
	"T (stopped)",		/*   4 */
	"t (tracing stop)",	/*   8 */
127 128
	"X (dead)",		/*  16 */
	"Z (zombie)",		/*  32 */
L
Linus Torvalds 已提交
129 130
};

131
static inline const char *get_task_state(struct task_struct *tsk)
L
Linus Torvalds 已提交
132
{
133 134
	BUILD_BUG_ON(1 + ilog2(TASK_REPORT) != ARRAY_SIZE(task_state_array) - 1);
	return task_state_array[__get_task_state(tsk)];
L
Linus Torvalds 已提交
135 136
}

137 138 139 140 141 142 143 144 145 146 147 148 149
static inline int get_task_umask(struct task_struct *tsk)
{
	struct fs_struct *fs;
	int umask = -ENOENT;

	task_lock(tsk);
	fs = tsk->fs;
	if (fs)
		umask = fs->umask;
	task_unlock(tsk);
	return umask;
}

150 151
static inline void task_state(struct seq_file *m, struct pid_namespace *ns,
				struct pid *pid, struct task_struct *p)
L
Linus Torvalds 已提交
152
{
153
	struct user_namespace *user_ns = seq_user_ns(m);
L
Linus Torvalds 已提交
154
	struct group_info *group_info;
155
	int g, umask;
156
	struct task_struct *tracer;
157
	const struct cred *cred;
158
	pid_t ppid, tpid = 0, tgid, ngid;
159
	unsigned int max_fds = 0;
L
Linus Torvalds 已提交
160

161
	rcu_read_lock();
162 163
	ppid = pid_alive(p) ?
		task_tgid_nr_ns(rcu_dereference(p->real_parent), ns) : 0;
164 165 166 167

	tracer = ptrace_parent(p);
	if (tracer)
		tpid = task_pid_nr_ns(tracer, ns);
168 169 170

	tgid = task_tgid_nr_ns(p, ns);
	ngid = task_numa_group_id(p);
171
	cred = get_task_cred(p);
172

173 174 175 176
	umask = get_task_umask(p);
	if (umask >= 0)
		seq_printf(m, "Umask:\t%#04o\n", umask);

177 178 179 180
	task_lock(p);
	if (p->files)
		max_fds = files_fdtable(p->files)->max_fds;
	task_unlock(p);
181
	rcu_read_unlock();
182

A
Alexey Dobriyan 已提交
183 184
	seq_printf(m, "State:\t%s", get_task_state(p));

185 186 187 188 189 190 191 192 193 194 195 196 197 198
	seq_put_decimal_ull(m, "\nTgid:\t", tgid);
	seq_put_decimal_ull(m, "\nNgid:\t", ngid);
	seq_put_decimal_ull(m, "\nPid:\t", pid_nr_ns(pid, ns));
	seq_put_decimal_ull(m, "\nPPid:\t", ppid);
	seq_put_decimal_ull(m, "\nTracerPid:\t", tpid);
	seq_put_decimal_ull(m, "\nUid:\t", from_kuid_munged(user_ns, cred->uid));
	seq_put_decimal_ull(m, "\t", from_kuid_munged(user_ns, cred->euid));
	seq_put_decimal_ull(m, "\t", from_kuid_munged(user_ns, cred->suid));
	seq_put_decimal_ull(m, "\t", from_kuid_munged(user_ns, cred->fsuid));
	seq_put_decimal_ull(m, "\nGid:\t", from_kgid_munged(user_ns, cred->gid));
	seq_put_decimal_ull(m, "\t", from_kgid_munged(user_ns, cred->egid));
	seq_put_decimal_ull(m, "\t", from_kgid_munged(user_ns, cred->sgid));
	seq_put_decimal_ull(m, "\t", from_kgid_munged(user_ns, cred->fsgid));
	seq_put_decimal_ull(m, "\nFDSize:\t", max_fds);
A
Alexey Dobriyan 已提交
199 200

	seq_puts(m, "\nGroups:\t");
201
	group_info = cred->group_info;
202
	for (g = 0; g < group_info->ngroups; g++)
203
		seq_put_decimal_ull(m, g ? " " : "",
204
				from_kgid_munged(user_ns, group_info->gid[g]));
205
	put_cred(cred);
A
Alexey Dobriyan 已提交
206 207
	/* Trailing space shouldn't have been added in the first place. */
	seq_putc(m, ' ');
L
Linus Torvalds 已提交
208

209 210 211
#ifdef CONFIG_PID_NS
	seq_puts(m, "\nNStgid:");
	for (g = ns->level; g <= pid->level; g++)
212
		seq_put_decimal_ull(m, "\t", task_tgid_nr_ns(p, pid->numbers[g].ns));
213 214
	seq_puts(m, "\nNSpid:");
	for (g = ns->level; g <= pid->level; g++)
215
		seq_put_decimal_ull(m, "\t", task_pid_nr_ns(p, pid->numbers[g].ns));
216 217
	seq_puts(m, "\nNSpgid:");
	for (g = ns->level; g <= pid->level; g++)
218
		seq_put_decimal_ull(m, "\t", task_pgrp_nr_ns(p, pid->numbers[g].ns));
219 220
	seq_puts(m, "\nNSsid:");
	for (g = ns->level; g <= pid->level; g++)
221
		seq_put_decimal_ull(m, "\t", task_session_nr_ns(p, pid->numbers[g].ns));
222
#endif
223
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
224 225
}

226
void render_sigset_t(struct seq_file *m, const char *header,
227
				sigset_t *set)
L
Linus Torvalds 已提交
228
{
229
	int i;
L
Linus Torvalds 已提交
230

231
	seq_puts(m, header);
L
Linus Torvalds 已提交
232 233 234 235 236 237 238 239 240 241

	i = _NSIG;
	do {
		int x = 0;

		i -= 4;
		if (sigismember(set, i+1)) x |= 1;
		if (sigismember(set, i+2)) x |= 2;
		if (sigismember(set, i+3)) x |= 4;
		if (sigismember(set, i+4)) x |= 8;
242
		seq_putc(m, hex_asc[x]);
L
Linus Torvalds 已提交
243 244
	} while (i >= 4);

245
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262
}

static void collect_sigign_sigcatch(struct task_struct *p, sigset_t *ign,
				    sigset_t *catch)
{
	struct k_sigaction *k;
	int i;

	k = p->sighand->action;
	for (i = 1; i <= _NSIG; ++i, ++k) {
		if (k->sa.sa_handler == SIG_IGN)
			sigaddset(ign, i);
		else if (k->sa.sa_handler != SIG_DFL)
			sigaddset(catch, i);
	}
}

263
static inline void task_sig(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
264
{
265
	unsigned long flags;
L
Linus Torvalds 已提交
266 267 268 269 270 271 272 273 274 275 276
	sigset_t pending, shpending, blocked, ignored, caught;
	int num_threads = 0;
	unsigned long qsize = 0;
	unsigned long qlim = 0;

	sigemptyset(&pending);
	sigemptyset(&shpending);
	sigemptyset(&blocked);
	sigemptyset(&ignored);
	sigemptyset(&caught);

277
	if (lock_task_sighand(p, &flags)) {
L
Linus Torvalds 已提交
278 279 280 281
		pending = p->pending.signal;
		shpending = p->signal->shared_pending.signal;
		blocked = p->blocked;
		collect_sigign_sigcatch(p, &ignored, &caught);
282
		num_threads = get_nr_threads(p);
283
		rcu_read_lock();  /* FIXME: is this correct? */
284
		qsize = atomic_read(&__task_cred(p)->user->sigpending);
285
		rcu_read_unlock();
J
Jiri Slaby 已提交
286
		qlim = task_rlimit(p, RLIMIT_SIGPENDING);
287
		unlock_task_sighand(p, &flags);
L
Linus Torvalds 已提交
288 289
	}

290 291 292
	seq_put_decimal_ull(m, "Threads:\t", num_threads);
	seq_put_decimal_ull(m, "\nSigQ:\t", qsize);
	seq_put_decimal_ull(m, "/", qlim);
L
Linus Torvalds 已提交
293 294

	/* render them all */
A
Alexey Dobriyan 已提交
295
	render_sigset_t(m, "\nSigPnd:\t", &pending);
296 297 298 299
	render_sigset_t(m, "ShdPnd:\t", &shpending);
	render_sigset_t(m, "SigBlk:\t", &blocked);
	render_sigset_t(m, "SigIgn:\t", &ignored);
	render_sigset_t(m, "SigCgt:\t", &caught);
L
Linus Torvalds 已提交
300 301
}

302 303
static void render_cap_t(struct seq_file *m, const char *header,
			kernel_cap_t *a)
304 305 306
{
	unsigned __capi;

307
	seq_puts(m, header);
308
	CAP_FOR_EACH_U32(__capi) {
309
		seq_printf(m, "%08x",
310
			   a->cap[CAP_LAST_U32 - __capi]);
311
	}
312
	seq_putc(m, '\n');
313 314
}

315
static inline void task_cap(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
316
{
317
	const struct cred *cred;
318 319
	kernel_cap_t cap_inheritable, cap_permitted, cap_effective,
			cap_bset, cap_ambient;
320

321 322 323 324 325 326
	rcu_read_lock();
	cred = __task_cred(p);
	cap_inheritable	= cred->cap_inheritable;
	cap_permitted	= cred->cap_permitted;
	cap_effective	= cred->cap_effective;
	cap_bset	= cred->cap_bset;
327
	cap_ambient	= cred->cap_ambient;
328 329 330 331 332 333
	rcu_read_unlock();

	render_cap_t(m, "CapInh:\t", &cap_inheritable);
	render_cap_t(m, "CapPrm:\t", &cap_permitted);
	render_cap_t(m, "CapEff:\t", &cap_effective);
	render_cap_t(m, "CapBnd:\t", &cap_bset);
334
	render_cap_t(m, "CapAmb:\t", &cap_ambient);
L
Linus Torvalds 已提交
335 336
}

K
Kees Cook 已提交
337 338
static inline void task_seccomp(struct seq_file *m, struct task_struct *p)
{
K
Kees Cook 已提交
339
	seq_put_decimal_ull(m, "NoNewPrivs:\t", task_no_new_privs(p));
K
Kees Cook 已提交
340
#ifdef CONFIG_SECCOMP
K
Kees Cook 已提交
341
	seq_put_decimal_ull(m, "\nSeccomp:\t", p->seccomp.mode);
K
Kees Cook 已提交
342
#endif
K
Kees Cook 已提交
343
	seq_putc(m, '\n');
K
Kees Cook 已提交
344 345
}

346 347
static inline void task_context_switch_counts(struct seq_file *m,
						struct task_struct *p)
348
{
349 350
	seq_put_decimal_ull(m, "voluntary_ctxt_switches:\t", p->nvcsw);
	seq_put_decimal_ull(m, "\nnonvoluntary_ctxt_switches:\t", p->nivcsw);
A
Alexey Dobriyan 已提交
351
	seq_putc(m, '\n');
352 353
}

354 355
static void task_cpus_allowed(struct seq_file *m, struct task_struct *task)
{
356 357 358 359
	seq_printf(m, "Cpus_allowed:\t%*pb\n",
		   cpumask_pr_args(&task->cpus_allowed));
	seq_printf(m, "Cpus_allowed_list:\t%*pbl\n",
		   cpumask_pr_args(&task->cpus_allowed));
360 361
}

362 363
int proc_pid_status(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
364 365 366
{
	struct mm_struct *mm = get_task_mm(task);

367 368
	task_name(m, task);
	task_state(m, ns, pid, task);
369

L
Linus Torvalds 已提交
370
	if (mm) {
371
		task_mem(m, mm);
L
Linus Torvalds 已提交
372 373
		mmput(mm);
	}
374 375
	task_sig(m, task);
	task_cap(m, task);
K
Kees Cook 已提交
376
	task_seccomp(m, task);
377
	task_cpus_allowed(m, task);
378 379 380
	cpuset_task_status_allowed(m, task);
	task_context_switch_counts(m, task);
	return 0;
L
Linus Torvalds 已提交
381 382
}

383 384
static int do_task_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task, int whole)
L
Linus Torvalds 已提交
385
{
386
	unsigned long vsize, eip, esp, wchan = 0;
387
	int priority, nice;
L
Linus Torvalds 已提交
388 389 390
	int tty_pgrp = -1, tty_nr = 0;
	sigset_t sigign, sigcatch;
	char state;
391
	pid_t ppid = 0, pgid = -1, sid = -1;
L
Linus Torvalds 已提交
392
	int num_threads = 0;
393
	int permitted;
L
Linus Torvalds 已提交
394 395 396 397
	struct mm_struct *mm;
	unsigned long long start_time;
	unsigned long cmin_flt = 0, cmaj_flt = 0;
	unsigned long  min_flt = 0,  maj_flt = 0;
398
	u64 cutime, cstime, utime, stime;
399
	u64 cgtime, gtime;
L
Linus Torvalds 已提交
400 401
	unsigned long rsslim = 0;
	char tcomm[sizeof(task->comm)];
402
	unsigned long flags;
L
Linus Torvalds 已提交
403 404 405

	state = *get_task_state(task);
	vsize = eip = esp = 0;
406
	permitted = ptrace_may_access(task, PTRACE_MODE_READ_FSCREDS | PTRACE_MODE_NOAUDIT);
L
Linus Torvalds 已提交
407 408 409
	mm = get_task_mm(task);
	if (mm) {
		vsize = task_vsize(mm);
410 411 412 413
		/*
		 * esp and eip are intentionally zeroed out.  There is no
		 * non-racy way to read them without freezing the task.
		 * Programs that need reliable values can use ptrace(2).
414 415 416 417
		 *
		 * The only exception is if the task is core dumping because
		 * a program is not able to use ptrace(2) in that case. It is
		 * safe because the task has stopped executing permanently.
418
		 */
419 420 421 422
		if (permitted && (task->flags & PF_DUMPCORE)) {
			eip = KSTK_EIP(task);
			esp = KSTK_ESP(task);
		}
L
Linus Torvalds 已提交
423 424 425 426 427 428
	}

	get_task_comm(tcomm, task);

	sigemptyset(&sigign);
	sigemptyset(&sigcatch);
429 430
	cutime = cstime = utime = stime = 0;
	cgtime = gtime = 0;
431

432 433
	if (lock_task_sighand(task, &flags)) {
		struct signal_struct *sig = task->signal;
434 435

		if (sig->tty) {
436 437 438
			struct pid *pgrp = tty_get_pgrp(sig->tty);
			tty_pgrp = pid_nr_ns(pgrp, ns);
			put_pid(pgrp);
439
			tty_nr = new_encode_dev(tty_devnum(sig->tty));
440 441
		}

442
		num_threads = get_nr_threads(task);
L
Linus Torvalds 已提交
443 444
		collect_sigign_sigcatch(task, &sigign, &sigcatch);

445 446 447 448
		cmin_flt = sig->cmin_flt;
		cmaj_flt = sig->cmaj_flt;
		cutime = sig->cutime;
		cstime = sig->cstime;
449
		cgtime = sig->cgtime;
J
Jiri Slaby 已提交
450
		rsslim = ACCESS_ONCE(sig->rlim[RLIMIT_RSS].rlim_cur);
451

L
Linus Torvalds 已提交
452 453
		/* add up live thread stats at the group level */
		if (whole) {
454
			struct task_struct *t = task;
L
Linus Torvalds 已提交
455 456 457
			do {
				min_flt += t->min_flt;
				maj_flt += t->maj_flt;
458
				gtime += task_gtime(t);
459
			} while_each_thread(task, t);
L
Linus Torvalds 已提交
460

461 462
			min_flt += sig->min_flt;
			maj_flt += sig->maj_flt;
463
			thread_group_cputime_adjusted(task, &utime, &stime);
464
			gtime += sig->gtime;
L
Linus Torvalds 已提交
465
		}
466

467
		sid = task_session_nr_ns(task, ns);
468
		ppid = task_tgid_nr_ns(task->real_parent, ns);
469
		pgid = task_pgrp_nr_ns(task, ns);
470 471

		unlock_task_sighand(task, &flags);
L
Linus Torvalds 已提交
472 473
	}

474
	if (permitted && (!whole || num_threads < 2))
L
Linus Torvalds 已提交
475 476 477 478
		wchan = get_wchan(task);
	if (!whole) {
		min_flt = task->min_flt;
		maj_flt = task->maj_flt;
479
		task_cputime_adjusted(task, &utime, &stime);
480
		gtime = task_gtime(task);
L
Linus Torvalds 已提交
481 482 483 484 485 486 487 488
	}

	/* scale priority and nice values from timeslices to -20..20 */
	/* to make it look like a "normal" Unix priority/nice value  */
	priority = task_prio(task);
	nice = task_nice(task);

	/* convert nsec -> ticks */
489
	start_time = nsec_to_clock_t(task->real_start_time);
L
Linus Torvalds 已提交
490

491
	seq_printf(m, "%d (%s) %c", pid_nr_ns(pid, ns), tcomm, state);
492 493 494 495 496 497 498 499 500 501
	seq_put_decimal_ll(m, " ", ppid);
	seq_put_decimal_ll(m, " ", pgid);
	seq_put_decimal_ll(m, " ", sid);
	seq_put_decimal_ll(m, " ", tty_nr);
	seq_put_decimal_ll(m, " ", tty_pgrp);
	seq_put_decimal_ull(m, " ", task->flags);
	seq_put_decimal_ull(m, " ", min_flt);
	seq_put_decimal_ull(m, " ", cmin_flt);
	seq_put_decimal_ull(m, " ", maj_flt);
	seq_put_decimal_ull(m, " ", cmaj_flt);
502 503 504 505
	seq_put_decimal_ull(m, " ", nsec_to_clock_t(utime));
	seq_put_decimal_ull(m, " ", nsec_to_clock_t(stime));
	seq_put_decimal_ll(m, " ", nsec_to_clock_t(cutime));
	seq_put_decimal_ll(m, " ", nsec_to_clock_t(cstime));
506 507 508 509 510 511 512 513 514 515 516 517 518
	seq_put_decimal_ll(m, " ", priority);
	seq_put_decimal_ll(m, " ", nice);
	seq_put_decimal_ll(m, " ", num_threads);
	seq_put_decimal_ull(m, " ", 0);
	seq_put_decimal_ull(m, " ", start_time);
	seq_put_decimal_ull(m, " ", vsize);
	seq_put_decimal_ull(m, " ", mm ? get_mm_rss(mm) : 0);
	seq_put_decimal_ull(m, " ", rsslim);
	seq_put_decimal_ull(m, " ", mm ? (permitted ? mm->start_code : 1) : 0);
	seq_put_decimal_ull(m, " ", mm ? (permitted ? mm->end_code : 1) : 0);
	seq_put_decimal_ull(m, " ", (permitted && mm) ? mm->start_stack : 0);
	seq_put_decimal_ull(m, " ", esp);
	seq_put_decimal_ull(m, " ", eip);
519 520 521 522
	/* The signal information here is obsolete.
	 * It must be decimal for Linux 2.0 compatibility.
	 * Use /proc/#/status for real-time signals.
	 */
523 524 525 526
	seq_put_decimal_ull(m, " ", task->pending.signal.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, " ", task->blocked.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, " ", sigign.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, " ", sigcatch.sig[0] & 0x7fffffffUL);
527 528 529 530 531 532 533 534 535 536 537 538 539

	/*
	 * We used to output the absolute kernel address, but that's an
	 * information leak - so instead we show a 0/1 flag here, to signal
	 * to user-space whether there's a wchan field in /proc/PID/wchan.
	 *
	 * This works with older implementations of procps as well.
	 */
	if (wchan)
		seq_puts(m, " 1");
	else
		seq_puts(m, " 0");

540 541 542 543 544 545 546
	seq_put_decimal_ull(m, " ", 0);
	seq_put_decimal_ull(m, " ", 0);
	seq_put_decimal_ll(m, " ", task->exit_signal);
	seq_put_decimal_ll(m, " ", task_cpu(task));
	seq_put_decimal_ull(m, " ", task->rt_priority);
	seq_put_decimal_ull(m, " ", task->policy);
	seq_put_decimal_ull(m, " ", delayacct_blkio_ticks(task));
547 548
	seq_put_decimal_ull(m, " ", nsec_to_clock_t(gtime));
	seq_put_decimal_ll(m, " ", nsec_to_clock_t(cgtime));
549 550

	if (mm && permitted) {
551 552 553 554 555 556 557
		seq_put_decimal_ull(m, " ", mm->start_data);
		seq_put_decimal_ull(m, " ", mm->end_data);
		seq_put_decimal_ull(m, " ", mm->start_brk);
		seq_put_decimal_ull(m, " ", mm->arg_start);
		seq_put_decimal_ull(m, " ", mm->arg_end);
		seq_put_decimal_ull(m, " ", mm->env_start);
		seq_put_decimal_ull(m, " ", mm->env_end);
558
	} else
559
		seq_puts(m, " 0 0 0 0 0 0 0");
560 561

	if (permitted)
562
		seq_put_decimal_ll(m, " ", task->exit_code);
563
	else
564
		seq_puts(m, " 0");
565

566
	seq_putc(m, '\n');
567
	if (mm)
L
Linus Torvalds 已提交
568
		mmput(mm);
569
	return 0;
L
Linus Torvalds 已提交
570 571
}

572 573
int proc_tid_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
574
{
575
	return do_task_stat(m, ns, pid, task, 0);
L
Linus Torvalds 已提交
576 577
}

578 579
int proc_tgid_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
580
{
581
	return do_task_stat(m, ns, pid, task, 1);
L
Linus Torvalds 已提交
582 583
}

584 585
int proc_pid_statm(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
586
{
587
	unsigned long size = 0, resident = 0, shared = 0, text = 0, data = 0;
L
Linus Torvalds 已提交
588
	struct mm_struct *mm = get_task_mm(task);
589

L
Linus Torvalds 已提交
590 591 592 593
	if (mm) {
		size = task_statm(mm, &shared, &text, &data, &resident);
		mmput(mm);
	}
594 595 596 597 598 599
	/*
	 * For quick read, open code by putting numbers directly
	 * expected format is
	 * seq_printf(m, "%lu %lu %lu %lu 0 %lu 0\n",
	 *               size, resident, shared, text, data);
	 */
600 601 602 603 604 605 606
	seq_put_decimal_ull(m, "", size);
	seq_put_decimal_ull(m, " ", resident);
	seq_put_decimal_ull(m, " ", shared);
	seq_put_decimal_ull(m, " ", text);
	seq_put_decimal_ull(m, " ", 0);
	seq_put_decimal_ull(m, " ", data);
	seq_put_decimal_ull(m, " ", 0);
607
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
608

609
	return 0;
L
Linus Torvalds 已提交
610
}
611

612
#ifdef CONFIG_PROC_CHILDREN
613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674
static struct pid *
get_children_pid(struct inode *inode, struct pid *pid_prev, loff_t pos)
{
	struct task_struct *start, *task;
	struct pid *pid = NULL;

	read_lock(&tasklist_lock);

	start = pid_task(proc_pid(inode), PIDTYPE_PID);
	if (!start)
		goto out;

	/*
	 * Lets try to continue searching first, this gives
	 * us significant speedup on children-rich processes.
	 */
	if (pid_prev) {
		task = pid_task(pid_prev, PIDTYPE_PID);
		if (task && task->real_parent == start &&
		    !(list_empty(&task->sibling))) {
			if (list_is_last(&task->sibling, &start->children))
				goto out;
			task = list_first_entry(&task->sibling,
						struct task_struct, sibling);
			pid = get_pid(task_pid(task));
			goto out;
		}
	}

	/*
	 * Slow search case.
	 *
	 * We might miss some children here if children
	 * are exited while we were not holding the lock,
	 * but it was never promised to be accurate that
	 * much.
	 *
	 * "Just suppose that the parent sleeps, but N children
	 *  exit after we printed their tids. Now the slow paths
	 *  skips N extra children, we miss N tasks." (c)
	 *
	 * So one need to stop or freeze the leader and all
	 * its children to get a precise result.
	 */
	list_for_each_entry(task, &start->children, sibling) {
		if (pos-- == 0) {
			pid = get_pid(task_pid(task));
			break;
		}
	}

out:
	read_unlock(&tasklist_lock);
	return pid;
}

static int children_seq_show(struct seq_file *seq, void *v)
{
	struct inode *inode = seq->private;
	pid_t pid;

	pid = pid_nr_ns(v, inode->i_sb->s_fs_info);
675 676 677
	seq_printf(seq, "%d ", pid);

	return 0;
678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734
}

static void *children_seq_start(struct seq_file *seq, loff_t *pos)
{
	return get_children_pid(seq->private, NULL, *pos);
}

static void *children_seq_next(struct seq_file *seq, void *v, loff_t *pos)
{
	struct pid *pid;

	pid = get_children_pid(seq->private, v, *pos + 1);
	put_pid(v);

	++*pos;
	return pid;
}

static void children_seq_stop(struct seq_file *seq, void *v)
{
	put_pid(v);
}

static const struct seq_operations children_seq_ops = {
	.start	= children_seq_start,
	.next	= children_seq_next,
	.stop	= children_seq_stop,
	.show	= children_seq_show,
};

static int children_seq_open(struct inode *inode, struct file *file)
{
	struct seq_file *m;
	int ret;

	ret = seq_open(file, &children_seq_ops);
	if (ret)
		return ret;

	m = file->private_data;
	m->private = inode;

	return ret;
}

int children_seq_release(struct inode *inode, struct file *file)
{
	seq_release(inode, file);
	return 0;
}

const struct file_operations proc_tid_children_operations = {
	.open    = children_seq_open,
	.read    = seq_read,
	.llseek  = seq_lseek,
	.release = children_seq_release,
};
735
#endif /* CONFIG_PROC_CHILDREN */