array.c 20.1 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42
/*
 *  linux/fs/proc/array.c
 *
 *  Copyright (C) 1992  by Linus Torvalds
 *  based on ideas by Darren Senn
 *
 * Fixes:
 * Michael. K. Johnson: stat,statm extensions.
 *                      <johnsonm@stolaf.edu>
 *
 * Pauline Middelink :  Made cmdline,envline only break at '\0's, to
 *                      make sure SET_PROCTITLE works. Also removed
 *                      bad '!' which forced address recalculation for
 *                      EVERY character on the current page.
 *                      <middelin@polyware.iaf.nl>
 *
 * Danny ter Haar    :	added cpuinfo
 *			<dth@cistron.nl>
 *
 * Alessandro Rubini :  profile extension.
 *                      <rubini@ipvvis.unipv.it>
 *
 * Jeff Tranter      :  added BogoMips field to cpuinfo
 *                      <Jeff_Tranter@Mitel.COM>
 *
 * Bruno Haible      :  remove 4K limit for the maps file
 *			<haible@ma2s2.mathematik.uni-karlsruhe.de>
 *
 * Yves Arrouye      :  remove removal of trailing spaces in get_array.
 *			<Yves.Arrouye@marin.fdn.fr>
 *
 * Jerome Forissier  :  added per-CPU time information to /proc/stat
 *                      and /proc/<pid>/cpu extension
 *                      <forissier@isia.cma.fr>
 *			- Incorporation and non-SMP safe operation
 *			of forissier patch in 2.1.78 by
 *			Hans Marcus <crowbar@concepts.nl>
 *
 * aeb@cwi.nl        :  /proc/partitions
 *
 *
 * Alan Cox	     :  security fixes.
A
Alan Cox 已提交
43
 *			<alan@lxorguk.ukuu.org.uk>
L
Linus Torvalds 已提交
44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62
 *
 * Al Viro           :  safe handling of mm_struct
 *
 * Gerhard Wichert   :  added BIGMEM support
 * Siemens AG           <Gerhard.Wichert@pdb.siemens.de>
 *
 * Al Viro & Jeff Garzik :  moved most of the thing into base.c and
 *			 :  proc_misc.c. The rest may eventually go into
 *			 :  base.c too.
 */

#include <linux/types.h>
#include <linux/errno.h>
#include <linux/time.h>
#include <linux/kernel.h>
#include <linux/kernel_stat.h>
#include <linux/tty.h>
#include <linux/string.h>
#include <linux/mman.h>
63
#include <linux/sched/mm.h>
64
#include <linux/sched/numa_balancing.h>
65
#include <linux/sched/task_stack.h>
66
#include <linux/sched/task.h>
67
#include <linux/sched/cputime.h>
L
Linus Torvalds 已提交
68 69
#include <linux/proc_fs.h>
#include <linux/ioport.h>
70 71
#include <linux/uaccess.h>
#include <linux/io.h>
L
Linus Torvalds 已提交
72 73 74 75 76 77 78 79
#include <linux/mm.h>
#include <linux/hugetlb.h>
#include <linux/pagemap.h>
#include <linux/swap.h>
#include <linux/smp.h>
#include <linux/signal.h>
#include <linux/highmem.h>
#include <linux/file.h>
A
Al Viro 已提交
80
#include <linux/fdtable.h>
L
Linus Torvalds 已提交
81 82
#include <linux/times.h>
#include <linux/cpuset.h>
83
#include <linux/rcupdate.h>
84
#include <linux/delayacct.h>
85
#include <linux/seq_file.h>
86
#include <linux/pid_namespace.h>
87
#include <linux/ptrace.h>
88
#include <linux/tracehook.h>
89
#include <linux/string_helpers.h>
90
#include <linux/user_namespace.h>
91
#include <linux/fs_struct.h>
L
Linus Torvalds 已提交
92 93 94 95 96

#include <asm/pgtable.h>
#include <asm/processor.h>
#include "internal.h"

97
static inline void task_name(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
98
{
99
	char *buf;
100
	size_t size;
L
Linus Torvalds 已提交
101
	char tcomm[sizeof(p->comm)];
102
	int ret;
L
Linus Torvalds 已提交
103 104 105

	get_task_comm(tcomm, p);

106
	seq_puts(m, "Name:\t");
107

108 109 110
	size = seq_get_buf(m, &buf);
	ret = string_escape_str(tcomm, buf, size, ESCAPE_SPACE | ESCAPE_SPECIAL, "\n\\");
	seq_commit(m, ret < size ? ret : -1);
111

112
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
113 114 115 116 117 118 119 120
}

/*
 * The task state array is a strange "bitmap" of
 * reasons to sleep. Thus "running" is zero, and
 * you can test for combinations of others with
 * simple bit tests.
 */
M
Mike Frysinger 已提交
121
static const char * const task_state_array[] = {
122 123 124 125 126 127 128 129 130

	/* states in TASK_REPORT: */
	"R (running)",		/* 0x00 */
	"S (sleeping)",		/* 0x01 */
	"D (disk sleep)",	/* 0x02 */
	"T (stopped)",		/* 0x04 */
	"t (tracing stop)",	/* 0x08 */
	"X (dead)",		/* 0x10 */
	"Z (zombie)",		/* 0x20 */
131
	"P (parked)",		/* 0x40 */
132 133

	/* states beyond TASK_REPORT: */
134
	"I (idle)",		/* 0x80 */
L
Linus Torvalds 已提交
135 136
};

137
static inline const char *get_task_state(struct task_struct *tsk)
L
Linus Torvalds 已提交
138
{
139
	BUILD_BUG_ON(1 + ilog2(TASK_REPORT_MAX) != ARRAY_SIZE(task_state_array));
140
	return task_state_array[__get_task_state(tsk)];
L
Linus Torvalds 已提交
141 142
}

143 144 145 146 147 148 149 150 151 152 153 154 155
static inline int get_task_umask(struct task_struct *tsk)
{
	struct fs_struct *fs;
	int umask = -ENOENT;

	task_lock(tsk);
	fs = tsk->fs;
	if (fs)
		umask = fs->umask;
	task_unlock(tsk);
	return umask;
}

156 157
static inline void task_state(struct seq_file *m, struct pid_namespace *ns,
				struct pid *pid, struct task_struct *p)
L
Linus Torvalds 已提交
158
{
159
	struct user_namespace *user_ns = seq_user_ns(m);
L
Linus Torvalds 已提交
160
	struct group_info *group_info;
161
	int g, umask;
162
	struct task_struct *tracer;
163
	const struct cred *cred;
164
	pid_t ppid, tpid = 0, tgid, ngid;
165
	unsigned int max_fds = 0;
L
Linus Torvalds 已提交
166

167
	rcu_read_lock();
168 169
	ppid = pid_alive(p) ?
		task_tgid_nr_ns(rcu_dereference(p->real_parent), ns) : 0;
170 171 172 173

	tracer = ptrace_parent(p);
	if (tracer)
		tpid = task_pid_nr_ns(tracer, ns);
174 175 176

	tgid = task_tgid_nr_ns(p, ns);
	ngid = task_numa_group_id(p);
177
	cred = get_task_cred(p);
178

179 180 181 182
	umask = get_task_umask(p);
	if (umask >= 0)
		seq_printf(m, "Umask:\t%#04o\n", umask);

183 184 185 186
	task_lock(p);
	if (p->files)
		max_fds = files_fdtable(p->files)->max_fds;
	task_unlock(p);
187
	rcu_read_unlock();
188

A
Alexey Dobriyan 已提交
189 190
	seq_printf(m, "State:\t%s", get_task_state(p));

191 192 193 194 195 196 197 198 199 200 201 202 203 204
	seq_put_decimal_ull(m, "\nTgid:\t", tgid);
	seq_put_decimal_ull(m, "\nNgid:\t", ngid);
	seq_put_decimal_ull(m, "\nPid:\t", pid_nr_ns(pid, ns));
	seq_put_decimal_ull(m, "\nPPid:\t", ppid);
	seq_put_decimal_ull(m, "\nTracerPid:\t", tpid);
	seq_put_decimal_ull(m, "\nUid:\t", from_kuid_munged(user_ns, cred->uid));
	seq_put_decimal_ull(m, "\t", from_kuid_munged(user_ns, cred->euid));
	seq_put_decimal_ull(m, "\t", from_kuid_munged(user_ns, cred->suid));
	seq_put_decimal_ull(m, "\t", from_kuid_munged(user_ns, cred->fsuid));
	seq_put_decimal_ull(m, "\nGid:\t", from_kgid_munged(user_ns, cred->gid));
	seq_put_decimal_ull(m, "\t", from_kgid_munged(user_ns, cred->egid));
	seq_put_decimal_ull(m, "\t", from_kgid_munged(user_ns, cred->sgid));
	seq_put_decimal_ull(m, "\t", from_kgid_munged(user_ns, cred->fsgid));
	seq_put_decimal_ull(m, "\nFDSize:\t", max_fds);
A
Alexey Dobriyan 已提交
205 206

	seq_puts(m, "\nGroups:\t");
207
	group_info = cred->group_info;
208
	for (g = 0; g < group_info->ngroups; g++)
209
		seq_put_decimal_ull(m, g ? " " : "",
210
				from_kgid_munged(user_ns, group_info->gid[g]));
211
	put_cred(cred);
A
Alexey Dobriyan 已提交
212 213
	/* Trailing space shouldn't have been added in the first place. */
	seq_putc(m, ' ');
L
Linus Torvalds 已提交
214

215 216 217
#ifdef CONFIG_PID_NS
	seq_puts(m, "\nNStgid:");
	for (g = ns->level; g <= pid->level; g++)
218
		seq_put_decimal_ull(m, "\t", task_tgid_nr_ns(p, pid->numbers[g].ns));
219 220
	seq_puts(m, "\nNSpid:");
	for (g = ns->level; g <= pid->level; g++)
221
		seq_put_decimal_ull(m, "\t", task_pid_nr_ns(p, pid->numbers[g].ns));
222 223
	seq_puts(m, "\nNSpgid:");
	for (g = ns->level; g <= pid->level; g++)
224
		seq_put_decimal_ull(m, "\t", task_pgrp_nr_ns(p, pid->numbers[g].ns));
225 226
	seq_puts(m, "\nNSsid:");
	for (g = ns->level; g <= pid->level; g++)
227
		seq_put_decimal_ull(m, "\t", task_session_nr_ns(p, pid->numbers[g].ns));
228
#endif
229
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
230 231
}

232
void render_sigset_t(struct seq_file *m, const char *header,
233
				sigset_t *set)
L
Linus Torvalds 已提交
234
{
235
	int i;
L
Linus Torvalds 已提交
236

237
	seq_puts(m, header);
L
Linus Torvalds 已提交
238 239 240 241 242 243 244 245 246 247

	i = _NSIG;
	do {
		int x = 0;

		i -= 4;
		if (sigismember(set, i+1)) x |= 1;
		if (sigismember(set, i+2)) x |= 2;
		if (sigismember(set, i+3)) x |= 4;
		if (sigismember(set, i+4)) x |= 8;
248
		seq_putc(m, hex_asc[x]);
L
Linus Torvalds 已提交
249 250
	} while (i >= 4);

251
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268
}

static void collect_sigign_sigcatch(struct task_struct *p, sigset_t *ign,
				    sigset_t *catch)
{
	struct k_sigaction *k;
	int i;

	k = p->sighand->action;
	for (i = 1; i <= _NSIG; ++i, ++k) {
		if (k->sa.sa_handler == SIG_IGN)
			sigaddset(ign, i);
		else if (k->sa.sa_handler != SIG_DFL)
			sigaddset(catch, i);
	}
}

269
static inline void task_sig(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
270
{
271
	unsigned long flags;
L
Linus Torvalds 已提交
272 273 274 275 276 277 278 279 280 281 282
	sigset_t pending, shpending, blocked, ignored, caught;
	int num_threads = 0;
	unsigned long qsize = 0;
	unsigned long qlim = 0;

	sigemptyset(&pending);
	sigemptyset(&shpending);
	sigemptyset(&blocked);
	sigemptyset(&ignored);
	sigemptyset(&caught);

283
	if (lock_task_sighand(p, &flags)) {
L
Linus Torvalds 已提交
284 285 286 287
		pending = p->pending.signal;
		shpending = p->signal->shared_pending.signal;
		blocked = p->blocked;
		collect_sigign_sigcatch(p, &ignored, &caught);
288
		num_threads = get_nr_threads(p);
289
		rcu_read_lock();  /* FIXME: is this correct? */
290
		qsize = atomic_read(&__task_cred(p)->user->sigpending);
291
		rcu_read_unlock();
J
Jiri Slaby 已提交
292
		qlim = task_rlimit(p, RLIMIT_SIGPENDING);
293
		unlock_task_sighand(p, &flags);
L
Linus Torvalds 已提交
294 295
	}

296 297 298
	seq_put_decimal_ull(m, "Threads:\t", num_threads);
	seq_put_decimal_ull(m, "\nSigQ:\t", qsize);
	seq_put_decimal_ull(m, "/", qlim);
L
Linus Torvalds 已提交
299 300

	/* render them all */
A
Alexey Dobriyan 已提交
301
	render_sigset_t(m, "\nSigPnd:\t", &pending);
302 303 304 305
	render_sigset_t(m, "ShdPnd:\t", &shpending);
	render_sigset_t(m, "SigBlk:\t", &blocked);
	render_sigset_t(m, "SigIgn:\t", &ignored);
	render_sigset_t(m, "SigCgt:\t", &caught);
L
Linus Torvalds 已提交
306 307
}

308 309
static void render_cap_t(struct seq_file *m, const char *header,
			kernel_cap_t *a)
310 311 312
{
	unsigned __capi;

313
	seq_puts(m, header);
314
	CAP_FOR_EACH_U32(__capi) {
315
		seq_printf(m, "%08x",
316
			   a->cap[CAP_LAST_U32 - __capi]);
317
	}
318
	seq_putc(m, '\n');
319 320
}

321
static inline void task_cap(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
322
{
323
	const struct cred *cred;
324 325
	kernel_cap_t cap_inheritable, cap_permitted, cap_effective,
			cap_bset, cap_ambient;
326

327 328 329 330 331 332
	rcu_read_lock();
	cred = __task_cred(p);
	cap_inheritable	= cred->cap_inheritable;
	cap_permitted	= cred->cap_permitted;
	cap_effective	= cred->cap_effective;
	cap_bset	= cred->cap_bset;
333
	cap_ambient	= cred->cap_ambient;
334 335 336 337 338 339
	rcu_read_unlock();

	render_cap_t(m, "CapInh:\t", &cap_inheritable);
	render_cap_t(m, "CapPrm:\t", &cap_permitted);
	render_cap_t(m, "CapEff:\t", &cap_effective);
	render_cap_t(m, "CapBnd:\t", &cap_bset);
340
	render_cap_t(m, "CapAmb:\t", &cap_ambient);
L
Linus Torvalds 已提交
341 342
}

K
Kees Cook 已提交
343 344
static inline void task_seccomp(struct seq_file *m, struct task_struct *p)
{
K
Kees Cook 已提交
345
	seq_put_decimal_ull(m, "NoNewPrivs:\t", task_no_new_privs(p));
K
Kees Cook 已提交
346
#ifdef CONFIG_SECCOMP
K
Kees Cook 已提交
347
	seq_put_decimal_ull(m, "\nSeccomp:\t", p->seccomp.mode);
K
Kees Cook 已提交
348
#endif
K
Kees Cook 已提交
349
	seq_putc(m, '\n');
K
Kees Cook 已提交
350 351
}

352 353
static inline void task_context_switch_counts(struct seq_file *m,
						struct task_struct *p)
354
{
355 356
	seq_put_decimal_ull(m, "voluntary_ctxt_switches:\t", p->nvcsw);
	seq_put_decimal_ull(m, "\nnonvoluntary_ctxt_switches:\t", p->nivcsw);
A
Alexey Dobriyan 已提交
357
	seq_putc(m, '\n');
358 359
}

360 361
static void task_cpus_allowed(struct seq_file *m, struct task_struct *task)
{
362 363 364 365
	seq_printf(m, "Cpus_allowed:\t%*pb\n",
		   cpumask_pr_args(&task->cpus_allowed));
	seq_printf(m, "Cpus_allowed_list:\t%*pbl\n",
		   cpumask_pr_args(&task->cpus_allowed));
366 367
}

368 369
int proc_pid_status(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
370 371 372
{
	struct mm_struct *mm = get_task_mm(task);

373 374
	task_name(m, task);
	task_state(m, ns, pid, task);
375

L
Linus Torvalds 已提交
376
	if (mm) {
377
		task_mem(m, mm);
L
Linus Torvalds 已提交
378 379
		mmput(mm);
	}
380 381
	task_sig(m, task);
	task_cap(m, task);
K
Kees Cook 已提交
382
	task_seccomp(m, task);
383
	task_cpus_allowed(m, task);
384 385 386
	cpuset_task_status_allowed(m, task);
	task_context_switch_counts(m, task);
	return 0;
L
Linus Torvalds 已提交
387 388
}

389 390
static int do_task_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task, int whole)
L
Linus Torvalds 已提交
391
{
392
	unsigned long vsize, eip, esp, wchan = 0;
393
	int priority, nice;
L
Linus Torvalds 已提交
394 395 396
	int tty_pgrp = -1, tty_nr = 0;
	sigset_t sigign, sigcatch;
	char state;
397
	pid_t ppid = 0, pgid = -1, sid = -1;
L
Linus Torvalds 已提交
398
	int num_threads = 0;
399
	int permitted;
L
Linus Torvalds 已提交
400 401 402 403
	struct mm_struct *mm;
	unsigned long long start_time;
	unsigned long cmin_flt = 0, cmaj_flt = 0;
	unsigned long  min_flt = 0,  maj_flt = 0;
404
	u64 cutime, cstime, utime, stime;
405
	u64 cgtime, gtime;
L
Linus Torvalds 已提交
406 407
	unsigned long rsslim = 0;
	char tcomm[sizeof(task->comm)];
408
	unsigned long flags;
L
Linus Torvalds 已提交
409 410 411

	state = *get_task_state(task);
	vsize = eip = esp = 0;
412
	permitted = ptrace_may_access(task, PTRACE_MODE_READ_FSCREDS | PTRACE_MODE_NOAUDIT);
L
Linus Torvalds 已提交
413 414 415
	mm = get_task_mm(task);
	if (mm) {
		vsize = task_vsize(mm);
416 417 418 419
		/*
		 * esp and eip are intentionally zeroed out.  There is no
		 * non-racy way to read them without freezing the task.
		 * Programs that need reliable values can use ptrace(2).
420 421 422 423
		 *
		 * The only exception is if the task is core dumping because
		 * a program is not able to use ptrace(2) in that case. It is
		 * safe because the task has stopped executing permanently.
424
		 */
425 426 427 428
		if (permitted && (task->flags & PF_DUMPCORE)) {
			eip = KSTK_EIP(task);
			esp = KSTK_ESP(task);
		}
L
Linus Torvalds 已提交
429 430 431 432 433 434
	}

	get_task_comm(tcomm, task);

	sigemptyset(&sigign);
	sigemptyset(&sigcatch);
435 436
	cutime = cstime = utime = stime = 0;
	cgtime = gtime = 0;
437

438 439
	if (lock_task_sighand(task, &flags)) {
		struct signal_struct *sig = task->signal;
440 441

		if (sig->tty) {
442 443 444
			struct pid *pgrp = tty_get_pgrp(sig->tty);
			tty_pgrp = pid_nr_ns(pgrp, ns);
			put_pid(pgrp);
445
			tty_nr = new_encode_dev(tty_devnum(sig->tty));
446 447
		}

448
		num_threads = get_nr_threads(task);
L
Linus Torvalds 已提交
449 450
		collect_sigign_sigcatch(task, &sigign, &sigcatch);

451 452 453 454
		cmin_flt = sig->cmin_flt;
		cmaj_flt = sig->cmaj_flt;
		cutime = sig->cutime;
		cstime = sig->cstime;
455
		cgtime = sig->cgtime;
J
Jiri Slaby 已提交
456
		rsslim = ACCESS_ONCE(sig->rlim[RLIMIT_RSS].rlim_cur);
457

L
Linus Torvalds 已提交
458 459
		/* add up live thread stats at the group level */
		if (whole) {
460
			struct task_struct *t = task;
L
Linus Torvalds 已提交
461 462 463
			do {
				min_flt += t->min_flt;
				maj_flt += t->maj_flt;
464
				gtime += task_gtime(t);
465
			} while_each_thread(task, t);
L
Linus Torvalds 已提交
466

467 468
			min_flt += sig->min_flt;
			maj_flt += sig->maj_flt;
469
			thread_group_cputime_adjusted(task, &utime, &stime);
470
			gtime += sig->gtime;
L
Linus Torvalds 已提交
471
		}
472

473
		sid = task_session_nr_ns(task, ns);
474
		ppid = task_tgid_nr_ns(task->real_parent, ns);
475
		pgid = task_pgrp_nr_ns(task, ns);
476 477

		unlock_task_sighand(task, &flags);
L
Linus Torvalds 已提交
478 479
	}

480
	if (permitted && (!whole || num_threads < 2))
L
Linus Torvalds 已提交
481 482 483 484
		wchan = get_wchan(task);
	if (!whole) {
		min_flt = task->min_flt;
		maj_flt = task->maj_flt;
485
		task_cputime_adjusted(task, &utime, &stime);
486
		gtime = task_gtime(task);
L
Linus Torvalds 已提交
487 488 489 490 491 492 493 494
	}

	/* scale priority and nice values from timeslices to -20..20 */
	/* to make it look like a "normal" Unix priority/nice value  */
	priority = task_prio(task);
	nice = task_nice(task);

	/* convert nsec -> ticks */
495
	start_time = nsec_to_clock_t(task->real_start_time);
L
Linus Torvalds 已提交
496

497
	seq_printf(m, "%d (%s) %c", pid_nr_ns(pid, ns), tcomm, state);
498 499 500 501 502 503 504 505 506 507
	seq_put_decimal_ll(m, " ", ppid);
	seq_put_decimal_ll(m, " ", pgid);
	seq_put_decimal_ll(m, " ", sid);
	seq_put_decimal_ll(m, " ", tty_nr);
	seq_put_decimal_ll(m, " ", tty_pgrp);
	seq_put_decimal_ull(m, " ", task->flags);
	seq_put_decimal_ull(m, " ", min_flt);
	seq_put_decimal_ull(m, " ", cmin_flt);
	seq_put_decimal_ull(m, " ", maj_flt);
	seq_put_decimal_ull(m, " ", cmaj_flt);
508 509 510 511
	seq_put_decimal_ull(m, " ", nsec_to_clock_t(utime));
	seq_put_decimal_ull(m, " ", nsec_to_clock_t(stime));
	seq_put_decimal_ll(m, " ", nsec_to_clock_t(cutime));
	seq_put_decimal_ll(m, " ", nsec_to_clock_t(cstime));
512 513 514 515 516 517 518 519 520 521 522 523 524
	seq_put_decimal_ll(m, " ", priority);
	seq_put_decimal_ll(m, " ", nice);
	seq_put_decimal_ll(m, " ", num_threads);
	seq_put_decimal_ull(m, " ", 0);
	seq_put_decimal_ull(m, " ", start_time);
	seq_put_decimal_ull(m, " ", vsize);
	seq_put_decimal_ull(m, " ", mm ? get_mm_rss(mm) : 0);
	seq_put_decimal_ull(m, " ", rsslim);
	seq_put_decimal_ull(m, " ", mm ? (permitted ? mm->start_code : 1) : 0);
	seq_put_decimal_ull(m, " ", mm ? (permitted ? mm->end_code : 1) : 0);
	seq_put_decimal_ull(m, " ", (permitted && mm) ? mm->start_stack : 0);
	seq_put_decimal_ull(m, " ", esp);
	seq_put_decimal_ull(m, " ", eip);
525 526 527 528
	/* The signal information here is obsolete.
	 * It must be decimal for Linux 2.0 compatibility.
	 * Use /proc/#/status for real-time signals.
	 */
529 530 531 532
	seq_put_decimal_ull(m, " ", task->pending.signal.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, " ", task->blocked.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, " ", sigign.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, " ", sigcatch.sig[0] & 0x7fffffffUL);
533 534 535 536 537 538 539 540 541 542 543 544 545

	/*
	 * We used to output the absolute kernel address, but that's an
	 * information leak - so instead we show a 0/1 flag here, to signal
	 * to user-space whether there's a wchan field in /proc/PID/wchan.
	 *
	 * This works with older implementations of procps as well.
	 */
	if (wchan)
		seq_puts(m, " 1");
	else
		seq_puts(m, " 0");

546 547 548 549 550 551 552
	seq_put_decimal_ull(m, " ", 0);
	seq_put_decimal_ull(m, " ", 0);
	seq_put_decimal_ll(m, " ", task->exit_signal);
	seq_put_decimal_ll(m, " ", task_cpu(task));
	seq_put_decimal_ull(m, " ", task->rt_priority);
	seq_put_decimal_ull(m, " ", task->policy);
	seq_put_decimal_ull(m, " ", delayacct_blkio_ticks(task));
553 554
	seq_put_decimal_ull(m, " ", nsec_to_clock_t(gtime));
	seq_put_decimal_ll(m, " ", nsec_to_clock_t(cgtime));
555 556

	if (mm && permitted) {
557 558 559 560 561 562 563
		seq_put_decimal_ull(m, " ", mm->start_data);
		seq_put_decimal_ull(m, " ", mm->end_data);
		seq_put_decimal_ull(m, " ", mm->start_brk);
		seq_put_decimal_ull(m, " ", mm->arg_start);
		seq_put_decimal_ull(m, " ", mm->arg_end);
		seq_put_decimal_ull(m, " ", mm->env_start);
		seq_put_decimal_ull(m, " ", mm->env_end);
564
	} else
565
		seq_puts(m, " 0 0 0 0 0 0 0");
566 567

	if (permitted)
568
		seq_put_decimal_ll(m, " ", task->exit_code);
569
	else
570
		seq_puts(m, " 0");
571

572
	seq_putc(m, '\n');
573
	if (mm)
L
Linus Torvalds 已提交
574
		mmput(mm);
575
	return 0;
L
Linus Torvalds 已提交
576 577
}

578 579
int proc_tid_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
580
{
581
	return do_task_stat(m, ns, pid, task, 0);
L
Linus Torvalds 已提交
582 583
}

584 585
int proc_tgid_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
586
{
587
	return do_task_stat(m, ns, pid, task, 1);
L
Linus Torvalds 已提交
588 589
}

590 591
int proc_pid_statm(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
592
{
593
	unsigned long size = 0, resident = 0, shared = 0, text = 0, data = 0;
L
Linus Torvalds 已提交
594
	struct mm_struct *mm = get_task_mm(task);
595

L
Linus Torvalds 已提交
596 597 598 599
	if (mm) {
		size = task_statm(mm, &shared, &text, &data, &resident);
		mmput(mm);
	}
600 601 602 603 604 605
	/*
	 * For quick read, open code by putting numbers directly
	 * expected format is
	 * seq_printf(m, "%lu %lu %lu %lu 0 %lu 0\n",
	 *               size, resident, shared, text, data);
	 */
606 607 608 609 610 611 612
	seq_put_decimal_ull(m, "", size);
	seq_put_decimal_ull(m, " ", resident);
	seq_put_decimal_ull(m, " ", shared);
	seq_put_decimal_ull(m, " ", text);
	seq_put_decimal_ull(m, " ", 0);
	seq_put_decimal_ull(m, " ", data);
	seq_put_decimal_ull(m, " ", 0);
613
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
614

615
	return 0;
L
Linus Torvalds 已提交
616
}
617

618
#ifdef CONFIG_PROC_CHILDREN
619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680
static struct pid *
get_children_pid(struct inode *inode, struct pid *pid_prev, loff_t pos)
{
	struct task_struct *start, *task;
	struct pid *pid = NULL;

	read_lock(&tasklist_lock);

	start = pid_task(proc_pid(inode), PIDTYPE_PID);
	if (!start)
		goto out;

	/*
	 * Lets try to continue searching first, this gives
	 * us significant speedup on children-rich processes.
	 */
	if (pid_prev) {
		task = pid_task(pid_prev, PIDTYPE_PID);
		if (task && task->real_parent == start &&
		    !(list_empty(&task->sibling))) {
			if (list_is_last(&task->sibling, &start->children))
				goto out;
			task = list_first_entry(&task->sibling,
						struct task_struct, sibling);
			pid = get_pid(task_pid(task));
			goto out;
		}
	}

	/*
	 * Slow search case.
	 *
	 * We might miss some children here if children
	 * are exited while we were not holding the lock,
	 * but it was never promised to be accurate that
	 * much.
	 *
	 * "Just suppose that the parent sleeps, but N children
	 *  exit after we printed their tids. Now the slow paths
	 *  skips N extra children, we miss N tasks." (c)
	 *
	 * So one need to stop or freeze the leader and all
	 * its children to get a precise result.
	 */
	list_for_each_entry(task, &start->children, sibling) {
		if (pos-- == 0) {
			pid = get_pid(task_pid(task));
			break;
		}
	}

out:
	read_unlock(&tasklist_lock);
	return pid;
}

static int children_seq_show(struct seq_file *seq, void *v)
{
	struct inode *inode = seq->private;
	pid_t pid;

	pid = pid_nr_ns(v, inode->i_sb->s_fs_info);
681 682 683
	seq_printf(seq, "%d ", pid);

	return 0;
684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740
}

static void *children_seq_start(struct seq_file *seq, loff_t *pos)
{
	return get_children_pid(seq->private, NULL, *pos);
}

static void *children_seq_next(struct seq_file *seq, void *v, loff_t *pos)
{
	struct pid *pid;

	pid = get_children_pid(seq->private, v, *pos + 1);
	put_pid(v);

	++*pos;
	return pid;
}

static void children_seq_stop(struct seq_file *seq, void *v)
{
	put_pid(v);
}

static const struct seq_operations children_seq_ops = {
	.start	= children_seq_start,
	.next	= children_seq_next,
	.stop	= children_seq_stop,
	.show	= children_seq_show,
};

static int children_seq_open(struct inode *inode, struct file *file)
{
	struct seq_file *m;
	int ret;

	ret = seq_open(file, &children_seq_ops);
	if (ret)
		return ret;

	m = file->private_data;
	m->private = inode;

	return ret;
}

int children_seq_release(struct inode *inode, struct file *file)
{
	seq_release(inode, file);
	return 0;
}

const struct file_operations proc_tid_children_operations = {
	.open    = children_seq_open,
	.read    = seq_read,
	.llseek  = seq_lseek,
	.release = children_seq_release,
};
741
#endif /* CONFIG_PROC_CHILDREN */