array.c 19.8 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42
/*
 *  linux/fs/proc/array.c
 *
 *  Copyright (C) 1992  by Linus Torvalds
 *  based on ideas by Darren Senn
 *
 * Fixes:
 * Michael. K. Johnson: stat,statm extensions.
 *                      <johnsonm@stolaf.edu>
 *
 * Pauline Middelink :  Made cmdline,envline only break at '\0's, to
 *                      make sure SET_PROCTITLE works. Also removed
 *                      bad '!' which forced address recalculation for
 *                      EVERY character on the current page.
 *                      <middelin@polyware.iaf.nl>
 *
 * Danny ter Haar    :	added cpuinfo
 *			<dth@cistron.nl>
 *
 * Alessandro Rubini :  profile extension.
 *                      <rubini@ipvvis.unipv.it>
 *
 * Jeff Tranter      :  added BogoMips field to cpuinfo
 *                      <Jeff_Tranter@Mitel.COM>
 *
 * Bruno Haible      :  remove 4K limit for the maps file
 *			<haible@ma2s2.mathematik.uni-karlsruhe.de>
 *
 * Yves Arrouye      :  remove removal of trailing spaces in get_array.
 *			<Yves.Arrouye@marin.fdn.fr>
 *
 * Jerome Forissier  :  added per-CPU time information to /proc/stat
 *                      and /proc/<pid>/cpu extension
 *                      <forissier@isia.cma.fr>
 *			- Incorporation and non-SMP safe operation
 *			of forissier patch in 2.1.78 by
 *			Hans Marcus <crowbar@concepts.nl>
 *
 * aeb@cwi.nl        :  /proc/partitions
 *
 *
 * Alan Cox	     :  security fixes.
A
Alan Cox 已提交
43
 *			<alan@lxorguk.ukuu.org.uk>
L
Linus Torvalds 已提交
44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64
 *
 * Al Viro           :  safe handling of mm_struct
 *
 * Gerhard Wichert   :  added BIGMEM support
 * Siemens AG           <Gerhard.Wichert@pdb.siemens.de>
 *
 * Al Viro & Jeff Garzik :  moved most of the thing into base.c and
 *			 :  proc_misc.c. The rest may eventually go into
 *			 :  base.c too.
 */

#include <linux/types.h>
#include <linux/errno.h>
#include <linux/time.h>
#include <linux/kernel.h>
#include <linux/kernel_stat.h>
#include <linux/tty.h>
#include <linux/string.h>
#include <linux/mman.h>
#include <linux/proc_fs.h>
#include <linux/ioport.h>
65 66
#include <linux/uaccess.h>
#include <linux/io.h>
L
Linus Torvalds 已提交
67 68 69 70 71 72 73 74
#include <linux/mm.h>
#include <linux/hugetlb.h>
#include <linux/pagemap.h>
#include <linux/swap.h>
#include <linux/smp.h>
#include <linux/signal.h>
#include <linux/highmem.h>
#include <linux/file.h>
A
Al Viro 已提交
75
#include <linux/fdtable.h>
L
Linus Torvalds 已提交
76 77
#include <linux/times.h>
#include <linux/cpuset.h>
78
#include <linux/rcupdate.h>
79
#include <linux/delayacct.h>
80
#include <linux/seq_file.h>
81
#include <linux/pid_namespace.h>
82
#include <linux/ptrace.h>
83
#include <linux/tracehook.h>
84
#include <linux/string_helpers.h>
85
#include <linux/user_namespace.h>
86
#include <linux/fs_struct.h>
L
Linus Torvalds 已提交
87 88 89 90 91

#include <asm/pgtable.h>
#include <asm/processor.h>
#include "internal.h"

92
static inline void task_name(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
93
{
94
	char *buf;
95
	size_t size;
L
Linus Torvalds 已提交
96
	char tcomm[sizeof(p->comm)];
97
	int ret;
L
Linus Torvalds 已提交
98 99 100

	get_task_comm(tcomm, p);

101
	seq_puts(m, "Name:\t");
102

103 104 105
	size = seq_get_buf(m, &buf);
	ret = string_escape_str(tcomm, buf, size, ESCAPE_SPACE | ESCAPE_SPECIAL, "\n\\");
	seq_commit(m, ret < size ? ret : -1);
106

107
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
108 109 110 111 112 113 114 115
}

/*
 * The task state array is a strange "bitmap" of
 * reasons to sleep. Thus "running" is zero, and
 * you can test for combinations of others with
 * simple bit tests.
 */
M
Mike Frysinger 已提交
116
static const char * const task_state_array[] = {
117 118 119 120 121
	"R (running)",		/*   0 */
	"S (sleeping)",		/*   1 */
	"D (disk sleep)",	/*   2 */
	"T (stopped)",		/*   4 */
	"t (tracing stop)",	/*   8 */
122 123
	"X (dead)",		/*  16 */
	"Z (zombie)",		/*  32 */
L
Linus Torvalds 已提交
124 125
};

126
static inline const char *get_task_state(struct task_struct *tsk)
L
Linus Torvalds 已提交
127
{
128
	unsigned int state = (tsk->state | tsk->exit_state) & TASK_REPORT;
L
Linus Torvalds 已提交
129

130 131 132 133 134 135 136 137
	/*
	 * Parked tasks do not run; they sit in __kthread_parkme().
	 * Without this check, we would report them as running, which is
	 * clearly wrong, so we report them as sleeping instead.
	 */
	if (tsk->state == TASK_PARKED)
		state = TASK_INTERRUPTIBLE;

138
	BUILD_BUG_ON(1 + ilog2(TASK_REPORT) != ARRAY_SIZE(task_state_array)-1);
139

140
	return task_state_array[fls(state)];
L
Linus Torvalds 已提交
141 142
}

143 144 145 146 147 148 149 150 151 152 153 154 155
static inline int get_task_umask(struct task_struct *tsk)
{
	struct fs_struct *fs;
	int umask = -ENOENT;

	task_lock(tsk);
	fs = tsk->fs;
	if (fs)
		umask = fs->umask;
	task_unlock(tsk);
	return umask;
}

156 157
static inline void task_state(struct seq_file *m, struct pid_namespace *ns,
				struct pid *pid, struct task_struct *p)
L
Linus Torvalds 已提交
158
{
159
	struct user_namespace *user_ns = seq_user_ns(m);
L
Linus Torvalds 已提交
160
	struct group_info *group_info;
161
	int g, umask;
162
	struct task_struct *tracer;
163
	const struct cred *cred;
164
	pid_t ppid, tpid = 0, tgid, ngid;
165
	unsigned int max_fds = 0;
L
Linus Torvalds 已提交
166

167
	rcu_read_lock();
168 169
	ppid = pid_alive(p) ?
		task_tgid_nr_ns(rcu_dereference(p->real_parent), ns) : 0;
170 171 172 173

	tracer = ptrace_parent(p);
	if (tracer)
		tpid = task_pid_nr_ns(tracer, ns);
174 175 176

	tgid = task_tgid_nr_ns(p, ns);
	ngid = task_numa_group_id(p);
177
	cred = get_task_cred(p);
178

179 180 181 182
	umask = get_task_umask(p);
	if (umask >= 0)
		seq_printf(m, "Umask:\t%#04o\n", umask);

183 184 185 186
	task_lock(p);
	if (p->files)
		max_fds = files_fdtable(p->files)->max_fds;
	task_unlock(p);
187
	rcu_read_unlock();
188

A
Alexey Dobriyan 已提交
189 190
	seq_printf(m, "State:\t%s", get_task_state(p));

191 192 193 194 195 196 197 198 199 200 201 202 203 204
	seq_put_decimal_ull(m, "\nTgid:\t", tgid);
	seq_put_decimal_ull(m, "\nNgid:\t", ngid);
	seq_put_decimal_ull(m, "\nPid:\t", pid_nr_ns(pid, ns));
	seq_put_decimal_ull(m, "\nPPid:\t", ppid);
	seq_put_decimal_ull(m, "\nTracerPid:\t", tpid);
	seq_put_decimal_ull(m, "\nUid:\t", from_kuid_munged(user_ns, cred->uid));
	seq_put_decimal_ull(m, "\t", from_kuid_munged(user_ns, cred->euid));
	seq_put_decimal_ull(m, "\t", from_kuid_munged(user_ns, cred->suid));
	seq_put_decimal_ull(m, "\t", from_kuid_munged(user_ns, cred->fsuid));
	seq_put_decimal_ull(m, "\nGid:\t", from_kgid_munged(user_ns, cred->gid));
	seq_put_decimal_ull(m, "\t", from_kgid_munged(user_ns, cred->egid));
	seq_put_decimal_ull(m, "\t", from_kgid_munged(user_ns, cred->sgid));
	seq_put_decimal_ull(m, "\t", from_kgid_munged(user_ns, cred->fsgid));
	seq_put_decimal_ull(m, "\nFDSize:\t", max_fds);
A
Alexey Dobriyan 已提交
205 206

	seq_puts(m, "\nGroups:\t");
207
	group_info = cred->group_info;
208
	for (g = 0; g < group_info->ngroups; g++)
209
		seq_put_decimal_ull(m, g ? " " : "",
210
				from_kgid_munged(user_ns, group_info->gid[g]));
211
	put_cred(cred);
A
Alexey Dobriyan 已提交
212 213
	/* Trailing space shouldn't have been added in the first place. */
	seq_putc(m, ' ');
L
Linus Torvalds 已提交
214

215 216 217
#ifdef CONFIG_PID_NS
	seq_puts(m, "\nNStgid:");
	for (g = ns->level; g <= pid->level; g++)
218
		seq_put_decimal_ull(m, "\t", task_tgid_nr_ns(p, pid->numbers[g].ns));
219 220
	seq_puts(m, "\nNSpid:");
	for (g = ns->level; g <= pid->level; g++)
221
		seq_put_decimal_ull(m, "\t", task_pid_nr_ns(p, pid->numbers[g].ns));
222 223
	seq_puts(m, "\nNSpgid:");
	for (g = ns->level; g <= pid->level; g++)
224
		seq_put_decimal_ull(m, "\t", task_pgrp_nr_ns(p, pid->numbers[g].ns));
225 226
	seq_puts(m, "\nNSsid:");
	for (g = ns->level; g <= pid->level; g++)
227
		seq_put_decimal_ull(m, "\t", task_session_nr_ns(p, pid->numbers[g].ns));
228
#endif
229
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
230 231
}

232
void render_sigset_t(struct seq_file *m, const char *header,
233
				sigset_t *set)
L
Linus Torvalds 已提交
234
{
235
	int i;
L
Linus Torvalds 已提交
236

237
	seq_puts(m, header);
L
Linus Torvalds 已提交
238 239 240 241 242 243 244 245 246 247

	i = _NSIG;
	do {
		int x = 0;

		i -= 4;
		if (sigismember(set, i+1)) x |= 1;
		if (sigismember(set, i+2)) x |= 2;
		if (sigismember(set, i+3)) x |= 4;
		if (sigismember(set, i+4)) x |= 8;
248
		seq_printf(m, "%x", x);
L
Linus Torvalds 已提交
249 250
	} while (i >= 4);

251
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268
}

static void collect_sigign_sigcatch(struct task_struct *p, sigset_t *ign,
				    sigset_t *catch)
{
	struct k_sigaction *k;
	int i;

	k = p->sighand->action;
	for (i = 1; i <= _NSIG; ++i, ++k) {
		if (k->sa.sa_handler == SIG_IGN)
			sigaddset(ign, i);
		else if (k->sa.sa_handler != SIG_DFL)
			sigaddset(catch, i);
	}
}

269
static inline void task_sig(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
270
{
271
	unsigned long flags;
L
Linus Torvalds 已提交
272 273 274 275 276 277 278 279 280 281 282
	sigset_t pending, shpending, blocked, ignored, caught;
	int num_threads = 0;
	unsigned long qsize = 0;
	unsigned long qlim = 0;

	sigemptyset(&pending);
	sigemptyset(&shpending);
	sigemptyset(&blocked);
	sigemptyset(&ignored);
	sigemptyset(&caught);

283
	if (lock_task_sighand(p, &flags)) {
L
Linus Torvalds 已提交
284 285 286 287
		pending = p->pending.signal;
		shpending = p->signal->shared_pending.signal;
		blocked = p->blocked;
		collect_sigign_sigcatch(p, &ignored, &caught);
288
		num_threads = get_nr_threads(p);
289
		rcu_read_lock();  /* FIXME: is this correct? */
290
		qsize = atomic_read(&__task_cred(p)->user->sigpending);
291
		rcu_read_unlock();
J
Jiri Slaby 已提交
292
		qlim = task_rlimit(p, RLIMIT_SIGPENDING);
293
		unlock_task_sighand(p, &flags);
L
Linus Torvalds 已提交
294 295
	}

296 297 298
	seq_put_decimal_ull(m, "Threads:\t", num_threads);
	seq_put_decimal_ull(m, "\nSigQ:\t", qsize);
	seq_put_decimal_ull(m, "/", qlim);
L
Linus Torvalds 已提交
299 300

	/* render them all */
A
Alexey Dobriyan 已提交
301
	render_sigset_t(m, "\nSigPnd:\t", &pending);
302 303 304 305
	render_sigset_t(m, "ShdPnd:\t", &shpending);
	render_sigset_t(m, "SigBlk:\t", &blocked);
	render_sigset_t(m, "SigIgn:\t", &ignored);
	render_sigset_t(m, "SigCgt:\t", &caught);
L
Linus Torvalds 已提交
306 307
}

308 309
static void render_cap_t(struct seq_file *m, const char *header,
			kernel_cap_t *a)
310 311 312
{
	unsigned __capi;

313
	seq_puts(m, header);
314
	CAP_FOR_EACH_U32(__capi) {
315
		seq_printf(m, "%08x",
316
			   a->cap[CAP_LAST_U32 - __capi]);
317
	}
318
	seq_putc(m, '\n');
319 320
}

321
static inline void task_cap(struct seq_file *m, struct task_struct *p)
L
Linus Torvalds 已提交
322
{
323
	const struct cred *cred;
324 325
	kernel_cap_t cap_inheritable, cap_permitted, cap_effective,
			cap_bset, cap_ambient;
326

327 328 329 330 331 332
	rcu_read_lock();
	cred = __task_cred(p);
	cap_inheritable	= cred->cap_inheritable;
	cap_permitted	= cred->cap_permitted;
	cap_effective	= cred->cap_effective;
	cap_bset	= cred->cap_bset;
333
	cap_ambient	= cred->cap_ambient;
334 335 336 337 338 339
	rcu_read_unlock();

	render_cap_t(m, "CapInh:\t", &cap_inheritable);
	render_cap_t(m, "CapPrm:\t", &cap_permitted);
	render_cap_t(m, "CapEff:\t", &cap_effective);
	render_cap_t(m, "CapBnd:\t", &cap_bset);
340
	render_cap_t(m, "CapAmb:\t", &cap_ambient);
L
Linus Torvalds 已提交
341 342
}

K
Kees Cook 已提交
343 344 345
static inline void task_seccomp(struct seq_file *m, struct task_struct *p)
{
#ifdef CONFIG_SECCOMP
346
	seq_put_decimal_ull(m, "Seccomp:\t", p->seccomp.mode);
A
Alexey Dobriyan 已提交
347
	seq_putc(m, '\n');
K
Kees Cook 已提交
348 349 350
#endif
}

351 352
static inline void task_context_switch_counts(struct seq_file *m,
						struct task_struct *p)
353
{
354 355
	seq_put_decimal_ull(m, "voluntary_ctxt_switches:\t", p->nvcsw);
	seq_put_decimal_ull(m, "\nnonvoluntary_ctxt_switches:\t", p->nivcsw);
A
Alexey Dobriyan 已提交
356
	seq_putc(m, '\n');
357 358
}

359 360
static void task_cpus_allowed(struct seq_file *m, struct task_struct *task)
{
361 362 363 364
	seq_printf(m, "Cpus_allowed:\t%*pb\n",
		   cpumask_pr_args(&task->cpus_allowed));
	seq_printf(m, "Cpus_allowed_list:\t%*pbl\n",
		   cpumask_pr_args(&task->cpus_allowed));
365 366
}

367 368
int proc_pid_status(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
369 370 371
{
	struct mm_struct *mm = get_task_mm(task);

372 373
	task_name(m, task);
	task_state(m, ns, pid, task);
374

L
Linus Torvalds 已提交
375
	if (mm) {
376
		task_mem(m, mm);
L
Linus Torvalds 已提交
377 378
		mmput(mm);
	}
379 380
	task_sig(m, task);
	task_cap(m, task);
K
Kees Cook 已提交
381
	task_seccomp(m, task);
382
	task_cpus_allowed(m, task);
383 384 385
	cpuset_task_status_allowed(m, task);
	task_context_switch_counts(m, task);
	return 0;
L
Linus Torvalds 已提交
386 387
}

388 389
static int do_task_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task, int whole)
L
Linus Torvalds 已提交
390
{
391
	unsigned long vsize, eip, esp, wchan = 0;
392
	int priority, nice;
L
Linus Torvalds 已提交
393 394 395
	int tty_pgrp = -1, tty_nr = 0;
	sigset_t sigign, sigcatch;
	char state;
396
	pid_t ppid = 0, pgid = -1, sid = -1;
L
Linus Torvalds 已提交
397
	int num_threads = 0;
398
	int permitted;
L
Linus Torvalds 已提交
399 400 401 402
	struct mm_struct *mm;
	unsigned long long start_time;
	unsigned long cmin_flt = 0, cmaj_flt = 0;
	unsigned long  min_flt = 0,  maj_flt = 0;
403
	cputime_t cutime, cstime, utime, stime;
404
	cputime_t cgtime, gtime;
L
Linus Torvalds 已提交
405 406
	unsigned long rsslim = 0;
	char tcomm[sizeof(task->comm)];
407
	unsigned long flags;
L
Linus Torvalds 已提交
408 409 410

	state = *get_task_state(task);
	vsize = eip = esp = 0;
411
	permitted = ptrace_may_access(task, PTRACE_MODE_READ_FSCREDS | PTRACE_MODE_NOAUDIT);
L
Linus Torvalds 已提交
412 413 414
	mm = get_task_mm(task);
	if (mm) {
		vsize = task_vsize(mm);
415 416 417 418 419
		/*
		 * esp and eip are intentionally zeroed out.  There is no
		 * non-racy way to read them without freezing the task.
		 * Programs that need reliable values can use ptrace(2).
		 */
L
Linus Torvalds 已提交
420 421 422 423 424 425
	}

	get_task_comm(tcomm, task);

	sigemptyset(&sigign);
	sigemptyset(&sigcatch);
426 427
	cutime = cstime = utime = stime = 0;
	cgtime = gtime = 0;
428

429 430
	if (lock_task_sighand(task, &flags)) {
		struct signal_struct *sig = task->signal;
431 432

		if (sig->tty) {
433 434 435
			struct pid *pgrp = tty_get_pgrp(sig->tty);
			tty_pgrp = pid_nr_ns(pgrp, ns);
			put_pid(pgrp);
436
			tty_nr = new_encode_dev(tty_devnum(sig->tty));
437 438
		}

439
		num_threads = get_nr_threads(task);
L
Linus Torvalds 已提交
440 441
		collect_sigign_sigcatch(task, &sigign, &sigcatch);

442 443 444 445
		cmin_flt = sig->cmin_flt;
		cmaj_flt = sig->cmaj_flt;
		cutime = sig->cutime;
		cstime = sig->cstime;
446
		cgtime = sig->cgtime;
J
Jiri Slaby 已提交
447
		rsslim = ACCESS_ONCE(sig->rlim[RLIMIT_RSS].rlim_cur);
448

L
Linus Torvalds 已提交
449 450
		/* add up live thread stats at the group level */
		if (whole) {
451
			struct task_struct *t = task;
L
Linus Torvalds 已提交
452 453 454
			do {
				min_flt += t->min_flt;
				maj_flt += t->maj_flt;
455
				gtime += task_gtime(t);
456
			} while_each_thread(task, t);
L
Linus Torvalds 已提交
457

458 459
			min_flt += sig->min_flt;
			maj_flt += sig->maj_flt;
460
			thread_group_cputime_adjusted(task, &utime, &stime);
461
			gtime += sig->gtime;
L
Linus Torvalds 已提交
462
		}
463

464
		sid = task_session_nr_ns(task, ns);
465
		ppid = task_tgid_nr_ns(task->real_parent, ns);
466
		pgid = task_pgrp_nr_ns(task, ns);
467 468

		unlock_task_sighand(task, &flags);
L
Linus Torvalds 已提交
469 470
	}

471
	if (permitted && (!whole || num_threads < 2))
L
Linus Torvalds 已提交
472 473 474 475
		wchan = get_wchan(task);
	if (!whole) {
		min_flt = task->min_flt;
		maj_flt = task->maj_flt;
476
		task_cputime_adjusted(task, &utime, &stime);
477
		gtime = task_gtime(task);
L
Linus Torvalds 已提交
478 479 480 481 482 483 484 485
	}

	/* scale priority and nice values from timeslices to -20..20 */
	/* to make it look like a "normal" Unix priority/nice value  */
	priority = task_prio(task);
	nice = task_nice(task);

	/* convert nsec -> ticks */
486
	start_time = nsec_to_clock_t(task->real_start_time);
L
Linus Torvalds 已提交
487

488
	seq_printf(m, "%d (%s) %c", pid_nr_ns(pid, ns), tcomm, state);
489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515
	seq_put_decimal_ll(m, " ", ppid);
	seq_put_decimal_ll(m, " ", pgid);
	seq_put_decimal_ll(m, " ", sid);
	seq_put_decimal_ll(m, " ", tty_nr);
	seq_put_decimal_ll(m, " ", tty_pgrp);
	seq_put_decimal_ull(m, " ", task->flags);
	seq_put_decimal_ull(m, " ", min_flt);
	seq_put_decimal_ull(m, " ", cmin_flt);
	seq_put_decimal_ull(m, " ", maj_flt);
	seq_put_decimal_ull(m, " ", cmaj_flt);
	seq_put_decimal_ull(m, " ", cputime_to_clock_t(utime));
	seq_put_decimal_ull(m, " ", cputime_to_clock_t(stime));
	seq_put_decimal_ll(m, " ", cputime_to_clock_t(cutime));
	seq_put_decimal_ll(m, " ", cputime_to_clock_t(cstime));
	seq_put_decimal_ll(m, " ", priority);
	seq_put_decimal_ll(m, " ", nice);
	seq_put_decimal_ll(m, " ", num_threads);
	seq_put_decimal_ull(m, " ", 0);
	seq_put_decimal_ull(m, " ", start_time);
	seq_put_decimal_ull(m, " ", vsize);
	seq_put_decimal_ull(m, " ", mm ? get_mm_rss(mm) : 0);
	seq_put_decimal_ull(m, " ", rsslim);
	seq_put_decimal_ull(m, " ", mm ? (permitted ? mm->start_code : 1) : 0);
	seq_put_decimal_ull(m, " ", mm ? (permitted ? mm->end_code : 1) : 0);
	seq_put_decimal_ull(m, " ", (permitted && mm) ? mm->start_stack : 0);
	seq_put_decimal_ull(m, " ", esp);
	seq_put_decimal_ull(m, " ", eip);
516 517 518 519
	/* The signal information here is obsolete.
	 * It must be decimal for Linux 2.0 compatibility.
	 * Use /proc/#/status for real-time signals.
	 */
520 521 522 523
	seq_put_decimal_ull(m, " ", task->pending.signal.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, " ", task->blocked.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, " ", sigign.sig[0] & 0x7fffffffUL);
	seq_put_decimal_ull(m, " ", sigcatch.sig[0] & 0x7fffffffUL);
524 525 526 527 528 529 530 531 532 533 534 535 536

	/*
	 * We used to output the absolute kernel address, but that's an
	 * information leak - so instead we show a 0/1 flag here, to signal
	 * to user-space whether there's a wchan field in /proc/PID/wchan.
	 *
	 * This works with older implementations of procps as well.
	 */
	if (wchan)
		seq_puts(m, " 1");
	else
		seq_puts(m, " 0");

537 538 539 540 541 542 543 544 545
	seq_put_decimal_ull(m, " ", 0);
	seq_put_decimal_ull(m, " ", 0);
	seq_put_decimal_ll(m, " ", task->exit_signal);
	seq_put_decimal_ll(m, " ", task_cpu(task));
	seq_put_decimal_ull(m, " ", task->rt_priority);
	seq_put_decimal_ull(m, " ", task->policy);
	seq_put_decimal_ull(m, " ", delayacct_blkio_ticks(task));
	seq_put_decimal_ull(m, " ", cputime_to_clock_t(gtime));
	seq_put_decimal_ll(m, " ", cputime_to_clock_t(cgtime));
546 547

	if (mm && permitted) {
548 549 550 551 552 553 554
		seq_put_decimal_ull(m, " ", mm->start_data);
		seq_put_decimal_ull(m, " ", mm->end_data);
		seq_put_decimal_ull(m, " ", mm->start_brk);
		seq_put_decimal_ull(m, " ", mm->arg_start);
		seq_put_decimal_ull(m, " ", mm->arg_end);
		seq_put_decimal_ull(m, " ", mm->env_start);
		seq_put_decimal_ull(m, " ", mm->env_end);
555
	} else
556
		seq_puts(m, " 0 0 0 0 0 0 0");
557 558

	if (permitted)
559
		seq_put_decimal_ll(m, " ", task->exit_code);
560
	else
561
		seq_puts(m, " 0");
562

563
	seq_putc(m, '\n');
564
	if (mm)
L
Linus Torvalds 已提交
565
		mmput(mm);
566
	return 0;
L
Linus Torvalds 已提交
567 568
}

569 570
int proc_tid_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
571
{
572
	return do_task_stat(m, ns, pid, task, 0);
L
Linus Torvalds 已提交
573 574
}

575 576
int proc_tgid_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
577
{
578
	return do_task_stat(m, ns, pid, task, 1);
L
Linus Torvalds 已提交
579 580
}

581 582
int proc_pid_statm(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
583
{
584
	unsigned long size = 0, resident = 0, shared = 0, text = 0, data = 0;
L
Linus Torvalds 已提交
585
	struct mm_struct *mm = get_task_mm(task);
586

L
Linus Torvalds 已提交
587 588 589 590
	if (mm) {
		size = task_statm(mm, &shared, &text, &data, &resident);
		mmput(mm);
	}
591 592 593 594 595 596
	/*
	 * For quick read, open code by putting numbers directly
	 * expected format is
	 * seq_printf(m, "%lu %lu %lu %lu 0 %lu 0\n",
	 *               size, resident, shared, text, data);
	 */
597 598 599 600 601 602 603
	seq_put_decimal_ull(m, "", size);
	seq_put_decimal_ull(m, " ", resident);
	seq_put_decimal_ull(m, " ", shared);
	seq_put_decimal_ull(m, " ", text);
	seq_put_decimal_ull(m, " ", 0);
	seq_put_decimal_ull(m, " ", data);
	seq_put_decimal_ull(m, " ", 0);
604
	seq_putc(m, '\n');
L
Linus Torvalds 已提交
605

606
	return 0;
L
Linus Torvalds 已提交
607
}
608

609
#ifdef CONFIG_PROC_CHILDREN
610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671
static struct pid *
get_children_pid(struct inode *inode, struct pid *pid_prev, loff_t pos)
{
	struct task_struct *start, *task;
	struct pid *pid = NULL;

	read_lock(&tasklist_lock);

	start = pid_task(proc_pid(inode), PIDTYPE_PID);
	if (!start)
		goto out;

	/*
	 * Lets try to continue searching first, this gives
	 * us significant speedup on children-rich processes.
	 */
	if (pid_prev) {
		task = pid_task(pid_prev, PIDTYPE_PID);
		if (task && task->real_parent == start &&
		    !(list_empty(&task->sibling))) {
			if (list_is_last(&task->sibling, &start->children))
				goto out;
			task = list_first_entry(&task->sibling,
						struct task_struct, sibling);
			pid = get_pid(task_pid(task));
			goto out;
		}
	}

	/*
	 * Slow search case.
	 *
	 * We might miss some children here if children
	 * are exited while we were not holding the lock,
	 * but it was never promised to be accurate that
	 * much.
	 *
	 * "Just suppose that the parent sleeps, but N children
	 *  exit after we printed their tids. Now the slow paths
	 *  skips N extra children, we miss N tasks." (c)
	 *
	 * So one need to stop or freeze the leader and all
	 * its children to get a precise result.
	 */
	list_for_each_entry(task, &start->children, sibling) {
		if (pos-- == 0) {
			pid = get_pid(task_pid(task));
			break;
		}
	}

out:
	read_unlock(&tasklist_lock);
	return pid;
}

static int children_seq_show(struct seq_file *seq, void *v)
{
	struct inode *inode = seq->private;
	pid_t pid;

	pid = pid_nr_ns(v, inode->i_sb->s_fs_info);
672 673 674
	seq_printf(seq, "%d ", pid);

	return 0;
675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721 722 723 724 725 726 727 728 729 730 731
}

static void *children_seq_start(struct seq_file *seq, loff_t *pos)
{
	return get_children_pid(seq->private, NULL, *pos);
}

static void *children_seq_next(struct seq_file *seq, void *v, loff_t *pos)
{
	struct pid *pid;

	pid = get_children_pid(seq->private, v, *pos + 1);
	put_pid(v);

	++*pos;
	return pid;
}

static void children_seq_stop(struct seq_file *seq, void *v)
{
	put_pid(v);
}

static const struct seq_operations children_seq_ops = {
	.start	= children_seq_start,
	.next	= children_seq_next,
	.stop	= children_seq_stop,
	.show	= children_seq_show,
};

static int children_seq_open(struct inode *inode, struct file *file)
{
	struct seq_file *m;
	int ret;

	ret = seq_open(file, &children_seq_ops);
	if (ret)
		return ret;

	m = file->private_data;
	m->private = inode;

	return ret;
}

int children_seq_release(struct inode *inode, struct file *file)
{
	seq_release(inode, file);
	return 0;
}

const struct file_operations proc_tid_children_operations = {
	.open    = children_seq_open,
	.read    = seq_read,
	.llseek  = seq_lseek,
	.release = children_seq_release,
};
732
#endif /* CONFIG_PROC_CHILDREN */