array.c 14.0 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64
/*
 *  linux/fs/proc/array.c
 *
 *  Copyright (C) 1992  by Linus Torvalds
 *  based on ideas by Darren Senn
 *
 * Fixes:
 * Michael. K. Johnson: stat,statm extensions.
 *                      <johnsonm@stolaf.edu>
 *
 * Pauline Middelink :  Made cmdline,envline only break at '\0's, to
 *                      make sure SET_PROCTITLE works. Also removed
 *                      bad '!' which forced address recalculation for
 *                      EVERY character on the current page.
 *                      <middelin@polyware.iaf.nl>
 *
 * Danny ter Haar    :	added cpuinfo
 *			<dth@cistron.nl>
 *
 * Alessandro Rubini :  profile extension.
 *                      <rubini@ipvvis.unipv.it>
 *
 * Jeff Tranter      :  added BogoMips field to cpuinfo
 *                      <Jeff_Tranter@Mitel.COM>
 *
 * Bruno Haible      :  remove 4K limit for the maps file
 *			<haible@ma2s2.mathematik.uni-karlsruhe.de>
 *
 * Yves Arrouye      :  remove removal of trailing spaces in get_array.
 *			<Yves.Arrouye@marin.fdn.fr>
 *
 * Jerome Forissier  :  added per-CPU time information to /proc/stat
 *                      and /proc/<pid>/cpu extension
 *                      <forissier@isia.cma.fr>
 *			- Incorporation and non-SMP safe operation
 *			of forissier patch in 2.1.78 by
 *			Hans Marcus <crowbar@concepts.nl>
 *
 * aeb@cwi.nl        :  /proc/partitions
 *
 *
 * Alan Cox	     :  security fixes.
 *			<Alan.Cox@linux.org>
 *
 * Al Viro           :  safe handling of mm_struct
 *
 * Gerhard Wichert   :  added BIGMEM support
 * Siemens AG           <Gerhard.Wichert@pdb.siemens.de>
 *
 * Al Viro & Jeff Garzik :  moved most of the thing into base.c and
 *			 :  proc_misc.c. The rest may eventually go into
 *			 :  base.c too.
 */

#include <linux/types.h>
#include <linux/errno.h>
#include <linux/time.h>
#include <linux/kernel.h>
#include <linux/kernel_stat.h>
#include <linux/tty.h>
#include <linux/string.h>
#include <linux/mman.h>
#include <linux/proc_fs.h>
#include <linux/ioport.h>
65 66
#include <linux/uaccess.h>
#include <linux/io.h>
L
Linus Torvalds 已提交
67 68 69 70 71 72 73 74 75 76 77
#include <linux/mm.h>
#include <linux/hugetlb.h>
#include <linux/pagemap.h>
#include <linux/swap.h>
#include <linux/slab.h>
#include <linux/smp.h>
#include <linux/signal.h>
#include <linux/highmem.h>
#include <linux/file.h>
#include <linux/times.h>
#include <linux/cpuset.h>
78
#include <linux/rcupdate.h>
79
#include <linux/delayacct.h>
80
#include <linux/seq_file.h>
81
#include <linux/pid_namespace.h>
L
Linus Torvalds 已提交
82 83 84 85 86 87 88 89 90 91

#include <asm/pgtable.h>
#include <asm/processor.h>
#include "internal.h"

/* Gcc optimizes away "strlen(x)" for constant x */
#define ADDBUF(buffer, string) \
do { memcpy(buffer, string, strlen(string)); \
     buffer += strlen(string); } while (0)

92
static inline char *task_name(struct task_struct *p, char *buf)
L
Linus Torvalds 已提交
93 94
{
	int i;
95
	char *name;
L
Linus Torvalds 已提交
96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142
	char tcomm[sizeof(p->comm)];

	get_task_comm(tcomm, p);

	ADDBUF(buf, "Name:\t");
	name = tcomm;
	i = sizeof(tcomm);
	do {
		unsigned char c = *name;
		name++;
		i--;
		*buf = c;
		if (!c)
			break;
		if (c == '\\') {
			buf[1] = c;
			buf += 2;
			continue;
		}
		if (c == '\n') {
			buf[0] = '\\';
			buf[1] = 'n';
			buf += 2;
			continue;
		}
		buf++;
	} while (i);
	*buf = '\n';
	return buf+1;
}

/*
 * The task state array is a strange "bitmap" of
 * reasons to sleep. Thus "running" is zero, and
 * you can test for combinations of others with
 * simple bit tests.
 */
static const char *task_state_array[] = {
	"R (running)",		/*  0 */
	"S (sleeping)",		/*  1 */
	"D (disk sleep)",	/*  2 */
	"T (stopped)",		/*  4 */
	"T (tracing stop)",	/*  8 */
	"Z (zombie)",		/* 16 */
	"X (dead)"		/* 32 */
};

143
static inline const char *get_task_state(struct task_struct *tsk)
L
Linus Torvalds 已提交
144
{
M
Matthew Wilcox 已提交
145
	unsigned int state = (tsk->state & TASK_REPORT) | tsk->exit_state;
L
Linus Torvalds 已提交
146 147 148 149 150 151 152 153 154
	const char **p = &task_state_array[0];

	while (state) {
		p++;
		state >>= 1;
	}
	return *p;
}

155
static inline char *task_state(struct task_struct *p, char *buffer)
L
Linus Torvalds 已提交
156 157 158
{
	struct group_info *group_info;
	int g;
159
	struct fdtable *fdt = NULL;
160 161
	struct pid_namespace *ns;
	pid_t ppid, tpid;
L
Linus Torvalds 已提交
162

163
	ns = current->nsproxy->pid_ns;
164
	rcu_read_lock();
165 166 167
	ppid = pid_alive(p) ?
		task_tgid_nr_ns(rcu_dereference(p->real_parent), ns) : 0;
	tpid = pid_alive(p) && p->ptrace ?
R
Roland McGrath 已提交
168
		task_pid_nr_ns(rcu_dereference(p->parent), ns) : 0;
L
Linus Torvalds 已提交
169 170 171 172 173 174 175 176 177
	buffer += sprintf(buffer,
		"State:\t%s\n"
		"Tgid:\t%d\n"
		"Pid:\t%d\n"
		"PPid:\t%d\n"
		"TracerPid:\t%d\n"
		"Uid:\t%d\t%d\t%d\t%d\n"
		"Gid:\t%d\t%d\t%d\t%d\n",
		get_task_state(p),
178 179 180
		task_tgid_nr_ns(p, ns),
		task_pid_nr_ns(p, ns),
		ppid, tpid,
L
Linus Torvalds 已提交
181 182
		p->uid, p->euid, p->suid, p->fsuid,
		p->gid, p->egid, p->sgid, p->fsgid);
183

L
Linus Torvalds 已提交
184
	task_lock(p);
185 186
	if (p->files)
		fdt = files_fdtable(p->files);
L
Linus Torvalds 已提交
187 188 189
	buffer += sprintf(buffer,
		"FDSize:\t%d\n"
		"Groups:\t",
190
		fdt ? fdt->max_fds : 0);
191
	rcu_read_unlock();
L
Linus Torvalds 已提交
192 193 194 195 196

	group_info = p->group_info;
	get_group_info(group_info);
	task_unlock(p);

197 198
	for (g = 0; g < min(group_info->ngroups, NGROUPS_SMALL); g++)
		buffer += sprintf(buffer, "%d ", GROUP_AT(group_info, g));
L
Linus Torvalds 已提交
199 200 201 202 203 204
	put_group_info(group_info);

	buffer += sprintf(buffer, "\n");
	return buffer;
}

205
static char *render_sigset_t(const char *header, sigset_t *set, char *buffer)
L
Linus Torvalds 已提交
206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244
{
	int i, len;

	len = strlen(header);
	memcpy(buffer, header, len);
	buffer += len;

	i = _NSIG;
	do {
		int x = 0;

		i -= 4;
		if (sigismember(set, i+1)) x |= 1;
		if (sigismember(set, i+2)) x |= 2;
		if (sigismember(set, i+3)) x |= 4;
		if (sigismember(set, i+4)) x |= 8;
		*buffer++ = (x < 10 ? '0' : 'a' - 10) + x;
	} while (i >= 4);

	*buffer++ = '\n';
	*buffer = 0;
	return buffer;
}

static void collect_sigign_sigcatch(struct task_struct *p, sigset_t *ign,
				    sigset_t *catch)
{
	struct k_sigaction *k;
	int i;

	k = p->sighand->action;
	for (i = 1; i <= _NSIG; ++i, ++k) {
		if (k->sa.sa_handler == SIG_IGN)
			sigaddset(ign, i);
		else if (k->sa.sa_handler != SIG_DFL)
			sigaddset(catch, i);
	}
}

245
static inline char *task_sig(struct task_struct *p, char *buffer)
L
Linus Torvalds 已提交
246
{
247
	unsigned long flags;
L
Linus Torvalds 已提交
248 249 250 251 252 253 254 255 256 257 258
	sigset_t pending, shpending, blocked, ignored, caught;
	int num_threads = 0;
	unsigned long qsize = 0;
	unsigned long qlim = 0;

	sigemptyset(&pending);
	sigemptyset(&shpending);
	sigemptyset(&blocked);
	sigemptyset(&ignored);
	sigemptyset(&caught);

259 260
	rcu_read_lock();
	if (lock_task_sighand(p, &flags)) {
L
Linus Torvalds 已提交
261 262 263 264 265 266 267
		pending = p->pending.signal;
		shpending = p->signal->shared_pending.signal;
		blocked = p->blocked;
		collect_sigign_sigcatch(p, &ignored, &caught);
		num_threads = atomic_read(&p->signal->count);
		qsize = atomic_read(&p->user->sigpending);
		qlim = p->signal->rlim[RLIMIT_SIGPENDING].rlim_cur;
268
		unlock_task_sighand(p, &flags);
L
Linus Torvalds 已提交
269
	}
270
	rcu_read_unlock();
L
Linus Torvalds 已提交
271 272 273 274 275 276 277 278 279 280 281 282 283 284

	buffer += sprintf(buffer, "Threads:\t%d\n", num_threads);
	buffer += sprintf(buffer, "SigQ:\t%lu/%lu\n", qsize, qlim);

	/* render them all */
	buffer = render_sigset_t("SigPnd:\t", &pending, buffer);
	buffer = render_sigset_t("ShdPnd:\t", &shpending, buffer);
	buffer = render_sigset_t("SigBlk:\t", &blocked, buffer);
	buffer = render_sigset_t("SigIgn:\t", &ignored, buffer);
	buffer = render_sigset_t("SigCgt:\t", &caught, buffer);

	return buffer;
}

285 286 287 288 289 290 291 292 293 294 295 296
static char *render_cap_t(const char *header, kernel_cap_t *a, char *buffer)
{
	unsigned __capi;

	buffer += sprintf(buffer, "%s", header);
	CAP_FOR_EACH_U32(__capi) {
		buffer += sprintf(buffer, "%08x",
				  a->cap[(_LINUX_CAPABILITY_U32S-1) - __capi]);
	}
	return buffer + sprintf(buffer, "\n");
}

L
Linus Torvalds 已提交
297 298
static inline char *task_cap(struct task_struct *p, char *buffer)
{
299 300 301
	buffer = render_cap_t("CapInh:\t", &p->cap_inheritable, buffer);
	buffer = render_cap_t("CapPrm:\t", &p->cap_permitted, buffer);
	return render_cap_t("CapEff:\t", &p->cap_effective, buffer);
L
Linus Torvalds 已提交
302 303
}

304 305 306 307 308 309 310 311 312
static inline char *task_context_switch_counts(struct task_struct *p,
						char *buffer)
{
	return buffer + sprintf(buffer, "voluntary_ctxt_switches:\t%lu\n"
			    "nonvoluntary_ctxt_switches:\t%lu\n",
			    p->nvcsw,
			    p->nivcsw);
}

313
int proc_pid_status(struct task_struct *task, char *buffer)
L
Linus Torvalds 已提交
314
{
315
	char *orig = buffer;
L
Linus Torvalds 已提交
316 317 318 319
	struct mm_struct *mm = get_task_mm(task);

	buffer = task_name(task, buffer);
	buffer = task_state(task, buffer);
320

L
Linus Torvalds 已提交
321 322 323 324 325 326 327
	if (mm) {
		buffer = task_mem(mm, buffer);
		mmput(mm);
	}
	buffer = task_sig(task, buffer);
	buffer = task_cap(task, buffer);
	buffer = cpuset_task_status_allowed(task, buffer);
328
#if defined(CONFIG_S390)
L
Linus Torvalds 已提交
329 330
	buffer = task_show_regs(task, buffer);
#endif
331
	buffer = task_context_switch_counts(task, buffer);
L
Linus Torvalds 已提交
332 333 334
	return buffer - orig;
}

335 336 337 338 339 340 341 342 343 344 345 346 347 348 349
/*
 * Use precise platform statistics if available:
 */
#ifdef CONFIG_VIRT_CPU_ACCOUNTING
static cputime_t task_utime(struct task_struct *p)
{
	return p->utime;
}

static cputime_t task_stime(struct task_struct *p)
{
	return p->stime;
}
#else
static cputime_t task_utime(struct task_struct *p)
350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365
{
	clock_t utime = cputime_to_clock_t(p->utime),
		total = utime + cputime_to_clock_t(p->stime);
	u64 temp;

	/*
	 * Use CFS's precise accounting:
	 */
	temp = (u64)nsec_to_clock_t(p->se.sum_exec_runtime);

	if (total) {
		temp *= utime;
		do_div(temp, total);
	}
	utime = (clock_t)temp;

P
Peter Zijlstra 已提交
366 367
	p->prev_utime = max(p->prev_utime, clock_t_to_cputime(utime));
	return p->prev_utime;
368 369
}

370
static cputime_t task_stime(struct task_struct *p)
371
{
372
	clock_t stime;
373 374 375 376 377 378

	/*
	 * Use CFS's precise accounting. (we subtract utime from
	 * the total, to make sure the total observed by userspace
	 * grows monotonically - apps rely on that):
	 */
379 380
	stime = nsec_to_clock_t(p->se.sum_exec_runtime) -
			cputime_to_clock_t(task_utime(p));
381

I
Ingo Molnar 已提交
382 383 384
	if (stime >= 0)
		p->prev_stime = max(p->prev_stime, clock_t_to_cputime(stime));

385
	return p->prev_stime;
386
}
387
#endif
388

389 390 391 392 393
static cputime_t task_gtime(struct task_struct *p)
{
	return p->gtime;
}

394 395
static int do_task_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task, int whole)
L
Linus Torvalds 已提交
396 397 398 399 400 401
{
	unsigned long vsize, eip, esp, wchan = ~0UL;
	long priority, nice;
	int tty_pgrp = -1, tty_nr = 0;
	sigset_t sigign, sigcatch;
	char state;
402
	pid_t ppid = 0, pgid = -1, sid = -1;
L
Linus Torvalds 已提交
403 404 405 406 407
	int num_threads = 0;
	struct mm_struct *mm;
	unsigned long long start_time;
	unsigned long cmin_flt = 0, cmaj_flt = 0;
	unsigned long  min_flt = 0,  maj_flt = 0;
408
	cputime_t cutime, cstime, utime, stime;
409
	cputime_t cgtime, gtime;
L
Linus Torvalds 已提交
410 411
	unsigned long rsslim = 0;
	char tcomm[sizeof(task->comm)];
412
	unsigned long flags;
L
Linus Torvalds 已提交
413 414 415 416 417 418 419 420 421 422 423 424 425 426

	state = *get_task_state(task);
	vsize = eip = esp = 0;
	mm = get_task_mm(task);
	if (mm) {
		vsize = task_vsize(mm);
		eip = KSTK_EIP(task);
		esp = KSTK_ESP(task);
	}

	get_task_comm(tcomm, task);

	sigemptyset(&sigign);
	sigemptyset(&sigcatch);
427
	cutime = cstime = utime = stime = cputime_zero;
428
	cgtime = gtime = cputime_zero;
429

430 431 432
	rcu_read_lock();
	if (lock_task_sighand(task, &flags)) {
		struct signal_struct *sig = task->signal;
433 434

		if (sig->tty) {
435
			tty_pgrp = pid_nr_ns(sig->tty->pgrp, ns);
436
			tty_nr = new_encode_dev(tty_devnum(sig->tty));
437 438 439
		}

		num_threads = atomic_read(&sig->count);
L
Linus Torvalds 已提交
440 441
		collect_sigign_sigcatch(task, &sigign, &sigcatch);

442 443 444 445
		cmin_flt = sig->cmin_flt;
		cmaj_flt = sig->cmaj_flt;
		cutime = sig->cutime;
		cstime = sig->cstime;
446
		cgtime = sig->cgtime;
447 448
		rsslim = sig->rlim[RLIMIT_RSS].rlim_cur;

L
Linus Torvalds 已提交
449 450
		/* add up live thread stats at the group level */
		if (whole) {
451
			struct task_struct *t = task;
L
Linus Torvalds 已提交
452 453 454
			do {
				min_flt += t->min_flt;
				maj_flt += t->maj_flt;
455 456
				utime = cputime_add(utime, task_utime(t));
				stime = cputime_add(stime, task_stime(t));
457
				gtime = cputime_add(gtime, task_gtime(t));
L
Linus Torvalds 已提交
458 459 460
				t = next_thread(t);
			} while (t != task);

461 462
			min_flt += sig->min_flt;
			maj_flt += sig->maj_flt;
463 464
			utime = cputime_add(utime, sig->utime);
			stime = cputime_add(stime, sig->stime);
465
			gtime = cputime_add(gtime, sig->gtime);
L
Linus Torvalds 已提交
466
		}
467

468
		sid = task_session_nr_ns(task, ns);
469
		ppid = task_tgid_nr_ns(task->real_parent, ns);
470
		pgid = task_pgrp_nr_ns(task, ns);
471 472

		unlock_task_sighand(task, &flags);
L
Linus Torvalds 已提交
473
	}
474
	rcu_read_unlock();
L
Linus Torvalds 已提交
475

476
	if (!whole || num_threads < 2)
L
Linus Torvalds 已提交
477 478 479 480
		wchan = get_wchan(task);
	if (!whole) {
		min_flt = task->min_flt;
		maj_flt = task->maj_flt;
481 482
		utime = task_utime(task);
		stime = task_stime(task);
483
		gtime = task_gtime(task);
L
Linus Torvalds 已提交
484 485 486 487 488 489 490 491 492
	}

	/* scale priority and nice values from timeslices to -20..20 */
	/* to make it look like a "normal" Unix priority/nice value  */
	priority = task_prio(task);
	nice = task_nice(task);

	/* Temporary variable needed for gcc-2.96 */
	/* convert timespec -> nsec*/
493 494 495
	start_time =
		(unsigned long long)task->real_start_time.tv_sec * NSEC_PER_SEC
				+ task->real_start_time.tv_nsec;
L
Linus Torvalds 已提交
496 497 498
	/* convert nsec -> ticks */
	start_time = nsec_to_clock_t(start_time);

499
	seq_printf(m, "%d (%s) %c %d %d %d %d %d %u %lu \
500
%lu %lu %lu %lu %lu %ld %ld %ld %ld %d 0 %llu %lu %ld %lu %lu %lu %lu %lu \
501
%lu %lu %lu %lu %lu %lu %lu %lu %d %d %u %u %llu %lu %ld\n",
502
		pid_nr_ns(pid, ns),
L
Linus Torvalds 已提交
503 504 505 506 507 508 509 510 511 512 513 514
		tcomm,
		state,
		ppid,
		pgid,
		sid,
		tty_nr,
		tty_pgrp,
		task->flags,
		min_flt,
		cmin_flt,
		maj_flt,
		cmaj_flt,
515 516
		cputime_to_clock_t(utime),
		cputime_to_clock_t(stime),
L
Linus Torvalds 已提交
517 518 519 520 521 522 523
		cputime_to_clock_t(cutime),
		cputime_to_clock_t(cstime),
		priority,
		nice,
		num_threads,
		start_time,
		vsize,
524
		mm ? get_mm_rss(mm) : 0,
525
		rsslim,
L
Linus Torvalds 已提交
526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544
		mm ? mm->start_code : 0,
		mm ? mm->end_code : 0,
		mm ? mm->start_stack : 0,
		esp,
		eip,
		/* The signal information here is obsolete.
		 * It must be decimal for Linux 2.0 compatibility.
		 * Use /proc/#/status for real-time signals.
		 */
		task->pending.signal.sig[0] & 0x7fffffffUL,
		task->blocked.sig[0] & 0x7fffffffUL,
		sigign      .sig[0] & 0x7fffffffUL,
		sigcatch    .sig[0] & 0x7fffffffUL,
		wchan,
		0UL,
		0UL,
		task->exit_signal,
		task_cpu(task),
		task->rt_priority,
545
		task->policy,
546 547 548
		(unsigned long long)delayacct_blkio_ticks(task),
		cputime_to_clock_t(gtime),
		cputime_to_clock_t(cgtime));
549
	if (mm)
L
Linus Torvalds 已提交
550
		mmput(mm);
551
	return 0;
L
Linus Torvalds 已提交
552 553
}

554 555
int proc_tid_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
556
{
557
	return do_task_stat(m, ns, pid, task, 0);
L
Linus Torvalds 已提交
558 559
}

560 561
int proc_tgid_stat(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
562
{
563
	return do_task_stat(m, ns, pid, task, 1);
L
Linus Torvalds 已提交
564 565
}

566 567
int proc_pid_statm(struct seq_file *m, struct pid_namespace *ns,
			struct pid *pid, struct task_struct *task)
L
Linus Torvalds 已提交
568 569 570
{
	int size = 0, resident = 0, shared = 0, text = 0, lib = 0, data = 0;
	struct mm_struct *mm = get_task_mm(task);
571

L
Linus Torvalds 已提交
572 573 574 575
	if (mm) {
		size = task_statm(mm, &shared, &text, &data, &resident);
		mmput(mm);
	}
576 577
	seq_printf(m, "%d %d %d %d %d %d %d\n",
			size, resident, shared, text, lib, data, 0);
L
Linus Torvalds 已提交
578

579
	return 0;
L
Linus Torvalds 已提交
580
}