generic.c 19.3 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14
/*
 * proc/fs/generic.c --- generic routines for the proc-fs
 *
 * This file contains generic proc-fs routines for handling
 * directories and files.
 * 
 * Copyright (C) 1991, 1992 Linus Torvalds.
 * Copyright (C) 1997 Theodore Ts'o
 */

#include <linux/errno.h>
#include <linux/time.h>
#include <linux/proc_fs.h>
#include <linux/stat.h>
C
Christoph Hellwig 已提交
15
#include <linux/mm.h>
L
Linus Torvalds 已提交
16
#include <linux/module.h>
17
#include <linux/slab.h>
A
Andrew Morton 已提交
18
#include <linux/printk.h>
L
Linus Torvalds 已提交
19 20 21 22 23
#include <linux/mount.h>
#include <linux/init.h>
#include <linux/idr.h>
#include <linux/namei.h>
#include <linux/bitops.h>
24
#include <linux/spinlock.h>
25
#include <linux/completion.h>
L
Linus Torvalds 已提交
26 27
#include <asm/uaccess.h>

28 29
#include "internal.h"

30 31
DEFINE_SPINLOCK(proc_subdir_lock);

32
static int proc_match(unsigned int len, const char *name, struct proc_dir_entry *de)
L
Linus Torvalds 已提交
33 34 35 36 37 38 39 40 41 42
{
	if (de->namelen != len)
		return 0;
	return !memcmp(name, de->name, len);
}

/* buffer size is one page but our output routines use some slack for overruns */
#define PROC_BLOCK_SIZE	(PAGE_SIZE - 1024)

static ssize_t
43
__proc_file_read(struct file *file, char __user *buf, size_t nbytes,
L
Linus Torvalds 已提交
44 45
	       loff_t *ppos)
{
A
Al Viro 已提交
46
	struct inode * inode = file_inode(file);
L
Linus Torvalds 已提交
47 48 49 50 51 52
	char 	*page;
	ssize_t	retval=0;
	int	eof=0;
	ssize_t	n, count;
	char	*start;
	struct proc_dir_entry * dp;
L
Linus Torvalds 已提交
53 54 55 56 57 58 59 60 61 62 63 64
	unsigned long long pos;

	/*
	 * Gaah, please just use "seq_file" instead. The legacy /proc
	 * interfaces cut loff_t down to off_t for reads, and ignore
	 * the offset entirely for writes..
	 */
	pos = *ppos;
	if (pos > MAX_NON_LFS)
		return 0;
	if (nbytes > MAX_NON_LFS - pos)
		nbytes = MAX_NON_LFS - pos;
L
Linus Torvalds 已提交
65 66

	dp = PDE(inode);
67
	if (!(page = (char*) __get_free_page(GFP_TEMPORARY)))
L
Linus Torvalds 已提交
68 69 70 71 72 73
		return -ENOMEM;

	while ((nbytes > 0) && !eof) {
		count = min_t(size_t, PROC_BLOCK_SIZE, nbytes);

		start = NULL;
74
		if (!dp->read_proc)
L
Linus Torvalds 已提交
75 76
			break;

77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122
		/* How to be a proc read function
		 * ------------------------------
		 * Prototype:
		 *    int f(char *buffer, char **start, off_t offset,
		 *          int count, int *peof, void *dat)
		 *
		 * Assume that the buffer is "count" bytes in size.
		 *
		 * If you know you have supplied all the data you have, set
		 * *peof.
		 *
		 * You have three ways to return data:
		 *
		 * 0) Leave *start = NULL.  (This is the default.)  Put the
		 *    data of the requested offset at that offset within the
		 *    buffer.  Return the number (n) of bytes there are from
		 *    the beginning of the buffer up to the last byte of data.
		 *    If the number of supplied bytes (= n - offset) is greater
		 *    than zero and you didn't signal eof and the reader is
		 *    prepared to take more data you will be called again with
		 *    the requested offset advanced by the number of bytes
		 *    absorbed.  This interface is useful for files no larger
		 *    than the buffer.
		 *
		 * 1) Set *start = an unsigned long value less than the buffer
		 *    address but greater than zero.  Put the data of the
		 *    requested offset at the beginning of the buffer.  Return
		 *    the number of bytes of data placed there.  If this number
		 *    is greater than zero and you didn't signal eof and the
		 *    reader is prepared to take more data you will be called
		 *    again with the requested offset advanced by *start.  This
		 *    interface is useful when you have a large file consisting
		 *    of a series of blocks which you want to count and return
		 *    as wholes.
		 *    (Hack by Paul.Russell@rustcorp.com.au)
		 *
		 * 2) Set *start = an address within the buffer.  Put the data
		 *    of the requested offset at *start.  Return the number of
		 *    bytes of data placed there.  If this number is greater
		 *    than zero and you didn't signal eof and the reader is
		 *    prepared to take more data you will be called again with
		 *    the requested offset advanced by the number of bytes
		 *    absorbed.
		 */
		n = dp->read_proc(page, &start, *ppos, count, &eof, dp->data);

L
Linus Torvalds 已提交
123 124 125 126 127 128 129 130 131
		if (n == 0)   /* end of file */
			break;
		if (n < 0) {  /* error */
			if (retval == 0)
				retval = n;
			break;
		}

		if (start == NULL) {
A
Andrew Morton 已提交
132
			if (n > PAGE_SIZE)	/* Apparent buffer overflow */
L
Linus Torvalds 已提交
133 134 135 136 137 138 139 140
				n = PAGE_SIZE;
			n -= *ppos;
			if (n <= 0)
				break;
			if (n > count)
				n = count;
			start = page + *ppos;
		} else if (start < page) {
A
Andrew Morton 已提交
141
			if (n > PAGE_SIZE)	/* Apparent buffer overflow */
L
Linus Torvalds 已提交
142 143 144 145 146 147
				n = PAGE_SIZE;
			if (n > count) {
				/*
				 * Don't reduce n because doing so might
				 * cut off part of a data block.
				 */
A
Andrew Morton 已提交
148
				pr_warn("proc_file_read: count exceeded\n");
L
Linus Torvalds 已提交
149 150 151
			}
		} else /* start >= page */ {
			unsigned long startoff = (unsigned long)(start - page);
A
Andrew Morton 已提交
152
			if (n > (PAGE_SIZE - startoff))	/* buffer overflow? */
L
Linus Torvalds 已提交
153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173
				n = PAGE_SIZE - startoff;
			if (n > count)
				n = count;
		}
		
 		n -= copy_to_user(buf, start < page ? page : start, n);
		if (n == 0) {
			if (retval == 0)
				retval = -EFAULT;
			break;
		}

		*ppos += start < page ? (unsigned long)start : n;
		nbytes -= n;
		buf += n;
		retval += n;
	}
	free_page((unsigned long) page);
	return retval;
}

174 175 176 177
static ssize_t
proc_file_read(struct file *file, char __user *buf, size_t nbytes,
	       loff_t *ppos)
{
A
Al Viro 已提交
178
	struct proc_dir_entry *pde = PDE(file_inode(file));
179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194
	ssize_t rv = -EIO;

	spin_lock(&pde->pde_unload_lock);
	if (!pde->proc_fops) {
		spin_unlock(&pde->pde_unload_lock);
		return rv;
	}
	pde->pde_users++;
	spin_unlock(&pde->pde_unload_lock);

	rv = __proc_file_read(file, buf, nbytes, ppos);

	pde_users_dec(pde);
	return rv;
}

L
Linus Torvalds 已提交
195 196 197
static loff_t
proc_file_lseek(struct file *file, loff_t offset, int orig)
{
L
Linus Torvalds 已提交
198 199 200 201 202 203 204 205 206 207 208
	loff_t retval = -EINVAL;
	switch (orig) {
	case 1:
		offset += file->f_pos;
	/* fallthrough */
	case 0:
		if (offset < 0 || offset > MAX_NON_LFS)
			break;
		file->f_pos = retval = offset;
	}
	return retval;
L
Linus Torvalds 已提交
209 210
}

211 212 213 214 215
static const struct file_operations proc_file_operations = {
	.llseek		= proc_file_lseek,
	.read		= proc_file_read,
};

L
Linus Torvalds 已提交
216 217 218 219 220 221 222 223
static int proc_notify_change(struct dentry *dentry, struct iattr *iattr)
{
	struct inode *inode = dentry->d_inode;
	struct proc_dir_entry *de = PDE(inode);
	int error;

	error = inode_change_ok(inode, iattr);
	if (error)
C
Christoph Hellwig 已提交
224
		return error;
L
Linus Torvalds 已提交
225

C
Christoph Hellwig 已提交
226 227
	setattr_copy(inode, iattr);
	mark_inode_dirty(inode);
M
Marco Stornelli 已提交
228

L
Linus Torvalds 已提交
229 230 231
	de->uid = inode->i_uid;
	de->gid = inode->i_gid;
	de->mode = inode->i_mode;
C
Christoph Hellwig 已提交
232
	return 0;
L
Linus Torvalds 已提交
233 234
}

M
Miklos Szeredi 已提交
235 236 237 238 239 240
static int proc_getattr(struct vfsmount *mnt, struct dentry *dentry,
			struct kstat *stat)
{
	struct inode *inode = dentry->d_inode;
	struct proc_dir_entry *de = PROC_I(inode)->pde;
	if (de && de->nlink)
M
Miklos Szeredi 已提交
241
		set_nlink(inode, de->nlink);
M
Miklos Szeredi 已提交
242 243 244 245 246

	generic_fillattr(inode, stat);
	return 0;
}

247
static const struct inode_operations proc_file_inode_operations = {
L
Linus Torvalds 已提交
248 249 250 251 252 253 254 255
	.setattr	= proc_notify_change,
};

/*
 * This function parses a name such as "tty/driver/serial", and
 * returns the struct proc_dir_entry for "/proc/tty/driver", and
 * returns "serial" in residual.
 */
256 257
static int __xlate_proc_name(const char *name, struct proc_dir_entry **ret,
			     const char **residual)
L
Linus Torvalds 已提交
258 259 260
{
	const char     		*cp = name, *next;
	struct proc_dir_entry	*de;
261
	unsigned int		len;
L
Linus Torvalds 已提交
262

263 264 265 266
	de = *ret;
	if (!de)
		de = &proc_root;

L
Linus Torvalds 已提交
267 268 269 270 271 272 273 274 275 276
	while (1) {
		next = strchr(cp, '/');
		if (!next)
			break;

		len = next - cp;
		for (de = de->subdir; de ; de = de->next) {
			if (proc_match(len, cp, de))
				break;
		}
277 278
		if (!de) {
			WARN(1, "name '%s'\n", name);
279
			return -ENOENT;
280
		}
L
Linus Torvalds 已提交
281 282 283 284
		cp += len + 1;
	}
	*residual = cp;
	*ret = de;
285 286 287 288 289 290 291 292 293 294
	return 0;
}

static int xlate_proc_name(const char *name, struct proc_dir_entry **ret,
			   const char **residual)
{
	int rv;

	spin_lock(&proc_subdir_lock);
	rv = __xlate_proc_name(name, ret, residual);
295
	spin_unlock(&proc_subdir_lock);
296
	return rv;
L
Linus Torvalds 已提交
297 298
}

299
static DEFINE_IDA(proc_inum_ida);
L
Linus Torvalds 已提交
300 301
static DEFINE_SPINLOCK(proc_inum_lock); /* protects the above */

302
#define PROC_DYNAMIC_FIRST 0xF0000000U
L
Linus Torvalds 已提交
303 304 305 306 307

/*
 * Return an inode number between PROC_DYNAMIC_FIRST and
 * 0xffffffff, or zero on failure.
 */
308
int proc_alloc_inum(unsigned int *inum)
L
Linus Torvalds 已提交
309
{
310
	unsigned int i;
L
Linus Torvalds 已提交
311 312 313
	int error;

retry:
314 315
	if (!ida_pre_get(&proc_inum_ida, GFP_KERNEL))
		return -ENOMEM;
L
Linus Torvalds 已提交
316

317
	spin_lock_irq(&proc_inum_lock);
318
	error = ida_get_new(&proc_inum_ida, &i);
319
	spin_unlock_irq(&proc_inum_lock);
L
Linus Torvalds 已提交
320 321 322
	if (error == -EAGAIN)
		goto retry;
	else if (error)
323
		return error;
L
Linus Torvalds 已提交
324

325
	if (i > UINT_MAX - PROC_DYNAMIC_FIRST) {
326
		spin_lock_irq(&proc_inum_lock);
327
		ida_remove(&proc_inum_ida, i);
328
		spin_unlock_irq(&proc_inum_lock);
329
		return -ENOSPC;
330
	}
331 332
	*inum = PROC_DYNAMIC_FIRST + i;
	return 0;
L
Linus Torvalds 已提交
333 334
}

335
void proc_free_inum(unsigned int inum)
L
Linus Torvalds 已提交
336
{
337 338
	unsigned long flags;
	spin_lock_irqsave(&proc_inum_lock, flags);
339
	ida_remove(&proc_inum_ida, inum - PROC_DYNAMIC_FIRST);
340
	spin_unlock_irqrestore(&proc_inum_lock, flags);
L
Linus Torvalds 已提交
341 342
}

343
static void *proc_follow_link(struct dentry *dentry, struct nameidata *nd)
L
Linus Torvalds 已提交
344
{
A
Al Viro 已提交
345
	nd_set_link(nd, PDE_DATA(dentry->d_inode));
346
	return NULL;
L
Linus Torvalds 已提交
347 348
}

349
static const struct inode_operations proc_link_inode_operations = {
L
Linus Torvalds 已提交
350 351 352 353 354 355 356 357 358 359
	.readlink	= generic_readlink,
	.follow_link	= proc_follow_link,
};

/*
 * As some entries in /proc are volatile, we want to 
 * get rid of unused dentries.  This could be made 
 * smarter: we could keep a "volatile" flag in the 
 * inode to indicate which ones to keep.
 */
N
Nick Piggin 已提交
360
static int proc_delete_dentry(const struct dentry * dentry)
L
Linus Torvalds 已提交
361 362 363 364
{
	return 1;
}

A
Al Viro 已提交
365
static const struct dentry_operations proc_dentry_operations =
L
Linus Torvalds 已提交
366 367 368 369 370 371 372 373
{
	.d_delete	= proc_delete_dentry,
};

/*
 * Don't create negative dentries here, return -ENOENT by hand
 * instead.
 */
374 375
struct dentry *proc_lookup_de(struct proc_dir_entry *de, struct inode *dir,
		struct dentry *dentry)
L
Linus Torvalds 已提交
376
{
377
	struct inode *inode;
L
Linus Torvalds 已提交
378

379
	spin_lock(&proc_subdir_lock);
380 381 382 383
	for (de = de->subdir; de ; de = de->next) {
		if (de->namelen != dentry->d_name.len)
			continue;
		if (!memcmp(dentry->d_name.name, de->name, de->namelen)) {
384
			pde_get(de);
385
			spin_unlock(&proc_subdir_lock);
A
Alexey Dobriyan 已提交
386
			inode = proc_get_inode(dir->i_sb, de);
387 388 389 390 391
			if (!inode)
				return ERR_PTR(-ENOMEM);
			d_set_d_op(dentry, &proc_dentry_operations);
			d_add(dentry, inode);
			return NULL;
L
Linus Torvalds 已提交
392 393
		}
	}
394
	spin_unlock(&proc_subdir_lock);
395
	return ERR_PTR(-ENOENT);
L
Linus Torvalds 已提交
396 397
}

398
struct dentry *proc_lookup(struct inode *dir, struct dentry *dentry,
A
Al Viro 已提交
399
		unsigned int flags)
400 401 402 403
{
	return proc_lookup_de(PDE(dir), dir, dentry);
}

L
Linus Torvalds 已提交
404 405 406 407 408 409 410 411 412
/*
 * This returns non-zero if at EOF, so that the /proc
 * root directory can use this and check if it should
 * continue with the <pid> entries..
 *
 * Note that the VFS-layer doesn't care about the return
 * value of the readdir() call, as long as it's non-negative
 * for success..
 */
413 414
int proc_readdir_de(struct proc_dir_entry *de, struct file *filp, void *dirent,
		filldir_t filldir)
L
Linus Torvalds 已提交
415 416 417
{
	unsigned int ino;
	int i;
A
Al Viro 已提交
418
	struct inode *inode = file_inode(filp);
L
Linus Torvalds 已提交
419 420 421 422 423 424 425 426 427 428 429 430 431
	int ret = 0;

	ino = inode->i_ino;
	i = filp->f_pos;
	switch (i) {
		case 0:
			if (filldir(dirent, ".", 1, i, ino, DT_DIR) < 0)
				goto out;
			i++;
			filp->f_pos++;
			/* fall through */
		case 1:
			if (filldir(dirent, "..", 2, i,
432
				    parent_ino(filp->f_path.dentry),
L
Linus Torvalds 已提交
433 434 435 436 437 438
				    DT_DIR) < 0)
				goto out;
			i++;
			filp->f_pos++;
			/* fall through */
		default:
439
			spin_lock(&proc_subdir_lock);
L
Linus Torvalds 已提交
440 441 442 443 444
			de = de->subdir;
			i -= 2;
			for (;;) {
				if (!de) {
					ret = 1;
445
					spin_unlock(&proc_subdir_lock);
L
Linus Torvalds 已提交
446 447 448 449 450 451 452 453 454
					goto out;
				}
				if (!i)
					break;
				de = de->next;
				i--;
			}

			do {
455 456
				struct proc_dir_entry *next;

457
				/* filldir passes info to user space */
458
				pde_get(de);
459
				spin_unlock(&proc_subdir_lock);
L
Linus Torvalds 已提交
460
				if (filldir(dirent, de->name, de->namelen, filp->f_pos,
461
					    de->low_ino, de->mode >> 12) < 0) {
462
					pde_put(de);
L
Linus Torvalds 已提交
463
					goto out;
464
				}
465
				spin_lock(&proc_subdir_lock);
L
Linus Torvalds 已提交
466
				filp->f_pos++;
467
				next = de->next;
468
				pde_put(de);
469
				de = next;
L
Linus Torvalds 已提交
470
			} while (de);
471
			spin_unlock(&proc_subdir_lock);
L
Linus Torvalds 已提交
472 473
	}
	ret = 1;
A
Alexey Dobriyan 已提交
474
out:
L
Linus Torvalds 已提交
475 476 477
	return ret;	
}

478 479
int proc_readdir(struct file *filp, void *dirent, filldir_t filldir)
{
A
Al Viro 已提交
480
	struct inode *inode = file_inode(filp);
481 482 483 484

	return proc_readdir_de(PDE(inode), filp, dirent, filldir);
}

L
Linus Torvalds 已提交
485 486 487 488 489
/*
 * These are the generic /proc directory operations. They
 * use the in-memory "struct proc_dir_entry" tree to parse
 * the /proc directory.
 */
490
static const struct file_operations proc_dir_operations = {
A
Alexey Dobriyan 已提交
491
	.llseek			= generic_file_llseek,
L
Linus Torvalds 已提交
492 493 494 495 496 497 498
	.read			= generic_read_dir,
	.readdir		= proc_readdir,
};

/*
 * proc directories can do almost nothing..
 */
499
static const struct inode_operations proc_dir_inode_operations = {
L
Linus Torvalds 已提交
500
	.lookup		= proc_lookup,
M
Miklos Szeredi 已提交
501
	.getattr	= proc_getattr,
L
Linus Torvalds 已提交
502 503 504 505 506
	.setattr	= proc_notify_change,
};

static int proc_register(struct proc_dir_entry * dir, struct proc_dir_entry * dp)
{
507
	struct proc_dir_entry *tmp;
508
	int ret;
L
Linus Torvalds 已提交
509
	
510 511 512
	ret = proc_alloc_inum(&dp->low_ino);
	if (ret)
		return ret;
513

L
Linus Torvalds 已提交
514
	if (S_ISDIR(dp->mode)) {
515 516
		dp->proc_fops = &proc_dir_operations;
		dp->proc_iops = &proc_dir_inode_operations;
L
Linus Torvalds 已提交
517 518
		dir->nlink++;
	} else if (S_ISLNK(dp->mode)) {
519
		dp->proc_iops = &proc_link_inode_operations;
L
Linus Torvalds 已提交
520 521 522
	} else if (S_ISREG(dp->mode)) {
		if (dp->proc_fops == NULL)
			dp->proc_fops = &proc_file_operations;
523 524 525 526
		dp->proc_iops = &proc_file_inode_operations;
	} else {
		WARN_ON(1);
		return -EINVAL;
L
Linus Torvalds 已提交
527
	}
C
Changli Gao 已提交
528 529

	spin_lock(&proc_subdir_lock);
530 531 532

	for (tmp = dir->subdir; tmp; tmp = tmp->next)
		if (strcmp(tmp->name, dp->name) == 0) {
A
Andrew Morton 已提交
533
			WARN(1, "proc_dir_entry '%s/%s' already registered\n",
534
				dir->name, dp->name);
535 536 537
			break;
		}

C
Changli Gao 已提交
538 539 540 541 542
	dp->next = dir->subdir;
	dp->parent = dir;
	dir->subdir = dp;
	spin_unlock(&proc_subdir_lock);

L
Linus Torvalds 已提交
543 544 545
	return 0;
}

546
static struct proc_dir_entry *__proc_create(struct proc_dir_entry **parent,
L
Linus Torvalds 已提交
547
					  const char *name,
A
Al Viro 已提交
548
					  umode_t mode,
L
Linus Torvalds 已提交
549 550 551 552
					  nlink_t nlink)
{
	struct proc_dir_entry *ent = NULL;
	const char *fn = name;
553
	unsigned int len;
L
Linus Torvalds 已提交
554 555

	/* make sure name is valid */
556 557
	if (!name || !strlen(name))
		goto out;
L
Linus Torvalds 已提交
558

559
	if (xlate_proc_name(name, parent, &fn) != 0)
L
Linus Torvalds 已提交
560 561 562 563 564 565 566 567
		goto out;

	/* At this point there must not be any '/' characters beyond *fn */
	if (strchr(fn, '/'))
		goto out;

	len = strlen(fn);

568 569 570
	ent = kzalloc(sizeof(struct proc_dir_entry) + len + 1, GFP_KERNEL);
	if (!ent)
		goto out;
L
Linus Torvalds 已提交
571

572
	memcpy(ent->name, fn, len + 1);
L
Linus Torvalds 已提交
573 574 575
	ent->namelen = len;
	ent->mode = mode;
	ent->nlink = nlink;
576
	atomic_set(&ent->count, 1);
577
	spin_lock_init(&ent->pde_unload_lock);
A
Alexey Dobriyan 已提交
578
	INIT_LIST_HEAD(&ent->pde_openers);
579
out:
L
Linus Torvalds 已提交
580 581 582 583 584 585 586 587
	return ent;
}

struct proc_dir_entry *proc_symlink(const char *name,
		struct proc_dir_entry *parent, const char *dest)
{
	struct proc_dir_entry *ent;

588
	ent = __proc_create(&parent, name,
L
Linus Torvalds 已提交
589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606
			  (S_IFLNK | S_IRUGO | S_IWUGO | S_IXUGO),1);

	if (ent) {
		ent->data = kmalloc((ent->size=strlen(dest))+1, GFP_KERNEL);
		if (ent->data) {
			strcpy((char*)ent->data,dest);
			if (proc_register(parent, ent) < 0) {
				kfree(ent->data);
				kfree(ent);
				ent = NULL;
			}
		} else {
			kfree(ent);
			ent = NULL;
		}
	}
	return ent;
}
H
Helight.Xu 已提交
607
EXPORT_SYMBOL(proc_symlink);
L
Linus Torvalds 已提交
608

A
Al Viro 已提交
609
struct proc_dir_entry *proc_mkdir_mode(const char *name, umode_t mode,
L
Linus Torvalds 已提交
610 611 612 613
		struct proc_dir_entry *parent)
{
	struct proc_dir_entry *ent;

614
	ent = __proc_create(&parent, name, S_IFDIR | mode, 2);
L
Linus Torvalds 已提交
615 616 617 618 619 620 621 622
	if (ent) {
		if (proc_register(parent, ent) < 0) {
			kfree(ent);
			ent = NULL;
		}
	}
	return ent;
}
623
EXPORT_SYMBOL(proc_mkdir_mode);
L
Linus Torvalds 已提交
624

625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641
struct proc_dir_entry *proc_net_mkdir(struct net *net, const char *name,
		struct proc_dir_entry *parent)
{
	struct proc_dir_entry *ent;

	ent = __proc_create(&parent, name, S_IFDIR | S_IRUGO | S_IXUGO, 2);
	if (ent) {
		ent->data = net;
		if (proc_register(parent, ent) < 0) {
			kfree(ent);
			ent = NULL;
		}
	}
	return ent;
}
EXPORT_SYMBOL_GPL(proc_net_mkdir);

L
Linus Torvalds 已提交
642 643 644 645 646
struct proc_dir_entry *proc_mkdir(const char *name,
		struct proc_dir_entry *parent)
{
	return proc_mkdir_mode(name, S_IRUGO | S_IXUGO, parent);
}
H
Helight.Xu 已提交
647
EXPORT_SYMBOL(proc_mkdir);
L
Linus Torvalds 已提交
648

D
David Howells 已提交
649 650 651
struct proc_dir_entry *create_proc_read_entry(
	const char *name, umode_t mode, struct proc_dir_entry *parent, 
	read_proc_t *read_proc, void *data)
L
Linus Torvalds 已提交
652 653 654
{
	struct proc_dir_entry *ent;

655 656 657 658 659 660
	if ((mode & S_IFMT) == 0)
		mode |= S_IFREG;

	if (!S_ISREG(mode)) {
		WARN_ON(1);	/* use proc_mkdir(), damnit */
		return NULL;
L
Linus Torvalds 已提交
661 662
	}

663 664 665 666
	if ((mode & S_IALLUGO) == 0)
		mode |= S_IRUGO;

	ent = __proc_create(&parent, name, mode, 1);
L
Linus Torvalds 已提交
667
	if (ent) {
D
David Howells 已提交
668 669
		ent->read_proc = read_proc;
		ent->data = data;
L
Linus Torvalds 已提交
670 671 672 673 674 675 676
		if (proc_register(parent, ent) < 0) {
			kfree(ent);
			ent = NULL;
		}
	}
	return ent;
}
D
David Howells 已提交
677
EXPORT_SYMBOL(create_proc_read_entry);
L
Linus Torvalds 已提交
678

A
Al Viro 已提交
679
struct proc_dir_entry *proc_create_data(const char *name, umode_t mode,
680 681 682
					struct proc_dir_entry *parent,
					const struct file_operations *proc_fops,
					void *data)
683 684
{
	struct proc_dir_entry *pde;
685 686
	if ((mode & S_IFMT) == 0)
		mode |= S_IFREG;
687

688 689 690
	if (!S_ISREG(mode)) {
		WARN_ON(1);	/* use proc_mkdir() */
		return NULL;
691 692
	}

693 694 695
	if ((mode & S_IALLUGO) == 0)
		mode |= S_IRUGO;
	pde = __proc_create(&parent, name, mode, 1);
696 697 698
	if (!pde)
		goto out;
	pde->proc_fops = proc_fops;
699
	pde->data = data;
700 701 702 703 704 705 706 707
	if (proc_register(parent, pde) < 0)
		goto out_free;
	return pde;
out_free:
	kfree(pde);
out:
	return NULL;
}
H
Helight.Xu 已提交
708
EXPORT_SYMBOL(proc_create_data);
709

710
static void free_proc_entry(struct proc_dir_entry *de)
L
Linus Torvalds 已提交
711
{
712
	proc_free_inum(de->low_ino);
L
Linus Torvalds 已提交
713

714
	if (S_ISLNK(de->mode))
L
Linus Torvalds 已提交
715 716 717 718
		kfree(de->data);
	kfree(de);
}

719 720 721 722 723 724
void pde_put(struct proc_dir_entry *pde)
{
	if (atomic_dec_and_test(&pde->count))
		free_proc_entry(pde);
}

A
Al Viro 已提交
725
static void entry_rundown(struct proc_dir_entry *de)
L
Linus Torvalds 已提交
726
{
727 728 729 730 731 732 733 734 735 736 737 738
	spin_lock(&de->pde_unload_lock);
	/*
	 * Stop accepting new callers into module. If you're
	 * dynamically allocating ->proc_fops, save a pointer somewhere.
	 */
	de->proc_fops = NULL;
	/* Wait until all existing callers into module are done. */
	if (de->pde_users > 0) {
		DECLARE_COMPLETION_ONSTACK(c);

		if (!de->pde_unload_completion)
			de->pde_unload_completion = &c;
739 740 741

		spin_unlock(&de->pde_unload_lock);

742 743
		wait_for_completion(de->pde_unload_completion);

744
		spin_lock(&de->pde_unload_lock);
745 746
	}

A
Alexey Dobriyan 已提交
747 748 749 750 751 752 753 754 755 756 757
	while (!list_empty(&de->pde_openers)) {
		struct pde_opener *pdeo;

		pdeo = list_first_entry(&de->pde_openers, struct pde_opener, lh);
		list_del(&pdeo->lh);
		spin_unlock(&de->pde_unload_lock);
		pdeo->release(pdeo->inode, pdeo->file);
		kfree(pdeo);
		spin_lock(&de->pde_unload_lock);
	}
	spin_unlock(&de->pde_unload_lock);
A
Al Viro 已提交
758 759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787 788 789 790 791
}

/*
 * Remove a /proc entry and free it if it's not currently in use.
 */
void remove_proc_entry(const char *name, struct proc_dir_entry *parent)
{
	struct proc_dir_entry **p;
	struct proc_dir_entry *de = NULL;
	const char *fn = name;
	unsigned int len;

	spin_lock(&proc_subdir_lock);
	if (__xlate_proc_name(name, &parent, &fn) != 0) {
		spin_unlock(&proc_subdir_lock);
		return;
	}
	len = strlen(fn);

	for (p = &parent->subdir; *p; p=&(*p)->next ) {
		if (proc_match(len, fn, *p)) {
			de = *p;
			*p = de->next;
			de->next = NULL;
			break;
		}
	}
	spin_unlock(&proc_subdir_lock);
	if (!de) {
		WARN(1, "name '%s'\n", name);
		return;
	}

	entry_rundown(de);
A
Alexey Dobriyan 已提交
792

793 794 795
	if (S_ISDIR(de->mode))
		parent->nlink--;
	de->nlink = 0;
A
Andrew Morton 已提交
796 797 798
	WARN(de->subdir, "%s: removing non-empty directory "
			 "'%s/%s', leaking at least '%s'\n", __func__,
			 de->parent->name, de->name, de->subdir->name);
799
	pde_put(de);
L
Linus Torvalds 已提交
800
}
H
Helight.Xu 已提交
801
EXPORT_SYMBOL(remove_proc_entry);
A
Al Viro 已提交
802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855

int remove_proc_subtree(const char *name, struct proc_dir_entry *parent)
{
	struct proc_dir_entry **p;
	struct proc_dir_entry *root = NULL, *de, *next;
	const char *fn = name;
	unsigned int len;

	spin_lock(&proc_subdir_lock);
	if (__xlate_proc_name(name, &parent, &fn) != 0) {
		spin_unlock(&proc_subdir_lock);
		return -ENOENT;
	}
	len = strlen(fn);

	for (p = &parent->subdir; *p; p=&(*p)->next ) {
		if (proc_match(len, fn, *p)) {
			root = *p;
			*p = root->next;
			root->next = NULL;
			break;
		}
	}
	if (!root) {
		spin_unlock(&proc_subdir_lock);
		return -ENOENT;
	}
	de = root;
	while (1) {
		next = de->subdir;
		if (next) {
			de->subdir = next->next;
			next->next = NULL;
			de = next;
			continue;
		}
		spin_unlock(&proc_subdir_lock);

		entry_rundown(de);
		next = de->parent;
		if (S_ISDIR(de->mode))
			next->nlink--;
		de->nlink = 0;
		if (de == root)
			break;
		pde_put(de);

		spin_lock(&proc_subdir_lock);
		de = next;
	}
	pde_put(root);
	return 0;
}
EXPORT_SYMBOL(remove_proc_subtree);