nfsctl.c 39.0 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0-only
L
Linus Torvalds 已提交
2 3 4 5 6 7
/*
 * Syscall interface to knfsd.
 *
 * Copyright (C) 1995, 1996 Olaf Kirch <okir@monad.swb.de>
 */

8
#include <linux/slab.h>
9
#include <linux/namei.h>
10
#include <linux/ctype.h>
11
#include <linux/fs_context.h>
L
Linus Torvalds 已提交
12

13
#include <linux/sunrpc/svcsock.h>
14
#include <linux/lockd/lockd.h>
15
#include <linux/sunrpc/addr.h>
16
#include <linux/sunrpc/gss_api.h>
17
#include <linux/sunrpc/gss_krb5_enctypes.h>
18
#include <linux/sunrpc/rpc_pipe_fs.h>
19
#include <linux/module.h>
20
#include <linux/fsnotify.h>
L
Linus Torvalds 已提交
21

22
#include "idmap.h"
23 24
#include "nfsd.h"
#include "cache.h"
25
#include "state.h"
26
#include "netns.h"
27
#include "pnfs.h"
28

L
Linus Torvalds 已提交
29
/*
30
 *	We have a single directory with several nodes in it.
L
Linus Torvalds 已提交
31 32 33 34
 */
enum {
	NFSD_Root = 1,
	NFSD_List,
35
	NFSD_Export_features,
L
Linus Torvalds 已提交
36
	NFSD_Fh,
37
	NFSD_FO_UnlockIP,
38
	NFSD_FO_UnlockFS,
L
Linus Torvalds 已提交
39
	NFSD_Threads,
40
	NFSD_Pool_Threads,
41
	NFSD_Pool_Stats,
42
	NFSD_Reply_Cache_Stats,
43
	NFSD_Versions,
44
	NFSD_Ports,
45
	NFSD_MaxBlkSize,
46
	NFSD_MaxConnections,
47
	NFSD_SupportedEnctypes,
48 49 50 51 52
	/*
	 * The below MUST come last.  Otherwise we leave a hole in nfsd_files[]
	 * with !CONFIG_NFSD_V4 and simple_fill_super() goes oops
	 */
#ifdef CONFIG_NFSD_V4
L
Linus Torvalds 已提交
53
	NFSD_Leasetime,
54
	NFSD_Gracetime,
55
	NFSD_RecoveryDir,
56
	NFSD_V4EndGrace,
57
#endif
58
	NFSD_MaxReserved
L
Linus Torvalds 已提交
59 60 61 62 63 64
};

/*
 * write() for these nodes.
 */
static ssize_t write_filehandle(struct file *file, char *buf, size_t size);
65 66
static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size);
static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size);
L
Linus Torvalds 已提交
67
static ssize_t write_threads(struct file *file, char *buf, size_t size);
68
static ssize_t write_pool_threads(struct file *file, char *buf, size_t size);
69
static ssize_t write_versions(struct file *file, char *buf, size_t size);
70
static ssize_t write_ports(struct file *file, char *buf, size_t size);
71
static ssize_t write_maxblksize(struct file *file, char *buf, size_t size);
72
static ssize_t write_maxconn(struct file *file, char *buf, size_t size);
73
#ifdef CONFIG_NFSD_V4
L
Linus Torvalds 已提交
74
static ssize_t write_leasetime(struct file *file, char *buf, size_t size);
75
static ssize_t write_gracetime(struct file *file, char *buf, size_t size);
76
static ssize_t write_recoverydir(struct file *file, char *buf, size_t size);
77
static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size);
78
#endif
L
Linus Torvalds 已提交
79

E
Eric Biggers 已提交
80
static ssize_t (*const write_op[])(struct file *, char *, size_t) = {
L
Linus Torvalds 已提交
81
	[NFSD_Fh] = write_filehandle,
82 83
	[NFSD_FO_UnlockIP] = write_unlock_ip,
	[NFSD_FO_UnlockFS] = write_unlock_fs,
L
Linus Torvalds 已提交
84
	[NFSD_Threads] = write_threads,
85
	[NFSD_Pool_Threads] = write_pool_threads,
86
	[NFSD_Versions] = write_versions,
87
	[NFSD_Ports] = write_ports,
88
	[NFSD_MaxBlkSize] = write_maxblksize,
89
	[NFSD_MaxConnections] = write_maxconn,
90
#ifdef CONFIG_NFSD_V4
L
Linus Torvalds 已提交
91
	[NFSD_Leasetime] = write_leasetime,
92
	[NFSD_Gracetime] = write_gracetime,
93
	[NFSD_RecoveryDir] = write_recoverydir,
94
	[NFSD_V4EndGrace] = write_v4_end_grace,
95
#endif
L
Linus Torvalds 已提交
96 97 98 99
};

static ssize_t nfsctl_transaction_write(struct file *file, const char __user *buf, size_t size, loff_t *pos)
{
A
Al Viro 已提交
100
	ino_t ino =  file_inode(file)->i_ino;
L
Linus Torvalds 已提交
101 102 103
	char *data;
	ssize_t rv;

104
	if (ino >= ARRAY_SIZE(write_op) || !write_op[ino])
L
Linus Torvalds 已提交
105 106 107 108 109 110 111
		return -EINVAL;

	data = simple_transaction_get(file, buf, size);
	if (IS_ERR(data))
		return PTR_ERR(data);

	rv =  write_op[ino](file, data, size);
112
	if (rv >= 0) {
L
Linus Torvalds 已提交
113 114 115 116 117 118
		simple_transaction_set(file, rv);
		rv = size;
	}
	return rv;
}

119 120 121 122 123 124 125 126 127 128 129 130 131 132
static ssize_t nfsctl_transaction_read(struct file *file, char __user *buf, size_t size, loff_t *pos)
{
	if (! file->private_data) {
		/* An attempt to read a transaction file without writing
		 * causes a 0-byte write so that the file can return
		 * state information
		 */
		ssize_t rv = nfsctl_transaction_write(file, buf, 0, pos);
		if (rv < 0)
			return rv;
	}
	return simple_transaction_read(file, buf, size, pos);
}

133
static const struct file_operations transaction_ops = {
L
Linus Torvalds 已提交
134
	.write		= nfsctl_transaction_write,
135
	.read		= nfsctl_transaction_read,
L
Linus Torvalds 已提交
136
	.release	= simple_transaction_release,
137
	.llseek		= default_llseek,
L
Linus Torvalds 已提交
138 139
};

140
static int exports_net_open(struct net *net, struct file *file)
L
Linus Torvalds 已提交
141
{
142 143
	int err;
	struct seq_file *seq;
144
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
145 146 147 148 149 150

	err = seq_open(file, &nfs_exports_op);
	if (err)
		return err;

	seq = file->private_data;
151
	seq->private = nn->svc_export_cache;
152
	return 0;
L
Linus Torvalds 已提交
153 154
}

155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173
static int exports_proc_open(struct inode *inode, struct file *file)
{
	return exports_net_open(current->nsproxy->net_ns, file);
}

static const struct file_operations exports_proc_operations = {
	.open		= exports_proc_open,
	.read		= seq_read,
	.llseek		= seq_lseek,
	.release	= seq_release,
};

static int exports_nfsd_open(struct inode *inode, struct file *file)
{
	return exports_net_open(inode->i_sb->s_fs_info, file);
}

static const struct file_operations exports_nfsd_operations = {
	.open		= exports_nfsd_open,
L
Linus Torvalds 已提交
174 175 176 177 178
	.read		= seq_read,
	.llseek		= seq_lseek,
	.release	= seq_release,
};

179 180 181 182 183 184 185 186 187 188 189
static int export_features_show(struct seq_file *m, void *v)
{
	seq_printf(m, "0x%x 0x%x\n", NFSEXP_ALLFLAGS, NFSEXP_SECINFO_FLAGS);
	return 0;
}

static int export_features_open(struct inode *inode, struct file *file)
{
	return single_open(file, export_features_show, NULL);
}

190
static const struct file_operations export_features_operations = {
191 192 193 194 195 196
	.open		= export_features_open,
	.read		= seq_read,
	.llseek		= seq_lseek,
	.release	= single_release,
};

197
#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
198 199
static int supported_enctypes_show(struct seq_file *m, void *v)
{
200
	seq_printf(m, KRB5_SUPPORTED_ENCTYPES);
201 202 203 204 205 206 207 208
	return 0;
}

static int supported_enctypes_open(struct inode *inode, struct file *file)
{
	return single_open(file, supported_enctypes_show, NULL);
}

209
static const struct file_operations supported_enctypes_ops = {
210 211 212 213 214
	.open		= supported_enctypes_open,
	.read		= seq_read,
	.llseek		= seq_lseek,
	.release	= single_release,
};
215
#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
216

217
static const struct file_operations pool_stats_operations = {
218 219 220
	.open		= nfsd_pool_stats_open,
	.read		= seq_read,
	.llseek		= seq_lseek,
221
	.release	= nfsd_pool_stats_release,
222 223
};

224
static const struct file_operations reply_cache_stats_operations = {
225 226 227 228 229 230
	.open		= nfsd_reply_cache_stats_open,
	.read		= seq_read,
	.llseek		= seq_lseek,
	.release	= single_release,
};

L
Linus Torvalds 已提交
231 232 233 234 235
/*----------------------------------------------------------------------------*/
/*
 * payload - write methods
 */

A
Al Viro 已提交
236 237 238 239
static inline struct net *netns(struct file *file)
{
	return file_inode(file)->i_sb->s_fs_info;
}
L
Linus Torvalds 已提交
240

241 242 243 244 245 246 247
/**
 * write_unlock_ip - Release all locks used by a client
 *
 * Experimental.
 *
 * Input:
 *			buf:	'\n'-terminated C string containing a
248
 *				presentation format IP address
249 250 251 252 253 254
 *			size:	length of C string in @buf
 * Output:
 *	On success:	returns zero if all specified locks were released;
 *			returns one if one or more locks were not released
 *	On error:	return code is negative errno value
 */
255
static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size)
256
{
257 258 259
	struct sockaddr_storage address;
	struct sockaddr *sap = (struct sockaddr *)&address;
	size_t salen = sizeof(address);
260
	char *fo_path;
A
Al Viro 已提交
261
	struct net *net = netns(file);
262 263 264 265 266 267 268 269 270 271 272 273

	/* sanity check */
	if (size == 0)
		return -EINVAL;

	if (buf[size-1] != '\n')
		return -EINVAL;

	fo_path = buf;
	if (qword_get(&buf, fo_path, size) < 0)
		return -EINVAL;

274
	if (rpc_pton(net, fo_path, size, sap, salen) == 0)
275 276
		return -EINVAL;

277
	return nlmsvc_unlock_all_by_ip(sap);
278 279
}

280 281 282 283 284 285 286 287 288 289 290 291 292 293
/**
 * write_unlock_fs - Release all locks on a local file system
 *
 * Experimental.
 *
 * Input:
 *			buf:	'\n'-terminated C string containing the
 *				absolute pathname of a local file system
 *			size:	length of C string in @buf
 * Output:
 *	On success:	returns zero if all specified locks were released;
 *			returns one if one or more locks were not released
 *	On error:	return code is negative errno value
 */
294
static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size)
295
{
A
Al Viro 已提交
296
	struct path path;
297 298 299 300 301 302 303 304 305 306 307 308 309 310
	char *fo_path;
	int error;

	/* sanity check */
	if (size == 0)
		return -EINVAL;

	if (buf[size-1] != '\n')
		return -EINVAL;

	fo_path = buf;
	if (qword_get(&buf, fo_path, size) < 0)
		return -EINVAL;

A
Al Viro 已提交
311
	error = kern_path(fo_path, 0, &path);
312 313 314
	if (error)
		return error;

315 316 317 318 319 320 321 322 323
	/*
	 * XXX: Needs better sanity checking.  Otherwise we could end up
	 * releasing locks on the wrong file system.
	 *
	 * For example:
	 * 1.  Does the path refer to a directory?
	 * 2.  Is that directory a mount point, or
	 * 3.  Is that directory the root of an exported file system?
	 */
324
	error = nlmsvc_unlock_all_by_sb(path.dentry->d_sb);
325

A
Al Viro 已提交
326
	path_put(&path);
327 328 329
	return error;
}

330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350
/**
 * write_filehandle - Get a variable-length NFS file handle by path
 *
 * On input, the buffer contains a '\n'-terminated C string comprised of
 * three alphanumeric words separated by whitespace.  The string may
 * contain escape sequences.
 *
 * Input:
 *			buf:
 *				domain:		client domain name
 *				path:		export pathname
 *				maxsize:	numeric maximum size of
 *						@buf
 *			size:	length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C
 *			string containing a ASCII hex text version
 *			of the NFS file handle;
 *			return code is the size in bytes of the string
 *	On error:	return code is negative errno value
 */
L
Linus Torvalds 已提交
351 352 353
static ssize_t write_filehandle(struct file *file, char *buf, size_t size)
{
	char *dname, *path;
A
Andrew Morton 已提交
354
	int uninitialized_var(maxsize);
L
Linus Torvalds 已提交
355 356 357 358 359
	char *mesg = buf;
	int len;
	struct auth_domain *dom;
	struct knfsd_fh fh;

360 361 362
	if (size == 0)
		return -EINVAL;

L
Linus Torvalds 已提交
363 364 365 366 367 368
	if (buf[size-1] != '\n')
		return -EINVAL;
	buf[size-1] = 0;

	dname = mesg;
	len = qword_get(&mesg, dname, size);
369 370
	if (len <= 0)
		return -EINVAL;
L
Linus Torvalds 已提交
371 372 373
	
	path = dname+len+1;
	len = qword_get(&mesg, path, size);
374 375
	if (len <= 0)
		return -EINVAL;
L
Linus Torvalds 已提交
376 377 378 379 380 381 382

	len = get_int(&mesg, &maxsize);
	if (len)
		return len;

	if (maxsize < NFS_FHSIZE)
		return -EINVAL;
383
	maxsize = min(maxsize, NFS3_FHSIZE);
L
Linus Torvalds 已提交
384 385 386 387 388 389 390 391 392

	if (qword_get(&mesg, mesg, size)>0)
		return -EINVAL;

	/* we have all the words, they are in buf.. */
	dom = unix_domain_find(dname);
	if (!dom)
		return -ENOMEM;

A
Al Viro 已提交
393
	len = exp_rootfh(netns(file), dom, path, &fh,  maxsize);
L
Linus Torvalds 已提交
394 395 396 397
	auth_domain_put(dom);
	if (len)
		return len;
	
398 399
	mesg = buf;
	len = SIMPLE_TRANSACTION_LIMIT;
L
Linus Torvalds 已提交
400 401 402 403 404
	qword_addhex(&mesg, &len, (char*)&fh.fh_base, fh.fh_size);
	mesg[-1] = '\n';
	return mesg - buf;	
}

405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432
/**
 * write_threads - Start NFSD, or report the current number of running threads
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C
 *			string numeric value representing the number of
 *			running NFSD threads;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero
 *
 * OR
 *
 * Input:
 *			buf:		C string containing an unsigned
 *					integer value representing the
 *					number of NFSD threads to start
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	NFS service is started;
 *			passed-in buffer filled with '\n'-terminated C
 *			string numeric value representing the number of
 *			running NFSD threads;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
L
Linus Torvalds 已提交
433 434 435 436
static ssize_t write_threads(struct file *file, char *buf, size_t size)
{
	char *mesg = buf;
	int rv;
A
Al Viro 已提交
437
	struct net *net = netns(file);
438

L
Linus Torvalds 已提交
439 440 441 442 443
	if (size > 0) {
		int newthreads;
		rv = get_int(&mesg, &newthreads);
		if (rv)
			return rv;
444
		if (newthreads < 0)
L
Linus Torvalds 已提交
445
			return -EINVAL;
446
		rv = nfsd_svc(newthreads, net, file->f_cred);
447
		if (rv < 0)
L
Linus Torvalds 已提交
448
			return rv;
449
	} else
450
		rv = nfsd_nrthreads(net);
451

452
	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n", rv);
L
Linus Torvalds 已提交
453 454
}

455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476
/**
 * write_pool_threads - Set or report the current number of threads per pool
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 *
 * OR
 *
 * Input:
 * 			buf:		C string containing whitespace-
 * 					separated unsigned integer values
 *					representing the number of NFSD
 *					threads to start in each pool
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C
 *			string containing integer values representing the
 *			number of NFSD threads in each pool;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
477 478 479 480 481 482 483 484 485
static ssize_t write_pool_threads(struct file *file, char *buf, size_t size)
{
	/* if size > 0, look for an array of number of threads per node
	 * and apply them  then write out number of threads per node as reply
	 */
	char *mesg = buf;
	int i;
	int rv;
	int len;
486
	int npools;
487
	int *nthreads;
A
Al Viro 已提交
488
	struct net *net = netns(file);
489

490
	mutex_lock(&nfsd_mutex);
491
	npools = nfsd_nrpools(net);
492 493 494 495 496 497
	if (npools == 0) {
		/*
		 * NFS is shut down.  The admin can start it by
		 * writing to the threads file but NOT the pool_threads
		 * file, sorry.  Report zero threads.
		 */
498
		mutex_unlock(&nfsd_mutex);
499 500 501 502 503
		strcpy(buf, "0\n");
		return strlen(buf);
	}

	nthreads = kcalloc(npools, sizeof(int), GFP_KERNEL);
504
	rv = -ENOMEM;
505
	if (nthreads == NULL)
506
		goto out_free;
507 508 509 510 511 512 513 514 515 516 517 518

	if (size > 0) {
		for (i = 0; i < npools; i++) {
			rv = get_int(&mesg, &nthreads[i]);
			if (rv == -ENOENT)
				break;		/* fewer numbers than pools */
			if (rv)
				goto out_free;	/* syntax error */
			rv = -EINVAL;
			if (nthreads[i] < 0)
				goto out_free;
		}
519
		rv = nfsd_set_nrthreads(i, nthreads, net);
520 521 522 523
		if (rv)
			goto out_free;
	}

524
	rv = nfsd_get_nrthreads(npools, nthreads, net);
525 526 527 528 529 530 531 532 533 534 535
	if (rv)
		goto out_free;

	mesg = buf;
	size = SIMPLE_TRANSACTION_LIMIT;
	for (i = 0; i < npools && size > 0; i++) {
		snprintf(mesg, size, "%d%c", nthreads[i], (i == npools-1 ? '\n' : ' '));
		len = strlen(mesg);
		size -= len;
		mesg += len;
	}
536
	rv = mesg - buf;
537 538
out_free:
	kfree(nthreads);
539
	mutex_unlock(&nfsd_mutex);
540 541 542
	return rv;
}

543
static ssize_t
544 545
nfsd_print_version_support(struct nfsd_net *nn, char *buf, int remaining,
		const char *sep, unsigned vers, int minor)
546
{
547
	const char *format = minor < 0 ? "%s%c%u" : "%s%c%u.%u";
548
	bool supported = !!nfsd_vers(nn, vers, NFSD_TEST);
549

550
	if (vers == 4 && minor >= 0 &&
551
	    !nfsd_minorversion(nn, minor, NFSD_TEST))
552
		supported = false;
553 554 555 556 557 558 559
	if (minor == 0 && supported)
		/*
		 * special case for backward compatability.
		 * +4.0 is never reported, it is implied by
		 * +4, unless -4.0 is present.
		 */
		return 0;
560 561 562 563
	return snprintf(buf, remaining, format, sep,
			supported ? '+' : '-', vers, minor);
}

564
static ssize_t __write_versions(struct file *file, char *buf, size_t size)
565 566
{
	char *mesg = buf;
567
	char *vers, *minorp, sign;
568
	int len, num, remaining;
569 570
	ssize_t tlen = 0;
	char *sep;
A
Al Viro 已提交
571
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
572 573

	if (size>0) {
574
		if (nn->nfsd_serv)
575
			/* Cannot change versions without updating
576
			 * nn->nfsd_serv->sv_xdrsize, and reallocing
577 578
			 * rq_argp and rq_resp
			 */
579 580 581 582 583 584 585 586 587
			return -EBUSY;
		if (buf[size-1] != '\n')
			return -EINVAL;
		buf[size-1] = 0;

		vers = mesg;
		len = qword_get(&mesg, vers, size);
		if (len <= 0) return -EINVAL;
		do {
588
			enum vers_op cmd;
589
			unsigned minor;
590 591
			sign = *vers;
			if (sign == '+' || sign == '-')
592
				num = simple_strtol((vers+1), &minorp, 0);
593
			else
594 595
				num = simple_strtol(vers, &minorp, 0);
			if (*minorp == '.') {
596
				if (num != 4)
597
					return -EINVAL;
598
				if (kstrtouint(minorp+1, 0, &minor) < 0)
599
					return -EINVAL;
600 601
			}

602
			cmd = sign == '-' ? NFSD_CLEAR : NFSD_SET;
603 604 605
			switch(num) {
			case 2:
			case 3:
606
				nfsd_vers(nn, num, cmd);
607
				break;
608
			case 4:
609
				if (*minorp == '.') {
610
					if (nfsd_minorversion(nn, minor, cmd) < 0)
611
						return -EINVAL;
612
				} else if ((cmd == NFSD_SET) != nfsd_vers(nn, num, NFSD_TEST)) {
613 614 615 616 617 618
					/*
					 * Either we have +4 and no minors are enabled,
					 * or we have -4 and at least one minor is enabled.
					 * In either case, propagate 'cmd' to all minors.
					 */
					minor = 0;
619
					while (nfsd_minorversion(nn, minor, cmd) >= 0)
620 621 622
						minor++;
				}
				break;
623 624 625 626 627 628 629 630
			default:
				return -EINVAL;
			}
			vers += len + 1;
		} while ((len = qword_get(&mesg, vers, size)) > 0);
		/* If all get turned off, turn them back on, as
		 * having no versions is BAD
		 */
631
		nfsd_reset_versions(nn);
632
	}
633

634 635 636
	/* Now write current state into reply buffer */
	len = 0;
	sep = "";
637
	remaining = SIMPLE_TRANSACTION_LIMIT;
638
	for (num=2 ; num <= 4 ; num++) {
639
		int minor;
640
		if (!nfsd_vers(nn, num, NFSD_AVAIL))
641
			continue;
642 643

		minor = -1;
644
		do {
645
			len = nfsd_print_version_support(nn, buf, remaining,
646
					sep, num, minor);
647
			if (len >= remaining)
648
				goto out;
649 650 651
			remaining -= len;
			buf += len;
			tlen += len;
652
			minor++;
653 654
			if (len)
				sep = " ";
655 656 657
		} while (num == 4 && minor <= NFSD_SUPPORTED_MINOR_VERSION);
	}
out:
658
	len = snprintf(buf, remaining, "\n");
659
	if (len >= remaining)
660 661
		return -EINVAL;
	return tlen + len;
662 663
}

664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695
/**
 * write_versions - Set or report the available NFS protocol versions
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C
 *			string containing positive or negative integer
 *			values representing the current status of each
 *			protocol version;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 *
 * OR
 *
 * Input:
 * 			buf:		C string containing whitespace-
 * 					separated positive or negative
 * 					integer values representing NFS
 * 					protocol versions to enable ("+n")
 * 					or disable ("-n")
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	status of zero or more protocol versions has
 *			been updated; passed-in buffer filled with
 *			'\n'-terminated C string containing positive
 *			or negative integer values representing the
 *			current status of each protocol version;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
696 697 698 699 700 701 702 703 704 705
static ssize_t write_versions(struct file *file, char *buf, size_t size)
{
	ssize_t rv;

	mutex_lock(&nfsd_mutex);
	rv = __write_versions(file, buf, size);
	mutex_unlock(&nfsd_mutex);
	return rv;
}

706 707 708 709
/*
 * Zero-length write.  Return a list of NFSD's current listener
 * transports.
 */
710
static ssize_t __write_ports_names(char *buf, struct net *net)
711
{
712 713 714
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);

	if (nn->nfsd_serv == NULL)
715
		return 0;
716
	return svc_xprt_names(nn->nfsd_serv, buf, SIMPLE_TRANSACTION_LIMIT);
717 718
}

719 720 721 722 723
/*
 * A single 'fd' number was written, in which case it must be for
 * a socket of a supported family/protocol, and we use it as an
 * nfsd listener.
 */
724
static ssize_t __write_ports_addfd(char *buf, struct net *net, const struct cred *cred)
725 726 727
{
	char *mesg = buf;
	int fd, err;
728
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
729 730 731 732 733

	err = get_int(&mesg, &fd);
	if (err != 0 || fd < 0)
		return -EINVAL;

734 735 736 737 738
	if (svc_alien_sock(net, fd)) {
		printk(KERN_ERR "%s: socket net is different to NFSd's one\n", __func__);
		return -EINVAL;
	}

739
	err = nfsd_create_serv(net);
740 741 742
	if (err != 0)
		return err;

743
	err = svc_addsock(nn->nfsd_serv, fd, buf, SIMPLE_TRANSACTION_LIMIT, cred);
744
	if (err < 0) {
745
		nfsd_destroy(net);
746 747
		return err;
	}
748

749
	/* Decrease the count, but don't shut down the service */
750
	nn->nfsd_serv->sv_nrthreads--;
751
	return err;
752 753
}

754 755 756 757
/*
 * A transport listener is added by writing it's transport name and
 * a port number.
 */
758
static ssize_t __write_ports_addxprt(char *buf, struct net *net, const struct cred *cred)
759 760
{
	char transport[16];
761
	struct svc_xprt *xprt;
762
	int port, err;
763
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
764

765
	if (sscanf(buf, "%15s %5u", transport, &port) != 2)
766 767
		return -EINVAL;

768
	if (port < 1 || port > USHRT_MAX)
769 770
		return -EINVAL;

771
	err = nfsd_create_serv(net);
772 773 774
	if (err != 0)
		return err;

775
	err = svc_create_xprt(nn->nfsd_serv, transport, net,
776
				PF_INET, port, SVC_SOCK_ANONYMOUS, cred);
777
	if (err < 0)
778 779
		goto out_err;

780
	err = svc_create_xprt(nn->nfsd_serv, transport, net,
781
				PF_INET6, port, SVC_SOCK_ANONYMOUS, cred);
782 783
	if (err < 0 && err != -EAFNOSUPPORT)
		goto out_close;
784 785

	/* Decrease the count, but don't shut down the service */
786
	nn->nfsd_serv->sv_nrthreads--;
787
	return 0;
788
out_close:
789
	xprt = svc_find_xprt(nn->nfsd_serv, transport, net, PF_INET, port);
790 791 792 793 794
	if (xprt != NULL) {
		svc_close_xprt(xprt);
		svc_xprt_put(xprt);
	}
out_err:
795
	nfsd_destroy(net);
796
	return err;
797 798
}

799 800
static ssize_t __write_ports(struct file *file, char *buf, size_t size,
			     struct net *net)
801
{
802
	if (size == 0)
803
		return __write_ports_names(buf, net);
804 805

	if (isdigit(buf[0]))
806
		return __write_ports_addfd(buf, net, file->f_cred);
807

808
	if (isalpha(buf[0]))
809
		return __write_ports_addxprt(buf, net, file->f_cred);
810

811
	return -EINVAL;
812 813
}

814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832
/**
 * write_ports - Pass a socket file descriptor or transport name to listen on
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 * Output:
 *	On success:	passed-in buffer filled with a '\n'-terminated C
 *			string containing a whitespace-separated list of
 *			named NFSD listeners;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 *
 * OR
 *
 * Input:
 *			buf:		C string containing an unsigned
 *					integer value representing a bound
 *					but unconnected socket that is to be
833 834 835
 *					used as an NFSD listener; listen(3)
 *					must be called for a SOCK_STREAM
 *					socket, otherwise it is ignored
836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	NFS service is started;
 *			passed-in buffer filled with a '\n'-terminated C
 *			string containing a unique alphanumeric name of
 *			the listener;
 *			return code is the size in bytes of the string
 *	On error:	return code is a negative errno value
 *
 * OR
 *
 * Input:
 *			buf:		C string containing a transport
 *					name and an unsigned integer value
 *					representing the port to listen on,
 *					separated by whitespace
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	returns zero; NFS service is started
 *	On error:	return code is a negative errno value
 */
857 858 859
static ssize_t write_ports(struct file *file, char *buf, size_t size)
{
	ssize_t rv;
860

861
	mutex_lock(&nfsd_mutex);
A
Al Viro 已提交
862
	rv = __write_ports(file, buf, size, netns(file));
863 864 865 866 867
	mutex_unlock(&nfsd_mutex);
	return rv;
}


868 869
int nfsd_max_blksize;

870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890
/**
 * write_maxblksize - Set or report the current NFS blksize
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 *
 * OR
 *
 * Input:
 * 			buf:		C string containing an unsigned
 * 					integer value representing the new
 * 					NFS blksize
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C string
 *			containing numeric value of the current NFS blksize
 *			setting;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
891 892 893
static ssize_t write_maxblksize(struct file *file, char *buf, size_t size)
{
	char *mesg = buf;
A
Al Viro 已提交
894
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
895

896 897 898 899 900 901 902 903
	if (size > 0) {
		int bsize;
		int rv = get_int(&mesg, &bsize);
		if (rv)
			return rv;
		/* force bsize into allowed range and
		 * required alignment.
		 */
904 905
		bsize = max_t(int, bsize, 1024);
		bsize = min_t(int, bsize, NFSSVC_MAXBLKSIZE);
906
		bsize &= ~(1024-1);
907
		mutex_lock(&nfsd_mutex);
908
		if (nn->nfsd_serv) {
909
			mutex_unlock(&nfsd_mutex);
910 911 912
			return -EBUSY;
		}
		nfsd_max_blksize = bsize;
913
		mutex_unlock(&nfsd_mutex);
914
	}
915 916 917

	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n",
							nfsd_max_blksize);
918 919
}

920 921 922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942
/**
 * write_maxconn - Set or report the current max number of connections
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 * OR
 *
 * Input:
 * 			buf:		C string containing an unsigned
 * 					integer value representing the new
 * 					number of max connections
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C string
 *			containing numeric value of max_connections setting
 *			for this net namespace;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
static ssize_t write_maxconn(struct file *file, char *buf, size_t size)
{
	char *mesg = buf;
A
Al Viro 已提交
943
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
944 945 946 947 948 949 950 951 952 953 954 955 956
	unsigned int maxconn = nn->max_connections;

	if (size > 0) {
		int rv = get_uint(&mesg, &maxconn);

		if (rv)
			return rv;
		nn->max_connections = maxconn;
	}

	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%u\n", maxconn);
}

957
#ifdef CONFIG_NFSD_V4
958 959
static ssize_t __nfsd4_write_time(struct file *file, char *buf, size_t size,
				  time_t *time, struct nfsd_net *nn)
L
Linus Torvalds 已提交
960 961
{
	char *mesg = buf;
962
	int rv, i;
L
Linus Torvalds 已提交
963 964

	if (size > 0) {
965
		if (nn->nfsd_serv)
966
			return -EBUSY;
967
		rv = get_int(&mesg, &i);
L
Linus Torvalds 已提交
968 969
		if (rv)
			return rv;
970 971 972 973 974 975 976 977 978 979 980 981
		/*
		 * Some sanity checking.  We don't have a reason for
		 * these particular numbers, but problems with the
		 * extremes are:
		 *	- Too short: the briefest network outage may
		 *	  cause clients to lose all their locks.  Also,
		 *	  the frequent polling may be wasteful.
		 *	- Too long: do you really want reboot recovery
		 *	  to take more than an hour?  Or to make other
		 *	  clients wait an hour before being able to
		 *	  revoke a dead client's locks?
		 */
982
		if (i < 10 || i > 3600)
L
Linus Torvalds 已提交
983
			return -EINVAL;
984
		*time = i;
L
Linus Torvalds 已提交
985
	}
986

987 988 989
	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%ld\n", *time);
}

990 991
static ssize_t nfsd4_write_time(struct file *file, char *buf, size_t size,
				time_t *time, struct nfsd_net *nn)
992 993 994 995
{
	ssize_t rv;

	mutex_lock(&nfsd_mutex);
996
	rv = __nfsd4_write_time(file, buf, size, time, nn);
997 998
	mutex_unlock(&nfsd_mutex);
	return rv;
L
Linus Torvalds 已提交
999 1000
}

1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021
/**
 * write_leasetime - Set or report the current NFSv4 lease time
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 *
 * OR
 *
 * Input:
 *			buf:		C string containing an unsigned
 *					integer value representing the new
 *					NFSv4 lease expiry time
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C
 *			string containing unsigned integer value of the
 *			current lease expiry time;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
1022 1023
static ssize_t write_leasetime(struct file *file, char *buf, size_t size)
{
A
Al Viro 已提交
1024
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1025
	return nfsd4_write_time(file, buf, size, &nn->nfsd4_lease, nn);
1026 1027
}

1028 1029 1030 1031 1032 1033 1034 1035 1036 1037 1038 1039
/**
 * write_gracetime - Set or report current NFSv4 grace period time
 *
 * As above, but sets the time of the NFSv4 grace period.
 *
 * Note this should never be set to less than the *previous*
 * lease-period time, but we don't try to enforce this.  (In the common
 * case (a new boot), we don't know what the previous lease time was
 * anyway.)
 */
static ssize_t write_gracetime(struct file *file, char *buf, size_t size)
{
A
Al Viro 已提交
1040
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1041
	return nfsd4_write_time(file, buf, size, &nn->nfsd4_grace, nn);
1042 1043
}

1044 1045
static ssize_t __write_recoverydir(struct file *file, char *buf, size_t size,
				   struct nfsd_net *nn)
1046 1047 1048 1049 1050
{
	char *mesg = buf;
	char *recdir;
	int len, status;

1051
	if (size > 0) {
1052
		if (nn->nfsd_serv)
1053 1054 1055 1056
			return -EBUSY;
		if (size > PATH_MAX || buf[size-1] != '\n')
			return -EINVAL;
		buf[size-1] = 0;
1057

1058 1059 1060 1061
		recdir = mesg;
		len = qword_get(&mesg, recdir, size);
		if (len <= 0)
			return -EINVAL;
1062

1063
		status = nfs4_reset_recoverydir(recdir);
1064 1065
		if (status)
			return status;
1066
	}
1067 1068 1069

	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%s\n",
							nfs4_recoverydir());
1070
}
1071

1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092
/**
 * write_recoverydir - Set or report the pathname of the recovery directory
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 *
 * OR
 *
 * Input:
 *			buf:		C string containing the pathname
 *					of the directory on a local file
 *					system containing permanent NFSv4
 *					recovery data
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C string
 *			containing the current recovery pathname setting;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
1093 1094 1095
static ssize_t write_recoverydir(struct file *file, char *buf, size_t size)
{
	ssize_t rv;
A
Al Viro 已提交
1096
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1097 1098

	mutex_lock(&nfsd_mutex);
1099
	rv = __write_recoverydir(file, buf, size, nn);
1100 1101 1102 1103
	mutex_unlock(&nfsd_mutex);
	return rv;
}

1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125
/**
 * write_v4_end_grace - release grace period for nfsd's v4.x lock manager
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 * OR
 *
 * Input:
 * 			buf:		any value
 *			size:		non-zero length of C string in @buf
 * Output:
 *			passed-in buffer filled with "Y" or "N" with a newline
 *			and NULL-terminated C string. This indicates whether
 *			the grace period has ended in the current net
 *			namespace. Return code is the size in bytes of the
 *			string. Writing a string that starts with 'Y', 'y', or
 *			'1' to the file will end the grace period for nfsd's v4
 *			lock manager.
 */
static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size)
{
A
Al Viro 已提交
1126
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1127 1128 1129 1130 1131 1132

	if (size > 0) {
		switch(buf[0]) {
		case 'Y':
		case 'y':
		case '1':
1133
			if (!nn->nfsd_serv)
1134
				return -EBUSY;
1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145
			nfsd4_end_grace(nn);
			break;
		default:
			return -EINVAL;
		}
	}

	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%c\n",
			 nn->grace_ended ? 'Y' : 'N');
}

1146
#endif
1147

L
Linus Torvalds 已提交
1148 1149 1150 1151 1152
/*----------------------------------------------------------------------------*/
/*
 *	populating the filesystem.
 */

1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211
/* Basically copying rpc_get_inode. */
static struct inode *nfsd_get_inode(struct super_block *sb, umode_t mode)
{
	struct inode *inode = new_inode(sb);
	if (!inode)
		return NULL;
	/* Following advice from simple_fill_super documentation: */
	inode->i_ino = iunique(sb, NFSD_MaxReserved);
	inode->i_mode = mode;
	inode->i_atime = inode->i_mtime = inode->i_ctime = current_time(inode);
	switch (mode & S_IFMT) {
	case S_IFDIR:
		inode->i_fop = &simple_dir_operations;
		inode->i_op = &simple_dir_inode_operations;
		inc_nlink(inode);
	default:
		break;
	}
	return inode;
}

static int __nfsd_mkdir(struct inode *dir, struct dentry *dentry, umode_t mode)
{
	struct inode *inode;

	inode = nfsd_get_inode(dir->i_sb, mode);
	if (!inode)
		return -ENOMEM;
	d_add(dentry, inode);
	inc_nlink(dir);
	fsnotify_mkdir(dir, dentry);
	return 0;
}

static struct dentry *nfsd_mkdir(struct dentry *parent, struct nfsdfs_client *ncl, char *name)
{
	struct inode *dir = parent->d_inode;
	struct dentry *dentry;
	int ret = -ENOMEM;

	inode_lock(dir);
	dentry = d_alloc_name(parent, name);
	if (!dentry)
		goto out_err;
	ret = __nfsd_mkdir(d_inode(parent), dentry, S_IFDIR | 0600);
	if (ret)
		goto out_err;
	if (ncl) {
		d_inode(dentry)->i_private = ncl;
		kref_get(&ncl->cl_ref);
	}
out:
	inode_unlock(dir);
	return dentry;
out_err:
	dentry = ERR_PTR(ret);
	goto out;
}

J
J. Bruce Fields 已提交
1212 1213 1214 1215 1216 1217 1218 1219 1220 1221
static void clear_ncl(struct inode *inode)
{
	struct nfsdfs_client *ncl = inode->i_private;

	inode->i_private = NULL;
	synchronize_rcu();
	kref_put(&ncl->cl_ref, ncl->cl_release);
}


1222
static struct nfsdfs_client *__get_nfsdfs_client(struct inode *inode)
J
J. Bruce Fields 已提交
1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299 1300 1301
{
	struct nfsdfs_client *nc = inode->i_private;

	if (nc)
		kref_get(&nc->cl_ref);
	return nc;
}

struct nfsdfs_client *get_nfsdfs_client(struct inode *inode)
{
	struct nfsdfs_client *nc;

	rcu_read_lock();
	nc = __get_nfsdfs_client(inode);
	rcu_read_unlock();
	return nc;
}
/* from __rpc_unlink */
static void nfsdfs_remove_file(struct inode *dir, struct dentry *dentry)
{
	int ret;

	clear_ncl(d_inode(dentry));
	dget(dentry);
	ret = simple_unlink(dir, dentry);
	d_delete(dentry);
	dput(dentry);
	WARN_ON_ONCE(ret);
}

static void nfsdfs_remove_files(struct dentry *root)
{
	struct dentry *dentry, *tmp;

	list_for_each_entry_safe(dentry, tmp, &root->d_subdirs, d_child) {
		if (!simple_positive(dentry)) {
			WARN_ON_ONCE(1); /* I think this can't happen? */
			continue;
		}
		nfsdfs_remove_file(d_inode(root), dentry);
	}
}

/* XXX: cut'n'paste from simple_fill_super; figure out if we could share
 * code instead. */
static  int nfsdfs_create_files(struct dentry *root,
					const struct tree_descr *files)
{
	struct inode *dir = d_inode(root);
	struct inode *inode;
	struct dentry *dentry;
	int i;

	inode_lock(dir);
	for (i = 0; files->name && files->name[0]; i++, files++) {
		if (!files->name)
			continue;
		dentry = d_alloc_name(root, files->name);
		if (!dentry)
			goto out;
		inode = nfsd_get_inode(d_inode(root)->i_sb,
					S_IFREG | files->mode);
		if (!inode) {
			dput(dentry);
			goto out;
		}
		inode->i_fop = files->ops;
		inode->i_private = __get_nfsdfs_client(dir);
		d_add(dentry, inode);
		fsnotify_create(dir, dentry);
	}
	inode_unlock(dir);
	return 0;
out:
	nfsdfs_remove_files(root);
	inode_unlock(dir);
	return -ENOMEM;
}

1302
/* on success, returns positive number unique to that client. */
J
J. Bruce Fields 已提交
1303 1304 1305
struct dentry *nfsd_client_mkdir(struct nfsd_net *nn,
		struct nfsdfs_client *ncl, u32 id,
		const struct tree_descr *files)
1306
{
J
J. Bruce Fields 已提交
1307
	struct dentry *dentry;
1308
	char name[11];
J
J. Bruce Fields 已提交
1309
	int ret;
1310

1311
	sprintf(name, "%u", id);
1312

J
J. Bruce Fields 已提交
1313 1314 1315 1316 1317 1318 1319 1320 1321
	dentry = nfsd_mkdir(nn->nfsd_client_dir, ncl, name);
	if (IS_ERR(dentry)) /* XXX: tossing errors? */
		return NULL;
	ret = nfsdfs_create_files(dentry, files);
	if (ret) {
		nfsd_client_rmdir(dentry);
		return NULL;
	}
	return dentry;
1322 1323 1324 1325 1326 1327 1328 1329 1330
}

/* Taken from __rpc_rmdir: */
void nfsd_client_rmdir(struct dentry *dentry)
{
	struct inode *dir = d_inode(dentry->d_parent);
	struct inode *inode = d_inode(dentry);
	int ret;

J
J. Bruce Fields 已提交
1331 1332 1333
	inode_lock(dir);
	nfsdfs_remove_files(dentry);
	clear_ncl(inode);
1334 1335 1336 1337
	dget(dentry);
	ret = simple_rmdir(dir, dentry);
	WARN_ON_ONCE(ret);
	d_delete(dentry);
J
J. Bruce Fields 已提交
1338
	inode_unlock(dir);
1339 1340
}

1341
static int nfsd_fill_super(struct super_block *sb, struct fs_context *fc)
L
Linus Torvalds 已提交
1342
{
1343 1344 1345 1346 1347
	struct nfsd_net *nn = net_generic(current->nsproxy->net_ns,
							nfsd_net_id);
	struct dentry *dentry;
	int ret;

1348
	static const struct tree_descr nfsd_files[] = {
1349
		[NFSD_List] = {"exports", &exports_nfsd_operations, S_IRUGO},
1350 1351
		[NFSD_Export_features] = {"export_features",
					&export_features_operations, S_IRUGO},
1352 1353
		[NFSD_FO_UnlockIP] = {"unlock_ip",
					&transaction_ops, S_IWUSR|S_IRUSR},
1354 1355
		[NFSD_FO_UnlockFS] = {"unlock_filesystem",
					&transaction_ops, S_IWUSR|S_IRUSR},
L
Linus Torvalds 已提交
1356 1357
		[NFSD_Fh] = {"filehandle", &transaction_ops, S_IWUSR|S_IRUSR},
		[NFSD_Threads] = {"threads", &transaction_ops, S_IWUSR|S_IRUSR},
1358
		[NFSD_Pool_Threads] = {"pool_threads", &transaction_ops, S_IWUSR|S_IRUSR},
1359
		[NFSD_Pool_Stats] = {"pool_stats", &pool_stats_operations, S_IRUGO},
1360
		[NFSD_Reply_Cache_Stats] = {"reply_cache_stats", &reply_cache_stats_operations, S_IRUGO},
1361
		[NFSD_Versions] = {"versions", &transaction_ops, S_IWUSR|S_IRUSR},
1362
		[NFSD_Ports] = {"portlist", &transaction_ops, S_IWUSR|S_IRUGO},
1363
		[NFSD_MaxBlkSize] = {"max_block_size", &transaction_ops, S_IWUSR|S_IRUGO},
1364
		[NFSD_MaxConnections] = {"max_connections", &transaction_ops, S_IWUSR|S_IRUGO},
1365
#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
1366
		[NFSD_SupportedEnctypes] = {"supported_krb5_enctypes", &supported_enctypes_ops, S_IRUGO},
1367
#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
L
Linus Torvalds 已提交
1368 1369
#ifdef CONFIG_NFSD_V4
		[NFSD_Leasetime] = {"nfsv4leasetime", &transaction_ops, S_IWUSR|S_IRUSR},
1370
		[NFSD_Gracetime] = {"nfsv4gracetime", &transaction_ops, S_IWUSR|S_IRUSR},
1371
		[NFSD_RecoveryDir] = {"nfsv4recoverydir", &transaction_ops, S_IWUSR|S_IRUSR},
1372
		[NFSD_V4EndGrace] = {"v4_end_grace", &transaction_ops, S_IWUSR|S_IRUGO},
L
Linus Torvalds 已提交
1373 1374 1375
#endif
		/* last one */ {""}
	};
1376

1377 1378 1379 1380 1381 1382 1383 1384
	ret = simple_fill_super(sb, 0x6e667364, nfsd_files);
	if (ret)
		return ret;
	dentry = nfsd_mkdir(sb->s_root, NULL, "clients");
	if (IS_ERR(dentry))
		return PTR_ERR(dentry);
	nn->nfsd_client_dir = dentry;
	return 0;
L
Linus Torvalds 已提交
1385
}
1386

1387 1388 1389 1390
static int nfsd_fs_get_tree(struct fs_context *fc)
{
	fc->s_fs_info = get_net(fc->net_ns);
	return vfs_get_super(fc, vfs_get_keyed_super, nfsd_fill_super);
L
Linus Torvalds 已提交
1391 1392
}

1393
static void nfsd_fs_free_fc(struct fs_context *fc)
L
Linus Torvalds 已提交
1394
{
1395 1396 1397 1398 1399 1400 1401 1402 1403 1404
	if (fc->s_fs_info)
		put_net(fc->s_fs_info);
}

static const struct fs_context_operations nfsd_fs_context_ops = {
	.free		= nfsd_fs_free_fc,
	.get_tree	= nfsd_fs_get_tree,
};

static int nfsd_init_fs_context(struct fs_context *fc)
L
Linus Torvalds 已提交
1405
{
1406 1407 1408 1409
	put_user_ns(fc->user_ns);
	fc->user_ns = get_user_ns(fc->net_ns->user_ns);
	fc->ops = &nfsd_fs_context_ops;
	return 0;
1410 1411 1412 1413 1414 1415 1416 1417
}

static void nfsd_umount(struct super_block *sb)
{
	struct net *net = sb->s_fs_info;

	kill_litter_super(sb);
	put_net(net);
L
Linus Torvalds 已提交
1418 1419 1420 1421 1422
}

static struct file_system_type nfsd_fs_type = {
	.owner		= THIS_MODULE,
	.name		= "nfsd",
1423
	.init_fs_context = nfsd_init_fs_context,
1424
	.kill_sb	= nfsd_umount,
L
Linus Torvalds 已提交
1425
};
1426
MODULE_ALIAS_FS("nfsd");
L
Linus Torvalds 已提交
1427

1428 1429 1430 1431 1432 1433 1434 1435
#ifdef CONFIG_PROC_FS
static int create_proc_exports_entry(void)
{
	struct proc_dir_entry *entry;

	entry = proc_mkdir("fs/nfs", NULL);
	if (!entry)
		return -ENOMEM;
1436 1437
	entry = proc_create("exports", 0, entry,
				 &exports_proc_operations);
1438 1439
	if (!entry) {
		remove_proc_entry("fs/nfs", NULL);
1440
		return -ENOMEM;
1441
	}
1442 1443 1444 1445 1446 1447 1448 1449 1450
	return 0;
}
#else /* CONFIG_PROC_FS */
static int create_proc_exports_entry(void)
{
	return 0;
}
#endif

1451
unsigned int nfsd_net_id;
1452 1453 1454 1455

static __net_init int nfsd_init_net(struct net *net)
{
	int retval;
1456
	struct vfsmount *mnt;
1457
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1458 1459 1460 1461

	retval = nfsd_export_init(net);
	if (retval)
		goto out_export_error;
1462 1463 1464
	retval = nfsd_idmap_init(net);
	if (retval)
		goto out_idmap_error;
1465 1466
	nn->nfsd_versions = NULL;
	nn->nfsd4_minorversions = NULL;
J
J. Bruce Fields 已提交
1467 1468 1469
	retval = nfsd_reply_cache_init(nn);
	if (retval)
		goto out_drc_error;
1470 1471
	nn->nfsd4_lease = 90;	/* default lease time */
	nn->nfsd4_grace = 90;
1472
	nn->somebody_reclaimed = false;
1473
	nn->track_reclaim_completes = false;
1474
	nn->clverifier_counter = prandom_u32();
1475 1476
	nn->clientid_base = prandom_u32();
	nn->clientid_counter = nn->clientid_base + 1;
1477
	nn->s2s_cp_cl_id = nn->clientid_counter++;
1478 1479 1480

	atomic_set(&nn->ntf_refcnt, 0);
	init_waitqueue_head(&nn->ntf_wq);
1481 1482 1483 1484 1485 1486 1487

	mnt =  vfs_kern_mount(&nfsd_fs_type, SB_KERNMOUNT, "nfsd", NULL);
	if (IS_ERR(mnt)) {
		retval = PTR_ERR(mnt);
		goto out_mount_err;
	}
	nn->nfsd_mnt = mnt;
1488 1489
	return 0;

1490 1491
out_mount_err:
	nfsd_reply_cache_shutdown(nn);
J
J. Bruce Fields 已提交
1492 1493
out_drc_error:
	nfsd_idmap_shutdown(net);
1494 1495
out_idmap_error:
	nfsd_export_shutdown(net);
1496 1497 1498 1499 1500 1501
out_export_error:
	return retval;
}

static __net_exit void nfsd_exit_net(struct net *net)
{
J
J. Bruce Fields 已提交
1502 1503
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);

1504
	mntput(nn->nfsd_mnt);
J
J. Bruce Fields 已提交
1505
	nfsd_reply_cache_shutdown(nn);
1506
	nfsd_idmap_shutdown(net);
1507
	nfsd_export_shutdown(net);
1508
	nfsd_netns_free_versions(net_generic(net, nfsd_net_id));
1509 1510
}

1511
static struct pernet_operations nfsd_net_ops = {
1512 1513
	.init = nfsd_init_net,
	.exit = nfsd_exit_net,
1514 1515 1516 1517
	.id   = &nfsd_net_id,
	.size = sizeof(struct nfsd_net),
};

L
Linus Torvalds 已提交
1518 1519 1520 1521 1522
static int __init init_nfsd(void)
{
	int retval;
	printk(KERN_INFO "Installing knfsd (copyright (C) 1996 okir@monad.swb.de).\n");

1523 1524
	retval = register_pernet_subsys(&nfsd_net_ops);
	if (retval < 0)
1525 1526
		return retval;
	retval = register_cld_notifier();
1527
	if (retval)
1528
		goto out_unregister_pernet;
1529 1530 1531
	retval = nfsd4_init_slabs();
	if (retval)
		goto out_unregister_notifier;
1532
	retval = nfsd4_init_pnfs();
B
Bryan Schumaker 已提交
1533 1534
	if (retval)
		goto out_free_slabs;
1535
	nfsd_fault_inject_init(); /* nfsd fault injection controls */
L
Linus Torvalds 已提交
1536 1537
	nfsd_stat_init();	/* Statistics */
	nfsd_lockd_init();	/* lockd->nfsd callbacks */
1538 1539
	retval = create_proc_exports_entry();
	if (retval)
1540
		goto out_free_lockd;
L
Linus Torvalds 已提交
1541
	retval = register_filesystem(&nfsd_fs_type);
1542 1543 1544 1545 1546 1547
	if (retval)
		goto out_free_all;
	return 0;
out_free_all:
	remove_proc_entry("fs/nfs/exports", NULL);
	remove_proc_entry("fs/nfs", NULL);
1548
out_free_lockd:
1549
	nfsd_lockd_shutdown();
1550
	nfsd_stat_shutdown();
B
Bryan Schumaker 已提交
1551
	nfsd_fault_inject_cleanup();
1552
	nfsd4_exit_pnfs();
B
Bryan Schumaker 已提交
1553
out_free_slabs:
1554
	nfsd4_free_slabs();
1555
out_unregister_notifier:
1556
	unregister_cld_notifier();
1557 1558
out_unregister_pernet:
	unregister_pernet_subsys(&nfsd_net_ops);
L
Linus Torvalds 已提交
1559 1560 1561 1562 1563 1564 1565 1566 1567
	return retval;
}

static void __exit exit_nfsd(void)
{
	remove_proc_entry("fs/nfs/exports", NULL);
	remove_proc_entry("fs/nfs", NULL);
	nfsd_stat_shutdown();
	nfsd_lockd_shutdown();
1568
	nfsd4_free_slabs();
1569
	nfsd4_exit_pnfs();
B
Bryan Schumaker 已提交
1570
	nfsd_fault_inject_cleanup();
L
Linus Torvalds 已提交
1571
	unregister_filesystem(&nfsd_fs_type);
1572
	unregister_cld_notifier();
1573
	unregister_pernet_subsys(&nfsd_net_ops);
L
Linus Torvalds 已提交
1574 1575 1576 1577 1578 1579
}

MODULE_AUTHOR("Olaf Kirch <okir@monad.swb.de>");
MODULE_LICENSE("GPL");
module_init(init_nfsd)
module_exit(exit_nfsd)