nfsctl.c 39.3 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0-only
L
Linus Torvalds 已提交
2 3 4 5 6 7
/*
 * Syscall interface to knfsd.
 *
 * Copyright (C) 1995, 1996 Olaf Kirch <okir@monad.swb.de>
 */

8
#include <linux/slab.h>
9
#include <linux/namei.h>
10
#include <linux/ctype.h>
11
#include <linux/fs_context.h>
L
Linus Torvalds 已提交
12

13
#include <linux/sunrpc/svcsock.h>
14
#include <linux/lockd/lockd.h>
15
#include <linux/sunrpc/addr.h>
16
#include <linux/sunrpc/gss_api.h>
17
#include <linux/sunrpc/gss_krb5_enctypes.h>
18
#include <linux/sunrpc/rpc_pipe_fs.h>
19
#include <linux/module.h>
20
#include <linux/fsnotify.h>
L
Linus Torvalds 已提交
21

22
#include "idmap.h"
23 24
#include "nfsd.h"
#include "cache.h"
25
#include "state.h"
26
#include "netns.h"
27
#include "pnfs.h"
28

L
Linus Torvalds 已提交
29
/*
30
 *	We have a single directory with several nodes in it.
L
Linus Torvalds 已提交
31 32 33 34
 */
enum {
	NFSD_Root = 1,
	NFSD_List,
A
Amir Goldstein 已提交
35
	NFSD_Export_Stats,
36
	NFSD_Export_features,
L
Linus Torvalds 已提交
37
	NFSD_Fh,
38
	NFSD_FO_UnlockIP,
39
	NFSD_FO_UnlockFS,
L
Linus Torvalds 已提交
40
	NFSD_Threads,
41
	NFSD_Pool_Threads,
42
	NFSD_Pool_Stats,
43
	NFSD_Reply_Cache_Stats,
44
	NFSD_Versions,
45
	NFSD_Ports,
46
	NFSD_MaxBlkSize,
47
	NFSD_MaxConnections,
48
	NFSD_SupportedEnctypes,
49 50 51 52 53
	/*
	 * The below MUST come last.  Otherwise we leave a hole in nfsd_files[]
	 * with !CONFIG_NFSD_V4 and simple_fill_super() goes oops
	 */
#ifdef CONFIG_NFSD_V4
L
Linus Torvalds 已提交
54
	NFSD_Leasetime,
55
	NFSD_Gracetime,
56
	NFSD_RecoveryDir,
57
	NFSD_V4EndGrace,
58
#endif
59
	NFSD_MaxReserved
L
Linus Torvalds 已提交
60 61 62 63 64 65
};

/*
 * write() for these nodes.
 */
static ssize_t write_filehandle(struct file *file, char *buf, size_t size);
66 67
static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size);
static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size);
L
Linus Torvalds 已提交
68
static ssize_t write_threads(struct file *file, char *buf, size_t size);
69
static ssize_t write_pool_threads(struct file *file, char *buf, size_t size);
70
static ssize_t write_versions(struct file *file, char *buf, size_t size);
71
static ssize_t write_ports(struct file *file, char *buf, size_t size);
72
static ssize_t write_maxblksize(struct file *file, char *buf, size_t size);
73
static ssize_t write_maxconn(struct file *file, char *buf, size_t size);
74
#ifdef CONFIG_NFSD_V4
L
Linus Torvalds 已提交
75
static ssize_t write_leasetime(struct file *file, char *buf, size_t size);
76
static ssize_t write_gracetime(struct file *file, char *buf, size_t size);
77
static ssize_t write_recoverydir(struct file *file, char *buf, size_t size);
78
static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size);
79
#endif
L
Linus Torvalds 已提交
80

E
Eric Biggers 已提交
81
static ssize_t (*const write_op[])(struct file *, char *, size_t) = {
L
Linus Torvalds 已提交
82
	[NFSD_Fh] = write_filehandle,
83 84
	[NFSD_FO_UnlockIP] = write_unlock_ip,
	[NFSD_FO_UnlockFS] = write_unlock_fs,
L
Linus Torvalds 已提交
85
	[NFSD_Threads] = write_threads,
86
	[NFSD_Pool_Threads] = write_pool_threads,
87
	[NFSD_Versions] = write_versions,
88
	[NFSD_Ports] = write_ports,
89
	[NFSD_MaxBlkSize] = write_maxblksize,
90
	[NFSD_MaxConnections] = write_maxconn,
91
#ifdef CONFIG_NFSD_V4
L
Linus Torvalds 已提交
92
	[NFSD_Leasetime] = write_leasetime,
93
	[NFSD_Gracetime] = write_gracetime,
94
	[NFSD_RecoveryDir] = write_recoverydir,
95
	[NFSD_V4EndGrace] = write_v4_end_grace,
96
#endif
L
Linus Torvalds 已提交
97 98 99 100
};

static ssize_t nfsctl_transaction_write(struct file *file, const char __user *buf, size_t size, loff_t *pos)
{
A
Al Viro 已提交
101
	ino_t ino =  file_inode(file)->i_ino;
L
Linus Torvalds 已提交
102 103 104
	char *data;
	ssize_t rv;

105
	if (ino >= ARRAY_SIZE(write_op) || !write_op[ino])
L
Linus Torvalds 已提交
106 107 108 109 110 111 112
		return -EINVAL;

	data = simple_transaction_get(file, buf, size);
	if (IS_ERR(data))
		return PTR_ERR(data);

	rv =  write_op[ino](file, data, size);
113
	if (rv >= 0) {
L
Linus Torvalds 已提交
114 115 116 117 118 119
		simple_transaction_set(file, rv);
		rv = size;
	}
	return rv;
}

120 121 122 123 124 125 126 127 128 129 130 131 132 133
static ssize_t nfsctl_transaction_read(struct file *file, char __user *buf, size_t size, loff_t *pos)
{
	if (! file->private_data) {
		/* An attempt to read a transaction file without writing
		 * causes a 0-byte write so that the file can return
		 * state information
		 */
		ssize_t rv = nfsctl_transaction_write(file, buf, 0, pos);
		if (rv < 0)
			return rv;
	}
	return simple_transaction_read(file, buf, size, pos);
}

134
static const struct file_operations transaction_ops = {
L
Linus Torvalds 已提交
135
	.write		= nfsctl_transaction_write,
136
	.read		= nfsctl_transaction_read,
L
Linus Torvalds 已提交
137
	.release	= simple_transaction_release,
138
	.llseek		= default_llseek,
L
Linus Torvalds 已提交
139 140
};

141
static int exports_net_open(struct net *net, struct file *file)
L
Linus Torvalds 已提交
142
{
143 144
	int err;
	struct seq_file *seq;
145
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
146 147 148 149 150 151

	err = seq_open(file, &nfs_exports_op);
	if (err)
		return err;

	seq = file->private_data;
152
	seq->private = nn->svc_export_cache;
153
	return 0;
L
Linus Torvalds 已提交
154 155
}

156 157 158 159 160
static int exports_proc_open(struct inode *inode, struct file *file)
{
	return exports_net_open(current->nsproxy->net_ns, file);
}

161 162 163 164 165
static const struct proc_ops exports_proc_ops = {
	.proc_open	= exports_proc_open,
	.proc_read	= seq_read,
	.proc_lseek	= seq_lseek,
	.proc_release	= seq_release,
166 167 168 169 170 171 172 173 174
};

static int exports_nfsd_open(struct inode *inode, struct file *file)
{
	return exports_net_open(inode->i_sb->s_fs_info, file);
}

static const struct file_operations exports_nfsd_operations = {
	.open		= exports_nfsd_open,
L
Linus Torvalds 已提交
175 176 177 178 179
	.read		= seq_read,
	.llseek		= seq_lseek,
	.release	= seq_release,
};

180 181 182 183 184 185 186 187 188 189 190
static int export_features_show(struct seq_file *m, void *v)
{
	seq_printf(m, "0x%x 0x%x\n", NFSEXP_ALLFLAGS, NFSEXP_SECINFO_FLAGS);
	return 0;
}

static int export_features_open(struct inode *inode, struct file *file)
{
	return single_open(file, export_features_show, NULL);
}

191
static const struct file_operations export_features_operations = {
192 193 194 195 196 197
	.open		= export_features_open,
	.read		= seq_read,
	.llseek		= seq_lseek,
	.release	= single_release,
};

198
#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
199 200
static int supported_enctypes_show(struct seq_file *m, void *v)
{
201
	seq_printf(m, KRB5_SUPPORTED_ENCTYPES);
202 203 204 205 206 207 208 209
	return 0;
}

static int supported_enctypes_open(struct inode *inode, struct file *file)
{
	return single_open(file, supported_enctypes_show, NULL);
}

210
static const struct file_operations supported_enctypes_ops = {
211 212 213 214 215
	.open		= supported_enctypes_open,
	.read		= seq_read,
	.llseek		= seq_lseek,
	.release	= single_release,
};
216
#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
217

218
static const struct file_operations pool_stats_operations = {
219 220 221
	.open		= nfsd_pool_stats_open,
	.read		= seq_read,
	.llseek		= seq_lseek,
222
	.release	= nfsd_pool_stats_release,
223 224
};

225
static const struct file_operations reply_cache_stats_operations = {
226 227 228 229 230 231
	.open		= nfsd_reply_cache_stats_open,
	.read		= seq_read,
	.llseek		= seq_lseek,
	.release	= single_release,
};

L
Linus Torvalds 已提交
232 233 234 235 236
/*----------------------------------------------------------------------------*/
/*
 * payload - write methods
 */

A
Al Viro 已提交
237 238 239 240
static inline struct net *netns(struct file *file)
{
	return file_inode(file)->i_sb->s_fs_info;
}
L
Linus Torvalds 已提交
241

242
/*
243 244 245 246 247 248
 * write_unlock_ip - Release all locks used by a client
 *
 * Experimental.
 *
 * Input:
 *			buf:	'\n'-terminated C string containing a
249
 *				presentation format IP address
250 251 252 253 254 255
 *			size:	length of C string in @buf
 * Output:
 *	On success:	returns zero if all specified locks were released;
 *			returns one if one or more locks were not released
 *	On error:	return code is negative errno value
 */
256
static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size)
257
{
258 259 260
	struct sockaddr_storage address;
	struct sockaddr *sap = (struct sockaddr *)&address;
	size_t salen = sizeof(address);
261
	char *fo_path;
A
Al Viro 已提交
262
	struct net *net = netns(file);
263 264 265 266 267 268 269 270 271 272 273 274

	/* sanity check */
	if (size == 0)
		return -EINVAL;

	if (buf[size-1] != '\n')
		return -EINVAL;

	fo_path = buf;
	if (qword_get(&buf, fo_path, size) < 0)
		return -EINVAL;

275
	if (rpc_pton(net, fo_path, size, sap, salen) == 0)
276 277
		return -EINVAL;

278
	return nlmsvc_unlock_all_by_ip(sap);
279 280
}

281
/*
282 283 284 285 286 287 288 289 290 291 292 293 294
 * write_unlock_fs - Release all locks on a local file system
 *
 * Experimental.
 *
 * Input:
 *			buf:	'\n'-terminated C string containing the
 *				absolute pathname of a local file system
 *			size:	length of C string in @buf
 * Output:
 *	On success:	returns zero if all specified locks were released;
 *			returns one if one or more locks were not released
 *	On error:	return code is negative errno value
 */
295
static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size)
296
{
A
Al Viro 已提交
297
	struct path path;
298 299 300 301 302 303 304 305 306 307 308 309 310 311
	char *fo_path;
	int error;

	/* sanity check */
	if (size == 0)
		return -EINVAL;

	if (buf[size-1] != '\n')
		return -EINVAL;

	fo_path = buf;
	if (qword_get(&buf, fo_path, size) < 0)
		return -EINVAL;

A
Al Viro 已提交
312
	error = kern_path(fo_path, 0, &path);
313 314 315
	if (error)
		return error;

316 317 318 319 320 321 322 323 324
	/*
	 * XXX: Needs better sanity checking.  Otherwise we could end up
	 * releasing locks on the wrong file system.
	 *
	 * For example:
	 * 1.  Does the path refer to a directory?
	 * 2.  Is that directory a mount point, or
	 * 3.  Is that directory the root of an exported file system?
	 */
325
	error = nlmsvc_unlock_all_by_sb(path.dentry->d_sb);
326

A
Al Viro 已提交
327
	path_put(&path);
328 329 330
	return error;
}

331
/*
332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351
 * write_filehandle - Get a variable-length NFS file handle by path
 *
 * On input, the buffer contains a '\n'-terminated C string comprised of
 * three alphanumeric words separated by whitespace.  The string may
 * contain escape sequences.
 *
 * Input:
 *			buf:
 *				domain:		client domain name
 *				path:		export pathname
 *				maxsize:	numeric maximum size of
 *						@buf
 *			size:	length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C
 *			string containing a ASCII hex text version
 *			of the NFS file handle;
 *			return code is the size in bytes of the string
 *	On error:	return code is negative errno value
 */
L
Linus Torvalds 已提交
352 353 354
static ssize_t write_filehandle(struct file *file, char *buf, size_t size)
{
	char *dname, *path;
355
	int maxsize;
L
Linus Torvalds 已提交
356 357 358 359 360
	char *mesg = buf;
	int len;
	struct auth_domain *dom;
	struct knfsd_fh fh;

361 362 363
	if (size == 0)
		return -EINVAL;

L
Linus Torvalds 已提交
364 365 366 367 368 369
	if (buf[size-1] != '\n')
		return -EINVAL;
	buf[size-1] = 0;

	dname = mesg;
	len = qword_get(&mesg, dname, size);
370 371
	if (len <= 0)
		return -EINVAL;
L
Linus Torvalds 已提交
372 373 374
	
	path = dname+len+1;
	len = qword_get(&mesg, path, size);
375 376
	if (len <= 0)
		return -EINVAL;
L
Linus Torvalds 已提交
377 378 379 380 381 382 383

	len = get_int(&mesg, &maxsize);
	if (len)
		return len;

	if (maxsize < NFS_FHSIZE)
		return -EINVAL;
384
	maxsize = min(maxsize, NFS3_FHSIZE);
L
Linus Torvalds 已提交
385 386 387 388 389 390 391 392 393

	if (qword_get(&mesg, mesg, size)>0)
		return -EINVAL;

	/* we have all the words, they are in buf.. */
	dom = unix_domain_find(dname);
	if (!dom)
		return -ENOMEM;

A
Al Viro 已提交
394
	len = exp_rootfh(netns(file), dom, path, &fh,  maxsize);
L
Linus Torvalds 已提交
395 396 397 398
	auth_domain_put(dom);
	if (len)
		return len;
	
399 400
	mesg = buf;
	len = SIMPLE_TRANSACTION_LIMIT;
L
Linus Torvalds 已提交
401 402 403 404 405
	qword_addhex(&mesg, &len, (char*)&fh.fh_base, fh.fh_size);
	mesg[-1] = '\n';
	return mesg - buf;	
}

406
/*
407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433
 * write_threads - Start NFSD, or report the current number of running threads
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C
 *			string numeric value representing the number of
 *			running NFSD threads;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero
 *
 * OR
 *
 * Input:
 *			buf:		C string containing an unsigned
 *					integer value representing the
 *					number of NFSD threads to start
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	NFS service is started;
 *			passed-in buffer filled with '\n'-terminated C
 *			string numeric value representing the number of
 *			running NFSD threads;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
L
Linus Torvalds 已提交
434 435 436 437
static ssize_t write_threads(struct file *file, char *buf, size_t size)
{
	char *mesg = buf;
	int rv;
A
Al Viro 已提交
438
	struct net *net = netns(file);
439

L
Linus Torvalds 已提交
440 441 442 443 444
	if (size > 0) {
		int newthreads;
		rv = get_int(&mesg, &newthreads);
		if (rv)
			return rv;
445
		if (newthreads < 0)
L
Linus Torvalds 已提交
446
			return -EINVAL;
447
		rv = nfsd_svc(newthreads, net, file->f_cred);
448
		if (rv < 0)
L
Linus Torvalds 已提交
449
			return rv;
450
	} else
451
		rv = nfsd_nrthreads(net);
452

453
	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n", rv);
L
Linus Torvalds 已提交
454 455
}

456
/*
457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477
 * write_pool_threads - Set or report the current number of threads per pool
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 *
 * OR
 *
 * Input:
 * 			buf:		C string containing whitespace-
 * 					separated unsigned integer values
 *					representing the number of NFSD
 *					threads to start in each pool
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C
 *			string containing integer values representing the
 *			number of NFSD threads in each pool;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
478 479 480 481 482 483 484 485 486
static ssize_t write_pool_threads(struct file *file, char *buf, size_t size)
{
	/* if size > 0, look for an array of number of threads per node
	 * and apply them  then write out number of threads per node as reply
	 */
	char *mesg = buf;
	int i;
	int rv;
	int len;
487
	int npools;
488
	int *nthreads;
A
Al Viro 已提交
489
	struct net *net = netns(file);
490

491
	mutex_lock(&nfsd_mutex);
492
	npools = nfsd_nrpools(net);
493 494 495 496 497 498
	if (npools == 0) {
		/*
		 * NFS is shut down.  The admin can start it by
		 * writing to the threads file but NOT the pool_threads
		 * file, sorry.  Report zero threads.
		 */
499
		mutex_unlock(&nfsd_mutex);
500 501 502 503 504
		strcpy(buf, "0\n");
		return strlen(buf);
	}

	nthreads = kcalloc(npools, sizeof(int), GFP_KERNEL);
505
	rv = -ENOMEM;
506
	if (nthreads == NULL)
507
		goto out_free;
508 509 510 511 512 513 514 515 516 517 518 519

	if (size > 0) {
		for (i = 0; i < npools; i++) {
			rv = get_int(&mesg, &nthreads[i]);
			if (rv == -ENOENT)
				break;		/* fewer numbers than pools */
			if (rv)
				goto out_free;	/* syntax error */
			rv = -EINVAL;
			if (nthreads[i] < 0)
				goto out_free;
		}
520
		rv = nfsd_set_nrthreads(i, nthreads, net);
521 522 523 524
		if (rv)
			goto out_free;
	}

525
	rv = nfsd_get_nrthreads(npools, nthreads, net);
526 527 528 529 530 531 532 533 534 535 536
	if (rv)
		goto out_free;

	mesg = buf;
	size = SIMPLE_TRANSACTION_LIMIT;
	for (i = 0; i < npools && size > 0; i++) {
		snprintf(mesg, size, "%d%c", nthreads[i], (i == npools-1 ? '\n' : ' '));
		len = strlen(mesg);
		size -= len;
		mesg += len;
	}
537
	rv = mesg - buf;
538 539
out_free:
	kfree(nthreads);
540
	mutex_unlock(&nfsd_mutex);
541 542 543
	return rv;
}

544
static ssize_t
545 546
nfsd_print_version_support(struct nfsd_net *nn, char *buf, int remaining,
		const char *sep, unsigned vers, int minor)
547
{
548
	const char *format = minor < 0 ? "%s%c%u" : "%s%c%u.%u";
549
	bool supported = !!nfsd_vers(nn, vers, NFSD_TEST);
550

551
	if (vers == 4 && minor >= 0 &&
552
	    !nfsd_minorversion(nn, minor, NFSD_TEST))
553
		supported = false;
554 555 556 557 558 559 560
	if (minor == 0 && supported)
		/*
		 * special case for backward compatability.
		 * +4.0 is never reported, it is implied by
		 * +4, unless -4.0 is present.
		 */
		return 0;
561 562 563 564
	return snprintf(buf, remaining, format, sep,
			supported ? '+' : '-', vers, minor);
}

565
static ssize_t __write_versions(struct file *file, char *buf, size_t size)
566 567
{
	char *mesg = buf;
568
	char *vers, *minorp, sign;
569
	int len, num, remaining;
570 571
	ssize_t tlen = 0;
	char *sep;
A
Al Viro 已提交
572
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
573 574

	if (size>0) {
575
		if (nn->nfsd_serv)
576
			/* Cannot change versions without updating
577
			 * nn->nfsd_serv->sv_xdrsize, and reallocing
578 579
			 * rq_argp and rq_resp
			 */
580 581 582 583 584 585 586 587 588
			return -EBUSY;
		if (buf[size-1] != '\n')
			return -EINVAL;
		buf[size-1] = 0;

		vers = mesg;
		len = qword_get(&mesg, vers, size);
		if (len <= 0) return -EINVAL;
		do {
589
			enum vers_op cmd;
590
			unsigned minor;
591 592
			sign = *vers;
			if (sign == '+' || sign == '-')
593
				num = simple_strtol((vers+1), &minorp, 0);
594
			else
595 596
				num = simple_strtol(vers, &minorp, 0);
			if (*minorp == '.') {
597
				if (num != 4)
598
					return -EINVAL;
599
				if (kstrtouint(minorp+1, 0, &minor) < 0)
600
					return -EINVAL;
601 602
			}

603
			cmd = sign == '-' ? NFSD_CLEAR : NFSD_SET;
604 605 606
			switch(num) {
			case 2:
			case 3:
607
				nfsd_vers(nn, num, cmd);
608
				break;
609
			case 4:
610
				if (*minorp == '.') {
611
					if (nfsd_minorversion(nn, minor, cmd) < 0)
612
						return -EINVAL;
613
				} else if ((cmd == NFSD_SET) != nfsd_vers(nn, num, NFSD_TEST)) {
614 615 616 617 618 619
					/*
					 * Either we have +4 and no minors are enabled,
					 * or we have -4 and at least one minor is enabled.
					 * In either case, propagate 'cmd' to all minors.
					 */
					minor = 0;
620
					while (nfsd_minorversion(nn, minor, cmd) >= 0)
621 622 623
						minor++;
				}
				break;
624 625 626 627 628 629 630 631
			default:
				return -EINVAL;
			}
			vers += len + 1;
		} while ((len = qword_get(&mesg, vers, size)) > 0);
		/* If all get turned off, turn them back on, as
		 * having no versions is BAD
		 */
632
		nfsd_reset_versions(nn);
633
	}
634

635 636 637
	/* Now write current state into reply buffer */
	len = 0;
	sep = "";
638
	remaining = SIMPLE_TRANSACTION_LIMIT;
639
	for (num=2 ; num <= 4 ; num++) {
640
		int minor;
641
		if (!nfsd_vers(nn, num, NFSD_AVAIL))
642
			continue;
643 644

		minor = -1;
645
		do {
646
			len = nfsd_print_version_support(nn, buf, remaining,
647
					sep, num, minor);
648
			if (len >= remaining)
649
				goto out;
650 651 652
			remaining -= len;
			buf += len;
			tlen += len;
653
			minor++;
654 655
			if (len)
				sep = " ";
656 657 658
		} while (num == 4 && minor <= NFSD_SUPPORTED_MINOR_VERSION);
	}
out:
659
	len = snprintf(buf, remaining, "\n");
660
	if (len >= remaining)
661 662
		return -EINVAL;
	return tlen + len;
663 664
}

665
/*
666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696
 * write_versions - Set or report the available NFS protocol versions
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C
 *			string containing positive or negative integer
 *			values representing the current status of each
 *			protocol version;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 *
 * OR
 *
 * Input:
 * 			buf:		C string containing whitespace-
 * 					separated positive or negative
 * 					integer values representing NFS
 * 					protocol versions to enable ("+n")
 * 					or disable ("-n")
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	status of zero or more protocol versions has
 *			been updated; passed-in buffer filled with
 *			'\n'-terminated C string containing positive
 *			or negative integer values representing the
 *			current status of each protocol version;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
697 698 699 700 701 702 703 704 705 706
static ssize_t write_versions(struct file *file, char *buf, size_t size)
{
	ssize_t rv;

	mutex_lock(&nfsd_mutex);
	rv = __write_versions(file, buf, size);
	mutex_unlock(&nfsd_mutex);
	return rv;
}

707 708 709 710
/*
 * Zero-length write.  Return a list of NFSD's current listener
 * transports.
 */
711
static ssize_t __write_ports_names(char *buf, struct net *net)
712
{
713 714 715
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);

	if (nn->nfsd_serv == NULL)
716
		return 0;
717
	return svc_xprt_names(nn->nfsd_serv, buf, SIMPLE_TRANSACTION_LIMIT);
718 719
}

720 721 722 723 724
/*
 * A single 'fd' number was written, in which case it must be for
 * a socket of a supported family/protocol, and we use it as an
 * nfsd listener.
 */
725
static ssize_t __write_ports_addfd(char *buf, struct net *net, const struct cred *cred)
726 727 728
{
	char *mesg = buf;
	int fd, err;
729
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
730 731 732 733 734

	err = get_int(&mesg, &fd);
	if (err != 0 || fd < 0)
		return -EINVAL;

735 736 737 738 739
	if (svc_alien_sock(net, fd)) {
		printk(KERN_ERR "%s: socket net is different to NFSd's one\n", __func__);
		return -EINVAL;
	}

740
	err = nfsd_create_serv(net);
741 742 743
	if (err != 0)
		return err;

744
	err = svc_addsock(nn->nfsd_serv, fd, buf, SIMPLE_TRANSACTION_LIMIT, cred);
745
	if (err < 0) {
746
		nfsd_destroy(net);
747 748
		return err;
	}
749

750
	/* Decrease the count, but don't shut down the service */
751
	nn->nfsd_serv->sv_nrthreads--;
752
	return err;
753 754
}

755 756 757 758
/*
 * A transport listener is added by writing it's transport name and
 * a port number.
 */
759
static ssize_t __write_ports_addxprt(char *buf, struct net *net, const struct cred *cred)
760 761
{
	char transport[16];
762
	struct svc_xprt *xprt;
763
	int port, err;
764
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
765

766
	if (sscanf(buf, "%15s %5u", transport, &port) != 2)
767 768
		return -EINVAL;

769
	if (port < 1 || port > USHRT_MAX)
770 771
		return -EINVAL;

772
	err = nfsd_create_serv(net);
773 774 775
	if (err != 0)
		return err;

776
	err = svc_create_xprt(nn->nfsd_serv, transport, net,
777
				PF_INET, port, SVC_SOCK_ANONYMOUS, cred);
778
	if (err < 0)
779 780
		goto out_err;

781
	err = svc_create_xprt(nn->nfsd_serv, transport, net,
782
				PF_INET6, port, SVC_SOCK_ANONYMOUS, cred);
783 784
	if (err < 0 && err != -EAFNOSUPPORT)
		goto out_close;
785 786

	/* Decrease the count, but don't shut down the service */
787
	nn->nfsd_serv->sv_nrthreads--;
788
	return 0;
789
out_close:
790
	xprt = svc_find_xprt(nn->nfsd_serv, transport, net, PF_INET, port);
791 792 793 794 795
	if (xprt != NULL) {
		svc_close_xprt(xprt);
		svc_xprt_put(xprt);
	}
out_err:
796
	nfsd_destroy(net);
797
	return err;
798 799
}

800 801
static ssize_t __write_ports(struct file *file, char *buf, size_t size,
			     struct net *net)
802
{
803
	if (size == 0)
804
		return __write_ports_names(buf, net);
805 806

	if (isdigit(buf[0]))
807
		return __write_ports_addfd(buf, net, file->f_cred);
808

809
	if (isalpha(buf[0]))
810
		return __write_ports_addxprt(buf, net, file->f_cred);
811

812
	return -EINVAL;
813 814
}

815
/*
816 817 818 819 820 821 822 823 824 825 826 827 828 829 830 831 832 833
 * write_ports - Pass a socket file descriptor or transport name to listen on
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 * Output:
 *	On success:	passed-in buffer filled with a '\n'-terminated C
 *			string containing a whitespace-separated list of
 *			named NFSD listeners;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 *
 * OR
 *
 * Input:
 *			buf:		C string containing an unsigned
 *					integer value representing a bound
 *					but unconnected socket that is to be
834 835 836
 *					used as an NFSD listener; listen(3)
 *					must be called for a SOCK_STREAM
 *					socket, otherwise it is ignored
837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	NFS service is started;
 *			passed-in buffer filled with a '\n'-terminated C
 *			string containing a unique alphanumeric name of
 *			the listener;
 *			return code is the size in bytes of the string
 *	On error:	return code is a negative errno value
 *
 * OR
 *
 * Input:
 *			buf:		C string containing a transport
 *					name and an unsigned integer value
 *					representing the port to listen on,
 *					separated by whitespace
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	returns zero; NFS service is started
 *	On error:	return code is a negative errno value
 */
858 859 860
static ssize_t write_ports(struct file *file, char *buf, size_t size)
{
	ssize_t rv;
861

862
	mutex_lock(&nfsd_mutex);
A
Al Viro 已提交
863
	rv = __write_ports(file, buf, size, netns(file));
864 865 866 867 868
	mutex_unlock(&nfsd_mutex);
	return rv;
}


869 870
int nfsd_max_blksize;

871
/*
872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891
 * write_maxblksize - Set or report the current NFS blksize
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 *
 * OR
 *
 * Input:
 * 			buf:		C string containing an unsigned
 * 					integer value representing the new
 * 					NFS blksize
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C string
 *			containing numeric value of the current NFS blksize
 *			setting;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
892 893 894
static ssize_t write_maxblksize(struct file *file, char *buf, size_t size)
{
	char *mesg = buf;
A
Al Viro 已提交
895
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
896

897 898 899 900 901 902 903 904
	if (size > 0) {
		int bsize;
		int rv = get_int(&mesg, &bsize);
		if (rv)
			return rv;
		/* force bsize into allowed range and
		 * required alignment.
		 */
905 906
		bsize = max_t(int, bsize, 1024);
		bsize = min_t(int, bsize, NFSSVC_MAXBLKSIZE);
907
		bsize &= ~(1024-1);
908
		mutex_lock(&nfsd_mutex);
909
		if (nn->nfsd_serv) {
910
			mutex_unlock(&nfsd_mutex);
911 912 913
			return -EBUSY;
		}
		nfsd_max_blksize = bsize;
914
		mutex_unlock(&nfsd_mutex);
915
	}
916 917 918

	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n",
							nfsd_max_blksize);
919 920
}

921
/*
922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943
 * write_maxconn - Set or report the current max number of connections
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 * OR
 *
 * Input:
 * 			buf:		C string containing an unsigned
 * 					integer value representing the new
 * 					number of max connections
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C string
 *			containing numeric value of max_connections setting
 *			for this net namespace;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
static ssize_t write_maxconn(struct file *file, char *buf, size_t size)
{
	char *mesg = buf;
A
Al Viro 已提交
944
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
945 946 947 948 949 950 951 952 953 954 955 956 957
	unsigned int maxconn = nn->max_connections;

	if (size > 0) {
		int rv = get_uint(&mesg, &maxconn);

		if (rv)
			return rv;
		nn->max_connections = maxconn;
	}

	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%u\n", maxconn);
}

958
#ifdef CONFIG_NFSD_V4
959
static ssize_t __nfsd4_write_time(struct file *file, char *buf, size_t size,
960
				  time64_t *time, struct nfsd_net *nn)
L
Linus Torvalds 已提交
961 962
{
	char *mesg = buf;
963
	int rv, i;
L
Linus Torvalds 已提交
964 965

	if (size > 0) {
966
		if (nn->nfsd_serv)
967
			return -EBUSY;
968
		rv = get_int(&mesg, &i);
L
Linus Torvalds 已提交
969 970
		if (rv)
			return rv;
971 972 973 974 975 976 977 978 979 980 981 982
		/*
		 * Some sanity checking.  We don't have a reason for
		 * these particular numbers, but problems with the
		 * extremes are:
		 *	- Too short: the briefest network outage may
		 *	  cause clients to lose all their locks.  Also,
		 *	  the frequent polling may be wasteful.
		 *	- Too long: do you really want reboot recovery
		 *	  to take more than an hour?  Or to make other
		 *	  clients wait an hour before being able to
		 *	  revoke a dead client's locks?
		 */
983
		if (i < 10 || i > 3600)
L
Linus Torvalds 已提交
984
			return -EINVAL;
985
		*time = i;
L
Linus Torvalds 已提交
986
	}
987

988
	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%lld\n", *time);
989 990
}

991
static ssize_t nfsd4_write_time(struct file *file, char *buf, size_t size,
992
				time64_t *time, struct nfsd_net *nn)
993 994 995 996
{
	ssize_t rv;

	mutex_lock(&nfsd_mutex);
997
	rv = __nfsd4_write_time(file, buf, size, time, nn);
998 999
	mutex_unlock(&nfsd_mutex);
	return rv;
L
Linus Torvalds 已提交
1000 1001
}

1002
/*
1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022
 * write_leasetime - Set or report the current NFSv4 lease time
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 *
 * OR
 *
 * Input:
 *			buf:		C string containing an unsigned
 *					integer value representing the new
 *					NFSv4 lease expiry time
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C
 *			string containing unsigned integer value of the
 *			current lease expiry time;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
1023 1024
static ssize_t write_leasetime(struct file *file, char *buf, size_t size)
{
A
Al Viro 已提交
1025
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1026
	return nfsd4_write_time(file, buf, size, &nn->nfsd4_lease, nn);
1027 1028
}

1029
/*
1030 1031 1032 1033 1034 1035 1036 1037 1038 1039 1040
 * write_gracetime - Set or report current NFSv4 grace period time
 *
 * As above, but sets the time of the NFSv4 grace period.
 *
 * Note this should never be set to less than the *previous*
 * lease-period time, but we don't try to enforce this.  (In the common
 * case (a new boot), we don't know what the previous lease time was
 * anyway.)
 */
static ssize_t write_gracetime(struct file *file, char *buf, size_t size)
{
A
Al Viro 已提交
1041
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1042
	return nfsd4_write_time(file, buf, size, &nn->nfsd4_grace, nn);
1043 1044
}

1045 1046
static ssize_t __write_recoverydir(struct file *file, char *buf, size_t size,
				   struct nfsd_net *nn)
1047 1048 1049 1050 1051
{
	char *mesg = buf;
	char *recdir;
	int len, status;

1052
	if (size > 0) {
1053
		if (nn->nfsd_serv)
1054 1055 1056 1057
			return -EBUSY;
		if (size > PATH_MAX || buf[size-1] != '\n')
			return -EINVAL;
		buf[size-1] = 0;
1058

1059 1060 1061 1062
		recdir = mesg;
		len = qword_get(&mesg, recdir, size);
		if (len <= 0)
			return -EINVAL;
1063

1064
		status = nfs4_reset_recoverydir(recdir);
1065 1066
		if (status)
			return status;
1067
	}
1068 1069 1070

	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%s\n",
							nfs4_recoverydir());
1071
}
1072

1073
/*
1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093
 * write_recoverydir - Set or report the pathname of the recovery directory
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 *
 * OR
 *
 * Input:
 *			buf:		C string containing the pathname
 *					of the directory on a local file
 *					system containing permanent NFSv4
 *					recovery data
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C string
 *			containing the current recovery pathname setting;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
1094 1095 1096
static ssize_t write_recoverydir(struct file *file, char *buf, size_t size)
{
	ssize_t rv;
A
Al Viro 已提交
1097
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1098 1099

	mutex_lock(&nfsd_mutex);
1100
	rv = __write_recoverydir(file, buf, size, nn);
1101 1102 1103 1104
	mutex_unlock(&nfsd_mutex);
	return rv;
}

1105
/*
1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126
 * write_v4_end_grace - release grace period for nfsd's v4.x lock manager
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 * OR
 *
 * Input:
 * 			buf:		any value
 *			size:		non-zero length of C string in @buf
 * Output:
 *			passed-in buffer filled with "Y" or "N" with a newline
 *			and NULL-terminated C string. This indicates whether
 *			the grace period has ended in the current net
 *			namespace. Return code is the size in bytes of the
 *			string. Writing a string that starts with 'Y', 'y', or
 *			'1' to the file will end the grace period for nfsd's v4
 *			lock manager.
 */
static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size)
{
A
Al Viro 已提交
1127
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1128 1129 1130 1131 1132 1133

	if (size > 0) {
		switch(buf[0]) {
		case 'Y':
		case 'y':
		case '1':
1134
			if (!nn->nfsd_serv)
1135
				return -EBUSY;
1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146
			nfsd4_end_grace(nn);
			break;
		default:
			return -EINVAL;
		}
	}

	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%c\n",
			 nn->grace_ended ? 'Y' : 'N');
}

1147
#endif
1148

L
Linus Torvalds 已提交
1149 1150 1151 1152 1153
/*----------------------------------------------------------------------------*/
/*
 *	populating the filesystem.
 */

1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174
/* Basically copying rpc_get_inode. */
static struct inode *nfsd_get_inode(struct super_block *sb, umode_t mode)
{
	struct inode *inode = new_inode(sb);
	if (!inode)
		return NULL;
	/* Following advice from simple_fill_super documentation: */
	inode->i_ino = iunique(sb, NFSD_MaxReserved);
	inode->i_mode = mode;
	inode->i_atime = inode->i_mtime = inode->i_ctime = current_time(inode);
	switch (mode & S_IFMT) {
	case S_IFDIR:
		inode->i_fop = &simple_dir_operations;
		inode->i_op = &simple_dir_inode_operations;
		inc_nlink(inode);
	default:
		break;
	}
	return inode;
}

1175
static int __nfsd_mkdir(struct inode *dir, struct dentry *dentry, umode_t mode, struct nfsdfs_client *ncl)
1176 1177 1178 1179 1180 1181
{
	struct inode *inode;

	inode = nfsd_get_inode(dir->i_sb, mode);
	if (!inode)
		return -ENOMEM;
1182 1183 1184 1185
	if (ncl) {
		inode->i_private = ncl;
		kref_get(&ncl->cl_ref);
	}
1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201
	d_add(dentry, inode);
	inc_nlink(dir);
	fsnotify_mkdir(dir, dentry);
	return 0;
}

static struct dentry *nfsd_mkdir(struct dentry *parent, struct nfsdfs_client *ncl, char *name)
{
	struct inode *dir = parent->d_inode;
	struct dentry *dentry;
	int ret = -ENOMEM;

	inode_lock(dir);
	dentry = d_alloc_name(parent, name);
	if (!dentry)
		goto out_err;
1202
	ret = __nfsd_mkdir(d_inode(parent), dentry, S_IFDIR | 0600, ncl);
1203 1204 1205 1206 1207 1208
	if (ret)
		goto out_err;
out:
	inode_unlock(dir);
	return dentry;
out_err:
1209
	dput(dentry);
1210 1211 1212 1213
	dentry = ERR_PTR(ret);
	goto out;
}

J
J. Bruce Fields 已提交
1214 1215 1216 1217 1218 1219 1220 1221
static void clear_ncl(struct inode *inode)
{
	struct nfsdfs_client *ncl = inode->i_private;

	inode->i_private = NULL;
	kref_put(&ncl->cl_ref, ncl->cl_release);
}

1222
static struct nfsdfs_client *__get_nfsdfs_client(struct inode *inode)
J
J. Bruce Fields 已提交
1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234
{
	struct nfsdfs_client *nc = inode->i_private;

	if (nc)
		kref_get(&nc->cl_ref);
	return nc;
}

struct nfsdfs_client *get_nfsdfs_client(struct inode *inode)
{
	struct nfsdfs_client *nc;

1235
	inode_lock_shared(inode);
J
J. Bruce Fields 已提交
1236
	nc = __get_nfsdfs_client(inode);
1237
	inode_unlock_shared(inode);
J
J. Bruce Fields 已提交
1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299 1300 1301
	return nc;
}
/* from __rpc_unlink */
static void nfsdfs_remove_file(struct inode *dir, struct dentry *dentry)
{
	int ret;

	clear_ncl(d_inode(dentry));
	dget(dentry);
	ret = simple_unlink(dir, dentry);
	d_delete(dentry);
	dput(dentry);
	WARN_ON_ONCE(ret);
}

static void nfsdfs_remove_files(struct dentry *root)
{
	struct dentry *dentry, *tmp;

	list_for_each_entry_safe(dentry, tmp, &root->d_subdirs, d_child) {
		if (!simple_positive(dentry)) {
			WARN_ON_ONCE(1); /* I think this can't happen? */
			continue;
		}
		nfsdfs_remove_file(d_inode(root), dentry);
	}
}

/* XXX: cut'n'paste from simple_fill_super; figure out if we could share
 * code instead. */
static  int nfsdfs_create_files(struct dentry *root,
					const struct tree_descr *files)
{
	struct inode *dir = d_inode(root);
	struct inode *inode;
	struct dentry *dentry;
	int i;

	inode_lock(dir);
	for (i = 0; files->name && files->name[0]; i++, files++) {
		if (!files->name)
			continue;
		dentry = d_alloc_name(root, files->name);
		if (!dentry)
			goto out;
		inode = nfsd_get_inode(d_inode(root)->i_sb,
					S_IFREG | files->mode);
		if (!inode) {
			dput(dentry);
			goto out;
		}
		inode->i_fop = files->ops;
		inode->i_private = __get_nfsdfs_client(dir);
		d_add(dentry, inode);
		fsnotify_create(dir, dentry);
	}
	inode_unlock(dir);
	return 0;
out:
	nfsdfs_remove_files(root);
	inode_unlock(dir);
	return -ENOMEM;
}

1302
/* on success, returns positive number unique to that client. */
J
J. Bruce Fields 已提交
1303 1304 1305
struct dentry *nfsd_client_mkdir(struct nfsd_net *nn,
		struct nfsdfs_client *ncl, u32 id,
		const struct tree_descr *files)
1306
{
J
J. Bruce Fields 已提交
1307
	struct dentry *dentry;
1308
	char name[11];
J
J. Bruce Fields 已提交
1309
	int ret;
1310

1311
	sprintf(name, "%u", id);
1312

J
J. Bruce Fields 已提交
1313 1314 1315 1316 1317 1318 1319 1320 1321
	dentry = nfsd_mkdir(nn->nfsd_client_dir, ncl, name);
	if (IS_ERR(dentry)) /* XXX: tossing errors? */
		return NULL;
	ret = nfsdfs_create_files(dentry, files);
	if (ret) {
		nfsd_client_rmdir(dentry);
		return NULL;
	}
	return dentry;
1322 1323 1324 1325 1326 1327 1328 1329 1330
}

/* Taken from __rpc_rmdir: */
void nfsd_client_rmdir(struct dentry *dentry)
{
	struct inode *dir = d_inode(dentry->d_parent);
	struct inode *inode = d_inode(dentry);
	int ret;

J
J. Bruce Fields 已提交
1331 1332 1333
	inode_lock(dir);
	nfsdfs_remove_files(dentry);
	clear_ncl(inode);
1334 1335 1336
	dget(dentry);
	ret = simple_rmdir(dir, dentry);
	WARN_ON_ONCE(ret);
1337
	fsnotify_rmdir(dir, dentry);
1338
	d_delete(dentry);
1339
	dput(dentry);
J
J. Bruce Fields 已提交
1340
	inode_unlock(dir);
1341 1342
}

1343
static int nfsd_fill_super(struct super_block *sb, struct fs_context *fc)
L
Linus Torvalds 已提交
1344
{
1345 1346 1347 1348 1349
	struct nfsd_net *nn = net_generic(current->nsproxy->net_ns,
							nfsd_net_id);
	struct dentry *dentry;
	int ret;

1350
	static const struct tree_descr nfsd_files[] = {
1351
		[NFSD_List] = {"exports", &exports_nfsd_operations, S_IRUGO},
A
Amir Goldstein 已提交
1352 1353
		/* Per-export io stats use same ops as exports file */
		[NFSD_Export_Stats] = {"export_stats", &exports_nfsd_operations, S_IRUGO},
1354 1355
		[NFSD_Export_features] = {"export_features",
					&export_features_operations, S_IRUGO},
1356 1357
		[NFSD_FO_UnlockIP] = {"unlock_ip",
					&transaction_ops, S_IWUSR|S_IRUSR},
1358 1359
		[NFSD_FO_UnlockFS] = {"unlock_filesystem",
					&transaction_ops, S_IWUSR|S_IRUSR},
L
Linus Torvalds 已提交
1360 1361
		[NFSD_Fh] = {"filehandle", &transaction_ops, S_IWUSR|S_IRUSR},
		[NFSD_Threads] = {"threads", &transaction_ops, S_IWUSR|S_IRUSR},
1362
		[NFSD_Pool_Threads] = {"pool_threads", &transaction_ops, S_IWUSR|S_IRUSR},
1363
		[NFSD_Pool_Stats] = {"pool_stats", &pool_stats_operations, S_IRUGO},
1364
		[NFSD_Reply_Cache_Stats] = {"reply_cache_stats", &reply_cache_stats_operations, S_IRUGO},
1365
		[NFSD_Versions] = {"versions", &transaction_ops, S_IWUSR|S_IRUSR},
1366
		[NFSD_Ports] = {"portlist", &transaction_ops, S_IWUSR|S_IRUGO},
1367
		[NFSD_MaxBlkSize] = {"max_block_size", &transaction_ops, S_IWUSR|S_IRUGO},
1368
		[NFSD_MaxConnections] = {"max_connections", &transaction_ops, S_IWUSR|S_IRUGO},
1369
#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
1370
		[NFSD_SupportedEnctypes] = {"supported_krb5_enctypes", &supported_enctypes_ops, S_IRUGO},
1371
#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
L
Linus Torvalds 已提交
1372 1373
#ifdef CONFIG_NFSD_V4
		[NFSD_Leasetime] = {"nfsv4leasetime", &transaction_ops, S_IWUSR|S_IRUSR},
1374
		[NFSD_Gracetime] = {"nfsv4gracetime", &transaction_ops, S_IWUSR|S_IRUSR},
1375
		[NFSD_RecoveryDir] = {"nfsv4recoverydir", &transaction_ops, S_IWUSR|S_IRUSR},
1376
		[NFSD_V4EndGrace] = {"v4_end_grace", &transaction_ops, S_IWUSR|S_IRUGO},
L
Linus Torvalds 已提交
1377 1378 1379
#endif
		/* last one */ {""}
	};
1380

1381 1382 1383 1384 1385 1386 1387 1388
	ret = simple_fill_super(sb, 0x6e667364, nfsd_files);
	if (ret)
		return ret;
	dentry = nfsd_mkdir(sb->s_root, NULL, "clients");
	if (IS_ERR(dentry))
		return PTR_ERR(dentry);
	nn->nfsd_client_dir = dentry;
	return 0;
L
Linus Torvalds 已提交
1389
}
1390

1391 1392
static int nfsd_fs_get_tree(struct fs_context *fc)
{
A
Al Viro 已提交
1393
	return get_tree_keyed(fc, nfsd_fill_super, get_net(fc->net_ns));
L
Linus Torvalds 已提交
1394 1395
}

1396
static void nfsd_fs_free_fc(struct fs_context *fc)
L
Linus Torvalds 已提交
1397
{
1398 1399 1400 1401 1402 1403 1404 1405 1406 1407
	if (fc->s_fs_info)
		put_net(fc->s_fs_info);
}

static const struct fs_context_operations nfsd_fs_context_ops = {
	.free		= nfsd_fs_free_fc,
	.get_tree	= nfsd_fs_get_tree,
};

static int nfsd_init_fs_context(struct fs_context *fc)
L
Linus Torvalds 已提交
1408
{
1409 1410 1411 1412
	put_user_ns(fc->user_ns);
	fc->user_ns = get_user_ns(fc->net_ns->user_ns);
	fc->ops = &nfsd_fs_context_ops;
	return 0;
1413 1414 1415 1416 1417 1418 1419 1420
}

static void nfsd_umount(struct super_block *sb)
{
	struct net *net = sb->s_fs_info;

	kill_litter_super(sb);
	put_net(net);
L
Linus Torvalds 已提交
1421 1422 1423 1424 1425
}

static struct file_system_type nfsd_fs_type = {
	.owner		= THIS_MODULE,
	.name		= "nfsd",
1426
	.init_fs_context = nfsd_init_fs_context,
1427
	.kill_sb	= nfsd_umount,
L
Linus Torvalds 已提交
1428
};
1429
MODULE_ALIAS_FS("nfsd");
L
Linus Torvalds 已提交
1430

1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442
int get_nfsdfs(struct net *net)
{
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
	struct vfsmount *mnt;

	mnt =  vfs_kern_mount(&nfsd_fs_type, SB_KERNMOUNT, "nfsd", NULL);
	if (IS_ERR(mnt))
		return PTR_ERR(mnt);
	nn->nfsd_mnt = mnt;
	return 0;
}

1443 1444 1445 1446 1447 1448 1449 1450
#ifdef CONFIG_PROC_FS
static int create_proc_exports_entry(void)
{
	struct proc_dir_entry *entry;

	entry = proc_mkdir("fs/nfs", NULL);
	if (!entry)
		return -ENOMEM;
1451
	entry = proc_create("exports", 0, entry, &exports_proc_ops);
1452 1453
	if (!entry) {
		remove_proc_entry("fs/nfs", NULL);
1454
		return -ENOMEM;
1455
	}
1456 1457 1458 1459 1460 1461 1462 1463 1464
	return 0;
}
#else /* CONFIG_PROC_FS */
static int create_proc_exports_entry(void)
{
	return 0;
}
#endif

1465
unsigned int nfsd_net_id;
1466 1467 1468 1469

static __net_init int nfsd_init_net(struct net *net)
{
	int retval;
1470
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1471 1472 1473 1474

	retval = nfsd_export_init(net);
	if (retval)
		goto out_export_error;
1475 1476 1477
	retval = nfsd_idmap_init(net);
	if (retval)
		goto out_idmap_error;
1478 1479
	nn->nfsd_versions = NULL;
	nn->nfsd4_minorversions = NULL;
J
J. Bruce Fields 已提交
1480 1481 1482
	retval = nfsd_reply_cache_init(nn);
	if (retval)
		goto out_drc_error;
1483 1484
	nn->nfsd4_lease = 90;	/* default lease time */
	nn->nfsd4_grace = 90;
1485
	nn->somebody_reclaimed = false;
1486
	nn->track_reclaim_completes = false;
1487
	nn->clverifier_counter = prandom_u32();
1488 1489
	nn->clientid_base = prandom_u32();
	nn->clientid_counter = nn->clientid_base + 1;
1490
	nn->s2s_cp_cl_id = nn->clientid_counter++;
1491 1492 1493

	atomic_set(&nn->ntf_refcnt, 0);
	init_waitqueue_head(&nn->ntf_wq);
1494
	seqlock_init(&nn->boot_lock);
1495

1496 1497
	return 0;

J
J. Bruce Fields 已提交
1498 1499
out_drc_error:
	nfsd_idmap_shutdown(net);
1500 1501
out_idmap_error:
	nfsd_export_shutdown(net);
1502 1503 1504 1505 1506 1507
out_export_error:
	return retval;
}

static __net_exit void nfsd_exit_net(struct net *net)
{
J
J. Bruce Fields 已提交
1508 1509 1510
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);

	nfsd_reply_cache_shutdown(nn);
1511
	nfsd_idmap_shutdown(net);
1512
	nfsd_export_shutdown(net);
1513
	nfsd_netns_free_versions(net_generic(net, nfsd_net_id));
1514 1515
}

1516
static struct pernet_operations nfsd_net_ops = {
1517 1518
	.init = nfsd_init_net,
	.exit = nfsd_exit_net,
1519 1520 1521 1522
	.id   = &nfsd_net_id,
	.size = sizeof(struct nfsd_net),
};

L
Linus Torvalds 已提交
1523 1524 1525 1526 1527
static int __init init_nfsd(void)
{
	int retval;
	printk(KERN_INFO "Installing knfsd (copyright (C) 1996 okir@monad.swb.de).\n");

1528
	retval = register_cld_notifier();
1529
	if (retval)
1530
		return retval;
1531 1532 1533
	retval = nfsd4_init_slabs();
	if (retval)
		goto out_unregister_notifier;
1534
	retval = nfsd4_init_pnfs();
B
Bryan Schumaker 已提交
1535 1536
	if (retval)
		goto out_free_slabs;
1537 1538 1539
	retval = nfsd_stat_init();	/* Statistics */
	if (retval)
		goto out_free_pnfs;
1540 1541 1542
	retval = nfsd_drc_slab_create();
	if (retval)
		goto out_free_stat;
L
Linus Torvalds 已提交
1543
	nfsd_lockd_init();	/* lockd->nfsd callbacks */
1544 1545
	retval = create_proc_exports_entry();
	if (retval)
1546
		goto out_free_lockd;
L
Linus Torvalds 已提交
1547
	retval = register_filesystem(&nfsd_fs_type);
1548
	if (retval)
1549 1550 1551
		goto out_free_exports;
	retval = register_pernet_subsys(&nfsd_net_ops);
	if (retval < 0)
1552 1553 1554
		goto out_free_all;
	return 0;
out_free_all:
1555 1556
	unregister_pernet_subsys(&nfsd_net_ops);
out_free_exports:
1557 1558
	remove_proc_entry("fs/nfs/exports", NULL);
	remove_proc_entry("fs/nfs", NULL);
1559
out_free_lockd:
1560
	nfsd_lockd_shutdown();
1561 1562
	nfsd_drc_slab_free();
out_free_stat:
1563
	nfsd_stat_shutdown();
1564
out_free_pnfs:
1565
	nfsd4_exit_pnfs();
B
Bryan Schumaker 已提交
1566
out_free_slabs:
1567
	nfsd4_free_slabs();
1568
out_unregister_notifier:
1569
	unregister_cld_notifier();
L
Linus Torvalds 已提交
1570 1571 1572 1573 1574
	return retval;
}

static void __exit exit_nfsd(void)
{
1575
	unregister_pernet_subsys(&nfsd_net_ops);
1576
	nfsd_drc_slab_free();
L
Linus Torvalds 已提交
1577 1578 1579 1580
	remove_proc_entry("fs/nfs/exports", NULL);
	remove_proc_entry("fs/nfs", NULL);
	nfsd_stat_shutdown();
	nfsd_lockd_shutdown();
1581
	nfsd4_free_slabs();
1582
	nfsd4_exit_pnfs();
L
Linus Torvalds 已提交
1583
	unregister_filesystem(&nfsd_fs_type);
1584
	unregister_cld_notifier();
L
Linus Torvalds 已提交
1585 1586 1587 1588 1589 1590
}

MODULE_AUTHOR("Olaf Kirch <okir@monad.swb.de>");
MODULE_LICENSE("GPL");
module_init(init_nfsd)
module_exit(exit_nfsd)