nfsctl.c 39.2 KB
Newer Older
1
// SPDX-License-Identifier: GPL-2.0-only
L
Linus Torvalds 已提交
2 3 4 5 6 7
/*
 * Syscall interface to knfsd.
 *
 * Copyright (C) 1995, 1996 Olaf Kirch <okir@monad.swb.de>
 */

8
#include <linux/slab.h>
9
#include <linux/namei.h>
10
#include <linux/ctype.h>
11
#include <linux/fs_context.h>
L
Linus Torvalds 已提交
12

13
#include <linux/sunrpc/svcsock.h>
14
#include <linux/lockd/lockd.h>
15
#include <linux/sunrpc/addr.h>
16
#include <linux/sunrpc/gss_api.h>
17
#include <linux/sunrpc/gss_krb5_enctypes.h>
18
#include <linux/sunrpc/rpc_pipe_fs.h>
19
#include <linux/module.h>
20
#include <linux/fsnotify.h>
L
Linus Torvalds 已提交
21

22
#include "idmap.h"
23 24
#include "nfsd.h"
#include "cache.h"
25
#include "state.h"
26
#include "netns.h"
27
#include "pnfs.h"
28

L
Linus Torvalds 已提交
29
/*
30
 *	We have a single directory with several nodes in it.
L
Linus Torvalds 已提交
31 32 33 34
 */
enum {
	NFSD_Root = 1,
	NFSD_List,
A
Amir Goldstein 已提交
35
	NFSD_Export_Stats,
36
	NFSD_Export_features,
L
Linus Torvalds 已提交
37
	NFSD_Fh,
38
	NFSD_FO_UnlockIP,
39
	NFSD_FO_UnlockFS,
L
Linus Torvalds 已提交
40
	NFSD_Threads,
41
	NFSD_Pool_Threads,
42
	NFSD_Pool_Stats,
43
	NFSD_Reply_Cache_Stats,
44
	NFSD_Versions,
45
	NFSD_Ports,
46
	NFSD_MaxBlkSize,
47
	NFSD_MaxConnections,
48
	NFSD_SupportedEnctypes,
49 50 51 52 53
	/*
	 * The below MUST come last.  Otherwise we leave a hole in nfsd_files[]
	 * with !CONFIG_NFSD_V4 and simple_fill_super() goes oops
	 */
#ifdef CONFIG_NFSD_V4
L
Linus Torvalds 已提交
54
	NFSD_Leasetime,
55
	NFSD_Gracetime,
56
	NFSD_RecoveryDir,
57
	NFSD_V4EndGrace,
58
#endif
59
	NFSD_MaxReserved
L
Linus Torvalds 已提交
60 61 62 63 64 65
};

/*
 * write() for these nodes.
 */
static ssize_t write_filehandle(struct file *file, char *buf, size_t size);
66 67
static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size);
static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size);
L
Linus Torvalds 已提交
68
static ssize_t write_threads(struct file *file, char *buf, size_t size);
69
static ssize_t write_pool_threads(struct file *file, char *buf, size_t size);
70
static ssize_t write_versions(struct file *file, char *buf, size_t size);
71
static ssize_t write_ports(struct file *file, char *buf, size_t size);
72
static ssize_t write_maxblksize(struct file *file, char *buf, size_t size);
73
static ssize_t write_maxconn(struct file *file, char *buf, size_t size);
74
#ifdef CONFIG_NFSD_V4
L
Linus Torvalds 已提交
75
static ssize_t write_leasetime(struct file *file, char *buf, size_t size);
76
static ssize_t write_gracetime(struct file *file, char *buf, size_t size);
77
static ssize_t write_recoverydir(struct file *file, char *buf, size_t size);
78
static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size);
79
#endif
L
Linus Torvalds 已提交
80

E
Eric Biggers 已提交
81
static ssize_t (*const write_op[])(struct file *, char *, size_t) = {
L
Linus Torvalds 已提交
82
	[NFSD_Fh] = write_filehandle,
83 84
	[NFSD_FO_UnlockIP] = write_unlock_ip,
	[NFSD_FO_UnlockFS] = write_unlock_fs,
L
Linus Torvalds 已提交
85
	[NFSD_Threads] = write_threads,
86
	[NFSD_Pool_Threads] = write_pool_threads,
87
	[NFSD_Versions] = write_versions,
88
	[NFSD_Ports] = write_ports,
89
	[NFSD_MaxBlkSize] = write_maxblksize,
90
	[NFSD_MaxConnections] = write_maxconn,
91
#ifdef CONFIG_NFSD_V4
L
Linus Torvalds 已提交
92
	[NFSD_Leasetime] = write_leasetime,
93
	[NFSD_Gracetime] = write_gracetime,
94
	[NFSD_RecoveryDir] = write_recoverydir,
95
	[NFSD_V4EndGrace] = write_v4_end_grace,
96
#endif
L
Linus Torvalds 已提交
97 98 99 100
};

static ssize_t nfsctl_transaction_write(struct file *file, const char __user *buf, size_t size, loff_t *pos)
{
A
Al Viro 已提交
101
	ino_t ino =  file_inode(file)->i_ino;
L
Linus Torvalds 已提交
102 103 104
	char *data;
	ssize_t rv;

105
	if (ino >= ARRAY_SIZE(write_op) || !write_op[ino])
L
Linus Torvalds 已提交
106 107 108 109 110 111 112
		return -EINVAL;

	data = simple_transaction_get(file, buf, size);
	if (IS_ERR(data))
		return PTR_ERR(data);

	rv =  write_op[ino](file, data, size);
113
	if (rv >= 0) {
L
Linus Torvalds 已提交
114 115 116 117 118 119
		simple_transaction_set(file, rv);
		rv = size;
	}
	return rv;
}

120 121 122 123 124 125 126 127 128 129 130 131 132 133
static ssize_t nfsctl_transaction_read(struct file *file, char __user *buf, size_t size, loff_t *pos)
{
	if (! file->private_data) {
		/* An attempt to read a transaction file without writing
		 * causes a 0-byte write so that the file can return
		 * state information
		 */
		ssize_t rv = nfsctl_transaction_write(file, buf, 0, pos);
		if (rv < 0)
			return rv;
	}
	return simple_transaction_read(file, buf, size, pos);
}

134
static const struct file_operations transaction_ops = {
L
Linus Torvalds 已提交
135
	.write		= nfsctl_transaction_write,
136
	.read		= nfsctl_transaction_read,
L
Linus Torvalds 已提交
137
	.release	= simple_transaction_release,
138
	.llseek		= default_llseek,
L
Linus Torvalds 已提交
139 140
};

141
static int exports_net_open(struct net *net, struct file *file)
L
Linus Torvalds 已提交
142
{
143 144
	int err;
	struct seq_file *seq;
145
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
146 147 148 149 150 151

	err = seq_open(file, &nfs_exports_op);
	if (err)
		return err;

	seq = file->private_data;
152
	seq->private = nn->svc_export_cache;
153
	return 0;
L
Linus Torvalds 已提交
154 155
}

156 157 158 159 160
static int exports_proc_open(struct inode *inode, struct file *file)
{
	return exports_net_open(current->nsproxy->net_ns, file);
}

161 162 163 164 165
static const struct proc_ops exports_proc_ops = {
	.proc_open	= exports_proc_open,
	.proc_read	= seq_read,
	.proc_lseek	= seq_lseek,
	.proc_release	= seq_release,
166 167 168 169 170 171 172 173 174
};

static int exports_nfsd_open(struct inode *inode, struct file *file)
{
	return exports_net_open(inode->i_sb->s_fs_info, file);
}

static const struct file_operations exports_nfsd_operations = {
	.open		= exports_nfsd_open,
L
Linus Torvalds 已提交
175 176 177 178 179
	.read		= seq_read,
	.llseek		= seq_lseek,
	.release	= seq_release,
};

180 181 182 183 184 185 186 187 188 189 190
static int export_features_show(struct seq_file *m, void *v)
{
	seq_printf(m, "0x%x 0x%x\n", NFSEXP_ALLFLAGS, NFSEXP_SECINFO_FLAGS);
	return 0;
}

static int export_features_open(struct inode *inode, struct file *file)
{
	return single_open(file, export_features_show, NULL);
}

191
static const struct file_operations export_features_operations = {
192 193 194 195 196 197
	.open		= export_features_open,
	.read		= seq_read,
	.llseek		= seq_lseek,
	.release	= single_release,
};

198
#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
199 200
static int supported_enctypes_show(struct seq_file *m, void *v)
{
201
	seq_printf(m, KRB5_SUPPORTED_ENCTYPES);
202 203 204 205 206 207 208 209
	return 0;
}

static int supported_enctypes_open(struct inode *inode, struct file *file)
{
	return single_open(file, supported_enctypes_show, NULL);
}

210
static const struct file_operations supported_enctypes_ops = {
211 212 213 214 215
	.open		= supported_enctypes_open,
	.read		= seq_read,
	.llseek		= seq_lseek,
	.release	= single_release,
};
216
#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
217

218
static const struct file_operations pool_stats_operations = {
219 220 221
	.open		= nfsd_pool_stats_open,
	.read		= seq_read,
	.llseek		= seq_lseek,
222
	.release	= nfsd_pool_stats_release,
223 224
};

225
static const struct file_operations reply_cache_stats_operations = {
226 227 228 229 230 231
	.open		= nfsd_reply_cache_stats_open,
	.read		= seq_read,
	.llseek		= seq_lseek,
	.release	= single_release,
};

L
Linus Torvalds 已提交
232 233 234 235 236
/*----------------------------------------------------------------------------*/
/*
 * payload - write methods
 */

A
Al Viro 已提交
237 238 239 240
static inline struct net *netns(struct file *file)
{
	return file_inode(file)->i_sb->s_fs_info;
}
L
Linus Torvalds 已提交
241

242
/*
243 244 245 246 247 248
 * write_unlock_ip - Release all locks used by a client
 *
 * Experimental.
 *
 * Input:
 *			buf:	'\n'-terminated C string containing a
249
 *				presentation format IP address
250 251 252 253 254 255
 *			size:	length of C string in @buf
 * Output:
 *	On success:	returns zero if all specified locks were released;
 *			returns one if one or more locks were not released
 *	On error:	return code is negative errno value
 */
256
static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size)
257
{
258 259 260
	struct sockaddr_storage address;
	struct sockaddr *sap = (struct sockaddr *)&address;
	size_t salen = sizeof(address);
261
	char *fo_path;
A
Al Viro 已提交
262
	struct net *net = netns(file);
263 264 265 266 267 268 269 270 271 272 273 274

	/* sanity check */
	if (size == 0)
		return -EINVAL;

	if (buf[size-1] != '\n')
		return -EINVAL;

	fo_path = buf;
	if (qword_get(&buf, fo_path, size) < 0)
		return -EINVAL;

275
	if (rpc_pton(net, fo_path, size, sap, salen) == 0)
276 277
		return -EINVAL;

278
	return nlmsvc_unlock_all_by_ip(sap);
279 280
}

281
/*
282 283 284 285 286 287 288 289 290 291 292 293 294
 * write_unlock_fs - Release all locks on a local file system
 *
 * Experimental.
 *
 * Input:
 *			buf:	'\n'-terminated C string containing the
 *				absolute pathname of a local file system
 *			size:	length of C string in @buf
 * Output:
 *	On success:	returns zero if all specified locks were released;
 *			returns one if one or more locks were not released
 *	On error:	return code is negative errno value
 */
295
static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size)
296
{
A
Al Viro 已提交
297
	struct path path;
298 299 300 301 302 303 304 305 306 307 308 309 310 311
	char *fo_path;
	int error;

	/* sanity check */
	if (size == 0)
		return -EINVAL;

	if (buf[size-1] != '\n')
		return -EINVAL;

	fo_path = buf;
	if (qword_get(&buf, fo_path, size) < 0)
		return -EINVAL;

A
Al Viro 已提交
312
	error = kern_path(fo_path, 0, &path);
313 314 315
	if (error)
		return error;

316 317 318 319 320 321 322 323 324
	/*
	 * XXX: Needs better sanity checking.  Otherwise we could end up
	 * releasing locks on the wrong file system.
	 *
	 * For example:
	 * 1.  Does the path refer to a directory?
	 * 2.  Is that directory a mount point, or
	 * 3.  Is that directory the root of an exported file system?
	 */
325
	error = nlmsvc_unlock_all_by_sb(path.dentry->d_sb);
326

A
Al Viro 已提交
327
	path_put(&path);
328 329 330
	return error;
}

331
/*
332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351
 * write_filehandle - Get a variable-length NFS file handle by path
 *
 * On input, the buffer contains a '\n'-terminated C string comprised of
 * three alphanumeric words separated by whitespace.  The string may
 * contain escape sequences.
 *
 * Input:
 *			buf:
 *				domain:		client domain name
 *				path:		export pathname
 *				maxsize:	numeric maximum size of
 *						@buf
 *			size:	length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C
 *			string containing a ASCII hex text version
 *			of the NFS file handle;
 *			return code is the size in bytes of the string
 *	On error:	return code is negative errno value
 */
L
Linus Torvalds 已提交
352 353 354
static ssize_t write_filehandle(struct file *file, char *buf, size_t size)
{
	char *dname, *path;
355
	int maxsize;
L
Linus Torvalds 已提交
356 357 358 359 360
	char *mesg = buf;
	int len;
	struct auth_domain *dom;
	struct knfsd_fh fh;

361 362 363
	if (size == 0)
		return -EINVAL;

L
Linus Torvalds 已提交
364 365 366 367 368 369
	if (buf[size-1] != '\n')
		return -EINVAL;
	buf[size-1] = 0;

	dname = mesg;
	len = qword_get(&mesg, dname, size);
370 371
	if (len <= 0)
		return -EINVAL;
L
Linus Torvalds 已提交
372 373 374
	
	path = dname+len+1;
	len = qword_get(&mesg, path, size);
375 376
	if (len <= 0)
		return -EINVAL;
L
Linus Torvalds 已提交
377 378 379 380 381 382 383

	len = get_int(&mesg, &maxsize);
	if (len)
		return len;

	if (maxsize < NFS_FHSIZE)
		return -EINVAL;
384
	maxsize = min(maxsize, NFS3_FHSIZE);
L
Linus Torvalds 已提交
385 386 387 388 389 390 391 392 393

	if (qword_get(&mesg, mesg, size)>0)
		return -EINVAL;

	/* we have all the words, they are in buf.. */
	dom = unix_domain_find(dname);
	if (!dom)
		return -ENOMEM;

A
Al Viro 已提交
394
	len = exp_rootfh(netns(file), dom, path, &fh,  maxsize);
L
Linus Torvalds 已提交
395 396 397 398
	auth_domain_put(dom);
	if (len)
		return len;
	
399 400
	mesg = buf;
	len = SIMPLE_TRANSACTION_LIMIT;
L
Linus Torvalds 已提交
401 402 403 404 405
	qword_addhex(&mesg, &len, (char*)&fh.fh_base, fh.fh_size);
	mesg[-1] = '\n';
	return mesg - buf;	
}

406
/*
407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433
 * write_threads - Start NFSD, or report the current number of running threads
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C
 *			string numeric value representing the number of
 *			running NFSD threads;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero
 *
 * OR
 *
 * Input:
 *			buf:		C string containing an unsigned
 *					integer value representing the
 *					number of NFSD threads to start
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	NFS service is started;
 *			passed-in buffer filled with '\n'-terminated C
 *			string numeric value representing the number of
 *			running NFSD threads;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
L
Linus Torvalds 已提交
434 435 436 437
static ssize_t write_threads(struct file *file, char *buf, size_t size)
{
	char *mesg = buf;
	int rv;
A
Al Viro 已提交
438
	struct net *net = netns(file);
439

L
Linus Torvalds 已提交
440 441 442 443 444
	if (size > 0) {
		int newthreads;
		rv = get_int(&mesg, &newthreads);
		if (rv)
			return rv;
445
		if (newthreads < 0)
L
Linus Torvalds 已提交
446
			return -EINVAL;
447
		rv = nfsd_svc(newthreads, net, file->f_cred);
448
		if (rv < 0)
L
Linus Torvalds 已提交
449
			return rv;
450
	} else
451
		rv = nfsd_nrthreads(net);
452

453
	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n", rv);
L
Linus Torvalds 已提交
454 455
}

456
/*
457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477
 * write_pool_threads - Set or report the current number of threads per pool
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 *
 * OR
 *
 * Input:
 * 			buf:		C string containing whitespace-
 * 					separated unsigned integer values
 *					representing the number of NFSD
 *					threads to start in each pool
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C
 *			string containing integer values representing the
 *			number of NFSD threads in each pool;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
478 479 480 481 482 483 484 485 486
static ssize_t write_pool_threads(struct file *file, char *buf, size_t size)
{
	/* if size > 0, look for an array of number of threads per node
	 * and apply them  then write out number of threads per node as reply
	 */
	char *mesg = buf;
	int i;
	int rv;
	int len;
487
	int npools;
488
	int *nthreads;
A
Al Viro 已提交
489
	struct net *net = netns(file);
490

491
	mutex_lock(&nfsd_mutex);
492
	npools = nfsd_nrpools(net);
493 494 495 496 497 498
	if (npools == 0) {
		/*
		 * NFS is shut down.  The admin can start it by
		 * writing to the threads file but NOT the pool_threads
		 * file, sorry.  Report zero threads.
		 */
499
		mutex_unlock(&nfsd_mutex);
500 501 502 503 504
		strcpy(buf, "0\n");
		return strlen(buf);
	}

	nthreads = kcalloc(npools, sizeof(int), GFP_KERNEL);
505
	rv = -ENOMEM;
506
	if (nthreads == NULL)
507
		goto out_free;
508 509 510 511 512 513 514 515 516 517 518 519

	if (size > 0) {
		for (i = 0; i < npools; i++) {
			rv = get_int(&mesg, &nthreads[i]);
			if (rv == -ENOENT)
				break;		/* fewer numbers than pools */
			if (rv)
				goto out_free;	/* syntax error */
			rv = -EINVAL;
			if (nthreads[i] < 0)
				goto out_free;
		}
520
		rv = nfsd_set_nrthreads(i, nthreads, net);
521 522 523 524
		if (rv)
			goto out_free;
	}

525
	rv = nfsd_get_nrthreads(npools, nthreads, net);
526 527 528 529 530 531 532 533 534 535 536
	if (rv)
		goto out_free;

	mesg = buf;
	size = SIMPLE_TRANSACTION_LIMIT;
	for (i = 0; i < npools && size > 0; i++) {
		snprintf(mesg, size, "%d%c", nthreads[i], (i == npools-1 ? '\n' : ' '));
		len = strlen(mesg);
		size -= len;
		mesg += len;
	}
537
	rv = mesg - buf;
538 539
out_free:
	kfree(nthreads);
540
	mutex_unlock(&nfsd_mutex);
541 542 543
	return rv;
}

544
static ssize_t
545 546
nfsd_print_version_support(struct nfsd_net *nn, char *buf, int remaining,
		const char *sep, unsigned vers, int minor)
547
{
548
	const char *format = minor < 0 ? "%s%c%u" : "%s%c%u.%u";
549
	bool supported = !!nfsd_vers(nn, vers, NFSD_TEST);
550

551
	if (vers == 4 && minor >= 0 &&
552
	    !nfsd_minorversion(nn, minor, NFSD_TEST))
553
		supported = false;
554 555 556 557 558 559 560
	if (minor == 0 && supported)
		/*
		 * special case for backward compatability.
		 * +4.0 is never reported, it is implied by
		 * +4, unless -4.0 is present.
		 */
		return 0;
561 562 563 564
	return snprintf(buf, remaining, format, sep,
			supported ? '+' : '-', vers, minor);
}

565
static ssize_t __write_versions(struct file *file, char *buf, size_t size)
566 567
{
	char *mesg = buf;
568
	char *vers, *minorp, sign;
569
	int len, num, remaining;
570 571
	ssize_t tlen = 0;
	char *sep;
A
Al Viro 已提交
572
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
573 574

	if (size>0) {
575
		if (nn->nfsd_serv)
576
			/* Cannot change versions without updating
577
			 * nn->nfsd_serv->sv_xdrsize, and reallocing
578 579
			 * rq_argp and rq_resp
			 */
580 581 582 583 584 585 586 587 588
			return -EBUSY;
		if (buf[size-1] != '\n')
			return -EINVAL;
		buf[size-1] = 0;

		vers = mesg;
		len = qword_get(&mesg, vers, size);
		if (len <= 0) return -EINVAL;
		do {
589
			enum vers_op cmd;
590
			unsigned minor;
591 592
			sign = *vers;
			if (sign == '+' || sign == '-')
593
				num = simple_strtol((vers+1), &minorp, 0);
594
			else
595 596
				num = simple_strtol(vers, &minorp, 0);
			if (*minorp == '.') {
597
				if (num != 4)
598
					return -EINVAL;
599
				if (kstrtouint(minorp+1, 0, &minor) < 0)
600
					return -EINVAL;
601 602
			}

603
			cmd = sign == '-' ? NFSD_CLEAR : NFSD_SET;
604 605 606
			switch(num) {
			case 2:
			case 3:
607
				nfsd_vers(nn, num, cmd);
608
				break;
609
			case 4:
610
				if (*minorp == '.') {
611
					if (nfsd_minorversion(nn, minor, cmd) < 0)
612
						return -EINVAL;
613
				} else if ((cmd == NFSD_SET) != nfsd_vers(nn, num, NFSD_TEST)) {
614 615 616 617 618 619
					/*
					 * Either we have +4 and no minors are enabled,
					 * or we have -4 and at least one minor is enabled.
					 * In either case, propagate 'cmd' to all minors.
					 */
					minor = 0;
620
					while (nfsd_minorversion(nn, minor, cmd) >= 0)
621 622 623
						minor++;
				}
				break;
624 625 626 627 628 629 630 631
			default:
				return -EINVAL;
			}
			vers += len + 1;
		} while ((len = qword_get(&mesg, vers, size)) > 0);
		/* If all get turned off, turn them back on, as
		 * having no versions is BAD
		 */
632
		nfsd_reset_versions(nn);
633
	}
634

635 636 637
	/* Now write current state into reply buffer */
	len = 0;
	sep = "";
638
	remaining = SIMPLE_TRANSACTION_LIMIT;
639
	for (num=2 ; num <= 4 ; num++) {
640
		int minor;
641
		if (!nfsd_vers(nn, num, NFSD_AVAIL))
642
			continue;
643 644

		minor = -1;
645
		do {
646
			len = nfsd_print_version_support(nn, buf, remaining,
647
					sep, num, minor);
648
			if (len >= remaining)
649
				goto out;
650 651 652
			remaining -= len;
			buf += len;
			tlen += len;
653
			minor++;
654 655
			if (len)
				sep = " ";
656 657 658
		} while (num == 4 && minor <= NFSD_SUPPORTED_MINOR_VERSION);
	}
out:
659
	len = snprintf(buf, remaining, "\n");
660
	if (len >= remaining)
661 662
		return -EINVAL;
	return tlen + len;
663 664
}

665
/*
666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696
 * write_versions - Set or report the available NFS protocol versions
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C
 *			string containing positive or negative integer
 *			values representing the current status of each
 *			protocol version;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 *
 * OR
 *
 * Input:
 * 			buf:		C string containing whitespace-
 * 					separated positive or negative
 * 					integer values representing NFS
 * 					protocol versions to enable ("+n")
 * 					or disable ("-n")
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	status of zero or more protocol versions has
 *			been updated; passed-in buffer filled with
 *			'\n'-terminated C string containing positive
 *			or negative integer values representing the
 *			current status of each protocol version;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
697 698 699 700 701 702 703 704 705 706
static ssize_t write_versions(struct file *file, char *buf, size_t size)
{
	ssize_t rv;

	mutex_lock(&nfsd_mutex);
	rv = __write_versions(file, buf, size);
	mutex_unlock(&nfsd_mutex);
	return rv;
}

707 708 709 710
/*
 * Zero-length write.  Return a list of NFSD's current listener
 * transports.
 */
711
static ssize_t __write_ports_names(char *buf, struct net *net)
712
{
713 714 715
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);

	if (nn->nfsd_serv == NULL)
716
		return 0;
717
	return svc_xprt_names(nn->nfsd_serv, buf, SIMPLE_TRANSACTION_LIMIT);
718 719
}

720 721 722 723 724
/*
 * A single 'fd' number was written, in which case it must be for
 * a socket of a supported family/protocol, and we use it as an
 * nfsd listener.
 */
725
static ssize_t __write_ports_addfd(char *buf, struct net *net, const struct cred *cred)
726 727 728
{
	char *mesg = buf;
	int fd, err;
729
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
730 731 732 733 734

	err = get_int(&mesg, &fd);
	if (err != 0 || fd < 0)
		return -EINVAL;

735 736 737 738 739
	if (svc_alien_sock(net, fd)) {
		printk(KERN_ERR "%s: socket net is different to NFSd's one\n", __func__);
		return -EINVAL;
	}

740
	err = nfsd_create_serv(net);
741 742 743
	if (err != 0)
		return err;

744
	err = svc_addsock(nn->nfsd_serv, fd, buf, SIMPLE_TRANSACTION_LIMIT, cred);
745
	if (err < 0) {
746
		nfsd_destroy(net);
747 748
		return err;
	}
749

750
	/* Decrease the count, but don't shut down the service */
751
	nn->nfsd_serv->sv_nrthreads--;
752
	return err;
753 754
}

755 756 757 758
/*
 * A transport listener is added by writing it's transport name and
 * a port number.
 */
759
static ssize_t __write_ports_addxprt(char *buf, struct net *net, const struct cred *cred)
760 761
{
	char transport[16];
762
	struct svc_xprt *xprt;
763
	int port, err;
764
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
765

766
	if (sscanf(buf, "%15s %5u", transport, &port) != 2)
767 768
		return -EINVAL;

769
	if (port < 1 || port > USHRT_MAX)
770 771
		return -EINVAL;

772
	err = nfsd_create_serv(net);
773 774 775
	if (err != 0)
		return err;

776
	err = svc_create_xprt(nn->nfsd_serv, transport, net,
777
				PF_INET, port, SVC_SOCK_ANONYMOUS, cred);
778
	if (err < 0)
779 780
		goto out_err;

781
	err = svc_create_xprt(nn->nfsd_serv, transport, net,
782
				PF_INET6, port, SVC_SOCK_ANONYMOUS, cred);
783 784
	if (err < 0 && err != -EAFNOSUPPORT)
		goto out_close;
785 786

	/* Decrease the count, but don't shut down the service */
787
	nn->nfsd_serv->sv_nrthreads--;
788
	return 0;
789
out_close:
790
	xprt = svc_find_xprt(nn->nfsd_serv, transport, net, PF_INET, port);
791 792 793 794 795
	if (xprt != NULL) {
		svc_close_xprt(xprt);
		svc_xprt_put(xprt);
	}
out_err:
796 797 798 799
	if (!list_empty(&nn->nfsd_serv->sv_permsocks))
		nn->nfsd_serv->sv_nrthreads--;
	 else
		nfsd_destroy(net);
800
	return err;
801 802
}

803 804
static ssize_t __write_ports(struct file *file, char *buf, size_t size,
			     struct net *net)
805
{
806
	if (size == 0)
807
		return __write_ports_names(buf, net);
808 809

	if (isdigit(buf[0]))
810
		return __write_ports_addfd(buf, net, file->f_cred);
811

812
	if (isalpha(buf[0]))
813
		return __write_ports_addxprt(buf, net, file->f_cred);
814

815
	return -EINVAL;
816 817
}

818
/*
819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836
 * write_ports - Pass a socket file descriptor or transport name to listen on
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 * Output:
 *	On success:	passed-in buffer filled with a '\n'-terminated C
 *			string containing a whitespace-separated list of
 *			named NFSD listeners;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 *
 * OR
 *
 * Input:
 *			buf:		C string containing an unsigned
 *					integer value representing a bound
 *					but unconnected socket that is to be
837 838 839
 *					used as an NFSD listener; listen(3)
 *					must be called for a SOCK_STREAM
 *					socket, otherwise it is ignored
840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	NFS service is started;
 *			passed-in buffer filled with a '\n'-terminated C
 *			string containing a unique alphanumeric name of
 *			the listener;
 *			return code is the size in bytes of the string
 *	On error:	return code is a negative errno value
 *
 * OR
 *
 * Input:
 *			buf:		C string containing a transport
 *					name and an unsigned integer value
 *					representing the port to listen on,
 *					separated by whitespace
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	returns zero; NFS service is started
 *	On error:	return code is a negative errno value
 */
861 862 863
static ssize_t write_ports(struct file *file, char *buf, size_t size)
{
	ssize_t rv;
864

865
	mutex_lock(&nfsd_mutex);
A
Al Viro 已提交
866
	rv = __write_ports(file, buf, size, netns(file));
867 868 869 870 871
	mutex_unlock(&nfsd_mutex);
	return rv;
}


872 873
int nfsd_max_blksize;

874
/*
875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894
 * write_maxblksize - Set or report the current NFS blksize
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 *
 * OR
 *
 * Input:
 * 			buf:		C string containing an unsigned
 * 					integer value representing the new
 * 					NFS blksize
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C string
 *			containing numeric value of the current NFS blksize
 *			setting;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
895 896 897
static ssize_t write_maxblksize(struct file *file, char *buf, size_t size)
{
	char *mesg = buf;
A
Al Viro 已提交
898
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
899

900 901 902 903 904 905 906 907
	if (size > 0) {
		int bsize;
		int rv = get_int(&mesg, &bsize);
		if (rv)
			return rv;
		/* force bsize into allowed range and
		 * required alignment.
		 */
908 909
		bsize = max_t(int, bsize, 1024);
		bsize = min_t(int, bsize, NFSSVC_MAXBLKSIZE);
910
		bsize &= ~(1024-1);
911
		mutex_lock(&nfsd_mutex);
912
		if (nn->nfsd_serv) {
913
			mutex_unlock(&nfsd_mutex);
914 915 916
			return -EBUSY;
		}
		nfsd_max_blksize = bsize;
917
		mutex_unlock(&nfsd_mutex);
918
	}
919 920 921

	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n",
							nfsd_max_blksize);
922 923
}

924
/*
925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946
 * write_maxconn - Set or report the current max number of connections
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 * OR
 *
 * Input:
 * 			buf:		C string containing an unsigned
 * 					integer value representing the new
 * 					number of max connections
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C string
 *			containing numeric value of max_connections setting
 *			for this net namespace;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
static ssize_t write_maxconn(struct file *file, char *buf, size_t size)
{
	char *mesg = buf;
A
Al Viro 已提交
947
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
948 949 950 951 952 953 954 955 956 957 958 959 960
	unsigned int maxconn = nn->max_connections;

	if (size > 0) {
		int rv = get_uint(&mesg, &maxconn);

		if (rv)
			return rv;
		nn->max_connections = maxconn;
	}

	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%u\n", maxconn);
}

961
#ifdef CONFIG_NFSD_V4
962
static ssize_t __nfsd4_write_time(struct file *file, char *buf, size_t size,
963
				  time64_t *time, struct nfsd_net *nn)
L
Linus Torvalds 已提交
964 965
{
	char *mesg = buf;
966
	int rv, i;
L
Linus Torvalds 已提交
967 968

	if (size > 0) {
969
		if (nn->nfsd_serv)
970
			return -EBUSY;
971
		rv = get_int(&mesg, &i);
L
Linus Torvalds 已提交
972 973
		if (rv)
			return rv;
974 975 976 977 978 979 980 981 982 983 984 985
		/*
		 * Some sanity checking.  We don't have a reason for
		 * these particular numbers, but problems with the
		 * extremes are:
		 *	- Too short: the briefest network outage may
		 *	  cause clients to lose all their locks.  Also,
		 *	  the frequent polling may be wasteful.
		 *	- Too long: do you really want reboot recovery
		 *	  to take more than an hour?  Or to make other
		 *	  clients wait an hour before being able to
		 *	  revoke a dead client's locks?
		 */
986
		if (i < 10 || i > 3600)
L
Linus Torvalds 已提交
987
			return -EINVAL;
988
		*time = i;
L
Linus Torvalds 已提交
989
	}
990

991
	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%lld\n", *time);
992 993
}

994
static ssize_t nfsd4_write_time(struct file *file, char *buf, size_t size,
995
				time64_t *time, struct nfsd_net *nn)
996 997 998 999
{
	ssize_t rv;

	mutex_lock(&nfsd_mutex);
1000
	rv = __nfsd4_write_time(file, buf, size, time, nn);
1001 1002
	mutex_unlock(&nfsd_mutex);
	return rv;
L
Linus Torvalds 已提交
1003 1004
}

1005
/*
1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025
 * write_leasetime - Set or report the current NFSv4 lease time
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 *
 * OR
 *
 * Input:
 *			buf:		C string containing an unsigned
 *					integer value representing the new
 *					NFSv4 lease expiry time
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C
 *			string containing unsigned integer value of the
 *			current lease expiry time;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
1026 1027
static ssize_t write_leasetime(struct file *file, char *buf, size_t size)
{
A
Al Viro 已提交
1028
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1029
	return nfsd4_write_time(file, buf, size, &nn->nfsd4_lease, nn);
1030 1031
}

1032
/*
1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043
 * write_gracetime - Set or report current NFSv4 grace period time
 *
 * As above, but sets the time of the NFSv4 grace period.
 *
 * Note this should never be set to less than the *previous*
 * lease-period time, but we don't try to enforce this.  (In the common
 * case (a new boot), we don't know what the previous lease time was
 * anyway.)
 */
static ssize_t write_gracetime(struct file *file, char *buf, size_t size)
{
A
Al Viro 已提交
1044
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1045
	return nfsd4_write_time(file, buf, size, &nn->nfsd4_grace, nn);
1046 1047
}

1048 1049
static ssize_t __write_recoverydir(struct file *file, char *buf, size_t size,
				   struct nfsd_net *nn)
1050 1051 1052 1053 1054
{
	char *mesg = buf;
	char *recdir;
	int len, status;

1055
	if (size > 0) {
1056
		if (nn->nfsd_serv)
1057 1058 1059 1060
			return -EBUSY;
		if (size > PATH_MAX || buf[size-1] != '\n')
			return -EINVAL;
		buf[size-1] = 0;
1061

1062 1063 1064 1065
		recdir = mesg;
		len = qword_get(&mesg, recdir, size);
		if (len <= 0)
			return -EINVAL;
1066

1067
		status = nfs4_reset_recoverydir(recdir);
1068 1069
		if (status)
			return status;
1070
	}
1071 1072 1073

	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%s\n",
							nfs4_recoverydir());
1074
}
1075

1076
/*
1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089 1090 1091 1092 1093 1094 1095 1096
 * write_recoverydir - Set or report the pathname of the recovery directory
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 *
 * OR
 *
 * Input:
 *			buf:		C string containing the pathname
 *					of the directory on a local file
 *					system containing permanent NFSv4
 *					recovery data
 *			size:		non-zero length of C string in @buf
 * Output:
 *	On success:	passed-in buffer filled with '\n'-terminated C string
 *			containing the current recovery pathname setting;
 *			return code is the size in bytes of the string
 *	On error:	return code is zero or a negative errno value
 */
1097 1098 1099
static ssize_t write_recoverydir(struct file *file, char *buf, size_t size)
{
	ssize_t rv;
A
Al Viro 已提交
1100
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1101 1102

	mutex_lock(&nfsd_mutex);
1103
	rv = __write_recoverydir(file, buf, size, nn);
1104 1105 1106 1107
	mutex_unlock(&nfsd_mutex);
	return rv;
}

1108
/*
1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129
 * write_v4_end_grace - release grace period for nfsd's v4.x lock manager
 *
 * Input:
 *			buf:		ignored
 *			size:		zero
 * OR
 *
 * Input:
 * 			buf:		any value
 *			size:		non-zero length of C string in @buf
 * Output:
 *			passed-in buffer filled with "Y" or "N" with a newline
 *			and NULL-terminated C string. This indicates whether
 *			the grace period has ended in the current net
 *			namespace. Return code is the size in bytes of the
 *			string. Writing a string that starts with 'Y', 'y', or
 *			'1' to the file will end the grace period for nfsd's v4
 *			lock manager.
 */
static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size)
{
A
Al Viro 已提交
1130
	struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1131 1132 1133 1134 1135 1136

	if (size > 0) {
		switch(buf[0]) {
		case 'Y':
		case 'y':
		case '1':
1137
			if (!nn->nfsd_serv)
1138
				return -EBUSY;
1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149
			nfsd4_end_grace(nn);
			break;
		default:
			return -EINVAL;
		}
	}

	return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%c\n",
			 nn->grace_ended ? 'Y' : 'N');
}

1150
#endif
1151

L
Linus Torvalds 已提交
1152 1153 1154 1155 1156
/*----------------------------------------------------------------------------*/
/*
 *	populating the filesystem.
 */

1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171
/* Basically copying rpc_get_inode. */
static struct inode *nfsd_get_inode(struct super_block *sb, umode_t mode)
{
	struct inode *inode = new_inode(sb);
	if (!inode)
		return NULL;
	/* Following advice from simple_fill_super documentation: */
	inode->i_ino = iunique(sb, NFSD_MaxReserved);
	inode->i_mode = mode;
	inode->i_atime = inode->i_mtime = inode->i_ctime = current_time(inode);
	switch (mode & S_IFMT) {
	case S_IFDIR:
		inode->i_fop = &simple_dir_operations;
		inode->i_op = &simple_dir_inode_operations;
		inc_nlink(inode);
1172
		break;
1173 1174 1175 1176 1177 1178
	default:
		break;
	}
	return inode;
}

1179
static int __nfsd_mkdir(struct inode *dir, struct dentry *dentry, umode_t mode, struct nfsdfs_client *ncl)
1180 1181 1182 1183 1184 1185
{
	struct inode *inode;

	inode = nfsd_get_inode(dir->i_sb, mode);
	if (!inode)
		return -ENOMEM;
1186 1187 1188 1189
	if (ncl) {
		inode->i_private = ncl;
		kref_get(&ncl->cl_ref);
	}
1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205
	d_add(dentry, inode);
	inc_nlink(dir);
	fsnotify_mkdir(dir, dentry);
	return 0;
}

static struct dentry *nfsd_mkdir(struct dentry *parent, struct nfsdfs_client *ncl, char *name)
{
	struct inode *dir = parent->d_inode;
	struct dentry *dentry;
	int ret = -ENOMEM;

	inode_lock(dir);
	dentry = d_alloc_name(parent, name);
	if (!dentry)
		goto out_err;
1206
	ret = __nfsd_mkdir(d_inode(parent), dentry, S_IFDIR | 0600, ncl);
1207 1208 1209 1210 1211 1212
	if (ret)
		goto out_err;
out:
	inode_unlock(dir);
	return dentry;
out_err:
1213
	dput(dentry);
1214 1215 1216 1217
	dentry = ERR_PTR(ret);
	goto out;
}

J
J. Bruce Fields 已提交
1218 1219 1220 1221 1222 1223 1224 1225
static void clear_ncl(struct inode *inode)
{
	struct nfsdfs_client *ncl = inode->i_private;

	inode->i_private = NULL;
	kref_put(&ncl->cl_ref, ncl->cl_release);
}

1226
static struct nfsdfs_client *__get_nfsdfs_client(struct inode *inode)
J
J. Bruce Fields 已提交
1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238
{
	struct nfsdfs_client *nc = inode->i_private;

	if (nc)
		kref_get(&nc->cl_ref);
	return nc;
}

struct nfsdfs_client *get_nfsdfs_client(struct inode *inode)
{
	struct nfsdfs_client *nc;

1239
	inode_lock_shared(inode);
J
J. Bruce Fields 已提交
1240
	nc = __get_nfsdfs_client(inode);
1241
	inode_unlock_shared(inode);
J
J. Bruce Fields 已提交
1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272
	return nc;
}
/* from __rpc_unlink */
static void nfsdfs_remove_file(struct inode *dir, struct dentry *dentry)
{
	int ret;

	clear_ncl(d_inode(dentry));
	dget(dentry);
	ret = simple_unlink(dir, dentry);
	d_delete(dentry);
	dput(dentry);
	WARN_ON_ONCE(ret);
}

static void nfsdfs_remove_files(struct dentry *root)
{
	struct dentry *dentry, *tmp;

	list_for_each_entry_safe(dentry, tmp, &root->d_subdirs, d_child) {
		if (!simple_positive(dentry)) {
			WARN_ON_ONCE(1); /* I think this can't happen? */
			continue;
		}
		nfsdfs_remove_file(d_inode(root), dentry);
	}
}

/* XXX: cut'n'paste from simple_fill_super; figure out if we could share
 * code instead. */
static  int nfsdfs_create_files(struct dentry *root,
1273 1274
				const struct tree_descr *files,
				struct dentry **fdentries)
J
J. Bruce Fields 已提交
1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295
{
	struct inode *dir = d_inode(root);
	struct inode *inode;
	struct dentry *dentry;
	int i;

	inode_lock(dir);
	for (i = 0; files->name && files->name[0]; i++, files++) {
		dentry = d_alloc_name(root, files->name);
		if (!dentry)
			goto out;
		inode = nfsd_get_inode(d_inode(root)->i_sb,
					S_IFREG | files->mode);
		if (!inode) {
			dput(dentry);
			goto out;
		}
		inode->i_fop = files->ops;
		inode->i_private = __get_nfsdfs_client(dir);
		d_add(dentry, inode);
		fsnotify_create(dir, dentry);
1296 1297
		if (fdentries)
			fdentries[i] = dentry;
J
J. Bruce Fields 已提交
1298 1299 1300 1301 1302 1303 1304 1305 1306
	}
	inode_unlock(dir);
	return 0;
out:
	nfsdfs_remove_files(root);
	inode_unlock(dir);
	return -ENOMEM;
}

1307
/* on success, returns positive number unique to that client. */
J
J. Bruce Fields 已提交
1308
struct dentry *nfsd_client_mkdir(struct nfsd_net *nn,
1309 1310 1311
				 struct nfsdfs_client *ncl, u32 id,
				 const struct tree_descr *files,
				 struct dentry **fdentries)
1312
{
J
J. Bruce Fields 已提交
1313
	struct dentry *dentry;
1314
	char name[11];
J
J. Bruce Fields 已提交
1315
	int ret;
1316

1317
	sprintf(name, "%u", id);
1318

J
J. Bruce Fields 已提交
1319 1320 1321
	dentry = nfsd_mkdir(nn->nfsd_client_dir, ncl, name);
	if (IS_ERR(dentry)) /* XXX: tossing errors? */
		return NULL;
1322
	ret = nfsdfs_create_files(dentry, files, fdentries);
J
J. Bruce Fields 已提交
1323 1324 1325 1326 1327
	if (ret) {
		nfsd_client_rmdir(dentry);
		return NULL;
	}
	return dentry;
1328 1329 1330 1331 1332 1333 1334 1335 1336
}

/* Taken from __rpc_rmdir: */
void nfsd_client_rmdir(struct dentry *dentry)
{
	struct inode *dir = d_inode(dentry->d_parent);
	struct inode *inode = d_inode(dentry);
	int ret;

J
J. Bruce Fields 已提交
1337 1338 1339
	inode_lock(dir);
	nfsdfs_remove_files(dentry);
	clear_ncl(inode);
1340 1341 1342
	dget(dentry);
	ret = simple_rmdir(dir, dentry);
	WARN_ON_ONCE(ret);
1343
	fsnotify_rmdir(dir, dentry);
1344
	d_delete(dentry);
1345
	dput(dentry);
J
J. Bruce Fields 已提交
1346
	inode_unlock(dir);
1347 1348
}

1349
static int nfsd_fill_super(struct super_block *sb, struct fs_context *fc)
L
Linus Torvalds 已提交
1350
{
1351 1352 1353 1354 1355
	struct nfsd_net *nn = net_generic(current->nsproxy->net_ns,
							nfsd_net_id);
	struct dentry *dentry;
	int ret;

1356
	static const struct tree_descr nfsd_files[] = {
1357
		[NFSD_List] = {"exports", &exports_nfsd_operations, S_IRUGO},
A
Amir Goldstein 已提交
1358 1359
		/* Per-export io stats use same ops as exports file */
		[NFSD_Export_Stats] = {"export_stats", &exports_nfsd_operations, S_IRUGO},
1360 1361
		[NFSD_Export_features] = {"export_features",
					&export_features_operations, S_IRUGO},
1362 1363
		[NFSD_FO_UnlockIP] = {"unlock_ip",
					&transaction_ops, S_IWUSR|S_IRUSR},
1364 1365
		[NFSD_FO_UnlockFS] = {"unlock_filesystem",
					&transaction_ops, S_IWUSR|S_IRUSR},
L
Linus Torvalds 已提交
1366 1367
		[NFSD_Fh] = {"filehandle", &transaction_ops, S_IWUSR|S_IRUSR},
		[NFSD_Threads] = {"threads", &transaction_ops, S_IWUSR|S_IRUSR},
1368
		[NFSD_Pool_Threads] = {"pool_threads", &transaction_ops, S_IWUSR|S_IRUSR},
1369
		[NFSD_Pool_Stats] = {"pool_stats", &pool_stats_operations, S_IRUGO},
1370
		[NFSD_Reply_Cache_Stats] = {"reply_cache_stats", &reply_cache_stats_operations, S_IRUGO},
1371
		[NFSD_Versions] = {"versions", &transaction_ops, S_IWUSR|S_IRUSR},
1372
		[NFSD_Ports] = {"portlist", &transaction_ops, S_IWUSR|S_IRUGO},
1373
		[NFSD_MaxBlkSize] = {"max_block_size", &transaction_ops, S_IWUSR|S_IRUGO},
1374
		[NFSD_MaxConnections] = {"max_connections", &transaction_ops, S_IWUSR|S_IRUGO},
1375
#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
1376
		[NFSD_SupportedEnctypes] = {"supported_krb5_enctypes", &supported_enctypes_ops, S_IRUGO},
1377
#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
L
Linus Torvalds 已提交
1378 1379
#ifdef CONFIG_NFSD_V4
		[NFSD_Leasetime] = {"nfsv4leasetime", &transaction_ops, S_IWUSR|S_IRUSR},
1380
		[NFSD_Gracetime] = {"nfsv4gracetime", &transaction_ops, S_IWUSR|S_IRUSR},
1381
		[NFSD_RecoveryDir] = {"nfsv4recoverydir", &transaction_ops, S_IWUSR|S_IRUSR},
1382
		[NFSD_V4EndGrace] = {"v4_end_grace", &transaction_ops, S_IWUSR|S_IRUGO},
L
Linus Torvalds 已提交
1383 1384 1385
#endif
		/* last one */ {""}
	};
1386

1387 1388 1389 1390 1391 1392 1393 1394
	ret = simple_fill_super(sb, 0x6e667364, nfsd_files);
	if (ret)
		return ret;
	dentry = nfsd_mkdir(sb->s_root, NULL, "clients");
	if (IS_ERR(dentry))
		return PTR_ERR(dentry);
	nn->nfsd_client_dir = dentry;
	return 0;
L
Linus Torvalds 已提交
1395
}
1396

1397 1398
static int nfsd_fs_get_tree(struct fs_context *fc)
{
A
Al Viro 已提交
1399
	return get_tree_keyed(fc, nfsd_fill_super, get_net(fc->net_ns));
L
Linus Torvalds 已提交
1400 1401
}

1402
static void nfsd_fs_free_fc(struct fs_context *fc)
L
Linus Torvalds 已提交
1403
{
1404 1405 1406 1407 1408 1409 1410 1411 1412 1413
	if (fc->s_fs_info)
		put_net(fc->s_fs_info);
}

static const struct fs_context_operations nfsd_fs_context_ops = {
	.free		= nfsd_fs_free_fc,
	.get_tree	= nfsd_fs_get_tree,
};

static int nfsd_init_fs_context(struct fs_context *fc)
L
Linus Torvalds 已提交
1414
{
1415 1416 1417 1418
	put_user_ns(fc->user_ns);
	fc->user_ns = get_user_ns(fc->net_ns->user_ns);
	fc->ops = &nfsd_fs_context_ops;
	return 0;
1419 1420 1421 1422 1423 1424
}

static void nfsd_umount(struct super_block *sb)
{
	struct net *net = sb->s_fs_info;

1425 1426
	nfsd_shutdown_threads(net);

1427 1428
	kill_litter_super(sb);
	put_net(net);
L
Linus Torvalds 已提交
1429 1430 1431 1432 1433
}

static struct file_system_type nfsd_fs_type = {
	.owner		= THIS_MODULE,
	.name		= "nfsd",
1434
	.init_fs_context = nfsd_init_fs_context,
1435
	.kill_sb	= nfsd_umount,
L
Linus Torvalds 已提交
1436
};
1437
MODULE_ALIAS_FS("nfsd");
L
Linus Torvalds 已提交
1438

1439 1440 1441 1442 1443 1444 1445 1446
#ifdef CONFIG_PROC_FS
static int create_proc_exports_entry(void)
{
	struct proc_dir_entry *entry;

	entry = proc_mkdir("fs/nfs", NULL);
	if (!entry)
		return -ENOMEM;
1447
	entry = proc_create("exports", 0, entry, &exports_proc_ops);
1448 1449
	if (!entry) {
		remove_proc_entry("fs/nfs", NULL);
1450
		return -ENOMEM;
1451
	}
1452 1453 1454 1455 1456 1457 1458 1459 1460
	return 0;
}
#else /* CONFIG_PROC_FS */
static int create_proc_exports_entry(void)
{
	return 0;
}
#endif

1461
unsigned int nfsd_net_id;
1462 1463 1464 1465

static __net_init int nfsd_init_net(struct net *net)
{
	int retval;
1466
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1467 1468 1469 1470

	retval = nfsd_export_init(net);
	if (retval)
		goto out_export_error;
1471 1472 1473
	retval = nfsd_idmap_init(net);
	if (retval)
		goto out_idmap_error;
1474 1475
	nn->nfsd_versions = NULL;
	nn->nfsd4_minorversions = NULL;
J
J. Bruce Fields 已提交
1476 1477 1478
	retval = nfsd_reply_cache_init(nn);
	if (retval)
		goto out_drc_error;
1479 1480
	nn->nfsd4_lease = 90;	/* default lease time */
	nn->nfsd4_grace = 90;
1481
	nn->somebody_reclaimed = false;
1482
	nn->track_reclaim_completes = false;
1483
	nn->clverifier_counter = prandom_u32();
1484 1485
	nn->clientid_base = prandom_u32();
	nn->clientid_counter = nn->clientid_base + 1;
1486
	nn->s2s_cp_cl_id = nn->clientid_counter++;
1487 1488 1489

	atomic_set(&nn->ntf_refcnt, 0);
	init_waitqueue_head(&nn->ntf_wq);
1490
	seqlock_init(&nn->boot_lock);
1491

1492 1493
	return 0;

J
J. Bruce Fields 已提交
1494 1495
out_drc_error:
	nfsd_idmap_shutdown(net);
1496 1497
out_idmap_error:
	nfsd_export_shutdown(net);
1498 1499 1500 1501 1502 1503
out_export_error:
	return retval;
}

static __net_exit void nfsd_exit_net(struct net *net)
{
J
J. Bruce Fields 已提交
1504 1505 1506
	struct nfsd_net *nn = net_generic(net, nfsd_net_id);

	nfsd_reply_cache_shutdown(nn);
1507
	nfsd_idmap_shutdown(net);
1508
	nfsd_export_shutdown(net);
1509
	nfsd_netns_free_versions(net_generic(net, nfsd_net_id));
1510 1511
}

1512
static struct pernet_operations nfsd_net_ops = {
1513 1514
	.init = nfsd_init_net,
	.exit = nfsd_exit_net,
1515 1516 1517 1518
	.id   = &nfsd_net_id,
	.size = sizeof(struct nfsd_net),
};

L
Linus Torvalds 已提交
1519 1520 1521 1522 1523
static int __init init_nfsd(void)
{
	int retval;
	printk(KERN_INFO "Installing knfsd (copyright (C) 1996 okir@monad.swb.de).\n");

1524
	retval = register_cld_notifier();
1525
	if (retval)
1526
		return retval;
1527 1528 1529
	retval = nfsd4_init_slabs();
	if (retval)
		goto out_unregister_notifier;
1530
	retval = nfsd4_init_pnfs();
B
Bryan Schumaker 已提交
1531 1532
	if (retval)
		goto out_free_slabs;
1533 1534 1535
	retval = nfsd_stat_init();	/* Statistics */
	if (retval)
		goto out_free_pnfs;
1536 1537 1538
	retval = nfsd_drc_slab_create();
	if (retval)
		goto out_free_stat;
L
Linus Torvalds 已提交
1539
	nfsd_lockd_init();	/* lockd->nfsd callbacks */
1540 1541
	retval = create_proc_exports_entry();
	if (retval)
1542
		goto out_free_lockd;
L
Linus Torvalds 已提交
1543
	retval = register_filesystem(&nfsd_fs_type);
1544
	if (retval)
1545 1546 1547
		goto out_free_exports;
	retval = register_pernet_subsys(&nfsd_net_ops);
	if (retval < 0)
1548 1549 1550
		goto out_free_all;
	return 0;
out_free_all:
1551
	unregister_filesystem(&nfsd_fs_type);
1552
out_free_exports:
1553 1554
	remove_proc_entry("fs/nfs/exports", NULL);
	remove_proc_entry("fs/nfs", NULL);
1555
out_free_lockd:
1556
	nfsd_lockd_shutdown();
1557 1558
	nfsd_drc_slab_free();
out_free_stat:
1559
	nfsd_stat_shutdown();
1560
out_free_pnfs:
1561
	nfsd4_exit_pnfs();
B
Bryan Schumaker 已提交
1562
out_free_slabs:
1563
	nfsd4_free_slabs();
1564
out_unregister_notifier:
1565
	unregister_cld_notifier();
L
Linus Torvalds 已提交
1566 1567 1568 1569 1570
	return retval;
}

static void __exit exit_nfsd(void)
{
1571
	unregister_pernet_subsys(&nfsd_net_ops);
1572
	nfsd_drc_slab_free();
L
Linus Torvalds 已提交
1573 1574 1575 1576
	remove_proc_entry("fs/nfs/exports", NULL);
	remove_proc_entry("fs/nfs", NULL);
	nfsd_stat_shutdown();
	nfsd_lockd_shutdown();
1577
	nfsd4_free_slabs();
1578
	nfsd4_exit_pnfs();
L
Linus Torvalds 已提交
1579
	unregister_filesystem(&nfsd_fs_type);
1580
	unregister_cld_notifier();
L
Linus Torvalds 已提交
1581 1582 1583 1584 1585 1586
}

MODULE_AUTHOR("Olaf Kirch <okir@monad.swb.de>");
MODULE_LICENSE("GPL");
module_init(init_nfsd)
module_exit(exit_nfsd)