nfs4proc.c 189.6 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41
/*
 *  fs/nfs/nfs4proc.c
 *
 *  Client-side procedure declarations for NFSv4.
 *
 *  Copyright (c) 2002 The Regents of the University of Michigan.
 *  All rights reserved.
 *
 *  Kendrick Smith <kmsmith@umich.edu>
 *  Andy Adamson   <andros@umich.edu>
 *
 *  Redistribution and use in source and binary forms, with or without
 *  modification, are permitted provided that the following conditions
 *  are met:
 *
 *  1. Redistributions of source code must retain the above copyright
 *     notice, this list of conditions and the following disclaimer.
 *  2. Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in the
 *     documentation and/or other materials provided with the distribution.
 *  3. Neither the name of the University nor the names of its
 *     contributors may be used to endorse or promote products derived
 *     from this software without specific prior written permission.
 *
 *  THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
 *  WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
 *  MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 *  DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
 *  FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 *  CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 *  SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
 *  BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
 *  LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
 *  NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
 *  SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 */

#include <linux/mm.h>
#include <linux/delay.h>
#include <linux/errno.h>
#include <linux/string.h>
42 43
#include <linux/ratelimit.h>
#include <linux/printk.h>
44
#include <linux/slab.h>
L
Linus Torvalds 已提交
45 46 47 48 49
#include <linux/sunrpc/clnt.h>
#include <linux/nfs.h>
#include <linux/nfs4.h>
#include <linux/nfs_fs.h>
#include <linux/nfs_page.h>
50
#include <linux/nfs_mount.h>
L
Linus Torvalds 已提交
51
#include <linux/namei.h>
52
#include <linux/mount.h>
B
Benny Halevy 已提交
53
#include <linux/module.h>
54
#include <linux/nfs_idmap.h>
55
#include <linux/xattr.h>
56
#include <linux/utsname.h>
57
#include <linux/freezer.h>
L
Linus Torvalds 已提交
58

59
#include "nfs4_fs.h"
L
Linus Torvalds 已提交
60
#include "delegation.h"
61
#include "internal.h"
62
#include "iostat.h"
A
Andy Adamson 已提交
63
#include "callback.h"
64
#include "pnfs.h"
65
#include "netns.h"
66
#include "nfs4session.h"
D
David Howells 已提交
67
#include "fscache.h"
L
Linus Torvalds 已提交
68 69 70

#define NFSDBG_FACILITY		NFSDBG_PROC

71
#define NFS4_POLL_RETRY_MIN	(HZ/10)
L
Linus Torvalds 已提交
72 73
#define NFS4_POLL_RETRY_MAX	(15*HZ)

74
struct nfs4_opendata;
75
static int _nfs4_proc_open(struct nfs4_opendata *data);
76
static int _nfs4_recover_proc_open(struct nfs4_opendata *data);
L
Linus Torvalds 已提交
77
static int nfs4_do_fsinfo(struct nfs_server *, struct nfs_fh *, struct nfs_fsinfo *);
78
static int nfs4_async_handle_error(struct rpc_task *, const struct nfs_server *, struct nfs4_state *);
79
static void nfs_fixup_referral_attributes(struct nfs_fattr *fattr);
80
static int nfs4_proc_getattr(struct nfs_server *, struct nfs_fh *, struct nfs_fattr *);
81
static int _nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fattr *fattr);
82 83 84
static int nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
			    struct nfs_fattr *fattr, struct iattr *sattr,
			    struct nfs4_state *state);
85
#ifdef CONFIG_NFS_V4_1
86 87
static int nfs41_test_stateid(struct nfs_server *, nfs4_stateid *);
static int nfs41_free_stateid(struct nfs_server *, nfs4_stateid *);
88
#endif
L
Linus Torvalds 已提交
89
/* Prevent leaks of NFSv4 errors into userland */
90
static int nfs4_map_errors(int err)
L
Linus Torvalds 已提交
91
{
92 93 94 95
	if (err >= -1000)
		return err;
	switch (err) {
	case -NFS4ERR_RESOURCE:
96 97
	case -NFS4ERR_LAYOUTTRYLATER:
	case -NFS4ERR_RECALLCONFLICT:
98
		return -EREMOTEIO;
99 100
	case -NFS4ERR_WRONGSEC:
		return -EPERM;
101 102 103
	case -NFS4ERR_BADOWNER:
	case -NFS4ERR_BADNAME:
		return -EINVAL;
104 105
	case -NFS4ERR_SHARE_DENIED:
		return -EACCES;
106 107
	case -NFS4ERR_MINOR_VERS_MISMATCH:
		return -EPROTONOSUPPORT;
108 109
	case -NFS4ERR_ACCESS:
		return -EACCES;
110 111
	case -NFS4ERR_FILE_OPEN:
		return -EBUSY;
112
	default:
L
Linus Torvalds 已提交
113
		dprintk("%s could not handle NFSv4 error %d\n",
114
				__func__, -err);
115
		break;
L
Linus Torvalds 已提交
116
	}
117
	return -EIO;
L
Linus Torvalds 已提交
118 119 120 121 122
}

/*
 * This is our standard bitmap for GETATTR requests.
 */
123
const u32 nfs4_fattr_bitmap[3] = {
L
Linus Torvalds 已提交
124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139
	FATTR4_WORD0_TYPE
	| FATTR4_WORD0_CHANGE
	| FATTR4_WORD0_SIZE
	| FATTR4_WORD0_FSID
	| FATTR4_WORD0_FILEID,
	FATTR4_WORD1_MODE
	| FATTR4_WORD1_NUMLINKS
	| FATTR4_WORD1_OWNER
	| FATTR4_WORD1_OWNER_GROUP
	| FATTR4_WORD1_RAWDEV
	| FATTR4_WORD1_SPACE_USED
	| FATTR4_WORD1_TIME_ACCESS
	| FATTR4_WORD1_TIME_METADATA
	| FATTR4_WORD1_TIME_MODIFY
};

140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157
static const u32 nfs4_pnfs_open_bitmap[3] = {
	FATTR4_WORD0_TYPE
	| FATTR4_WORD0_CHANGE
	| FATTR4_WORD0_SIZE
	| FATTR4_WORD0_FSID
	| FATTR4_WORD0_FILEID,
	FATTR4_WORD1_MODE
	| FATTR4_WORD1_NUMLINKS
	| FATTR4_WORD1_OWNER
	| FATTR4_WORD1_OWNER_GROUP
	| FATTR4_WORD1_RAWDEV
	| FATTR4_WORD1_SPACE_USED
	| FATTR4_WORD1_TIME_ACCESS
	| FATTR4_WORD1_TIME_METADATA
	| FATTR4_WORD1_TIME_MODIFY,
	FATTR4_WORD2_MDSTHRESHOLD
};

158 159 160 161 162 163
static const u32 nfs4_open_noattr_bitmap[3] = {
	FATTR4_WORD0_TYPE
	| FATTR4_WORD0_CHANGE
	| FATTR4_WORD0_FILEID,
};

L
Linus Torvalds 已提交
164 165 166 167 168 169 170 171 172
const u32 nfs4_statfs_bitmap[2] = {
	FATTR4_WORD0_FILES_AVAIL
	| FATTR4_WORD0_FILES_FREE
	| FATTR4_WORD0_FILES_TOTAL,
	FATTR4_WORD1_SPACE_AVAIL
	| FATTR4_WORD1_SPACE_FREE
	| FATTR4_WORD1_SPACE_TOTAL
};

173
const u32 nfs4_pathconf_bitmap[2] = {
L
Linus Torvalds 已提交
174 175 176 177 178
	FATTR4_WORD0_MAXLINK
	| FATTR4_WORD0_MAXNAME,
	0
};

179
const u32 nfs4_fsinfo_bitmap[3] = { FATTR4_WORD0_MAXFILESIZE
L
Linus Torvalds 已提交
180 181 182
			| FATTR4_WORD0_MAXREAD
			| FATTR4_WORD0_MAXWRITE
			| FATTR4_WORD0_LEASE_TIME,
183
			FATTR4_WORD1_TIME_DELTA
184 185
			| FATTR4_WORD1_FS_LAYOUT_TYPES,
			FATTR4_WORD2_LAYOUT_BLKSIZE
L
Linus Torvalds 已提交
186 187
};

188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206
const u32 nfs4_fs_locations_bitmap[2] = {
	FATTR4_WORD0_TYPE
	| FATTR4_WORD0_CHANGE
	| FATTR4_WORD0_SIZE
	| FATTR4_WORD0_FSID
	| FATTR4_WORD0_FILEID
	| FATTR4_WORD0_FS_LOCATIONS,
	FATTR4_WORD1_MODE
	| FATTR4_WORD1_NUMLINKS
	| FATTR4_WORD1_OWNER
	| FATTR4_WORD1_OWNER_GROUP
	| FATTR4_WORD1_RAWDEV
	| FATTR4_WORD1_SPACE_USED
	| FATTR4_WORD1_TIME_ACCESS
	| FATTR4_WORD1_TIME_METADATA
	| FATTR4_WORD1_TIME_MODIFY
	| FATTR4_WORD1_MOUNTED_ON_FILEID
};

A
Al Viro 已提交
207
static void nfs4_setup_readdir(u64 cookie, __be32 *verifier, struct dentry *dentry,
L
Linus Torvalds 已提交
208 209
		struct nfs4_readdir_arg *readdir)
{
210
	__be32 *start, *p;
L
Linus Torvalds 已提交
211 212

	if (cookie > 2) {
213
		readdir->cookie = cookie;
L
Linus Torvalds 已提交
214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229
		memcpy(&readdir->verifier, verifier, sizeof(readdir->verifier));
		return;
	}

	readdir->cookie = 0;
	memset(&readdir->verifier, 0, sizeof(readdir->verifier));
	if (cookie == 2)
		return;
	
	/*
	 * NFSv4 servers do not return entries for '.' and '..'
	 * Therefore, we fake these entries here.  We let '.'
	 * have cookie 0 and '..' have cookie 1.  Note that
	 * when talking to the server, we always send cookie 0
	 * instead of 1 or 2.
	 */
230
	start = p = kmap_atomic(*readdir->pages);
L
Linus Torvalds 已提交
231 232 233 234 235 236 237 238 239 240 241
	
	if (cookie == 0) {
		*p++ = xdr_one;                                  /* next */
		*p++ = xdr_zero;                   /* cookie, first word */
		*p++ = xdr_one;                   /* cookie, second word */
		*p++ = xdr_one;                             /* entry len */
		memcpy(p, ".\0\0\0", 4);                        /* entry */
		p++;
		*p++ = xdr_one;                         /* bitmap length */
		*p++ = htonl(FATTR4_WORD0_FILEID);             /* bitmap */
		*p++ = htonl(8);              /* attribute buffer length */
P
Peter Staubach 已提交
242
		p = xdr_encode_hyper(p, NFS_FILEID(dentry->d_inode));
L
Linus Torvalds 已提交
243 244 245 246 247 248 249 250 251 252 253
	}
	
	*p++ = xdr_one;                                  /* next */
	*p++ = xdr_zero;                   /* cookie, first word */
	*p++ = xdr_two;                   /* cookie, second word */
	*p++ = xdr_two;                             /* entry len */
	memcpy(p, "..\0\0", 4);                         /* entry */
	p++;
	*p++ = xdr_one;                         /* bitmap length */
	*p++ = htonl(FATTR4_WORD0_FILEID);             /* bitmap */
	*p++ = htonl(8);              /* attribute buffer length */
P
Peter Staubach 已提交
254
	p = xdr_encode_hyper(p, NFS_FILEID(dentry->d_parent->d_inode));
L
Linus Torvalds 已提交
255 256 257

	readdir->pgbase = (char *)p - (char *)start;
	readdir->count -= readdir->pgbase;
258
	kunmap_atomic(start);
L
Linus Torvalds 已提交
259 260
}

261 262 263 264 265 266 267 268 269 270
static int nfs4_delay(struct rpc_clnt *clnt, long *timeout)
{
	int res = 0;

	might_sleep();

	if (*timeout <= 0)
		*timeout = NFS4_POLL_RETRY_MIN;
	if (*timeout > NFS4_POLL_RETRY_MAX)
		*timeout = NFS4_POLL_RETRY_MAX;
271
	freezable_schedule_timeout_killable(*timeout);
272 273 274 275 276 277 278 279 280
	if (fatal_signal_pending(current))
		res = -ERESTARTSYS;
	*timeout <<= 1;
	return res;
}

/* This is the error handling routine for processes that are allowed
 * to sleep.
 */
281
static int nfs4_handle_exception(struct nfs_server *server, int errorcode, struct nfs4_exception *exception)
282 283
{
	struct nfs_client *clp = server->nfs_client;
284
	struct nfs4_state *state = exception->state;
285
	struct inode *inode = exception->inode;
286 287 288 289 290 291
	int ret = errorcode;

	exception->retry = 0;
	switch(errorcode) {
		case 0:
			return 0;
292
		case -NFS4ERR_OPENMODE:
293
			if (inode && nfs4_have_delegation(inode, FMODE_READ)) {
294
				nfs4_inode_return_delegation(inode);
295 296 297 298 299
				exception->retry = 1;
				return 0;
			}
			if (state == NULL)
				break;
300 301 302
			ret = nfs4_schedule_stateid_recovery(server, state);
			if (ret < 0)
				break;
303
			goto wait_on_recovery;
304
		case -NFS4ERR_DELEG_REVOKED:
305 306
		case -NFS4ERR_ADMIN_REVOKED:
		case -NFS4ERR_BAD_STATEID:
307 308 309 310 311
			if (inode != NULL && nfs4_have_delegation(inode, FMODE_READ)) {
				nfs_remove_bad_delegation(inode);
				exception->retry = 1;
				break;
			}
312 313
			if (state == NULL)
				break;
314 315 316
			ret = nfs4_schedule_stateid_recovery(server, state);
			if (ret < 0)
				break;
317
			goto wait_on_recovery;
318
		case -NFS4ERR_EXPIRED:
319 320 321 322 323
			if (state != NULL) {
				ret = nfs4_schedule_stateid_recovery(server, state);
				if (ret < 0)
					break;
			}
324
		case -NFS4ERR_STALE_STATEID:
325
		case -NFS4ERR_STALE_CLIENTID:
326 327
			nfs4_schedule_lease_recovery(clp);
			goto wait_on_recovery;
328
#if defined(CONFIG_NFS_V4_1)
329 330 331 332 333 334 335 336 337
		case -NFS4ERR_BADSESSION:
		case -NFS4ERR_BADSLOT:
		case -NFS4ERR_BAD_HIGH_SLOT:
		case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
		case -NFS4ERR_DEADSESSION:
		case -NFS4ERR_SEQ_FALSE_RETRY:
		case -NFS4ERR_SEQ_MISORDERED:
			dprintk("%s ERROR: %d Reset session\n", __func__,
				errorcode);
338
			nfs4_schedule_session_recovery(clp->cl_session, errorcode);
339
			goto wait_on_recovery;
340
#endif /* defined(CONFIG_NFS_V4_1) */
341
		case -NFS4ERR_FILE_OPEN:
342 343 344 345 346 347 348
			if (exception->timeout > HZ) {
				/* We have retried a decent amount, time to
				 * fail
				 */
				ret = -EBUSY;
				break;
			}
349 350 351 352 353
		case -NFS4ERR_GRACE:
		case -NFS4ERR_DELAY:
			ret = nfs4_delay(server->client, &exception->timeout);
			if (ret != 0)
				break;
354
		case -NFS4ERR_RETRY_UNCACHED_REP:
355 356
		case -NFS4ERR_OLD_STATEID:
			exception->retry = 1;
357 358 359 360 361 362 363 364 365 366 367 368 369
			break;
		case -NFS4ERR_BADOWNER:
			/* The following works around a Linux server bug! */
		case -NFS4ERR_BADNAME:
			if (server->caps & NFS_CAP_UIDGID_NOMAP) {
				server->caps &= ~NFS_CAP_UIDGID_NOMAP;
				exception->retry = 1;
				printk(KERN_WARNING "NFS: v4 server %s "
						"does not accept raw "
						"uid/gids. "
						"Reenabling the idmapper.\n",
						server->nfs_client->cl_hostname);
			}
370 371 372
	}
	/* We failed to handle the error */
	return nfs4_map_errors(ret);
373
wait_on_recovery:
374 375 376 377
	ret = nfs4_wait_clnt_recover(clp);
	if (ret == 0)
		exception->retry = 1;
	return ret;
378 379 380
}


381
static void do_renew_lease(struct nfs_client *clp, unsigned long timestamp)
L
Linus Torvalds 已提交
382 383 384 385 386 387 388
{
	spin_lock(&clp->cl_lock);
	if (time_before(clp->cl_last_renewal,timestamp))
		clp->cl_last_renewal = timestamp;
	spin_unlock(&clp->cl_lock);
}

389 390 391 392 393
static void renew_lease(const struct nfs_server *server, unsigned long timestamp)
{
	do_renew_lease(server->nfs_client, timestamp);
}

A
Andy Adamson 已提交
394 395
#if defined(CONFIG_NFS_V4_1)

396
static void nfs41_sequence_free_slot(struct nfs4_sequence_res *res)
A
Andy Adamson 已提交
397
{
398
	struct nfs4_session *session;
A
Andy Adamson 已提交
399
	struct nfs4_slot_table *tbl;
400
	bool send_new_highest_used_slotid = false;
A
Andy Adamson 已提交
401

402
	if (!res->sr_slot) {
A
Andy Adamson 已提交
403 404
		/* just wake up the next guy waiting since
		 * we may have not consumed a slot after all */
A
Andy Adamson 已提交
405
		dprintk("%s: No slot\n", __func__);
406
		return;
A
Andy Adamson 已提交
407
	}
408 409
	tbl = res->sr_slot->table;
	session = tbl->session;
410

411
	spin_lock(&tbl->slot_tbl_lock);
412 413 414 415 416 417
	/* Be nice to the server: try to ensure that the last transmitted
	 * value for highest_user_slotid <= target_highest_slotid
	 */
	if (tbl->highest_used_slotid > tbl->target_highest_slotid)
		send_new_highest_used_slotid = true;

418 419 420 421
	if (nfs41_wake_and_assign_slot(tbl, res->sr_slot)) {
		send_new_highest_used_slotid = false;
		goto out_unlock;
	}
T
Trond Myklebust 已提交
422
	nfs4_free_slot(tbl, res->sr_slot);
423 424 425

	if (tbl->highest_used_slotid != NFS4_NO_SLOT)
		send_new_highest_used_slotid = false;
426
out_unlock:
427
	spin_unlock(&tbl->slot_tbl_lock);
428
	res->sr_slot = NULL;
429 430
	if (send_new_highest_used_slotid)
		nfs41_server_notify_highest_slotid_update(session->clp);
A
Andy Adamson 已提交
431 432
}

433
static int nfs41_sequence_done(struct rpc_task *task, struct nfs4_sequence_res *res)
A
Andy Adamson 已提交
434
{
435
	struct nfs4_session *session;
436
	struct nfs4_slot *slot;
437
	struct nfs_client *clp;
438
	bool interrupted = false;
439
	int ret = 1;
A
Andy Adamson 已提交
440

441 442
	/* don't increment the sequence number if the task wasn't sent */
	if (!RPC_WAS_SENT(task))
A
Andy Adamson 已提交
443 444
		goto out;

445
	slot = res->sr_slot;
446
	session = slot->table->session;
447

448 449 450 451 452
	if (slot->interrupted) {
		slot->interrupted = 0;
		interrupted = true;
	}

A
Andy Adamson 已提交
453
	/* Check the SEQUENCE operation status */
454 455
	switch (res->sr_status) {
	case 0:
A
Andy Adamson 已提交
456
		/* Update the slot's sequence and clientid lease timer */
457
		++slot->seq_nr;
458
		clp = session->clp;
459
		do_renew_lease(clp, res->sr_timestamp);
460
		/* Check sequence flags */
461 462
		if (res->sr_status_flags != 0)
			nfs4_schedule_lease_recovery(clp);
463
		nfs41_update_target_slotid(slot->table, slot, res);
464
		break;
465 466 467 468 469 470 471 472 473
	case 1:
		/*
		 * sr_status remains 1 if an RPC level error occurred.
		 * The server may or may not have processed the sequence
		 * operation..
		 * Mark the slot as having hosted an interrupted RPC call.
		 */
		slot->interrupted = 1;
		goto out;
474 475 476 477 478
	case -NFS4ERR_DELAY:
		/* The server detected a resend of the RPC call and
		 * returned NFS4ERR_DELAY as per Section 2.10.6.2
		 * of RFC5661.
		 */
479
		dprintk("%s: slot=%u seq=%u: Operation in progress\n",
480
			__func__,
481
			slot->slot_nr,
482
			slot->seq_nr);
483
		goto out_retry;
484 485 486 487 488
	case -NFS4ERR_BADSLOT:
		/*
		 * The slot id we used was probably retired. Try again
		 * using a different slot id.
		 */
489 490
		goto retry_nowait;
	case -NFS4ERR_SEQ_MISORDERED:
491 492 493 494 495 496 497 498
		/*
		 * Was the last operation on this sequence interrupted?
		 * If so, retry after bumping the sequence number.
		 */
		if (interrupted) {
			++slot->seq_nr;
			goto retry_nowait;
		}
499 500 501 502
		/*
		 * Could this slot have been previously retired?
		 * If so, then the server may be expecting seq_nr = 1!
		 */
503 504 505 506 507
		if (slot->seq_nr != 1) {
			slot->seq_nr = 1;
			goto retry_nowait;
		}
		break;
508 509 510
	case -NFS4ERR_SEQ_FALSE_RETRY:
		++slot->seq_nr;
		goto retry_nowait;
511 512
	default:
		/* Just update the slot sequence no. */
513
		++slot->seq_nr;
A
Andy Adamson 已提交
514 515 516 517
	}
out:
	/* The session may be reset by one of the error handlers. */
	dprintk("%s: Error %d free the slot \n", __func__, res->sr_status);
518
	nfs41_sequence_free_slot(res);
519
	return ret;
520 521 522 523 524 525
retry_nowait:
	if (rpc_restart_call_prepare(task)) {
		task->tk_status = 0;
		ret = 0;
	}
	goto out;
526
out_retry:
527
	if (!rpc_restart_call(task))
528 529 530
		goto out;
	rpc_delay(task, NFS4_POLL_RETRY_MAX);
	return 0;
A
Andy Adamson 已提交
531 532
}

533 534
static int nfs4_sequence_done(struct rpc_task *task,
			       struct nfs4_sequence_res *res)
535
{
536
	if (res->sr_slot == NULL)
537 538
		return 1;
	return nfs41_sequence_done(task, res);
539 540
}

541 542 543
static void nfs41_init_sequence(struct nfs4_sequence_args *args,
		struct nfs4_sequence_res *res, int cache_reply)
{
544
	args->sa_slot = NULL;
545
	args->sa_cache_this = 0;
546
	args->sa_privileged = 0;
547 548 549 550 551
	if (cache_reply)
		args->sa_cache_this = 1;
	res->sr_slot = NULL;
}

552 553 554 555 556
static void nfs4_set_sequence_privileged(struct nfs4_sequence_args *args)
{
	args->sa_privileged = 1;
}

A
Andy Adamson 已提交
557
int nfs41_setup_sequence(struct nfs4_session *session,
A
Andy Adamson 已提交
558 559 560 561
				struct nfs4_sequence_args *args,
				struct nfs4_sequence_res *res,
				struct rpc_task *task)
{
A
Andy Adamson 已提交
562 563 564 565
	struct nfs4_slot *slot;
	struct nfs4_slot_table *tbl;

	dprintk("--> %s\n", __func__);
A
Andy Adamson 已提交
566
	/* slot already allocated? */
567
	if (res->sr_slot != NULL)
568
		goto out_success;
A
Andy Adamson 已提交
569

A
Andy Adamson 已提交
570 571
	tbl = &session->fc_slot_table;

572 573
	task->tk_timeout = 0;

A
Andy Adamson 已提交
574
	spin_lock(&tbl->slot_tbl_lock);
575
	if (test_bit(NFS4_SLOT_TBL_DRAINING, &tbl->slot_tbl_state) &&
576
	    !args->sa_privileged) {
577 578
		/* The state manager will wait until the slot table is empty */
		dprintk("%s session is draining\n", __func__);
579
		goto out_sleep;
580 581
	}

582
	slot = nfs4_alloc_slot(tbl);
583 584 585 586
	if (IS_ERR(slot)) {
		/* If out of memory, try again in 1/4 second */
		if (slot == ERR_PTR(-ENOMEM))
			task->tk_timeout = HZ >> 2;
A
Andy Adamson 已提交
587
		dprintk("<-- %s: no free slots\n", __func__);
588
		goto out_sleep;
A
Andy Adamson 已提交
589 590 591
	}
	spin_unlock(&tbl->slot_tbl_lock);

592
	args->sa_slot = slot;
A
Andy Adamson 已提交
593

594 595
	dprintk("<-- %s slotid=%d seqid=%d\n", __func__,
			slot->slot_nr, slot->seq_nr);
A
Andy Adamson 已提交
596

597
	res->sr_slot = slot;
598
	res->sr_timestamp = jiffies;
599
	res->sr_status_flags = 0;
A
Andy Adamson 已提交
600 601 602 603 604
	/*
	 * sr_status is only set in decode_sequence, and so will remain
	 * set to 1 if an rpc level failure occurs.
	 */
	res->sr_status = 1;
605 606
out_success:
	rpc_call_start(task);
A
Andy Adamson 已提交
607
	return 0;
608
out_sleep:
609 610
	/* Privileged tasks are queued with top priority */
	if (args->sa_privileged)
611 612 613 614
		rpc_sleep_on_priority(&tbl->slot_tbl_waitq, task,
				NULL, RPC_PRIORITY_PRIVILEGED);
	else
		rpc_sleep_on(&tbl->slot_tbl_waitq, task, NULL);
615 616
	spin_unlock(&tbl->slot_tbl_lock);
	return -EAGAIN;
A
Andy Adamson 已提交
617
}
A
Andy Adamson 已提交
618
EXPORT_SYMBOL_GPL(nfs41_setup_sequence);
A
Andy Adamson 已提交
619

620
int nfs4_setup_sequence(const struct nfs_server *server,
A
Andy Adamson 已提交
621 622 623 624
			struct nfs4_sequence_args *args,
			struct nfs4_sequence_res *res,
			struct rpc_task *task)
{
625
	struct nfs4_session *session = nfs4_get_session(server);
A
Andy Adamson 已提交
626 627
	int ret = 0;

628 629
	if (session == NULL) {
		rpc_call_start(task);
630
		goto out;
631
	}
632

633
	dprintk("--> %s clp %p session %p sr_slot %d\n",
634
		__func__, session->clp, session, res->sr_slot ?
635
			res->sr_slot->slot_nr : -1);
A
Andy Adamson 已提交
636

637
	ret = nfs41_setup_sequence(session, args, res, task);
A
Andy Adamson 已提交
638 639 640 641 642 643
out:
	dprintk("<-- %s status=%d\n", __func__, ret);
	return ret;
}

struct nfs41_call_sync_data {
644
	const struct nfs_server *seq_server;
A
Andy Adamson 已提交
645 646 647 648 649 650 651
	struct nfs4_sequence_args *seq_args;
	struct nfs4_sequence_res *seq_res;
};

static void nfs41_call_sync_prepare(struct rpc_task *task, void *calldata)
{
	struct nfs41_call_sync_data *data = calldata;
652
	struct nfs4_session *session = nfs4_get_session(data->seq_server);
A
Andy Adamson 已提交
653

654 655
	dprintk("--> %s data->seq_server %p\n", __func__, data->seq_server);

656
	nfs41_setup_sequence(session, data->seq_args, data->seq_res, task);
A
Andy Adamson 已提交
657 658
}

A
Andy Adamson 已提交
659 660 661 662
static void nfs41_call_sync_done(struct rpc_task *task, void *calldata)
{
	struct nfs41_call_sync_data *data = calldata;

663
	nfs41_sequence_done(task, data->seq_res);
A
Andy Adamson 已提交
664 665
}

666
static const struct rpc_call_ops nfs41_call_sync_ops = {
A
Andy Adamson 已提交
667
	.rpc_call_prepare = nfs41_call_sync_prepare,
A
Andy Adamson 已提交
668
	.rpc_call_done = nfs41_call_sync_done,
A
Andy Adamson 已提交
669 670
};

671 672
static int nfs4_call_sync_sequence(struct rpc_clnt *clnt,
				   struct nfs_server *server,
A
Andy Adamson 已提交
673 674
				   struct rpc_message *msg,
				   struct nfs4_sequence_args *args,
675
				   struct nfs4_sequence_res *res)
A
Andy Adamson 已提交
676 677 678 679
{
	int ret;
	struct rpc_task *task;
	struct nfs41_call_sync_data data = {
680
		.seq_server = server,
A
Andy Adamson 已提交
681 682 683 684
		.seq_args = args,
		.seq_res = res,
	};
	struct rpc_task_setup task_setup = {
685
		.rpc_client = clnt,
A
Andy Adamson 已提交
686 687 688 689 690 691 692 693 694 695 696 697 698 699 700
		.rpc_message = msg,
		.callback_ops = &nfs41_call_sync_ops,
		.callback_data = &data
	};

	task = rpc_run_task(&task_setup);
	if (IS_ERR(task))
		ret = PTR_ERR(task);
	else {
		ret = task->tk_status;
		rpc_put_task(task);
	}
	return ret;
}

701
#else
702
static
703 704 705 706 707
void nfs41_init_sequence(struct nfs4_sequence_args *args,
		struct nfs4_sequence_res *res, int cache_reply)
{
}

708 709 710 711 712
static void nfs4_set_sequence_privileged(struct nfs4_sequence_args *args)
{
}


713 714
static int nfs4_sequence_done(struct rpc_task *task,
			       struct nfs4_sequence_res *res)
715
{
716
	return 1;
717
}
A
Andy Adamson 已提交
718 719
#endif /* CONFIG_NFS_V4_1 */

720
static
721 722
int _nfs4_call_sync(struct rpc_clnt *clnt,
		    struct nfs_server *server,
A
Andy Adamson 已提交
723 724
		    struct rpc_message *msg,
		    struct nfs4_sequence_args *args,
725
		    struct nfs4_sequence_res *res)
A
Andy Adamson 已提交
726
{
727
	return rpc_call_sync(clnt, msg, 0);
A
Andy Adamson 已提交
728 729
}

730
static
731 732
int nfs4_call_sync(struct rpc_clnt *clnt,
		   struct nfs_server *server,
733 734 735 736 737
		   struct rpc_message *msg,
		   struct nfs4_sequence_args *args,
		   struct nfs4_sequence_res *res,
		   int cache_reply)
{
738
	nfs41_init_sequence(args, res, cache_reply);
739
	return server->nfs_client->cl_mvops->call_sync(clnt, server, msg,
740
						args, res);
741
}
A
Andy Adamson 已提交
742

743
static void update_changeattr(struct inode *dir, struct nfs4_change_info *cinfo)
L
Linus Torvalds 已提交
744
{
745
	struct nfs_inode *nfsi = NFS_I(dir);
L
Linus Torvalds 已提交
746

747
	spin_lock(&dir->i_lock);
748
	nfsi->cache_validity |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA;
749
	if (!cinfo->atomic || cinfo->before != dir->i_version)
750
		nfs_force_lookup_revalidate(dir);
751
	dir->i_version = cinfo->after;
D
David Howells 已提交
752
	nfs_fscache_invalidate(dir);
753
	spin_unlock(&dir->i_lock);
L
Linus Torvalds 已提交
754 755
}

756
struct nfs4_opendata {
757
	struct kref kref;
758 759
	struct nfs_openargs o_arg;
	struct nfs_openres o_res;
760 761
	struct nfs_open_confirmargs c_arg;
	struct nfs_open_confirmres c_res;
762 763
	struct nfs4_string owner_name;
	struct nfs4_string group_name;
764 765
	struct nfs_fattr f_attr;
	struct dentry *dir;
766
	struct dentry *dentry;
767
	struct nfs4_state_owner *owner;
768
	struct nfs4_state *state;
769
	struct iattr attrs;
770
	unsigned long timestamp;
771
	unsigned int rpc_done : 1;
772
	unsigned int is_recover : 1;
773 774
	int rpc_status;
	int cancelled;
775 776
};

777 778 779 780 781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805
static bool nfs4_clear_cap_atomic_open_v1(struct nfs_server *server,
		int err, struct nfs4_exception *exception)
{
	if (err != -EINVAL)
		return false;
	if (!(server->caps & NFS_CAP_ATOMIC_OPEN_V1))
		return false;
	server->caps &= ~NFS_CAP_ATOMIC_OPEN_V1;
	exception->retry = 1;
	return true;
}

static enum open_claim_type4
nfs4_map_atomic_open_claim(struct nfs_server *server,
		enum open_claim_type4 claim)
{
	if (server->caps & NFS_CAP_ATOMIC_OPEN_V1)
		return claim;
	switch (claim) {
	default:
		return claim;
	case NFS4_OPEN_CLAIM_FH:
		return NFS4_OPEN_CLAIM_NULL;
	case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
		return NFS4_OPEN_CLAIM_DELEGATE_CUR;
	case NFS4_OPEN_CLAIM_DELEG_PREV_FH:
		return NFS4_OPEN_CLAIM_DELEGATE_PREV;
	}
}
806 807 808 809

static void nfs4_init_opendata_res(struct nfs4_opendata *p)
{
	p->o_res.f_attr = &p->f_attr;
810 811
	p->o_res.seqid = p->o_arg.seqid;
	p->c_res.seqid = p->c_arg.seqid;
812
	p->o_res.server = p->o_arg.server;
813
	p->o_res.access_request = p->o_arg.access;
814
	nfs_fattr_init(&p->f_attr);
815
	nfs_fattr_init_names(&p->f_attr, &p->owner_name, &p->group_name);
816 817
}

818
static struct nfs4_opendata *nfs4_opendata_alloc(struct dentry *dentry,
819
		struct nfs4_state_owner *sp, fmode_t fmode, int flags,
820
		const struct iattr *attrs,
821
		enum open_claim_type4 claim,
822
		gfp_t gfp_mask)
823
{
824
	struct dentry *parent = dget_parent(dentry);
825 826 827 828
	struct inode *dir = parent->d_inode;
	struct nfs_server *server = NFS_SERVER(dir);
	struct nfs4_opendata *p;

829
	p = kzalloc(sizeof(*p), gfp_mask);
830 831
	if (p == NULL)
		goto err;
832
	p->o_arg.seqid = nfs_alloc_seqid(&sp->so_seqid, gfp_mask);
833 834
	if (p->o_arg.seqid == NULL)
		goto err_free;
835 836
	nfs_sb_active(dentry->d_sb);
	p->dentry = dget(dentry);
837 838 839
	p->dir = parent;
	p->owner = sp;
	atomic_inc(&sp->so_count);
840 841
	p->o_arg.open_flags = flags;
	p->o_arg.fmode = fmode & (FMODE_READ|FMODE_WRITE);
842 843 844 845 846 847 848 849
	/* don't put an ACCESS op in OPEN compound if O_EXCL, because ACCESS
	 * will return permission denied for all bits until close */
	if (!(flags & O_EXCL)) {
		/* ask server to check for all possible rights as results
		 * are cached */
		p->o_arg.access = NFS4_ACCESS_READ | NFS4_ACCESS_MODIFY |
				  NFS4_ACCESS_EXTEND | NFS4_ACCESS_EXECUTE;
	}
850
	p->o_arg.clientid = server->nfs_client->cl_clientid;
851 852
	p->o_arg.id.create_time = ktime_to_ns(sp->so_seqid.create_time);
	p->o_arg.id.uniquifier = sp->so_seqid.owner_id;
853
	p->o_arg.name = &dentry->d_name;
854 855
	p->o_arg.server = server;
	p->o_arg.bitmask = server->attr_bitmask;
856
	p->o_arg.open_bitmap = &nfs4_fattr_bitmap[0];
857 858
	p->o_arg.claim = nfs4_map_atomic_open_claim(server, claim);
	switch (p->o_arg.claim) {
859 860 861 862 863 864 865 866 867 868 869
	case NFS4_OPEN_CLAIM_NULL:
	case NFS4_OPEN_CLAIM_DELEGATE_CUR:
	case NFS4_OPEN_CLAIM_DELEGATE_PREV:
		p->o_arg.fh = NFS_FH(dir);
		break;
	case NFS4_OPEN_CLAIM_PREVIOUS:
	case NFS4_OPEN_CLAIM_FH:
	case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
	case NFS4_OPEN_CLAIM_DELEG_PREV_FH:
		p->o_arg.fh = NFS_FH(dentry->d_inode);
	}
870
	if (attrs != NULL && attrs->ia_valid != 0) {
871
		__be32 verf[2];
872

873 874
		p->o_arg.u.attrs = &p->attrs;
		memcpy(&p->attrs, attrs, sizeof(p->attrs));
875 876 877 878 879

		verf[0] = jiffies;
		verf[1] = current->pid;
		memcpy(p->o_arg.u.verifier.data, verf,
				sizeof(p->o_arg.u.verifier.data));
880
	}
881 882 883
	p->c_arg.fh = &p->o_res.fh;
	p->c_arg.stateid = &p->o_res.stateid;
	p->c_arg.seqid = p->o_arg.seqid;
884
	nfs4_init_opendata_res(p);
885
	kref_init(&p->kref);
886 887 888 889 890 891 892 893
	return p;
err_free:
	kfree(p);
err:
	dput(parent);
	return NULL;
}

894
static void nfs4_opendata_free(struct kref *kref)
895
{
896 897
	struct nfs4_opendata *p = container_of(kref,
			struct nfs4_opendata, kref);
898
	struct super_block *sb = p->dentry->d_sb;
899 900

	nfs_free_seqid(p->o_arg.seqid);
901 902
	if (p->state != NULL)
		nfs4_put_open_state(p->state);
903 904
	nfs4_put_state_owner(p->owner);
	dput(p->dir);
905 906
	dput(p->dentry);
	nfs_sb_deactive(sb);
907
	nfs_fattr_free_names(&p->f_attr);
908 909 910 911 912 913 914
	kfree(p);
}

static void nfs4_opendata_put(struct nfs4_opendata *p)
{
	if (p != NULL)
		kref_put(&p->kref, nfs4_opendata_free);
915 916
}

917 918 919 920 921 922 923 924
static int nfs4_wait_for_completion_rpc_task(struct rpc_task *task)
{
	int ret;

	ret = rpc_wait_for_completion_task(task);
	return ret;
}

925
static int can_open_cached(struct nfs4_state *state, fmode_t mode, int open_mode)
926 927
{
	int ret = 0;
928

929
	if (open_mode & (O_EXCL|O_TRUNC))
930 931
		goto out;
	switch (mode & (FMODE_READ|FMODE_WRITE)) {
932
		case FMODE_READ:
933 934
			ret |= test_bit(NFS_O_RDONLY_STATE, &state->flags) != 0
				&& state->n_rdonly != 0;
935 936
			break;
		case FMODE_WRITE:
937 938
			ret |= test_bit(NFS_O_WRONLY_STATE, &state->flags) != 0
				&& state->n_wronly != 0;
939 940
			break;
		case FMODE_READ|FMODE_WRITE:
941 942
			ret |= test_bit(NFS_O_RDWR_STATE, &state->flags) != 0
				&& state->n_rdwr != 0;
943
	}
944
out:
945 946 947
	return ret;
}

948
static int can_open_delegated(struct nfs_delegation *delegation, fmode_t fmode)
949
{
950 951
	if (delegation == NULL)
		return 0;
952
	if ((delegation->type & fmode) != fmode)
953
		return 0;
954
	if (test_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags))
955
		return 0;
956 957
	if (test_bit(NFS_DELEGATION_RETURNING, &delegation->flags))
		return 0;
958
	nfs_mark_delegation_referenced(delegation);
959 960 961
	return 1;
}

962
static void update_open_stateflags(struct nfs4_state *state, fmode_t fmode)
963
{
964
	switch (fmode) {
965 966 967 968 969 970 971 972 973
		case FMODE_WRITE:
			state->n_wronly++;
			break;
		case FMODE_READ:
			state->n_rdonly++;
			break;
		case FMODE_READ|FMODE_WRITE:
			state->n_rdwr++;
	}
974
	nfs4_state_set_mode_locked(state, state->state | fmode);
975 976
}

977
static void nfs_set_open_stateid_locked(struct nfs4_state *state, nfs4_stateid *stateid, fmode_t fmode)
978 979
{
	if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
980 981
		nfs4_stateid_copy(&state->stateid, stateid);
	nfs4_stateid_copy(&state->open_stateid, stateid);
982
	set_bit(NFS_OPEN_STATE, &state->flags);
983
	switch (fmode) {
984 985 986 987 988 989 990 991 992
		case FMODE_READ:
			set_bit(NFS_O_RDONLY_STATE, &state->flags);
			break;
		case FMODE_WRITE:
			set_bit(NFS_O_WRONLY_STATE, &state->flags);
			break;
		case FMODE_READ|FMODE_WRITE:
			set_bit(NFS_O_RDWR_STATE, &state->flags);
	}
993 994
}

995
static void nfs_set_open_stateid(struct nfs4_state *state, nfs4_stateid *stateid, fmode_t fmode)
996
{
997
	write_seqlock(&state->seqlock);
998
	nfs_set_open_stateid_locked(state, stateid, fmode);
999
	write_sequnlock(&state->seqlock);
1000 1001
}

1002
static void __update_open_stateid(struct nfs4_state *state, nfs4_stateid *open_stateid, const nfs4_stateid *deleg_stateid, fmode_t fmode)
L
Linus Torvalds 已提交
1003
{
1004 1005 1006 1007 1008
	/*
	 * Protect the call to nfs4_state_set_mode_locked and
	 * serialise the stateid update
	 */
	write_seqlock(&state->seqlock);
1009
	if (deleg_stateid != NULL) {
1010
		nfs4_stateid_copy(&state->stateid, deleg_stateid);
1011 1012 1013
		set_bit(NFS_DELEGATED_STATE, &state->flags);
	}
	if (open_stateid != NULL)
1014
		nfs_set_open_stateid_locked(state, open_stateid, fmode);
1015 1016
	write_sequnlock(&state->seqlock);
	spin_lock(&state->owner->so_lock);
1017
	update_open_stateflags(state, fmode);
1018
	spin_unlock(&state->owner->so_lock);
L
Linus Torvalds 已提交
1019 1020
}

1021
static int update_open_stateid(struct nfs4_state *state, nfs4_stateid *open_stateid, nfs4_stateid *delegation, fmode_t fmode)
1022 1023 1024 1025 1026
{
	struct nfs_inode *nfsi = NFS_I(state->inode);
	struct nfs_delegation *deleg_cur;
	int ret = 0;

1027
	fmode &= (FMODE_READ|FMODE_WRITE);
1028 1029 1030 1031 1032 1033 1034 1035

	rcu_read_lock();
	deleg_cur = rcu_dereference(nfsi->delegation);
	if (deleg_cur == NULL)
		goto no_delegation;

	spin_lock(&deleg_cur->lock);
	if (nfsi->delegation != deleg_cur ||
1036
	   test_bit(NFS_DELEGATION_RETURNING, &deleg_cur->flags) ||
1037
	    (deleg_cur->type & fmode) != fmode)
1038 1039 1040 1041
		goto no_delegation_unlock;

	if (delegation == NULL)
		delegation = &deleg_cur->stateid;
1042
	else if (!nfs4_stateid_match(&deleg_cur->stateid, delegation))
1043 1044
		goto no_delegation_unlock;

1045
	nfs_mark_delegation_referenced(deleg_cur);
1046
	__update_open_stateid(state, open_stateid, &deleg_cur->stateid, fmode);
1047 1048 1049 1050 1051 1052 1053
	ret = 1;
no_delegation_unlock:
	spin_unlock(&deleg_cur->lock);
no_delegation:
	rcu_read_unlock();

	if (!ret && open_stateid != NULL) {
1054
		__update_open_stateid(state, open_stateid, NULL, fmode);
1055 1056 1057 1058 1059 1060 1061
		ret = 1;
	}

	return ret;
}


1062
static void nfs4_return_incompatible_delegation(struct inode *inode, fmode_t fmode)
1063 1064 1065 1066 1067
{
	struct nfs_delegation *delegation;

	rcu_read_lock();
	delegation = rcu_dereference(NFS_I(inode)->delegation);
1068
	if (delegation == NULL || (delegation->type & fmode) == fmode) {
1069 1070 1071 1072
		rcu_read_unlock();
		return;
	}
	rcu_read_unlock();
1073
	nfs4_inode_return_delegation(inode);
1074 1075
}

1076
static struct nfs4_state *nfs4_try_open_cached(struct nfs4_opendata *opendata)
1077 1078 1079 1080
{
	struct nfs4_state *state = opendata->state;
	struct nfs_inode *nfsi = NFS_I(state->inode);
	struct nfs_delegation *delegation;
1081
	int open_mode = opendata->o_arg.open_flags;
1082
	fmode_t fmode = opendata->o_arg.fmode;
1083 1084 1085 1086
	nfs4_stateid stateid;
	int ret = -EAGAIN;

	for (;;) {
1087
		if (can_open_cached(state, fmode, open_mode)) {
1088
			spin_lock(&state->owner->so_lock);
1089 1090
			if (can_open_cached(state, fmode, open_mode)) {
				update_open_stateflags(state, fmode);
1091 1092 1093 1094 1095
				spin_unlock(&state->owner->so_lock);
				goto out_return_state;
			}
			spin_unlock(&state->owner->so_lock);
		}
1096 1097
		rcu_read_lock();
		delegation = rcu_dereference(nfsi->delegation);
1098
		if (!can_open_delegated(delegation, fmode)) {
1099
			rcu_read_unlock();
1100
			break;
1101
		}
1102
		/* Save the delegation */
1103
		nfs4_stateid_copy(&stateid, &delegation->stateid);
1104
		rcu_read_unlock();
1105
		nfs_release_seqid(opendata->o_arg.seqid);
1106 1107 1108 1109 1110
		if (!opendata->is_recover) {
			ret = nfs_may_open(state->inode, state->owner->so_cred, open_mode);
			if (ret != 0)
				goto out;
		}
1111
		ret = -EAGAIN;
1112 1113

		/* Try to update the stateid using the delegation */
1114
		if (update_open_stateid(state, NULL, &stateid, fmode))
1115
			goto out_return_state;
1116 1117 1118 1119 1120 1121 1122 1123
	}
out:
	return ERR_PTR(ret);
out_return_state:
	atomic_inc(&state->count);
	return state;
}

1124 1125 1126 1127 1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194
static void
nfs4_opendata_check_deleg(struct nfs4_opendata *data, struct nfs4_state *state)
{
	struct nfs_client *clp = NFS_SERVER(state->inode)->nfs_client;
	struct nfs_delegation *delegation;
	int delegation_flags = 0;

	rcu_read_lock();
	delegation = rcu_dereference(NFS_I(state->inode)->delegation);
	if (delegation)
		delegation_flags = delegation->flags;
	rcu_read_unlock();
	if (data->o_arg.claim == NFS4_OPEN_CLAIM_DELEGATE_CUR) {
		pr_err_ratelimited("NFS: Broken NFSv4 server %s is "
				   "returning a delegation for "
				   "OPEN(CLAIM_DELEGATE_CUR)\n",
				   clp->cl_hostname);
	} else if ((delegation_flags & 1UL<<NFS_DELEGATION_NEED_RECLAIM) == 0)
		nfs_inode_set_delegation(state->inode,
					 data->owner->so_cred,
					 &data->o_res);
	else
		nfs_inode_reclaim_delegation(state->inode,
					     data->owner->so_cred,
					     &data->o_res);
}

/*
 * Check the inode attributes against the CLAIM_PREVIOUS returned attributes
 * and update the nfs4_state.
 */
static struct nfs4_state *
_nfs4_opendata_reclaim_to_nfs4_state(struct nfs4_opendata *data)
{
	struct inode *inode = data->state->inode;
	struct nfs4_state *state = data->state;
	int ret;

	if (!data->rpc_done) {
		ret = data->rpc_status;
		goto err;
	}

	ret = -ESTALE;
	if (!(data->f_attr.valid & NFS_ATTR_FATTR_TYPE) ||
	    !(data->f_attr.valid & NFS_ATTR_FATTR_FILEID) ||
	    !(data->f_attr.valid & NFS_ATTR_FATTR_CHANGE))
		goto err;

	ret = -ENOMEM;
	state = nfs4_get_open_state(inode, data->owner);
	if (state == NULL)
		goto err;

	ret = nfs_refresh_inode(inode, &data->f_attr);
	if (ret)
		goto err;

	if (data->o_res.delegation_type != 0)
		nfs4_opendata_check_deleg(data, state);
	update_open_stateid(state, &data->o_res.stateid, NULL,
			    data->o_arg.fmode);

	return state;
err:
	return ERR_PTR(ret);

}

static struct nfs4_state *
_nfs4_opendata_to_nfs4_state(struct nfs4_opendata *data)
1195 1196 1197
{
	struct inode *inode;
	struct nfs4_state *state = NULL;
1198
	int ret;
1199

1200
	if (!data->rpc_done) {
1201
		state = nfs4_try_open_cached(data);
1202 1203 1204
		goto out;
	}

1205
	ret = -EAGAIN;
1206
	if (!(data->f_attr.valid & NFS_ATTR_FATTR))
1207
		goto err;
1208
	inode = nfs_fhget(data->dir->d_sb, &data->o_res.fh, &data->f_attr);
1209
	ret = PTR_ERR(inode);
1210
	if (IS_ERR(inode))
1211 1212
		goto err;
	ret = -ENOMEM;
1213 1214
	state = nfs4_get_open_state(inode, data->owner);
	if (state == NULL)
1215
		goto err_put_inode;
1216 1217
	if (data->o_res.delegation_type != 0)
		nfs4_opendata_check_deleg(data, state);
1218
	update_open_stateid(state, &data->o_res.stateid, NULL,
1219
			data->o_arg.fmode);
1220
	iput(inode);
1221
out:
1222
	nfs_release_seqid(data->o_arg.seqid);
1223
	return state;
1224 1225 1226 1227
err_put_inode:
	iput(inode);
err:
	return ERR_PTR(ret);
1228 1229
}

1230 1231 1232 1233 1234 1235 1236 1237
static struct nfs4_state *
nfs4_opendata_to_nfs4_state(struct nfs4_opendata *data)
{
	if (data->o_arg.claim == NFS4_OPEN_CLAIM_PREVIOUS)
		return _nfs4_opendata_reclaim_to_nfs4_state(data);
	return _nfs4_opendata_to_nfs4_state(data);
}

1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254
static struct nfs_open_context *nfs4_state_find_open_context(struct nfs4_state *state)
{
	struct nfs_inode *nfsi = NFS_I(state->inode);
	struct nfs_open_context *ctx;

	spin_lock(&state->inode->i_lock);
	list_for_each_entry(ctx, &nfsi->open_files, list) {
		if (ctx->state != state)
			continue;
		get_nfs_open_context(ctx);
		spin_unlock(&state->inode->i_lock);
		return ctx;
	}
	spin_unlock(&state->inode->i_lock);
	return ERR_PTR(-ENOENT);
}

1255 1256
static struct nfs4_opendata *nfs4_open_recoverdata_alloc(struct nfs_open_context *ctx,
		struct nfs4_state *state, enum open_claim_type4 claim)
T
Trond Myklebust 已提交
1257 1258 1259
{
	struct nfs4_opendata *opendata;

1260 1261
	opendata = nfs4_opendata_alloc(ctx->dentry, state->owner, 0, 0,
			NULL, claim, GFP_NOFS);
T
Trond Myklebust 已提交
1262 1263 1264 1265 1266 1267 1268
	if (opendata == NULL)
		return ERR_PTR(-ENOMEM);
	opendata->state = state;
	atomic_inc(&state->count);
	return opendata;
}

1269
static int nfs4_open_recover_helper(struct nfs4_opendata *opendata, fmode_t fmode, struct nfs4_state **res)
1270
{
1271
	struct nfs4_state *newstate;
1272 1273
	int ret;

1274 1275
	opendata->o_arg.open_flags = 0;
	opendata->o_arg.fmode = fmode;
1276 1277 1278
	memset(&opendata->o_res, 0, sizeof(opendata->o_res));
	memset(&opendata->c_res, 0, sizeof(opendata->c_res));
	nfs4_init_opendata_res(opendata);
1279
	ret = _nfs4_recover_proc_open(opendata);
1280 1281
	if (ret != 0)
		return ret; 
1282
	newstate = nfs4_opendata_to_nfs4_state(opendata);
1283 1284
	if (IS_ERR(newstate))
		return PTR_ERR(newstate);
1285
	nfs4_close_state(newstate, fmode);
1286
	*res = newstate;
1287 1288 1289 1290 1291 1292 1293 1294 1295
	return 0;
}

static int nfs4_open_recover(struct nfs4_opendata *opendata, struct nfs4_state *state)
{
	struct nfs4_state *newstate;
	int ret;

	/* memory barrier prior to reading state->n_* */
1296
	clear_bit(NFS_DELEGATED_STATE, &state->flags);
1297
	clear_bit(NFS_OPEN_STATE, &state->flags);
1298 1299
	smp_rmb();
	if (state->n_rdwr != 0) {
T
Trond Myklebust 已提交
1300
		clear_bit(NFS_O_RDWR_STATE, &state->flags);
1301
		ret = nfs4_open_recover_helper(opendata, FMODE_READ|FMODE_WRITE, &newstate);
1302 1303
		if (ret != 0)
			return ret;
1304 1305
		if (newstate != state)
			return -ESTALE;
1306 1307
	}
	if (state->n_wronly != 0) {
T
Trond Myklebust 已提交
1308
		clear_bit(NFS_O_WRONLY_STATE, &state->flags);
1309
		ret = nfs4_open_recover_helper(opendata, FMODE_WRITE, &newstate);
1310 1311
		if (ret != 0)
			return ret;
1312 1313
		if (newstate != state)
			return -ESTALE;
1314 1315
	}
	if (state->n_rdonly != 0) {
T
Trond Myklebust 已提交
1316
		clear_bit(NFS_O_RDONLY_STATE, &state->flags);
1317
		ret = nfs4_open_recover_helper(opendata, FMODE_READ, &newstate);
1318 1319
		if (ret != 0)
			return ret;
1320 1321
		if (newstate != state)
			return -ESTALE;
1322
	}
1323 1324 1325 1326 1327
	/*
	 * We may have performed cached opens for all three recoveries.
	 * Check if we need to update the current stateid.
	 */
	if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0 &&
1328
	    !nfs4_stateid_match(&state->stateid, &state->open_stateid)) {
1329
		write_seqlock(&state->seqlock);
1330
		if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
1331
			nfs4_stateid_copy(&state->stateid, &state->open_stateid);
1332
		write_sequnlock(&state->seqlock);
1333
	}
1334 1335 1336
	return 0;
}

L
Linus Torvalds 已提交
1337 1338 1339 1340
/*
 * OPEN_RECLAIM:
 * 	reclaim state on the server after a reboot.
 */
1341
static int _nfs4_do_open_reclaim(struct nfs_open_context *ctx, struct nfs4_state *state)
L
Linus Torvalds 已提交
1342
{
1343
	struct nfs_delegation *delegation;
1344
	struct nfs4_opendata *opendata;
1345
	fmode_t delegation_type = 0;
L
Linus Torvalds 已提交
1346 1347
	int status;

1348 1349
	opendata = nfs4_open_recoverdata_alloc(ctx, state,
			NFS4_OPEN_CLAIM_PREVIOUS);
T
Trond Myklebust 已提交
1350 1351
	if (IS_ERR(opendata))
		return PTR_ERR(opendata);
1352 1353
	rcu_read_lock();
	delegation = rcu_dereference(NFS_I(state->inode)->delegation);
1354
	if (delegation != NULL && test_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags) != 0)
1355
		delegation_type = delegation->type;
1356
	rcu_read_unlock();
1357 1358
	opendata->o_arg.u.delegation_type = delegation_type;
	status = nfs4_open_recover(opendata, state);
1359
	nfs4_opendata_put(opendata);
L
Linus Torvalds 已提交
1360 1361 1362
	return status;
}

1363
static int nfs4_do_open_reclaim(struct nfs_open_context *ctx, struct nfs4_state *state)
L
Linus Torvalds 已提交
1364 1365 1366 1367 1368
{
	struct nfs_server *server = NFS_SERVER(state->inode);
	struct nfs4_exception exception = { };
	int err;
	do {
1369
		err = _nfs4_do_open_reclaim(ctx, state);
1370 1371
		if (nfs4_clear_cap_atomic_open_v1(server, err, &exception))
			continue;
1372
		if (err != -NFS4ERR_DELAY)
1373 1374
			break;
		nfs4_handle_exception(server, err, &exception);
L
Linus Torvalds 已提交
1375 1376 1377 1378
	} while (exception.retry);
	return err;
}

1379 1380 1381 1382 1383 1384 1385
static int nfs4_open_reclaim(struct nfs4_state_owner *sp, struct nfs4_state *state)
{
	struct nfs_open_context *ctx;
	int ret;

	ctx = nfs4_state_find_open_context(state);
	if (IS_ERR(ctx))
1386
		return -EAGAIN;
1387
	ret = nfs4_do_open_reclaim(ctx, state);
1388 1389 1390 1391
	put_nfs_open_context(ctx);
	return ret;
}

1392
static int nfs4_handle_delegation_recall_error(struct nfs_server *server, struct nfs4_state *state, const nfs4_stateid *stateid, int err)
L
Linus Torvalds 已提交
1393
{
1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419
	switch (err) {
		default:
			printk(KERN_ERR "NFS: %s: unhandled error "
					"%d.\n", __func__, err);
		case 0:
		case -ENOENT:
		case -ESTALE:
			break;
		case -NFS4ERR_BADSESSION:
		case -NFS4ERR_BADSLOT:
		case -NFS4ERR_BAD_HIGH_SLOT:
		case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
		case -NFS4ERR_DEADSESSION:
			set_bit(NFS_DELEGATED_STATE, &state->flags);
			nfs4_schedule_session_recovery(server->nfs_client->cl_session, err);
			return -EAGAIN;
		case -NFS4ERR_STALE_CLIENTID:
		case -NFS4ERR_STALE_STATEID:
			set_bit(NFS_DELEGATED_STATE, &state->flags);
		case -NFS4ERR_EXPIRED:
			/* Don't recall a delegation if it was lost */
			nfs4_schedule_lease_recovery(server->nfs_client);
			return -EAGAIN;
		case -NFS4ERR_DELEG_REVOKED:
		case -NFS4ERR_ADMIN_REVOKED:
		case -NFS4ERR_BAD_STATEID:
1420
		case -NFS4ERR_OPENMODE:
1421 1422 1423 1424 1425 1426 1427 1428 1429
			nfs_inode_find_state_and_recover(state->inode,
					stateid);
			nfs4_schedule_stateid_recovery(server, state);
			return 0;
		case -NFS4ERR_DELAY:
		case -NFS4ERR_GRACE:
			set_bit(NFS_DELEGATED_STATE, &state->flags);
			ssleep(1);
			return -EAGAIN;
1430 1431 1432 1433
		case -ENOMEM:
		case -NFS4ERR_DENIED:
			/* kill_proc(fl->fl_pid, SIGLOST, 1); */
			return 0;
1434
	}
L
Linus Torvalds 已提交
1435 1436 1437
	return err;
}

1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453
int nfs4_open_delegation_recall(struct nfs_open_context *ctx, struct nfs4_state *state, const nfs4_stateid *stateid)
{
	struct nfs_server *server = NFS_SERVER(state->inode);
	struct nfs4_opendata *opendata;
	int err;

	opendata = nfs4_open_recoverdata_alloc(ctx, state,
			NFS4_OPEN_CLAIM_DELEG_CUR_FH);
	if (IS_ERR(opendata))
		return PTR_ERR(opendata);
	nfs4_stateid_copy(&opendata->o_arg.u.delegation, stateid);
	err = nfs4_open_recover(opendata, state);
	nfs4_opendata_put(opendata);
	return nfs4_handle_delegation_recall_error(server, state, stateid, err);
}

1454 1455 1456 1457 1458
static void nfs4_open_confirm_done(struct rpc_task *task, void *calldata)
{
	struct nfs4_opendata *data = calldata;

	data->rpc_status = task->tk_status;
1459
	if (data->rpc_status == 0) {
1460
		nfs4_stateid_copy(&data->o_res.stateid, &data->c_res.stateid);
1461
		nfs_confirm_seqid(&data->owner->so_seqid, 0);
1462
		renew_lease(data->o_res.server, data->timestamp);
1463
		data->rpc_done = 1;
1464
	}
1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475
}

static void nfs4_open_confirm_release(void *calldata)
{
	struct nfs4_opendata *data = calldata;
	struct nfs4_state *state = NULL;

	/* If this request hasn't been cancelled, do nothing */
	if (data->cancelled == 0)
		goto out_free;
	/* In case of error, no cleanup! */
1476
	if (!data->rpc_done)
1477 1478
		goto out_free;
	state = nfs4_opendata_to_nfs4_state(data);
1479
	if (!IS_ERR(state))
1480
		nfs4_close_state(state, data->o_arg.fmode);
1481
out_free:
1482
	nfs4_opendata_put(data);
1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494 1495 1496
}

static const struct rpc_call_ops nfs4_open_confirm_ops = {
	.rpc_call_done = nfs4_open_confirm_done,
	.rpc_release = nfs4_open_confirm_release,
};

/*
 * Note: On error, nfs4_proc_open_confirm will free the struct nfs4_opendata
 */
static int _nfs4_proc_open_confirm(struct nfs4_opendata *data)
{
	struct nfs_server *server = NFS_SERVER(data->dir->d_inode);
	struct rpc_task *task;
1497 1498 1499 1500 1501 1502
	struct  rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_CONFIRM],
		.rpc_argp = &data->c_arg,
		.rpc_resp = &data->c_res,
		.rpc_cred = data->owner->so_cred,
	};
T
Trond Myklebust 已提交
1503 1504
	struct rpc_task_setup task_setup_data = {
		.rpc_client = server->client,
1505
		.rpc_message = &msg,
T
Trond Myklebust 已提交
1506 1507
		.callback_ops = &nfs4_open_confirm_ops,
		.callback_data = data,
1508
		.workqueue = nfsiod_workqueue,
T
Trond Myklebust 已提交
1509 1510
		.flags = RPC_TASK_ASYNC,
	};
L
Linus Torvalds 已提交
1511 1512
	int status;

1513
	kref_get(&data->kref);
1514 1515
	data->rpc_done = 0;
	data->rpc_status = 0;
1516
	data->timestamp = jiffies;
T
Trond Myklebust 已提交
1517
	task = rpc_run_task(&task_setup_data);
1518
	if (IS_ERR(task))
1519 1520 1521 1522 1523 1524 1525
		return PTR_ERR(task);
	status = nfs4_wait_for_completion_rpc_task(task);
	if (status != 0) {
		data->cancelled = 1;
		smp_wmb();
	} else
		status = data->rpc_status;
1526
	rpc_put_task(task);
L
Linus Torvalds 已提交
1527 1528 1529
	return status;
}

1530
static void nfs4_open_prepare(struct rpc_task *task, void *calldata)
L
Linus Torvalds 已提交
1531
{
1532 1533
	struct nfs4_opendata *data = calldata;
	struct nfs4_state_owner *sp = data->owner;
1534
	struct nfs_client *clp = sp->so_server->nfs_client;
1535

1536
	if (nfs_wait_on_sequence(data->o_arg.seqid, task) != 0)
1537
		goto out_wait;
1538 1539 1540 1541 1542 1543 1544
	/*
	 * Check if we still need to send an OPEN call, or if we can use
	 * a delegation instead.
	 */
	if (data->state != NULL) {
		struct nfs_delegation *delegation;

1545
		if (can_open_cached(data->state, data->o_arg.fmode, data->o_arg.open_flags))
1546
			goto out_no_action;
1547 1548
		rcu_read_lock();
		delegation = rcu_dereference(NFS_I(data->state->inode)->delegation);
1549
		if (data->o_arg.claim != NFS4_OPEN_CLAIM_DELEGATE_CUR &&
1550
		    data->o_arg.claim != NFS4_OPEN_CLAIM_DELEG_CUR_FH &&
1551 1552
		    can_open_delegated(delegation, data->o_arg.fmode))
			goto unlock_no_action;
1553 1554
		rcu_read_unlock();
	}
1555
	/* Update client id. */
1556
	data->o_arg.clientid = clp->cl_clientid;
1557 1558 1559 1560
	switch (data->o_arg.claim) {
	case NFS4_OPEN_CLAIM_PREVIOUS:
	case NFS4_OPEN_CLAIM_DELEG_CUR_FH:
	case NFS4_OPEN_CLAIM_DELEG_PREV_FH:
1561
		data->o_arg.open_bitmap = &nfs4_open_noattr_bitmap[0];
1562 1563
	case NFS4_OPEN_CLAIM_FH:
		task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_NOATTR];
T
Trond Myklebust 已提交
1564 1565
		nfs_copy_fh(&data->o_res.fh, data->o_arg.fh);
	}
1566
	data->timestamp = jiffies;
1567
	if (nfs4_setup_sequence(data->o_arg.server,
1568
				&data->o_arg.seq_args,
1569 1570 1571
				&data->o_res.seq_res,
				task) != 0)
		nfs_release_seqid(data->o_arg.seqid);
1572 1573 1574 1575 1576 1577 1578 1579 1580 1581

	/* Set the create mode (note dependency on the session type) */
	data->o_arg.createmode = NFS4_CREATE_UNCHECKED;
	if (data->o_arg.open_flags & O_EXCL) {
		data->o_arg.createmode = NFS4_CREATE_EXCLUSIVE;
		if (nfs4_has_persistent_session(clp))
			data->o_arg.createmode = NFS4_CREATE_GUARDED;
		else if (clp->cl_mvops->minor_version > 0)
			data->o_arg.createmode = NFS4_CREATE_EXCLUSIVE4_1;
	}
1582
	return;
1583 1584
unlock_no_action:
	rcu_read_unlock();
1585 1586
out_no_action:
	task->tk_action = NULL;
1587
out_wait:
1588
	nfs4_sequence_done(task, &data->o_res.seq_res);
1589 1590
}

1591 1592 1593
static void nfs4_open_done(struct rpc_task *task, void *calldata)
{
	struct nfs4_opendata *data = calldata;
L
Linus Torvalds 已提交
1594

1595
	data->rpc_status = task->tk_status;
1596

1597 1598
	if (!nfs4_sequence_done(task, &data->o_res.seq_res))
		return;
1599

1600
	if (task->tk_status == 0) {
1601 1602
		if (data->o_res.f_attr->valid & NFS_ATTR_FATTR_TYPE) {
			switch (data->o_res.f_attr->mode & S_IFMT) {
1603 1604 1605
			case S_IFREG:
				break;
			case S_IFLNK:
1606
				data->rpc_status = -ELOOP;
1607 1608
				break;
			case S_IFDIR:
1609
				data->rpc_status = -EISDIR;
1610 1611
				break;
			default:
1612
				data->rpc_status = -ENOTDIR;
1613
			}
1614
		}
1615
		renew_lease(data->o_res.server, data->timestamp);
1616 1617
		if (!(data->o_res.rflags & NFS4_OPEN_RESULT_CONFIRM))
			nfs_confirm_seqid(&data->owner->so_seqid, 0);
1618
	}
1619
	data->rpc_done = 1;
1620
}
1621

1622 1623 1624 1625 1626 1627 1628 1629 1630
static void nfs4_open_release(void *calldata)
{
	struct nfs4_opendata *data = calldata;
	struct nfs4_state *state = NULL;

	/* If this request hasn't been cancelled, do nothing */
	if (data->cancelled == 0)
		goto out_free;
	/* In case of error, no cleanup! */
1631
	if (data->rpc_status != 0 || !data->rpc_done)
1632 1633 1634 1635 1636
		goto out_free;
	/* In case we need an open_confirm, no cleanup! */
	if (data->o_res.rflags & NFS4_OPEN_RESULT_CONFIRM)
		goto out_free;
	state = nfs4_opendata_to_nfs4_state(data);
1637
	if (!IS_ERR(state))
1638
		nfs4_close_state(state, data->o_arg.fmode);
1639
out_free:
1640
	nfs4_opendata_put(data);
1641 1642 1643 1644 1645 1646 1647 1648
}

static const struct rpc_call_ops nfs4_open_ops = {
	.rpc_call_prepare = nfs4_open_prepare,
	.rpc_call_done = nfs4_open_done,
	.rpc_release = nfs4_open_release,
};

1649
static int nfs4_run_open_task(struct nfs4_opendata *data, int isrecover)
1650 1651 1652 1653 1654 1655
{
	struct inode *dir = data->dir->d_inode;
	struct nfs_server *server = NFS_SERVER(dir);
	struct nfs_openargs *o_arg = &data->o_arg;
	struct nfs_openres *o_res = &data->o_res;
	struct rpc_task *task;
1656 1657 1658 1659 1660 1661
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN],
		.rpc_argp = o_arg,
		.rpc_resp = o_res,
		.rpc_cred = data->owner->so_cred,
	};
T
Trond Myklebust 已提交
1662 1663
	struct rpc_task_setup task_setup_data = {
		.rpc_client = server->client,
1664
		.rpc_message = &msg,
T
Trond Myklebust 已提交
1665 1666
		.callback_ops = &nfs4_open_ops,
		.callback_data = data,
1667
		.workqueue = nfsiod_workqueue,
T
Trond Myklebust 已提交
1668 1669
		.flags = RPC_TASK_ASYNC,
	};
1670 1671
	int status;

1672
	nfs41_init_sequence(&o_arg->seq_args, &o_res->seq_res, 1);
1673
	kref_get(&data->kref);
1674 1675
	data->rpc_done = 0;
	data->rpc_status = 0;
1676
	data->cancelled = 0;
1677 1678
	data->is_recover = 0;
	if (isrecover) {
1679
		nfs4_set_sequence_privileged(&o_arg->seq_args);
1680 1681
		data->is_recover = 1;
	}
T
Trond Myklebust 已提交
1682
	task = rpc_run_task(&task_setup_data);
1683 1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702 1703 1704 1705
        if (IS_ERR(task))
                return PTR_ERR(task);
        status = nfs4_wait_for_completion_rpc_task(task);
        if (status != 0) {
                data->cancelled = 1;
                smp_wmb();
        } else
                status = data->rpc_status;
        rpc_put_task(task);

	return status;
}

static int _nfs4_recover_proc_open(struct nfs4_opendata *data)
{
	struct inode *dir = data->dir->d_inode;
	struct nfs_openres *o_res = &data->o_res;
        int status;

	status = nfs4_run_open_task(data, 1);
	if (status != 0 || !data->rpc_done)
		return status;

1706 1707
	nfs_fattr_map_and_free_names(NFS_SERVER(dir), &data->f_attr);

1708 1709 1710 1711 1712 1713 1714 1715 1716
	if (o_res->rflags & NFS4_OPEN_RESULT_CONFIRM) {
		status = _nfs4_proc_open_confirm(data);
		if (status != 0)
			return status;
	}

	return status;
}

1717 1718
static int nfs4_opendata_access(struct rpc_cred *cred,
				struct nfs4_opendata *opendata,
1719 1720
				struct nfs4_state *state, fmode_t fmode,
				int openflags)
1721 1722 1723 1724 1725 1726 1727 1728 1729 1730
{
	struct nfs_access_entry cache;
	u32 mask;

	/* access call failed or for some reason the server doesn't
	 * support any access modes -- defer access call until later */
	if (opendata->o_res.access_supported == 0)
		return 0;

	mask = 0;
1731
	/* don't check MAY_WRITE - a newly created file may not have
1732 1733 1734 1735 1736 1737 1738 1739
	 * write mode bits, but POSIX allows the creating process to write.
	 * use openflags to check for exec, because fmode won't
	 * always have FMODE_EXEC set when file open for exec. */
	if (openflags & __FMODE_EXEC) {
		/* ONLY check for exec rights */
		mask = MAY_EXEC;
	} else if (fmode & FMODE_READ)
		mask = MAY_READ;
1740 1741 1742 1743 1744 1745

	cache.cred = cred;
	cache.jiffies = jiffies;
	nfs_access_set_mask(&cache, opendata->o_res.access_result);
	nfs_access_add_cache(state->inode, &cache);

1746
	if ((mask & ~cache.mask & (MAY_READ | MAY_EXEC)) == 0)
1747 1748 1749 1750
		return 0;

	/* even though OPEN succeeded, access is denied. Close the file */
	nfs4_close_state(state, fmode);
1751
	return -EACCES;
1752 1753
}

1754 1755 1756 1757 1758 1759 1760 1761 1762 1763 1764 1765
/*
 * Note: On error, nfs4_proc_open will free the struct nfs4_opendata
 */
static int _nfs4_proc_open(struct nfs4_opendata *data)
{
	struct inode *dir = data->dir->d_inode;
	struct nfs_server *server = NFS_SERVER(dir);
	struct nfs_openargs *o_arg = &data->o_arg;
	struct nfs_openres *o_res = &data->o_res;
	int status;

	status = nfs4_run_open_task(data, 0);
1766 1767 1768 1769 1770 1771
	if (!data->rpc_done)
		return status;
	if (status != 0) {
		if (status == -NFS4ERR_BADNAME &&
				!(o_arg->open_flags & O_CREAT))
			return -ENOENT;
1772
		return status;
1773
	}
1774

1775 1776
	nfs_fattr_map_and_free_names(server, &data->f_attr);

1777
	if (o_arg->open_flags & O_CREAT)
1778
		update_changeattr(dir, &o_res->cinfo);
T
Trond Myklebust 已提交
1779 1780
	if ((o_res->rflags & NFS4_OPEN_RESULT_LOCKTYPE_POSIX) == 0)
		server->caps &= ~NFS_CAP_POSIX_LOCK;
L
Linus Torvalds 已提交
1781
	if(o_res->rflags & NFS4_OPEN_RESULT_CONFIRM) {
1782
		status = _nfs4_proc_open_confirm(data);
L
Linus Torvalds 已提交
1783
		if (status != 0)
1784
			return status;
L
Linus Torvalds 已提交
1785 1786
	}
	if (!(o_res->f_attr->valid & NFS_ATTR_FATTR))
1787
		_nfs4_proc_getattr(server, &o_res->fh, o_res->f_attr);
1788
	return 0;
L
Linus Torvalds 已提交
1789 1790
}

A
Andy Adamson 已提交
1791 1792 1793 1794 1795
static int nfs4_recover_expired_lease(struct nfs_server *server)
{
	return nfs4_client_recover_expired_lease(server->nfs_client);
}

L
Linus Torvalds 已提交
1796 1797 1798 1799 1800
/*
 * OPEN_EXPIRED:
 * 	reclaim state on the server after a network partition.
 * 	Assumes caller holds the appropriate lock
 */
1801
static int _nfs4_open_expired(struct nfs_open_context *ctx, struct nfs4_state *state)
L
Linus Torvalds 已提交
1802
{
1803
	struct nfs4_opendata *opendata;
1804
	int ret;
L
Linus Torvalds 已提交
1805

1806
	opendata = nfs4_open_recoverdata_alloc(ctx, state,
1807
			NFS4_OPEN_CLAIM_FH);
T
Trond Myklebust 已提交
1808 1809
	if (IS_ERR(opendata))
		return PTR_ERR(opendata);
1810
	ret = nfs4_open_recover(opendata, state);
1811
	if (ret == -ESTALE)
1812
		d_drop(ctx->dentry);
1813
	nfs4_opendata_put(opendata);
1814
	return ret;
L
Linus Torvalds 已提交
1815 1816
}

1817
static int nfs4_do_open_expired(struct nfs_open_context *ctx, struct nfs4_state *state)
1818
{
1819
	struct nfs_server *server = NFS_SERVER(state->inode);
1820 1821 1822 1823
	struct nfs4_exception exception = { };
	int err;

	do {
1824
		err = _nfs4_open_expired(ctx, state);
1825 1826
		if (nfs4_clear_cap_atomic_open_v1(server, err, &exception))
			continue;
1827 1828 1829 1830 1831 1832 1833 1834
		switch (err) {
		default:
			goto out;
		case -NFS4ERR_GRACE:
		case -NFS4ERR_DELAY:
			nfs4_handle_exception(server, err, &exception);
			err = 0;
		}
1835
	} while (exception.retry);
1836
out:
1837 1838 1839
	return err;
}

L
Linus Torvalds 已提交
1840 1841 1842
static int nfs4_open_expired(struct nfs4_state_owner *sp, struct nfs4_state *state)
{
	struct nfs_open_context *ctx;
1843
	int ret;
L
Linus Torvalds 已提交
1844

1845 1846
	ctx = nfs4_state_find_open_context(state);
	if (IS_ERR(ctx))
1847
		return -EAGAIN;
1848
	ret = nfs4_do_open_expired(ctx, state);
1849 1850
	put_nfs_open_context(ctx);
	return ret;
L
Linus Torvalds 已提交
1851 1852
}

1853
#if defined(CONFIG_NFS_V4_1)
1854
static void nfs41_clear_delegation_stateid(struct nfs4_state *state)
1855 1856
{
	struct nfs_server *server = NFS_SERVER(state->inode);
1857 1858 1859 1860 1861 1862 1863 1864 1865 1866 1867 1868 1869
	nfs4_stateid *stateid = &state->stateid;
	int status;

	/* If a state reset has been done, test_stateid is unneeded */
	if (test_bit(NFS_DELEGATED_STATE, &state->flags) == 0)
		return;

	status = nfs41_test_stateid(server, stateid);
	if (status != NFS_OK) {
		/* Free the stateid unless the server explicitly
		 * informs us the stateid is unrecognized. */
		if (status != -NFS4ERR_BAD_STATEID)
			nfs41_free_stateid(server, stateid);
1870
		nfs_remove_bad_delegation(state->inode);
1871

1872 1873 1874
		write_seqlock(&state->seqlock);
		nfs4_stateid_copy(&state->stateid, &state->open_stateid);
		write_sequnlock(&state->seqlock);
1875 1876 1877 1878 1879 1880 1881 1882 1883 1884 1885 1886 1887 1888 1889
		clear_bit(NFS_DELEGATED_STATE, &state->flags);
	}
}

/**
 * nfs41_check_open_stateid - possibly free an open stateid
 *
 * @state: NFSv4 state for an inode
 *
 * Returns NFS_OK if recovery for this stateid is now finished.
 * Otherwise a negative NFS4ERR value is returned.
 */
static int nfs41_check_open_stateid(struct nfs4_state *state)
{
	struct nfs_server *server = NFS_SERVER(state->inode);
1890
	nfs4_stateid *stateid = &state->open_stateid;
1891 1892 1893 1894 1895 1896 1897 1898 1899 1900 1901 1902 1903 1904 1905 1906 1907 1908
	int status;

	/* If a state reset has been done, test_stateid is unneeded */
	if ((test_bit(NFS_O_RDONLY_STATE, &state->flags) == 0) &&
	    (test_bit(NFS_O_WRONLY_STATE, &state->flags) == 0) &&
	    (test_bit(NFS_O_RDWR_STATE, &state->flags) == 0))
		return -NFS4ERR_BAD_STATEID;

	status = nfs41_test_stateid(server, stateid);
	if (status != NFS_OK) {
		/* Free the stateid unless the server explicitly
		 * informs us the stateid is unrecognized. */
		if (status != -NFS4ERR_BAD_STATEID)
			nfs41_free_stateid(server, stateid);

		clear_bit(NFS_O_RDONLY_STATE, &state->flags);
		clear_bit(NFS_O_WRONLY_STATE, &state->flags);
		clear_bit(NFS_O_RDWR_STATE, &state->flags);
1909
		clear_bit(NFS_OPEN_STATE, &state->flags);
1910 1911 1912 1913 1914 1915
	}
	return status;
}

static int nfs41_open_expired(struct nfs4_state_owner *sp, struct nfs4_state *state)
{
1916
	int status;
1917

1918 1919
	nfs41_clear_delegation_stateid(state);
	status = nfs41_check_open_stateid(state);
1920 1921 1922
	if (status != NFS_OK)
		status = nfs4_open_expired(sp, state);
	return status;
1923 1924 1925
}
#endif

1926 1927 1928 1929 1930 1931 1932 1933 1934 1935 1936 1937 1938 1939 1940 1941
/*
 * on an EXCLUSIVE create, the server should send back a bitmask with FATTR4-*
 * fields corresponding to attributes that were used to store the verifier.
 * Make sure we clobber those fields in the later setattr call
 */
static inline void nfs4_exclusive_attrset(struct nfs4_opendata *opendata, struct iattr *sattr)
{
	if ((opendata->o_res.attrset[1] & FATTR4_WORD1_TIME_ACCESS) &&
	    !(sattr->ia_valid & ATTR_ATIME_SET))
		sattr->ia_valid |= ATTR_ATIME;

	if ((opendata->o_res.attrset[1] & FATTR4_WORD1_TIME_MODIFY) &&
	    !(sattr->ia_valid & ATTR_MTIME_SET))
		sattr->ia_valid |= ATTR_MTIME;
}

1942 1943 1944 1945 1946 1947 1948 1949 1950 1951 1952 1953 1954 1955 1956 1957 1958 1959 1960 1961 1962 1963 1964 1965 1966 1967 1968 1969
static int _nfs4_open_and_get_state(struct nfs4_opendata *opendata,
		fmode_t fmode,
		int flags,
		struct nfs4_state **res)
{
	struct nfs4_state_owner *sp = opendata->owner;
	struct nfs_server *server = sp->so_server;
	struct nfs4_state *state;
	unsigned int seq;
	int ret;

	seq = raw_seqcount_begin(&sp->so_reclaim_seqcount);

	ret = _nfs4_proc_open(opendata);
	if (ret != 0)
		goto out;

	state = nfs4_opendata_to_nfs4_state(opendata);
	ret = PTR_ERR(state);
	if (IS_ERR(state))
		goto out;
	if (server->caps & NFS_CAP_POSIX_LOCK)
		set_bit(NFS_STATE_POSIX_LOCKS, &state->flags);

	ret = nfs4_opendata_access(sp->so_cred, opendata, state, fmode, flags);
	if (ret != 0)
		goto out;

1970
	if (read_seqcount_retry(&sp->so_reclaim_seqcount, seq))
1971 1972 1973 1974 1975 1976
		nfs4_schedule_stateid_recovery(server, state);
	*res = state;
out:
	return ret;
}

L
Linus Torvalds 已提交
1977
/*
1978
 * Returns a referenced nfs4_state
L
Linus Torvalds 已提交
1979
 */
1980 1981 1982 1983 1984 1985 1986 1987
static int _nfs4_do_open(struct inode *dir,
			struct dentry *dentry,
			fmode_t fmode,
			int flags,
			struct iattr *sattr,
			struct rpc_cred *cred,
			struct nfs4_state **res,
			struct nfs4_threshold **ctx_th)
L
Linus Torvalds 已提交
1988 1989 1990 1991
{
	struct nfs4_state_owner  *sp;
	struct nfs4_state     *state = NULL;
	struct nfs_server       *server = NFS_SERVER(dir);
1992
	struct nfs4_opendata *opendata;
1993
	enum open_claim_type4 claim = NFS4_OPEN_CLAIM_NULL;
1994
	int status;
L
Linus Torvalds 已提交
1995 1996 1997

	/* Protect against reboot recovery conflicts */
	status = -ENOMEM;
1998 1999
	sp = nfs4_get_state_owner(server, cred, GFP_KERNEL);
	if (sp == NULL) {
L
Linus Torvalds 已提交
2000 2001 2002
		dprintk("nfs4_do_open: nfs4_get_state_owner failed!\n");
		goto out_err;
	}
2003 2004
	status = nfs4_recover_expired_lease(server);
	if (status != 0)
2005
		goto err_put_state_owner;
2006 2007
	if (dentry->d_inode != NULL)
		nfs4_return_incompatible_delegation(dentry->d_inode, fmode);
2008
	status = -ENOMEM;
2009 2010
	if (dentry->d_inode)
		claim = NFS4_OPEN_CLAIM_FH;
2011
	opendata = nfs4_opendata_alloc(dentry, sp, fmode, flags, sattr,
2012
			claim, GFP_KERNEL);
2013
	if (opendata == NULL)
T
Trond Myklebust 已提交
2014
		goto err_put_state_owner;
L
Linus Torvalds 已提交
2015

2016 2017 2018 2019
	if (ctx_th && server->attr_bitmask[2] & FATTR4_WORD2_MDSTHRESHOLD) {
		opendata->f_attr.mdsthreshold = pnfs_mdsthreshold_alloc();
		if (!opendata->f_attr.mdsthreshold)
			goto err_opendata_put;
2020
		opendata->o_arg.open_bitmap = &nfs4_pnfs_open_bitmap[0];
2021
	}
2022 2023
	if (dentry->d_inode != NULL)
		opendata->state = nfs4_get_open_state(dentry->d_inode, sp);
2024

2025
	status = _nfs4_open_and_get_state(opendata, fmode, flags, &state);
2026 2027 2028
	if (status != 0)
		goto err_opendata_put;

2029 2030
	if ((opendata->o_arg.open_flags & O_EXCL) &&
	    (opendata->o_arg.createmode != NFS4_CREATE_GUARDED)) {
2031 2032 2033 2034 2035 2036 2037 2038 2039 2040
		nfs4_exclusive_attrset(opendata, sattr);

		nfs_fattr_init(opendata->o_res.f_attr);
		status = nfs4_do_setattr(state->inode, cred,
				opendata->o_res.f_attr, sattr,
				state);
		if (status == 0)
			nfs_setattr_update_inode(state->inode, sattr);
		nfs_post_op_update_inode(state->inode, opendata->o_res.f_attr);
	}
2041 2042 2043 2044 2045 2046 2047

	if (pnfs_use_threshold(ctx_th, opendata->f_attr.mdsthreshold, server))
		*ctx_th = opendata->f_attr.mdsthreshold;
	else
		kfree(opendata->f_attr.mdsthreshold);
	opendata->f_attr.mdsthreshold = NULL;

2048
	nfs4_opendata_put(opendata);
L
Linus Torvalds 已提交
2049 2050 2051
	nfs4_put_state_owner(sp);
	*res = state;
	return 0;
2052
err_opendata_put:
2053
	kfree(opendata->f_attr.mdsthreshold);
2054
	nfs4_opendata_put(opendata);
2055 2056
err_put_state_owner:
	nfs4_put_state_owner(sp);
L
Linus Torvalds 已提交
2057 2058 2059 2060 2061 2062
out_err:
	*res = NULL;
	return status;
}


2063 2064 2065 2066 2067 2068 2069
static struct nfs4_state *nfs4_do_open(struct inode *dir,
					struct dentry *dentry,
					fmode_t fmode,
					int flags,
					struct iattr *sattr,
					struct rpc_cred *cred,
					struct nfs4_threshold **ctx_th)
L
Linus Torvalds 已提交
2070
{
2071
	struct nfs_server *server = NFS_SERVER(dir);
L
Linus Torvalds 已提交
2072 2073 2074 2075
	struct nfs4_exception exception = { };
	struct nfs4_state *res;
	int status;

2076
	fmode &= FMODE_READ|FMODE_WRITE|FMODE_EXEC;
L
Linus Torvalds 已提交
2077
	do {
2078 2079
		status = _nfs4_do_open(dir, dentry, fmode, flags, sattr, cred,
				       &res, ctx_th);
L
Linus Torvalds 已提交
2080 2081 2082 2083 2084 2085 2086 2087
		if (status == 0)
			break;
		/* NOTE: BAD_SEQID means the server and client disagree about the
		 * book-keeping w.r.t. state-changing operations
		 * (OPEN/CLOSE/LOCK/LOCKU...)
		 * It is actually a sign of a bug on the client or on the server.
		 *
		 * If we receive a BAD_SEQID error in the particular case of
2088
		 * doing an OPEN, we assume that nfs_increment_open_seqid() will
L
Linus Torvalds 已提交
2089 2090 2091 2092 2093
		 * have unhashed the old state_owner for us, and that we can
		 * therefore safely retry using a new one. We should still warn
		 * the user though...
		 */
		if (status == -NFS4ERR_BAD_SEQID) {
2094
			pr_warn_ratelimited("NFS: v4 server %s "
2095 2096
					" returned a bad sequence-id error!\n",
					NFS_SERVER(dir)->nfs_client->cl_hostname);
L
Linus Torvalds 已提交
2097 2098 2099
			exception.retry = 1;
			continue;
		}
2100 2101 2102 2103 2104 2105 2106 2107 2108 2109
		/*
		 * BAD_STATEID on OPEN means that the server cancelled our
		 * state before it received the OPEN_CONFIRM.
		 * Recover by retrying the request as per the discussion
		 * on Page 181 of RFC3530.
		 */
		if (status == -NFS4ERR_BAD_STATEID) {
			exception.retry = 1;
			continue;
		}
2110 2111 2112 2113 2114
		if (status == -EAGAIN) {
			/* We must have found a delegation */
			exception.retry = 1;
			continue;
		}
2115 2116 2117
		if (nfs4_clear_cap_atomic_open_v1(server, status, &exception))
			continue;
		res = ERR_PTR(nfs4_handle_exception(server,
L
Linus Torvalds 已提交
2118 2119 2120 2121 2122
					status, &exception));
	} while (exception.retry);
	return res;
}

2123 2124 2125
static int _nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
			    struct nfs_fattr *fattr, struct iattr *sattr,
			    struct nfs4_state *state)
L
Linus Torvalds 已提交
2126
{
2127
	struct nfs_server *server = NFS_SERVER(inode);
L
Linus Torvalds 已提交
2128
        struct nfs_setattrargs  arg = {
2129
                .fh             = NFS_FH(inode),
L
Linus Torvalds 已提交
2130 2131 2132 2133 2134 2135 2136 2137 2138
                .iap            = sattr,
		.server		= server,
		.bitmask = server->attr_bitmask,
        };
        struct nfs_setattrres  res = {
		.fattr		= fattr,
		.server		= server,
        };
        struct rpc_message msg = {
2139 2140 2141 2142
		.rpc_proc	= &nfs4_procedures[NFSPROC4_CLNT_SETATTR],
		.rpc_argp	= &arg,
		.rpc_resp	= &res,
		.rpc_cred	= cred,
L
Linus Torvalds 已提交
2143
        };
2144
	unsigned long timestamp = jiffies;
2145 2146
	fmode_t fmode;
	bool truncate;
2147
	int status;
L
Linus Torvalds 已提交
2148

2149
	nfs_fattr_init(fattr);
L
Linus Torvalds 已提交
2150

2151 2152 2153 2154 2155 2156 2157
	/* Servers should only apply open mode checks for file size changes */
	truncate = (sattr->ia_valid & ATTR_SIZE) ? true : false;
	fmode = truncate ? FMODE_WRITE : FMODE_READ;

	if (nfs4_copy_delegation_stateid(&arg.stateid, inode, fmode)) {
		/* Use that stateid */
	} else if (truncate && state != NULL && nfs4_valid_open_stateid(state)) {
2158 2159 2160 2161
		struct nfs_lockowner lockowner = {
			.l_owner = current->files,
			.l_pid = current->tgid,
		};
2162
		nfs4_select_rw_stateid(&arg.stateid, state, FMODE_WRITE,
2163
				&lockowner);
2164
	} else
2165
		nfs4_stateid_copy(&arg.stateid, &zero_stateid);
L
Linus Torvalds 已提交
2166

2167
	status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
2168 2169
	if (status == 0 && state != NULL)
		renew_lease(server, timestamp);
2170
	return status;
L
Linus Torvalds 已提交
2171 2172
}

2173 2174 2175
static int nfs4_do_setattr(struct inode *inode, struct rpc_cred *cred,
			   struct nfs_fattr *fattr, struct iattr *sattr,
			   struct nfs4_state *state)
L
Linus Torvalds 已提交
2176
{
2177
	struct nfs_server *server = NFS_SERVER(inode);
2178 2179
	struct nfs4_exception exception = {
		.state = state,
2180
		.inode = inode,
2181
	};
L
Linus Torvalds 已提交
2182 2183
	int err;
	do {
2184 2185 2186
		err = _nfs4_do_setattr(inode, cred, fattr, sattr, state);
		switch (err) {
		case -NFS4ERR_OPENMODE:
2187 2188 2189 2190 2191 2192 2193
			if (!(sattr->ia_valid & ATTR_SIZE)) {
				pr_warn_once("NFSv4: server %s is incorrectly "
						"applying open mode checks to "
						"a SETATTR that is not "
						"changing file size.\n",
						server->nfs_client->cl_hostname);
			}
2194 2195 2196 2197 2198 2199 2200 2201
			if (state && !(state->state & FMODE_WRITE)) {
				err = -EBADF;
				if (sattr->ia_valid & ATTR_OPEN)
					err = -EACCES;
				goto out;
			}
		}
		err = nfs4_handle_exception(server, err, &exception);
L
Linus Torvalds 已提交
2202
	} while (exception.retry);
2203
out:
L
Linus Torvalds 已提交
2204 2205 2206 2207 2208 2209 2210 2211
	return err;
}

struct nfs4_closedata {
	struct inode *inode;
	struct nfs4_state *state;
	struct nfs_closeargs arg;
	struct nfs_closeres res;
2212
	struct nfs_fattr fattr;
2213
	unsigned long timestamp;
F
Fred Isaman 已提交
2214 2215
	bool roc;
	u32 roc_barrier;
L
Linus Torvalds 已提交
2216 2217
};

2218
static void nfs4_free_closedata(void *data)
2219
{
2220 2221
	struct nfs4_closedata *calldata = data;
	struct nfs4_state_owner *sp = calldata->state->owner;
2222
	struct super_block *sb = calldata->state->inode->i_sb;
2223

F
Fred Isaman 已提交
2224 2225
	if (calldata->roc)
		pnfs_roc_release(calldata->state->inode);
2226 2227 2228
	nfs4_put_open_state(calldata->state);
	nfs_free_seqid(calldata->arg.seqid);
	nfs4_put_state_owner(sp);
2229
	nfs_sb_deactive(sb);
2230 2231 2232
	kfree(calldata);
}

2233 2234 2235 2236
static void nfs4_close_clear_stateid_flags(struct nfs4_state *state,
		fmode_t fmode)
{
	spin_lock(&state->owner->so_lock);
2237 2238 2239
	clear_bit(NFS_O_RDWR_STATE, &state->flags);
	switch (fmode & (FMODE_READ|FMODE_WRITE)) {
	case FMODE_WRITE:
2240
		clear_bit(NFS_O_RDONLY_STATE, &state->flags);
2241 2242
		break;
	case FMODE_READ:
2243
		clear_bit(NFS_O_WRONLY_STATE, &state->flags);
2244 2245 2246 2247 2248 2249
		break;
	case 0:
		clear_bit(NFS_O_RDONLY_STATE, &state->flags);
		clear_bit(NFS_O_WRONLY_STATE, &state->flags);
		clear_bit(NFS_OPEN_STATE, &state->flags);
	}
2250 2251 2252
	spin_unlock(&state->owner->so_lock);
}

2253
static void nfs4_close_done(struct rpc_task *task, void *data)
L
Linus Torvalds 已提交
2254
{
2255
	struct nfs4_closedata *calldata = data;
L
Linus Torvalds 已提交
2256 2257 2258
	struct nfs4_state *state = calldata->state;
	struct nfs_server *server = NFS_SERVER(calldata->inode);

2259
	dprintk("%s: begin!\n", __func__);
2260 2261
	if (!nfs4_sequence_done(task, &calldata->res.seq_res))
		return;
L
Linus Torvalds 已提交
2262 2263 2264 2265 2266
        /* hmm. we are done with the inode, and in the process of freeing
	 * the state_owner. we keep this around to process errors
	 */
	switch (task->tk_status) {
		case 0:
F
Fred Isaman 已提交
2267 2268 2269
			if (calldata->roc)
				pnfs_roc_set_barrier(state->inode,
						     calldata->roc_barrier);
2270
			nfs_set_open_stateid(state, &calldata->res.stateid, 0);
2271
			renew_lease(server, calldata->timestamp);
2272 2273
			nfs4_close_clear_stateid_flags(state,
					calldata->arg.fmode);
L
Linus Torvalds 已提交
2274 2275
			break;
		case -NFS4ERR_STALE_STATEID:
2276 2277
		case -NFS4ERR_OLD_STATEID:
		case -NFS4ERR_BAD_STATEID:
L
Linus Torvalds 已提交
2278
		case -NFS4ERR_EXPIRED:
2279
			if (calldata->arg.fmode == 0)
2280
				break;
L
Linus Torvalds 已提交
2281
		default:
2282 2283
			if (nfs4_async_handle_error(task, server, state) == -EAGAIN)
				rpc_restart_call_prepare(task);
L
Linus Torvalds 已提交
2284
	}
2285
	nfs_release_seqid(calldata->arg.seqid);
2286
	nfs_refresh_inode(calldata->inode, calldata->res.fattr);
2287
	dprintk("%s: done, ret = %d!\n", __func__, task->tk_status);
L
Linus Torvalds 已提交
2288 2289
}

T
Trond Myklebust 已提交
2290
static void nfs4_close_prepare(struct rpc_task *task, void *data)
L
Linus Torvalds 已提交
2291
{
T
Trond Myklebust 已提交
2292
	struct nfs4_closedata *calldata = data;
2293
	struct nfs4_state *state = calldata->state;
2294
	struct inode *inode = calldata->inode;
2295
	int call_close = 0;
2296

2297
	dprintk("%s: begin!\n", __func__);
2298
	if (nfs_wait_on_sequence(calldata->arg.seqid, task) != 0)
2299
		goto out_wait;
2300

2301 2302
	task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_OPEN_DOWNGRADE];
	calldata->arg.fmode = FMODE_READ|FMODE_WRITE;
2303
	spin_lock(&state->owner->so_lock);
2304
	/* Calculate the change in open mode */
2305
	if (state->n_rdwr == 0) {
2306
		if (state->n_rdonly == 0) {
2307 2308 2309
			call_close |= test_bit(NFS_O_RDONLY_STATE, &state->flags);
			call_close |= test_bit(NFS_O_RDWR_STATE, &state->flags);
			calldata->arg.fmode &= ~FMODE_READ;
2310 2311
		}
		if (state->n_wronly == 0) {
2312 2313 2314
			call_close |= test_bit(NFS_O_WRONLY_STATE, &state->flags);
			call_close |= test_bit(NFS_O_RDWR_STATE, &state->flags);
			calldata->arg.fmode &= ~FMODE_WRITE;
2315
		}
2316
	}
2317 2318
	if (!nfs4_valid_open_stateid(state))
		call_close = 0;
2319
	spin_unlock(&state->owner->so_lock);
2320 2321

	if (!call_close) {
2322
		/* Note: exit _without_ calling nfs4_close_done */
2323
		goto out_no_action;
2324
	}
2325

F
Fred Isaman 已提交
2326
	if (calldata->arg.fmode == 0) {
2327
		task->tk_msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CLOSE];
F
Fred Isaman 已提交
2328
		if (calldata->roc &&
2329 2330
		    pnfs_roc_drain(inode, &calldata->roc_barrier, task)) {
			nfs_release_seqid(calldata->arg.seqid);
2331
			goto out_wait;
2332
		    }
F
Fred Isaman 已提交
2333
	}
2334

2335
	nfs_fattr_init(calldata->res.fattr);
2336
	calldata->timestamp = jiffies;
2337
	if (nfs4_setup_sequence(NFS_SERVER(inode),
2338 2339
				&calldata->arg.seq_args,
				&calldata->res.seq_res,
2340 2341
				task) != 0)
		nfs_release_seqid(calldata->arg.seqid);
2342
	dprintk("%s: done!\n", __func__);
2343 2344 2345 2346 2347
	return;
out_no_action:
	task->tk_action = NULL;
out_wait:
	nfs4_sequence_done(task, &calldata->res.seq_res);
L
Linus Torvalds 已提交
2348 2349
}

2350
static const struct rpc_call_ops nfs4_close_ops = {
T
Trond Myklebust 已提交
2351
	.rpc_call_prepare = nfs4_close_prepare,
2352 2353 2354 2355
	.rpc_call_done = nfs4_close_done,
	.rpc_release = nfs4_free_closedata,
};

L
Linus Torvalds 已提交
2356 2357 2358 2359 2360 2361 2362 2363 2364 2365 2366
/* 
 * It is possible for data to be read/written from a mem-mapped file 
 * after the sys_close call (which hits the vfs layer as a flush).
 * This means that we can't safely call nfsv4 close on a file until 
 * the inode is cleared. This in turn means that we are not good
 * NFSv4 citizens - we do not indicate to the server to update the file's 
 * share state even when we are done with one of the three share 
 * stateid's in the inode.
 *
 * NOTE: Caller must be holding the sp->so_owner semaphore!
 */
2367
int nfs4_do_close(struct nfs4_state *state, gfp_t gfp_mask, int wait)
L
Linus Torvalds 已提交
2368
{
2369
	struct nfs_server *server = NFS_SERVER(state->inode);
L
Linus Torvalds 已提交
2370
	struct nfs4_closedata *calldata;
2371 2372
	struct nfs4_state_owner *sp = state->owner;
	struct rpc_task *task;
2373 2374 2375 2376
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CLOSE],
		.rpc_cred = state->owner->so_cred,
	};
T
Trond Myklebust 已提交
2377 2378
	struct rpc_task_setup task_setup_data = {
		.rpc_client = server->client,
2379
		.rpc_message = &msg,
T
Trond Myklebust 已提交
2380
		.callback_ops = &nfs4_close_ops,
2381
		.workqueue = nfsiod_workqueue,
T
Trond Myklebust 已提交
2382 2383
		.flags = RPC_TASK_ASYNC,
	};
2384
	int status = -ENOMEM;
L
Linus Torvalds 已提交
2385

2386
	calldata = kzalloc(sizeof(*calldata), gfp_mask);
L
Linus Torvalds 已提交
2387
	if (calldata == NULL)
2388
		goto out;
2389
	nfs41_init_sequence(&calldata->arg.seq_args, &calldata->res.seq_res, 1);
2390
	calldata->inode = state->inode;
L
Linus Torvalds 已提交
2391
	calldata->state = state;
2392
	calldata->arg.fh = NFS_FH(state->inode);
2393
	calldata->arg.stateid = &state->open_stateid;
L
Linus Torvalds 已提交
2394
	/* Serialization for the sequence id */
2395
	calldata->arg.seqid = nfs_alloc_seqid(&state->owner->so_seqid, gfp_mask);
2396 2397
	if (calldata->arg.seqid == NULL)
		goto out_free_calldata;
2398
	calldata->arg.fmode = 0;
2399
	calldata->arg.bitmask = server->cache_consistency_bitmask;
2400
	calldata->res.fattr = &calldata->fattr;
2401
	calldata->res.seqid = calldata->arg.seqid;
2402
	calldata->res.server = server;
2403
	calldata->roc = pnfs_roc(state->inode);
2404
	nfs_sb_active(calldata->inode->i_sb);
2405

2406 2407
	msg.rpc_argp = &calldata->arg;
	msg.rpc_resp = &calldata->res;
T
Trond Myklebust 已提交
2408 2409
	task_setup_data.callback_data = calldata;
	task = rpc_run_task(&task_setup_data);
2410 2411
	if (IS_ERR(task))
		return PTR_ERR(task);
2412 2413 2414
	status = 0;
	if (wait)
		status = rpc_wait_for_completion_task(task);
2415
	rpc_put_task(task);
2416
	return status;
2417 2418 2419
out_free_calldata:
	kfree(calldata);
out:
2420 2421
	nfs4_put_open_state(state);
	nfs4_put_state_owner(sp);
2422
	return status;
L
Linus Torvalds 已提交
2423 2424
}

2425
static struct inode *
2426
nfs4_atomic_open(struct inode *dir, struct nfs_open_context *ctx, int open_flags, struct iattr *attr)
L
Linus Torvalds 已提交
2427 2428 2429
{
	struct nfs4_state *state;

T
Trond Myklebust 已提交
2430
	/* Protect against concurrent sillydeletes */
2431 2432
	state = nfs4_do_open(dir, ctx->dentry, ctx->mode, open_flags, attr,
			     ctx->cred, &ctx->mdsthreshold);
2433 2434
	if (IS_ERR(state))
		return ERR_CAST(state);
2435
	ctx->state = state;
2436
	return igrab(state->inode);
L
Linus Torvalds 已提交
2437 2438
}

2439
static void nfs4_close_context(struct nfs_open_context *ctx, int is_sync)
T
Trond Myklebust 已提交
2440 2441 2442 2443
{
	if (ctx->state == NULL)
		return;
	if (is_sync)
2444
		nfs4_close_sync(ctx->state, ctx->mode);
T
Trond Myklebust 已提交
2445
	else
2446
		nfs4_close_state(ctx->state, ctx->mode);
T
Trond Myklebust 已提交
2447
}
L
Linus Torvalds 已提交
2448 2449 2450

static int _nfs4_server_capabilities(struct nfs_server *server, struct nfs_fh *fhandle)
{
B
Benny Halevy 已提交
2451 2452 2453
	struct nfs4_server_caps_arg args = {
		.fhandle = fhandle,
	};
L
Linus Torvalds 已提交
2454 2455 2456
	struct nfs4_server_caps_res res = {};
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SERVER_CAPS],
B
Benny Halevy 已提交
2457
		.rpc_argp = &args,
L
Linus Torvalds 已提交
2458 2459 2460 2461
		.rpc_resp = &res,
	};
	int status;

2462
	status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
L
Linus Torvalds 已提交
2463 2464
	if (status == 0) {
		memcpy(server->attr_bitmask, res.attr_bitmask, sizeof(server->attr_bitmask));
2465 2466 2467 2468 2469
		server->caps &= ~(NFS_CAP_ACLS|NFS_CAP_HARDLINKS|
				NFS_CAP_SYMLINKS|NFS_CAP_FILEID|
				NFS_CAP_MODE|NFS_CAP_NLINK|NFS_CAP_OWNER|
				NFS_CAP_OWNER_GROUP|NFS_CAP_ATIME|
				NFS_CAP_CTIME|NFS_CAP_MTIME);
L
Linus Torvalds 已提交
2470 2471 2472 2473 2474 2475
		if (res.attr_bitmask[0] & FATTR4_WORD0_ACL)
			server->caps |= NFS_CAP_ACLS;
		if (res.has_links != 0)
			server->caps |= NFS_CAP_HARDLINKS;
		if (res.has_symlinks != 0)
			server->caps |= NFS_CAP_SYMLINKS;
2476 2477 2478 2479 2480 2481 2482 2483 2484 2485 2486 2487 2488 2489 2490 2491 2492
		if (res.attr_bitmask[0] & FATTR4_WORD0_FILEID)
			server->caps |= NFS_CAP_FILEID;
		if (res.attr_bitmask[1] & FATTR4_WORD1_MODE)
			server->caps |= NFS_CAP_MODE;
		if (res.attr_bitmask[1] & FATTR4_WORD1_NUMLINKS)
			server->caps |= NFS_CAP_NLINK;
		if (res.attr_bitmask[1] & FATTR4_WORD1_OWNER)
			server->caps |= NFS_CAP_OWNER;
		if (res.attr_bitmask[1] & FATTR4_WORD1_OWNER_GROUP)
			server->caps |= NFS_CAP_OWNER_GROUP;
		if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_ACCESS)
			server->caps |= NFS_CAP_ATIME;
		if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_METADATA)
			server->caps |= NFS_CAP_CTIME;
		if (res.attr_bitmask[1] & FATTR4_WORD1_TIME_MODIFY)
			server->caps |= NFS_CAP_MTIME;

2493 2494 2495
		memcpy(server->cache_consistency_bitmask, res.attr_bitmask, sizeof(server->cache_consistency_bitmask));
		server->cache_consistency_bitmask[0] &= FATTR4_WORD0_CHANGE|FATTR4_WORD0_SIZE;
		server->cache_consistency_bitmask[1] &= FATTR4_WORD1_TIME_METADATA|FATTR4_WORD1_TIME_MODIFY;
L
Linus Torvalds 已提交
2496
		server->acl_bitmask = res.acl_bitmask;
2497
		server->fh_expire_type = res.fh_expire_type;
L
Linus Torvalds 已提交
2498
	}
A
Andy Adamson 已提交
2499

L
Linus Torvalds 已提交
2500 2501 2502
	return status;
}

2503
int nfs4_server_capabilities(struct nfs_server *server, struct nfs_fh *fhandle)
L
Linus Torvalds 已提交
2504 2505 2506 2507 2508 2509 2510 2511 2512 2513 2514 2515 2516 2517 2518 2519 2520 2521 2522
{
	struct nfs4_exception exception = { };
	int err;
	do {
		err = nfs4_handle_exception(server,
				_nfs4_server_capabilities(server, fhandle),
				&exception);
	} while (exception.retry);
	return err;
}

static int _nfs4_lookup_root(struct nfs_server *server, struct nfs_fh *fhandle,
		struct nfs_fsinfo *info)
{
	struct nfs4_lookup_root_arg args = {
		.bitmask = nfs4_fattr_bitmap,
	};
	struct nfs4_lookup_res res = {
		.server = server,
2523
		.fattr = info->fattr,
L
Linus Torvalds 已提交
2524 2525 2526 2527 2528 2529 2530
		.fh = fhandle,
	};
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOOKUP_ROOT],
		.rpc_argp = &args,
		.rpc_resp = &res,
	};
2531

2532
	nfs_fattr_init(info->fattr);
2533
	return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
L
Linus Torvalds 已提交
2534 2535 2536 2537 2538 2539 2540 2541
}

static int nfs4_lookup_root(struct nfs_server *server, struct nfs_fh *fhandle,
		struct nfs_fsinfo *info)
{
	struct nfs4_exception exception = { };
	int err;
	do {
2542 2543 2544 2545
		err = _nfs4_lookup_root(server, fhandle, info);
		switch (err) {
		case 0:
		case -NFS4ERR_WRONGSEC:
2546
			goto out;
2547 2548 2549
		default:
			err = nfs4_handle_exception(server, err, &exception);
		}
L
Linus Torvalds 已提交
2550
	} while (exception.retry);
2551
out:
L
Linus Torvalds 已提交
2552 2553 2554
	return err;
}

2555 2556 2557 2558 2559 2560 2561
static int nfs4_lookup_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
				struct nfs_fsinfo *info, rpc_authflavor_t flavor)
{
	struct rpc_auth *auth;
	int ret;

	auth = rpcauth_create(flavor, server->client);
2562
	if (IS_ERR(auth)) {
2563
		ret = -EACCES;
2564 2565 2566 2567 2568 2569 2570
		goto out;
	}
	ret = nfs4_lookup_root(server, fhandle, info);
out:
	return ret;
}

2571 2572 2573 2574 2575 2576 2577 2578 2579
/*
 * Retry pseudoroot lookup with various security flavors.  We do this when:
 *
 *   NFSv4.0: the PUTROOTFH operation returns NFS4ERR_WRONGSEC
 *   NFSv4.1: the server does not support the SECINFO_NO_NAME operation
 *
 * Returns zero on success, or a negative NFS4ERR value, or a
 * negative errno value.
 */
2580
static int nfs4_find_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
2581
			      struct nfs_fsinfo *info)
L
Linus Torvalds 已提交
2582
{
2583 2584 2585 2586 2587
	/* Per 3530bis 15.33.5 */
	static const rpc_authflavor_t flav_array[] = {
		RPC_AUTH_GSS_KRB5P,
		RPC_AUTH_GSS_KRB5I,
		RPC_AUTH_GSS_KRB5,
2588
		RPC_AUTH_UNIX,			/* courtesy */
2589 2590 2591 2592
		RPC_AUTH_NULL,
	};
	int status = -EPERM;
	size_t i;
C
Chuck Lever 已提交
2593

2594
	for (i = 0; i < ARRAY_SIZE(flav_array); i++) {
2595
		status = nfs4_lookup_root_sec(server, fhandle, info, flav_array[i]);
2596
		if (status == -NFS4ERR_WRONGSEC || status == -EACCES)
2597 2598
			continue;
		break;
2599
	}
2600

2601 2602 2603 2604 2605 2606 2607 2608 2609
	/*
	 * -EACCESS could mean that the user doesn't have correct permissions
	 * to access the mount.  It could also mean that we tried to mount
	 * with a gss auth flavor, but rpc.gssd isn't running.  Either way,
	 * existing mount programs don't handle -EACCES very well so it should
	 * be mapped to -EPERM instead.
	 */
	if (status == -EACCES)
		status = -EPERM;
2610 2611 2612
	return status;
}

C
Chuck Lever 已提交
2613 2614 2615 2616 2617 2618 2619 2620 2621 2622 2623 2624 2625 2626
static int nfs4_do_find_root_sec(struct nfs_server *server,
		struct nfs_fh *fhandle, struct nfs_fsinfo *info)
{
	int mv = server->nfs_client->cl_minorversion;
	return nfs_v4_minor_ops[mv]->find_root_sec(server, fhandle, info);
}

/**
 * nfs4_proc_get_rootfh - get file handle for server's pseudoroot
 * @server: initialized nfs_server handle
 * @fhandle: we fill in the pseudo-fs root file handle
 * @info: we fill in an FSINFO struct
 *
 * Returns zero on success, or a negative errno.
2627
 */
2628 2629
int nfs4_proc_get_rootfh(struct nfs_server *server, struct nfs_fh *fhandle,
			 struct nfs_fsinfo *info)
2630
{
C
Chuck Lever 已提交
2631 2632 2633 2634 2635 2636 2637
	int status;

	status = nfs4_lookup_root(server, fhandle, info);
	if ((status == -NFS4ERR_WRONGSEC) &&
	    !(server->flags & NFS_MOUNT_SECFLAVOUR))
		status = nfs4_do_find_root_sec(server, fhandle, info);

L
Linus Torvalds 已提交
2638 2639 2640 2641
	if (status == 0)
		status = nfs4_server_capabilities(server, fhandle);
	if (status == 0)
		status = nfs4_do_fsinfo(server, fhandle, info);
C
Chuck Lever 已提交
2642

2643
	return nfs4_map_errors(status);
L
Linus Torvalds 已提交
2644 2645
}

2646 2647 2648 2649 2650 2651 2652 2653 2654 2655 2656 2657 2658 2659 2660 2661 2662 2663 2664 2665 2666 2667 2668 2669 2670
static int nfs4_proc_get_root(struct nfs_server *server, struct nfs_fh *mntfh,
			      struct nfs_fsinfo *info)
{
	int error;
	struct nfs_fattr *fattr = info->fattr;

	error = nfs4_server_capabilities(server, mntfh);
	if (error < 0) {
		dprintk("nfs4_get_root: getcaps error = %d\n", -error);
		return error;
	}

	error = nfs4_proc_getattr(server, mntfh, fattr);
	if (error < 0) {
		dprintk("nfs4_get_root: getattr error = %d\n", -error);
		return error;
	}

	if (fattr->valid & NFS_ATTR_FATTR_FSID &&
	    !nfs_fsid_equal(&server->fsid, &fattr->fsid))
		memcpy(&server->fsid, &fattr->fsid, sizeof(server->fsid));

	return error;
}

M
Manoj Naik 已提交
2671 2672 2673 2674 2675
/*
 * Get locations and (maybe) other attributes of a referral.
 * Note that we'll actually follow the referral later when
 * we detect fsid mismatch in inode revalidation
 */
2676 2677 2678
static int nfs4_get_referral(struct rpc_clnt *client, struct inode *dir,
			     const struct qstr *name, struct nfs_fattr *fattr,
			     struct nfs_fh *fhandle)
M
Manoj Naik 已提交
2679 2680 2681 2682 2683 2684 2685 2686 2687 2688 2689 2690
{
	int status = -ENOMEM;
	struct page *page = NULL;
	struct nfs4_fs_locations *locations = NULL;

	page = alloc_page(GFP_KERNEL);
	if (page == NULL)
		goto out;
	locations = kmalloc(sizeof(struct nfs4_fs_locations), GFP_KERNEL);
	if (locations == NULL)
		goto out;

2691
	status = nfs4_proc_fs_locations(client, dir, name, locations, page);
M
Manoj Naik 已提交
2692 2693 2694 2695
	if (status != 0)
		goto out;
	/* Make sure server returned a different fsid for the referral */
	if (nfs_fsid_equal(&NFS_SERVER(dir)->fsid, &locations->fattr.fsid)) {
2696 2697
		dprintk("%s: server did not return a different fsid for"
			" a referral at %s\n", __func__, name->name);
M
Manoj Naik 已提交
2698 2699 2700
		status = -EIO;
		goto out;
	}
2701 2702
	/* Fixup attributes for the nfs_lookup() call to nfs_fhget() */
	nfs_fixup_referral_attributes(&locations->fattr);
M
Manoj Naik 已提交
2703

2704
	/* replace the lookup nfs_fattr with the locations nfs_fattr */
M
Manoj Naik 已提交
2705 2706 2707 2708 2709
	memcpy(fattr, &locations->fattr, sizeof(struct nfs_fattr));
	memset(fhandle, 0, sizeof(struct nfs_fh));
out:
	if (page)
		__free_page(page);
2710
	kfree(locations);
M
Manoj Naik 已提交
2711 2712 2713
	return status;
}

L
Linus Torvalds 已提交
2714 2715 2716 2717 2718 2719 2720 2721 2722 2723 2724 2725 2726 2727 2728 2729
static int _nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fattr *fattr)
{
	struct nfs4_getattr_arg args = {
		.fh = fhandle,
		.bitmask = server->attr_bitmask,
	};
	struct nfs4_getattr_res res = {
		.fattr = fattr,
		.server = server,
	};
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETATTR],
		.rpc_argp = &args,
		.rpc_resp = &res,
	};
	
2730
	nfs_fattr_init(fattr);
2731
	return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
L
Linus Torvalds 已提交
2732 2733 2734 2735 2736 2737 2738 2739 2740 2741 2742 2743 2744 2745 2746 2747 2748 2749 2750 2751 2752 2753 2754 2755 2756 2757 2758 2759 2760 2761 2762 2763 2764 2765 2766
}

static int nfs4_proc_getattr(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fattr *fattr)
{
	struct nfs4_exception exception = { };
	int err;
	do {
		err = nfs4_handle_exception(server,
				_nfs4_proc_getattr(server, fhandle, fattr),
				&exception);
	} while (exception.retry);
	return err;
}

/* 
 * The file is not closed if it is opened due to the a request to change
 * the size of the file. The open call will not be needed once the
 * VFS layer lookup-intents are implemented.
 *
 * Close is called when the inode is destroyed.
 * If we haven't opened the file for O_WRONLY, we
 * need to in the size_change case to obtain a stateid.
 *
 * Got race?
 * Because OPEN is always done by name in nfsv4, it is
 * possible that we opened a different file by the same
 * name.  We can recognize this race condition, but we
 * can't do anything about it besides returning an error.
 *
 * This will be fixed with VFS changes (lookup-intent).
 */
static int
nfs4_proc_setattr(struct dentry *dentry, struct nfs_fattr *fattr,
		  struct iattr *sattr)
{
2767
	struct inode *inode = dentry->d_inode;
2768
	struct rpc_cred *cred = NULL;
2769
	struct nfs4_state *state = NULL;
L
Linus Torvalds 已提交
2770 2771
	int status;

B
Benny Halevy 已提交
2772
	if (pnfs_ld_layoutret_on_setattr(inode))
2773
		pnfs_commit_and_return_layout(inode);
B
Benny Halevy 已提交
2774

2775
	nfs_fattr_init(fattr);
L
Linus Torvalds 已提交
2776
	
2777 2778 2779 2780 2781 2782 2783 2784
	/* Deal with open(O_TRUNC) */
	if (sattr->ia_valid & ATTR_OPEN)
		sattr->ia_valid &= ~(ATTR_MTIME|ATTR_CTIME|ATTR_OPEN);

	/* Optimization: if the end result is no change, don't RPC */
	if ((sattr->ia_valid & ~(ATTR_FILE)) == 0)
		return 0;

2785
	/* Search for an existing open(O_WRITE) file */
2786 2787 2788 2789
	if (sattr->ia_valid & ATTR_FILE) {
		struct nfs_open_context *ctx;

		ctx = nfs_file_open_context(sattr->ia_file);
N
Neil Brown 已提交
2790 2791 2792 2793
		if (ctx) {
			cred = ctx->cred;
			state = ctx->state;
		}
2794
	}
2795

2796
	status = nfs4_do_setattr(inode, cred, fattr, sattr, state);
2797 2798
	if (status == 0)
		nfs_setattr_update_inode(inode, sattr);
L
Linus Torvalds 已提交
2799 2800 2801
	return status;
}

2802 2803 2804
static int _nfs4_proc_lookup(struct rpc_clnt *clnt, struct inode *dir,
		const struct qstr *name, struct nfs_fh *fhandle,
		struct nfs_fattr *fattr)
D
David Howells 已提交
2805
{
2806
	struct nfs_server *server = NFS_SERVER(dir);
D
David Howells 已提交
2807 2808 2809
	int		       status;
	struct nfs4_lookup_arg args = {
		.bitmask = server->attr_bitmask,
2810
		.dir_fh = NFS_FH(dir),
D
David Howells 已提交
2811 2812 2813 2814 2815 2816 2817 2818 2819 2820 2821 2822 2823 2824 2825
		.name = name,
	};
	struct nfs4_lookup_res res = {
		.server = server,
		.fattr = fattr,
		.fh = fhandle,
	};
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOOKUP],
		.rpc_argp = &args,
		.rpc_resp = &res,
	};

	nfs_fattr_init(fattr);

L
Linus Torvalds 已提交
2826
	dprintk("NFS call  lookup %s\n", name->name);
2827
	status = nfs4_call_sync(clnt, server, &msg, &args.seq_args, &res.seq_res, 0);
L
Linus Torvalds 已提交
2828 2829 2830 2831
	dprintk("NFS reply lookup: %d\n", status);
	return status;
}

2832
static void nfs_fixup_secinfo_attributes(struct nfs_fattr *fattr)
2833 2834
{
	fattr->valid |= NFS_ATTR_FATTR_TYPE | NFS_ATTR_FATTR_MODE |
2835
		NFS_ATTR_FATTR_NLINK | NFS_ATTR_FATTR_MOUNTPOINT;
2836 2837 2838 2839
	fattr->mode = S_IFDIR | S_IRUGO | S_IXUGO;
	fattr->nlink = 2;
}

2840 2841 2842
static int nfs4_proc_lookup_common(struct rpc_clnt **clnt, struct inode *dir,
				   struct qstr *name, struct nfs_fh *fhandle,
				   struct nfs_fattr *fattr)
L
Linus Torvalds 已提交
2843 2844
{
	struct nfs4_exception exception = { };
2845
	struct rpc_clnt *client = *clnt;
L
Linus Torvalds 已提交
2846 2847
	int err;
	do {
2848 2849
		err = _nfs4_proc_lookup(client, dir, name, fhandle, fattr);
		switch (err) {
2850
		case -NFS4ERR_BADNAME:
2851 2852
			err = -ENOENT;
			goto out;
2853
		case -NFS4ERR_MOVED:
2854
			err = nfs4_get_referral(client, dir, name, fattr, fhandle);
2855
			goto out;
2856
		case -NFS4ERR_WRONGSEC:
2857 2858 2859 2860 2861 2862 2863 2864 2865 2866 2867 2868
			err = -EPERM;
			if (client != *clnt)
				goto out;

			client = nfs4_create_sec_client(client, dir, name);
			if (IS_ERR(client))
				return PTR_ERR(client);

			exception.retry = 1;
			break;
		default:
			err = nfs4_handle_exception(NFS_SERVER(dir), err, &exception);
2869
		}
L
Linus Torvalds 已提交
2870
	} while (exception.retry);
2871 2872 2873 2874 2875 2876 2877

out:
	if (err == 0)
		*clnt = client;
	else if (client != *clnt)
		rpc_shutdown_client(client);

L
Linus Torvalds 已提交
2878 2879 2880
	return err;
}

2881
static int nfs4_proc_lookup(struct inode *dir, struct qstr *name,
2882 2883 2884 2885 2886 2887 2888 2889 2890 2891 2892 2893 2894
			    struct nfs_fh *fhandle, struct nfs_fattr *fattr)
{
	int status;
	struct rpc_clnt *client = NFS_CLIENT(dir);

	status = nfs4_proc_lookup_common(&client, dir, name, fhandle, fattr);
	if (client != NFS_CLIENT(dir)) {
		rpc_shutdown_client(client);
		nfs_fixup_secinfo_attributes(fattr);
	}
	return status;
}

2895 2896 2897 2898 2899 2900 2901 2902 2903 2904 2905 2906 2907 2908 2909
struct rpc_clnt *
nfs4_proc_lookup_mountpoint(struct inode *dir, struct qstr *name,
			    struct nfs_fh *fhandle, struct nfs_fattr *fattr)
{
	int status;
	struct rpc_clnt *client = rpc_clone_client(NFS_CLIENT(dir));

	status = nfs4_proc_lookup_common(&client, dir, name, fhandle, fattr);
	if (status < 0) {
		rpc_shutdown_client(client);
		return ERR_PTR(status);
	}
	return client;
}

L
Linus Torvalds 已提交
2910 2911
static int _nfs4_proc_access(struct inode *inode, struct nfs_access_entry *entry)
{
2912
	struct nfs_server *server = NFS_SERVER(inode);
L
Linus Torvalds 已提交
2913 2914
	struct nfs4_accessargs args = {
		.fh = NFS_FH(inode),
2915
		.bitmask = server->cache_consistency_bitmask,
2916 2917 2918
	};
	struct nfs4_accessres res = {
		.server = server,
L
Linus Torvalds 已提交
2919 2920 2921 2922 2923 2924 2925 2926 2927 2928 2929 2930 2931 2932 2933 2934 2935 2936 2937 2938 2939 2940 2941 2942 2943 2944
	};
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_ACCESS],
		.rpc_argp = &args,
		.rpc_resp = &res,
		.rpc_cred = entry->cred,
	};
	int mode = entry->mask;
	int status;

	/*
	 * Determine which access bits we want to ask for...
	 */
	if (mode & MAY_READ)
		args.access |= NFS4_ACCESS_READ;
	if (S_ISDIR(inode->i_mode)) {
		if (mode & MAY_WRITE)
			args.access |= NFS4_ACCESS_MODIFY | NFS4_ACCESS_EXTEND | NFS4_ACCESS_DELETE;
		if (mode & MAY_EXEC)
			args.access |= NFS4_ACCESS_LOOKUP;
	} else {
		if (mode & MAY_WRITE)
			args.access |= NFS4_ACCESS_MODIFY | NFS4_ACCESS_EXTEND;
		if (mode & MAY_EXEC)
			args.access |= NFS4_ACCESS_EXECUTE;
	}
2945 2946 2947 2948 2949

	res.fattr = nfs_alloc_fattr();
	if (res.fattr == NULL)
		return -ENOMEM;

2950
	status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
L
Linus Torvalds 已提交
2951
	if (!status) {
2952
		nfs_access_set_mask(entry, res.access);
2953
		nfs_refresh_inode(inode, res.fattr);
L
Linus Torvalds 已提交
2954
	}
2955
	nfs_free_fattr(res.fattr);
L
Linus Torvalds 已提交
2956 2957 2958 2959 2960 2961 2962 2963 2964 2965 2966 2967 2968 2969 2970 2971 2972 2973 2974 2975 2976 2977 2978 2979 2980 2981 2982 2983 2984 2985 2986 2987
	return status;
}

static int nfs4_proc_access(struct inode *inode, struct nfs_access_entry *entry)
{
	struct nfs4_exception exception = { };
	int err;
	do {
		err = nfs4_handle_exception(NFS_SERVER(inode),
				_nfs4_proc_access(inode, entry),
				&exception);
	} while (exception.retry);
	return err;
}

/*
 * TODO: For the time being, we don't try to get any attributes
 * along with any of the zero-copy operations READ, READDIR,
 * READLINK, WRITE.
 *
 * In the case of the first three, we want to put the GETATTR
 * after the read-type operation -- this is because it is hard
 * to predict the length of a GETATTR response in v4, and thus
 * align the READ data correctly.  This means that the GETATTR
 * may end up partially falling into the page cache, and we should
 * shift it into the 'tail' of the xdr_buf before processing.
 * To do this efficiently, we need to know the total length
 * of data received, which doesn't seem to be available outside
 * of the RPC layer.
 *
 * In the case of WRITE, we also want to put the GETATTR after
 * the operation -- in this case because we want to make sure
2988
 * we get the post-operation mtime and size.
L
Linus Torvalds 已提交
2989 2990 2991 2992 2993 2994 2995 2996 2997 2998 2999 3000 3001
 *
 * Both of these changes to the XDR layer would in fact be quite
 * minor, but I decided to leave them for a subsequent patch.
 */
static int _nfs4_proc_readlink(struct inode *inode, struct page *page,
		unsigned int pgbase, unsigned int pglen)
{
	struct nfs4_readlink args = {
		.fh       = NFS_FH(inode),
		.pgbase	  = pgbase,
		.pglen    = pglen,
		.pages    = &page,
	};
B
Benny Halevy 已提交
3002
	struct nfs4_readlink_res res;
L
Linus Torvalds 已提交
3003 3004 3005
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READLINK],
		.rpc_argp = &args,
B
Benny Halevy 已提交
3006
		.rpc_resp = &res,
L
Linus Torvalds 已提交
3007 3008
	};

3009
	return nfs4_call_sync(NFS_SERVER(inode)->client, NFS_SERVER(inode), &msg, &args.seq_args, &res.seq_res, 0);
L
Linus Torvalds 已提交
3010 3011 3012 3013 3014 3015 3016 3017 3018 3019 3020 3021 3022 3023 3024 3025
}

static int nfs4_proc_readlink(struct inode *inode, struct page *page,
		unsigned int pgbase, unsigned int pglen)
{
	struct nfs4_exception exception = { };
	int err;
	do {
		err = nfs4_handle_exception(NFS_SERVER(inode),
				_nfs4_proc_readlink(inode, page, pgbase, pglen),
				&exception);
	} while (exception.retry);
	return err;
}

/*
3026
 * This is just for mknod.  open(O_CREAT) will always do ->open_context().
L
Linus Torvalds 已提交
3027 3028 3029
 */
static int
nfs4_proc_create(struct inode *dir, struct dentry *dentry, struct iattr *sattr,
3030
		 int flags)
L
Linus Torvalds 已提交
3031
{
3032
	struct nfs_open_context *ctx;
L
Linus Torvalds 已提交
3033 3034 3035
	struct nfs4_state *state;
	int status = 0;

3036 3037 3038 3039
	ctx = alloc_nfs_open_context(dentry, FMODE_READ);
	if (IS_ERR(ctx))
		return PTR_ERR(ctx);

A
Aneesh Kumar K.V 已提交
3040
	sattr->ia_mode &= ~current_umask();
3041 3042 3043
	state = nfs4_do_open(dir, dentry, ctx->mode,
			flags, sattr, ctx->cred,
			&ctx->mdsthreshold);
3044
	d_drop(dentry);
L
Linus Torvalds 已提交
3045 3046
	if (IS_ERR(state)) {
		status = PTR_ERR(state);
3047
		goto out;
L
Linus Torvalds 已提交
3048
	}
3049
	d_add(dentry, igrab(state->inode));
3050
	nfs_set_verifier(dentry, nfs_save_change_attribute(dir));
3051
	ctx->state = state;
L
Linus Torvalds 已提交
3052
out:
3053
	put_nfs_open_context(ctx);
L
Linus Torvalds 已提交
3054 3055 3056 3057 3058
	return status;
}

static int _nfs4_proc_remove(struct inode *dir, struct qstr *name)
{
3059
	struct nfs_server *server = NFS_SERVER(dir);
3060
	struct nfs_removeargs args = {
L
Linus Torvalds 已提交
3061
		.fh = NFS_FH(dir),
3062
		.name = *name,
3063
	};
3064
	struct nfs_removeres res = {
3065
		.server = server,
L
Linus Torvalds 已提交
3066 3067
	};
	struct rpc_message msg = {
3068 3069 3070
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_REMOVE],
		.rpc_argp = &args,
		.rpc_resp = &res,
L
Linus Torvalds 已提交
3071
	};
3072
	int status;
L
Linus Torvalds 已提交
3073

3074
	status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 1);
3075
	if (status == 0)
3076
		update_changeattr(dir, &res.cinfo);
L
Linus Torvalds 已提交
3077 3078 3079 3080 3081 3082 3083 3084 3085 3086 3087 3088 3089 3090 3091
	return status;
}

static int nfs4_proc_remove(struct inode *dir, struct qstr *name)
{
	struct nfs4_exception exception = { };
	int err;
	do {
		err = nfs4_handle_exception(NFS_SERVER(dir),
				_nfs4_proc_remove(dir, name),
				&exception);
	} while (exception.retry);
	return err;
}

3092
static void nfs4_proc_unlink_setup(struct rpc_message *msg, struct inode *dir)
L
Linus Torvalds 已提交
3093
{
3094 3095 3096
	struct nfs_server *server = NFS_SERVER(dir);
	struct nfs_removeargs *args = msg->rpc_argp;
	struct nfs_removeres *res = msg->rpc_resp;
L
Linus Torvalds 已提交
3097

3098
	res->server = server;
L
Linus Torvalds 已提交
3099
	msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_REMOVE];
3100
	nfs41_init_sequence(&args->seq_args, &res->seq_res, 1);
L
Linus Torvalds 已提交
3101 3102
}

3103 3104
static void nfs4_proc_unlink_rpc_prepare(struct rpc_task *task, struct nfs_unlinkdata *data)
{
3105 3106 3107 3108
	nfs4_setup_sequence(NFS_SERVER(data->dir),
			&data->args.seq_args,
			&data->res.seq_res,
			task);
L
Linus Torvalds 已提交
3109 3110
}

3111
static int nfs4_proc_unlink_done(struct rpc_task *task, struct inode *dir)
L
Linus Torvalds 已提交
3112
{
3113 3114
	struct nfs_removeres *res = task->tk_msg.rpc_resp;

3115 3116
	if (!nfs4_sequence_done(task, &res->seq_res))
		return 0;
3117
	if (nfs4_async_handle_error(task, res->server, NULL) == -EAGAIN)
3118 3119 3120
		return 0;
	update_changeattr(dir, &res->cinfo);
	return 1;
L
Linus Torvalds 已提交
3121 3122
}

3123 3124 3125 3126 3127 3128 3129 3130
static void nfs4_proc_rename_setup(struct rpc_message *msg, struct inode *dir)
{
	struct nfs_server *server = NFS_SERVER(dir);
	struct nfs_renameargs *arg = msg->rpc_argp;
	struct nfs_renameres *res = msg->rpc_resp;

	msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RENAME];
	res->server = server;
3131
	nfs41_init_sequence(&arg->seq_args, &res->seq_res, 1);
3132 3133
}

3134 3135
static void nfs4_proc_rename_rpc_prepare(struct rpc_task *task, struct nfs_renamedata *data)
{
3136 3137 3138 3139
	nfs4_setup_sequence(NFS_SERVER(data->old_dir),
			&data->args.seq_args,
			&data->res.seq_res,
			task);
3140 3141 3142 3143 3144 3145 3146 3147 3148 3149 3150 3151 3152 3153 3154 3155 3156
}

static int nfs4_proc_rename_done(struct rpc_task *task, struct inode *old_dir,
				 struct inode *new_dir)
{
	struct nfs_renameres *res = task->tk_msg.rpc_resp;

	if (!nfs4_sequence_done(task, &res->seq_res))
		return 0;
	if (nfs4_async_handle_error(task, res->server, NULL) == -EAGAIN)
		return 0;

	update_changeattr(old_dir, &res->old_cinfo);
	update_changeattr(new_dir, &res->new_cinfo);
	return 1;
}

L
Linus Torvalds 已提交
3157 3158 3159
static int _nfs4_proc_rename(struct inode *old_dir, struct qstr *old_name,
		struct inode *new_dir, struct qstr *new_name)
{
3160
	struct nfs_server *server = NFS_SERVER(old_dir);
3161
	struct nfs_renameargs arg = {
L
Linus Torvalds 已提交
3162 3163 3164 3165
		.old_dir = NFS_FH(old_dir),
		.new_dir = NFS_FH(new_dir),
		.old_name = old_name,
		.new_name = new_name,
3166
	};
3167
	struct nfs_renameres res = {
3168
		.server = server,
L
Linus Torvalds 已提交
3169 3170 3171 3172 3173 3174
	};
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RENAME],
		.rpc_argp = &arg,
		.rpc_resp = &res,
	};
3175
	int status = -ENOMEM;
L
Linus Torvalds 已提交
3176
	
3177
	status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
L
Linus Torvalds 已提交
3178 3179 3180 3181 3182 3183 3184 3185 3186 3187 3188 3189 3190 3191 3192 3193 3194 3195 3196 3197 3198 3199 3200
	if (!status) {
		update_changeattr(old_dir, &res.old_cinfo);
		update_changeattr(new_dir, &res.new_cinfo);
	}
	return status;
}

static int nfs4_proc_rename(struct inode *old_dir, struct qstr *old_name,
		struct inode *new_dir, struct qstr *new_name)
{
	struct nfs4_exception exception = { };
	int err;
	do {
		err = nfs4_handle_exception(NFS_SERVER(old_dir),
				_nfs4_proc_rename(old_dir, old_name,
					new_dir, new_name),
				&exception);
	} while (exception.retry);
	return err;
}

static int _nfs4_proc_link(struct inode *inode, struct inode *dir, struct qstr *name)
{
3201
	struct nfs_server *server = NFS_SERVER(inode);
L
Linus Torvalds 已提交
3202 3203 3204 3205
	struct nfs4_link_arg arg = {
		.fh     = NFS_FH(inode),
		.dir_fh = NFS_FH(dir),
		.name   = name,
3206 3207 3208 3209
		.bitmask = server->attr_bitmask,
	};
	struct nfs4_link_res res = {
		.server = server,
L
Linus Torvalds 已提交
3210 3211 3212 3213
	};
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LINK],
		.rpc_argp = &arg,
3214
		.rpc_resp = &res,
L
Linus Torvalds 已提交
3215
	};
3216 3217 3218
	int status = -ENOMEM;

	res.fattr = nfs_alloc_fattr();
3219
	if (res.fattr == NULL)
3220
		goto out;
L
Linus Torvalds 已提交
3221

3222
	status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
3223 3224
	if (!status) {
		update_changeattr(dir, &res.cinfo);
3225
		nfs_post_op_update_inode(inode, res.fattr);
3226
	}
3227 3228
out:
	nfs_free_fattr(res.fattr);
L
Linus Torvalds 已提交
3229 3230 3231 3232 3233 3234 3235 3236 3237 3238 3239 3240 3241 3242 3243
	return status;
}

static int nfs4_proc_link(struct inode *inode, struct inode *dir, struct qstr *name)
{
	struct nfs4_exception exception = { };
	int err;
	do {
		err = nfs4_handle_exception(NFS_SERVER(inode),
				_nfs4_proc_link(inode, dir, name),
				&exception);
	} while (exception.retry);
	return err;
}

3244 3245 3246 3247 3248 3249 3250 3251 3252 3253 3254 3255 3256 3257 3258 3259 3260 3261 3262 3263 3264 3265 3266 3267 3268 3269 3270 3271 3272 3273 3274 3275 3276 3277 3278 3279
struct nfs4_createdata {
	struct rpc_message msg;
	struct nfs4_create_arg arg;
	struct nfs4_create_res res;
	struct nfs_fh fh;
	struct nfs_fattr fattr;
};

static struct nfs4_createdata *nfs4_alloc_createdata(struct inode *dir,
		struct qstr *name, struct iattr *sattr, u32 ftype)
{
	struct nfs4_createdata *data;

	data = kzalloc(sizeof(*data), GFP_KERNEL);
	if (data != NULL) {
		struct nfs_server *server = NFS_SERVER(dir);

		data->msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CREATE];
		data->msg.rpc_argp = &data->arg;
		data->msg.rpc_resp = &data->res;
		data->arg.dir_fh = NFS_FH(dir);
		data->arg.server = server;
		data->arg.name = name;
		data->arg.attrs = sattr;
		data->arg.ftype = ftype;
		data->arg.bitmask = server->attr_bitmask;
		data->res.server = server;
		data->res.fh = &data->fh;
		data->res.fattr = &data->fattr;
		nfs_fattr_init(data->res.fattr);
	}
	return data;
}

static int nfs4_do_create(struct inode *dir, struct dentry *dentry, struct nfs4_createdata *data)
{
3280
	int status = nfs4_call_sync(NFS_SERVER(dir)->client, NFS_SERVER(dir), &data->msg,
3281
				    &data->arg.seq_args, &data->res.seq_res, 1);
3282 3283 3284 3285 3286 3287 3288 3289 3290 3291 3292 3293
	if (status == 0) {
		update_changeattr(dir, &data->res.dir_cinfo);
		status = nfs_instantiate(dentry, data->res.fh, data->res.fattr);
	}
	return status;
}

static void nfs4_free_createdata(struct nfs4_createdata *data)
{
	kfree(data);
}

3294
static int _nfs4_proc_symlink(struct inode *dir, struct dentry *dentry,
3295
		struct page *page, unsigned int len, struct iattr *sattr)
L
Linus Torvalds 已提交
3296
{
3297 3298
	struct nfs4_createdata *data;
	int status = -ENAMETOOLONG;
L
Linus Torvalds 已提交
3299

3300
	if (len > NFS4_MAXPATHLEN)
3301
		goto out;
3302

3303 3304 3305 3306 3307 3308 3309 3310
	status = -ENOMEM;
	data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4LNK);
	if (data == NULL)
		goto out;

	data->msg.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SYMLINK];
	data->arg.u.symlink.pages = &page;
	data->arg.u.symlink.len = len;
L
Linus Torvalds 已提交
3311
	
3312 3313 3314 3315
	status = nfs4_do_create(dir, dentry, data);

	nfs4_free_createdata(data);
out:
L
Linus Torvalds 已提交
3316 3317 3318
	return status;
}

3319
static int nfs4_proc_symlink(struct inode *dir, struct dentry *dentry,
3320
		struct page *page, unsigned int len, struct iattr *sattr)
L
Linus Torvalds 已提交
3321 3322 3323 3324 3325
{
	struct nfs4_exception exception = { };
	int err;
	do {
		err = nfs4_handle_exception(NFS_SERVER(dir),
3326 3327
				_nfs4_proc_symlink(dir, dentry, page,
							len, sattr),
L
Linus Torvalds 已提交
3328 3329 3330 3331 3332 3333 3334 3335
				&exception);
	} while (exception.retry);
	return err;
}

static int _nfs4_proc_mkdir(struct inode *dir, struct dentry *dentry,
		struct iattr *sattr)
{
3336 3337
	struct nfs4_createdata *data;
	int status = -ENOMEM;
L
Linus Torvalds 已提交
3338

3339 3340 3341 3342 3343 3344 3345 3346
	data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4DIR);
	if (data == NULL)
		goto out;

	status = nfs4_do_create(dir, dentry, data);

	nfs4_free_createdata(data);
out:
L
Linus Torvalds 已提交
3347 3348 3349 3350 3351 3352 3353 3354
	return status;
}

static int nfs4_proc_mkdir(struct inode *dir, struct dentry *dentry,
		struct iattr *sattr)
{
	struct nfs4_exception exception = { };
	int err;
A
Aneesh Kumar K.V 已提交
3355 3356

	sattr->ia_mode &= ~current_umask();
L
Linus Torvalds 已提交
3357 3358 3359 3360 3361 3362 3363 3364 3365
	do {
		err = nfs4_handle_exception(NFS_SERVER(dir),
				_nfs4_proc_mkdir(dir, dentry, sattr),
				&exception);
	} while (exception.retry);
	return err;
}

static int _nfs4_proc_readdir(struct dentry *dentry, struct rpc_cred *cred,
B
Bryan Schumaker 已提交
3366
		u64 cookie, struct page **pages, unsigned int count, int plus)
L
Linus Torvalds 已提交
3367 3368 3369 3370
{
	struct inode		*dir = dentry->d_inode;
	struct nfs4_readdir_arg args = {
		.fh = NFS_FH(dir),
B
Bryan Schumaker 已提交
3371
		.pages = pages,
L
Linus Torvalds 已提交
3372 3373
		.pgbase = 0,
		.count = count,
3374
		.bitmask = NFS_SERVER(dentry->d_inode)->attr_bitmask,
B
Bryan Schumaker 已提交
3375
		.plus = plus,
L
Linus Torvalds 已提交
3376 3377 3378 3379 3380 3381 3382 3383 3384 3385
	};
	struct nfs4_readdir_res res;
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READDIR],
		.rpc_argp = &args,
		.rpc_resp = &res,
		.rpc_cred = cred,
	};
	int			status;

3386
	dprintk("%s: dentry = %s/%s, cookie = %Lu\n", __func__,
3387 3388 3389
			dentry->d_parent->d_name.name,
			dentry->d_name.name,
			(unsigned long long)cookie);
3390
	nfs4_setup_readdir(cookie, NFS_I(dir)->cookieverf, dentry, &args);
L
Linus Torvalds 已提交
3391
	res.pgbase = args.pgbase;
3392
	status = nfs4_call_sync(NFS_SERVER(dir)->client, NFS_SERVER(dir), &msg, &args.seq_args, &res.seq_res, 0);
3393
	if (status >= 0) {
3394
		memcpy(NFS_I(dir)->cookieverf, res.verifier.data, NFS4_VERIFIER_SIZE);
3395 3396
		status += args.pgbase;
	}
3397 3398 3399

	nfs_invalidate_atime(dir);

3400
	dprintk("%s: returns %d\n", __func__, status);
L
Linus Torvalds 已提交
3401 3402 3403 3404
	return status;
}

static int nfs4_proc_readdir(struct dentry *dentry, struct rpc_cred *cred,
B
Bryan Schumaker 已提交
3405
		u64 cookie, struct page **pages, unsigned int count, int plus)
L
Linus Torvalds 已提交
3406 3407 3408 3409 3410 3411
{
	struct nfs4_exception exception = { };
	int err;
	do {
		err = nfs4_handle_exception(NFS_SERVER(dentry->d_inode),
				_nfs4_proc_readdir(dentry, cred, cookie,
B
Bryan Schumaker 已提交
3412
					pages, count, plus),
L
Linus Torvalds 已提交
3413 3414 3415 3416 3417 3418 3419 3420
				&exception);
	} while (exception.retry);
	return err;
}

static int _nfs4_proc_mknod(struct inode *dir, struct dentry *dentry,
		struct iattr *sattr, dev_t rdev)
{
3421 3422 3423
	struct nfs4_createdata *data;
	int mode = sattr->ia_mode;
	int status = -ENOMEM;
L
Linus Torvalds 已提交
3424

3425 3426 3427 3428
	data = nfs4_alloc_createdata(dir, &dentry->d_name, sattr, NF4SOCK);
	if (data == NULL)
		goto out;

L
Linus Torvalds 已提交
3429
	if (S_ISFIFO(mode))
3430
		data->arg.ftype = NF4FIFO;
L
Linus Torvalds 已提交
3431
	else if (S_ISBLK(mode)) {
3432 3433 3434
		data->arg.ftype = NF4BLK;
		data->arg.u.device.specdata1 = MAJOR(rdev);
		data->arg.u.device.specdata2 = MINOR(rdev);
L
Linus Torvalds 已提交
3435 3436
	}
	else if (S_ISCHR(mode)) {
3437 3438 3439
		data->arg.ftype = NF4CHR;
		data->arg.u.device.specdata1 = MAJOR(rdev);
		data->arg.u.device.specdata2 = MINOR(rdev);
3440 3441 3442
	} else if (!S_ISSOCK(mode)) {
		status = -EINVAL;
		goto out_free;
L
Linus Torvalds 已提交
3443 3444
	}
	
3445
	status = nfs4_do_create(dir, dentry, data);
3446
out_free:
3447 3448
	nfs4_free_createdata(data);
out:
L
Linus Torvalds 已提交
3449 3450 3451 3452 3453 3454 3455 3456
	return status;
}

static int nfs4_proc_mknod(struct inode *dir, struct dentry *dentry,
		struct iattr *sattr, dev_t rdev)
{
	struct nfs4_exception exception = { };
	int err;
A
Aneesh Kumar K.V 已提交
3457 3458

	sattr->ia_mode &= ~current_umask();
L
Linus Torvalds 已提交
3459 3460 3461 3462 3463 3464 3465 3466 3467 3468 3469 3470 3471 3472 3473
	do {
		err = nfs4_handle_exception(NFS_SERVER(dir),
				_nfs4_proc_mknod(dir, dentry, sattr, rdev),
				&exception);
	} while (exception.retry);
	return err;
}

static int _nfs4_proc_statfs(struct nfs_server *server, struct nfs_fh *fhandle,
		 struct nfs_fsstat *fsstat)
{
	struct nfs4_statfs_arg args = {
		.fh = fhandle,
		.bitmask = server->attr_bitmask,
	};
B
Benny Halevy 已提交
3474 3475 3476
	struct nfs4_statfs_res res = {
		.fsstat = fsstat,
	};
L
Linus Torvalds 已提交
3477 3478 3479
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_STATFS],
		.rpc_argp = &args,
B
Benny Halevy 已提交
3480
		.rpc_resp = &res,
L
Linus Torvalds 已提交
3481 3482
	};

3483
	nfs_fattr_init(fsstat->fattr);
3484
	return  nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
L
Linus Torvalds 已提交
3485 3486 3487 3488 3489 3490 3491 3492 3493 3494 3495 3496 3497 3498 3499 3500 3501 3502 3503 3504 3505
}

static int nfs4_proc_statfs(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsstat *fsstat)
{
	struct nfs4_exception exception = { };
	int err;
	do {
		err = nfs4_handle_exception(server,
				_nfs4_proc_statfs(server, fhandle, fsstat),
				&exception);
	} while (exception.retry);
	return err;
}

static int _nfs4_do_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle,
		struct nfs_fsinfo *fsinfo)
{
	struct nfs4_fsinfo_arg args = {
		.fh = fhandle,
		.bitmask = server->attr_bitmask,
	};
B
Benny Halevy 已提交
3506 3507 3508
	struct nfs4_fsinfo_res res = {
		.fsinfo = fsinfo,
	};
L
Linus Torvalds 已提交
3509 3510 3511
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FSINFO],
		.rpc_argp = &args,
B
Benny Halevy 已提交
3512
		.rpc_resp = &res,
L
Linus Torvalds 已提交
3513 3514
	};

3515
	return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
L
Linus Torvalds 已提交
3516 3517 3518 3519 3520
}

static int nfs4_do_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsinfo *fsinfo)
{
	struct nfs4_exception exception = { };
3521
	unsigned long now = jiffies;
L
Linus Torvalds 已提交
3522 3523 3524
	int err;

	do {
3525 3526 3527 3528 3529 3530 3531 3532 3533 3534 3535
		err = _nfs4_do_fsinfo(server, fhandle, fsinfo);
		if (err == 0) {
			struct nfs_client *clp = server->nfs_client;

			spin_lock(&clp->cl_lock);
			clp->cl_lease_time = fsinfo->lease_time * HZ;
			clp->cl_last_renewal = now;
			spin_unlock(&clp->cl_lock);
			break;
		}
		err = nfs4_handle_exception(server, err, &exception);
L
Linus Torvalds 已提交
3536 3537 3538 3539 3540 3541
	} while (exception.retry);
	return err;
}

static int nfs4_proc_fsinfo(struct nfs_server *server, struct nfs_fh *fhandle, struct nfs_fsinfo *fsinfo)
{
3542 3543
	int error;

3544
	nfs_fattr_init(fsinfo->fattr);
3545
	error = nfs4_do_fsinfo(server, fhandle, fsinfo);
3546 3547 3548
	if (error == 0) {
		/* block layout checks this! */
		server->pnfs_blksize = fsinfo->blksize;
3549
		set_pnfs_layoutdriver(server, fhandle, fsinfo->layouttype);
3550
	}
3551 3552

	return error;
L
Linus Torvalds 已提交
3553 3554 3555 3556 3557 3558 3559 3560 3561
}

static int _nfs4_proc_pathconf(struct nfs_server *server, struct nfs_fh *fhandle,
		struct nfs_pathconf *pathconf)
{
	struct nfs4_pathconf_arg args = {
		.fh = fhandle,
		.bitmask = server->attr_bitmask,
	};
B
Benny Halevy 已提交
3562 3563 3564
	struct nfs4_pathconf_res res = {
		.pathconf = pathconf,
	};
L
Linus Torvalds 已提交
3565 3566 3567
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_PATHCONF],
		.rpc_argp = &args,
B
Benny Halevy 已提交
3568
		.rpc_resp = &res,
L
Linus Torvalds 已提交
3569 3570 3571 3572 3573 3574 3575 3576
	};

	/* None of the pathconf attributes are mandatory to implement */
	if ((args.bitmask[0] & nfs4_pathconf_bitmap[0]) == 0) {
		memset(pathconf, 0, sizeof(*pathconf));
		return 0;
	}

3577
	nfs_fattr_init(pathconf->fattr);
3578
	return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
L
Linus Torvalds 已提交
3579 3580 3581 3582 3583 3584 3585 3586 3587 3588 3589 3590 3591 3592 3593 3594
}

static int nfs4_proc_pathconf(struct nfs_server *server, struct nfs_fh *fhandle,
		struct nfs_pathconf *pathconf)
{
	struct nfs4_exception exception = { };
	int err;

	do {
		err = nfs4_handle_exception(server,
				_nfs4_proc_pathconf(server, fhandle, pathconf),
				&exception);
	} while (exception.retry);
	return err;
}

3595
int nfs4_set_rw_stateid(nfs4_stateid *stateid,
3596 3597 3598 3599 3600 3601 3602 3603
		const struct nfs_open_context *ctx,
		const struct nfs_lock_context *l_ctx,
		fmode_t fmode)
{
	const struct nfs_lockowner *lockowner = NULL;

	if (l_ctx != NULL)
		lockowner = &l_ctx->lockowner;
3604
	return nfs4_select_rw_stateid(stateid, ctx->state, fmode, lockowner);
3605 3606 3607
}
EXPORT_SYMBOL_GPL(nfs4_set_rw_stateid);

3608 3609 3610 3611 3612 3613 3614 3615 3616 3617 3618 3619 3620 3621 3622 3623 3624 3625 3626 3627 3628 3629 3630 3631 3632 3633 3634
static bool nfs4_stateid_is_current(nfs4_stateid *stateid,
		const struct nfs_open_context *ctx,
		const struct nfs_lock_context *l_ctx,
		fmode_t fmode)
{
	nfs4_stateid current_stateid;

	if (nfs4_set_rw_stateid(&current_stateid, ctx, l_ctx, fmode))
		return false;
	return nfs4_stateid_match(stateid, &current_stateid);
}

static bool nfs4_error_stateid_expired(int err)
{
	switch (err) {
	case -NFS4ERR_DELEG_REVOKED:
	case -NFS4ERR_ADMIN_REVOKED:
	case -NFS4ERR_BAD_STATEID:
	case -NFS4ERR_STALE_STATEID:
	case -NFS4ERR_OLD_STATEID:
	case -NFS4ERR_OPENMODE:
	case -NFS4ERR_EXPIRED:
		return true;
	}
	return false;
}

3635 3636
void __nfs4_read_done_cb(struct nfs_read_data *data)
{
3637
	nfs_invalidate_atime(data->header->inode);
3638 3639
}

3640
static int nfs4_read_done_cb(struct rpc_task *task, struct nfs_read_data *data)
L
Linus Torvalds 已提交
3641
{
3642
	struct nfs_server *server = NFS_SERVER(data->header->inode);
L
Linus Torvalds 已提交
3643

3644
	if (nfs4_async_handle_error(task, server, data->args.context->state) == -EAGAIN) {
3645
		rpc_restart_call_prepare(task);
T
Trond Myklebust 已提交
3646
		return -EAGAIN;
L
Linus Torvalds 已提交
3647
	}
3648

3649
	__nfs4_read_done_cb(data);
L
Linus Torvalds 已提交
3650
	if (task->tk_status > 0)
T
Trond Myklebust 已提交
3651 3652
		renew_lease(server, data->timestamp);
	return 0;
L
Linus Torvalds 已提交
3653 3654
}

3655 3656 3657 3658 3659 3660 3661 3662 3663 3664 3665 3666 3667 3668
static bool nfs4_read_stateid_changed(struct rpc_task *task,
		struct nfs_readargs *args)
{

	if (!nfs4_error_stateid_expired(task->tk_status) ||
		nfs4_stateid_is_current(&args->stateid,
				args->context,
				args->lock_context,
				FMODE_READ))
		return false;
	rpc_restart_call_prepare(task);
	return true;
}

3669 3670 3671 3672 3673 3674 3675
static int nfs4_read_done(struct rpc_task *task, struct nfs_read_data *data)
{

	dprintk("--> %s\n", __func__);

	if (!nfs4_sequence_done(task, &data->res.seq_res))
		return -EAGAIN;
3676 3677
	if (nfs4_read_stateid_changed(task, &data->args))
		return -EAGAIN;
3678 3679
	return data->read_done_cb ? data->read_done_cb(task, data) :
				    nfs4_read_done_cb(task, data);
3680 3681
}

3682
static void nfs4_proc_read_setup(struct nfs_read_data *data, struct rpc_message *msg)
L
Linus Torvalds 已提交
3683 3684
{
	data->timestamp   = jiffies;
3685
	data->read_done_cb = nfs4_read_done_cb;
3686
	msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_READ];
3687
	nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 0);
L
Linus Torvalds 已提交
3688 3689
}

3690 3691
static void nfs4_proc_read_rpc_prepare(struct rpc_task *task, struct nfs_read_data *data)
{
3692
	if (nfs4_setup_sequence(NFS_SERVER(data->header->inode),
3693 3694
			&data->args.seq_args,
			&data->res.seq_res,
3695 3696 3697 3698
			task))
		return;
	nfs4_set_rw_stateid(&data->args.stateid, data->args.context,
			data->args.lock_context, FMODE_READ);
L
Linus Torvalds 已提交
3699 3700
}

3701
static int nfs4_write_done_cb(struct rpc_task *task, struct nfs_write_data *data)
L
Linus Torvalds 已提交
3702
{
3703
	struct inode *inode = data->header->inode;
L
Linus Torvalds 已提交
3704
	
3705
	if (nfs4_async_handle_error(task, NFS_SERVER(inode), data->args.context->state) == -EAGAIN) {
3706
		rpc_restart_call_prepare(task);
3707
		return -EAGAIN;
L
Linus Torvalds 已提交
3708
	}
3709
	if (task->tk_status >= 0) {
L
Linus Torvalds 已提交
3710
		renew_lease(NFS_SERVER(inode), data->timestamp);
3711
		nfs_post_op_update_inode_force_wcc(inode, &data->fattr);
3712
	}
3713
	return 0;
L
Linus Torvalds 已提交
3714 3715
}

3716 3717 3718 3719 3720 3721 3722 3723 3724 3725 3726 3727 3728 3729
static bool nfs4_write_stateid_changed(struct rpc_task *task,
		struct nfs_writeargs *args)
{

	if (!nfs4_error_stateid_expired(task->tk_status) ||
		nfs4_stateid_is_current(&args->stateid,
				args->context,
				args->lock_context,
				FMODE_WRITE))
		return false;
	rpc_restart_call_prepare(task);
	return true;
}

3730 3731 3732 3733
static int nfs4_write_done(struct rpc_task *task, struct nfs_write_data *data)
{
	if (!nfs4_sequence_done(task, &data->res.seq_res))
		return -EAGAIN;
3734 3735
	if (nfs4_write_stateid_changed(task, &data->args))
		return -EAGAIN;
3736 3737
	return data->write_done_cb ? data->write_done_cb(task, data) :
		nfs4_write_done_cb(task, data);
3738 3739
}

3740 3741
static
bool nfs4_write_need_cache_consistency_data(const struct nfs_write_data *data)
3742
{
3743 3744 3745 3746 3747 3748 3749 3750
	const struct nfs_pgio_header *hdr = data->header;

	/* Don't request attributes for pNFS or O_DIRECT writes */
	if (data->ds_clp != NULL || hdr->dreq != NULL)
		return false;
	/* Otherwise, request attributes if and only if we don't hold
	 * a delegation
	 */
3751
	return nfs4_have_delegation(hdr->inode, FMODE_READ) == 0;
3752 3753
}

3754
static void nfs4_proc_write_setup(struct nfs_write_data *data, struct rpc_message *msg)
L
Linus Torvalds 已提交
3755
{
3756
	struct nfs_server *server = NFS_SERVER(data->header->inode);
3757

3758
	if (!nfs4_write_need_cache_consistency_data(data)) {
3759 3760 3761 3762
		data->args.bitmask = NULL;
		data->res.fattr = NULL;
	} else
		data->args.bitmask = server->cache_consistency_bitmask;
3763

3764 3765
	if (!data->write_done_cb)
		data->write_done_cb = nfs4_write_done_cb;
3766
	data->res.server = server;
L
Linus Torvalds 已提交
3767 3768
	data->timestamp   = jiffies;

3769
	msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_WRITE];
3770
	nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
L
Linus Torvalds 已提交
3771 3772
}

3773 3774
static void nfs4_proc_write_rpc_prepare(struct rpc_task *task, struct nfs_write_data *data)
{
3775
	if (nfs4_setup_sequence(NFS_SERVER(data->header->inode),
3776 3777
			&data->args.seq_args,
			&data->res.seq_res,
3778 3779 3780 3781
			task))
		return;
	nfs4_set_rw_stateid(&data->args.stateid, data->args.context,
			data->args.lock_context, FMODE_WRITE);
L
Linus Torvalds 已提交
3782 3783
}

3784
static void nfs4_proc_commit_rpc_prepare(struct rpc_task *task, struct nfs_commit_data *data)
3785
{
3786 3787 3788 3789
	nfs4_setup_sequence(NFS_SERVER(data->inode),
			&data->args.seq_args,
			&data->res.seq_res,
			task);
L
Linus Torvalds 已提交
3790 3791
}

3792
static int nfs4_commit_done_cb(struct rpc_task *task, struct nfs_commit_data *data)
L
Linus Torvalds 已提交
3793 3794
{
	struct inode *inode = data->inode;
3795

3796
	if (nfs4_async_handle_error(task, NFS_SERVER(inode), NULL) == -EAGAIN) {
3797
		rpc_restart_call_prepare(task);
3798
		return -EAGAIN;
L
Linus Torvalds 已提交
3799
	}
3800
	return 0;
L
Linus Torvalds 已提交
3801 3802
}

3803
static int nfs4_commit_done(struct rpc_task *task, struct nfs_commit_data *data)
3804 3805 3806
{
	if (!nfs4_sequence_done(task, &data->res.seq_res))
		return -EAGAIN;
3807
	return data->commit_done_cb(task, data);
3808 3809
}

3810
static void nfs4_proc_commit_setup(struct nfs_commit_data *data, struct rpc_message *msg)
L
Linus Torvalds 已提交
3811
{
3812
	struct nfs_server *server = NFS_SERVER(data->inode);
3813

3814 3815
	if (data->commit_done_cb == NULL)
		data->commit_done_cb = nfs4_commit_done_cb;
3816
	data->res.server = server;
3817
	msg->rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_COMMIT];
3818
	nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
L
Linus Torvalds 已提交
3819 3820
}

3821 3822 3823 3824 3825
struct nfs4_renewdata {
	struct nfs_client	*client;
	unsigned long		timestamp;
};

L
Linus Torvalds 已提交
3826 3827 3828 3829
/*
 * nfs4_proc_async_renew(): This is not one of the nfs_rpc_ops; it is a special
 * standalone procedure for queueing an asynchronous RENEW.
 */
3830
static void nfs4_renew_release(void *calldata)
3831
{
3832 3833
	struct nfs4_renewdata *data = calldata;
	struct nfs_client *clp = data->client;
3834

3835 3836 3837
	if (atomic_read(&clp->cl_count) > 1)
		nfs4_schedule_state_renewal(clp);
	nfs_put_client(clp);
3838
	kfree(data);
3839 3840
}

3841
static void nfs4_renew_done(struct rpc_task *task, void *calldata)
L
Linus Torvalds 已提交
3842
{
3843 3844 3845
	struct nfs4_renewdata *data = calldata;
	struct nfs_client *clp = data->client;
	unsigned long timestamp = data->timestamp;
L
Linus Torvalds 已提交
3846 3847

	if (task->tk_status < 0) {
3848
		/* Unless we're shutting down, schedule state recovery! */
3849 3850 3851
		if (test_bit(NFS_CS_RENEWD, &clp->cl_res_state) == 0)
			return;
		if (task->tk_status != NFS4ERR_CB_PATH_DOWN) {
3852
			nfs4_schedule_lease_recovery(clp);
3853 3854 3855
			return;
		}
		nfs4_schedule_path_down_recovery(clp);
L
Linus Torvalds 已提交
3856
	}
3857
	do_renew_lease(clp, timestamp);
L
Linus Torvalds 已提交
3858 3859
}

3860 3861
static const struct rpc_call_ops nfs4_renew_ops = {
	.rpc_call_done = nfs4_renew_done,
3862
	.rpc_release = nfs4_renew_release,
3863 3864
};

3865
static int nfs4_proc_async_renew(struct nfs_client *clp, struct rpc_cred *cred, unsigned renew_flags)
L
Linus Torvalds 已提交
3866 3867 3868 3869
{
	struct rpc_message msg = {
		.rpc_proc	= &nfs4_procedures[NFSPROC4_CLNT_RENEW],
		.rpc_argp	= clp,
3870
		.rpc_cred	= cred,
L
Linus Torvalds 已提交
3871
	};
3872
	struct nfs4_renewdata *data;
L
Linus Torvalds 已提交
3873

3874 3875
	if (renew_flags == 0)
		return 0;
3876 3877
	if (!atomic_inc_not_zero(&clp->cl_count))
		return -EIO;
3878
	data = kmalloc(sizeof(*data), GFP_NOFS);
3879 3880 3881 3882
	if (data == NULL)
		return -ENOMEM;
	data->client = clp;
	data->timestamp = jiffies;
3883
	return rpc_call_async(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT,
3884
			&nfs4_renew_ops, data);
L
Linus Torvalds 已提交
3885 3886
}

3887
static int nfs4_proc_renew(struct nfs_client *clp, struct rpc_cred *cred)
L
Linus Torvalds 已提交
3888 3889 3890 3891
{
	struct rpc_message msg = {
		.rpc_proc	= &nfs4_procedures[NFSPROC4_CLNT_RENEW],
		.rpc_argp	= clp,
3892
		.rpc_cred	= cred,
L
Linus Torvalds 已提交
3893 3894 3895 3896
	};
	unsigned long now = jiffies;
	int status;

3897
	status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
L
Linus Torvalds 已提交
3898 3899
	if (status < 0)
		return status;
3900
	do_renew_lease(clp, now);
L
Linus Torvalds 已提交
3901 3902 3903
	return 0;
}

3904 3905 3906 3907 3908 3909 3910
static inline int nfs4_server_supports_acls(struct nfs_server *server)
{
	return (server->caps & NFS_CAP_ACLS)
		&& (server->acl_bitmask & ACL4_SUPPORT_ALLOW_ACL)
		&& (server->acl_bitmask & ACL4_SUPPORT_DENY_ACL);
}

3911 3912
/* Assuming that XATTR_SIZE_MAX is a multiple of PAGE_SIZE, and that
 * it's OK to put sizeof(void) * (XATTR_SIZE_MAX/PAGE_SIZE) bytes on
3913 3914
 * the stack.
 */
3915
#define NFS4ACL_MAXPAGES DIV_ROUND_UP(XATTR_SIZE_MAX, PAGE_SIZE)
3916

3917 3918 3919 3920 3921 3922 3923 3924 3925
static int buf_to_pages_noslab(const void *buf, size_t buflen,
		struct page **pages, unsigned int *pgbase)
{
	struct page *newpage, **spages;
	int rc = 0;
	size_t len;
	spages = pages;

	do {
3926
		len = min_t(size_t, PAGE_SIZE, buflen);
3927 3928 3929 3930 3931 3932 3933 3934 3935 3936 3937 3938 3939 3940 3941 3942 3943 3944 3945
		newpage = alloc_page(GFP_KERNEL);

		if (newpage == NULL)
			goto unwind;
		memcpy(page_address(newpage), buf, len);
                buf += len;
                buflen -= len;
		*pages++ = newpage;
		rc++;
	} while (buflen != 0);

	return rc;

unwind:
	for(; rc > 0; rc--)
		__free_page(spages[rc-1]);
	return -ENOMEM;
}

3946 3947 3948
struct nfs4_cached_acl {
	int cached;
	size_t len;
A
Andrew Morton 已提交
3949
	char data[0];
3950 3951 3952 3953 3954 3955 3956 3957 3958 3959 3960 3961 3962 3963 3964 3965 3966 3967 3968 3969 3970 3971 3972 3973 3974 3975 3976 3977 3978 3979 3980 3981 3982 3983 3984 3985 3986 3987 3988 3989 3990 3991
};

static void nfs4_set_cached_acl(struct inode *inode, struct nfs4_cached_acl *acl)
{
	struct nfs_inode *nfsi = NFS_I(inode);

	spin_lock(&inode->i_lock);
	kfree(nfsi->nfs4_acl);
	nfsi->nfs4_acl = acl;
	spin_unlock(&inode->i_lock);
}

static void nfs4_zap_acl_attr(struct inode *inode)
{
	nfs4_set_cached_acl(inode, NULL);
}

static inline ssize_t nfs4_read_cached_acl(struct inode *inode, char *buf, size_t buflen)
{
	struct nfs_inode *nfsi = NFS_I(inode);
	struct nfs4_cached_acl *acl;
	int ret = -ENOENT;

	spin_lock(&inode->i_lock);
	acl = nfsi->nfs4_acl;
	if (acl == NULL)
		goto out;
	if (buf == NULL) /* user is just asking for length */
		goto out_len;
	if (acl->cached == 0)
		goto out;
	ret = -ERANGE; /* see getxattr(2) man page */
	if (acl->len > buflen)
		goto out;
	memcpy(buf, acl->data, acl->len);
out_len:
	ret = acl->len;
out:
	spin_unlock(&inode->i_lock);
	return ret;
}

3992
static void nfs4_write_cached_acl(struct inode *inode, struct page **pages, size_t pgbase, size_t acl_len)
3993 3994
{
	struct nfs4_cached_acl *acl;
3995
	size_t buflen = sizeof(*acl) + acl_len;
3996

3997
	if (buflen <= PAGE_SIZE) {
3998
		acl = kmalloc(buflen, GFP_KERNEL);
3999 4000 4001
		if (acl == NULL)
			goto out;
		acl->cached = 1;
4002
		_copy_from_pages(acl->data, pages, pgbase, acl_len);
4003 4004 4005 4006 4007 4008 4009 4010 4011 4012 4013
	} else {
		acl = kmalloc(sizeof(*acl), GFP_KERNEL);
		if (acl == NULL)
			goto out;
		acl->cached = 0;
	}
	acl->len = acl_len;
out:
	nfs4_set_cached_acl(inode, acl);
}

4014 4015 4016 4017 4018 4019 4020 4021 4022 4023
/*
 * The getxattr API returns the required buffer length when called with a
 * NULL buf. The NFSv4 acl tool then calls getxattr again after allocating
 * the required buf.  On a NULL buf, we send a page of data to the server
 * guessing that the ACL request can be serviced by a page. If so, we cache
 * up to the page of ACL data, and the 2nd call to getxattr is serviced by
 * the cache. If not so, we throw away the page, and cache the required
 * length. The next getxattr call will then produce another round trip to
 * the server, this time with the input buf of the required size.
 */
4024
static ssize_t __nfs4_get_acl_uncached(struct inode *inode, void *buf, size_t buflen)
4025
{
4026
	struct page *pages[NFS4ACL_MAXPAGES] = {NULL, };
4027 4028 4029 4030 4031
	struct nfs_getaclargs args = {
		.fh = NFS_FH(inode),
		.acl_pages = pages,
		.acl_len = buflen,
	};
B
Benny Halevy 已提交
4032 4033 4034
	struct nfs_getaclres res = {
		.acl_len = buflen,
	};
4035 4036 4037
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETACL],
		.rpc_argp = &args,
B
Benny Halevy 已提交
4038
		.rpc_resp = &res,
4039
	};
4040 4041
	unsigned int npages = DIV_ROUND_UP(buflen, PAGE_SIZE);
	int ret = -ENOMEM, i;
4042

4043 4044 4045 4046
	/* As long as we're doing a round trip to the server anyway,
	 * let's be prepared for a page of acl data. */
	if (npages == 0)
		npages = 1;
4047 4048
	if (npages > ARRAY_SIZE(pages))
		return -ERANGE;
4049

4050 4051 4052 4053
	for (i = 0; i < npages; i++) {
		pages[i] = alloc_page(GFP_KERNEL);
		if (!pages[i])
			goto out_free;
4054
	}
4055 4056 4057 4058 4059 4060

	/* for decoding across pages */
	res.acl_scratch = alloc_page(GFP_KERNEL);
	if (!res.acl_scratch)
		goto out_free;

4061 4062
	args.acl_len = npages * PAGE_SIZE;
	args.acl_pgbase = 0;
4063

4064
	dprintk("%s  buf %p buflen %zu npages %d args.acl_len %zu\n",
4065 4066 4067
		__func__, buf, buflen, npages, args.acl_len);
	ret = nfs4_call_sync(NFS_SERVER(inode)->client, NFS_SERVER(inode),
			     &msg, &args.seq_args, &res.seq_res, 0);
4068 4069
	if (ret)
		goto out_free;
4070

4071 4072 4073 4074 4075
	/* Handle the case where the passed-in buffer is too short */
	if (res.acl_flags & NFS4_ACL_TRUNC) {
		/* Did the user only issue a request for the acl length? */
		if (buf == NULL)
			goto out_ok;
4076
		ret = -ERANGE;
4077
		goto out_free;
4078
	}
4079
	nfs4_write_cached_acl(inode, pages, res.acl_data_offset, res.acl_len);
4080 4081 4082 4083 4084
	if (buf) {
		if (res.acl_len > buflen) {
			ret = -ERANGE;
			goto out_free;
		}
4085
		_copy_from_pages(buf, pages, res.acl_data_offset, res.acl_len);
4086
	}
4087 4088
out_ok:
	ret = res.acl_len;
4089
out_free:
4090 4091 4092
	for (i = 0; i < npages; i++)
		if (pages[i])
			__free_page(pages[i]);
4093 4094
	if (res.acl_scratch)
		__free_page(res.acl_scratch);
4095 4096 4097
	return ret;
}

4098 4099 4100 4101 4102 4103 4104 4105 4106 4107 4108 4109 4110
static ssize_t nfs4_get_acl_uncached(struct inode *inode, void *buf, size_t buflen)
{
	struct nfs4_exception exception = { };
	ssize_t ret;
	do {
		ret = __nfs4_get_acl_uncached(inode, buf, buflen);
		if (ret >= 0)
			break;
		ret = nfs4_handle_exception(NFS_SERVER(inode), ret, &exception);
	} while (exception.retry);
	return ret;
}

4111 4112 4113 4114 4115 4116 4117 4118 4119 4120
static ssize_t nfs4_proc_get_acl(struct inode *inode, void *buf, size_t buflen)
{
	struct nfs_server *server = NFS_SERVER(inode);
	int ret;

	if (!nfs4_server_supports_acls(server))
		return -EOPNOTSUPP;
	ret = nfs_revalidate_inode(server, inode);
	if (ret < 0)
		return ret;
4121 4122
	if (NFS_I(inode)->cache_validity & NFS_INO_INVALID_ACL)
		nfs_zap_acl_cache(inode);
4123 4124
	ret = nfs4_read_cached_acl(inode, buf, buflen);
	if (ret != -ENOENT)
4125 4126
		/* -ENOENT is returned if there is no ACL or if there is an ACL
		 * but no cached acl data, just the acl length */
4127 4128 4129 4130
		return ret;
	return nfs4_get_acl_uncached(inode, buf, buflen);
}

4131
static int __nfs4_proc_set_acl(struct inode *inode, const void *buf, size_t buflen)
4132 4133 4134 4135 4136 4137 4138 4139
{
	struct nfs_server *server = NFS_SERVER(inode);
	struct page *pages[NFS4ACL_MAXPAGES];
	struct nfs_setaclargs arg = {
		.fh		= NFS_FH(inode),
		.acl_pages	= pages,
		.acl_len	= buflen,
	};
B
Benny Halevy 已提交
4140
	struct nfs_setaclres res;
4141 4142 4143
	struct rpc_message msg = {
		.rpc_proc	= &nfs4_procedures[NFSPROC4_CLNT_SETACL],
		.rpc_argp	= &arg,
B
Benny Halevy 已提交
4144
		.rpc_resp	= &res,
4145
	};
4146
	unsigned int npages = DIV_ROUND_UP(buflen, PAGE_SIZE);
4147
	int ret, i;
4148 4149 4150

	if (!nfs4_server_supports_acls(server))
		return -EOPNOTSUPP;
4151 4152
	if (npages > ARRAY_SIZE(pages))
		return -ERANGE;
4153 4154 4155
	i = buf_to_pages_noslab(buf, buflen, arg.acl_pages, &arg.acl_pgbase);
	if (i < 0)
		return i;
4156
	nfs4_inode_return_delegation(inode);
4157
	ret = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
4158 4159 4160 4161 4162 4163 4164 4165

	/*
	 * Free each page after tx, so the only ref left is
	 * held by the network stack
	 */
	for (; i > 0; i--)
		put_page(pages[i-1]);

4166 4167 4168 4169 4170 4171 4172
	/*
	 * Acl update can result in inode attribute update.
	 * so mark the attribute cache invalid.
	 */
	spin_lock(&inode->i_lock);
	NFS_I(inode)->cache_validity |= NFS_INO_INVALID_ATTR;
	spin_unlock(&inode->i_lock);
4173 4174
	nfs_access_zap_cache(inode);
	nfs_zap_acl_cache(inode);
4175 4176 4177
	return ret;
}

4178 4179 4180 4181 4182 4183 4184 4185 4186 4187 4188 4189
static int nfs4_proc_set_acl(struct inode *inode, const void *buf, size_t buflen)
{
	struct nfs4_exception exception = { };
	int err;
	do {
		err = nfs4_handle_exception(NFS_SERVER(inode),
				__nfs4_proc_set_acl(inode, buf, buflen),
				&exception);
	} while (exception.retry);
	return err;
}

L
Linus Torvalds 已提交
4190
static int
4191
nfs4_async_handle_error(struct rpc_task *task, const struct nfs_server *server, struct nfs4_state *state)
L
Linus Torvalds 已提交
4192
{
4193 4194 4195
	struct nfs_client *clp = server->nfs_client;

	if (task->tk_status >= 0)
L
Linus Torvalds 已提交
4196 4197
		return 0;
	switch(task->tk_status) {
4198
		case -NFS4ERR_DELEG_REVOKED:
4199 4200
		case -NFS4ERR_ADMIN_REVOKED:
		case -NFS4ERR_BAD_STATEID:
4201 4202 4203
			if (state == NULL)
				break;
			nfs_remove_bad_delegation(state->inode);
4204 4205 4206
		case -NFS4ERR_OPENMODE:
			if (state == NULL)
				break;
4207 4208
			if (nfs4_schedule_stateid_recovery(server, state) < 0)
				goto stateid_invalid;
4209
			goto wait_on_recovery;
4210
		case -NFS4ERR_EXPIRED:
4211 4212 4213 4214
			if (state != NULL) {
				if (nfs4_schedule_stateid_recovery(server, state) < 0)
					goto stateid_invalid;
			}
L
Linus Torvalds 已提交
4215
		case -NFS4ERR_STALE_STATEID:
4216
		case -NFS4ERR_STALE_CLIENTID:
4217 4218
			nfs4_schedule_lease_recovery(clp);
			goto wait_on_recovery;
4219 4220 4221 4222 4223 4224 4225 4226 4227 4228
#if defined(CONFIG_NFS_V4_1)
		case -NFS4ERR_BADSESSION:
		case -NFS4ERR_BADSLOT:
		case -NFS4ERR_BAD_HIGH_SLOT:
		case -NFS4ERR_DEADSESSION:
		case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
		case -NFS4ERR_SEQ_FALSE_RETRY:
		case -NFS4ERR_SEQ_MISORDERED:
			dprintk("%s ERROR %d, Reset session\n", __func__,
				task->tk_status);
4229
			nfs4_schedule_session_recovery(clp->cl_session, task->tk_status);
4230 4231 4232
			task->tk_status = 0;
			return -EAGAIN;
#endif /* CONFIG_NFS_V4_1 */
L
Linus Torvalds 已提交
4233
		case -NFS4ERR_DELAY:
4234
			nfs_inc_server_stats(server, NFSIOS_DELAY);
4235
		case -NFS4ERR_GRACE:
L
Linus Torvalds 已提交
4236 4237 4238
			rpc_delay(task, NFS4_POLL_RETRY_MAX);
			task->tk_status = 0;
			return -EAGAIN;
4239
		case -NFS4ERR_RETRY_UNCACHED_REP:
L
Linus Torvalds 已提交
4240 4241 4242 4243 4244 4245
		case -NFS4ERR_OLD_STATEID:
			task->tk_status = 0;
			return -EAGAIN;
	}
	task->tk_status = nfs4_map_errors(task->tk_status);
	return 0;
4246 4247 4248
stateid_invalid:
	task->tk_status = -EIO;
	return 0;
4249
wait_on_recovery:
4250 4251 4252 4253 4254
	rpc_sleep_on(&clp->cl_rpcwaitq, task, NULL);
	if (test_bit(NFS4CLNT_MANAGER_RUNNING, &clp->cl_state) == 0)
		rpc_wake_up_queued_task(&clp->cl_rpcwaitq, task);
	task->tk_status = 0;
	return -EAGAIN;
L
Linus Torvalds 已提交
4255 4256
}

4257 4258
static void nfs4_init_boot_verifier(const struct nfs_client *clp,
				    nfs4_verifier *bootverf)
4259 4260 4261
{
	__be32 verf[2];

4262 4263 4264 4265 4266 4267
	if (test_bit(NFS4CLNT_PURGE_STATE, &clp->cl_state)) {
		/* An impossible timestamp guarantees this value
		 * will never match a generated boot time. */
		verf[0] = 0;
		verf[1] = (__be32)(NSEC_PER_SEC + 1);
	} else {
4268 4269 4270
		struct nfs_net *nn = net_generic(clp->cl_net, nfs_net_id);
		verf[0] = (__be32)nn->boot_time.tv_sec;
		verf[1] = (__be32)nn->boot_time.tv_nsec;
4271
	}
4272 4273 4274
	memcpy(bootverf->data, verf, sizeof(bootverf->data));
}

4275 4276 4277 4278 4279 4280 4281 4282 4283 4284 4285 4286 4287 4288 4289 4290 4291 4292 4293 4294 4295
static unsigned int
nfs4_init_nonuniform_client_string(const struct nfs_client *clp,
				   char *buf, size_t len)
{
	unsigned int result;

	rcu_read_lock();
	result = scnprintf(buf, len, "Linux NFSv4.0 %s/%s %s",
				clp->cl_ipaddr,
				rpc_peeraddr2str(clp->cl_rpcclient,
							RPC_DISPLAY_ADDR),
				rpc_peeraddr2str(clp->cl_rpcclient,
							RPC_DISPLAY_PROTO));
	rcu_read_unlock();
	return result;
}

static unsigned int
nfs4_init_uniform_client_string(const struct nfs_client *clp,
				char *buf, size_t len)
{
4296 4297 4298 4299
	char *nodename = clp->cl_rpcclient->cl_nodename;

	if (nfs4_client_id_uniquifier[0] != '\0')
		nodename = nfs4_client_id_uniquifier;
4300 4301
	return scnprintf(buf, len, "Linux NFSv%u.%u %s",
				clp->rpc_ops->version, clp->cl_minorversion,
4302
				nodename);
4303 4304
}

4305 4306 4307 4308 4309 4310 4311 4312 4313 4314
/**
 * nfs4_proc_setclientid - Negotiate client ID
 * @clp: state data structure
 * @program: RPC program for NFSv4 callback service
 * @port: IP port number for NFS4 callback service
 * @cred: RPC credential to use for this call
 * @res: where to place the result
 *
 * Returns zero, a negative errno, or a negative NFS4ERR status code.
 */
4315 4316 4317
int nfs4_proc_setclientid(struct nfs_client *clp, u32 program,
		unsigned short port, struct rpc_cred *cred,
		struct nfs4_setclientid_res *res)
L
Linus Torvalds 已提交
4318 4319 4320 4321 4322
{
	nfs4_verifier sc_verifier;
	struct nfs4_setclientid setclientid = {
		.sc_verifier = &sc_verifier,
		.sc_prog = program,
A
Andy Adamson 已提交
4323
		.sc_cb_ident = clp->cl_cb_ident,
L
Linus Torvalds 已提交
4324 4325 4326 4327
	};
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SETCLIENTID],
		.rpc_argp = &setclientid,
4328
		.rpc_resp = res,
4329
		.rpc_cred = cred,
L
Linus Torvalds 已提交
4330
	};
4331
	int status;
L
Linus Torvalds 已提交
4332

4333
	/* nfs_client_id4 */
4334
	nfs4_init_boot_verifier(clp, &sc_verifier);
4335 4336 4337 4338 4339 4340 4341 4342 4343 4344
	if (test_bit(NFS_CS_MIGRATION, &clp->cl_flags))
		setclientid.sc_name_len =
				nfs4_init_uniform_client_string(clp,
						setclientid.sc_name,
						sizeof(setclientid.sc_name));
	else
		setclientid.sc_name_len =
				nfs4_init_nonuniform_client_string(clp,
						setclientid.sc_name,
						sizeof(setclientid.sc_name));
4345
	/* cb_client4 */
4346
	rcu_read_lock();
4347
	setclientid.sc_netid_len = scnprintf(setclientid.sc_netid,
4348 4349 4350
				sizeof(setclientid.sc_netid),
				rpc_peeraddr2str(clp->cl_rpcclient,
							RPC_DISPLAY_NETID));
4351 4352
	rcu_read_unlock();
	setclientid.sc_uaddr_len = scnprintf(setclientid.sc_uaddr,
4353
				sizeof(setclientid.sc_uaddr), "%s.%u.%u",
L
Linus Torvalds 已提交
4354 4355
				clp->cl_ipaddr, port >> 8, port & 255);

4356 4357 4358 4359 4360 4361
	dprintk("NFS call  setclientid auth=%s, '%.*s'\n",
		clp->cl_rpcclient->cl_auth->au_ops->au_name,
		setclientid.sc_name_len, setclientid.sc_name);
	status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
	dprintk("NFS reply setclientid: %d\n", status);
	return status;
L
Linus Torvalds 已提交
4362 4363
}

4364 4365 4366 4367 4368 4369 4370 4371
/**
 * nfs4_proc_setclientid_confirm - Confirm client ID
 * @clp: state data structure
 * @res: result of a previous SETCLIENTID
 * @cred: RPC credential to use for this call
 *
 * Returns zero, a negative errno, or a negative NFS4ERR status code.
 */
4372
int nfs4_proc_setclientid_confirm(struct nfs_client *clp,
4373 4374
		struct nfs4_setclientid_res *arg,
		struct rpc_cred *cred)
L
Linus Torvalds 已提交
4375 4376 4377
{
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SETCLIENTID_CONFIRM],
4378
		.rpc_argp = arg,
4379
		.rpc_cred = cred,
L
Linus Torvalds 已提交
4380 4381 4382
	};
	int status;

4383 4384 4385
	dprintk("NFS call  setclientid_confirm auth=%s, (client ID %llx)\n",
		clp->cl_rpcclient->cl_auth->au_ops->au_name,
		clp->cl_clientid);
4386
	status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
4387
	dprintk("NFS reply setclientid_confirm: %d\n", status);
L
Linus Torvalds 已提交
4388 4389 4390
	return status;
}

4391 4392
struct nfs4_delegreturndata {
	struct nfs4_delegreturnargs args;
4393
	struct nfs4_delegreturnres res;
4394 4395
	struct nfs_fh fh;
	nfs4_stateid stateid;
4396
	unsigned long timestamp;
4397
	struct nfs_fattr fattr;
4398 4399 4400 4401 4402 4403
	int rpc_status;
};

static void nfs4_delegreturn_done(struct rpc_task *task, void *calldata)
{
	struct nfs4_delegreturndata *data = calldata;
4404

4405 4406
	if (!nfs4_sequence_done(task, &data->res.seq_res))
		return;
4407

4408 4409 4410 4411
	switch (task->tk_status) {
	case -NFS4ERR_STALE_STATEID:
	case -NFS4ERR_EXPIRED:
	case 0:
4412
		renew_lease(data->res.server, data->timestamp);
4413 4414 4415 4416
		break;
	default:
		if (nfs4_async_handle_error(task, data->res.server, NULL) ==
				-EAGAIN) {
4417
			rpc_restart_call_prepare(task);
4418 4419 4420 4421
			return;
		}
	}
	data->rpc_status = task->tk_status;
4422 4423 4424 4425 4426 4427 4428
}

static void nfs4_delegreturn_release(void *calldata)
{
	kfree(calldata);
}

4429 4430 4431 4432 4433 4434 4435
#if defined(CONFIG_NFS_V4_1)
static void nfs4_delegreturn_prepare(struct rpc_task *task, void *data)
{
	struct nfs4_delegreturndata *d_data;

	d_data = (struct nfs4_delegreturndata *)data;

4436 4437 4438 4439
	nfs4_setup_sequence(d_data->res.server,
			&d_data->args.seq_args,
			&d_data->res.seq_res,
			task);
4440 4441 4442
}
#endif /* CONFIG_NFS_V4_1 */

4443
static const struct rpc_call_ops nfs4_delegreturn_ops = {
4444 4445 4446
#if defined(CONFIG_NFS_V4_1)
	.rpc_call_prepare = nfs4_delegreturn_prepare,
#endif /* CONFIG_NFS_V4_1 */
4447 4448 4449 4450
	.rpc_call_done = nfs4_delegreturn_done,
	.rpc_release = nfs4_delegreturn_release,
};

4451
static int _nfs4_proc_delegreturn(struct inode *inode, struct rpc_cred *cred, const nfs4_stateid *stateid, int issync)
4452 4453
{
	struct nfs4_delegreturndata *data;
4454
	struct nfs_server *server = NFS_SERVER(inode);
4455
	struct rpc_task *task;
4456 4457 4458 4459
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DELEGRETURN],
		.rpc_cred = cred,
	};
T
Trond Myklebust 已提交
4460 4461
	struct rpc_task_setup task_setup_data = {
		.rpc_client = server->client,
4462
		.rpc_message = &msg,
T
Trond Myklebust 已提交
4463 4464 4465
		.callback_ops = &nfs4_delegreturn_ops,
		.flags = RPC_TASK_ASYNC,
	};
4466
	int status = 0;
4467

4468
	data = kzalloc(sizeof(*data), GFP_NOFS);
4469 4470
	if (data == NULL)
		return -ENOMEM;
4471
	nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
4472 4473
	data->args.fhandle = &data->fh;
	data->args.stateid = &data->stateid;
4474
	data->args.bitmask = server->cache_consistency_bitmask;
4475
	nfs_copy_fh(&data->fh, NFS_FH(inode));
4476
	nfs4_stateid_copy(&data->stateid, stateid);
4477 4478
	data->res.fattr = &data->fattr;
	data->res.server = server;
4479
	nfs_fattr_init(data->res.fattr);
4480
	data->timestamp = jiffies;
4481 4482
	data->rpc_status = 0;

T
Trond Myklebust 已提交
4483
	task_setup_data.callback_data = data;
4484 4485
	msg.rpc_argp = &data->args;
	msg.rpc_resp = &data->res;
T
Trond Myklebust 已提交
4486
	task = rpc_run_task(&task_setup_data);
4487
	if (IS_ERR(task))
4488
		return PTR_ERR(task);
4489 4490
	if (!issync)
		goto out;
4491
	status = nfs4_wait_for_completion_rpc_task(task);
4492 4493 4494
	if (status != 0)
		goto out;
	status = data->rpc_status;
4495 4496 4497 4498
	if (status == 0)
		nfs_post_op_update_inode_force_wcc(inode, &data->fattr);
	else
		nfs_refresh_inode(inode, &data->fattr);
4499
out:
4500
	rpc_put_task(task);
4501
	return status;
L
Linus Torvalds 已提交
4502 4503
}

4504
int nfs4_proc_delegreturn(struct inode *inode, struct rpc_cred *cred, const nfs4_stateid *stateid, int issync)
L
Linus Torvalds 已提交
4505 4506 4507 4508 4509
{
	struct nfs_server *server = NFS_SERVER(inode);
	struct nfs4_exception exception = { };
	int err;
	do {
4510
		err = _nfs4_proc_delegreturn(inode, cred, stateid, issync);
L
Linus Torvalds 已提交
4511 4512 4513 4514 4515 4516 4517 4518 4519 4520 4521 4522 4523 4524 4525 4526 4527 4528 4529 4530
		switch (err) {
			case -NFS4ERR_STALE_STATEID:
			case -NFS4ERR_EXPIRED:
			case 0:
				return 0;
		}
		err = nfs4_handle_exception(server, err, &exception);
	} while (exception.retry);
	return err;
}

#define NFS4_LOCK_MINTIMEOUT (1 * HZ)
#define NFS4_LOCK_MAXTIMEOUT (30 * HZ)

/* 
 * sleep, with exponential backoff, and retry the LOCK operation. 
 */
static unsigned long
nfs4_set_lock_task_retry(unsigned long timeout)
{
4531
	freezable_schedule_timeout_killable(timeout);
L
Linus Torvalds 已提交
4532 4533 4534 4535 4536 4537 4538 4539 4540 4541
	timeout <<= 1;
	if (timeout > NFS4_LOCK_MAXTIMEOUT)
		return NFS4_LOCK_MAXTIMEOUT;
	return timeout;
}

static int _nfs4_proc_getlk(struct nfs4_state *state, int cmd, struct file_lock *request)
{
	struct inode *inode = state->inode;
	struct nfs_server *server = NFS_SERVER(inode);
4542
	struct nfs_client *clp = server->nfs_client;
T
Trond Myklebust 已提交
4543
	struct nfs_lockt_args arg = {
L
Linus Torvalds 已提交
4544
		.fh = NFS_FH(inode),
T
Trond Myklebust 已提交
4545
		.fl = request,
L
Linus Torvalds 已提交
4546
	};
T
Trond Myklebust 已提交
4547 4548
	struct nfs_lockt_res res = {
		.denied = request,
L
Linus Torvalds 已提交
4549 4550 4551 4552 4553 4554 4555 4556 4557 4558
	};
	struct rpc_message msg = {
		.rpc_proc	= &nfs4_procedures[NFSPROC4_CLNT_LOCKT],
		.rpc_argp       = &arg,
		.rpc_resp       = &res,
		.rpc_cred	= state->owner->so_cred,
	};
	struct nfs4_lock_state *lsp;
	int status;

T
Trond Myklebust 已提交
4559
	arg.lock_owner.clientid = clp->cl_clientid;
4560 4561 4562 4563
	status = nfs4_set_lock_state(state, request);
	if (status != 0)
		goto out;
	lsp = request->fl_u.nfs4_fl.owner;
4564
	arg.lock_owner.id = lsp->ls_seqid.owner_id;
4565
	arg.lock_owner.s_dev = server->s_dev;
4566
	status = nfs4_call_sync(server->client, server, &msg, &arg.seq_args, &res.seq_res, 1);
T
Trond Myklebust 已提交
4567 4568 4569 4570 4571 4572
	switch (status) {
		case 0:
			request->fl_type = F_UNLCK;
			break;
		case -NFS4ERR_DENIED:
			status = 0;
L
Linus Torvalds 已提交
4573
	}
4574
	request->fl_ops->fl_release_private(request);
4575
out:
L
Linus Torvalds 已提交
4576 4577 4578 4579 4580 4581 4582 4583 4584 4585 4586 4587 4588 4589 4590 4591 4592 4593 4594 4595 4596 4597 4598 4599 4600 4601 4602 4603 4604 4605 4606 4607
	return status;
}

static int nfs4_proc_getlk(struct nfs4_state *state, int cmd, struct file_lock *request)
{
	struct nfs4_exception exception = { };
	int err;

	do {
		err = nfs4_handle_exception(NFS_SERVER(state->inode),
				_nfs4_proc_getlk(state, cmd, request),
				&exception);
	} while (exception.retry);
	return err;
}

static int do_vfs_lock(struct file *file, struct file_lock *fl)
{
	int res = 0;
	switch (fl->fl_flags & (FL_POSIX|FL_FLOCK)) {
		case FL_POSIX:
			res = posix_lock_file_wait(file, fl);
			break;
		case FL_FLOCK:
			res = flock_lock_file_wait(file, fl);
			break;
		default:
			BUG();
	}
	return res;
}

4608
struct nfs4_unlockdata {
T
Trond Myklebust 已提交
4609 4610
	struct nfs_locku_args arg;
	struct nfs_locku_res res;
4611 4612
	struct nfs4_lock_state *lsp;
	struct nfs_open_context *ctx;
T
Trond Myklebust 已提交
4613 4614
	struct file_lock fl;
	const struct nfs_server *server;
4615
	unsigned long timestamp;
4616 4617
};

T
Trond Myklebust 已提交
4618 4619 4620 4621 4622 4623 4624 4625
static struct nfs4_unlockdata *nfs4_alloc_unlockdata(struct file_lock *fl,
		struct nfs_open_context *ctx,
		struct nfs4_lock_state *lsp,
		struct nfs_seqid *seqid)
{
	struct nfs4_unlockdata *p;
	struct inode *inode = lsp->ls_state->inode;

4626
	p = kzalloc(sizeof(*p), GFP_NOFS);
T
Trond Myklebust 已提交
4627 4628 4629 4630 4631
	if (p == NULL)
		return NULL;
	p->arg.fh = NFS_FH(inode);
	p->arg.fl = &p->fl;
	p->arg.seqid = seqid;
4632
	p->res.seqid = seqid;
T
Trond Myklebust 已提交
4633 4634 4635 4636 4637 4638 4639 4640 4641 4642
	p->arg.stateid = &lsp->ls_stateid;
	p->lsp = lsp;
	atomic_inc(&lsp->ls_count);
	/* Ensure we don't close file until we're done freeing locks! */
	p->ctx = get_nfs_open_context(ctx);
	memcpy(&p->fl, fl, sizeof(p->fl));
	p->server = NFS_SERVER(inode);
	return p;
}

4643
static void nfs4_locku_release_calldata(void *data)
4644
{
4645
	struct nfs4_unlockdata *calldata = data;
T
Trond Myklebust 已提交
4646
	nfs_free_seqid(calldata->arg.seqid);
4647 4648 4649
	nfs4_put_lock_state(calldata->lsp);
	put_nfs_open_context(calldata->ctx);
	kfree(calldata);
4650 4651
}

4652
static void nfs4_locku_done(struct rpc_task *task, void *data)
4653
{
4654
	struct nfs4_unlockdata *calldata = data;
4655

4656 4657
	if (!nfs4_sequence_done(task, &calldata->res.seq_res))
		return;
4658 4659
	switch (task->tk_status) {
		case 0:
4660 4661
			nfs4_stateid_copy(&calldata->lsp->ls_stateid,
					&calldata->res.stateid);
4662
			renew_lease(calldata->server, calldata->timestamp);
4663
			break;
4664 4665
		case -NFS4ERR_BAD_STATEID:
		case -NFS4ERR_OLD_STATEID:
4666 4667 4668 4669
		case -NFS4ERR_STALE_STATEID:
		case -NFS4ERR_EXPIRED:
			break;
		default:
4670
			if (nfs4_async_handle_error(task, calldata->server, NULL) == -EAGAIN)
4671
				rpc_restart_call_prepare(task);
4672
	}
4673
	nfs_release_seqid(calldata->arg.seqid);
4674 4675
}

T
Trond Myklebust 已提交
4676
static void nfs4_locku_prepare(struct rpc_task *task, void *data)
4677
{
T
Trond Myklebust 已提交
4678
	struct nfs4_unlockdata *calldata = data;
4679

T
Trond Myklebust 已提交
4680
	if (nfs_wait_on_sequence(calldata->arg.seqid, task) != 0)
4681
		goto out_wait;
4682
	if (test_bit(NFS_LOCK_INITIALIZED, &calldata->lsp->ls_flags) == 0) {
4683
		/* Note: exit _without_ running nfs4_locku_done */
4684
		goto out_no_action;
4685
	}
4686
	calldata->timestamp = jiffies;
4687
	if (nfs4_setup_sequence(calldata->server,
4688
				&calldata->arg.seq_args,
4689 4690 4691
				&calldata->res.seq_res,
				task) != 0)
		nfs_release_seqid(calldata->arg.seqid);
4692 4693 4694 4695 4696
	return;
out_no_action:
	task->tk_action = NULL;
out_wait:
	nfs4_sequence_done(task, &calldata->res.seq_res);
4697 4698
}

4699
static const struct rpc_call_ops nfs4_locku_ops = {
T
Trond Myklebust 已提交
4700
	.rpc_call_prepare = nfs4_locku_prepare,
4701
	.rpc_call_done = nfs4_locku_done,
4702
	.rpc_release = nfs4_locku_release_calldata,
4703 4704
};

4705 4706 4707 4708 4709 4710
static struct rpc_task *nfs4_do_unlck(struct file_lock *fl,
		struct nfs_open_context *ctx,
		struct nfs4_lock_state *lsp,
		struct nfs_seqid *seqid)
{
	struct nfs4_unlockdata *data;
4711 4712 4713 4714
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOCKU],
		.rpc_cred = ctx->cred,
	};
T
Trond Myklebust 已提交
4715 4716
	struct rpc_task_setup task_setup_data = {
		.rpc_client = NFS_CLIENT(lsp->ls_state->inode),
4717
		.rpc_message = &msg,
T
Trond Myklebust 已提交
4718
		.callback_ops = &nfs4_locku_ops,
4719
		.workqueue = nfsiod_workqueue,
T
Trond Myklebust 已提交
4720 4721
		.flags = RPC_TASK_ASYNC,
	};
4722

4723 4724 4725 4726 4727
	/* Ensure this is an unlock - when canceling a lock, the
	 * canceled lock is passed in, and it won't be an unlock.
	 */
	fl->fl_type = F_UNLCK;

4728 4729 4730 4731 4732 4733
	data = nfs4_alloc_unlockdata(fl, ctx, lsp, seqid);
	if (data == NULL) {
		nfs_free_seqid(seqid);
		return ERR_PTR(-ENOMEM);
	}

4734
	nfs41_init_sequence(&data->arg.seq_args, &data->res.seq_res, 1);
4735 4736
	msg.rpc_argp = &data->arg;
	msg.rpc_resp = &data->res;
T
Trond Myklebust 已提交
4737 4738
	task_setup_data.callback_data = data;
	return rpc_run_task(&task_setup_data);
4739 4740
}

4741 4742
static int nfs4_proc_unlck(struct nfs4_state *state, int cmd, struct file_lock *request)
{
4743 4744 4745
	struct inode *inode = state->inode;
	struct nfs4_state_owner *sp = state->owner;
	struct nfs_inode *nfsi = NFS_I(inode);
T
Trond Myklebust 已提交
4746
	struct nfs_seqid *seqid;
L
Linus Torvalds 已提交
4747
	struct nfs4_lock_state *lsp;
4748 4749
	struct rpc_task *task;
	int status = 0;
4750
	unsigned char fl_flags = request->fl_flags;
4751

4752
	status = nfs4_set_lock_state(state, request);
4753 4754
	/* Unlock _before_ we do the RPC call */
	request->fl_flags |= FL_EXISTS;
4755 4756 4757
	/* Exclude nfs_delegation_claim_locks() */
	mutex_lock(&sp->so_delegreturn_mutex);
	/* Exclude nfs4_reclaim_open_stateid() - note nesting! */
4758 4759 4760
	down_read(&nfsi->rwsem);
	if (do_vfs_lock(request->fl_file, request) == -ENOENT) {
		up_read(&nfsi->rwsem);
4761
		mutex_unlock(&sp->so_delegreturn_mutex);
4762
		goto out;
4763 4764
	}
	up_read(&nfsi->rwsem);
4765
	mutex_unlock(&sp->so_delegreturn_mutex);
4766
	if (status != 0)
4767 4768
		goto out;
	/* Is this a delegated lock? */
4769
	lsp = request->fl_u.nfs4_fl.owner;
4770 4771
	if (test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags) == 0)
		goto out;
4772
	seqid = nfs_alloc_seqid(&lsp->ls_seqid, GFP_KERNEL);
4773
	status = -ENOMEM;
T
Trond Myklebust 已提交
4774
	if (seqid == NULL)
4775
		goto out;
4776
	task = nfs4_do_unlck(request, nfs_file_open_context(request->fl_file), lsp, seqid);
4777 4778
	status = PTR_ERR(task);
	if (IS_ERR(task))
4779
		goto out;
4780
	status = nfs4_wait_for_completion_rpc_task(task);
4781
	rpc_put_task(task);
4782
out:
4783
	request->fl_flags = fl_flags;
L
Linus Torvalds 已提交
4784 4785 4786
	return status;
}

4787 4788 4789 4790 4791 4792
struct nfs4_lockdata {
	struct nfs_lock_args arg;
	struct nfs_lock_res res;
	struct nfs4_lock_state *lsp;
	struct nfs_open_context *ctx;
	struct file_lock fl;
4793
	unsigned long timestamp;
4794 4795
	int rpc_status;
	int cancelled;
4796
	struct nfs_server *server;
4797 4798 4799
};

static struct nfs4_lockdata *nfs4_alloc_lockdata(struct file_lock *fl,
4800 4801
		struct nfs_open_context *ctx, struct nfs4_lock_state *lsp,
		gfp_t gfp_mask)
L
Linus Torvalds 已提交
4802
{
4803 4804
	struct nfs4_lockdata *p;
	struct inode *inode = lsp->ls_state->inode;
L
Linus Torvalds 已提交
4805
	struct nfs_server *server = NFS_SERVER(inode);
4806

4807
	p = kzalloc(sizeof(*p), gfp_mask);
4808 4809 4810 4811 4812
	if (p == NULL)
		return NULL;

	p->arg.fh = NFS_FH(inode);
	p->arg.fl = &p->fl;
4813
	p->arg.open_seqid = nfs_alloc_seqid(&lsp->ls_state->owner->so_seqid, gfp_mask);
4814 4815
	if (p->arg.open_seqid == NULL)
		goto out_free;
4816
	p->arg.lock_seqid = nfs_alloc_seqid(&lsp->ls_seqid, gfp_mask);
4817
	if (p->arg.lock_seqid == NULL)
4818
		goto out_free_seqid;
4819
	p->arg.lock_stateid = &lsp->ls_stateid;
4820
	p->arg.lock_owner.clientid = server->nfs_client->cl_clientid;
4821
	p->arg.lock_owner.id = lsp->ls_seqid.owner_id;
4822
	p->arg.lock_owner.s_dev = server->s_dev;
4823
	p->res.lock_seqid = p->arg.lock_seqid;
4824
	p->lsp = lsp;
4825
	p->server = server;
4826 4827 4828 4829
	atomic_inc(&lsp->ls_count);
	p->ctx = get_nfs_open_context(ctx);
	memcpy(&p->fl, fl, sizeof(p->fl));
	return p;
4830 4831
out_free_seqid:
	nfs_free_seqid(p->arg.open_seqid);
4832 4833 4834 4835 4836 4837 4838 4839 4840
out_free:
	kfree(p);
	return NULL;
}

static void nfs4_lock_prepare(struct rpc_task *task, void *calldata)
{
	struct nfs4_lockdata *data = calldata;
	struct nfs4_state *state = data->lsp->ls_state;
4841

4842
	dprintk("%s: begin!\n", __func__);
4843
	if (nfs_wait_on_sequence(data->arg.lock_seqid, task) != 0)
4844
		goto out_wait;
4845 4846
	/* Do we need to do an open_to_lock_owner? */
	if (!(data->arg.lock_seqid->sequence->flags & NFS_SEQID_CONFIRMED)) {
4847
		if (nfs_wait_on_sequence(data->arg.open_seqid, task) != 0) {
4848
			goto out_release_lock_seqid;
4849
		}
4850
		data->arg.open_stateid = &state->open_stateid;
4851
		data->arg.new_lock_owner = 1;
4852
		data->res.open_seqid = data->arg.open_seqid;
4853 4854
	} else
		data->arg.new_lock_owner = 0;
4855 4856 4857 4858 4859
	if (!nfs4_valid_open_stateid(state)) {
		data->rpc_status = -EBADF;
		task->tk_action = NULL;
		goto out_release_open_seqid;
	}
4860
	data->timestamp = jiffies;
4861 4862
	if (nfs4_setup_sequence(data->server,
				&data->arg.seq_args,
4863
				&data->res.seq_res,
4864
				task) == 0)
4865
		return;
4866
out_release_open_seqid:
4867 4868 4869
	nfs_release_seqid(data->arg.open_seqid);
out_release_lock_seqid:
	nfs_release_seqid(data->arg.lock_seqid);
4870 4871
out_wait:
	nfs4_sequence_done(task, &data->res.seq_res);
4872
	dprintk("%s: done!, ret = %d\n", __func__, data->rpc_status);
4873 4874
}

4875 4876 4877 4878
static void nfs4_lock_done(struct rpc_task *task, void *calldata)
{
	struct nfs4_lockdata *data = calldata;

4879
	dprintk("%s: begin!\n", __func__);
4880

4881 4882
	if (!nfs4_sequence_done(task, &data->res.seq_res))
		return;
4883

4884 4885 4886 4887 4888 4889 4890 4891
	data->rpc_status = task->tk_status;
	if (data->arg.new_lock_owner != 0) {
		if (data->rpc_status == 0)
			nfs_confirm_seqid(&data->lsp->ls_seqid, 0);
		else
			goto out;
	}
	if (data->rpc_status == 0) {
4892
		nfs4_stateid_copy(&data->lsp->ls_stateid, &data->res.stateid);
4893
		set_bit(NFS_LOCK_INITIALIZED, &data->lsp->ls_flags);
4894
		renew_lease(NFS_SERVER(data->ctx->dentry->d_inode), data->timestamp);
4895 4896
	}
out:
4897
	dprintk("%s: done, ret = %d!\n", __func__, data->rpc_status);
4898 4899 4900 4901 4902 4903
}

static void nfs4_lock_release(void *calldata)
{
	struct nfs4_lockdata *data = calldata;

4904
	dprintk("%s: begin!\n", __func__);
4905
	nfs_free_seqid(data->arg.open_seqid);
4906 4907 4908 4909 4910
	if (data->cancelled != 0) {
		struct rpc_task *task;
		task = nfs4_do_unlck(&data->fl, data->ctx, data->lsp,
				data->arg.lock_seqid);
		if (!IS_ERR(task))
4911
			rpc_put_task_async(task);
4912
		dprintk("%s: cancelling lock!\n", __func__);
4913 4914 4915 4916 4917
	} else
		nfs_free_seqid(data->arg.lock_seqid);
	nfs4_put_lock_state(data->lsp);
	put_nfs_open_context(data->ctx);
	kfree(data);
4918
	dprintk("%s: done!\n", __func__);
4919 4920 4921 4922 4923 4924 4925 4926
}

static const struct rpc_call_ops nfs4_lock_ops = {
	.rpc_call_prepare = nfs4_lock_prepare,
	.rpc_call_done = nfs4_lock_done,
	.rpc_release = nfs4_lock_release,
};

4927 4928 4929 4930 4931
static void nfs4_handle_setlk_error(struct nfs_server *server, struct nfs4_lock_state *lsp, int new_lock_owner, int error)
{
	switch (error) {
	case -NFS4ERR_ADMIN_REVOKED:
	case -NFS4ERR_BAD_STATEID:
4932
		lsp->ls_seqid.flags &= ~NFS_SEQID_CONFIRMED;
4933
		if (new_lock_owner != 0 ||
4934
		   test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags) != 0)
4935
			nfs4_schedule_stateid_recovery(server, lsp->ls_state);
4936 4937 4938
		break;
	case -NFS4ERR_STALE_STATEID:
		lsp->ls_seqid.flags &= ~NFS_SEQID_CONFIRMED;
4939 4940
	case -NFS4ERR_EXPIRED:
		nfs4_schedule_lease_recovery(server->nfs_client);
4941 4942 4943
	};
}

4944
static int _nfs4_do_setlk(struct nfs4_state *state, int cmd, struct file_lock *fl, int recovery_type)
4945 4946 4947
{
	struct nfs4_lockdata *data;
	struct rpc_task *task;
4948 4949 4950 4951
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LOCK],
		.rpc_cred = state->owner->so_cred,
	};
T
Trond Myklebust 已提交
4952 4953
	struct rpc_task_setup task_setup_data = {
		.rpc_client = NFS_CLIENT(state->inode),
4954
		.rpc_message = &msg,
T
Trond Myklebust 已提交
4955
		.callback_ops = &nfs4_lock_ops,
4956
		.workqueue = nfsiod_workqueue,
T
Trond Myklebust 已提交
4957 4958
		.flags = RPC_TASK_ASYNC,
	};
4959 4960
	int ret;

4961
	dprintk("%s: begin!\n", __func__);
4962
	data = nfs4_alloc_lockdata(fl, nfs_file_open_context(fl->fl_file),
4963 4964
			fl->fl_u.nfs4_fl.owner,
			recovery_type == NFS_LOCK_NEW ? GFP_KERNEL : GFP_NOFS);
4965 4966 4967 4968
	if (data == NULL)
		return -ENOMEM;
	if (IS_SETLKW(cmd))
		data->arg.block = 1;
4969
	nfs41_init_sequence(&data->arg.seq_args, &data->res.seq_res, 1);
4970 4971
	msg.rpc_argp = &data->arg;
	msg.rpc_resp = &data->res;
T
Trond Myklebust 已提交
4972
	task_setup_data.callback_data = data;
4973 4974 4975 4976 4977
	if (recovery_type > NFS_LOCK_NEW) {
		if (recovery_type == NFS_LOCK_RECLAIM)
			data->arg.reclaim = NFS_LOCK_RECLAIM;
		nfs4_set_sequence_privileged(&data->arg.seq_args);
	}
T
Trond Myklebust 已提交
4978
	task = rpc_run_task(&task_setup_data);
4979
	if (IS_ERR(task))
4980 4981 4982 4983
		return PTR_ERR(task);
	ret = nfs4_wait_for_completion_rpc_task(task);
	if (ret == 0) {
		ret = data->rpc_status;
4984 4985 4986
		if (ret)
			nfs4_handle_setlk_error(data->server, data->lsp,
					data->arg.new_lock_owner, ret);
4987 4988
	} else
		data->cancelled = 1;
4989
	rpc_put_task(task);
4990
	dprintk("%s: done, ret = %d!\n", __func__, ret);
4991
	return ret;
L
Linus Torvalds 已提交
4992 4993 4994 4995
}

static int nfs4_lock_reclaim(struct nfs4_state *state, struct file_lock *request)
{
4996
	struct nfs_server *server = NFS_SERVER(state->inode);
4997 4998 4999
	struct nfs4_exception exception = {
		.inode = state->inode,
	};
5000 5001 5002
	int err;

	do {
5003 5004 5005
		/* Cache the lock if possible... */
		if (test_bit(NFS_DELEGATED_STATE, &state->flags) != 0)
			return 0;
5006
		err = _nfs4_do_setlk(state, F_SETLK, request, NFS_LOCK_RECLAIM);
5007
		if (err != -NFS4ERR_DELAY)
5008 5009 5010 5011
			break;
		nfs4_handle_exception(server, err, &exception);
	} while (exception.retry);
	return err;
L
Linus Torvalds 已提交
5012 5013 5014 5015
}

static int nfs4_lock_expired(struct nfs4_state *state, struct file_lock *request)
{
5016
	struct nfs_server *server = NFS_SERVER(state->inode);
5017 5018 5019
	struct nfs4_exception exception = {
		.inode = state->inode,
	};
5020 5021
	int err;

5022 5023 5024
	err = nfs4_set_lock_state(state, request);
	if (err != 0)
		return err;
5025
	do {
5026 5027
		if (test_bit(NFS_DELEGATED_STATE, &state->flags) != 0)
			return 0;
5028
		err = _nfs4_do_setlk(state, F_SETLK, request, NFS_LOCK_EXPIRED);
5029 5030 5031 5032 5033 5034 5035 5036
		switch (err) {
		default:
			goto out;
		case -NFS4ERR_GRACE:
		case -NFS4ERR_DELAY:
			nfs4_handle_exception(server, err, &exception);
			err = 0;
		}
5037
	} while (exception.retry);
5038
out:
5039
	return err;
L
Linus Torvalds 已提交
5040 5041
}

5042
#if defined(CONFIG_NFS_V4_1)
5043 5044 5045 5046 5047 5048 5049 5050
/**
 * nfs41_check_expired_locks - possibly free a lock stateid
 *
 * @state: NFSv4 state for an inode
 *
 * Returns NFS_OK if recovery for this stateid is now finished.
 * Otherwise a negative NFS4ERR value is returned.
 */
5051
static int nfs41_check_expired_locks(struct nfs4_state *state)
5052
{
5053
	int status, ret = -NFS4ERR_BAD_STATEID;
5054
	struct nfs4_lock_state *lsp;
5055 5056
	struct nfs_server *server = NFS_SERVER(state->inode);

5057
	list_for_each_entry(lsp, &state->lock_states, ls_locks) {
5058
		if (test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags)) {
5059 5060
			status = nfs41_test_stateid(server, &lsp->ls_stateid);
			if (status != NFS_OK) {
5061 5062
				/* Free the stateid unless the server
				 * informs us the stateid is unrecognized. */
5063 5064 5065
				if (status != -NFS4ERR_BAD_STATEID)
					nfs41_free_stateid(server,
							&lsp->ls_stateid);
5066
				clear_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags);
5067 5068 5069 5070 5071 5072 5073 5074 5075 5076 5077 5078 5079 5080
				ret = status;
			}
		}
	};

	return ret;
}

static int nfs41_lock_expired(struct nfs4_state *state, struct file_lock *request)
{
	int status = NFS_OK;

	if (test_bit(LK_STATE_IN_USE, &state->flags))
		status = nfs41_check_expired_locks(state);
5081 5082 5083
	if (status != NFS_OK)
		status = nfs4_lock_expired(state, request);
	return status;
5084 5085 5086
}
#endif

L
Linus Torvalds 已提交
5087 5088
static int _nfs4_proc_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
{
5089
	struct nfs4_state_owner *sp = state->owner;
5090
	struct nfs_inode *nfsi = NFS_I(state->inode);
5091
	unsigned char fl_flags = request->fl_flags;
5092
	unsigned int seq;
5093
	int status = -ENOLCK;
L
Linus Torvalds 已提交
5094

5095 5096 5097
	if ((fl_flags & FL_POSIX) &&
			!test_bit(NFS_STATE_POSIX_LOCKS, &state->flags))
		goto out;
5098 5099 5100 5101
	/* Is this a delegated open? */
	status = nfs4_set_lock_state(state, request);
	if (status != 0)
		goto out;
5102 5103 5104 5105
	request->fl_flags |= FL_ACCESS;
	status = do_vfs_lock(request->fl_file, request);
	if (status < 0)
		goto out;
5106
	down_read(&nfsi->rwsem);
5107 5108 5109
	if (test_bit(NFS_DELEGATED_STATE, &state->flags)) {
		/* Yes: cache locks! */
		/* ...but avoid races with delegation recall... */
5110 5111 5112
		request->fl_flags = fl_flags & ~FL_SLEEP;
		status = do_vfs_lock(request->fl_file, request);
		goto out_unlock;
5113
	}
5114 5115
	seq = raw_seqcount_begin(&sp->so_reclaim_seqcount);
	up_read(&nfsi->rwsem);
5116
	status = _nfs4_do_setlk(state, cmd, request, NFS_LOCK_NEW);
5117
	if (status != 0)
5118 5119 5120 5121
		goto out;
	down_read(&nfsi->rwsem);
	if (read_seqcount_retry(&sp->so_reclaim_seqcount, seq)) {
		status = -NFS4ERR_DELAY;
5122
		goto out_unlock;
5123
	}
5124
	/* Note: we always want to sleep here! */
5125
	request->fl_flags = fl_flags | FL_SLEEP;
5126
	if (do_vfs_lock(request->fl_file, request) < 0)
5127 5128
		printk(KERN_WARNING "NFS: %s: VFS is out of sync with lock "
			"manager!\n", __func__);
5129
out_unlock:
5130
	up_read(&nfsi->rwsem);
5131 5132
out:
	request->fl_flags = fl_flags;
L
Linus Torvalds 已提交
5133 5134 5135 5136 5137
	return status;
}

static int nfs4_proc_setlk(struct nfs4_state *state, int cmd, struct file_lock *request)
{
5138 5139
	struct nfs4_exception exception = {
		.state = state,
5140
		.inode = state->inode,
5141
	};
L
Linus Torvalds 已提交
5142 5143 5144
	int err;

	do {
5145 5146 5147
		err = _nfs4_proc_setlk(state, cmd, request);
		if (err == -NFS4ERR_DENIED)
			err = -EAGAIN;
L
Linus Torvalds 已提交
5148
		err = nfs4_handle_exception(NFS_SERVER(state->inode),
5149
				err, &exception);
L
Linus Torvalds 已提交
5150 5151 5152 5153 5154 5155 5156 5157 5158 5159 5160 5161 5162
	} while (exception.retry);
	return err;
}

static int
nfs4_proc_lock(struct file *filp, int cmd, struct file_lock *request)
{
	struct nfs_open_context *ctx;
	struct nfs4_state *state;
	unsigned long timeout = NFS4_LOCK_MINTIMEOUT;
	int status;

	/* verify open state */
5163
	ctx = nfs_file_open_context(filp);
L
Linus Torvalds 已提交
5164 5165 5166 5167 5168
	state = ctx->state;

	if (request->fl_start < 0 || request->fl_end < 0)
		return -EINVAL;

5169 5170 5171 5172 5173
	if (IS_GETLK(cmd)) {
		if (state != NULL)
			return nfs4_proc_getlk(state, F_GETLK, request);
		return 0;
	}
L
Linus Torvalds 已提交
5174 5175 5176 5177

	if (!(IS_SETLK(cmd) || IS_SETLKW(cmd)))
		return -EINVAL;

5178 5179 5180 5181 5182
	if (request->fl_type == F_UNLCK) {
		if (state != NULL)
			return nfs4_proc_unlck(state, cmd, request);
		return 0;
	}
L
Linus Torvalds 已提交
5183

5184 5185
	if (state == NULL)
		return -ENOLCK;
5186 5187 5188 5189
	/*
	 * Don't rely on the VFS having checked the file open mode,
	 * since it won't do this for flock() locks.
	 */
5190
	switch (request->fl_type) {
5191 5192 5193 5194 5195 5196 5197 5198 5199
	case F_RDLCK:
		if (!(filp->f_mode & FMODE_READ))
			return -EBADF;
		break;
	case F_WRLCK:
		if (!(filp->f_mode & FMODE_WRITE))
			return -EBADF;
	}

L
Linus Torvalds 已提交
5200 5201 5202 5203 5204 5205 5206 5207 5208 5209 5210 5211
	do {
		status = nfs4_proc_setlk(state, cmd, request);
		if ((status != -EAGAIN) || IS_SETLK(cmd))
			break;
		timeout = nfs4_set_lock_task_retry(timeout);
		status = -ERESTARTSYS;
		if (signalled())
			break;
	} while(status < 0);
	return status;
}

5212
int nfs4_lock_delegation_recall(struct file_lock *fl, struct nfs4_state *state, const nfs4_stateid *stateid)
5213 5214 5215 5216 5217 5218
{
	struct nfs_server *server = NFS_SERVER(state->inode);
	int err;

	err = nfs4_set_lock_state(state, fl);
	if (err != 0)
5219
		return err;
5220
	err = _nfs4_do_setlk(state, F_SETLK, fl, NFS_LOCK_NEW);
5221
	return nfs4_handle_delegation_recall_error(server, state, stateid, err);
5222
}
5223

5224 5225
struct nfs_release_lockowner_data {
	struct nfs4_lock_state *lsp;
5226
	struct nfs_server *server;
5227 5228 5229
	struct nfs_release_lockowner_args args;
};

5230 5231
static void nfs4_release_lockowner_release(void *calldata)
{
5232
	struct nfs_release_lockowner_data *data = calldata;
5233
	nfs4_free_lock_state(data->server, data->lsp);
5234 5235 5236
	kfree(calldata);
}

5237
static const struct rpc_call_ops nfs4_release_lockowner_ops = {
5238 5239 5240
	.rpc_release = nfs4_release_lockowner_release,
};

5241
static int nfs4_release_lockowner(struct nfs_server *server, struct nfs4_lock_state *lsp)
5242
{
5243
	struct nfs_release_lockowner_data *data;
5244 5245 5246 5247 5248
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RELEASE_LOCKOWNER],
	};

	if (server->nfs_client->cl_mvops->minor_version != 0)
5249 5250 5251 5252 5253
		return -EINVAL;
	data = kmalloc(sizeof(*data), GFP_NOFS);
	if (!data)
		return -ENOMEM;
	data->lsp = lsp;
5254
	data->server = server;
5255 5256 5257 5258 5259 5260
	data->args.lock_owner.clientid = server->nfs_client->cl_clientid;
	data->args.lock_owner.id = lsp->ls_seqid.owner_id;
	data->args.lock_owner.s_dev = server->s_dev;
	msg.rpc_argp = &data->args;
	rpc_call_async(server->client, &msg, 0, &nfs4_release_lockowner_ops, data);
	return 0;
5261 5262
}

5263 5264
#define XATTR_NAME_NFSV4_ACL "system.nfs4_acl"

5265 5266 5267
static int nfs4_xattr_set_nfs4_acl(struct dentry *dentry, const char *key,
				   const void *buf, size_t buflen,
				   int flags, int type)
5268
{
5269 5270
	if (strcmp(key, "") != 0)
		return -EINVAL;
5271

5272
	return nfs4_proc_set_acl(dentry->d_inode, buf, buflen);
5273 5274
}

5275 5276
static int nfs4_xattr_get_nfs4_acl(struct dentry *dentry, const char *key,
				   void *buf, size_t buflen, int type)
5277
{
5278 5279
	if (strcmp(key, "") != 0)
		return -EINVAL;
5280

5281
	return nfs4_proc_get_acl(dentry->d_inode, buf, buflen);
5282 5283
}

5284 5285 5286
static size_t nfs4_xattr_list_nfs4_acl(struct dentry *dentry, char *list,
				       size_t list_len, const char *name,
				       size_t name_len, int type)
5287
{
5288
	size_t len = sizeof(XATTR_NAME_NFSV4_ACL);
5289

5290 5291
	if (!nfs4_server_supports_acls(NFS_SERVER(dentry->d_inode)))
		return 0;
5292 5293 5294

	if (list && len <= list_len)
		memcpy(list, XATTR_NAME_NFSV4_ACL, len);
5295
	return len;
5296 5297
}

5298 5299 5300
/*
 * nfs_fhget will use either the mounted_on_fileid or the fileid
 */
5301 5302
static void nfs_fixup_referral_attributes(struct nfs_fattr *fattr)
{
5303 5304 5305
	if (!(((fattr->valid & NFS_ATTR_FATTR_MOUNTED_ON_FILEID) ||
	       (fattr->valid & NFS_ATTR_FATTR_FILEID)) &&
	      (fattr->valid & NFS_ATTR_FATTR_FSID) &&
5306
	      (fattr->valid & NFS_ATTR_FATTR_V4_LOCATIONS)))
5307 5308 5309
		return;

	fattr->valid |= NFS_ATTR_FATTR_TYPE | NFS_ATTR_FATTR_MODE |
5310
		NFS_ATTR_FATTR_NLINK | NFS_ATTR_FATTR_V4_REFERRAL;
5311 5312 5313 5314
	fattr->mode = S_IFDIR | S_IRUGO | S_IXUGO;
	fattr->nlink = 2;
}

5315 5316 5317 5318
static int _nfs4_proc_fs_locations(struct rpc_clnt *client, struct inode *dir,
				   const struct qstr *name,
				   struct nfs4_fs_locations *fs_locations,
				   struct page *page)
5319 5320 5321
{
	struct nfs_server *server = NFS_SERVER(dir);
	u32 bitmask[2] = {
5322
		[0] = FATTR4_WORD0_FSID | FATTR4_WORD0_FS_LOCATIONS,
5323 5324 5325
	};
	struct nfs4_fs_locations_arg args = {
		.dir_fh = NFS_FH(dir),
5326
		.name = name,
5327 5328 5329
		.page = page,
		.bitmask = bitmask,
	};
B
Benny Halevy 已提交
5330 5331 5332
	struct nfs4_fs_locations_res res = {
		.fs_locations = fs_locations,
	};
5333 5334 5335
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FS_LOCATIONS],
		.rpc_argp = &args,
B
Benny Halevy 已提交
5336
		.rpc_resp = &res,
5337 5338 5339
	};
	int status;

5340
	dprintk("%s: start\n", __func__);
5341 5342 5343 5344 5345 5346 5347 5348

	/* Ask for the fileid of the absent filesystem if mounted_on_fileid
	 * is not supported */
	if (NFS_SERVER(dir)->attr_bitmask[1] & FATTR4_WORD1_MOUNTED_ON_FILEID)
		bitmask[1] |= FATTR4_WORD1_MOUNTED_ON_FILEID;
	else
		bitmask[0] |= FATTR4_WORD0_FILEID;

5349
	nfs_fattr_init(&fs_locations->fattr);
5350
	fs_locations->server = server;
5351
	fs_locations->nlocations = 0;
5352
	status = nfs4_call_sync(client, server, &msg, &args.seq_args, &res.seq_res, 0);
5353
	dprintk("%s: returned status = %d\n", __func__, status);
5354 5355 5356
	return status;
}

5357 5358 5359 5360
int nfs4_proc_fs_locations(struct rpc_clnt *client, struct inode *dir,
			   const struct qstr *name,
			   struct nfs4_fs_locations *fs_locations,
			   struct page *page)
5361 5362 5363 5364 5365
{
	struct nfs4_exception exception = { };
	int err;
	do {
		err = nfs4_handle_exception(NFS_SERVER(dir),
5366
				_nfs4_proc_fs_locations(client, dir, name, fs_locations, page),
5367 5368 5369 5370 5371
				&exception);
	} while (exception.retry);
	return err;
}

B
Bryan Schumaker 已提交
5372 5373 5374 5375 5376 5377 5378 5379 5380 5381 5382 5383 5384 5385 5386 5387 5388 5389 5390 5391 5392 5393
static int _nfs4_proc_secinfo(struct inode *dir, const struct qstr *name, struct nfs4_secinfo_flavors *flavors)
{
	int status;
	struct nfs4_secinfo_arg args = {
		.dir_fh = NFS_FH(dir),
		.name   = name,
	};
	struct nfs4_secinfo_res res = {
		.flavors     = flavors,
	};
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SECINFO],
		.rpc_argp = &args,
		.rpc_resp = &res,
	};

	dprintk("NFS call  secinfo %s\n", name->name);
	status = nfs4_call_sync(NFS_SERVER(dir)->client, NFS_SERVER(dir), &msg, &args.seq_args, &res.seq_res, 0);
	dprintk("NFS reply  secinfo: %d\n", status);
	return status;
}

5394 5395
int nfs4_proc_secinfo(struct inode *dir, const struct qstr *name,
		      struct nfs4_secinfo_flavors *flavors)
B
Bryan Schumaker 已提交
5396 5397 5398 5399 5400 5401 5402 5403 5404 5405 5406
{
	struct nfs4_exception exception = { };
	int err;
	do {
		err = nfs4_handle_exception(NFS_SERVER(dir),
				_nfs4_proc_secinfo(dir, name, flavors),
				&exception);
	} while (exception.retry);
	return err;
}

5407
#ifdef CONFIG_NFS_V4_1
5408 5409 5410 5411 5412 5413 5414 5415 5416 5417 5418 5419 5420 5421 5422 5423 5424 5425 5426
/*
 * Check the exchange flags returned by the server for invalid flags, having
 * both PNFS and NON_PNFS flags set, and not having one of NON_PNFS, PNFS, or
 * DS flags set.
 */
static int nfs4_check_cl_exchange_flags(u32 flags)
{
	if (flags & ~EXCHGID4_FLAG_MASK_R)
		goto out_inval;
	if ((flags & EXCHGID4_FLAG_USE_PNFS_MDS) &&
	    (flags & EXCHGID4_FLAG_USE_NON_PNFS))
		goto out_inval;
	if (!(flags & (EXCHGID4_FLAG_MASK_PNFS)))
		goto out_inval;
	return NFS_OK;
out_inval:
	return -NFS4ERR_INVAL;
}

5427
static bool
5428 5429
nfs41_same_server_scope(struct nfs41_server_scope *a,
			struct nfs41_server_scope *b)
5430 5431 5432 5433 5434 5435 5436 5437
{
	if (a->server_scope_sz == b->server_scope_sz &&
	    memcmp(a->server_scope, b->server_scope, a->server_scope_sz) == 0)
		return true;

	return false;
}

5438 5439 5440 5441 5442 5443
/*
 * nfs4_proc_bind_conn_to_session()
 *
 * The 4.1 client currently uses the same TCP connection for the
 * fore and backchannel.
 */
5444
int nfs4_proc_bind_conn_to_session(struct nfs_client *clp, struct rpc_cred *cred)
5445 5446 5447 5448 5449 5450 5451 5452
{
	int status;
	struct nfs41_bind_conn_to_session_res res;
	struct rpc_message msg = {
		.rpc_proc =
			&nfs4_procedures[NFSPROC4_CLNT_BIND_CONN_TO_SESSION],
		.rpc_argp = clp,
		.rpc_resp = &res,
5453
		.rpc_cred = cred,
5454 5455 5456 5457 5458 5459 5460 5461 5462 5463 5464 5465 5466 5467 5468 5469 5470 5471 5472 5473 5474 5475 5476 5477 5478 5479 5480 5481 5482 5483 5484 5485 5486 5487 5488 5489 5490 5491
	};

	dprintk("--> %s\n", __func__);

	res.session = kzalloc(sizeof(struct nfs4_session), GFP_NOFS);
	if (unlikely(res.session == NULL)) {
		status = -ENOMEM;
		goto out;
	}

	status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
	if (status == 0) {
		if (memcmp(res.session->sess_id.data,
		    clp->cl_session->sess_id.data, NFS4_MAX_SESSIONID_LEN)) {
			dprintk("NFS: %s: Session ID mismatch\n", __func__);
			status = -EIO;
			goto out_session;
		}
		if (res.dir != NFS4_CDFS4_BOTH) {
			dprintk("NFS: %s: Unexpected direction from server\n",
				__func__);
			status = -EIO;
			goto out_session;
		}
		if (res.use_conn_in_rdma_mode) {
			dprintk("NFS: %s: Server returned RDMA mode = true\n",
				__func__);
			status = -EIO;
			goto out_session;
		}
	}
out_session:
	kfree(res.session);
out:
	dprintk("<-- %s status= %d\n", __func__, status);
	return status;
}

B
Benny Halevy 已提交
5492 5493 5494
/*
 * nfs4_proc_exchange_id()
 *
5495 5496
 * Returns zero, a negative errno, or a negative NFS4ERR status code.
 *
B
Benny Halevy 已提交
5497 5498 5499 5500 5501
 * Since the clientid has expired, all compounds using sessions
 * associated with the stale clientid will be returning
 * NFS4ERR_BADSESSION in the sequence operation, and will therefore
 * be in some phase of session reset.
 */
5502
int nfs4_proc_exchange_id(struct nfs_client *clp, struct rpc_cred *cred)
B
Benny Halevy 已提交
5503 5504 5505
{
	nfs4_verifier verifier;
	struct nfs41_exchange_id_args args = {
5506
		.verifier = &verifier,
B
Benny Halevy 已提交
5507
		.client = clp,
5508
		.flags = EXCHGID4_FLAG_SUPP_MOVED_REFER,
B
Benny Halevy 已提交
5509 5510
	};
	struct nfs41_exchange_id_res res = {
5511
		0
B
Benny Halevy 已提交
5512 5513 5514 5515 5516 5517 5518 5519 5520
	};
	int status;
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_EXCHANGE_ID],
		.rpc_argp = &args,
		.rpc_resp = &res,
		.rpc_cred = cred,
	};

5521
	nfs4_init_boot_verifier(clp, &verifier);
5522 5523
	args.id_len = nfs4_init_uniform_client_string(clp, args.id,
							sizeof(args.id));
5524 5525 5526
	dprintk("NFS call  exchange_id auth=%s, '%.*s'\n",
		clp->cl_rpcclient->cl_auth->au_ops->au_name,
		args.id_len, args.id);
B
Benny Halevy 已提交
5527

5528
	res.server_owner = kzalloc(sizeof(struct nfs41_server_owner),
5529
					GFP_NOFS);
5530
	if (unlikely(res.server_owner == NULL)) {
5531 5532 5533
		status = -ENOMEM;
		goto out;
	}
5534

5535
	res.server_scope = kzalloc(sizeof(struct nfs41_server_scope),
5536
					GFP_NOFS);
5537
	if (unlikely(res.server_scope == NULL)) {
5538
		status = -ENOMEM;
5539
		goto out_server_owner;
5540
	}
5541

5542
	res.impl_id = kzalloc(sizeof(struct nfs41_impl_id), GFP_NOFS);
5543
	if (unlikely(res.impl_id == NULL)) {
5544 5545 5546 5547
		status = -ENOMEM;
		goto out_server_scope;
	}

5548
	status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
5549
	if (status == 0)
5550
		status = nfs4_check_cl_exchange_flags(res.flags);
5551

5552
	if (status == 0) {
5553 5554 5555 5556 5557
		clp->cl_clientid = res.clientid;
		clp->cl_exchange_flags = (res.flags & ~EXCHGID4_FLAG_CONFIRMED_R);
		if (!(res.flags & EXCHGID4_FLAG_CONFIRMED_R))
			clp->cl_seqid = res.seqid;

5558 5559 5560
		kfree(clp->cl_serverowner);
		clp->cl_serverowner = res.server_owner;
		res.server_owner = NULL;
5561

5562
		/* use the most recent implementation id */
5563 5564
		kfree(clp->cl_implid);
		clp->cl_implid = res.impl_id;
5565

5566
		if (clp->cl_serverscope != NULL &&
5567
		    !nfs41_same_server_scope(clp->cl_serverscope,
5568 5569 5570 5571
					     res.server_scope)) {
			dprintk("%s: server_scope mismatch detected\n",
				__func__);
			set_bit(NFS4CLNT_SERVER_SCOPE_MISMATCH, &clp->cl_state);
5572 5573
			kfree(clp->cl_serverscope);
			clp->cl_serverscope = NULL;
5574 5575
		}

5576
		if (clp->cl_serverscope == NULL) {
5577
			clp->cl_serverscope = res.server_scope;
5578 5579
			goto out;
		}
5580 5581
	} else
		kfree(res.impl_id);
5582

5583 5584
out_server_owner:
	kfree(res.server_owner);
5585
out_server_scope:
5586 5587
	kfree(res.server_scope);
out:
5588
	if (clp->cl_implid != NULL)
5589
		dprintk("NFS reply exchange_id: Server Implementation ID: "
5590
			"domain: %s, name: %s, date: %llu,%u\n",
5591
			clp->cl_implid->domain, clp->cl_implid->name,
5592 5593
			clp->cl_implid->date.seconds,
			clp->cl_implid->date.nseconds);
5594
	dprintk("NFS reply exchange_id: %d\n", status);
B
Benny Halevy 已提交
5595 5596 5597
	return status;
}

T
Trond Myklebust 已提交
5598 5599 5600 5601 5602 5603 5604 5605 5606 5607 5608 5609
static int _nfs4_proc_destroy_clientid(struct nfs_client *clp,
		struct rpc_cred *cred)
{
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DESTROY_CLIENTID],
		.rpc_argp = clp,
		.rpc_cred = cred,
	};
	int status;

	status = rpc_call_sync(clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
	if (status)
5610
		dprintk("NFS: Got error %d from the server %s on "
T
Trond Myklebust 已提交
5611 5612 5613 5614 5615 5616 5617 5618 5619 5620 5621 5622 5623 5624 5625 5626 5627 5628 5629 5630 5631 5632 5633 5634 5635 5636 5637 5638 5639 5640 5641 5642 5643
			"DESTROY_CLIENTID.", status, clp->cl_hostname);
	return status;
}

static int nfs4_proc_destroy_clientid(struct nfs_client *clp,
		struct rpc_cred *cred)
{
	unsigned int loop;
	int ret;

	for (loop = NFS4_MAX_LOOP_ON_RECOVER; loop != 0; loop--) {
		ret = _nfs4_proc_destroy_clientid(clp, cred);
		switch (ret) {
		case -NFS4ERR_DELAY:
		case -NFS4ERR_CLIENTID_BUSY:
			ssleep(1);
			break;
		default:
			return ret;
		}
	}
	return 0;
}

int nfs4_destroy_clientid(struct nfs_client *clp)
{
	struct rpc_cred *cred;
	int ret = 0;

	if (clp->cl_mvops->minor_version < 1)
		goto out;
	if (clp->cl_exchange_flags == 0)
		goto out;
5644 5645
	if (clp->cl_preserve_clid)
		goto out;
T
Trond Myklebust 已提交
5646 5647 5648 5649 5650 5651 5652 5653 5654 5655 5656 5657 5658
	cred = nfs4_get_exchange_id_cred(clp);
	ret = nfs4_proc_destroy_clientid(clp, cred);
	if (cred)
		put_rpccred(cred);
	switch (ret) {
	case 0:
	case -NFS4ERR_STALE_CLIENTID:
		clp->cl_exchange_flags = 0;
	}
out:
	return ret;
}

A
Andy Adamson 已提交
5659 5660 5661 5662 5663 5664 5665 5666 5667 5668 5669 5670 5671 5672 5673
struct nfs4_get_lease_time_data {
	struct nfs4_get_lease_time_args *args;
	struct nfs4_get_lease_time_res *res;
	struct nfs_client *clp;
};

static void nfs4_get_lease_time_prepare(struct rpc_task *task,
					void *calldata)
{
	struct nfs4_get_lease_time_data *data =
			(struct nfs4_get_lease_time_data *)calldata;

	dprintk("--> %s\n", __func__);
	/* just setup sequence, do not trigger session recovery
	   since we're invoked within one */
5674 5675 5676 5677
	nfs41_setup_sequence(data->clp->cl_session,
			&data->args->la_seq_args,
			&data->res->lr_seq_res,
			task);
A
Andy Adamson 已提交
5678 5679 5680 5681 5682 5683 5684 5685 5686 5687 5688 5689 5690
	dprintk("<-- %s\n", __func__);
}

/*
 * Called from nfs4_state_manager thread for session setup, so don't recover
 * from sequence operation or clientid errors.
 */
static void nfs4_get_lease_time_done(struct rpc_task *task, void *calldata)
{
	struct nfs4_get_lease_time_data *data =
			(struct nfs4_get_lease_time_data *)calldata;

	dprintk("--> %s\n", __func__);
5691 5692
	if (!nfs41_sequence_done(task, &data->res->lr_seq_res))
		return;
A
Andy Adamson 已提交
5693 5694 5695 5696 5697 5698
	switch (task->tk_status) {
	case -NFS4ERR_DELAY:
	case -NFS4ERR_GRACE:
		dprintk("%s Retry: tk_status %d\n", __func__, task->tk_status);
		rpc_delay(task, NFS4_POLL_RETRY_MIN);
		task->tk_status = 0;
5699 5700
		/* fall through */
	case -NFS4ERR_RETRY_UNCACHED_REP:
5701
		rpc_restart_call_prepare(task);
A
Andy Adamson 已提交
5702 5703 5704 5705 5706
		return;
	}
	dprintk("<-- %s\n", __func__);
}

5707
static const struct rpc_call_ops nfs4_get_lease_time_ops = {
A
Andy Adamson 已提交
5708 5709 5710 5711 5712 5713 5714 5715 5716 5717 5718 5719 5720 5721 5722 5723 5724 5725 5726 5727 5728 5729 5730 5731 5732
	.rpc_call_prepare = nfs4_get_lease_time_prepare,
	.rpc_call_done = nfs4_get_lease_time_done,
};

int nfs4_proc_get_lease_time(struct nfs_client *clp, struct nfs_fsinfo *fsinfo)
{
	struct rpc_task *task;
	struct nfs4_get_lease_time_args args;
	struct nfs4_get_lease_time_res res = {
		.lr_fsinfo = fsinfo,
	};
	struct nfs4_get_lease_time_data data = {
		.args = &args,
		.res = &res,
		.clp = clp,
	};
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GET_LEASE_TIME],
		.rpc_argp = &args,
		.rpc_resp = &res,
	};
	struct rpc_task_setup task_setup = {
		.rpc_client = clp->cl_rpcclient,
		.rpc_message = &msg,
		.callback_ops = &nfs4_get_lease_time_ops,
5733 5734
		.callback_data = &data,
		.flags = RPC_TASK_TIMEOUT,
A
Andy Adamson 已提交
5735 5736 5737
	};
	int status;

5738
	nfs41_init_sequence(&args.la_seq_args, &res.lr_seq_res, 0);
5739
	nfs4_set_sequence_privileged(&args.la_seq_args);
A
Andy Adamson 已提交
5740 5741 5742 5743 5744 5745 5746 5747 5748 5749 5750 5751 5752 5753
	dprintk("--> %s\n", __func__);
	task = rpc_run_task(&task_setup);

	if (IS_ERR(task))
		status = PTR_ERR(task);
	else {
		status = task->tk_status;
		rpc_put_task(task);
	}
	dprintk("<-- %s return %d\n", __func__, status);

	return status;
}

A
Andy Adamson 已提交
5754 5755 5756 5757 5758 5759 5760 5761 5762 5763 5764 5765
/*
 * Initialize the values to be used by the client in CREATE_SESSION
 * If nfs4_init_session set the fore channel request and response sizes,
 * use them.
 *
 * Set the back channel max_resp_sz_cached to zero to force the client to
 * always set csa_cachethis to FALSE because the current implementation
 * of the back channel DRC only supports caching the CB_SEQUENCE operation.
 */
static void nfs4_init_channel_attrs(struct nfs41_create_session_args *args)
{
	struct nfs4_session *session = args->client->cl_session;
5766 5767
	unsigned int mxrqst_sz = session->fc_target_max_rqst_sz,
		     mxresp_sz = session->fc_target_max_resp_sz;
A
Andy Adamson 已提交
5768 5769 5770 5771 5772 5773 5774 5775 5776

	if (mxrqst_sz == 0)
		mxrqst_sz = NFS_MAX_FILE_IO_SIZE;
	if (mxresp_sz == 0)
		mxresp_sz = NFS_MAX_FILE_IO_SIZE;
	/* Fore channel attributes */
	args->fc_attrs.max_rqst_sz = mxrqst_sz;
	args->fc_attrs.max_resp_sz = mxresp_sz;
	args->fc_attrs.max_ops = NFS4_MAX_OPS;
5777
	args->fc_attrs.max_reqs = max_session_slots;
A
Andy Adamson 已提交
5778 5779

	dprintk("%s: Fore Channel : max_rqst_sz=%u max_resp_sz=%u "
5780
		"max_ops=%u max_reqs=%u\n",
A
Andy Adamson 已提交
5781 5782
		__func__,
		args->fc_attrs.max_rqst_sz, args->fc_attrs.max_resp_sz,
5783
		args->fc_attrs.max_ops, args->fc_attrs.max_reqs);
A
Andy Adamson 已提交
5784 5785 5786 5787 5788 5789 5790 5791 5792 5793 5794 5795 5796 5797 5798 5799

	/* Back channel attributes */
	args->bc_attrs.max_rqst_sz = PAGE_SIZE;
	args->bc_attrs.max_resp_sz = PAGE_SIZE;
	args->bc_attrs.max_resp_sz_cached = 0;
	args->bc_attrs.max_ops = NFS4_MAX_BACK_CHANNEL_OPS;
	args->bc_attrs.max_reqs = 1;

	dprintk("%s: Back Channel : max_rqst_sz=%u max_resp_sz=%u "
		"max_resp_sz_cached=%u max_ops=%u max_reqs=%u\n",
		__func__,
		args->bc_attrs.max_rqst_sz, args->bc_attrs.max_resp_sz,
		args->bc_attrs.max_resp_sz_cached, args->bc_attrs.max_ops,
		args->bc_attrs.max_reqs);
}

5800
static int nfs4_verify_fore_channel_attrs(struct nfs41_create_session_args *args, struct nfs4_session *session)
5801
{
5802 5803 5804 5805 5806 5807 5808 5809 5810 5811 5812 5813 5814 5815 5816
	struct nfs4_channel_attrs *sent = &args->fc_attrs;
	struct nfs4_channel_attrs *rcvd = &session->fc_attrs;

	if (rcvd->max_resp_sz > sent->max_resp_sz)
		return -EINVAL;
	/*
	 * Our requested max_ops is the minimum we need; we're not
	 * prepared to break up compounds into smaller pieces than that.
	 * So, no point even trying to continue if the server won't
	 * cooperate:
	 */
	if (rcvd->max_ops < sent->max_ops)
		return -EINVAL;
	if (rcvd->max_reqs == 0)
		return -EINVAL;
5817 5818
	if (rcvd->max_reqs > NFS4_MAX_SLOT_TABLE)
		rcvd->max_reqs = NFS4_MAX_SLOT_TABLE;
5819
	return 0;
5820 5821
}

5822 5823 5824 5825
static int nfs4_verify_back_channel_attrs(struct nfs41_create_session_args *args, struct nfs4_session *session)
{
	struct nfs4_channel_attrs *sent = &args->bc_attrs;
	struct nfs4_channel_attrs *rcvd = &session->bc_attrs;
5826

5827 5828 5829 5830 5831 5832 5833
	if (rcvd->max_rqst_sz > sent->max_rqst_sz)
		return -EINVAL;
	if (rcvd->max_resp_sz < sent->max_resp_sz)
		return -EINVAL;
	if (rcvd->max_resp_sz_cached > sent->max_resp_sz_cached)
		return -EINVAL;
	/* These would render the backchannel useless: */
5834
	if (rcvd->max_ops != sent->max_ops)
5835
		return -EINVAL;
5836
	if (rcvd->max_reqs != sent->max_reqs)
5837 5838 5839
		return -EINVAL;
	return 0;
}
5840 5841 5842 5843

static int nfs4_verify_channel_attrs(struct nfs41_create_session_args *args,
				     struct nfs4_session *session)
{
5844
	int ret;
5845

5846 5847 5848 5849
	ret = nfs4_verify_fore_channel_attrs(args, session);
	if (ret)
		return ret;
	return nfs4_verify_back_channel_attrs(args, session);
5850 5851
}

5852 5853
static int _nfs4_proc_create_session(struct nfs_client *clp,
		struct rpc_cred *cred)
A
Andy Adamson 已提交
5854 5855 5856 5857 5858 5859 5860 5861 5862 5863 5864 5865 5866
{
	struct nfs4_session *session = clp->cl_session;
	struct nfs41_create_session_args args = {
		.client = clp,
		.cb_program = NFS4_CALLBACK,
	};
	struct nfs41_create_session_res res = {
		.client = clp,
	};
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_CREATE_SESSION],
		.rpc_argp = &args,
		.rpc_resp = &res,
5867
		.rpc_cred = cred,
A
Andy Adamson 已提交
5868 5869 5870 5871
	};
	int status;

	nfs4_init_channel_attrs(&args);
5872
	args.flags = (SESSION4_PERSIST | SESSION4_BACK_CHAN);
A
Andy Adamson 已提交
5873

5874
	status = rpc_call_sync(session->clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
A
Andy Adamson 已提交
5875

5876
	if (!status) {
5877 5878
		/* Verify the session's negotiated channel_attrs values */
		status = nfs4_verify_channel_attrs(&args, session);
A
Andy Adamson 已提交
5879 5880 5881 5882 5883 5884 5885 5886 5887 5888 5889 5890
		/* Increment the clientid slot sequence id */
		clp->cl_seqid++;
	}

	return status;
}

/*
 * Issues a CREATE_SESSION operation to the server.
 * It is the responsibility of the caller to verify the session is
 * expired before calling this routine.
 */
5891
int nfs4_proc_create_session(struct nfs_client *clp, struct rpc_cred *cred)
A
Andy Adamson 已提交
5892 5893 5894 5895 5896 5897 5898
{
	int status;
	unsigned *ptr;
	struct nfs4_session *session = clp->cl_session;

	dprintk("--> %s clp=%p session=%p\n", __func__, clp, session);

5899
	status = _nfs4_proc_create_session(clp, cred);
A
Andy Adamson 已提交
5900 5901 5902
	if (status)
		goto out;

5903 5904 5905
	/* Init or reset the session slot tables */
	status = nfs4_setup_session_slot_tables(session);
	dprintk("slot table setup returned %d\n", status);
A
Andy Adamson 已提交
5906 5907 5908 5909 5910 5911 5912 5913 5914 5915 5916
	if (status)
		goto out;

	ptr = (unsigned *)&session->sess_id.data[0];
	dprintk("%s client>seqid %d sessionid %u:%u:%u:%u\n", __func__,
		clp->cl_seqid, ptr[0], ptr[1], ptr[2], ptr[3]);
out:
	dprintk("<-- %s\n", __func__);
	return status;
}

A
Andy Adamson 已提交
5917 5918 5919 5920
/*
 * Issue the over-the-wire RPC DESTROY_SESSION.
 * The caller must serialize access to this routine.
 */
5921 5922
int nfs4_proc_destroy_session(struct nfs4_session *session,
		struct rpc_cred *cred)
A
Andy Adamson 已提交
5923
{
5924 5925 5926 5927 5928
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_DESTROY_SESSION],
		.rpc_argp = session,
		.rpc_cred = cred,
	};
A
Andy Adamson 已提交
5929 5930 5931 5932 5933 5934 5935 5936
	int status = 0;

	dprintk("--> nfs4_proc_destroy_session\n");

	/* session is still being setup */
	if (session->clp->cl_cons_state != NFS_CS_READY)
		return status;

5937
	status = rpc_call_sync(session->clp->cl_rpcclient, &msg, RPC_TASK_TIMEOUT);
A
Andy Adamson 已提交
5938 5939

	if (status)
5940
		dprintk("NFS: Got error %d from the server on DESTROY_SESSION. "
A
Andy Adamson 已提交
5941 5942 5943 5944 5945 5946
			"Session has been destroyed regardless...\n", status);

	dprintk("<-- nfs4_proc_destroy_session\n");
	return status;
}

A
Andy Adamson 已提交
5947 5948 5949
/*
 * Renew the cl_session lease.
 */
5950 5951 5952 5953 5954 5955
struct nfs4_sequence_data {
	struct nfs_client *clp;
	struct nfs4_sequence_args args;
	struct nfs4_sequence_res res;
};

5956 5957
static void nfs41_sequence_release(void *data)
{
5958 5959
	struct nfs4_sequence_data *calldata = data;
	struct nfs_client *clp = calldata->clp;
5960

5961 5962 5963
	if (atomic_read(&clp->cl_count) > 1)
		nfs4_schedule_state_renewal(clp);
	nfs_put_client(clp);
5964
	kfree(calldata);
5965 5966
}

5967 5968 5969 5970 5971 5972 5973
static int nfs41_sequence_handle_errors(struct rpc_task *task, struct nfs_client *clp)
{
	switch(task->tk_status) {
	case -NFS4ERR_DELAY:
		rpc_delay(task, NFS4_POLL_RETRY_MAX);
		return -EAGAIN;
	default:
5974
		nfs4_schedule_lease_recovery(clp);
5975 5976 5977 5978
	}
	return 0;
}

5979
static void nfs41_sequence_call_done(struct rpc_task *task, void *data)
A
Andy Adamson 已提交
5980
{
5981 5982
	struct nfs4_sequence_data *calldata = data;
	struct nfs_client *clp = calldata->clp;
A
Andy Adamson 已提交
5983

5984 5985
	if (!nfs41_sequence_done(task, task->tk_msg.rpc_resp))
		return;
A
Andy Adamson 已提交
5986 5987 5988

	if (task->tk_status < 0) {
		dprintk("%s ERROR %d\n", __func__, task->tk_status);
5989 5990
		if (atomic_read(&clp->cl_count) == 1)
			goto out;
A
Andy Adamson 已提交
5991

5992 5993
		if (nfs41_sequence_handle_errors(task, clp) == -EAGAIN) {
			rpc_restart_call_prepare(task);
A
Andy Adamson 已提交
5994 5995 5996 5997
			return;
		}
	}
	dprintk("%s rpc_cred %p\n", __func__, task->tk_msg.rpc_cred);
5998
out:
A
Andy Adamson 已提交
5999 6000 6001 6002 6003
	dprintk("<-- %s\n", __func__);
}

static void nfs41_sequence_prepare(struct rpc_task *task, void *data)
{
6004 6005
	struct nfs4_sequence_data *calldata = data;
	struct nfs_client *clp = calldata->clp;
A
Andy Adamson 已提交
6006 6007 6008 6009 6010 6011
	struct nfs4_sequence_args *args;
	struct nfs4_sequence_res *res;

	args = task->tk_msg.rpc_argp;
	res = task->tk_msg.rpc_resp;

6012
	nfs41_setup_sequence(clp->cl_session, args, res, task);
A
Andy Adamson 已提交
6013 6014 6015 6016 6017
}

static const struct rpc_call_ops nfs41_sequence_ops = {
	.rpc_call_done = nfs41_sequence_call_done,
	.rpc_call_prepare = nfs41_sequence_prepare,
6018
	.rpc_release = nfs41_sequence_release,
A
Andy Adamson 已提交
6019 6020
};

6021 6022 6023
static struct rpc_task *_nfs41_proc_sequence(struct nfs_client *clp,
		struct rpc_cred *cred,
		bool is_privileged)
A
Andy Adamson 已提交
6024
{
6025
	struct nfs4_sequence_data *calldata;
A
Andy Adamson 已提交
6026 6027 6028 6029
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SEQUENCE],
		.rpc_cred = cred,
	};
6030 6031 6032
	struct rpc_task_setup task_setup_data = {
		.rpc_client = clp->cl_rpcclient,
		.rpc_message = &msg,
6033
		.callback_ops = &nfs41_sequence_ops,
6034
		.flags = RPC_TASK_ASYNC | RPC_TASK_TIMEOUT,
6035
	};
A
Andy Adamson 已提交
6036

6037
	if (!atomic_inc_not_zero(&clp->cl_count))
6038
		return ERR_PTR(-EIO);
6039
	calldata = kzalloc(sizeof(*calldata), GFP_NOFS);
6040
	if (calldata == NULL) {
6041
		nfs_put_client(clp);
6042
		return ERR_PTR(-ENOMEM);
A
Andy Adamson 已提交
6043
	}
6044
	nfs41_init_sequence(&calldata->args, &calldata->res, 0);
6045 6046
	if (is_privileged)
		nfs4_set_sequence_privileged(&calldata->args);
6047 6048 6049
	msg.rpc_argp = &calldata->args;
	msg.rpc_resp = &calldata->res;
	calldata->clp = clp;
6050
	task_setup_data.callback_data = calldata;
A
Andy Adamson 已提交
6051

6052 6053 6054
	return rpc_run_task(&task_setup_data);
}

6055
static int nfs41_proc_async_sequence(struct nfs_client *clp, struct rpc_cred *cred, unsigned renew_flags)
6056 6057 6058 6059
{
	struct rpc_task *task;
	int ret = 0;

6060 6061
	if ((renew_flags & NFS4_RENEW_TIMEOUT) == 0)
		return 0;
6062
	task = _nfs41_proc_sequence(clp, cred, false);
6063 6064 6065
	if (IS_ERR(task))
		ret = PTR_ERR(task);
	else
6066
		rpc_put_task_async(task);
6067 6068 6069 6070 6071 6072 6073 6074 6075
	dprintk("<-- %s status=%d\n", __func__, ret);
	return ret;
}

static int nfs4_proc_sequence(struct nfs_client *clp, struct rpc_cred *cred)
{
	struct rpc_task *task;
	int ret;

6076
	task = _nfs41_proc_sequence(clp, cred, true);
6077 6078 6079 6080 6081
	if (IS_ERR(task)) {
		ret = PTR_ERR(task);
		goto out;
	}
	ret = rpc_wait_for_completion_task(task);
6082 6083 6084 6085 6086
	if (!ret) {
		struct nfs4_sequence_res *res = task->tk_msg.rpc_resp;

		if (task->tk_status == 0)
			nfs41_handle_sequence_flag_errors(clp, res->sr_status_flags);
6087
		ret = task->tk_status;
6088
	}
6089 6090 6091 6092
	rpc_put_task(task);
out:
	dprintk("<-- %s status=%d\n", __func__, ret);
	return ret;
A
Andy Adamson 已提交
6093 6094
}

6095 6096 6097 6098 6099 6100 6101 6102 6103 6104
struct nfs4_reclaim_complete_data {
	struct nfs_client *clp;
	struct nfs41_reclaim_complete_args arg;
	struct nfs41_reclaim_complete_res res;
};

static void nfs4_reclaim_complete_prepare(struct rpc_task *task, void *data)
{
	struct nfs4_reclaim_complete_data *calldata = data;

6105 6106 6107 6108
	nfs41_setup_sequence(calldata->clp->cl_session,
			&calldata->arg.seq_args,
			&calldata->res.seq_res,
			task);
6109 6110
}

6111 6112 6113 6114 6115 6116 6117 6118 6119
static int nfs41_reclaim_complete_handle_errors(struct rpc_task *task, struct nfs_client *clp)
{
	switch(task->tk_status) {
	case 0:
	case -NFS4ERR_COMPLETE_ALREADY:
	case -NFS4ERR_WRONG_CRED: /* What to do here? */
		break;
	case -NFS4ERR_DELAY:
		rpc_delay(task, NFS4_POLL_RETRY_MAX);
6120 6121
		/* fall through */
	case -NFS4ERR_RETRY_UNCACHED_REP:
6122 6123
		return -EAGAIN;
	default:
6124
		nfs4_schedule_lease_recovery(clp);
6125 6126 6127 6128
	}
	return 0;
}

6129 6130 6131 6132 6133 6134 6135
static void nfs4_reclaim_complete_done(struct rpc_task *task, void *data)
{
	struct nfs4_reclaim_complete_data *calldata = data;
	struct nfs_client *clp = calldata->clp;
	struct nfs4_sequence_res *res = &calldata->res.seq_res;

	dprintk("--> %s\n", __func__);
6136 6137
	if (!nfs41_sequence_done(task, res))
		return;
6138

6139 6140 6141 6142
	if (nfs41_reclaim_complete_handle_errors(task, clp) == -EAGAIN) {
		rpc_restart_call_prepare(task);
		return;
	}
6143 6144 6145 6146 6147 6148 6149 6150 6151 6152 6153 6154 6155 6156 6157 6158 6159 6160 6161
	dprintk("<-- %s\n", __func__);
}

static void nfs4_free_reclaim_complete_data(void *data)
{
	struct nfs4_reclaim_complete_data *calldata = data;

	kfree(calldata);
}

static const struct rpc_call_ops nfs4_reclaim_complete_call_ops = {
	.rpc_call_prepare = nfs4_reclaim_complete_prepare,
	.rpc_call_done = nfs4_reclaim_complete_done,
	.rpc_release = nfs4_free_reclaim_complete_data,
};

/*
 * Issue a global reclaim complete.
 */
6162 6163
static int nfs41_proc_reclaim_complete(struct nfs_client *clp,
		struct rpc_cred *cred)
6164 6165 6166 6167 6168
{
	struct nfs4_reclaim_complete_data *calldata;
	struct rpc_task *task;
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_RECLAIM_COMPLETE],
6169
		.rpc_cred = cred,
6170 6171 6172 6173 6174 6175 6176 6177 6178 6179
	};
	struct rpc_task_setup task_setup_data = {
		.rpc_client = clp->cl_rpcclient,
		.rpc_message = &msg,
		.callback_ops = &nfs4_reclaim_complete_call_ops,
		.flags = RPC_TASK_ASYNC,
	};
	int status = -ENOMEM;

	dprintk("--> %s\n", __func__);
6180
	calldata = kzalloc(sizeof(*calldata), GFP_NOFS);
6181 6182 6183 6184 6185
	if (calldata == NULL)
		goto out;
	calldata->clp = clp;
	calldata->arg.one_fs = 0;

6186
	nfs41_init_sequence(&calldata->arg.seq_args, &calldata->res.seq_res, 0);
6187
	nfs4_set_sequence_privileged(&calldata->arg.seq_args);
6188 6189 6190 6191
	msg.rpc_argp = &calldata->arg;
	msg.rpc_resp = &calldata->res;
	task_setup_data.callback_data = calldata;
	task = rpc_run_task(&task_setup_data);
6192
	if (IS_ERR(task)) {
6193
		status = PTR_ERR(task);
6194 6195
		goto out;
	}
6196 6197 6198
	status = nfs4_wait_for_completion_rpc_task(task);
	if (status == 0)
		status = task->tk_status;
6199
	rpc_put_task(task);
6200
	return 0;
6201 6202 6203 6204
out:
	dprintk("<-- %s status=%d\n", __func__, status);
	return status;
}
6205 6206 6207 6208 6209

static void
nfs4_layoutget_prepare(struct rpc_task *task, void *calldata)
{
	struct nfs4_layoutget *lgp = calldata;
F
Fred Isaman 已提交
6210
	struct nfs_server *server = NFS_SERVER(lgp->args.inode);
6211
	struct nfs4_session *session = nfs4_get_session(server);
6212 6213

	dprintk("--> %s\n", __func__);
F
Fred Isaman 已提交
6214 6215 6216 6217 6218
	/* Note the is a race here, where a CB_LAYOUTRECALL can come in
	 * right now covering the LAYOUTGET we are about to send.
	 * However, that is not so catastrophic, and there seems
	 * to be no way to prevent it completely.
	 */
6219
	if (nfs41_setup_sequence(session, &lgp->args.seq_args,
6220
				&lgp->res.seq_res, task))
6221
		return;
6222 6223 6224 6225 6226
	if (pnfs_choose_layoutget_stateid(&lgp->args.stateid,
					  NFS_I(lgp->args.inode)->layout,
					  lgp->args.ctx->state)) {
		rpc_exit(task, NFS4_OK);
	}
6227 6228 6229 6230 6231
}

static void nfs4_layoutget_done(struct rpc_task *task, void *calldata)
{
	struct nfs4_layoutget *lgp = calldata;
6232 6233 6234 6235
	struct inode *inode = lgp->args.inode;
	struct nfs_server *server = NFS_SERVER(inode);
	struct pnfs_layout_hdr *lo;
	struct nfs4_state *state = NULL;
6236
	unsigned long timeo, giveup;
6237 6238 6239

	dprintk("--> %s\n", __func__);

6240
	if (!nfs41_sequence_done(task, &lgp->res.seq_res))
6241
		goto out;
6242 6243 6244

	switch (task->tk_status) {
	case 0:
6245
		goto out;
6246 6247
	case -NFS4ERR_LAYOUTTRYLATER:
	case -NFS4ERR_RECALLCONFLICT:
6248 6249 6250 6251
		timeo = rpc_get_timeout(task->tk_client);
		giveup = lgp->args.timestamp + timeo;
		if (time_after(giveup, jiffies))
			task->tk_status = -NFS4ERR_DELAY;
6252 6253 6254 6255 6256 6257 6258 6259 6260 6261 6262 6263 6264 6265 6266 6267 6268
		break;
	case -NFS4ERR_EXPIRED:
	case -NFS4ERR_BAD_STATEID:
		spin_lock(&inode->i_lock);
		lo = NFS_I(inode)->layout;
		if (!lo || list_empty(&lo->plh_segs)) {
			spin_unlock(&inode->i_lock);
			/* If the open stateid was bad, then recover it. */
			state = lgp->args.ctx->state;
		} else {
			LIST_HEAD(head);

			pnfs_mark_matching_lsegs_invalid(lo, &head, NULL);
			spin_unlock(&inode->i_lock);
			/* Mark the bad layout state as invalid, then
			 * retry using the open stateid. */
			pnfs_free_lseg_list(&head);
6269 6270
		}
	}
6271 6272 6273
	if (nfs4_async_handle_error(task, server, state) == -EAGAIN)
		rpc_restart_call_prepare(task);
out:
6274 6275 6276
	dprintk("<-- %s\n", __func__);
}

6277 6278 6279 6280 6281 6282 6283 6284 6285 6286 6287 6288 6289 6290 6291 6292 6293 6294 6295 6296 6297 6298 6299 6300 6301 6302 6303 6304 6305 6306 6307 6308 6309 6310 6311 6312 6313 6314 6315 6316 6317 6318 6319 6320
static size_t max_response_pages(struct nfs_server *server)
{
	u32 max_resp_sz = server->nfs_client->cl_session->fc_attrs.max_resp_sz;
	return nfs_page_array_len(0, max_resp_sz);
}

static void nfs4_free_pages(struct page **pages, size_t size)
{
	int i;

	if (!pages)
		return;

	for (i = 0; i < size; i++) {
		if (!pages[i])
			break;
		__free_page(pages[i]);
	}
	kfree(pages);
}

static struct page **nfs4_alloc_pages(size_t size, gfp_t gfp_flags)
{
	struct page **pages;
	int i;

	pages = kcalloc(size, sizeof(struct page *), gfp_flags);
	if (!pages) {
		dprintk("%s: can't alloc array of %zu pages\n", __func__, size);
		return NULL;
	}

	for (i = 0; i < size; i++) {
		pages[i] = alloc_page(gfp_flags);
		if (!pages[i]) {
			dprintk("%s: failed to allocate page\n", __func__);
			nfs4_free_pages(pages, size);
			return NULL;
		}
	}

	return pages;
}

6321 6322 6323
static void nfs4_layoutget_release(void *calldata)
{
	struct nfs4_layoutget *lgp = calldata;
6324 6325
	struct inode *inode = lgp->args.inode;
	struct nfs_server *server = NFS_SERVER(inode);
6326
	size_t max_pages = max_response_pages(server);
6327 6328

	dprintk("--> %s\n", __func__);
6329
	nfs4_free_pages(lgp->args.layout.pages, max_pages);
6330
	pnfs_put_layout_hdr(NFS_I(inode)->layout);
6331 6332 6333 6334 6335 6336 6337 6338 6339 6340 6341
	put_nfs_open_context(lgp->args.ctx);
	kfree(calldata);
	dprintk("<-- %s\n", __func__);
}

static const struct rpc_call_ops nfs4_layoutget_call_ops = {
	.rpc_call_prepare = nfs4_layoutget_prepare,
	.rpc_call_done = nfs4_layoutget_done,
	.rpc_release = nfs4_layoutget_release,
};

6342 6343
struct pnfs_layout_segment *
nfs4_proc_layoutget(struct nfs4_layoutget *lgp, gfp_t gfp_flags)
6344
{
6345 6346
	struct inode *inode = lgp->args.inode;
	struct nfs_server *server = NFS_SERVER(inode);
6347
	size_t max_pages = max_response_pages(server);
6348 6349 6350 6351 6352
	struct rpc_task *task;
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTGET],
		.rpc_argp = &lgp->args,
		.rpc_resp = &lgp->res,
6353
		.rpc_cred = lgp->cred,
6354 6355 6356 6357 6358 6359 6360 6361
	};
	struct rpc_task_setup task_setup_data = {
		.rpc_client = server->client,
		.rpc_message = &msg,
		.callback_ops = &nfs4_layoutget_call_ops,
		.callback_data = lgp,
		.flags = RPC_TASK_ASYNC,
	};
6362
	struct pnfs_layout_segment *lseg = NULL;
6363 6364 6365 6366
	int status = 0;

	dprintk("--> %s\n", __func__);

6367 6368 6369
	lgp->args.layout.pages = nfs4_alloc_pages(max_pages, gfp_flags);
	if (!lgp->args.layout.pages) {
		nfs4_layoutget_release(lgp);
6370
		return ERR_PTR(-ENOMEM);
6371 6372
	}
	lgp->args.layout.pglen = max_pages * PAGE_SIZE;
6373
	lgp->args.timestamp = jiffies;
6374

6375
	lgp->res.layoutp = &lgp->args.layout;
6376
	lgp->res.seq_res.sr_slot = NULL;
6377
	nfs41_init_sequence(&lgp->args.seq_args, &lgp->res.seq_res, 0);
6378 6379 6380 6381

	/* nfs4_layoutget_release calls pnfs_put_layout_hdr */
	pnfs_get_layout_hdr(NFS_I(inode)->layout);

6382 6383
	task = rpc_run_task(&task_setup_data);
	if (IS_ERR(task))
6384
		return ERR_CAST(task);
6385
	status = nfs4_wait_for_completion_rpc_task(task);
F
Fred Isaman 已提交
6386 6387
	if (status == 0)
		status = task->tk_status;
6388 6389
	/* if layoutp->len is 0, nfs4_layoutget_prepare called rpc_exit */
	if (status == 0 && lgp->res.layoutp->len)
6390
		lseg = pnfs_layout_process(lgp);
6391 6392
	rpc_put_task(task);
	dprintk("<-- %s status=%d\n", __func__, status);
6393 6394 6395
	if (status)
		return ERR_PTR(status);
	return lseg;
6396 6397
}

B
Benny Halevy 已提交
6398 6399 6400 6401 6402 6403
static void
nfs4_layoutreturn_prepare(struct rpc_task *task, void *calldata)
{
	struct nfs4_layoutreturn *lrp = calldata;

	dprintk("--> %s\n", __func__);
6404 6405 6406 6407
	nfs41_setup_sequence(lrp->clp->cl_session,
			&lrp->args.seq_args,
			&lrp->res.seq_res,
			task);
B
Benny Halevy 已提交
6408 6409 6410 6411 6412 6413 6414 6415 6416
}

static void nfs4_layoutreturn_done(struct rpc_task *task, void *calldata)
{
	struct nfs4_layoutreturn *lrp = calldata;
	struct nfs_server *server;

	dprintk("--> %s\n", __func__);

6417
	if (!nfs41_sequence_done(task, &lrp->res.seq_res))
B
Benny Halevy 已提交
6418 6419 6420 6421
		return;

	server = NFS_SERVER(lrp->args.inode);
	if (nfs4_async_handle_error(task, server, NULL) == -EAGAIN) {
6422
		rpc_restart_call_prepare(task);
B
Benny Halevy 已提交
6423 6424 6425 6426 6427 6428 6429 6430
		return;
	}
	dprintk("<-- %s\n", __func__);
}

static void nfs4_layoutreturn_release(void *calldata)
{
	struct nfs4_layoutreturn *lrp = calldata;
6431
	struct pnfs_layout_hdr *lo = lrp->args.layout;
B
Benny Halevy 已提交
6432 6433

	dprintk("--> %s\n", __func__);
6434 6435 6436 6437 6438
	spin_lock(&lo->plh_inode->i_lock);
	if (lrp->res.lrs_present)
		pnfs_set_layout_stateid(lo, &lrp->res.stateid, true);
	lo->plh_block_lgets--;
	spin_unlock(&lo->plh_inode->i_lock);
6439
	pnfs_put_layout_hdr(lrp->args.layout);
B
Benny Halevy 已提交
6440 6441 6442 6443 6444 6445 6446 6447 6448 6449 6450 6451 6452 6453 6454 6455 6456
	kfree(calldata);
	dprintk("<-- %s\n", __func__);
}

static const struct rpc_call_ops nfs4_layoutreturn_call_ops = {
	.rpc_call_prepare = nfs4_layoutreturn_prepare,
	.rpc_call_done = nfs4_layoutreturn_done,
	.rpc_release = nfs4_layoutreturn_release,
};

int nfs4_proc_layoutreturn(struct nfs4_layoutreturn *lrp)
{
	struct rpc_task *task;
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTRETURN],
		.rpc_argp = &lrp->args,
		.rpc_resp = &lrp->res,
6457
		.rpc_cred = lrp->cred,
B
Benny Halevy 已提交
6458 6459 6460 6461 6462 6463 6464 6465 6466 6467
	};
	struct rpc_task_setup task_setup_data = {
		.rpc_client = lrp->clp->cl_rpcclient,
		.rpc_message = &msg,
		.callback_ops = &nfs4_layoutreturn_call_ops,
		.callback_data = lrp,
	};
	int status;

	dprintk("--> %s\n", __func__);
6468
	nfs41_init_sequence(&lrp->args.seq_args, &lrp->res.seq_res, 1);
B
Benny Halevy 已提交
6469 6470 6471 6472 6473 6474 6475 6476 6477
	task = rpc_run_task(&task_setup_data);
	if (IS_ERR(task))
		return PTR_ERR(task);
	status = task->tk_status;
	dprintk("<-- %s status=%d\n", __func__, status);
	rpc_put_task(task);
	return status;
}

A
Andy Adamson 已提交
6478 6479 6480 6481 6482 6483 6484 6485 6486 6487 6488 6489 6490 6491 6492 6493 6494 6495 6496 6497 6498 6499 6500 6501 6502 6503 6504 6505 6506 6507 6508 6509 6510 6511 6512 6513 6514 6515 6516 6517 6518 6519 6520 6521 6522 6523 6524 6525
/*
 * Retrieve the list of Data Server devices from the MDS.
 */
static int _nfs4_getdevicelist(struct nfs_server *server,
				    const struct nfs_fh *fh,
				    struct pnfs_devicelist *devlist)
{
	struct nfs4_getdevicelist_args args = {
		.fh = fh,
		.layoutclass = server->pnfs_curr_ld->id,
	};
	struct nfs4_getdevicelist_res res = {
		.devlist = devlist,
	};
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETDEVICELIST],
		.rpc_argp = &args,
		.rpc_resp = &res,
	};
	int status;

	dprintk("--> %s\n", __func__);
	status = nfs4_call_sync(server->client, server, &msg, &args.seq_args,
				&res.seq_res, 0);
	dprintk("<-- %s status=%d\n", __func__, status);
	return status;
}

int nfs4_proc_getdevicelist(struct nfs_server *server,
			    const struct nfs_fh *fh,
			    struct pnfs_devicelist *devlist)
{
	struct nfs4_exception exception = { };
	int err;

	do {
		err = nfs4_handle_exception(server,
				_nfs4_getdevicelist(server, fh, devlist),
				&exception);
	} while (exception.retry);

	dprintk("%s: err=%d, num_devs=%u\n", __func__,
		err, devlist->num_devs);

	return err;
}
EXPORT_SYMBOL_GPL(nfs4_proc_getdevicelist);

6526 6527 6528 6529 6530 6531 6532 6533 6534 6535 6536 6537 6538 6539 6540 6541 6542
static int
_nfs4_proc_getdeviceinfo(struct nfs_server *server, struct pnfs_device *pdev)
{
	struct nfs4_getdeviceinfo_args args = {
		.pdev = pdev,
	};
	struct nfs4_getdeviceinfo_res res = {
		.pdev = pdev,
	};
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_GETDEVICEINFO],
		.rpc_argp = &args,
		.rpc_resp = &res,
	};
	int status;

	dprintk("--> %s\n", __func__);
6543
	status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
6544 6545 6546 6547 6548 6549 6550 6551 6552 6553 6554 6555 6556 6557 6558 6559 6560 6561 6562
	dprintk("<-- %s status=%d\n", __func__, status);

	return status;
}

int nfs4_proc_getdeviceinfo(struct nfs_server *server, struct pnfs_device *pdev)
{
	struct nfs4_exception exception = { };
	int err;

	do {
		err = nfs4_handle_exception(server,
					_nfs4_proc_getdeviceinfo(server, pdev),
					&exception);
	} while (exception.retry);
	return err;
}
EXPORT_SYMBOL_GPL(nfs4_proc_getdeviceinfo);

A
Andy Adamson 已提交
6563 6564 6565 6566
static void nfs4_layoutcommit_prepare(struct rpc_task *task, void *calldata)
{
	struct nfs4_layoutcommit_data *data = calldata;
	struct nfs_server *server = NFS_SERVER(data->args.inode);
6567
	struct nfs4_session *session = nfs4_get_session(server);
A
Andy Adamson 已提交
6568

6569 6570 6571 6572
	nfs41_setup_sequence(session,
			&data->args.seq_args,
			&data->res.seq_res,
			task);
A
Andy Adamson 已提交
6573 6574 6575 6576 6577 6578 6579 6580
}

static void
nfs4_layoutcommit_done(struct rpc_task *task, void *calldata)
{
	struct nfs4_layoutcommit_data *data = calldata;
	struct nfs_server *server = NFS_SERVER(data->args.inode);

6581
	if (!nfs41_sequence_done(task, &data->res.seq_res))
A
Andy Adamson 已提交
6582 6583 6584
		return;

	switch (task->tk_status) { /* Just ignore these failures */
6585 6586 6587 6588
	case -NFS4ERR_DELEG_REVOKED: /* layout was recalled */
	case -NFS4ERR_BADIOMODE:     /* no IOMODE_RW layout for range */
	case -NFS4ERR_BADLAYOUT:     /* no layout */
	case -NFS4ERR_GRACE:	    /* loca_recalim always false */
A
Andy Adamson 已提交
6589
		task->tk_status = 0;
6590 6591
		break;
	case 0:
A
Andy Adamson 已提交
6592 6593
		nfs_post_op_update_inode_force_wcc(data->args.inode,
						   data->res.fattr);
6594 6595 6596 6597 6598 6599 6600
		break;
	default:
		if (nfs4_async_handle_error(task, server, NULL) == -EAGAIN) {
			rpc_restart_call_prepare(task);
			return;
		}
	}
A
Andy Adamson 已提交
6601 6602 6603 6604 6605 6606
}

static void nfs4_layoutcommit_release(void *calldata)
{
	struct nfs4_layoutcommit_data *data = calldata;

A
Andy Adamson 已提交
6607
	pnfs_cleanup_layoutcommit(data);
A
Andy Adamson 已提交
6608 6609 6610 6611 6612 6613 6614 6615 6616 6617 6618
	put_rpccred(data->cred);
	kfree(data);
}

static const struct rpc_call_ops nfs4_layoutcommit_ops = {
	.rpc_call_prepare = nfs4_layoutcommit_prepare,
	.rpc_call_done = nfs4_layoutcommit_done,
	.rpc_release = nfs4_layoutcommit_release,
};

int
6619
nfs4_proc_layoutcommit(struct nfs4_layoutcommit_data *data, bool sync)
A
Andy Adamson 已提交
6620 6621 6622 6623 6624 6625 6626 6627 6628 6629 6630 6631 6632 6633 6634 6635 6636 6637 6638 6639 6640 6641 6642 6643
{
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_LAYOUTCOMMIT],
		.rpc_argp = &data->args,
		.rpc_resp = &data->res,
		.rpc_cred = data->cred,
	};
	struct rpc_task_setup task_setup_data = {
		.task = &data->task,
		.rpc_client = NFS_CLIENT(data->args.inode),
		.rpc_message = &msg,
		.callback_ops = &nfs4_layoutcommit_ops,
		.callback_data = data,
		.flags = RPC_TASK_ASYNC,
	};
	struct rpc_task *task;
	int status = 0;

	dprintk("NFS: %4d initiating layoutcommit call. sync %d "
		"lbw: %llu inode %lu\n",
		data->task.tk_pid, sync,
		data->args.lastbytewritten,
		data->args.inode->i_ino);

6644
	nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 1);
A
Andy Adamson 已提交
6645 6646 6647
	task = rpc_run_task(&task_setup_data);
	if (IS_ERR(task))
		return PTR_ERR(task);
6648
	if (sync == false)
A
Andy Adamson 已提交
6649 6650 6651 6652 6653 6654 6655 6656 6657 6658
		goto out;
	status = nfs4_wait_for_completion_rpc_task(task);
	if (status != 0)
		goto out;
	status = task->tk_status;
out:
	dprintk("%s: status %d\n", __func__, status);
	rpc_put_task(task);
	return status;
}
6659 6660 6661 6662 6663 6664 6665 6666 6667 6668 6669 6670 6671 6672 6673 6674 6675 6676 6677 6678 6679 6680 6681 6682 6683 6684 6685 6686 6687 6688 6689

static int
_nfs41_proc_secinfo_no_name(struct nfs_server *server, struct nfs_fh *fhandle,
		    struct nfs_fsinfo *info, struct nfs4_secinfo_flavors *flavors)
{
	struct nfs41_secinfo_no_name_args args = {
		.style = SECINFO_STYLE_CURRENT_FH,
	};
	struct nfs4_secinfo_res res = {
		.flavors = flavors,
	};
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_SECINFO_NO_NAME],
		.rpc_argp = &args,
		.rpc_resp = &res,
	};
	return nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
}

static int
nfs41_proc_secinfo_no_name(struct nfs_server *server, struct nfs_fh *fhandle,
			   struct nfs_fsinfo *info, struct nfs4_secinfo_flavors *flavors)
{
	struct nfs4_exception exception = { };
	int err;
	do {
		err = _nfs41_proc_secinfo_no_name(server, fhandle, info, flavors);
		switch (err) {
		case 0:
		case -NFS4ERR_WRONGSEC:
		case -NFS4ERR_NOTSUPP:
6690
			goto out;
6691 6692 6693 6694
		default:
			err = nfs4_handle_exception(server, err, &exception);
		}
	} while (exception.retry);
6695
out:
6696 6697 6698 6699 6700 6701 6702 6703 6704 6705 6706 6707 6708 6709 6710 6711 6712 6713 6714 6715 6716 6717 6718 6719 6720 6721 6722 6723 6724 6725 6726 6727 6728 6729 6730 6731 6732 6733 6734 6735 6736 6737 6738
	return err;
}

static int
nfs41_find_root_sec(struct nfs_server *server, struct nfs_fh *fhandle,
		    struct nfs_fsinfo *info)
{
	int err;
	struct page *page;
	rpc_authflavor_t flavor;
	struct nfs4_secinfo_flavors *flavors;

	page = alloc_page(GFP_KERNEL);
	if (!page) {
		err = -ENOMEM;
		goto out;
	}

	flavors = page_address(page);
	err = nfs41_proc_secinfo_no_name(server, fhandle, info, flavors);

	/*
	 * Fall back on "guess and check" method if
	 * the server doesn't support SECINFO_NO_NAME
	 */
	if (err == -NFS4ERR_WRONGSEC || err == -NFS4ERR_NOTSUPP) {
		err = nfs4_find_root_sec(server, fhandle, info);
		goto out_freepage;
	}
	if (err)
		goto out_freepage;

	flavor = nfs_find_best_sec(flavors);
	if (err == 0)
		err = nfs4_lookup_root_sec(server, fhandle, info, flavor);

out_freepage:
	put_page(page);
	if (err == -EACCES)
		return -EPERM;
out:
	return err;
}
6739 6740

static int _nfs41_test_stateid(struct nfs_server *server, nfs4_stateid *stateid)
B
Bryan Schumaker 已提交
6741 6742 6743
{
	int status;
	struct nfs41_test_stateid_args args = {
6744
		.stateid = stateid,
B
Bryan Schumaker 已提交
6745 6746 6747 6748 6749 6750 6751
	};
	struct nfs41_test_stateid_res res;
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_TEST_STATEID],
		.rpc_argp = &args,
		.rpc_resp = &res,
	};
6752

6753
	dprintk("NFS call  test_stateid %p\n", stateid);
6754
	nfs41_init_sequence(&args.seq_args, &res.seq_res, 0);
6755 6756 6757
	nfs4_set_sequence_privileged(&args.seq_args);
	status = nfs4_call_sync_sequence(server->client, server, &msg,
			&args.seq_args, &res.seq_res);
6758 6759
	if (status != NFS_OK) {
		dprintk("NFS reply test_stateid: failed, %d\n", status);
6760
		return status;
6761 6762
	}
	dprintk("NFS reply test_stateid: succeeded, %d\n", -res.status);
6763
	return -res.status;
B
Bryan Schumaker 已提交
6764 6765
}

6766 6767 6768 6769 6770 6771 6772 6773 6774 6775
/**
 * nfs41_test_stateid - perform a TEST_STATEID operation
 *
 * @server: server / transport on which to perform the operation
 * @stateid: state ID to test
 *
 * Returns NFS_OK if the server recognizes that "stateid" is valid.
 * Otherwise a negative NFS4ERR value is returned if the operation
 * failed or the state ID is not currently valid.
 */
6776
static int nfs41_test_stateid(struct nfs_server *server, nfs4_stateid *stateid)
B
Bryan Schumaker 已提交
6777 6778 6779 6780
{
	struct nfs4_exception exception = { };
	int err;
	do {
6781 6782 6783 6784
		err = _nfs41_test_stateid(server, stateid);
		if (err != -NFS4ERR_DELAY)
			break;
		nfs4_handle_exception(server, err, &exception);
B
Bryan Schumaker 已提交
6785 6786 6787
	} while (exception.retry);
	return err;
}
B
Bryan Schumaker 已提交
6788

6789 6790 6791
struct nfs_free_stateid_data {
	struct nfs_server *server;
	struct nfs41_free_stateid_args args;
B
Bryan Schumaker 已提交
6792
	struct nfs41_free_stateid_res res;
6793 6794 6795 6796 6797 6798 6799 6800 6801 6802 6803 6804 6805 6806 6807 6808 6809 6810 6811 6812 6813 6814 6815 6816 6817 6818 6819 6820 6821 6822 6823 6824 6825 6826 6827 6828 6829 6830 6831
};

static void nfs41_free_stateid_prepare(struct rpc_task *task, void *calldata)
{
	struct nfs_free_stateid_data *data = calldata;
	nfs41_setup_sequence(nfs4_get_session(data->server),
			&data->args.seq_args,
			&data->res.seq_res,
			task);
}

static void nfs41_free_stateid_done(struct rpc_task *task, void *calldata)
{
	struct nfs_free_stateid_data *data = calldata;

	nfs41_sequence_done(task, &data->res.seq_res);

	switch (task->tk_status) {
	case -NFS4ERR_DELAY:
		if (nfs4_async_handle_error(task, data->server, NULL) == -EAGAIN)
			rpc_restart_call_prepare(task);
	}
}

static void nfs41_free_stateid_release(void *calldata)
{
	kfree(calldata);
}

const struct rpc_call_ops nfs41_free_stateid_ops = {
	.rpc_call_prepare = nfs41_free_stateid_prepare,
	.rpc_call_done = nfs41_free_stateid_done,
	.rpc_release = nfs41_free_stateid_release,
};

static struct rpc_task *_nfs41_free_stateid(struct nfs_server *server,
		nfs4_stateid *stateid,
		bool privileged)
{
B
Bryan Schumaker 已提交
6832 6833 6834
	struct rpc_message msg = {
		.rpc_proc = &nfs4_procedures[NFSPROC4_CLNT_FREE_STATEID],
	};
6835 6836 6837 6838 6839 6840 6841
	struct rpc_task_setup task_setup = {
		.rpc_client = server->client,
		.rpc_message = &msg,
		.callback_ops = &nfs41_free_stateid_ops,
		.flags = RPC_TASK_ASYNC,
	};
	struct nfs_free_stateid_data *data;
B
Bryan Schumaker 已提交
6842

6843
	dprintk("NFS call  free_stateid %p\n", stateid);
6844 6845 6846 6847 6848 6849 6850 6851 6852 6853 6854 6855 6856 6857 6858
	data = kmalloc(sizeof(*data), GFP_NOFS);
	if (!data)
		return ERR_PTR(-ENOMEM);
	data->server = server;
	nfs4_stateid_copy(&data->args.stateid, stateid);

	task_setup.callback_data = data;

	msg.rpc_argp = &data->args;
	msg.rpc_resp = &data->res;
	nfs41_init_sequence(&data->args.seq_args, &data->res.seq_res, 0);
	if (privileged)
		nfs4_set_sequence_privileged(&data->args.seq_args);

	return rpc_run_task(&task_setup);
B
Bryan Schumaker 已提交
6859 6860
}

6861 6862 6863 6864 6865 6866 6867 6868 6869
/**
 * nfs41_free_stateid - perform a FREE_STATEID operation
 *
 * @server: server / transport on which to perform the operation
 * @stateid: state ID to release
 *
 * Returns NFS_OK if the server freed "stateid".  Otherwise a
 * negative NFS4ERR value is returned.
 */
6870
static int nfs41_free_stateid(struct nfs_server *server, nfs4_stateid *stateid)
B
Bryan Schumaker 已提交
6871
{
6872 6873 6874 6875 6876 6877 6878 6879 6880 6881 6882
	struct rpc_task *task;
	int ret;

	task = _nfs41_free_stateid(server, stateid, true);
	if (IS_ERR(task))
		return PTR_ERR(task);
	ret = rpc_wait_for_completion_task(task);
	if (!ret)
		ret = task->tk_status;
	rpc_put_task(task);
	return ret;
B
Bryan Schumaker 已提交
6883
}
6884

6885 6886 6887 6888 6889 6890 6891 6892 6893 6894 6895 6896
static int nfs41_free_lock_state(struct nfs_server *server, struct nfs4_lock_state *lsp)
{
	struct rpc_task *task;

	task = _nfs41_free_stateid(server, &lsp->ls_stateid, false);
	nfs4_free_lock_state(server, lsp);
	if (IS_ERR(task))
		return PTR_ERR(task);
	rpc_put_task(task);
	return 0;
}

6897 6898 6899
static bool nfs41_match_stateid(const nfs4_stateid *s1,
		const nfs4_stateid *s2)
{
6900
	if (memcmp(s1->other, s2->other, sizeof(s1->other)) != 0)
6901 6902
		return false;

6903
	if (s1->seqid == s2->seqid)
6904
		return true;
6905
	if (s1->seqid == 0 || s2->seqid == 0)
6906 6907 6908 6909 6910
		return true;

	return false;
}

6911 6912
#endif /* CONFIG_NFS_V4_1 */

6913 6914 6915
static bool nfs4_match_stateid(const nfs4_stateid *s1,
		const nfs4_stateid *s2)
{
6916
	return nfs4_stateid_match(s1, s2);
6917 6918 6919
}


6920
static const struct nfs4_state_recovery_ops nfs40_reboot_recovery_ops = {
6921
	.owner_flag_bit = NFS_OWNER_RECLAIM_REBOOT,
6922
	.state_flag_bit	= NFS_STATE_RECLAIM_REBOOT,
L
Linus Torvalds 已提交
6923 6924
	.recover_open	= nfs4_open_reclaim,
	.recover_lock	= nfs4_lock_reclaim,
6925
	.establish_clid = nfs4_init_clientid,
6926
	.get_clid_cred	= nfs4_get_setclientid_cred,
6927
	.detect_trunking = nfs40_discover_server_trunking,
L
Linus Torvalds 已提交
6928 6929
};

6930
#if defined(CONFIG_NFS_V4_1)
6931
static const struct nfs4_state_recovery_ops nfs41_reboot_recovery_ops = {
6932 6933 6934 6935
	.owner_flag_bit = NFS_OWNER_RECLAIM_REBOOT,
	.state_flag_bit	= NFS_STATE_RECLAIM_REBOOT,
	.recover_open	= nfs4_open_reclaim,
	.recover_lock	= nfs4_lock_reclaim,
6936
	.establish_clid = nfs41_init_clientid,
6937
	.get_clid_cred	= nfs4_get_exchange_id_cred,
6938
	.reclaim_complete = nfs41_proc_reclaim_complete,
6939
	.detect_trunking = nfs41_discover_server_trunking,
6940 6941 6942
};
#endif /* CONFIG_NFS_V4_1 */

6943
static const struct nfs4_state_recovery_ops nfs40_nograce_recovery_ops = {
6944 6945 6946 6947 6948
	.owner_flag_bit = NFS_OWNER_RECLAIM_NOGRACE,
	.state_flag_bit	= NFS_STATE_RECLAIM_NOGRACE,
	.recover_open	= nfs4_open_expired,
	.recover_lock	= nfs4_lock_expired,
	.establish_clid = nfs4_init_clientid,
6949
	.get_clid_cred	= nfs4_get_setclientid_cred,
6950 6951 6952
};

#if defined(CONFIG_NFS_V4_1)
6953
static const struct nfs4_state_recovery_ops nfs41_nograce_recovery_ops = {
6954
	.owner_flag_bit = NFS_OWNER_RECLAIM_NOGRACE,
6955
	.state_flag_bit	= NFS_STATE_RECLAIM_NOGRACE,
6956 6957
	.recover_open	= nfs41_open_expired,
	.recover_lock	= nfs41_lock_expired,
6958
	.establish_clid = nfs41_init_clientid,
6959
	.get_clid_cred	= nfs4_get_exchange_id_cred,
L
Linus Torvalds 已提交
6960
};
6961
#endif /* CONFIG_NFS_V4_1 */
L
Linus Torvalds 已提交
6962

6963
static const struct nfs4_state_maintenance_ops nfs40_state_renewal_ops = {
B
Benny Halevy 已提交
6964
	.sched_state_renewal = nfs4_proc_async_renew,
6965
	.get_state_renewal_cred_locked = nfs4_get_renew_cred_locked,
6966
	.renew_lease = nfs4_proc_renew,
B
Benny Halevy 已提交
6967 6968 6969
};

#if defined(CONFIG_NFS_V4_1)
6970
static const struct nfs4_state_maintenance_ops nfs41_state_renewal_ops = {
B
Benny Halevy 已提交
6971
	.sched_state_renewal = nfs41_proc_async_sequence,
6972
	.get_state_renewal_cred_locked = nfs4_get_machine_cred_locked,
6973
	.renew_lease = nfs4_proc_sequence,
B
Benny Halevy 已提交
6974 6975 6976
};
#endif

6977 6978
static const struct nfs4_minor_version_ops nfs_v4_0_minor_ops = {
	.minor_version = 0,
6979 6980 6981 6982
	.init_caps = NFS_CAP_READDIRPLUS
		| NFS_CAP_ATOMIC_OPEN
		| NFS_CAP_CHANGE_ATTR
		| NFS_CAP_POSIX_LOCK,
6983
	.call_sync = _nfs4_call_sync,
6984
	.match_stateid = nfs4_match_stateid,
6985
	.find_root_sec = nfs4_find_root_sec,
6986
	.free_lock_state = nfs4_release_lockowner,
6987 6988 6989
	.reboot_recovery_ops = &nfs40_reboot_recovery_ops,
	.nograce_recovery_ops = &nfs40_nograce_recovery_ops,
	.state_renewal_ops = &nfs40_state_renewal_ops,
6990 6991 6992 6993 6994
};

#if defined(CONFIG_NFS_V4_1)
static const struct nfs4_minor_version_ops nfs_v4_1_minor_ops = {
	.minor_version = 1,
6995 6996 6997
	.init_caps = NFS_CAP_READDIRPLUS
		| NFS_CAP_ATOMIC_OPEN
		| NFS_CAP_CHANGE_ATTR
6998
		| NFS_CAP_POSIX_LOCK
6999 7000
		| NFS_CAP_STATEID_NFSV41
		| NFS_CAP_ATOMIC_OPEN_V1,
7001
	.call_sync = nfs4_call_sync_sequence,
7002
	.match_stateid = nfs41_match_stateid,
7003
	.find_root_sec = nfs41_find_root_sec,
7004
	.free_lock_state = nfs41_free_lock_state,
7005 7006 7007
	.reboot_recovery_ops = &nfs41_reboot_recovery_ops,
	.nograce_recovery_ops = &nfs41_nograce_recovery_ops,
	.state_renewal_ops = &nfs41_state_renewal_ops,
7008 7009 7010 7011 7012 7013 7014 7015 7016 7017
};
#endif

const struct nfs4_minor_version_ops *nfs_v4_minor_ops[] = {
	[0] = &nfs_v4_0_minor_ops,
#if defined(CONFIG_NFS_V4_1)
	[1] = &nfs_v4_1_minor_ops,
#endif
};

7018 7019 7020 7021 7022 7023 7024 7025 7026 7027 7028 7029 7030 7031 7032 7033 7034 7035 7036 7037
const struct inode_operations nfs4_dir_inode_operations = {
	.create		= nfs_create,
	.lookup		= nfs_lookup,
	.atomic_open	= nfs_atomic_open,
	.link		= nfs_link,
	.unlink		= nfs_unlink,
	.symlink	= nfs_symlink,
	.mkdir		= nfs_mkdir,
	.rmdir		= nfs_rmdir,
	.mknod		= nfs_mknod,
	.rename		= nfs_rename,
	.permission	= nfs_permission,
	.getattr	= nfs_getattr,
	.setattr	= nfs_setattr,
	.getxattr	= generic_getxattr,
	.setxattr	= generic_setxattr,
	.listxattr	= generic_listxattr,
	.removexattr	= generic_removexattr,
};

7038
static const struct inode_operations nfs4_file_inode_operations = {
7039 7040 7041
	.permission	= nfs_permission,
	.getattr	= nfs_getattr,
	.setattr	= nfs_setattr,
7042 7043 7044 7045
	.getxattr	= generic_getxattr,
	.setxattr	= generic_setxattr,
	.listxattr	= generic_listxattr,
	.removexattr	= generic_removexattr,
7046 7047
};

D
David Howells 已提交
7048
const struct nfs_rpc_ops nfs_v4_clientops = {
L
Linus Torvalds 已提交
7049 7050 7051
	.version	= 4,			/* protocol version */
	.dentry_ops	= &nfs4_dentry_operations,
	.dir_inode_ops	= &nfs4_dir_inode_operations,
7052
	.file_inode_ops	= &nfs4_file_inode_operations,
7053
	.file_ops	= &nfs4_file_operations,
L
Linus Torvalds 已提交
7054
	.getroot	= nfs4_proc_get_root,
B
Bryan Schumaker 已提交
7055
	.submount	= nfs4_submount,
B
Bryan Schumaker 已提交
7056
	.try_mount	= nfs4_try_mount,
L
Linus Torvalds 已提交
7057 7058 7059 7060 7061 7062 7063 7064
	.getattr	= nfs4_proc_getattr,
	.setattr	= nfs4_proc_setattr,
	.lookup		= nfs4_proc_lookup,
	.access		= nfs4_proc_access,
	.readlink	= nfs4_proc_readlink,
	.create		= nfs4_proc_create,
	.remove		= nfs4_proc_remove,
	.unlink_setup	= nfs4_proc_unlink_setup,
7065
	.unlink_rpc_prepare = nfs4_proc_unlink_rpc_prepare,
L
Linus Torvalds 已提交
7066 7067
	.unlink_done	= nfs4_proc_unlink_done,
	.rename		= nfs4_proc_rename,
7068
	.rename_setup	= nfs4_proc_rename_setup,
7069
	.rename_rpc_prepare = nfs4_proc_rename_rpc_prepare,
7070
	.rename_done	= nfs4_proc_rename_done,
L
Linus Torvalds 已提交
7071 7072 7073 7074 7075 7076 7077 7078 7079
	.link		= nfs4_proc_link,
	.symlink	= nfs4_proc_symlink,
	.mkdir		= nfs4_proc_mkdir,
	.rmdir		= nfs4_proc_remove,
	.readdir	= nfs4_proc_readdir,
	.mknod		= nfs4_proc_mknod,
	.statfs		= nfs4_proc_statfs,
	.fsinfo		= nfs4_proc_fsinfo,
	.pathconf	= nfs4_proc_pathconf,
7080
	.set_capabilities = nfs4_server_capabilities,
L
Linus Torvalds 已提交
7081 7082
	.decode_dirent	= nfs4_decode_dirent,
	.read_setup	= nfs4_proc_read_setup,
7083
	.read_pageio_init = pnfs_pageio_init_read,
7084
	.read_rpc_prepare = nfs4_proc_read_rpc_prepare,
T
Trond Myklebust 已提交
7085
	.read_done	= nfs4_read_done,
L
Linus Torvalds 已提交
7086
	.write_setup	= nfs4_proc_write_setup,
7087
	.write_pageio_init = pnfs_pageio_init_write,
7088
	.write_rpc_prepare = nfs4_proc_write_rpc_prepare,
7089
	.write_done	= nfs4_write_done,
L
Linus Torvalds 已提交
7090
	.commit_setup	= nfs4_proc_commit_setup,
7091
	.commit_rpc_prepare = nfs4_proc_commit_rpc_prepare,
7092
	.commit_done	= nfs4_commit_done,
L
Linus Torvalds 已提交
7093
	.lock		= nfs4_proc_lock,
7094
	.clear_acl_cache = nfs4_zap_acl_attr,
T
Trond Myklebust 已提交
7095
	.close_context  = nfs4_close_context,
7096
	.open_context	= nfs4_atomic_open,
7097
	.have_delegation = nfs4_have_delegation,
7098
	.return_delegation = nfs4_inode_return_delegation,
7099
	.alloc_client	= nfs4_alloc_client,
7100
	.init_client	= nfs4_init_client,
7101
	.free_client	= nfs4_free_client,
7102 7103
	.create_server	= nfs4_create_server,
	.clone_server	= nfs_clone_server,
L
Linus Torvalds 已提交
7104 7105
};

7106 7107 7108 7109 7110 7111 7112 7113 7114 7115 7116 7117
static const struct xattr_handler nfs4_xattr_nfs4_acl_handler = {
	.prefix	= XATTR_NAME_NFSV4_ACL,
	.list	= nfs4_xattr_list_nfs4_acl,
	.get	= nfs4_xattr_get_nfs4_acl,
	.set	= nfs4_xattr_set_nfs4_acl,
};

const struct xattr_handler *nfs4_xattr_handlers[] = {
	&nfs4_xattr_nfs4_acl_handler,
	NULL
};

L
Linus Torvalds 已提交
7118 7119 7120 7121 7122
/*
 * Local variables:
 *  c-basic-offset: 8
 * End:
 */