callback_proc.c 15.2 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9
/*
 * linux/fs/nfs/callback_proc.c
 *
 * Copyright (C) 2004 Trond Myklebust
 *
 * NFSv4 callback procedures
 */
#include <linux/nfs4.h>
#include <linux/nfs_fs.h>
10
#include <linux/slab.h>
11
#include <linux/rcupdate.h>
12
#include "nfs4_fs.h"
L
Linus Torvalds 已提交
13 14
#include "callback.h"
#include "delegation.h"
15
#include "internal.h"
F
Fred Isaman 已提交
16
#include "pnfs.h"
L
Linus Torvalds 已提交
17

18
#ifdef NFS_DEBUG
L
Linus Torvalds 已提交
19
#define NFSDBG_FACILITY NFSDBG_CALLBACK
20
#endif
21 22 23 24

__be32 nfs4_callback_getattr(struct cb_getattrargs *args,
			     struct cb_getattrres *res,
			     struct cb_process_state *cps)
L
Linus Torvalds 已提交
25 26 27 28
{
	struct nfs_delegation *delegation;
	struct nfs_inode *nfsi;
	struct inode *inode;
29

30 31 32 33
	res->status = htonl(NFS4ERR_OP_NOT_IN_SESSION);
	if (!cps->clp) /* Always set for v4.0. Set in cb_sequence for v4.1 */
		goto out;

L
Linus Torvalds 已提交
34 35
	res->bitmap[0] = res->bitmap[1] = 0;
	res->status = htonl(NFS4ERR_BADHANDLE);
36

37
	dprintk_rcu("NFS: GETATTR callback request from %s\n",
38
		rpc_peeraddr2str(cps->clp->cl_rpcclient, RPC_DISPLAY_ADDR));
39

40
	inode = nfs_delegation_find_inode(cps->clp, &args->fh);
L
Linus Torvalds 已提交
41
	if (inode == NULL)
42
		goto out;
L
Linus Torvalds 已提交
43
	nfsi = NFS_I(inode);
44 45
	rcu_read_lock();
	delegation = rcu_dereference(nfsi->delegation);
L
Linus Torvalds 已提交
46 47 48
	if (delegation == NULL || (delegation->type & FMODE_WRITE) == 0)
		goto out_iput;
	res->size = i_size_read(inode);
49 50 51
	res->change_attr = delegation->change_attr;
	if (nfsi->npages != 0)
		res->change_attr++;
L
Linus Torvalds 已提交
52 53 54 55 56 57 58 59
	res->ctime = inode->i_ctime;
	res->mtime = inode->i_mtime;
	res->bitmap[0] = (FATTR4_WORD0_CHANGE|FATTR4_WORD0_SIZE) &
		args->bitmap[0];
	res->bitmap[1] = (FATTR4_WORD1_TIME_METADATA|FATTR4_WORD1_TIME_MODIFY) &
		args->bitmap[1];
	res->status = 0;
out_iput:
60
	rcu_read_unlock();
L
Linus Torvalds 已提交
61 62
	iput(inode);
out:
63
	dprintk("%s: exit with status = %d\n", __func__, ntohl(res->status));
L
Linus Torvalds 已提交
64 65 66
	return res->status;
}

67 68
__be32 nfs4_callback_recall(struct cb_recallargs *args, void *dummy,
			    struct cb_process_state *cps)
L
Linus Torvalds 已提交
69 70
{
	struct inode *inode;
71
	__be32 res;
L
Linus Torvalds 已提交
72
	
73 74
	res = htonl(NFS4ERR_OP_NOT_IN_SESSION);
	if (!cps->clp) /* Always set for v4.0. Set in cb_sequence for v4.1 */
L
Linus Torvalds 已提交
75
		goto out;
76

77
	dprintk_rcu("NFS: RECALL callback request from %s\n",
78 79 80 81 82 83 84 85 86 87 88 89
		rpc_peeraddr2str(cps->clp->cl_rpcclient, RPC_DISPLAY_ADDR));

	res = htonl(NFS4ERR_BADHANDLE);
	inode = nfs_delegation_find_inode(cps->clp, &args->fh);
	if (inode == NULL)
		goto out;
	/* Set up a helper thread to actually return the delegation */
	switch (nfs_async_inode_return_delegation(inode, &args->stateid)) {
	case 0:
		res = 0;
		break;
	case -ENOENT:
90
		res = htonl(NFS4ERR_BAD_STATEID);
91 92 93 94 95
		break;
	default:
		res = htonl(NFS4ERR_RESOURCE);
	}
	iput(inode);
L
Linus Torvalds 已提交
96
out:
97
	dprintk("%s: exit with status = %d\n", __func__, ntohl(res));
L
Linus Torvalds 已提交
98 99
	return res;
}
100 101 102

#if defined(CONFIG_NFS_V4_1)

103 104 105 106 107 108 109 110 111 112
/*
 * Lookup a layout by filehandle.
 *
 * Note: gets a refcount on the layout hdr and on its respective inode.
 * Caller must put the layout hdr and the inode.
 *
 * TODO: keep track of all layouts (and delegations) in a hash table
 * hashed by filehandle.
 */
static struct pnfs_layout_hdr * get_layout_by_fh_locked(struct nfs_client *clp, struct nfs_fh *fh)
F
Fred Isaman 已提交
113
{
114
	struct nfs_server *server;
F
Fred Isaman 已提交
115
	struct inode *ino;
116
	struct pnfs_layout_hdr *lo;
F
Fred Isaman 已提交
117

118 119
	list_for_each_entry_rcu(server, &clp->cl_superblocks, client_link) {
		list_for_each_entry(lo, &server->layouts, plh_layouts) {
120
			if (nfs_compare_fh(fh, &NFS_I(lo->plh_inode)->fh))
121 122 123 124
				continue;
			ino = igrab(lo->plh_inode);
			if (!ino)
				continue;
125 126 127 128 129 130 131
			spin_lock(&ino->i_lock);
			/* Is this layout in the process of being freed? */
			if (NFS_I(ino)->layout != lo) {
				spin_unlock(&ino->i_lock);
				iput(ino);
				continue;
			}
132
			pnfs_get_layout_hdr(lo);
133
			spin_unlock(&ino->i_lock);
134
			return lo;
135
		}
F
Fred Isaman 已提交
136
	}
137 138 139 140 141 142 143 144 145 146 147

	return NULL;
}

static struct pnfs_layout_hdr * get_layout_by_fh(struct nfs_client *clp, struct nfs_fh *fh)
{
	struct pnfs_layout_hdr *lo;

	spin_lock(&clp->cl_lock);
	rcu_read_lock();
	lo = get_layout_by_fh_locked(clp, fh);
148
	rcu_read_unlock();
F
Fred Isaman 已提交
149
	spin_unlock(&clp->cl_lock);
150

151 152 153 154 155 156 157 158 159 160 161 162 163
	return lo;
}

static u32 initiate_file_draining(struct nfs_client *clp,
				  struct cb_layoutrecallargs *args)
{
	struct inode *ino;
	struct pnfs_layout_hdr *lo;
	u32 rv = NFS4ERR_NOMATCHING_LAYOUT;
	LIST_HEAD(free_me_list);

	lo = get_layout_by_fh(clp, &args->cbl_fh);
	if (!lo)
F
Fred Isaman 已提交
164 165
		return NFS4ERR_NOMATCHING_LAYOUT;

166
	ino = lo->plh_inode;
F
Fred Isaman 已提交
167 168
	spin_lock(&ino->i_lock);
	if (test_bit(NFS_LAYOUT_BULK_RECALL, &lo->plh_flags) ||
169
	    pnfs_mark_matching_lsegs_invalid(lo, &free_me_list,
170
					&args->cbl_range))
F
Fred Isaman 已提交
171 172 173 174 175 176
		rv = NFS4ERR_DELAY;
	else
		rv = NFS4ERR_NOMATCHING_LAYOUT;
	pnfs_set_layout_stateid(lo, &args->cbl_stateid, true);
	spin_unlock(&ino->i_lock);
	pnfs_free_lseg_list(&free_me_list);
177
	pnfs_put_layout_hdr(lo);
F
Fred Isaman 已提交
178 179 180 181 182 183 184
	iput(ino);
	return rv;
}

static u32 initiate_bulk_draining(struct nfs_client *clp,
				  struct cb_layoutrecallargs *args)
{
185
	struct nfs_server *server;
F
Fred Isaman 已提交
186 187 188 189 190 191 192 193 194 195 196 197 198
	struct pnfs_layout_hdr *lo;
	struct inode *ino;
	u32 rv = NFS4ERR_NOMATCHING_LAYOUT;
	struct pnfs_layout_hdr *tmp;
	LIST_HEAD(recall_list);
	LIST_HEAD(free_me_list);
	struct pnfs_layout_range range = {
		.iomode = IOMODE_ANY,
		.offset = 0,
		.length = NFS4_MAX_UINT64,
	};

	spin_lock(&clp->cl_lock);
199 200
	rcu_read_lock();
	list_for_each_entry_rcu(server, &clp->cl_superblocks, client_link) {
F
Fred Isaman 已提交
201
		if ((args->cbl_recall_type == RETURN_FSID) &&
202 203
		    memcmp(&server->fsid, &args->cbl_fsid,
			   sizeof(struct nfs_fsid)))
F
Fred Isaman 已提交
204
			continue;
205 206

		list_for_each_entry(lo, &server->layouts, plh_layouts) {
207 208 209 210 211 212 213 214
			ino = igrab(lo->plh_inode);
			if (ino)
				continue;
			spin_lock(&ino->i_lock);
			/* Is this layout in the process of being freed? */
			if (NFS_I(ino)->layout != lo) {
				spin_unlock(&ino->i_lock);
				iput(ino);
215
				continue;
216
			}
217
			pnfs_get_layout_hdr(lo);
218
			spin_unlock(&ino->i_lock);
219 220
			list_add(&lo->plh_bulk_recall, &recall_list);
		}
F
Fred Isaman 已提交
221
	}
222
	rcu_read_unlock();
F
Fred Isaman 已提交
223
	spin_unlock(&clp->cl_lock);
224

F
Fred Isaman 已提交
225 226 227 228 229
	list_for_each_entry_safe(lo, tmp,
				 &recall_list, plh_bulk_recall) {
		ino = lo->plh_inode;
		spin_lock(&ino->i_lock);
		set_bit(NFS_LAYOUT_BULK_RECALL, &lo->plh_flags);
230
		if (pnfs_mark_matching_lsegs_invalid(lo, &free_me_list, &range))
F
Fred Isaman 已提交
231 232 233
			rv = NFS4ERR_DELAY;
		list_del_init(&lo->plh_bulk_recall);
		spin_unlock(&ino->i_lock);
234
		pnfs_free_lseg_list(&free_me_list);
235
		pnfs_put_layout_hdr(lo);
F
Fred Isaman 已提交
236 237 238 239 240 241 242 243
		iput(ino);
	}
	return rv;
}

static u32 do_callback_layoutrecall(struct nfs_client *clp,
				    struct cb_layoutrecallargs *args)
{
244
	u32 res;
F
Fred Isaman 已提交
245 246 247 248 249 250 251 252 253 254 255

	dprintk("%s enter, type=%i\n", __func__, args->cbl_recall_type);
	if (args->cbl_recall_type == RETURN_FILE)
		res = initiate_file_draining(clp, args);
	else
		res = initiate_bulk_draining(clp, args);
	dprintk("%s returning %i\n", __func__, res);
	return res;

}

F
Fred Isaman 已提交
256 257 258
__be32 nfs4_callback_layoutrecall(struct cb_layoutrecallargs *args,
				  void *dummy, struct cb_process_state *cps)
{
F
Fred Isaman 已提交
259 260 261 262 263 264 265 266 267 268 269
	u32 res;

	dprintk("%s: -->\n", __func__);

	if (cps->clp)
		res = do_callback_layoutrecall(cps->clp, args);
	else
		res = NFS4ERR_OP_NOT_IN_SESSION;

	dprintk("%s: exit with status = %d\n", __func__, res);
	return cpu_to_be32(res);
F
Fred Isaman 已提交
270 271
}

272 273 274 275 276 277 278 279 280 281 282
static void pnfs_recall_all_layouts(struct nfs_client *clp)
{
	struct cb_layoutrecallargs args;

	/* Pretend we got a CB_LAYOUTRECALL(ALL) */
	memset(&args, 0, sizeof(args));
	args.cbl_recall_type = RETURN_ALL;
	/* FIXME we ignore errors, what should we do? */
	do_callback_layoutrecall(clp, &args);
}

M
Marc Eshel 已提交
283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319
__be32 nfs4_callback_devicenotify(struct cb_devicenotifyargs *args,
				  void *dummy, struct cb_process_state *cps)
{
	int i;
	__be32 res = 0;
	struct nfs_client *clp = cps->clp;
	struct nfs_server *server = NULL;

	dprintk("%s: -->\n", __func__);

	if (!clp) {
		res = cpu_to_be32(NFS4ERR_OP_NOT_IN_SESSION);
		goto out;
	}

	for (i = 0; i < args->ndevs; i++) {
		struct cb_devicenotifyitem *dev = &args->devs[i];

		if (!server ||
		    server->pnfs_curr_ld->id != dev->cbd_layout_type) {
			rcu_read_lock();
			list_for_each_entry_rcu(server, &clp->cl_superblocks, client_link)
				if (server->pnfs_curr_ld &&
				    server->pnfs_curr_ld->id == dev->cbd_layout_type) {
					rcu_read_unlock();
					goto found;
				}
			rcu_read_unlock();
			dprintk("%s: layout type %u not found\n",
				__func__, dev->cbd_layout_type);
			continue;
		}

	found:
		if (dev->cbd_notify_type == NOTIFY_DEVICEID4_CHANGE)
			dprintk("%s: NOTIFY_DEVICEID4_CHANGE not supported, "
				"deleting instead\n", __func__);
320
		nfs4_delete_deviceid(server->pnfs_curr_ld, clp, &dev->cbd_dev_id);
M
Marc Eshel 已提交
321 322 323 324 325 326 327 328 329
	}

out:
	kfree(args->devs);
	dprintk("%s: exit with status = %u\n",
		__func__, be32_to_cpu(res));
	return res;
}

330 331 332 333 334
/*
 * Validate the sequenceID sent by the server.
 * Return success if the sequenceID is one more than what we last saw on
 * this slot, accounting for wraparound.  Increments the slot's sequence.
 *
335 336
 * We don't yet implement a duplicate request cache, instead we set the
 * back channel ca_maxresponsesize_cached to zero. This is OK for now
337 338 339 340 341 342
 * since we only currently implement idempotent callbacks anyway.
 *
 * We have a single slot backchannel at this time, so we don't bother
 * checking the used_slots bit array on the table.  The lower layer guarantees
 * a single outstanding callback request at a time.
 */
343
static __be32
344
validate_seqid(struct nfs4_slot_table *tbl, struct cb_sequenceargs * args)
345 346 347 348
{
	struct nfs4_slot *slot;

	dprintk("%s enter. slotid %d seqid %d\n",
349
		__func__, args->csa_slotid, args->csa_sequenceid);
350

351
	if (args->csa_slotid >= NFS41_BC_MAX_CALLBACKS)
352 353
		return htonl(NFS4ERR_BADSLOT);

354
	slot = tbl->slots + args->csa_slotid;
355 356 357
	dprintk("%s slot table seqid: %d\n", __func__, slot->seq_nr);

	/* Normal */
358
	if (likely(args->csa_sequenceid == slot->seq_nr + 1)) {
359
		slot->seq_nr++;
360
		goto out_ok;
361 362 363
	}

	/* Replay */
364
	if (args->csa_sequenceid == slot->seq_nr) {
365
		dprintk("%s seqid %d is a replay\n",
366
			__func__, args->csa_sequenceid);
367 368 369 370 371 372 373
		/* Signal process_op to set this error on next op */
		if (args->csa_cachethis == 0)
			return htonl(NFS4ERR_RETRY_UNCACHED_REP);

		/* The ca_maxresponsesize_cached is 0 with no DRC */
		else if (args->csa_cachethis == 1)
			return htonl(NFS4ERR_REP_TOO_BIG_TO_CACHE);
374 375 376
	}

	/* Wraparound */
377
	if (args->csa_sequenceid == 1 && (slot->seq_nr + 1) == 0) {
378
		slot->seq_nr = 1;
379
		goto out_ok;
380 381 382 383
	}

	/* Misordered request */
	return htonl(NFS4ERR_SEQ_MISORDERED);
384 385 386
out_ok:
	tbl->highest_used_slotid = args->csa_slotid;
	return htonl(NFS4_OK);
387 388
}

389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443
/*
 * For each referring call triple, check the session's slot table for
 * a match.  If the slot is in use and the sequence numbers match, the
 * client is still waiting for a response to the original request.
 */
static bool referring_call_exists(struct nfs_client *clp,
				  uint32_t nrclists,
				  struct referring_call_list *rclists)
{
	bool status = 0;
	int i, j;
	struct nfs4_session *session;
	struct nfs4_slot_table *tbl;
	struct referring_call_list *rclist;
	struct referring_call *ref;

	/*
	 * XXX When client trunking is implemented, this becomes
	 * a session lookup from within the loop
	 */
	session = clp->cl_session;
	tbl = &session->fc_slot_table;

	for (i = 0; i < nrclists; i++) {
		rclist = &rclists[i];
		if (memcmp(session->sess_id.data,
			   rclist->rcl_sessionid.data,
			   NFS4_MAX_SESSIONID_LEN) != 0)
			continue;

		for (j = 0; j < rclist->rcl_nrefcalls; j++) {
			ref = &rclist->rcl_refcalls[j];

			dprintk("%s: sessionid %x:%x:%x:%x sequenceid %u "
				"slotid %u\n", __func__,
				((u32 *)&rclist->rcl_sessionid.data)[0],
				((u32 *)&rclist->rcl_sessionid.data)[1],
				((u32 *)&rclist->rcl_sessionid.data)[2],
				((u32 *)&rclist->rcl_sessionid.data)[3],
				ref->rc_sequenceid, ref->rc_slotid);

			spin_lock(&tbl->slot_tbl_lock);
			status = (test_bit(ref->rc_slotid, tbl->used_slots) &&
				  tbl->slots[ref->rc_slotid].seq_nr ==
					ref->rc_sequenceid);
			spin_unlock(&tbl->slot_tbl_lock);
			if (status)
				goto out;
		}
	}

out:
	return status;
}

444
__be32 nfs4_callback_sequence(struct cb_sequenceargs *args,
445 446
			      struct cb_sequenceres *res,
			      struct cb_process_state *cps)
447
{
448
	struct nfs4_slot_table *tbl;
449
	struct nfs_client *clp;
450
	int i;
451
	__be32 status = htonl(NFS4ERR_BADSESSION);
452

453
	clp = nfs4_find_client_sessionid(cps->net, args->csa_addr, &args->csa_sessionid);
454 455 456
	if (clp == NULL)
		goto out;

457 458 459
	tbl = &clp->cl_session->bc_slot_table;

	spin_lock(&tbl->slot_tbl_lock);
460 461
	/* state manager is resetting the session */
	if (test_bit(NFS4_SESSION_DRAINING, &clp->cl_session->session_state)) {
462 463
		spin_unlock(&tbl->slot_tbl_lock);
		status = htonl(NFS4ERR_DELAY);
464 465 466 467 468
		/* Return NFS4ERR_BADSESSION if we're draining the session
		 * in order to reset it.
		 */
		if (test_bit(NFS4CLNT_SESSION_RESET, &clp->cl_state))
			status = htonl(NFS4ERR_BADSESSION);
469 470 471
		goto out;
	}

472
	status = validate_seqid(&clp->cl_session->bc_slot_table, args);
473
	spin_unlock(&tbl->slot_tbl_lock);
474
	if (status)
475
		goto out;
476

477 478
	cps->slotid = args->csa_slotid;

479 480 481 482 483 484 485
	/*
	 * Check for pending referring calls.  If a match is found, a
	 * related callback was received before the response to the original
	 * call.
	 */
	if (referring_call_exists(clp, args->csa_nrclists, args->csa_rclists)) {
		status = htonl(NFS4ERR_DELAY);
486
		goto out;
487 488
	}

489 490 491 492 493 494 495
	memcpy(&res->csr_sessionid, &args->csa_sessionid,
	       sizeof(res->csr_sessionid));
	res->csr_sequenceid = args->csa_sequenceid;
	res->csr_slotid = args->csa_slotid;
	res->csr_highestslotid = NFS41_BC_MAX_CALLBACKS - 1;
	res->csr_target_highestslotid = NFS41_BC_MAX_CALLBACKS - 1;

496
out:
497
	cps->clp = clp; /* put in nfs4_callback_compound */
498 499 500 501
	for (i = 0; i < args->csa_nrclists; i++)
		kfree(args->csa_rclists[i].rcl_refcalls);
	kfree(args->csa_rclists);

502 503 504 505
	if (status == htonl(NFS4ERR_RETRY_UNCACHED_REP)) {
		cps->drc_status = status;
		status = 0;
	} else
506
		res->csr_status = status;
507

508 509 510
	dprintk("%s: exit with status = %d res->csr_status %d\n", __func__,
		ntohl(status), ntohl(res->csr_status));
	return status;
511 512
}

513 514 515 516 517 518
static bool
validate_bitmap_values(unsigned long mask)
{
	return (mask & ~RCA4_TYPE_MASK_ALL) == 0;
}

519 520
__be32 nfs4_callback_recallany(struct cb_recallanyargs *args, void *dummy,
			       struct cb_process_state *cps)
521
{
522
	__be32 status;
523 524
	fmode_t flags = 0;

525
	status = cpu_to_be32(NFS4ERR_OP_NOT_IN_SESSION);
526
	if (!cps->clp) /* set in cb_sequence */
527 528
		goto out;

529
	dprintk_rcu("NFS: RECALL_ANY callback request from %s\n",
530
		rpc_peeraddr2str(cps->clp->cl_rpcclient, RPC_DISPLAY_ADDR));
531

532 533 534 535 536
	status = cpu_to_be32(NFS4ERR_INVAL);
	if (!validate_bitmap_values(args->craa_type_mask))
		goto out;

	status = cpu_to_be32(NFS4_OK);
537 538 539 540 541 542
	if (test_bit(RCA4_TYPE_MASK_RDATA_DLG, (const unsigned long *)
		     &args->craa_type_mask))
		flags = FMODE_READ;
	if (test_bit(RCA4_TYPE_MASK_WDATA_DLG, (const unsigned long *)
		     &args->craa_type_mask))
		flags |= FMODE_WRITE;
543 544 545
	if (test_bit(RCA4_TYPE_MASK_FILE_LAYOUT, (const unsigned long *)
		     &args->craa_type_mask))
		pnfs_recall_all_layouts(cps->clp);
546
	if (flags)
547
		nfs_expire_all_delegation_types(cps->clp, flags);
548 549 550 551
out:
	dprintk("%s: exit with status = %d\n", __func__, ntohl(status));
	return status;
}
A
Andy Adamson 已提交
552 553

/* Reduce the fore channel's max_slots to the target value */
554 555
__be32 nfs4_callback_recallslot(struct cb_recallslotargs *args, void *dummy,
				struct cb_process_state *cps)
A
Andy Adamson 已提交
556 557
{
	struct nfs4_slot_table *fc_tbl;
558
	__be32 status;
A
Andy Adamson 已提交
559 560

	status = htonl(NFS4ERR_OP_NOT_IN_SESSION);
561
	if (!cps->clp) /* set in cb_sequence */
A
Andy Adamson 已提交
562 563
		goto out;

564
	dprintk_rcu("NFS: CB_RECALL_SLOT request from %s target highest slotid %d\n",
565
		rpc_peeraddr2str(cps->clp->cl_rpcclient, RPC_DISPLAY_ADDR),
566
		args->crsa_target_highest_slotid);
A
Andy Adamson 已提交
567

568
	fc_tbl = &cps->clp->cl_session->fc_slot_table;
A
Andy Adamson 已提交
569

570
	status = htonl(NFS4_OK);
A
Andy Adamson 已提交
571

572
	nfs41_set_target_slotid(fc_tbl, args->crsa_target_highest_slotid);
A
Andy Adamson 已提交
573 574 575 576
out:
	dprintk("%s: exit with status = %d\n", __func__, ntohl(status));
	return status;
}
577
#endif /* CONFIG_NFS_V4_1 */