delegation.c 14.8 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9
/*
 * linux/fs/nfs/delegation.c
 *
 * Copyright (C) 2004 Trond Myklebust
 *
 * NFS file delegation management
 *
 */
#include <linux/completion.h>
10
#include <linux/kthread.h>
L
Linus Torvalds 已提交
11 12
#include <linux/module.h>
#include <linux/sched.h>
13
#include <linux/slab.h>
A
Alexey Dobriyan 已提交
14
#include <linux/smp_lock.h>
L
Linus Torvalds 已提交
15 16 17 18 19 20
#include <linux/spinlock.h>

#include <linux/nfs4.h>
#include <linux/nfs_fs.h>
#include <linux/nfs_xdr.h>

21
#include "nfs4_fs.h"
L
Linus Torvalds 已提交
22
#include "delegation.h"
23
#include "internal.h"
L
Linus Torvalds 已提交
24

25
static void nfs_do_free_delegation(struct nfs_delegation *delegation)
L
Linus Torvalds 已提交
26 27 28 29
{
	kfree(delegation);
}

30 31 32 33
static void nfs_free_delegation_callback(struct rcu_head *head)
{
	struct nfs_delegation *delegation = container_of(head, struct nfs_delegation, rcu);

34 35 36 37 38 39 40 41 42 43 44 45
	nfs_do_free_delegation(delegation);
}

static void nfs_free_delegation(struct nfs_delegation *delegation)
{
	struct rpc_cred *cred;

	cred = rcu_dereference(delegation->cred);
	rcu_assign_pointer(delegation->cred, NULL);
	call_rcu(&delegation->rcu, nfs_free_delegation_callback);
	if (cred)
		put_rpccred(cred);
46 47
}

48 49 50 51 52
void nfs_mark_delegation_referenced(struct nfs_delegation *delegation)
{
	set_bit(NFS_DELEGATION_REFERENCED, &delegation->flags);
}

53
int nfs_have_delegation(struct inode *inode, fmode_t flags)
54 55 56 57 58 59 60 61 62 63 64 65 66 67 68
{
	struct nfs_delegation *delegation;
	int ret = 0;

	flags &= FMODE_READ|FMODE_WRITE;
	rcu_read_lock();
	delegation = rcu_dereference(NFS_I(inode)->delegation);
	if (delegation != NULL && (delegation->type & flags) == flags) {
		nfs_mark_delegation_referenced(delegation);
		ret = 1;
	}
	rcu_read_unlock();
	return ret;
}

69 70 71 72
static int nfs_delegation_claim_locks(struct nfs_open_context *ctx, struct nfs4_state *state)
{
	struct inode *inode = state->inode;
	struct file_lock *fl;
73
	int status = 0;
74

75 76 77 78 79
	if (inode->i_flock == NULL)
		goto out;

	/* Protect inode->i_flock using the BKL */
	lock_kernel();
H
Harvey Harrison 已提交
80
	for (fl = inode->i_flock; fl != NULL; fl = fl->fl_next) {
81 82
		if (!(fl->fl_flags & (FL_POSIX|FL_FLOCK)))
			continue;
83
		if (nfs_file_open_context(fl->fl_file) != ctx)
84
			continue;
85
		unlock_kernel();
86
		status = nfs4_lock_delegation_recall(state, fl);
87
		if (status < 0)
88 89
			goto out;
		lock_kernel();
90
	}
91 92
	unlock_kernel();
out:
93 94 95
	return status;
}

96
static int nfs_delegation_claim_opens(struct inode *inode, const nfs4_stateid *stateid)
L
Linus Torvalds 已提交
97 98 99 100
{
	struct nfs_inode *nfsi = NFS_I(inode);
	struct nfs_open_context *ctx;
	struct nfs4_state *state;
101
	int err;
L
Linus Torvalds 已提交
102 103 104 105 106 107 108 109 110

again:
	spin_lock(&inode->i_lock);
	list_for_each_entry(ctx, &nfsi->open_files, list) {
		state = ctx->state;
		if (state == NULL)
			continue;
		if (!test_bit(NFS_DELEGATED_STATE, &state->flags))
			continue;
111 112
		if (memcmp(state->stateid.data, stateid->data, sizeof(state->stateid.data)) != 0)
			continue;
L
Linus Torvalds 已提交
113 114
		get_nfs_open_context(ctx);
		spin_unlock(&inode->i_lock);
115
		err = nfs4_open_delegation_recall(ctx, state, stateid);
116 117
		if (err >= 0)
			err = nfs_delegation_claim_locks(ctx, state);
L
Linus Torvalds 已提交
118
		put_nfs_open_context(ctx);
119
		if (err != 0)
120
			return err;
L
Linus Torvalds 已提交
121 122 123
		goto again;
	}
	spin_unlock(&inode->i_lock);
124
	return 0;
L
Linus Torvalds 已提交
125 126 127 128 129 130 131
}

/*
 * Set up a delegation on an inode
 */
void nfs_inode_reclaim_delegation(struct inode *inode, struct rpc_cred *cred, struct nfs_openres *res)
{
132 133
	struct nfs_delegation *delegation;
	struct rpc_cred *oldcred = NULL;
L
Linus Torvalds 已提交
134

135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160
	rcu_read_lock();
	delegation = rcu_dereference(NFS_I(inode)->delegation);
	if (delegation != NULL) {
		spin_lock(&delegation->lock);
		if (delegation->inode != NULL) {
			memcpy(delegation->stateid.data, res->delegation.data,
			       sizeof(delegation->stateid.data));
			delegation->type = res->delegation_type;
			delegation->maxsize = res->maxsize;
			oldcred = delegation->cred;
			delegation->cred = get_rpccred(cred);
			clear_bit(NFS_DELEGATION_NEED_RECLAIM,
				  &delegation->flags);
			NFS_I(inode)->delegation_state = delegation->type;
			spin_unlock(&delegation->lock);
			put_rpccred(oldcred);
			rcu_read_unlock();
		} else {
			/* We appear to have raced with a delegation return. */
			spin_unlock(&delegation->lock);
			rcu_read_unlock();
			nfs_inode_set_delegation(inode, cred, res);
		}
	} else {
		rcu_read_unlock();
	}
L
Linus Torvalds 已提交
161 162
}

163 164 165 166 167 168 169 170 171
static int nfs_do_return_delegation(struct inode *inode, struct nfs_delegation *delegation, int issync)
{
	int res = 0;

	res = nfs4_proc_delegreturn(inode, delegation->cred, &delegation->stateid, issync);
	nfs_free_delegation(delegation);
	return res;
}

172 173 174 175 176 177 178 179 180 181 182
static struct inode *nfs_delegation_grab_inode(struct nfs_delegation *delegation)
{
	struct inode *inode = NULL;

	spin_lock(&delegation->lock);
	if (delegation->inode != NULL)
		inode = igrab(delegation->inode);
	spin_unlock(&delegation->lock);
	return inode;
}

183 184 185 186 187 188
static struct nfs_delegation *nfs_detach_delegation_locked(struct nfs_inode *nfsi, const nfs4_stateid *stateid)
{
	struct nfs_delegation *delegation = rcu_dereference(nfsi->delegation);

	if (delegation == NULL)
		goto nomatch;
189
	spin_lock(&delegation->lock);
190 191
	if (stateid != NULL && memcmp(delegation->stateid.data, stateid->data,
				sizeof(delegation->stateid.data)) != 0)
192
		goto nomatch_unlock;
193
	list_del_rcu(&delegation->super_list);
194
	delegation->inode = NULL;
195 196
	nfsi->delegation_state = 0;
	rcu_assign_pointer(nfsi->delegation, NULL);
197
	spin_unlock(&delegation->lock);
198
	return delegation;
199 200
nomatch_unlock:
	spin_unlock(&delegation->lock);
201 202 203 204
nomatch:
	return NULL;
}

L
Linus Torvalds 已提交
205 206 207 208 209
/*
 * Set up a delegation on an inode
 */
int nfs_inode_set_delegation(struct inode *inode, struct rpc_cred *cred, struct nfs_openres *res)
{
210
	struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
L
Linus Torvalds 已提交
211 212
	struct nfs_inode *nfsi = NFS_I(inode);
	struct nfs_delegation *delegation;
213
	struct nfs_delegation *freeme = NULL;
L
Linus Torvalds 已提交
214 215
	int status = 0;

216
	delegation = kmalloc(sizeof(*delegation), GFP_KERNEL);
L
Linus Torvalds 已提交
217 218 219 220 221 222
	if (delegation == NULL)
		return -ENOMEM;
	memcpy(delegation->stateid.data, res->delegation.data,
			sizeof(delegation->stateid.data));
	delegation->type = res->delegation_type;
	delegation->maxsize = res->maxsize;
223
	delegation->change_attr = nfsi->change_attr;
L
Linus Torvalds 已提交
224 225
	delegation->cred = get_rpccred(cred);
	delegation->inode = inode;
226
	delegation->flags = 1<<NFS_DELEGATION_REFERENCED;
227
	spin_lock_init(&delegation->lock);
L
Linus Torvalds 已提交
228 229

	spin_lock(&clp->cl_lock);
230
	if (rcu_dereference(nfsi->delegation) != NULL) {
L
Linus Torvalds 已提交
231
		if (memcmp(&delegation->stateid, &nfsi->delegation->stateid,
232 233 234
					sizeof(delegation->stateid)) == 0 &&
				delegation->type == nfsi->delegation->type) {
			goto out;
L
Linus Torvalds 已提交
235
		}
236 237 238 239 240 241
		/*
		 * Deal with broken servers that hand out two
		 * delegations for the same file.
		 */
		dfprintk(FILE, "%s: server %s handed out "
				"a duplicate delegation!\n",
242
				__func__, clp->cl_hostname);
243 244 245 246 247 248
		if (delegation->type <= nfsi->delegation->type) {
			freeme = delegation;
			delegation = NULL;
			goto out;
		}
		freeme = nfs_detach_delegation_locked(nfsi, NULL);
L
Linus Torvalds 已提交
249
	}
250 251 252 253
	list_add_rcu(&delegation->super_list, &clp->cl_delegations);
	nfsi->delegation_state = delegation->type;
	rcu_assign_pointer(nfsi->delegation, delegation);
	delegation = NULL;
254 255 256 257 258 259

	/* Ensure we revalidate the attributes and page cache! */
	spin_lock(&inode->i_lock);
	nfsi->cache_validity |= NFS_INO_REVAL_FORCED;
	spin_unlock(&inode->i_lock);

260
out:
L
Linus Torvalds 已提交
261
	spin_unlock(&clp->cl_lock);
262 263
	if (delegation != NULL)
		nfs_free_delegation(delegation);
264 265
	if (freeme != NULL)
		nfs_do_return_delegation(inode, freeme, 0);
L
Linus Torvalds 已提交
266 267 268 269 270 271 272 273 274 275 276 277 278 279
	return status;
}

/* Sync all data to disk upon delegation return */
static void nfs_msync_inode(struct inode *inode)
{
	filemap_fdatawrite(inode->i_mapping);
	nfs_wb_all(inode);
	filemap_fdatawait(inode->i_mapping);
}

/*
 * Basic procedure for returning a delegation to the server
 */
280
static int __nfs_inode_return_delegation(struct inode *inode, struct nfs_delegation *delegation, int issync)
L
Linus Torvalds 已提交
281 282
{
	struct nfs_inode *nfsi = NFS_I(inode);
283
	int err;
L
Linus Torvalds 已提交
284

285 286 287 288
	/*
	 * Guard against new delegated open/lock/unlock calls and against
	 * state recovery
	 */
L
Linus Torvalds 已提交
289
	down_write(&nfsi->rwsem);
290
	err = nfs_delegation_claim_opens(inode, &delegation->stateid);
L
Linus Torvalds 已提交
291
	up_write(&nfsi->rwsem);
292 293
	if (err)
		goto out;
L
Linus Torvalds 已提交
294

295 296 297
	err = nfs_do_return_delegation(inode, delegation, issync);
out:
	return err;
298 299
}

300 301 302
/*
 * Return all delegations that have been marked for return
 */
303
int nfs_client_return_marked_delegations(struct nfs_client *clp)
304 305 306
{
	struct nfs_delegation *delegation;
	struct inode *inode;
307
	int err = 0;
308 309 310 311 312 313 314 315 316 317 318 319 320

restart:
	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
		if (!test_and_clear_bit(NFS_DELEGATION_RETURN, &delegation->flags))
			continue;
		inode = nfs_delegation_grab_inode(delegation);
		if (inode == NULL)
			continue;
		spin_lock(&clp->cl_lock);
		delegation = nfs_detach_delegation_locked(NFS_I(inode), NULL);
		spin_unlock(&clp->cl_lock);
		rcu_read_unlock();
321 322 323 324
		if (delegation != NULL) {
			filemap_flush(inode->i_mapping);
			err = __nfs_inode_return_delegation(inode, delegation, 0);
		}
325
		iput(inode);
326 327 328 329
		if (!err)
			goto restart;
		set_bit(NFS4CLNT_DELEGRETURN, &clp->cl_state);
		return err;
330 331
	}
	rcu_read_unlock();
332
	return 0;
333 334
}

335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355
/*
 * This function returns the delegation without reclaiming opens
 * or protecting against delegation reclaims.
 * It is therefore really only safe to be called from
 * nfs4_clear_inode()
 */
void nfs_inode_return_delegation_noreclaim(struct inode *inode)
{
	struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
	struct nfs_inode *nfsi = NFS_I(inode);
	struct nfs_delegation *delegation;

	if (rcu_dereference(nfsi->delegation) != NULL) {
		spin_lock(&clp->cl_lock);
		delegation = nfs_detach_delegation_locked(nfsi, NULL);
		spin_unlock(&clp->cl_lock);
		if (delegation != NULL)
			nfs_do_return_delegation(inode, delegation, 0);
	}
}

356 357 358 359 360 361 362
int nfs_inode_return_delegation(struct inode *inode)
{
	struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
	struct nfs_inode *nfsi = NFS_I(inode);
	struct nfs_delegation *delegation;
	int err = 0;

363
	if (rcu_dereference(nfsi->delegation) != NULL) {
364 365 366
		spin_lock(&clp->cl_lock);
		delegation = nfs_detach_delegation_locked(nfsi, NULL);
		spin_unlock(&clp->cl_lock);
367 368 369 370
		if (delegation != NULL) {
			nfs_msync_inode(inode);
			err = __nfs_inode_return_delegation(inode, delegation, 1);
		}
371 372
	}
	return err;
L
Linus Torvalds 已提交
373 374
}

375 376 377 378 379 380
static void nfs_mark_return_delegation(struct nfs_client *clp, struct nfs_delegation *delegation)
{
	set_bit(NFS_DELEGATION_RETURN, &delegation->flags);
	set_bit(NFS4CLNT_DELEGRETURN, &clp->cl_state);
}

L
Linus Torvalds 已提交
381 382 383
/*
 * Return all delegations associated to a super block
 */
384
void nfs_super_return_all_delegations(struct super_block *sb)
L
Linus Torvalds 已提交
385
{
386
	struct nfs_client *clp = NFS_SB(sb)->nfs_client;
L
Linus Torvalds 已提交
387 388 389 390
	struct nfs_delegation *delegation;

	if (clp == NULL)
		return;
391 392
	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
393 394
		spin_lock(&delegation->lock);
		if (delegation->inode != NULL && delegation->inode->i_sb == sb)
395
			set_bit(NFS_DELEGATION_RETURN, &delegation->flags);
396
		spin_unlock(&delegation->lock);
L
Linus Torvalds 已提交
397
	}
398
	rcu_read_unlock();
399 400
	if (nfs_client_return_marked_delegations(clp) != 0)
		nfs4_schedule_state_manager(clp);
401 402
}

403 404
static
void nfs_client_mark_return_all_delegation_types(struct nfs_client *clp, fmode_t flags)
405 406 407 408
{
	struct nfs_delegation *delegation;

	rcu_read_lock();
409
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
410 411 412 413
		if ((delegation->type == (FMODE_READ|FMODE_WRITE)) && !(flags & FMODE_WRITE))
			continue;
		if (delegation->type & flags)
			nfs_mark_return_delegation(clp, delegation);
414
	}
415
	rcu_read_unlock();
L
Linus Torvalds 已提交
416 417
}

418 419 420 421 422
static void nfs_client_mark_return_all_delegations(struct nfs_client *clp)
{
	nfs_client_mark_return_all_delegation_types(clp, FMODE_READ|FMODE_WRITE);
}

423
static void nfs_delegation_run_state_manager(struct nfs_client *clp)
424
{
425 426
	if (test_bit(NFS4CLNT_DELEGRETURN, &clp->cl_state))
		nfs4_schedule_state_manager(clp);
427 428
}

429
void nfs_expire_all_delegation_types(struct nfs_client *clp, fmode_t flags)
430
{
431
	nfs_client_mark_return_all_delegation_types(clp, flags);
432
	nfs_delegation_run_state_manager(clp);
433 434
}

435 436 437 438 439
void nfs_expire_all_delegations(struct nfs_client *clp)
{
	nfs_expire_all_delegation_types(clp, FMODE_READ|FMODE_WRITE);
}

L
Linus Torvalds 已提交
440 441 442
/*
 * Return all delegations following an NFS4ERR_CB_PATH_DOWN error.
 */
443
void nfs_handle_cb_pathdown(struct nfs_client *clp)
L
Linus Torvalds 已提交
444 445 446
{
	if (clp == NULL)
		return;
447
	nfs_client_mark_return_all_delegations(clp);
L
Linus Torvalds 已提交
448 449
}

450 451 452 453 454 455 456 457
static void nfs_client_mark_return_unreferenced_delegations(struct nfs_client *clp)
{
	struct nfs_delegation *delegation;

	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
		if (test_and_clear_bit(NFS_DELEGATION_REFERENCED, &delegation->flags))
			continue;
458
		nfs_mark_return_delegation(clp, delegation);
459 460 461 462 463 464 465 466 467 468
	}
	rcu_read_unlock();
}

void nfs_expire_unreferenced_delegations(struct nfs_client *clp)
{
	nfs_client_mark_return_unreferenced_delegations(clp);
	nfs_delegation_run_state_manager(clp);
}

L
Linus Torvalds 已提交
469 470 471
/*
 * Asynchronous delegation recall!
 */
A
Alexandros Batsakis 已提交
472 473 474
int nfs_async_inode_return_delegation(struct inode *inode, const nfs4_stateid *stateid,
				      int (*validate_stateid)(struct nfs_delegation *delegation,
							      const nfs4_stateid *stateid))
L
Linus Torvalds 已提交
475
{
476 477
	struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
	struct nfs_delegation *delegation;
L
Linus Torvalds 已提交
478

479 480
	rcu_read_lock();
	delegation = rcu_dereference(NFS_I(inode)->delegation);
A
Alexandros Batsakis 已提交
481 482

	if (!validate_stateid(delegation, stateid)) {
483 484 485
		rcu_read_unlock();
		return -ENOENT;
	}
A
Alexandros Batsakis 已提交
486

487 488 489 490
	nfs_mark_return_delegation(clp, delegation);
	rcu_read_unlock();
	nfs_delegation_run_state_manager(clp);
	return 0;
L
Linus Torvalds 已提交
491 492 493 494 495
}

/*
 * Retrieve the inode associated with a delegation
 */
496
struct inode *nfs_delegation_find_inode(struct nfs_client *clp, const struct nfs_fh *fhandle)
L
Linus Torvalds 已提交
497 498 499
{
	struct nfs_delegation *delegation;
	struct inode *res = NULL;
500 501
	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
502 503 504
		spin_lock(&delegation->lock);
		if (delegation->inode != NULL &&
		    nfs_compare_fh(fhandle, &NFS_I(delegation->inode)->fh) == 0) {
L
Linus Torvalds 已提交
505 506
			res = igrab(delegation->inode);
		}
507 508 509
		spin_unlock(&delegation->lock);
		if (res != NULL)
			break;
L
Linus Torvalds 已提交
510
	}
511
	rcu_read_unlock();
L
Linus Torvalds 已提交
512 513 514 515 516 517
	return res;
}

/*
 * Mark all delegations as needing to be reclaimed
 */
518
void nfs_delegation_mark_reclaim(struct nfs_client *clp)
L
Linus Torvalds 已提交
519 520
{
	struct nfs_delegation *delegation;
521 522
	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list)
523
		set_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags);
524
	rcu_read_unlock();
L
Linus Torvalds 已提交
525 526 527 528 529
}

/*
 * Reap all unclaimed delegations after reboot recovery is done
 */
530
void nfs_delegation_reap_unclaimed(struct nfs_client *clp)
L
Linus Torvalds 已提交
531
{
532
	struct nfs_delegation *delegation;
533
	struct inode *inode;
534 535 536
restart:
	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
537
		if (test_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags) == 0)
L
Linus Torvalds 已提交
538
			continue;
539 540 541
		inode = nfs_delegation_grab_inode(delegation);
		if (inode == NULL)
			continue;
542
		spin_lock(&clp->cl_lock);
543
		delegation = nfs_detach_delegation_locked(NFS_I(inode), NULL);
544 545 546
		spin_unlock(&clp->cl_lock);
		rcu_read_unlock();
		if (delegation != NULL)
547
			nfs_free_delegation(delegation);
548
		iput(inode);
549
		goto restart;
L
Linus Torvalds 已提交
550
	}
551
	rcu_read_unlock();
L
Linus Torvalds 已提交
552
}
553 554 555 556 557

int nfs4_copy_delegation_stateid(nfs4_stateid *dst, struct inode *inode)
{
	struct nfs_inode *nfsi = NFS_I(inode);
	struct nfs_delegation *delegation;
558
	int ret = 0;
559

560 561
	rcu_read_lock();
	delegation = rcu_dereference(nfsi->delegation);
562 563
	if (delegation != NULL) {
		memcpy(dst->data, delegation->stateid.data, sizeof(dst->data));
564
		ret = 1;
565
	}
566 567
	rcu_read_unlock();
	return ret;
568
}