delegation.c 14.4 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9
/*
 * linux/fs/nfs/delegation.c
 *
 * Copyright (C) 2004 Trond Myklebust
 *
 * NFS file delegation management
 *
 */
#include <linux/completion.h>
10
#include <linux/kthread.h>
L
Linus Torvalds 已提交
11 12
#include <linux/module.h>
#include <linux/sched.h>
A
Alexey Dobriyan 已提交
13
#include <linux/smp_lock.h>
L
Linus Torvalds 已提交
14 15 16 17 18 19
#include <linux/spinlock.h>

#include <linux/nfs4.h>
#include <linux/nfs_fs.h>
#include <linux/nfs_xdr.h>

20
#include "nfs4_fs.h"
L
Linus Torvalds 已提交
21
#include "delegation.h"
22
#include "internal.h"
L
Linus Torvalds 已提交
23

24
static void nfs_do_free_delegation(struct nfs_delegation *delegation)
L
Linus Torvalds 已提交
25 26 27 28
{
	kfree(delegation);
}

29 30 31 32
static void nfs_free_delegation_callback(struct rcu_head *head)
{
	struct nfs_delegation *delegation = container_of(head, struct nfs_delegation, rcu);

33 34 35 36 37 38 39 40 41 42 43 44
	nfs_do_free_delegation(delegation);
}

static void nfs_free_delegation(struct nfs_delegation *delegation)
{
	struct rpc_cred *cred;

	cred = rcu_dereference(delegation->cred);
	rcu_assign_pointer(delegation->cred, NULL);
	call_rcu(&delegation->rcu, nfs_free_delegation_callback);
	if (cred)
		put_rpccred(cred);
45 46
}

47 48 49 50 51
void nfs_mark_delegation_referenced(struct nfs_delegation *delegation)
{
	set_bit(NFS_DELEGATION_REFERENCED, &delegation->flags);
}

52
int nfs_have_delegation(struct inode *inode, fmode_t flags)
53 54 55 56 57 58 59 60 61 62 63 64 65 66 67
{
	struct nfs_delegation *delegation;
	int ret = 0;

	flags &= FMODE_READ|FMODE_WRITE;
	rcu_read_lock();
	delegation = rcu_dereference(NFS_I(inode)->delegation);
	if (delegation != NULL && (delegation->type & flags) == flags) {
		nfs_mark_delegation_referenced(delegation);
		ret = 1;
	}
	rcu_read_unlock();
	return ret;
}

68 69 70 71
static int nfs_delegation_claim_locks(struct nfs_open_context *ctx, struct nfs4_state *state)
{
	struct inode *inode = state->inode;
	struct file_lock *fl;
72
	int status = 0;
73

74 75 76 77 78
	if (inode->i_flock == NULL)
		goto out;

	/* Protect inode->i_flock using the BKL */
	lock_kernel();
H
Harvey Harrison 已提交
79
	for (fl = inode->i_flock; fl != NULL; fl = fl->fl_next) {
80 81
		if (!(fl->fl_flags & (FL_POSIX|FL_FLOCK)))
			continue;
82
		if (nfs_file_open_context(fl->fl_file) != ctx)
83
			continue;
84
		unlock_kernel();
85
		status = nfs4_lock_delegation_recall(state, fl);
86
		if (status < 0)
87 88
			goto out;
		lock_kernel();
89
	}
90 91
	unlock_kernel();
out:
92 93 94
	return status;
}

95
static int nfs_delegation_claim_opens(struct inode *inode, const nfs4_stateid *stateid)
L
Linus Torvalds 已提交
96 97 98 99
{
	struct nfs_inode *nfsi = NFS_I(inode);
	struct nfs_open_context *ctx;
	struct nfs4_state *state;
100
	int err;
L
Linus Torvalds 已提交
101 102 103 104 105 106 107 108 109

again:
	spin_lock(&inode->i_lock);
	list_for_each_entry(ctx, &nfsi->open_files, list) {
		state = ctx->state;
		if (state == NULL)
			continue;
		if (!test_bit(NFS_DELEGATED_STATE, &state->flags))
			continue;
110 111
		if (memcmp(state->stateid.data, stateid->data, sizeof(state->stateid.data)) != 0)
			continue;
L
Linus Torvalds 已提交
112 113
		get_nfs_open_context(ctx);
		spin_unlock(&inode->i_lock);
114
		err = nfs4_open_delegation_recall(ctx, state, stateid);
115 116
		if (err >= 0)
			err = nfs_delegation_claim_locks(ctx, state);
L
Linus Torvalds 已提交
117
		put_nfs_open_context(ctx);
118
		if (err != 0)
119
			return err;
L
Linus Torvalds 已提交
120 121 122
		goto again;
	}
	spin_unlock(&inode->i_lock);
123
	return 0;
L
Linus Torvalds 已提交
124 125 126 127 128 129 130 131
}

/*
 * Set up a delegation on an inode
 */
void nfs_inode_reclaim_delegation(struct inode *inode, struct rpc_cred *cred, struct nfs_openres *res)
{
	struct nfs_delegation *delegation = NFS_I(inode)->delegation;
132
	struct rpc_cred *oldcred;
L
Linus Torvalds 已提交
133 134 135 136 137 138 139

	if (delegation == NULL)
		return;
	memcpy(delegation->stateid.data, res->delegation.data,
			sizeof(delegation->stateid.data));
	delegation->type = res->delegation_type;
	delegation->maxsize = res->maxsize;
140
	oldcred = delegation->cred;
L
Linus Torvalds 已提交
141
	delegation->cred = get_rpccred(cred);
142
	clear_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags);
L
Linus Torvalds 已提交
143 144
	NFS_I(inode)->delegation_state = delegation->type;
	smp_wmb();
145
	put_rpccred(oldcred);
L
Linus Torvalds 已提交
146 147
}

148 149 150 151 152 153 154 155 156
static int nfs_do_return_delegation(struct inode *inode, struct nfs_delegation *delegation, int issync)
{
	int res = 0;

	res = nfs4_proc_delegreturn(inode, delegation->cred, &delegation->stateid, issync);
	nfs_free_delegation(delegation);
	return res;
}

157 158 159 160 161 162 163 164 165 166 167
static struct inode *nfs_delegation_grab_inode(struct nfs_delegation *delegation)
{
	struct inode *inode = NULL;

	spin_lock(&delegation->lock);
	if (delegation->inode != NULL)
		inode = igrab(delegation->inode);
	spin_unlock(&delegation->lock);
	return inode;
}

168 169 170 171 172 173
static struct nfs_delegation *nfs_detach_delegation_locked(struct nfs_inode *nfsi, const nfs4_stateid *stateid)
{
	struct nfs_delegation *delegation = rcu_dereference(nfsi->delegation);

	if (delegation == NULL)
		goto nomatch;
174
	spin_lock(&delegation->lock);
175 176
	if (stateid != NULL && memcmp(delegation->stateid.data, stateid->data,
				sizeof(delegation->stateid.data)) != 0)
177
		goto nomatch_unlock;
178
	list_del_rcu(&delegation->super_list);
179
	delegation->inode = NULL;
180 181
	nfsi->delegation_state = 0;
	rcu_assign_pointer(nfsi->delegation, NULL);
182
	spin_unlock(&delegation->lock);
183
	return delegation;
184 185
nomatch_unlock:
	spin_unlock(&delegation->lock);
186 187 188 189
nomatch:
	return NULL;
}

L
Linus Torvalds 已提交
190 191 192 193 194
/*
 * Set up a delegation on an inode
 */
int nfs_inode_set_delegation(struct inode *inode, struct rpc_cred *cred, struct nfs_openres *res)
{
195
	struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
L
Linus Torvalds 已提交
196 197
	struct nfs_inode *nfsi = NFS_I(inode);
	struct nfs_delegation *delegation;
198
	struct nfs_delegation *freeme = NULL;
L
Linus Torvalds 已提交
199 200
	int status = 0;

201
	delegation = kmalloc(sizeof(*delegation), GFP_KERNEL);
L
Linus Torvalds 已提交
202 203 204 205 206 207
	if (delegation == NULL)
		return -ENOMEM;
	memcpy(delegation->stateid.data, res->delegation.data,
			sizeof(delegation->stateid.data));
	delegation->type = res->delegation_type;
	delegation->maxsize = res->maxsize;
208
	delegation->change_attr = nfsi->change_attr;
L
Linus Torvalds 已提交
209 210
	delegation->cred = get_rpccred(cred);
	delegation->inode = inode;
211
	delegation->flags = 1<<NFS_DELEGATION_REFERENCED;
212
	spin_lock_init(&delegation->lock);
L
Linus Torvalds 已提交
213 214

	spin_lock(&clp->cl_lock);
215
	if (rcu_dereference(nfsi->delegation) != NULL) {
L
Linus Torvalds 已提交
216
		if (memcmp(&delegation->stateid, &nfsi->delegation->stateid,
217 218 219
					sizeof(delegation->stateid)) == 0 &&
				delegation->type == nfsi->delegation->type) {
			goto out;
L
Linus Torvalds 已提交
220
		}
221 222 223 224 225 226
		/*
		 * Deal with broken servers that hand out two
		 * delegations for the same file.
		 */
		dfprintk(FILE, "%s: server %s handed out "
				"a duplicate delegation!\n",
227
				__func__, clp->cl_hostname);
228 229 230 231 232 233
		if (delegation->type <= nfsi->delegation->type) {
			freeme = delegation;
			delegation = NULL;
			goto out;
		}
		freeme = nfs_detach_delegation_locked(nfsi, NULL);
L
Linus Torvalds 已提交
234
	}
235 236 237 238
	list_add_rcu(&delegation->super_list, &clp->cl_delegations);
	nfsi->delegation_state = delegation->type;
	rcu_assign_pointer(nfsi->delegation, delegation);
	delegation = NULL;
239 240 241 242 243 244

	/* Ensure we revalidate the attributes and page cache! */
	spin_lock(&inode->i_lock);
	nfsi->cache_validity |= NFS_INO_REVAL_FORCED;
	spin_unlock(&inode->i_lock);

245
out:
L
Linus Torvalds 已提交
246
	spin_unlock(&clp->cl_lock);
247 248
	if (delegation != NULL)
		nfs_free_delegation(delegation);
249 250
	if (freeme != NULL)
		nfs_do_return_delegation(inode, freeme, 0);
L
Linus Torvalds 已提交
251 252 253 254 255 256 257 258 259 260 261 262 263 264
	return status;
}

/* Sync all data to disk upon delegation return */
static void nfs_msync_inode(struct inode *inode)
{
	filemap_fdatawrite(inode->i_mapping);
	nfs_wb_all(inode);
	filemap_fdatawait(inode->i_mapping);
}

/*
 * Basic procedure for returning a delegation to the server
 */
265
static int __nfs_inode_return_delegation(struct inode *inode, struct nfs_delegation *delegation, int issync)
L
Linus Torvalds 已提交
266 267
{
	struct nfs_inode *nfsi = NFS_I(inode);
268
	int err;
L
Linus Torvalds 已提交
269

270 271 272 273
	/*
	 * Guard against new delegated open/lock/unlock calls and against
	 * state recovery
	 */
L
Linus Torvalds 已提交
274
	down_write(&nfsi->rwsem);
275
	err = nfs_delegation_claim_opens(inode, &delegation->stateid);
L
Linus Torvalds 已提交
276
	up_write(&nfsi->rwsem);
277 278
	if (err)
		goto out;
L
Linus Torvalds 已提交
279

280 281 282
	err = nfs_do_return_delegation(inode, delegation, issync);
out:
	return err;
283 284
}

285 286 287
/*
 * Return all delegations that have been marked for return
 */
288
int nfs_client_return_marked_delegations(struct nfs_client *clp)
289 290 291
{
	struct nfs_delegation *delegation;
	struct inode *inode;
292
	int err = 0;
293 294 295 296 297 298 299 300 301 302 303 304 305

restart:
	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
		if (!test_and_clear_bit(NFS_DELEGATION_RETURN, &delegation->flags))
			continue;
		inode = nfs_delegation_grab_inode(delegation);
		if (inode == NULL)
			continue;
		spin_lock(&clp->cl_lock);
		delegation = nfs_detach_delegation_locked(NFS_I(inode), NULL);
		spin_unlock(&clp->cl_lock);
		rcu_read_unlock();
306 307 308 309
		if (delegation != NULL) {
			filemap_flush(inode->i_mapping);
			err = __nfs_inode_return_delegation(inode, delegation, 0);
		}
310
		iput(inode);
311 312 313 314
		if (!err)
			goto restart;
		set_bit(NFS4CLNT_DELEGRETURN, &clp->cl_state);
		return err;
315 316
	}
	rcu_read_unlock();
317
	return 0;
318 319
}

320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340
/*
 * This function returns the delegation without reclaiming opens
 * or protecting against delegation reclaims.
 * It is therefore really only safe to be called from
 * nfs4_clear_inode()
 */
void nfs_inode_return_delegation_noreclaim(struct inode *inode)
{
	struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
	struct nfs_inode *nfsi = NFS_I(inode);
	struct nfs_delegation *delegation;

	if (rcu_dereference(nfsi->delegation) != NULL) {
		spin_lock(&clp->cl_lock);
		delegation = nfs_detach_delegation_locked(nfsi, NULL);
		spin_unlock(&clp->cl_lock);
		if (delegation != NULL)
			nfs_do_return_delegation(inode, delegation, 0);
	}
}

341 342 343 344 345 346 347
int nfs_inode_return_delegation(struct inode *inode)
{
	struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
	struct nfs_inode *nfsi = NFS_I(inode);
	struct nfs_delegation *delegation;
	int err = 0;

348
	if (rcu_dereference(nfsi->delegation) != NULL) {
349 350 351
		spin_lock(&clp->cl_lock);
		delegation = nfs_detach_delegation_locked(nfsi, NULL);
		spin_unlock(&clp->cl_lock);
352 353 354 355
		if (delegation != NULL) {
			nfs_msync_inode(inode);
			err = __nfs_inode_return_delegation(inode, delegation, 1);
		}
356 357
	}
	return err;
L
Linus Torvalds 已提交
358 359
}

360 361 362 363 364 365
static void nfs_mark_return_delegation(struct nfs_client *clp, struct nfs_delegation *delegation)
{
	set_bit(NFS_DELEGATION_RETURN, &delegation->flags);
	set_bit(NFS4CLNT_DELEGRETURN, &clp->cl_state);
}

L
Linus Torvalds 已提交
366 367 368
/*
 * Return all delegations associated to a super block
 */
369
void nfs_super_return_all_delegations(struct super_block *sb)
L
Linus Torvalds 已提交
370
{
371
	struct nfs_client *clp = NFS_SB(sb)->nfs_client;
L
Linus Torvalds 已提交
372 373 374 375
	struct nfs_delegation *delegation;

	if (clp == NULL)
		return;
376 377
	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
378 379
		spin_lock(&delegation->lock);
		if (delegation->inode != NULL && delegation->inode->i_sb == sb)
380
			set_bit(NFS_DELEGATION_RETURN, &delegation->flags);
381
		spin_unlock(&delegation->lock);
L
Linus Torvalds 已提交
382
	}
383
	rcu_read_unlock();
384 385
	if (nfs_client_return_marked_delegations(clp) != 0)
		nfs4_schedule_state_manager(clp);
386 387
}

388 389
static
void nfs_client_mark_return_all_delegation_types(struct nfs_client *clp, fmode_t flags)
390 391 392 393
{
	struct nfs_delegation *delegation;

	rcu_read_lock();
394
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
395 396 397 398
		if ((delegation->type == (FMODE_READ|FMODE_WRITE)) && !(flags & FMODE_WRITE))
			continue;
		if (delegation->type & flags)
			nfs_mark_return_delegation(clp, delegation);
399
	}
400
	rcu_read_unlock();
L
Linus Torvalds 已提交
401 402
}

403 404 405 406 407
static void nfs_client_mark_return_all_delegations(struct nfs_client *clp)
{
	nfs_client_mark_return_all_delegation_types(clp, FMODE_READ|FMODE_WRITE);
}

408
static void nfs_delegation_run_state_manager(struct nfs_client *clp)
409
{
410 411
	if (test_bit(NFS4CLNT_DELEGRETURN, &clp->cl_state))
		nfs4_schedule_state_manager(clp);
412 413
}

414
static void nfs_expire_all_delegation_types(struct nfs_client *clp, fmode_t flags)
415
{
416
	nfs_client_mark_return_all_delegation_types(clp, flags);
417
	nfs_delegation_run_state_manager(clp);
418 419
}

420 421 422 423 424
void nfs_expire_all_delegations(struct nfs_client *clp)
{
	nfs_expire_all_delegation_types(clp, FMODE_READ|FMODE_WRITE);
}

L
Linus Torvalds 已提交
425 426 427
/*
 * Return all delegations following an NFS4ERR_CB_PATH_DOWN error.
 */
428
void nfs_handle_cb_pathdown(struct nfs_client *clp)
L
Linus Torvalds 已提交
429 430 431
{
	if (clp == NULL)
		return;
432
	nfs_client_mark_return_all_delegations(clp);
L
Linus Torvalds 已提交
433 434
}

435 436 437 438 439 440 441 442
static void nfs_client_mark_return_unreferenced_delegations(struct nfs_client *clp)
{
	struct nfs_delegation *delegation;

	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
		if (test_and_clear_bit(NFS_DELEGATION_REFERENCED, &delegation->flags))
			continue;
443
		nfs_mark_return_delegation(clp, delegation);
444 445 446 447 448 449 450 451 452 453
	}
	rcu_read_unlock();
}

void nfs_expire_unreferenced_delegations(struct nfs_client *clp)
{
	nfs_client_mark_return_unreferenced_delegations(clp);
	nfs_delegation_run_state_manager(clp);
}

L
Linus Torvalds 已提交
454 455 456 457 458
/*
 * Asynchronous delegation recall!
 */
int nfs_async_inode_return_delegation(struct inode *inode, const nfs4_stateid *stateid)
{
459 460
	struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
	struct nfs_delegation *delegation;
L
Linus Torvalds 已提交
461

462 463 464 465 466 467 468 469 470 471 472
	rcu_read_lock();
	delegation = rcu_dereference(NFS_I(inode)->delegation);
	if (delegation == NULL || memcmp(delegation->stateid.data, stateid->data,
				sizeof(delegation->stateid.data)) != 0) {
		rcu_read_unlock();
		return -ENOENT;
	}
	nfs_mark_return_delegation(clp, delegation);
	rcu_read_unlock();
	nfs_delegation_run_state_manager(clp);
	return 0;
L
Linus Torvalds 已提交
473 474 475 476 477
}

/*
 * Retrieve the inode associated with a delegation
 */
478
struct inode *nfs_delegation_find_inode(struct nfs_client *clp, const struct nfs_fh *fhandle)
L
Linus Torvalds 已提交
479 480 481
{
	struct nfs_delegation *delegation;
	struct inode *res = NULL;
482 483
	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
484 485 486
		spin_lock(&delegation->lock);
		if (delegation->inode != NULL &&
		    nfs_compare_fh(fhandle, &NFS_I(delegation->inode)->fh) == 0) {
L
Linus Torvalds 已提交
487 488
			res = igrab(delegation->inode);
		}
489 490 491
		spin_unlock(&delegation->lock);
		if (res != NULL)
			break;
L
Linus Torvalds 已提交
492
	}
493
	rcu_read_unlock();
L
Linus Torvalds 已提交
494 495 496 497 498 499
	return res;
}

/*
 * Mark all delegations as needing to be reclaimed
 */
500
void nfs_delegation_mark_reclaim(struct nfs_client *clp)
L
Linus Torvalds 已提交
501 502
{
	struct nfs_delegation *delegation;
503 504
	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list)
505
		set_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags);
506
	rcu_read_unlock();
L
Linus Torvalds 已提交
507 508 509 510 511
}

/*
 * Reap all unclaimed delegations after reboot recovery is done
 */
512
void nfs_delegation_reap_unclaimed(struct nfs_client *clp)
L
Linus Torvalds 已提交
513
{
514
	struct nfs_delegation *delegation;
515
	struct inode *inode;
516 517 518
restart:
	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
519
		if (test_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags) == 0)
L
Linus Torvalds 已提交
520
			continue;
521 522 523
		inode = nfs_delegation_grab_inode(delegation);
		if (inode == NULL)
			continue;
524
		spin_lock(&clp->cl_lock);
525
		delegation = nfs_detach_delegation_locked(NFS_I(inode), NULL);
526 527 528
		spin_unlock(&clp->cl_lock);
		rcu_read_unlock();
		if (delegation != NULL)
529
			nfs_free_delegation(delegation);
530
		iput(inode);
531
		goto restart;
L
Linus Torvalds 已提交
532
	}
533
	rcu_read_unlock();
L
Linus Torvalds 已提交
534
}
535 536 537 538 539

int nfs4_copy_delegation_stateid(nfs4_stateid *dst, struct inode *inode)
{
	struct nfs_inode *nfsi = NFS_I(inode);
	struct nfs_delegation *delegation;
540
	int ret = 0;
541

542 543
	rcu_read_lock();
	delegation = rcu_dereference(nfsi->delegation);
544 545
	if (delegation != NULL) {
		memcpy(dst->data, delegation->stateid.data, sizeof(dst->data));
546
		ret = 1;
547
	}
548 549
	rcu_read_unlock();
	return ret;
550
}