delegation.c 14.5 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9
/*
 * linux/fs/nfs/delegation.c
 *
 * Copyright (C) 2004 Trond Myklebust
 *
 * NFS file delegation management
 *
 */
#include <linux/completion.h>
10
#include <linux/kthread.h>
L
Linus Torvalds 已提交
11 12
#include <linux/module.h>
#include <linux/sched.h>
13
#include <linux/slab.h>
A
Alexey Dobriyan 已提交
14
#include <linux/smp_lock.h>
L
Linus Torvalds 已提交
15 16 17 18 19 20
#include <linux/spinlock.h>

#include <linux/nfs4.h>
#include <linux/nfs_fs.h>
#include <linux/nfs_xdr.h>

21
#include "nfs4_fs.h"
L
Linus Torvalds 已提交
22
#include "delegation.h"
23
#include "internal.h"
L
Linus Torvalds 已提交
24

25
static void nfs_do_free_delegation(struct nfs_delegation *delegation)
L
Linus Torvalds 已提交
26 27 28 29
{
	kfree(delegation);
}

30 31 32 33
static void nfs_free_delegation_callback(struct rcu_head *head)
{
	struct nfs_delegation *delegation = container_of(head, struct nfs_delegation, rcu);

34 35 36 37 38 39 40 41 42 43 44 45
	nfs_do_free_delegation(delegation);
}

static void nfs_free_delegation(struct nfs_delegation *delegation)
{
	struct rpc_cred *cred;

	cred = rcu_dereference(delegation->cred);
	rcu_assign_pointer(delegation->cred, NULL);
	call_rcu(&delegation->rcu, nfs_free_delegation_callback);
	if (cred)
		put_rpccred(cred);
46 47
}

48 49 50 51 52
void nfs_mark_delegation_referenced(struct nfs_delegation *delegation)
{
	set_bit(NFS_DELEGATION_REFERENCED, &delegation->flags);
}

53
int nfs_have_delegation(struct inode *inode, fmode_t flags)
54 55 56 57 58 59 60 61 62 63 64 65 66 67 68
{
	struct nfs_delegation *delegation;
	int ret = 0;

	flags &= FMODE_READ|FMODE_WRITE;
	rcu_read_lock();
	delegation = rcu_dereference(NFS_I(inode)->delegation);
	if (delegation != NULL && (delegation->type & flags) == flags) {
		nfs_mark_delegation_referenced(delegation);
		ret = 1;
	}
	rcu_read_unlock();
	return ret;
}

69 70 71 72
static int nfs_delegation_claim_locks(struct nfs_open_context *ctx, struct nfs4_state *state)
{
	struct inode *inode = state->inode;
	struct file_lock *fl;
73
	int status = 0;
74

75 76 77 78 79
	if (inode->i_flock == NULL)
		goto out;

	/* Protect inode->i_flock using the BKL */
	lock_kernel();
H
Harvey Harrison 已提交
80
	for (fl = inode->i_flock; fl != NULL; fl = fl->fl_next) {
81 82
		if (!(fl->fl_flags & (FL_POSIX|FL_FLOCK)))
			continue;
83
		if (nfs_file_open_context(fl->fl_file) != ctx)
84
			continue;
85
		unlock_kernel();
86
		status = nfs4_lock_delegation_recall(state, fl);
87
		if (status < 0)
88 89
			goto out;
		lock_kernel();
90
	}
91 92
	unlock_kernel();
out:
93 94 95
	return status;
}

96
static int nfs_delegation_claim_opens(struct inode *inode, const nfs4_stateid *stateid)
L
Linus Torvalds 已提交
97 98 99 100
{
	struct nfs_inode *nfsi = NFS_I(inode);
	struct nfs_open_context *ctx;
	struct nfs4_state *state;
101
	int err;
L
Linus Torvalds 已提交
102 103 104 105 106 107 108 109 110

again:
	spin_lock(&inode->i_lock);
	list_for_each_entry(ctx, &nfsi->open_files, list) {
		state = ctx->state;
		if (state == NULL)
			continue;
		if (!test_bit(NFS_DELEGATED_STATE, &state->flags))
			continue;
111 112
		if (memcmp(state->stateid.data, stateid->data, sizeof(state->stateid.data)) != 0)
			continue;
L
Linus Torvalds 已提交
113 114
		get_nfs_open_context(ctx);
		spin_unlock(&inode->i_lock);
115
		err = nfs4_open_delegation_recall(ctx, state, stateid);
116 117
		if (err >= 0)
			err = nfs_delegation_claim_locks(ctx, state);
L
Linus Torvalds 已提交
118
		put_nfs_open_context(ctx);
119
		if (err != 0)
120
			return err;
L
Linus Torvalds 已提交
121 122 123
		goto again;
	}
	spin_unlock(&inode->i_lock);
124
	return 0;
L
Linus Torvalds 已提交
125 126 127 128 129 130 131 132
}

/*
 * Set up a delegation on an inode
 */
void nfs_inode_reclaim_delegation(struct inode *inode, struct rpc_cred *cred, struct nfs_openres *res)
{
	struct nfs_delegation *delegation = NFS_I(inode)->delegation;
133
	struct rpc_cred *oldcred;
L
Linus Torvalds 已提交
134 135 136 137 138 139 140

	if (delegation == NULL)
		return;
	memcpy(delegation->stateid.data, res->delegation.data,
			sizeof(delegation->stateid.data));
	delegation->type = res->delegation_type;
	delegation->maxsize = res->maxsize;
141
	oldcred = delegation->cred;
L
Linus Torvalds 已提交
142
	delegation->cred = get_rpccred(cred);
143
	clear_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags);
L
Linus Torvalds 已提交
144 145
	NFS_I(inode)->delegation_state = delegation->type;
	smp_wmb();
146
	put_rpccred(oldcred);
L
Linus Torvalds 已提交
147 148
}

149 150 151 152 153 154 155 156 157
static int nfs_do_return_delegation(struct inode *inode, struct nfs_delegation *delegation, int issync)
{
	int res = 0;

	res = nfs4_proc_delegreturn(inode, delegation->cred, &delegation->stateid, issync);
	nfs_free_delegation(delegation);
	return res;
}

158 159 160 161 162 163 164 165 166 167 168
static struct inode *nfs_delegation_grab_inode(struct nfs_delegation *delegation)
{
	struct inode *inode = NULL;

	spin_lock(&delegation->lock);
	if (delegation->inode != NULL)
		inode = igrab(delegation->inode);
	spin_unlock(&delegation->lock);
	return inode;
}

169 170 171 172 173 174
static struct nfs_delegation *nfs_detach_delegation_locked(struct nfs_inode *nfsi, const nfs4_stateid *stateid)
{
	struct nfs_delegation *delegation = rcu_dereference(nfsi->delegation);

	if (delegation == NULL)
		goto nomatch;
175
	spin_lock(&delegation->lock);
176 177
	if (stateid != NULL && memcmp(delegation->stateid.data, stateid->data,
				sizeof(delegation->stateid.data)) != 0)
178
		goto nomatch_unlock;
179
	list_del_rcu(&delegation->super_list);
180
	delegation->inode = NULL;
181 182
	nfsi->delegation_state = 0;
	rcu_assign_pointer(nfsi->delegation, NULL);
183
	spin_unlock(&delegation->lock);
184
	return delegation;
185 186
nomatch_unlock:
	spin_unlock(&delegation->lock);
187 188 189 190
nomatch:
	return NULL;
}

L
Linus Torvalds 已提交
191 192 193 194 195
/*
 * Set up a delegation on an inode
 */
int nfs_inode_set_delegation(struct inode *inode, struct rpc_cred *cred, struct nfs_openres *res)
{
196
	struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
L
Linus Torvalds 已提交
197 198
	struct nfs_inode *nfsi = NFS_I(inode);
	struct nfs_delegation *delegation;
199
	struct nfs_delegation *freeme = NULL;
L
Linus Torvalds 已提交
200 201
	int status = 0;

202
	delegation = kmalloc(sizeof(*delegation), GFP_KERNEL);
L
Linus Torvalds 已提交
203 204 205 206 207 208
	if (delegation == NULL)
		return -ENOMEM;
	memcpy(delegation->stateid.data, res->delegation.data,
			sizeof(delegation->stateid.data));
	delegation->type = res->delegation_type;
	delegation->maxsize = res->maxsize;
209
	delegation->change_attr = nfsi->change_attr;
L
Linus Torvalds 已提交
210 211
	delegation->cred = get_rpccred(cred);
	delegation->inode = inode;
212
	delegation->flags = 1<<NFS_DELEGATION_REFERENCED;
213
	spin_lock_init(&delegation->lock);
L
Linus Torvalds 已提交
214 215

	spin_lock(&clp->cl_lock);
216
	if (rcu_dereference(nfsi->delegation) != NULL) {
L
Linus Torvalds 已提交
217
		if (memcmp(&delegation->stateid, &nfsi->delegation->stateid,
218 219 220
					sizeof(delegation->stateid)) == 0 &&
				delegation->type == nfsi->delegation->type) {
			goto out;
L
Linus Torvalds 已提交
221
		}
222 223 224 225 226 227
		/*
		 * Deal with broken servers that hand out two
		 * delegations for the same file.
		 */
		dfprintk(FILE, "%s: server %s handed out "
				"a duplicate delegation!\n",
228
				__func__, clp->cl_hostname);
229 230 231 232 233 234
		if (delegation->type <= nfsi->delegation->type) {
			freeme = delegation;
			delegation = NULL;
			goto out;
		}
		freeme = nfs_detach_delegation_locked(nfsi, NULL);
L
Linus Torvalds 已提交
235
	}
236 237 238 239
	list_add_rcu(&delegation->super_list, &clp->cl_delegations);
	nfsi->delegation_state = delegation->type;
	rcu_assign_pointer(nfsi->delegation, delegation);
	delegation = NULL;
240 241 242 243 244 245

	/* Ensure we revalidate the attributes and page cache! */
	spin_lock(&inode->i_lock);
	nfsi->cache_validity |= NFS_INO_REVAL_FORCED;
	spin_unlock(&inode->i_lock);

246
out:
L
Linus Torvalds 已提交
247
	spin_unlock(&clp->cl_lock);
248 249
	if (delegation != NULL)
		nfs_free_delegation(delegation);
250 251
	if (freeme != NULL)
		nfs_do_return_delegation(inode, freeme, 0);
L
Linus Torvalds 已提交
252 253 254 255 256 257 258 259 260 261 262 263 264 265
	return status;
}

/* Sync all data to disk upon delegation return */
static void nfs_msync_inode(struct inode *inode)
{
	filemap_fdatawrite(inode->i_mapping);
	nfs_wb_all(inode);
	filemap_fdatawait(inode->i_mapping);
}

/*
 * Basic procedure for returning a delegation to the server
 */
266
static int __nfs_inode_return_delegation(struct inode *inode, struct nfs_delegation *delegation, int issync)
L
Linus Torvalds 已提交
267 268
{
	struct nfs_inode *nfsi = NFS_I(inode);
269
	int err;
L
Linus Torvalds 已提交
270

271 272 273 274
	/*
	 * Guard against new delegated open/lock/unlock calls and against
	 * state recovery
	 */
L
Linus Torvalds 已提交
275
	down_write(&nfsi->rwsem);
276
	err = nfs_delegation_claim_opens(inode, &delegation->stateid);
L
Linus Torvalds 已提交
277
	up_write(&nfsi->rwsem);
278 279
	if (err)
		goto out;
L
Linus Torvalds 已提交
280

281 282 283
	err = nfs_do_return_delegation(inode, delegation, issync);
out:
	return err;
284 285
}

286 287 288
/*
 * Return all delegations that have been marked for return
 */
289
int nfs_client_return_marked_delegations(struct nfs_client *clp)
290 291 292
{
	struct nfs_delegation *delegation;
	struct inode *inode;
293
	int err = 0;
294 295 296 297 298 299 300 301 302 303 304 305 306

restart:
	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
		if (!test_and_clear_bit(NFS_DELEGATION_RETURN, &delegation->flags))
			continue;
		inode = nfs_delegation_grab_inode(delegation);
		if (inode == NULL)
			continue;
		spin_lock(&clp->cl_lock);
		delegation = nfs_detach_delegation_locked(NFS_I(inode), NULL);
		spin_unlock(&clp->cl_lock);
		rcu_read_unlock();
307 308 309 310
		if (delegation != NULL) {
			filemap_flush(inode->i_mapping);
			err = __nfs_inode_return_delegation(inode, delegation, 0);
		}
311
		iput(inode);
312 313 314 315
		if (!err)
			goto restart;
		set_bit(NFS4CLNT_DELEGRETURN, &clp->cl_state);
		return err;
316 317
	}
	rcu_read_unlock();
318
	return 0;
319 320
}

321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341
/*
 * This function returns the delegation without reclaiming opens
 * or protecting against delegation reclaims.
 * It is therefore really only safe to be called from
 * nfs4_clear_inode()
 */
void nfs_inode_return_delegation_noreclaim(struct inode *inode)
{
	struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
	struct nfs_inode *nfsi = NFS_I(inode);
	struct nfs_delegation *delegation;

	if (rcu_dereference(nfsi->delegation) != NULL) {
		spin_lock(&clp->cl_lock);
		delegation = nfs_detach_delegation_locked(nfsi, NULL);
		spin_unlock(&clp->cl_lock);
		if (delegation != NULL)
			nfs_do_return_delegation(inode, delegation, 0);
	}
}

342 343 344 345 346 347 348
int nfs_inode_return_delegation(struct inode *inode)
{
	struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
	struct nfs_inode *nfsi = NFS_I(inode);
	struct nfs_delegation *delegation;
	int err = 0;

349
	if (rcu_dereference(nfsi->delegation) != NULL) {
350 351 352
		spin_lock(&clp->cl_lock);
		delegation = nfs_detach_delegation_locked(nfsi, NULL);
		spin_unlock(&clp->cl_lock);
353 354 355 356
		if (delegation != NULL) {
			nfs_msync_inode(inode);
			err = __nfs_inode_return_delegation(inode, delegation, 1);
		}
357 358
	}
	return err;
L
Linus Torvalds 已提交
359 360
}

361 362 363 364 365 366
static void nfs_mark_return_delegation(struct nfs_client *clp, struct nfs_delegation *delegation)
{
	set_bit(NFS_DELEGATION_RETURN, &delegation->flags);
	set_bit(NFS4CLNT_DELEGRETURN, &clp->cl_state);
}

L
Linus Torvalds 已提交
367 368 369
/*
 * Return all delegations associated to a super block
 */
370
void nfs_super_return_all_delegations(struct super_block *sb)
L
Linus Torvalds 已提交
371
{
372
	struct nfs_client *clp = NFS_SB(sb)->nfs_client;
L
Linus Torvalds 已提交
373 374 375 376
	struct nfs_delegation *delegation;

	if (clp == NULL)
		return;
377 378
	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
379 380
		spin_lock(&delegation->lock);
		if (delegation->inode != NULL && delegation->inode->i_sb == sb)
381
			set_bit(NFS_DELEGATION_RETURN, &delegation->flags);
382
		spin_unlock(&delegation->lock);
L
Linus Torvalds 已提交
383
	}
384
	rcu_read_unlock();
385 386
	if (nfs_client_return_marked_delegations(clp) != 0)
		nfs4_schedule_state_manager(clp);
387 388
}

389 390
static
void nfs_client_mark_return_all_delegation_types(struct nfs_client *clp, fmode_t flags)
391 392 393 394
{
	struct nfs_delegation *delegation;

	rcu_read_lock();
395
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
396 397 398 399
		if ((delegation->type == (FMODE_READ|FMODE_WRITE)) && !(flags & FMODE_WRITE))
			continue;
		if (delegation->type & flags)
			nfs_mark_return_delegation(clp, delegation);
400
	}
401
	rcu_read_unlock();
L
Linus Torvalds 已提交
402 403
}

404 405 406 407 408
static void nfs_client_mark_return_all_delegations(struct nfs_client *clp)
{
	nfs_client_mark_return_all_delegation_types(clp, FMODE_READ|FMODE_WRITE);
}

409
static void nfs_delegation_run_state_manager(struct nfs_client *clp)
410
{
411 412
	if (test_bit(NFS4CLNT_DELEGRETURN, &clp->cl_state))
		nfs4_schedule_state_manager(clp);
413 414
}

415
void nfs_expire_all_delegation_types(struct nfs_client *clp, fmode_t flags)
416
{
417
	nfs_client_mark_return_all_delegation_types(clp, flags);
418
	nfs_delegation_run_state_manager(clp);
419 420
}

421 422 423 424 425
void nfs_expire_all_delegations(struct nfs_client *clp)
{
	nfs_expire_all_delegation_types(clp, FMODE_READ|FMODE_WRITE);
}

L
Linus Torvalds 已提交
426 427 428
/*
 * Return all delegations following an NFS4ERR_CB_PATH_DOWN error.
 */
429
void nfs_handle_cb_pathdown(struct nfs_client *clp)
L
Linus Torvalds 已提交
430 431 432
{
	if (clp == NULL)
		return;
433
	nfs_client_mark_return_all_delegations(clp);
L
Linus Torvalds 已提交
434 435
}

436 437 438 439 440 441 442 443
static void nfs_client_mark_return_unreferenced_delegations(struct nfs_client *clp)
{
	struct nfs_delegation *delegation;

	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
		if (test_and_clear_bit(NFS_DELEGATION_REFERENCED, &delegation->flags))
			continue;
444
		nfs_mark_return_delegation(clp, delegation);
445 446 447 448 449 450 451 452 453 454
	}
	rcu_read_unlock();
}

void nfs_expire_unreferenced_delegations(struct nfs_client *clp)
{
	nfs_client_mark_return_unreferenced_delegations(clp);
	nfs_delegation_run_state_manager(clp);
}

L
Linus Torvalds 已提交
455 456 457
/*
 * Asynchronous delegation recall!
 */
A
Alexandros Batsakis 已提交
458 459 460
int nfs_async_inode_return_delegation(struct inode *inode, const nfs4_stateid *stateid,
				      int (*validate_stateid)(struct nfs_delegation *delegation,
							      const nfs4_stateid *stateid))
L
Linus Torvalds 已提交
461
{
462 463
	struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
	struct nfs_delegation *delegation;
L
Linus Torvalds 已提交
464

465 466
	rcu_read_lock();
	delegation = rcu_dereference(NFS_I(inode)->delegation);
A
Alexandros Batsakis 已提交
467 468

	if (!validate_stateid(delegation, stateid)) {
469 470 471
		rcu_read_unlock();
		return -ENOENT;
	}
A
Alexandros Batsakis 已提交
472

473 474 475 476
	nfs_mark_return_delegation(clp, delegation);
	rcu_read_unlock();
	nfs_delegation_run_state_manager(clp);
	return 0;
L
Linus Torvalds 已提交
477 478 479 480 481
}

/*
 * Retrieve the inode associated with a delegation
 */
482
struct inode *nfs_delegation_find_inode(struct nfs_client *clp, const struct nfs_fh *fhandle)
L
Linus Torvalds 已提交
483 484 485
{
	struct nfs_delegation *delegation;
	struct inode *res = NULL;
486 487
	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
488 489 490
		spin_lock(&delegation->lock);
		if (delegation->inode != NULL &&
		    nfs_compare_fh(fhandle, &NFS_I(delegation->inode)->fh) == 0) {
L
Linus Torvalds 已提交
491 492
			res = igrab(delegation->inode);
		}
493 494 495
		spin_unlock(&delegation->lock);
		if (res != NULL)
			break;
L
Linus Torvalds 已提交
496
	}
497
	rcu_read_unlock();
L
Linus Torvalds 已提交
498 499 500 501 502 503
	return res;
}

/*
 * Mark all delegations as needing to be reclaimed
 */
504
void nfs_delegation_mark_reclaim(struct nfs_client *clp)
L
Linus Torvalds 已提交
505 506
{
	struct nfs_delegation *delegation;
507 508
	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list)
509
		set_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags);
510
	rcu_read_unlock();
L
Linus Torvalds 已提交
511 512 513 514 515
}

/*
 * Reap all unclaimed delegations after reboot recovery is done
 */
516
void nfs_delegation_reap_unclaimed(struct nfs_client *clp)
L
Linus Torvalds 已提交
517
{
518
	struct nfs_delegation *delegation;
519
	struct inode *inode;
520 521 522
restart:
	rcu_read_lock();
	list_for_each_entry_rcu(delegation, &clp->cl_delegations, super_list) {
523
		if (test_bit(NFS_DELEGATION_NEED_RECLAIM, &delegation->flags) == 0)
L
Linus Torvalds 已提交
524
			continue;
525 526 527
		inode = nfs_delegation_grab_inode(delegation);
		if (inode == NULL)
			continue;
528
		spin_lock(&clp->cl_lock);
529
		delegation = nfs_detach_delegation_locked(NFS_I(inode), NULL);
530 531 532
		spin_unlock(&clp->cl_lock);
		rcu_read_unlock();
		if (delegation != NULL)
533
			nfs_free_delegation(delegation);
534
		iput(inode);
535
		goto restart;
L
Linus Torvalds 已提交
536
	}
537
	rcu_read_unlock();
L
Linus Torvalds 已提交
538
}
539 540 541 542 543

int nfs4_copy_delegation_stateid(nfs4_stateid *dst, struct inode *inode)
{
	struct nfs_inode *nfsi = NFS_I(inode);
	struct nfs_delegation *delegation;
544
	int ret = 0;
545

546 547
	rcu_read_lock();
	delegation = rcu_dereference(nfsi->delegation);
548 549
	if (delegation != NULL) {
		memcpy(dst->data, delegation->stateid.data, sizeof(dst->data));
550
		ret = 1;
551
	}
552 553
	rcu_read_unlock();
	return ret;
554
}