unlink.c 15.5 KB
Newer Older
L
Linus Torvalds 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
/*
 *  linux/fs/nfs/unlink.c
 *
 * nfs sillydelete handling
 *
 */

#include <linux/slab.h>
#include <linux/string.h>
#include <linux/dcache.h>
#include <linux/sunrpc/sched.h>
#include <linux/sunrpc/clnt.h>
#include <linux/nfs_fs.h>
14 15
#include <linux/sched.h>
#include <linux/wait.h>
16
#include <linux/namei.h>
17
#include <linux/fsnotify.h>
L
Linus Torvalds 已提交
18

19
#include "internal.h"
20
#include "nfs4_fs.h"
21 22
#include "iostat.h"
#include "delegation.h"
23

24 25
#include "nfstrace.h"

L
Linus Torvalds 已提交
26
/**
27
 * nfs_free_unlinkdata - release data from a sillydelete operation.
L
Linus Torvalds 已提交
28 29 30
 * @data: pointer to unlink structure.
 */
static void
31
nfs_free_unlinkdata(struct nfs_unlinkdata *data)
L
Linus Torvalds 已提交
32
{
33 34 35 36
	iput(data->dir);
	put_rpccred(data->cred);
	kfree(data->args.name.name);
	kfree(data);
L
Linus Torvalds 已提交
37 38 39 40 41 42 43 44
}

#define NAME_ALLOC_LEN(len)	((len+16) & ~15)
/**
 * nfs_copy_dname - copy dentry name to data structure
 * @dentry: pointer to dentry
 * @data: nfs_unlinkdata
 */
45
static int nfs_copy_dname(struct dentry *dentry, struct nfs_unlinkdata *data)
L
Linus Torvalds 已提交
46 47 48 49
{
	char		*str;
	int		len = dentry->d_name.len;

50
	str = kmemdup(dentry->d_name.name, NAME_ALLOC_LEN(len), GFP_KERNEL);
L
Linus Torvalds 已提交
51
	if (!str)
52 53 54 55
		return -ENOMEM;
	data->args.name.len = len;
	data->args.name.name = str;
	return 0;
L
Linus Torvalds 已提交
56 57
}

T
Trond Myklebust 已提交
58 59 60 61 62 63 64 65 66 67 68 69 70 71
static void nfs_free_dname(struct nfs_unlinkdata *data)
{
	kfree(data->args.name.name);
	data->args.name.name = NULL;
	data->args.name.len = 0;
}

static void nfs_dec_sillycount(struct inode *dir)
{
	struct nfs_inode *nfsi = NFS_I(dir);
	if (atomic_dec_return(&nfsi->silly_count) == 1)
		wake_up(&nfsi->waitqueue);
}

L
Linus Torvalds 已提交
72 73 74 75 76 77
/**
 * nfs_async_unlink_done - Sillydelete post-processing
 * @task: rpc_task of the sillydelete
 *
 * Do the directory attribute update.
 */
78
static void nfs_async_unlink_done(struct rpc_task *task, void *calldata)
L
Linus Torvalds 已提交
79
{
80 81 82
	struct nfs_unlinkdata *data = calldata;
	struct inode *dir = data->dir;

83
	trace_nfs_sillyrename_unlink(data, task->tk_status);
84
	if (!NFS_PROTO(dir)->unlink_done(task, dir))
85
		rpc_restart_call_prepare(task);
L
Linus Torvalds 已提交
86 87 88 89 90 91 92 93 94
}

/**
 * nfs_async_unlink_release - Release the sillydelete data.
 * @task: rpc_task of the sillydelete
 *
 * We need to call nfs_put_unlinkdata as a 'tk_release' task since the
 * rpc_task would be freed too.
 */
95
static void nfs_async_unlink_release(void *calldata)
L
Linus Torvalds 已提交
96
{
97
	struct nfs_unlinkdata	*data = calldata;
98
	struct super_block *sb = data->dir->i_sb;
T
Trond Myklebust 已提交
99 100

	nfs_dec_sillycount(data->dir);
101
	nfs_free_unlinkdata(data);
102
	nfs_sb_deactive(sb);
L
Linus Torvalds 已提交
103 104
}

105
static void nfs_unlink_prepare(struct rpc_task *task, void *calldata)
106 107
{
	struct nfs_unlinkdata *data = calldata;
108
	NFS_PROTO(data->dir)->unlink_rpc_prepare(task, data);
109 110
}

111 112 113
static const struct rpc_call_ops nfs_unlink_ops = {
	.rpc_call_done = nfs_async_unlink_done,
	.rpc_release = nfs_async_unlink_release,
114
	.rpc_call_prepare = nfs_unlink_prepare,
115 116
};

T
Trond Myklebust 已提交
117
static int nfs_do_call_unlink(struct dentry *parent, struct inode *dir, struct nfs_unlinkdata *data)
118
{
119 120 121 122 123
	struct rpc_message msg = {
		.rpc_argp = &data->args,
		.rpc_resp = &data->res,
		.rpc_cred = data->cred,
	};
T
Trond Myklebust 已提交
124
	struct rpc_task_setup task_setup_data = {
125
		.rpc_message = &msg,
T
Trond Myklebust 已提交
126 127
		.callback_ops = &nfs_unlink_ops,
		.callback_data = data,
128
		.workqueue = nfsiod_workqueue,
T
Trond Myklebust 已提交
129 130
		.flags = RPC_TASK_ASYNC,
	};
131
	struct rpc_task *task;
T
Trond Myklebust 已提交
132 133 134 135
	struct dentry *alias;

	alias = d_lookup(parent, &data->args.name);
	if (alias != NULL) {
136
		int ret;
137
		void *devname_garbage = NULL;
138

T
Trond Myklebust 已提交
139 140 141 142 143
		/*
		 * Hey, we raced with lookup... See if we need to transfer
		 * the sillyrename information to the aliased dentry.
		 */
		nfs_free_dname(data);
144
		ret = nfs_copy_dname(alias, data);
T
Trond Myklebust 已提交
145
		spin_lock(&alias->d_lock);
146
		if (ret == 0 && alias->d_inode != NULL &&
147
		    !(alias->d_flags & DCACHE_NFSFS_RENAMED)) {
148
			devname_garbage = alias->d_fsdata;
T
Trond Myklebust 已提交
149
			alias->d_fsdata = data;
T
Trond Myklebust 已提交
150
			alias->d_flags |= DCACHE_NFSFS_RENAMED;
T
Trond Myklebust 已提交
151
			ret = 1;
152 153
		} else
			ret = 0;
T
Trond Myklebust 已提交
154 155 156
		spin_unlock(&alias->d_lock);
		nfs_dec_sillycount(dir);
		dput(alias);
157 158 159 160 161
		/*
		 * If we'd displaced old cached devname, free it.  At that
		 * point dentry is definitely not a root, so we won't need
		 * that anymore.
		 */
162
		kfree(devname_garbage);
T
Trond Myklebust 已提交
163 164 165 166 167 168 169
		return ret;
	}
	data->dir = igrab(dir);
	if (!data->dir) {
		nfs_dec_sillycount(dir);
		return 0;
	}
170
	nfs_sb_active(dir->i_sb);
T
Trond Myklebust 已提交
171
	data->args.fh = NFS_FH(dir);
172
	nfs_fattr_init(data->res.dir_attr);
T
Trond Myklebust 已提交
173

174
	NFS_PROTO(dir)->unlink_setup(&msg, dir);
T
Trond Myklebust 已提交
175

176
	task_setup_data.rpc_client = NFS_CLIENT(dir);
T
Trond Myklebust 已提交
177
	task = rpc_run_task(&task_setup_data);
T
Trond Myklebust 已提交
178
	if (!IS_ERR(task))
179
		rpc_put_task_async(task);
T
Trond Myklebust 已提交
180 181 182 183 184
	return 1;
}

static int nfs_call_unlink(struct dentry *dentry, struct nfs_unlinkdata *data)
{
185 186
	struct dentry *parent;
	struct inode *dir;
T
Trond Myklebust 已提交
187
	int ret = 0;
188 189 190 191 192


	parent = dget_parent(dentry);
	if (parent == NULL)
		goto out_free;
T
Trond Myklebust 已提交
193 194 195 196 197 198 199 200 201 202 203 204 205
	dir = parent->d_inode;
	/* Non-exclusive lock protects against concurrent lookup() calls */
	spin_lock(&dir->i_lock);
	if (atomic_inc_not_zero(&NFS_I(dir)->silly_count) == 0) {
		/* Deferred delete */
		hlist_add_head(&data->list, &NFS_I(dir)->silly_list);
		spin_unlock(&dir->i_lock);
		ret = 1;
		goto out_dput;
	}
	spin_unlock(&dir->i_lock);
	ret = nfs_do_call_unlink(parent, dir, data);
out_dput:
206
	dput(parent);
T
Trond Myklebust 已提交
207 208 209
out_free:
	return ret;
}
210

211 212 213 214 215 216 217
void nfs_wait_on_sillyrename(struct dentry *dentry)
{
	struct nfs_inode *nfsi = NFS_I(dentry->d_inode);

	wait_event(nfsi->waitqueue, atomic_read(&nfsi->silly_count) <= 1);
}

T
Trond Myklebust 已提交
218 219 220
void nfs_block_sillyrename(struct dentry *dentry)
{
	struct nfs_inode *nfsi = NFS_I(dentry->d_inode);
221

T
Trond Myklebust 已提交
222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243
	wait_event(nfsi->waitqueue, atomic_cmpxchg(&nfsi->silly_count, 1, 0) == 1);
}

void nfs_unblock_sillyrename(struct dentry *dentry)
{
	struct inode *dir = dentry->d_inode;
	struct nfs_inode *nfsi = NFS_I(dir);
	struct nfs_unlinkdata *data;

	atomic_inc(&nfsi->silly_count);
	spin_lock(&dir->i_lock);
	while (!hlist_empty(&nfsi->silly_list)) {
		if (!atomic_inc_not_zero(&nfsi->silly_count))
			break;
		data = hlist_entry(nfsi->silly_list.first, struct nfs_unlinkdata, list);
		hlist_del(&data->list);
		spin_unlock(&dir->i_lock);
		if (nfs_do_call_unlink(dentry, dir, data) == 0)
			nfs_free_unlinkdata(data);
		spin_lock(&dir->i_lock);
	}
	spin_unlock(&dir->i_lock);
244 245
}

L
Linus Torvalds 已提交
246 247
/**
 * nfs_async_unlink - asynchronous unlinking of a file
248
 * @dir: parent directory of dentry
L
Linus Torvalds 已提交
249 250
 * @dentry: dentry to unlink
 */
251
static int
252
nfs_async_unlink(struct inode *dir, struct dentry *dentry)
L
Linus Torvalds 已提交
253
{
254 255
	struct nfs_unlinkdata *data;
	int status = -ENOMEM;
256
	void *devname_garbage = NULL;
L
Linus Torvalds 已提交
257

258
	data = kzalloc(sizeof(*data), GFP_KERNEL);
259
	if (data == NULL)
L
Linus Torvalds 已提交
260 261
		goto out;

262
	data->cred = rpc_lookup_cred();
L
Linus Torvalds 已提交
263 264 265 266
	if (IS_ERR(data->cred)) {
		status = PTR_ERR(data->cred);
		goto out_free;
	}
267
	data->res.dir_attr = &data->dir_attr;
L
Linus Torvalds 已提交
268

269
	status = -EBUSY;
L
Linus Torvalds 已提交
270
	spin_lock(&dentry->d_lock);
271 272
	if (dentry->d_flags & DCACHE_NFSFS_RENAMED)
		goto out_unlock;
L
Linus Torvalds 已提交
273
	dentry->d_flags |= DCACHE_NFSFS_RENAMED;
274
	devname_garbage = dentry->d_fsdata;
275
	dentry->d_fsdata = data;
L
Linus Torvalds 已提交
276
	spin_unlock(&dentry->d_lock);
277 278 279 280 281
	/*
	 * If we'd displaced old cached devname, free it.  At that
	 * point dentry is definitely not a root, so we won't need
	 * that anymore.
	 */
282
	kfree(devname_garbage);
283 284 285 286
	return 0;
out_unlock:
	spin_unlock(&dentry->d_lock);
	put_rpccred(data->cred);
L
Linus Torvalds 已提交
287 288
out_free:
	kfree(data);
289
out:
L
Linus Torvalds 已提交
290 291 292 293 294 295
	return status;
}

/**
 * nfs_complete_unlink - Initialize completion of the sillydelete
 * @dentry: dentry to delete
296
 * @inode: inode
L
Linus Torvalds 已提交
297 298 299 300 301 302
 *
 * Since we're most likely to be called by dentry_iput(), we
 * only use the dentry to find the sillydelete. We then copy the name
 * into the qstr.
 */
void
303
nfs_complete_unlink(struct dentry *dentry, struct inode *inode)
L
Linus Torvalds 已提交
304
{
305
	struct nfs_unlinkdata	*data = NULL;
L
Linus Torvalds 已提交
306 307

	spin_lock(&dentry->d_lock);
308 309 310
	if (dentry->d_flags & DCACHE_NFSFS_RENAMED) {
		dentry->d_flags &= ~DCACHE_NFSFS_RENAMED;
		data = dentry->d_fsdata;
311
		dentry->d_fsdata = NULL;
312
	}
L
Linus Torvalds 已提交
313
	spin_unlock(&dentry->d_lock);
314 315 316

	if (data != NULL && (NFS_STALE(inode) || !nfs_call_unlink(dentry, data)))
		nfs_free_unlinkdata(data);
L
Linus Torvalds 已提交
317
}
318

319 320 321 322 323 324 325 326 327
/* Cancel a queued async unlink. Called when a sillyrename run fails. */
static void
nfs_cancel_async_unlink(struct dentry *dentry)
{
	spin_lock(&dentry->d_lock);
	if (dentry->d_flags & DCACHE_NFSFS_RENAMED) {
		struct nfs_unlinkdata *data = dentry->d_fsdata;

		dentry->d_flags &= ~DCACHE_NFSFS_RENAMED;
328
		dentry->d_fsdata = NULL;
329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347
		spin_unlock(&dentry->d_lock);
		nfs_free_unlinkdata(data);
		return;
	}
	spin_unlock(&dentry->d_lock);
}

/**
 * nfs_async_rename_done - Sillyrename post-processing
 * @task: rpc_task of the sillyrename
 * @calldata: nfs_renamedata for the sillyrename
 *
 * Do the directory attribute updates and the d_move
 */
static void nfs_async_rename_done(struct rpc_task *task, void *calldata)
{
	struct nfs_renamedata *data = calldata;
	struct inode *old_dir = data->old_dir;
	struct inode *new_dir = data->new_dir;
348
	struct dentry *old_dentry = data->old_dentry;
349

350 351
	trace_nfs_sillyrename_rename(old_dir, old_dentry,
			new_dir, data->new_dentry, task->tk_status);
352
	if (!NFS_PROTO(old_dir)->rename_done(task, old_dir, new_dir)) {
353
		rpc_restart_call_prepare(task);
354 355 356
		return;
	}

357 358
	if (data->complete)
		data->complete(task, data);
359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384
}

/**
 * nfs_async_rename_release - Release the sillyrename data.
 * @calldata: the struct nfs_renamedata to be released
 */
static void nfs_async_rename_release(void *calldata)
{
	struct nfs_renamedata	*data = calldata;
	struct super_block *sb = data->old_dir->i_sb;

	if (data->old_dentry->d_inode)
		nfs_mark_for_revalidate(data->old_dentry->d_inode);

	dput(data->old_dentry);
	dput(data->new_dentry);
	iput(data->old_dir);
	iput(data->new_dir);
	nfs_sb_deactive(sb);
	put_rpccred(data->cred);
	kfree(data);
}

static void nfs_rename_prepare(struct rpc_task *task, void *calldata)
{
	struct nfs_renamedata *data = calldata;
385
	NFS_PROTO(data->old_dir)->rename_rpc_prepare(task, data);
386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402
}

static const struct rpc_call_ops nfs_rename_ops = {
	.rpc_call_done = nfs_async_rename_done,
	.rpc_release = nfs_async_rename_release,
	.rpc_call_prepare = nfs_rename_prepare,
};

/**
 * nfs_async_rename - perform an asynchronous rename operation
 * @old_dir: directory that currently holds the dentry to be renamed
 * @new_dir: target directory for the rename
 * @old_dentry: original dentry to be renamed
 * @new_dentry: dentry to which the old_dentry should be renamed
 *
 * It's expected that valid references to the dentries and inodes are held
 */
403
struct rpc_task *
404
nfs_async_rename(struct inode *old_dir, struct inode *new_dir,
405 406
		 struct dentry *old_dentry, struct dentry *new_dentry,
		 void (*complete)(struct rpc_task *, struct nfs_renamedata *))
407 408 409 410 411 412 413 414 415 416 417
{
	struct nfs_renamedata *data;
	struct rpc_message msg = { };
	struct rpc_task_setup task_setup_data = {
		.rpc_message = &msg,
		.callback_ops = &nfs_rename_ops,
		.workqueue = nfsiod_workqueue,
		.rpc_client = NFS_CLIENT(old_dir),
		.flags = RPC_TASK_ASYNC,
	};

418
	data = kzalloc(sizeof(*data), GFP_KERNEL);
419 420
	if (data == NULL)
		return ERR_PTR(-ENOMEM);
421
	task_setup_data.callback_data = data;
422 423 424

	data->cred = rpc_lookup_cred();
	if (IS_ERR(data->cred)) {
425
		struct rpc_task *task = ERR_CAST(data->cred);
426 427 428 429 430 431 432 433 434 435
		kfree(data);
		return task;
	}

	msg.rpc_argp = &data->args;
	msg.rpc_resp = &data->res;
	msg.rpc_cred = data->cred;

	/* set up nfs_renamedata */
	data->old_dir = old_dir;
436
	ihold(old_dir);
437
	data->new_dir = new_dir;
438
	ihold(new_dir);
439 440 441 442
	data->old_dentry = dget(old_dentry);
	data->new_dentry = dget(new_dentry);
	nfs_fattr_init(&data->old_fattr);
	nfs_fattr_init(&data->new_fattr);
443
	data->complete = complete;
444 445 446 447 448 449 450 451 452 453 454 455 456 457 458

	/* set up nfs_renameargs */
	data->args.old_dir = NFS_FH(old_dir);
	data->args.old_name = &old_dentry->d_name;
	data->args.new_dir = NFS_FH(new_dir);
	data->args.new_name = &new_dentry->d_name;

	/* set up nfs_renameres */
	data->res.old_fattr = &data->old_fattr;
	data->res.new_fattr = &data->new_fattr;

	nfs_sb_active(old_dir->i_sb);

	NFS_PROTO(data->old_dir)->rename_setup(&msg, old_dir);

459
	return rpc_run_task(&task_setup_data);
460 461
}

462 463 464 465 466 467 468
/*
 * Perform tasks needed when a sillyrename is done such as cancelling the
 * queued async unlink if it failed.
 */
static void
nfs_complete_sillyrename(struct rpc_task *task, struct nfs_renamedata *data)
{
469 470 471 472 473 474 475 476 477 478 479 480
	struct dentry *dentry = data->old_dentry;

	if (task->tk_status != 0) {
		nfs_cancel_async_unlink(dentry);
		return;
	}

	/*
	 * vfs_unlink and the like do not issue this when a file is
	 * sillyrenamed, so do it here.
	 */
	fsnotify_nameremove(dentry, 0);
481 482
}

483 484 485 486 487 488 489 490
#define SILLYNAME_PREFIX ".nfs"
#define SILLYNAME_PREFIX_LEN ((unsigned)sizeof(SILLYNAME_PREFIX) - 1)
#define SILLYNAME_FILEID_LEN ((unsigned)sizeof(u64) << 1)
#define SILLYNAME_COUNTER_LEN ((unsigned)sizeof(unsigned int) << 1)
#define SILLYNAME_LEN (SILLYNAME_PREFIX_LEN + \
		SILLYNAME_FILEID_LEN + \
		SILLYNAME_COUNTER_LEN)

491 492 493 494 495 496 497 498 499 500 501 502
/**
 * nfs_sillyrename - Perform a silly-rename of a dentry
 * @dir: inode of directory that contains dentry
 * @dentry: dentry to be sillyrenamed
 *
 * NFSv2/3 is stateless and the server doesn't know when the client is
 * holding a file open. To prevent application problems when a file is
 * unlinked while it's still open, the client performs a "silly-rename".
 * That is, it renames the file to a hidden file in the same directory,
 * and only performs the unlink once the last reference to it is put.
 *
 * The final cleanup is done during dentry_iput.
503 504 505 506 507 508 509 510
 *
 * (Note: NFSv4 is stateful, and has opens, so in theory an NFSv4 server
 * could take responsibility for keeping open files referenced.  The server
 * would also need to ensure that opened-but-deleted files were kept over
 * reboots.  However, we may not assume a server does so.  (RFC 5661
 * does provide an OPEN4_RESULT_PRESERVE_UNLINKED flag that a server can
 * use to advertise that it does this; some day we may take advantage of
 * it.))
511 512 513 514 515
 */
int
nfs_sillyrename(struct inode *dir, struct dentry *dentry)
{
	static unsigned int sillycounter;
516 517
	unsigned char silly[SILLYNAME_LEN + 1];
	unsigned long long fileid;
518
	struct dentry *sdentry;
519
	struct rpc_task *task;
520
	int            error = -EBUSY;
521

522 523
	dfprintk(VFS, "NFS: silly-rename(%pd2, ct=%d)\n",
		dentry, d_count(dentry));
524 525 526 527 528 529 530 531
	nfs_inc_stats(dir, NFSIOS_SILLYRENAME);

	/*
	 * We don't allow a dentry to be silly-renamed twice.
	 */
	if (dentry->d_flags & DCACHE_NFSFS_RENAMED)
		goto out;

532
	fileid = NFS_FILEID(dentry->d_inode);
533 534

	/* Return delegation in anticipation of the rename */
535
	NFS_PROTO(dentry->d_inode)->return_delegation(dentry->d_inode);
536 537 538

	sdentry = NULL;
	do {
539
		int slen;
540 541
		dput(sdentry);
		sillycounter++;
542 543 544 545
		slen = scnprintf(silly, sizeof(silly),
				SILLYNAME_PREFIX "%0*llx%0*x",
				SILLYNAME_FILEID_LEN, fileid,
				SILLYNAME_COUNTER_LEN, sillycounter);
546

547 548
		dfprintk(VFS, "NFS: trying to rename %pd to %s\n",
				dentry, silly);
549 550 551 552 553 554 555 556 557 558

		sdentry = lookup_one_len(silly, dentry->d_parent, slen);
		/*
		 * N.B. Better to return EBUSY here ... it could be
		 * dangerous to delete the file while it's in use.
		 */
		if (IS_ERR(sdentry))
			goto out;
	} while (sdentry->d_inode != NULL); /* need negative lookup */

559 560 561 562 563 564 565
	/* queue unlink first. Can't do this from rpc_release as it
	 * has to allocate memory
	 */
	error = nfs_async_unlink(dir, dentry);
	if (error)
		goto out_dput;

566 567 568 569 570 571 572 573
	/* populate unlinkdata with the right dname */
	error = nfs_copy_dname(sdentry,
				(struct nfs_unlinkdata *)dentry->d_fsdata);
	if (error) {
		nfs_cancel_async_unlink(dentry);
		goto out_dput;
	}

574
	/* run the rename task, undo unlink if it fails */
575 576
	task = nfs_async_rename(dir, dir, dentry, sdentry,
					nfs_complete_sillyrename);
577 578 579 580
	if (IS_ERR(task)) {
		error = -EBUSY;
		nfs_cancel_async_unlink(dentry);
		goto out_dput;
581
	}
582 583 584 585 586

	/* wait for the RPC task to complete, unless a SIGKILL intervenes */
	error = rpc_wait_for_completion_task(task);
	if (error == 0)
		error = task->tk_status;
587 588 589 590 591 592 593 594 595 596 597 598
	switch (error) {
	case 0:
		/* The rename succeeded */
		nfs_set_verifier(dentry, nfs_save_change_attribute(dir));
		d_move(dentry, sdentry);
		break;
	case -ERESTARTSYS:
		/* The result of the rename is unknown. Play it safe by
		 * forcing a new lookup */
		d_drop(dentry);
		d_drop(sdentry);
	}
599 600
	rpc_put_task(task);
out_dput:
601 602 603 604
	dput(sdentry);
out:
	return error;
}