dir.c 42.4 KB
Newer Older
1 2
/*
  FUSE: Filesystem in Userspace
M
Miklos Szeredi 已提交
3
  Copyright (C) 2001-2008  Miklos Szeredi <miklos@szeredi.hu>
4 5 6 7 8 9 10 11 12 13 14

  This program can be distributed under the terms of the GNU GPL.
  See the file COPYING.
*/

#include "fuse_i.h"

#include <linux/pagemap.h>
#include <linux/file.h>
#include <linux/sched.h>
#include <linux/namei.h>
15
#include <linux/slab.h>
S
Seth Forshee 已提交
16
#include <linux/xattr.h>
17
#include <linux/iversion.h>
S
Seth Forshee 已提交
18
#include <linux/posix_acl.h>
19

20 21 22 23 24 25 26
static void fuse_advise_use_readdirplus(struct inode *dir)
{
	struct fuse_inode *fi = get_fuse_inode(dir);

	set_bit(FUSE_I_ADVISE_RDPLUS, &fi->state);
}

M
Miklos Szeredi 已提交
27 28 29 30 31
union fuse_dentry {
	u64 time;
	struct rcu_head rcu;
};

M
Miklos Szeredi 已提交
32 33
static inline void fuse_dentry_settime(struct dentry *entry, u64 time)
{
M
Miklos Szeredi 已提交
34
	((union fuse_dentry *) entry->d_fsdata)->time = time;
M
Miklos Szeredi 已提交
35 36 37 38
}

static inline u64 fuse_dentry_time(struct dentry *entry)
{
M
Miklos Szeredi 已提交
39
	return ((union fuse_dentry *) entry->d_fsdata)->time;
M
Miklos Szeredi 已提交
40 41
}

42 43 44
/*
 * FUSE caches dentries and attributes with separate timeout.  The
 * time in jiffies until the dentry/attributes are valid is stored in
M
Miklos Szeredi 已提交
45
 * dentry->d_fsdata and fuse_inode->i_time respectively.
46 47 48 49 50
 */

/*
 * Calculate the time in jiffies until a dentry/attributes are valid
 */
M
Miklos Szeredi 已提交
51
static u64 time_to_jiffies(u64 sec, u32 nsec)
52
{
M
Miklos Szeredi 已提交
53
	if (sec || nsec) {
M
Miklos Szeredi 已提交
54 55
		struct timespec64 ts = {
			sec,
56
			min_t(u32, nsec, NSEC_PER_SEC - 1)
M
Miklos Szeredi 已提交
57 58 59
		};

		return get_jiffies_64() + timespec64_to_jiffies(&ts);
M
Miklos Szeredi 已提交
60
	} else
M
Miklos Szeredi 已提交
61
		return 0;
62 63
}

64 65 66 67
/*
 * Set dentry and possibly attribute timeouts from the lookup/mk*
 * replies
 */
M
Miklos Szeredi 已提交
68
void fuse_change_entry_timeout(struct dentry *entry, struct fuse_entry_out *o)
69
{
M
Miklos Szeredi 已提交
70 71
	fuse_dentry_settime(entry,
		time_to_jiffies(o->entry_valid, o->entry_valid_nsec));
72 73 74 75 76 77 78
}

static u64 attr_timeout(struct fuse_attr_out *o)
{
	return time_to_jiffies(o->attr_valid, o->attr_valid_nsec);
}

M
Miklos Szeredi 已提交
79
u64 entry_attr_timeout(struct fuse_entry_out *o)
80 81
{
	return time_to_jiffies(o->attr_valid, o->attr_valid_nsec);
82 83
}

84 85 86 87 88
static void fuse_invalidate_attr_mask(struct inode *inode, u32 mask)
{
	set_mask_bits(&get_fuse_inode(inode)->inval_mask, 0, mask);
}

89 90 91 92
/*
 * Mark the attributes as stale, so that at the next call to
 * ->getattr() they will be fetched from userspace
 */
93 94
void fuse_invalidate_attr(struct inode *inode)
{
95
	fuse_invalidate_attr_mask(inode, STATX_BASIC_STATS);
96 97
}

98 99 100 101 102 103
static void fuse_dir_changed(struct inode *dir)
{
	fuse_invalidate_attr(dir);
	inode_maybe_inc_iversion(dir, false);
}

104 105 106 107 108 109 110
/**
 * Mark the attributes as stale due to an atime change.  Avoid the invalidate if
 * atime is not used.
 */
void fuse_invalidate_atime(struct inode *inode)
{
	if (!IS_RDONLY(inode))
111
		fuse_invalidate_attr_mask(inode, STATX_ATIME);
112 113
}

114 115 116 117 118 119 120 121
/*
 * Just mark the entry as stale, so that a next attempt to look it up
 * will result in a new lookup call to userspace
 *
 * This is called when a dentry is about to become negative and the
 * timeout is unknown (unlink, rmdir, rename and in some cases
 * lookup)
 */
M
Miklos Szeredi 已提交
122
void fuse_invalidate_entry_cache(struct dentry *entry)
123
{
M
Miklos Szeredi 已提交
124
	fuse_dentry_settime(entry, 0);
125 126
}

127 128 129 130
/*
 * Same as fuse_invalidate_entry_cache(), but also try to remove the
 * dentry from the hash
 */
131 132 133 134
static void fuse_invalidate_entry(struct dentry *entry)
{
	d_invalidate(entry);
	fuse_invalidate_entry_cache(entry);
135 136
}

137
static void fuse_lookup_init(struct fuse_conn *fc, struct fuse_args *args,
A
Al Viro 已提交
138
			     u64 nodeid, const struct qstr *name,
139 140
			     struct fuse_entry_out *outarg)
{
141
	memset(outarg, 0, sizeof(struct fuse_entry_out));
142 143 144 145 146 147
	args->in.h.opcode = FUSE_LOOKUP;
	args->in.h.nodeid = nodeid;
	args->in.numargs = 1;
	args->in.args[0].size = name->len + 1;
	args->in.args[0].value = name->name;
	args->out.numargs = 1;
148
	args->out.args[0].size = sizeof(struct fuse_entry_out);
149
	args->out.args[0].value = outarg;
150 151
}

152
u64 fuse_get_attr_version(struct fuse_conn *fc)
153 154 155 156 157 158 159 160 161 162 163 164 165 166
{
	u64 curr_version;

	/*
	 * The spin lock isn't actually needed on 64bit archs, but we
	 * don't yet care too much about such optimizations.
	 */
	spin_lock(&fc->lock);
	curr_version = fc->attr_version;
	spin_unlock(&fc->lock);

	return curr_version;
}

167 168 169 170 171 172 173 174 175
/*
 * Check whether the dentry is still valid
 *
 * If the entry validity timeout has expired and the dentry is
 * positive, try to redo the lookup.  If the lookup results in a
 * different inode, then let the VFS invalidate the dentry and redo
 * the lookup once more.  If the lookup results in the same inode,
 * then refresh the attributes, timeouts and mark the dentry valid.
 */
176
static int fuse_dentry_revalidate(struct dentry *entry, unsigned int flags)
177
{
178
	struct inode *inode;
179 180
	struct dentry *parent;
	struct fuse_conn *fc;
M
Miklos Szeredi 已提交
181
	struct fuse_inode *fi;
182
	int ret;
183

184
	inode = d_inode_rcu(entry);
185
	if (inode && is_bad_inode(inode))
186
		goto invalid;
187 188
	else if (time_before64(fuse_dentry_time(entry), get_jiffies_64()) ||
		 (flags & LOOKUP_REVAL)) {
189
		struct fuse_entry_out outarg;
190
		FUSE_ARGS(args);
191
		struct fuse_forget_link *forget;
192
		u64 attr_version;
193

194
		/* For negative dentries, always do a fresh lookup */
195
		if (!inode)
196
			goto invalid;
197

198
		ret = -ECHILD;
199
		if (flags & LOOKUP_RCU)
200
			goto out;
201

202
		fc = get_fuse_conn(inode);
203

204
		forget = fuse_alloc_forget();
205 206
		ret = -ENOMEM;
		if (!forget)
207
			goto out;
M
Miklos Szeredi 已提交
208

209
		attr_version = fuse_get_attr_version(fc);
210

211
		parent = dget_parent(entry);
212
		fuse_lookup_init(fc, &args, get_node_id(d_inode(parent)),
213
				 &entry->d_name, &outarg);
214
		ret = fuse_simple_request(fc, &args);
215
		dput(parent);
216
		/* Zero nodeid is same as -ENOENT */
217 218 219
		if (!ret && !outarg.nodeid)
			ret = -ENOENT;
		if (!ret) {
M
Miklos Szeredi 已提交
220
			fi = get_fuse_inode(inode);
221
			if (outarg.nodeid != get_node_id(inode)) {
222
				fuse_queue_forget(fc, forget, outarg.nodeid, 1);
223
				goto invalid;
224
			}
225
			spin_lock(&fc->lock);
M
Miklos Szeredi 已提交
226
			fi->nlookup++;
227
			spin_unlock(&fc->lock);
228
		}
229
		kfree(forget);
230 231 232
		if (ret == -ENOMEM)
			goto out;
		if (ret || (outarg.attr.mode ^ inode->i_mode) & S_IFMT)
233
			goto invalid;
234

S
Seth Forshee 已提交
235
		forget_all_cached_acls(inode);
236 237 238 239
		fuse_change_attributes(inode, &outarg.attr,
				       entry_attr_timeout(&outarg),
				       attr_version);
		fuse_change_entry_timeout(entry, &outarg);
240
	} else if (inode) {
M
Miklos Szeredi 已提交
241 242 243 244 245
		fi = get_fuse_inode(inode);
		if (flags & LOOKUP_RCU) {
			if (test_bit(FUSE_I_INIT_RDPLUS, &fi->state))
				return -ECHILD;
		} else if (test_and_clear_bit(FUSE_I_INIT_RDPLUS, &fi->state)) {
246
			parent = dget_parent(entry);
247
			fuse_advise_use_readdirplus(d_inode(parent));
248 249
			dput(parent);
		}
250
	}
251 252 253 254 255 256 257
	ret = 1;
out:
	return ret;

invalid:
	ret = 0;
	goto out;
258 259
}

M
Miklos Szeredi 已提交
260 261 262 263 264 265 266 267 268 269 270 271 272
static int fuse_dentry_init(struct dentry *dentry)
{
	dentry->d_fsdata = kzalloc(sizeof(union fuse_dentry), GFP_KERNEL);

	return dentry->d_fsdata ? 0 : -ENOMEM;
}
static void fuse_dentry_release(struct dentry *dentry)
{
	union fuse_dentry *fd = dentry->d_fsdata;

	kfree_rcu(fd, rcu);
}

A
Al Viro 已提交
273
const struct dentry_operations fuse_dentry_operations = {
274
	.d_revalidate	= fuse_dentry_revalidate,
M
Miklos Szeredi 已提交
275 276
	.d_init		= fuse_dentry_init,
	.d_release	= fuse_dentry_release,
277 278
};

279 280 281 282 283
const struct dentry_operations fuse_root_dentry_operations = {
	.d_init		= fuse_dentry_init,
	.d_release	= fuse_dentry_release,
};

284
int fuse_valid_type(int m)
285 286 287 288 289
{
	return S_ISREG(m) || S_ISDIR(m) || S_ISLNK(m) || S_ISCHR(m) ||
		S_ISBLK(m) || S_ISFIFO(m) || S_ISSOCK(m);
}

A
Al Viro 已提交
290
int fuse_lookup_name(struct super_block *sb, u64 nodeid, const struct qstr *name,
291
		     struct fuse_entry_out *outarg, struct inode **inode)
292
{
293
	struct fuse_conn *fc = get_fuse_conn_super(sb);
294
	FUSE_ARGS(args);
295
	struct fuse_forget_link *forget;
296
	u64 attr_version;
297
	int err;
298

299 300 301 302
	*inode = NULL;
	err = -ENAMETOOLONG;
	if (name->len > FUSE_NAME_MAX)
		goto out;
303 304


305 306
	forget = fuse_alloc_forget();
	err = -ENOMEM;
307
	if (!forget)
308
		goto out;
M
Miklos Szeredi 已提交
309

310
	attr_version = fuse_get_attr_version(fc);
311

312 313
	fuse_lookup_init(fc, &args, nodeid, name, outarg);
	err = fuse_simple_request(fc, &args);
314
	/* Zero nodeid is same as -ENOENT, but with valid timeout */
315 316 317 318 319 320 321 322 323 324 325 326 327 328
	if (err || !outarg->nodeid)
		goto out_put_forget;

	err = -EIO;
	if (!outarg->nodeid)
		goto out_put_forget;
	if (!fuse_valid_type(outarg->attr.mode))
		goto out_put_forget;

	*inode = fuse_iget(sb, outarg->nodeid, outarg->generation,
			   &outarg->attr, entry_attr_timeout(outarg),
			   attr_version);
	err = -ENOMEM;
	if (!*inode) {
329
		fuse_queue_forget(fc, forget, outarg->nodeid, 1);
330
		goto out;
331
	}
332 333 334
	err = 0;

 out_put_forget:
335
	kfree(forget);
336 337 338 339 340
 out:
	return err;
}

static struct dentry *fuse_lookup(struct inode *dir, struct dentry *entry,
A
Al Viro 已提交
341
				  unsigned int flags)
342 343 344 345 346 347
{
	int err;
	struct fuse_entry_out outarg;
	struct inode *inode;
	struct dentry *newent;
	bool outarg_valid = true;
348
	bool locked;
349

350
	locked = fuse_lock_inode(dir);
351 352
	err = fuse_lookup_name(dir->i_sb, get_node_id(dir), &entry->d_name,
			       &outarg, &inode);
353
	fuse_unlock_inode(dir, locked);
354 355 356 357 358 359 360 361 362 363
	if (err == -ENOENT) {
		outarg_valid = false;
		err = 0;
	}
	if (err)
		goto out_err;

	err = -EIO;
	if (inode && get_node_id(inode) == FUSE_ROOT_ID)
		goto out_iput;
364

365
	newent = d_splice_alias(inode, entry);
366 367 368
	err = PTR_ERR(newent);
	if (IS_ERR(newent))
		goto out_err;
369

370
	entry = newent ? newent : entry;
371
	if (outarg_valid)
372
		fuse_change_entry_timeout(entry, &outarg);
373 374
	else
		fuse_invalidate_entry_cache(entry);
375

376
	fuse_advise_use_readdirplus(dir);
377
	return newent;
378 379 380 381 382

 out_iput:
	iput(inode);
 out_err:
	return ERR_PTR(err);
383 384
}

385 386 387 388 389 390
/*
 * Atomic create+open operation
 *
 * If the filesystem doesn't support this, then fall back to separate
 * 'mknod' + 'open' requests.
 */
A
Al Viro 已提交
391
static int fuse_create_open(struct inode *dir, struct dentry *entry,
A
Al Viro 已提交
392
			    struct file *file, unsigned flags,
393
			    umode_t mode)
M
Miklos Szeredi 已提交
394 395 396 397
{
	int err;
	struct inode *inode;
	struct fuse_conn *fc = get_fuse_conn(dir);
398
	FUSE_ARGS(args);
399
	struct fuse_forget_link *forget;
400
	struct fuse_create_in inarg;
M
Miklos Szeredi 已提交
401 402
	struct fuse_open_out outopen;
	struct fuse_entry_out outentry;
403
	struct fuse_inode *fi;
M
Miklos Szeredi 已提交
404 405
	struct fuse_file *ff;

406 407 408
	/* Userspace expects S_IFREG in create mode */
	BUG_ON((mode & S_IFMT) != S_IFREG);

409
	forget = fuse_alloc_forget();
410
	err = -ENOMEM;
411
	if (!forget)
412
		goto out_err;
413

414
	err = -ENOMEM;
T
Tejun Heo 已提交
415
	ff = fuse_file_alloc(fc);
M
Miklos Szeredi 已提交
416
	if (!ff)
417
		goto out_put_forget_req;
M
Miklos Szeredi 已提交
418

419 420 421
	if (!fc->dont_mask)
		mode &= ~current_umask();

M
Miklos Szeredi 已提交
422 423
	flags &= ~O_NOCTTY;
	memset(&inarg, 0, sizeof(inarg));
424
	memset(&outentry, 0, sizeof(outentry));
M
Miklos Szeredi 已提交
425 426
	inarg.flags = flags;
	inarg.mode = mode;
427
	inarg.umask = current_umask();
428 429 430
	args.in.h.opcode = FUSE_CREATE;
	args.in.h.nodeid = get_node_id(dir);
	args.in.numargs = 2;
431
	args.in.args[0].size = sizeof(inarg);
432 433 434 435
	args.in.args[0].value = &inarg;
	args.in.args[1].size = entry->d_name.len + 1;
	args.in.args[1].value = entry->d_name.name;
	args.out.numargs = 2;
436
	args.out.args[0].size = sizeof(outentry);
437 438 439 440
	args.out.args[0].value = &outentry;
	args.out.args[1].size = sizeof(outopen);
	args.out.args[1].value = &outopen;
	err = fuse_simple_request(fc, &args);
441
	if (err)
M
Miklos Szeredi 已提交
442 443 444
		goto out_free_ff;

	err = -EIO;
445
	if (!S_ISREG(outentry.attr.mode) || invalid_nodeid(outentry.nodeid))
M
Miklos Szeredi 已提交
446 447
		goto out_free_ff;

448 449 450
	ff->fh = outopen.fh;
	ff->nodeid = outentry.nodeid;
	ff->open_flags = outopen.open_flags;
M
Miklos Szeredi 已提交
451
	inode = fuse_iget(dir->i_sb, outentry.nodeid, outentry.generation,
452
			  &outentry.attr, entry_attr_timeout(&outentry), 0);
M
Miklos Szeredi 已提交
453 454
	if (!inode) {
		flags &= ~(O_CREAT | O_EXCL | O_TRUNC);
455
		fuse_sync_release(NULL, ff, flags);
456
		fuse_queue_forget(fc, forget, outentry.nodeid, 1);
457 458
		err = -ENOMEM;
		goto out_err;
M
Miklos Szeredi 已提交
459
	}
460
	kfree(forget);
M
Miklos Szeredi 已提交
461
	d_instantiate(entry, inode);
462
	fuse_change_entry_timeout(entry, &outentry);
463
	fuse_dir_changed(dir);
464
	err = finish_open(file, entry, generic_file_open);
A
Al Viro 已提交
465
	if (err) {
466 467
		fi = get_fuse_inode(inode);
		fuse_sync_release(fi, ff, flags);
468
	} else {
469
		file->private_data = ff;
470
		fuse_finish_open(inode, file);
M
Miklos Szeredi 已提交
471
	}
A
Al Viro 已提交
472
	return err;
M
Miklos Szeredi 已提交
473

474
out_free_ff:
M
Miklos Szeredi 已提交
475
	fuse_file_free(ff);
476
out_put_forget_req:
477
	kfree(forget);
478
out_err:
A
Al Viro 已提交
479
	return err;
480 481 482
}

static int fuse_mknod(struct inode *, struct dentry *, umode_t, dev_t);
A
Al Viro 已提交
483
static int fuse_atomic_open(struct inode *dir, struct dentry *entry,
A
Al Viro 已提交
484
			    struct file *file, unsigned flags,
485
			    umode_t mode)
486 487 488 489 490
{
	int err;
	struct fuse_conn *fc = get_fuse_conn(dir);
	struct dentry *res = NULL;

491
	if (d_in_lookup(entry)) {
A
Al Viro 已提交
492
		res = fuse_lookup(dir, entry, 0);
493
		if (IS_ERR(res))
A
Al Viro 已提交
494
			return PTR_ERR(res);
495 496 497 498 499

		if (res)
			entry = res;
	}

500
	if (!(flags & O_CREAT) || d_really_is_positive(entry))
501 502 503
		goto no_open;

	/* Only creates */
504
	file->f_mode |= FMODE_CREATED;
505 506 507 508

	if (fc->no_create)
		goto mknod;

509
	err = fuse_create_open(dir, entry, file, flags, mode);
A
Al Viro 已提交
510
	if (err == -ENOSYS) {
511 512 513 514 515
		fc->no_create = 1;
		goto mknod;
	}
out_dput:
	dput(res);
A
Al Viro 已提交
516
	return err;
517 518 519

mknod:
	err = fuse_mknod(dir, entry, mode, 0);
A
Al Viro 已提交
520
	if (err)
521 522
		goto out_dput;
no_open:
A
Al Viro 已提交
523
	return finish_no_open(file, res);
M
Miklos Szeredi 已提交
524 525
}

526 527 528
/*
 * Code shared between mknod, mkdir, symlink and link
 */
529
static int create_new_entry(struct fuse_conn *fc, struct fuse_args *args,
530
			    struct inode *dir, struct dentry *entry,
A
Al Viro 已提交
531
			    umode_t mode)
532 533 534
{
	struct fuse_entry_out outarg;
	struct inode *inode;
A
Al Viro 已提交
535
	struct dentry *d;
536
	int err;
537
	struct fuse_forget_link *forget;
M
Miklos Szeredi 已提交
538

539
	forget = fuse_alloc_forget();
540
	if (!forget)
541
		return -ENOMEM;
542

543
	memset(&outarg, 0, sizeof(outarg));
544 545
	args->in.h.nodeid = get_node_id(dir);
	args->out.numargs = 1;
546
	args->out.args[0].size = sizeof(outarg);
547 548
	args->out.args[0].value = &outarg;
	err = fuse_simple_request(fc, args);
M
Miklos Szeredi 已提交
549 550 551
	if (err)
		goto out_put_forget_req;

552 553
	err = -EIO;
	if (invalid_nodeid(outarg.nodeid))
M
Miklos Szeredi 已提交
554
		goto out_put_forget_req;
555 556

	if ((outarg.attr.mode ^ mode) & S_IFMT)
M
Miklos Szeredi 已提交
557
		goto out_put_forget_req;
558

559
	inode = fuse_iget(dir->i_sb, outarg.nodeid, outarg.generation,
560
			  &outarg.attr, entry_attr_timeout(&outarg), 0);
561
	if (!inode) {
562
		fuse_queue_forget(fc, forget, outarg.nodeid, 1);
563 564
		return -ENOMEM;
	}
565
	kfree(forget);
566

A
Al Viro 已提交
567 568 569 570
	d_drop(entry);
	d = d_splice_alias(inode, entry);
	if (IS_ERR(d))
		return PTR_ERR(d);
571

A
Al Viro 已提交
572 573 574 575 576 577
	if (d) {
		fuse_change_entry_timeout(d, &outarg);
		dput(d);
	} else {
		fuse_change_entry_timeout(entry, &outarg);
	}
578
	fuse_dir_changed(dir);
579
	return 0;
580

M
Miklos Szeredi 已提交
581
 out_put_forget_req:
582
	kfree(forget);
583
	return err;
584 585
}

A
Al Viro 已提交
586
static int fuse_mknod(struct inode *dir, struct dentry *entry, umode_t mode,
587 588 589 590
		      dev_t rdev)
{
	struct fuse_mknod_in inarg;
	struct fuse_conn *fc = get_fuse_conn(dir);
591
	FUSE_ARGS(args);
592

593 594 595
	if (!fc->dont_mask)
		mode &= ~current_umask();

596 597 598
	memset(&inarg, 0, sizeof(inarg));
	inarg.mode = mode;
	inarg.rdev = new_encode_dev(rdev);
599
	inarg.umask = current_umask();
600 601
	args.in.h.opcode = FUSE_MKNOD;
	args.in.numargs = 2;
602
	args.in.args[0].size = sizeof(inarg);
603 604 605 606
	args.in.args[0].value = &inarg;
	args.in.args[1].size = entry->d_name.len + 1;
	args.in.args[1].value = entry->d_name.name;
	return create_new_entry(fc, &args, dir, entry, mode);
607 608
}

A
Al Viro 已提交
609
static int fuse_create(struct inode *dir, struct dentry *entry, umode_t mode,
A
Al Viro 已提交
610
		       bool excl)
611 612 613 614
{
	return fuse_mknod(dir, entry, mode, 0);
}

615
static int fuse_mkdir(struct inode *dir, struct dentry *entry, umode_t mode)
616 617 618
{
	struct fuse_mkdir_in inarg;
	struct fuse_conn *fc = get_fuse_conn(dir);
619
	FUSE_ARGS(args);
620

621 622 623
	if (!fc->dont_mask)
		mode &= ~current_umask();

624 625
	memset(&inarg, 0, sizeof(inarg));
	inarg.mode = mode;
626
	inarg.umask = current_umask();
627 628 629 630 631 632 633
	args.in.h.opcode = FUSE_MKDIR;
	args.in.numargs = 2;
	args.in.args[0].size = sizeof(inarg);
	args.in.args[0].value = &inarg;
	args.in.args[1].size = entry->d_name.len + 1;
	args.in.args[1].value = entry->d_name.name;
	return create_new_entry(fc, &args, dir, entry, S_IFDIR);
634 635 636 637 638 639 640
}

static int fuse_symlink(struct inode *dir, struct dentry *entry,
			const char *link)
{
	struct fuse_conn *fc = get_fuse_conn(dir);
	unsigned len = strlen(link) + 1;
641
	FUSE_ARGS(args);
642

643 644 645 646 647 648 649
	args.in.h.opcode = FUSE_SYMLINK;
	args.in.numargs = 2;
	args.in.args[0].size = entry->d_name.len + 1;
	args.in.args[0].value = entry->d_name.name;
	args.in.args[1].size = len;
	args.in.args[1].value = link;
	return create_new_entry(fc, &args, dir, entry, S_IFLNK);
650 651
}

S
Seth Forshee 已提交
652
void fuse_update_ctime(struct inode *inode)
M
Maxim Patlasov 已提交
653 654
{
	if (!IS_NOCMTIME(inode)) {
655
		inode->i_ctime = current_time(inode);
M
Maxim Patlasov 已提交
656 657 658 659
		mark_inode_dirty_sync(inode);
	}
}

660 661 662 663
static int fuse_unlink(struct inode *dir, struct dentry *entry)
{
	int err;
	struct fuse_conn *fc = get_fuse_conn(dir);
664 665 666 667 668 669 670 671
	FUSE_ARGS(args);

	args.in.h.opcode = FUSE_UNLINK;
	args.in.h.nodeid = get_node_id(dir);
	args.in.numargs = 1;
	args.in.args[0].size = entry->d_name.len + 1;
	args.in.args[0].value = entry->d_name.name;
	err = fuse_simple_request(fc, &args);
672
	if (!err) {
673
		struct inode *inode = d_inode(entry);
M
Miklos Szeredi 已提交
674
		struct fuse_inode *fi = get_fuse_inode(inode);
675

M
Miklos Szeredi 已提交
676 677
		spin_lock(&fc->lock);
		fi->attr_version = ++fc->attr_version;
678 679 680 681 682 683 684 685
		/*
		 * If i_nlink == 0 then unlink doesn't make sense, yet this can
		 * happen if userspace filesystem is careless.  It would be
		 * difficult to enforce correct nlink usage so just ignore this
		 * condition here
		 */
		if (inode->i_nlink > 0)
			drop_nlink(inode);
M
Miklos Szeredi 已提交
686
		spin_unlock(&fc->lock);
687
		fuse_invalidate_attr(inode);
688
		fuse_dir_changed(dir);
689
		fuse_invalidate_entry_cache(entry);
M
Maxim Patlasov 已提交
690
		fuse_update_ctime(inode);
691 692 693 694 695 696 697 698 699
	} else if (err == -EINTR)
		fuse_invalidate_entry(entry);
	return err;
}

static int fuse_rmdir(struct inode *dir, struct dentry *entry)
{
	int err;
	struct fuse_conn *fc = get_fuse_conn(dir);
700 701 702 703 704 705 706 707
	FUSE_ARGS(args);

	args.in.h.opcode = FUSE_RMDIR;
	args.in.h.nodeid = get_node_id(dir);
	args.in.numargs = 1;
	args.in.args[0].size = entry->d_name.len + 1;
	args.in.args[0].value = entry->d_name.name;
	err = fuse_simple_request(fc, &args);
708
	if (!err) {
709
		clear_nlink(d_inode(entry));
710
		fuse_dir_changed(dir);
711
		fuse_invalidate_entry_cache(entry);
712 713 714 715 716
	} else if (err == -EINTR)
		fuse_invalidate_entry(entry);
	return err;
}

M
Miklos Szeredi 已提交
717 718 719
static int fuse_rename_common(struct inode *olddir, struct dentry *oldent,
			      struct inode *newdir, struct dentry *newent,
			      unsigned int flags, int opcode, size_t argsize)
720 721
{
	int err;
M
Miklos Szeredi 已提交
722
	struct fuse_rename2_in inarg;
723
	struct fuse_conn *fc = get_fuse_conn(olddir);
724
	FUSE_ARGS(args);
725

M
Miklos Szeredi 已提交
726
	memset(&inarg, 0, argsize);
727
	inarg.newdir = get_node_id(newdir);
M
Miklos Szeredi 已提交
728
	inarg.flags = flags;
729 730 731 732 733 734 735 736 737 738
	args.in.h.opcode = opcode;
	args.in.h.nodeid = get_node_id(olddir);
	args.in.numargs = 3;
	args.in.args[0].size = argsize;
	args.in.args[0].value = &inarg;
	args.in.args[1].size = oldent->d_name.len + 1;
	args.in.args[1].value = oldent->d_name.name;
	args.in.args[2].size = newent->d_name.len + 1;
	args.in.args[2].value = newent->d_name.name;
	err = fuse_simple_request(fc, &args);
739
	if (!err) {
740
		/* ctime changes */
741 742
		fuse_invalidate_attr(d_inode(oldent));
		fuse_update_ctime(d_inode(oldent));
743

M
Miklos Szeredi 已提交
744
		if (flags & RENAME_EXCHANGE) {
745 746
			fuse_invalidate_attr(d_inode(newent));
			fuse_update_ctime(d_inode(newent));
M
Miklos Szeredi 已提交
747 748
		}

749
		fuse_dir_changed(olddir);
750
		if (olddir != newdir)
751
			fuse_dir_changed(newdir);
752 753

		/* newent will end up negative */
754 755
		if (!(flags & RENAME_EXCHANGE) && d_really_is_positive(newent)) {
			fuse_invalidate_attr(d_inode(newent));
756
			fuse_invalidate_entry_cache(newent);
757
			fuse_update_ctime(d_inode(newent));
M
Miklos Szeredi 已提交
758
		}
759 760 761 762 763 764 765
	} else if (err == -EINTR) {
		/* If request was interrupted, DEITY only knows if the
		   rename actually took place.  If the invalidation
		   fails (e.g. some process has CWD under the renamed
		   directory), then there can be inconsistency between
		   the dcache and the real filesystem.  Tough luck. */
		fuse_invalidate_entry(oldent);
766
		if (d_really_is_positive(newent))
767 768 769 770 771 772
			fuse_invalidate_entry(newent);
	}

	return err;
}

M
Miklos Szeredi 已提交
773 774 775 776 777 778 779 780 781 782
static int fuse_rename2(struct inode *olddir, struct dentry *oldent,
			struct inode *newdir, struct dentry *newent,
			unsigned int flags)
{
	struct fuse_conn *fc = get_fuse_conn(olddir);
	int err;

	if (flags & ~(RENAME_NOREPLACE | RENAME_EXCHANGE))
		return -EINVAL;

M
Miklos Szeredi 已提交
783 784 785
	if (flags) {
		if (fc->no_rename2 || fc->minor < 23)
			return -EINVAL;
M
Miklos Szeredi 已提交
786

M
Miklos Szeredi 已提交
787 788 789 790 791 792 793 794 795 796 797
		err = fuse_rename_common(olddir, oldent, newdir, newent, flags,
					 FUSE_RENAME2,
					 sizeof(struct fuse_rename2_in));
		if (err == -ENOSYS) {
			fc->no_rename2 = 1;
			err = -EINVAL;
		}
	} else {
		err = fuse_rename_common(olddir, oldent, newdir, newent, 0,
					 FUSE_RENAME,
					 sizeof(struct fuse_rename_in));
M
Miklos Szeredi 已提交
798
	}
M
Miklos Szeredi 已提交
799

M
Miklos Szeredi 已提交
800
	return err;
M
Miklos Szeredi 已提交
801
}
M
Miklos Szeredi 已提交
802

803 804 805 806 807
static int fuse_link(struct dentry *entry, struct inode *newdir,
		     struct dentry *newent)
{
	int err;
	struct fuse_link_in inarg;
808
	struct inode *inode = d_inode(entry);
809
	struct fuse_conn *fc = get_fuse_conn(inode);
810
	FUSE_ARGS(args);
811 812 813

	memset(&inarg, 0, sizeof(inarg));
	inarg.oldnodeid = get_node_id(inode);
814 815 816 817 818 819 820
	args.in.h.opcode = FUSE_LINK;
	args.in.numargs = 2;
	args.in.args[0].size = sizeof(inarg);
	args.in.args[0].value = &inarg;
	args.in.args[1].size = newent->d_name.len + 1;
	args.in.args[1].value = newent->d_name.name;
	err = create_new_entry(fc, &args, newdir, newent, inode->i_mode);
821 822 823 824 825 826
	/* Contrary to "normal" filesystems it can happen that link
	   makes two "logical" inodes point to the same "physical"
	   inode.  We invalidate the attributes of the old one, so it
	   will reflect changes in the backing inode (link count,
	   etc.)
	*/
M
Miklos Szeredi 已提交
827 828 829 830 831 832 833
	if (!err) {
		struct fuse_inode *fi = get_fuse_inode(inode);

		spin_lock(&fc->lock);
		fi->attr_version = ++fc->attr_version;
		inc_nlink(inode);
		spin_unlock(&fc->lock);
834
		fuse_invalidate_attr(inode);
M
Maxim Patlasov 已提交
835
		fuse_update_ctime(inode);
M
Miklos Szeredi 已提交
836 837 838
	} else if (err == -EINTR) {
		fuse_invalidate_attr(inode);
	}
839 840 841
	return err;
}

842 843 844
static void fuse_fillattr(struct inode *inode, struct fuse_attr *attr,
			  struct kstat *stat)
{
M
Miklos Szeredi 已提交
845
	unsigned int blkbits;
P
Pavel Emelyanov 已提交
846 847 848
	struct fuse_conn *fc = get_fuse_conn(inode);

	/* see the comment in fuse_change_attributes() */
M
Maxim Patlasov 已提交
849
	if (fc->writeback_cache && S_ISREG(inode->i_mode)) {
P
Pavel Emelyanov 已提交
850
		attr->size = i_size_read(inode);
M
Maxim Patlasov 已提交
851 852
		attr->mtime = inode->i_mtime.tv_sec;
		attr->mtimensec = inode->i_mtime.tv_nsec;
M
Maxim Patlasov 已提交
853 854
		attr->ctime = inode->i_ctime.tv_sec;
		attr->ctimensec = inode->i_ctime.tv_nsec;
M
Maxim Patlasov 已提交
855
	}
M
Miklos Szeredi 已提交
856

857 858 859 860
	stat->dev = inode->i_sb->s_dev;
	stat->ino = attr->ino;
	stat->mode = (inode->i_mode & S_IFMT) | (attr->mode & 07777);
	stat->nlink = attr->nlink;
861 862
	stat->uid = make_kuid(fc->user_ns, attr->uid);
	stat->gid = make_kgid(fc->user_ns, attr->gid);
863 864 865 866 867 868 869 870 871
	stat->rdev = inode->i_rdev;
	stat->atime.tv_sec = attr->atime;
	stat->atime.tv_nsec = attr->atimensec;
	stat->mtime.tv_sec = attr->mtime;
	stat->mtime.tv_nsec = attr->mtimensec;
	stat->ctime.tv_sec = attr->ctime;
	stat->ctime.tv_nsec = attr->ctimensec;
	stat->size = attr->size;
	stat->blocks = attr->blocks;
M
Miklos Szeredi 已提交
872 873 874 875 876 877 878

	if (attr->blksize != 0)
		blkbits = ilog2(attr->blksize);
	else
		blkbits = inode->i_sb->s_blocksize_bits;

	stat->blksize = 1 << blkbits;
879 880
}

881 882
static int fuse_do_getattr(struct inode *inode, struct kstat *stat,
			   struct file *file)
883 884
{
	int err;
885 886
	struct fuse_getattr_in inarg;
	struct fuse_attr_out outarg;
887
	struct fuse_conn *fc = get_fuse_conn(inode);
888
	FUSE_ARGS(args);
889 890
	u64 attr_version;

891
	attr_version = fuse_get_attr_version(fc);
892

893
	memset(&inarg, 0, sizeof(inarg));
894
	memset(&outarg, 0, sizeof(outarg));
895 896 897 898 899 900 901
	/* Directories have separate file-handle space */
	if (file && S_ISREG(inode->i_mode)) {
		struct fuse_file *ff = file->private_data;

		inarg.getattr_flags |= FUSE_GETATTR_FH;
		inarg.fh = ff->fh;
	}
902 903 904 905 906 907
	args.in.h.opcode = FUSE_GETATTR;
	args.in.h.nodeid = get_node_id(inode);
	args.in.numargs = 1;
	args.in.args[0].size = sizeof(inarg);
	args.in.args[0].value = &inarg;
	args.out.numargs = 1;
908
	args.out.args[0].size = sizeof(outarg);
909 910
	args.out.args[0].value = &outarg;
	err = fuse_simple_request(fc, &args);
911
	if (!err) {
912
		if ((inode->i_mode ^ outarg.attr.mode) & S_IFMT) {
913 914 915
			make_bad_inode(inode);
			err = -EIO;
		} else {
916 917
			fuse_change_attributes(inode, &outarg.attr,
					       attr_timeout(&outarg),
918 919
					       attr_version);
			if (stat)
920
				fuse_fillattr(inode, &outarg.attr, stat);
921 922 923 924 925
		}
	}
	return err;
}

M
Miklos Szeredi 已提交
926
static int fuse_update_get_attr(struct inode *inode, struct file *file,
927 928
				struct kstat *stat, u32 request_mask,
				unsigned int flags)
M
Miklos Szeredi 已提交
929 930
{
	struct fuse_inode *fi = get_fuse_inode(inode);
M
Miklos Szeredi 已提交
931
	int err = 0;
M
Miklos Szeredi 已提交
932
	bool sync;
M
Miklos Szeredi 已提交
933

M
Miklos Szeredi 已提交
934 935 936 937
	if (flags & AT_STATX_FORCE_SYNC)
		sync = true;
	else if (flags & AT_STATX_DONT_SYNC)
		sync = false;
938 939
	else if (request_mask & READ_ONCE(fi->inval_mask))
		sync = true;
M
Miklos Szeredi 已提交
940 941 942 943
	else
		sync = time_before64(fi->i_time, get_jiffies_64());

	if (sync) {
S
Seth Forshee 已提交
944
		forget_all_cached_acls(inode);
M
Miklos Szeredi 已提交
945
		err = fuse_do_getattr(inode, stat, file);
M
Miklos Szeredi 已提交
946 947 948 949
	} else if (stat) {
		generic_fillattr(inode, stat);
		stat->mode = fi->orig_i_mode;
		stat->ino = fi->orig_ino;
M
Miklos Szeredi 已提交
950 951 952 953 954
	}

	return err;
}

M
Miklos Szeredi 已提交
955 956
int fuse_update_attributes(struct inode *inode, struct file *file)
{
957 958 959
	/* Do *not* need to get atime for internal purposes */
	return fuse_update_get_attr(inode, file, NULL,
				    STATX_BASIC_STATS & ~STATX_ATIME, 0);
M
Miklos Szeredi 已提交
960 961
}

J
John Muir 已提交
962
int fuse_reverse_inval_entry(struct super_block *sb, u64 parent_nodeid,
963
			     u64 child_nodeid, struct qstr *name)
J
John Muir 已提交
964 965 966 967 968 969 970 971 972 973
{
	int err = -ENOTDIR;
	struct inode *parent;
	struct dentry *dir;
	struct dentry *entry;

	parent = ilookup5(sb, parent_nodeid, fuse_inode_eq, &parent_nodeid);
	if (!parent)
		return -ENOENT;

A
Al Viro 已提交
974
	inode_lock(parent);
J
John Muir 已提交
975 976 977 978 979 980 981 982
	if (!S_ISDIR(parent->i_mode))
		goto unlock;

	err = -ENOENT;
	dir = d_find_alias(parent);
	if (!dir)
		goto unlock;

983
	name->hash = full_name_hash(dir, name->name, name->len);
J
John Muir 已提交
984 985 986 987 988
	entry = d_lookup(dir, name);
	dput(dir);
	if (!entry)
		goto unlock;

989
	fuse_dir_changed(parent);
J
John Muir 已提交
990
	fuse_invalidate_entry(entry);
991

992
	if (child_nodeid != 0 && d_really_is_positive(entry)) {
A
Al Viro 已提交
993
		inode_lock(d_inode(entry));
994
		if (get_node_id(d_inode(entry)) != child_nodeid) {
995 996 997 998 999 1000 1001
			err = -ENOENT;
			goto badentry;
		}
		if (d_mountpoint(entry)) {
			err = -EBUSY;
			goto badentry;
		}
1002
		if (d_is_dir(entry)) {
1003 1004 1005 1006 1007
			shrink_dcache_parent(entry);
			if (!simple_empty(entry)) {
				err = -ENOTEMPTY;
				goto badentry;
			}
1008
			d_inode(entry)->i_flags |= S_DEAD;
1009 1010
		}
		dont_mount(entry);
1011
		clear_nlink(d_inode(entry));
1012 1013
		err = 0;
 badentry:
A
Al Viro 已提交
1014
		inode_unlock(d_inode(entry));
1015 1016 1017 1018 1019
		if (!err)
			d_delete(entry);
	} else {
		err = 0;
	}
J
John Muir 已提交
1020 1021 1022
	dput(entry);

 unlock:
A
Al Viro 已提交
1023
	inode_unlock(parent);
J
John Muir 已提交
1024 1025 1026 1027
	iput(parent);
	return err;
}

1028 1029
/*
 * Calling into a user-controlled filesystem gives the filesystem
1030
 * daemon ptrace-like capabilities over the current process.  This
1031 1032 1033 1034 1035 1036 1037 1038 1039 1040
 * means, that the filesystem daemon is able to record the exact
 * filesystem operations performed, and can also control the behavior
 * of the requester process in otherwise impossible ways.  For example
 * it can delay the operation for arbitrary length of time allowing
 * DoS against the requester.
 *
 * For this reason only those processes can call into the filesystem,
 * for which the owner of the mount has ptrace privilege.  This
 * excludes processes started by other users, suid or sgid processes.
 */
1041
int fuse_allow_current_process(struct fuse_conn *fc)
1042
{
1043
	const struct cred *cred;
1044

M
Miklos Szeredi 已提交
1045
	if (fc->allow_other)
1046
		return current_in_userns(fc->user_ns);
1047

1048
	cred = current_cred();
1049 1050 1051 1052 1053 1054
	if (uid_eq(cred->euid, fc->user_id) &&
	    uid_eq(cred->suid, fc->user_id) &&
	    uid_eq(cred->uid,  fc->user_id) &&
	    gid_eq(cred->egid, fc->group_id) &&
	    gid_eq(cred->sgid, fc->group_id) &&
	    gid_eq(cred->gid,  fc->group_id))
1055
		return 1;
1056

1057
	return 0;
1058 1059
}

M
Miklos Szeredi 已提交
1060 1061 1062
static int fuse_access(struct inode *inode, int mask)
{
	struct fuse_conn *fc = get_fuse_conn(inode);
1063
	FUSE_ARGS(args);
M
Miklos Szeredi 已提交
1064 1065 1066
	struct fuse_access_in inarg;
	int err;

1067 1068
	BUG_ON(mask & MAY_NOT_BLOCK);

M
Miklos Szeredi 已提交
1069 1070 1071 1072
	if (fc->no_access)
		return 0;

	memset(&inarg, 0, sizeof(inarg));
1073
	inarg.mask = mask & (MAY_READ | MAY_WRITE | MAY_EXEC);
1074 1075 1076 1077 1078 1079
	args.in.h.opcode = FUSE_ACCESS;
	args.in.h.nodeid = get_node_id(inode);
	args.in.numargs = 1;
	args.in.args[0].size = sizeof(inarg);
	args.in.args[0].value = &inarg;
	err = fuse_simple_request(fc, &args);
M
Miklos Szeredi 已提交
1080 1081 1082 1083 1084 1085 1086
	if (err == -ENOSYS) {
		fc->no_access = 1;
		err = 0;
	}
	return err;
}

1087
static int fuse_perm_getattr(struct inode *inode, int mask)
1088
{
1089
	if (mask & MAY_NOT_BLOCK)
1090 1091
		return -ECHILD;

S
Seth Forshee 已提交
1092
	forget_all_cached_acls(inode);
1093 1094 1095
	return fuse_do_getattr(inode, NULL, NULL);
}

1096 1097 1098 1099 1100 1101 1102 1103 1104 1105 1106 1107 1108
/*
 * Check permission.  The two basic access models of FUSE are:
 *
 * 1) Local access checking ('default_permissions' mount option) based
 * on file mode.  This is the plain old disk filesystem permission
 * modell.
 *
 * 2) "Remote" access checking, where server is responsible for
 * checking permission in each inode operation.  An exception to this
 * is if ->permission() was invoked from sys_access() in which case an
 * access request is sent.  Execute permission is still checked
 * locally based on file mode.
 */
1109
static int fuse_permission(struct inode *inode, int mask)
1110 1111
{
	struct fuse_conn *fc = get_fuse_conn(inode);
1112 1113
	bool refreshed = false;
	int err = 0;
1114

1115
	if (!fuse_allow_current_process(fc))
1116
		return -EACCES;
1117 1118

	/*
1119
	 * If attributes are needed, refresh them before proceeding
1120
	 */
M
Miklos Szeredi 已提交
1121
	if (fc->default_permissions ||
1122
	    ((mask & MAY_EXEC) && S_ISREG(inode->i_mode))) {
1123
		struct fuse_inode *fi = get_fuse_inode(inode);
1124
		u32 perm_mask = STATX_MODE | STATX_UID | STATX_GID;
1125

1126 1127
		if (perm_mask & READ_ONCE(fi->inval_mask) ||
		    time_before64(fi->i_time, get_jiffies_64())) {
1128 1129
			refreshed = true;

1130
			err = fuse_perm_getattr(inode, mask);
1131 1132 1133
			if (err)
				return err;
		}
1134 1135
	}

M
Miklos Szeredi 已提交
1136
	if (fc->default_permissions) {
1137
		err = generic_permission(inode, mask);
M
Miklos Szeredi 已提交
1138 1139 1140 1141

		/* If permission is denied, try to refresh file
		   attributes.  This is also needed, because the root
		   node will at first have no permissions */
1142
		if (err == -EACCES && !refreshed) {
1143
			err = fuse_perm_getattr(inode, mask);
M
Miklos Szeredi 已提交
1144
			if (!err)
1145
				err = generic_permission(inode, mask);
M
Miklos Szeredi 已提交
1146 1147
		}

1148 1149 1150 1151
		/* Note: the opposite of the above test does not
		   exist.  So if permissions are revoked this won't be
		   noticed immediately, only after the attribute
		   timeout has expired */
E
Eric Paris 已提交
1152
	} else if (mask & (MAY_ACCESS | MAY_CHDIR)) {
1153 1154 1155 1156 1157 1158
		err = fuse_access(inode, mask);
	} else if ((mask & MAY_EXEC) && S_ISREG(inode->i_mode)) {
		if (!(inode->i_mode & S_IXUGO)) {
			if (refreshed)
				return -EACCES;

1159
			err = fuse_perm_getattr(inode, mask);
1160 1161 1162
			if (!err && !(inode->i_mode & S_IXUGO))
				return -EACCES;
		}
1163
	}
1164
	return err;
1165 1166
}

D
Dan Schatzberg 已提交
1167
static int fuse_readlink_page(struct inode *inode, struct page *page)
1168 1169
{
	struct fuse_conn *fc = get_fuse_conn(inode);
D
Dan Schatzberg 已提交
1170 1171
	struct fuse_req *req;
	int err;
1172

D
Dan Schatzberg 已提交
1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188
	req = fuse_get_req(fc, 1);
	if (IS_ERR(req))
		return PTR_ERR(req);

	req->out.page_zeroing = 1;
	req->out.argpages = 1;
	req->num_pages = 1;
	req->pages[0] = page;
	req->page_descs[0].length = PAGE_SIZE - 1;
	req->in.h.opcode = FUSE_READLINK;
	req->in.h.nodeid = get_node_id(inode);
	req->out.argvar = 1;
	req->out.numargs = 1;
	req->out.args[0].size = PAGE_SIZE - 1;
	fuse_request_send(fc, req);
	err = req->out.h.error;
1189

D
Dan Schatzberg 已提交
1190 1191 1192
	if (!err) {
		char *link = page_address(page);
		size_t len = req->out.args[0].size;
1193

D
Dan Schatzberg 已提交
1194 1195
		BUG_ON(len >= PAGE_SIZE);
		link[len] = '\0';
1196
	}
D
Dan Schatzberg 已提交
1197 1198

	fuse_put_request(fc, req);
1199
	fuse_invalidate_atime(inode);
D
Dan Schatzberg 已提交
1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238

	return err;
}

static const char *fuse_get_link(struct dentry *dentry, struct inode *inode,
				 struct delayed_call *callback)
{
	struct fuse_conn *fc = get_fuse_conn(inode);
	struct page *page;
	int err;

	err = -EIO;
	if (is_bad_inode(inode))
		goto out_err;

	if (fc->cache_symlinks)
		return page_get_link(dentry, inode, callback);

	err = -ECHILD;
	if (!dentry)
		goto out_err;

	page = alloc_page(GFP_KERNEL);
	err = -ENOMEM;
	if (!page)
		goto out_err;

	err = fuse_readlink_page(inode, page);
	if (err) {
		__free_page(page);
		goto out_err;
	}

	set_delayed_call(callback, page_put_link, page);

	return page_address(page);

out_err:
	return ERR_PTR(err);
1239 1240 1241 1242
}

static int fuse_dir_open(struct inode *inode, struct file *file)
{
1243
	return fuse_open_common(inode, file, true);
1244 1245 1246 1247
}

static int fuse_dir_release(struct inode *inode, struct file *file)
{
1248
	fuse_release_common(file, true);
1249 1250

	return 0;
1251 1252
}

1253 1254
static int fuse_dir_fsync(struct file *file, loff_t start, loff_t end,
			  int datasync)
1255
{
M
Miklos Szeredi 已提交
1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 1273 1274
	struct inode *inode = file->f_mapping->host;
	struct fuse_conn *fc = get_fuse_conn(inode);
	int err;

	if (is_bad_inode(inode))
		return -EIO;

	if (fc->no_fsyncdir)
		return 0;

	inode_lock(inode);
	err = fuse_fsync_common(file, start, end, datasync, FUSE_FSYNCDIR);
	if (err == -ENOSYS) {
		fc->no_fsyncdir = 1;
		err = 0;
	}
	inode_unlock(inode);

	return err;
1275 1276
}

1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299 1300
static long fuse_dir_ioctl(struct file *file, unsigned int cmd,
			    unsigned long arg)
{
	struct fuse_conn *fc = get_fuse_conn(file->f_mapping->host);

	/* FUSE_IOCTL_DIR only supported for API version >= 7.18 */
	if (fc->minor < 18)
		return -ENOTTY;

	return fuse_ioctl_common(file, cmd, arg, FUSE_IOCTL_DIR);
}

static long fuse_dir_compat_ioctl(struct file *file, unsigned int cmd,
				   unsigned long arg)
{
	struct fuse_conn *fc = get_fuse_conn(file->f_mapping->host);

	if (fc->minor < 18)
		return -ENOTTY;

	return fuse_ioctl_common(file, cmd, arg,
				 FUSE_IOCTL_COMPAT | FUSE_IOCTL_DIR);
}

M
Maxim Patlasov 已提交
1301
static bool update_mtime(unsigned ivalid, bool trust_local_mtime)
M
Miklos Szeredi 已提交
1302 1303 1304 1305 1306
{
	/* Always update if mtime is explicitly set  */
	if (ivalid & ATTR_MTIME_SET)
		return true;

M
Maxim Patlasov 已提交
1307 1308 1309 1310
	/* Or if kernel i_mtime is the official one */
	if (trust_local_mtime)
		return true;

M
Miklos Szeredi 已提交
1311 1312 1313 1314 1315 1316 1317 1318
	/* If it's an open(O_TRUNC) or an ftruncate(), don't update */
	if ((ivalid & ATTR_SIZE) && (ivalid & (ATTR_OPEN | ATTR_FILE)))
		return false;

	/* In all other cases update */
	return true;
}

1319 1320
static void iattr_to_fattr(struct fuse_conn *fc, struct iattr *iattr,
			   struct fuse_setattr_in *arg, bool trust_local_cmtime)
1321 1322 1323 1324
{
	unsigned ivalid = iattr->ia_valid;

	if (ivalid & ATTR_MODE)
1325
		arg->valid |= FATTR_MODE,   arg->mode = iattr->ia_mode;
1326
	if (ivalid & ATTR_UID)
1327
		arg->valid |= FATTR_UID,    arg->uid = from_kuid(fc->user_ns, iattr->ia_uid);
1328
	if (ivalid & ATTR_GID)
1329
		arg->valid |= FATTR_GID,    arg->gid = from_kgid(fc->user_ns, iattr->ia_gid);
1330
	if (ivalid & ATTR_SIZE)
1331
		arg->valid |= FATTR_SIZE,   arg->size = iattr->ia_size;
M
Miklos Szeredi 已提交
1332 1333
	if (ivalid & ATTR_ATIME) {
		arg->valid |= FATTR_ATIME;
1334
		arg->atime = iattr->ia_atime.tv_sec;
M
Miklos Szeredi 已提交
1335 1336 1337 1338
		arg->atimensec = iattr->ia_atime.tv_nsec;
		if (!(ivalid & ATTR_ATIME_SET))
			arg->valid |= FATTR_ATIME_NOW;
	}
1339
	if ((ivalid & ATTR_MTIME) && update_mtime(ivalid, trust_local_cmtime)) {
M
Miklos Szeredi 已提交
1340
		arg->valid |= FATTR_MTIME;
1341
		arg->mtime = iattr->ia_mtime.tv_sec;
M
Miklos Szeredi 已提交
1342
		arg->mtimensec = iattr->ia_mtime.tv_nsec;
1343
		if (!(ivalid & ATTR_MTIME_SET) && !trust_local_cmtime)
M
Miklos Szeredi 已提交
1344
			arg->valid |= FATTR_MTIME_NOW;
1345
	}
1346 1347 1348 1349 1350
	if ((ivalid & ATTR_CTIME) && trust_local_cmtime) {
		arg->valid |= FATTR_CTIME;
		arg->ctime = iattr->ia_ctime.tv_sec;
		arg->ctimensec = iattr->ia_ctime.tv_nsec;
	}
1351 1352
}

M
Miklos Szeredi 已提交
1353 1354 1355 1356 1357 1358 1359 1360 1361 1362 1363
/*
 * Prevent concurrent writepages on inode
 *
 * This is done by adding a negative bias to the inode write counter
 * and waiting for all pending writes to finish.
 */
void fuse_set_nowrite(struct inode *inode)
{
	struct fuse_conn *fc = get_fuse_conn(inode);
	struct fuse_inode *fi = get_fuse_inode(inode);

A
Al Viro 已提交
1364
	BUG_ON(!inode_is_locked(inode));
M
Miklos Szeredi 已提交
1365 1366 1367 1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396

	spin_lock(&fc->lock);
	BUG_ON(fi->writectr < 0);
	fi->writectr += FUSE_NOWRITE;
	spin_unlock(&fc->lock);
	wait_event(fi->page_waitq, fi->writectr == FUSE_NOWRITE);
}

/*
 * Allow writepages on inode
 *
 * Remove the bias from the writecounter and send any queued
 * writepages.
 */
static void __fuse_release_nowrite(struct inode *inode)
{
	struct fuse_inode *fi = get_fuse_inode(inode);

	BUG_ON(fi->writectr != FUSE_NOWRITE);
	fi->writectr = 0;
	fuse_flush_writepages(inode);
}

void fuse_release_nowrite(struct inode *inode)
{
	struct fuse_conn *fc = get_fuse_conn(inode);

	spin_lock(&fc->lock);
	__fuse_release_nowrite(inode);
	spin_unlock(&fc->lock);
}

1397
static void fuse_setattr_fill(struct fuse_conn *fc, struct fuse_args *args,
M
Maxim Patlasov 已提交
1398 1399 1400 1401
			      struct inode *inode,
			      struct fuse_setattr_in *inarg_p,
			      struct fuse_attr_out *outarg_p)
{
1402 1403 1404 1405 1406 1407
	args->in.h.opcode = FUSE_SETATTR;
	args->in.h.nodeid = get_node_id(inode);
	args->in.numargs = 1;
	args->in.args[0].size = sizeof(*inarg_p);
	args->in.args[0].value = inarg_p;
	args->out.numargs = 1;
1408
	args->out.args[0].size = sizeof(*outarg_p);
1409
	args->out.args[0].value = outarg_p;
M
Maxim Patlasov 已提交
1410 1411 1412 1413 1414
}

/*
 * Flush inode->i_mtime to the server
 */
1415
int fuse_flush_times(struct inode *inode, struct fuse_file *ff)
M
Maxim Patlasov 已提交
1416 1417
{
	struct fuse_conn *fc = get_fuse_conn(inode);
1418
	FUSE_ARGS(args);
M
Maxim Patlasov 已提交
1419 1420 1421 1422 1423 1424
	struct fuse_setattr_in inarg;
	struct fuse_attr_out outarg;

	memset(&inarg, 0, sizeof(inarg));
	memset(&outarg, 0, sizeof(outarg));

1425
	inarg.valid = FATTR_MTIME;
M
Maxim Patlasov 已提交
1426 1427
	inarg.mtime = inode->i_mtime.tv_sec;
	inarg.mtimensec = inode->i_mtime.tv_nsec;
1428 1429 1430 1431 1432
	if (fc->minor >= 23) {
		inarg.valid |= FATTR_CTIME;
		inarg.ctime = inode->i_ctime.tv_sec;
		inarg.ctimensec = inode->i_ctime.tv_nsec;
	}
M
Miklos Szeredi 已提交
1433 1434 1435 1436
	if (ff) {
		inarg.valid |= FATTR_FH;
		inarg.fh = ff->fh;
	}
1437
	fuse_setattr_fill(fc, &args, inode, &inarg, &outarg);
M
Maxim Patlasov 已提交
1438

1439
	return fuse_simple_request(fc, &args);
M
Maxim Patlasov 已提交
1440 1441
}

1442 1443 1444 1445 1446
/*
 * Set attributes, and at the same time refresh them.
 *
 * Truncation is slightly complicated, because the 'truncate' request
 * may fail, in which case we don't want to touch the mapping.
M
Miklos Szeredi 已提交
1447 1448
 * vmtruncate() doesn't allow for this case, so do the rlimit checking
 * and the actual truncation by hand.
1449
 */
1450
int fuse_do_setattr(struct dentry *dentry, struct iattr *attr,
1451
		    struct file *file)
1452
{
1453
	struct inode *inode = d_inode(dentry);
1454
	struct fuse_conn *fc = get_fuse_conn(inode);
1455
	struct fuse_inode *fi = get_fuse_inode(inode);
1456
	FUSE_ARGS(args);
1457 1458
	struct fuse_setattr_in inarg;
	struct fuse_attr_out outarg;
M
Miklos Szeredi 已提交
1459
	bool is_truncate = false;
P
Pavel Emelyanov 已提交
1460
	bool is_wb = fc->writeback_cache;
M
Miklos Szeredi 已提交
1461
	loff_t oldsize;
1462
	int err;
1463
	bool trust_local_cmtime = is_wb && S_ISREG(inode->i_mode);
1464

M
Miklos Szeredi 已提交
1465
	if (!fc->default_permissions)
1466 1467
		attr->ia_valid |= ATTR_FORCE;

1468
	err = setattr_prepare(dentry, attr);
1469 1470
	if (err)
		return err;
M
Miklos Szeredi 已提交
1471

M
Miklos Szeredi 已提交
1472
	if (attr->ia_valid & ATTR_OPEN) {
1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483
		/* This is coming from open(..., ... | O_TRUNC); */
		WARN_ON(!(attr->ia_valid & ATTR_SIZE));
		WARN_ON(attr->ia_size != 0);
		if (fc->atomic_o_trunc) {
			/*
			 * No need to send request to userspace, since actual
			 * truncation has already been done by OPEN.  But still
			 * need to truncate page cache.
			 */
			i_size_write(inode, 0);
			truncate_pagecache(inode, 0);
M
Miklos Szeredi 已提交
1484
			return 0;
1485
		}
M
Miklos Szeredi 已提交
1486 1487
		file = NULL;
	}
1488

1489 1490 1491
	if (attr->ia_valid & ATTR_SIZE) {
		if (WARN_ON(!S_ISREG(inode->i_mode)))
			return -EIO;
M
Miklos Szeredi 已提交
1492
		is_truncate = true;
1493
	}
1494

1495
	if (is_truncate) {
M
Miklos Szeredi 已提交
1496
		fuse_set_nowrite(inode);
1497
		set_bit(FUSE_I_SIZE_UNSTABLE, &fi->state);
1498 1499
		if (trust_local_cmtime && attr->ia_size != inode->i_size)
			attr->ia_valid |= ATTR_MTIME | ATTR_CTIME;
1500
	}
M
Miklos Szeredi 已提交
1501

1502
	memset(&inarg, 0, sizeof(inarg));
1503
	memset(&outarg, 0, sizeof(outarg));
1504
	iattr_to_fattr(fc, attr, &inarg, trust_local_cmtime);
1505 1506 1507 1508 1509
	if (file) {
		struct fuse_file *ff = file->private_data;
		inarg.valid |= FATTR_FH;
		inarg.fh = ff->fh;
	}
1510 1511 1512 1513 1514
	if (attr->ia_valid & ATTR_SIZE) {
		/* For mandatory locking in truncate */
		inarg.valid |= FATTR_LOCKOWNER;
		inarg.lock_owner = fuse_lock_owner_id(fc, current->files);
	}
1515 1516
	fuse_setattr_fill(fc, &args, inode, &inarg, &outarg);
	err = fuse_simple_request(fc, &args);
1517 1518 1519
	if (err) {
		if (err == -EINTR)
			fuse_invalidate_attr(inode);
M
Miklos Szeredi 已提交
1520
		goto error;
1521
	}
1522

1523 1524
	if ((inode->i_mode ^ outarg.attr.mode) & S_IFMT) {
		make_bad_inode(inode);
M
Miklos Szeredi 已提交
1525 1526 1527 1528 1529
		err = -EIO;
		goto error;
	}

	spin_lock(&fc->lock);
M
Maxim Patlasov 已提交
1530
	/* the kernel maintains i_mtime locally */
1531 1532 1533 1534 1535
	if (trust_local_cmtime) {
		if (attr->ia_valid & ATTR_MTIME)
			inode->i_mtime = attr->ia_mtime;
		if (attr->ia_valid & ATTR_CTIME)
			inode->i_ctime = attr->ia_ctime;
M
Miklos Szeredi 已提交
1536
		/* FIXME: clear I_DIRTY_SYNC? */
M
Maxim Patlasov 已提交
1537 1538
	}

M
Miklos Szeredi 已提交
1539 1540 1541
	fuse_change_attributes_common(inode, &outarg.attr,
				      attr_timeout(&outarg));
	oldsize = inode->i_size;
P
Pavel Emelyanov 已提交
1542 1543 1544
	/* see the comment in fuse_change_attributes() */
	if (!is_wb || is_truncate || !S_ISREG(inode->i_mode))
		i_size_write(inode, outarg.attr.size);
M
Miklos Szeredi 已提交
1545 1546 1547 1548 1549 1550 1551 1552 1553 1554 1555

	if (is_truncate) {
		/* NOTE: this may release/reacquire fc->lock */
		__fuse_release_nowrite(inode);
	}
	spin_unlock(&fc->lock);

	/*
	 * Only call invalidate_inode_pages2() after removing
	 * FUSE_NOWRITE, otherwise fuse_launder_page() would deadlock.
	 */
P
Pavel Emelyanov 已提交
1556 1557
	if ((is_truncate || !is_wb) &&
	    S_ISREG(inode->i_mode) && oldsize != outarg.attr.size) {
1558
		truncate_pagecache(inode, outarg.attr.size);
M
Miklos Szeredi 已提交
1559
		invalidate_inode_pages2(inode->i_mapping);
1560 1561
	}

1562
	clear_bit(FUSE_I_SIZE_UNSTABLE, &fi->state);
1563
	return 0;
M
Miklos Szeredi 已提交
1564 1565 1566 1567 1568

error:
	if (is_truncate)
		fuse_release_nowrite(inode);

1569
	clear_bit(FUSE_I_SIZE_UNSTABLE, &fi->state);
M
Miklos Szeredi 已提交
1570
	return err;
1571 1572
}

1573 1574
static int fuse_setattr(struct dentry *entry, struct iattr *attr)
{
1575
	struct inode *inode = d_inode(entry);
1576
	struct fuse_conn *fc = get_fuse_conn(inode);
1577
	struct file *file = (attr->ia_valid & ATTR_FILE) ? attr->ia_file : NULL;
1578
	int ret;
1579 1580 1581 1582

	if (!fuse_allow_current_process(get_fuse_conn(inode)))
		return -EACCES;

1583 1584 1585
	if (attr->ia_valid & (ATTR_KILL_SUID | ATTR_KILL_SGID)) {
		attr->ia_valid &= ~(ATTR_KILL_SUID | ATTR_KILL_SGID |
				    ATTR_MODE);
1586

1587
		/*
1588 1589 1590 1591
		 * The only sane way to reliably kill suid/sgid is to do it in
		 * the userspace filesystem
		 *
		 * This should be done on write(), truncate() and chown().
1592
		 */
1593 1594 1595 1596 1597 1598 1599 1600 1601 1602
		if (!fc->handle_killpriv) {
			/*
			 * ia_mode calculation may have used stale i_mode.
			 * Refresh and recalculate.
			 */
			ret = fuse_do_getattr(inode, NULL, file);
			if (ret)
				return ret;

			attr->ia_mode = inode->i_mode;
1603
			if (inode->i_mode & S_ISUID) {
1604 1605 1606
				attr->ia_valid |= ATTR_MODE;
				attr->ia_mode &= ~S_ISUID;
			}
1607
			if ((inode->i_mode & (S_ISGID | S_IXGRP)) == (S_ISGID | S_IXGRP)) {
1608 1609 1610
				attr->ia_valid |= ATTR_MODE;
				attr->ia_mode &= ~S_ISGID;
			}
1611 1612 1613 1614
		}
	}
	if (!attr->ia_valid)
		return 0;
1615

1616
	ret = fuse_do_setattr(entry, attr, file);
1617
	if (!ret) {
S
Seth Forshee 已提交
1618 1619 1620 1621 1622 1623 1624
		/*
		 * If filesystem supports acls it may have updated acl xattrs in
		 * the filesystem, so forget cached acls for the inode.
		 */
		if (fc->posix_acl)
			forget_all_cached_acls(inode);

1625 1626 1627 1628 1629
		/* Directory mode changed, may need to revalidate access */
		if (d_is_dir(entry) && (attr->ia_valid & ATTR_MODE))
			fuse_invalidate_entry_cache(entry);
	}
	return ret;
1630 1631
}

1632 1633
static int fuse_getattr(const struct path *path, struct kstat *stat,
			u32 request_mask, unsigned int flags)
1634
{
1635
	struct inode *inode = d_inode(path->dentry);
1636 1637
	struct fuse_conn *fc = get_fuse_conn(inode);

1638
	if (!fuse_allow_current_process(fc))
1639 1640
		return -EACCES;

1641
	return fuse_update_get_attr(inode, NULL, stat, request_mask, flags);
1642 1643
}

1644
static const struct inode_operations fuse_dir_inode_operations = {
1645
	.lookup		= fuse_lookup,
1646 1647 1648 1649
	.mkdir		= fuse_mkdir,
	.symlink	= fuse_symlink,
	.unlink		= fuse_unlink,
	.rmdir		= fuse_rmdir,
1650
	.rename		= fuse_rename2,
1651 1652 1653
	.link		= fuse_link,
	.setattr	= fuse_setattr,
	.create		= fuse_create,
1654
	.atomic_open	= fuse_atomic_open,
1655
	.mknod		= fuse_mknod,
1656 1657
	.permission	= fuse_permission,
	.getattr	= fuse_getattr,
1658
	.listxattr	= fuse_listxattr,
S
Seth Forshee 已提交
1659 1660
	.get_acl	= fuse_get_acl,
	.set_acl	= fuse_set_acl,
1661 1662
};

1663
static const struct file_operations fuse_dir_operations = {
M
Miklos Szeredi 已提交
1664
	.llseek		= generic_file_llseek,
1665
	.read		= generic_read_dir,
A
Al Viro 已提交
1666
	.iterate_shared	= fuse_readdir,
1667 1668
	.open		= fuse_dir_open,
	.release	= fuse_dir_release,
1669
	.fsync		= fuse_dir_fsync,
1670 1671
	.unlocked_ioctl	= fuse_dir_ioctl,
	.compat_ioctl	= fuse_dir_compat_ioctl,
1672 1673
};

1674
static const struct inode_operations fuse_common_inode_operations = {
1675
	.setattr	= fuse_setattr,
1676 1677
	.permission	= fuse_permission,
	.getattr	= fuse_getattr,
1678
	.listxattr	= fuse_listxattr,
S
Seth Forshee 已提交
1679 1680
	.get_acl	= fuse_get_acl,
	.set_acl	= fuse_set_acl,
1681 1682
};

1683
static const struct inode_operations fuse_symlink_inode_operations = {
1684
	.setattr	= fuse_setattr,
1685
	.get_link	= fuse_get_link,
1686
	.getattr	= fuse_getattr,
1687
	.listxattr	= fuse_listxattr,
1688 1689 1690 1691 1692 1693 1694 1695 1696
};

void fuse_init_common(struct inode *inode)
{
	inode->i_op = &fuse_common_inode_operations;
}

void fuse_init_dir(struct inode *inode)
{
1697 1698
	struct fuse_inode *fi = get_fuse_inode(inode);

1699 1700
	inode->i_op = &fuse_dir_inode_operations;
	inode->i_fop = &fuse_dir_operations;
1701 1702 1703 1704 1705 1706

	spin_lock_init(&fi->rdc.lock);
	fi->rdc.cached = false;
	fi->rdc.size = 0;
	fi->rdc.pos = 0;
	fi->rdc.version = 0;
1707 1708
}

D
Dan Schatzberg 已提交
1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722 1723 1724
static int fuse_symlink_readpage(struct file *null, struct page *page)
{
	int err = fuse_readlink_page(page->mapping->host, page);

	if (!err)
		SetPageUptodate(page);

	unlock_page(page);

	return err;
}

static const struct address_space_operations fuse_symlink_aops = {
	.readpage	= fuse_symlink_readpage,
};

1725 1726 1727
void fuse_init_symlink(struct inode *inode)
{
	inode->i_op = &fuse_symlink_inode_operations;
D
Dan Schatzberg 已提交
1728 1729
	inode->i_data.a_ops = &fuse_symlink_aops;
	inode_nohighmem(inode);
1730
}