dir.c 47.6 KB
Newer Older
1 2
/*
  FUSE: Filesystem in Userspace
M
Miklos Szeredi 已提交
3
  Copyright (C) 2001-2008  Miklos Szeredi <miklos@szeredi.hu>
4 5 6 7 8 9 10 11 12

  This program can be distributed under the terms of the GNU GPL.
  See the file COPYING.
*/

#include "fuse_i.h"

#include <linux/pagemap.h>
#include <linux/file.h>
M
Max Reitz 已提交
13
#include <linux/fs_context.h>
14 15
#include <linux/sched.h>
#include <linux/namei.h>
16
#include <linux/slab.h>
S
Seth Forshee 已提交
17
#include <linux/xattr.h>
18
#include <linux/iversion.h>
S
Seth Forshee 已提交
19
#include <linux/posix_acl.h>
20

21 22 23 24 25 26 27
static void fuse_advise_use_readdirplus(struct inode *dir)
{
	struct fuse_inode *fi = get_fuse_inode(dir);

	set_bit(FUSE_I_ADVISE_RDPLUS, &fi->state);
}

28 29 30 31 32 33 34 35 36 37 38 39
#if BITS_PER_LONG >= 64
static inline void __fuse_dentry_settime(struct dentry *entry, u64 time)
{
	entry->d_fsdata = (void *) time;
}

static inline u64 fuse_dentry_time(const struct dentry *entry)
{
	return (u64)entry->d_fsdata;
}

#else
M
Miklos Szeredi 已提交
40 41 42 43 44
union fuse_dentry {
	u64 time;
	struct rcu_head rcu;
};

45 46 47 48 49 50 51 52 53 54 55
static inline void __fuse_dentry_settime(struct dentry *dentry, u64 time)
{
	((union fuse_dentry *) dentry->d_fsdata)->time = time;
}

static inline u64 fuse_dentry_time(const struct dentry *entry)
{
	return ((union fuse_dentry *) entry->d_fsdata)->time;
}
#endif

56
static void fuse_dentry_settime(struct dentry *dentry, u64 time)
M
Miklos Szeredi 已提交
57
{
58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73
	struct fuse_conn *fc = get_fuse_conn_super(dentry->d_sb);
	bool delete = !time && fc->delete_stale;
	/*
	 * Mess with DCACHE_OP_DELETE because dput() will be faster without it.
	 * Don't care about races, either way it's just an optimization
	 */
	if ((!delete && (dentry->d_flags & DCACHE_OP_DELETE)) ||
	    (delete && !(dentry->d_flags & DCACHE_OP_DELETE))) {
		spin_lock(&dentry->d_lock);
		if (!delete)
			dentry->d_flags &= ~DCACHE_OP_DELETE;
		else
			dentry->d_flags |= DCACHE_OP_DELETE;
		spin_unlock(&dentry->d_lock);
	}

74
	__fuse_dentry_settime(dentry, time);
M
Miklos Szeredi 已提交
75 76
}

77 78 79
/*
 * FUSE caches dentries and attributes with separate timeout.  The
 * time in jiffies until the dentry/attributes are valid is stored in
M
Miklos Szeredi 已提交
80
 * dentry->d_fsdata and fuse_inode->i_time respectively.
81 82 83 84 85
 */

/*
 * Calculate the time in jiffies until a dentry/attributes are valid
 */
M
Miklos Szeredi 已提交
86
static u64 time_to_jiffies(u64 sec, u32 nsec)
87
{
M
Miklos Szeredi 已提交
88
	if (sec || nsec) {
M
Miklos Szeredi 已提交
89 90
		struct timespec64 ts = {
			sec,
91
			min_t(u32, nsec, NSEC_PER_SEC - 1)
M
Miklos Szeredi 已提交
92 93 94
		};

		return get_jiffies_64() + timespec64_to_jiffies(&ts);
M
Miklos Szeredi 已提交
95
	} else
M
Miklos Szeredi 已提交
96
		return 0;
97 98
}

99 100 101 102
/*
 * Set dentry and possibly attribute timeouts from the lookup/mk*
 * replies
 */
M
Miklos Szeredi 已提交
103
void fuse_change_entry_timeout(struct dentry *entry, struct fuse_entry_out *o)
104
{
M
Miklos Szeredi 已提交
105 106
	fuse_dentry_settime(entry,
		time_to_jiffies(o->entry_valid, o->entry_valid_nsec));
107 108 109 110 111 112 113
}

static u64 attr_timeout(struct fuse_attr_out *o)
{
	return time_to_jiffies(o->attr_valid, o->attr_valid_nsec);
}

M
Miklos Szeredi 已提交
114
u64 entry_attr_timeout(struct fuse_entry_out *o)
115 116
{
	return time_to_jiffies(o->attr_valid, o->attr_valid_nsec);
117 118
}

119 120 121 122 123
static void fuse_invalidate_attr_mask(struct inode *inode, u32 mask)
{
	set_mask_bits(&get_fuse_inode(inode)->inval_mask, 0, mask);
}

124 125 126 127
/*
 * Mark the attributes as stale, so that at the next call to
 * ->getattr() they will be fetched from userspace
 */
128 129
void fuse_invalidate_attr(struct inode *inode)
{
130
	fuse_invalidate_attr_mask(inode, STATX_BASIC_STATS);
131 132
}

133 134 135 136 137 138
static void fuse_dir_changed(struct inode *dir)
{
	fuse_invalidate_attr(dir);
	inode_maybe_inc_iversion(dir, false);
}

139 140 141 142 143 144 145
/**
 * Mark the attributes as stale due to an atime change.  Avoid the invalidate if
 * atime is not used.
 */
void fuse_invalidate_atime(struct inode *inode)
{
	if (!IS_RDONLY(inode))
146
		fuse_invalidate_attr_mask(inode, STATX_ATIME);
147 148
}

149 150 151 152 153 154 155 156
/*
 * Just mark the entry as stale, so that a next attempt to look it up
 * will result in a new lookup call to userspace
 *
 * This is called when a dentry is about to become negative and the
 * timeout is unknown (unlink, rmdir, rename and in some cases
 * lookup)
 */
M
Miklos Szeredi 已提交
157
void fuse_invalidate_entry_cache(struct dentry *entry)
158
{
M
Miklos Szeredi 已提交
159
	fuse_dentry_settime(entry, 0);
160 161
}

162 163 164 165
/*
 * Same as fuse_invalidate_entry_cache(), but also try to remove the
 * dentry from the hash
 */
166 167 168 169
static void fuse_invalidate_entry(struct dentry *entry)
{
	d_invalidate(entry);
	fuse_invalidate_entry_cache(entry);
170 171
}

172
static void fuse_lookup_init(struct fuse_conn *fc, struct fuse_args *args,
A
Al Viro 已提交
173
			     u64 nodeid, const struct qstr *name,
174 175
			     struct fuse_entry_out *outarg)
{
176
	memset(outarg, 0, sizeof(struct fuse_entry_out));
177 178 179 180 181 182 183 184
	args->opcode = FUSE_LOOKUP;
	args->nodeid = nodeid;
	args->in_numargs = 1;
	args->in_args[0].size = name->len + 1;
	args->in_args[0].value = name->name;
	args->out_numargs = 1;
	args->out_args[0].size = sizeof(struct fuse_entry_out);
	args->out_args[0].value = outarg;
185 186
}

187 188 189 190 191 192 193 194 195
/*
 * Check whether the dentry is still valid
 *
 * If the entry validity timeout has expired and the dentry is
 * positive, try to redo the lookup.  If the lookup results in a
 * different inode, then let the VFS invalidate the dentry and redo
 * the lookup once more.  If the lookup results in the same inode,
 * then refresh the attributes, timeouts and mark the dentry valid.
 */
196
static int fuse_dentry_revalidate(struct dentry *entry, unsigned int flags)
197
{
198
	struct inode *inode;
199
	struct dentry *parent;
200
	struct fuse_mount *fm;
M
Miklos Szeredi 已提交
201
	struct fuse_inode *fi;
202
	int ret;
203

204
	inode = d_inode_rcu(entry);
M
Miklos Szeredi 已提交
205
	if (inode && fuse_is_bad(inode))
206
		goto invalid;
207
	else if (time_before64(fuse_dentry_time(entry), get_jiffies_64()) ||
208
		 (flags & (LOOKUP_EXCL | LOOKUP_REVAL))) {
209
		struct fuse_entry_out outarg;
210
		FUSE_ARGS(args);
211
		struct fuse_forget_link *forget;
212
		u64 attr_version;
213

214
		/* For negative dentries, always do a fresh lookup */
215
		if (!inode)
216
			goto invalid;
217

218
		ret = -ECHILD;
219
		if (flags & LOOKUP_RCU)
220
			goto out;
221

222
		fm = get_fuse_mount(inode);
223

224
		forget = fuse_alloc_forget();
225 226
		ret = -ENOMEM;
		if (!forget)
227
			goto out;
M
Miklos Szeredi 已提交
228

229
		attr_version = fuse_get_attr_version(fm->fc);
230

231
		parent = dget_parent(entry);
232
		fuse_lookup_init(fm->fc, &args, get_node_id(d_inode(parent)),
233
				 &entry->d_name, &outarg);
234
		ret = fuse_simple_request(fm, &args);
235
		dput(parent);
236
		/* Zero nodeid is same as -ENOENT */
237 238 239
		if (!ret && !outarg.nodeid)
			ret = -ENOENT;
		if (!ret) {
M
Miklos Szeredi 已提交
240
			fi = get_fuse_inode(inode);
M
Max Reitz 已提交
241 242
			if (outarg.nodeid != get_node_id(inode) ||
			    (bool) IS_AUTOMOUNT(inode) != (bool) (outarg.attr.flags & FUSE_ATTR_SUBMOUNT)) {
243 244
				fuse_queue_forget(fm->fc, forget,
						  outarg.nodeid, 1);
245
				goto invalid;
246
			}
247
			spin_lock(&fi->lock);
M
Miklos Szeredi 已提交
248
			fi->nlookup++;
249
			spin_unlock(&fi->lock);
250
		}
251
		kfree(forget);
252 253
		if (ret == -ENOMEM)
			goto out;
M
Miklos Szeredi 已提交
254 255
		if (ret || fuse_invalid_attr(&outarg.attr) ||
		    (outarg.attr.mode ^ inode->i_mode) & S_IFMT)
256
			goto invalid;
257

S
Seth Forshee 已提交
258
		forget_all_cached_acls(inode);
259 260 261 262
		fuse_change_attributes(inode, &outarg.attr,
				       entry_attr_timeout(&outarg),
				       attr_version);
		fuse_change_entry_timeout(entry, &outarg);
263
	} else if (inode) {
M
Miklos Szeredi 已提交
264 265 266 267 268
		fi = get_fuse_inode(inode);
		if (flags & LOOKUP_RCU) {
			if (test_bit(FUSE_I_INIT_RDPLUS, &fi->state))
				return -ECHILD;
		} else if (test_and_clear_bit(FUSE_I_INIT_RDPLUS, &fi->state)) {
269
			parent = dget_parent(entry);
270
			fuse_advise_use_readdirplus(d_inode(parent));
271 272
			dput(parent);
		}
273
	}
274 275 276 277 278 279 280
	ret = 1;
out:
	return ret;

invalid:
	ret = 0;
	goto out;
281 282
}

283
#if BITS_PER_LONG < 64
M
Miklos Szeredi 已提交
284 285
static int fuse_dentry_init(struct dentry *dentry)
{
286 287
	dentry->d_fsdata = kzalloc(sizeof(union fuse_dentry),
				   GFP_KERNEL_ACCOUNT | __GFP_RECLAIMABLE);
M
Miklos Szeredi 已提交
288 289 290 291 292 293 294 295 296

	return dentry->d_fsdata ? 0 : -ENOMEM;
}
static void fuse_dentry_release(struct dentry *dentry)
{
	union fuse_dentry *fd = dentry->d_fsdata;

	kfree_rcu(fd, rcu);
}
297
#endif
M
Miklos Szeredi 已提交
298

299 300 301 302 303
static int fuse_dentry_delete(const struct dentry *dentry)
{
	return time_before64(fuse_dentry_time(dentry), get_jiffies_64());
}

M
Max Reitz 已提交
304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334
/*
 * Create a fuse_mount object with a new superblock (with path->dentry
 * as the root), and return that mount so it can be auto-mounted on
 * @path.
 */
static struct vfsmount *fuse_dentry_automount(struct path *path)
{
	struct fs_context *fsc;
	struct fuse_mount *parent_fm = get_fuse_mount_super(path->mnt->mnt_sb);
	struct fuse_conn *fc = parent_fm->fc;
	struct fuse_mount *fm;
	struct vfsmount *mnt;
	struct fuse_inode *mp_fi = get_fuse_inode(d_inode(path->dentry));
	struct super_block *sb;
	int err;

	fsc = fs_context_for_submount(path->mnt->mnt_sb->s_type, path->dentry);
	if (IS_ERR(fsc)) {
		err = PTR_ERR(fsc);
		goto out;
	}

	err = -ENOMEM;
	fm = kzalloc(sizeof(struct fuse_mount), GFP_KERNEL);
	if (!fm)
		goto out_put_fsc;

	fsc->s_fs_info = fm;
	sb = sget_fc(fsc, NULL, set_anon_super_fc);
	if (IS_ERR(sb)) {
		err = PTR_ERR(sb);
335
		kfree(fm);
M
Max Reitz 已提交
336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375
		goto out_put_fsc;
	}
	fm->fc = fuse_conn_get(fc);

	/* Initialize superblock, making @mp_fi its root */
	err = fuse_fill_super_submount(sb, mp_fi);
	if (err)
		goto out_put_sb;

	sb->s_flags |= SB_ACTIVE;
	fsc->root = dget(sb->s_root);
	/* We are done configuring the superblock, so unlock it */
	up_write(&sb->s_umount);

	down_write(&fc->killsb);
	list_add_tail(&fm->fc_entry, &fc->mounts);
	up_write(&fc->killsb);

	/* Create the submount */
	mnt = vfs_create_mount(fsc);
	if (IS_ERR(mnt)) {
		err = PTR_ERR(mnt);
		goto out_put_fsc;
	}
	mntget(mnt);
	put_fs_context(fsc);
	return mnt;

out_put_sb:
	/*
	 * Only jump here when fsc->root is NULL and sb is still locked
	 * (otherwise put_fs_context() will put the superblock)
	 */
	deactivate_locked_super(sb);
out_put_fsc:
	put_fs_context(fsc);
out:
	return ERR_PTR(err);
}

A
Al Viro 已提交
376
const struct dentry_operations fuse_dentry_operations = {
377
	.d_revalidate	= fuse_dentry_revalidate,
378
	.d_delete	= fuse_dentry_delete,
379
#if BITS_PER_LONG < 64
M
Miklos Szeredi 已提交
380 381
	.d_init		= fuse_dentry_init,
	.d_release	= fuse_dentry_release,
382
#endif
M
Max Reitz 已提交
383
	.d_automount	= fuse_dentry_automount,
384 385
};

386
const struct dentry_operations fuse_root_dentry_operations = {
387
#if BITS_PER_LONG < 64
388 389
	.d_init		= fuse_dentry_init,
	.d_release	= fuse_dentry_release,
390
#endif
391 392
};

393
int fuse_valid_type(int m)
394 395 396 397 398
{
	return S_ISREG(m) || S_ISDIR(m) || S_ISLNK(m) || S_ISCHR(m) ||
		S_ISBLK(m) || S_ISFIFO(m) || S_ISSOCK(m);
}

M
Miklos Szeredi 已提交
399 400 401 402 403 404
bool fuse_invalid_attr(struct fuse_attr *attr)
{
	return !fuse_valid_type(attr->mode) ||
		attr->size > LLONG_MAX;
}

A
Al Viro 已提交
405
int fuse_lookup_name(struct super_block *sb, u64 nodeid, const struct qstr *name,
406
		     struct fuse_entry_out *outarg, struct inode **inode)
407
{
408
	struct fuse_mount *fm = get_fuse_mount_super(sb);
409
	FUSE_ARGS(args);
410
	struct fuse_forget_link *forget;
411
	u64 attr_version;
412
	int err;
413

414 415 416 417
	*inode = NULL;
	err = -ENAMETOOLONG;
	if (name->len > FUSE_NAME_MAX)
		goto out;
418 419


420 421
	forget = fuse_alloc_forget();
	err = -ENOMEM;
422
	if (!forget)
423
		goto out;
M
Miklos Szeredi 已提交
424

425
	attr_version = fuse_get_attr_version(fm->fc);
426

427 428
	fuse_lookup_init(fm->fc, &args, nodeid, name, outarg);
	err = fuse_simple_request(fm, &args);
429
	/* Zero nodeid is same as -ENOENT, but with valid timeout */
430 431 432 433 434 435
	if (err || !outarg->nodeid)
		goto out_put_forget;

	err = -EIO;
	if (!outarg->nodeid)
		goto out_put_forget;
M
Miklos Szeredi 已提交
436
	if (fuse_invalid_attr(&outarg->attr))
437 438 439 440 441 442 443
		goto out_put_forget;

	*inode = fuse_iget(sb, outarg->nodeid, outarg->generation,
			   &outarg->attr, entry_attr_timeout(outarg),
			   attr_version);
	err = -ENOMEM;
	if (!*inode) {
444
		fuse_queue_forget(fm->fc, forget, outarg->nodeid, 1);
445
		goto out;
446
	}
447 448 449
	err = 0;

 out_put_forget:
450
	kfree(forget);
451 452 453 454 455
 out:
	return err;
}

static struct dentry *fuse_lookup(struct inode *dir, struct dentry *entry,
A
Al Viro 已提交
456
				  unsigned int flags)
457 458 459 460 461 462
{
	int err;
	struct fuse_entry_out outarg;
	struct inode *inode;
	struct dentry *newent;
	bool outarg_valid = true;
463
	bool locked;
464

M
Miklos Szeredi 已提交
465 466 467
	if (fuse_is_bad(dir))
		return ERR_PTR(-EIO);

468
	locked = fuse_lock_inode(dir);
469 470
	err = fuse_lookup_name(dir->i_sb, get_node_id(dir), &entry->d_name,
			       &outarg, &inode);
471
	fuse_unlock_inode(dir, locked);
472 473 474 475 476 477 478 479 480 481
	if (err == -ENOENT) {
		outarg_valid = false;
		err = 0;
	}
	if (err)
		goto out_err;

	err = -EIO;
	if (inode && get_node_id(inode) == FUSE_ROOT_ID)
		goto out_iput;
482

483
	newent = d_splice_alias(inode, entry);
484 485 486
	err = PTR_ERR(newent);
	if (IS_ERR(newent))
		goto out_err;
487

488
	entry = newent ? newent : entry;
489
	if (outarg_valid)
490
		fuse_change_entry_timeout(entry, &outarg);
491 492
	else
		fuse_invalidate_entry_cache(entry);
493

494 495
	if (inode)
		fuse_advise_use_readdirplus(dir);
496
	return newent;
497 498 499 500 501

 out_iput:
	iput(inode);
 out_err:
	return ERR_PTR(err);
502 503
}

504 505 506 507 508 509
/*
 * Atomic create+open operation
 *
 * If the filesystem doesn't support this, then fall back to separate
 * 'mknod' + 'open' requests.
 */
A
Al Viro 已提交
510
static int fuse_create_open(struct inode *dir, struct dentry *entry,
M
Miklos Szeredi 已提交
511
			    struct file *file, unsigned int flags,
512
			    umode_t mode)
M
Miklos Szeredi 已提交
513 514 515
{
	int err;
	struct inode *inode;
516
	struct fuse_mount *fm = get_fuse_mount(dir);
517
	FUSE_ARGS(args);
518
	struct fuse_forget_link *forget;
519
	struct fuse_create_in inarg;
M
Miklos Szeredi 已提交
520 521
	struct fuse_open_out outopen;
	struct fuse_entry_out outentry;
522
	struct fuse_inode *fi;
M
Miklos Szeredi 已提交
523 524
	struct fuse_file *ff;

525 526 527
	/* Userspace expects S_IFREG in create mode */
	BUG_ON((mode & S_IFMT) != S_IFREG);

528
	forget = fuse_alloc_forget();
529
	err = -ENOMEM;
530
	if (!forget)
531
		goto out_err;
532

533
	err = -ENOMEM;
534
	ff = fuse_file_alloc(fm);
M
Miklos Szeredi 已提交
535
	if (!ff)
536
		goto out_put_forget_req;
M
Miklos Szeredi 已提交
537

538
	if (!fm->fc->dont_mask)
539 540
		mode &= ~current_umask();

M
Miklos Szeredi 已提交
541 542
	flags &= ~O_NOCTTY;
	memset(&inarg, 0, sizeof(inarg));
543
	memset(&outentry, 0, sizeof(outentry));
M
Miklos Szeredi 已提交
544 545
	inarg.flags = flags;
	inarg.mode = mode;
546
	inarg.umask = current_umask();
547 548 549 550 551 552

	if (fm->fc->handle_killpriv_v2 && (flags & O_TRUNC) &&
	    !(flags & O_EXCL) && !capable(CAP_FSETID)) {
		inarg.open_flags |= FUSE_OPEN_KILL_SUIDGID;
	}

553 554 555 556 557 558 559 560 561 562 563 564
	args.opcode = FUSE_CREATE;
	args.nodeid = get_node_id(dir);
	args.in_numargs = 2;
	args.in_args[0].size = sizeof(inarg);
	args.in_args[0].value = &inarg;
	args.in_args[1].size = entry->d_name.len + 1;
	args.in_args[1].value = entry->d_name.name;
	args.out_numargs = 2;
	args.out_args[0].size = sizeof(outentry);
	args.out_args[0].value = &outentry;
	args.out_args[1].size = sizeof(outopen);
	args.out_args[1].value = &outopen;
565
	err = fuse_simple_request(fm, &args);
566
	if (err)
M
Miklos Szeredi 已提交
567 568 569
		goto out_free_ff;

	err = -EIO;
M
Miklos Szeredi 已提交
570 571
	if (!S_ISREG(outentry.attr.mode) || invalid_nodeid(outentry.nodeid) ||
	    fuse_invalid_attr(&outentry.attr))
M
Miklos Szeredi 已提交
572 573
		goto out_free_ff;

574 575 576
	ff->fh = outopen.fh;
	ff->nodeid = outentry.nodeid;
	ff->open_flags = outopen.open_flags;
M
Miklos Szeredi 已提交
577
	inode = fuse_iget(dir->i_sb, outentry.nodeid, outentry.generation,
578
			  &outentry.attr, entry_attr_timeout(&outentry), 0);
M
Miklos Szeredi 已提交
579 580
	if (!inode) {
		flags &= ~(O_CREAT | O_EXCL | O_TRUNC);
581
		fuse_sync_release(NULL, ff, flags);
582
		fuse_queue_forget(fm->fc, forget, outentry.nodeid, 1);
583 584
		err = -ENOMEM;
		goto out_err;
M
Miklos Szeredi 已提交
585
	}
586
	kfree(forget);
M
Miklos Szeredi 已提交
587
	d_instantiate(entry, inode);
588
	fuse_change_entry_timeout(entry, &outentry);
589
	fuse_dir_changed(dir);
590
	err = finish_open(file, entry, generic_file_open);
A
Al Viro 已提交
591
	if (err) {
592 593
		fi = get_fuse_inode(inode);
		fuse_sync_release(fi, ff, flags);
594
	} else {
595
		file->private_data = ff;
596
		fuse_finish_open(inode, file);
M
Miklos Szeredi 已提交
597
	}
A
Al Viro 已提交
598
	return err;
M
Miklos Szeredi 已提交
599

600
out_free_ff:
M
Miklos Szeredi 已提交
601
	fuse_file_free(ff);
602
out_put_forget_req:
603
	kfree(forget);
604
out_err:
A
Al Viro 已提交
605
	return err;
606 607
}

608 609
static int fuse_mknod(struct user_namespace *, struct inode *, struct dentry *,
		      umode_t, dev_t);
A
Al Viro 已提交
610
static int fuse_atomic_open(struct inode *dir, struct dentry *entry,
A
Al Viro 已提交
611
			    struct file *file, unsigned flags,
612
			    umode_t mode)
613 614 615 616 617
{
	int err;
	struct fuse_conn *fc = get_fuse_conn(dir);
	struct dentry *res = NULL;

M
Miklos Szeredi 已提交
618 619 620
	if (fuse_is_bad(dir))
		return -EIO;

621
	if (d_in_lookup(entry)) {
A
Al Viro 已提交
622
		res = fuse_lookup(dir, entry, 0);
623
		if (IS_ERR(res))
A
Al Viro 已提交
624
			return PTR_ERR(res);
625 626 627 628 629

		if (res)
			entry = res;
	}

630
	if (!(flags & O_CREAT) || d_really_is_positive(entry))
631 632 633
		goto no_open;

	/* Only creates */
634
	file->f_mode |= FMODE_CREATED;
635 636 637 638

	if (fc->no_create)
		goto mknod;

639
	err = fuse_create_open(dir, entry, file, flags, mode);
A
Al Viro 已提交
640
	if (err == -ENOSYS) {
641 642 643 644 645
		fc->no_create = 1;
		goto mknod;
	}
out_dput:
	dput(res);
A
Al Viro 已提交
646
	return err;
647 648

mknod:
649
	err = fuse_mknod(&init_user_ns, dir, entry, mode, 0);
A
Al Viro 已提交
650
	if (err)
651 652
		goto out_dput;
no_open:
A
Al Viro 已提交
653
	return finish_no_open(file, res);
M
Miklos Szeredi 已提交
654 655
}

656 657 658
/*
 * Code shared between mknod, mkdir, symlink and link
 */
659
static int create_new_entry(struct fuse_mount *fm, struct fuse_args *args,
660
			    struct inode *dir, struct dentry *entry,
A
Al Viro 已提交
661
			    umode_t mode)
662 663 664
{
	struct fuse_entry_out outarg;
	struct inode *inode;
A
Al Viro 已提交
665
	struct dentry *d;
666
	int err;
667
	struct fuse_forget_link *forget;
M
Miklos Szeredi 已提交
668

M
Miklos Szeredi 已提交
669 670 671
	if (fuse_is_bad(dir))
		return -EIO;

672
	forget = fuse_alloc_forget();
673
	if (!forget)
674
		return -ENOMEM;
675

676
	memset(&outarg, 0, sizeof(outarg));
677 678 679 680
	args->nodeid = get_node_id(dir);
	args->out_numargs = 1;
	args->out_args[0].size = sizeof(outarg);
	args->out_args[0].value = &outarg;
681
	err = fuse_simple_request(fm, args);
M
Miklos Szeredi 已提交
682 683 684
	if (err)
		goto out_put_forget_req;

685
	err = -EIO;
M
Miklos Szeredi 已提交
686
	if (invalid_nodeid(outarg.nodeid) || fuse_invalid_attr(&outarg.attr))
M
Miklos Szeredi 已提交
687
		goto out_put_forget_req;
688 689

	if ((outarg.attr.mode ^ mode) & S_IFMT)
M
Miklos Szeredi 已提交
690
		goto out_put_forget_req;
691

692
	inode = fuse_iget(dir->i_sb, outarg.nodeid, outarg.generation,
693
			  &outarg.attr, entry_attr_timeout(&outarg), 0);
694
	if (!inode) {
695
		fuse_queue_forget(fm->fc, forget, outarg.nodeid, 1);
696 697
		return -ENOMEM;
	}
698
	kfree(forget);
699

A
Al Viro 已提交
700 701 702 703
	d_drop(entry);
	d = d_splice_alias(inode, entry);
	if (IS_ERR(d))
		return PTR_ERR(d);
704

A
Al Viro 已提交
705 706 707 708 709 710
	if (d) {
		fuse_change_entry_timeout(d, &outarg);
		dput(d);
	} else {
		fuse_change_entry_timeout(entry, &outarg);
	}
711
	fuse_dir_changed(dir);
712
	return 0;
713

M
Miklos Szeredi 已提交
714
 out_put_forget_req:
715
	kfree(forget);
716
	return err;
717 718
}

719 720
static int fuse_mknod(struct user_namespace *mnt_userns, struct inode *dir,
		      struct dentry *entry, umode_t mode, dev_t rdev)
721 722
{
	struct fuse_mknod_in inarg;
723
	struct fuse_mount *fm = get_fuse_mount(dir);
724
	FUSE_ARGS(args);
725

726
	if (!fm->fc->dont_mask)
727 728
		mode &= ~current_umask();

729 730 731
	memset(&inarg, 0, sizeof(inarg));
	inarg.mode = mode;
	inarg.rdev = new_encode_dev(rdev);
732
	inarg.umask = current_umask();
733 734 735 736 737 738
	args.opcode = FUSE_MKNOD;
	args.in_numargs = 2;
	args.in_args[0].size = sizeof(inarg);
	args.in_args[0].value = &inarg;
	args.in_args[1].size = entry->d_name.len + 1;
	args.in_args[1].value = entry->d_name.name;
739
	return create_new_entry(fm, &args, dir, entry, mode);
740 741
}

742 743
static int fuse_create(struct user_namespace *mnt_userns, struct inode *dir,
		       struct dentry *entry, umode_t mode, bool excl)
744
{
745
	return fuse_mknod(&init_user_ns, dir, entry, mode, 0);
746 747
}

748 749
static int fuse_mkdir(struct user_namespace *mnt_userns, struct inode *dir,
		      struct dentry *entry, umode_t mode)
750 751
{
	struct fuse_mkdir_in inarg;
752
	struct fuse_mount *fm = get_fuse_mount(dir);
753
	FUSE_ARGS(args);
754

755
	if (!fm->fc->dont_mask)
756 757
		mode &= ~current_umask();

758 759
	memset(&inarg, 0, sizeof(inarg));
	inarg.mode = mode;
760
	inarg.umask = current_umask();
761 762 763 764 765 766
	args.opcode = FUSE_MKDIR;
	args.in_numargs = 2;
	args.in_args[0].size = sizeof(inarg);
	args.in_args[0].value = &inarg;
	args.in_args[1].size = entry->d_name.len + 1;
	args.in_args[1].value = entry->d_name.name;
767
	return create_new_entry(fm, &args, dir, entry, S_IFDIR);
768 769
}

770 771
static int fuse_symlink(struct user_namespace *mnt_userns, struct inode *dir,
			struct dentry *entry, const char *link)
772
{
773
	struct fuse_mount *fm = get_fuse_mount(dir);
774
	unsigned len = strlen(link) + 1;
775
	FUSE_ARGS(args);
776

777 778 779 780 781 782
	args.opcode = FUSE_SYMLINK;
	args.in_numargs = 2;
	args.in_args[0].size = entry->d_name.len + 1;
	args.in_args[0].value = entry->d_name.name;
	args.in_args[1].size = len;
	args.in_args[1].value = link;
783
	return create_new_entry(fm, &args, dir, entry, S_IFLNK);
784 785
}

S
Seth Forshee 已提交
786
void fuse_update_ctime(struct inode *inode)
M
Maxim Patlasov 已提交
787 788
{
	if (!IS_NOCMTIME(inode)) {
789
		inode->i_ctime = current_time(inode);
M
Maxim Patlasov 已提交
790 791 792 793
		mark_inode_dirty_sync(inode);
	}
}

794 795 796
static int fuse_unlink(struct inode *dir, struct dentry *entry)
{
	int err;
797
	struct fuse_mount *fm = get_fuse_mount(dir);
798 799
	FUSE_ARGS(args);

M
Miklos Szeredi 已提交
800 801 802
	if (fuse_is_bad(dir))
		return -EIO;

803 804 805 806 807
	args.opcode = FUSE_UNLINK;
	args.nodeid = get_node_id(dir);
	args.in_numargs = 1;
	args.in_args[0].size = entry->d_name.len + 1;
	args.in_args[0].value = entry->d_name.name;
808
	err = fuse_simple_request(fm, &args);
809
	if (!err) {
810
		struct inode *inode = d_inode(entry);
M
Miklos Szeredi 已提交
811
		struct fuse_inode *fi = get_fuse_inode(inode);
812

813
		spin_lock(&fi->lock);
814
		fi->attr_version = atomic64_inc_return(&fm->fc->attr_version);
815 816 817 818 819 820 821 822
		/*
		 * If i_nlink == 0 then unlink doesn't make sense, yet this can
		 * happen if userspace filesystem is careless.  It would be
		 * difficult to enforce correct nlink usage so just ignore this
		 * condition here
		 */
		if (inode->i_nlink > 0)
			drop_nlink(inode);
823
		spin_unlock(&fi->lock);
824
		fuse_invalidate_attr(inode);
825
		fuse_dir_changed(dir);
826
		fuse_invalidate_entry_cache(entry);
M
Maxim Patlasov 已提交
827
		fuse_update_ctime(inode);
828 829 830 831 832 833 834 835
	} else if (err == -EINTR)
		fuse_invalidate_entry(entry);
	return err;
}

static int fuse_rmdir(struct inode *dir, struct dentry *entry)
{
	int err;
836
	struct fuse_mount *fm = get_fuse_mount(dir);
837 838
	FUSE_ARGS(args);

M
Miklos Szeredi 已提交
839 840 841
	if (fuse_is_bad(dir))
		return -EIO;

842 843 844 845 846
	args.opcode = FUSE_RMDIR;
	args.nodeid = get_node_id(dir);
	args.in_numargs = 1;
	args.in_args[0].size = entry->d_name.len + 1;
	args.in_args[0].value = entry->d_name.name;
847
	err = fuse_simple_request(fm, &args);
848
	if (!err) {
849
		clear_nlink(d_inode(entry));
850
		fuse_dir_changed(dir);
851
		fuse_invalidate_entry_cache(entry);
852 853 854 855 856
	} else if (err == -EINTR)
		fuse_invalidate_entry(entry);
	return err;
}

M
Miklos Szeredi 已提交
857 858 859
static int fuse_rename_common(struct inode *olddir, struct dentry *oldent,
			      struct inode *newdir, struct dentry *newent,
			      unsigned int flags, int opcode, size_t argsize)
860 861
{
	int err;
M
Miklos Szeredi 已提交
862
	struct fuse_rename2_in inarg;
863
	struct fuse_mount *fm = get_fuse_mount(olddir);
864
	FUSE_ARGS(args);
865

M
Miklos Szeredi 已提交
866
	memset(&inarg, 0, argsize);
867
	inarg.newdir = get_node_id(newdir);
M
Miklos Szeredi 已提交
868
	inarg.flags = flags;
869 870 871 872 873 874 875 876 877
	args.opcode = opcode;
	args.nodeid = get_node_id(olddir);
	args.in_numargs = 3;
	args.in_args[0].size = argsize;
	args.in_args[0].value = &inarg;
	args.in_args[1].size = oldent->d_name.len + 1;
	args.in_args[1].value = oldent->d_name.name;
	args.in_args[2].size = newent->d_name.len + 1;
	args.in_args[2].value = newent->d_name.name;
878
	err = fuse_simple_request(fm, &args);
879
	if (!err) {
880
		/* ctime changes */
881 882
		fuse_invalidate_attr(d_inode(oldent));
		fuse_update_ctime(d_inode(oldent));
883

M
Miklos Szeredi 已提交
884
		if (flags & RENAME_EXCHANGE) {
885 886
			fuse_invalidate_attr(d_inode(newent));
			fuse_update_ctime(d_inode(newent));
M
Miklos Szeredi 已提交
887 888
		}

889
		fuse_dir_changed(olddir);
890
		if (olddir != newdir)
891
			fuse_dir_changed(newdir);
892 893

		/* newent will end up negative */
894 895
		if (!(flags & RENAME_EXCHANGE) && d_really_is_positive(newent)) {
			fuse_invalidate_attr(d_inode(newent));
896
			fuse_invalidate_entry_cache(newent);
897
			fuse_update_ctime(d_inode(newent));
M
Miklos Szeredi 已提交
898
		}
899 900 901 902 903 904 905
	} else if (err == -EINTR) {
		/* If request was interrupted, DEITY only knows if the
		   rename actually took place.  If the invalidation
		   fails (e.g. some process has CWD under the renamed
		   directory), then there can be inconsistency between
		   the dcache and the real filesystem.  Tough luck. */
		fuse_invalidate_entry(oldent);
906
		if (d_really_is_positive(newent))
907 908 909 910 911 912
			fuse_invalidate_entry(newent);
	}

	return err;
}

913 914 915
static int fuse_rename2(struct user_namespace *mnt_userns, struct inode *olddir,
			struct dentry *oldent, struct inode *newdir,
			struct dentry *newent, unsigned int flags)
M
Miklos Szeredi 已提交
916 917 918 919
{
	struct fuse_conn *fc = get_fuse_conn(olddir);
	int err;

M
Miklos Szeredi 已提交
920 921 922
	if (fuse_is_bad(olddir))
		return -EIO;

V
Vivek Goyal 已提交
923
	if (flags & ~(RENAME_NOREPLACE | RENAME_EXCHANGE | RENAME_WHITEOUT))
M
Miklos Szeredi 已提交
924 925
		return -EINVAL;

M
Miklos Szeredi 已提交
926 927 928
	if (flags) {
		if (fc->no_rename2 || fc->minor < 23)
			return -EINVAL;
M
Miklos Szeredi 已提交
929

M
Miklos Szeredi 已提交
930 931 932 933 934 935 936 937 938 939 940
		err = fuse_rename_common(olddir, oldent, newdir, newent, flags,
					 FUSE_RENAME2,
					 sizeof(struct fuse_rename2_in));
		if (err == -ENOSYS) {
			fc->no_rename2 = 1;
			err = -EINVAL;
		}
	} else {
		err = fuse_rename_common(olddir, oldent, newdir, newent, 0,
					 FUSE_RENAME,
					 sizeof(struct fuse_rename_in));
M
Miklos Szeredi 已提交
941
	}
M
Miklos Szeredi 已提交
942

M
Miklos Szeredi 已提交
943
	return err;
M
Miklos Szeredi 已提交
944
}
M
Miklos Szeredi 已提交
945

946 947 948 949 950
static int fuse_link(struct dentry *entry, struct inode *newdir,
		     struct dentry *newent)
{
	int err;
	struct fuse_link_in inarg;
951
	struct inode *inode = d_inode(entry);
952
	struct fuse_mount *fm = get_fuse_mount(inode);
953
	FUSE_ARGS(args);
954 955 956

	memset(&inarg, 0, sizeof(inarg));
	inarg.oldnodeid = get_node_id(inode);
957 958 959 960 961 962
	args.opcode = FUSE_LINK;
	args.in_numargs = 2;
	args.in_args[0].size = sizeof(inarg);
	args.in_args[0].value = &inarg;
	args.in_args[1].size = newent->d_name.len + 1;
	args.in_args[1].value = newent->d_name.name;
963
	err = create_new_entry(fm, &args, newdir, newent, inode->i_mode);
964 965 966 967 968 969
	/* Contrary to "normal" filesystems it can happen that link
	   makes two "logical" inodes point to the same "physical"
	   inode.  We invalidate the attributes of the old one, so it
	   will reflect changes in the backing inode (link count,
	   etc.)
	*/
M
Miklos Szeredi 已提交
970 971 972
	if (!err) {
		struct fuse_inode *fi = get_fuse_inode(inode);

973
		spin_lock(&fi->lock);
974
		fi->attr_version = atomic64_inc_return(&fm->fc->attr_version);
M
Miklos Szeredi 已提交
975 976
		if (likely(inode->i_nlink < UINT_MAX))
			inc_nlink(inode);
977
		spin_unlock(&fi->lock);
978
		fuse_invalidate_attr(inode);
M
Maxim Patlasov 已提交
979
		fuse_update_ctime(inode);
M
Miklos Szeredi 已提交
980 981 982
	} else if (err == -EINTR) {
		fuse_invalidate_attr(inode);
	}
983 984 985
	return err;
}

986 987 988
static void fuse_fillattr(struct inode *inode, struct fuse_attr *attr,
			  struct kstat *stat)
{
M
Miklos Szeredi 已提交
989
	unsigned int blkbits;
P
Pavel Emelyanov 已提交
990 991 992
	struct fuse_conn *fc = get_fuse_conn(inode);

	/* see the comment in fuse_change_attributes() */
M
Maxim Patlasov 已提交
993
	if (fc->writeback_cache && S_ISREG(inode->i_mode)) {
P
Pavel Emelyanov 已提交
994
		attr->size = i_size_read(inode);
M
Maxim Patlasov 已提交
995 996
		attr->mtime = inode->i_mtime.tv_sec;
		attr->mtimensec = inode->i_mtime.tv_nsec;
M
Maxim Patlasov 已提交
997 998
		attr->ctime = inode->i_ctime.tv_sec;
		attr->ctimensec = inode->i_ctime.tv_nsec;
M
Maxim Patlasov 已提交
999
	}
M
Miklos Szeredi 已提交
1000

1001 1002 1003 1004
	stat->dev = inode->i_sb->s_dev;
	stat->ino = attr->ino;
	stat->mode = (inode->i_mode & S_IFMT) | (attr->mode & 07777);
	stat->nlink = attr->nlink;
1005 1006
	stat->uid = make_kuid(fc->user_ns, attr->uid);
	stat->gid = make_kgid(fc->user_ns, attr->gid);
1007 1008 1009 1010 1011 1012 1013 1014 1015
	stat->rdev = inode->i_rdev;
	stat->atime.tv_sec = attr->atime;
	stat->atime.tv_nsec = attr->atimensec;
	stat->mtime.tv_sec = attr->mtime;
	stat->mtime.tv_nsec = attr->mtimensec;
	stat->ctime.tv_sec = attr->ctime;
	stat->ctime.tv_nsec = attr->ctimensec;
	stat->size = attr->size;
	stat->blocks = attr->blocks;
M
Miklos Szeredi 已提交
1016 1017 1018 1019 1020 1021 1022

	if (attr->blksize != 0)
		blkbits = ilog2(attr->blksize);
	else
		blkbits = inode->i_sb->s_blocksize_bits;

	stat->blksize = 1 << blkbits;
1023 1024
}

1025 1026
static int fuse_do_getattr(struct inode *inode, struct kstat *stat,
			   struct file *file)
1027 1028
{
	int err;
1029 1030
	struct fuse_getattr_in inarg;
	struct fuse_attr_out outarg;
1031
	struct fuse_mount *fm = get_fuse_mount(inode);
1032
	FUSE_ARGS(args);
1033 1034
	u64 attr_version;

1035
	attr_version = fuse_get_attr_version(fm->fc);
1036

1037
	memset(&inarg, 0, sizeof(inarg));
1038
	memset(&outarg, 0, sizeof(outarg));
1039 1040 1041 1042 1043 1044 1045
	/* Directories have separate file-handle space */
	if (file && S_ISREG(inode->i_mode)) {
		struct fuse_file *ff = file->private_data;

		inarg.getattr_flags |= FUSE_GETATTR_FH;
		inarg.fh = ff->fh;
	}
1046 1047 1048 1049 1050 1051 1052 1053
	args.opcode = FUSE_GETATTR;
	args.nodeid = get_node_id(inode);
	args.in_numargs = 1;
	args.in_args[0].size = sizeof(inarg);
	args.in_args[0].value = &inarg;
	args.out_numargs = 1;
	args.out_args[0].size = sizeof(outarg);
	args.out_args[0].value = &outarg;
1054
	err = fuse_simple_request(fm, &args);
1055
	if (!err) {
M
Miklos Szeredi 已提交
1056 1057
		if (fuse_invalid_attr(&outarg.attr) ||
		    (inode->i_mode ^ outarg.attr.mode) & S_IFMT) {
M
Miklos Szeredi 已提交
1058
			fuse_make_bad(inode);
1059 1060
			err = -EIO;
		} else {
1061 1062
			fuse_change_attributes(inode, &outarg.attr,
					       attr_timeout(&outarg),
1063 1064
					       attr_version);
			if (stat)
1065
				fuse_fillattr(inode, &outarg.attr, stat);
1066 1067 1068 1069 1070
		}
	}
	return err;
}

M
Miklos Szeredi 已提交
1071
static int fuse_update_get_attr(struct inode *inode, struct file *file,
1072 1073
				struct kstat *stat, u32 request_mask,
				unsigned int flags)
M
Miklos Szeredi 已提交
1074 1075
{
	struct fuse_inode *fi = get_fuse_inode(inode);
M
Miklos Szeredi 已提交
1076
	int err = 0;
M
Miklos Szeredi 已提交
1077
	bool sync;
M
Miklos Szeredi 已提交
1078

M
Miklos Szeredi 已提交
1079 1080 1081 1082
	if (flags & AT_STATX_FORCE_SYNC)
		sync = true;
	else if (flags & AT_STATX_DONT_SYNC)
		sync = false;
1083 1084
	else if (request_mask & READ_ONCE(fi->inval_mask))
		sync = true;
M
Miklos Szeredi 已提交
1085 1086 1087 1088
	else
		sync = time_before64(fi->i_time, get_jiffies_64());

	if (sync) {
S
Seth Forshee 已提交
1089
		forget_all_cached_acls(inode);
M
Miklos Szeredi 已提交
1090
		err = fuse_do_getattr(inode, stat, file);
M
Miklos Szeredi 已提交
1091
	} else if (stat) {
C
Christian Brauner 已提交
1092
		generic_fillattr(&init_user_ns, inode, stat);
M
Miklos Szeredi 已提交
1093 1094
		stat->mode = fi->orig_i_mode;
		stat->ino = fi->orig_ino;
M
Miklos Szeredi 已提交
1095 1096 1097 1098 1099
	}

	return err;
}

M
Miklos Szeredi 已提交
1100 1101
int fuse_update_attributes(struct inode *inode, struct file *file)
{
1102 1103 1104
	/* Do *not* need to get atime for internal purposes */
	return fuse_update_get_attr(inode, file, NULL,
				    STATX_BASIC_STATS & ~STATX_ATIME, 0);
M
Miklos Szeredi 已提交
1105 1106
}

1107
int fuse_reverse_inval_entry(struct fuse_conn *fc, u64 parent_nodeid,
1108
			     u64 child_nodeid, struct qstr *name)
J
John Muir 已提交
1109 1110 1111 1112 1113 1114
{
	int err = -ENOTDIR;
	struct inode *parent;
	struct dentry *dir;
	struct dentry *entry;

1115
	parent = fuse_ilookup(fc, parent_nodeid, NULL);
J
John Muir 已提交
1116 1117 1118
	if (!parent)
		return -ENOENT;

A
Al Viro 已提交
1119
	inode_lock(parent);
J
John Muir 已提交
1120 1121 1122 1123 1124 1125 1126 1127
	if (!S_ISDIR(parent->i_mode))
		goto unlock;

	err = -ENOENT;
	dir = d_find_alias(parent);
	if (!dir)
		goto unlock;

1128
	name->hash = full_name_hash(dir, name->name, name->len);
J
John Muir 已提交
1129 1130 1131 1132 1133
	entry = d_lookup(dir, name);
	dput(dir);
	if (!entry)
		goto unlock;

1134
	fuse_dir_changed(parent);
J
John Muir 已提交
1135
	fuse_invalidate_entry(entry);
1136

1137
	if (child_nodeid != 0 && d_really_is_positive(entry)) {
A
Al Viro 已提交
1138
		inode_lock(d_inode(entry));
1139
		if (get_node_id(d_inode(entry)) != child_nodeid) {
1140 1141 1142 1143 1144 1145 1146
			err = -ENOENT;
			goto badentry;
		}
		if (d_mountpoint(entry)) {
			err = -EBUSY;
			goto badentry;
		}
1147
		if (d_is_dir(entry)) {
1148 1149 1150 1151 1152
			shrink_dcache_parent(entry);
			if (!simple_empty(entry)) {
				err = -ENOTEMPTY;
				goto badentry;
			}
1153
			d_inode(entry)->i_flags |= S_DEAD;
1154 1155
		}
		dont_mount(entry);
1156
		clear_nlink(d_inode(entry));
1157 1158
		err = 0;
 badentry:
A
Al Viro 已提交
1159
		inode_unlock(d_inode(entry));
1160 1161 1162 1163 1164
		if (!err)
			d_delete(entry);
	} else {
		err = 0;
	}
J
John Muir 已提交
1165 1166 1167
	dput(entry);

 unlock:
A
Al Viro 已提交
1168
	inode_unlock(parent);
J
John Muir 已提交
1169 1170 1171 1172
	iput(parent);
	return err;
}

1173 1174
/*
 * Calling into a user-controlled filesystem gives the filesystem
1175
 * daemon ptrace-like capabilities over the current process.  This
1176 1177 1178 1179 1180 1181 1182 1183 1184 1185
 * means, that the filesystem daemon is able to record the exact
 * filesystem operations performed, and can also control the behavior
 * of the requester process in otherwise impossible ways.  For example
 * it can delay the operation for arbitrary length of time allowing
 * DoS against the requester.
 *
 * For this reason only those processes can call into the filesystem,
 * for which the owner of the mount has ptrace privilege.  This
 * excludes processes started by other users, suid or sgid processes.
 */
1186
int fuse_allow_current_process(struct fuse_conn *fc)
1187
{
1188
	const struct cred *cred;
1189

M
Miklos Szeredi 已提交
1190
	if (fc->allow_other)
1191
		return current_in_userns(fc->user_ns);
1192

1193
	cred = current_cred();
1194 1195 1196 1197 1198 1199
	if (uid_eq(cred->euid, fc->user_id) &&
	    uid_eq(cred->suid, fc->user_id) &&
	    uid_eq(cred->uid,  fc->user_id) &&
	    gid_eq(cred->egid, fc->group_id) &&
	    gid_eq(cred->sgid, fc->group_id) &&
	    gid_eq(cred->gid,  fc->group_id))
1200
		return 1;
1201

1202
	return 0;
1203 1204
}

M
Miklos Szeredi 已提交
1205 1206
static int fuse_access(struct inode *inode, int mask)
{
1207
	struct fuse_mount *fm = get_fuse_mount(inode);
1208
	FUSE_ARGS(args);
M
Miklos Szeredi 已提交
1209 1210 1211
	struct fuse_access_in inarg;
	int err;

1212 1213
	BUG_ON(mask & MAY_NOT_BLOCK);

1214
	if (fm->fc->no_access)
M
Miklos Szeredi 已提交
1215 1216 1217
		return 0;

	memset(&inarg, 0, sizeof(inarg));
1218
	inarg.mask = mask & (MAY_READ | MAY_WRITE | MAY_EXEC);
1219 1220 1221 1222 1223
	args.opcode = FUSE_ACCESS;
	args.nodeid = get_node_id(inode);
	args.in_numargs = 1;
	args.in_args[0].size = sizeof(inarg);
	args.in_args[0].value = &inarg;
1224
	err = fuse_simple_request(fm, &args);
M
Miklos Szeredi 已提交
1225
	if (err == -ENOSYS) {
1226
		fm->fc->no_access = 1;
M
Miklos Szeredi 已提交
1227 1228 1229 1230 1231
		err = 0;
	}
	return err;
}

1232
static int fuse_perm_getattr(struct inode *inode, int mask)
1233
{
1234
	if (mask & MAY_NOT_BLOCK)
1235 1236
		return -ECHILD;

S
Seth Forshee 已提交
1237
	forget_all_cached_acls(inode);
1238 1239 1240
	return fuse_do_getattr(inode, NULL, NULL);
}

1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253
/*
 * Check permission.  The two basic access models of FUSE are:
 *
 * 1) Local access checking ('default_permissions' mount option) based
 * on file mode.  This is the plain old disk filesystem permission
 * modell.
 *
 * 2) "Remote" access checking, where server is responsible for
 * checking permission in each inode operation.  An exception to this
 * is if ->permission() was invoked from sys_access() in which case an
 * access request is sent.  Execute permission is still checked
 * locally based on file mode.
 */
1254 1255
static int fuse_permission(struct user_namespace *mnt_userns,
			   struct inode *inode, int mask)
1256 1257
{
	struct fuse_conn *fc = get_fuse_conn(inode);
1258 1259
	bool refreshed = false;
	int err = 0;
1260

M
Miklos Szeredi 已提交
1261 1262 1263
	if (fuse_is_bad(inode))
		return -EIO;

1264
	if (!fuse_allow_current_process(fc))
1265
		return -EACCES;
1266 1267

	/*
1268
	 * If attributes are needed, refresh them before proceeding
1269
	 */
M
Miklos Szeredi 已提交
1270
	if (fc->default_permissions ||
1271
	    ((mask & MAY_EXEC) && S_ISREG(inode->i_mode))) {
1272
		struct fuse_inode *fi = get_fuse_inode(inode);
1273
		u32 perm_mask = STATX_MODE | STATX_UID | STATX_GID;
1274

1275 1276
		if (perm_mask & READ_ONCE(fi->inval_mask) ||
		    time_before64(fi->i_time, get_jiffies_64())) {
1277 1278
			refreshed = true;

1279
			err = fuse_perm_getattr(inode, mask);
1280 1281 1282
			if (err)
				return err;
		}
1283 1284
	}

M
Miklos Szeredi 已提交
1285
	if (fc->default_permissions) {
1286
		err = generic_permission(&init_user_ns, inode, mask);
M
Miklos Szeredi 已提交
1287 1288 1289 1290

		/* If permission is denied, try to refresh file
		   attributes.  This is also needed, because the root
		   node will at first have no permissions */
1291
		if (err == -EACCES && !refreshed) {
1292
			err = fuse_perm_getattr(inode, mask);
M
Miklos Szeredi 已提交
1293
			if (!err)
1294 1295
				err = generic_permission(&init_user_ns,
							 inode, mask);
M
Miklos Szeredi 已提交
1296 1297
		}

1298 1299 1300 1301
		/* Note: the opposite of the above test does not
		   exist.  So if permissions are revoked this won't be
		   noticed immediately, only after the attribute
		   timeout has expired */
E
Eric Paris 已提交
1302
	} else if (mask & (MAY_ACCESS | MAY_CHDIR)) {
1303 1304 1305 1306 1307 1308
		err = fuse_access(inode, mask);
	} else if ((mask & MAY_EXEC) && S_ISREG(inode->i_mode)) {
		if (!(inode->i_mode & S_IXUGO)) {
			if (refreshed)
				return -EACCES;

1309
			err = fuse_perm_getattr(inode, mask);
1310 1311 1312
			if (!err && !(inode->i_mode & S_IXUGO))
				return -EACCES;
		}
1313
	}
1314
	return err;
1315 1316
}

D
Dan Schatzberg 已提交
1317
static int fuse_readlink_page(struct inode *inode, struct page *page)
1318
{
1319
	struct fuse_mount *fm = get_fuse_mount(inode);
1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335
	struct fuse_page_desc desc = { .length = PAGE_SIZE - 1 };
	struct fuse_args_pages ap = {
		.num_pages = 1,
		.pages = &page,
		.descs = &desc,
	};
	char *link;
	ssize_t res;

	ap.args.opcode = FUSE_READLINK;
	ap.args.nodeid = get_node_id(inode);
	ap.args.out_pages = true;
	ap.args.out_argvar = true;
	ap.args.page_zeroing = true;
	ap.args.out_numargs = 1;
	ap.args.out_args[0].size = desc.length;
1336
	res = fuse_simple_request(fm, &ap.args);
1337

1338
	fuse_invalidate_atime(inode);
1339

1340 1341
	if (res < 0)
		return res;
1342

1343 1344
	if (WARN_ON(res >= PAGE_SIZE))
		return -EIO;
D
Dan Schatzberg 已提交
1345

1346 1347
	link = page_address(page);
	link[res] = '\0';
D
Dan Schatzberg 已提交
1348

1349
	return 0;
D
Dan Schatzberg 已提交
1350 1351 1352 1353 1354 1355 1356 1357 1358 1359
}

static const char *fuse_get_link(struct dentry *dentry, struct inode *inode,
				 struct delayed_call *callback)
{
	struct fuse_conn *fc = get_fuse_conn(inode);
	struct page *page;
	int err;

	err = -EIO;
M
Miklos Szeredi 已提交
1360
	if (fuse_is_bad(inode))
D
Dan Schatzberg 已提交
1361 1362 1363 1364 1365 1366 1367 1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386
		goto out_err;

	if (fc->cache_symlinks)
		return page_get_link(dentry, inode, callback);

	err = -ECHILD;
	if (!dentry)
		goto out_err;

	page = alloc_page(GFP_KERNEL);
	err = -ENOMEM;
	if (!page)
		goto out_err;

	err = fuse_readlink_page(inode, page);
	if (err) {
		__free_page(page);
		goto out_err;
	}

	set_delayed_call(callback, page_put_link, page);

	return page_address(page);

out_err:
	return ERR_PTR(err);
1387 1388 1389 1390
}

static int fuse_dir_open(struct inode *inode, struct file *file)
{
1391
	return fuse_open_common(inode, file, true);
1392 1393 1394 1395
}

static int fuse_dir_release(struct inode *inode, struct file *file)
{
1396
	fuse_release_common(file, true);
1397 1398

	return 0;
1399 1400
}

1401 1402
static int fuse_dir_fsync(struct file *file, loff_t start, loff_t end,
			  int datasync)
1403
{
M
Miklos Szeredi 已提交
1404 1405 1406 1407
	struct inode *inode = file->f_mapping->host;
	struct fuse_conn *fc = get_fuse_conn(inode);
	int err;

M
Miklos Szeredi 已提交
1408
	if (fuse_is_bad(inode))
M
Miklos Szeredi 已提交
1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422
		return -EIO;

	if (fc->no_fsyncdir)
		return 0;

	inode_lock(inode);
	err = fuse_fsync_common(file, start, end, datasync, FUSE_FSYNCDIR);
	if (err == -ENOSYS) {
		fc->no_fsyncdir = 1;
		err = 0;
	}
	inode_unlock(inode);

	return err;
1423 1424
}

1425 1426 1427 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448
static long fuse_dir_ioctl(struct file *file, unsigned int cmd,
			    unsigned long arg)
{
	struct fuse_conn *fc = get_fuse_conn(file->f_mapping->host);

	/* FUSE_IOCTL_DIR only supported for API version >= 7.18 */
	if (fc->minor < 18)
		return -ENOTTY;

	return fuse_ioctl_common(file, cmd, arg, FUSE_IOCTL_DIR);
}

static long fuse_dir_compat_ioctl(struct file *file, unsigned int cmd,
				   unsigned long arg)
{
	struct fuse_conn *fc = get_fuse_conn(file->f_mapping->host);

	if (fc->minor < 18)
		return -ENOTTY;

	return fuse_ioctl_common(file, cmd, arg,
				 FUSE_IOCTL_COMPAT | FUSE_IOCTL_DIR);
}

M
Maxim Patlasov 已提交
1449
static bool update_mtime(unsigned ivalid, bool trust_local_mtime)
M
Miklos Szeredi 已提交
1450 1451 1452 1453 1454
{
	/* Always update if mtime is explicitly set  */
	if (ivalid & ATTR_MTIME_SET)
		return true;

M
Maxim Patlasov 已提交
1455 1456 1457 1458
	/* Or if kernel i_mtime is the official one */
	if (trust_local_mtime)
		return true;

M
Miklos Szeredi 已提交
1459 1460 1461 1462 1463 1464 1465 1466
	/* If it's an open(O_TRUNC) or an ftruncate(), don't update */
	if ((ivalid & ATTR_SIZE) && (ivalid & (ATTR_OPEN | ATTR_FILE)))
		return false;

	/* In all other cases update */
	return true;
}

1467 1468
static void iattr_to_fattr(struct fuse_conn *fc, struct iattr *iattr,
			   struct fuse_setattr_in *arg, bool trust_local_cmtime)
1469 1470 1471 1472
{
	unsigned ivalid = iattr->ia_valid;

	if (ivalid & ATTR_MODE)
1473
		arg->valid |= FATTR_MODE,   arg->mode = iattr->ia_mode;
1474
	if (ivalid & ATTR_UID)
1475
		arg->valid |= FATTR_UID,    arg->uid = from_kuid(fc->user_ns, iattr->ia_uid);
1476
	if (ivalid & ATTR_GID)
1477
		arg->valid |= FATTR_GID,    arg->gid = from_kgid(fc->user_ns, iattr->ia_gid);
1478
	if (ivalid & ATTR_SIZE)
1479
		arg->valid |= FATTR_SIZE,   arg->size = iattr->ia_size;
M
Miklos Szeredi 已提交
1480 1481
	if (ivalid & ATTR_ATIME) {
		arg->valid |= FATTR_ATIME;
1482
		arg->atime = iattr->ia_atime.tv_sec;
M
Miklos Szeredi 已提交
1483 1484 1485 1486
		arg->atimensec = iattr->ia_atime.tv_nsec;
		if (!(ivalid & ATTR_ATIME_SET))
			arg->valid |= FATTR_ATIME_NOW;
	}
1487
	if ((ivalid & ATTR_MTIME) && update_mtime(ivalid, trust_local_cmtime)) {
M
Miklos Szeredi 已提交
1488
		arg->valid |= FATTR_MTIME;
1489
		arg->mtime = iattr->ia_mtime.tv_sec;
M
Miklos Szeredi 已提交
1490
		arg->mtimensec = iattr->ia_mtime.tv_nsec;
1491
		if (!(ivalid & ATTR_MTIME_SET) && !trust_local_cmtime)
M
Miklos Szeredi 已提交
1492
			arg->valid |= FATTR_MTIME_NOW;
1493
	}
1494 1495 1496 1497 1498
	if ((ivalid & ATTR_CTIME) && trust_local_cmtime) {
		arg->valid |= FATTR_CTIME;
		arg->ctime = iattr->ia_ctime.tv_sec;
		arg->ctimensec = iattr->ia_ctime.tv_nsec;
	}
1499 1500
}

M
Miklos Szeredi 已提交
1501 1502 1503 1504 1505 1506 1507 1508 1509 1510
/*
 * Prevent concurrent writepages on inode
 *
 * This is done by adding a negative bias to the inode write counter
 * and waiting for all pending writes to finish.
 */
void fuse_set_nowrite(struct inode *inode)
{
	struct fuse_inode *fi = get_fuse_inode(inode);

A
Al Viro 已提交
1511
	BUG_ON(!inode_is_locked(inode));
M
Miklos Szeredi 已提交
1512

1513
	spin_lock(&fi->lock);
M
Miklos Szeredi 已提交
1514 1515
	BUG_ON(fi->writectr < 0);
	fi->writectr += FUSE_NOWRITE;
1516
	spin_unlock(&fi->lock);
M
Miklos Szeredi 已提交
1517 1518 1519 1520 1521 1522 1523 1524 1525 1526 1527 1528 1529 1530 1531 1532 1533 1534 1535 1536
	wait_event(fi->page_waitq, fi->writectr == FUSE_NOWRITE);
}

/*
 * Allow writepages on inode
 *
 * Remove the bias from the writecounter and send any queued
 * writepages.
 */
static void __fuse_release_nowrite(struct inode *inode)
{
	struct fuse_inode *fi = get_fuse_inode(inode);

	BUG_ON(fi->writectr != FUSE_NOWRITE);
	fi->writectr = 0;
	fuse_flush_writepages(inode);
}

void fuse_release_nowrite(struct inode *inode)
{
1537
	struct fuse_inode *fi = get_fuse_inode(inode);
M
Miklos Szeredi 已提交
1538

1539
	spin_lock(&fi->lock);
M
Miklos Szeredi 已提交
1540
	__fuse_release_nowrite(inode);
1541
	spin_unlock(&fi->lock);
M
Miklos Szeredi 已提交
1542 1543
}

1544
static void fuse_setattr_fill(struct fuse_conn *fc, struct fuse_args *args,
M
Maxim Patlasov 已提交
1545 1546 1547 1548
			      struct inode *inode,
			      struct fuse_setattr_in *inarg_p,
			      struct fuse_attr_out *outarg_p)
{
1549 1550 1551 1552 1553 1554 1555 1556
	args->opcode = FUSE_SETATTR;
	args->nodeid = get_node_id(inode);
	args->in_numargs = 1;
	args->in_args[0].size = sizeof(*inarg_p);
	args->in_args[0].value = inarg_p;
	args->out_numargs = 1;
	args->out_args[0].size = sizeof(*outarg_p);
	args->out_args[0].value = outarg_p;
M
Maxim Patlasov 已提交
1557 1558 1559 1560 1561
}

/*
 * Flush inode->i_mtime to the server
 */
1562
int fuse_flush_times(struct inode *inode, struct fuse_file *ff)
M
Maxim Patlasov 已提交
1563
{
1564
	struct fuse_mount *fm = get_fuse_mount(inode);
1565
	FUSE_ARGS(args);
M
Maxim Patlasov 已提交
1566 1567 1568 1569 1570 1571
	struct fuse_setattr_in inarg;
	struct fuse_attr_out outarg;

	memset(&inarg, 0, sizeof(inarg));
	memset(&outarg, 0, sizeof(outarg));

1572
	inarg.valid = FATTR_MTIME;
M
Maxim Patlasov 已提交
1573 1574
	inarg.mtime = inode->i_mtime.tv_sec;
	inarg.mtimensec = inode->i_mtime.tv_nsec;
1575
	if (fm->fc->minor >= 23) {
1576 1577 1578 1579
		inarg.valid |= FATTR_CTIME;
		inarg.ctime = inode->i_ctime.tv_sec;
		inarg.ctimensec = inode->i_ctime.tv_nsec;
	}
M
Miklos Szeredi 已提交
1580 1581 1582 1583
	if (ff) {
		inarg.valid |= FATTR_FH;
		inarg.fh = ff->fh;
	}
1584
	fuse_setattr_fill(fm->fc, &args, inode, &inarg, &outarg);
M
Maxim Patlasov 已提交
1585

1586
	return fuse_simple_request(fm, &args);
M
Maxim Patlasov 已提交
1587 1588
}

1589 1590 1591 1592 1593
/*
 * Set attributes, and at the same time refresh them.
 *
 * Truncation is slightly complicated, because the 'truncate' request
 * may fail, in which case we don't want to touch the mapping.
M
Miklos Szeredi 已提交
1594 1595
 * vmtruncate() doesn't allow for this case, so do the rlimit checking
 * and the actual truncation by hand.
1596
 */
1597
int fuse_do_setattr(struct dentry *dentry, struct iattr *attr,
1598
		    struct file *file)
1599
{
1600
	struct inode *inode = d_inode(dentry);
1601 1602
	struct fuse_mount *fm = get_fuse_mount(inode);
	struct fuse_conn *fc = fm->fc;
1603
	struct fuse_inode *fi = get_fuse_inode(inode);
1604
	FUSE_ARGS(args);
1605 1606
	struct fuse_setattr_in inarg;
	struct fuse_attr_out outarg;
M
Miklos Szeredi 已提交
1607
	bool is_truncate = false;
P
Pavel Emelyanov 已提交
1608
	bool is_wb = fc->writeback_cache;
M
Miklos Szeredi 已提交
1609
	loff_t oldsize;
1610
	int err;
1611
	bool trust_local_cmtime = is_wb && S_ISREG(inode->i_mode);
1612
	bool fault_blocked = false;
1613

M
Miklos Szeredi 已提交
1614
	if (!fc->default_permissions)
1615 1616
		attr->ia_valid |= ATTR_FORCE;

C
Christian Brauner 已提交
1617
	err = setattr_prepare(&init_user_ns, dentry, attr);
1618 1619
	if (err)
		return err;
M
Miklos Szeredi 已提交
1620

1621 1622 1623 1624 1625 1626 1627 1628 1629 1630 1631 1632 1633 1634 1635 1636
	if (attr->ia_valid & ATTR_SIZE) {
		if (WARN_ON(!S_ISREG(inode->i_mode)))
			return -EIO;
		is_truncate = true;
	}

	if (FUSE_IS_DAX(inode) && is_truncate) {
		down_write(&fi->i_mmap_sem);
		fault_blocked = true;
		err = fuse_dax_break_layouts(inode, 0, 0);
		if (err) {
			up_write(&fi->i_mmap_sem);
			return err;
		}
	}

M
Miklos Szeredi 已提交
1637
	if (attr->ia_valid & ATTR_OPEN) {
1638 1639 1640 1641 1642 1643 1644 1645 1646 1647 1648
		/* This is coming from open(..., ... | O_TRUNC); */
		WARN_ON(!(attr->ia_valid & ATTR_SIZE));
		WARN_ON(attr->ia_size != 0);
		if (fc->atomic_o_trunc) {
			/*
			 * No need to send request to userspace, since actual
			 * truncation has already been done by OPEN.  But still
			 * need to truncate page cache.
			 */
			i_size_write(inode, 0);
			truncate_pagecache(inode, 0);
1649
			goto out;
1650
		}
M
Miklos Szeredi 已提交
1651 1652
		file = NULL;
	}
1653

1654 1655 1656 1657 1658 1659 1660 1661 1662 1663 1664 1665 1666
	/* Flush dirty data/metadata before non-truncate SETATTR */
	if (is_wb && S_ISREG(inode->i_mode) &&
	    attr->ia_valid &
			(ATTR_MODE | ATTR_UID | ATTR_GID | ATTR_MTIME_SET |
			 ATTR_TIMES_SET)) {
		err = write_inode_now(inode, true);
		if (err)
			return err;

		fuse_set_nowrite(inode);
		fuse_release_nowrite(inode);
	}

1667
	if (is_truncate) {
M
Miklos Szeredi 已提交
1668
		fuse_set_nowrite(inode);
1669
		set_bit(FUSE_I_SIZE_UNSTABLE, &fi->state);
1670 1671
		if (trust_local_cmtime && attr->ia_size != inode->i_size)
			attr->ia_valid |= ATTR_MTIME | ATTR_CTIME;
1672
	}
M
Miklos Szeredi 已提交
1673

1674
	memset(&inarg, 0, sizeof(inarg));
1675
	memset(&outarg, 0, sizeof(outarg));
1676
	iattr_to_fattr(fc, attr, &inarg, trust_local_cmtime);
1677 1678 1679 1680 1681
	if (file) {
		struct fuse_file *ff = file->private_data;
		inarg.valid |= FATTR_FH;
		inarg.fh = ff->fh;
	}
1682 1683 1684 1685 1686 1687

	/* Kill suid/sgid for non-directory chown unconditionally */
	if (fc->handle_killpriv_v2 && !S_ISDIR(inode->i_mode) &&
	    attr->ia_valid & (ATTR_UID | ATTR_GID))
		inarg.valid |= FATTR_KILL_SUIDGID;

1688 1689 1690 1691
	if (attr->ia_valid & ATTR_SIZE) {
		/* For mandatory locking in truncate */
		inarg.valid |= FATTR_LOCKOWNER;
		inarg.lock_owner = fuse_lock_owner_id(fc, current->files);
1692 1693 1694 1695

		/* Kill suid/sgid for truncate only if no CAP_FSETID */
		if (fc->handle_killpriv_v2 && !capable(CAP_FSETID))
			inarg.valid |= FATTR_KILL_SUIDGID;
1696
	}
1697
	fuse_setattr_fill(fc, &args, inode, &inarg, &outarg);
1698
	err = fuse_simple_request(fm, &args);
1699 1700 1701
	if (err) {
		if (err == -EINTR)
			fuse_invalidate_attr(inode);
M
Miklos Szeredi 已提交
1702
		goto error;
1703
	}
1704

M
Miklos Szeredi 已提交
1705 1706
	if (fuse_invalid_attr(&outarg.attr) ||
	    (inode->i_mode ^ outarg.attr.mode) & S_IFMT) {
M
Miklos Szeredi 已提交
1707
		fuse_make_bad(inode);
M
Miklos Szeredi 已提交
1708 1709 1710 1711
		err = -EIO;
		goto error;
	}

1712
	spin_lock(&fi->lock);
M
Maxim Patlasov 已提交
1713
	/* the kernel maintains i_mtime locally */
1714 1715 1716 1717 1718
	if (trust_local_cmtime) {
		if (attr->ia_valid & ATTR_MTIME)
			inode->i_mtime = attr->ia_mtime;
		if (attr->ia_valid & ATTR_CTIME)
			inode->i_ctime = attr->ia_ctime;
M
Miklos Szeredi 已提交
1719
		/* FIXME: clear I_DIRTY_SYNC? */
M
Maxim Patlasov 已提交
1720 1721
	}

M
Miklos Szeredi 已提交
1722 1723 1724
	fuse_change_attributes_common(inode, &outarg.attr,
				      attr_timeout(&outarg));
	oldsize = inode->i_size;
P
Pavel Emelyanov 已提交
1725 1726 1727
	/* see the comment in fuse_change_attributes() */
	if (!is_wb || is_truncate || !S_ISREG(inode->i_mode))
		i_size_write(inode, outarg.attr.size);
M
Miklos Szeredi 已提交
1728 1729

	if (is_truncate) {
1730
		/* NOTE: this may release/reacquire fi->lock */
M
Miklos Szeredi 已提交
1731 1732
		__fuse_release_nowrite(inode);
	}
1733
	spin_unlock(&fi->lock);
M
Miklos Szeredi 已提交
1734 1735 1736 1737 1738

	/*
	 * Only call invalidate_inode_pages2() after removing
	 * FUSE_NOWRITE, otherwise fuse_launder_page() would deadlock.
	 */
P
Pavel Emelyanov 已提交
1739 1740
	if ((is_truncate || !is_wb) &&
	    S_ISREG(inode->i_mode) && oldsize != outarg.attr.size) {
1741
		truncate_pagecache(inode, outarg.attr.size);
M
Miklos Szeredi 已提交
1742
		invalidate_inode_pages2(inode->i_mapping);
1743 1744
	}

1745
	clear_bit(FUSE_I_SIZE_UNSTABLE, &fi->state);
1746 1747 1748 1749
out:
	if (fault_blocked)
		up_write(&fi->i_mmap_sem);

1750
	return 0;
M
Miklos Szeredi 已提交
1751 1752 1753 1754 1755

error:
	if (is_truncate)
		fuse_release_nowrite(inode);

1756
	clear_bit(FUSE_I_SIZE_UNSTABLE, &fi->state);
1757 1758 1759

	if (fault_blocked)
		up_write(&fi->i_mmap_sem);
M
Miklos Szeredi 已提交
1760
	return err;
1761 1762
}

1763 1764
static int fuse_setattr(struct user_namespace *mnt_userns, struct dentry *entry,
			struct iattr *attr)
1765
{
1766
	struct inode *inode = d_inode(entry);
1767
	struct fuse_conn *fc = get_fuse_conn(inode);
1768
	struct file *file = (attr->ia_valid & ATTR_FILE) ? attr->ia_file : NULL;
1769
	int ret;
1770

M
Miklos Szeredi 已提交
1771 1772 1773
	if (fuse_is_bad(inode))
		return -EIO;

1774 1775 1776
	if (!fuse_allow_current_process(get_fuse_conn(inode)))
		return -EACCES;

1777 1778 1779
	if (attr->ia_valid & (ATTR_KILL_SUID | ATTR_KILL_SGID)) {
		attr->ia_valid &= ~(ATTR_KILL_SUID | ATTR_KILL_SGID |
				    ATTR_MODE);
1780

1781
		/*
1782 1783 1784 1785
		 * The only sane way to reliably kill suid/sgid is to do it in
		 * the userspace filesystem
		 *
		 * This should be done on write(), truncate() and chown().
1786
		 */
1787
		if (!fc->handle_killpriv && !fc->handle_killpriv_v2) {
1788 1789 1790 1791 1792 1793 1794 1795 1796
			/*
			 * ia_mode calculation may have used stale i_mode.
			 * Refresh and recalculate.
			 */
			ret = fuse_do_getattr(inode, NULL, file);
			if (ret)
				return ret;

			attr->ia_mode = inode->i_mode;
1797
			if (inode->i_mode & S_ISUID) {
1798 1799 1800
				attr->ia_valid |= ATTR_MODE;
				attr->ia_mode &= ~S_ISUID;
			}
1801
			if ((inode->i_mode & (S_ISGID | S_IXGRP)) == (S_ISGID | S_IXGRP)) {
1802 1803 1804
				attr->ia_valid |= ATTR_MODE;
				attr->ia_mode &= ~S_ISGID;
			}
1805 1806 1807 1808
		}
	}
	if (!attr->ia_valid)
		return 0;
1809

1810
	ret = fuse_do_setattr(entry, attr, file);
1811
	if (!ret) {
S
Seth Forshee 已提交
1812 1813 1814 1815 1816 1817 1818
		/*
		 * If filesystem supports acls it may have updated acl xattrs in
		 * the filesystem, so forget cached acls for the inode.
		 */
		if (fc->posix_acl)
			forget_all_cached_acls(inode);

1819 1820 1821 1822 1823
		/* Directory mode changed, may need to revalidate access */
		if (d_is_dir(entry) && (attr->ia_valid & ATTR_MODE))
			fuse_invalidate_entry_cache(entry);
	}
	return ret;
1824 1825
}

1826 1827
static int fuse_getattr(struct user_namespace *mnt_userns,
			const struct path *path, struct kstat *stat,
1828
			u32 request_mask, unsigned int flags)
1829
{
1830
	struct inode *inode = d_inode(path->dentry);
1831 1832
	struct fuse_conn *fc = get_fuse_conn(inode);

M
Miklos Szeredi 已提交
1833 1834 1835
	if (fuse_is_bad(inode))
		return -EIO;

1836 1837 1838 1839 1840 1841 1842 1843 1844 1845
	if (!fuse_allow_current_process(fc)) {
		if (!request_mask) {
			/*
			 * If user explicitly requested *nothing* then don't
			 * error out, but return st_dev only.
			 */
			stat->result_mask = 0;
			stat->dev = inode->i_sb->s_dev;
			return 0;
		}
1846
		return -EACCES;
1847
	}
1848

1849
	return fuse_update_get_attr(inode, NULL, stat, request_mask, flags);
1850 1851
}

1852
static const struct inode_operations fuse_dir_inode_operations = {
1853
	.lookup		= fuse_lookup,
1854 1855 1856 1857
	.mkdir		= fuse_mkdir,
	.symlink	= fuse_symlink,
	.unlink		= fuse_unlink,
	.rmdir		= fuse_rmdir,
1858
	.rename		= fuse_rename2,
1859 1860 1861
	.link		= fuse_link,
	.setattr	= fuse_setattr,
	.create		= fuse_create,
1862
	.atomic_open	= fuse_atomic_open,
1863
	.mknod		= fuse_mknod,
1864 1865
	.permission	= fuse_permission,
	.getattr	= fuse_getattr,
1866
	.listxattr	= fuse_listxattr,
S
Seth Forshee 已提交
1867 1868
	.get_acl	= fuse_get_acl,
	.set_acl	= fuse_set_acl,
1869 1870
};

1871
static const struct file_operations fuse_dir_operations = {
M
Miklos Szeredi 已提交
1872
	.llseek		= generic_file_llseek,
1873
	.read		= generic_read_dir,
A
Al Viro 已提交
1874
	.iterate_shared	= fuse_readdir,
1875 1876
	.open		= fuse_dir_open,
	.release	= fuse_dir_release,
1877
	.fsync		= fuse_dir_fsync,
1878 1879
	.unlocked_ioctl	= fuse_dir_ioctl,
	.compat_ioctl	= fuse_dir_compat_ioctl,
1880 1881
};

1882
static const struct inode_operations fuse_common_inode_operations = {
1883
	.setattr	= fuse_setattr,
1884 1885
	.permission	= fuse_permission,
	.getattr	= fuse_getattr,
1886
	.listxattr	= fuse_listxattr,
S
Seth Forshee 已提交
1887 1888
	.get_acl	= fuse_get_acl,
	.set_acl	= fuse_set_acl,
1889 1890
};

1891
static const struct inode_operations fuse_symlink_inode_operations = {
1892
	.setattr	= fuse_setattr,
1893
	.get_link	= fuse_get_link,
1894
	.getattr	= fuse_getattr,
1895
	.listxattr	= fuse_listxattr,
1896 1897 1898 1899 1900 1901 1902 1903 1904
};

void fuse_init_common(struct inode *inode)
{
	inode->i_op = &fuse_common_inode_operations;
}

void fuse_init_dir(struct inode *inode)
{
1905 1906
	struct fuse_inode *fi = get_fuse_inode(inode);

1907 1908
	inode->i_op = &fuse_dir_inode_operations;
	inode->i_fop = &fuse_dir_operations;
1909 1910 1911 1912 1913 1914

	spin_lock_init(&fi->rdc.lock);
	fi->rdc.cached = false;
	fi->rdc.size = 0;
	fi->rdc.pos = 0;
	fi->rdc.version = 0;
1915 1916
}

D
Dan Schatzberg 已提交
1917 1918 1919 1920 1921 1922 1923 1924 1925 1926 1927 1928 1929 1930 1931 1932
static int fuse_symlink_readpage(struct file *null, struct page *page)
{
	int err = fuse_readlink_page(page->mapping->host, page);

	if (!err)
		SetPageUptodate(page);

	unlock_page(page);

	return err;
}

static const struct address_space_operations fuse_symlink_aops = {
	.readpage	= fuse_symlink_readpage,
};

1933 1934 1935
void fuse_init_symlink(struct inode *inode)
{
	inode->i_op = &fuse_symlink_inode_operations;
D
Dan Schatzberg 已提交
1936 1937
	inode->i_data.a_ops = &fuse_symlink_aops;
	inode_nohighmem(inode);
1938
}