dir.c 49.3 KB
Newer Older
1 2
/*
  FUSE: Filesystem in Userspace
M
Miklos Szeredi 已提交
3
  Copyright (C) 2001-2008  Miklos Szeredi <miklos@szeredi.hu>
4 5 6 7 8 9 10 11 12 13 14

  This program can be distributed under the terms of the GNU GPL.
  See the file COPYING.
*/

#include "fuse_i.h"

#include <linux/pagemap.h>
#include <linux/file.h>
#include <linux/sched.h>
#include <linux/namei.h>
15
#include <linux/slab.h>
16

A
Al Viro 已提交
17
static bool fuse_use_readdirplus(struct inode *dir, struct dir_context *ctx)
18 19 20 21 22 23
{
	struct fuse_conn *fc = get_fuse_conn(dir);
	struct fuse_inode *fi = get_fuse_inode(dir);

	if (!fc->do_readdirplus)
		return false;
24 25
	if (!fc->readdirplus_auto)
		return true;
26 27
	if (test_and_clear_bit(FUSE_I_ADVISE_RDPLUS, &fi->state))
		return true;
A
Al Viro 已提交
28
	if (ctx->pos == 0)
29 30 31 32 33 34 35 36 37 38 39
		return true;
	return false;
}

static void fuse_advise_use_readdirplus(struct inode *dir)
{
	struct fuse_inode *fi = get_fuse_inode(dir);

	set_bit(FUSE_I_ADVISE_RDPLUS, &fi->state);
}

M
Miklos Szeredi 已提交
40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66
#if BITS_PER_LONG >= 64
static inline void fuse_dentry_settime(struct dentry *entry, u64 time)
{
	entry->d_time = time;
}

static inline u64 fuse_dentry_time(struct dentry *entry)
{
	return entry->d_time;
}
#else
/*
 * On 32 bit archs store the high 32 bits of time in d_fsdata
 */
static void fuse_dentry_settime(struct dentry *entry, u64 time)
{
	entry->d_time = time;
	entry->d_fsdata = (void *) (unsigned long) (time >> 32);
}

static u64 fuse_dentry_time(struct dentry *entry)
{
	return (u64) entry->d_time +
		((u64) (unsigned long) entry->d_fsdata << 32);
}
#endif

67 68 69 70 71 72 73 74 75
/*
 * FUSE caches dentries and attributes with separate timeout.  The
 * time in jiffies until the dentry/attributes are valid is stored in
 * dentry->d_time and fuse_inode->i_time respectively.
 */

/*
 * Calculate the time in jiffies until a dentry/attributes are valid
 */
M
Miklos Szeredi 已提交
76
static u64 time_to_jiffies(unsigned long sec, unsigned long nsec)
77
{
M
Miklos Szeredi 已提交
78 79
	if (sec || nsec) {
		struct timespec ts = {sec, nsec};
M
Miklos Szeredi 已提交
80
		return get_jiffies_64() + timespec_to_jiffies(&ts);
M
Miklos Szeredi 已提交
81
	} else
M
Miklos Szeredi 已提交
82
		return 0;
83 84
}

85 86 87 88
/*
 * Set dentry and possibly attribute timeouts from the lookup/mk*
 * replies
 */
89 90
static void fuse_change_entry_timeout(struct dentry *entry,
				      struct fuse_entry_out *o)
91
{
M
Miklos Szeredi 已提交
92 93
	fuse_dentry_settime(entry,
		time_to_jiffies(o->entry_valid, o->entry_valid_nsec));
94 95 96 97 98 99 100 101 102 103
}

static u64 attr_timeout(struct fuse_attr_out *o)
{
	return time_to_jiffies(o->attr_valid, o->attr_valid_nsec);
}

static u64 entry_attr_timeout(struct fuse_entry_out *o)
{
	return time_to_jiffies(o->attr_valid, o->attr_valid_nsec);
104 105
}

106 107 108 109
/*
 * Mark the attributes as stale, so that at the next call to
 * ->getattr() they will be fetched from userspace
 */
110 111
void fuse_invalidate_attr(struct inode *inode)
{
M
Miklos Szeredi 已提交
112
	get_fuse_inode(inode)->i_time = 0;
113 114
}

115 116 117 118 119 120 121 122 123 124
/**
 * Mark the attributes as stale due to an atime change.  Avoid the invalidate if
 * atime is not used.
 */
void fuse_invalidate_atime(struct inode *inode)
{
	if (!IS_RDONLY(inode))
		fuse_invalidate_attr(inode);
}

125 126 127 128 129 130 131 132
/*
 * Just mark the entry as stale, so that a next attempt to look it up
 * will result in a new lookup call to userspace
 *
 * This is called when a dentry is about to become negative and the
 * timeout is unknown (unlink, rmdir, rename and in some cases
 * lookup)
 */
M
Miklos Szeredi 已提交
133
void fuse_invalidate_entry_cache(struct dentry *entry)
134
{
M
Miklos Szeredi 已提交
135
	fuse_dentry_settime(entry, 0);
136 137
}

138 139 140 141
/*
 * Same as fuse_invalidate_entry_cache(), but also try to remove the
 * dentry from the hash
 */
142 143 144 145
static void fuse_invalidate_entry(struct dentry *entry)
{
	d_invalidate(entry);
	fuse_invalidate_entry_cache(entry);
146 147
}

148 149
static void fuse_lookup_init(struct fuse_conn *fc, struct fuse_req *req,
			     u64 nodeid, struct qstr *name,
150 151
			     struct fuse_entry_out *outarg)
{
152
	memset(outarg, 0, sizeof(struct fuse_entry_out));
153
	req->in.h.opcode = FUSE_LOOKUP;
154
	req->in.h.nodeid = nodeid;
155
	req->in.numargs = 1;
156 157
	req->in.args[0].size = name->len + 1;
	req->in.args[0].value = name->name;
158
	req->out.numargs = 1;
159 160 161 162
	if (fc->minor < 9)
		req->out.args[0].size = FUSE_COMPAT_ENTRY_OUT_SIZE;
	else
		req->out.args[0].size = sizeof(struct fuse_entry_out);
163 164 165
	req->out.args[0].value = outarg;
}

166
u64 fuse_get_attr_version(struct fuse_conn *fc)
167 168 169 170 171 172 173 174 175 176 177 178 179 180
{
	u64 curr_version;

	/*
	 * The spin lock isn't actually needed on 64bit archs, but we
	 * don't yet care too much about such optimizations.
	 */
	spin_lock(&fc->lock);
	curr_version = fc->attr_version;
	spin_unlock(&fc->lock);

	return curr_version;
}

181 182 183 184 185 186 187 188 189
/*
 * Check whether the dentry is still valid
 *
 * If the entry validity timeout has expired and the dentry is
 * positive, try to redo the lookup.  If the lookup results in a
 * different inode, then let the VFS invalidate the dentry and redo
 * the lookup once more.  If the lookup results in the same inode,
 * then refresh the attributes, timeouts and mark the dentry valid.
 */
190
static int fuse_dentry_revalidate(struct dentry *entry, unsigned int flags)
191
{
192
	struct inode *inode;
193 194
	struct dentry *parent;
	struct fuse_conn *fc;
M
Miklos Szeredi 已提交
195
	struct fuse_inode *fi;
196
	int ret;
197

198
	inode = ACCESS_ONCE(entry->d_inode);
199
	if (inode && is_bad_inode(inode))
200
		goto invalid;
M
Miklos Szeredi 已提交
201
	else if (fuse_dentry_time(entry) < get_jiffies_64()) {
202 203
		int err;
		struct fuse_entry_out outarg;
204
		struct fuse_req *req;
205
		struct fuse_forget_link *forget;
206
		u64 attr_version;
207

208
		/* For negative dentries, always do a fresh lookup */
209
		if (!inode)
210
			goto invalid;
211

212
		ret = -ECHILD;
213
		if (flags & LOOKUP_RCU)
214
			goto out;
215

216
		fc = get_fuse_conn(inode);
M
Maxim Patlasov 已提交
217
		req = fuse_get_req_nopages(fc);
218
		ret = PTR_ERR(req);
219
		if (IS_ERR(req))
220
			goto out;
221

222 223
		forget = fuse_alloc_forget();
		if (!forget) {
M
Miklos Szeredi 已提交
224
			fuse_put_request(fc, req);
225 226
			ret = -ENOMEM;
			goto out;
M
Miklos Szeredi 已提交
227 228
		}

229
		attr_version = fuse_get_attr_version(fc);
230

231
		parent = dget_parent(entry);
232 233
		fuse_lookup_init(fc, req, get_node_id(parent->d_inode),
				 &entry->d_name, &outarg);
234
		fuse_request_send(fc, req);
235
		dput(parent);
236
		err = req->out.h.error;
M
Miklos Szeredi 已提交
237
		fuse_put_request(fc, req);
238 239 240
		/* Zero nodeid is same as -ENOENT */
		if (!err && !outarg.nodeid)
			err = -ENOENT;
241
		if (!err) {
M
Miklos Szeredi 已提交
242
			fi = get_fuse_inode(inode);
243
			if (outarg.nodeid != get_node_id(inode)) {
244
				fuse_queue_forget(fc, forget, outarg.nodeid, 1);
245
				goto invalid;
246
			}
247
			spin_lock(&fc->lock);
M
Miklos Szeredi 已提交
248
			fi->nlookup++;
249
			spin_unlock(&fc->lock);
250
		}
251
		kfree(forget);
252
		if (err || (outarg.attr.mode ^ inode->i_mode) & S_IFMT)
253
			goto invalid;
254

255 256 257 258
		fuse_change_attributes(inode, &outarg.attr,
				       entry_attr_timeout(&outarg),
				       attr_version);
		fuse_change_entry_timeout(entry, &outarg);
259
	} else if (inode) {
M
Miklos Szeredi 已提交
260 261 262 263 264
		fi = get_fuse_inode(inode);
		if (flags & LOOKUP_RCU) {
			if (test_bit(FUSE_I_INIT_RDPLUS, &fi->state))
				return -ECHILD;
		} else if (test_and_clear_bit(FUSE_I_INIT_RDPLUS, &fi->state)) {
265 266 267 268
			parent = dget_parent(entry);
			fuse_advise_use_readdirplus(parent->d_inode);
			dput(parent);
		}
269
	}
270 271 272 273 274 275
	ret = 1;
out:
	return ret;

invalid:
	ret = 0;
276 277

	if (!(flags & LOOKUP_RCU) && check_submounts_and_drop(entry) != 0)
278
		ret = 1;
279
	goto out;
280 281
}

282
static int invalid_nodeid(u64 nodeid)
283 284 285 286
{
	return !nodeid || nodeid == FUSE_ROOT_ID;
}

A
Al Viro 已提交
287
const struct dentry_operations fuse_dentry_operations = {
288 289 290
	.d_revalidate	= fuse_dentry_revalidate,
};

291
int fuse_valid_type(int m)
292 293 294 295 296
{
	return S_ISREG(m) || S_ISDIR(m) || S_ISLNK(m) || S_ISCHR(m) ||
		S_ISBLK(m) || S_ISFIFO(m) || S_ISSOCK(m);
}

297 298
int fuse_lookup_name(struct super_block *sb, u64 nodeid, struct qstr *name,
		     struct fuse_entry_out *outarg, struct inode **inode)
299
{
300
	struct fuse_conn *fc = get_fuse_conn_super(sb);
301
	struct fuse_req *req;
302
	struct fuse_forget_link *forget;
303
	u64 attr_version;
304
	int err;
305

306 307 308 309
	*inode = NULL;
	err = -ENAMETOOLONG;
	if (name->len > FUSE_NAME_MAX)
		goto out;
310

M
Maxim Patlasov 已提交
311
	req = fuse_get_req_nopages(fc);
312
	err = PTR_ERR(req);
313
	if (IS_ERR(req))
314
		goto out;
315

316 317 318
	forget = fuse_alloc_forget();
	err = -ENOMEM;
	if (!forget) {
M
Miklos Szeredi 已提交
319
		fuse_put_request(fc, req);
320
		goto out;
M
Miklos Szeredi 已提交
321 322
	}

323
	attr_version = fuse_get_attr_version(fc);
324

325
	fuse_lookup_init(fc, req, nodeid, name, outarg);
326
	fuse_request_send(fc, req);
327
	err = req->out.h.error;
M
Miklos Szeredi 已提交
328
	fuse_put_request(fc, req);
329
	/* Zero nodeid is same as -ENOENT, but with valid timeout */
330 331 332 333 334 335 336 337 338 339 340 341 342 343
	if (err || !outarg->nodeid)
		goto out_put_forget;

	err = -EIO;
	if (!outarg->nodeid)
		goto out_put_forget;
	if (!fuse_valid_type(outarg->attr.mode))
		goto out_put_forget;

	*inode = fuse_iget(sb, outarg->nodeid, outarg->generation,
			   &outarg->attr, entry_attr_timeout(outarg),
			   attr_version);
	err = -ENOMEM;
	if (!*inode) {
344
		fuse_queue_forget(fc, forget, outarg->nodeid, 1);
345
		goto out;
346
	}
347 348 349
	err = 0;

 out_put_forget:
350
	kfree(forget);
351 352 353 354 355
 out:
	return err;
}

static struct dentry *fuse_lookup(struct inode *dir, struct dentry *entry,
A
Al Viro 已提交
356
				  unsigned int flags)
357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375
{
	int err;
	struct fuse_entry_out outarg;
	struct inode *inode;
	struct dentry *newent;
	bool outarg_valid = true;

	err = fuse_lookup_name(dir->i_sb, get_node_id(dir), &entry->d_name,
			       &outarg, &inode);
	if (err == -ENOENT) {
		outarg_valid = false;
		err = 0;
	}
	if (err)
		goto out_err;

	err = -EIO;
	if (inode && get_node_id(inode) == FUSE_ROOT_ID)
		goto out_iput;
376

377
	newent = d_materialise_unique(entry, inode);
378 379 380
	err = PTR_ERR(newent);
	if (IS_ERR(newent))
		goto out_err;
381

382
	entry = newent ? newent : entry;
383
	if (outarg_valid)
384
		fuse_change_entry_timeout(entry, &outarg);
385 386
	else
		fuse_invalidate_entry_cache(entry);
387

388
	fuse_advise_use_readdirplus(dir);
389
	return newent;
390 391 392 393 394

 out_iput:
	iput(inode);
 out_err:
	return ERR_PTR(err);
395 396
}

397 398 399 400 401 402
/*
 * Atomic create+open operation
 *
 * If the filesystem doesn't support this, then fall back to separate
 * 'mknod' + 'open' requests.
 */
A
Al Viro 已提交
403
static int fuse_create_open(struct inode *dir, struct dentry *entry,
A
Al Viro 已提交
404
			    struct file *file, unsigned flags,
A
Al Viro 已提交
405
			    umode_t mode, int *opened)
M
Miklos Szeredi 已提交
406 407 408 409 410
{
	int err;
	struct inode *inode;
	struct fuse_conn *fc = get_fuse_conn(dir);
	struct fuse_req *req;
411
	struct fuse_forget_link *forget;
412
	struct fuse_create_in inarg;
M
Miklos Szeredi 已提交
413 414 415 416
	struct fuse_open_out outopen;
	struct fuse_entry_out outentry;
	struct fuse_file *ff;

417 418 419
	/* Userspace expects S_IFREG in create mode */
	BUG_ON((mode & S_IFMT) != S_IFREG);

420
	forget = fuse_alloc_forget();
421
	err = -ENOMEM;
422
	if (!forget)
423
		goto out_err;
424

M
Maxim Patlasov 已提交
425
	req = fuse_get_req_nopages(fc);
426
	err = PTR_ERR(req);
427
	if (IS_ERR(req))
428
		goto out_put_forget_req;
M
Miklos Szeredi 已提交
429

430
	err = -ENOMEM;
T
Tejun Heo 已提交
431
	ff = fuse_file_alloc(fc);
M
Miklos Szeredi 已提交
432 433 434
	if (!ff)
		goto out_put_request;

435 436 437
	if (!fc->dont_mask)
		mode &= ~current_umask();

M
Miklos Szeredi 已提交
438 439
	flags &= ~O_NOCTTY;
	memset(&inarg, 0, sizeof(inarg));
440
	memset(&outentry, 0, sizeof(outentry));
M
Miklos Szeredi 已提交
441 442
	inarg.flags = flags;
	inarg.mode = mode;
443
	inarg.umask = current_umask();
M
Miklos Szeredi 已提交
444 445 446
	req->in.h.opcode = FUSE_CREATE;
	req->in.h.nodeid = get_node_id(dir);
	req->in.numargs = 2;
447 448
	req->in.args[0].size = fc->minor < 12 ? sizeof(struct fuse_open_in) :
						sizeof(inarg);
M
Miklos Szeredi 已提交
449 450 451 452
	req->in.args[0].value = &inarg;
	req->in.args[1].size = entry->d_name.len + 1;
	req->in.args[1].value = entry->d_name.name;
	req->out.numargs = 2;
453 454 455 456
	if (fc->minor < 9)
		req->out.args[0].size = FUSE_COMPAT_ENTRY_OUT_SIZE;
	else
		req->out.args[0].size = sizeof(outentry);
M
Miklos Szeredi 已提交
457 458 459
	req->out.args[0].value = &outentry;
	req->out.args[1].size = sizeof(outopen);
	req->out.args[1].value = &outopen;
460
	fuse_request_send(fc, req);
M
Miklos Szeredi 已提交
461
	err = req->out.h.error;
462
	if (err)
M
Miklos Szeredi 已提交
463 464 465
		goto out_free_ff;

	err = -EIO;
466
	if (!S_ISREG(outentry.attr.mode) || invalid_nodeid(outentry.nodeid))
M
Miklos Szeredi 已提交
467 468
		goto out_free_ff;

469
	fuse_put_request(fc, req);
470 471 472
	ff->fh = outopen.fh;
	ff->nodeid = outentry.nodeid;
	ff->open_flags = outopen.open_flags;
M
Miklos Szeredi 已提交
473
	inode = fuse_iget(dir->i_sb, outentry.nodeid, outentry.generation,
474
			  &outentry.attr, entry_attr_timeout(&outentry), 0);
M
Miklos Szeredi 已提交
475 476
	if (!inode) {
		flags &= ~(O_CREAT | O_EXCL | O_TRUNC);
477
		fuse_sync_release(ff, flags);
478
		fuse_queue_forget(fc, forget, outentry.nodeid, 1);
479 480
		err = -ENOMEM;
		goto out_err;
M
Miklos Szeredi 已提交
481
	}
482
	kfree(forget);
M
Miklos Szeredi 已提交
483
	d_instantiate(entry, inode);
484
	fuse_change_entry_timeout(entry, &outentry);
485
	fuse_invalidate_attr(dir);
A
Al Viro 已提交
486 487
	err = finish_open(file, entry, generic_file_open, opened);
	if (err) {
488
		fuse_sync_release(ff, flags);
489 490 491
	} else {
		file->private_data = fuse_file_get(ff);
		fuse_finish_open(inode, file);
M
Miklos Szeredi 已提交
492
	}
A
Al Viro 已提交
493
	return err;
M
Miklos Szeredi 已提交
494

495
out_free_ff:
M
Miklos Szeredi 已提交
496
	fuse_file_free(ff);
497
out_put_request:
M
Miklos Szeredi 已提交
498
	fuse_put_request(fc, req);
499
out_put_forget_req:
500
	kfree(forget);
501
out_err:
A
Al Viro 已提交
502
	return err;
503 504 505
}

static int fuse_mknod(struct inode *, struct dentry *, umode_t, dev_t);
A
Al Viro 已提交
506
static int fuse_atomic_open(struct inode *dir, struct dentry *entry,
A
Al Viro 已提交
507
			    struct file *file, unsigned flags,
A
Al Viro 已提交
508
			    umode_t mode, int *opened)
509 510 511 512 513 514
{
	int err;
	struct fuse_conn *fc = get_fuse_conn(dir);
	struct dentry *res = NULL;

	if (d_unhashed(entry)) {
A
Al Viro 已提交
515
		res = fuse_lookup(dir, entry, 0);
516
		if (IS_ERR(res))
A
Al Viro 已提交
517
			return PTR_ERR(res);
518 519 520 521 522 523 524 525 526

		if (res)
			entry = res;
	}

	if (!(flags & O_CREAT) || entry->d_inode)
		goto no_open;

	/* Only creates */
527
	*opened |= FILE_CREATED;
528 529 530 531

	if (fc->no_create)
		goto mknod;

A
Al Viro 已提交
532
	err = fuse_create_open(dir, entry, file, flags, mode, opened);
A
Al Viro 已提交
533
	if (err == -ENOSYS) {
534 535 536 537 538
		fc->no_create = 1;
		goto mknod;
	}
out_dput:
	dput(res);
A
Al Viro 已提交
539
	return err;
540 541 542

mknod:
	err = fuse_mknod(dir, entry, mode, 0);
A
Al Viro 已提交
543
	if (err)
544 545
		goto out_dput;
no_open:
A
Al Viro 已提交
546
	return finish_no_open(file, res);
M
Miklos Szeredi 已提交
547 548
}

549 550 551
/*
 * Code shared between mknod, mkdir, symlink and link
 */
552 553
static int create_new_entry(struct fuse_conn *fc, struct fuse_req *req,
			    struct inode *dir, struct dentry *entry,
A
Al Viro 已提交
554
			    umode_t mode)
555 556 557 558
{
	struct fuse_entry_out outarg;
	struct inode *inode;
	int err;
559
	struct fuse_forget_link *forget;
M
Miklos Szeredi 已提交
560

561 562
	forget = fuse_alloc_forget();
	if (!forget) {
M
Miklos Szeredi 已提交
563
		fuse_put_request(fc, req);
564
		return -ENOMEM;
M
Miklos Szeredi 已提交
565
	}
566

567
	memset(&outarg, 0, sizeof(outarg));
568 569
	req->in.h.nodeid = get_node_id(dir);
	req->out.numargs = 1;
570 571 572 573
	if (fc->minor < 9)
		req->out.args[0].size = FUSE_COMPAT_ENTRY_OUT_SIZE;
	else
		req->out.args[0].size = sizeof(outarg);
574
	req->out.args[0].value = &outarg;
575
	fuse_request_send(fc, req);
576
	err = req->out.h.error;
M
Miklos Szeredi 已提交
577 578 579 580
	fuse_put_request(fc, req);
	if (err)
		goto out_put_forget_req;

581 582
	err = -EIO;
	if (invalid_nodeid(outarg.nodeid))
M
Miklos Szeredi 已提交
583
		goto out_put_forget_req;
584 585

	if ((outarg.attr.mode ^ mode) & S_IFMT)
M
Miklos Szeredi 已提交
586
		goto out_put_forget_req;
587

588
	inode = fuse_iget(dir->i_sb, outarg.nodeid, outarg.generation,
589
			  &outarg.attr, entry_attr_timeout(&outarg), 0);
590
	if (!inode) {
591
		fuse_queue_forget(fc, forget, outarg.nodeid, 1);
592 593
		return -ENOMEM;
	}
594
	kfree(forget);
595

596 597 598
	err = d_instantiate_no_diralias(entry, inode);
	if (err)
		return err;
599

600
	fuse_change_entry_timeout(entry, &outarg);
601 602
	fuse_invalidate_attr(dir);
	return 0;
603

M
Miklos Szeredi 已提交
604
 out_put_forget_req:
605
	kfree(forget);
606
	return err;
607 608
}

A
Al Viro 已提交
609
static int fuse_mknod(struct inode *dir, struct dentry *entry, umode_t mode,
610 611 612 613
		      dev_t rdev)
{
	struct fuse_mknod_in inarg;
	struct fuse_conn *fc = get_fuse_conn(dir);
M
Maxim Patlasov 已提交
614
	struct fuse_req *req = fuse_get_req_nopages(fc);
615 616
	if (IS_ERR(req))
		return PTR_ERR(req);
617

618 619 620
	if (!fc->dont_mask)
		mode &= ~current_umask();

621 622 623
	memset(&inarg, 0, sizeof(inarg));
	inarg.mode = mode;
	inarg.rdev = new_encode_dev(rdev);
624
	inarg.umask = current_umask();
625 626
	req->in.h.opcode = FUSE_MKNOD;
	req->in.numargs = 2;
627 628
	req->in.args[0].size = fc->minor < 12 ? FUSE_COMPAT_MKNOD_IN_SIZE :
						sizeof(inarg);
629 630 631 632 633 634
	req->in.args[0].value = &inarg;
	req->in.args[1].size = entry->d_name.len + 1;
	req->in.args[1].value = entry->d_name.name;
	return create_new_entry(fc, req, dir, entry, mode);
}

A
Al Viro 已提交
635
static int fuse_create(struct inode *dir, struct dentry *entry, umode_t mode,
A
Al Viro 已提交
636
		       bool excl)
637 638 639 640
{
	return fuse_mknod(dir, entry, mode, 0);
}

641
static int fuse_mkdir(struct inode *dir, struct dentry *entry, umode_t mode)
642 643 644
{
	struct fuse_mkdir_in inarg;
	struct fuse_conn *fc = get_fuse_conn(dir);
M
Maxim Patlasov 已提交
645
	struct fuse_req *req = fuse_get_req_nopages(fc);
646 647
	if (IS_ERR(req))
		return PTR_ERR(req);
648

649 650 651
	if (!fc->dont_mask)
		mode &= ~current_umask();

652 653
	memset(&inarg, 0, sizeof(inarg));
	inarg.mode = mode;
654
	inarg.umask = current_umask();
655 656 657 658 659 660 661 662 663 664 665 666 667 668
	req->in.h.opcode = FUSE_MKDIR;
	req->in.numargs = 2;
	req->in.args[0].size = sizeof(inarg);
	req->in.args[0].value = &inarg;
	req->in.args[1].size = entry->d_name.len + 1;
	req->in.args[1].value = entry->d_name.name;
	return create_new_entry(fc, req, dir, entry, S_IFDIR);
}

static int fuse_symlink(struct inode *dir, struct dentry *entry,
			const char *link)
{
	struct fuse_conn *fc = get_fuse_conn(dir);
	unsigned len = strlen(link) + 1;
M
Maxim Patlasov 已提交
669
	struct fuse_req *req = fuse_get_req_nopages(fc);
670 671
	if (IS_ERR(req))
		return PTR_ERR(req);
672 673 674 675 676 677 678 679 680 681

	req->in.h.opcode = FUSE_SYMLINK;
	req->in.numargs = 2;
	req->in.args[0].size = entry->d_name.len + 1;
	req->in.args[0].value = entry->d_name.name;
	req->in.args[1].size = len;
	req->in.args[1].value = link;
	return create_new_entry(fc, req, dir, entry, S_IFLNK);
}

M
Maxim Patlasov 已提交
682 683 684 685 686 687 688 689
static inline void fuse_update_ctime(struct inode *inode)
{
	if (!IS_NOCMTIME(inode)) {
		inode->i_ctime = current_fs_time(inode->i_sb);
		mark_inode_dirty_sync(inode);
	}
}

690 691 692 693
static int fuse_unlink(struct inode *dir, struct dentry *entry)
{
	int err;
	struct fuse_conn *fc = get_fuse_conn(dir);
M
Maxim Patlasov 已提交
694
	struct fuse_req *req = fuse_get_req_nopages(fc);
695 696
	if (IS_ERR(req))
		return PTR_ERR(req);
697 698 699 700 701 702

	req->in.h.opcode = FUSE_UNLINK;
	req->in.h.nodeid = get_node_id(dir);
	req->in.numargs = 1;
	req->in.args[0].size = entry->d_name.len + 1;
	req->in.args[0].value = entry->d_name.name;
703
	fuse_request_send(fc, req);
704 705 706 707
	err = req->out.h.error;
	fuse_put_request(fc, req);
	if (!err) {
		struct inode *inode = entry->d_inode;
M
Miklos Szeredi 已提交
708
		struct fuse_inode *fi = get_fuse_inode(inode);
709

M
Miklos Szeredi 已提交
710 711
		spin_lock(&fc->lock);
		fi->attr_version = ++fc->attr_version;
712 713 714 715 716 717 718 719
		/*
		 * If i_nlink == 0 then unlink doesn't make sense, yet this can
		 * happen if userspace filesystem is careless.  It would be
		 * difficult to enforce correct nlink usage so just ignore this
		 * condition here
		 */
		if (inode->i_nlink > 0)
			drop_nlink(inode);
M
Miklos Szeredi 已提交
720
		spin_unlock(&fc->lock);
721 722
		fuse_invalidate_attr(inode);
		fuse_invalidate_attr(dir);
723
		fuse_invalidate_entry_cache(entry);
M
Maxim Patlasov 已提交
724
		fuse_update_ctime(inode);
725 726 727 728 729 730 731 732 733
	} else if (err == -EINTR)
		fuse_invalidate_entry(entry);
	return err;
}

static int fuse_rmdir(struct inode *dir, struct dentry *entry)
{
	int err;
	struct fuse_conn *fc = get_fuse_conn(dir);
M
Maxim Patlasov 已提交
734
	struct fuse_req *req = fuse_get_req_nopages(fc);
735 736
	if (IS_ERR(req))
		return PTR_ERR(req);
737 738 739 740 741 742

	req->in.h.opcode = FUSE_RMDIR;
	req->in.h.nodeid = get_node_id(dir);
	req->in.numargs = 1;
	req->in.args[0].size = entry->d_name.len + 1;
	req->in.args[0].value = entry->d_name.name;
743
	fuse_request_send(fc, req);
744 745 746
	err = req->out.h.error;
	fuse_put_request(fc, req);
	if (!err) {
747
		clear_nlink(entry->d_inode);
748
		fuse_invalidate_attr(dir);
749
		fuse_invalidate_entry_cache(entry);
750 751 752 753 754 755 756 757 758 759 760
	} else if (err == -EINTR)
		fuse_invalidate_entry(entry);
	return err;
}

static int fuse_rename(struct inode *olddir, struct dentry *oldent,
		       struct inode *newdir, struct dentry *newent)
{
	int err;
	struct fuse_rename_in inarg;
	struct fuse_conn *fc = get_fuse_conn(olddir);
M
Maxim Patlasov 已提交
761
	struct fuse_req *req = fuse_get_req_nopages(fc);
762

763 764
	if (IS_ERR(req))
		return PTR_ERR(req);
765 766 767 768 769 770 771 772 773 774 775 776

	memset(&inarg, 0, sizeof(inarg));
	inarg.newdir = get_node_id(newdir);
	req->in.h.opcode = FUSE_RENAME;
	req->in.h.nodeid = get_node_id(olddir);
	req->in.numargs = 3;
	req->in.args[0].size = sizeof(inarg);
	req->in.args[0].value = &inarg;
	req->in.args[1].size = oldent->d_name.len + 1;
	req->in.args[1].value = oldent->d_name.name;
	req->in.args[2].size = newent->d_name.len + 1;
	req->in.args[2].value = newent->d_name.name;
777
	fuse_request_send(fc, req);
778 779 780
	err = req->out.h.error;
	fuse_put_request(fc, req);
	if (!err) {
781 782
		/* ctime changes */
		fuse_invalidate_attr(oldent->d_inode);
M
Maxim Patlasov 已提交
783
		fuse_update_ctime(oldent->d_inode);
784

785 786 787
		fuse_invalidate_attr(olddir);
		if (olddir != newdir)
			fuse_invalidate_attr(newdir);
788 789

		/* newent will end up negative */
M
Miklos Szeredi 已提交
790 791
		if (newent->d_inode) {
			fuse_invalidate_attr(newent->d_inode);
792
			fuse_invalidate_entry_cache(newent);
M
Maxim Patlasov 已提交
793
			fuse_update_ctime(newent->d_inode);
M
Miklos Szeredi 已提交
794
		}
795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815
	} else if (err == -EINTR) {
		/* If request was interrupted, DEITY only knows if the
		   rename actually took place.  If the invalidation
		   fails (e.g. some process has CWD under the renamed
		   directory), then there can be inconsistency between
		   the dcache and the real filesystem.  Tough luck. */
		fuse_invalidate_entry(oldent);
		if (newent->d_inode)
			fuse_invalidate_entry(newent);
	}

	return err;
}

static int fuse_link(struct dentry *entry, struct inode *newdir,
		     struct dentry *newent)
{
	int err;
	struct fuse_link_in inarg;
	struct inode *inode = entry->d_inode;
	struct fuse_conn *fc = get_fuse_conn(inode);
M
Maxim Patlasov 已提交
816
	struct fuse_req *req = fuse_get_req_nopages(fc);
817 818
	if (IS_ERR(req))
		return PTR_ERR(req);
819 820 821 822 823 824 825 826 827 828 829 830 831 832 833 834

	memset(&inarg, 0, sizeof(inarg));
	inarg.oldnodeid = get_node_id(inode);
	req->in.h.opcode = FUSE_LINK;
	req->in.numargs = 2;
	req->in.args[0].size = sizeof(inarg);
	req->in.args[0].value = &inarg;
	req->in.args[1].size = newent->d_name.len + 1;
	req->in.args[1].value = newent->d_name.name;
	err = create_new_entry(fc, req, newdir, newent, inode->i_mode);
	/* Contrary to "normal" filesystems it can happen that link
	   makes two "logical" inodes point to the same "physical"
	   inode.  We invalidate the attributes of the old one, so it
	   will reflect changes in the backing inode (link count,
	   etc.)
	*/
M
Miklos Szeredi 已提交
835 836 837 838 839 840 841
	if (!err) {
		struct fuse_inode *fi = get_fuse_inode(inode);

		spin_lock(&fc->lock);
		fi->attr_version = ++fc->attr_version;
		inc_nlink(inode);
		spin_unlock(&fc->lock);
842
		fuse_invalidate_attr(inode);
M
Maxim Patlasov 已提交
843
		fuse_update_ctime(inode);
M
Miklos Szeredi 已提交
844 845 846
	} else if (err == -EINTR) {
		fuse_invalidate_attr(inode);
	}
847 848 849
	return err;
}

850 851 852
static void fuse_fillattr(struct inode *inode, struct fuse_attr *attr,
			  struct kstat *stat)
{
M
Miklos Szeredi 已提交
853
	unsigned int blkbits;
P
Pavel Emelyanov 已提交
854 855 856
	struct fuse_conn *fc = get_fuse_conn(inode);

	/* see the comment in fuse_change_attributes() */
M
Maxim Patlasov 已提交
857
	if (fc->writeback_cache && S_ISREG(inode->i_mode)) {
P
Pavel Emelyanov 已提交
858
		attr->size = i_size_read(inode);
M
Maxim Patlasov 已提交
859 860
		attr->mtime = inode->i_mtime.tv_sec;
		attr->mtimensec = inode->i_mtime.tv_nsec;
M
Maxim Patlasov 已提交
861 862
		attr->ctime = inode->i_ctime.tv_sec;
		attr->ctimensec = inode->i_ctime.tv_nsec;
M
Maxim Patlasov 已提交
863
	}
M
Miklos Szeredi 已提交
864

865 866 867 868
	stat->dev = inode->i_sb->s_dev;
	stat->ino = attr->ino;
	stat->mode = (inode->i_mode & S_IFMT) | (attr->mode & 07777);
	stat->nlink = attr->nlink;
869 870
	stat->uid = make_kuid(&init_user_ns, attr->uid);
	stat->gid = make_kgid(&init_user_ns, attr->gid);
871 872 873 874 875 876 877 878 879
	stat->rdev = inode->i_rdev;
	stat->atime.tv_sec = attr->atime;
	stat->atime.tv_nsec = attr->atimensec;
	stat->mtime.tv_sec = attr->mtime;
	stat->mtime.tv_nsec = attr->mtimensec;
	stat->ctime.tv_sec = attr->ctime;
	stat->ctime.tv_nsec = attr->ctimensec;
	stat->size = attr->size;
	stat->blocks = attr->blocks;
M
Miklos Szeredi 已提交
880 881 882 883 884 885 886

	if (attr->blksize != 0)
		blkbits = ilog2(attr->blksize);
	else
		blkbits = inode->i_sb->s_blocksize_bits;

	stat->blksize = 1 << blkbits;
887 888
}

889 890
static int fuse_do_getattr(struct inode *inode, struct kstat *stat,
			   struct file *file)
891 892
{
	int err;
893 894
	struct fuse_getattr_in inarg;
	struct fuse_attr_out outarg;
895
	struct fuse_conn *fc = get_fuse_conn(inode);
896 897 898
	struct fuse_req *req;
	u64 attr_version;

M
Maxim Patlasov 已提交
899
	req = fuse_get_req_nopages(fc);
900 901
	if (IS_ERR(req))
		return PTR_ERR(req);
902

903
	attr_version = fuse_get_attr_version(fc);
904

905
	memset(&inarg, 0, sizeof(inarg));
906
	memset(&outarg, 0, sizeof(outarg));
907 908 909 910 911 912 913
	/* Directories have separate file-handle space */
	if (file && S_ISREG(inode->i_mode)) {
		struct fuse_file *ff = file->private_data;

		inarg.getattr_flags |= FUSE_GETATTR_FH;
		inarg.fh = ff->fh;
	}
914 915
	req->in.h.opcode = FUSE_GETATTR;
	req->in.h.nodeid = get_node_id(inode);
916 917 918
	req->in.numargs = 1;
	req->in.args[0].size = sizeof(inarg);
	req->in.args[0].value = &inarg;
919
	req->out.numargs = 1;
920 921 922 923
	if (fc->minor < 9)
		req->out.args[0].size = FUSE_COMPAT_ATTR_OUT_SIZE;
	else
		req->out.args[0].size = sizeof(outarg);
924
	req->out.args[0].value = &outarg;
925
	fuse_request_send(fc, req);
926 927 928
	err = req->out.h.error;
	fuse_put_request(fc, req);
	if (!err) {
929
		if ((inode->i_mode ^ outarg.attr.mode) & S_IFMT) {
930 931 932
			make_bad_inode(inode);
			err = -EIO;
		} else {
933 934
			fuse_change_attributes(inode, &outarg.attr,
					       attr_timeout(&outarg),
935 936
					       attr_version);
			if (stat)
937
				fuse_fillattr(inode, &outarg.attr, stat);
938 939 940 941 942
		}
	}
	return err;
}

M
Miklos Szeredi 已提交
943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958
int fuse_update_attributes(struct inode *inode, struct kstat *stat,
			   struct file *file, bool *refreshed)
{
	struct fuse_inode *fi = get_fuse_inode(inode);
	int err;
	bool r;

	if (fi->i_time < get_jiffies_64()) {
		r = true;
		err = fuse_do_getattr(inode, stat, file);
	} else {
		r = false;
		err = 0;
		if (stat) {
			generic_fillattr(inode, stat);
			stat->mode = fi->orig_i_mode;
959
			stat->ino = fi->orig_ino;
M
Miklos Szeredi 已提交
960 961 962 963 964 965 966 967 968
		}
	}

	if (refreshed != NULL)
		*refreshed = r;

	return err;
}

J
John Muir 已提交
969
int fuse_reverse_inval_entry(struct super_block *sb, u64 parent_nodeid,
970
			     u64 child_nodeid, struct qstr *name)
J
John Muir 已提交
971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996
{
	int err = -ENOTDIR;
	struct inode *parent;
	struct dentry *dir;
	struct dentry *entry;

	parent = ilookup5(sb, parent_nodeid, fuse_inode_eq, &parent_nodeid);
	if (!parent)
		return -ENOENT;

	mutex_lock(&parent->i_mutex);
	if (!S_ISDIR(parent->i_mode))
		goto unlock;

	err = -ENOENT;
	dir = d_find_alias(parent);
	if (!dir)
		goto unlock;

	entry = d_lookup(dir, name);
	dput(dir);
	if (!entry)
		goto unlock;

	fuse_invalidate_attr(parent);
	fuse_invalidate_entry(entry);
997 998 999 1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025

	if (child_nodeid != 0 && entry->d_inode) {
		mutex_lock(&entry->d_inode->i_mutex);
		if (get_node_id(entry->d_inode) != child_nodeid) {
			err = -ENOENT;
			goto badentry;
		}
		if (d_mountpoint(entry)) {
			err = -EBUSY;
			goto badentry;
		}
		if (S_ISDIR(entry->d_inode->i_mode)) {
			shrink_dcache_parent(entry);
			if (!simple_empty(entry)) {
				err = -ENOTEMPTY;
				goto badentry;
			}
			entry->d_inode->i_flags |= S_DEAD;
		}
		dont_mount(entry);
		clear_nlink(entry->d_inode);
		err = 0;
 badentry:
		mutex_unlock(&entry->d_inode->i_mutex);
		if (!err)
			d_delete(entry);
	} else {
		err = 0;
	}
J
John Muir 已提交
1026 1027 1028 1029 1030 1031 1032 1033
	dput(entry);

 unlock:
	mutex_unlock(&parent->i_mutex);
	iput(parent);
	return err;
}

1034 1035
/*
 * Calling into a user-controlled filesystem gives the filesystem
1036
 * daemon ptrace-like capabilities over the current process.  This
1037 1038 1039 1040 1041 1042 1043 1044 1045 1046
 * means, that the filesystem daemon is able to record the exact
 * filesystem operations performed, and can also control the behavior
 * of the requester process in otherwise impossible ways.  For example
 * it can delay the operation for arbitrary length of time allowing
 * DoS against the requester.
 *
 * For this reason only those processes can call into the filesystem,
 * for which the owner of the mount has ptrace privilege.  This
 * excludes processes started by other users, suid or sgid processes.
 */
1047
int fuse_allow_current_process(struct fuse_conn *fc)
1048
{
1049
	const struct cred *cred;
1050

1051
	if (fc->flags & FUSE_ALLOW_OTHER)
1052 1053
		return 1;

1054
	cred = current_cred();
1055 1056 1057 1058 1059 1060
	if (uid_eq(cred->euid, fc->user_id) &&
	    uid_eq(cred->suid, fc->user_id) &&
	    uid_eq(cred->uid,  fc->user_id) &&
	    gid_eq(cred->egid, fc->group_id) &&
	    gid_eq(cred->sgid, fc->group_id) &&
	    gid_eq(cred->gid,  fc->group_id))
1061
		return 1;
1062

1063
	return 0;
1064 1065
}

M
Miklos Szeredi 已提交
1066 1067 1068 1069 1070 1071 1072
static int fuse_access(struct inode *inode, int mask)
{
	struct fuse_conn *fc = get_fuse_conn(inode);
	struct fuse_req *req;
	struct fuse_access_in inarg;
	int err;

1073 1074
	BUG_ON(mask & MAY_NOT_BLOCK);

M
Miklos Szeredi 已提交
1075 1076 1077
	if (fc->no_access)
		return 0;

M
Maxim Patlasov 已提交
1078
	req = fuse_get_req_nopages(fc);
1079 1080
	if (IS_ERR(req))
		return PTR_ERR(req);
M
Miklos Szeredi 已提交
1081 1082

	memset(&inarg, 0, sizeof(inarg));
1083
	inarg.mask = mask & (MAY_READ | MAY_WRITE | MAY_EXEC);
M
Miklos Szeredi 已提交
1084 1085 1086 1087 1088
	req->in.h.opcode = FUSE_ACCESS;
	req->in.h.nodeid = get_node_id(inode);
	req->in.numargs = 1;
	req->in.args[0].size = sizeof(inarg);
	req->in.args[0].value = &inarg;
1089
	fuse_request_send(fc, req);
M
Miklos Szeredi 已提交
1090 1091 1092 1093 1094 1095 1096 1097 1098
	err = req->out.h.error;
	fuse_put_request(fc, req);
	if (err == -ENOSYS) {
		fc->no_access = 1;
		err = 0;
	}
	return err;
}

1099
static int fuse_perm_getattr(struct inode *inode, int mask)
1100
{
1101
	if (mask & MAY_NOT_BLOCK)
1102 1103 1104 1105 1106
		return -ECHILD;

	return fuse_do_getattr(inode, NULL, NULL);
}

1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119
/*
 * Check permission.  The two basic access models of FUSE are:
 *
 * 1) Local access checking ('default_permissions' mount option) based
 * on file mode.  This is the plain old disk filesystem permission
 * modell.
 *
 * 2) "Remote" access checking, where server is responsible for
 * checking permission in each inode operation.  An exception to this
 * is if ->permission() was invoked from sys_access() in which case an
 * access request is sent.  Execute permission is still checked
 * locally based on file mode.
 */
1120
static int fuse_permission(struct inode *inode, int mask)
1121 1122
{
	struct fuse_conn *fc = get_fuse_conn(inode);
1123 1124
	bool refreshed = false;
	int err = 0;
1125

1126
	if (!fuse_allow_current_process(fc))
1127
		return -EACCES;
1128 1129

	/*
1130
	 * If attributes are needed, refresh them before proceeding
1131
	 */
1132 1133
	if ((fc->flags & FUSE_DEFAULT_PERMISSIONS) ||
	    ((mask & MAY_EXEC) && S_ISREG(inode->i_mode))) {
1134 1135 1136 1137 1138
		struct fuse_inode *fi = get_fuse_inode(inode);

		if (fi->i_time < get_jiffies_64()) {
			refreshed = true;

1139
			err = fuse_perm_getattr(inode, mask);
1140 1141 1142
			if (err)
				return err;
		}
1143 1144 1145
	}

	if (fc->flags & FUSE_DEFAULT_PERMISSIONS) {
1146
		err = generic_permission(inode, mask);
M
Miklos Szeredi 已提交
1147 1148 1149 1150

		/* If permission is denied, try to refresh file
		   attributes.  This is also needed, because the root
		   node will at first have no permissions */
1151
		if (err == -EACCES && !refreshed) {
1152
			err = fuse_perm_getattr(inode, mask);
M
Miklos Szeredi 已提交
1153
			if (!err)
1154
				err = generic_permission(inode, mask);
M
Miklos Szeredi 已提交
1155 1156
		}

1157 1158 1159 1160
		/* Note: the opposite of the above test does not
		   exist.  So if permissions are revoked this won't be
		   noticed immediately, only after the attribute
		   timeout has expired */
E
Eric Paris 已提交
1161
	} else if (mask & (MAY_ACCESS | MAY_CHDIR)) {
1162 1163 1164 1165 1166 1167
		err = fuse_access(inode, mask);
	} else if ((mask & MAY_EXEC) && S_ISREG(inode->i_mode)) {
		if (!(inode->i_mode & S_IXUGO)) {
			if (refreshed)
				return -EACCES;

1168
			err = fuse_perm_getattr(inode, mask);
1169 1170 1171
			if (!err && !(inode->i_mode & S_IXUGO))
				return -EACCES;
		}
1172
	}
1173
	return err;
1174 1175 1176
}

static int parse_dirfile(char *buf, size_t nbytes, struct file *file,
A
Al Viro 已提交
1177
			 struct dir_context *ctx)
1178 1179 1180 1181 1182 1183 1184 1185
{
	while (nbytes >= FUSE_NAME_OFFSET) {
		struct fuse_dirent *dirent = (struct fuse_dirent *) buf;
		size_t reclen = FUSE_DIRENT_SIZE(dirent);
		if (!dirent->namelen || dirent->namelen > FUSE_NAME_MAX)
			return -EIO;
		if (reclen > nbytes)
			break;
1186 1187
		if (memchr(dirent->name, '/', dirent->namelen) != NULL)
			return -EIO;
1188

A
Al Viro 已提交
1189 1190
		if (!dir_emit(ctx, dirent->name, dirent->namelen,
			       dirent->ino, dirent->type))
1191 1192 1193 1194
			break;

		buf += reclen;
		nbytes -= reclen;
A
Al Viro 已提交
1195
		ctx->pos = dirent->off;
1196 1197 1198 1199 1200
	}

	return 0;
}

1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236
static int fuse_direntplus_link(struct file *file,
				struct fuse_direntplus *direntplus,
				u64 attr_version)
{
	int err;
	struct fuse_entry_out *o = &direntplus->entry_out;
	struct fuse_dirent *dirent = &direntplus->dirent;
	struct dentry *parent = file->f_path.dentry;
	struct qstr name = QSTR_INIT(dirent->name, dirent->namelen);
	struct dentry *dentry;
	struct dentry *alias;
	struct inode *dir = parent->d_inode;
	struct fuse_conn *fc;
	struct inode *inode;

	if (!o->nodeid) {
		/*
		 * Unlike in the case of fuse_lookup, zero nodeid does not mean
		 * ENOENT. Instead, it only means the userspace filesystem did
		 * not want to return attributes/handle for this entry.
		 *
		 * So do nothing.
		 */
		return 0;
	}

	if (name.name[0] == '.') {
		/*
		 * We could potentially refresh the attributes of the directory
		 * and its parent?
		 */
		if (name.len == 1)
			return 0;
		if (name.name[1] == '.' && name.len == 2)
			return 0;
	}
1237 1238 1239 1240 1241 1242

	if (invalid_nodeid(o->nodeid))
		return -EIO;
	if (!fuse_valid_type(o->attr.mode))
		return -EIO;

1243 1244 1245 1246
	fc = get_fuse_conn(dir);

	name.hash = full_name_hash(name.name, name.len);
	dentry = d_lookup(parent, &name);
1247
	if (dentry) {
1248
		inode = dentry->d_inode;
1249 1250
		if (!inode) {
			d_drop(dentry);
1251 1252
		} else if (get_node_id(inode) != o->nodeid ||
			   ((o->attr.mode ^ inode->i_mode) & S_IFMT)) {
1253 1254 1255
			err = d_invalidate(dentry);
			if (err)
				goto out;
1256 1257 1258
		} else if (is_bad_inode(inode)) {
			err = -EIO;
			goto out;
1259
		} else {
1260 1261 1262 1263 1264 1265
			struct fuse_inode *fi;
			fi = get_fuse_inode(inode);
			spin_lock(&fc->lock);
			fi->nlookup++;
			spin_unlock(&fc->lock);

1266 1267 1268 1269
			fuse_change_attributes(inode, &o->attr,
					       entry_attr_timeout(o),
					       attr_version);

1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288
			/*
			 * The other branch to 'found' comes via fuse_iget()
			 * which bumps nlookup inside
			 */
			goto found;
		}
		dput(dentry);
	}

	dentry = d_alloc(parent, &name);
	err = -ENOMEM;
	if (!dentry)
		goto out;

	inode = fuse_iget(dir->i_sb, o->nodeid, o->generation,
			  &o->attr, entry_attr_timeout(o), attr_version);
	if (!inode)
		goto out;

1289
	alias = d_materialise_unique(dentry, inode);
1290 1291 1292
	err = PTR_ERR(alias);
	if (IS_ERR(alias))
		goto out;
1293

1294 1295 1296 1297 1298 1299
	if (alias) {
		dput(dentry);
		dentry = alias;
	}

found:
M
Miklos Szeredi 已提交
1300 1301
	if (fc->readdirplus_auto)
		set_bit(FUSE_I_INIT_RDPLUS, &get_fuse_inode(inode)->state);
1302 1303 1304 1305
	fuse_change_entry_timeout(dentry, o);

	err = 0;
out:
M
Miklos Szeredi 已提交
1306
	dput(dentry);
1307 1308 1309 1310
	return err;
}

static int parse_dirplusfile(char *buf, size_t nbytes, struct file *file,
A
Al Viro 已提交
1311
			     struct dir_context *ctx, u64 attr_version)
1312 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327
{
	struct fuse_direntplus *direntplus;
	struct fuse_dirent *dirent;
	size_t reclen;
	int over = 0;
	int ret;

	while (nbytes >= FUSE_NAME_OFFSET_DIRENTPLUS) {
		direntplus = (struct fuse_direntplus *) buf;
		dirent = &direntplus->dirent;
		reclen = FUSE_DIRENTPLUS_SIZE(direntplus);

		if (!dirent->namelen || dirent->namelen > FUSE_NAME_MAX)
			return -EIO;
		if (reclen > nbytes)
			break;
1328 1329
		if (memchr(dirent->name, '/', dirent->namelen) != NULL)
			return -EIO;
1330 1331 1332 1333 1334 1335 1336 1337

		if (!over) {
			/* We fill entries into dstbuf only as much as
			   it can hold. But we still continue iterating
			   over remaining entries to link them. If not,
			   we need to send a FORGET for each of those
			   which we did not link.
			*/
A
Al Viro 已提交
1338 1339 1340
			over = !dir_emit(ctx, dirent->name, dirent->namelen,
				       dirent->ino, dirent->type);
			ctx->pos = dirent->off;
1341 1342 1343 1344 1345 1346 1347 1348 1349 1350 1351 1352 1353
		}

		buf += reclen;
		nbytes -= reclen;

		ret = fuse_direntplus_link(file, direntplus, attr_version);
		if (ret)
			fuse_force_forget(file, direntplus->entry_out.nodeid);
	}

	return 0;
}

A
Al Viro 已提交
1354
static int fuse_readdir(struct file *file, struct dir_context *ctx)
1355
{
1356
	int plus, err;
1357 1358
	size_t nbytes;
	struct page *page;
A
Al Viro 已提交
1359
	struct inode *inode = file_inode(file);
1360
	struct fuse_conn *fc = get_fuse_conn(inode);
1361
	struct fuse_req *req;
1362
	u64 attr_version = 0;
1363 1364 1365 1366

	if (is_bad_inode(inode))
		return -EIO;

M
Maxim Patlasov 已提交
1367
	req = fuse_get_req(fc, 1);
1368 1369
	if (IS_ERR(req))
		return PTR_ERR(req);
1370

1371 1372 1373 1374 1375
	page = alloc_page(GFP_KERNEL);
	if (!page) {
		fuse_put_request(fc, req);
		return -ENOMEM;
	}
1376

A
Al Viro 已提交
1377
	plus = fuse_use_readdirplus(inode, ctx);
1378
	req->out.argpages = 1;
1379 1380
	req->num_pages = 1;
	req->pages[0] = page;
1381
	req->page_descs[0].length = PAGE_SIZE;
1382
	if (plus) {
1383
		attr_version = fuse_get_attr_version(fc);
A
Al Viro 已提交
1384
		fuse_read_fill(req, file, ctx->pos, PAGE_SIZE,
1385 1386
			       FUSE_READDIRPLUS);
	} else {
A
Al Viro 已提交
1387
		fuse_read_fill(req, file, ctx->pos, PAGE_SIZE,
1388 1389
			       FUSE_READDIR);
	}
1390
	fuse_request_send(fc, req);
1391
	nbytes = req->out.args[0].size;
1392 1393
	err = req->out.h.error;
	fuse_put_request(fc, req);
1394
	if (!err) {
1395
		if (plus) {
1396
			err = parse_dirplusfile(page_address(page), nbytes,
A
Al Viro 已提交
1397
						file, ctx,
1398 1399 1400
						attr_version);
		} else {
			err = parse_dirfile(page_address(page), nbytes, file,
A
Al Viro 已提交
1401
					    ctx);
1402 1403
		}
	}
1404

1405
	__free_page(page);
1406
	fuse_invalidate_atime(inode);
1407
	return err;
1408 1409 1410 1411 1412 1413
}

static char *read_link(struct dentry *dentry)
{
	struct inode *inode = dentry->d_inode;
	struct fuse_conn *fc = get_fuse_conn(inode);
M
Maxim Patlasov 已提交
1414
	struct fuse_req *req = fuse_get_req_nopages(fc);
1415 1416
	char *link;

1417
	if (IS_ERR(req))
1418
		return ERR_CAST(req);
1419 1420 1421 1422 1423 1424 1425 1426 1427 1428 1429 1430

	link = (char *) __get_free_page(GFP_KERNEL);
	if (!link) {
		link = ERR_PTR(-ENOMEM);
		goto out;
	}
	req->in.h.opcode = FUSE_READLINK;
	req->in.h.nodeid = get_node_id(inode);
	req->out.argvar = 1;
	req->out.numargs = 1;
	req->out.args[0].size = PAGE_SIZE - 1;
	req->out.args[0].value = link;
1431
	fuse_request_send(fc, req);
1432 1433 1434 1435 1436 1437 1438
	if (req->out.h.error) {
		free_page((unsigned long) link);
		link = ERR_PTR(req->out.h.error);
	} else
		link[req->out.args[0].size] = '\0';
 out:
	fuse_put_request(fc, req);
1439
	fuse_invalidate_atime(inode);
1440 1441 1442 1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461
	return link;
}

static void free_link(char *link)
{
	if (!IS_ERR(link))
		free_page((unsigned long) link);
}

static void *fuse_follow_link(struct dentry *dentry, struct nameidata *nd)
{
	nd_set_link(nd, read_link(dentry));
	return NULL;
}

static void fuse_put_link(struct dentry *dentry, struct nameidata *nd, void *c)
{
	free_link(nd_get_link(nd));
}

static int fuse_dir_open(struct inode *inode, struct file *file)
{
1462
	return fuse_open_common(inode, file, true);
1463 1464 1465 1466
}

static int fuse_dir_release(struct inode *inode, struct file *file)
{
1467 1468 1469
	fuse_release_common(file, FUSE_RELEASEDIR);

	return 0;
1470 1471
}

1472 1473
static int fuse_dir_fsync(struct file *file, loff_t start, loff_t end,
			  int datasync)
1474
{
1475
	return fuse_fsync_common(file, start, end, datasync, 1);
1476 1477
}

1478 1479 1480 1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501
static long fuse_dir_ioctl(struct file *file, unsigned int cmd,
			    unsigned long arg)
{
	struct fuse_conn *fc = get_fuse_conn(file->f_mapping->host);

	/* FUSE_IOCTL_DIR only supported for API version >= 7.18 */
	if (fc->minor < 18)
		return -ENOTTY;

	return fuse_ioctl_common(file, cmd, arg, FUSE_IOCTL_DIR);
}

static long fuse_dir_compat_ioctl(struct file *file, unsigned int cmd,
				   unsigned long arg)
{
	struct fuse_conn *fc = get_fuse_conn(file->f_mapping->host);

	if (fc->minor < 18)
		return -ENOTTY;

	return fuse_ioctl_common(file, cmd, arg,
				 FUSE_IOCTL_COMPAT | FUSE_IOCTL_DIR);
}

M
Maxim Patlasov 已提交
1502
static bool update_mtime(unsigned ivalid, bool trust_local_mtime)
M
Miklos Szeredi 已提交
1503 1504 1505 1506 1507
{
	/* Always update if mtime is explicitly set  */
	if (ivalid & ATTR_MTIME_SET)
		return true;

M
Maxim Patlasov 已提交
1508 1509 1510 1511
	/* Or if kernel i_mtime is the official one */
	if (trust_local_mtime)
		return true;

M
Miklos Szeredi 已提交
1512 1513 1514 1515 1516 1517 1518 1519
	/* If it's an open(O_TRUNC) or an ftruncate(), don't update */
	if ((ivalid & ATTR_SIZE) && (ivalid & (ATTR_OPEN | ATTR_FILE)))
		return false;

	/* In all other cases update */
	return true;
}

M
Maxim Patlasov 已提交
1520 1521
static void iattr_to_fattr(struct iattr *iattr, struct fuse_setattr_in *arg,
			   bool trust_local_mtime)
1522 1523 1524 1525
{
	unsigned ivalid = iattr->ia_valid;

	if (ivalid & ATTR_MODE)
1526
		arg->valid |= FATTR_MODE,   arg->mode = iattr->ia_mode;
1527
	if (ivalid & ATTR_UID)
1528
		arg->valid |= FATTR_UID,    arg->uid = from_kuid(&init_user_ns, iattr->ia_uid);
1529
	if (ivalid & ATTR_GID)
1530
		arg->valid |= FATTR_GID,    arg->gid = from_kgid(&init_user_ns, iattr->ia_gid);
1531
	if (ivalid & ATTR_SIZE)
1532
		arg->valid |= FATTR_SIZE,   arg->size = iattr->ia_size;
M
Miklos Szeredi 已提交
1533 1534
	if (ivalid & ATTR_ATIME) {
		arg->valid |= FATTR_ATIME;
1535
		arg->atime = iattr->ia_atime.tv_sec;
M
Miklos Szeredi 已提交
1536 1537 1538 1539
		arg->atimensec = iattr->ia_atime.tv_nsec;
		if (!(ivalid & ATTR_ATIME_SET))
			arg->valid |= FATTR_ATIME_NOW;
	}
M
Maxim Patlasov 已提交
1540
	if ((ivalid & ATTR_MTIME) && update_mtime(ivalid, trust_local_mtime)) {
M
Miklos Szeredi 已提交
1541
		arg->valid |= FATTR_MTIME;
1542
		arg->mtime = iattr->ia_mtime.tv_sec;
M
Miklos Szeredi 已提交
1543
		arg->mtimensec = iattr->ia_mtime.tv_nsec;
M
Maxim Patlasov 已提交
1544
		if (!(ivalid & ATTR_MTIME_SET) && !trust_local_mtime)
M
Miklos Szeredi 已提交
1545
			arg->valid |= FATTR_MTIME_NOW;
1546
	}
1547 1548
}

M
Miklos Szeredi 已提交
1549 1550 1551 1552 1553 1554 1555 1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572 1573 1574 1575 1576 1577 1578 1579 1580 1581 1582 1583 1584 1585 1586 1587 1588 1589 1590 1591 1592
/*
 * Prevent concurrent writepages on inode
 *
 * This is done by adding a negative bias to the inode write counter
 * and waiting for all pending writes to finish.
 */
void fuse_set_nowrite(struct inode *inode)
{
	struct fuse_conn *fc = get_fuse_conn(inode);
	struct fuse_inode *fi = get_fuse_inode(inode);

	BUG_ON(!mutex_is_locked(&inode->i_mutex));

	spin_lock(&fc->lock);
	BUG_ON(fi->writectr < 0);
	fi->writectr += FUSE_NOWRITE;
	spin_unlock(&fc->lock);
	wait_event(fi->page_waitq, fi->writectr == FUSE_NOWRITE);
}

/*
 * Allow writepages on inode
 *
 * Remove the bias from the writecounter and send any queued
 * writepages.
 */
static void __fuse_release_nowrite(struct inode *inode)
{
	struct fuse_inode *fi = get_fuse_inode(inode);

	BUG_ON(fi->writectr != FUSE_NOWRITE);
	fi->writectr = 0;
	fuse_flush_writepages(inode);
}

void fuse_release_nowrite(struct inode *inode)
{
	struct fuse_conn *fc = get_fuse_conn(inode);

	spin_lock(&fc->lock);
	__fuse_release_nowrite(inode);
	spin_unlock(&fc->lock);
}

M
Maxim Patlasov 已提交
1593 1594 1595 1596 1597 1598 1599 1600 1601 1602 1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613
static void fuse_setattr_fill(struct fuse_conn *fc, struct fuse_req *req,
			      struct inode *inode,
			      struct fuse_setattr_in *inarg_p,
			      struct fuse_attr_out *outarg_p)
{
	req->in.h.opcode = FUSE_SETATTR;
	req->in.h.nodeid = get_node_id(inode);
	req->in.numargs = 1;
	req->in.args[0].size = sizeof(*inarg_p);
	req->in.args[0].value = inarg_p;
	req->out.numargs = 1;
	if (fc->minor < 9)
		req->out.args[0].size = FUSE_COMPAT_ATTR_OUT_SIZE;
	else
		req->out.args[0].size = sizeof(*outarg_p);
	req->out.args[0].value = outarg_p;
}

/*
 * Flush inode->i_mtime to the server
 */
1614
int fuse_flush_times(struct inode *inode, struct fuse_file *ff)
M
Maxim Patlasov 已提交
1615 1616
{
	struct fuse_conn *fc = get_fuse_conn(inode);
M
Miklos Szeredi 已提交
1617
	struct fuse_req *req;
M
Maxim Patlasov 已提交
1618 1619 1620 1621
	struct fuse_setattr_in inarg;
	struct fuse_attr_out outarg;
	int err;

M
Miklos Szeredi 已提交
1622 1623 1624
	req = fuse_get_req_nopages(fc);
	if (IS_ERR(req))
		return PTR_ERR(req);
M
Maxim Patlasov 已提交
1625 1626 1627 1628

	memset(&inarg, 0, sizeof(inarg));
	memset(&outarg, 0, sizeof(outarg));

1629
	inarg.valid = FATTR_MTIME;
M
Maxim Patlasov 已提交
1630 1631
	inarg.mtime = inode->i_mtime.tv_sec;
	inarg.mtimensec = inode->i_mtime.tv_nsec;
1632 1633 1634 1635 1636
	if (fc->minor >= 23) {
		inarg.valid |= FATTR_CTIME;
		inarg.ctime = inode->i_ctime.tv_sec;
		inarg.ctimensec = inode->i_ctime.tv_nsec;
	}
M
Miklos Szeredi 已提交
1637 1638 1639 1640
	if (ff) {
		inarg.valid |= FATTR_FH;
		inarg.fh = ff->fh;
	}
M
Maxim Patlasov 已提交
1641 1642 1643 1644 1645 1646 1647 1648
	fuse_setattr_fill(fc, req, inode, &inarg, &outarg);
	fuse_request_send(fc, req);
	err = req->out.h.error;
	fuse_put_request(fc, req);

	return err;
}

1649 1650 1651 1652 1653
/*
 * Set attributes, and at the same time refresh them.
 *
 * Truncation is slightly complicated, because the 'truncate' request
 * may fail, in which case we don't want to touch the mapping.
M
Miklos Szeredi 已提交
1654 1655
 * vmtruncate() doesn't allow for this case, so do the rlimit checking
 * and the actual truncation by hand.
1656
 */
1657 1658
int fuse_do_setattr(struct inode *inode, struct iattr *attr,
		    struct file *file)
1659 1660
{
	struct fuse_conn *fc = get_fuse_conn(inode);
1661
	struct fuse_inode *fi = get_fuse_inode(inode);
1662 1663 1664
	struct fuse_req *req;
	struct fuse_setattr_in inarg;
	struct fuse_attr_out outarg;
M
Miklos Szeredi 已提交
1665
	bool is_truncate = false;
P
Pavel Emelyanov 已提交
1666
	bool is_wb = fc->writeback_cache;
M
Miklos Szeredi 已提交
1667
	loff_t oldsize;
1668
	int err;
M
Maxim Patlasov 已提交
1669
	bool trust_local_mtime = is_wb && S_ISREG(inode->i_mode);
1670

1671 1672 1673 1674 1675 1676
	if (!(fc->flags & FUSE_DEFAULT_PERMISSIONS))
		attr->ia_valid |= ATTR_FORCE;

	err = inode_change_ok(inode, attr);
	if (err)
		return err;
M
Miklos Szeredi 已提交
1677

M
Miklos Szeredi 已提交
1678 1679 1680 1681 1682
	if (attr->ia_valid & ATTR_OPEN) {
		if (fc->atomic_o_trunc)
			return 0;
		file = NULL;
	}
1683

1684
	if (attr->ia_valid & ATTR_SIZE)
M
Miklos Szeredi 已提交
1685
		is_truncate = true;
1686

M
Maxim Patlasov 已提交
1687
	req = fuse_get_req_nopages(fc);
1688 1689
	if (IS_ERR(req))
		return PTR_ERR(req);
1690

1691
	if (is_truncate) {
M
Miklos Szeredi 已提交
1692
		fuse_set_nowrite(inode);
1693
		set_bit(FUSE_I_SIZE_UNSTABLE, &fi->state);
1694 1695
		if (trust_local_mtime && attr->ia_size != inode->i_size)
			attr->ia_valid |= ATTR_MTIME;
1696
	}
M
Miklos Szeredi 已提交
1697

1698
	memset(&inarg, 0, sizeof(inarg));
1699
	memset(&outarg, 0, sizeof(outarg));
M
Maxim Patlasov 已提交
1700
	iattr_to_fattr(attr, &inarg, trust_local_mtime);
1701 1702 1703 1704 1705
	if (file) {
		struct fuse_file *ff = file->private_data;
		inarg.valid |= FATTR_FH;
		inarg.fh = ff->fh;
	}
1706 1707 1708 1709 1710
	if (attr->ia_valid & ATTR_SIZE) {
		/* For mandatory locking in truncate */
		inarg.valid |= FATTR_LOCKOWNER;
		inarg.lock_owner = fuse_lock_owner_id(fc, current->files);
	}
M
Maxim Patlasov 已提交
1711
	fuse_setattr_fill(fc, req, inode, &inarg, &outarg);
1712
	fuse_request_send(fc, req);
1713 1714
	err = req->out.h.error;
	fuse_put_request(fc, req);
1715 1716 1717
	if (err) {
		if (err == -EINTR)
			fuse_invalidate_attr(inode);
M
Miklos Szeredi 已提交
1718
		goto error;
1719
	}
1720

1721 1722
	if ((inode->i_mode ^ outarg.attr.mode) & S_IFMT) {
		make_bad_inode(inode);
M
Miklos Szeredi 已提交
1723 1724 1725 1726 1727
		err = -EIO;
		goto error;
	}

	spin_lock(&fc->lock);
M
Maxim Patlasov 已提交
1728 1729 1730
	/* the kernel maintains i_mtime locally */
	if (trust_local_mtime && (attr->ia_valid & ATTR_MTIME)) {
		inode->i_mtime = attr->ia_mtime;
M
Miklos Szeredi 已提交
1731
		/* FIXME: clear I_DIRTY_SYNC? */
M
Maxim Patlasov 已提交
1732 1733
	}

M
Miklos Szeredi 已提交
1734 1735 1736
	fuse_change_attributes_common(inode, &outarg.attr,
				      attr_timeout(&outarg));
	oldsize = inode->i_size;
P
Pavel Emelyanov 已提交
1737 1738 1739
	/* see the comment in fuse_change_attributes() */
	if (!is_wb || is_truncate || !S_ISREG(inode->i_mode))
		i_size_write(inode, outarg.attr.size);
M
Miklos Szeredi 已提交
1740 1741 1742 1743 1744 1745 1746 1747 1748 1749 1750

	if (is_truncate) {
		/* NOTE: this may release/reacquire fc->lock */
		__fuse_release_nowrite(inode);
	}
	spin_unlock(&fc->lock);

	/*
	 * Only call invalidate_inode_pages2() after removing
	 * FUSE_NOWRITE, otherwise fuse_launder_page() would deadlock.
	 */
P
Pavel Emelyanov 已提交
1751 1752
	if ((is_truncate || !is_wb) &&
	    S_ISREG(inode->i_mode) && oldsize != outarg.attr.size) {
1753
		truncate_pagecache(inode, outarg.attr.size);
M
Miklos Szeredi 已提交
1754
		invalidate_inode_pages2(inode->i_mapping);
1755 1756
	}

1757
	clear_bit(FUSE_I_SIZE_UNSTABLE, &fi->state);
1758
	return 0;
M
Miklos Szeredi 已提交
1759 1760 1761 1762 1763

error:
	if (is_truncate)
		fuse_release_nowrite(inode);

1764
	clear_bit(FUSE_I_SIZE_UNSTABLE, &fi->state);
M
Miklos Szeredi 已提交
1765
	return err;
1766 1767
}

1768 1769
static int fuse_setattr(struct dentry *entry, struct iattr *attr)
{
1770 1771 1772 1773 1774
	struct inode *inode = entry->d_inode;

	if (!fuse_allow_current_process(get_fuse_conn(inode)))
		return -EACCES;

1775
	if (attr->ia_valid & ATTR_FILE)
1776
		return fuse_do_setattr(inode, attr, attr->ia_file);
1777
	else
1778
		return fuse_do_setattr(inode, attr, NULL);
1779 1780
}

1781 1782 1783 1784
static int fuse_getattr(struct vfsmount *mnt, struct dentry *entry,
			struct kstat *stat)
{
	struct inode *inode = entry->d_inode;
1785 1786
	struct fuse_conn *fc = get_fuse_conn(inode);

1787
	if (!fuse_allow_current_process(fc))
1788 1789
		return -EACCES;

M
Miklos Szeredi 已提交
1790
	return fuse_update_attributes(inode, stat, NULL, NULL);
1791 1792
}

1793 1794 1795 1796 1797 1798 1799 1800 1801 1802 1803 1804
static int fuse_setxattr(struct dentry *entry, const char *name,
			 const void *value, size_t size, int flags)
{
	struct inode *inode = entry->d_inode;
	struct fuse_conn *fc = get_fuse_conn(inode);
	struct fuse_req *req;
	struct fuse_setxattr_in inarg;
	int err;

	if (fc->no_setxattr)
		return -EOPNOTSUPP;

M
Maxim Patlasov 已提交
1805
	req = fuse_get_req_nopages(fc);
1806 1807
	if (IS_ERR(req))
		return PTR_ERR(req);
1808 1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819 1820

	memset(&inarg, 0, sizeof(inarg));
	inarg.size = size;
	inarg.flags = flags;
	req->in.h.opcode = FUSE_SETXATTR;
	req->in.h.nodeid = get_node_id(inode);
	req->in.numargs = 3;
	req->in.args[0].size = sizeof(inarg);
	req->in.args[0].value = &inarg;
	req->in.args[1].size = strlen(name) + 1;
	req->in.args[1].value = name;
	req->in.args[2].size = size;
	req->in.args[2].value = value;
1821
	fuse_request_send(fc, req);
1822 1823 1824 1825 1826 1827
	err = req->out.h.error;
	fuse_put_request(fc, req);
	if (err == -ENOSYS) {
		fc->no_setxattr = 1;
		err = -EOPNOTSUPP;
	}
M
Maxim Patlasov 已提交
1828
	if (!err) {
1829
		fuse_invalidate_attr(inode);
M
Maxim Patlasov 已提交
1830 1831
		fuse_update_ctime(inode);
	}
1832 1833 1834 1835 1836 1837 1838 1839 1840 1841 1842 1843 1844 1845 1846 1847
	return err;
}

static ssize_t fuse_getxattr(struct dentry *entry, const char *name,
			     void *value, size_t size)
{
	struct inode *inode = entry->d_inode;
	struct fuse_conn *fc = get_fuse_conn(inode);
	struct fuse_req *req;
	struct fuse_getxattr_in inarg;
	struct fuse_getxattr_out outarg;
	ssize_t ret;

	if (fc->no_getxattr)
		return -EOPNOTSUPP;

M
Maxim Patlasov 已提交
1848
	req = fuse_get_req_nopages(fc);
1849 1850
	if (IS_ERR(req))
		return PTR_ERR(req);
1851 1852 1853 1854 1855 1856 1857 1858 1859 1860 1861 1862 1863 1864 1865 1866 1867 1868 1869 1870

	memset(&inarg, 0, sizeof(inarg));
	inarg.size = size;
	req->in.h.opcode = FUSE_GETXATTR;
	req->in.h.nodeid = get_node_id(inode);
	req->in.numargs = 2;
	req->in.args[0].size = sizeof(inarg);
	req->in.args[0].value = &inarg;
	req->in.args[1].size = strlen(name) + 1;
	req->in.args[1].value = name;
	/* This is really two different operations rolled into one */
	req->out.numargs = 1;
	if (size) {
		req->out.argvar = 1;
		req->out.args[0].size = size;
		req->out.args[0].value = value;
	} else {
		req->out.args[0].size = sizeof(outarg);
		req->out.args[0].value = &outarg;
	}
1871
	fuse_request_send(fc, req);
1872 1873 1874 1875 1876 1877 1878 1879 1880 1881 1882 1883 1884 1885 1886 1887 1888 1889 1890 1891 1892 1893
	ret = req->out.h.error;
	if (!ret)
		ret = size ? req->out.args[0].size : outarg.size;
	else {
		if (ret == -ENOSYS) {
			fc->no_getxattr = 1;
			ret = -EOPNOTSUPP;
		}
	}
	fuse_put_request(fc, req);
	return ret;
}

static ssize_t fuse_listxattr(struct dentry *entry, char *list, size_t size)
{
	struct inode *inode = entry->d_inode;
	struct fuse_conn *fc = get_fuse_conn(inode);
	struct fuse_req *req;
	struct fuse_getxattr_in inarg;
	struct fuse_getxattr_out outarg;
	ssize_t ret;

1894
	if (!fuse_allow_current_process(fc))
M
Miklos Szeredi 已提交
1895 1896
		return -EACCES;

1897 1898 1899
	if (fc->no_listxattr)
		return -EOPNOTSUPP;

M
Maxim Patlasov 已提交
1900
	req = fuse_get_req_nopages(fc);
1901 1902
	if (IS_ERR(req))
		return PTR_ERR(req);
1903 1904 1905 1906 1907 1908 1909 1910 1911 1912 1913 1914 1915 1916 1917 1918 1919 1920

	memset(&inarg, 0, sizeof(inarg));
	inarg.size = size;
	req->in.h.opcode = FUSE_LISTXATTR;
	req->in.h.nodeid = get_node_id(inode);
	req->in.numargs = 1;
	req->in.args[0].size = sizeof(inarg);
	req->in.args[0].value = &inarg;
	/* This is really two different operations rolled into one */
	req->out.numargs = 1;
	if (size) {
		req->out.argvar = 1;
		req->out.args[0].size = size;
		req->out.args[0].value = list;
	} else {
		req->out.args[0].size = sizeof(outarg);
		req->out.args[0].value = &outarg;
	}
1921
	fuse_request_send(fc, req);
1922 1923 1924 1925 1926 1927 1928 1929 1930 1931 1932 1933 1934 1935 1936 1937 1938 1939 1940 1941 1942 1943 1944
	ret = req->out.h.error;
	if (!ret)
		ret = size ? req->out.args[0].size : outarg.size;
	else {
		if (ret == -ENOSYS) {
			fc->no_listxattr = 1;
			ret = -EOPNOTSUPP;
		}
	}
	fuse_put_request(fc, req);
	return ret;
}

static int fuse_removexattr(struct dentry *entry, const char *name)
{
	struct inode *inode = entry->d_inode;
	struct fuse_conn *fc = get_fuse_conn(inode);
	struct fuse_req *req;
	int err;

	if (fc->no_removexattr)
		return -EOPNOTSUPP;

M
Maxim Patlasov 已提交
1945
	req = fuse_get_req_nopages(fc);
1946 1947
	if (IS_ERR(req))
		return PTR_ERR(req);
1948 1949 1950 1951 1952 1953

	req->in.h.opcode = FUSE_REMOVEXATTR;
	req->in.h.nodeid = get_node_id(inode);
	req->in.numargs = 1;
	req->in.args[0].size = strlen(name) + 1;
	req->in.args[0].value = name;
1954
	fuse_request_send(fc, req);
1955 1956 1957 1958 1959 1960
	err = req->out.h.error;
	fuse_put_request(fc, req);
	if (err == -ENOSYS) {
		fc->no_removexattr = 1;
		err = -EOPNOTSUPP;
	}
M
Maxim Patlasov 已提交
1961
	if (!err) {
1962
		fuse_invalidate_attr(inode);
M
Maxim Patlasov 已提交
1963 1964
		fuse_update_ctime(inode);
	}
1965 1966 1967
	return err;
}

1968
static const struct inode_operations fuse_dir_inode_operations = {
1969
	.lookup		= fuse_lookup,
1970 1971 1972 1973 1974 1975 1976 1977
	.mkdir		= fuse_mkdir,
	.symlink	= fuse_symlink,
	.unlink		= fuse_unlink,
	.rmdir		= fuse_rmdir,
	.rename		= fuse_rename,
	.link		= fuse_link,
	.setattr	= fuse_setattr,
	.create		= fuse_create,
1978
	.atomic_open	= fuse_atomic_open,
1979
	.mknod		= fuse_mknod,
1980 1981
	.permission	= fuse_permission,
	.getattr	= fuse_getattr,
1982 1983 1984 1985
	.setxattr	= fuse_setxattr,
	.getxattr	= fuse_getxattr,
	.listxattr	= fuse_listxattr,
	.removexattr	= fuse_removexattr,
1986 1987
};

1988
static const struct file_operations fuse_dir_operations = {
M
Miklos Szeredi 已提交
1989
	.llseek		= generic_file_llseek,
1990
	.read		= generic_read_dir,
A
Al Viro 已提交
1991
	.iterate	= fuse_readdir,
1992 1993
	.open		= fuse_dir_open,
	.release	= fuse_dir_release,
1994
	.fsync		= fuse_dir_fsync,
1995 1996
	.unlocked_ioctl	= fuse_dir_ioctl,
	.compat_ioctl	= fuse_dir_compat_ioctl,
1997 1998
};

1999
static const struct inode_operations fuse_common_inode_operations = {
2000
	.setattr	= fuse_setattr,
2001 2002
	.permission	= fuse_permission,
	.getattr	= fuse_getattr,
2003 2004 2005 2006
	.setxattr	= fuse_setxattr,
	.getxattr	= fuse_getxattr,
	.listxattr	= fuse_listxattr,
	.removexattr	= fuse_removexattr,
2007 2008
};

2009
static const struct inode_operations fuse_symlink_inode_operations = {
2010
	.setattr	= fuse_setattr,
2011 2012 2013 2014
	.follow_link	= fuse_follow_link,
	.put_link	= fuse_put_link,
	.readlink	= generic_readlink,
	.getattr	= fuse_getattr,
2015 2016 2017 2018
	.setxattr	= fuse_setxattr,
	.getxattr	= fuse_getxattr,
	.listxattr	= fuse_listxattr,
	.removexattr	= fuse_removexattr,
2019 2020 2021 2022 2023 2024 2025 2026 2027 2028 2029 2030 2031 2032 2033 2034 2035
};

void fuse_init_common(struct inode *inode)
{
	inode->i_op = &fuse_common_inode_operations;
}

void fuse_init_dir(struct inode *inode)
{
	inode->i_op = &fuse_dir_inode_operations;
	inode->i_fop = &fuse_dir_operations;
}

void fuse_init_symlink(struct inode *inode)
{
	inode->i_op = &fuse_symlink_inode_operations;
}