xfs_ioctl.c 51.6 KB
Newer Older
D
Dave Chinner 已提交
1
// SPDX-License-Identifier: GPL-2.0
L
Linus Torvalds 已提交
2
/*
3 4
 * Copyright (c) 2000-2005 Silicon Graphics, Inc.
 * All Rights Reserved.
L
Linus Torvalds 已提交
5 6 7
 */
#include "xfs.h"
#include "xfs_fs.h"
8
#include "xfs_shared.h"
9 10 11
#include "xfs_format.h"
#include "xfs_log_format.h"
#include "xfs_trans_resv.h"
L
Linus Torvalds 已提交
12 13 14
#include "xfs_mount.h"
#include "xfs_inode.h"
#include "xfs_rtalloc.h"
15
#include "xfs_iwalk.h"
L
Linus Torvalds 已提交
16
#include "xfs_itable.h"
17
#include "xfs_error.h"
L
Linus Torvalds 已提交
18
#include "xfs_attr.h"
19
#include "xfs_bmap.h"
D
Dave Chinner 已提交
20
#include "xfs_bmap_util.h"
L
Linus Torvalds 已提交
21
#include "xfs_fsops.h"
C
Christoph Hellwig 已提交
22
#include "xfs_discard.h"
23
#include "xfs_quota.h"
24
#include "xfs_export.h"
C
Christoph Hellwig 已提交
25
#include "xfs_trace.h"
26
#include "xfs_icache.h"
27
#include "xfs_trans.h"
28
#include "xfs_acl.h"
29 30 31
#include "xfs_btree.h"
#include <linux/fsmap.h>
#include "xfs_fsmap.h"
32
#include "scrub/xfs_scrub.h"
33
#include "xfs_sb.h"
34
#include "xfs_ag.h"
35
#include "xfs_health.h"
36
#include "xfs_reflink.h"
D
Darrick J. Wong 已提交
37
#include "xfs_ioctl.h"
38 39
#include "xfs_da_format.h"
#include "xfs_da_btree.h"
L
Linus Torvalds 已提交
40 41 42 43 44 45 46 47 48 49 50 51 52 53 54

#include <linux/mount.h>
#include <linux/namei.h>

/*
 * xfs_find_handle maps from userspace xfs_fsop_handlereq structure to
 * a file or fs handle.
 *
 * XFS_IOC_PATH_TO_FSHANDLE
 *    returns fs handle for a mount point or path within that mount point
 * XFS_IOC_FD_TO_HANDLE
 *    returns full handle for a FD opened in user space
 * XFS_IOC_PATH_TO_HANDLE
 *    returns full handle for a path
 */
55
int
L
Linus Torvalds 已提交
56 57
xfs_find_handle(
	unsigned int		cmd,
58
	xfs_fsop_handlereq_t	*hreq)
L
Linus Torvalds 已提交
59 60 61 62
{
	int			hsize;
	xfs_handle_t		handle;
	struct inode		*inode;
63
	struct fd		f = {NULL};
C
Christoph Hellwig 已提交
64
	struct path		path;
65
	int			error;
C
Christoph Hellwig 已提交
66
	struct xfs_inode	*ip;
L
Linus Torvalds 已提交
67

C
Christoph Hellwig 已提交
68
	if (cmd == XFS_IOC_FD_TO_HANDLE) {
69 70
		f = fdget(hreq->fd);
		if (!f.file)
C
Christoph Hellwig 已提交
71
			return -EBADF;
A
Al Viro 已提交
72
		inode = file_inode(f.file);
C
Christoph Hellwig 已提交
73
	} else {
74
		error = user_path_at(AT_FDCWD, hreq->path, 0, &path);
C
Christoph Hellwig 已提交
75 76
		if (error)
			return error;
77
		inode = d_inode(path.dentry);
L
Linus Torvalds 已提交
78
	}
C
Christoph Hellwig 已提交
79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104
	ip = XFS_I(inode);

	/*
	 * We can only generate handles for inodes residing on a XFS filesystem,
	 * and only for regular files, directories or symbolic links.
	 */
	error = -EINVAL;
	if (inode->i_sb->s_magic != XFS_SB_MAGIC)
		goto out_put;

	error = -EBADF;
	if (!S_ISREG(inode->i_mode) &&
	    !S_ISDIR(inode->i_mode) &&
	    !S_ISLNK(inode->i_mode))
		goto out_put;


	memcpy(&handle.ha_fsid, ip->i_mount->m_fixedfsid, sizeof(xfs_fsid_t));

	if (cmd == XFS_IOC_PATH_TO_FSHANDLE) {
		/*
		 * This handle only contains an fsid, zero the rest.
		 */
		memset(&handle.ha_fid, 0, sizeof(handle.ha_fid));
		hsize = sizeof(xfs_fsid_t);
	} else {
C
Christoph Hellwig 已提交
105 106 107
		handle.ha_fid.fid_len = sizeof(xfs_fid_t) -
					sizeof(handle.ha_fid.fid_len);
		handle.ha_fid.fid_pad = 0;
108
		handle.ha_fid.fid_gen = inode->i_generation;
C
Christoph Hellwig 已提交
109
		handle.ha_fid.fid_ino = ip->i_ino;
C
Christoph Hellwig 已提交
110
		hsize = sizeof(xfs_handle_t);
L
Linus Torvalds 已提交
111 112
	}

C
Christoph Hellwig 已提交
113
	error = -EFAULT;
114
	if (copy_to_user(hreq->ohandle, &handle, hsize) ||
C
Christoph Hellwig 已提交
115 116
	    copy_to_user(hreq->ohandlen, &hsize, sizeof(__s32)))
		goto out_put;
L
Linus Torvalds 已提交
117

C
Christoph Hellwig 已提交
118 119 120 121
	error = 0;

 out_put:
	if (cmd == XFS_IOC_FD_TO_HANDLE)
122
		fdput(f);
C
Christoph Hellwig 已提交
123 124 125
	else
		path_put(&path);
	return error;
L
Linus Torvalds 已提交
126 127 128
}

/*
129 130
 * No need to do permission checks on the various pathname components
 * as the handle operations are privileged.
L
Linus Torvalds 已提交
131 132
 */
STATIC int
133 134 135 136 137 138 139 140 141 142 143 144 145 146 147
xfs_handle_acceptable(
	void			*context,
	struct dentry		*dentry)
{
	return 1;
}

/*
 * Convert userspace handle data into a dentry.
 */
struct dentry *
xfs_handle_to_dentry(
	struct file		*parfilp,
	void __user		*uhandle,
	u32			hlen)
L
Linus Torvalds 已提交
148 149
{
	xfs_handle_t		handle;
150
	struct xfs_fid64	fid;
L
Linus Torvalds 已提交
151 152 153 154

	/*
	 * Only allow handle opens under a directory.
	 */
A
Al Viro 已提交
155
	if (!S_ISDIR(file_inode(parfilp)->i_mode))
156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173
		return ERR_PTR(-ENOTDIR);

	if (hlen != sizeof(xfs_handle_t))
		return ERR_PTR(-EINVAL);
	if (copy_from_user(&handle, uhandle, hlen))
		return ERR_PTR(-EFAULT);
	if (handle.ha_fid.fid_len !=
	    sizeof(handle.ha_fid) - sizeof(handle.ha_fid.fid_len))
		return ERR_PTR(-EINVAL);

	memset(&fid, 0, sizeof(struct fid));
	fid.ino = handle.ha_fid.fid_ino;
	fid.gen = handle.ha_fid.fid_gen;

	return exportfs_decode_fh(parfilp->f_path.mnt, (struct fid *)&fid, 3,
			FILEID_INO32_GEN | XFS_FILEID_TYPE_64FLAG,
			xfs_handle_acceptable, NULL);
}
L
Linus Torvalds 已提交
174

175 176 177 178 179 180
STATIC struct dentry *
xfs_handlereq_to_dentry(
	struct file		*parfilp,
	xfs_fsop_handlereq_t	*hreq)
{
	return xfs_handle_to_dentry(parfilp, hreq->ihandle, hreq->ihandlen);
L
Linus Torvalds 已提交
181 182
}

183
int
L
Linus Torvalds 已提交
184 185
xfs_open_by_handle(
	struct file		*parfilp,
186
	xfs_fsop_handlereq_t	*hreq)
L
Linus Torvalds 已提交
187
{
188
	const struct cred	*cred = current_cred();
L
Linus Torvalds 已提交
189
	int			error;
190
	int			fd;
L
Linus Torvalds 已提交
191 192 193 194
	int			permflag;
	struct file		*filp;
	struct inode		*inode;
	struct dentry		*dentry;
195
	fmode_t			fmode;
196
	struct path		path;
L
Linus Torvalds 已提交
197 198

	if (!capable(CAP_SYS_ADMIN))
E
Eric Sandeen 已提交
199
		return -EPERM;
L
Linus Torvalds 已提交
200

201 202 203
	dentry = xfs_handlereq_to_dentry(parfilp, hreq);
	if (IS_ERR(dentry))
		return PTR_ERR(dentry);
204
	inode = d_inode(dentry);
L
Linus Torvalds 已提交
205 206 207

	/* Restrict xfs_open_by_handle to directories & regular files. */
	if (!(S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode))) {
E
Eric Sandeen 已提交
208
		error = -EPERM;
209
		goto out_dput;
L
Linus Torvalds 已提交
210 211 212
	}

#if BITS_PER_LONG != 32
213
	hreq->oflags |= O_LARGEFILE;
L
Linus Torvalds 已提交
214
#endif
215

216
	permflag = hreq->oflags;
217
	fmode = OPEN_FMODE(permflag);
L
Linus Torvalds 已提交
218
	if ((!(permflag & O_APPEND) || (permflag & O_TRUNC)) &&
219
	    (fmode & FMODE_WRITE) && IS_APPEND(inode)) {
E
Eric Sandeen 已提交
220
		error = -EPERM;
221
		goto out_dput;
L
Linus Torvalds 已提交
222 223
	}

224
	if ((fmode & FMODE_WRITE) && IS_IMMUTABLE(inode)) {
E
Eryu Guan 已提交
225
		error = -EPERM;
226
		goto out_dput;
L
Linus Torvalds 已提交
227 228 229
	}

	/* Can't write directories. */
230
	if (S_ISDIR(inode->i_mode) && (fmode & FMODE_WRITE)) {
E
Eric Sandeen 已提交
231
		error = -EISDIR;
232
		goto out_dput;
L
Linus Torvalds 已提交
233 234
	}

235
	fd = get_unused_fd_flags(0);
236 237 238
	if (fd < 0) {
		error = fd;
		goto out_dput;
L
Linus Torvalds 已提交
239 240
	}

241 242 243 244
	path.mnt = parfilp->f_path.mnt;
	path.dentry = dentry;
	filp = dentry_open(&path, hreq->oflags, cred);
	dput(dentry);
L
Linus Torvalds 已提交
245
	if (IS_ERR(filp)) {
246 247
		put_unused_fd(fd);
		return PTR_ERR(filp);
L
Linus Torvalds 已提交
248
	}
249

A
Al Viro 已提交
250
	if (S_ISREG(inode->i_mode)) {
251
		filp->f_flags |= O_NOATIME;
252
		filp->f_mode |= FMODE_NOCMTIME;
253
	}
L
Linus Torvalds 已提交
254

255 256 257 258 259 260
	fd_install(fd, filp);
	return fd;

 out_dput:
	dput(dentry);
	return error;
L
Linus Torvalds 已提交
261 262
}

263
int
L
Linus Torvalds 已提交
264
xfs_readlink_by_handle(
265 266
	struct file		*parfilp,
	xfs_fsop_handlereq_t	*hreq)
L
Linus Torvalds 已提交
267
{
268
	struct dentry		*dentry;
L
Linus Torvalds 已提交
269
	__u32			olen;
270
	int			error;
L
Linus Torvalds 已提交
271 272

	if (!capable(CAP_SYS_ADMIN))
E
Eric Sandeen 已提交
273
		return -EPERM;
L
Linus Torvalds 已提交
274

275 276 277
	dentry = xfs_handlereq_to_dentry(parfilp, hreq);
	if (IS_ERR(dentry))
		return PTR_ERR(dentry);
L
Linus Torvalds 已提交
278 279

	/* Restrict this handle operation to symlinks only. */
280
	if (!d_is_symlink(dentry)) {
E
Eric Sandeen 已提交
281
		error = -EINVAL;
282
		goto out_dput;
L
Linus Torvalds 已提交
283 284
	}

285
	if (copy_from_user(&olen, hreq->ohandlen, sizeof(__u32))) {
E
Eric Sandeen 已提交
286
		error = -EFAULT;
287
		goto out_dput;
L
Linus Torvalds 已提交
288 289
	}

290
	error = vfs_readlink(dentry, hreq->ohandle, olen);
291

292 293
 out_dput:
	dput(dentry);
294
	return error;
L
Linus Torvalds 已提交
295 296 297 298
}

STATIC int
xfs_attrlist_by_handle(
299 300
	struct file		*parfilp,
	void			__user *arg)
L
Linus Torvalds 已提交
301
{
302
	int			error = -ENOMEM;
L
Linus Torvalds 已提交
303
	attrlist_cursor_kern_t	*cursor;
304
	struct xfs_fsop_attrlist_handlereq __user	*p = arg;
L
Linus Torvalds 已提交
305
	xfs_fsop_attrlist_handlereq_t al_hreq;
306
	struct dentry		*dentry;
L
Linus Torvalds 已提交
307 308 309
	char			*kbuf;

	if (!capable(CAP_SYS_ADMIN))
E
Eric Sandeen 已提交
310
		return -EPERM;
L
Linus Torvalds 已提交
311
	if (copy_from_user(&al_hreq, arg, sizeof(xfs_fsop_attrlist_handlereq_t)))
E
Eric Sandeen 已提交
312
		return -EFAULT;
313
	if (al_hreq.buflen < sizeof(struct attrlist) ||
J
Jan Tulak 已提交
314
	    al_hreq.buflen > XFS_XATTR_LIST_MAX)
E
Eric Sandeen 已提交
315
		return -EINVAL;
L
Linus Torvalds 已提交
316

317 318 319 320
	/*
	 * Reject flags, only allow namespaces.
	 */
	if (al_hreq.flags & ~(ATTR_ROOT | ATTR_SECURE))
E
Eric Sandeen 已提交
321
		return -EINVAL;
322 323
	if (al_hreq.flags == (ATTR_ROOT | ATTR_SECURE))
		return -EINVAL;
324

325 326 327
	dentry = xfs_handlereq_to_dentry(parfilp, &al_hreq.hreq);
	if (IS_ERR(dentry))
		return PTR_ERR(dentry);
L
Linus Torvalds 已提交
328

329
	kbuf = kmem_zalloc_large(al_hreq.buflen, 0);
330 331
	if (!kbuf)
		goto out_dput;
L
Linus Torvalds 已提交
332 333

	cursor = (attrlist_cursor_kern_t *)&al_hreq.pos;
334
	error = xfs_attr_list(XFS_I(d_inode(dentry)), kbuf, al_hreq.buflen,
335
					al_hreq.flags, cursor);
L
Linus Torvalds 已提交
336 337 338
	if (error)
		goto out_kfree;

339 340 341 342 343
	if (copy_to_user(&p->pos, cursor, sizeof(attrlist_cursor_kern_t))) {
		error = -EFAULT;
		goto out_kfree;
	}

L
Linus Torvalds 已提交
344 345 346
	if (copy_to_user(al_hreq.buffer, kbuf, al_hreq.buflen))
		error = -EFAULT;

347 348 349
out_kfree:
	kmem_free(kbuf);
out_dput:
350 351
	dput(dentry);
	return error;
L
Linus Torvalds 已提交
352 353
}

354
static int
L
Linus Torvalds 已提交
355
xfs_attrmulti_attr_get(
356
	struct inode		*inode,
357 358
	unsigned char		*name,
	unsigned char		__user *ubuf,
359 360
	uint32_t		*len,
	uint32_t		flags)
L
Linus Torvalds 已提交
361
{
362 363 364 365 366 367 368 369
	struct xfs_da_args	args = {
		.dp		= XFS_I(inode),
		.flags		= flags,
		.name		= name,
		.namelen	= strlen(name),
		.valuelen	= *len,
	};
	int			error;
370

371
	if (*len > XFS_XATTR_SIZE_MAX)
D
Dave Chinner 已提交
372
		return -EINVAL;
373 374 375

	args.value = kmem_zalloc_large(*len, 0);
	if (!args.value)
D
Dave Chinner 已提交
376
		return -ENOMEM;
L
Linus Torvalds 已提交
377

378
	error = xfs_attr_get(&args);
L
Linus Torvalds 已提交
379 380 381
	if (error)
		goto out_kfree;

382 383
	*len = args.valuelen;
	if (copy_to_user(ubuf, args.value, args.valuelen))
D
Dave Chinner 已提交
384
		error = -EFAULT;
L
Linus Torvalds 已提交
385

386
out_kfree:
387
	kmem_free(args.value);
L
Linus Torvalds 已提交
388 389 390
	return error;
}

391
static int
L
Linus Torvalds 已提交
392
xfs_attrmulti_attr_set(
393
	struct inode		*inode,
394 395
	unsigned char		*name,
	const unsigned char	__user *ubuf,
396 397
	uint32_t		len,
	uint32_t		flags)
L
Linus Torvalds 已提交
398
{
399 400 401 402 403 404
	struct xfs_da_args	args = {
		.dp		= XFS_I(inode),
		.flags		= flags,
		.name		= name,
		.namelen	= strlen(name),
	};
405
	int			error;
L
Linus Torvalds 已提交
406

407
	if (IS_IMMUTABLE(inode) || IS_APPEND(inode))
D
Dave Chinner 已提交
408
		return -EPERM;
L
Linus Torvalds 已提交
409

410 411 412
	if (ubuf) {
		if (len > XFS_XATTR_SIZE_MAX)
			return -EINVAL;
413 414 415 416
		args.value = memdup_user(ubuf, len);
		if (IS_ERR(args.value))
			return PTR_ERR(args.value);
		args.valuelen = len;
417
	}
418

419
	error = xfs_attr_set(&args);
420 421
	if (!error)
		xfs_forget_acl(inode, name, flags);
422
	kfree(args.value);
423
	return error;
L
Linus Torvalds 已提交
424 425
}

426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469
int
xfs_ioc_attrmulti_one(
	struct file		*parfilp,
	struct inode		*inode,
	uint32_t		opcode,
	void __user		*uname,
	void __user		*value,
	uint32_t		*len,
	uint32_t		flags)
{
	unsigned char		*name;
	int			error;

	if ((flags & ATTR_ROOT) && (flags & ATTR_SECURE))
		return -EINVAL;

	name = strndup_user(uname, MAXNAMELEN);
	if (IS_ERR(name))
		return PTR_ERR(name);

	switch (opcode) {
	case ATTR_OP_GET:
		error = xfs_attrmulti_attr_get(inode, name, value, len, flags);
		break;
	case ATTR_OP_REMOVE:
		value = NULL;
		*len = 0;
		/* fall through */
	case ATTR_OP_SET:
		error = mnt_want_write_file(parfilp);
		if (error)
			break;
		error = xfs_attrmulti_attr_set(inode, name, value, *len, flags);
		mnt_drop_write_file(parfilp);
		break;
	default:
		error = -EINVAL;
		break;
	}

	kfree(name);
	return error;
}

L
Linus Torvalds 已提交
470 471
STATIC int
xfs_attrmulti_by_handle(
472
	struct file		*parfilp,
473
	void			__user *arg)
L
Linus Torvalds 已提交
474 475 476 477
{
	int			error;
	xfs_attr_multiop_t	*ops;
	xfs_fsop_attrmulti_handlereq_t am_hreq;
478
	struct dentry		*dentry;
L
Linus Torvalds 已提交
479 480 481
	unsigned int		i, size;

	if (!capable(CAP_SYS_ADMIN))
E
Eric Sandeen 已提交
482
		return -EPERM;
L
Linus Torvalds 已提交
483
	if (copy_from_user(&am_hreq, arg, sizeof(xfs_fsop_attrmulti_handlereq_t)))
E
Eric Sandeen 已提交
484
		return -EFAULT;
L
Linus Torvalds 已提交
485

486 487 488 489
	/* overflow check */
	if (am_hreq.opcount >= INT_MAX / sizeof(xfs_attr_multiop_t))
		return -E2BIG;

490 491 492
	dentry = xfs_handlereq_to_dentry(parfilp, &am_hreq.hreq);
	if (IS_ERR(dentry))
		return PTR_ERR(dentry);
L
Linus Torvalds 已提交
493

D
Dave Chinner 已提交
494
	error = -E2BIG;
C
Christoph Hellwig 已提交
495
	size = am_hreq.opcount * sizeof(xfs_attr_multiop_t);
L
Linus Torvalds 已提交
496
	if (!size || size > 16 * PAGE_SIZE)
497
		goto out_dput;
L
Linus Torvalds 已提交
498

L
Li Zefan 已提交
499 500
	ops = memdup_user(am_hreq.ops, size);
	if (IS_ERR(ops)) {
D
Dave Chinner 已提交
501
		error = PTR_ERR(ops);
502
		goto out_dput;
L
Li Zefan 已提交
503
	}
L
Linus Torvalds 已提交
504 505 506

	error = 0;
	for (i = 0; i < am_hreq.opcount; i++) {
507 508 509 510
		ops[i].am_error = xfs_ioc_attrmulti_one(parfilp,
				d_inode(dentry), ops[i].am_opcode,
				ops[i].am_attrname, ops[i].am_attrvalue,
				&ops[i].am_length, ops[i].am_flags);
L
Linus Torvalds 已提交
511 512 513
	}

	if (copy_to_user(am_hreq.ops, ops, size))
D
Dave Chinner 已提交
514
		error = -EFAULT;
L
Linus Torvalds 已提交
515 516

	kfree(ops);
517 518
 out_dput:
	dput(dentry);
D
Dave Chinner 已提交
519
	return error;
L
Linus Torvalds 已提交
520 521
}

522
int
L
Linus Torvalds 已提交
523 524
xfs_ioc_space(
	struct file		*filp,
525
	xfs_flock64_t		*bf)
L
Linus Torvalds 已提交
526
{
527 528
	struct inode		*inode = file_inode(filp);
	struct xfs_inode	*ip = XFS_I(inode);
529
	struct iattr		iattr;
530
	enum xfs_prealloc_flags	flags = XFS_PREALLOC_CLEAR;
531
	uint			iolock = XFS_IOLOCK_EXCL | XFS_MMAPLOCK_EXCL;
L
Linus Torvalds 已提交
532 533
	int			error;

534
	if (inode->i_flags & (S_IMMUTABLE|S_APPEND))
E
Eric Sandeen 已提交
535
		return -EPERM;
L
Linus Torvalds 已提交
536

537
	if (!(filp->f_mode & FMODE_WRITE))
E
Eric Sandeen 已提交
538
		return -EBADF;
L
Linus Torvalds 已提交
539

540
	if (!S_ISREG(inode->i_mode))
E
Eric Sandeen 已提交
541
		return -EINVAL;
L
Linus Torvalds 已提交
542

543 544 545
	if (xfs_is_always_cow_inode(ip))
		return -EOPNOTSUPP;

546 547
	if (filp->f_flags & O_DSYNC)
		flags |= XFS_PREALLOC_SYNC;
548
	if (filp->f_mode & FMODE_NOCMTIME)
549 550
		flags |= XFS_PREALLOC_INVISIBLE;

J
Jan Kara 已提交
551 552 553
	error = mnt_want_write_file(filp);
	if (error)
		return error;
554

555
	xfs_ilock(ip, iolock);
556
	error = xfs_break_layouts(inode, &iolock, BREAK_UNMAP);
557 558
	if (error)
		goto out_unlock;
559
	inode_dio_wait(inode);
560 561 562 563 564 565 566 567 568 569 570

	switch (bf->l_whence) {
	case 0: /*SEEK_SET*/
		break;
	case 1: /*SEEK_CUR*/
		bf->l_start += filp->f_pos;
		break;
	case 2: /*SEEK_END*/
		bf->l_start += XFS_ISIZE(ip);
		break;
	default:
D
Dave Chinner 已提交
571
		error = -EINVAL;
572 573 574
		goto out_unlock;
	}

575
	if (bf->l_start < 0 || bf->l_start > inode->i_sb->s_maxbytes) {
D
Dave Chinner 已提交
576
		error = -EINVAL;
577 578 579
		goto out_unlock;
	}

580 581 582 583 584
	if (bf->l_start > XFS_ISIZE(ip)) {
		error = xfs_alloc_file_space(ip, XFS_ISIZE(ip),
				bf->l_start - XFS_ISIZE(ip), 0);
		if (error)
			goto out_unlock;
585 586
	}

587 588 589
	iattr.ia_valid = ATTR_SIZE;
	iattr.ia_size = bf->l_start;
	error = xfs_vn_setattr_size(file_dentry(filp), &iattr);
590 591 592
	if (error)
		goto out_unlock;

593
	error = xfs_update_prealloc_flags(ip, flags);
594 595

out_unlock:
596
	xfs_iunlock(ip, iolock);
J
Jan Kara 已提交
597
	mnt_drop_write_file(filp);
D
Dave Chinner 已提交
598
	return error;
L
Linus Torvalds 已提交
599 600
}

601 602
/* Return 0 on success or positive error */
int
D
Darrick J. Wong 已提交
603
xfs_fsbulkstat_one_fmt(
604 605
	struct xfs_ibulk		*breq,
	const struct xfs_bulkstat	*bstat)
606
{
607 608 609 610
	struct xfs_bstat		bs1;

	xfs_bulkstat_to_bstat(breq->mp, &bs1, bstat);
	if (copy_to_user(breq->ubuffer, &bs1, sizeof(bs1)))
611 612 613 614
		return -EFAULT;
	return xfs_ibulk_advance(breq, sizeof(struct xfs_bstat));
}

615
int
D
Darrick J. Wong 已提交
616
xfs_fsinumbers_fmt(
617 618
	struct xfs_ibulk		*breq,
	const struct xfs_inumbers	*igrp)
619
{
620 621 622 623
	struct xfs_inogrp		ig1;

	xfs_inumbers_to_inogrp(&ig1, igrp);
	if (copy_to_user(breq->ubuffer, &ig1, sizeof(struct xfs_inogrp)))
624 625 626 627
		return -EFAULT;
	return xfs_ibulk_advance(breq, sizeof(struct xfs_inogrp));
}

L
Linus Torvalds 已提交
628
STATIC int
D
Darrick J. Wong 已提交
629
xfs_ioc_fsbulkstat(
L
Linus Torvalds 已提交
630 631 632 633
	xfs_mount_t		*mp,
	unsigned int		cmd,
	void			__user *arg)
{
634 635 636 637 638 639
	struct xfs_fsop_bulkreq	bulkreq;
	struct xfs_ibulk	breq = {
		.mp		= mp,
		.ocount		= 0,
	};
	xfs_ino_t		lastino;
L
Linus Torvalds 已提交
640 641 642 643 644 645 646 647 648
	int			error;

	/* done = 1 if there are more stats to get and if bulkstat */
	/* should be called again (unused here, but used in dmapi) */

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (XFS_FORCED_SHUTDOWN(mp))
E
Eric Sandeen 已提交
649
		return -EIO;
L
Linus Torvalds 已提交
650

651
	if (copy_from_user(&bulkreq, arg, sizeof(struct xfs_fsop_bulkreq)))
E
Eric Sandeen 已提交
652
		return -EFAULT;
L
Linus Torvalds 已提交
653

654
	if (copy_from_user(&lastino, bulkreq.lastip, sizeof(__s64)))
E
Eric Sandeen 已提交
655
		return -EFAULT;
L
Linus Torvalds 已提交
656

657
	if (bulkreq.icount <= 0)
E
Eric Sandeen 已提交
658
		return -EINVAL;
L
Linus Torvalds 已提交
659

660
	if (bulkreq.ubuffer == NULL)
E
Eric Sandeen 已提交
661
		return -EINVAL;
662

663 664 665 666 667 668 669 670 671 672 673 674 675 676 677
	breq.ubuffer = bulkreq.ubuffer;
	breq.icount = bulkreq.icount;

	/*
	 * FSBULKSTAT_SINGLE expects that *lastip contains the inode number
	 * that we want to stat.  However, FSINUMBERS and FSBULKSTAT expect
	 * that *lastip contains either zero or the number of the last inode to
	 * be examined by the previous call and return results starting with
	 * the next inode after that.  The new bulk request back end functions
	 * take the inode to start with, so we have to compute the startino
	 * parameter from lastino to maintain correct function.  lastino == 0
	 * is a special case because it has traditionally meant "first inode
	 * in filesystem".
	 */
	if (cmd == XFS_IOC_FSINUMBERS) {
678
		breq.startino = lastino ? lastino + 1 : 0;
D
Darrick J. Wong 已提交
679
		error = xfs_inumbers(&breq, xfs_fsinumbers_fmt);
680
		lastino = breq.startino - 1;
681 682 683
	} else if (cmd == XFS_IOC_FSBULKSTAT_SINGLE) {
		breq.startino = lastino;
		breq.icount = 1;
D
Darrick J. Wong 已提交
684
		error = xfs_bulkstat_one(&breq, xfs_fsbulkstat_one_fmt);
685 686
	} else {	/* XFS_IOC_FSBULKSTAT */
		breq.startino = lastino ? lastino + 1 : 0;
D
Darrick J. Wong 已提交
687
		error = xfs_bulkstat(&breq, xfs_fsbulkstat_one_fmt);
688 689
		lastino = breq.startino - 1;
	}
L
Linus Torvalds 已提交
690 691

	if (error)
D
Dave Chinner 已提交
692
		return error;
L
Linus Torvalds 已提交
693

694
	if (bulkreq.lastip != NULL &&
695
	    copy_to_user(bulkreq.lastip, &lastino, sizeof(xfs_ino_t)))
696
		return -EFAULT;
L
Linus Torvalds 已提交
697

698
	if (bulkreq.ocount != NULL &&
699
	    copy_to_user(bulkreq.ocount, &breq.ocount, sizeof(__s32)))
700
		return -EFAULT;
L
Linus Torvalds 已提交
701 702 703 704

	return 0;
}

705 706 707 708 709 710 711 712 713 714 715 716 717 718
/* Return 0 on success or positive error */
static int
xfs_bulkstat_fmt(
	struct xfs_ibulk		*breq,
	const struct xfs_bulkstat	*bstat)
{
	if (copy_to_user(breq->ubuffer, bstat, sizeof(struct xfs_bulkstat)))
		return -EFAULT;
	return xfs_ibulk_advance(breq, sizeof(struct xfs_bulkstat));
}

/*
 * Check the incoming bulk request @hdr from userspace and initialize the
 * internal @breq bulk request appropriately.  Returns 0 if the bulk request
719
 * should proceed; -ECANCELED if there's nothing to do; or the usual
720 721 722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737
 * negative error code.
 */
static int
xfs_bulk_ireq_setup(
	struct xfs_mount	*mp,
	struct xfs_bulk_ireq	*hdr,
	struct xfs_ibulk	*breq,
	void __user		*ubuffer)
{
	if (hdr->icount == 0 ||
	    (hdr->flags & ~XFS_BULK_IREQ_FLAGS_ALL) ||
	    memchr_inv(hdr->reserved, 0, sizeof(hdr->reserved)))
		return -EINVAL;

	breq->startino = hdr->ino;
	breq->ubuffer = ubuffer;
	breq->icount = hdr->icount;
	breq->ocount = 0;
D
Darrick J. Wong 已提交
738 739
	breq->flags = 0;

740 741 742 743 744 745 746 747 748 749 750 751 752 753 754 755 756
	/*
	 * The @ino parameter is a special value, so we must look it up here.
	 * We're not allowed to have IREQ_AGNO, and we only return one inode
	 * worth of data.
	 */
	if (hdr->flags & XFS_BULK_IREQ_SPECIAL) {
		if (hdr->flags & XFS_BULK_IREQ_AGNO)
			return -EINVAL;

		switch (hdr->ino) {
		case XFS_BULK_IREQ_SPECIAL_ROOT:
			hdr->ino = mp->m_sb.sb_rootino;
			break;
		default:
			return -EINVAL;
		}
		breq->icount = 1;
L
Linus Torvalds 已提交
757 758
	}

D
Darrick J. Wong 已提交
759 760 761 762 763 764 765 766 767 768 769 770 771 772 773 774 775 776
	/*
	 * The IREQ_AGNO flag means that we only want results from a given AG.
	 * If @hdr->ino is zero, we start iterating in that AG.  If @hdr->ino is
	 * beyond the specified AG then we return no results.
	 */
	if (hdr->flags & XFS_BULK_IREQ_AGNO) {
		if (hdr->agno >= mp->m_sb.sb_agcount)
			return -EINVAL;

		if (breq->startino == 0)
			breq->startino = XFS_AGINO_TO_INO(mp, hdr->agno, 0);
		else if (XFS_INO_TO_AGNO(mp, breq->startino) < hdr->agno)
			return -EINVAL;

		breq->flags |= XFS_IBULK_SAME_AG;

		/* Asking for an inode past the end of the AG?  We're done! */
		if (XFS_INO_TO_AGNO(mp, breq->startino) > hdr->agno)
777
			return -ECANCELED;
D
Darrick J. Wong 已提交
778 779
	} else if (hdr->agno)
		return -EINVAL;
780 781 782

	/* Asking for an inode past the end of the FS?  We're done! */
	if (XFS_INO_TO_AGNO(mp, breq->startino) >= mp->m_sb.sb_agcount)
783
		return -ECANCELED;
784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823

	return 0;
}

/*
 * Update the userspace bulk request @hdr to reflect the end state of the
 * internal bulk request @breq.
 */
static void
xfs_bulk_ireq_teardown(
	struct xfs_bulk_ireq	*hdr,
	struct xfs_ibulk	*breq)
{
	hdr->ino = breq->startino;
	hdr->ocount = breq->ocount;
}

/* Handle the v5 bulkstat ioctl. */
STATIC int
xfs_ioc_bulkstat(
	struct xfs_mount		*mp,
	unsigned int			cmd,
	struct xfs_bulkstat_req __user	*arg)
{
	struct xfs_bulk_ireq		hdr;
	struct xfs_ibulk		breq = {
		.mp			= mp,
	};
	int				error;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (XFS_FORCED_SHUTDOWN(mp))
		return -EIO;

	if (copy_from_user(&hdr, &arg->hdr, sizeof(hdr)))
		return -EFAULT;

	error = xfs_bulk_ireq_setup(mp, &hdr, &breq, arg->bulkstat);
824
	if (error == -ECANCELED)
825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840
		goto out_teardown;
	if (error < 0)
		return error;

	error = xfs_bulkstat(&breq, xfs_bulkstat_fmt);
	if (error)
		return error;

out_teardown:
	xfs_bulk_ireq_teardown(&hdr, &breq);
	if (copy_to_user(&arg->hdr, &hdr, sizeof(hdr)))
		return -EFAULT;

	return 0;
}

841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873
STATIC int
xfs_inumbers_fmt(
	struct xfs_ibulk		*breq,
	const struct xfs_inumbers	*igrp)
{
	if (copy_to_user(breq->ubuffer, igrp, sizeof(struct xfs_inumbers)))
		return -EFAULT;
	return xfs_ibulk_advance(breq, sizeof(struct xfs_inumbers));
}

/* Handle the v5 inumbers ioctl. */
STATIC int
xfs_ioc_inumbers(
	struct xfs_mount		*mp,
	unsigned int			cmd,
	struct xfs_inumbers_req __user	*arg)
{
	struct xfs_bulk_ireq		hdr;
	struct xfs_ibulk		breq = {
		.mp			= mp,
	};
	int				error;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (XFS_FORCED_SHUTDOWN(mp))
		return -EIO;

	if (copy_from_user(&hdr, &arg->hdr, sizeof(hdr)))
		return -EFAULT;

	error = xfs_bulk_ireq_setup(mp, &hdr, &breq, arg->inumbers);
874
	if (error == -ECANCELED)
875 876 877 878 879 880 881 882 883 884 885 886 887
		goto out_teardown;
	if (error < 0)
		return error;

	error = xfs_inumbers(&breq, xfs_inumbers_fmt);
	if (error)
		return error;

out_teardown:
	xfs_bulk_ireq_teardown(&hdr, &breq);
	if (copy_to_user(&arg->hdr, &hdr, sizeof(hdr)))
		return -EFAULT;

L
Linus Torvalds 已提交
888 889 890 891 892
	return 0;
}

STATIC int
xfs_ioc_fsgeometry(
893 894 895
	struct xfs_mount	*mp,
	void			__user *arg,
	int			struct_version)
L
Linus Torvalds 已提交
896
{
897 898
	struct xfs_fsop_geom	fsgeo;
	size_t			len;
L
Linus Torvalds 已提交
899

900
	xfs_fs_geometry(&mp->m_sb, &fsgeo, struct_version);
L
Linus Torvalds 已提交
901

902 903 904 905
	if (struct_version <= 3)
		len = sizeof(struct xfs_fsop_geom_v1);
	else if (struct_version == 4)
		len = sizeof(struct xfs_fsop_geom_v4);
906 907
	else {
		xfs_fsop_geom_health(mp, &fsgeo);
908
		len = sizeof(fsgeo);
909
	}
910 911

	if (copy_to_user(arg, &fsgeo, len))
E
Eric Sandeen 已提交
912
		return -EFAULT;
L
Linus Torvalds 已提交
913 914 915
	return 0;
}

916 917 918 919 920 921 922 923 924 925
STATIC int
xfs_ioc_ag_geometry(
	struct xfs_mount	*mp,
	void			__user *arg)
{
	struct xfs_ag_geometry	ageo;
	int			error;

	if (copy_from_user(&ageo, arg, sizeof(ageo)))
		return -EFAULT;
926 927 928 929
	if (ageo.ag_flags)
		return -EINVAL;
	if (memchr_inv(&ageo.ag_reserved, 0, sizeof(ageo.ag_reserved)))
		return -EINVAL;
930 931 932 933 934 935 936 937 938 939

	error = xfs_ag_get_geometry(mp, ageo.ag_number, &ageo);
	if (error)
		return error;

	if (copy_to_user(arg, &ageo, sizeof(ageo)))
		return -EFAULT;
	return 0;
}

L
Linus Torvalds 已提交
940 941 942 943 944 945 946 947 948 949 950
/*
 * Linux extended inode flags interface.
 */

STATIC unsigned int
xfs_merge_ioc_xflags(
	unsigned int	flags,
	unsigned int	start)
{
	unsigned int	xflags = start;

951
	if (flags & FS_IMMUTABLE_FL)
952
		xflags |= FS_XFLAG_IMMUTABLE;
L
Linus Torvalds 已提交
953
	else
954
		xflags &= ~FS_XFLAG_IMMUTABLE;
955
	if (flags & FS_APPEND_FL)
956
		xflags |= FS_XFLAG_APPEND;
L
Linus Torvalds 已提交
957
	else
958
		xflags &= ~FS_XFLAG_APPEND;
959
	if (flags & FS_SYNC_FL)
960
		xflags |= FS_XFLAG_SYNC;
L
Linus Torvalds 已提交
961
	else
962
		xflags &= ~FS_XFLAG_SYNC;
963
	if (flags & FS_NOATIME_FL)
964
		xflags |= FS_XFLAG_NOATIME;
L
Linus Torvalds 已提交
965
	else
966
		xflags &= ~FS_XFLAG_NOATIME;
967
	if (flags & FS_NODUMP_FL)
968
		xflags |= FS_XFLAG_NODUMP;
L
Linus Torvalds 已提交
969
	else
970
		xflags &= ~FS_XFLAG_NODUMP;
L
Linus Torvalds 已提交
971 972 973 974 975 976

	return xflags;
}

STATIC unsigned int
xfs_di2lxflags(
977
	uint16_t	di_flags)
L
Linus Torvalds 已提交
978 979 980 981
{
	unsigned int	flags = 0;

	if (di_flags & XFS_DIFLAG_IMMUTABLE)
982
		flags |= FS_IMMUTABLE_FL;
L
Linus Torvalds 已提交
983
	if (di_flags & XFS_DIFLAG_APPEND)
984
		flags |= FS_APPEND_FL;
L
Linus Torvalds 已提交
985
	if (di_flags & XFS_DIFLAG_SYNC)
986
		flags |= FS_SYNC_FL;
L
Linus Torvalds 已提交
987
	if (di_flags & XFS_DIFLAG_NOATIME)
988
		flags |= FS_NOATIME_FL;
L
Linus Torvalds 已提交
989
	if (di_flags & XFS_DIFLAG_NODUMP)
990
		flags |= FS_NODUMP_FL;
L
Linus Torvalds 已提交
991 992 993
	return flags;
}

994 995 996 997 998
static void
xfs_fill_fsxattr(
	struct xfs_inode	*ip,
	bool			attr,
	struct fsxattr		*fa)
999
{
1000 1001 1002
	simple_fill_fsxattr(fa, xfs_ip2xflags(ip));
	fa->fsx_extsize = ip->i_d.di_extsize << ip->i_mount->m_sb.sb_blocklog;
	fa->fsx_cowextsize = ip->i_d.di_cowextsize <<
1003
			ip->i_mount->m_sb.sb_blocklog;
1004
	fa->fsx_projid = ip->i_d.di_projid;
1005 1006 1007 1008

	if (attr) {
		if (ip->i_afp) {
			if (ip->i_afp->if_flags & XFS_IFEXTENTS)
1009
				fa->fsx_nextents = xfs_iext_count(ip->i_afp);
1010
			else
1011
				fa->fsx_nextents = ip->i_d.di_anextents;
1012
		} else
1013
			fa->fsx_nextents = 0;
1014 1015
	} else {
		if (ip->i_df.if_flags & XFS_IFEXTENTS)
1016
			fa->fsx_nextents = xfs_iext_count(&ip->i_df);
1017
		else
1018
			fa->fsx_nextents = ip->i_d.di_nextents;
1019
	}
1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030 1031
}

STATIC int
xfs_ioc_fsgetxattr(
	xfs_inode_t		*ip,
	int			attr,
	void			__user *arg)
{
	struct fsxattr		fa;

	xfs_ilock(ip, XFS_ILOCK_SHARED);
	xfs_fill_fsxattr(ip, attr, &fa);
1032 1033 1034 1035 1036 1037 1038
	xfs_iunlock(ip, XFS_ILOCK_SHARED);

	if (copy_to_user(arg, &fa, sizeof(fa)))
		return -EFAULT;
	return 0;
}

1039 1040
STATIC uint16_t
xfs_flags2diflags(
1041 1042 1043 1044
	struct xfs_inode	*ip,
	unsigned int		xflags)
{
	/* can't set PREALLOC this way, just preserve it */
1045 1046 1047
	uint16_t		di_flags =
		(ip->i_d.di_flags & XFS_DIFLAG_PREALLOC);

1048
	if (xflags & FS_XFLAG_IMMUTABLE)
1049
		di_flags |= XFS_DIFLAG_IMMUTABLE;
1050
	if (xflags & FS_XFLAG_APPEND)
1051
		di_flags |= XFS_DIFLAG_APPEND;
1052
	if (xflags & FS_XFLAG_SYNC)
1053
		di_flags |= XFS_DIFLAG_SYNC;
1054
	if (xflags & FS_XFLAG_NOATIME)
1055
		di_flags |= XFS_DIFLAG_NOATIME;
1056
	if (xflags & FS_XFLAG_NODUMP)
1057
		di_flags |= XFS_DIFLAG_NODUMP;
1058
	if (xflags & FS_XFLAG_NODEFRAG)
1059
		di_flags |= XFS_DIFLAG_NODEFRAG;
1060
	if (xflags & FS_XFLAG_FILESTREAM)
1061
		di_flags |= XFS_DIFLAG_FILESTREAM;
D
Dave Chinner 已提交
1062
	if (S_ISDIR(VFS_I(ip)->i_mode)) {
1063
		if (xflags & FS_XFLAG_RTINHERIT)
1064
			di_flags |= XFS_DIFLAG_RTINHERIT;
1065
		if (xflags & FS_XFLAG_NOSYMLINKS)
1066
			di_flags |= XFS_DIFLAG_NOSYMLINKS;
1067
		if (xflags & FS_XFLAG_EXTSZINHERIT)
1068
			di_flags |= XFS_DIFLAG_EXTSZINHERIT;
1069
		if (xflags & FS_XFLAG_PROJINHERIT)
1070
			di_flags |= XFS_DIFLAG_PROJINHERIT;
D
Dave Chinner 已提交
1071
	} else if (S_ISREG(VFS_I(ip)->i_mode)) {
1072
		if (xflags & FS_XFLAG_REALTIME)
1073
			di_flags |= XFS_DIFLAG_REALTIME;
1074
		if (xflags & FS_XFLAG_EXTSIZE)
1075 1076
			di_flags |= XFS_DIFLAG_EXTSIZE;
	}
1077

1078 1079 1080 1081 1082 1083 1084 1085 1086 1087
	return di_flags;
}

STATIC uint64_t
xfs_flags2diflags2(
	struct xfs_inode	*ip,
	unsigned int		xflags)
{
	uint64_t		di_flags2 =
		(ip->i_d.di_flags2 & XFS_DIFLAG2_REFLINK);
1088 1089 1090

	if (xflags & FS_XFLAG_DAX)
		di_flags2 |= XFS_DIFLAG2_DAX;
1091 1092
	if (xflags & FS_XFLAG_COWEXTSIZE)
		di_flags2 |= XFS_DIFLAG2_COWEXTSIZE;
1093

1094
	return di_flags2;
1095 1096
}

1097 1098 1099 1100
STATIC void
xfs_diflags_to_linux(
	struct xfs_inode	*ip)
{
1101
	struct inode		*inode = VFS_I(ip);
1102 1103
	unsigned int		xflags = xfs_ip2xflags(ip);

1104
	if (xflags & FS_XFLAG_IMMUTABLE)
1105 1106 1107
		inode->i_flags |= S_IMMUTABLE;
	else
		inode->i_flags &= ~S_IMMUTABLE;
1108
	if (xflags & FS_XFLAG_APPEND)
1109 1110 1111
		inode->i_flags |= S_APPEND;
	else
		inode->i_flags &= ~S_APPEND;
1112
	if (xflags & FS_XFLAG_SYNC)
1113 1114 1115
		inode->i_flags |= S_SYNC;
	else
		inode->i_flags &= ~S_SYNC;
1116
	if (xflags & FS_XFLAG_NOATIME)
1117 1118 1119
		inode->i_flags |= S_NOATIME;
	else
		inode->i_flags &= ~S_NOATIME;
1120
#if 0	/* disabled until the flag switching races are sorted out */
1121 1122 1123 1124
	if (xflags & FS_XFLAG_DAX)
		inode->i_flags |= S_DAX;
	else
		inode->i_flags &= ~S_DAX;
1125
#endif
1126
}
1127

1128 1129 1130 1131 1132 1133 1134
static int
xfs_ioctl_setattr_xflags(
	struct xfs_trans	*tp,
	struct xfs_inode	*ip,
	struct fsxattr		*fa)
{
	struct xfs_mount	*mp = ip->i_mount;
1135
	uint64_t		di_flags2;
1136 1137 1138

	/* Can't change realtime flag if any extents are allocated. */
	if ((ip->i_d.di_nextents || ip->i_delayed_blks) &&
1139
	    XFS_IS_REALTIME_INODE(ip) != (fa->fsx_xflags & FS_XFLAG_REALTIME))
1140 1141 1142
		return -EINVAL;

	/* If realtime flag is set then must have realtime device */
1143
	if (fa->fsx_xflags & FS_XFLAG_REALTIME) {
1144 1145 1146 1147 1148
		if (mp->m_sb.sb_rblocks == 0 || mp->m_sb.sb_rextsize == 0 ||
		    (ip->i_d.di_extsize % mp->m_sb.sb_rextsize))
			return -EINVAL;
	}

1149
	/* Clear reflink if we are actually able to set the rt flag. */
1150
	if ((fa->fsx_xflags & FS_XFLAG_REALTIME) && xfs_is_reflink_inode(ip))
1151
		ip->i_d.di_flags2 &= ~XFS_DIFLAG2_REFLINK;
1152

1153 1154 1155 1156
	/* Don't allow us to set DAX mode for a reflinked file for now. */
	if ((fa->fsx_xflags & FS_XFLAG_DAX) && xfs_is_reflink_inode(ip))
		return -EINVAL;

1157 1158 1159 1160 1161 1162 1163 1164
	/* diflags2 only valid for v3 inodes. */
	di_flags2 = xfs_flags2diflags2(ip, fa->fsx_xflags);
	if (di_flags2 && ip->i_d.di_version < 3)
		return -EINVAL;

	ip->i_d.di_flags = xfs_flags2diflags(ip, fa->fsx_xflags);
	ip->i_d.di_flags2 = di_flags2;

1165 1166 1167
	xfs_diflags_to_linux(ip);
	xfs_trans_ichgtime(tp, ip, XFS_ICHGTIME_CHG);
	xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE);
1168
	XFS_STATS_INC(mp, xs_ig_attrchg);
1169 1170 1171
	return 0;
}

1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186
/*
 * If we are changing DAX flags, we have to ensure the file is clean and any
 * cached objects in the address space are invalidated and removed. This
 * requires us to lock out other IO and page faults similar to a truncate
 * operation. The locks need to be held until the transaction has been committed
 * so that the cache invalidation is atomic with respect to the DAX flag
 * manipulation.
 */
static int
xfs_ioctl_setattr_dax_invalidate(
	struct xfs_inode	*ip,
	struct fsxattr		*fa,
	int			*join_flags)
{
	struct inode		*inode = VFS_I(ip);
1187
	struct super_block	*sb = inode->i_sb;
1188 1189 1190 1191
	int			error;

	*join_flags = 0;

1192 1193
	/*
	 * It is only valid to set the DAX flag on regular files and
1194
	 * directories on filesystems where the block size is equal to the page
1195 1196
	 * size. On directories it serves as an inherited hint so we don't
	 * have to check the device for dax support or flush pagecache.
1197
	 */
1198
	if (fa->fsx_xflags & FS_XFLAG_DAX) {
1199 1200 1201
		struct xfs_buftarg	*target = xfs_inode_buftarg(ip);

		if (!bdev_dax_supported(target->bt_bdev, sb->s_blocksize))
1202 1203
			return -EINVAL;
	}
1204

1205 1206 1207 1208 1209 1210
	/* If the DAX state is not changing, we have nothing to do here. */
	if ((fa->fsx_xflags & FS_XFLAG_DAX) && IS_DAX(inode))
		return 0;
	if (!(fa->fsx_xflags & FS_XFLAG_DAX) && !IS_DAX(inode))
		return 0;

1211 1212 1213
	if (S_ISDIR(inode->i_mode))
		return 0;

1214 1215 1216 1217 1218 1219 1220 1221 1222 1223
	/* lock, flush and invalidate mapping in preparation for flag change */
	xfs_ilock(ip, XFS_MMAPLOCK_EXCL | XFS_IOLOCK_EXCL);
	error = filemap_write_and_wait(inode->i_mapping);
	if (error)
		goto out_unlock;
	error = invalidate_inode_pages2(inode->i_mapping);
	if (error)
		goto out_unlock;

	*join_flags = XFS_MMAPLOCK_EXCL | XFS_IOLOCK_EXCL;
1224
	return 0;
1225 1226 1227 1228 1229

out_unlock:
	xfs_iunlock(ip, XFS_MMAPLOCK_EXCL | XFS_IOLOCK_EXCL);
	return error;

1230 1231
}

1232 1233 1234 1235 1236
/*
 * Set up the transaction structure for the setattr operation, checking that we
 * have permission to do so. On success, return a clean transaction and the
 * inode locked exclusively ready for further operation specific checks. On
 * failure, return an error without modifying or locking the inode.
1237 1238 1239 1240 1241 1242
 *
 * The inode might already be IO locked on call. If this is the case, it is
 * indicated in @join_flags and we take full responsibility for ensuring they
 * are unlocked from now on. Hence if we have an error here, we still have to
 * unlock them. Otherwise, once they are joined to the transaction, they will
 * be unlocked on commit/cancel.
1243 1244 1245
 */
static struct xfs_trans *
xfs_ioctl_setattr_get_trans(
1246 1247
	struct xfs_inode	*ip,
	int			join_flags)
1248 1249 1250
{
	struct xfs_mount	*mp = ip->i_mount;
	struct xfs_trans	*tp;
1251
	int			error = -EROFS;
1252 1253

	if (mp->m_flags & XFS_MOUNT_RDONLY)
1254 1255
		goto out_unlock;
	error = -EIO;
1256
	if (XFS_FORCED_SHUTDOWN(mp))
1257
		goto out_unlock;
1258

1259
	error = xfs_trans_alloc(mp, &M_RES(mp)->tr_ichange, 0, 0, 0, &tp);
1260
	if (error)
1261
		goto out_unlock;
1262 1263

	xfs_ilock(ip, XFS_ILOCK_EXCL);
1264 1265
	xfs_trans_ijoin(tp, ip, XFS_ILOCK_EXCL | join_flags);
	join_flags = 0;
1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283

	/*
	 * CAP_FOWNER overrides the following restrictions:
	 *
	 * The user ID of the calling process must be equal to the file owner
	 * ID, except in cases where the CAP_FSETID capability is applicable.
	 */
	if (!inode_owner_or_capable(VFS_I(ip))) {
		error = -EPERM;
		goto out_cancel;
	}

	if (mp->m_flags & XFS_MOUNT_WSYNC)
		xfs_trans_set_sync(tp);

	return tp;

out_cancel:
1284
	xfs_trans_cancel(tp);
1285 1286 1287
out_unlock:
	if (join_flags)
		xfs_iunlock(ip, join_flags);
1288 1289 1290
	return ERR_PTR(error);
}

1291 1292 1293 1294
/*
 * extent size hint validation is somewhat cumbersome. Rules are:
 *
 * 1. extent size hint is only valid for directories and regular files
1295 1296
 * 2. FS_XFLAG_EXTSIZE is only valid for regular files
 * 3. FS_XFLAG_EXTSZINHERIT is only valid for directories.
1297 1298 1299 1300 1301 1302 1303
 * 4. can only be changed on regular files if no extents are allocated
 * 5. can be changed on directories at any time
 * 6. extsize hint of 0 turns off hints, clears inode flags.
 * 7. Extent size must be a multiple of the appropriate block size.
 * 8. for non-realtime files, the extent size hint must be limited
 *    to half the AG size to avoid alignment extending the extent beyond the
 *    limits of the AG.
D
Darrick J. Wong 已提交
1304 1305
 *
 * Please keep this function in sync with xfs_scrub_inode_extsize.
1306
 */
1307
static int
1308 1309 1310 1311 1312
xfs_ioctl_setattr_check_extsize(
	struct xfs_inode	*ip,
	struct fsxattr		*fa)
{
	struct xfs_mount	*mp = ip->i_mount;
1313 1314
	xfs_extlen_t		size;
	xfs_fsblock_t		extsize_fsb;
1315

D
Dave Chinner 已提交
1316
	if (S_ISREG(VFS_I(ip)->i_mode) && ip->i_d.di_nextents &&
1317 1318 1319
	    ((ip->i_d.di_extsize << mp->m_sb.sb_blocklog) != fa->fsx_extsize))
		return -EINVAL;

1320 1321
	if (fa->fsx_extsize == 0)
		return 0;
1322

1323 1324 1325
	extsize_fsb = XFS_B_TO_FSB(mp, fa->fsx_extsize);
	if (extsize_fsb > MAXEXTLEN)
		return -EINVAL;
1326

1327 1328 1329 1330 1331 1332
	if (XFS_IS_REALTIME_INODE(ip) ||
	    (fa->fsx_xflags & FS_XFLAG_REALTIME)) {
		size = mp->m_sb.sb_rextsize << mp->m_sb.sb_blocklog;
	} else {
		size = mp->m_sb.sb_blocksize;
		if (extsize_fsb > mp->m_sb.sb_agblocks / 2)
1333
			return -EINVAL;
1334 1335 1336 1337
	}

	if (fa->fsx_extsize % size)
		return -EINVAL;
1338

1339 1340 1341
	return 0;
}

1342 1343 1344 1345 1346 1347 1348 1349 1350 1351 1352 1353
/*
 * CoW extent size hint validation rules are:
 *
 * 1. CoW extent size hint can only be set if reflink is enabled on the fs.
 *    The inode does not have to have any shared blocks, but it must be a v3.
 * 2. FS_XFLAG_COWEXTSIZE is only valid for directories and regular files;
 *    for a directory, the hint is propagated to new files.
 * 3. Can be changed on files & directories at any time.
 * 4. CoW extsize hint of 0 turns off hints, clears inode flags.
 * 5. Extent size must be a multiple of the appropriate block size.
 * 6. The extent size hint must be limited to half the AG size to avoid
 *    alignment extending the extent beyond the limits of the AG.
D
Darrick J. Wong 已提交
1354 1355
 *
 * Please keep this function in sync with xfs_scrub_inode_cowextsize.
1356 1357 1358 1359 1360 1361 1362
 */
static int
xfs_ioctl_setattr_check_cowextsize(
	struct xfs_inode	*ip,
	struct fsxattr		*fa)
{
	struct xfs_mount	*mp = ip->i_mount;
1363 1364
	xfs_extlen_t		size;
	xfs_fsblock_t		cowextsize_fsb;
1365 1366 1367 1368 1369 1370 1371 1372

	if (!(fa->fsx_xflags & FS_XFLAG_COWEXTSIZE))
		return 0;

	if (!xfs_sb_version_hasreflink(&ip->i_mount->m_sb) ||
	    ip->i_d.di_version != 3)
		return -EINVAL;

1373 1374
	if (fa->fsx_cowextsize == 0)
		return 0;
1375

1376 1377 1378
	cowextsize_fsb = XFS_B_TO_FSB(mp, fa->fsx_cowextsize);
	if (cowextsize_fsb > MAXEXTLEN)
		return -EINVAL;
1379

1380 1381 1382
	size = mp->m_sb.sb_blocksize;
	if (cowextsize_fsb > mp->m_sb.sb_agblocks / 2)
		return -EINVAL;
1383

1384 1385
	if (fa->fsx_cowextsize % size)
		return -EINVAL;
1386 1387 1388 1389

	return 0;
}

1390
static int
1391 1392 1393 1394 1395
xfs_ioctl_setattr_check_projid(
	struct xfs_inode	*ip,
	struct fsxattr		*fa)
{
	/* Disallow 32bit project ids if projid32bit feature is not enabled. */
1396
	if (fa->fsx_projid > (uint16_t)-1 &&
1397 1398 1399 1400
	    !xfs_sb_version_hasprojid32bit(&ip->i_mount->m_sb))
		return -EINVAL;
	return 0;
}
1401 1402 1403 1404

STATIC int
xfs_ioctl_setattr(
	xfs_inode_t		*ip,
1405
	struct fsxattr		*fa)
1406
{
1407
	struct fsxattr		old_fa;
1408 1409
	struct xfs_mount	*mp = ip->i_mount;
	struct xfs_trans	*tp;
C
Christoph Hellwig 已提交
1410
	struct xfs_dquot	*udqp = NULL;
1411
	struct xfs_dquot	*pdqp = NULL;
1412 1413
	struct xfs_dquot	*olddquot = NULL;
	int			code;
1414
	int			join_flags = 0;
1415

C
Christoph Hellwig 已提交
1416
	trace_xfs_ioctl_setattr(ip);
1417

1418 1419 1420
	code = xfs_ioctl_setattr_check_projid(ip, fa);
	if (code)
		return code;
1421

1422 1423 1424 1425 1426 1427 1428 1429
	/*
	 * If disk quotas is on, we make sure that the dquots do exist on disk,
	 * before we start any other transactions. Trying to do this later
	 * is messy. We don't care to take a readlock to look at the ids
	 * in inode here, because we can't hold it across the trans_reserve.
	 * If the IDs do change before we take the ilock, we're covered
	 * because the i_*dquot fields will get updated anyway.
	 */
1430
	if (XFS_IS_QUOTA_ON(mp)) {
1431 1432 1433
		code = xfs_qm_vop_dqalloc(ip, VFS_I(ip)->i_uid,
				VFS_I(ip)->i_gid, fa->fsx_projid,
				XFS_QMOPT_PQUOTA, &udqp, NULL, &pdqp);
1434 1435 1436 1437
		if (code)
			return code;
	}

1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448 1449
	/*
	 * Changing DAX config may require inode locking for mapping
	 * invalidation. These need to be held all the way to transaction commit
	 * or cancel time, so need to be passed through to
	 * xfs_ioctl_setattr_get_trans() so it can apply them to the join call
	 * appropriately.
	 */
	code = xfs_ioctl_setattr_dax_invalidate(ip, fa, &join_flags);
	if (code)
		goto error_free_dquots;

	tp = xfs_ioctl_setattr_get_trans(ip, join_flags);
1450 1451 1452
	if (IS_ERR(tp)) {
		code = PTR_ERR(tp);
		goto error_free_dquots;
1453 1454
	}

1455
	if (XFS_IS_QUOTA_RUNNING(mp) && XFS_IS_PQUOTA_ON(mp) &&
1456
	    ip->i_d.di_projid != fa->fsx_projid) {
1457 1458 1459
		code = xfs_qm_vop_chown_reserve(tp, ip, udqp, NULL, pdqp,
				capable(CAP_FOWNER) ?  XFS_QMOPT_FORCE_RES : 0);
		if (code)	/* out of quota */
1460
			goto error_trans_cancel;
1461 1462
	}

1463 1464 1465 1466 1467
	xfs_fill_fsxattr(ip, false, &old_fa);
	code = vfs_ioc_fssetxattr_check(VFS_I(ip), &old_fa, fa);
	if (code)
		goto error_trans_cancel;

1468 1469 1470
	code = xfs_ioctl_setattr_check_extsize(ip, fa);
	if (code)
		goto error_trans_cancel;
1471

1472 1473 1474 1475
	code = xfs_ioctl_setattr_check_cowextsize(ip, fa);
	if (code)
		goto error_trans_cancel;

1476 1477
	code = xfs_ioctl_setattr_xflags(tp, ip, fa);
	if (code)
1478
		goto error_trans_cancel;
1479 1480

	/*
1481 1482 1483 1484 1485
	 * Change file ownership.  Must be the owner or privileged.  CAP_FSETID
	 * overrides the following restrictions:
	 *
	 * The set-user-ID and set-group-ID bits of a file will be cleared upon
	 * successful return from chown()
1486 1487
	 */

D
Dave Chinner 已提交
1488
	if ((VFS_I(ip)->i_mode & (S_ISUID|S_ISGID)) &&
1489
	    !capable_wrt_inode_uidgid(VFS_I(ip), CAP_FSETID))
D
Dave Chinner 已提交
1490
		VFS_I(ip)->i_mode &= ~(S_ISUID|S_ISGID);
1491

1492
	/* Change the ownerships and register project quota modifications */
1493
	if (ip->i_d.di_projid != fa->fsx_projid) {
1494 1495 1496 1497 1498
		if (XFS_IS_QUOTA_RUNNING(mp) && XFS_IS_PQUOTA_ON(mp)) {
			olddquot = xfs_qm_vop_chown(tp, ip,
						&ip->i_pdquot, pdqp);
		}
		ASSERT(ip->i_d.di_version > 1);
1499
		ip->i_d.di_projid = fa->fsx_projid;
1500
	}
1501

1502 1503 1504 1505 1506
	/*
	 * Only set the extent size hint if we've already determined that the
	 * extent size hint should be set on the inode. If no extent size flags
	 * are set on the inode then unconditionally clear the extent size hint.
	 */
1507 1508 1509 1510
	if (ip->i_d.di_flags & (XFS_DIFLAG_EXTSIZE | XFS_DIFLAG_EXTSZINHERIT))
		ip->i_d.di_extsize = fa->fsx_extsize >> mp->m_sb.sb_blocklog;
	else
		ip->i_d.di_extsize = 0;
1511 1512 1513 1514 1515 1516
	if (ip->i_d.di_version == 3 &&
	    (ip->i_d.di_flags2 & XFS_DIFLAG2_COWEXTSIZE))
		ip->i_d.di_cowextsize = fa->fsx_cowextsize >>
				mp->m_sb.sb_blocklog;
	else
		ip->i_d.di_cowextsize = 0;
1517

1518
	code = xfs_trans_commit(tp);
1519 1520 1521 1522

	/*
	 * Release any dquot(s) the inode had kept before chown.
	 */
C
Christoph Hellwig 已提交
1523 1524
	xfs_qm_dqrele(olddquot);
	xfs_qm_dqrele(udqp);
1525
	xfs_qm_dqrele(pdqp);
1526

C
Christoph Hellwig 已提交
1527
	return code;
1528

1529
error_trans_cancel:
1530
	xfs_trans_cancel(tp);
1531
error_free_dquots:
C
Christoph Hellwig 已提交
1532
	xfs_qm_dqrele(udqp);
1533
	xfs_qm_dqrele(pdqp);
1534 1535 1536
	return code;
}

L
Linus Torvalds 已提交
1537
STATIC int
L
Lachlan McIlroy 已提交
1538
xfs_ioc_fssetxattr(
L
Linus Torvalds 已提交
1539 1540 1541 1542 1543
	xfs_inode_t		*ip,
	struct file		*filp,
	void			__user *arg)
{
	struct fsxattr		fa;
J
Jan Kara 已提交
1544
	int error;
L
Lachlan McIlroy 已提交
1545 1546 1547

	if (copy_from_user(&fa, arg, sizeof(fa)))
		return -EFAULT;
L
Linus Torvalds 已提交
1548

J
Jan Kara 已提交
1549 1550 1551
	error = mnt_want_write_file(filp);
	if (error)
		return error;
1552
	error = xfs_ioctl_setattr(ip, &fa);
J
Jan Kara 已提交
1553
	mnt_drop_write_file(filp);
D
Dave Chinner 已提交
1554
	return error;
L
Lachlan McIlroy 已提交
1555
}
L
Linus Torvalds 已提交
1556

L
Lachlan McIlroy 已提交
1557 1558 1559 1560 1561 1562
STATIC int
xfs_ioc_getxflags(
	xfs_inode_t		*ip,
	void			__user *arg)
{
	unsigned int		flags;
L
Linus Torvalds 已提交
1563

L
Lachlan McIlroy 已提交
1564 1565 1566 1567 1568
	flags = xfs_di2lxflags(ip->i_d.di_flags);
	if (copy_to_user(arg, &flags, sizeof(flags)))
		return -EFAULT;
	return 0;
}
L
Linus Torvalds 已提交
1569

L
Lachlan McIlroy 已提交
1570 1571
STATIC int
xfs_ioc_setxflags(
1572
	struct xfs_inode	*ip,
L
Lachlan McIlroy 已提交
1573 1574 1575
	struct file		*filp,
	void			__user *arg)
{
1576
	struct xfs_trans	*tp;
1577
	struct fsxattr		fa;
1578
	struct fsxattr		old_fa;
L
Lachlan McIlroy 已提交
1579
	unsigned int		flags;
1580
	int			join_flags = 0;
1581
	int			error;
L
Linus Torvalds 已提交
1582

L
Lachlan McIlroy 已提交
1583 1584
	if (copy_from_user(&flags, arg, sizeof(flags)))
		return -EFAULT;
L
Linus Torvalds 已提交
1585

L
Lachlan McIlroy 已提交
1586 1587 1588 1589
	if (flags & ~(FS_IMMUTABLE_FL | FS_APPEND_FL | \
		      FS_NOATIME_FL | FS_NODUMP_FL | \
		      FS_SYNC_FL))
		return -EOPNOTSUPP;
L
Linus Torvalds 已提交
1590

1591
	fa.fsx_xflags = xfs_merge_ioc_xflags(flags, xfs_ip2xflags(ip));
L
Linus Torvalds 已提交
1592

J
Jan Kara 已提交
1593 1594 1595
	error = mnt_want_write_file(filp);
	if (error)
		return error;
1596

1597 1598 1599 1600 1601 1602 1603 1604 1605 1606 1607 1608
	/*
	 * Changing DAX config may require inode locking for mapping
	 * invalidation. These need to be held all the way to transaction commit
	 * or cancel time, so need to be passed through to
	 * xfs_ioctl_setattr_get_trans() so it can apply them to the join call
	 * appropriately.
	 */
	error = xfs_ioctl_setattr_dax_invalidate(ip, &fa, &join_flags);
	if (error)
		goto out_drop_write;

	tp = xfs_ioctl_setattr_get_trans(ip, join_flags);
1609 1610 1611 1612 1613
	if (IS_ERR(tp)) {
		error = PTR_ERR(tp);
		goto out_drop_write;
	}

1614 1615 1616 1617 1618 1619 1620
	xfs_fill_fsxattr(ip, false, &old_fa);
	error = vfs_ioc_fssetxattr_check(VFS_I(ip), &old_fa, &fa);
	if (error) {
		xfs_trans_cancel(tp);
		goto out_drop_write;
	}

1621 1622
	error = xfs_ioctl_setattr_xflags(tp, ip, &fa);
	if (error) {
1623
		xfs_trans_cancel(tp);
1624 1625 1626
		goto out_drop_write;
	}

1627
	error = xfs_trans_commit(tp);
1628
out_drop_write:
J
Jan Kara 已提交
1629
	mnt_drop_write_file(filp);
D
Dave Chinner 已提交
1630
	return error;
L
Linus Torvalds 已提交
1631 1632
}

1633 1634 1635 1636 1637
static bool
xfs_getbmap_format(
	struct kgetbmap		*p,
	struct getbmapx __user	*u,
	size_t			recsize)
1638
{
1639 1640 1641 1642 1643 1644 1645 1646 1647 1648 1649 1650 1651 1652
	if (put_user(p->bmv_offset, &u->bmv_offset) ||
	    put_user(p->bmv_block, &u->bmv_block) ||
	    put_user(p->bmv_length, &u->bmv_length) ||
	    put_user(0, &u->bmv_count) ||
	    put_user(0, &u->bmv_entries))
		return false;
	if (recsize < sizeof(struct getbmapx))
		return true;
	if (put_user(0, &u->bmv_iflags) ||
	    put_user(p->bmv_oflags, &u->bmv_oflags) ||
	    put_user(0, &u->bmv_unused1) ||
	    put_user(0, &u->bmv_unused2))
		return false;
	return true;
1653 1654
}

L
Linus Torvalds 已提交
1655 1656
STATIC int
xfs_ioc_getbmap(
1657
	struct file		*file,
L
Linus Torvalds 已提交
1658 1659 1660
	unsigned int		cmd,
	void			__user *arg)
{
1661
	struct getbmapx		bmx = { 0 };
1662 1663 1664
	struct kgetbmap		*buf;
	size_t			recsize;
	int			error, i;
L
Linus Torvalds 已提交
1665

1666 1667 1668 1669 1670 1671 1672 1673 1674 1675 1676 1677 1678 1679
	switch (cmd) {
	case XFS_IOC_GETBMAPA:
		bmx.bmv_iflags = BMV_IF_ATTRFORK;
		/*FALLTHRU*/
	case XFS_IOC_GETBMAP:
		if (file->f_mode & FMODE_NOCMTIME)
			bmx.bmv_iflags |= BMV_IF_NO_DMAPI_READ;
		/* struct getbmap is a strict subset of struct getbmapx. */
		recsize = sizeof(struct getbmap);
		break;
	case XFS_IOC_GETBMAPX:
		recsize = sizeof(struct getbmapx);
		break;
	default:
E
Eric Sandeen 已提交
1680
		return -EINVAL;
1681
	}
L
Linus Torvalds 已提交
1682

1683
	if (copy_from_user(&bmx, arg, recsize))
E
Eric Sandeen 已提交
1684
		return -EFAULT;
L
Linus Torvalds 已提交
1685 1686

	if (bmx.bmv_count < 2)
E
Eric Sandeen 已提交
1687
		return -EINVAL;
1688 1689
	if (bmx.bmv_count > ULONG_MAX / recsize)
		return -ENOMEM;
L
Linus Torvalds 已提交
1690

1691 1692 1693
	buf = kmem_zalloc_large(bmx.bmv_count * sizeof(*buf), 0);
	if (!buf)
		return -ENOMEM;
L
Linus Torvalds 已提交
1694

1695
	error = xfs_getbmap(XFS_I(file_inode(file)), &bmx, buf);
L
Linus Torvalds 已提交
1696
	if (error)
1697
		goto out_free_buf;
L
Linus Torvalds 已提交
1698

1699 1700 1701 1702 1703 1704 1705 1706 1707 1708
	error = -EFAULT;
	if (copy_to_user(arg, &bmx, recsize))
		goto out_free_buf;
	arg += recsize;

	for (i = 0; i < bmx.bmv_entries; i++) {
		if (!xfs_getbmap_format(buf + i, arg, recsize))
			goto out_free_buf;
		arg += recsize;
	}
L
Linus Torvalds 已提交
1709

1710 1711 1712
	error = 0;
out_free_buf:
	kmem_free(buf);
1713
	return error;
L
Linus Torvalds 已提交
1714
}
L
Lachlan McIlroy 已提交
1715

1716 1717
struct getfsmap_info {
	struct xfs_mount	*mp;
1718 1719
	struct fsmap_head __user *data;
	unsigned int		idx;
1720 1721 1722 1723 1724 1725 1726 1727 1728 1729 1730 1731 1732
	__u32			last_flags;
};

STATIC int
xfs_getfsmap_format(struct xfs_fsmap *xfm, void *priv)
{
	struct getfsmap_info	*info = priv;
	struct fsmap		fm;

	trace_xfs_getfsmap_mapping(info->mp, xfm);

	info->last_flags = xfm->fmr_flags;
	xfs_fsmap_from_internal(&fm, xfm);
1733 1734
	if (copy_to_user(&info->data->fmh_recs[info->idx++], &fm,
			sizeof(struct fsmap)))
1735 1736 1737 1738 1739 1740 1741 1742
		return -EFAULT;

	return 0;
}

STATIC int
xfs_ioc_getfsmap(
	struct xfs_inode	*ip,
1743
	struct fsmap_head	__user *arg)
1744
{
1745
	struct getfsmap_info	info = { NULL };
1746 1747 1748 1749 1750 1751 1752 1753 1754 1755 1756 1757 1758 1759 1760 1761 1762 1763 1764 1765 1766 1767 1768
	struct xfs_fsmap_head	xhead = {0};
	struct fsmap_head	head;
	bool			aborted = false;
	int			error;

	if (copy_from_user(&head, arg, sizeof(struct fsmap_head)))
		return -EFAULT;
	if (memchr_inv(head.fmh_reserved, 0, sizeof(head.fmh_reserved)) ||
	    memchr_inv(head.fmh_keys[0].fmr_reserved, 0,
		       sizeof(head.fmh_keys[0].fmr_reserved)) ||
	    memchr_inv(head.fmh_keys[1].fmr_reserved, 0,
		       sizeof(head.fmh_keys[1].fmr_reserved)))
		return -EINVAL;

	xhead.fmh_iflags = head.fmh_iflags;
	xhead.fmh_count = head.fmh_count;
	xfs_fsmap_to_internal(&xhead.fmh_keys[0], &head.fmh_keys[0]);
	xfs_fsmap_to_internal(&xhead.fmh_keys[1], &head.fmh_keys[1]);

	trace_xfs_getfsmap_low_key(ip->i_mount, &xhead.fmh_keys[0]);
	trace_xfs_getfsmap_high_key(ip->i_mount, &xhead.fmh_keys[1]);

	info.mp = ip->i_mount;
1769
	info.data = arg;
1770
	error = xfs_getfsmap(ip->i_mount, &xhead, xfs_getfsmap_format, &info);
1771
	if (error == -ECANCELED) {
1772 1773 1774 1775 1776 1777
		error = 0;
		aborted = true;
	} else if (error)
		return error;

	/* If we didn't abort, set the "last" flag in the last fmx */
1778
	if (!aborted && info.idx) {
1779
		info.last_flags |= FMR_OF_LAST;
1780 1781
		if (copy_to_user(&info.data->fmh_recs[info.idx - 1].fmr_flags,
				&info.last_flags, sizeof(info.last_flags)))
1782 1783 1784 1785 1786 1787 1788 1789 1790 1791 1792 1793
			return -EFAULT;
	}

	/* copy back header */
	head.fmh_entries = xhead.fmh_entries;
	head.fmh_oflags = xhead.fmh_oflags;
	if (copy_to_user(arg, &head, sizeof(struct fsmap_head)))
		return -EFAULT;

	return 0;
}

1794 1795 1796 1797 1798 1799 1800 1801 1802 1803 1804 1805 1806 1807 1808 1809 1810 1811 1812 1813 1814 1815 1816 1817
STATIC int
xfs_ioc_scrub_metadata(
	struct xfs_inode		*ip,
	void				__user *arg)
{
	struct xfs_scrub_metadata	scrub;
	int				error;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (copy_from_user(&scrub, arg, sizeof(scrub)))
		return -EFAULT;

	error = xfs_scrub_metadata(ip, &scrub);
	if (error)
		return error;

	if (copy_to_user(arg, &scrub, sizeof(scrub)))
		return -EFAULT;

	return 0;
}

D
Dave Chinner 已提交
1818 1819 1820 1821 1822 1823 1824 1825 1826 1827 1828
int
xfs_ioc_swapext(
	xfs_swapext_t	*sxp)
{
	xfs_inode_t     *ip, *tip;
	struct fd	f, tmp;
	int		error = 0;

	/* Pull information for the target fd */
	f = fdget((int)sxp->sx_fdtarget);
	if (!f.file) {
D
Dave Chinner 已提交
1829
		error = -EINVAL;
D
Dave Chinner 已提交
1830 1831 1832 1833 1834 1835
		goto out;
	}

	if (!(f.file->f_mode & FMODE_WRITE) ||
	    !(f.file->f_mode & FMODE_READ) ||
	    (f.file->f_flags & O_APPEND)) {
D
Dave Chinner 已提交
1836
		error = -EBADF;
D
Dave Chinner 已提交
1837 1838 1839 1840 1841
		goto out_put_file;
	}

	tmp = fdget((int)sxp->sx_fdtmp);
	if (!tmp.file) {
D
Dave Chinner 已提交
1842
		error = -EINVAL;
D
Dave Chinner 已提交
1843 1844 1845 1846 1847 1848
		goto out_put_file;
	}

	if (!(tmp.file->f_mode & FMODE_WRITE) ||
	    !(tmp.file->f_mode & FMODE_READ) ||
	    (tmp.file->f_flags & O_APPEND)) {
D
Dave Chinner 已提交
1849
		error = -EBADF;
D
Dave Chinner 已提交
1850 1851 1852 1853 1854
		goto out_put_tmp_file;
	}

	if (IS_SWAPFILE(file_inode(f.file)) ||
	    IS_SWAPFILE(file_inode(tmp.file))) {
D
Dave Chinner 已提交
1855
		error = -EINVAL;
D
Dave Chinner 已提交
1856 1857 1858
		goto out_put_tmp_file;
	}

1859 1860 1861 1862 1863 1864 1865 1866 1867 1868 1869
	/*
	 * We need to ensure that the fds passed in point to XFS inodes
	 * before we cast and access them as XFS structures as we have no
	 * control over what the user passes us here.
	 */
	if (f.file->f_op != &xfs_file_operations ||
	    tmp.file->f_op != &xfs_file_operations) {
		error = -EINVAL;
		goto out_put_tmp_file;
	}

D
Dave Chinner 已提交
1870 1871 1872 1873
	ip = XFS_I(file_inode(f.file));
	tip = XFS_I(file_inode(tmp.file));

	if (ip->i_mount != tip->i_mount) {
D
Dave Chinner 已提交
1874
		error = -EINVAL;
D
Dave Chinner 已提交
1875 1876 1877 1878
		goto out_put_tmp_file;
	}

	if (ip->i_ino == tip->i_ino) {
D
Dave Chinner 已提交
1879
		error = -EINVAL;
D
Dave Chinner 已提交
1880 1881 1882 1883
		goto out_put_tmp_file;
	}

	if (XFS_FORCED_SHUTDOWN(ip->i_mount)) {
D
Dave Chinner 已提交
1884
		error = -EIO;
D
Dave Chinner 已提交
1885 1886 1887 1888 1889 1890 1891 1892 1893 1894 1895 1896 1897
		goto out_put_tmp_file;
	}

	error = xfs_swap_extents(ip, tip, sxp);

 out_put_tmp_file:
	fdput(tmp);
 out_put_file:
	fdput(f);
 out:
	return error;
}

1898 1899 1900 1901 1902 1903 1904 1905 1906 1907 1908
static int
xfs_ioc_getlabel(
	struct xfs_mount	*mp,
	char			__user *user_label)
{
	struct xfs_sb		*sbp = &mp->m_sb;
	char			label[XFSLABEL_MAX + 1];

	/* Paranoia */
	BUILD_BUG_ON(sizeof(sbp->sb_fname) > FSLABEL_MAX);

1909 1910
	/* 1 larger than sb_fname, so this ensures a trailing NUL char */
	memset(label, 0, sizeof(label));
1911
	spin_lock(&mp->m_sb_lock);
1912
	strncpy(label, sbp->sb_fname, XFSLABEL_MAX);
1913 1914
	spin_unlock(&mp->m_sb_lock);

1915
	if (copy_to_user(user_label, label, sizeof(label)))
1916 1917 1918 1919 1920 1921 1922 1923 1924 1925 1926 1927 1928 1929 1930 1931 1932 1933 1934 1935 1936 1937 1938 1939 1940 1941 1942 1943 1944 1945 1946 1947 1948 1949 1950
		return -EFAULT;
	return 0;
}

static int
xfs_ioc_setlabel(
	struct file		*filp,
	struct xfs_mount	*mp,
	char			__user *newlabel)
{
	struct xfs_sb		*sbp = &mp->m_sb;
	char			label[XFSLABEL_MAX + 1];
	size_t			len;
	int			error;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;
	/*
	 * The generic ioctl allows up to FSLABEL_MAX chars, but XFS is much
	 * smaller, at 12 bytes.  We copy one more to be sure we find the
	 * (required) NULL character to test the incoming label length.
	 * NB: The on disk label doesn't need to be null terminated.
	 */
	if (copy_from_user(label, newlabel, XFSLABEL_MAX + 1))
		return -EFAULT;
	len = strnlen(label, XFSLABEL_MAX + 1);
	if (len > sizeof(sbp->sb_fname))
		return -EINVAL;

	error = mnt_want_write_file(filp);
	if (error)
		return error;

	spin_lock(&mp->m_sb_lock);
	memset(sbp->sb_fname, 0, sizeof(sbp->sb_fname));
1951
	memcpy(sbp->sb_fname, label, len);
1952 1953 1954 1955 1956 1957 1958 1959 1960 1961 1962 1963 1964 1965 1966 1967 1968 1969 1970 1971 1972 1973 1974 1975 1976 1977 1978 1979
	spin_unlock(&mp->m_sb_lock);

	/*
	 * Now we do several things to satisfy userspace.
	 * In addition to normal logging of the primary superblock, we also
	 * immediately write these changes to sector zero for the primary, then
	 * update all backup supers (as xfs_db does for a label change), then
	 * invalidate the block device page cache.  This is so that any prior
	 * buffered reads from userspace (i.e. from blkid) are invalidated,
	 * and userspace will see the newly-written label.
	 */
	error = xfs_sync_sb_buf(mp);
	if (error)
		goto out;
	/*
	 * growfs also updates backup supers so lock against that.
	 */
	mutex_lock(&mp->m_growlock);
	error = xfs_update_secondary_sbs(mp);
	mutex_unlock(&mp->m_growlock);

	invalidate_bdev(mp->m_ddev_targp->bt_bdev);

out:
	mnt_drop_write_file(filp);
	return error;
}

1980 1981 1982 1983 1984 1985 1986 1987
/*
 * Note: some of the ioctl's return positive numbers as a
 * byte count indicating success, such as readlink_by_handle.
 * So we don't "sign flip" like most other routines.  This means
 * true errors need to be returned as a negative value.
 */
long
xfs_file_ioctl(
L
Lachlan McIlroy 已提交
1988 1989
	struct file		*filp,
	unsigned int		cmd,
1990
	unsigned long		p)
L
Lachlan McIlroy 已提交
1991
{
A
Al Viro 已提交
1992
	struct inode		*inode = file_inode(filp);
1993 1994 1995
	struct xfs_inode	*ip = XFS_I(inode);
	struct xfs_mount	*mp = ip->i_mount;
	void			__user *arg = (void __user *)p;
L
Lachlan McIlroy 已提交
1996 1997
	int			error;

C
Christoph Hellwig 已提交
1998
	trace_xfs_file_ioctl(ip);
1999 2000

	switch (cmd) {
C
Christoph Hellwig 已提交
2001 2002
	case FITRIM:
		return xfs_ioc_trim(mp, arg);
2003 2004 2005 2006
	case FS_IOC_GETFSLABEL:
		return xfs_ioc_getlabel(mp, arg);
	case FS_IOC_SETFSLABEL:
		return xfs_ioc_setlabel(filp, mp, arg);
L
Lachlan McIlroy 已提交
2007 2008 2009
	case XFS_IOC_ALLOCSP:
	case XFS_IOC_FREESP:
	case XFS_IOC_ALLOCSP64:
2010
	case XFS_IOC_FREESP64: {
2011
		xfs_flock64_t		bf;
L
Lachlan McIlroy 已提交
2012

2013
		if (copy_from_user(&bf, arg, sizeof(bf)))
E
Eric Sandeen 已提交
2014
			return -EFAULT;
2015
		return xfs_ioc_space(filp, &bf);
2016
	}
L
Lachlan McIlroy 已提交
2017
	case XFS_IOC_DIOINFO: {
2018 2019
		struct xfs_buftarg	*target = xfs_inode_buftarg(ip);
		struct dioattr		da;
L
Lachlan McIlroy 已提交
2020

2021
		da.d_mem =  da.d_miniosz = target->bt_logical_sectorsize;
L
Lachlan McIlroy 已提交
2022 2023 2024
		da.d_maxiosz = INT_MAX & ~(da.d_miniosz - 1);

		if (copy_to_user(arg, &da, sizeof(da)))
E
Eric Sandeen 已提交
2025
			return -EFAULT;
L
Lachlan McIlroy 已提交
2026 2027 2028 2029 2030 2031
		return 0;
	}

	case XFS_IOC_FSBULKSTAT_SINGLE:
	case XFS_IOC_FSBULKSTAT:
	case XFS_IOC_FSINUMBERS:
D
Darrick J. Wong 已提交
2032
		return xfs_ioc_fsbulkstat(mp, cmd, arg);
L
Lachlan McIlroy 已提交
2033

2034
	case XFS_IOC_BULKSTAT:
L
Lachlan McIlroy 已提交
2035
		return xfs_ioc_bulkstat(mp, cmd, arg);
2036 2037
	case XFS_IOC_INUMBERS:
		return xfs_ioc_inumbers(mp, cmd, arg);
L
Lachlan McIlroy 已提交
2038 2039

	case XFS_IOC_FSGEOMETRY_V1:
2040 2041 2042
		return xfs_ioc_fsgeometry(mp, arg, 3);
	case XFS_IOC_FSGEOMETRY_V4:
		return xfs_ioc_fsgeometry(mp, arg, 4);
L
Lachlan McIlroy 已提交
2043
	case XFS_IOC_FSGEOMETRY:
2044
		return xfs_ioc_fsgeometry(mp, arg, 5);
L
Lachlan McIlroy 已提交
2045

2046 2047 2048
	case XFS_IOC_AG_GEOMETRY:
		return xfs_ioc_ag_geometry(mp, arg);

L
Lachlan McIlroy 已提交
2049 2050 2051 2052 2053 2054 2055
	case XFS_IOC_GETVERSION:
		return put_user(inode->i_generation, (int __user *)arg);

	case XFS_IOC_FSGETXATTR:
		return xfs_ioc_fsgetxattr(ip, 0, arg);
	case XFS_IOC_FSGETXATTRA:
		return xfs_ioc_fsgetxattr(ip, 1, arg);
L
Lachlan McIlroy 已提交
2056 2057
	case XFS_IOC_FSSETXATTR:
		return xfs_ioc_fssetxattr(ip, filp, arg);
L
Lachlan McIlroy 已提交
2058
	case XFS_IOC_GETXFLAGS:
L
Lachlan McIlroy 已提交
2059
		return xfs_ioc_getxflags(ip, arg);
L
Lachlan McIlroy 已提交
2060
	case XFS_IOC_SETXFLAGS:
L
Lachlan McIlroy 已提交
2061
		return xfs_ioc_setxflags(ip, filp, arg);
L
Lachlan McIlroy 已提交
2062 2063 2064 2065

	case XFS_IOC_GETBMAP:
	case XFS_IOC_GETBMAPA:
	case XFS_IOC_GETBMAPX:
2066
		return xfs_ioc_getbmap(filp, cmd, arg);
L
Lachlan McIlroy 已提交
2067

2068 2069 2070
	case FS_IOC_GETFSMAP:
		return xfs_ioc_getfsmap(ip, arg);

2071 2072 2073
	case XFS_IOC_SCRUB_METADATA:
		return xfs_ioc_scrub_metadata(ip, arg);

L
Lachlan McIlroy 已提交
2074 2075
	case XFS_IOC_FD_TO_HANDLE:
	case XFS_IOC_PATH_TO_HANDLE:
2076 2077
	case XFS_IOC_PATH_TO_FSHANDLE: {
		xfs_fsop_handlereq_t	hreq;
L
Lachlan McIlroy 已提交
2078

2079
		if (copy_from_user(&hreq, arg, sizeof(hreq)))
E
Eric Sandeen 已提交
2080
			return -EFAULT;
2081 2082 2083 2084
		return xfs_find_handle(cmd, &hreq);
	}
	case XFS_IOC_OPEN_BY_HANDLE: {
		xfs_fsop_handlereq_t	hreq;
L
Lachlan McIlroy 已提交
2085

2086
		if (copy_from_user(&hreq, arg, sizeof(xfs_fsop_handlereq_t)))
E
Eric Sandeen 已提交
2087
			return -EFAULT;
2088
		return xfs_open_by_handle(filp, &hreq);
2089
	}
L
Lachlan McIlroy 已提交
2090

2091 2092
	case XFS_IOC_READLINK_BY_HANDLE: {
		xfs_fsop_handlereq_t	hreq;
L
Lachlan McIlroy 已提交
2093

2094
		if (copy_from_user(&hreq, arg, sizeof(xfs_fsop_handlereq_t)))
E
Eric Sandeen 已提交
2095
			return -EFAULT;
2096
		return xfs_readlink_by_handle(filp, &hreq);
2097
	}
L
Lachlan McIlroy 已提交
2098
	case XFS_IOC_ATTRLIST_BY_HANDLE:
2099
		return xfs_attrlist_by_handle(filp, arg);
L
Lachlan McIlroy 已提交
2100 2101

	case XFS_IOC_ATTRMULTI_BY_HANDLE:
2102
		return xfs_attrmulti_by_handle(filp, arg);
L
Lachlan McIlroy 已提交
2103 2104

	case XFS_IOC_SWAPEXT: {
2105 2106 2107
		struct xfs_swapext	sxp;

		if (copy_from_user(&sxp, arg, sizeof(xfs_swapext_t)))
E
Eric Sandeen 已提交
2108
			return -EFAULT;
J
Jan Kara 已提交
2109 2110 2111
		error = mnt_want_write_file(filp);
		if (error)
			return error;
D
Dave Chinner 已提交
2112
		error = xfs_ioc_swapext(&sxp);
J
Jan Kara 已提交
2113
		mnt_drop_write_file(filp);
D
Dave Chinner 已提交
2114
		return error;
L
Lachlan McIlroy 已提交
2115 2116 2117 2118 2119
	}

	case XFS_IOC_FSCOUNTS: {
		xfs_fsop_counts_t out;

2120
		xfs_fs_counts(mp, &out);
L
Lachlan McIlroy 已提交
2121 2122

		if (copy_to_user(arg, &out, sizeof(out)))
E
Eric Sandeen 已提交
2123
			return -EFAULT;
L
Lachlan McIlroy 已提交
2124 2125 2126 2127 2128
		return 0;
	}

	case XFS_IOC_SET_RESBLKS: {
		xfs_fsop_resblks_t inout;
2129
		uint64_t	   in;
L
Lachlan McIlroy 已提交
2130 2131 2132 2133

		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

E
Eric Sandeen 已提交
2134
		if (mp->m_flags & XFS_MOUNT_RDONLY)
E
Eric Sandeen 已提交
2135
			return -EROFS;
E
Eric Sandeen 已提交
2136

L
Lachlan McIlroy 已提交
2137
		if (copy_from_user(&inout, arg, sizeof(inout)))
E
Eric Sandeen 已提交
2138
			return -EFAULT;
L
Lachlan McIlroy 已提交
2139

J
Jan Kara 已提交
2140 2141 2142 2143
		error = mnt_want_write_file(filp);
		if (error)
			return error;

L
Lachlan McIlroy 已提交
2144 2145 2146
		/* input parameter is passed in resblks field of structure */
		in = inout.resblks;
		error = xfs_reserve_blocks(mp, &in, &inout);
J
Jan Kara 已提交
2147
		mnt_drop_write_file(filp);
L
Lachlan McIlroy 已提交
2148
		if (error)
D
Dave Chinner 已提交
2149
			return error;
L
Lachlan McIlroy 已提交
2150 2151

		if (copy_to_user(arg, &inout, sizeof(inout)))
E
Eric Sandeen 已提交
2152
			return -EFAULT;
L
Lachlan McIlroy 已提交
2153 2154 2155 2156 2157 2158 2159 2160 2161 2162 2163
		return 0;
	}

	case XFS_IOC_GET_RESBLKS: {
		xfs_fsop_resblks_t out;

		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

		error = xfs_reserve_blocks(mp, NULL, &out);
		if (error)
D
Dave Chinner 已提交
2164
			return error;
L
Lachlan McIlroy 已提交
2165 2166

		if (copy_to_user(arg, &out, sizeof(out)))
E
Eric Sandeen 已提交
2167
			return -EFAULT;
L
Lachlan McIlroy 已提交
2168 2169 2170 2171 2172 2173 2174 2175

		return 0;
	}

	case XFS_IOC_FSGROWFSDATA: {
		xfs_growfs_data_t in;

		if (copy_from_user(&in, arg, sizeof(in)))
E
Eric Sandeen 已提交
2176
			return -EFAULT;
L
Lachlan McIlroy 已提交
2177

J
Jan Kara 已提交
2178 2179 2180
		error = mnt_want_write_file(filp);
		if (error)
			return error;
L
Lachlan McIlroy 已提交
2181
		error = xfs_growfs_data(mp, &in);
J
Jan Kara 已提交
2182
		mnt_drop_write_file(filp);
D
Dave Chinner 已提交
2183
		return error;
L
Lachlan McIlroy 已提交
2184 2185 2186 2187 2188 2189
	}

	case XFS_IOC_FSGROWFSLOG: {
		xfs_growfs_log_t in;

		if (copy_from_user(&in, arg, sizeof(in)))
E
Eric Sandeen 已提交
2190
			return -EFAULT;
L
Lachlan McIlroy 已提交
2191

J
Jan Kara 已提交
2192 2193 2194
		error = mnt_want_write_file(filp);
		if (error)
			return error;
L
Lachlan McIlroy 已提交
2195
		error = xfs_growfs_log(mp, &in);
J
Jan Kara 已提交
2196
		mnt_drop_write_file(filp);
D
Dave Chinner 已提交
2197
		return error;
L
Lachlan McIlroy 已提交
2198 2199 2200 2201 2202 2203
	}

	case XFS_IOC_FSGROWFSRT: {
		xfs_growfs_rt_t in;

		if (copy_from_user(&in, arg, sizeof(in)))
E
Eric Sandeen 已提交
2204
			return -EFAULT;
L
Lachlan McIlroy 已提交
2205

J
Jan Kara 已提交
2206 2207 2208
		error = mnt_want_write_file(filp);
		if (error)
			return error;
L
Lachlan McIlroy 已提交
2209
		error = xfs_growfs_rt(mp, &in);
J
Jan Kara 已提交
2210
		mnt_drop_write_file(filp);
D
Dave Chinner 已提交
2211
		return error;
L
Lachlan McIlroy 已提交
2212 2213 2214
	}

	case XFS_IOC_GOINGDOWN: {
2215
		uint32_t in;
L
Lachlan McIlroy 已提交
2216 2217 2218 2219

		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

2220
		if (get_user(in, (uint32_t __user *)arg))
E
Eric Sandeen 已提交
2221
			return -EFAULT;
L
Lachlan McIlroy 已提交
2222

D
Dave Chinner 已提交
2223
		return xfs_fs_goingdown(mp, in);
L
Lachlan McIlroy 已提交
2224 2225 2226 2227 2228 2229 2230 2231 2232
	}

	case XFS_IOC_ERROR_INJECTION: {
		xfs_error_injection_t in;

		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

		if (copy_from_user(&in, arg, sizeof(in)))
E
Eric Sandeen 已提交
2233
			return -EFAULT;
L
Lachlan McIlroy 已提交
2234

2235
		return xfs_errortag_add(mp, in.errtag);
L
Lachlan McIlroy 已提交
2236 2237 2238 2239 2240 2241
	}

	case XFS_IOC_ERROR_CLEARALL:
		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

2242
		return xfs_errortag_clearall(mp);
L
Lachlan McIlroy 已提交
2243

2244
	case XFS_IOC_FREE_EOFBLOCKS: {
2245 2246
		struct xfs_fs_eofblocks eofb;
		struct xfs_eofblocks keofb;
2247

2248 2249 2250 2251
		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

		if (mp->m_flags & XFS_MOUNT_RDONLY)
E
Eric Sandeen 已提交
2252
			return -EROFS;
2253

2254
		if (copy_from_user(&eofb, arg, sizeof(eofb)))
E
Eric Sandeen 已提交
2255
			return -EFAULT;
2256

2257 2258
		error = xfs_fs_eofblocks_from_user(&eofb, &keofb);
		if (error)
D
Dave Chinner 已提交
2259
			return error;
2260

D
Dave Chinner 已提交
2261
		return xfs_icache_free_eofblocks(mp, &keofb);
2262 2263
	}

L
Lachlan McIlroy 已提交
2264 2265 2266 2267
	default:
		return -ENOTTY;
	}
}