xfs_ioctl.c 50.0 KB
Newer Older
D
Dave Chinner 已提交
1
// SPDX-License-Identifier: GPL-2.0
L
Linus Torvalds 已提交
2
/*
3 4
 * Copyright (c) 2000-2005 Silicon Graphics, Inc.
 * All Rights Reserved.
L
Linus Torvalds 已提交
5 6 7
 */
#include "xfs.h"
#include "xfs_fs.h"
8
#include "xfs_shared.h"
9 10 11
#include "xfs_format.h"
#include "xfs_log_format.h"
#include "xfs_trans_resv.h"
L
Linus Torvalds 已提交
12 13
#include "xfs_mount.h"
#include "xfs_inode.h"
14
#include "xfs_ioctl.h"
15
#include "xfs_alloc.h"
L
Linus Torvalds 已提交
16 17
#include "xfs_rtalloc.h"
#include "xfs_itable.h"
18
#include "xfs_error.h"
L
Linus Torvalds 已提交
19
#include "xfs_attr.h"
20
#include "xfs_bmap.h"
D
Dave Chinner 已提交
21
#include "xfs_bmap_util.h"
L
Linus Torvalds 已提交
22
#include "xfs_fsops.h"
C
Christoph Hellwig 已提交
23
#include "xfs_discard.h"
24
#include "xfs_quota.h"
25
#include "xfs_export.h"
C
Christoph Hellwig 已提交
26
#include "xfs_trace.h"
27
#include "xfs_icache.h"
D
Dave Chinner 已提交
28
#include "xfs_symlink.h"
29
#include "xfs_trans.h"
30
#include "xfs_pnfs.h"
31
#include "xfs_acl.h"
32 33 34
#include "xfs_btree.h"
#include <linux/fsmap.h>
#include "xfs_fsmap.h"
35
#include "scrub/xfs_scrub.h"
36
#include "xfs_sb.h"
L
Linus Torvalds 已提交
37

38
#include <linux/capability.h>
39
#include <linux/cred.h>
L
Linus Torvalds 已提交
40 41 42 43
#include <linux/dcache.h>
#include <linux/mount.h>
#include <linux/namei.h>
#include <linux/pagemap.h>
44
#include <linux/slab.h>
45
#include <linux/exportfs.h>
L
Linus Torvalds 已提交
46 47 48 49 50 51 52 53 54 55 56 57

/*
 * xfs_find_handle maps from userspace xfs_fsop_handlereq structure to
 * a file or fs handle.
 *
 * XFS_IOC_PATH_TO_FSHANDLE
 *    returns fs handle for a mount point or path within that mount point
 * XFS_IOC_FD_TO_HANDLE
 *    returns full handle for a FD opened in user space
 * XFS_IOC_PATH_TO_HANDLE
 *    returns full handle for a path
 */
58
int
L
Linus Torvalds 已提交
59 60
xfs_find_handle(
	unsigned int		cmd,
61
	xfs_fsop_handlereq_t	*hreq)
L
Linus Torvalds 已提交
62 63 64 65
{
	int			hsize;
	xfs_handle_t		handle;
	struct inode		*inode;
66
	struct fd		f = {NULL};
C
Christoph Hellwig 已提交
67
	struct path		path;
68
	int			error;
C
Christoph Hellwig 已提交
69
	struct xfs_inode	*ip;
L
Linus Torvalds 已提交
70

C
Christoph Hellwig 已提交
71
	if (cmd == XFS_IOC_FD_TO_HANDLE) {
72 73
		f = fdget(hreq->fd);
		if (!f.file)
C
Christoph Hellwig 已提交
74
			return -EBADF;
A
Al Viro 已提交
75
		inode = file_inode(f.file);
C
Christoph Hellwig 已提交
76 77 78 79
	} else {
		error = user_lpath((const char __user *)hreq->path, &path);
		if (error)
			return error;
80
		inode = d_inode(path.dentry);
L
Linus Torvalds 已提交
81
	}
C
Christoph Hellwig 已提交
82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107
	ip = XFS_I(inode);

	/*
	 * We can only generate handles for inodes residing on a XFS filesystem,
	 * and only for regular files, directories or symbolic links.
	 */
	error = -EINVAL;
	if (inode->i_sb->s_magic != XFS_SB_MAGIC)
		goto out_put;

	error = -EBADF;
	if (!S_ISREG(inode->i_mode) &&
	    !S_ISDIR(inode->i_mode) &&
	    !S_ISLNK(inode->i_mode))
		goto out_put;


	memcpy(&handle.ha_fsid, ip->i_mount->m_fixedfsid, sizeof(xfs_fsid_t));

	if (cmd == XFS_IOC_PATH_TO_FSHANDLE) {
		/*
		 * This handle only contains an fsid, zero the rest.
		 */
		memset(&handle.ha_fid, 0, sizeof(handle.ha_fid));
		hsize = sizeof(xfs_fsid_t);
	} else {
C
Christoph Hellwig 已提交
108 109 110
		handle.ha_fid.fid_len = sizeof(xfs_fid_t) -
					sizeof(handle.ha_fid.fid_len);
		handle.ha_fid.fid_pad = 0;
111
		handle.ha_fid.fid_gen = inode->i_generation;
C
Christoph Hellwig 已提交
112
		handle.ha_fid.fid_ino = ip->i_ino;
C
Christoph Hellwig 已提交
113
		hsize = sizeof(xfs_handle_t);
L
Linus Torvalds 已提交
114 115
	}

C
Christoph Hellwig 已提交
116
	error = -EFAULT;
117
	if (copy_to_user(hreq->ohandle, &handle, hsize) ||
C
Christoph Hellwig 已提交
118 119
	    copy_to_user(hreq->ohandlen, &hsize, sizeof(__s32)))
		goto out_put;
L
Linus Torvalds 已提交
120

C
Christoph Hellwig 已提交
121 122 123 124
	error = 0;

 out_put:
	if (cmd == XFS_IOC_FD_TO_HANDLE)
125
		fdput(f);
C
Christoph Hellwig 已提交
126 127 128
	else
		path_put(&path);
	return error;
L
Linus Torvalds 已提交
129 130 131
}

/*
132 133
 * No need to do permission checks on the various pathname components
 * as the handle operations are privileged.
L
Linus Torvalds 已提交
134 135
 */
STATIC int
136 137 138 139 140 141 142 143 144 145 146 147 148 149 150
xfs_handle_acceptable(
	void			*context,
	struct dentry		*dentry)
{
	return 1;
}

/*
 * Convert userspace handle data into a dentry.
 */
struct dentry *
xfs_handle_to_dentry(
	struct file		*parfilp,
	void __user		*uhandle,
	u32			hlen)
L
Linus Torvalds 已提交
151 152
{
	xfs_handle_t		handle;
153
	struct xfs_fid64	fid;
L
Linus Torvalds 已提交
154 155 156 157

	/*
	 * Only allow handle opens under a directory.
	 */
A
Al Viro 已提交
158
	if (!S_ISDIR(file_inode(parfilp)->i_mode))
159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176
		return ERR_PTR(-ENOTDIR);

	if (hlen != sizeof(xfs_handle_t))
		return ERR_PTR(-EINVAL);
	if (copy_from_user(&handle, uhandle, hlen))
		return ERR_PTR(-EFAULT);
	if (handle.ha_fid.fid_len !=
	    sizeof(handle.ha_fid) - sizeof(handle.ha_fid.fid_len))
		return ERR_PTR(-EINVAL);

	memset(&fid, 0, sizeof(struct fid));
	fid.ino = handle.ha_fid.fid_ino;
	fid.gen = handle.ha_fid.fid_gen;

	return exportfs_decode_fh(parfilp->f_path.mnt, (struct fid *)&fid, 3,
			FILEID_INO32_GEN | XFS_FILEID_TYPE_64FLAG,
			xfs_handle_acceptable, NULL);
}
L
Linus Torvalds 已提交
177

178 179 180 181 182 183
STATIC struct dentry *
xfs_handlereq_to_dentry(
	struct file		*parfilp,
	xfs_fsop_handlereq_t	*hreq)
{
	return xfs_handle_to_dentry(parfilp, hreq->ihandle, hreq->ihandlen);
L
Linus Torvalds 已提交
184 185
}

186
int
L
Linus Torvalds 已提交
187 188
xfs_open_by_handle(
	struct file		*parfilp,
189
	xfs_fsop_handlereq_t	*hreq)
L
Linus Torvalds 已提交
190
{
191
	const struct cred	*cred = current_cred();
L
Linus Torvalds 已提交
192
	int			error;
193
	int			fd;
L
Linus Torvalds 已提交
194 195 196 197
	int			permflag;
	struct file		*filp;
	struct inode		*inode;
	struct dentry		*dentry;
198
	fmode_t			fmode;
199
	struct path		path;
L
Linus Torvalds 已提交
200 201

	if (!capable(CAP_SYS_ADMIN))
E
Eric Sandeen 已提交
202
		return -EPERM;
L
Linus Torvalds 已提交
203

204 205 206
	dentry = xfs_handlereq_to_dentry(parfilp, hreq);
	if (IS_ERR(dentry))
		return PTR_ERR(dentry);
207
	inode = d_inode(dentry);
L
Linus Torvalds 已提交
208 209 210

	/* Restrict xfs_open_by_handle to directories & regular files. */
	if (!(S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode))) {
E
Eric Sandeen 已提交
211
		error = -EPERM;
212
		goto out_dput;
L
Linus Torvalds 已提交
213 214 215
	}

#if BITS_PER_LONG != 32
216
	hreq->oflags |= O_LARGEFILE;
L
Linus Torvalds 已提交
217
#endif
218

219
	permflag = hreq->oflags;
220
	fmode = OPEN_FMODE(permflag);
L
Linus Torvalds 已提交
221
	if ((!(permflag & O_APPEND) || (permflag & O_TRUNC)) &&
222
	    (fmode & FMODE_WRITE) && IS_APPEND(inode)) {
E
Eric Sandeen 已提交
223
		error = -EPERM;
224
		goto out_dput;
L
Linus Torvalds 已提交
225 226
	}

227
	if ((fmode & FMODE_WRITE) && IS_IMMUTABLE(inode)) {
E
Eryu Guan 已提交
228
		error = -EPERM;
229
		goto out_dput;
L
Linus Torvalds 已提交
230 231 232
	}

	/* Can't write directories. */
233
	if (S_ISDIR(inode->i_mode) && (fmode & FMODE_WRITE)) {
E
Eric Sandeen 已提交
234
		error = -EISDIR;
235
		goto out_dput;
L
Linus Torvalds 已提交
236 237
	}

238
	fd = get_unused_fd_flags(0);
239 240 241
	if (fd < 0) {
		error = fd;
		goto out_dput;
L
Linus Torvalds 已提交
242 243
	}

244 245 246 247
	path.mnt = parfilp->f_path.mnt;
	path.dentry = dentry;
	filp = dentry_open(&path, hreq->oflags, cred);
	dput(dentry);
L
Linus Torvalds 已提交
248
	if (IS_ERR(filp)) {
249 250
		put_unused_fd(fd);
		return PTR_ERR(filp);
L
Linus Torvalds 已提交
251
	}
252

A
Al Viro 已提交
253
	if (S_ISREG(inode->i_mode)) {
254
		filp->f_flags |= O_NOATIME;
255
		filp->f_mode |= FMODE_NOCMTIME;
256
	}
L
Linus Torvalds 已提交
257

258 259 260 261 262 263
	fd_install(fd, filp);
	return fd;

 out_dput:
	dput(dentry);
	return error;
L
Linus Torvalds 已提交
264 265
}

266
int
L
Linus Torvalds 已提交
267
xfs_readlink_by_handle(
268 269
	struct file		*parfilp,
	xfs_fsop_handlereq_t	*hreq)
L
Linus Torvalds 已提交
270
{
271
	struct dentry		*dentry;
L
Linus Torvalds 已提交
272
	__u32			olen;
273
	int			error;
L
Linus Torvalds 已提交
274 275

	if (!capable(CAP_SYS_ADMIN))
E
Eric Sandeen 已提交
276
		return -EPERM;
L
Linus Torvalds 已提交
277

278 279 280
	dentry = xfs_handlereq_to_dentry(parfilp, hreq);
	if (IS_ERR(dentry))
		return PTR_ERR(dentry);
L
Linus Torvalds 已提交
281 282

	/* Restrict this handle operation to symlinks only. */
283
	if (!d_is_symlink(dentry)) {
E
Eric Sandeen 已提交
284
		error = -EINVAL;
285
		goto out_dput;
L
Linus Torvalds 已提交
286 287
	}

288
	if (copy_from_user(&olen, hreq->ohandlen, sizeof(__u32))) {
E
Eric Sandeen 已提交
289
		error = -EFAULT;
290
		goto out_dput;
L
Linus Torvalds 已提交
291 292
	}

293
	error = vfs_readlink(dentry, hreq->ohandle, olen);
294

295 296
 out_dput:
	dput(dentry);
297
	return error;
L
Linus Torvalds 已提交
298 299
}

D
Dave Chinner 已提交
300 301 302
int
xfs_set_dmattrs(
	xfs_inode_t     *ip,
D
Darrick J. Wong 已提交
303 304
	uint		evmask,
	uint16_t	state)
D
Dave Chinner 已提交
305 306 307 308 309 310
{
	xfs_mount_t	*mp = ip->i_mount;
	xfs_trans_t	*tp;
	int		error;

	if (!capable(CAP_SYS_ADMIN))
D
Dave Chinner 已提交
311
		return -EPERM;
D
Dave Chinner 已提交
312 313

	if (XFS_FORCED_SHUTDOWN(mp))
D
Dave Chinner 已提交
314
		return -EIO;
D
Dave Chinner 已提交
315

316 317
	error = xfs_trans_alloc(mp, &M_RES(mp)->tr_ichange, 0, 0, 0, &tp);
	if (error)
D
Dave Chinner 已提交
318
		return error;
319

D
Dave Chinner 已提交
320 321 322 323 324 325 326
	xfs_ilock(ip, XFS_ILOCK_EXCL);
	xfs_trans_ijoin(tp, ip, XFS_ILOCK_EXCL);

	ip->i_d.di_dmevmask = evmask;
	ip->i_d.di_dmstate  = state;

	xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE);
327
	error = xfs_trans_commit(tp);
D
Dave Chinner 已提交
328 329 330 331

	return error;
}

L
Linus Torvalds 已提交
332 333
STATIC int
xfs_fssetdm_by_handle(
334 335
	struct file		*parfilp,
	void			__user *arg)
L
Linus Torvalds 已提交
336 337 338 339
{
	int			error;
	struct fsdmidata	fsd;
	xfs_fsop_setdm_handlereq_t dmhreq;
340
	struct dentry		*dentry;
L
Linus Torvalds 已提交
341 342

	if (!capable(CAP_MKNOD))
E
Eric Sandeen 已提交
343
		return -EPERM;
L
Linus Torvalds 已提交
344
	if (copy_from_user(&dmhreq, arg, sizeof(xfs_fsop_setdm_handlereq_t)))
E
Eric Sandeen 已提交
345
		return -EFAULT;
L
Linus Torvalds 已提交
346

J
Jan Kara 已提交
347 348 349 350
	error = mnt_want_write_file(parfilp);
	if (error)
		return error;

351
	dentry = xfs_handlereq_to_dentry(parfilp, &dmhreq.hreq);
J
Jan Kara 已提交
352 353
	if (IS_ERR(dentry)) {
		mnt_drop_write_file(parfilp);
354
		return PTR_ERR(dentry);
J
Jan Kara 已提交
355
	}
L
Linus Torvalds 已提交
356

357
	if (IS_IMMUTABLE(d_inode(dentry)) || IS_APPEND(d_inode(dentry))) {
E
Eric Sandeen 已提交
358
		error = -EPERM;
359
		goto out;
L
Linus Torvalds 已提交
360 361 362
	}

	if (copy_from_user(&fsd, dmhreq.data, sizeof(fsd))) {
E
Eric Sandeen 已提交
363
		error = -EFAULT;
364
		goto out;
L
Linus Torvalds 已提交
365 366
	}

367
	error = xfs_set_dmattrs(XFS_I(d_inode(dentry)), fsd.fsd_dmevmask,
368
				 fsd.fsd_dmstate);
L
Linus Torvalds 已提交
369

370
 out:
J
Jan Kara 已提交
371
	mnt_drop_write_file(parfilp);
372
	dput(dentry);
373
	return error;
L
Linus Torvalds 已提交
374 375 376 377
}

STATIC int
xfs_attrlist_by_handle(
378 379
	struct file		*parfilp,
	void			__user *arg)
L
Linus Torvalds 已提交
380
{
381
	int			error = -ENOMEM;
L
Linus Torvalds 已提交
382
	attrlist_cursor_kern_t	*cursor;
383
	struct xfs_fsop_attrlist_handlereq __user	*p = arg;
L
Linus Torvalds 已提交
384
	xfs_fsop_attrlist_handlereq_t al_hreq;
385
	struct dentry		*dentry;
L
Linus Torvalds 已提交
386 387 388
	char			*kbuf;

	if (!capable(CAP_SYS_ADMIN))
E
Eric Sandeen 已提交
389
		return -EPERM;
L
Linus Torvalds 已提交
390
	if (copy_from_user(&al_hreq, arg, sizeof(xfs_fsop_attrlist_handlereq_t)))
E
Eric Sandeen 已提交
391
		return -EFAULT;
392
	if (al_hreq.buflen < sizeof(struct attrlist) ||
J
Jan Tulak 已提交
393
	    al_hreq.buflen > XFS_XATTR_LIST_MAX)
E
Eric Sandeen 已提交
394
		return -EINVAL;
L
Linus Torvalds 已提交
395

396 397 398 399
	/*
	 * Reject flags, only allow namespaces.
	 */
	if (al_hreq.flags & ~(ATTR_ROOT | ATTR_SECURE))
E
Eric Sandeen 已提交
400
		return -EINVAL;
401

402 403 404
	dentry = xfs_handlereq_to_dentry(parfilp, &al_hreq.hreq);
	if (IS_ERR(dentry))
		return PTR_ERR(dentry);
L
Linus Torvalds 已提交
405

406 407 408
	kbuf = kmem_zalloc_large(al_hreq.buflen, KM_SLEEP);
	if (!kbuf)
		goto out_dput;
L
Linus Torvalds 已提交
409 410

	cursor = (attrlist_cursor_kern_t *)&al_hreq.pos;
411
	error = xfs_attr_list(XFS_I(d_inode(dentry)), kbuf, al_hreq.buflen,
412
					al_hreq.flags, cursor);
L
Linus Torvalds 已提交
413 414 415
	if (error)
		goto out_kfree;

416 417 418 419 420
	if (copy_to_user(&p->pos, cursor, sizeof(attrlist_cursor_kern_t))) {
		error = -EFAULT;
		goto out_kfree;
	}

L
Linus Torvalds 已提交
421 422 423
	if (copy_to_user(al_hreq.buffer, kbuf, al_hreq.buflen))
		error = -EFAULT;

424 425 426
out_kfree:
	kmem_free(kbuf);
out_dput:
427 428
	dput(dentry);
	return error;
L
Linus Torvalds 已提交
429 430
}

431
int
L
Linus Torvalds 已提交
432
xfs_attrmulti_attr_get(
433
	struct inode		*inode,
434 435
	unsigned char		*name,
	unsigned char		__user *ubuf,
436 437
	uint32_t		*len,
	uint32_t		flags)
L
Linus Torvalds 已提交
438
{
439
	unsigned char		*kbuf;
D
Dave Chinner 已提交
440
	int			error = -EFAULT;
441

442
	if (*len > XFS_XATTR_SIZE_MAX)
D
Dave Chinner 已提交
443
		return -EINVAL;
444 445
	kbuf = kmem_zalloc_large(*len, KM_SLEEP);
	if (!kbuf)
D
Dave Chinner 已提交
446
		return -ENOMEM;
L
Linus Torvalds 已提交
447

448
	error = xfs_attr_get(XFS_I(inode), name, kbuf, (int *)len, flags);
L
Linus Torvalds 已提交
449 450 451 452
	if (error)
		goto out_kfree;

	if (copy_to_user(ubuf, kbuf, *len))
D
Dave Chinner 已提交
453
		error = -EFAULT;
L
Linus Torvalds 已提交
454

455 456
out_kfree:
	kmem_free(kbuf);
L
Linus Torvalds 已提交
457 458 459
	return error;
}

460
int
L
Linus Torvalds 已提交
461
xfs_attrmulti_attr_set(
462
	struct inode		*inode,
463 464
	unsigned char		*name,
	const unsigned char	__user *ubuf,
465 466
	uint32_t		len,
	uint32_t		flags)
L
Linus Torvalds 已提交
467
{
468
	unsigned char		*kbuf;
469
	int			error;
L
Linus Torvalds 已提交
470

471
	if (IS_IMMUTABLE(inode) || IS_APPEND(inode))
D
Dave Chinner 已提交
472
		return -EPERM;
473
	if (len > XFS_XATTR_SIZE_MAX)
D
Dave Chinner 已提交
474
		return -EINVAL;
L
Linus Torvalds 已提交
475

L
Li Zefan 已提交
476 477 478
	kbuf = memdup_user(ubuf, len);
	if (IS_ERR(kbuf))
		return PTR_ERR(kbuf);
479

480
	error = xfs_attr_set(XFS_I(inode), name, kbuf, len, flags);
481 482
	if (!error)
		xfs_forget_acl(inode, name, flags);
483 484
	kfree(kbuf);
	return error;
L
Linus Torvalds 已提交
485 486
}

487
int
L
Linus Torvalds 已提交
488
xfs_attrmulti_attr_remove(
489
	struct inode		*inode,
490
	unsigned char		*name,
491
	uint32_t		flags)
L
Linus Torvalds 已提交
492
{
493 494
	int			error;

495
	if (IS_IMMUTABLE(inode) || IS_APPEND(inode))
D
Dave Chinner 已提交
496
		return -EPERM;
497 498 499 500
	error = xfs_attr_remove(XFS_I(inode), name, flags);
	if (!error)
		xfs_forget_acl(inode, name, flags);
	return error;
L
Linus Torvalds 已提交
501 502 503 504
}

STATIC int
xfs_attrmulti_by_handle(
505
	struct file		*parfilp,
506
	void			__user *arg)
L
Linus Torvalds 已提交
507 508 509 510
{
	int			error;
	xfs_attr_multiop_t	*ops;
	xfs_fsop_attrmulti_handlereq_t am_hreq;
511
	struct dentry		*dentry;
L
Linus Torvalds 已提交
512
	unsigned int		i, size;
513
	unsigned char		*attr_name;
L
Linus Torvalds 已提交
514 515

	if (!capable(CAP_SYS_ADMIN))
E
Eric Sandeen 已提交
516
		return -EPERM;
L
Linus Torvalds 已提交
517
	if (copy_from_user(&am_hreq, arg, sizeof(xfs_fsop_attrmulti_handlereq_t)))
E
Eric Sandeen 已提交
518
		return -EFAULT;
L
Linus Torvalds 已提交
519

520 521 522 523
	/* overflow check */
	if (am_hreq.opcount >= INT_MAX / sizeof(xfs_attr_multiop_t))
		return -E2BIG;

524 525 526
	dentry = xfs_handlereq_to_dentry(parfilp, &am_hreq.hreq);
	if (IS_ERR(dentry))
		return PTR_ERR(dentry);
L
Linus Torvalds 已提交
527

D
Dave Chinner 已提交
528
	error = -E2BIG;
C
Christoph Hellwig 已提交
529
	size = am_hreq.opcount * sizeof(xfs_attr_multiop_t);
L
Linus Torvalds 已提交
530
	if (!size || size > 16 * PAGE_SIZE)
531
		goto out_dput;
L
Linus Torvalds 已提交
532

L
Li Zefan 已提交
533 534
	ops = memdup_user(am_hreq.ops, size);
	if (IS_ERR(ops)) {
D
Dave Chinner 已提交
535
		error = PTR_ERR(ops);
536
		goto out_dput;
L
Li Zefan 已提交
537
	}
L
Linus Torvalds 已提交
538

D
Dave Chinner 已提交
539
	error = -ENOMEM;
L
Linus Torvalds 已提交
540 541 542 543 544 545
	attr_name = kmalloc(MAXNAMELEN, GFP_KERNEL);
	if (!attr_name)
		goto out_kfree_ops;

	error = 0;
	for (i = 0; i < am_hreq.opcount; i++) {
546
		ops[i].am_error = strncpy_from_user((char *)attr_name,
L
Linus Torvalds 已提交
547 548
				ops[i].am_attrname, MAXNAMELEN);
		if (ops[i].am_error == 0 || ops[i].am_error == MAXNAMELEN)
D
Dave Chinner 已提交
549
			error = -ERANGE;
L
Linus Torvalds 已提交
550 551 552 553 554
		if (ops[i].am_error < 0)
			break;

		switch (ops[i].am_opcode) {
		case ATTR_OP_GET:
555
			ops[i].am_error = xfs_attrmulti_attr_get(
556
					d_inode(dentry), attr_name,
557 558
					ops[i].am_attrvalue, &ops[i].am_length,
					ops[i].am_flags);
L
Linus Torvalds 已提交
559 560
			break;
		case ATTR_OP_SET:
561
			ops[i].am_error = mnt_want_write_file(parfilp);
562 563
			if (ops[i].am_error)
				break;
564
			ops[i].am_error = xfs_attrmulti_attr_set(
565
					d_inode(dentry), attr_name,
566 567
					ops[i].am_attrvalue, ops[i].am_length,
					ops[i].am_flags);
A
Al Viro 已提交
568
			mnt_drop_write_file(parfilp);
L
Linus Torvalds 已提交
569 570
			break;
		case ATTR_OP_REMOVE:
571
			ops[i].am_error = mnt_want_write_file(parfilp);
572 573
			if (ops[i].am_error)
				break;
574
			ops[i].am_error = xfs_attrmulti_attr_remove(
575
					d_inode(dentry), attr_name,
576
					ops[i].am_flags);
A
Al Viro 已提交
577
			mnt_drop_write_file(parfilp);
L
Linus Torvalds 已提交
578 579
			break;
		default:
D
Dave Chinner 已提交
580
			ops[i].am_error = -EINVAL;
L
Linus Torvalds 已提交
581 582 583 584
		}
	}

	if (copy_to_user(am_hreq.ops, ops, size))
D
Dave Chinner 已提交
585
		error = -EFAULT;
L
Linus Torvalds 已提交
586 587 588 589

	kfree(attr_name);
 out_kfree_ops:
	kfree(ops);
590 591
 out_dput:
	dput(dentry);
D
Dave Chinner 已提交
592
	return error;
L
Linus Torvalds 已提交
593 594
}

595
int
L
Linus Torvalds 已提交
596 597 598
xfs_ioc_space(
	struct file		*filp,
	unsigned int		cmd,
599
	xfs_flock64_t		*bf)
L
Linus Torvalds 已提交
600
{
601 602
	struct inode		*inode = file_inode(filp);
	struct xfs_inode	*ip = XFS_I(inode);
603
	struct iattr		iattr;
604
	enum xfs_prealloc_flags	flags = 0;
605
	uint			iolock = XFS_IOLOCK_EXCL;
L
Linus Torvalds 已提交
606 607
	int			error;

608 609 610 611 612 613
	/*
	 * Only allow the sys admin to reserve space unless
	 * unwritten extents are enabled.
	 */
	if (!xfs_sb_version_hasextflgbit(&ip->i_mount->m_sb) &&
	    !capable(CAP_SYS_ADMIN))
E
Eric Sandeen 已提交
614
		return -EPERM;
615

616
	if (inode->i_flags & (S_IMMUTABLE|S_APPEND))
E
Eric Sandeen 已提交
617
		return -EPERM;
L
Linus Torvalds 已提交
618

619
	if (!(filp->f_mode & FMODE_WRITE))
E
Eric Sandeen 已提交
620
		return -EBADF;
L
Linus Torvalds 已提交
621

622
	if (!S_ISREG(inode->i_mode))
E
Eric Sandeen 已提交
623
		return -EINVAL;
L
Linus Torvalds 已提交
624

625 626
	if (filp->f_flags & O_DSYNC)
		flags |= XFS_PREALLOC_SYNC;
627
	if (filp->f_mode & FMODE_NOCMTIME)
628 629
		flags |= XFS_PREALLOC_INVISIBLE;

J
Jan Kara 已提交
630 631 632
	error = mnt_want_write_file(filp);
	if (error)
		return error;
633

634
	xfs_ilock(ip, iolock);
635
	error = xfs_break_layouts(inode, &iolock);
636 637
	if (error)
		goto out_unlock;
638

639 640 641
	xfs_ilock(ip, XFS_MMAPLOCK_EXCL);
	iolock |= XFS_MMAPLOCK_EXCL;

642 643 644 645 646 647 648 649 650 651
	switch (bf->l_whence) {
	case 0: /*SEEK_SET*/
		break;
	case 1: /*SEEK_CUR*/
		bf->l_start += filp->f_pos;
		break;
	case 2: /*SEEK_END*/
		bf->l_start += XFS_ISIZE(ip);
		break;
	default:
D
Dave Chinner 已提交
652
		error = -EINVAL;
653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668
		goto out_unlock;
	}

	/*
	 * length of <= 0 for resv/unresv/zero is invalid.  length for
	 * alloc/free is ignored completely and we have no idea what userspace
	 * might have set it to, so set it to zero to allow range
	 * checks to pass.
	 */
	switch (cmd) {
	case XFS_IOC_ZERO_RANGE:
	case XFS_IOC_RESVSP:
	case XFS_IOC_RESVSP64:
	case XFS_IOC_UNRESVSP:
	case XFS_IOC_UNRESVSP64:
		if (bf->l_len <= 0) {
D
Dave Chinner 已提交
669
			error = -EINVAL;
670 671 672 673 674 675 676 677 678
			goto out_unlock;
		}
		break;
	default:
		bf->l_len = 0;
		break;
	}

	if (bf->l_start < 0 ||
679
	    bf->l_start > inode->i_sb->s_maxbytes ||
680
	    bf->l_start + bf->l_len < 0 ||
681
	    bf->l_start + bf->l_len >= inode->i_sb->s_maxbytes) {
D
Dave Chinner 已提交
682
		error = -EINVAL;
683 684 685 686 687
		goto out_unlock;
	}

	switch (cmd) {
	case XFS_IOC_ZERO_RANGE:
688
		flags |= XFS_PREALLOC_SET;
689 690 691 692
		error = xfs_zero_file_space(ip, bf->l_start, bf->l_len);
		break;
	case XFS_IOC_RESVSP:
	case XFS_IOC_RESVSP64:
693
		flags |= XFS_PREALLOC_SET;
694 695 696 697 698 699 700 701 702 703 704
		error = xfs_alloc_file_space(ip, bf->l_start, bf->l_len,
						XFS_BMAPI_PREALLOC);
		break;
	case XFS_IOC_UNRESVSP:
	case XFS_IOC_UNRESVSP64:
		error = xfs_free_file_space(ip, bf->l_start, bf->l_len);
		break;
	case XFS_IOC_ALLOCSP:
	case XFS_IOC_ALLOCSP64:
	case XFS_IOC_FREESP:
	case XFS_IOC_FREESP64:
705
		flags |= XFS_PREALLOC_CLEAR;
706 707 708 709 710 711 712 713 714 715
		if (bf->l_start > XFS_ISIZE(ip)) {
			error = xfs_alloc_file_space(ip, XFS_ISIZE(ip),
					bf->l_start - XFS_ISIZE(ip), 0);
			if (error)
				goto out_unlock;
		}

		iattr.ia_valid = ATTR_SIZE;
		iattr.ia_size = bf->l_start;

716
		error = xfs_vn_setattr_size(file_dentry(filp), &iattr);
717 718 719
		break;
	default:
		ASSERT(0);
D
Dave Chinner 已提交
720
		error = -EINVAL;
721 722 723 724 725
	}

	if (error)
		goto out_unlock;

726
	error = xfs_update_prealloc_flags(ip, flags);
727 728

out_unlock:
729
	xfs_iunlock(ip, iolock);
J
Jan Kara 已提交
730
	mnt_drop_write_file(filp);
D
Dave Chinner 已提交
731
	return error;
L
Linus Torvalds 已提交
732 733 734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750 751 752
}

STATIC int
xfs_ioc_bulkstat(
	xfs_mount_t		*mp,
	unsigned int		cmd,
	void			__user *arg)
{
	xfs_fsop_bulkreq_t	bulkreq;
	int			count;	/* # of records returned */
	xfs_ino_t		inlast;	/* last inode number */
	int			done;
	int			error;

	/* done = 1 if there are more stats to get and if bulkstat */
	/* should be called again (unused here, but used in dmapi) */

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (XFS_FORCED_SHUTDOWN(mp))
E
Eric Sandeen 已提交
753
		return -EIO;
L
Linus Torvalds 已提交
754 755

	if (copy_from_user(&bulkreq, arg, sizeof(xfs_fsop_bulkreq_t)))
E
Eric Sandeen 已提交
756
		return -EFAULT;
L
Linus Torvalds 已提交
757 758

	if (copy_from_user(&inlast, bulkreq.lastip, sizeof(__s64)))
E
Eric Sandeen 已提交
759
		return -EFAULT;
L
Linus Torvalds 已提交
760 761

	if ((count = bulkreq.icount) <= 0)
E
Eric Sandeen 已提交
762
		return -EINVAL;
L
Linus Torvalds 已提交
763

764
	if (bulkreq.ubuffer == NULL)
E
Eric Sandeen 已提交
765
		return -EINVAL;
766

L
Linus Torvalds 已提交
767 768
	if (cmd == XFS_IOC_FSINUMBERS)
		error = xfs_inumbers(mp, &inlast, &count,
769
					bulkreq.ubuffer, xfs_inumbers_fmt);
L
Linus Torvalds 已提交
770
	else if (cmd == XFS_IOC_FSBULKSTAT_SINGLE)
771 772
		error = xfs_bulkstat_one(mp, inlast, bulkreq.ubuffer,
					sizeof(xfs_bstat_t), NULL, &done);
773
	else	/* XFS_IOC_FSBULKSTAT */
774 775 776
		error = xfs_bulkstat(mp, &inlast, &count, xfs_bulkstat_one,
				     sizeof(xfs_bstat_t), bulkreq.ubuffer,
				     &done);
L
Linus Torvalds 已提交
777 778

	if (error)
D
Dave Chinner 已提交
779
		return error;
L
Linus Torvalds 已提交
780 781 782 783

	if (bulkreq.ocount != NULL) {
		if (copy_to_user(bulkreq.lastip, &inlast,
						sizeof(xfs_ino_t)))
E
Eric Sandeen 已提交
784
			return -EFAULT;
L
Linus Torvalds 已提交
785 786

		if (copy_to_user(bulkreq.ocount, &count, sizeof(count)))
E
Eric Sandeen 已提交
787
			return -EFAULT;
L
Linus Torvalds 已提交
788 789 790 791 792 793 794 795 796 797
	}

	return 0;
}

STATIC int
xfs_ioc_fsgeometry_v1(
	xfs_mount_t		*mp,
	void			__user *arg)
{
798
	xfs_fsop_geom_t         fsgeo;
L
Linus Torvalds 已提交
799 800
	int			error;

801
	error = xfs_fs_geometry(&mp->m_sb, &fsgeo, 3);
L
Linus Torvalds 已提交
802
	if (error)
D
Dave Chinner 已提交
803
		return error;
L
Linus Torvalds 已提交
804

805 806 807 808 809 810
	/*
	 * Caller should have passed an argument of type
	 * xfs_fsop_geom_v1_t.  This is a proper subset of the
	 * xfs_fsop_geom_t that xfs_fs_geometry() fills in.
	 */
	if (copy_to_user(arg, &fsgeo, sizeof(xfs_fsop_geom_v1_t)))
E
Eric Sandeen 已提交
811
		return -EFAULT;
L
Linus Torvalds 已提交
812 813 814 815 816 817 818 819 820 821 822
	return 0;
}

STATIC int
xfs_ioc_fsgeometry(
	xfs_mount_t		*mp,
	void			__user *arg)
{
	xfs_fsop_geom_t		fsgeo;
	int			error;

823
	error = xfs_fs_geometry(&mp->m_sb, &fsgeo, 4);
L
Linus Torvalds 已提交
824
	if (error)
D
Dave Chinner 已提交
825
		return error;
L
Linus Torvalds 已提交
826 827

	if (copy_to_user(arg, &fsgeo, sizeof(fsgeo)))
E
Eric Sandeen 已提交
828
		return -EFAULT;
L
Linus Torvalds 已提交
829 830 831 832 833 834 835 836 837 838 839 840 841 842
	return 0;
}

/*
 * Linux extended inode flags interface.
 */

STATIC unsigned int
xfs_merge_ioc_xflags(
	unsigned int	flags,
	unsigned int	start)
{
	unsigned int	xflags = start;

843
	if (flags & FS_IMMUTABLE_FL)
844
		xflags |= FS_XFLAG_IMMUTABLE;
L
Linus Torvalds 已提交
845
	else
846
		xflags &= ~FS_XFLAG_IMMUTABLE;
847
	if (flags & FS_APPEND_FL)
848
		xflags |= FS_XFLAG_APPEND;
L
Linus Torvalds 已提交
849
	else
850
		xflags &= ~FS_XFLAG_APPEND;
851
	if (flags & FS_SYNC_FL)
852
		xflags |= FS_XFLAG_SYNC;
L
Linus Torvalds 已提交
853
	else
854
		xflags &= ~FS_XFLAG_SYNC;
855
	if (flags & FS_NOATIME_FL)
856
		xflags |= FS_XFLAG_NOATIME;
L
Linus Torvalds 已提交
857
	else
858
		xflags &= ~FS_XFLAG_NOATIME;
859
	if (flags & FS_NODUMP_FL)
860
		xflags |= FS_XFLAG_NODUMP;
L
Linus Torvalds 已提交
861
	else
862
		xflags &= ~FS_XFLAG_NODUMP;
L
Linus Torvalds 已提交
863 864 865 866 867 868

	return xflags;
}

STATIC unsigned int
xfs_di2lxflags(
869
	uint16_t	di_flags)
L
Linus Torvalds 已提交
870 871 872 873
{
	unsigned int	flags = 0;

	if (di_flags & XFS_DIFLAG_IMMUTABLE)
874
		flags |= FS_IMMUTABLE_FL;
L
Linus Torvalds 已提交
875
	if (di_flags & XFS_DIFLAG_APPEND)
876
		flags |= FS_APPEND_FL;
L
Linus Torvalds 已提交
877
	if (di_flags & XFS_DIFLAG_SYNC)
878
		flags |= FS_SYNC_FL;
L
Linus Torvalds 已提交
879
	if (di_flags & XFS_DIFLAG_NOATIME)
880
		flags |= FS_NOATIME_FL;
L
Linus Torvalds 已提交
881
	if (di_flags & XFS_DIFLAG_NODUMP)
882
		flags |= FS_NODUMP_FL;
L
Linus Torvalds 已提交
883 884 885
	return flags;
}

886 887 888 889 890 891 892 893
STATIC int
xfs_ioc_fsgetxattr(
	xfs_inode_t		*ip,
	int			attr,
	void			__user *arg)
{
	struct fsxattr		fa;

894 895
	memset(&fa, 0, sizeof(struct fsxattr));

896 897 898
	xfs_ilock(ip, XFS_ILOCK_SHARED);
	fa.fsx_xflags = xfs_ip2xflags(ip);
	fa.fsx_extsize = ip->i_d.di_extsize << ip->i_mount->m_sb.sb_blocklog;
899 900
	fa.fsx_cowextsize = ip->i_d.di_cowextsize <<
			ip->i_mount->m_sb.sb_blocklog;
901
	fa.fsx_projid = xfs_get_projid(ip);
902 903 904 905

	if (attr) {
		if (ip->i_afp) {
			if (ip->i_afp->if_flags & XFS_IFEXTENTS)
906
				fa.fsx_nextents = xfs_iext_count(ip->i_afp);
907 908 909 910 911 912
			else
				fa.fsx_nextents = ip->i_d.di_anextents;
		} else
			fa.fsx_nextents = 0;
	} else {
		if (ip->i_df.if_flags & XFS_IFEXTENTS)
913
			fa.fsx_nextents = xfs_iext_count(&ip->i_df);
914 915 916 917 918 919 920 921 922 923
		else
			fa.fsx_nextents = ip->i_d.di_nextents;
	}
	xfs_iunlock(ip, XFS_ILOCK_SHARED);

	if (copy_to_user(arg, &fa, sizeof(fa)))
		return -EFAULT;
	return 0;
}

924 925
STATIC uint16_t
xfs_flags2diflags(
926 927 928 929
	struct xfs_inode	*ip,
	unsigned int		xflags)
{
	/* can't set PREALLOC this way, just preserve it */
930 931 932
	uint16_t		di_flags =
		(ip->i_d.di_flags & XFS_DIFLAG_PREALLOC);

933
	if (xflags & FS_XFLAG_IMMUTABLE)
934
		di_flags |= XFS_DIFLAG_IMMUTABLE;
935
	if (xflags & FS_XFLAG_APPEND)
936
		di_flags |= XFS_DIFLAG_APPEND;
937
	if (xflags & FS_XFLAG_SYNC)
938
		di_flags |= XFS_DIFLAG_SYNC;
939
	if (xflags & FS_XFLAG_NOATIME)
940
		di_flags |= XFS_DIFLAG_NOATIME;
941
	if (xflags & FS_XFLAG_NODUMP)
942
		di_flags |= XFS_DIFLAG_NODUMP;
943
	if (xflags & FS_XFLAG_NODEFRAG)
944
		di_flags |= XFS_DIFLAG_NODEFRAG;
945
	if (xflags & FS_XFLAG_FILESTREAM)
946
		di_flags |= XFS_DIFLAG_FILESTREAM;
D
Dave Chinner 已提交
947
	if (S_ISDIR(VFS_I(ip)->i_mode)) {
948
		if (xflags & FS_XFLAG_RTINHERIT)
949
			di_flags |= XFS_DIFLAG_RTINHERIT;
950
		if (xflags & FS_XFLAG_NOSYMLINKS)
951
			di_flags |= XFS_DIFLAG_NOSYMLINKS;
952
		if (xflags & FS_XFLAG_EXTSZINHERIT)
953
			di_flags |= XFS_DIFLAG_EXTSZINHERIT;
954
		if (xflags & FS_XFLAG_PROJINHERIT)
955
			di_flags |= XFS_DIFLAG_PROJINHERIT;
D
Dave Chinner 已提交
956
	} else if (S_ISREG(VFS_I(ip)->i_mode)) {
957
		if (xflags & FS_XFLAG_REALTIME)
958
			di_flags |= XFS_DIFLAG_REALTIME;
959
		if (xflags & FS_XFLAG_EXTSIZE)
960 961
			di_flags |= XFS_DIFLAG_EXTSIZE;
	}
962

963 964 965 966 967 968 969 970 971 972
	return di_flags;
}

STATIC uint64_t
xfs_flags2diflags2(
	struct xfs_inode	*ip,
	unsigned int		xflags)
{
	uint64_t		di_flags2 =
		(ip->i_d.di_flags2 & XFS_DIFLAG2_REFLINK);
973 974 975

	if (xflags & FS_XFLAG_DAX)
		di_flags2 |= XFS_DIFLAG2_DAX;
976 977
	if (xflags & FS_XFLAG_COWEXTSIZE)
		di_flags2 |= XFS_DIFLAG2_COWEXTSIZE;
978

979
	return di_flags2;
980 981
}

982 983 984 985
STATIC void
xfs_diflags_to_linux(
	struct xfs_inode	*ip)
{
986
	struct inode		*inode = VFS_I(ip);
987 988
	unsigned int		xflags = xfs_ip2xflags(ip);

989
	if (xflags & FS_XFLAG_IMMUTABLE)
990 991 992
		inode->i_flags |= S_IMMUTABLE;
	else
		inode->i_flags &= ~S_IMMUTABLE;
993
	if (xflags & FS_XFLAG_APPEND)
994 995 996
		inode->i_flags |= S_APPEND;
	else
		inode->i_flags &= ~S_APPEND;
997
	if (xflags & FS_XFLAG_SYNC)
998 999 1000
		inode->i_flags |= S_SYNC;
	else
		inode->i_flags &= ~S_SYNC;
1001
	if (xflags & FS_XFLAG_NOATIME)
1002 1003 1004
		inode->i_flags |= S_NOATIME;
	else
		inode->i_flags &= ~S_NOATIME;
1005
#if 0	/* disabled until the flag switching races are sorted out */
1006 1007 1008 1009
	if (xflags & FS_XFLAG_DAX)
		inode->i_flags |= S_DAX;
	else
		inode->i_flags &= ~S_DAX;
1010
#endif
1011
}
1012

1013 1014 1015 1016 1017 1018 1019
static int
xfs_ioctl_setattr_xflags(
	struct xfs_trans	*tp,
	struct xfs_inode	*ip,
	struct fsxattr		*fa)
{
	struct xfs_mount	*mp = ip->i_mount;
1020
	uint64_t		di_flags2;
1021 1022 1023

	/* Can't change realtime flag if any extents are allocated. */
	if ((ip->i_d.di_nextents || ip->i_delayed_blks) &&
1024
	    XFS_IS_REALTIME_INODE(ip) != (fa->fsx_xflags & FS_XFLAG_REALTIME))
1025 1026 1027
		return -EINVAL;

	/* If realtime flag is set then must have realtime device */
1028
	if (fa->fsx_xflags & FS_XFLAG_REALTIME) {
1029 1030 1031 1032 1033
		if (mp->m_sb.sb_rblocks == 0 || mp->m_sb.sb_rextsize == 0 ||
		    (ip->i_d.di_extsize % mp->m_sb.sb_rextsize))
			return -EINVAL;
	}

1034
	/* Clear reflink if we are actually able to set the rt flag. */
1035
	if ((fa->fsx_xflags & FS_XFLAG_REALTIME) && xfs_is_reflink_inode(ip))
1036
		ip->i_d.di_flags2 &= ~XFS_DIFLAG2_REFLINK;
1037

1038 1039 1040 1041
	/* Don't allow us to set DAX mode for a reflinked file for now. */
	if ((fa->fsx_xflags & FS_XFLAG_DAX) && xfs_is_reflink_inode(ip))
		return -EINVAL;

1042 1043 1044 1045 1046
	/*
	 * Can't modify an immutable/append-only file unless
	 * we have appropriate permission.
	 */
	if (((ip->i_d.di_flags & (XFS_DIFLAG_IMMUTABLE | XFS_DIFLAG_APPEND)) ||
1047
	     (fa->fsx_xflags & (FS_XFLAG_IMMUTABLE | FS_XFLAG_APPEND))) &&
1048 1049 1050
	    !capable(CAP_LINUX_IMMUTABLE))
		return -EPERM;

1051 1052 1053 1054 1055 1056 1057 1058
	/* diflags2 only valid for v3 inodes. */
	di_flags2 = xfs_flags2diflags2(ip, fa->fsx_xflags);
	if (di_flags2 && ip->i_d.di_version < 3)
		return -EINVAL;

	ip->i_d.di_flags = xfs_flags2diflags(ip, fa->fsx_xflags);
	ip->i_d.di_flags2 = di_flags2;

1059 1060 1061
	xfs_diflags_to_linux(ip);
	xfs_trans_ichgtime(tp, ip, XFS_ICHGTIME_CHG);
	xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE);
1062
	XFS_STATS_INC(mp, xs_ig_attrchg);
1063 1064 1065
	return 0;
}

1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080
/*
 * If we are changing DAX flags, we have to ensure the file is clean and any
 * cached objects in the address space are invalidated and removed. This
 * requires us to lock out other IO and page faults similar to a truncate
 * operation. The locks need to be held until the transaction has been committed
 * so that the cache invalidation is atomic with respect to the DAX flag
 * manipulation.
 */
static int
xfs_ioctl_setattr_dax_invalidate(
	struct xfs_inode	*ip,
	struct fsxattr		*fa,
	int			*join_flags)
{
	struct inode		*inode = VFS_I(ip);
1081
	struct super_block	*sb = inode->i_sb;
1082 1083 1084 1085
	int			error;

	*join_flags = 0;

1086 1087
	/*
	 * It is only valid to set the DAX flag on regular files and
1088
	 * directories on filesystems where the block size is equal to the page
1089 1090
	 * size. On directories it serves as an inherited hint so we don't
	 * have to check the device for dax support or flush pagecache.
1091
	 */
1092 1093 1094
	if (fa->fsx_xflags & FS_XFLAG_DAX) {
		if (!(S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode)))
			return -EINVAL;
1095 1096
		if (S_ISREG(inode->i_mode) &&
		    !bdev_dax_supported(xfs_find_bdev_for_inode(VFS_I(ip)),
1097
				sb->s_blocksize))
1098 1099
			return -EINVAL;
	}
1100

1101 1102 1103 1104 1105 1106
	/* If the DAX state is not changing, we have nothing to do here. */
	if ((fa->fsx_xflags & FS_XFLAG_DAX) && IS_DAX(inode))
		return 0;
	if (!(fa->fsx_xflags & FS_XFLAG_DAX) && !IS_DAX(inode))
		return 0;

1107 1108 1109
	if (S_ISDIR(inode->i_mode))
		return 0;

1110 1111 1112 1113 1114 1115 1116 1117 1118 1119
	/* lock, flush and invalidate mapping in preparation for flag change */
	xfs_ilock(ip, XFS_MMAPLOCK_EXCL | XFS_IOLOCK_EXCL);
	error = filemap_write_and_wait(inode->i_mapping);
	if (error)
		goto out_unlock;
	error = invalidate_inode_pages2(inode->i_mapping);
	if (error)
		goto out_unlock;

	*join_flags = XFS_MMAPLOCK_EXCL | XFS_IOLOCK_EXCL;
1120
	return 0;
1121 1122 1123 1124 1125

out_unlock:
	xfs_iunlock(ip, XFS_MMAPLOCK_EXCL | XFS_IOLOCK_EXCL);
	return error;

1126 1127
}

1128 1129 1130 1131 1132
/*
 * Set up the transaction structure for the setattr operation, checking that we
 * have permission to do so. On success, return a clean transaction and the
 * inode locked exclusively ready for further operation specific checks. On
 * failure, return an error without modifying or locking the inode.
1133 1134 1135 1136 1137 1138
 *
 * The inode might already be IO locked on call. If this is the case, it is
 * indicated in @join_flags and we take full responsibility for ensuring they
 * are unlocked from now on. Hence if we have an error here, we still have to
 * unlock them. Otherwise, once they are joined to the transaction, they will
 * be unlocked on commit/cancel.
1139 1140 1141
 */
static struct xfs_trans *
xfs_ioctl_setattr_get_trans(
1142 1143
	struct xfs_inode	*ip,
	int			join_flags)
1144 1145 1146
{
	struct xfs_mount	*mp = ip->i_mount;
	struct xfs_trans	*tp;
1147
	int			error = -EROFS;
1148 1149

	if (mp->m_flags & XFS_MOUNT_RDONLY)
1150 1151
		goto out_unlock;
	error = -EIO;
1152
	if (XFS_FORCED_SHUTDOWN(mp))
1153
		goto out_unlock;
1154

1155
	error = xfs_trans_alloc(mp, &M_RES(mp)->tr_ichange, 0, 0, 0, &tp);
1156
	if (error)
1157
		return ERR_PTR(error);
1158 1159

	xfs_ilock(ip, XFS_ILOCK_EXCL);
1160 1161
	xfs_trans_ijoin(tp, ip, XFS_ILOCK_EXCL | join_flags);
	join_flags = 0;
1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179

	/*
	 * CAP_FOWNER overrides the following restrictions:
	 *
	 * The user ID of the calling process must be equal to the file owner
	 * ID, except in cases where the CAP_FSETID capability is applicable.
	 */
	if (!inode_owner_or_capable(VFS_I(ip))) {
		error = -EPERM;
		goto out_cancel;
	}

	if (mp->m_flags & XFS_MOUNT_WSYNC)
		xfs_trans_set_sync(tp);

	return tp;

out_cancel:
1180
	xfs_trans_cancel(tp);
1181 1182 1183
out_unlock:
	if (join_flags)
		xfs_iunlock(ip, join_flags);
1184 1185 1186
	return ERR_PTR(error);
}

1187 1188 1189 1190
/*
 * extent size hint validation is somewhat cumbersome. Rules are:
 *
 * 1. extent size hint is only valid for directories and regular files
1191 1192
 * 2. FS_XFLAG_EXTSIZE is only valid for regular files
 * 3. FS_XFLAG_EXTSZINHERIT is only valid for directories.
1193 1194 1195 1196 1197 1198 1199
 * 4. can only be changed on regular files if no extents are allocated
 * 5. can be changed on directories at any time
 * 6. extsize hint of 0 turns off hints, clears inode flags.
 * 7. Extent size must be a multiple of the appropriate block size.
 * 8. for non-realtime files, the extent size hint must be limited
 *    to half the AG size to avoid alignment extending the extent beyond the
 *    limits of the AG.
D
Darrick J. Wong 已提交
1200 1201
 *
 * Please keep this function in sync with xfs_scrub_inode_extsize.
1202
 */
1203
static int
1204 1205 1206 1207 1208 1209
xfs_ioctl_setattr_check_extsize(
	struct xfs_inode	*ip,
	struct fsxattr		*fa)
{
	struct xfs_mount	*mp = ip->i_mount;

D
Dave Chinner 已提交
1210
	if ((fa->fsx_xflags & FS_XFLAG_EXTSIZE) && !S_ISREG(VFS_I(ip)->i_mode))
1211 1212
		return -EINVAL;

1213
	if ((fa->fsx_xflags & FS_XFLAG_EXTSZINHERIT) &&
D
Dave Chinner 已提交
1214
	    !S_ISDIR(VFS_I(ip)->i_mode))
1215 1216
		return -EINVAL;

D
Dave Chinner 已提交
1217
	if (S_ISREG(VFS_I(ip)->i_mode) && ip->i_d.di_nextents &&
1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229
	    ((ip->i_d.di_extsize << mp->m_sb.sb_blocklog) != fa->fsx_extsize))
		return -EINVAL;

	if (fa->fsx_extsize != 0) {
		xfs_extlen_t    size;
		xfs_fsblock_t   extsize_fsb;

		extsize_fsb = XFS_B_TO_FSB(mp, fa->fsx_extsize);
		if (extsize_fsb > MAXEXTLEN)
			return -EINVAL;

		if (XFS_IS_REALTIME_INODE(ip) ||
1230
		    (fa->fsx_xflags & FS_XFLAG_REALTIME)) {
1231 1232 1233 1234 1235 1236 1237 1238 1239
			size = mp->m_sb.sb_rextsize << mp->m_sb.sb_blocklog;
		} else {
			size = mp->m_sb.sb_blocksize;
			if (extsize_fsb > mp->m_sb.sb_agblocks / 2)
				return -EINVAL;
		}

		if (fa->fsx_extsize % size)
			return -EINVAL;
1240
	} else
1241
		fa->fsx_xflags &= ~(FS_XFLAG_EXTSIZE | FS_XFLAG_EXTSZINHERIT);
1242

1243 1244 1245
	return 0;
}

1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257
/*
 * CoW extent size hint validation rules are:
 *
 * 1. CoW extent size hint can only be set if reflink is enabled on the fs.
 *    The inode does not have to have any shared blocks, but it must be a v3.
 * 2. FS_XFLAG_COWEXTSIZE is only valid for directories and regular files;
 *    for a directory, the hint is propagated to new files.
 * 3. Can be changed on files & directories at any time.
 * 4. CoW extsize hint of 0 turns off hints, clears inode flags.
 * 5. Extent size must be a multiple of the appropriate block size.
 * 6. The extent size hint must be limited to half the AG size to avoid
 *    alignment extending the extent beyond the limits of the AG.
D
Darrick J. Wong 已提交
1258 1259
 *
 * Please keep this function in sync with xfs_scrub_inode_cowextsize.
1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295 1296 1297
 */
static int
xfs_ioctl_setattr_check_cowextsize(
	struct xfs_inode	*ip,
	struct fsxattr		*fa)
{
	struct xfs_mount	*mp = ip->i_mount;

	if (!(fa->fsx_xflags & FS_XFLAG_COWEXTSIZE))
		return 0;

	if (!xfs_sb_version_hasreflink(&ip->i_mount->m_sb) ||
	    ip->i_d.di_version != 3)
		return -EINVAL;

	if (!S_ISREG(VFS_I(ip)->i_mode) && !S_ISDIR(VFS_I(ip)->i_mode))
		return -EINVAL;

	if (fa->fsx_cowextsize != 0) {
		xfs_extlen_t    size;
		xfs_fsblock_t   cowextsize_fsb;

		cowextsize_fsb = XFS_B_TO_FSB(mp, fa->fsx_cowextsize);
		if (cowextsize_fsb > MAXEXTLEN)
			return -EINVAL;

		size = mp->m_sb.sb_blocksize;
		if (cowextsize_fsb > mp->m_sb.sb_agblocks / 2)
			return -EINVAL;

		if (fa->fsx_cowextsize % size)
			return -EINVAL;
	} else
		fa->fsx_xflags &= ~FS_XFLAG_COWEXTSIZE;

	return 0;
}

1298
static int
1299 1300 1301 1302 1303
xfs_ioctl_setattr_check_projid(
	struct xfs_inode	*ip,
	struct fsxattr		*fa)
{
	/* Disallow 32bit project ids if projid32bit feature is not enabled. */
1304
	if (fa->fsx_projid > (uint16_t)-1 &&
1305 1306 1307 1308 1309 1310 1311 1312 1313 1314 1315 1316 1317
	    !xfs_sb_version_hasprojid32bit(&ip->i_mount->m_sb))
		return -EINVAL;

	/*
	 * Project Quota ID state is only allowed to change from within the init
	 * namespace. Enforce that restriction only if we are trying to change
	 * the quota ID state. Everything else is allowed in user namespaces.
	 */
	if (current_user_ns() == &init_user_ns)
		return 0;

	if (xfs_get_projid(ip) != fa->fsx_projid)
		return -EINVAL;
1318
	if ((fa->fsx_xflags & FS_XFLAG_PROJINHERIT) !=
1319 1320 1321 1322 1323
	    (ip->i_d.di_flags & XFS_DIFLAG_PROJINHERIT))
		return -EINVAL;

	return 0;
}
1324 1325 1326 1327

STATIC int
xfs_ioctl_setattr(
	xfs_inode_t		*ip,
1328
	struct fsxattr		*fa)
1329 1330 1331
{
	struct xfs_mount	*mp = ip->i_mount;
	struct xfs_trans	*tp;
C
Christoph Hellwig 已提交
1332
	struct xfs_dquot	*udqp = NULL;
1333
	struct xfs_dquot	*pdqp = NULL;
1334 1335
	struct xfs_dquot	*olddquot = NULL;
	int			code;
1336
	int			join_flags = 0;
1337

C
Christoph Hellwig 已提交
1338
	trace_xfs_ioctl_setattr(ip);
1339

1340 1341 1342
	code = xfs_ioctl_setattr_check_projid(ip, fa);
	if (code)
		return code;
1343

1344 1345 1346 1347 1348 1349 1350 1351
	/*
	 * If disk quotas is on, we make sure that the dquots do exist on disk,
	 * before we start any other transactions. Trying to do this later
	 * is messy. We don't care to take a readlock to look at the ids
	 * in inode here, because we can't hold it across the trans_reserve.
	 * If the IDs do change before we take the ilock, we're covered
	 * because the i_*dquot fields will get updated anyway.
	 */
1352
	if (XFS_IS_QUOTA_ON(mp)) {
C
Christoph Hellwig 已提交
1353
		code = xfs_qm_vop_dqalloc(ip, ip->i_d.di_uid,
1354
					 ip->i_d.di_gid, fa->fsx_projid,
1355
					 XFS_QMOPT_PQUOTA, &udqp, NULL, &pdqp);
1356 1357 1358 1359
		if (code)
			return code;
	}

1360 1361 1362 1363 1364 1365 1366 1367 1368 1369 1370 1371
	/*
	 * Changing DAX config may require inode locking for mapping
	 * invalidation. These need to be held all the way to transaction commit
	 * or cancel time, so need to be passed through to
	 * xfs_ioctl_setattr_get_trans() so it can apply them to the join call
	 * appropriately.
	 */
	code = xfs_ioctl_setattr_dax_invalidate(ip, fa, &join_flags);
	if (code)
		goto error_free_dquots;

	tp = xfs_ioctl_setattr_get_trans(ip, join_flags);
1372 1373 1374
	if (IS_ERR(tp)) {
		code = PTR_ERR(tp);
		goto error_free_dquots;
1375 1376 1377
	}


1378 1379 1380 1381 1382
	if (XFS_IS_QUOTA_RUNNING(mp) && XFS_IS_PQUOTA_ON(mp) &&
	    xfs_get_projid(ip) != fa->fsx_projid) {
		code = xfs_qm_vop_chown_reserve(tp, ip, udqp, NULL, pdqp,
				capable(CAP_FOWNER) ?  XFS_QMOPT_FORCE_RES : 0);
		if (code)	/* out of quota */
1383
			goto error_trans_cancel;
1384 1385
	}

1386 1387 1388
	code = xfs_ioctl_setattr_check_extsize(ip, fa);
	if (code)
		goto error_trans_cancel;
1389

1390 1391 1392 1393
	code = xfs_ioctl_setattr_check_cowextsize(ip, fa);
	if (code)
		goto error_trans_cancel;

1394 1395
	code = xfs_ioctl_setattr_xflags(tp, ip, fa);
	if (code)
1396
		goto error_trans_cancel;
1397 1398

	/*
1399 1400 1401 1402 1403
	 * Change file ownership.  Must be the owner or privileged.  CAP_FSETID
	 * overrides the following restrictions:
	 *
	 * The set-user-ID and set-group-ID bits of a file will be cleared upon
	 * successful return from chown()
1404 1405
	 */

D
Dave Chinner 已提交
1406
	if ((VFS_I(ip)->i_mode & (S_ISUID|S_ISGID)) &&
1407
	    !capable_wrt_inode_uidgid(VFS_I(ip), CAP_FSETID))
D
Dave Chinner 已提交
1408
		VFS_I(ip)->i_mode &= ~(S_ISUID|S_ISGID);
1409

1410 1411 1412 1413 1414 1415 1416 1417
	/* Change the ownerships and register project quota modifications */
	if (xfs_get_projid(ip) != fa->fsx_projid) {
		if (XFS_IS_QUOTA_RUNNING(mp) && XFS_IS_PQUOTA_ON(mp)) {
			olddquot = xfs_qm_vop_chown(tp, ip,
						&ip->i_pdquot, pdqp);
		}
		ASSERT(ip->i_d.di_version > 1);
		xfs_set_projid(ip, fa->fsx_projid);
1418
	}
1419

1420 1421 1422 1423 1424
	/*
	 * Only set the extent size hint if we've already determined that the
	 * extent size hint should be set on the inode. If no extent size flags
	 * are set on the inode then unconditionally clear the extent size hint.
	 */
1425 1426 1427 1428
	if (ip->i_d.di_flags & (XFS_DIFLAG_EXTSIZE | XFS_DIFLAG_EXTSZINHERIT))
		ip->i_d.di_extsize = fa->fsx_extsize >> mp->m_sb.sb_blocklog;
	else
		ip->i_d.di_extsize = 0;
1429 1430 1431 1432 1433 1434
	if (ip->i_d.di_version == 3 &&
	    (ip->i_d.di_flags2 & XFS_DIFLAG2_COWEXTSIZE))
		ip->i_d.di_cowextsize = fa->fsx_cowextsize >>
				mp->m_sb.sb_blocklog;
	else
		ip->i_d.di_cowextsize = 0;
1435

1436
	code = xfs_trans_commit(tp);
1437 1438 1439 1440

	/*
	 * Release any dquot(s) the inode had kept before chown.
	 */
C
Christoph Hellwig 已提交
1441 1442
	xfs_qm_dqrele(olddquot);
	xfs_qm_dqrele(udqp);
1443
	xfs_qm_dqrele(pdqp);
1444

C
Christoph Hellwig 已提交
1445
	return code;
1446

1447
error_trans_cancel:
1448
	xfs_trans_cancel(tp);
1449
error_free_dquots:
C
Christoph Hellwig 已提交
1450
	xfs_qm_dqrele(udqp);
1451
	xfs_qm_dqrele(pdqp);
1452 1453 1454
	return code;
}

L
Linus Torvalds 已提交
1455
STATIC int
L
Lachlan McIlroy 已提交
1456
xfs_ioc_fssetxattr(
L
Linus Torvalds 已提交
1457 1458 1459 1460 1461
	xfs_inode_t		*ip,
	struct file		*filp,
	void			__user *arg)
{
	struct fsxattr		fa;
J
Jan Kara 已提交
1462
	int error;
L
Lachlan McIlroy 已提交
1463 1464 1465

	if (copy_from_user(&fa, arg, sizeof(fa)))
		return -EFAULT;
L
Linus Torvalds 已提交
1466

J
Jan Kara 已提交
1467 1468 1469
	error = mnt_want_write_file(filp);
	if (error)
		return error;
1470
	error = xfs_ioctl_setattr(ip, &fa);
J
Jan Kara 已提交
1471
	mnt_drop_write_file(filp);
D
Dave Chinner 已提交
1472
	return error;
L
Lachlan McIlroy 已提交
1473
}
L
Linus Torvalds 已提交
1474

L
Lachlan McIlroy 已提交
1475 1476 1477 1478 1479 1480
STATIC int
xfs_ioc_getxflags(
	xfs_inode_t		*ip,
	void			__user *arg)
{
	unsigned int		flags;
L
Linus Torvalds 已提交
1481

L
Lachlan McIlroy 已提交
1482 1483 1484 1485 1486
	flags = xfs_di2lxflags(ip->i_d.di_flags);
	if (copy_to_user(arg, &flags, sizeof(flags)))
		return -EFAULT;
	return 0;
}
L
Linus Torvalds 已提交
1487

L
Lachlan McIlroy 已提交
1488 1489
STATIC int
xfs_ioc_setxflags(
1490
	struct xfs_inode	*ip,
L
Lachlan McIlroy 已提交
1491 1492 1493
	struct file		*filp,
	void			__user *arg)
{
1494
	struct xfs_trans	*tp;
1495
	struct fsxattr		fa;
L
Lachlan McIlroy 已提交
1496
	unsigned int		flags;
1497
	int			join_flags = 0;
1498
	int			error;
L
Linus Torvalds 已提交
1499

L
Lachlan McIlroy 已提交
1500 1501
	if (copy_from_user(&flags, arg, sizeof(flags)))
		return -EFAULT;
L
Linus Torvalds 已提交
1502

L
Lachlan McIlroy 已提交
1503 1504 1505 1506
	if (flags & ~(FS_IMMUTABLE_FL | FS_APPEND_FL | \
		      FS_NOATIME_FL | FS_NODUMP_FL | \
		      FS_SYNC_FL))
		return -EOPNOTSUPP;
L
Linus Torvalds 已提交
1507

1508
	fa.fsx_xflags = xfs_merge_ioc_xflags(flags, xfs_ip2xflags(ip));
L
Linus Torvalds 已提交
1509

J
Jan Kara 已提交
1510 1511 1512
	error = mnt_want_write_file(filp);
	if (error)
		return error;
1513

1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525
	/*
	 * Changing DAX config may require inode locking for mapping
	 * invalidation. These need to be held all the way to transaction commit
	 * or cancel time, so need to be passed through to
	 * xfs_ioctl_setattr_get_trans() so it can apply them to the join call
	 * appropriately.
	 */
	error = xfs_ioctl_setattr_dax_invalidate(ip, &fa, &join_flags);
	if (error)
		goto out_drop_write;

	tp = xfs_ioctl_setattr_get_trans(ip, join_flags);
1526 1527 1528 1529 1530 1531 1532
	if (IS_ERR(tp)) {
		error = PTR_ERR(tp);
		goto out_drop_write;
	}

	error = xfs_ioctl_setattr_xflags(tp, ip, &fa);
	if (error) {
1533
		xfs_trans_cancel(tp);
1534 1535 1536
		goto out_drop_write;
	}

1537
	error = xfs_trans_commit(tp);
1538
out_drop_write:
J
Jan Kara 已提交
1539
	mnt_drop_write_file(filp);
D
Dave Chinner 已提交
1540
	return error;
L
Linus Torvalds 已提交
1541 1542
}

1543 1544 1545 1546 1547
static bool
xfs_getbmap_format(
	struct kgetbmap		*p,
	struct getbmapx __user	*u,
	size_t			recsize)
1548
{
1549 1550 1551 1552 1553 1554 1555 1556 1557 1558 1559 1560 1561 1562
	if (put_user(p->bmv_offset, &u->bmv_offset) ||
	    put_user(p->bmv_block, &u->bmv_block) ||
	    put_user(p->bmv_length, &u->bmv_length) ||
	    put_user(0, &u->bmv_count) ||
	    put_user(0, &u->bmv_entries))
		return false;
	if (recsize < sizeof(struct getbmapx))
		return true;
	if (put_user(0, &u->bmv_iflags) ||
	    put_user(p->bmv_oflags, &u->bmv_oflags) ||
	    put_user(0, &u->bmv_unused1) ||
	    put_user(0, &u->bmv_unused2))
		return false;
	return true;
1563 1564
}

L
Linus Torvalds 已提交
1565 1566
STATIC int
xfs_ioc_getbmap(
1567
	struct file		*file,
L
Linus Torvalds 已提交
1568 1569 1570
	unsigned int		cmd,
	void			__user *arg)
{
1571
	struct getbmapx		bmx = { 0 };
1572 1573 1574
	struct kgetbmap		*buf;
	size_t			recsize;
	int			error, i;
L
Linus Torvalds 已提交
1575

1576 1577 1578 1579 1580 1581 1582 1583 1584 1585 1586 1587 1588 1589
	switch (cmd) {
	case XFS_IOC_GETBMAPA:
		bmx.bmv_iflags = BMV_IF_ATTRFORK;
		/*FALLTHRU*/
	case XFS_IOC_GETBMAP:
		if (file->f_mode & FMODE_NOCMTIME)
			bmx.bmv_iflags |= BMV_IF_NO_DMAPI_READ;
		/* struct getbmap is a strict subset of struct getbmapx. */
		recsize = sizeof(struct getbmap);
		break;
	case XFS_IOC_GETBMAPX:
		recsize = sizeof(struct getbmapx);
		break;
	default:
E
Eric Sandeen 已提交
1590
		return -EINVAL;
1591
	}
L
Linus Torvalds 已提交
1592

1593
	if (copy_from_user(&bmx, arg, recsize))
E
Eric Sandeen 已提交
1594
		return -EFAULT;
L
Linus Torvalds 已提交
1595 1596

	if (bmx.bmv_count < 2)
E
Eric Sandeen 已提交
1597
		return -EINVAL;
1598 1599
	if (bmx.bmv_count > ULONG_MAX / recsize)
		return -ENOMEM;
L
Linus Torvalds 已提交
1600

1601 1602 1603
	buf = kmem_zalloc_large(bmx.bmv_count * sizeof(*buf), 0);
	if (!buf)
		return -ENOMEM;
L
Linus Torvalds 已提交
1604

1605
	error = xfs_getbmap(XFS_I(file_inode(file)), &bmx, buf);
L
Linus Torvalds 已提交
1606
	if (error)
1607
		goto out_free_buf;
L
Linus Torvalds 已提交
1608

1609 1610 1611 1612 1613 1614 1615 1616 1617 1618
	error = -EFAULT;
	if (copy_to_user(arg, &bmx, recsize))
		goto out_free_buf;
	arg += recsize;

	for (i = 0; i < bmx.bmv_entries; i++) {
		if (!xfs_getbmap_format(buf + i, arg, recsize))
			goto out_free_buf;
		arg += recsize;
	}
L
Linus Torvalds 已提交
1619

1620 1621 1622
	error = 0;
out_free_buf:
	kmem_free(buf);
L
Linus Torvalds 已提交
1623 1624
	return 0;
}
L
Lachlan McIlroy 已提交
1625

1626 1627
struct getfsmap_info {
	struct xfs_mount	*mp;
1628 1629
	struct fsmap_head __user *data;
	unsigned int		idx;
1630 1631 1632 1633 1634 1635 1636 1637 1638 1639 1640 1641 1642
	__u32			last_flags;
};

STATIC int
xfs_getfsmap_format(struct xfs_fsmap *xfm, void *priv)
{
	struct getfsmap_info	*info = priv;
	struct fsmap		fm;

	trace_xfs_getfsmap_mapping(info->mp, xfm);

	info->last_flags = xfm->fmr_flags;
	xfs_fsmap_from_internal(&fm, xfm);
1643 1644
	if (copy_to_user(&info->data->fmh_recs[info->idx++], &fm,
			sizeof(struct fsmap)))
1645 1646 1647 1648 1649 1650 1651 1652
		return -EFAULT;

	return 0;
}

STATIC int
xfs_ioc_getfsmap(
	struct xfs_inode	*ip,
1653
	struct fsmap_head	__user *arg)
1654
{
1655
	struct getfsmap_info	info = { NULL };
1656 1657 1658 1659 1660 1661 1662 1663 1664 1665 1666 1667 1668 1669 1670 1671 1672 1673 1674 1675 1676 1677 1678
	struct xfs_fsmap_head	xhead = {0};
	struct fsmap_head	head;
	bool			aborted = false;
	int			error;

	if (copy_from_user(&head, arg, sizeof(struct fsmap_head)))
		return -EFAULT;
	if (memchr_inv(head.fmh_reserved, 0, sizeof(head.fmh_reserved)) ||
	    memchr_inv(head.fmh_keys[0].fmr_reserved, 0,
		       sizeof(head.fmh_keys[0].fmr_reserved)) ||
	    memchr_inv(head.fmh_keys[1].fmr_reserved, 0,
		       sizeof(head.fmh_keys[1].fmr_reserved)))
		return -EINVAL;

	xhead.fmh_iflags = head.fmh_iflags;
	xhead.fmh_count = head.fmh_count;
	xfs_fsmap_to_internal(&xhead.fmh_keys[0], &head.fmh_keys[0]);
	xfs_fsmap_to_internal(&xhead.fmh_keys[1], &head.fmh_keys[1]);

	trace_xfs_getfsmap_low_key(ip->i_mount, &xhead.fmh_keys[0]);
	trace_xfs_getfsmap_high_key(ip->i_mount, &xhead.fmh_keys[1]);

	info.mp = ip->i_mount;
1679
	info.data = arg;
1680 1681 1682 1683 1684 1685 1686 1687
	error = xfs_getfsmap(ip->i_mount, &xhead, xfs_getfsmap_format, &info);
	if (error == XFS_BTREE_QUERY_RANGE_ABORT) {
		error = 0;
		aborted = true;
	} else if (error)
		return error;

	/* If we didn't abort, set the "last" flag in the last fmx */
1688
	if (!aborted && info.idx) {
1689
		info.last_flags |= FMR_OF_LAST;
1690 1691
		if (copy_to_user(&info.data->fmh_recs[info.idx - 1].fmr_flags,
				&info.last_flags, sizeof(info.last_flags)))
1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702 1703
			return -EFAULT;
	}

	/* copy back header */
	head.fmh_entries = xhead.fmh_entries;
	head.fmh_oflags = xhead.fmh_oflags;
	if (copy_to_user(arg, &head, sizeof(struct fsmap_head)))
		return -EFAULT;

	return 0;
}

1704 1705 1706 1707 1708 1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722 1723 1724 1725 1726 1727
STATIC int
xfs_ioc_scrub_metadata(
	struct xfs_inode		*ip,
	void				__user *arg)
{
	struct xfs_scrub_metadata	scrub;
	int				error;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (copy_from_user(&scrub, arg, sizeof(scrub)))
		return -EFAULT;

	error = xfs_scrub_metadata(ip, &scrub);
	if (error)
		return error;

	if (copy_to_user(arg, &scrub, sizeof(scrub)))
		return -EFAULT;

	return 0;
}

D
Dave Chinner 已提交
1728 1729 1730 1731 1732 1733 1734 1735 1736 1737 1738
int
xfs_ioc_swapext(
	xfs_swapext_t	*sxp)
{
	xfs_inode_t     *ip, *tip;
	struct fd	f, tmp;
	int		error = 0;

	/* Pull information for the target fd */
	f = fdget((int)sxp->sx_fdtarget);
	if (!f.file) {
D
Dave Chinner 已提交
1739
		error = -EINVAL;
D
Dave Chinner 已提交
1740 1741 1742 1743 1744 1745
		goto out;
	}

	if (!(f.file->f_mode & FMODE_WRITE) ||
	    !(f.file->f_mode & FMODE_READ) ||
	    (f.file->f_flags & O_APPEND)) {
D
Dave Chinner 已提交
1746
		error = -EBADF;
D
Dave Chinner 已提交
1747 1748 1749 1750 1751
		goto out_put_file;
	}

	tmp = fdget((int)sxp->sx_fdtmp);
	if (!tmp.file) {
D
Dave Chinner 已提交
1752
		error = -EINVAL;
D
Dave Chinner 已提交
1753 1754 1755 1756 1757 1758
		goto out_put_file;
	}

	if (!(tmp.file->f_mode & FMODE_WRITE) ||
	    !(tmp.file->f_mode & FMODE_READ) ||
	    (tmp.file->f_flags & O_APPEND)) {
D
Dave Chinner 已提交
1759
		error = -EBADF;
D
Dave Chinner 已提交
1760 1761 1762 1763 1764
		goto out_put_tmp_file;
	}

	if (IS_SWAPFILE(file_inode(f.file)) ||
	    IS_SWAPFILE(file_inode(tmp.file))) {
D
Dave Chinner 已提交
1765
		error = -EINVAL;
D
Dave Chinner 已提交
1766 1767 1768
		goto out_put_tmp_file;
	}

1769 1770 1771 1772 1773 1774 1775 1776 1777 1778 1779
	/*
	 * We need to ensure that the fds passed in point to XFS inodes
	 * before we cast and access them as XFS structures as we have no
	 * control over what the user passes us here.
	 */
	if (f.file->f_op != &xfs_file_operations ||
	    tmp.file->f_op != &xfs_file_operations) {
		error = -EINVAL;
		goto out_put_tmp_file;
	}

D
Dave Chinner 已提交
1780 1781 1782 1783
	ip = XFS_I(file_inode(f.file));
	tip = XFS_I(file_inode(tmp.file));

	if (ip->i_mount != tip->i_mount) {
D
Dave Chinner 已提交
1784
		error = -EINVAL;
D
Dave Chinner 已提交
1785 1786 1787 1788
		goto out_put_tmp_file;
	}

	if (ip->i_ino == tip->i_ino) {
D
Dave Chinner 已提交
1789
		error = -EINVAL;
D
Dave Chinner 已提交
1790 1791 1792 1793
		goto out_put_tmp_file;
	}

	if (XFS_FORCED_SHUTDOWN(ip->i_mount)) {
D
Dave Chinner 已提交
1794
		error = -EIO;
D
Dave Chinner 已提交
1795 1796 1797 1798 1799 1800 1801 1802 1803 1804 1805 1806 1807
		goto out_put_tmp_file;
	}

	error = xfs_swap_extents(ip, tip, sxp);

 out_put_tmp_file:
	fdput(tmp);
 out_put_file:
	fdput(f);
 out:
	return error;
}

1808 1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819 1820 1821 1822 1823 1824 1825 1826 1827 1828 1829 1830 1831 1832 1833 1834 1835 1836 1837 1838 1839 1840 1841 1842 1843 1844 1845 1846 1847 1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858 1859 1860 1861 1862 1863 1864 1865 1866 1867 1868 1869 1870 1871 1872 1873 1874 1875 1876 1877 1878 1879 1880 1881 1882 1883 1884 1885 1886 1887 1888 1889
static int
xfs_ioc_getlabel(
	struct xfs_mount	*mp,
	char			__user *user_label)
{
	struct xfs_sb		*sbp = &mp->m_sb;
	char			label[XFSLABEL_MAX + 1];

	/* Paranoia */
	BUILD_BUG_ON(sizeof(sbp->sb_fname) > FSLABEL_MAX);

	spin_lock(&mp->m_sb_lock);
	strncpy(label, sbp->sb_fname, sizeof(sbp->sb_fname));
	spin_unlock(&mp->m_sb_lock);

	/* xfs on-disk label is 12 chars, be sure we send a null to user */
	label[XFSLABEL_MAX] = '\0';
	if (copy_to_user(user_label, label, sizeof(sbp->sb_fname)))
		return -EFAULT;
	return 0;
}

static int
xfs_ioc_setlabel(
	struct file		*filp,
	struct xfs_mount	*mp,
	char			__user *newlabel)
{
	struct xfs_sb		*sbp = &mp->m_sb;
	char			label[XFSLABEL_MAX + 1];
	size_t			len;
	int			error;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;
	/*
	 * The generic ioctl allows up to FSLABEL_MAX chars, but XFS is much
	 * smaller, at 12 bytes.  We copy one more to be sure we find the
	 * (required) NULL character to test the incoming label length.
	 * NB: The on disk label doesn't need to be null terminated.
	 */
	if (copy_from_user(label, newlabel, XFSLABEL_MAX + 1))
		return -EFAULT;
	len = strnlen(label, XFSLABEL_MAX + 1);
	if (len > sizeof(sbp->sb_fname))
		return -EINVAL;

	error = mnt_want_write_file(filp);
	if (error)
		return error;

	spin_lock(&mp->m_sb_lock);
	memset(sbp->sb_fname, 0, sizeof(sbp->sb_fname));
	strncpy(sbp->sb_fname, label, sizeof(sbp->sb_fname));
	spin_unlock(&mp->m_sb_lock);

	/*
	 * Now we do several things to satisfy userspace.
	 * In addition to normal logging of the primary superblock, we also
	 * immediately write these changes to sector zero for the primary, then
	 * update all backup supers (as xfs_db does for a label change), then
	 * invalidate the block device page cache.  This is so that any prior
	 * buffered reads from userspace (i.e. from blkid) are invalidated,
	 * and userspace will see the newly-written label.
	 */
	error = xfs_sync_sb_buf(mp);
	if (error)
		goto out;
	/*
	 * growfs also updates backup supers so lock against that.
	 */
	mutex_lock(&mp->m_growlock);
	error = xfs_update_secondary_sbs(mp);
	mutex_unlock(&mp->m_growlock);

	invalidate_bdev(mp->m_ddev_targp->bt_bdev);

out:
	mnt_drop_write_file(filp);
	return error;
}

1890 1891 1892 1893 1894 1895 1896 1897
/*
 * Note: some of the ioctl's return positive numbers as a
 * byte count indicating success, such as readlink_by_handle.
 * So we don't "sign flip" like most other routines.  This means
 * true errors need to be returned as a negative value.
 */
long
xfs_file_ioctl(
L
Lachlan McIlroy 已提交
1898 1899
	struct file		*filp,
	unsigned int		cmd,
1900
	unsigned long		p)
L
Lachlan McIlroy 已提交
1901
{
A
Al Viro 已提交
1902
	struct inode		*inode = file_inode(filp);
1903 1904 1905
	struct xfs_inode	*ip = XFS_I(inode);
	struct xfs_mount	*mp = ip->i_mount;
	void			__user *arg = (void __user *)p;
L
Lachlan McIlroy 已提交
1906 1907
	int			error;

C
Christoph Hellwig 已提交
1908
	trace_xfs_file_ioctl(ip);
1909 1910

	switch (cmd) {
C
Christoph Hellwig 已提交
1911 1912
	case FITRIM:
		return xfs_ioc_trim(mp, arg);
1913 1914 1915 1916
	case FS_IOC_GETFSLABEL:
		return xfs_ioc_getlabel(mp, arg);
	case FS_IOC_SETFSLABEL:
		return xfs_ioc_setlabel(filp, mp, arg);
L
Lachlan McIlroy 已提交
1917 1918 1919 1920 1921 1922 1923
	case XFS_IOC_ALLOCSP:
	case XFS_IOC_FREESP:
	case XFS_IOC_RESVSP:
	case XFS_IOC_UNRESVSP:
	case XFS_IOC_ALLOCSP64:
	case XFS_IOC_FREESP64:
	case XFS_IOC_RESVSP64:
D
Dave Chinner 已提交
1924 1925
	case XFS_IOC_UNRESVSP64:
	case XFS_IOC_ZERO_RANGE: {
1926
		xfs_flock64_t		bf;
L
Lachlan McIlroy 已提交
1927

1928
		if (copy_from_user(&bf, arg, sizeof(bf)))
E
Eric Sandeen 已提交
1929
			return -EFAULT;
1930
		return xfs_ioc_space(filp, cmd, &bf);
1931
	}
L
Lachlan McIlroy 已提交
1932 1933 1934 1935 1936 1937
	case XFS_IOC_DIOINFO: {
		struct dioattr	da;
		xfs_buftarg_t	*target =
			XFS_IS_REALTIME_INODE(ip) ?
			mp->m_rtdev_targp : mp->m_ddev_targp;

1938
		da.d_mem =  da.d_miniosz = target->bt_logical_sectorsize;
L
Lachlan McIlroy 已提交
1939 1940 1941
		da.d_maxiosz = INT_MAX & ~(da.d_miniosz - 1);

		if (copy_to_user(arg, &da, sizeof(da)))
E
Eric Sandeen 已提交
1942
			return -EFAULT;
L
Lachlan McIlroy 已提交
1943 1944 1945 1946 1947 1948 1949 1950 1951 1952 1953 1954 1955 1956 1957 1958 1959 1960 1961 1962 1963
		return 0;
	}

	case XFS_IOC_FSBULKSTAT_SINGLE:
	case XFS_IOC_FSBULKSTAT:
	case XFS_IOC_FSINUMBERS:
		return xfs_ioc_bulkstat(mp, cmd, arg);

	case XFS_IOC_FSGEOMETRY_V1:
		return xfs_ioc_fsgeometry_v1(mp, arg);

	case XFS_IOC_FSGEOMETRY:
		return xfs_ioc_fsgeometry(mp, arg);

	case XFS_IOC_GETVERSION:
		return put_user(inode->i_generation, (int __user *)arg);

	case XFS_IOC_FSGETXATTR:
		return xfs_ioc_fsgetxattr(ip, 0, arg);
	case XFS_IOC_FSGETXATTRA:
		return xfs_ioc_fsgetxattr(ip, 1, arg);
L
Lachlan McIlroy 已提交
1964 1965
	case XFS_IOC_FSSETXATTR:
		return xfs_ioc_fssetxattr(ip, filp, arg);
L
Lachlan McIlroy 已提交
1966
	case XFS_IOC_GETXFLAGS:
L
Lachlan McIlroy 已提交
1967
		return xfs_ioc_getxflags(ip, arg);
L
Lachlan McIlroy 已提交
1968
	case XFS_IOC_SETXFLAGS:
L
Lachlan McIlroy 已提交
1969
		return xfs_ioc_setxflags(ip, filp, arg);
L
Lachlan McIlroy 已提交
1970 1971 1972 1973 1974

	case XFS_IOC_FSSETDM: {
		struct fsdmidata	dmi;

		if (copy_from_user(&dmi, arg, sizeof(dmi)))
E
Eric Sandeen 已提交
1975
			return -EFAULT;
L
Lachlan McIlroy 已提交
1976

J
Jan Kara 已提交
1977 1978 1979 1980
		error = mnt_want_write_file(filp);
		if (error)
			return error;

L
Lachlan McIlroy 已提交
1981 1982
		error = xfs_set_dmattrs(ip, dmi.fsd_dmevmask,
				dmi.fsd_dmstate);
J
Jan Kara 已提交
1983
		mnt_drop_write_file(filp);
D
Dave Chinner 已提交
1984
		return error;
L
Lachlan McIlroy 已提交
1985 1986 1987 1988 1989
	}

	case XFS_IOC_GETBMAP:
	case XFS_IOC_GETBMAPA:
	case XFS_IOC_GETBMAPX:
1990
		return xfs_ioc_getbmap(filp, cmd, arg);
L
Lachlan McIlroy 已提交
1991

1992 1993 1994
	case FS_IOC_GETFSMAP:
		return xfs_ioc_getfsmap(ip, arg);

1995 1996 1997
	case XFS_IOC_SCRUB_METADATA:
		return xfs_ioc_scrub_metadata(ip, arg);

L
Lachlan McIlroy 已提交
1998 1999
	case XFS_IOC_FD_TO_HANDLE:
	case XFS_IOC_PATH_TO_HANDLE:
2000 2001
	case XFS_IOC_PATH_TO_FSHANDLE: {
		xfs_fsop_handlereq_t	hreq;
L
Lachlan McIlroy 已提交
2002

2003
		if (copy_from_user(&hreq, arg, sizeof(hreq)))
E
Eric Sandeen 已提交
2004
			return -EFAULT;
2005 2006 2007 2008
		return xfs_find_handle(cmd, &hreq);
	}
	case XFS_IOC_OPEN_BY_HANDLE: {
		xfs_fsop_handlereq_t	hreq;
L
Lachlan McIlroy 已提交
2009

2010
		if (copy_from_user(&hreq, arg, sizeof(xfs_fsop_handlereq_t)))
E
Eric Sandeen 已提交
2011
			return -EFAULT;
2012
		return xfs_open_by_handle(filp, &hreq);
2013
	}
L
Lachlan McIlroy 已提交
2014
	case XFS_IOC_FSSETDM_BY_HANDLE:
2015
		return xfs_fssetdm_by_handle(filp, arg);
L
Lachlan McIlroy 已提交
2016

2017 2018
	case XFS_IOC_READLINK_BY_HANDLE: {
		xfs_fsop_handlereq_t	hreq;
L
Lachlan McIlroy 已提交
2019

2020
		if (copy_from_user(&hreq, arg, sizeof(xfs_fsop_handlereq_t)))
E
Eric Sandeen 已提交
2021
			return -EFAULT;
2022
		return xfs_readlink_by_handle(filp, &hreq);
2023
	}
L
Lachlan McIlroy 已提交
2024
	case XFS_IOC_ATTRLIST_BY_HANDLE:
2025
		return xfs_attrlist_by_handle(filp, arg);
L
Lachlan McIlroy 已提交
2026 2027

	case XFS_IOC_ATTRMULTI_BY_HANDLE:
2028
		return xfs_attrmulti_by_handle(filp, arg);
L
Lachlan McIlroy 已提交
2029 2030

	case XFS_IOC_SWAPEXT: {
2031 2032 2033
		struct xfs_swapext	sxp;

		if (copy_from_user(&sxp, arg, sizeof(xfs_swapext_t)))
E
Eric Sandeen 已提交
2034
			return -EFAULT;
J
Jan Kara 已提交
2035 2036 2037
		error = mnt_want_write_file(filp);
		if (error)
			return error;
D
Dave Chinner 已提交
2038
		error = xfs_ioc_swapext(&sxp);
J
Jan Kara 已提交
2039
		mnt_drop_write_file(filp);
D
Dave Chinner 已提交
2040
		return error;
L
Lachlan McIlroy 已提交
2041 2042 2043 2044 2045 2046 2047
	}

	case XFS_IOC_FSCOUNTS: {
		xfs_fsop_counts_t out;

		error = xfs_fs_counts(mp, &out);
		if (error)
D
Dave Chinner 已提交
2048
			return error;
L
Lachlan McIlroy 已提交
2049 2050

		if (copy_to_user(arg, &out, sizeof(out)))
E
Eric Sandeen 已提交
2051
			return -EFAULT;
L
Lachlan McIlroy 已提交
2052 2053 2054 2055 2056
		return 0;
	}

	case XFS_IOC_SET_RESBLKS: {
		xfs_fsop_resblks_t inout;
2057
		uint64_t	   in;
L
Lachlan McIlroy 已提交
2058 2059 2060 2061

		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

E
Eric Sandeen 已提交
2062
		if (mp->m_flags & XFS_MOUNT_RDONLY)
E
Eric Sandeen 已提交
2063
			return -EROFS;
E
Eric Sandeen 已提交
2064

L
Lachlan McIlroy 已提交
2065
		if (copy_from_user(&inout, arg, sizeof(inout)))
E
Eric Sandeen 已提交
2066
			return -EFAULT;
L
Lachlan McIlroy 已提交
2067

J
Jan Kara 已提交
2068 2069 2070 2071
		error = mnt_want_write_file(filp);
		if (error)
			return error;

L
Lachlan McIlroy 已提交
2072 2073 2074
		/* input parameter is passed in resblks field of structure */
		in = inout.resblks;
		error = xfs_reserve_blocks(mp, &in, &inout);
J
Jan Kara 已提交
2075
		mnt_drop_write_file(filp);
L
Lachlan McIlroy 已提交
2076
		if (error)
D
Dave Chinner 已提交
2077
			return error;
L
Lachlan McIlroy 已提交
2078 2079

		if (copy_to_user(arg, &inout, sizeof(inout)))
E
Eric Sandeen 已提交
2080
			return -EFAULT;
L
Lachlan McIlroy 已提交
2081 2082 2083 2084 2085 2086 2087 2088 2089 2090 2091
		return 0;
	}

	case XFS_IOC_GET_RESBLKS: {
		xfs_fsop_resblks_t out;

		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

		error = xfs_reserve_blocks(mp, NULL, &out);
		if (error)
D
Dave Chinner 已提交
2092
			return error;
L
Lachlan McIlroy 已提交
2093 2094

		if (copy_to_user(arg, &out, sizeof(out)))
E
Eric Sandeen 已提交
2095
			return -EFAULT;
L
Lachlan McIlroy 已提交
2096 2097 2098 2099 2100 2101 2102 2103

		return 0;
	}

	case XFS_IOC_FSGROWFSDATA: {
		xfs_growfs_data_t in;

		if (copy_from_user(&in, arg, sizeof(in)))
E
Eric Sandeen 已提交
2104
			return -EFAULT;
L
Lachlan McIlroy 已提交
2105

J
Jan Kara 已提交
2106 2107 2108
		error = mnt_want_write_file(filp);
		if (error)
			return error;
L
Lachlan McIlroy 已提交
2109
		error = xfs_growfs_data(mp, &in);
J
Jan Kara 已提交
2110
		mnt_drop_write_file(filp);
D
Dave Chinner 已提交
2111
		return error;
L
Lachlan McIlroy 已提交
2112 2113 2114 2115 2116 2117
	}

	case XFS_IOC_FSGROWFSLOG: {
		xfs_growfs_log_t in;

		if (copy_from_user(&in, arg, sizeof(in)))
E
Eric Sandeen 已提交
2118
			return -EFAULT;
L
Lachlan McIlroy 已提交
2119

J
Jan Kara 已提交
2120 2121 2122
		error = mnt_want_write_file(filp);
		if (error)
			return error;
L
Lachlan McIlroy 已提交
2123
		error = xfs_growfs_log(mp, &in);
J
Jan Kara 已提交
2124
		mnt_drop_write_file(filp);
D
Dave Chinner 已提交
2125
		return error;
L
Lachlan McIlroy 已提交
2126 2127 2128 2129 2130 2131
	}

	case XFS_IOC_FSGROWFSRT: {
		xfs_growfs_rt_t in;

		if (copy_from_user(&in, arg, sizeof(in)))
E
Eric Sandeen 已提交
2132
			return -EFAULT;
L
Lachlan McIlroy 已提交
2133

J
Jan Kara 已提交
2134 2135 2136
		error = mnt_want_write_file(filp);
		if (error)
			return error;
L
Lachlan McIlroy 已提交
2137
		error = xfs_growfs_rt(mp, &in);
J
Jan Kara 已提交
2138
		mnt_drop_write_file(filp);
D
Dave Chinner 已提交
2139
		return error;
L
Lachlan McIlroy 已提交
2140 2141 2142
	}

	case XFS_IOC_GOINGDOWN: {
2143
		uint32_t in;
L
Lachlan McIlroy 已提交
2144 2145 2146 2147

		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

2148
		if (get_user(in, (uint32_t __user *)arg))
E
Eric Sandeen 已提交
2149
			return -EFAULT;
L
Lachlan McIlroy 已提交
2150

D
Dave Chinner 已提交
2151
		return xfs_fs_goingdown(mp, in);
L
Lachlan McIlroy 已提交
2152 2153 2154 2155 2156 2157 2158 2159 2160
	}

	case XFS_IOC_ERROR_INJECTION: {
		xfs_error_injection_t in;

		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

		if (copy_from_user(&in, arg, sizeof(in)))
E
Eric Sandeen 已提交
2161
			return -EFAULT;
L
Lachlan McIlroy 已提交
2162

2163
		return xfs_errortag_add(mp, in.errtag);
L
Lachlan McIlroy 已提交
2164 2165 2166 2167 2168 2169
	}

	case XFS_IOC_ERROR_CLEARALL:
		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

2170
		return xfs_errortag_clearall(mp);
L
Lachlan McIlroy 已提交
2171

2172
	case XFS_IOC_FREE_EOFBLOCKS: {
2173 2174
		struct xfs_fs_eofblocks eofb;
		struct xfs_eofblocks keofb;
2175

2176 2177 2178 2179
		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

		if (mp->m_flags & XFS_MOUNT_RDONLY)
E
Eric Sandeen 已提交
2180
			return -EROFS;
2181

2182
		if (copy_from_user(&eofb, arg, sizeof(eofb)))
E
Eric Sandeen 已提交
2183
			return -EFAULT;
2184

2185 2186
		error = xfs_fs_eofblocks_from_user(&eofb, &keofb);
		if (error)
D
Dave Chinner 已提交
2187
			return error;
2188

D
Dave Chinner 已提交
2189
		return xfs_icache_free_eofblocks(mp, &keofb);
2190 2191
	}

L
Lachlan McIlroy 已提交
2192 2193 2194 2195
	default:
		return -ENOTTY;
	}
}