xfs_ioctl.c 49.2 KB
Newer Older
D
Dave Chinner 已提交
1
// SPDX-License-Identifier: GPL-2.0
L
Linus Torvalds 已提交
2
/*
3 4
 * Copyright (c) 2000-2005 Silicon Graphics, Inc.
 * All Rights Reserved.
L
Linus Torvalds 已提交
5 6 7
 */
#include "xfs.h"
#include "xfs_fs.h"
8
#include "xfs_shared.h"
9 10 11
#include "xfs_format.h"
#include "xfs_log_format.h"
#include "xfs_trans_resv.h"
L
Linus Torvalds 已提交
12 13
#include "xfs_mount.h"
#include "xfs_inode.h"
14
#include "xfs_ioctl.h"
15
#include "xfs_alloc.h"
L
Linus Torvalds 已提交
16 17
#include "xfs_rtalloc.h"
#include "xfs_itable.h"
18
#include "xfs_error.h"
L
Linus Torvalds 已提交
19
#include "xfs_attr.h"
20
#include "xfs_bmap.h"
D
Dave Chinner 已提交
21
#include "xfs_bmap_util.h"
L
Linus Torvalds 已提交
22
#include "xfs_fsops.h"
C
Christoph Hellwig 已提交
23
#include "xfs_discard.h"
24
#include "xfs_quota.h"
25
#include "xfs_export.h"
C
Christoph Hellwig 已提交
26
#include "xfs_trace.h"
27
#include "xfs_icache.h"
D
Dave Chinner 已提交
28
#include "xfs_symlink.h"
29
#include "xfs_trans.h"
30
#include "xfs_acl.h"
31 32 33
#include "xfs_btree.h"
#include <linux/fsmap.h>
#include "xfs_fsmap.h"
34
#include "scrub/xfs_scrub.h"
35
#include "xfs_sb.h"
36
#include "xfs_ag.h"
37
#include "xfs_health.h"
L
Linus Torvalds 已提交
38

39
#include <linux/capability.h>
40
#include <linux/cred.h>
L
Linus Torvalds 已提交
41 42 43 44
#include <linux/dcache.h>
#include <linux/mount.h>
#include <linux/namei.h>
#include <linux/pagemap.h>
45
#include <linux/slab.h>
46
#include <linux/exportfs.h>
L
Linus Torvalds 已提交
47 48 49 50 51 52 53 54 55 56 57 58

/*
 * xfs_find_handle maps from userspace xfs_fsop_handlereq structure to
 * a file or fs handle.
 *
 * XFS_IOC_PATH_TO_FSHANDLE
 *    returns fs handle for a mount point or path within that mount point
 * XFS_IOC_FD_TO_HANDLE
 *    returns full handle for a FD opened in user space
 * XFS_IOC_PATH_TO_HANDLE
 *    returns full handle for a path
 */
59
int
L
Linus Torvalds 已提交
60 61
xfs_find_handle(
	unsigned int		cmd,
62
	xfs_fsop_handlereq_t	*hreq)
L
Linus Torvalds 已提交
63 64 65 66
{
	int			hsize;
	xfs_handle_t		handle;
	struct inode		*inode;
67
	struct fd		f = {NULL};
C
Christoph Hellwig 已提交
68
	struct path		path;
69
	int			error;
C
Christoph Hellwig 已提交
70
	struct xfs_inode	*ip;
L
Linus Torvalds 已提交
71

C
Christoph Hellwig 已提交
72
	if (cmd == XFS_IOC_FD_TO_HANDLE) {
73 74
		f = fdget(hreq->fd);
		if (!f.file)
C
Christoph Hellwig 已提交
75
			return -EBADF;
A
Al Viro 已提交
76
		inode = file_inode(f.file);
C
Christoph Hellwig 已提交
77 78 79 80
	} else {
		error = user_lpath((const char __user *)hreq->path, &path);
		if (error)
			return error;
81
		inode = d_inode(path.dentry);
L
Linus Torvalds 已提交
82
	}
C
Christoph Hellwig 已提交
83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108
	ip = XFS_I(inode);

	/*
	 * We can only generate handles for inodes residing on a XFS filesystem,
	 * and only for regular files, directories or symbolic links.
	 */
	error = -EINVAL;
	if (inode->i_sb->s_magic != XFS_SB_MAGIC)
		goto out_put;

	error = -EBADF;
	if (!S_ISREG(inode->i_mode) &&
	    !S_ISDIR(inode->i_mode) &&
	    !S_ISLNK(inode->i_mode))
		goto out_put;


	memcpy(&handle.ha_fsid, ip->i_mount->m_fixedfsid, sizeof(xfs_fsid_t));

	if (cmd == XFS_IOC_PATH_TO_FSHANDLE) {
		/*
		 * This handle only contains an fsid, zero the rest.
		 */
		memset(&handle.ha_fid, 0, sizeof(handle.ha_fid));
		hsize = sizeof(xfs_fsid_t);
	} else {
C
Christoph Hellwig 已提交
109 110 111
		handle.ha_fid.fid_len = sizeof(xfs_fid_t) -
					sizeof(handle.ha_fid.fid_len);
		handle.ha_fid.fid_pad = 0;
112
		handle.ha_fid.fid_gen = inode->i_generation;
C
Christoph Hellwig 已提交
113
		handle.ha_fid.fid_ino = ip->i_ino;
C
Christoph Hellwig 已提交
114
		hsize = sizeof(xfs_handle_t);
L
Linus Torvalds 已提交
115 116
	}

C
Christoph Hellwig 已提交
117
	error = -EFAULT;
118
	if (copy_to_user(hreq->ohandle, &handle, hsize) ||
C
Christoph Hellwig 已提交
119 120
	    copy_to_user(hreq->ohandlen, &hsize, sizeof(__s32)))
		goto out_put;
L
Linus Torvalds 已提交
121

C
Christoph Hellwig 已提交
122 123 124 125
	error = 0;

 out_put:
	if (cmd == XFS_IOC_FD_TO_HANDLE)
126
		fdput(f);
C
Christoph Hellwig 已提交
127 128 129
	else
		path_put(&path);
	return error;
L
Linus Torvalds 已提交
130 131 132
}

/*
133 134
 * No need to do permission checks on the various pathname components
 * as the handle operations are privileged.
L
Linus Torvalds 已提交
135 136
 */
STATIC int
137 138 139 140 141 142 143 144 145 146 147 148 149 150 151
xfs_handle_acceptable(
	void			*context,
	struct dentry		*dentry)
{
	return 1;
}

/*
 * Convert userspace handle data into a dentry.
 */
struct dentry *
xfs_handle_to_dentry(
	struct file		*parfilp,
	void __user		*uhandle,
	u32			hlen)
L
Linus Torvalds 已提交
152 153
{
	xfs_handle_t		handle;
154
	struct xfs_fid64	fid;
L
Linus Torvalds 已提交
155 156 157 158

	/*
	 * Only allow handle opens under a directory.
	 */
A
Al Viro 已提交
159
	if (!S_ISDIR(file_inode(parfilp)->i_mode))
160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177
		return ERR_PTR(-ENOTDIR);

	if (hlen != sizeof(xfs_handle_t))
		return ERR_PTR(-EINVAL);
	if (copy_from_user(&handle, uhandle, hlen))
		return ERR_PTR(-EFAULT);
	if (handle.ha_fid.fid_len !=
	    sizeof(handle.ha_fid) - sizeof(handle.ha_fid.fid_len))
		return ERR_PTR(-EINVAL);

	memset(&fid, 0, sizeof(struct fid));
	fid.ino = handle.ha_fid.fid_ino;
	fid.gen = handle.ha_fid.fid_gen;

	return exportfs_decode_fh(parfilp->f_path.mnt, (struct fid *)&fid, 3,
			FILEID_INO32_GEN | XFS_FILEID_TYPE_64FLAG,
			xfs_handle_acceptable, NULL);
}
L
Linus Torvalds 已提交
178

179 180 181 182 183 184
STATIC struct dentry *
xfs_handlereq_to_dentry(
	struct file		*parfilp,
	xfs_fsop_handlereq_t	*hreq)
{
	return xfs_handle_to_dentry(parfilp, hreq->ihandle, hreq->ihandlen);
L
Linus Torvalds 已提交
185 186
}

187
int
L
Linus Torvalds 已提交
188 189
xfs_open_by_handle(
	struct file		*parfilp,
190
	xfs_fsop_handlereq_t	*hreq)
L
Linus Torvalds 已提交
191
{
192
	const struct cred	*cred = current_cred();
L
Linus Torvalds 已提交
193
	int			error;
194
	int			fd;
L
Linus Torvalds 已提交
195 196 197 198
	int			permflag;
	struct file		*filp;
	struct inode		*inode;
	struct dentry		*dentry;
199
	fmode_t			fmode;
200
	struct path		path;
L
Linus Torvalds 已提交
201 202

	if (!capable(CAP_SYS_ADMIN))
E
Eric Sandeen 已提交
203
		return -EPERM;
L
Linus Torvalds 已提交
204

205 206 207
	dentry = xfs_handlereq_to_dentry(parfilp, hreq);
	if (IS_ERR(dentry))
		return PTR_ERR(dentry);
208
	inode = d_inode(dentry);
L
Linus Torvalds 已提交
209 210 211

	/* Restrict xfs_open_by_handle to directories & regular files. */
	if (!(S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode))) {
E
Eric Sandeen 已提交
212
		error = -EPERM;
213
		goto out_dput;
L
Linus Torvalds 已提交
214 215 216
	}

#if BITS_PER_LONG != 32
217
	hreq->oflags |= O_LARGEFILE;
L
Linus Torvalds 已提交
218
#endif
219

220
	permflag = hreq->oflags;
221
	fmode = OPEN_FMODE(permflag);
L
Linus Torvalds 已提交
222
	if ((!(permflag & O_APPEND) || (permflag & O_TRUNC)) &&
223
	    (fmode & FMODE_WRITE) && IS_APPEND(inode)) {
E
Eric Sandeen 已提交
224
		error = -EPERM;
225
		goto out_dput;
L
Linus Torvalds 已提交
226 227
	}

228
	if ((fmode & FMODE_WRITE) && IS_IMMUTABLE(inode)) {
E
Eryu Guan 已提交
229
		error = -EPERM;
230
		goto out_dput;
L
Linus Torvalds 已提交
231 232 233
	}

	/* Can't write directories. */
234
	if (S_ISDIR(inode->i_mode) && (fmode & FMODE_WRITE)) {
E
Eric Sandeen 已提交
235
		error = -EISDIR;
236
		goto out_dput;
L
Linus Torvalds 已提交
237 238
	}

239
	fd = get_unused_fd_flags(0);
240 241 242
	if (fd < 0) {
		error = fd;
		goto out_dput;
L
Linus Torvalds 已提交
243 244
	}

245 246 247 248
	path.mnt = parfilp->f_path.mnt;
	path.dentry = dentry;
	filp = dentry_open(&path, hreq->oflags, cred);
	dput(dentry);
L
Linus Torvalds 已提交
249
	if (IS_ERR(filp)) {
250 251
		put_unused_fd(fd);
		return PTR_ERR(filp);
L
Linus Torvalds 已提交
252
	}
253

A
Al Viro 已提交
254
	if (S_ISREG(inode->i_mode)) {
255
		filp->f_flags |= O_NOATIME;
256
		filp->f_mode |= FMODE_NOCMTIME;
257
	}
L
Linus Torvalds 已提交
258

259 260 261 262 263 264
	fd_install(fd, filp);
	return fd;

 out_dput:
	dput(dentry);
	return error;
L
Linus Torvalds 已提交
265 266
}

267
int
L
Linus Torvalds 已提交
268
xfs_readlink_by_handle(
269 270
	struct file		*parfilp,
	xfs_fsop_handlereq_t	*hreq)
L
Linus Torvalds 已提交
271
{
272
	struct dentry		*dentry;
L
Linus Torvalds 已提交
273
	__u32			olen;
274
	int			error;
L
Linus Torvalds 已提交
275 276

	if (!capable(CAP_SYS_ADMIN))
E
Eric Sandeen 已提交
277
		return -EPERM;
L
Linus Torvalds 已提交
278

279 280 281
	dentry = xfs_handlereq_to_dentry(parfilp, hreq);
	if (IS_ERR(dentry))
		return PTR_ERR(dentry);
L
Linus Torvalds 已提交
282 283

	/* Restrict this handle operation to symlinks only. */
284
	if (!d_is_symlink(dentry)) {
E
Eric Sandeen 已提交
285
		error = -EINVAL;
286
		goto out_dput;
L
Linus Torvalds 已提交
287 288
	}

289
	if (copy_from_user(&olen, hreq->ohandlen, sizeof(__u32))) {
E
Eric Sandeen 已提交
290
		error = -EFAULT;
291
		goto out_dput;
L
Linus Torvalds 已提交
292 293
	}

294
	error = vfs_readlink(dentry, hreq->ohandle, olen);
295

296 297
 out_dput:
	dput(dentry);
298
	return error;
L
Linus Torvalds 已提交
299 300
}

D
Dave Chinner 已提交
301 302 303
int
xfs_set_dmattrs(
	xfs_inode_t     *ip,
D
Darrick J. Wong 已提交
304 305
	uint		evmask,
	uint16_t	state)
D
Dave Chinner 已提交
306 307 308 309 310 311
{
	xfs_mount_t	*mp = ip->i_mount;
	xfs_trans_t	*tp;
	int		error;

	if (!capable(CAP_SYS_ADMIN))
D
Dave Chinner 已提交
312
		return -EPERM;
D
Dave Chinner 已提交
313 314

	if (XFS_FORCED_SHUTDOWN(mp))
D
Dave Chinner 已提交
315
		return -EIO;
D
Dave Chinner 已提交
316

317 318
	error = xfs_trans_alloc(mp, &M_RES(mp)->tr_ichange, 0, 0, 0, &tp);
	if (error)
D
Dave Chinner 已提交
319
		return error;
320

D
Dave Chinner 已提交
321 322 323 324 325 326 327
	xfs_ilock(ip, XFS_ILOCK_EXCL);
	xfs_trans_ijoin(tp, ip, XFS_ILOCK_EXCL);

	ip->i_d.di_dmevmask = evmask;
	ip->i_d.di_dmstate  = state;

	xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE);
328
	error = xfs_trans_commit(tp);
D
Dave Chinner 已提交
329 330 331 332

	return error;
}

L
Linus Torvalds 已提交
333 334
STATIC int
xfs_fssetdm_by_handle(
335 336
	struct file		*parfilp,
	void			__user *arg)
L
Linus Torvalds 已提交
337 338 339 340
{
	int			error;
	struct fsdmidata	fsd;
	xfs_fsop_setdm_handlereq_t dmhreq;
341
	struct dentry		*dentry;
L
Linus Torvalds 已提交
342 343

	if (!capable(CAP_MKNOD))
E
Eric Sandeen 已提交
344
		return -EPERM;
L
Linus Torvalds 已提交
345
	if (copy_from_user(&dmhreq, arg, sizeof(xfs_fsop_setdm_handlereq_t)))
E
Eric Sandeen 已提交
346
		return -EFAULT;
L
Linus Torvalds 已提交
347

J
Jan Kara 已提交
348 349 350 351
	error = mnt_want_write_file(parfilp);
	if (error)
		return error;

352
	dentry = xfs_handlereq_to_dentry(parfilp, &dmhreq.hreq);
J
Jan Kara 已提交
353 354
	if (IS_ERR(dentry)) {
		mnt_drop_write_file(parfilp);
355
		return PTR_ERR(dentry);
J
Jan Kara 已提交
356
	}
L
Linus Torvalds 已提交
357

358
	if (IS_IMMUTABLE(d_inode(dentry)) || IS_APPEND(d_inode(dentry))) {
E
Eric Sandeen 已提交
359
		error = -EPERM;
360
		goto out;
L
Linus Torvalds 已提交
361 362 363
	}

	if (copy_from_user(&fsd, dmhreq.data, sizeof(fsd))) {
E
Eric Sandeen 已提交
364
		error = -EFAULT;
365
		goto out;
L
Linus Torvalds 已提交
366 367
	}

368
	error = xfs_set_dmattrs(XFS_I(d_inode(dentry)), fsd.fsd_dmevmask,
369
				 fsd.fsd_dmstate);
L
Linus Torvalds 已提交
370

371
 out:
J
Jan Kara 已提交
372
	mnt_drop_write_file(parfilp);
373
	dput(dentry);
374
	return error;
L
Linus Torvalds 已提交
375 376 377 378
}

STATIC int
xfs_attrlist_by_handle(
379 380
	struct file		*parfilp,
	void			__user *arg)
L
Linus Torvalds 已提交
381
{
382
	int			error = -ENOMEM;
L
Linus Torvalds 已提交
383
	attrlist_cursor_kern_t	*cursor;
384
	struct xfs_fsop_attrlist_handlereq __user	*p = arg;
L
Linus Torvalds 已提交
385
	xfs_fsop_attrlist_handlereq_t al_hreq;
386
	struct dentry		*dentry;
L
Linus Torvalds 已提交
387 388 389
	char			*kbuf;

	if (!capable(CAP_SYS_ADMIN))
E
Eric Sandeen 已提交
390
		return -EPERM;
L
Linus Torvalds 已提交
391
	if (copy_from_user(&al_hreq, arg, sizeof(xfs_fsop_attrlist_handlereq_t)))
E
Eric Sandeen 已提交
392
		return -EFAULT;
393
	if (al_hreq.buflen < sizeof(struct attrlist) ||
J
Jan Tulak 已提交
394
	    al_hreq.buflen > XFS_XATTR_LIST_MAX)
E
Eric Sandeen 已提交
395
		return -EINVAL;
L
Linus Torvalds 已提交
396

397 398 399 400
	/*
	 * Reject flags, only allow namespaces.
	 */
	if (al_hreq.flags & ~(ATTR_ROOT | ATTR_SECURE))
E
Eric Sandeen 已提交
401
		return -EINVAL;
402

403 404 405
	dentry = xfs_handlereq_to_dentry(parfilp, &al_hreq.hreq);
	if (IS_ERR(dentry))
		return PTR_ERR(dentry);
L
Linus Torvalds 已提交
406

407 408 409
	kbuf = kmem_zalloc_large(al_hreq.buflen, KM_SLEEP);
	if (!kbuf)
		goto out_dput;
L
Linus Torvalds 已提交
410 411

	cursor = (attrlist_cursor_kern_t *)&al_hreq.pos;
412
	error = xfs_attr_list(XFS_I(d_inode(dentry)), kbuf, al_hreq.buflen,
413
					al_hreq.flags, cursor);
L
Linus Torvalds 已提交
414 415 416
	if (error)
		goto out_kfree;

417 418 419 420 421
	if (copy_to_user(&p->pos, cursor, sizeof(attrlist_cursor_kern_t))) {
		error = -EFAULT;
		goto out_kfree;
	}

L
Linus Torvalds 已提交
422 423 424
	if (copy_to_user(al_hreq.buffer, kbuf, al_hreq.buflen))
		error = -EFAULT;

425 426 427
out_kfree:
	kmem_free(kbuf);
out_dput:
428 429
	dput(dentry);
	return error;
L
Linus Torvalds 已提交
430 431
}

432
int
L
Linus Torvalds 已提交
433
xfs_attrmulti_attr_get(
434
	struct inode		*inode,
435 436
	unsigned char		*name,
	unsigned char		__user *ubuf,
437 438
	uint32_t		*len,
	uint32_t		flags)
L
Linus Torvalds 已提交
439
{
440
	unsigned char		*kbuf;
D
Dave Chinner 已提交
441
	int			error = -EFAULT;
442

443
	if (*len > XFS_XATTR_SIZE_MAX)
D
Dave Chinner 已提交
444
		return -EINVAL;
445 446
	kbuf = kmem_zalloc_large(*len, KM_SLEEP);
	if (!kbuf)
D
Dave Chinner 已提交
447
		return -ENOMEM;
L
Linus Torvalds 已提交
448

449
	error = xfs_attr_get(XFS_I(inode), name, kbuf, (int *)len, flags);
L
Linus Torvalds 已提交
450 451 452 453
	if (error)
		goto out_kfree;

	if (copy_to_user(ubuf, kbuf, *len))
D
Dave Chinner 已提交
454
		error = -EFAULT;
L
Linus Torvalds 已提交
455

456 457
out_kfree:
	kmem_free(kbuf);
L
Linus Torvalds 已提交
458 459 460
	return error;
}

461
int
L
Linus Torvalds 已提交
462
xfs_attrmulti_attr_set(
463
	struct inode		*inode,
464 465
	unsigned char		*name,
	const unsigned char	__user *ubuf,
466 467
	uint32_t		len,
	uint32_t		flags)
L
Linus Torvalds 已提交
468
{
469
	unsigned char		*kbuf;
470
	int			error;
L
Linus Torvalds 已提交
471

472
	if (IS_IMMUTABLE(inode) || IS_APPEND(inode))
D
Dave Chinner 已提交
473
		return -EPERM;
474
	if (len > XFS_XATTR_SIZE_MAX)
D
Dave Chinner 已提交
475
		return -EINVAL;
L
Linus Torvalds 已提交
476

L
Li Zefan 已提交
477 478 479
	kbuf = memdup_user(ubuf, len);
	if (IS_ERR(kbuf))
		return PTR_ERR(kbuf);
480

481
	error = xfs_attr_set(XFS_I(inode), name, kbuf, len, flags);
482 483
	if (!error)
		xfs_forget_acl(inode, name, flags);
484 485
	kfree(kbuf);
	return error;
L
Linus Torvalds 已提交
486 487
}

488
int
L
Linus Torvalds 已提交
489
xfs_attrmulti_attr_remove(
490
	struct inode		*inode,
491
	unsigned char		*name,
492
	uint32_t		flags)
L
Linus Torvalds 已提交
493
{
494 495
	int			error;

496
	if (IS_IMMUTABLE(inode) || IS_APPEND(inode))
D
Dave Chinner 已提交
497
		return -EPERM;
498 499 500 501
	error = xfs_attr_remove(XFS_I(inode), name, flags);
	if (!error)
		xfs_forget_acl(inode, name, flags);
	return error;
L
Linus Torvalds 已提交
502 503 504 505
}

STATIC int
xfs_attrmulti_by_handle(
506
	struct file		*parfilp,
507
	void			__user *arg)
L
Linus Torvalds 已提交
508 509 510 511
{
	int			error;
	xfs_attr_multiop_t	*ops;
	xfs_fsop_attrmulti_handlereq_t am_hreq;
512
	struct dentry		*dentry;
L
Linus Torvalds 已提交
513
	unsigned int		i, size;
514
	unsigned char		*attr_name;
L
Linus Torvalds 已提交
515 516

	if (!capable(CAP_SYS_ADMIN))
E
Eric Sandeen 已提交
517
		return -EPERM;
L
Linus Torvalds 已提交
518
	if (copy_from_user(&am_hreq, arg, sizeof(xfs_fsop_attrmulti_handlereq_t)))
E
Eric Sandeen 已提交
519
		return -EFAULT;
L
Linus Torvalds 已提交
520

521 522 523 524
	/* overflow check */
	if (am_hreq.opcount >= INT_MAX / sizeof(xfs_attr_multiop_t))
		return -E2BIG;

525 526 527
	dentry = xfs_handlereq_to_dentry(parfilp, &am_hreq.hreq);
	if (IS_ERR(dentry))
		return PTR_ERR(dentry);
L
Linus Torvalds 已提交
528

D
Dave Chinner 已提交
529
	error = -E2BIG;
C
Christoph Hellwig 已提交
530
	size = am_hreq.opcount * sizeof(xfs_attr_multiop_t);
L
Linus Torvalds 已提交
531
	if (!size || size > 16 * PAGE_SIZE)
532
		goto out_dput;
L
Linus Torvalds 已提交
533

L
Li Zefan 已提交
534 535
	ops = memdup_user(am_hreq.ops, size);
	if (IS_ERR(ops)) {
D
Dave Chinner 已提交
536
		error = PTR_ERR(ops);
537
		goto out_dput;
L
Li Zefan 已提交
538
	}
L
Linus Torvalds 已提交
539

D
Dave Chinner 已提交
540
	error = -ENOMEM;
L
Linus Torvalds 已提交
541 542 543 544 545 546
	attr_name = kmalloc(MAXNAMELEN, GFP_KERNEL);
	if (!attr_name)
		goto out_kfree_ops;

	error = 0;
	for (i = 0; i < am_hreq.opcount; i++) {
547
		ops[i].am_error = strncpy_from_user((char *)attr_name,
L
Linus Torvalds 已提交
548 549
				ops[i].am_attrname, MAXNAMELEN);
		if (ops[i].am_error == 0 || ops[i].am_error == MAXNAMELEN)
D
Dave Chinner 已提交
550
			error = -ERANGE;
L
Linus Torvalds 已提交
551 552 553 554 555
		if (ops[i].am_error < 0)
			break;

		switch (ops[i].am_opcode) {
		case ATTR_OP_GET:
556
			ops[i].am_error = xfs_attrmulti_attr_get(
557
					d_inode(dentry), attr_name,
558 559
					ops[i].am_attrvalue, &ops[i].am_length,
					ops[i].am_flags);
L
Linus Torvalds 已提交
560 561
			break;
		case ATTR_OP_SET:
562
			ops[i].am_error = mnt_want_write_file(parfilp);
563 564
			if (ops[i].am_error)
				break;
565
			ops[i].am_error = xfs_attrmulti_attr_set(
566
					d_inode(dentry), attr_name,
567 568
					ops[i].am_attrvalue, ops[i].am_length,
					ops[i].am_flags);
A
Al Viro 已提交
569
			mnt_drop_write_file(parfilp);
L
Linus Torvalds 已提交
570 571
			break;
		case ATTR_OP_REMOVE:
572
			ops[i].am_error = mnt_want_write_file(parfilp);
573 574
			if (ops[i].am_error)
				break;
575
			ops[i].am_error = xfs_attrmulti_attr_remove(
576
					d_inode(dentry), attr_name,
577
					ops[i].am_flags);
A
Al Viro 已提交
578
			mnt_drop_write_file(parfilp);
L
Linus Torvalds 已提交
579 580
			break;
		default:
D
Dave Chinner 已提交
581
			ops[i].am_error = -EINVAL;
L
Linus Torvalds 已提交
582 583 584 585
		}
	}

	if (copy_to_user(am_hreq.ops, ops, size))
D
Dave Chinner 已提交
586
		error = -EFAULT;
L
Linus Torvalds 已提交
587 588 589 590

	kfree(attr_name);
 out_kfree_ops:
	kfree(ops);
591 592
 out_dput:
	dput(dentry);
D
Dave Chinner 已提交
593
	return error;
L
Linus Torvalds 已提交
594 595
}

596
int
L
Linus Torvalds 已提交
597 598 599
xfs_ioc_space(
	struct file		*filp,
	unsigned int		cmd,
600
	xfs_flock64_t		*bf)
L
Linus Torvalds 已提交
601
{
602 603
	struct inode		*inode = file_inode(filp);
	struct xfs_inode	*ip = XFS_I(inode);
604
	struct iattr		iattr;
605
	enum xfs_prealloc_flags	flags = 0;
606
	uint			iolock = XFS_IOLOCK_EXCL | XFS_MMAPLOCK_EXCL;
L
Linus Torvalds 已提交
607 608
	int			error;

609
	if (inode->i_flags & (S_IMMUTABLE|S_APPEND))
E
Eric Sandeen 已提交
610
		return -EPERM;
L
Linus Torvalds 已提交
611

612
	if (!(filp->f_mode & FMODE_WRITE))
E
Eric Sandeen 已提交
613
		return -EBADF;
L
Linus Torvalds 已提交
614

615
	if (!S_ISREG(inode->i_mode))
E
Eric Sandeen 已提交
616
		return -EINVAL;
L
Linus Torvalds 已提交
617

618 619
	if (filp->f_flags & O_DSYNC)
		flags |= XFS_PREALLOC_SYNC;
620
	if (filp->f_mode & FMODE_NOCMTIME)
621 622
		flags |= XFS_PREALLOC_INVISIBLE;

J
Jan Kara 已提交
623 624 625
	error = mnt_want_write_file(filp);
	if (error)
		return error;
626

627
	xfs_ilock(ip, iolock);
628
	error = xfs_break_layouts(inode, &iolock, BREAK_UNMAP);
629 630
	if (error)
		goto out_unlock;
631 632 633 634 635 636 637 638 639 640 641

	switch (bf->l_whence) {
	case 0: /*SEEK_SET*/
		break;
	case 1: /*SEEK_CUR*/
		bf->l_start += filp->f_pos;
		break;
	case 2: /*SEEK_END*/
		bf->l_start += XFS_ISIZE(ip);
		break;
	default:
D
Dave Chinner 已提交
642
		error = -EINVAL;
643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658
		goto out_unlock;
	}

	/*
	 * length of <= 0 for resv/unresv/zero is invalid.  length for
	 * alloc/free is ignored completely and we have no idea what userspace
	 * might have set it to, so set it to zero to allow range
	 * checks to pass.
	 */
	switch (cmd) {
	case XFS_IOC_ZERO_RANGE:
	case XFS_IOC_RESVSP:
	case XFS_IOC_RESVSP64:
	case XFS_IOC_UNRESVSP:
	case XFS_IOC_UNRESVSP64:
		if (bf->l_len <= 0) {
D
Dave Chinner 已提交
659
			error = -EINVAL;
660 661 662 663 664 665 666 667 668
			goto out_unlock;
		}
		break;
	default:
		bf->l_len = 0;
		break;
	}

	if (bf->l_start < 0 ||
669
	    bf->l_start > inode->i_sb->s_maxbytes ||
670
	    bf->l_start + bf->l_len < 0 ||
671
	    bf->l_start + bf->l_len >= inode->i_sb->s_maxbytes) {
D
Dave Chinner 已提交
672
		error = -EINVAL;
673 674 675 676 677
		goto out_unlock;
	}

	switch (cmd) {
	case XFS_IOC_ZERO_RANGE:
678
		flags |= XFS_PREALLOC_SET;
679 680 681 682
		error = xfs_zero_file_space(ip, bf->l_start, bf->l_len);
		break;
	case XFS_IOC_RESVSP:
	case XFS_IOC_RESVSP64:
683
		flags |= XFS_PREALLOC_SET;
684 685 686 687 688 689 690 691 692 693 694
		error = xfs_alloc_file_space(ip, bf->l_start, bf->l_len,
						XFS_BMAPI_PREALLOC);
		break;
	case XFS_IOC_UNRESVSP:
	case XFS_IOC_UNRESVSP64:
		error = xfs_free_file_space(ip, bf->l_start, bf->l_len);
		break;
	case XFS_IOC_ALLOCSP:
	case XFS_IOC_ALLOCSP64:
	case XFS_IOC_FREESP:
	case XFS_IOC_FREESP64:
695
		flags |= XFS_PREALLOC_CLEAR;
696 697 698 699 700 701 702 703 704 705
		if (bf->l_start > XFS_ISIZE(ip)) {
			error = xfs_alloc_file_space(ip, XFS_ISIZE(ip),
					bf->l_start - XFS_ISIZE(ip), 0);
			if (error)
				goto out_unlock;
		}

		iattr.ia_valid = ATTR_SIZE;
		iattr.ia_size = bf->l_start;

706
		error = xfs_vn_setattr_size(file_dentry(filp), &iattr);
707 708 709
		break;
	default:
		ASSERT(0);
D
Dave Chinner 已提交
710
		error = -EINVAL;
711 712 713 714 715
	}

	if (error)
		goto out_unlock;

716
	error = xfs_update_prealloc_flags(ip, flags);
717 718

out_unlock:
719
	xfs_iunlock(ip, iolock);
J
Jan Kara 已提交
720
	mnt_drop_write_file(filp);
D
Dave Chinner 已提交
721
	return error;
L
Linus Torvalds 已提交
722 723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742
}

STATIC int
xfs_ioc_bulkstat(
	xfs_mount_t		*mp,
	unsigned int		cmd,
	void			__user *arg)
{
	xfs_fsop_bulkreq_t	bulkreq;
	int			count;	/* # of records returned */
	xfs_ino_t		inlast;	/* last inode number */
	int			done;
	int			error;

	/* done = 1 if there are more stats to get and if bulkstat */
	/* should be called again (unused here, but used in dmapi) */

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (XFS_FORCED_SHUTDOWN(mp))
E
Eric Sandeen 已提交
743
		return -EIO;
L
Linus Torvalds 已提交
744 745

	if (copy_from_user(&bulkreq, arg, sizeof(xfs_fsop_bulkreq_t)))
E
Eric Sandeen 已提交
746
		return -EFAULT;
L
Linus Torvalds 已提交
747 748

	if (copy_from_user(&inlast, bulkreq.lastip, sizeof(__s64)))
E
Eric Sandeen 已提交
749
		return -EFAULT;
L
Linus Torvalds 已提交
750 751

	if ((count = bulkreq.icount) <= 0)
E
Eric Sandeen 已提交
752
		return -EINVAL;
L
Linus Torvalds 已提交
753

754
	if (bulkreq.ubuffer == NULL)
E
Eric Sandeen 已提交
755
		return -EINVAL;
756

L
Linus Torvalds 已提交
757 758
	if (cmd == XFS_IOC_FSINUMBERS)
		error = xfs_inumbers(mp, &inlast, &count,
759
					bulkreq.ubuffer, xfs_inumbers_fmt);
L
Linus Torvalds 已提交
760
	else if (cmd == XFS_IOC_FSBULKSTAT_SINGLE)
761 762
		error = xfs_bulkstat_one(mp, inlast, bulkreq.ubuffer,
					sizeof(xfs_bstat_t), NULL, &done);
763
	else	/* XFS_IOC_FSBULKSTAT */
764 765 766
		error = xfs_bulkstat(mp, &inlast, &count, xfs_bulkstat_one,
				     sizeof(xfs_bstat_t), bulkreq.ubuffer,
				     &done);
L
Linus Torvalds 已提交
767 768

	if (error)
D
Dave Chinner 已提交
769
		return error;
L
Linus Torvalds 已提交
770 771 772 773

	if (bulkreq.ocount != NULL) {
		if (copy_to_user(bulkreq.lastip, &inlast,
						sizeof(xfs_ino_t)))
E
Eric Sandeen 已提交
774
			return -EFAULT;
L
Linus Torvalds 已提交
775 776

		if (copy_to_user(bulkreq.ocount, &count, sizeof(count)))
E
Eric Sandeen 已提交
777
			return -EFAULT;
L
Linus Torvalds 已提交
778 779 780 781 782 783 784
	}

	return 0;
}

STATIC int
xfs_ioc_fsgeometry(
785 786 787
	struct xfs_mount	*mp,
	void			__user *arg,
	int			struct_version)
L
Linus Torvalds 已提交
788
{
789 790
	struct xfs_fsop_geom	fsgeo;
	size_t			len;
L
Linus Torvalds 已提交
791

792
	xfs_fs_geometry(&mp->m_sb, &fsgeo, struct_version);
L
Linus Torvalds 已提交
793

794 795 796 797
	if (struct_version <= 3)
		len = sizeof(struct xfs_fsop_geom_v1);
	else if (struct_version == 4)
		len = sizeof(struct xfs_fsop_geom_v4);
798 799
	else {
		xfs_fsop_geom_health(mp, &fsgeo);
800
		len = sizeof(fsgeo);
801
	}
802 803

	if (copy_to_user(arg, &fsgeo, len))
E
Eric Sandeen 已提交
804
		return -EFAULT;
L
Linus Torvalds 已提交
805 806 807
	return 0;
}

808 809 810 811 812 813 814 815 816 817 818 819 820 821 822 823 824 825 826 827
STATIC int
xfs_ioc_ag_geometry(
	struct xfs_mount	*mp,
	void			__user *arg)
{
	struct xfs_ag_geometry	ageo;
	int			error;

	if (copy_from_user(&ageo, arg, sizeof(ageo)))
		return -EFAULT;

	error = xfs_ag_get_geometry(mp, ageo.ag_number, &ageo);
	if (error)
		return error;

	if (copy_to_user(arg, &ageo, sizeof(ageo)))
		return -EFAULT;
	return 0;
}

L
Linus Torvalds 已提交
828 829 830 831 832 833 834 835 836 837 838
/*
 * Linux extended inode flags interface.
 */

STATIC unsigned int
xfs_merge_ioc_xflags(
	unsigned int	flags,
	unsigned int	start)
{
	unsigned int	xflags = start;

839
	if (flags & FS_IMMUTABLE_FL)
840
		xflags |= FS_XFLAG_IMMUTABLE;
L
Linus Torvalds 已提交
841
	else
842
		xflags &= ~FS_XFLAG_IMMUTABLE;
843
	if (flags & FS_APPEND_FL)
844
		xflags |= FS_XFLAG_APPEND;
L
Linus Torvalds 已提交
845
	else
846
		xflags &= ~FS_XFLAG_APPEND;
847
	if (flags & FS_SYNC_FL)
848
		xflags |= FS_XFLAG_SYNC;
L
Linus Torvalds 已提交
849
	else
850
		xflags &= ~FS_XFLAG_SYNC;
851
	if (flags & FS_NOATIME_FL)
852
		xflags |= FS_XFLAG_NOATIME;
L
Linus Torvalds 已提交
853
	else
854
		xflags &= ~FS_XFLAG_NOATIME;
855
	if (flags & FS_NODUMP_FL)
856
		xflags |= FS_XFLAG_NODUMP;
L
Linus Torvalds 已提交
857
	else
858
		xflags &= ~FS_XFLAG_NODUMP;
L
Linus Torvalds 已提交
859 860 861 862 863 864

	return xflags;
}

STATIC unsigned int
xfs_di2lxflags(
865
	uint16_t	di_flags)
L
Linus Torvalds 已提交
866 867 868 869
{
	unsigned int	flags = 0;

	if (di_flags & XFS_DIFLAG_IMMUTABLE)
870
		flags |= FS_IMMUTABLE_FL;
L
Linus Torvalds 已提交
871
	if (di_flags & XFS_DIFLAG_APPEND)
872
		flags |= FS_APPEND_FL;
L
Linus Torvalds 已提交
873
	if (di_flags & XFS_DIFLAG_SYNC)
874
		flags |= FS_SYNC_FL;
L
Linus Torvalds 已提交
875
	if (di_flags & XFS_DIFLAG_NOATIME)
876
		flags |= FS_NOATIME_FL;
L
Linus Torvalds 已提交
877
	if (di_flags & XFS_DIFLAG_NODUMP)
878
		flags |= FS_NODUMP_FL;
L
Linus Torvalds 已提交
879 880 881
	return flags;
}

882 883 884 885 886
static void
xfs_fill_fsxattr(
	struct xfs_inode	*ip,
	bool			attr,
	struct fsxattr		*fa)
887
{
888 889 890
	simple_fill_fsxattr(fa, xfs_ip2xflags(ip));
	fa->fsx_extsize = ip->i_d.di_extsize << ip->i_mount->m_sb.sb_blocklog;
	fa->fsx_cowextsize = ip->i_d.di_cowextsize <<
891
			ip->i_mount->m_sb.sb_blocklog;
892
	fa->fsx_projid = xfs_get_projid(ip);
893 894 895 896

	if (attr) {
		if (ip->i_afp) {
			if (ip->i_afp->if_flags & XFS_IFEXTENTS)
897
				fa->fsx_nextents = xfs_iext_count(ip->i_afp);
898
			else
899
				fa->fsx_nextents = ip->i_d.di_anextents;
900
		} else
901
			fa->fsx_nextents = 0;
902 903
	} else {
		if (ip->i_df.if_flags & XFS_IFEXTENTS)
904
			fa->fsx_nextents = xfs_iext_count(&ip->i_df);
905
		else
906
			fa->fsx_nextents = ip->i_d.di_nextents;
907
	}
908 909 910 911 912 913 914 915 916 917 918 919
}

STATIC int
xfs_ioc_fsgetxattr(
	xfs_inode_t		*ip,
	int			attr,
	void			__user *arg)
{
	struct fsxattr		fa;

	xfs_ilock(ip, XFS_ILOCK_SHARED);
	xfs_fill_fsxattr(ip, attr, &fa);
920 921 922 923 924 925 926
	xfs_iunlock(ip, XFS_ILOCK_SHARED);

	if (copy_to_user(arg, &fa, sizeof(fa)))
		return -EFAULT;
	return 0;
}

927 928
STATIC uint16_t
xfs_flags2diflags(
929 930 931 932
	struct xfs_inode	*ip,
	unsigned int		xflags)
{
	/* can't set PREALLOC this way, just preserve it */
933 934 935
	uint16_t		di_flags =
		(ip->i_d.di_flags & XFS_DIFLAG_PREALLOC);

936
	if (xflags & FS_XFLAG_IMMUTABLE)
937
		di_flags |= XFS_DIFLAG_IMMUTABLE;
938
	if (xflags & FS_XFLAG_APPEND)
939
		di_flags |= XFS_DIFLAG_APPEND;
940
	if (xflags & FS_XFLAG_SYNC)
941
		di_flags |= XFS_DIFLAG_SYNC;
942
	if (xflags & FS_XFLAG_NOATIME)
943
		di_flags |= XFS_DIFLAG_NOATIME;
944
	if (xflags & FS_XFLAG_NODUMP)
945
		di_flags |= XFS_DIFLAG_NODUMP;
946
	if (xflags & FS_XFLAG_NODEFRAG)
947
		di_flags |= XFS_DIFLAG_NODEFRAG;
948
	if (xflags & FS_XFLAG_FILESTREAM)
949
		di_flags |= XFS_DIFLAG_FILESTREAM;
D
Dave Chinner 已提交
950
	if (S_ISDIR(VFS_I(ip)->i_mode)) {
951
		if (xflags & FS_XFLAG_RTINHERIT)
952
			di_flags |= XFS_DIFLAG_RTINHERIT;
953
		if (xflags & FS_XFLAG_NOSYMLINKS)
954
			di_flags |= XFS_DIFLAG_NOSYMLINKS;
955
		if (xflags & FS_XFLAG_EXTSZINHERIT)
956
			di_flags |= XFS_DIFLAG_EXTSZINHERIT;
957
		if (xflags & FS_XFLAG_PROJINHERIT)
958
			di_flags |= XFS_DIFLAG_PROJINHERIT;
D
Dave Chinner 已提交
959
	} else if (S_ISREG(VFS_I(ip)->i_mode)) {
960
		if (xflags & FS_XFLAG_REALTIME)
961
			di_flags |= XFS_DIFLAG_REALTIME;
962
		if (xflags & FS_XFLAG_EXTSIZE)
963 964
			di_flags |= XFS_DIFLAG_EXTSIZE;
	}
965

966 967 968 969 970 971 972 973 974 975
	return di_flags;
}

STATIC uint64_t
xfs_flags2diflags2(
	struct xfs_inode	*ip,
	unsigned int		xflags)
{
	uint64_t		di_flags2 =
		(ip->i_d.di_flags2 & XFS_DIFLAG2_REFLINK);
976 977 978

	if (xflags & FS_XFLAG_DAX)
		di_flags2 |= XFS_DIFLAG2_DAX;
979 980
	if (xflags & FS_XFLAG_COWEXTSIZE)
		di_flags2 |= XFS_DIFLAG2_COWEXTSIZE;
981

982
	return di_flags2;
983 984
}

985 986 987 988
STATIC void
xfs_diflags_to_linux(
	struct xfs_inode	*ip)
{
989
	struct inode		*inode = VFS_I(ip);
990 991
	unsigned int		xflags = xfs_ip2xflags(ip);

992
	if (xflags & FS_XFLAG_IMMUTABLE)
993 994 995
		inode->i_flags |= S_IMMUTABLE;
	else
		inode->i_flags &= ~S_IMMUTABLE;
996
	if (xflags & FS_XFLAG_APPEND)
997 998 999
		inode->i_flags |= S_APPEND;
	else
		inode->i_flags &= ~S_APPEND;
1000
	if (xflags & FS_XFLAG_SYNC)
1001 1002 1003
		inode->i_flags |= S_SYNC;
	else
		inode->i_flags &= ~S_SYNC;
1004
	if (xflags & FS_XFLAG_NOATIME)
1005 1006 1007
		inode->i_flags |= S_NOATIME;
	else
		inode->i_flags &= ~S_NOATIME;
1008
#if 0	/* disabled until the flag switching races are sorted out */
1009 1010 1011 1012
	if (xflags & FS_XFLAG_DAX)
		inode->i_flags |= S_DAX;
	else
		inode->i_flags &= ~S_DAX;
1013
#endif
1014
}
1015

1016 1017 1018 1019 1020 1021 1022
static int
xfs_ioctl_setattr_xflags(
	struct xfs_trans	*tp,
	struct xfs_inode	*ip,
	struct fsxattr		*fa)
{
	struct xfs_mount	*mp = ip->i_mount;
1023
	uint64_t		di_flags2;
1024 1025 1026

	/* Can't change realtime flag if any extents are allocated. */
	if ((ip->i_d.di_nextents || ip->i_delayed_blks) &&
1027
	    XFS_IS_REALTIME_INODE(ip) != (fa->fsx_xflags & FS_XFLAG_REALTIME))
1028 1029 1030
		return -EINVAL;

	/* If realtime flag is set then must have realtime device */
1031
	if (fa->fsx_xflags & FS_XFLAG_REALTIME) {
1032 1033 1034 1035 1036
		if (mp->m_sb.sb_rblocks == 0 || mp->m_sb.sb_rextsize == 0 ||
		    (ip->i_d.di_extsize % mp->m_sb.sb_rextsize))
			return -EINVAL;
	}

1037
	/* Clear reflink if we are actually able to set the rt flag. */
1038
	if ((fa->fsx_xflags & FS_XFLAG_REALTIME) && xfs_is_reflink_inode(ip))
1039
		ip->i_d.di_flags2 &= ~XFS_DIFLAG2_REFLINK;
1040

1041 1042 1043 1044
	/* Don't allow us to set DAX mode for a reflinked file for now. */
	if ((fa->fsx_xflags & FS_XFLAG_DAX) && xfs_is_reflink_inode(ip))
		return -EINVAL;

1045 1046 1047 1048 1049 1050 1051 1052
	/* diflags2 only valid for v3 inodes. */
	di_flags2 = xfs_flags2diflags2(ip, fa->fsx_xflags);
	if (di_flags2 && ip->i_d.di_version < 3)
		return -EINVAL;

	ip->i_d.di_flags = xfs_flags2diflags(ip, fa->fsx_xflags);
	ip->i_d.di_flags2 = di_flags2;

1053 1054 1055
	xfs_diflags_to_linux(ip);
	xfs_trans_ichgtime(tp, ip, XFS_ICHGTIME_CHG);
	xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE);
1056
	XFS_STATS_INC(mp, xs_ig_attrchg);
1057 1058 1059
	return 0;
}

1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074
/*
 * If we are changing DAX flags, we have to ensure the file is clean and any
 * cached objects in the address space are invalidated and removed. This
 * requires us to lock out other IO and page faults similar to a truncate
 * operation. The locks need to be held until the transaction has been committed
 * so that the cache invalidation is atomic with respect to the DAX flag
 * manipulation.
 */
static int
xfs_ioctl_setattr_dax_invalidate(
	struct xfs_inode	*ip,
	struct fsxattr		*fa,
	int			*join_flags)
{
	struct inode		*inode = VFS_I(ip);
1075
	struct super_block	*sb = inode->i_sb;
1076 1077 1078 1079
	int			error;

	*join_flags = 0;

1080 1081
	/*
	 * It is only valid to set the DAX flag on regular files and
1082
	 * directories on filesystems where the block size is equal to the page
1083 1084
	 * size. On directories it serves as an inherited hint so we don't
	 * have to check the device for dax support or flush pagecache.
1085
	 */
1086 1087 1088
	if (fa->fsx_xflags & FS_XFLAG_DAX) {
		if (!(S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode)))
			return -EINVAL;
1089 1090
		if (S_ISREG(inode->i_mode) &&
		    !bdev_dax_supported(xfs_find_bdev_for_inode(VFS_I(ip)),
1091
				sb->s_blocksize))
1092 1093
			return -EINVAL;
	}
1094

1095 1096 1097 1098 1099 1100
	/* If the DAX state is not changing, we have nothing to do here. */
	if ((fa->fsx_xflags & FS_XFLAG_DAX) && IS_DAX(inode))
		return 0;
	if (!(fa->fsx_xflags & FS_XFLAG_DAX) && !IS_DAX(inode))
		return 0;

1101 1102 1103
	if (S_ISDIR(inode->i_mode))
		return 0;

1104 1105 1106 1107 1108 1109 1110 1111 1112 1113
	/* lock, flush and invalidate mapping in preparation for flag change */
	xfs_ilock(ip, XFS_MMAPLOCK_EXCL | XFS_IOLOCK_EXCL);
	error = filemap_write_and_wait(inode->i_mapping);
	if (error)
		goto out_unlock;
	error = invalidate_inode_pages2(inode->i_mapping);
	if (error)
		goto out_unlock;

	*join_flags = XFS_MMAPLOCK_EXCL | XFS_IOLOCK_EXCL;
1114
	return 0;
1115 1116 1117 1118 1119

out_unlock:
	xfs_iunlock(ip, XFS_MMAPLOCK_EXCL | XFS_IOLOCK_EXCL);
	return error;

1120 1121
}

1122 1123 1124 1125 1126
/*
 * Set up the transaction structure for the setattr operation, checking that we
 * have permission to do so. On success, return a clean transaction and the
 * inode locked exclusively ready for further operation specific checks. On
 * failure, return an error without modifying or locking the inode.
1127 1128 1129 1130 1131 1132
 *
 * The inode might already be IO locked on call. If this is the case, it is
 * indicated in @join_flags and we take full responsibility for ensuring they
 * are unlocked from now on. Hence if we have an error here, we still have to
 * unlock them. Otherwise, once they are joined to the transaction, they will
 * be unlocked on commit/cancel.
1133 1134 1135
 */
static struct xfs_trans *
xfs_ioctl_setattr_get_trans(
1136 1137
	struct xfs_inode	*ip,
	int			join_flags)
1138 1139 1140
{
	struct xfs_mount	*mp = ip->i_mount;
	struct xfs_trans	*tp;
1141
	int			error = -EROFS;
1142 1143

	if (mp->m_flags & XFS_MOUNT_RDONLY)
1144 1145
		goto out_unlock;
	error = -EIO;
1146
	if (XFS_FORCED_SHUTDOWN(mp))
1147
		goto out_unlock;
1148

1149
	error = xfs_trans_alloc(mp, &M_RES(mp)->tr_ichange, 0, 0, 0, &tp);
1150
	if (error)
1151
		goto out_unlock;
1152 1153

	xfs_ilock(ip, XFS_ILOCK_EXCL);
1154 1155
	xfs_trans_ijoin(tp, ip, XFS_ILOCK_EXCL | join_flags);
	join_flags = 0;
1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173

	/*
	 * CAP_FOWNER overrides the following restrictions:
	 *
	 * The user ID of the calling process must be equal to the file owner
	 * ID, except in cases where the CAP_FSETID capability is applicable.
	 */
	if (!inode_owner_or_capable(VFS_I(ip))) {
		error = -EPERM;
		goto out_cancel;
	}

	if (mp->m_flags & XFS_MOUNT_WSYNC)
		xfs_trans_set_sync(tp);

	return tp;

out_cancel:
1174
	xfs_trans_cancel(tp);
1175 1176 1177
out_unlock:
	if (join_flags)
		xfs_iunlock(ip, join_flags);
1178 1179 1180
	return ERR_PTR(error);
}

1181 1182 1183 1184
/*
 * extent size hint validation is somewhat cumbersome. Rules are:
 *
 * 1. extent size hint is only valid for directories and regular files
1185 1186
 * 2. FS_XFLAG_EXTSIZE is only valid for regular files
 * 3. FS_XFLAG_EXTSZINHERIT is only valid for directories.
1187 1188 1189 1190 1191 1192 1193
 * 4. can only be changed on regular files if no extents are allocated
 * 5. can be changed on directories at any time
 * 6. extsize hint of 0 turns off hints, clears inode flags.
 * 7. Extent size must be a multiple of the appropriate block size.
 * 8. for non-realtime files, the extent size hint must be limited
 *    to half the AG size to avoid alignment extending the extent beyond the
 *    limits of the AG.
D
Darrick J. Wong 已提交
1194 1195
 *
 * Please keep this function in sync with xfs_scrub_inode_extsize.
1196
 */
1197
static int
1198 1199 1200 1201 1202
xfs_ioctl_setattr_check_extsize(
	struct xfs_inode	*ip,
	struct fsxattr		*fa)
{
	struct xfs_mount	*mp = ip->i_mount;
1203 1204
	xfs_extlen_t		size;
	xfs_fsblock_t		extsize_fsb;
1205

D
Dave Chinner 已提交
1206
	if (S_ISREG(VFS_I(ip)->i_mode) && ip->i_d.di_nextents &&
1207 1208 1209
	    ((ip->i_d.di_extsize << mp->m_sb.sb_blocklog) != fa->fsx_extsize))
		return -EINVAL;

1210 1211
	if (fa->fsx_extsize == 0)
		return 0;
1212

1213 1214 1215
	extsize_fsb = XFS_B_TO_FSB(mp, fa->fsx_extsize);
	if (extsize_fsb > MAXEXTLEN)
		return -EINVAL;
1216

1217 1218 1219 1220 1221 1222
	if (XFS_IS_REALTIME_INODE(ip) ||
	    (fa->fsx_xflags & FS_XFLAG_REALTIME)) {
		size = mp->m_sb.sb_rextsize << mp->m_sb.sb_blocklog;
	} else {
		size = mp->m_sb.sb_blocksize;
		if (extsize_fsb > mp->m_sb.sb_agblocks / 2)
1223
			return -EINVAL;
1224 1225 1226 1227
	}

	if (fa->fsx_extsize % size)
		return -EINVAL;
1228

1229 1230 1231
	return 0;
}

1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243
/*
 * CoW extent size hint validation rules are:
 *
 * 1. CoW extent size hint can only be set if reflink is enabled on the fs.
 *    The inode does not have to have any shared blocks, but it must be a v3.
 * 2. FS_XFLAG_COWEXTSIZE is only valid for directories and regular files;
 *    for a directory, the hint is propagated to new files.
 * 3. Can be changed on files & directories at any time.
 * 4. CoW extsize hint of 0 turns off hints, clears inode flags.
 * 5. Extent size must be a multiple of the appropriate block size.
 * 6. The extent size hint must be limited to half the AG size to avoid
 *    alignment extending the extent beyond the limits of the AG.
D
Darrick J. Wong 已提交
1244 1245
 *
 * Please keep this function in sync with xfs_scrub_inode_cowextsize.
1246 1247 1248 1249 1250 1251 1252
 */
static int
xfs_ioctl_setattr_check_cowextsize(
	struct xfs_inode	*ip,
	struct fsxattr		*fa)
{
	struct xfs_mount	*mp = ip->i_mount;
1253 1254
	xfs_extlen_t		size;
	xfs_fsblock_t		cowextsize_fsb;
1255 1256 1257 1258 1259 1260 1261 1262

	if (!(fa->fsx_xflags & FS_XFLAG_COWEXTSIZE))
		return 0;

	if (!xfs_sb_version_hasreflink(&ip->i_mount->m_sb) ||
	    ip->i_d.di_version != 3)
		return -EINVAL;

1263 1264
	if (fa->fsx_cowextsize == 0)
		return 0;
1265

1266 1267 1268
	cowextsize_fsb = XFS_B_TO_FSB(mp, fa->fsx_cowextsize);
	if (cowextsize_fsb > MAXEXTLEN)
		return -EINVAL;
1269

1270 1271 1272
	size = mp->m_sb.sb_blocksize;
	if (cowextsize_fsb > mp->m_sb.sb_agblocks / 2)
		return -EINVAL;
1273

1274 1275
	if (fa->fsx_cowextsize % size)
		return -EINVAL;
1276 1277 1278 1279

	return 0;
}

1280
static int
1281 1282 1283 1284 1285
xfs_ioctl_setattr_check_projid(
	struct xfs_inode	*ip,
	struct fsxattr		*fa)
{
	/* Disallow 32bit project ids if projid32bit feature is not enabled. */
1286
	if (fa->fsx_projid > (uint16_t)-1 &&
1287 1288 1289 1290
	    !xfs_sb_version_hasprojid32bit(&ip->i_mount->m_sb))
		return -EINVAL;
	return 0;
}
1291 1292 1293 1294

STATIC int
xfs_ioctl_setattr(
	xfs_inode_t		*ip,
1295
	struct fsxattr		*fa)
1296
{
1297
	struct fsxattr		old_fa;
1298 1299
	struct xfs_mount	*mp = ip->i_mount;
	struct xfs_trans	*tp;
C
Christoph Hellwig 已提交
1300
	struct xfs_dquot	*udqp = NULL;
1301
	struct xfs_dquot	*pdqp = NULL;
1302 1303
	struct xfs_dquot	*olddquot = NULL;
	int			code;
1304
	int			join_flags = 0;
1305

C
Christoph Hellwig 已提交
1306
	trace_xfs_ioctl_setattr(ip);
1307

1308 1309 1310
	code = xfs_ioctl_setattr_check_projid(ip, fa);
	if (code)
		return code;
1311

1312 1313 1314 1315 1316 1317 1318 1319
	/*
	 * If disk quotas is on, we make sure that the dquots do exist on disk,
	 * before we start any other transactions. Trying to do this later
	 * is messy. We don't care to take a readlock to look at the ids
	 * in inode here, because we can't hold it across the trans_reserve.
	 * If the IDs do change before we take the ilock, we're covered
	 * because the i_*dquot fields will get updated anyway.
	 */
1320
	if (XFS_IS_QUOTA_ON(mp)) {
C
Christoph Hellwig 已提交
1321
		code = xfs_qm_vop_dqalloc(ip, ip->i_d.di_uid,
1322
					 ip->i_d.di_gid, fa->fsx_projid,
1323
					 XFS_QMOPT_PQUOTA, &udqp, NULL, &pdqp);
1324 1325 1326 1327
		if (code)
			return code;
	}

1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339
	/*
	 * Changing DAX config may require inode locking for mapping
	 * invalidation. These need to be held all the way to transaction commit
	 * or cancel time, so need to be passed through to
	 * xfs_ioctl_setattr_get_trans() so it can apply them to the join call
	 * appropriately.
	 */
	code = xfs_ioctl_setattr_dax_invalidate(ip, fa, &join_flags);
	if (code)
		goto error_free_dquots;

	tp = xfs_ioctl_setattr_get_trans(ip, join_flags);
1340 1341 1342
	if (IS_ERR(tp)) {
		code = PTR_ERR(tp);
		goto error_free_dquots;
1343 1344
	}

1345 1346 1347 1348 1349
	if (XFS_IS_QUOTA_RUNNING(mp) && XFS_IS_PQUOTA_ON(mp) &&
	    xfs_get_projid(ip) != fa->fsx_projid) {
		code = xfs_qm_vop_chown_reserve(tp, ip, udqp, NULL, pdqp,
				capable(CAP_FOWNER) ?  XFS_QMOPT_FORCE_RES : 0);
		if (code)	/* out of quota */
1350
			goto error_trans_cancel;
1351 1352
	}

1353 1354 1355 1356 1357
	xfs_fill_fsxattr(ip, false, &old_fa);
	code = vfs_ioc_fssetxattr_check(VFS_I(ip), &old_fa, fa);
	if (code)
		goto error_trans_cancel;

1358 1359 1360
	code = xfs_ioctl_setattr_check_extsize(ip, fa);
	if (code)
		goto error_trans_cancel;
1361

1362 1363 1364 1365
	code = xfs_ioctl_setattr_check_cowextsize(ip, fa);
	if (code)
		goto error_trans_cancel;

1366 1367
	code = xfs_ioctl_setattr_xflags(tp, ip, fa);
	if (code)
1368
		goto error_trans_cancel;
1369 1370

	/*
1371 1372 1373 1374 1375
	 * Change file ownership.  Must be the owner or privileged.  CAP_FSETID
	 * overrides the following restrictions:
	 *
	 * The set-user-ID and set-group-ID bits of a file will be cleared upon
	 * successful return from chown()
1376 1377
	 */

D
Dave Chinner 已提交
1378
	if ((VFS_I(ip)->i_mode & (S_ISUID|S_ISGID)) &&
1379
	    !capable_wrt_inode_uidgid(VFS_I(ip), CAP_FSETID))
D
Dave Chinner 已提交
1380
		VFS_I(ip)->i_mode &= ~(S_ISUID|S_ISGID);
1381

1382 1383 1384 1385 1386 1387 1388 1389
	/* Change the ownerships and register project quota modifications */
	if (xfs_get_projid(ip) != fa->fsx_projid) {
		if (XFS_IS_QUOTA_RUNNING(mp) && XFS_IS_PQUOTA_ON(mp)) {
			olddquot = xfs_qm_vop_chown(tp, ip,
						&ip->i_pdquot, pdqp);
		}
		ASSERT(ip->i_d.di_version > 1);
		xfs_set_projid(ip, fa->fsx_projid);
1390
	}
1391

1392 1393 1394 1395 1396
	/*
	 * Only set the extent size hint if we've already determined that the
	 * extent size hint should be set on the inode. If no extent size flags
	 * are set on the inode then unconditionally clear the extent size hint.
	 */
1397 1398 1399 1400
	if (ip->i_d.di_flags & (XFS_DIFLAG_EXTSIZE | XFS_DIFLAG_EXTSZINHERIT))
		ip->i_d.di_extsize = fa->fsx_extsize >> mp->m_sb.sb_blocklog;
	else
		ip->i_d.di_extsize = 0;
1401 1402 1403 1404 1405 1406
	if (ip->i_d.di_version == 3 &&
	    (ip->i_d.di_flags2 & XFS_DIFLAG2_COWEXTSIZE))
		ip->i_d.di_cowextsize = fa->fsx_cowextsize >>
				mp->m_sb.sb_blocklog;
	else
		ip->i_d.di_cowextsize = 0;
1407

1408
	code = xfs_trans_commit(tp);
1409 1410 1411 1412

	/*
	 * Release any dquot(s) the inode had kept before chown.
	 */
C
Christoph Hellwig 已提交
1413 1414
	xfs_qm_dqrele(olddquot);
	xfs_qm_dqrele(udqp);
1415
	xfs_qm_dqrele(pdqp);
1416

C
Christoph Hellwig 已提交
1417
	return code;
1418

1419
error_trans_cancel:
1420
	xfs_trans_cancel(tp);
1421
error_free_dquots:
C
Christoph Hellwig 已提交
1422
	xfs_qm_dqrele(udqp);
1423
	xfs_qm_dqrele(pdqp);
1424 1425 1426
	return code;
}

L
Linus Torvalds 已提交
1427
STATIC int
L
Lachlan McIlroy 已提交
1428
xfs_ioc_fssetxattr(
L
Linus Torvalds 已提交
1429 1430 1431 1432 1433
	xfs_inode_t		*ip,
	struct file		*filp,
	void			__user *arg)
{
	struct fsxattr		fa;
J
Jan Kara 已提交
1434
	int error;
L
Lachlan McIlroy 已提交
1435 1436 1437

	if (copy_from_user(&fa, arg, sizeof(fa)))
		return -EFAULT;
L
Linus Torvalds 已提交
1438

J
Jan Kara 已提交
1439 1440 1441
	error = mnt_want_write_file(filp);
	if (error)
		return error;
1442
	error = xfs_ioctl_setattr(ip, &fa);
J
Jan Kara 已提交
1443
	mnt_drop_write_file(filp);
D
Dave Chinner 已提交
1444
	return error;
L
Lachlan McIlroy 已提交
1445
}
L
Linus Torvalds 已提交
1446

L
Lachlan McIlroy 已提交
1447 1448 1449 1450 1451 1452
STATIC int
xfs_ioc_getxflags(
	xfs_inode_t		*ip,
	void			__user *arg)
{
	unsigned int		flags;
L
Linus Torvalds 已提交
1453

L
Lachlan McIlroy 已提交
1454 1455 1456 1457 1458
	flags = xfs_di2lxflags(ip->i_d.di_flags);
	if (copy_to_user(arg, &flags, sizeof(flags)))
		return -EFAULT;
	return 0;
}
L
Linus Torvalds 已提交
1459

L
Lachlan McIlroy 已提交
1460 1461
STATIC int
xfs_ioc_setxflags(
1462
	struct xfs_inode	*ip,
L
Lachlan McIlroy 已提交
1463 1464 1465
	struct file		*filp,
	void			__user *arg)
{
1466
	struct xfs_trans	*tp;
1467
	struct fsxattr		fa;
1468
	struct fsxattr		old_fa;
L
Lachlan McIlroy 已提交
1469
	unsigned int		flags;
1470
	int			join_flags = 0;
1471
	int			error;
L
Linus Torvalds 已提交
1472

L
Lachlan McIlroy 已提交
1473 1474
	if (copy_from_user(&flags, arg, sizeof(flags)))
		return -EFAULT;
L
Linus Torvalds 已提交
1475

L
Lachlan McIlroy 已提交
1476 1477 1478 1479
	if (flags & ~(FS_IMMUTABLE_FL | FS_APPEND_FL | \
		      FS_NOATIME_FL | FS_NODUMP_FL | \
		      FS_SYNC_FL))
		return -EOPNOTSUPP;
L
Linus Torvalds 已提交
1480

1481
	fa.fsx_xflags = xfs_merge_ioc_xflags(flags, xfs_ip2xflags(ip));
L
Linus Torvalds 已提交
1482

J
Jan Kara 已提交
1483 1484 1485
	error = mnt_want_write_file(filp);
	if (error)
		return error;
1486

1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498
	/*
	 * Changing DAX config may require inode locking for mapping
	 * invalidation. These need to be held all the way to transaction commit
	 * or cancel time, so need to be passed through to
	 * xfs_ioctl_setattr_get_trans() so it can apply them to the join call
	 * appropriately.
	 */
	error = xfs_ioctl_setattr_dax_invalidate(ip, &fa, &join_flags);
	if (error)
		goto out_drop_write;

	tp = xfs_ioctl_setattr_get_trans(ip, join_flags);
1499 1500 1501 1502 1503
	if (IS_ERR(tp)) {
		error = PTR_ERR(tp);
		goto out_drop_write;
	}

1504 1505 1506 1507 1508 1509 1510
	xfs_fill_fsxattr(ip, false, &old_fa);
	error = vfs_ioc_fssetxattr_check(VFS_I(ip), &old_fa, &fa);
	if (error) {
		xfs_trans_cancel(tp);
		goto out_drop_write;
	}

1511 1512
	error = xfs_ioctl_setattr_xflags(tp, ip, &fa);
	if (error) {
1513
		xfs_trans_cancel(tp);
1514 1515 1516
		goto out_drop_write;
	}

1517
	error = xfs_trans_commit(tp);
1518
out_drop_write:
J
Jan Kara 已提交
1519
	mnt_drop_write_file(filp);
D
Dave Chinner 已提交
1520
	return error;
L
Linus Torvalds 已提交
1521 1522
}

1523 1524 1525 1526 1527
static bool
xfs_getbmap_format(
	struct kgetbmap		*p,
	struct getbmapx __user	*u,
	size_t			recsize)
1528
{
1529 1530 1531 1532 1533 1534 1535 1536 1537 1538 1539 1540 1541 1542
	if (put_user(p->bmv_offset, &u->bmv_offset) ||
	    put_user(p->bmv_block, &u->bmv_block) ||
	    put_user(p->bmv_length, &u->bmv_length) ||
	    put_user(0, &u->bmv_count) ||
	    put_user(0, &u->bmv_entries))
		return false;
	if (recsize < sizeof(struct getbmapx))
		return true;
	if (put_user(0, &u->bmv_iflags) ||
	    put_user(p->bmv_oflags, &u->bmv_oflags) ||
	    put_user(0, &u->bmv_unused1) ||
	    put_user(0, &u->bmv_unused2))
		return false;
	return true;
1543 1544
}

L
Linus Torvalds 已提交
1545 1546
STATIC int
xfs_ioc_getbmap(
1547
	struct file		*file,
L
Linus Torvalds 已提交
1548 1549 1550
	unsigned int		cmd,
	void			__user *arg)
{
1551
	struct getbmapx		bmx = { 0 };
1552 1553 1554
	struct kgetbmap		*buf;
	size_t			recsize;
	int			error, i;
L
Linus Torvalds 已提交
1555

1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567 1568 1569
	switch (cmd) {
	case XFS_IOC_GETBMAPA:
		bmx.bmv_iflags = BMV_IF_ATTRFORK;
		/*FALLTHRU*/
	case XFS_IOC_GETBMAP:
		if (file->f_mode & FMODE_NOCMTIME)
			bmx.bmv_iflags |= BMV_IF_NO_DMAPI_READ;
		/* struct getbmap is a strict subset of struct getbmapx. */
		recsize = sizeof(struct getbmap);
		break;
	case XFS_IOC_GETBMAPX:
		recsize = sizeof(struct getbmapx);
		break;
	default:
E
Eric Sandeen 已提交
1570
		return -EINVAL;
1571
	}
L
Linus Torvalds 已提交
1572

1573
	if (copy_from_user(&bmx, arg, recsize))
E
Eric Sandeen 已提交
1574
		return -EFAULT;
L
Linus Torvalds 已提交
1575 1576

	if (bmx.bmv_count < 2)
E
Eric Sandeen 已提交
1577
		return -EINVAL;
1578 1579
	if (bmx.bmv_count > ULONG_MAX / recsize)
		return -ENOMEM;
L
Linus Torvalds 已提交
1580

1581 1582 1583
	buf = kmem_zalloc_large(bmx.bmv_count * sizeof(*buf), 0);
	if (!buf)
		return -ENOMEM;
L
Linus Torvalds 已提交
1584

1585
	error = xfs_getbmap(XFS_I(file_inode(file)), &bmx, buf);
L
Linus Torvalds 已提交
1586
	if (error)
1587
		goto out_free_buf;
L
Linus Torvalds 已提交
1588

1589 1590 1591 1592 1593 1594 1595 1596 1597 1598
	error = -EFAULT;
	if (copy_to_user(arg, &bmx, recsize))
		goto out_free_buf;
	arg += recsize;

	for (i = 0; i < bmx.bmv_entries; i++) {
		if (!xfs_getbmap_format(buf + i, arg, recsize))
			goto out_free_buf;
		arg += recsize;
	}
L
Linus Torvalds 已提交
1599

1600 1601 1602
	error = 0;
out_free_buf:
	kmem_free(buf);
1603
	return error;
L
Linus Torvalds 已提交
1604
}
L
Lachlan McIlroy 已提交
1605

1606 1607
struct getfsmap_info {
	struct xfs_mount	*mp;
1608 1609
	struct fsmap_head __user *data;
	unsigned int		idx;
1610 1611 1612 1613 1614 1615 1616 1617 1618 1619 1620 1621 1622
	__u32			last_flags;
};

STATIC int
xfs_getfsmap_format(struct xfs_fsmap *xfm, void *priv)
{
	struct getfsmap_info	*info = priv;
	struct fsmap		fm;

	trace_xfs_getfsmap_mapping(info->mp, xfm);

	info->last_flags = xfm->fmr_flags;
	xfs_fsmap_from_internal(&fm, xfm);
1623 1624
	if (copy_to_user(&info->data->fmh_recs[info->idx++], &fm,
			sizeof(struct fsmap)))
1625 1626 1627 1628 1629 1630 1631 1632
		return -EFAULT;

	return 0;
}

STATIC int
xfs_ioc_getfsmap(
	struct xfs_inode	*ip,
1633
	struct fsmap_head	__user *arg)
1634
{
1635
	struct getfsmap_info	info = { NULL };
1636 1637 1638 1639 1640 1641 1642 1643 1644 1645 1646 1647 1648 1649 1650 1651 1652 1653 1654 1655 1656 1657 1658
	struct xfs_fsmap_head	xhead = {0};
	struct fsmap_head	head;
	bool			aborted = false;
	int			error;

	if (copy_from_user(&head, arg, sizeof(struct fsmap_head)))
		return -EFAULT;
	if (memchr_inv(head.fmh_reserved, 0, sizeof(head.fmh_reserved)) ||
	    memchr_inv(head.fmh_keys[0].fmr_reserved, 0,
		       sizeof(head.fmh_keys[0].fmr_reserved)) ||
	    memchr_inv(head.fmh_keys[1].fmr_reserved, 0,
		       sizeof(head.fmh_keys[1].fmr_reserved)))
		return -EINVAL;

	xhead.fmh_iflags = head.fmh_iflags;
	xhead.fmh_count = head.fmh_count;
	xfs_fsmap_to_internal(&xhead.fmh_keys[0], &head.fmh_keys[0]);
	xfs_fsmap_to_internal(&xhead.fmh_keys[1], &head.fmh_keys[1]);

	trace_xfs_getfsmap_low_key(ip->i_mount, &xhead.fmh_keys[0]);
	trace_xfs_getfsmap_high_key(ip->i_mount, &xhead.fmh_keys[1]);

	info.mp = ip->i_mount;
1659
	info.data = arg;
1660 1661 1662 1663 1664 1665 1666 1667
	error = xfs_getfsmap(ip->i_mount, &xhead, xfs_getfsmap_format, &info);
	if (error == XFS_BTREE_QUERY_RANGE_ABORT) {
		error = 0;
		aborted = true;
	} else if (error)
		return error;

	/* If we didn't abort, set the "last" flag in the last fmx */
1668
	if (!aborted && info.idx) {
1669
		info.last_flags |= FMR_OF_LAST;
1670 1671
		if (copy_to_user(&info.data->fmh_recs[info.idx - 1].fmr_flags,
				&info.last_flags, sizeof(info.last_flags)))
1672 1673 1674 1675 1676 1677 1678 1679 1680 1681 1682 1683
			return -EFAULT;
	}

	/* copy back header */
	head.fmh_entries = xhead.fmh_entries;
	head.fmh_oflags = xhead.fmh_oflags;
	if (copy_to_user(arg, &head, sizeof(struct fsmap_head)))
		return -EFAULT;

	return 0;
}

1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702 1703 1704 1705 1706 1707
STATIC int
xfs_ioc_scrub_metadata(
	struct xfs_inode		*ip,
	void				__user *arg)
{
	struct xfs_scrub_metadata	scrub;
	int				error;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (copy_from_user(&scrub, arg, sizeof(scrub)))
		return -EFAULT;

	error = xfs_scrub_metadata(ip, &scrub);
	if (error)
		return error;

	if (copy_to_user(arg, &scrub, sizeof(scrub)))
		return -EFAULT;

	return 0;
}

D
Dave Chinner 已提交
1708 1709 1710 1711 1712 1713 1714 1715 1716 1717 1718
int
xfs_ioc_swapext(
	xfs_swapext_t	*sxp)
{
	xfs_inode_t     *ip, *tip;
	struct fd	f, tmp;
	int		error = 0;

	/* Pull information for the target fd */
	f = fdget((int)sxp->sx_fdtarget);
	if (!f.file) {
D
Dave Chinner 已提交
1719
		error = -EINVAL;
D
Dave Chinner 已提交
1720 1721 1722 1723 1724 1725
		goto out;
	}

	if (!(f.file->f_mode & FMODE_WRITE) ||
	    !(f.file->f_mode & FMODE_READ) ||
	    (f.file->f_flags & O_APPEND)) {
D
Dave Chinner 已提交
1726
		error = -EBADF;
D
Dave Chinner 已提交
1727 1728 1729 1730 1731
		goto out_put_file;
	}

	tmp = fdget((int)sxp->sx_fdtmp);
	if (!tmp.file) {
D
Dave Chinner 已提交
1732
		error = -EINVAL;
D
Dave Chinner 已提交
1733 1734 1735 1736 1737 1738
		goto out_put_file;
	}

	if (!(tmp.file->f_mode & FMODE_WRITE) ||
	    !(tmp.file->f_mode & FMODE_READ) ||
	    (tmp.file->f_flags & O_APPEND)) {
D
Dave Chinner 已提交
1739
		error = -EBADF;
D
Dave Chinner 已提交
1740 1741 1742 1743 1744
		goto out_put_tmp_file;
	}

	if (IS_SWAPFILE(file_inode(f.file)) ||
	    IS_SWAPFILE(file_inode(tmp.file))) {
D
Dave Chinner 已提交
1745
		error = -EINVAL;
D
Dave Chinner 已提交
1746 1747 1748
		goto out_put_tmp_file;
	}

1749 1750 1751 1752 1753 1754 1755 1756 1757 1758 1759
	/*
	 * We need to ensure that the fds passed in point to XFS inodes
	 * before we cast and access them as XFS structures as we have no
	 * control over what the user passes us here.
	 */
	if (f.file->f_op != &xfs_file_operations ||
	    tmp.file->f_op != &xfs_file_operations) {
		error = -EINVAL;
		goto out_put_tmp_file;
	}

D
Dave Chinner 已提交
1760 1761 1762 1763
	ip = XFS_I(file_inode(f.file));
	tip = XFS_I(file_inode(tmp.file));

	if (ip->i_mount != tip->i_mount) {
D
Dave Chinner 已提交
1764
		error = -EINVAL;
D
Dave Chinner 已提交
1765 1766 1767 1768
		goto out_put_tmp_file;
	}

	if (ip->i_ino == tip->i_ino) {
D
Dave Chinner 已提交
1769
		error = -EINVAL;
D
Dave Chinner 已提交
1770 1771 1772 1773
		goto out_put_tmp_file;
	}

	if (XFS_FORCED_SHUTDOWN(ip->i_mount)) {
D
Dave Chinner 已提交
1774
		error = -EIO;
D
Dave Chinner 已提交
1775 1776 1777 1778 1779 1780 1781 1782 1783 1784 1785 1786 1787
		goto out_put_tmp_file;
	}

	error = xfs_swap_extents(ip, tip, sxp);

 out_put_tmp_file:
	fdput(tmp);
 out_put_file:
	fdput(f);
 out:
	return error;
}

1788 1789 1790 1791 1792 1793 1794 1795 1796 1797 1798
static int
xfs_ioc_getlabel(
	struct xfs_mount	*mp,
	char			__user *user_label)
{
	struct xfs_sb		*sbp = &mp->m_sb;
	char			label[XFSLABEL_MAX + 1];

	/* Paranoia */
	BUILD_BUG_ON(sizeof(sbp->sb_fname) > FSLABEL_MAX);

1799 1800
	/* 1 larger than sb_fname, so this ensures a trailing NUL char */
	memset(label, 0, sizeof(label));
1801
	spin_lock(&mp->m_sb_lock);
1802
	strncpy(label, sbp->sb_fname, XFSLABEL_MAX);
1803 1804
	spin_unlock(&mp->m_sb_lock);

1805
	if (copy_to_user(user_label, label, sizeof(label)))
1806 1807 1808 1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819 1820 1821 1822 1823 1824 1825 1826 1827 1828 1829 1830 1831 1832 1833 1834 1835 1836 1837 1838 1839 1840
		return -EFAULT;
	return 0;
}

static int
xfs_ioc_setlabel(
	struct file		*filp,
	struct xfs_mount	*mp,
	char			__user *newlabel)
{
	struct xfs_sb		*sbp = &mp->m_sb;
	char			label[XFSLABEL_MAX + 1];
	size_t			len;
	int			error;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;
	/*
	 * The generic ioctl allows up to FSLABEL_MAX chars, but XFS is much
	 * smaller, at 12 bytes.  We copy one more to be sure we find the
	 * (required) NULL character to test the incoming label length.
	 * NB: The on disk label doesn't need to be null terminated.
	 */
	if (copy_from_user(label, newlabel, XFSLABEL_MAX + 1))
		return -EFAULT;
	len = strnlen(label, XFSLABEL_MAX + 1);
	if (len > sizeof(sbp->sb_fname))
		return -EINVAL;

	error = mnt_want_write_file(filp);
	if (error)
		return error;

	spin_lock(&mp->m_sb_lock);
	memset(sbp->sb_fname, 0, sizeof(sbp->sb_fname));
1841
	memcpy(sbp->sb_fname, label, len);
1842 1843 1844 1845 1846 1847 1848 1849 1850 1851 1852 1853 1854 1855 1856 1857 1858 1859 1860 1861 1862 1863 1864 1865 1866 1867 1868 1869
	spin_unlock(&mp->m_sb_lock);

	/*
	 * Now we do several things to satisfy userspace.
	 * In addition to normal logging of the primary superblock, we also
	 * immediately write these changes to sector zero for the primary, then
	 * update all backup supers (as xfs_db does for a label change), then
	 * invalidate the block device page cache.  This is so that any prior
	 * buffered reads from userspace (i.e. from blkid) are invalidated,
	 * and userspace will see the newly-written label.
	 */
	error = xfs_sync_sb_buf(mp);
	if (error)
		goto out;
	/*
	 * growfs also updates backup supers so lock against that.
	 */
	mutex_lock(&mp->m_growlock);
	error = xfs_update_secondary_sbs(mp);
	mutex_unlock(&mp->m_growlock);

	invalidate_bdev(mp->m_ddev_targp->bt_bdev);

out:
	mnt_drop_write_file(filp);
	return error;
}

1870 1871 1872 1873 1874 1875 1876 1877
/*
 * Note: some of the ioctl's return positive numbers as a
 * byte count indicating success, such as readlink_by_handle.
 * So we don't "sign flip" like most other routines.  This means
 * true errors need to be returned as a negative value.
 */
long
xfs_file_ioctl(
L
Lachlan McIlroy 已提交
1878 1879
	struct file		*filp,
	unsigned int		cmd,
1880
	unsigned long		p)
L
Lachlan McIlroy 已提交
1881
{
A
Al Viro 已提交
1882
	struct inode		*inode = file_inode(filp);
1883 1884 1885
	struct xfs_inode	*ip = XFS_I(inode);
	struct xfs_mount	*mp = ip->i_mount;
	void			__user *arg = (void __user *)p;
L
Lachlan McIlroy 已提交
1886 1887
	int			error;

C
Christoph Hellwig 已提交
1888
	trace_xfs_file_ioctl(ip);
1889 1890

	switch (cmd) {
C
Christoph Hellwig 已提交
1891 1892
	case FITRIM:
		return xfs_ioc_trim(mp, arg);
1893 1894 1895 1896
	case FS_IOC_GETFSLABEL:
		return xfs_ioc_getlabel(mp, arg);
	case FS_IOC_SETFSLABEL:
		return xfs_ioc_setlabel(filp, mp, arg);
L
Lachlan McIlroy 已提交
1897 1898 1899 1900 1901 1902 1903
	case XFS_IOC_ALLOCSP:
	case XFS_IOC_FREESP:
	case XFS_IOC_RESVSP:
	case XFS_IOC_UNRESVSP:
	case XFS_IOC_ALLOCSP64:
	case XFS_IOC_FREESP64:
	case XFS_IOC_RESVSP64:
D
Dave Chinner 已提交
1904 1905
	case XFS_IOC_UNRESVSP64:
	case XFS_IOC_ZERO_RANGE: {
1906
		xfs_flock64_t		bf;
L
Lachlan McIlroy 已提交
1907

1908
		if (copy_from_user(&bf, arg, sizeof(bf)))
E
Eric Sandeen 已提交
1909
			return -EFAULT;
1910
		return xfs_ioc_space(filp, cmd, &bf);
1911
	}
L
Lachlan McIlroy 已提交
1912 1913 1914 1915 1916 1917
	case XFS_IOC_DIOINFO: {
		struct dioattr	da;
		xfs_buftarg_t	*target =
			XFS_IS_REALTIME_INODE(ip) ?
			mp->m_rtdev_targp : mp->m_ddev_targp;

1918
		da.d_mem =  da.d_miniosz = target->bt_logical_sectorsize;
L
Lachlan McIlroy 已提交
1919 1920 1921
		da.d_maxiosz = INT_MAX & ~(da.d_miniosz - 1);

		if (copy_to_user(arg, &da, sizeof(da)))
E
Eric Sandeen 已提交
1922
			return -EFAULT;
L
Lachlan McIlroy 已提交
1923 1924 1925 1926 1927 1928 1929 1930 1931
		return 0;
	}

	case XFS_IOC_FSBULKSTAT_SINGLE:
	case XFS_IOC_FSBULKSTAT:
	case XFS_IOC_FSINUMBERS:
		return xfs_ioc_bulkstat(mp, cmd, arg);

	case XFS_IOC_FSGEOMETRY_V1:
1932 1933 1934
		return xfs_ioc_fsgeometry(mp, arg, 3);
	case XFS_IOC_FSGEOMETRY_V4:
		return xfs_ioc_fsgeometry(mp, arg, 4);
L
Lachlan McIlroy 已提交
1935
	case XFS_IOC_FSGEOMETRY:
1936
		return xfs_ioc_fsgeometry(mp, arg, 5);
L
Lachlan McIlroy 已提交
1937

1938 1939 1940
	case XFS_IOC_AG_GEOMETRY:
		return xfs_ioc_ag_geometry(mp, arg);

L
Lachlan McIlroy 已提交
1941 1942 1943 1944 1945 1946 1947
	case XFS_IOC_GETVERSION:
		return put_user(inode->i_generation, (int __user *)arg);

	case XFS_IOC_FSGETXATTR:
		return xfs_ioc_fsgetxattr(ip, 0, arg);
	case XFS_IOC_FSGETXATTRA:
		return xfs_ioc_fsgetxattr(ip, 1, arg);
L
Lachlan McIlroy 已提交
1948 1949
	case XFS_IOC_FSSETXATTR:
		return xfs_ioc_fssetxattr(ip, filp, arg);
L
Lachlan McIlroy 已提交
1950
	case XFS_IOC_GETXFLAGS:
L
Lachlan McIlroy 已提交
1951
		return xfs_ioc_getxflags(ip, arg);
L
Lachlan McIlroy 已提交
1952
	case XFS_IOC_SETXFLAGS:
L
Lachlan McIlroy 已提交
1953
		return xfs_ioc_setxflags(ip, filp, arg);
L
Lachlan McIlroy 已提交
1954 1955 1956 1957 1958

	case XFS_IOC_FSSETDM: {
		struct fsdmidata	dmi;

		if (copy_from_user(&dmi, arg, sizeof(dmi)))
E
Eric Sandeen 已提交
1959
			return -EFAULT;
L
Lachlan McIlroy 已提交
1960

J
Jan Kara 已提交
1961 1962 1963 1964
		error = mnt_want_write_file(filp);
		if (error)
			return error;

L
Lachlan McIlroy 已提交
1965 1966
		error = xfs_set_dmattrs(ip, dmi.fsd_dmevmask,
				dmi.fsd_dmstate);
J
Jan Kara 已提交
1967
		mnt_drop_write_file(filp);
D
Dave Chinner 已提交
1968
		return error;
L
Lachlan McIlroy 已提交
1969 1970 1971 1972 1973
	}

	case XFS_IOC_GETBMAP:
	case XFS_IOC_GETBMAPA:
	case XFS_IOC_GETBMAPX:
1974
		return xfs_ioc_getbmap(filp, cmd, arg);
L
Lachlan McIlroy 已提交
1975

1976 1977 1978
	case FS_IOC_GETFSMAP:
		return xfs_ioc_getfsmap(ip, arg);

1979 1980 1981
	case XFS_IOC_SCRUB_METADATA:
		return xfs_ioc_scrub_metadata(ip, arg);

L
Lachlan McIlroy 已提交
1982 1983
	case XFS_IOC_FD_TO_HANDLE:
	case XFS_IOC_PATH_TO_HANDLE:
1984 1985
	case XFS_IOC_PATH_TO_FSHANDLE: {
		xfs_fsop_handlereq_t	hreq;
L
Lachlan McIlroy 已提交
1986

1987
		if (copy_from_user(&hreq, arg, sizeof(hreq)))
E
Eric Sandeen 已提交
1988
			return -EFAULT;
1989 1990 1991 1992
		return xfs_find_handle(cmd, &hreq);
	}
	case XFS_IOC_OPEN_BY_HANDLE: {
		xfs_fsop_handlereq_t	hreq;
L
Lachlan McIlroy 已提交
1993

1994
		if (copy_from_user(&hreq, arg, sizeof(xfs_fsop_handlereq_t)))
E
Eric Sandeen 已提交
1995
			return -EFAULT;
1996
		return xfs_open_by_handle(filp, &hreq);
1997
	}
L
Lachlan McIlroy 已提交
1998
	case XFS_IOC_FSSETDM_BY_HANDLE:
1999
		return xfs_fssetdm_by_handle(filp, arg);
L
Lachlan McIlroy 已提交
2000

2001 2002
	case XFS_IOC_READLINK_BY_HANDLE: {
		xfs_fsop_handlereq_t	hreq;
L
Lachlan McIlroy 已提交
2003

2004
		if (copy_from_user(&hreq, arg, sizeof(xfs_fsop_handlereq_t)))
E
Eric Sandeen 已提交
2005
			return -EFAULT;
2006
		return xfs_readlink_by_handle(filp, &hreq);
2007
	}
L
Lachlan McIlroy 已提交
2008
	case XFS_IOC_ATTRLIST_BY_HANDLE:
2009
		return xfs_attrlist_by_handle(filp, arg);
L
Lachlan McIlroy 已提交
2010 2011

	case XFS_IOC_ATTRMULTI_BY_HANDLE:
2012
		return xfs_attrmulti_by_handle(filp, arg);
L
Lachlan McIlroy 已提交
2013 2014

	case XFS_IOC_SWAPEXT: {
2015 2016 2017
		struct xfs_swapext	sxp;

		if (copy_from_user(&sxp, arg, sizeof(xfs_swapext_t)))
E
Eric Sandeen 已提交
2018
			return -EFAULT;
J
Jan Kara 已提交
2019 2020 2021
		error = mnt_want_write_file(filp);
		if (error)
			return error;
D
Dave Chinner 已提交
2022
		error = xfs_ioc_swapext(&sxp);
J
Jan Kara 已提交
2023
		mnt_drop_write_file(filp);
D
Dave Chinner 已提交
2024
		return error;
L
Lachlan McIlroy 已提交
2025 2026 2027 2028 2029
	}

	case XFS_IOC_FSCOUNTS: {
		xfs_fsop_counts_t out;

2030
		xfs_fs_counts(mp, &out);
L
Lachlan McIlroy 已提交
2031 2032

		if (copy_to_user(arg, &out, sizeof(out)))
E
Eric Sandeen 已提交
2033
			return -EFAULT;
L
Lachlan McIlroy 已提交
2034 2035 2036 2037 2038
		return 0;
	}

	case XFS_IOC_SET_RESBLKS: {
		xfs_fsop_resblks_t inout;
2039
		uint64_t	   in;
L
Lachlan McIlroy 已提交
2040 2041 2042 2043

		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

E
Eric Sandeen 已提交
2044
		if (mp->m_flags & XFS_MOUNT_RDONLY)
E
Eric Sandeen 已提交
2045
			return -EROFS;
E
Eric Sandeen 已提交
2046

L
Lachlan McIlroy 已提交
2047
		if (copy_from_user(&inout, arg, sizeof(inout)))
E
Eric Sandeen 已提交
2048
			return -EFAULT;
L
Lachlan McIlroy 已提交
2049

J
Jan Kara 已提交
2050 2051 2052 2053
		error = mnt_want_write_file(filp);
		if (error)
			return error;

L
Lachlan McIlroy 已提交
2054 2055 2056
		/* input parameter is passed in resblks field of structure */
		in = inout.resblks;
		error = xfs_reserve_blocks(mp, &in, &inout);
J
Jan Kara 已提交
2057
		mnt_drop_write_file(filp);
L
Lachlan McIlroy 已提交
2058
		if (error)
D
Dave Chinner 已提交
2059
			return error;
L
Lachlan McIlroy 已提交
2060 2061

		if (copy_to_user(arg, &inout, sizeof(inout)))
E
Eric Sandeen 已提交
2062
			return -EFAULT;
L
Lachlan McIlroy 已提交
2063 2064 2065 2066 2067 2068 2069 2070 2071 2072 2073
		return 0;
	}

	case XFS_IOC_GET_RESBLKS: {
		xfs_fsop_resblks_t out;

		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

		error = xfs_reserve_blocks(mp, NULL, &out);
		if (error)
D
Dave Chinner 已提交
2074
			return error;
L
Lachlan McIlroy 已提交
2075 2076

		if (copy_to_user(arg, &out, sizeof(out)))
E
Eric Sandeen 已提交
2077
			return -EFAULT;
L
Lachlan McIlroy 已提交
2078 2079 2080 2081 2082 2083 2084 2085

		return 0;
	}

	case XFS_IOC_FSGROWFSDATA: {
		xfs_growfs_data_t in;

		if (copy_from_user(&in, arg, sizeof(in)))
E
Eric Sandeen 已提交
2086
			return -EFAULT;
L
Lachlan McIlroy 已提交
2087

J
Jan Kara 已提交
2088 2089 2090
		error = mnt_want_write_file(filp);
		if (error)
			return error;
L
Lachlan McIlroy 已提交
2091
		error = xfs_growfs_data(mp, &in);
J
Jan Kara 已提交
2092
		mnt_drop_write_file(filp);
D
Dave Chinner 已提交
2093
		return error;
L
Lachlan McIlroy 已提交
2094 2095 2096 2097 2098 2099
	}

	case XFS_IOC_FSGROWFSLOG: {
		xfs_growfs_log_t in;

		if (copy_from_user(&in, arg, sizeof(in)))
E
Eric Sandeen 已提交
2100
			return -EFAULT;
L
Lachlan McIlroy 已提交
2101

J
Jan Kara 已提交
2102 2103 2104
		error = mnt_want_write_file(filp);
		if (error)
			return error;
L
Lachlan McIlroy 已提交
2105
		error = xfs_growfs_log(mp, &in);
J
Jan Kara 已提交
2106
		mnt_drop_write_file(filp);
D
Dave Chinner 已提交
2107
		return error;
L
Lachlan McIlroy 已提交
2108 2109 2110 2111 2112 2113
	}

	case XFS_IOC_FSGROWFSRT: {
		xfs_growfs_rt_t in;

		if (copy_from_user(&in, arg, sizeof(in)))
E
Eric Sandeen 已提交
2114
			return -EFAULT;
L
Lachlan McIlroy 已提交
2115

J
Jan Kara 已提交
2116 2117 2118
		error = mnt_want_write_file(filp);
		if (error)
			return error;
L
Lachlan McIlroy 已提交
2119
		error = xfs_growfs_rt(mp, &in);
J
Jan Kara 已提交
2120
		mnt_drop_write_file(filp);
D
Dave Chinner 已提交
2121
		return error;
L
Lachlan McIlroy 已提交
2122 2123 2124
	}

	case XFS_IOC_GOINGDOWN: {
2125
		uint32_t in;
L
Lachlan McIlroy 已提交
2126 2127 2128 2129

		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

2130
		if (get_user(in, (uint32_t __user *)arg))
E
Eric Sandeen 已提交
2131
			return -EFAULT;
L
Lachlan McIlroy 已提交
2132

D
Dave Chinner 已提交
2133
		return xfs_fs_goingdown(mp, in);
L
Lachlan McIlroy 已提交
2134 2135 2136 2137 2138 2139 2140 2141 2142
	}

	case XFS_IOC_ERROR_INJECTION: {
		xfs_error_injection_t in;

		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

		if (copy_from_user(&in, arg, sizeof(in)))
E
Eric Sandeen 已提交
2143
			return -EFAULT;
L
Lachlan McIlroy 已提交
2144

2145
		return xfs_errortag_add(mp, in.errtag);
L
Lachlan McIlroy 已提交
2146 2147 2148 2149 2150 2151
	}

	case XFS_IOC_ERROR_CLEARALL:
		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

2152
		return xfs_errortag_clearall(mp);
L
Lachlan McIlroy 已提交
2153

2154
	case XFS_IOC_FREE_EOFBLOCKS: {
2155 2156
		struct xfs_fs_eofblocks eofb;
		struct xfs_eofblocks keofb;
2157

2158 2159 2160 2161
		if (!capable(CAP_SYS_ADMIN))
			return -EPERM;

		if (mp->m_flags & XFS_MOUNT_RDONLY)
E
Eric Sandeen 已提交
2162
			return -EROFS;
2163

2164
		if (copy_from_user(&eofb, arg, sizeof(eofb)))
E
Eric Sandeen 已提交
2165
			return -EFAULT;
2166

2167 2168
		error = xfs_fs_eofblocks_from_user(&eofb, &keofb);
		if (error)
D
Dave Chinner 已提交
2169
			return error;
2170

D
Dave Chinner 已提交
2171
		return xfs_icache_free_eofblocks(mp, &keofb);
2172 2173
	}

L
Lachlan McIlroy 已提交
2174 2175 2176 2177
	default:
		return -ENOTTY;
	}
}