xfs_file.c 11.5 KB
Newer Older
L
Linus Torvalds 已提交
1
/*
2 3
 * Copyright (c) 2000-2005 Silicon Graphics, Inc.
 * All Rights Reserved.
L
Linus Torvalds 已提交
4
 *
5 6
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License as
L
Linus Torvalds 已提交
7 8
 * published by the Free Software Foundation.
 *
9 10 11 12
 * This program is distributed in the hope that it would be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
L
Linus Torvalds 已提交
13
 *
14 15 16
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write the Free Software Foundation,
 * Inc.,  51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
L
Linus Torvalds 已提交
17 18
 */
#include "xfs.h"
19
#include "xfs_bit.h"
L
Linus Torvalds 已提交
20
#include "xfs_log.h"
21
#include "xfs_inum.h"
L
Linus Torvalds 已提交
22
#include "xfs_sb.h"
23
#include "xfs_ag.h"
L
Linus Torvalds 已提交
24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43
#include "xfs_dir2.h"
#include "xfs_trans.h"
#include "xfs_dmapi.h"
#include "xfs_mount.h"
#include "xfs_bmap_btree.h"
#include "xfs_alloc_btree.h"
#include "xfs_ialloc_btree.h"
#include "xfs_alloc.h"
#include "xfs_btree.h"
#include "xfs_attr_sf.h"
#include "xfs_dir2_sf.h"
#include "xfs_dinode.h"
#include "xfs_inode.h"
#include "xfs_error.h"
#include "xfs_rw.h"
#include "xfs_ioctl32.h"

#include <linux/dcache.h>
#include <linux/smp_lock.h>

44
static struct vm_operations_struct xfs_file_vm_ops;
45
#ifdef CONFIG_XFS_DMAPI
46
static struct vm_operations_struct xfs_dmapi_file_vm_ops;
47
#endif
L
Linus Torvalds 已提交
48

49
STATIC_INLINE ssize_t
50
__xfs_file_read(
L
Linus Torvalds 已提交
51
	struct kiocb		*iocb,
52 53
	const struct iovec	*iov,
	unsigned long		nr_segs,
L
Linus Torvalds 已提交
54 55 56 57
	int			ioflags,
	loff_t			pos)
{
	struct file		*file = iocb->ki_filp;
58
	bhv_vnode_t		*vp = vn_from_inode(file->f_path.dentry->d_inode);
L
Linus Torvalds 已提交
59 60 61 62

	BUG_ON(iocb->ki_pos != pos);
	if (unlikely(file->f_flags & O_DIRECT))
		ioflags |= IO_ISDIRECT;
63 64
	return bhv_vop_read(vp, iocb, iov, nr_segs, &iocb->ki_pos,
				ioflags, NULL);
L
Linus Torvalds 已提交
65 66 67
}

STATIC ssize_t
68
xfs_file_aio_read(
L
Linus Torvalds 已提交
69
	struct kiocb		*iocb,
70 71
	const struct iovec	*iov,
	unsigned long		nr_segs,
L
Linus Torvalds 已提交
72 73
	loff_t			pos)
{
74
	return __xfs_file_read(iocb, iov, nr_segs, IO_ISAIO, pos);
L
Linus Torvalds 已提交
75 76 77
}

STATIC ssize_t
78
xfs_file_aio_read_invis(
L
Linus Torvalds 已提交
79
	struct kiocb		*iocb,
80 81
	const struct iovec	*iov,
	unsigned long		nr_segs,
L
Linus Torvalds 已提交
82 83
	loff_t			pos)
{
84
	return __xfs_file_read(iocb, iov, nr_segs, IO_ISAIO|IO_INVIS, pos);
L
Linus Torvalds 已提交
85 86
}

87
STATIC_INLINE ssize_t
88
__xfs_file_write(
89 90 91 92 93
	struct kiocb		*iocb,
	const struct iovec	*iov,
	unsigned long		nr_segs,
	int			ioflags,
	loff_t			pos)
L
Linus Torvalds 已提交
94 95 96
{
	struct file	*file = iocb->ki_filp;
	struct inode	*inode = file->f_mapping->host;
97
	bhv_vnode_t	*vp = vn_from_inode(inode);
L
Linus Torvalds 已提交
98 99 100 101

	BUG_ON(iocb->ki_pos != pos);
	if (unlikely(file->f_flags & O_DIRECT))
		ioflags |= IO_ISDIRECT;
102 103
	return bhv_vop_write(vp, iocb, iov, nr_segs, &iocb->ki_pos,
				ioflags, NULL);
L
Linus Torvalds 已提交
104 105 106
}

STATIC ssize_t
107
xfs_file_aio_write(
L
Linus Torvalds 已提交
108
	struct kiocb		*iocb,
109 110
	const struct iovec	*iov,
	unsigned long		nr_segs,
L
Linus Torvalds 已提交
111 112
	loff_t			pos)
{
113
	return __xfs_file_write(iocb, iov, nr_segs, IO_ISAIO, pos);
L
Linus Torvalds 已提交
114 115 116
}

STATIC ssize_t
117
xfs_file_aio_write_invis(
L
Linus Torvalds 已提交
118
	struct kiocb		*iocb,
119 120
	const struct iovec	*iov,
	unsigned long		nr_segs,
L
Linus Torvalds 已提交
121 122
	loff_t			pos)
{
123
	return __xfs_file_write(iocb, iov, nr_segs, IO_ISAIO|IO_INVIS, pos);
L
Linus Torvalds 已提交
124 125
}

126 127 128
STATIC ssize_t
xfs_file_splice_read(
	struct file		*infilp,
129
	loff_t			*ppos,
130
	struct pipe_inode_info	*pipe,
131 132 133
	size_t			len,
	unsigned int		flags)
{
134
	return bhv_vop_splice_read(vn_from_inode(infilp->f_path.dentry->d_inode),
135
				   infilp, ppos, pipe, len, flags, 0, NULL);
136 137 138 139 140
}

STATIC ssize_t
xfs_file_splice_read_invis(
	struct file		*infilp,
141
	loff_t			*ppos,
142
	struct pipe_inode_info	*pipe,
143 144 145
	size_t			len,
	unsigned int		flags)
{
146
	return bhv_vop_splice_read(vn_from_inode(infilp->f_path.dentry->d_inode),
147 148
				   infilp, ppos, pipe, len, flags, IO_INVIS,
				   NULL);
149 150 151 152
}

STATIC ssize_t
xfs_file_splice_write(
153
	struct pipe_inode_info	*pipe,
154
	struct file		*outfilp,
155
	loff_t			*ppos,
156 157 158
	size_t			len,
	unsigned int		flags)
{
159
	return bhv_vop_splice_write(vn_from_inode(outfilp->f_path.dentry->d_inode),
160
				    pipe, outfilp, ppos, len, flags, 0, NULL);
161 162 163 164
}

STATIC ssize_t
xfs_file_splice_write_invis(
165
	struct pipe_inode_info	*pipe,
166
	struct file		*outfilp,
167
	loff_t			*ppos,
168 169 170
	size_t			len,
	unsigned int		flags)
{
171
	return bhv_vop_splice_write(vn_from_inode(outfilp->f_path.dentry->d_inode),
172 173
				    pipe, outfilp, ppos, len, flags, IO_INVIS,
				    NULL);
174
}
L
Linus Torvalds 已提交
175 176

STATIC int
177
xfs_file_open(
L
Linus Torvalds 已提交
178 179 180 181 182
	struct inode	*inode,
	struct file	*filp)
{
	if (!(filp->f_flags & O_LARGEFILE) && i_size_read(inode) > MAX_NON_LFS)
		return -EFBIG;
183
	return -bhv_vop_open(vn_from_inode(inode), NULL);
L
Linus Torvalds 已提交
184 185 186
}

STATIC int
187
xfs_file_release(
L
Linus Torvalds 已提交
188 189 190
	struct inode	*inode,
	struct file	*filp)
{
191
	bhv_vnode_t	*vp = vn_from_inode(inode);
L
Linus Torvalds 已提交
192 193

	if (vp)
194 195
		return -bhv_vop_release(vp);
	return 0;
L
Linus Torvalds 已提交
196 197 198
}

STATIC int
199
xfs_file_fsync(
L
Linus Torvalds 已提交
200 201 202 203
	struct file	*filp,
	struct dentry	*dentry,
	int		datasync)
{
204
	bhv_vnode_t	*vp = vn_from_inode(dentry->d_inode);
L
Linus Torvalds 已提交
205 206 207 208
	int		flags = FSYNC_WAIT;

	if (datasync)
		flags |= FSYNC_DATA;
209 210
	if (VN_TRUNC(vp))
		VUNTRUNCATE(vp);
211
	return -bhv_vop_fsync(vp, flags, NULL, (xfs_off_t)0, (xfs_off_t)-1);
L
Linus Torvalds 已提交
212 213
}

214
#ifdef CONFIG_XFS_DMAPI
N
Nick Piggin 已提交
215
STATIC int
216 217
xfs_vm_fault(
	struct vm_area_struct	*vma,
N
Nick Piggin 已提交
218
	struct vm_fault	*vmf)
219
{
220
	struct inode	*inode = vma->vm_file->f_path.dentry->d_inode;
221
	bhv_vnode_t	*vp = vn_from_inode(inode);
222 223

	ASSERT_ALWAYS(vp->v_vfsp->vfs_flag & VFS_DMI);
N
Nick Piggin 已提交
224 225 226
	if (XFS_SEND_MMAP(XFS_VFSTOM(vp->v_vfsp), vma, 0))
		return VM_FAULT_SIGBUS;
	return filemap_fault(vma, vmf);
227 228 229
}
#endif /* CONFIG_XFS_DMAPI */

L
Linus Torvalds 已提交
230
STATIC int
231
xfs_file_readdir(
L
Linus Torvalds 已提交
232 233 234 235 236
	struct file	*filp,
	void		*dirent,
	filldir_t	filldir)
{
	int		error = 0;
237
	bhv_vnode_t	*vp = vn_from_inode(filp->f_path.dentry->d_inode);
L
Linus Torvalds 已提交
238 239 240 241 242 243 244 245 246 247 248
	uio_t		uio;
	iovec_t		iov;
	int		eof = 0;
	caddr_t		read_buf;
	int		namelen, size = 0;
	size_t		rlen = PAGE_CACHE_SIZE;
	xfs_off_t	start_offset, curr_offset;
	xfs_dirent_t	*dbp = NULL;

	/* Try fairly hard to get memory */
	do {
249
		if ((read_buf = kmalloc(rlen, GFP_KERNEL)))
L
Linus Torvalds 已提交
250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271
			break;
		rlen >>= 1;
	} while (rlen >= 1024);

	if (read_buf == NULL)
		return -ENOMEM;

	uio.uio_iov = &iov;
	uio.uio_segflg = UIO_SYSSPACE;
	curr_offset = filp->f_pos;
	if (filp->f_pos != 0x7fffffff)
		uio.uio_offset = filp->f_pos;
	else
		uio.uio_offset = 0xffffffff;

	while (!eof) {
		uio.uio_resid = iov.iov_len = rlen;
		iov.iov_base = read_buf;
		uio.uio_iovcnt = 1;

		start_offset = uio.uio_offset;

272
		error = bhv_vop_readdir(vp, &uio, NULL, &eof);
L
Linus Torvalds 已提交
273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290
		if ((uio.uio_offset == start_offset) || error) {
			size = 0;
			break;
		}

		size = rlen - uio.uio_resid;
		dbp = (xfs_dirent_t *)read_buf;
		while (size > 0) {
			namelen = strlen(dbp->d_name);

			if (filldir(dirent, dbp->d_name, namelen,
					(loff_t) curr_offset & 0x7fffffff,
					(ino_t) dbp->d_ino,
					DT_UNKNOWN)) {
				goto done;
			}
			size -= dbp->d_reclen;
			curr_offset = (loff_t)dbp->d_off /* & 0x7fffffff */;
291
			dbp = (xfs_dirent_t *)((char *)dbp + dbp->d_reclen);
L
Linus Torvalds 已提交
292 293 294 295 296 297 298 299 300 301 302 303 304 305 306
		}
	}
done:
	if (!error) {
		if (size == 0)
			filp->f_pos = uio.uio_offset & 0x7fffffff;
		else if (dbp)
			filp->f_pos = curr_offset;
	}

	kfree(read_buf);
	return -error;
}

STATIC int
307
xfs_file_mmap(
L
Linus Torvalds 已提交
308 309 310
	struct file	*filp,
	struct vm_area_struct *vma)
{
311
	vma->vm_ops = &xfs_file_vm_ops;
N
Nick Piggin 已提交
312
	vma->vm_flags |= VM_CAN_NONLINEAR;
313 314

#ifdef CONFIG_XFS_DMAPI
315
	if (vn_from_inode(filp->f_path.dentry->d_inode)->v_vfsp->vfs_flag & VFS_DMI)
316
		vma->vm_ops = &xfs_dmapi_file_vm_ops;
317
#endif /* CONFIG_XFS_DMAPI */
L
Linus Torvalds 已提交
318

319
	file_accessed(filp);
L
Linus Torvalds 已提交
320 321 322 323
	return 0;
}

STATIC long
324
xfs_file_ioctl(
L
Linus Torvalds 已提交
325 326
	struct file	*filp,
	unsigned int	cmd,
327
	unsigned long	p)
L
Linus Torvalds 已提交
328 329
{
	int		error;
330
	struct inode	*inode = filp->f_path.dentry->d_inode;
331
	bhv_vnode_t	*vp = vn_from_inode(inode);
L
Linus Torvalds 已提交
332

333
	error = bhv_vop_ioctl(vp, inode, filp, 0, cmd, (void __user *)p);
L
Linus Torvalds 已提交
334 335 336 337 338 339 340 341 342 343 344 345
	VMODIFY(vp);

	/* NOTE:  some of the ioctl's return positive #'s as a
	 *	  byte count indicating success, such as
	 *	  readlink_by_handle.  So we don't "sign flip"
	 *	  like most other routines.  This means true
	 *	  errors need to be returned as a negative value.
	 */
	return error;
}

STATIC long
346
xfs_file_ioctl_invis(
L
Linus Torvalds 已提交
347 348
	struct file	*filp,
	unsigned int	cmd,
349
	unsigned long	p)
L
Linus Torvalds 已提交
350
{
351
	int		error;
352
	struct inode	*inode = filp->f_path.dentry->d_inode;
353
	bhv_vnode_t	*vp = vn_from_inode(inode);
L
Linus Torvalds 已提交
354

355
	error = bhv_vop_ioctl(vp, inode, filp, IO_INVIS, cmd, (void __user *)p);
L
Linus Torvalds 已提交
356 357 358 359 360 361 362 363 364 365 366
	VMODIFY(vp);

	/* NOTE:  some of the ioctl's return positive #'s as a
	 *	  byte count indicating success, such as
	 *	  readlink_by_handle.  So we don't "sign flip"
	 *	  like most other routines.  This means true
	 *	  errors need to be returned as a negative value.
	 */
	return error;
}

367
#ifdef CONFIG_XFS_DMAPI
L
Linus Torvalds 已提交
368 369
#ifdef HAVE_VMOP_MPROTECT
STATIC int
370
xfs_vm_mprotect(
L
Linus Torvalds 已提交
371 372 373
	struct vm_area_struct *vma,
	unsigned int	newflags)
{
374
	bhv_vnode_t	*vp = vn_from_inode(vma->vm_file->f_path.dentry->d_inode);
L
Linus Torvalds 已提交
375 376 377 378 379 380 381 382 383 384 385 386 387
	int		error = 0;

	if (vp->v_vfsp->vfs_flag & VFS_DMI) {
		if ((vma->vm_flags & VM_MAYSHARE) &&
		    (newflags & VM_WRITE) && !(vma->vm_flags & VM_WRITE)) {
			xfs_mount_t	*mp = XFS_VFSTOM(vp->v_vfsp);

			error = XFS_SEND_MMAP(mp, vma, VM_WRITE);
		    }
	}
	return error;
}
#endif /* HAVE_VMOP_MPROTECT */
388
#endif /* CONFIG_XFS_DMAPI */
L
Linus Torvalds 已提交
389 390 391 392 393 394 395 396

#ifdef HAVE_FOP_OPEN_EXEC
/* If the user is attempting to execute a file that is offline then
 * we have to trigger a DMAPI READ event before the file is marked as busy
 * otherwise the invisible I/O will not be able to write to the file to bring
 * it back online.
 */
STATIC int
397
xfs_file_open_exec(
L
Linus Torvalds 已提交
398 399
	struct inode	*inode)
{
400
	bhv_vnode_t	*vp = vn_from_inode(inode);
L
Linus Torvalds 已提交
401

402 403 404 405 406 407
	if (unlikely(vp->v_vfsp->vfs_flag & VFS_DMI)) {
		xfs_mount_t	*mp = XFS_VFSTOM(vp->v_vfsp);
		xfs_inode_t	*ip = xfs_vtoi(vp);

		if (!ip)
			return -EINVAL;
408
		if (DM_EVENT_ENABLED(ip, DM_EVENT_READ))
409
			return -XFS_SEND_DATA(mp, DM_EVENT_READ, vp,
L
Linus Torvalds 已提交
410 411
					       0, 0, 0, NULL);
	}
412
	return 0;
L
Linus Torvalds 已提交
413 414 415
}
#endif /* HAVE_FOP_OPEN_EXEC */

416 417 418 419 420 421 422 423 424 425 426 427 428 429
/*
 * mmap()d file has taken write protection fault and is being made
 * writable. We can set the page state up correctly for a writable
 * page, which means we can do correct delalloc accounting (ENOSPC
 * checking!) and unwritten extent mapping.
 */
STATIC int
xfs_vm_page_mkwrite(
	struct vm_area_struct	*vma,
	struct page		*page)
{
	return block_page_mkwrite(vma, page, xfs_get_blocks);
}

430
const struct file_operations xfs_file_operations = {
L
Linus Torvalds 已提交
431 432
	.llseek		= generic_file_llseek,
	.read		= do_sync_read,
433
	.write		= do_sync_write,
434 435
	.aio_read	= xfs_file_aio_read,
	.aio_write	= xfs_file_aio_write,
436 437
	.splice_read	= xfs_file_splice_read,
	.splice_write	= xfs_file_splice_write,
438
	.unlocked_ioctl	= xfs_file_ioctl,
L
Linus Torvalds 已提交
439
#ifdef CONFIG_COMPAT
440
	.compat_ioctl	= xfs_file_compat_ioctl,
L
Linus Torvalds 已提交
441
#endif
442 443 444 445
	.mmap		= xfs_file_mmap,
	.open		= xfs_file_open,
	.release	= xfs_file_release,
	.fsync		= xfs_file_fsync,
L
Linus Torvalds 已提交
446
#ifdef HAVE_FOP_OPEN_EXEC
447
	.open_exec	= xfs_file_open_exec,
L
Linus Torvalds 已提交
448 449 450
#endif
};

451
const struct file_operations xfs_invis_file_operations = {
L
Linus Torvalds 已提交
452 453
	.llseek		= generic_file_llseek,
	.read		= do_sync_read,
454
	.write		= do_sync_write,
455 456
	.aio_read	= xfs_file_aio_read_invis,
	.aio_write	= xfs_file_aio_write_invis,
457 458
	.splice_read	= xfs_file_splice_read_invis,
	.splice_write	= xfs_file_splice_write_invis,
459
	.unlocked_ioctl	= xfs_file_ioctl_invis,
L
Linus Torvalds 已提交
460
#ifdef CONFIG_COMPAT
461
	.compat_ioctl	= xfs_file_compat_invis_ioctl,
L
Linus Torvalds 已提交
462
#endif
463 464 465 466
	.mmap		= xfs_file_mmap,
	.open		= xfs_file_open,
	.release	= xfs_file_release,
	.fsync		= xfs_file_fsync,
L
Linus Torvalds 已提交
467 468 469
};


470
const struct file_operations xfs_dir_file_operations = {
L
Linus Torvalds 已提交
471
	.read		= generic_read_dir,
472 473
	.readdir	= xfs_file_readdir,
	.unlocked_ioctl	= xfs_file_ioctl,
474
#ifdef CONFIG_COMPAT
475
	.compat_ioctl	= xfs_file_compat_ioctl,
476
#endif
477
	.fsync		= xfs_file_fsync,
L
Linus Torvalds 已提交
478 479
};

480
static struct vm_operations_struct xfs_file_vm_ops = {
481
	.fault		= filemap_fault,
482
	.page_mkwrite	= xfs_vm_page_mkwrite,
483 484 485
};

#ifdef CONFIG_XFS_DMAPI
486
static struct vm_operations_struct xfs_dmapi_file_vm_ops = {
487
	.fault		= xfs_vm_fault,
488
	.page_mkwrite	= xfs_vm_page_mkwrite,
L
Linus Torvalds 已提交
489
#ifdef HAVE_VMOP_MPROTECT
490
	.mprotect	= xfs_vm_mprotect,
L
Linus Torvalds 已提交
491 492
#endif
};
493
#endif /* CONFIG_XFS_DMAPI */