xfs_file.c 10.6 KB
Newer Older
L
Linus Torvalds 已提交
1
/*
2 3
 * Copyright (c) 2000-2005 Silicon Graphics, Inc.
 * All Rights Reserved.
L
Linus Torvalds 已提交
4
 *
5 6
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License as
L
Linus Torvalds 已提交
7 8
 * published by the Free Software Foundation.
 *
9 10 11 12
 * This program is distributed in the hope that it would be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
L
Linus Torvalds 已提交
13
 *
14 15 16
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write the Free Software Foundation,
 * Inc.,  51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
L
Linus Torvalds 已提交
17 18
 */
#include "xfs.h"
19
#include "xfs_bit.h"
L
Linus Torvalds 已提交
20
#include "xfs_log.h"
21
#include "xfs_inum.h"
L
Linus Torvalds 已提交
22
#include "xfs_sb.h"
23
#include "xfs_ag.h"
L
Linus Torvalds 已提交
24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39
#include "xfs_dir2.h"
#include "xfs_trans.h"
#include "xfs_dmapi.h"
#include "xfs_mount.h"
#include "xfs_bmap_btree.h"
#include "xfs_alloc_btree.h"
#include "xfs_ialloc_btree.h"
#include "xfs_alloc.h"
#include "xfs_btree.h"
#include "xfs_attr_sf.h"
#include "xfs_dir2_sf.h"
#include "xfs_dinode.h"
#include "xfs_inode.h"
#include "xfs_error.h"
#include "xfs_rw.h"
#include "xfs_ioctl32.h"
40
#include "xfs_vnodeops.h"
L
Linus Torvalds 已提交
41 42 43 44

#include <linux/dcache.h>
#include <linux/smp_lock.h>

45
static struct vm_operations_struct xfs_file_vm_ops;
46
#ifdef CONFIG_XFS_DMAPI
47
static struct vm_operations_struct xfs_dmapi_file_vm_ops;
48
#endif
L
Linus Torvalds 已提交
49

50
STATIC_INLINE ssize_t
51
__xfs_file_read(
L
Linus Torvalds 已提交
52
	struct kiocb		*iocb,
53 54
	const struct iovec	*iov,
	unsigned long		nr_segs,
L
Linus Torvalds 已提交
55 56 57 58 59 60 61 62
	int			ioflags,
	loff_t			pos)
{
	struct file		*file = iocb->ki_filp;

	BUG_ON(iocb->ki_pos != pos);
	if (unlikely(file->f_flags & O_DIRECT))
		ioflags |= IO_ISDIRECT;
63 64
	return xfs_read(XFS_I(file->f_path.dentry->d_inode), iocb, iov,
				nr_segs, &iocb->ki_pos, ioflags);
L
Linus Torvalds 已提交
65 66 67
}

STATIC ssize_t
68
xfs_file_aio_read(
L
Linus Torvalds 已提交
69
	struct kiocb		*iocb,
70 71
	const struct iovec	*iov,
	unsigned long		nr_segs,
L
Linus Torvalds 已提交
72 73
	loff_t			pos)
{
74
	return __xfs_file_read(iocb, iov, nr_segs, IO_ISAIO, pos);
L
Linus Torvalds 已提交
75 76 77
}

STATIC ssize_t
78
xfs_file_aio_read_invis(
L
Linus Torvalds 已提交
79
	struct kiocb		*iocb,
80 81
	const struct iovec	*iov,
	unsigned long		nr_segs,
L
Linus Torvalds 已提交
82 83
	loff_t			pos)
{
84
	return __xfs_file_read(iocb, iov, nr_segs, IO_ISAIO|IO_INVIS, pos);
L
Linus Torvalds 已提交
85 86
}

87
STATIC_INLINE ssize_t
88
__xfs_file_write(
89 90 91 92 93
	struct kiocb		*iocb,
	const struct iovec	*iov,
	unsigned long		nr_segs,
	int			ioflags,
	loff_t			pos)
L
Linus Torvalds 已提交
94 95 96 97 98 99
{
	struct file	*file = iocb->ki_filp;

	BUG_ON(iocb->ki_pos != pos);
	if (unlikely(file->f_flags & O_DIRECT))
		ioflags |= IO_ISDIRECT;
100 101
	return xfs_write(XFS_I(file->f_mapping->host), iocb, iov, nr_segs,
				&iocb->ki_pos, ioflags);
L
Linus Torvalds 已提交
102 103 104
}

STATIC ssize_t
105
xfs_file_aio_write(
L
Linus Torvalds 已提交
106
	struct kiocb		*iocb,
107 108
	const struct iovec	*iov,
	unsigned long		nr_segs,
L
Linus Torvalds 已提交
109 110
	loff_t			pos)
{
111
	return __xfs_file_write(iocb, iov, nr_segs, IO_ISAIO, pos);
L
Linus Torvalds 已提交
112 113 114
}

STATIC ssize_t
115
xfs_file_aio_write_invis(
L
Linus Torvalds 已提交
116
	struct kiocb		*iocb,
117 118
	const struct iovec	*iov,
	unsigned long		nr_segs,
L
Linus Torvalds 已提交
119 120
	loff_t			pos)
{
121
	return __xfs_file_write(iocb, iov, nr_segs, IO_ISAIO|IO_INVIS, pos);
L
Linus Torvalds 已提交
122 123
}

124 125 126
STATIC ssize_t
xfs_file_splice_read(
	struct file		*infilp,
127
	loff_t			*ppos,
128
	struct pipe_inode_info	*pipe,
129 130 131
	size_t			len,
	unsigned int		flags)
{
132 133
	return xfs_splice_read(XFS_I(infilp->f_path.dentry->d_inode),
				   infilp, ppos, pipe, len, flags, 0);
134 135 136 137 138
}

STATIC ssize_t
xfs_file_splice_read_invis(
	struct file		*infilp,
139
	loff_t			*ppos,
140
	struct pipe_inode_info	*pipe,
141 142 143
	size_t			len,
	unsigned int		flags)
{
144 145
	return xfs_splice_read(XFS_I(infilp->f_path.dentry->d_inode),
				   infilp, ppos, pipe, len, flags, IO_INVIS);
146 147 148 149
}

STATIC ssize_t
xfs_file_splice_write(
150
	struct pipe_inode_info	*pipe,
151
	struct file		*outfilp,
152
	loff_t			*ppos,
153 154 155
	size_t			len,
	unsigned int		flags)
{
156 157
	return xfs_splice_write(XFS_I(outfilp->f_path.dentry->d_inode),
				    pipe, outfilp, ppos, len, flags, 0);
158 159 160 161
}

STATIC ssize_t
xfs_file_splice_write_invis(
162
	struct pipe_inode_info	*pipe,
163
	struct file		*outfilp,
164
	loff_t			*ppos,
165 166 167
	size_t			len,
	unsigned int		flags)
{
168 169
	return xfs_splice_write(XFS_I(outfilp->f_path.dentry->d_inode),
				    pipe, outfilp, ppos, len, flags, IO_INVIS);
170
}
L
Linus Torvalds 已提交
171 172

STATIC int
173
xfs_file_open(
L
Linus Torvalds 已提交
174 175 176 177 178
	struct inode	*inode,
	struct file	*filp)
{
	if (!(filp->f_flags & O_LARGEFILE) && i_size_read(inode) > MAX_NON_LFS)
		return -EFBIG;
179
	return -xfs_open(XFS_I(inode));
L
Linus Torvalds 已提交
180 181 182
}

STATIC int
183
xfs_file_release(
L
Linus Torvalds 已提交
184 185 186
	struct inode	*inode,
	struct file	*filp)
{
187
	return -xfs_release(XFS_I(inode));
L
Linus Torvalds 已提交
188 189 190
}

STATIC int
191
xfs_file_fsync(
L
Linus Torvalds 已提交
192 193 194 195
	struct file	*filp,
	struct dentry	*dentry,
	int		datasync)
{
196
	bhv_vnode_t	*vp = vn_from_inode(dentry->d_inode);
L
Linus Torvalds 已提交
197 198 199 200
	int		flags = FSYNC_WAIT;

	if (datasync)
		flags |= FSYNC_DATA;
201 202
	if (VN_TRUNC(vp))
		VUNTRUNCATE(vp);
203 204
	return -xfs_fsync(XFS_I(dentry->d_inode), flags,
			(xfs_off_t)0, (xfs_off_t)-1);
L
Linus Torvalds 已提交
205 206
}

207
#ifdef CONFIG_XFS_DMAPI
N
Nick Piggin 已提交
208
STATIC int
209 210
xfs_vm_fault(
	struct vm_area_struct	*vma,
N
Nick Piggin 已提交
211
	struct vm_fault	*vmf)
212
{
213
	struct inode	*inode = vma->vm_file->f_path.dentry->d_inode;
214
	bhv_vnode_t	*vp = vn_from_inode(inode);
215 216

	ASSERT_ALWAYS(vp->v_vfsp->vfs_flag & VFS_DMI);
N
Nick Piggin 已提交
217 218 219
	if (XFS_SEND_MMAP(XFS_VFSTOM(vp->v_vfsp), vma, 0))
		return VM_FAULT_SIGBUS;
	return filemap_fault(vma, vmf);
220 221 222
}
#endif /* CONFIG_XFS_DMAPI */

L
Linus Torvalds 已提交
223
STATIC int
224
xfs_file_readdir(
L
Linus Torvalds 已提交
225 226 227 228
	struct file	*filp,
	void		*dirent,
	filldir_t	filldir)
{
C
Christoph Hellwig 已提交
229
	struct inode	*inode = filp->f_path.dentry->d_inode;
230
	xfs_inode_t	*ip = XFS_I(inode);
C
Christoph Hellwig 已提交
231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247
	int		error;
	size_t		bufsize;

	/*
	 * The Linux API doesn't pass down the total size of the buffer
	 * we read into down to the filesystem.  With the filldir concept
	 * it's not needed for correct information, but the XFS dir2 leaf
	 * code wants an estimate of the buffer size to calculate it's
	 * readahead window and size the buffers used for mapping to
	 * physical blocks.
	 *
	 * Try to give it an estimate that's good enough, maybe at some
	 * point we can change the ->readdir prototype to include the
	 * buffer size.
	 */
	bufsize = (size_t)min_t(loff_t, PAGE_SIZE, inode->i_size);

248
	error = xfs_readdir(ip, dirent, bufsize,
C
Christoph Hellwig 已提交
249 250 251 252
				(xfs_off_t *)&filp->f_pos, filldir);
	if (error)
		return -error;
	return 0;
L
Linus Torvalds 已提交
253 254 255
}

STATIC int
256
xfs_file_mmap(
L
Linus Torvalds 已提交
257 258 259
	struct file	*filp,
	struct vm_area_struct *vma)
{
260
	vma->vm_ops = &xfs_file_vm_ops;
N
Nick Piggin 已提交
261
	vma->vm_flags |= VM_CAN_NONLINEAR;
262 263

#ifdef CONFIG_XFS_DMAPI
264
	if (vn_from_inode(filp->f_path.dentry->d_inode)->v_vfsp->vfs_flag & VFS_DMI)
265
		vma->vm_ops = &xfs_dmapi_file_vm_ops;
266
#endif /* CONFIG_XFS_DMAPI */
L
Linus Torvalds 已提交
267

268
	file_accessed(filp);
L
Linus Torvalds 已提交
269 270 271 272
	return 0;
}

STATIC long
273
xfs_file_ioctl(
L
Linus Torvalds 已提交
274 275
	struct file	*filp,
	unsigned int	cmd,
276
	unsigned long	p)
L
Linus Torvalds 已提交
277 278
{
	int		error;
279
	struct inode	*inode = filp->f_path.dentry->d_inode;
280
	bhv_vnode_t	*vp = vn_from_inode(inode);
L
Linus Torvalds 已提交
281

282
	error = xfs_ioctl(XFS_I(inode), filp, 0, cmd, (void __user *)p);
L
Linus Torvalds 已提交
283 284 285 286 287 288 289 290 291 292 293 294
	VMODIFY(vp);

	/* NOTE:  some of the ioctl's return positive #'s as a
	 *	  byte count indicating success, such as
	 *	  readlink_by_handle.  So we don't "sign flip"
	 *	  like most other routines.  This means true
	 *	  errors need to be returned as a negative value.
	 */
	return error;
}

STATIC long
295
xfs_file_ioctl_invis(
L
Linus Torvalds 已提交
296 297
	struct file	*filp,
	unsigned int	cmd,
298
	unsigned long	p)
L
Linus Torvalds 已提交
299
{
300
	int		error;
301
	struct inode	*inode = filp->f_path.dentry->d_inode;
302
	bhv_vnode_t	*vp = vn_from_inode(inode);
L
Linus Torvalds 已提交
303

304
	error = xfs_ioctl(XFS_I(inode), filp, IO_INVIS, cmd, (void __user *)p);
L
Linus Torvalds 已提交
305 306 307 308 309 310 311 312 313 314 315
	VMODIFY(vp);

	/* NOTE:  some of the ioctl's return positive #'s as a
	 *	  byte count indicating success, such as
	 *	  readlink_by_handle.  So we don't "sign flip"
	 *	  like most other routines.  This means true
	 *	  errors need to be returned as a negative value.
	 */
	return error;
}

316
#ifdef CONFIG_XFS_DMAPI
L
Linus Torvalds 已提交
317 318
#ifdef HAVE_VMOP_MPROTECT
STATIC int
319
xfs_vm_mprotect(
L
Linus Torvalds 已提交
320 321 322
	struct vm_area_struct *vma,
	unsigned int	newflags)
{
323
	bhv_vnode_t	*vp = vn_from_inode(vma->vm_file->f_path.dentry->d_inode);
L
Linus Torvalds 已提交
324 325 326 327 328 329 330 331 332 333 334 335 336
	int		error = 0;

	if (vp->v_vfsp->vfs_flag & VFS_DMI) {
		if ((vma->vm_flags & VM_MAYSHARE) &&
		    (newflags & VM_WRITE) && !(vma->vm_flags & VM_WRITE)) {
			xfs_mount_t	*mp = XFS_VFSTOM(vp->v_vfsp);

			error = XFS_SEND_MMAP(mp, vma, VM_WRITE);
		    }
	}
	return error;
}
#endif /* HAVE_VMOP_MPROTECT */
337
#endif /* CONFIG_XFS_DMAPI */
L
Linus Torvalds 已提交
338 339 340 341 342 343 344 345

#ifdef HAVE_FOP_OPEN_EXEC
/* If the user is attempting to execute a file that is offline then
 * we have to trigger a DMAPI READ event before the file is marked as busy
 * otherwise the invisible I/O will not be able to write to the file to bring
 * it back online.
 */
STATIC int
346
xfs_file_open_exec(
L
Linus Torvalds 已提交
347 348
	struct inode	*inode)
{
349
	bhv_vnode_t	*vp = vn_from_inode(inode);
L
Linus Torvalds 已提交
350

351 352 353 354 355 356
	if (unlikely(vp->v_vfsp->vfs_flag & VFS_DMI)) {
		xfs_mount_t	*mp = XFS_VFSTOM(vp->v_vfsp);
		xfs_inode_t	*ip = xfs_vtoi(vp);

		if (!ip)
			return -EINVAL;
357
		if (DM_EVENT_ENABLED(ip, DM_EVENT_READ))
358
			return -XFS_SEND_DATA(mp, DM_EVENT_READ, vp,
L
Linus Torvalds 已提交
359 360
					       0, 0, 0, NULL);
	}
361
	return 0;
L
Linus Torvalds 已提交
362 363 364
}
#endif /* HAVE_FOP_OPEN_EXEC */

365 366 367 368 369 370 371 372 373 374 375 376 377 378
/*
 * mmap()d file has taken write protection fault and is being made
 * writable. We can set the page state up correctly for a writable
 * page, which means we can do correct delalloc accounting (ENOSPC
 * checking!) and unwritten extent mapping.
 */
STATIC int
xfs_vm_page_mkwrite(
	struct vm_area_struct	*vma,
	struct page		*page)
{
	return block_page_mkwrite(vma, page, xfs_get_blocks);
}

379
const struct file_operations xfs_file_operations = {
L
Linus Torvalds 已提交
380 381
	.llseek		= generic_file_llseek,
	.read		= do_sync_read,
382
	.write		= do_sync_write,
383 384
	.aio_read	= xfs_file_aio_read,
	.aio_write	= xfs_file_aio_write,
385 386
	.splice_read	= xfs_file_splice_read,
	.splice_write	= xfs_file_splice_write,
387
	.unlocked_ioctl	= xfs_file_ioctl,
L
Linus Torvalds 已提交
388
#ifdef CONFIG_COMPAT
389
	.compat_ioctl	= xfs_file_compat_ioctl,
L
Linus Torvalds 已提交
390
#endif
391 392 393 394
	.mmap		= xfs_file_mmap,
	.open		= xfs_file_open,
	.release	= xfs_file_release,
	.fsync		= xfs_file_fsync,
L
Linus Torvalds 已提交
395
#ifdef HAVE_FOP_OPEN_EXEC
396
	.open_exec	= xfs_file_open_exec,
L
Linus Torvalds 已提交
397 398 399
#endif
};

400
const struct file_operations xfs_invis_file_operations = {
L
Linus Torvalds 已提交
401 402
	.llseek		= generic_file_llseek,
	.read		= do_sync_read,
403
	.write		= do_sync_write,
404 405
	.aio_read	= xfs_file_aio_read_invis,
	.aio_write	= xfs_file_aio_write_invis,
406 407
	.splice_read	= xfs_file_splice_read_invis,
	.splice_write	= xfs_file_splice_write_invis,
408
	.unlocked_ioctl	= xfs_file_ioctl_invis,
L
Linus Torvalds 已提交
409
#ifdef CONFIG_COMPAT
410
	.compat_ioctl	= xfs_file_compat_invis_ioctl,
L
Linus Torvalds 已提交
411
#endif
412 413 414 415
	.mmap		= xfs_file_mmap,
	.open		= xfs_file_open,
	.release	= xfs_file_release,
	.fsync		= xfs_file_fsync,
L
Linus Torvalds 已提交
416 417 418
};


419
const struct file_operations xfs_dir_file_operations = {
L
Linus Torvalds 已提交
420
	.read		= generic_read_dir,
421 422
	.readdir	= xfs_file_readdir,
	.unlocked_ioctl	= xfs_file_ioctl,
423
#ifdef CONFIG_COMPAT
424
	.compat_ioctl	= xfs_file_compat_ioctl,
425
#endif
426
	.fsync		= xfs_file_fsync,
L
Linus Torvalds 已提交
427 428
};

429
static struct vm_operations_struct xfs_file_vm_ops = {
430
	.fault		= filemap_fault,
431
	.page_mkwrite	= xfs_vm_page_mkwrite,
432 433 434
};

#ifdef CONFIG_XFS_DMAPI
435
static struct vm_operations_struct xfs_dmapi_file_vm_ops = {
436
	.fault		= xfs_vm_fault,
437
	.page_mkwrite	= xfs_vm_page_mkwrite,
L
Linus Torvalds 已提交
438
#ifdef HAVE_VMOP_MPROTECT
439
	.mprotect	= xfs_vm_mprotect,
L
Linus Torvalds 已提交
440 441
#endif
};
442
#endif /* CONFIG_XFS_DMAPI */