xfs_file.c 9.3 KB
Newer Older
L
Linus Torvalds 已提交
1
/*
2 3
 * Copyright (c) 2000-2005 Silicon Graphics, Inc.
 * All Rights Reserved.
L
Linus Torvalds 已提交
4
 *
5 6
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License as
L
Linus Torvalds 已提交
7 8
 * published by the Free Software Foundation.
 *
9 10 11 12
 * This program is distributed in the hope that it would be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
L
Linus Torvalds 已提交
13
 *
14 15 16
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write the Free Software Foundation,
 * Inc.,  51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
L
Linus Torvalds 已提交
17 18
 */
#include "xfs.h"
19
#include "xfs_bit.h"
L
Linus Torvalds 已提交
20
#include "xfs_log.h"
21
#include "xfs_inum.h"
L
Linus Torvalds 已提交
22
#include "xfs_sb.h"
23
#include "xfs_ag.h"
L
Linus Torvalds 已提交
24 25 26 27 28 29 30 31 32 33 34 35 36 37 38
#include "xfs_dir2.h"
#include "xfs_trans.h"
#include "xfs_dmapi.h"
#include "xfs_mount.h"
#include "xfs_bmap_btree.h"
#include "xfs_alloc_btree.h"
#include "xfs_ialloc_btree.h"
#include "xfs_alloc.h"
#include "xfs_btree.h"
#include "xfs_attr_sf.h"
#include "xfs_dir2_sf.h"
#include "xfs_dinode.h"
#include "xfs_inode.h"
#include "xfs_error.h"
#include "xfs_rw.h"
39
#include "xfs_vnodeops.h"
40
#include "xfs_da_btree.h"
41
#include "xfs_ioctl.h"
L
Linus Torvalds 已提交
42 43 44 45

#include <linux/dcache.h>
#include <linux/smp_lock.h>

46
static struct vm_operations_struct xfs_file_vm_ops;
L
Linus Torvalds 已提交
47

48
STATIC_INLINE ssize_t
49
__xfs_file_read(
L
Linus Torvalds 已提交
50
	struct kiocb		*iocb,
51 52
	const struct iovec	*iov,
	unsigned long		nr_segs,
L
Linus Torvalds 已提交
53 54 55 56 57 58 59 60
	int			ioflags,
	loff_t			pos)
{
	struct file		*file = iocb->ki_filp;

	BUG_ON(iocb->ki_pos != pos);
	if (unlikely(file->f_flags & O_DIRECT))
		ioflags |= IO_ISDIRECT;
61 62
	return xfs_read(XFS_I(file->f_path.dentry->d_inode), iocb, iov,
				nr_segs, &iocb->ki_pos, ioflags);
L
Linus Torvalds 已提交
63 64 65
}

STATIC ssize_t
66
xfs_file_aio_read(
L
Linus Torvalds 已提交
67
	struct kiocb		*iocb,
68 69
	const struct iovec	*iov,
	unsigned long		nr_segs,
L
Linus Torvalds 已提交
70 71
	loff_t			pos)
{
72
	return __xfs_file_read(iocb, iov, nr_segs, IO_ISAIO, pos);
L
Linus Torvalds 已提交
73 74 75
}

STATIC ssize_t
76
xfs_file_aio_read_invis(
L
Linus Torvalds 已提交
77
	struct kiocb		*iocb,
78 79
	const struct iovec	*iov,
	unsigned long		nr_segs,
L
Linus Torvalds 已提交
80 81
	loff_t			pos)
{
82
	return __xfs_file_read(iocb, iov, nr_segs, IO_ISAIO|IO_INVIS, pos);
L
Linus Torvalds 已提交
83 84
}

85
STATIC_INLINE ssize_t
86
__xfs_file_write(
87 88 89 90 91
	struct kiocb		*iocb,
	const struct iovec	*iov,
	unsigned long		nr_segs,
	int			ioflags,
	loff_t			pos)
L
Linus Torvalds 已提交
92 93 94 95 96 97
{
	struct file	*file = iocb->ki_filp;

	BUG_ON(iocb->ki_pos != pos);
	if (unlikely(file->f_flags & O_DIRECT))
		ioflags |= IO_ISDIRECT;
98 99
	return xfs_write(XFS_I(file->f_mapping->host), iocb, iov, nr_segs,
				&iocb->ki_pos, ioflags);
L
Linus Torvalds 已提交
100 101 102
}

STATIC ssize_t
103
xfs_file_aio_write(
L
Linus Torvalds 已提交
104
	struct kiocb		*iocb,
105 106
	const struct iovec	*iov,
	unsigned long		nr_segs,
L
Linus Torvalds 已提交
107 108
	loff_t			pos)
{
109
	return __xfs_file_write(iocb, iov, nr_segs, IO_ISAIO, pos);
L
Linus Torvalds 已提交
110 111 112
}

STATIC ssize_t
113
xfs_file_aio_write_invis(
L
Linus Torvalds 已提交
114
	struct kiocb		*iocb,
115 116
	const struct iovec	*iov,
	unsigned long		nr_segs,
L
Linus Torvalds 已提交
117 118
	loff_t			pos)
{
119
	return __xfs_file_write(iocb, iov, nr_segs, IO_ISAIO|IO_INVIS, pos);
L
Linus Torvalds 已提交
120 121
}

122 123 124
STATIC ssize_t
xfs_file_splice_read(
	struct file		*infilp,
125
	loff_t			*ppos,
126
	struct pipe_inode_info	*pipe,
127 128 129
	size_t			len,
	unsigned int		flags)
{
130 131
	return xfs_splice_read(XFS_I(infilp->f_path.dentry->d_inode),
				   infilp, ppos, pipe, len, flags, 0);
132 133 134 135 136
}

STATIC ssize_t
xfs_file_splice_read_invis(
	struct file		*infilp,
137
	loff_t			*ppos,
138
	struct pipe_inode_info	*pipe,
139 140 141
	size_t			len,
	unsigned int		flags)
{
142 143
	return xfs_splice_read(XFS_I(infilp->f_path.dentry->d_inode),
				   infilp, ppos, pipe, len, flags, IO_INVIS);
144 145 146 147
}

STATIC ssize_t
xfs_file_splice_write(
148
	struct pipe_inode_info	*pipe,
149
	struct file		*outfilp,
150
	loff_t			*ppos,
151 152 153
	size_t			len,
	unsigned int		flags)
{
154 155
	return xfs_splice_write(XFS_I(outfilp->f_path.dentry->d_inode),
				    pipe, outfilp, ppos, len, flags, 0);
156 157 158 159
}

STATIC ssize_t
xfs_file_splice_write_invis(
160
	struct pipe_inode_info	*pipe,
161
	struct file		*outfilp,
162
	loff_t			*ppos,
163 164 165
	size_t			len,
	unsigned int		flags)
{
166 167
	return xfs_splice_write(XFS_I(outfilp->f_path.dentry->d_inode),
				    pipe, outfilp, ppos, len, flags, IO_INVIS);
168
}
L
Linus Torvalds 已提交
169 170

STATIC int
171
xfs_file_open(
L
Linus Torvalds 已提交
172
	struct inode	*inode,
173
	struct file	*file)
L
Linus Torvalds 已提交
174
{
175
	if (!(file->f_flags & O_LARGEFILE) && i_size_read(inode) > MAX_NON_LFS)
L
Linus Torvalds 已提交
176
		return -EFBIG;
177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203
	if (XFS_FORCED_SHUTDOWN(XFS_M(inode->i_sb)))
		return -EIO;
	return 0;
}

STATIC int
xfs_dir_open(
	struct inode	*inode,
	struct file	*file)
{
	struct xfs_inode *ip = XFS_I(inode);
	int		mode;
	int		error;

	error = xfs_file_open(inode, file);
	if (error)
		return error;

	/*
	 * If there are any blocks, read-ahead block 0 as we're almost
	 * certain to have the next operation be a read there.
	 */
	mode = xfs_ilock_map_shared(ip);
	if (ip->i_d.di_nextents > 0)
		xfs_da_reada_buf(NULL, ip, 0, XFS_DATA_FORK);
	xfs_iunlock(ip, mode);
	return 0;
L
Linus Torvalds 已提交
204 205 206
}

STATIC int
207
xfs_file_release(
L
Linus Torvalds 已提交
208 209 210
	struct inode	*inode,
	struct file	*filp)
{
211
	return -xfs_release(XFS_I(inode));
L
Linus Torvalds 已提交
212 213
}

D
David Chinner 已提交
214 215 216 217 218 219 220 221 222 223
/*
 * We ignore the datasync flag here because a datasync is effectively
 * identical to an fsync. That is, datasync implies that we need to write
 * only the metadata needed to be able to access the data that is written
 * if we crash after the call completes. Hence if we are writing beyond
 * EOF we have to log the inode size change as well, which makes it a
 * full fsync. If we don't write beyond EOF, the inode core will be
 * clean in memory and so we don't need to log the inode, just like
 * fsync.
 */
L
Linus Torvalds 已提交
224
STATIC int
225
xfs_file_fsync(
L
Linus Torvalds 已提交
226 227 228 229
	struct file	*filp,
	struct dentry	*dentry,
	int		datasync)
{
230
	xfs_iflags_clear(XFS_I(dentry->d_inode), XFS_ITRUNCATED);
D
David Chinner 已提交
231
	return -xfs_fsync(XFS_I(dentry->d_inode));
L
Linus Torvalds 已提交
232 233 234
}

STATIC int
235
xfs_file_readdir(
L
Linus Torvalds 已提交
236 237 238 239
	struct file	*filp,
	void		*dirent,
	filldir_t	filldir)
{
C
Christoph Hellwig 已提交
240
	struct inode	*inode = filp->f_path.dentry->d_inode;
241
	xfs_inode_t	*ip = XFS_I(inode);
C
Christoph Hellwig 已提交
242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258
	int		error;
	size_t		bufsize;

	/*
	 * The Linux API doesn't pass down the total size of the buffer
	 * we read into down to the filesystem.  With the filldir concept
	 * it's not needed for correct information, but the XFS dir2 leaf
	 * code wants an estimate of the buffer size to calculate it's
	 * readahead window and size the buffers used for mapping to
	 * physical blocks.
	 *
	 * Try to give it an estimate that's good enough, maybe at some
	 * point we can change the ->readdir prototype to include the
	 * buffer size.
	 */
	bufsize = (size_t)min_t(loff_t, PAGE_SIZE, inode->i_size);

259
	error = xfs_readdir(ip, dirent, bufsize,
C
Christoph Hellwig 已提交
260 261 262 263
				(xfs_off_t *)&filp->f_pos, filldir);
	if (error)
		return -error;
	return 0;
L
Linus Torvalds 已提交
264 265 266
}

STATIC int
267
xfs_file_mmap(
L
Linus Torvalds 已提交
268 269 270
	struct file	*filp,
	struct vm_area_struct *vma)
{
271
	vma->vm_ops = &xfs_file_vm_ops;
N
Nick Piggin 已提交
272
	vma->vm_flags |= VM_CAN_NONLINEAR;
273

274
	file_accessed(filp);
L
Linus Torvalds 已提交
275 276 277 278
	return 0;
}

STATIC long
279
xfs_file_ioctl(
L
Linus Torvalds 已提交
280 281
	struct file	*filp,
	unsigned int	cmd,
282
	unsigned long	p)
L
Linus Torvalds 已提交
283
{
284
	struct inode	*inode = filp->f_path.dentry->d_inode;
L
Linus Torvalds 已提交
285 286 287 288 289 290 291 292


	/* NOTE:  some of the ioctl's return positive #'s as a
	 *	  byte count indicating success, such as
	 *	  readlink_by_handle.  So we don't "sign flip"
	 *	  like most other routines.  This means true
	 *	  errors need to be returned as a negative value.
	 */
C
Christoph Hellwig 已提交
293
	return xfs_ioctl(XFS_I(inode), filp, 0, cmd, (void __user *)p);
L
Linus Torvalds 已提交
294 295 296
}

STATIC long
297
xfs_file_ioctl_invis(
L
Linus Torvalds 已提交
298 299
	struct file	*filp,
	unsigned int	cmd,
300
	unsigned long	p)
L
Linus Torvalds 已提交
301
{
302
	struct inode	*inode = filp->f_path.dentry->d_inode;
L
Linus Torvalds 已提交
303 304 305 306 307 308 309 310


	/* NOTE:  some of the ioctl's return positive #'s as a
	 *	  byte count indicating success, such as
	 *	  readlink_by_handle.  So we don't "sign flip"
	 *	  like most other routines.  This means true
	 *	  errors need to be returned as a negative value.
	 */
C
Christoph Hellwig 已提交
311
	return xfs_ioctl(XFS_I(inode), filp, IO_INVIS, cmd, (void __user *)p);
L
Linus Torvalds 已提交
312 313
}

314 315 316 317 318 319 320 321 322 323 324 325 326 327
/*
 * mmap()d file has taken write protection fault and is being made
 * writable. We can set the page state up correctly for a writable
 * page, which means we can do correct delalloc accounting (ENOSPC
 * checking!) and unwritten extent mapping.
 */
STATIC int
xfs_vm_page_mkwrite(
	struct vm_area_struct	*vma,
	struct page		*page)
{
	return block_page_mkwrite(vma, page, xfs_get_blocks);
}

328
const struct file_operations xfs_file_operations = {
L
Linus Torvalds 已提交
329 330
	.llseek		= generic_file_llseek,
	.read		= do_sync_read,
331
	.write		= do_sync_write,
332 333
	.aio_read	= xfs_file_aio_read,
	.aio_write	= xfs_file_aio_write,
334 335
	.splice_read	= xfs_file_splice_read,
	.splice_write	= xfs_file_splice_write,
336
	.unlocked_ioctl	= xfs_file_ioctl,
L
Linus Torvalds 已提交
337
#ifdef CONFIG_COMPAT
338
	.compat_ioctl	= xfs_file_compat_ioctl,
L
Linus Torvalds 已提交
339
#endif
340 341 342 343
	.mmap		= xfs_file_mmap,
	.open		= xfs_file_open,
	.release	= xfs_file_release,
	.fsync		= xfs_file_fsync,
L
Linus Torvalds 已提交
344
#ifdef HAVE_FOP_OPEN_EXEC
345
	.open_exec	= xfs_file_open_exec,
L
Linus Torvalds 已提交
346 347 348
#endif
};

349
const struct file_operations xfs_invis_file_operations = {
L
Linus Torvalds 已提交
350 351
	.llseek		= generic_file_llseek,
	.read		= do_sync_read,
352
	.write		= do_sync_write,
353 354
	.aio_read	= xfs_file_aio_read_invis,
	.aio_write	= xfs_file_aio_write_invis,
355 356
	.splice_read	= xfs_file_splice_read_invis,
	.splice_write	= xfs_file_splice_write_invis,
357
	.unlocked_ioctl	= xfs_file_ioctl_invis,
L
Linus Torvalds 已提交
358
#ifdef CONFIG_COMPAT
359
	.compat_ioctl	= xfs_file_compat_invis_ioctl,
L
Linus Torvalds 已提交
360
#endif
361 362 363 364
	.mmap		= xfs_file_mmap,
	.open		= xfs_file_open,
	.release	= xfs_file_release,
	.fsync		= xfs_file_fsync,
L
Linus Torvalds 已提交
365 366 367
};


368
const struct file_operations xfs_dir_file_operations = {
369
	.open		= xfs_dir_open,
L
Linus Torvalds 已提交
370
	.read		= generic_read_dir,
371
	.readdir	= xfs_file_readdir,
372
	.llseek		= generic_file_llseek,
373
	.unlocked_ioctl	= xfs_file_ioctl,
374
#ifdef CONFIG_COMPAT
375
	.compat_ioctl	= xfs_file_compat_ioctl,
376
#endif
377
	.fsync		= xfs_file_fsync,
L
Linus Torvalds 已提交
378 379
};

380
static struct vm_operations_struct xfs_file_vm_ops = {
381
	.fault		= filemap_fault,
382
	.page_mkwrite	= xfs_vm_page_mkwrite,
383
};