xfs_file.c 12.9 KB
Newer Older
L
Linus Torvalds 已提交
1
/*
2 3
 * Copyright (c) 2000-2005 Silicon Graphics, Inc.
 * All Rights Reserved.
L
Linus Torvalds 已提交
4
 *
5 6
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License as
L
Linus Torvalds 已提交
7 8
 * published by the Free Software Foundation.
 *
9 10 11 12
 * This program is distributed in the hope that it would be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
L
Linus Torvalds 已提交
13
 *
14 15 16
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write the Free Software Foundation,
 * Inc.,  51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
L
Linus Torvalds 已提交
17 18
 */
#include "xfs.h"
19
#include "xfs_bit.h"
L
Linus Torvalds 已提交
20
#include "xfs_log.h"
21
#include "xfs_inum.h"
L
Linus Torvalds 已提交
22
#include "xfs_sb.h"
23
#include "xfs_ag.h"
L
Linus Torvalds 已提交
24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45
#include "xfs_dir.h"
#include "xfs_dir2.h"
#include "xfs_trans.h"
#include "xfs_dmapi.h"
#include "xfs_mount.h"
#include "xfs_bmap_btree.h"
#include "xfs_alloc_btree.h"
#include "xfs_ialloc_btree.h"
#include "xfs_alloc.h"
#include "xfs_btree.h"
#include "xfs_attr_sf.h"
#include "xfs_dir_sf.h"
#include "xfs_dir2_sf.h"
#include "xfs_dinode.h"
#include "xfs_inode.h"
#include "xfs_error.h"
#include "xfs_rw.h"
#include "xfs_ioctl32.h"

#include <linux/dcache.h>
#include <linux/smp_lock.h>

46
static struct vm_operations_struct xfs_file_vm_ops;
47
#ifdef CONFIG_XFS_DMAPI
48
static struct vm_operations_struct xfs_dmapi_file_vm_ops;
49
#endif
L
Linus Torvalds 已提交
50 51

STATIC inline ssize_t
52
__xfs_file_read(
L
Linus Torvalds 已提交
53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73
	struct kiocb		*iocb,
	char			__user *buf,
	int			ioflags,
	size_t			count,
	loff_t			pos)
{
	struct iovec		iov = {buf, count};
	struct file		*file = iocb->ki_filp;
	vnode_t			*vp = LINVFS_GET_VP(file->f_dentry->d_inode);
	ssize_t			rval;

	BUG_ON(iocb->ki_pos != pos);

	if (unlikely(file->f_flags & O_DIRECT))
		ioflags |= IO_ISDIRECT;
	VOP_READ(vp, iocb, &iov, 1, &iocb->ki_pos, ioflags, NULL, rval);
	return rval;
}


STATIC ssize_t
74
xfs_file_aio_read(
L
Linus Torvalds 已提交
75 76 77 78 79
	struct kiocb		*iocb,
	char			__user *buf,
	size_t			count,
	loff_t			pos)
{
80
	return __xfs_file_read(iocb, buf, IO_ISAIO, count, pos);
L
Linus Torvalds 已提交
81 82 83
}

STATIC ssize_t
84
xfs_file_aio_read_invis(
L
Linus Torvalds 已提交
85 86 87 88 89
	struct kiocb		*iocb,
	char			__user *buf,
	size_t			count,
	loff_t			pos)
{
90
	return __xfs_file_read(iocb, buf, IO_ISAIO|IO_INVIS, count, pos);
L
Linus Torvalds 已提交
91 92 93 94
}


STATIC inline ssize_t
95
__xfs_file_write(
L
Linus Torvalds 已提交
96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117
	struct kiocb	*iocb,
	const char	__user *buf,
	int		ioflags,
	size_t		count,
	loff_t		pos)
{
	struct iovec	iov = {(void __user *)buf, count};
	struct file	*file = iocb->ki_filp;
	struct inode	*inode = file->f_mapping->host;
	vnode_t		*vp = LINVFS_GET_VP(inode);
	ssize_t		rval;

	BUG_ON(iocb->ki_pos != pos);
	if (unlikely(file->f_flags & O_DIRECT))
		ioflags |= IO_ISDIRECT;

	VOP_WRITE(vp, iocb, &iov, 1, &iocb->ki_pos, ioflags, NULL, rval);
	return rval;
}


STATIC ssize_t
118
xfs_file_aio_write(
L
Linus Torvalds 已提交
119 120 121 122 123
	struct kiocb		*iocb,
	const char		__user *buf,
	size_t			count,
	loff_t			pos)
{
124
	return __xfs_file_write(iocb, buf, IO_ISAIO, count, pos);
L
Linus Torvalds 已提交
125 126 127
}

STATIC ssize_t
128
xfs_file_aio_write_invis(
L
Linus Torvalds 已提交
129 130 131 132 133
	struct kiocb		*iocb,
	const char		__user *buf,
	size_t			count,
	loff_t			pos)
{
134
	return __xfs_file_write(iocb, buf, IO_ISAIO|IO_INVIS, count, pos);
L
Linus Torvalds 已提交
135 136 137 138
}


STATIC inline ssize_t
139
__xfs_file_readv(
L
Linus Torvalds 已提交
140 141 142 143 144 145 146 147
	struct file		*file,
	const struct iovec 	*iov,
	int			ioflags,
	unsigned long		nr_segs,
	loff_t			*ppos)
{
	struct inode	*inode = file->f_mapping->host;
	vnode_t		*vp = LINVFS_GET_VP(inode);
148
	struct kiocb	*kiocb;
L
Linus Torvalds 已提交
149 150
	ssize_t		rval;

151 152 153 154 155 156
	kiocb = kmalloc(sizeof(*kiocb), GFP_KERNEL);
	if (unlikely(!kiocb))
		return -ENOMEM;

	init_sync_kiocb(kiocb, file);
	kiocb->ki_pos = *ppos;
L
Linus Torvalds 已提交
157 158 159

	if (unlikely(file->f_flags & O_DIRECT))
		ioflags |= IO_ISDIRECT;
160
	VOP_READ(vp, kiocb, iov, nr_segs, &kiocb->ki_pos, ioflags, NULL, rval);
L
Linus Torvalds 已提交
161

162 163
	*ppos = kiocb->ki_pos;
	kfree(kiocb);
L
Linus Torvalds 已提交
164 165 166 167
	return rval;
}

STATIC ssize_t
168
xfs_file_readv(
L
Linus Torvalds 已提交
169 170 171 172 173
	struct file		*file,
	const struct iovec 	*iov,
	unsigned long		nr_segs,
	loff_t			*ppos)
{
174
	return __xfs_file_readv(file, iov, 0, nr_segs, ppos);
L
Linus Torvalds 已提交
175 176 177
}

STATIC ssize_t
178
xfs_file_readv_invis(
L
Linus Torvalds 已提交
179 180 181 182 183
	struct file		*file,
	const struct iovec 	*iov,
	unsigned long		nr_segs,
	loff_t			*ppos)
{
184
	return __xfs_file_readv(file, iov, IO_INVIS, nr_segs, ppos);
L
Linus Torvalds 已提交
185 186 187 188
}


STATIC inline ssize_t
189
__xfs_file_writev(
L
Linus Torvalds 已提交
190 191 192 193 194 195 196 197
	struct file		*file,
	const struct iovec 	*iov,
	int			ioflags,
	unsigned long		nr_segs,
	loff_t			*ppos)
{
	struct inode	*inode = file->f_mapping->host;
	vnode_t		*vp = LINVFS_GET_VP(inode);
198
	struct kiocb	*kiocb;
L
Linus Torvalds 已提交
199 200
	ssize_t		rval;

201 202 203 204 205 206
	kiocb = kmalloc(sizeof(*kiocb), GFP_KERNEL);
	if (unlikely(!kiocb))
		return -ENOMEM;

	init_sync_kiocb(kiocb, file);
	kiocb->ki_pos = *ppos;
L
Linus Torvalds 已提交
207 208 209
	if (unlikely(file->f_flags & O_DIRECT))
		ioflags |= IO_ISDIRECT;

210
	VOP_WRITE(vp, kiocb, iov, nr_segs, &kiocb->ki_pos, ioflags, NULL, rval);
L
Linus Torvalds 已提交
211

212 213
	*ppos = kiocb->ki_pos;
	kfree(kiocb);
L
Linus Torvalds 已提交
214 215 216 217 218
	return rval;
}


STATIC ssize_t
219
xfs_file_writev(
L
Linus Torvalds 已提交
220 221 222 223 224
	struct file		*file,
	const struct iovec 	*iov,
	unsigned long		nr_segs,
	loff_t			*ppos)
{
225
	return __xfs_file_writev(file, iov, 0, nr_segs, ppos);
L
Linus Torvalds 已提交
226 227 228
}

STATIC ssize_t
229
xfs_file_writev_invis(
L
Linus Torvalds 已提交
230 231 232 233 234
	struct file		*file,
	const struct iovec 	*iov,
	unsigned long		nr_segs,
	loff_t			*ppos)
{
235
	return __xfs_file_writev(file, iov, IO_INVIS, nr_segs, ppos);
L
Linus Torvalds 已提交
236 237 238
}

STATIC ssize_t
239
xfs_file_sendfile(
L
Linus Torvalds 已提交
240 241 242 243 244 245 246 247 248 249 250 251 252 253 254
	struct file		*filp,
	loff_t			*ppos,
	size_t			count,
	read_actor_t		actor,
	void			*target)
{
	vnode_t			*vp = LINVFS_GET_VP(filp->f_dentry->d_inode);
	ssize_t			rval;

	VOP_SENDFILE(vp, filp, ppos, 0, count, actor, target, NULL, rval);
	return rval;
}


STATIC int
255
xfs_file_open(
L
Linus Torvalds 已提交
256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271
	struct inode	*inode,
	struct file	*filp)
{
	vnode_t		*vp = LINVFS_GET_VP(inode);
	int		error;

	if (!(filp->f_flags & O_LARGEFILE) && i_size_read(inode) > MAX_NON_LFS)
		return -EFBIG;

	ASSERT(vp);
	VOP_OPEN(vp, NULL, error);
	return -error;
}


STATIC int
272
xfs_file_release(
L
Linus Torvalds 已提交
273 274 275 276 277 278 279 280 281 282 283 284 285
	struct inode	*inode,
	struct file	*filp)
{
	vnode_t		*vp = LINVFS_GET_VP(inode);
	int		error = 0;

	if (vp)
		VOP_RELEASE(vp, error);
	return -error;
}


STATIC int
286
xfs_file_fsync(
L
Linus Torvalds 已提交
287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304
	struct file	*filp,
	struct dentry	*dentry,
	int		datasync)
{
	struct inode	*inode = dentry->d_inode;
	vnode_t		*vp = LINVFS_GET_VP(inode);
	int		error;
	int		flags = FSYNC_WAIT;

	if (datasync)
		flags |= FSYNC_DATA;

	ASSERT(vp);
	VOP_FSYNC(vp, flags, NULL, (xfs_off_t)0, (xfs_off_t)-1, error);
	return -error;
}

/*
305
 * xfs_file_readdir maps to VOP_READDIR().
L
Linus Torvalds 已提交
306 307 308 309 310
 * We need to build a uio, cred, ...
 */

#define nextdp(dp)      ((struct xfs_dirent *)((char *)(dp) + (dp)->d_reclen))

311 312 313
#ifdef CONFIG_XFS_DMAPI

STATIC struct page *
314
xfs_vm_nopage(
315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335
	struct vm_area_struct	*area,
	unsigned long		address,
	int			*type)
{
	struct inode	*inode = area->vm_file->f_dentry->d_inode;
	vnode_t		*vp = LINVFS_GET_VP(inode);
	xfs_mount_t	*mp = XFS_VFSTOM(vp->v_vfsp);
	int		error;

	ASSERT_ALWAYS(vp->v_vfsp->vfs_flag & VFS_DMI);

	error = XFS_SEND_MMAP(mp, area, 0);
	if (error)
		return NULL;

	return filemap_nopage(area, address, type);
}

#endif /* CONFIG_XFS_DMAPI */


L
Linus Torvalds 已提交
336
STATIC int
337
xfs_file_readdir(
L
Linus Torvalds 已提交
338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416
	struct file	*filp,
	void		*dirent,
	filldir_t	filldir)
{
	int		error = 0;
	vnode_t		*vp;
	uio_t		uio;
	iovec_t		iov;
	int		eof = 0;
	caddr_t		read_buf;
	int		namelen, size = 0;
	size_t		rlen = PAGE_CACHE_SIZE;
	xfs_off_t	start_offset, curr_offset;
	xfs_dirent_t	*dbp = NULL;

	vp = LINVFS_GET_VP(filp->f_dentry->d_inode);
	ASSERT(vp);

	/* Try fairly hard to get memory */
	do {
		if ((read_buf = (caddr_t)kmalloc(rlen, GFP_KERNEL)))
			break;
		rlen >>= 1;
	} while (rlen >= 1024);

	if (read_buf == NULL)
		return -ENOMEM;

	uio.uio_iov = &iov;
	uio.uio_segflg = UIO_SYSSPACE;
	curr_offset = filp->f_pos;
	if (filp->f_pos != 0x7fffffff)
		uio.uio_offset = filp->f_pos;
	else
		uio.uio_offset = 0xffffffff;

	while (!eof) {
		uio.uio_resid = iov.iov_len = rlen;
		iov.iov_base = read_buf;
		uio.uio_iovcnt = 1;

		start_offset = uio.uio_offset;

		VOP_READDIR(vp, &uio, NULL, &eof, error);
		if ((uio.uio_offset == start_offset) || error) {
			size = 0;
			break;
		}

		size = rlen - uio.uio_resid;
		dbp = (xfs_dirent_t *)read_buf;
		while (size > 0) {
			namelen = strlen(dbp->d_name);

			if (filldir(dirent, dbp->d_name, namelen,
					(loff_t) curr_offset & 0x7fffffff,
					(ino_t) dbp->d_ino,
					DT_UNKNOWN)) {
				goto done;
			}
			size -= dbp->d_reclen;
			curr_offset = (loff_t)dbp->d_off /* & 0x7fffffff */;
			dbp = nextdp(dbp);
		}
	}
done:
	if (!error) {
		if (size == 0)
			filp->f_pos = uio.uio_offset & 0x7fffffff;
		else if (dbp)
			filp->f_pos = curr_offset;
	}

	kfree(read_buf);
	return -error;
}


STATIC int
417
xfs_file_mmap(
L
Linus Torvalds 已提交
418 419 420 421 422
	struct file	*filp,
	struct vm_area_struct *vma)
{
	struct inode	*ip = filp->f_dentry->d_inode;
	vnode_t		*vp = LINVFS_GET_VP(ip);
423
	vattr_t		*vattr;
L
Linus Torvalds 已提交
424 425
	int		error;

426
	vma->vm_ops = &xfs_file_vm_ops;
427 428

#ifdef CONFIG_XFS_DMAPI
429
	if (vp->v_vfsp->vfs_flag & VFS_DMI) {
430
		vma->vm_ops = &xfs_dmapi_file_vm_ops;
L
Linus Torvalds 已提交
431
	}
432
#endif /* CONFIG_XFS_DMAPI */
L
Linus Torvalds 已提交
433

434 435 436 437 438 439 440 441
	vattr = kmalloc(sizeof(*vattr), GFP_KERNEL);
	if (unlikely(!vattr))
		return -ENOMEM;
	vattr->va_mask = XFS_AT_UPDATIME;
	VOP_SETATTR(vp, vattr, XFS_AT_UPDATIME, NULL, error);
	if (likely(!error))
		__vn_revalidate(vp, vattr);	/* update flags */
	kfree(vattr);
L
Linus Torvalds 已提交
442 443 444 445 446
	return 0;
}


STATIC long
447
xfs_file_ioctl(
L
Linus Torvalds 已提交
448 449 450 451 452
	struct file	*filp,
	unsigned int	cmd,
	unsigned long	arg)
{
	int		error;
453
	struct inode	*inode = filp->f_dentry->d_inode;
L
Linus Torvalds 已提交
454 455 456 457 458 459 460 461 462 463 464 465 466 467 468
	vnode_t		*vp = LINVFS_GET_VP(inode);

	VOP_IOCTL(vp, inode, filp, 0, cmd, (void __user *)arg, error);
	VMODIFY(vp);

	/* NOTE:  some of the ioctl's return positive #'s as a
	 *	  byte count indicating success, such as
	 *	  readlink_by_handle.  So we don't "sign flip"
	 *	  like most other routines.  This means true
	 *	  errors need to be returned as a negative value.
	 */
	return error;
}

STATIC long
469
xfs_file_ioctl_invis(
L
Linus Torvalds 已提交
470 471 472 473 474
	struct file	*filp,
	unsigned int	cmd,
	unsigned long	arg)
{
	int		error;
475
	struct inode	*inode = filp->f_dentry->d_inode;
L
Linus Torvalds 已提交
476 477 478 479 480 481 482 483 484 485 486 487 488 489 490
	vnode_t		*vp = LINVFS_GET_VP(inode);

	ASSERT(vp);
	VOP_IOCTL(vp, inode, filp, IO_INVIS, cmd, (void __user *)arg, error);
	VMODIFY(vp);

	/* NOTE:  some of the ioctl's return positive #'s as a
	 *	  byte count indicating success, such as
	 *	  readlink_by_handle.  So we don't "sign flip"
	 *	  like most other routines.  This means true
	 *	  errors need to be returned as a negative value.
	 */
	return error;
}

491
#ifdef CONFIG_XFS_DMAPI
L
Linus Torvalds 已提交
492 493
#ifdef HAVE_VMOP_MPROTECT
STATIC int
494
xfs_vm_mprotect(
L
Linus Torvalds 已提交
495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511
	struct vm_area_struct *vma,
	unsigned int	newflags)
{
	vnode_t		*vp = LINVFS_GET_VP(vma->vm_file->f_dentry->d_inode);
	int		error = 0;

	if (vp->v_vfsp->vfs_flag & VFS_DMI) {
		if ((vma->vm_flags & VM_MAYSHARE) &&
		    (newflags & VM_WRITE) && !(vma->vm_flags & VM_WRITE)) {
			xfs_mount_t	*mp = XFS_VFSTOM(vp->v_vfsp);

			error = XFS_SEND_MMAP(mp, vma, VM_WRITE);
		    }
	}
	return error;
}
#endif /* HAVE_VMOP_MPROTECT */
512
#endif /* CONFIG_XFS_DMAPI */
L
Linus Torvalds 已提交
513 514 515 516 517 518 519 520

#ifdef HAVE_FOP_OPEN_EXEC
/* If the user is attempting to execute a file that is offline then
 * we have to trigger a DMAPI READ event before the file is marked as busy
 * otherwise the invisible I/O will not be able to write to the file to bring
 * it back online.
 */
STATIC int
521
xfs_file_open_exec(
L
Linus Torvalds 已提交
522 523 524 525 526 527 528 529
	struct inode	*inode)
{
	vnode_t		*vp = LINVFS_GET_VP(inode);
	xfs_mount_t	*mp = XFS_VFSTOM(vp->v_vfsp);
	int		error = 0;
	xfs_inode_t	*ip;

	if (vp->v_vfsp->vfs_flag & VFS_DMI) {
530 531
		ip = xfs_vtoi(vp);
		if (!ip) {
L
Linus Torvalds 已提交
532 533 534 535 536 537 538 539 540 541 542 543 544
			error = -EINVAL;
			goto open_exec_out;
		}
		if (DM_EVENT_ENABLED(vp->v_vfsp, ip, DM_EVENT_READ)) {
			error = -XFS_SEND_DATA(mp, DM_EVENT_READ, vp,
					       0, 0, 0, NULL);
		}
	}
open_exec_out:
	return error;
}
#endif /* HAVE_FOP_OPEN_EXEC */

545
struct file_operations xfs_file_operations = {
L
Linus Torvalds 已提交
546 547
	.llseek		= generic_file_llseek,
	.read		= do_sync_read,
548
	.write		= do_sync_write,
549 550 551 552 553 554
	.readv		= xfs_file_readv,
	.writev		= xfs_file_writev,
	.aio_read	= xfs_file_aio_read,
	.aio_write	= xfs_file_aio_write,
	.sendfile	= xfs_file_sendfile,
	.unlocked_ioctl	= xfs_file_ioctl,
L
Linus Torvalds 已提交
555
#ifdef CONFIG_COMPAT
556
	.compat_ioctl	= xfs_file_compat_ioctl,
L
Linus Torvalds 已提交
557
#endif
558 559 560 561
	.mmap		= xfs_file_mmap,
	.open		= xfs_file_open,
	.release	= xfs_file_release,
	.fsync		= xfs_file_fsync,
L
Linus Torvalds 已提交
562
#ifdef HAVE_FOP_OPEN_EXEC
563
	.open_exec	= xfs_file_open_exec,
L
Linus Torvalds 已提交
564 565 566
#endif
};

567
struct file_operations xfs_invis_file_operations = {
L
Linus Torvalds 已提交
568 569
	.llseek		= generic_file_llseek,
	.read		= do_sync_read,
570
	.write		= do_sync_write,
571 572 573 574 575 576
	.readv		= xfs_file_readv_invis,
	.writev		= xfs_file_writev_invis,
	.aio_read	= xfs_file_aio_read_invis,
	.aio_write	= xfs_file_aio_write_invis,
	.sendfile	= xfs_file_sendfile,
	.unlocked_ioctl	= xfs_file_ioctl_invis,
L
Linus Torvalds 已提交
577
#ifdef CONFIG_COMPAT
578
	.compat_ioctl	= xfs_file_compat_invis_ioctl,
L
Linus Torvalds 已提交
579
#endif
580 581 582 583
	.mmap		= xfs_file_mmap,
	.open		= xfs_file_open,
	.release	= xfs_file_release,
	.fsync		= xfs_file_fsync,
L
Linus Torvalds 已提交
584 585 586
};


587
struct file_operations xfs_dir_file_operations = {
L
Linus Torvalds 已提交
588
	.read		= generic_read_dir,
589 590
	.readdir	= xfs_file_readdir,
	.unlocked_ioctl	= xfs_file_ioctl,
591
#ifdef CONFIG_COMPAT
592
	.compat_ioctl	= xfs_file_compat_ioctl,
593
#endif
594
	.fsync		= xfs_file_fsync,
L
Linus Torvalds 已提交
595 596
};

597
static struct vm_operations_struct xfs_file_vm_ops = {
L
Linus Torvalds 已提交
598 599
	.nopage		= filemap_nopage,
	.populate	= filemap_populate,
600 601 602
};

#ifdef CONFIG_XFS_DMAPI
603 604
static struct vm_operations_struct xfs_dmapi_file_vm_ops = {
	.nopage		= xfs_vm_nopage,
605
	.populate	= filemap_populate,
L
Linus Torvalds 已提交
606
#ifdef HAVE_VMOP_MPROTECT
607
	.mprotect	= xfs_vm_mprotect,
L
Linus Torvalds 已提交
608 609
#endif
};
610
#endif /* CONFIG_XFS_DMAPI */