nfs4file.c 7.6 KB
Newer Older
1 2 3 4 5
/*
 *  linux/fs/nfs/file.c
 *
 *  Copyright (C) 1992  Rick Sladkey
 */
A
Anna Schumaker 已提交
6
#include <linux/fs.h>
P
Peng Tao 已提交
7
#include <linux/file.h>
A
Anna Schumaker 已提交
8
#include <linux/falloc.h>
9
#include <linux/nfs_fs.h>
10
#include "delegation.h"
11
#include "internal.h"
12
#include "iostat.h"
D
David Howells 已提交
13
#include "fscache.h"
14 15
#include "pnfs.h"

16 17
#include "nfstrace.h"

A
Anna Schumaker 已提交
18 19 20 21
#ifdef CONFIG_NFS_V4_2
#include "nfs42.h"
#endif

22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43
#define NFSDBG_FACILITY		NFSDBG_FILE

static int
nfs4_file_open(struct inode *inode, struct file *filp)
{
	struct nfs_open_context *ctx;
	struct dentry *dentry = filp->f_path.dentry;
	struct dentry *parent = NULL;
	struct inode *dir;
	unsigned openflags = filp->f_flags;
	struct iattr attr;
	int err;

	/*
	 * If no cached dentry exists or if it's negative, NFSv4 handled the
	 * opens in ->lookup() or ->create().
	 *
	 * We only get this far for a cached positive dentry.  We skipped
	 * revalidation, so handle it here by dropping the dentry and returning
	 * -EOPENSTALE.  The VFS will retry the lookup/create/open.
	 */

44
	dprintk("NFS: open file(%pd2)\n", dentry);
45

46 47 48 49
	err = nfs_check_flags(openflags);
	if (err)
		return err;

50 51 52 53 54 55 56
	if ((openflags & O_ACCMODE) == 3)
		openflags--;

	/* We can't create new files here */
	openflags &= ~(O_CREAT|O_EXCL);

	parent = dget_parent(dentry);
57
	dir = d_inode(parent);
58 59 60 61 62 63 64 65 66 67

	ctx = alloc_nfs_open_context(filp->f_path.dentry, filp->f_mode);
	err = PTR_ERR(ctx);
	if (IS_ERR(ctx))
		goto out;

	attr.ia_valid = ATTR_OPEN;
	if (openflags & O_TRUNC) {
		attr.ia_valid |= ATTR_SIZE;
		attr.ia_size = 0;
68
		nfs_sync_inode(inode);
69 70
	}

71
	inode = NFS_PROTO(dir)->open_context(dir, ctx, openflags, &attr, NULL);
72 73 74 75 76 77 78 79 80 81 82 83 84
	if (IS_ERR(inode)) {
		err = PTR_ERR(inode);
		switch (err) {
		case -EPERM:
		case -EACCES:
		case -EDQUOT:
		case -ENOSPC:
		case -EROFS:
			goto out_put_ctx;
		default:
			goto out_drop;
		}
	}
85
	if (inode != d_inode(dentry))
86 87 88 89
		goto out_drop;

	nfs_set_verifier(dentry, nfs_save_change_attribute(dir));
	nfs_file_set_open_context(filp, ctx);
90
	nfs_fscache_open_file(inode, filp);
91 92 93 94 95 96 97 98 99 100 101 102 103 104
	err = 0;

out_put_ctx:
	put_nfs_open_context(ctx);
out:
	dput(parent);
	return err;

out_drop:
	d_drop(dentry);
	err = -EOPENSTALE;
	goto out_put_ctx;
}

105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129
/*
 * Flush all dirty pages, and check for write errors.
 */
static int
nfs4_file_flush(struct file *file, fl_owner_t id)
{
	struct inode	*inode = file_inode(file);

	dprintk("NFS: flush(%pD2)\n", file);

	nfs_inc_stats(inode, NFSIOS_VFSFLUSH);
	if ((file->f_mode & FMODE_WRITE) == 0)
		return 0;

	/*
	 * If we're holding a write delegation, then check if we're required
	 * to flush the i/o on close. If not, then just start the i/o now.
	 */
	if (!nfs4_delegation_flush_on_close(inode))
		return filemap_fdatawrite(file->f_mapping);

	/* Flush writes to the server and return any errors */
	return vfs_fsync(file, 0);
}

130 131 132 133
static int
nfs4_file_fsync(struct file *file, loff_t start, loff_t end, int datasync)
{
	int ret;
A
Al Viro 已提交
134
	struct inode *inode = file_inode(file);
135

136 137
	trace_nfs_fsync_enter(inode);

138
	nfs_inode_dio_wait(inode);
139 140 141 142 143 144
	do {
		ret = filemap_write_and_wait_range(inode->i_mapping, start, end);
		if (ret != 0)
			break;
		mutex_lock(&inode->i_mutex);
		ret = nfs_file_fsync_commit(file, start, end, datasync);
145
		if (!ret)
146
			ret = pnfs_sync_inode(inode, !!datasync);
147
		mutex_unlock(&inode->i_mutex);
148 149 150 151 152 153 154
		/*
		 * If nfs_file_fsync_commit detected a server reboot, then
		 * resend all dirty pages that might have been covered by
		 * the NFS_CONTEXT_RESEND_WRITES flag
		 */
		start = 0;
		end = LLONG_MAX;
155 156
	} while (ret == -EAGAIN);

157
	trace_nfs_fsync_exit(inode, ret);
158 159 160
	return ret;
}

A
Anna Schumaker 已提交
161 162 163 164 165 166 167 168 169 170 171 172 173 174 175
#ifdef CONFIG_NFS_V4_2
static loff_t nfs4_file_llseek(struct file *filep, loff_t offset, int whence)
{
	loff_t ret;

	switch (whence) {
	case SEEK_HOLE:
	case SEEK_DATA:
		ret = nfs42_proc_llseek(filep, offset, whence);
		if (ret != -ENOTSUPP)
			return ret;
	default:
		return nfs_file_llseek(filep, offset, whence);
	}
}
A
Anna Schumaker 已提交
176 177 178 179 180 181 182 183 184

static long nfs42_fallocate(struct file *filep, int mode, loff_t offset, loff_t len)
{
	struct inode *inode = file_inode(filep);
	long ret;

	if (!S_ISREG(inode->i_mode))
		return -EOPNOTSUPP;

A
Anna Schumaker 已提交
185
	if ((mode != 0) && (mode != (FALLOC_FL_PUNCH_HOLE | FALLOC_FL_KEEP_SIZE)))
A
Anna Schumaker 已提交
186 187 188 189 190 191
		return -EOPNOTSUPP;

	ret = inode_newsize_ok(inode, offset + len);
	if (ret < 0)
		return ret;

A
Anna Schumaker 已提交
192
	if (mode & FALLOC_FL_PUNCH_HOLE)
193 194
		return nfs42_proc_deallocate(filep, offset, len);
	return nfs42_proc_allocate(filep, offset, len);
A
Anna Schumaker 已提交
195
}
P
Peng Tao 已提交
196 197 198 199 200 201

static noinline long
nfs42_ioctl_clone(struct file *dst_file, unsigned long srcfd,
		  u64 src_off, u64 dst_off, u64 count)
{
	struct inode *dst_inode = file_inode(dst_file);
P
Peng Tao 已提交
202
	struct nfs_server *server = NFS_SERVER(dst_inode);
P
Peng Tao 已提交
203 204
	struct fd src_file;
	struct inode *src_inode;
P
Peng Tao 已提交
205
	unsigned int bs = server->clone_blksize;
P
Peng Tao 已提交
206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242
	int ret;

	/* dst file must be opened for writing */
	if (!(dst_file->f_mode & FMODE_WRITE))
		return -EINVAL;

	ret = mnt_want_write_file(dst_file);
	if (ret)
		return ret;

	src_file = fdget(srcfd);
	if (!src_file.file) {
		ret = -EBADF;
		goto out_drop_write;
	}

	src_inode = file_inode(src_file.file);

	/* src and dst must be different files */
	ret = -EINVAL;
	if (src_inode == dst_inode)
		goto out_fput;

	/* src file must be opened for reading */
	if (!(src_file.file->f_mode & FMODE_READ))
		goto out_fput;

	/* src and dst must be regular files */
	ret = -EISDIR;
	if (!S_ISREG(src_inode->i_mode) || !S_ISREG(dst_inode->i_mode))
		goto out_fput;

	ret = -EXDEV;
	if (src_file.file->f_path.mnt != dst_file->f_path.mnt ||
	    src_inode->i_sb != dst_inode->i_sb)
		goto out_fput;

P
Peng Tao 已提交
243 244 245 246 247 248 249 250 251
	/* check alignment w.r.t. clone_blksize */
	ret = -EINVAL;
	if (bs) {
		if (!IS_ALIGNED(src_off, bs) || !IS_ALIGNED(dst_off, bs))
			goto out_fput;
		if (!IS_ALIGNED(count, bs) && i_size_read(src_inode) != (src_off + count))
			goto out_fput;
	}

P
Peng Tao 已提交
252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290
	/* XXX: do we lock at all? what if server needs CB_RECALL_LAYOUT? */
	if (dst_inode < src_inode) {
		mutex_lock_nested(&dst_inode->i_mutex, I_MUTEX_PARENT);
		mutex_lock_nested(&src_inode->i_mutex, I_MUTEX_CHILD);
	} else {
		mutex_lock_nested(&src_inode->i_mutex, I_MUTEX_PARENT);
		mutex_lock_nested(&dst_inode->i_mutex, I_MUTEX_CHILD);
	}

	/* flush all pending writes on both src and dst so that server
	 * has the latest data */
	ret = nfs_sync_inode(src_inode);
	if (ret)
		goto out_unlock;
	ret = nfs_sync_inode(dst_inode);
	if (ret)
		goto out_unlock;

	ret = nfs42_proc_clone(src_file.file, dst_file, src_off, dst_off, count);

	/* truncate inode page cache of the dst range so that future reads can fetch
	 * new data from server */
	if (!ret)
		truncate_inode_pages_range(&dst_inode->i_data, dst_off, dst_off + count - 1);

out_unlock:
	if (dst_inode < src_inode) {
		mutex_unlock(&src_inode->i_mutex);
		mutex_unlock(&dst_inode->i_mutex);
	} else {
		mutex_unlock(&dst_inode->i_mutex);
		mutex_unlock(&src_inode->i_mutex);
	}
out_fput:
	fdput(src_file);
out_drop_write:
	mnt_drop_write_file(dst_file);
	return ret;
}
A
Anna Schumaker 已提交
291 292
#endif /* CONFIG_NFS_V4_2 */

P
Peng Tao 已提交
293 294 295 296 297 298 299 300 301 302 303 304
long nfs4_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
{
	switch (cmd) {
#ifdef CONFIG_NFS_V4_2
	case NFS_IOC_CLONE:
		return nfs42_ioctl_clone(file, arg, 0, 0, 0);
#endif
	}

	return -ENOTTY;
}

305
const struct file_operations nfs4_file_operations = {
A
Anna Schumaker 已提交
306 307 308
#ifdef CONFIG_NFS_V4_2
	.llseek		= nfs4_file_llseek,
#else
309
	.llseek		= nfs_file_llseek,
A
Anna Schumaker 已提交
310
#endif
A
Al Viro 已提交
311
	.read_iter	= nfs_file_read,
A
Al Viro 已提交
312
	.write_iter	= nfs_file_write,
313 314
	.mmap		= nfs_file_mmap,
	.open		= nfs4_file_open,
315
	.flush		= nfs4_file_flush,
316 317 318 319 320
	.release	= nfs_file_release,
	.fsync		= nfs4_file_fsync,
	.lock		= nfs_lock,
	.flock		= nfs_flock,
	.splice_read	= nfs_file_splice_read,
321
	.splice_write	= iter_file_splice_write,
A
Anna Schumaker 已提交
322 323 324
#ifdef CONFIG_NFS_V4_2
	.fallocate	= nfs42_fallocate,
#endif /* CONFIG_NFS_V4_2 */
325
	.check_flags	= nfs_check_flags,
326
	.setlease	= simple_nosetlease,
P
Peng Tao 已提交
327 328 329 330 331
#ifdef CONFIG_COMPAT
	.unlocked_ioctl = nfs4_ioctl,
#else
	.compat_ioctl	= nfs4_ioctl,
#endif /* CONFIG_COMPAT */
332
};