file.c 100.0 KB
Newer Older
C
Chao Yu 已提交
1
// SPDX-License-Identifier: GPL-2.0
J
Jaegeuk Kim 已提交
2
/*
J
Jaegeuk Kim 已提交
3 4 5 6 7 8 9 10 11 12
 * fs/f2fs/file.c
 *
 * Copyright (c) 2012 Samsung Electronics Co., Ltd.
 *             http://www.samsung.com/
 */
#include <linux/fs.h>
#include <linux/f2fs_fs.h>
#include <linux/stat.h>
#include <linux/buffer_head.h>
#include <linux/writeback.h>
13
#include <linux/blkdev.h>
J
Jaegeuk Kim 已提交
14 15
#include <linux/falloc.h>
#include <linux/types.h>
16
#include <linux/compat.h>
J
Jaegeuk Kim 已提交
17 18
#include <linux/uaccess.h>
#include <linux/mount.h>
19
#include <linux/pagevec.h>
20
#include <linux/uio.h>
21
#include <linux/uuid.h>
22
#include <linux/file.h>
C
Chao Yu 已提交
23
#include <linux/nls.h>
24
#include <linux/sched/signal.h>
J
Jaegeuk Kim 已提交
25 26 27 28 29 30

#include "f2fs.h"
#include "node.h"
#include "segment.h"
#include "xattr.h"
#include "acl.h"
31
#include "gc.h"
J
Jaegeuk Kim 已提交
32
#include "trace.h"
33
#include <trace/events/f2fs.h>
34
#include <uapi/linux/f2fs.h>
J
Jaegeuk Kim 已提交
35

36
static vm_fault_t f2fs_filemap_fault(struct vm_fault *vmf)
37 38
{
	struct inode *inode = file_inode(vmf->vma->vm_file);
39
	vm_fault_t ret;
40 41

	down_read(&F2FS_I(inode)->i_mmap_sem);
42
	ret = filemap_fault(vmf);
43 44
	up_read(&F2FS_I(inode)->i_mmap_sem);

C
Chao Yu 已提交
45 46 47 48
	if (!ret)
		f2fs_update_iostat(F2FS_I_SB(inode), APP_MAPPED_READ_IO,
							F2FS_BLKSIZE);

49 50
	trace_f2fs_filemap_fault(inode, vmf->pgoff, (unsigned long)ret);

51
	return ret;
52 53
}

54
static vm_fault_t f2fs_vm_page_mkwrite(struct vm_fault *vmf)
J
Jaegeuk Kim 已提交
55 56
{
	struct page *page = vmf->page;
57
	struct inode *inode = file_inode(vmf->vma->vm_file);
58
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
59
	struct dnode_of_data dn;
C
Chao Yu 已提交
60 61
	bool need_alloc = true;
	int err = 0;
J
Jaegeuk Kim 已提交
62

63 64 65 66 67
	if (unlikely(f2fs_cp_error(sbi))) {
		err = -EIO;
		goto err;
	}

68 69
	if (!f2fs_is_checkpoint_ready(sbi)) {
		err = -ENOSPC;
70
		goto err;
71
	}
72

C
Chao Yu 已提交
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88
#ifdef CONFIG_F2FS_FS_COMPRESSION
	if (f2fs_compressed_file(inode)) {
		int ret = f2fs_is_compressed_cluster(inode, page->index);

		if (ret < 0) {
			err = ret;
			goto err;
		} else if (ret) {
			if (ret < F2FS_I(inode)->i_cluster_size) {
				err = -EAGAIN;
				goto err;
			}
			need_alloc = false;
		}
	}
#endif
89
	/* should do out of any locked page */
C
Chao Yu 已提交
90 91
	if (need_alloc)
		f2fs_balance_fs(sbi, true);
92

J
Jaegeuk Kim 已提交
93
	sb_start_pagefault(inode->i_sb);
94 95

	f2fs_bug_on(sbi, f2fs_has_inline_data(inode));
96

97
	file_update_time(vmf->vma->vm_file);
98
	down_read(&F2FS_I(inode)->i_mmap_sem);
J
Jaegeuk Kim 已提交
99
	lock_page(page);
100
	if (unlikely(page->mapping != inode->i_mapping ||
101
			page_offset(page) > i_size_read(inode) ||
102
			!PageUptodate(page))) {
J
Jaegeuk Kim 已提交
103 104
		unlock_page(page);
		err = -EFAULT;
105
		goto out_sem;
J
Jaegeuk Kim 已提交
106 107
	}

C
Chao Yu 已提交
108 109
	if (need_alloc) {
		/* block allocation */
C
Chao Yu 已提交
110
		f2fs_do_map_lock(sbi, F2FS_GET_BLOCK_PRE_AIO, true);
C
Chao Yu 已提交
111 112 113
		set_new_dnode(&dn, inode, NULL, NULL, 0);
		err = f2fs_get_block(&dn, page->index);
		f2fs_put_dnode(&dn);
C
Chao Yu 已提交
114
		f2fs_do_map_lock(sbi, F2FS_GET_BLOCK_PRE_AIO, false);
C
Chao Yu 已提交
115 116
	}

117 118 119 120 121 122 123 124 125 126
#ifdef CONFIG_F2FS_FS_COMPRESSION
	if (!need_alloc) {
		set_new_dnode(&dn, inode, NULL, NULL, 0);
		err = f2fs_get_dnode_of_data(&dn, page->index, LOOKUP_NODE);
		f2fs_put_dnode(&dn);
	}
#endif
	if (err) {
		unlock_page(page);
		goto out_sem;
C
Chao Yu 已提交
127 128
	}

129
	f2fs_wait_on_page_writeback(page, DATA, false, true);
C
Chao Yu 已提交
130 131 132 133

	/* wait for GCed page writeback via META_MAPPING */
	f2fs_wait_on_block_writeback(inode, dn.data_blkaddr);

J
Jaegeuk Kim 已提交
134 135 136 137
	/*
	 * check to see if the page is mapped already (no holes)
	 */
	if (PageMappedToDisk(page))
C
Chao Yu 已提交
138
		goto out_sem;
J
Jaegeuk Kim 已提交
139 140

	/* page is wholly or partially inside EOF */
141
	if (((loff_t)(page->index + 1) << PAGE_SHIFT) >
C
Chao Yu 已提交
142
						i_size_read(inode)) {
143
		loff_t offset;
144

145 146
		offset = i_size_read(inode) & ~PAGE_MASK;
		zero_user_segment(page, offset, PAGE_SIZE);
J
Jaegeuk Kim 已提交
147 148
	}
	set_page_dirty(page);
149 150
	if (!PageUptodate(page))
		SetPageUptodate(page);
J
Jaegeuk Kim 已提交
151

C
Chao Yu 已提交
152
	f2fs_update_iostat(sbi, APP_MAPPED_IO, F2FS_BLKSIZE);
153
	f2fs_update_time(sbi, REQ_TIME);
C
Chao Yu 已提交
154

155
	trace_f2fs_vm_page_mkwrite(page, DATA);
156 157
out_sem:
	up_read(&F2FS_I(inode)->i_mmap_sem);
C
Chao Yu 已提交
158

J
Jaegeuk Kim 已提交
159
	sb_end_pagefault(inode->i_sb);
160
err:
J
Jaegeuk Kim 已提交
161 162 163 164
	return block_page_mkwrite_return(err);
}

static const struct vm_operations_struct f2fs_file_vm_ops = {
165
	.fault		= f2fs_filemap_fault,
166
	.map_pages	= filemap_map_pages,
167
	.page_mkwrite	= f2fs_vm_page_mkwrite,
J
Jaegeuk Kim 已提交
168 169
};

170 171 172 173
static int get_parent_ino(struct inode *inode, nid_t *pino)
{
	struct dentry *dentry;

174 175 176 177 178
	/*
	 * Make sure to get the non-deleted alias.  The alias associated with
	 * the open file descriptor being fsync()'ed may be deleted already.
	 */
	dentry = d_find_alias(inode);
179 180 181
	if (!dentry)
		return 0;

182 183
	*pino = parent_ino(dentry);
	dput(dentry);
184 185 186
	return 1;
}

C
Chao Yu 已提交
187
static inline enum cp_reason_type need_do_checkpoint(struct inode *inode)
188
{
189
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
C
Chao Yu 已提交
190
	enum cp_reason_type cp_reason = CP_NO_NEEDED;
191

C
Chao Yu 已提交
192 193
	if (!S_ISREG(inode->i_mode))
		cp_reason = CP_NON_REGULAR;
C
Chao Yu 已提交
194 195
	else if (f2fs_compressed_file(inode))
		cp_reason = CP_COMPRESSED;
C
Chao Yu 已提交
196 197
	else if (inode->i_nlink != 1)
		cp_reason = CP_HARDLINK;
198
	else if (is_sbi_flag_set(sbi, SBI_NEED_CP))
C
Chao Yu 已提交
199
		cp_reason = CP_SB_NEED_CP;
200
	else if (file_wrong_pino(inode))
C
Chao Yu 已提交
201
		cp_reason = CP_WRONG_PINO;
C
Chao Yu 已提交
202
	else if (!f2fs_space_for_roll_forward(sbi))
C
Chao Yu 已提交
203
		cp_reason = CP_NO_SPC_ROLL;
C
Chao Yu 已提交
204
	else if (!f2fs_is_checkpointed_node(sbi, F2FS_I(inode)->i_pino))
C
Chao Yu 已提交
205
		cp_reason = CP_NODE_NEED_CP;
206
	else if (test_opt(sbi, FASTBOOT))
C
Chao Yu 已提交
207
		cp_reason = CP_FASTBOOT_MODE;
208
	else if (F2FS_OPTION(sbi).active_logs == 2)
C
Chao Yu 已提交
209
		cp_reason = CP_SPEC_LOG_NUM;
210
	else if (F2FS_OPTION(sbi).fsync_mode == FSYNC_MODE_STRICT &&
C
Chao Yu 已提交
211 212 213
		f2fs_need_dentry_mark(sbi, inode->i_ino) &&
		f2fs_exist_written_data(sbi, F2FS_I(inode)->i_pino,
							TRANS_DIR_INO))
214
		cp_reason = CP_RECOVER_DIR;
215

C
Chao Yu 已提交
216
	return cp_reason;
217 218
}

219 220 221 222 223
static bool need_inode_page_update(struct f2fs_sb_info *sbi, nid_t ino)
{
	struct page *i = find_get_page(NODE_MAPPING(sbi), ino);
	bool ret = false;
	/* But we need to avoid that there are some inode updates */
C
Chao Yu 已提交
224
	if ((i && PageDirty(i)) || f2fs_need_inode_block_update(sbi, ino))
225 226 227 228 229
		ret = true;
	f2fs_put_page(i, 0);
	return ret;
}

230 231 232 233 234 235 236 237
static void try_to_fix_pino(struct inode *inode)
{
	struct f2fs_inode_info *fi = F2FS_I(inode);
	nid_t pino;

	down_write(&fi->i_sem);
	if (file_wrong_pino(inode) && inode->i_nlink == 1 &&
			get_parent_ino(inode, &pino)) {
238
		f2fs_i_pino_write(inode, pino);
239 240
		file_got_pino(inode);
	}
241
	up_write(&fi->i_sem);
242 243
}

244 245
static int f2fs_do_sync_file(struct file *file, loff_t start, loff_t end,
						int datasync, bool atomic)
J
Jaegeuk Kim 已提交
246 247
{
	struct inode *inode = file->f_mapping->host;
248
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
J
Jaegeuk Kim 已提交
249
	nid_t ino = inode->i_ino;
J
Jaegeuk Kim 已提交
250
	int ret = 0;
C
Chao Yu 已提交
251
	enum cp_reason_type cp_reason = 0;
J
Jaegeuk Kim 已提交
252
	struct writeback_control wbc = {
253
		.sync_mode = WB_SYNC_ALL,
J
Jaegeuk Kim 已提交
254 255 256
		.nr_to_write = LONG_MAX,
		.for_reclaim = 0,
	};
257
	unsigned int seq_id = 0;
J
Jaegeuk Kim 已提交
258

D
Daniel Rosenberg 已提交
259 260
	if (unlikely(f2fs_readonly(inode->i_sb) ||
				is_sbi_flag_set(sbi, SBI_CP_DISABLED)))
261 262
		return 0;

263
	trace_f2fs_sync_file_enter(inode);
264

265 266 267
	if (S_ISDIR(inode->i_mode))
		goto go_write;

268
	/* if fdatasync is triggered, let's do in-place-update */
J
Jaegeuk Kim 已提交
269
	if (datasync || get_dirty_pages(inode) <= SM_I(sbi)->min_fsync_blocks)
270
		set_inode_flag(inode, FI_NEED_IPU);
271
	ret = file_write_and_wait_range(file, start, end);
272
	clear_inode_flag(inode, FI_NEED_IPU);
273

274
	if (ret) {
C
Chao Yu 已提交
275
		trace_f2fs_sync_file_exit(inode, cp_reason, datasync, ret);
J
Jaegeuk Kim 已提交
276
		return ret;
277
	}
J
Jaegeuk Kim 已提交
278

279
	/* if the inode is dirty, let's recover all the time */
C
Chao Yu 已提交
280
	if (!f2fs_skip_inode_update(inode, datasync)) {
281
		f2fs_write_inode(inode, NULL);
282 283 284
		goto go_write;
	}

285 286 287
	/*
	 * if there is no written data, don't waste time to write recovery info.
	 */
288
	if (!is_inode_flag_set(inode, FI_APPEND_WRITE) &&
C
Chao Yu 已提交
289
			!f2fs_exist_written_data(sbi, ino, APPEND_INO)) {
290

291 292
		/* it may call write_inode just prior to fsync */
		if (need_inode_page_update(sbi, ino))
293 294
			goto go_write;

295
		if (is_inode_flag_set(inode, FI_UPDATE_WRITE) ||
C
Chao Yu 已提交
296
				f2fs_exist_written_data(sbi, ino, UPDATE_INO))
297 298 299
			goto flush_out;
		goto out;
	}
300
go_write:
301 302 303 304
	/*
	 * Both of fdatasync() and fsync() are able to be recovered from
	 * sudden-power-off.
	 */
305
	down_read(&F2FS_I(inode)->i_sem);
C
Chao Yu 已提交
306
	cp_reason = need_do_checkpoint(inode);
307
	up_read(&F2FS_I(inode)->i_sem);
308

C
Chao Yu 已提交
309
	if (cp_reason) {
J
Jaegeuk Kim 已提交
310 311
		/* all the dirty node pages should be flushed for POR */
		ret = f2fs_sync_fs(inode->i_sb, 1);
312

313 314 315 316 317
		/*
		 * We've secured consistency through sync_fs. Following pino
		 * will be used only for fsynced inodes after checkpoint.
		 */
		try_to_fix_pino(inode);
318 319
		clear_inode_flag(inode, FI_APPEND_WRITE);
		clear_inode_flag(inode, FI_UPDATE_WRITE);
320 321
		goto out;
	}
322
sync_nodes:
323
	atomic_inc(&sbi->wb_sync_req[NODE]);
324
	ret = f2fs_fsync_node_pages(sbi, inode, &wbc, atomic, &seq_id);
325
	atomic_dec(&sbi->wb_sync_req[NODE]);
326 327
	if (ret)
		goto out;
328

329
	/* if cp_error was enabled, we should avoid infinite loop */
C
Chao Yu 已提交
330 331
	if (unlikely(f2fs_cp_error(sbi))) {
		ret = -EIO;
332
		goto out;
C
Chao Yu 已提交
333
	}
334

C
Chao Yu 已提交
335
	if (f2fs_need_inode_block_update(sbi, ino)) {
336
		f2fs_mark_inode_dirty_sync(inode, true);
337 338
		f2fs_write_inode(inode, NULL);
		goto sync_nodes;
J
Jaegeuk Kim 已提交
339
	}
340

341 342 343 344 345 346 347 348 349
	/*
	 * If it's atomic_write, it's just fine to keep write ordering. So
	 * here we don't need to wait for node write completion, since we use
	 * node chain which serializes node blocks. If one of node writes are
	 * reordered, we can see simply broken chain, resulting in stopping
	 * roll-forward recovery. It means we'll recover all or none node blocks
	 * given fsync mark.
	 */
	if (!atomic) {
350
		ret = f2fs_wait_on_node_pages_writeback(sbi, seq_id);
351 352 353
		if (ret)
			goto out;
	}
354 355

	/* once recovery info is written, don't need to tack this */
C
Chao Yu 已提交
356
	f2fs_remove_ino_entry(sbi, ino, APPEND_INO);
357
	clear_inode_flag(inode, FI_APPEND_WRITE);
358
flush_out:
359
	if (!atomic && F2FS_OPTION(sbi).fsync_mode != FSYNC_MODE_NOBARRIER)
C
Chao Yu 已提交
360
		ret = f2fs_issue_flush(sbi, inode->i_ino);
361
	if (!ret) {
C
Chao Yu 已提交
362
		f2fs_remove_ino_entry(sbi, ino, UPDATE_INO);
363
		clear_inode_flag(inode, FI_UPDATE_WRITE);
C
Chao Yu 已提交
364
		f2fs_remove_ino_entry(sbi, ino, FLUSH_INO);
365
	}
366
	f2fs_update_time(sbi, REQ_TIME);
J
Jaegeuk Kim 已提交
367
out:
C
Chao Yu 已提交
368
	trace_f2fs_sync_file_exit(inode, cp_reason, datasync, ret);
369
	f2fs_trace_ios(NULL, 1);
J
Jaegeuk Kim 已提交
370 371 372
	return ret;
}

373 374
int f2fs_sync_file(struct file *file, loff_t start, loff_t end, int datasync)
{
375 376
	if (unlikely(f2fs_cp_error(F2FS_I_SB(file_inode(file)))))
		return -EIO;
377 378 379
	return f2fs_do_sync_file(file, start, end, datasync, false);
}

380 381
static bool __found_offset(struct address_space *mapping, block_t blkaddr,
				pgoff_t index, int whence)
382 383 384
{
	switch (whence) {
	case SEEK_DATA:
385 386 387 388
		if (__is_valid_data_blkaddr(blkaddr))
			return true;
		if (blkaddr == NEW_ADDR &&
		    xa_get_mark(&mapping->i_pages, index, PAGECACHE_TAG_DIRTY))
389 390 391 392 393 394 395 396 397 398
			return true;
		break;
	case SEEK_HOLE:
		if (blkaddr == NULL_ADDR)
			return true;
		break;
	}
	return false;
}

399 400 401 402 403
static loff_t f2fs_seek_block(struct file *file, loff_t offset, int whence)
{
	struct inode *inode = file->f_mapping->host;
	loff_t maxbytes = inode->i_sb->s_maxbytes;
	struct dnode_of_data dn;
404
	pgoff_t pgofs, end_offset;
405 406
	loff_t data_ofs = offset;
	loff_t isize;
407 408
	int err = 0;

A
Al Viro 已提交
409
	inode_lock(inode);
410 411 412 413 414 415

	isize = i_size_read(inode);
	if (offset >= isize)
		goto fail;

	/* handle inline data case */
416 417 418 419 420 421 422 423
	if (f2fs_has_inline_data(inode)) {
		if (whence == SEEK_HOLE) {
			data_ofs = isize;
			goto found;
		} else if (whence == SEEK_DATA) {
			data_ofs = offset;
			goto found;
		}
424 425
	}

426
	pgofs = (pgoff_t)(offset >> PAGE_SHIFT);
427

428
	for (; data_ofs < isize; data_ofs = (loff_t)pgofs << PAGE_SHIFT) {
429
		set_new_dnode(&dn, inode, NULL, NULL, 0);
C
Chao Yu 已提交
430
		err = f2fs_get_dnode_of_data(&dn, pgofs, LOOKUP_NODE);
431 432 433
		if (err && err != -ENOENT) {
			goto fail;
		} else if (err == -ENOENT) {
A
arter97 已提交
434
			/* direct node does not exists */
435
			if (whence == SEEK_DATA) {
C
Chao Yu 已提交
436
				pgofs = f2fs_get_next_page_offset(&dn, pgofs);
437 438 439 440 441 442
				continue;
			} else {
				goto found;
			}
		}

443
		end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
444 445 446 447

		/* find data/hole in dnode block */
		for (; dn.ofs_in_node < end_offset;
				dn.ofs_in_node++, pgofs++,
448
				data_ofs = (loff_t)pgofs << PAGE_SHIFT) {
449
			block_t blkaddr;
450

451
			blkaddr = f2fs_data_blkaddr(&dn);
452

453 454
			if (__is_valid_data_blkaddr(blkaddr) &&
				!f2fs_is_valid_blkaddr(F2FS_I_SB(inode),
C
Chao Yu 已提交
455
					blkaddr, DATA_GENERIC_ENHANCE)) {
456 457 458 459
				f2fs_put_dnode(&dn);
				goto fail;
			}

460
			if (__found_offset(file->f_mapping, blkaddr,
461
							pgofs, whence)) {
462 463 464 465 466 467 468 469 470 471
				f2fs_put_dnode(&dn);
				goto found;
			}
		}
		f2fs_put_dnode(&dn);
	}

	if (whence == SEEK_DATA)
		goto fail;
found:
472 473
	if (whence == SEEK_HOLE && data_ofs > isize)
		data_ofs = isize;
A
Al Viro 已提交
474
	inode_unlock(inode);
475 476
	return vfs_setpos(file, data_ofs, maxbytes);
fail:
A
Al Viro 已提交
477
	inode_unlock(inode);
478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493
	return -ENXIO;
}

static loff_t f2fs_llseek(struct file *file, loff_t offset, int whence)
{
	struct inode *inode = file->f_mapping->host;
	loff_t maxbytes = inode->i_sb->s_maxbytes;

	switch (whence) {
	case SEEK_SET:
	case SEEK_CUR:
	case SEEK_END:
		return generic_file_llseek_size(file, offset, whence,
						maxbytes, i_size_read(inode));
	case SEEK_DATA:
	case SEEK_HOLE:
494 495
		if (offset < 0)
			return -ENXIO;
496 497 498 499 500 501
		return f2fs_seek_block(file, offset, whence);
	}

	return -EINVAL;
}

J
Jaegeuk Kim 已提交
502 503
static int f2fs_file_mmap(struct file *file, struct vm_area_struct *vma)
{
504
	struct inode *inode = file_inode(file);
505
	int err;
506

507 508 509
	if (unlikely(f2fs_cp_error(F2FS_I_SB(inode))))
		return -EIO;

C
Chao Yu 已提交
510 511 512
	if (!f2fs_is_compress_backend_ready(inode))
		return -EOPNOTSUPP;

513
	/* we don't need to use inline_data strictly */
514 515 516
	err = f2fs_convert_inline_inode(inode);
	if (err)
		return err;
517

J
Jaegeuk Kim 已提交
518 519
	file_accessed(file);
	vma->vm_ops = &f2fs_file_vm_ops;
C
Chao Yu 已提交
520
	set_inode_flag(inode, FI_MMAP_FILE);
J
Jaegeuk Kim 已提交
521 522 523
	return 0;
}

524 525
static int f2fs_file_open(struct inode *inode, struct file *filp)
{
526
	int err = fscrypt_file_open(inode, filp);
527

E
Eric Biggers 已提交
528 529 530
	if (err)
		return err;

C
Chao Yu 已提交
531 532 533
	if (!f2fs_is_compress_backend_ready(inode))
		return -EOPNOTSUPP;

E
Eric Biggers 已提交
534
	err = fsverity_file_open(inode, filp);
535 536
	if (err)
		return err;
H
Hyunchul Lee 已提交
537 538 539

	filp->f_mode |= FMODE_NOWAIT;

C
Chao Yu 已提交
540
	return dquot_file_open(inode, filp);
541 542
}

C
Chao Yu 已提交
543
void f2fs_truncate_data_blocks_range(struct dnode_of_data *dn, int count)
J
Jaegeuk Kim 已提交
544
{
545
	struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
J
Jaegeuk Kim 已提交
546
	struct f2fs_node *raw_node;
C
Chao Yu 已提交
547
	int nr_free = 0, ofs = dn->ofs_in_node, len = count;
J
Jaegeuk Kim 已提交
548
	__le32 *addr;
549
	int base = 0;
C
Chao Yu 已提交
550 551 552
	bool compressed_cluster = false;
	int cluster_index = 0, valid_blocks = 0;
	int cluster_size = F2FS_I(dn->inode)->i_cluster_size;
553
	bool released = !atomic_read(&F2FS_I(dn->inode)->i_compr_blocks);
554 555 556

	if (IS_INODE(dn->node_page) && f2fs_has_extra_attr(dn->inode))
		base = get_extra_isize(dn->inode);
J
Jaegeuk Kim 已提交
557

558
	raw_node = F2FS_NODE(dn->node_page);
559
	addr = blkaddr_in_node(raw_node) + base + ofs;
J
Jaegeuk Kim 已提交
560

C
Chao Yu 已提交
561 562
	/* Assumption: truncateion starts with cluster */
	for (; count > 0; count--, addr++, dn->ofs_in_node++, cluster_index++) {
J
Jaegeuk Kim 已提交
563
		block_t blkaddr = le32_to_cpu(*addr);
564

C
Chao Yu 已提交
565 566 567 568 569 570 571 572 573
		if (f2fs_compressed_file(dn->inode) &&
					!(cluster_index & (cluster_size - 1))) {
			if (compressed_cluster)
				f2fs_i_compr_blocks_update(dn->inode,
							valid_blocks, false);
			compressed_cluster = (blkaddr == COMPRESS_ADDR);
			valid_blocks = 0;
		}

J
Jaegeuk Kim 已提交
574 575 576
		if (blkaddr == NULL_ADDR)
			continue;

J
Jaegeuk Kim 已提交
577
		dn->data_blkaddr = NULL_ADDR;
C
Chao Yu 已提交
578
		f2fs_set_data_blkaddr(dn);
579

C
Chao Yu 已提交
580 581
		if (__is_valid_data_blkaddr(blkaddr)) {
			if (!f2fs_is_valid_blkaddr(sbi, blkaddr,
C
Chao Yu 已提交
582
					DATA_GENERIC_ENHANCE))
C
Chao Yu 已提交
583 584 585 586
				continue;
			if (compressed_cluster)
				valid_blocks++;
		}
587

588
		if (dn->ofs_in_node == 0 && IS_INODE(dn->node_page))
589
			clear_inode_flag(dn->inode, FI_FIRST_BLOCK_WRITTEN);
C
Chao Yu 已提交
590 591

		f2fs_invalidate_blocks(sbi, blkaddr);
592 593 594

		if (!released || blkaddr != COMPRESS_ADDR)
			nr_free++;
J
Jaegeuk Kim 已提交
595
	}
C
Chao Yu 已提交
596

C
Chao Yu 已提交
597 598 599
	if (compressed_cluster)
		f2fs_i_compr_blocks_update(dn->inode, valid_blocks, false);

J
Jaegeuk Kim 已提交
600
	if (nr_free) {
C
Chao Yu 已提交
601 602 603 604 605
		pgoff_t fofs;
		/*
		 * once we invalidate valid blkaddr in range [ofs, ofs + count],
		 * we will invalidate all blkaddr in the whole range.
		 */
C
Chao Yu 已提交
606
		fofs = f2fs_start_bidx_of_node(ofs_of_node(dn->node_page),
607
							dn->inode) + ofs;
C
Chao Yu 已提交
608
		f2fs_update_extent_cache_range(dn, fofs, 0, len);
609
		dec_valid_block_count(sbi, dn->inode, nr_free);
J
Jaegeuk Kim 已提交
610 611
	}
	dn->ofs_in_node = ofs;
612

613
	f2fs_update_time(sbi, REQ_TIME);
614 615
	trace_f2fs_truncate_data_blocks_range(dn->inode, dn->nid,
					 dn->ofs_in_node, nr_free);
J
Jaegeuk Kim 已提交
616 617
}

C
Chao Yu 已提交
618
void f2fs_truncate_data_blocks(struct dnode_of_data *dn)
J
Jaegeuk Kim 已提交
619
{
620
	f2fs_truncate_data_blocks_range(dn, ADDRS_PER_BLOCK(dn->inode));
J
Jaegeuk Kim 已提交
621 622
}

623
static int truncate_partial_data_page(struct inode *inode, u64 from,
624
								bool cache_only)
J
Jaegeuk Kim 已提交
625
{
626
	loff_t offset = from & (PAGE_SIZE - 1);
627
	pgoff_t index = from >> PAGE_SHIFT;
628
	struct address_space *mapping = inode->i_mapping;
J
Jaegeuk Kim 已提交
629 630
	struct page *page;

631
	if (!offset && !cache_only)
632
		return 0;
J
Jaegeuk Kim 已提交
633

634
	if (cache_only) {
635
		page = find_lock_page(mapping, index);
636 637 638
		if (page && PageUptodate(page))
			goto truncate_out;
		f2fs_put_page(page, 1);
639
		return 0;
640
	}
J
Jaegeuk Kim 已提交
641

C
Chao Yu 已提交
642
	page = f2fs_get_lock_data_page(inode, index, true);
643
	if (IS_ERR(page))
644
		return PTR_ERR(page) == -ENOENT ? 0 : PTR_ERR(page);
645
truncate_out:
646
	f2fs_wait_on_page_writeback(page, DATA, true, true);
647
	zero_user(page, offset, PAGE_SIZE - offset);
648 649

	/* An encrypted inode should have a key and truncate the last page. */
650
	f2fs_bug_on(F2FS_I_SB(inode), cache_only && IS_ENCRYPTED(inode));
651
	if (!cache_only)
652
		set_page_dirty(page);
J
Jaegeuk Kim 已提交
653
	f2fs_put_page(page, 1);
654
	return 0;
J
Jaegeuk Kim 已提交
655 656
}

657
int f2fs_do_truncate_blocks(struct inode *inode, u64 from, bool lock)
J
Jaegeuk Kim 已提交
658
{
659
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
J
Jaegeuk Kim 已提交
660 661
	struct dnode_of_data dn;
	pgoff_t free_from;
H
Huajun Li 已提交
662
	int count = 0, err = 0;
663
	struct page *ipage;
664
	bool truncate_page = false;
J
Jaegeuk Kim 已提交
665

666 667
	trace_f2fs_truncate_blocks_enter(inode, from);

C
Chao Yu 已提交
668
	free_from = (pgoff_t)F2FS_BLK_ALIGN(from);
J
Jaegeuk Kim 已提交
669

670 671 672
	if (free_from >= sbi->max_file_blocks)
		goto free_partial;

673
	if (lock)
674
		f2fs_lock_op(sbi);
H
Huajun Li 已提交
675

C
Chao Yu 已提交
676
	ipage = f2fs_get_node_page(sbi, inode->i_ino);
677 678 679 680 681 682
	if (IS_ERR(ipage)) {
		err = PTR_ERR(ipage);
		goto out;
	}

	if (f2fs_has_inline_data(inode)) {
C
Chao Yu 已提交
683
		f2fs_truncate_inline_inode(inode, ipage, from);
684
		f2fs_put_page(ipage, 1);
685
		truncate_page = true;
686 687 688 689
		goto out;
	}

	set_new_dnode(&dn, inode, ipage, NULL, 0);
C
Chao Yu 已提交
690
	err = f2fs_get_dnode_of_data(&dn, free_from, LOOKUP_NODE_RA);
J
Jaegeuk Kim 已提交
691 692 693
	if (err) {
		if (err == -ENOENT)
			goto free_next;
694
		goto out;
695 696
	}

697
	count = ADDRS_PER_PAGE(dn.node_page, inode);
J
Jaegeuk Kim 已提交
698 699

	count -= dn.ofs_in_node;
700
	f2fs_bug_on(sbi, count < 0);
701

J
Jaegeuk Kim 已提交
702
	if (dn.ofs_in_node || IS_INODE(dn.node_page)) {
C
Chao Yu 已提交
703
		f2fs_truncate_data_blocks_range(&dn, count);
J
Jaegeuk Kim 已提交
704 705 706 707 708
		free_from += count;
	}

	f2fs_put_dnode(&dn);
free_next:
C
Chao Yu 已提交
709
	err = f2fs_truncate_inode_blocks(inode, free_from);
710 711
out:
	if (lock)
712
		f2fs_unlock_op(sbi);
713
free_partial:
714 715
	/* lastly zero out the first data page */
	if (!err)
716
		err = truncate_partial_data_page(inode, from, truncate_page);
J
Jaegeuk Kim 已提交
717

718
	trace_f2fs_truncate_blocks_exit(inode, err);
J
Jaegeuk Kim 已提交
719 720 721
	return err;
}

C
Chao Yu 已提交
722 723 724
int f2fs_truncate_blocks(struct inode *inode, u64 from, bool lock)
{
	u64 free_from = from;
725
	int err;
C
Chao Yu 已提交
726

727
#ifdef CONFIG_F2FS_FS_COMPRESSION
C
Chao Yu 已提交
728 729 730 731
	/*
	 * for compressed file, only support cluster size
	 * aligned truncation.
	 */
732 733 734
	if (f2fs_compressed_file(inode))
		free_from = round_up(from,
				F2FS_I(inode)->i_cluster_size << PAGE_SHIFT);
735 736 737 738 739 740 741
#endif

	err = f2fs_do_truncate_blocks(inode, free_from, lock);
	if (err)
		return err;

#ifdef CONFIG_F2FS_FS_COMPRESSION
C
Chao Yu 已提交
742
	if (from != free_from) {
743
		err = f2fs_truncate_partial_cluster(inode, from, lock);
C
Chao Yu 已提交
744 745 746
		if (err)
			return err;
	}
747
#endif
C
Chao Yu 已提交
748

C
Chao Yu 已提交
749
	return 0;
C
Chao Yu 已提交
750 751
}

752
int f2fs_truncate(struct inode *inode)
J
Jaegeuk Kim 已提交
753
{
754 755
	int err;

756 757 758
	if (unlikely(f2fs_cp_error(F2FS_I_SB(inode))))
		return -EIO;

J
Jaegeuk Kim 已提交
759 760
	if (!(S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode) ||
				S_ISLNK(inode->i_mode)))
761
		return 0;
J
Jaegeuk Kim 已提交
762

763 764
	trace_f2fs_truncate(inode);

765
	if (time_to_inject(F2FS_I_SB(inode), FAULT_TRUNCATE)) {
766
		f2fs_show_injection_info(F2FS_I_SB(inode), FAULT_TRUNCATE);
767 768
		return -EIO;
	}
769

770
	/* we should check inline_data size */
771
	if (!f2fs_may_inline_data(inode)) {
772 773 774
		err = f2fs_convert_inline_inode(inode);
		if (err)
			return err;
775 776
	}

777
	err = f2fs_truncate_blocks(inode, i_size_read(inode), true);
778 779 780
	if (err)
		return err;

781
	inode->i_mtime = inode->i_ctime = current_time(inode);
782
	f2fs_mark_inode_dirty_sync(inode, false);
783
	return 0;
J
Jaegeuk Kim 已提交
784 785
}

786
int f2fs_getattr(const struct path *path, struct kstat *stat,
C
Chao Yu 已提交
787
		 u32 request_mask, unsigned int query_flags)
J
Jaegeuk Kim 已提交
788
{
789
	struct inode *inode = d_inode(path->dentry);
C
Chao Yu 已提交
790
	struct f2fs_inode_info *fi = F2FS_I(inode);
C
Chao Yu 已提交
791
	struct f2fs_inode *ri;
C
Chao Yu 已提交
792 793
	unsigned int flags;

C
Chao Yu 已提交
794
	if (f2fs_has_extra_attr(inode) &&
795
			f2fs_sb_has_inode_crtime(F2FS_I_SB(inode)) &&
C
Chao Yu 已提交
796 797 798 799 800 801
			F2FS_FITS_IN_INODE(ri, fi->i_extra_isize, i_crtime)) {
		stat->result_mask |= STATX_BTIME;
		stat->btime.tv_sec = fi->i_crtime.tv_sec;
		stat->btime.tv_nsec = fi->i_crtime.tv_nsec;
	}

802
	flags = fi->i_flags;
C
Chao Yu 已提交
803 804
	if (flags & F2FS_COMPR_FL)
		stat->attributes |= STATX_ATTR_COMPRESSED;
805
	if (flags & F2FS_APPEND_FL)
C
Chao Yu 已提交
806
		stat->attributes |= STATX_ATTR_APPEND;
807
	if (IS_ENCRYPTED(inode))
C
Chao Yu 已提交
808
		stat->attributes |= STATX_ATTR_ENCRYPTED;
809
	if (flags & F2FS_IMMUTABLE_FL)
C
Chao Yu 已提交
810
		stat->attributes |= STATX_ATTR_IMMUTABLE;
811
	if (flags & F2FS_NODUMP_FL)
C
Chao Yu 已提交
812
		stat->attributes |= STATX_ATTR_NODUMP;
E
Eric Biggers 已提交
813 814
	if (IS_VERITY(inode))
		stat->attributes |= STATX_ATTR_VERITY;
C
Chao Yu 已提交
815

C
Chao Yu 已提交
816 817
	stat->attributes_mask |= (STATX_ATTR_COMPRESSED |
				  STATX_ATTR_APPEND |
C
Chao Yu 已提交
818 819
				  STATX_ATTR_ENCRYPTED |
				  STATX_ATTR_IMMUTABLE |
E
Eric Biggers 已提交
820 821
				  STATX_ATTR_NODUMP |
				  STATX_ATTR_VERITY);
C
Chao Yu 已提交
822

J
Jaegeuk Kim 已提交
823
	generic_fillattr(inode, stat);
824 825 826 827 828 829

	/* we need to show initial sectors used for inline_data/dentries */
	if ((S_ISREG(inode->i_mode) && f2fs_has_inline_data(inode)) ||
					f2fs_has_inline_dentry(inode))
		stat->blocks += (stat->size + 511) >> 9;

J
Jaegeuk Kim 已提交
830 831 832 833 834 835 836 837 838 839 840 841
	return 0;
}

#ifdef CONFIG_F2FS_FS_POSIX_ACL
static void __setattr_copy(struct inode *inode, const struct iattr *attr)
{
	unsigned int ia_valid = attr->ia_valid;

	if (ia_valid & ATTR_UID)
		inode->i_uid = attr->ia_uid;
	if (ia_valid & ATTR_GID)
		inode->i_gid = attr->ia_gid;
842 843 844 845 846 847
	if (ia_valid & ATTR_ATIME)
		inode->i_atime = attr->ia_atime;
	if (ia_valid & ATTR_MTIME)
		inode->i_mtime = attr->ia_mtime;
	if (ia_valid & ATTR_CTIME)
		inode->i_ctime = attr->ia_ctime;
J
Jaegeuk Kim 已提交
848 849 850 851 852
	if (ia_valid & ATTR_MODE) {
		umode_t mode = attr->ia_mode;

		if (!in_group_p(inode->i_gid) && !capable(CAP_FSETID))
			mode &= ~S_ISGID;
853
		set_acl_inode(inode, mode);
J
Jaegeuk Kim 已提交
854 855 856 857 858 859 860 861
	}
}
#else
#define __setattr_copy setattr_copy
#endif

int f2fs_setattr(struct dentry *dentry, struct iattr *attr)
{
862
	struct inode *inode = d_inode(dentry);
J
Jaegeuk Kim 已提交
863 864
	int err;

865 866 867
	if (unlikely(f2fs_cp_error(F2FS_I_SB(inode))))
		return -EIO;

C
Chao Yu 已提交
868 869 870 871
	if ((attr->ia_valid & ATTR_SIZE) &&
		!f2fs_is_compress_backend_ready(inode))
		return -EOPNOTSUPP;

872
	err = setattr_prepare(dentry, attr);
J
Jaegeuk Kim 已提交
873 874 875
	if (err)
		return err;

876 877 878 879
	err = fscrypt_prepare_setattr(dentry, attr);
	if (err)
		return err;

E
Eric Biggers 已提交
880 881 882 883
	err = fsverity_prepare_setattr(dentry, attr);
	if (err)
		return err;

C
Chao Yu 已提交
884 885 886 887 888 889 890 891 892
	if (is_quota_modification(inode, attr)) {
		err = dquot_initialize(inode);
		if (err)
			return err;
	}
	if ((attr->ia_valid & ATTR_UID &&
		!uid_eq(attr->ia_uid, inode->i_uid)) ||
		(attr->ia_valid & ATTR_GID &&
		!gid_eq(attr->ia_gid, inode->i_gid))) {
893
		f2fs_lock_op(F2FS_I_SB(inode));
C
Chao Yu 已提交
894
		err = dquot_transfer(inode, attr);
895 896 897 898
		if (err) {
			set_sbi_flag(F2FS_I_SB(inode),
					SBI_QUOTA_NEED_REPAIR);
			f2fs_unlock_op(F2FS_I_SB(inode));
C
Chao Yu 已提交
899
			return err;
900 901 902 903 904 905 906 907 908 909 910
		}
		/*
		 * update uid/gid under lock_op(), so that dquot and inode can
		 * be updated atomically.
		 */
		if (attr->ia_valid & ATTR_UID)
			inode->i_uid = attr->ia_uid;
		if (attr->ia_valid & ATTR_GID)
			inode->i_gid = attr->ia_gid;
		f2fs_mark_inode_dirty_sync(inode, true);
		f2fs_unlock_op(F2FS_I_SB(inode));
C
Chao Yu 已提交
911 912
	}

913
	if (attr->ia_valid & ATTR_SIZE) {
914 915 916 917 918 919 920 921 922 923 924
		loff_t old_size = i_size_read(inode);

		if (attr->ia_size > MAX_INLINE_DATA(inode)) {
			/*
			 * should convert inline inode before i_size_write to
			 * keep smaller than inline_data size with inline flag.
			 */
			err = f2fs_convert_inline_inode(inode);
			if (err)
				return err;
		}
925 926

		down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
927
		down_write(&F2FS_I(inode)->i_mmap_sem);
928 929 930

		truncate_setsize(inode, attr->ia_size);

931
		if (attr->ia_size <= old_size)
932
			err = f2fs_truncate(inode);
933 934 935 936 937
		/*
		 * do not trim all blocks after i_size if target size is
		 * larger than i_size.
		 */
		up_write(&F2FS_I(inode)->i_mmap_sem);
938
		up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
939 940
		if (err)
			return err;
941

942
		spin_lock(&F2FS_I(inode)->i_size_lock);
943
		inode->i_mtime = inode->i_ctime = current_time(inode);
944
		F2FS_I(inode)->last_disk_size = i_size_read(inode);
945
		spin_unlock(&F2FS_I(inode)->i_size_lock);
J
Jaegeuk Kim 已提交
946 947 948 949 950
	}

	__setattr_copy(inode, attr);

	if (attr->ia_valid & ATTR_MODE) {
C
Chao Yu 已提交
951
		err = posix_acl_chmod(inode, f2fs_get_inode_mode(inode));
952 953 954
		if (err || is_inode_flag_set(inode, FI_ACL_MODE)) {
			inode->i_mode = F2FS_I(inode)->i_acl_mode;
			clear_inode_flag(inode, FI_ACL_MODE);
J
Jaegeuk Kim 已提交
955 956 957
		}
	}

958
	/* file size may changed here */
959
	f2fs_mark_inode_dirty_sync(inode, true);
960 961 962 963

	/* inode change will produce dirty node pages flushed by checkpoint */
	f2fs_balance_fs(F2FS_I_SB(inode), true);

J
Jaegeuk Kim 已提交
964 965 966 967 968 969 970
	return err;
}

const struct inode_operations f2fs_file_inode_operations = {
	.getattr	= f2fs_getattr,
	.setattr	= f2fs_setattr,
	.get_acl	= f2fs_get_acl,
971
	.set_acl	= f2fs_set_acl,
J
Jaegeuk Kim 已提交
972
	.listxattr	= f2fs_listxattr,
J
Jaegeuk Kim 已提交
973
	.fiemap		= f2fs_fiemap,
J
Jaegeuk Kim 已提交
974 975
};

C
Chao Yu 已提交
976
static int fill_zero(struct inode *inode, pgoff_t index,
J
Jaegeuk Kim 已提交
977 978
					loff_t start, loff_t len)
{
979
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
J
Jaegeuk Kim 已提交
980 981 982
	struct page *page;

	if (!len)
C
Chao Yu 已提交
983
		return 0;
J
Jaegeuk Kim 已提交
984

J
Jaegeuk Kim 已提交
985
	f2fs_balance_fs(sbi, true);
986

987
	f2fs_lock_op(sbi);
C
Chao Yu 已提交
988
	page = f2fs_get_new_data_page(inode, NULL, index, false);
989
	f2fs_unlock_op(sbi);
J
Jaegeuk Kim 已提交
990

C
Chao Yu 已提交
991 992 993
	if (IS_ERR(page))
		return PTR_ERR(page);

994
	f2fs_wait_on_page_writeback(page, DATA, true, true);
C
Chao Yu 已提交
995 996 997 998
	zero_user(page, start, len);
	set_page_dirty(page);
	f2fs_put_page(page, 1);
	return 0;
J
Jaegeuk Kim 已提交
999 1000
}

C
Chao Yu 已提交
1001
int f2fs_truncate_hole(struct inode *inode, pgoff_t pg_start, pgoff_t pg_end)
J
Jaegeuk Kim 已提交
1002 1003 1004
{
	int err;

1005
	while (pg_start < pg_end) {
J
Jaegeuk Kim 已提交
1006
		struct dnode_of_data dn;
1007
		pgoff_t end_offset, count;
1008

J
Jaegeuk Kim 已提交
1009
		set_new_dnode(&dn, inode, NULL, NULL, 0);
C
Chao Yu 已提交
1010
		err = f2fs_get_dnode_of_data(&dn, pg_start, LOOKUP_NODE);
J
Jaegeuk Kim 已提交
1011
		if (err) {
1012
			if (err == -ENOENT) {
C
Chao Yu 已提交
1013 1014
				pg_start = f2fs_get_next_page_offset(&dn,
								pg_start);
J
Jaegeuk Kim 已提交
1015
				continue;
1016
			}
J
Jaegeuk Kim 已提交
1017 1018 1019
			return err;
		}

1020
		end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
1021 1022 1023 1024
		count = min(end_offset - dn.ofs_in_node, pg_end - pg_start);

		f2fs_bug_on(F2FS_I_SB(inode), count == 0 || count > end_offset);

C
Chao Yu 已提交
1025
		f2fs_truncate_data_blocks_range(&dn, count);
J
Jaegeuk Kim 已提交
1026
		f2fs_put_dnode(&dn);
1027 1028

		pg_start += count;
J
Jaegeuk Kim 已提交
1029 1030 1031 1032
	}
	return 0;
}

C
Chao Yu 已提交
1033
static int punch_hole(struct inode *inode, loff_t offset, loff_t len)
J
Jaegeuk Kim 已提交
1034 1035 1036
{
	pgoff_t pg_start, pg_end;
	loff_t off_start, off_end;
1037
	int ret;
J
Jaegeuk Kim 已提交
1038

1039 1040 1041
	ret = f2fs_convert_inline_inode(inode);
	if (ret)
		return ret;
H
Huajun Li 已提交
1042

1043 1044
	pg_start = ((unsigned long long) offset) >> PAGE_SHIFT;
	pg_end = ((unsigned long long) offset + len) >> PAGE_SHIFT;
J
Jaegeuk Kim 已提交
1045

1046 1047
	off_start = offset & (PAGE_SIZE - 1);
	off_end = (offset + len) & (PAGE_SIZE - 1);
J
Jaegeuk Kim 已提交
1048 1049

	if (pg_start == pg_end) {
C
Chao Yu 已提交
1050
		ret = fill_zero(inode, pg_start, off_start,
J
Jaegeuk Kim 已提交
1051
						off_end - off_start);
C
Chao Yu 已提交
1052 1053
		if (ret)
			return ret;
J
Jaegeuk Kim 已提交
1054
	} else {
C
Chao Yu 已提交
1055 1056
		if (off_start) {
			ret = fill_zero(inode, pg_start++, off_start,
1057
						PAGE_SIZE - off_start);
C
Chao Yu 已提交
1058 1059 1060 1061 1062 1063 1064 1065
			if (ret)
				return ret;
		}
		if (off_end) {
			ret = fill_zero(inode, pg_end, 0, off_end);
			if (ret)
				return ret;
		}
J
Jaegeuk Kim 已提交
1066 1067 1068 1069

		if (pg_start < pg_end) {
			struct address_space *mapping = inode->i_mapping;
			loff_t blk_start, blk_end;
1070
			struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1071

J
Jaegeuk Kim 已提交
1072
			f2fs_balance_fs(sbi, true);
J
Jaegeuk Kim 已提交
1073

1074 1075
			blk_start = (loff_t)pg_start << PAGE_SHIFT;
			blk_end = (loff_t)pg_end << PAGE_SHIFT;
1076 1077

			down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
1078
			down_write(&F2FS_I(inode)->i_mmap_sem);
1079

J
Jaegeuk Kim 已提交
1080 1081
			truncate_inode_pages_range(mapping, blk_start,
					blk_end - 1);
1082

1083
			f2fs_lock_op(sbi);
C
Chao Yu 已提交
1084
			ret = f2fs_truncate_hole(inode, pg_start, pg_end);
1085
			f2fs_unlock_op(sbi);
1086

1087
			up_write(&F2FS_I(inode)->i_mmap_sem);
1088
			up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
J
Jaegeuk Kim 已提交
1089 1090 1091 1092 1093 1094
		}
	}

	return ret;
}

1095 1096
static int __read_out_blkaddrs(struct inode *inode, block_t *blkaddr,
				int *do_replace, pgoff_t off, pgoff_t len)
C
Chao Yu 已提交
1097 1098 1099
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct dnode_of_data dn;
1100
	int ret, done, i;
1101

1102
next_dnode:
1103
	set_new_dnode(&dn, inode, NULL, NULL, 0);
C
Chao Yu 已提交
1104
	ret = f2fs_get_dnode_of_data(&dn, off, LOOKUP_NODE_RA);
1105 1106 1107
	if (ret && ret != -ENOENT) {
		return ret;
	} else if (ret == -ENOENT) {
1108 1109
		if (dn.max_level == 0)
			return -ENOENT;
C
Chao Yu 已提交
1110 1111
		done = min((pgoff_t)ADDRS_PER_BLOCK(inode) -
						dn.ofs_in_node, len);
1112 1113 1114 1115 1116 1117 1118 1119
		blkaddr += done;
		do_replace += done;
		goto next;
	}

	done = min((pgoff_t)ADDRS_PER_PAGE(dn.node_page, inode) -
							dn.ofs_in_node, len);
	for (i = 0; i < done; i++, blkaddr++, do_replace++, dn.ofs_in_node++) {
1120
		*blkaddr = f2fs_data_blkaddr(&dn);
C
Chao Yu 已提交
1121 1122 1123 1124 1125

		if (__is_valid_data_blkaddr(*blkaddr) &&
			!f2fs_is_valid_blkaddr(sbi, *blkaddr,
					DATA_GENERIC_ENHANCE)) {
			f2fs_put_dnode(&dn);
1126
			return -EFSCORRUPTED;
C
Chao Yu 已提交
1127 1128
		}

C
Chao Yu 已提交
1129
		if (!f2fs_is_checkpointed_data(sbi, *blkaddr)) {
1130

1131
			if (f2fs_lfs_mode(sbi)) {
1132
				f2fs_put_dnode(&dn);
1133
				return -EOPNOTSUPP;
1134 1135
			}

1136
			/* do not invalidate this block address */
1137
			f2fs_update_data_blkaddr(&dn, NULL_ADDR);
1138
			*do_replace = 1;
C
Chao Yu 已提交
1139
		}
1140
	}
1141 1142 1143 1144 1145 1146 1147 1148
	f2fs_put_dnode(&dn);
next:
	len -= done;
	off += done;
	if (len)
		goto next_dnode;
	return 0;
}
C
Chao Yu 已提交
1149

1150 1151 1152 1153 1154 1155
static int __roll_back_blkaddrs(struct inode *inode, block_t *blkaddr,
				int *do_replace, pgoff_t off, int len)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct dnode_of_data dn;
	int ret, i;
C
Chao Yu 已提交
1156

1157 1158 1159
	for (i = 0; i < len; i++, do_replace++, blkaddr++) {
		if (*do_replace == 0)
			continue;
C
Chao Yu 已提交
1160

1161
		set_new_dnode(&dn, inode, NULL, NULL, 0);
C
Chao Yu 已提交
1162
		ret = f2fs_get_dnode_of_data(&dn, off + i, LOOKUP_NODE_RA);
1163 1164
		if (ret) {
			dec_valid_block_count(sbi, inode, 1);
C
Chao Yu 已提交
1165
			f2fs_invalidate_blocks(sbi, *blkaddr);
1166 1167
		} else {
			f2fs_update_data_blkaddr(&dn, *blkaddr);
1168
		}
1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180
		f2fs_put_dnode(&dn);
	}
	return 0;
}

static int __clone_blkaddrs(struct inode *src_inode, struct inode *dst_inode,
			block_t *blkaddr, int *do_replace,
			pgoff_t src, pgoff_t dst, pgoff_t len, bool full)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(src_inode);
	pgoff_t i = 0;
	int ret;
1181

1182 1183 1184 1185
	while (i < len) {
		if (blkaddr[i] == NULL_ADDR && !full) {
			i++;
			continue;
1186
		}
C
Chao Yu 已提交
1187

1188 1189 1190 1191 1192
		if (do_replace[i] || blkaddr[i] == NULL_ADDR) {
			struct dnode_of_data dn;
			struct node_info ni;
			size_t new_size;
			pgoff_t ilen;
C
Chao Yu 已提交
1193

1194
			set_new_dnode(&dn, dst_inode, NULL, NULL, 0);
C
Chao Yu 已提交
1195
			ret = f2fs_get_dnode_of_data(&dn, dst + i, ALLOC_NODE);
1196 1197
			if (ret)
				return ret;
C
Chao Yu 已提交
1198

1199 1200 1201 1202 1203 1204
			ret = f2fs_get_node_info(sbi, dn.nid, &ni);
			if (ret) {
				f2fs_put_dnode(&dn);
				return ret;
			}

1205 1206 1207 1208
			ilen = min((pgoff_t)
				ADDRS_PER_PAGE(dn.node_page, dst_inode) -
						dn.ofs_in_node, len - i);
			do {
1209
				dn.data_blkaddr = f2fs_data_blkaddr(&dn);
C
Chao Yu 已提交
1210
				f2fs_truncate_data_blocks_range(&dn, 1);
1211 1212 1213

				if (do_replace[i]) {
					f2fs_i_blocks_write(src_inode,
C
Chao Yu 已提交
1214
							1, false, false);
1215
					f2fs_i_blocks_write(dst_inode,
C
Chao Yu 已提交
1216
							1, true, false);
1217 1218 1219 1220 1221 1222 1223
					f2fs_replace_block(sbi, &dn, dn.data_blkaddr,
					blkaddr[i], ni.version, true, false);

					do_replace[i] = 0;
				}
				dn.ofs_in_node++;
				i++;
C
Chao Yu 已提交
1224
				new_size = (loff_t)(dst + i) << PAGE_SHIFT;
1225 1226
				if (dst_inode->i_size < new_size)
					f2fs_i_size_write(dst_inode, new_size);
1227
			} while (--ilen && (do_replace[i] || blkaddr[i] == NULL_ADDR));
1228

1229 1230 1231 1232
			f2fs_put_dnode(&dn);
		} else {
			struct page *psrc, *pdst;

C
Chao Yu 已提交
1233 1234
			psrc = f2fs_get_lock_data_page(src_inode,
							src + i, true);
1235 1236
			if (IS_ERR(psrc))
				return PTR_ERR(psrc);
C
Chao Yu 已提交
1237
			pdst = f2fs_get_new_data_page(dst_inode, NULL, dst + i,
1238 1239 1240 1241 1242 1243 1244 1245
								true);
			if (IS_ERR(pdst)) {
				f2fs_put_page(psrc, 1);
				return PTR_ERR(pdst);
			}
			f2fs_copy_page(psrc, pdst);
			set_page_dirty(pdst);
			f2fs_put_page(pdst, 1);
1246
			f2fs_put_page(psrc, 1);
C
Chao Yu 已提交
1247

C
Chao Yu 已提交
1248 1249
			ret = f2fs_truncate_hole(src_inode,
						src + i, src + i + 1);
1250 1251 1252 1253
			if (ret)
				return ret;
			i++;
		}
1254 1255
	}
	return 0;
1256
}
C
Chao Yu 已提交
1257

1258 1259
static int __exchange_data_block(struct inode *src_inode,
			struct inode *dst_inode, pgoff_t src, pgoff_t dst,
1260
			pgoff_t len, bool full)
1261 1262 1263
{
	block_t *src_blkaddr;
	int *do_replace;
1264
	pgoff_t olen;
1265 1266
	int ret;

1267
	while (len) {
1268
		olen = min((pgoff_t)4 * ADDRS_PER_BLOCK(src_inode), len);
1269

C
Chao Yu 已提交
1270
		src_blkaddr = f2fs_kvzalloc(F2FS_I_SB(src_inode),
1271
					array_size(olen, sizeof(block_t)),
1272
					GFP_NOFS);
1273 1274
		if (!src_blkaddr)
			return -ENOMEM;
1275

C
Chao Yu 已提交
1276
		do_replace = f2fs_kvzalloc(F2FS_I_SB(src_inode),
1277
					array_size(olen, sizeof(int)),
1278
					GFP_NOFS);
1279 1280 1281 1282
		if (!do_replace) {
			kvfree(src_blkaddr);
			return -ENOMEM;
		}
1283

1284 1285 1286 1287
		ret = __read_out_blkaddrs(src_inode, src_blkaddr,
					do_replace, src, olen);
		if (ret)
			goto roll_back;
1288

1289 1290 1291 1292 1293 1294 1295 1296 1297 1298 1299 1300
		ret = __clone_blkaddrs(src_inode, dst_inode, src_blkaddr,
					do_replace, src, dst, olen, full);
		if (ret)
			goto roll_back;

		src += olen;
		dst += olen;
		len -= olen;

		kvfree(src_blkaddr);
		kvfree(do_replace);
	}
1301 1302 1303
	return 0;

roll_back:
1304
	__roll_back_blkaddrs(src_inode, src_blkaddr, do_replace, src, olen);
1305 1306
	kvfree(src_blkaddr);
	kvfree(do_replace);
1307 1308
	return ret;
}
C
Chao Yu 已提交
1309

1310
static int f2fs_do_collapse(struct inode *inode, loff_t offset, loff_t len)
1311 1312
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1313
	pgoff_t nrpages = DIV_ROUND_UP(i_size_read(inode), PAGE_SIZE);
1314 1315
	pgoff_t start = offset >> PAGE_SHIFT;
	pgoff_t end = (offset + len) >> PAGE_SHIFT;
1316
	int ret;
1317

1318
	f2fs_balance_fs(sbi, true);
1319

1320 1321 1322
	/* avoid gc operation during block exchange */
	down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
	down_write(&F2FS_I(inode)->i_mmap_sem);
1323

1324 1325 1326
	f2fs_lock_op(sbi);
	f2fs_drop_extent_tree(inode);
	truncate_pagecache(inode, offset);
1327 1328
	ret = __exchange_data_block(inode, inode, end, start, nrpages - end, true);
	f2fs_unlock_op(sbi);
1329 1330 1331

	up_write(&F2FS_I(inode)->i_mmap_sem);
	up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
C
Chao Yu 已提交
1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346
	return ret;
}

static int f2fs_collapse_range(struct inode *inode, loff_t offset, loff_t len)
{
	loff_t new_size;
	int ret;

	if (offset + len >= i_size_read(inode))
		return -EINVAL;

	/* collapse range should be aligned to block size of f2fs. */
	if (offset & (F2FS_BLKSIZE - 1) || len & (F2FS_BLKSIZE - 1))
		return -EINVAL;

1347 1348 1349
	ret = f2fs_convert_inline_inode(inode);
	if (ret)
		return ret;
1350

C
Chao Yu 已提交
1351 1352 1353
	/* write out all dirty pages from offset */
	ret = filemap_write_and_wait_range(inode->i_mapping, offset, LLONG_MAX);
	if (ret)
1354
		return ret;
C
Chao Yu 已提交
1355

1356
	ret = f2fs_do_collapse(inode, offset, len);
C
Chao Yu 已提交
1357
	if (ret)
1358
		return ret;
C
Chao Yu 已提交
1359

1360
	/* write out all moved pages, if possible */
1361
	down_write(&F2FS_I(inode)->i_mmap_sem);
1362 1363 1364
	filemap_write_and_wait_range(inode->i_mapping, offset, LLONG_MAX);
	truncate_pagecache(inode, offset);

C
Chao Yu 已提交
1365
	new_size = i_size_read(inode) - len;
1366
	ret = f2fs_truncate_blocks(inode, new_size, true);
1367
	up_write(&F2FS_I(inode)->i_mmap_sem);
C
Chao Yu 已提交
1368
	if (!ret)
1369
		f2fs_i_size_write(inode, new_size);
C
Chao Yu 已提交
1370 1371 1372
	return ret;
}

1373 1374 1375 1376 1377 1378 1379 1380 1381 1382
static int f2fs_do_zero_range(struct dnode_of_data *dn, pgoff_t start,
								pgoff_t end)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
	pgoff_t index = start;
	unsigned int ofs_in_node = dn->ofs_in_node;
	blkcnt_t count = 0;
	int ret;

	for (; index < end; index++, dn->ofs_in_node++) {
1383
		if (f2fs_data_blkaddr(dn) == NULL_ADDR)
1384 1385 1386 1387
			count++;
	}

	dn->ofs_in_node = ofs_in_node;
C
Chao Yu 已提交
1388
	ret = f2fs_reserve_new_blocks(dn, count);
1389 1390 1391 1392 1393
	if (ret)
		return ret;

	dn->ofs_in_node = ofs_in_node;
	for (index = start; index < end; index++, dn->ofs_in_node++) {
1394
		dn->data_blkaddr = f2fs_data_blkaddr(dn);
1395
		/*
C
Chao Yu 已提交
1396
		 * f2fs_reserve_new_blocks will not guarantee entire block
1397 1398 1399 1400 1401 1402 1403
		 * allocation.
		 */
		if (dn->data_blkaddr == NULL_ADDR) {
			ret = -ENOSPC;
			break;
		}
		if (dn->data_blkaddr != NEW_ADDR) {
C
Chao Yu 已提交
1404
			f2fs_invalidate_blocks(sbi, dn->data_blkaddr);
1405
			dn->data_blkaddr = NEW_ADDR;
C
Chao Yu 已提交
1406
			f2fs_set_data_blkaddr(dn);
1407 1408 1409 1410 1411 1412 1413 1414
		}
	}

	f2fs_update_extent_cache_range(dn, start, 0, index - start);

	return ret;
}

C
Chao Yu 已提交
1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425 1426 1427 1428
static int f2fs_zero_range(struct inode *inode, loff_t offset, loff_t len,
								int mode)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct address_space *mapping = inode->i_mapping;
	pgoff_t index, pg_start, pg_end;
	loff_t new_size = i_size_read(inode);
	loff_t off_start, off_end;
	int ret = 0;

	ret = inode_newsize_ok(inode, (len + offset));
	if (ret)
		return ret;

1429 1430 1431
	ret = f2fs_convert_inline_inode(inode);
	if (ret)
		return ret;
C
Chao Yu 已提交
1432 1433 1434

	ret = filemap_write_and_wait_range(mapping, offset, offset + len - 1);
	if (ret)
1435
		return ret;
C
Chao Yu 已提交
1436

1437 1438
	pg_start = ((unsigned long long) offset) >> PAGE_SHIFT;
	pg_end = ((unsigned long long) offset + len) >> PAGE_SHIFT;
C
Chao Yu 已提交
1439

1440 1441
	off_start = offset & (PAGE_SIZE - 1);
	off_end = (offset + len) & (PAGE_SIZE - 1);
C
Chao Yu 已提交
1442 1443

	if (pg_start == pg_end) {
C
Chao Yu 已提交
1444 1445 1446
		ret = fill_zero(inode, pg_start, off_start,
						off_end - off_start);
		if (ret)
1447
			return ret;
C
Chao Yu 已提交
1448

C
Chao Yu 已提交
1449 1450 1451
		new_size = max_t(loff_t, new_size, offset + len);
	} else {
		if (off_start) {
C
Chao Yu 已提交
1452
			ret = fill_zero(inode, pg_start++, off_start,
1453
						PAGE_SIZE - off_start);
C
Chao Yu 已提交
1454
			if (ret)
1455
				return ret;
C
Chao Yu 已提交
1456

C
Chao Yu 已提交
1457
			new_size = max_t(loff_t, new_size,
1458
					(loff_t)pg_start << PAGE_SHIFT);
C
Chao Yu 已提交
1459 1460
		}

1461
		for (index = pg_start; index < pg_end;) {
C
Chao Yu 已提交
1462
			struct dnode_of_data dn;
1463 1464
			unsigned int end_offset;
			pgoff_t end;
C
Chao Yu 已提交
1465

1466
			down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
1467
			down_write(&F2FS_I(inode)->i_mmap_sem);
1468 1469 1470 1471 1472

			truncate_pagecache_range(inode,
				(loff_t)index << PAGE_SHIFT,
				((loff_t)pg_end << PAGE_SHIFT) - 1);

C
Chao Yu 已提交
1473 1474
			f2fs_lock_op(sbi);

1475
			set_new_dnode(&dn, inode, NULL, NULL, 0);
C
Chao Yu 已提交
1476
			ret = f2fs_get_dnode_of_data(&dn, index, ALLOC_NODE);
C
Chao Yu 已提交
1477 1478
			if (ret) {
				f2fs_unlock_op(sbi);
1479
				up_write(&F2FS_I(inode)->i_mmap_sem);
1480
				up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
C
Chao Yu 已提交
1481 1482 1483
				goto out;
			}

1484 1485 1486 1487
			end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
			end = min(pg_end, end_offset - dn.ofs_in_node + index);

			ret = f2fs_do_zero_range(&dn, index, end);
C
Chao Yu 已提交
1488
			f2fs_put_dnode(&dn);
1489

C
Chao Yu 已提交
1490
			f2fs_unlock_op(sbi);
1491
			up_write(&F2FS_I(inode)->i_mmap_sem);
1492
			up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
1493 1494 1495

			f2fs_balance_fs(sbi, dn.node_changed);

1496 1497
			if (ret)
				goto out;
C
Chao Yu 已提交
1498

1499
			index = end;
C
Chao Yu 已提交
1500
			new_size = max_t(loff_t, new_size,
1501
					(loff_t)index << PAGE_SHIFT);
C
Chao Yu 已提交
1502 1503 1504
		}

		if (off_end) {
C
Chao Yu 已提交
1505 1506 1507 1508
			ret = fill_zero(inode, pg_end, 0, off_end);
			if (ret)
				goto out;

C
Chao Yu 已提交
1509 1510 1511 1512 1513
			new_size = max_t(loff_t, new_size, offset + len);
		}
	}

out:
1514 1515 1516 1517 1518 1519
	if (new_size > i_size_read(inode)) {
		if (mode & FALLOC_FL_KEEP_SIZE)
			file_set_keep_isize(inode);
		else
			f2fs_i_size_write(inode, new_size);
	}
C
Chao Yu 已提交
1520 1521 1522
	return ret;
}

C
Chao Yu 已提交
1523 1524 1525
static int f2fs_insert_range(struct inode *inode, loff_t offset, loff_t len)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1526
	pgoff_t nr, pg_start, pg_end, delta, idx;
C
Chao Yu 已提交
1527
	loff_t new_size;
1528
	int ret = 0;
C
Chao Yu 已提交
1529 1530

	new_size = i_size_read(inode) + len;
1531 1532 1533
	ret = inode_newsize_ok(inode, new_size);
	if (ret)
		return ret;
C
Chao Yu 已提交
1534 1535 1536 1537 1538 1539 1540 1541

	if (offset >= i_size_read(inode))
		return -EINVAL;

	/* insert range should be aligned to block size of f2fs. */
	if (offset & (F2FS_BLKSIZE - 1) || len & (F2FS_BLKSIZE - 1))
		return -EINVAL;

1542 1543 1544
	ret = f2fs_convert_inline_inode(inode);
	if (ret)
		return ret;
1545

J
Jaegeuk Kim 已提交
1546
	f2fs_balance_fs(sbi, true);
1547

1548
	down_write(&F2FS_I(inode)->i_mmap_sem);
1549
	ret = f2fs_truncate_blocks(inode, i_size_read(inode), true);
1550
	up_write(&F2FS_I(inode)->i_mmap_sem);
C
Chao Yu 已提交
1551
	if (ret)
1552
		return ret;
C
Chao Yu 已提交
1553 1554 1555 1556

	/* write out all dirty pages from offset */
	ret = filemap_write_and_wait_range(inode->i_mapping, offset, LLONG_MAX);
	if (ret)
1557
		return ret;
C
Chao Yu 已提交
1558

1559 1560
	pg_start = offset >> PAGE_SHIFT;
	pg_end = (offset + len) >> PAGE_SHIFT;
C
Chao Yu 已提交
1561
	delta = pg_end - pg_start;
1562
	idx = DIV_ROUND_UP(i_size_read(inode), PAGE_SIZE);
1563

1564 1565 1566 1567 1568
	/* avoid gc operation during block exchange */
	down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
	down_write(&F2FS_I(inode)->i_mmap_sem);
	truncate_pagecache(inode, offset);

1569 1570 1571 1572 1573
	while (!ret && idx > pg_start) {
		nr = idx - pg_start;
		if (nr > delta)
			nr = delta;
		idx -= nr;
C
Chao Yu 已提交
1574 1575

		f2fs_lock_op(sbi);
1576 1577
		f2fs_drop_extent_tree(inode);

1578 1579
		ret = __exchange_data_block(inode, inode, idx,
					idx + delta, nr, false);
C
Chao Yu 已提交
1580 1581
		f2fs_unlock_op(sbi);
	}
1582 1583
	up_write(&F2FS_I(inode)->i_mmap_sem);
	up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
C
Chao Yu 已提交
1584

1585
	/* write out all moved pages, if possible */
1586
	down_write(&F2FS_I(inode)->i_mmap_sem);
1587 1588
	filemap_write_and_wait_range(inode->i_mapping, offset, LLONG_MAX);
	truncate_pagecache(inode, offset);
1589
	up_write(&F2FS_I(inode)->i_mmap_sem);
1590 1591

	if (!ret)
1592
		f2fs_i_size_write(inode, new_size);
C
Chao Yu 已提交
1593 1594 1595
	return ret;
}

J
Jaegeuk Kim 已提交
1596 1597 1598
static int expand_inode_data(struct inode *inode, loff_t offset,
					loff_t len, int mode)
{
1599
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1600
	struct f2fs_map_blocks map = { .m_next_pgofs = NULL,
C
Chao Yu 已提交
1601 1602
			.m_next_extent = NULL, .m_seg_type = NO_CHECK_TYPE,
			.m_may_create = true };
1603
	pgoff_t pg_end;
J
Jaegeuk Kim 已提交
1604
	loff_t new_size = i_size_read(inode);
1605
	loff_t off_end;
1606
	int err;
J
Jaegeuk Kim 已提交
1607

1608 1609 1610
	err = inode_newsize_ok(inode, (len + offset));
	if (err)
		return err;
J
Jaegeuk Kim 已提交
1611

1612 1613 1614
	err = f2fs_convert_inline_inode(inode);
	if (err)
		return err;
1615

J
Jaegeuk Kim 已提交
1616
	f2fs_balance_fs(sbi, true);
1617

1618
	pg_end = ((unsigned long long)offset + len) >> PAGE_SHIFT;
1619
	off_end = (offset + len) & (PAGE_SIZE - 1);
J
Jaegeuk Kim 已提交
1620

1621 1622 1623 1624
	map.m_lblk = ((unsigned long long)offset) >> PAGE_SHIFT;
	map.m_len = pg_end - map.m_lblk;
	if (off_end)
		map.m_len++;
1625

J
Jaegeuk Kim 已提交
1626 1627 1628 1629 1630 1631 1632 1633 1634 1635 1636 1637 1638 1639 1640
	if (!map.m_len)
		return 0;

	if (f2fs_is_pinned_file(inode)) {
		block_t len = (map.m_len >> sbi->log_blocks_per_seg) <<
					sbi->log_blocks_per_seg;
		block_t done = 0;

		if (map.m_len % sbi->blocks_per_seg)
			len += sbi->blocks_per_seg;

		map.m_len = sbi->blocks_per_seg;
next_alloc:
		if (has_not_enough_free_secs(sbi, 0,
			GET_SEC_FROM_SEG(sbi, overprovision_segments(sbi)))) {
C
Chao Yu 已提交
1641
			down_write(&sbi->gc_lock);
J
Jaegeuk Kim 已提交
1642 1643 1644 1645 1646 1647
			err = f2fs_gc(sbi, true, false, NULL_SEGNO);
			if (err && err != -ENODATA && err != -EAGAIN)
				goto out_err;
		}

		down_write(&sbi->pin_sem);
1648 1649

		f2fs_lock_op(sbi);
C
Chao Yu 已提交
1650
		f2fs_allocate_new_segment(sbi, CURSEG_COLD_DATA_PINNED);
1651 1652
		f2fs_unlock_op(sbi);

C
Chao Yu 已提交
1653
		map.m_seg_type = CURSEG_COLD_DATA_PINNED;
J
Jaegeuk Kim 已提交
1654
		err = f2fs_map_blocks(inode, &map, 1, F2FS_GET_BLOCK_PRE_DIO);
C
Chao Yu 已提交
1655

J
Jaegeuk Kim 已提交
1656
		up_write(&sbi->pin_sem);
1657

J
Jaegeuk Kim 已提交
1658 1659 1660 1661 1662 1663 1664 1665 1666 1667 1668
		done += map.m_len;
		len -= map.m_len;
		map.m_lblk += map.m_len;
		if (!err && len)
			goto next_alloc;

		map.m_len = done;
	} else {
		err = f2fs_map_blocks(inode, &map, 1, F2FS_GET_BLOCK_PRE_AIO);
	}
out_err:
1669
	if (err) {
1670
		pgoff_t last_off;
J
Jaegeuk Kim 已提交
1671

1672
		if (!map.m_len)
1673
			return err;
1674

1675 1676 1677
		last_off = map.m_lblk + map.m_len - 1;

		/* update new size to the failed position */
1678
		new_size = (last_off == pg_end) ? offset + len :
1679 1680 1681
					(loff_t)(last_off + 1) << PAGE_SHIFT;
	} else {
		new_size = ((loff_t)pg_end << PAGE_SHIFT) + off_end;
J
Jaegeuk Kim 已提交
1682 1683
	}

1684 1685 1686 1687 1688 1689
	if (new_size > i_size_read(inode)) {
		if (mode & FALLOC_FL_KEEP_SIZE)
			file_set_keep_isize(inode);
		else
			f2fs_i_size_write(inode, new_size);
	}
J
Jaegeuk Kim 已提交
1690

1691
	return err;
J
Jaegeuk Kim 已提交
1692 1693 1694 1695 1696
}

static long f2fs_fallocate(struct file *file, int mode,
				loff_t offset, loff_t len)
{
A
Al Viro 已提交
1697
	struct inode *inode = file_inode(file);
1698
	long ret = 0;
J
Jaegeuk Kim 已提交
1699

1700 1701
	if (unlikely(f2fs_cp_error(F2FS_I_SB(inode))))
		return -EIO;
1702 1703
	if (!f2fs_is_checkpoint_ready(F2FS_I_SB(inode)))
		return -ENOSPC;
C
Chao Yu 已提交
1704 1705
	if (!f2fs_is_compress_backend_ready(inode))
		return -EOPNOTSUPP;
1706

1707 1708 1709 1710
	/* f2fs only support ->fallocate for regular file */
	if (!S_ISREG(inode->i_mode))
		return -EINVAL;

1711
	if (IS_ENCRYPTED(inode) &&
C
Chao Yu 已提交
1712
		(mode & (FALLOC_FL_COLLAPSE_RANGE | FALLOC_FL_INSERT_RANGE)))
1713 1714
		return -EOPNOTSUPP;

C
Chao Yu 已提交
1715 1716 1717 1718 1719
	if (f2fs_compressed_file(inode) &&
		(mode & (FALLOC_FL_PUNCH_HOLE | FALLOC_FL_COLLAPSE_RANGE |
			FALLOC_FL_ZERO_RANGE | FALLOC_FL_INSERT_RANGE)))
		return -EOPNOTSUPP;

C
Chao Yu 已提交
1720
	if (mode & ~(FALLOC_FL_KEEP_SIZE | FALLOC_FL_PUNCH_HOLE |
C
Chao Yu 已提交
1721 1722
			FALLOC_FL_COLLAPSE_RANGE | FALLOC_FL_ZERO_RANGE |
			FALLOC_FL_INSERT_RANGE))
J
Jaegeuk Kim 已提交
1723 1724
		return -EOPNOTSUPP;

A
Al Viro 已提交
1725
	inode_lock(inode);
1726

1727 1728 1729 1730
	if (mode & FALLOC_FL_PUNCH_HOLE) {
		if (offset >= inode->i_size)
			goto out;

C
Chao Yu 已提交
1731
		ret = punch_hole(inode, offset, len);
C
Chao Yu 已提交
1732 1733
	} else if (mode & FALLOC_FL_COLLAPSE_RANGE) {
		ret = f2fs_collapse_range(inode, offset, len);
C
Chao Yu 已提交
1734 1735
	} else if (mode & FALLOC_FL_ZERO_RANGE) {
		ret = f2fs_zero_range(inode, offset, len, mode);
C
Chao Yu 已提交
1736 1737
	} else if (mode & FALLOC_FL_INSERT_RANGE) {
		ret = f2fs_insert_range(inode, offset, len);
C
Chao Yu 已提交
1738
	} else {
J
Jaegeuk Kim 已提交
1739
		ret = expand_inode_data(inode, offset, len, mode);
C
Chao Yu 已提交
1740
	}
J
Jaegeuk Kim 已提交
1741

1742
	if (!ret) {
1743
		inode->i_mtime = inode->i_ctime = current_time(inode);
1744
		f2fs_mark_inode_dirty_sync(inode, false);
1745
		f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
1746
	}
1747

1748
out:
A
Al Viro 已提交
1749
	inode_unlock(inode);
1750

1751
	trace_f2fs_fallocate(inode, mode, offset, len, ret);
J
Jaegeuk Kim 已提交
1752 1753 1754
	return ret;
}

1755 1756
static int f2fs_release_file(struct inode *inode, struct file *filp)
{
1757 1758 1759 1760 1761 1762 1763 1764
	/*
	 * f2fs_relase_file is called at every close calls. So we should
	 * not drop any inmemory pages by close called by other process.
	 */
	if (!(filp->f_mode & FMODE_WRITE) ||
			atomic_read(&inode->i_writecount) != 1)
		return 0;

1765 1766
	/* some remained atomic pages should discarded */
	if (f2fs_is_atomic_file(inode))
C
Chao Yu 已提交
1767
		f2fs_drop_inmem_pages(inode);
1768
	if (f2fs_is_volatile_file(inode)) {
1769
		set_inode_flag(inode, FI_DROP_CACHE);
1770
		filemap_fdatawrite(inode->i_mapping);
1771
		clear_inode_flag(inode, FI_DROP_CACHE);
1772 1773
		clear_inode_flag(inode, FI_VOLATILE_FILE);
		stat_dec_volatile_write(inode);
1774 1775 1776 1777
	}
	return 0;
}

1778
static int f2fs_file_flush(struct file *file, fl_owner_t id)
J
Jaegeuk Kim 已提交
1779
{
1780 1781 1782 1783 1784 1785 1786 1787 1788 1789
	struct inode *inode = file_inode(file);

	/*
	 * If the process doing a transaction is crashed, we should do
	 * roll-back. Otherwise, other reader/write can see corrupted database
	 * until all the writers close its file. Since this should be done
	 * before dropping file lock, it needs to do in ->flush.
	 */
	if (f2fs_is_atomic_file(inode) &&
			F2FS_I(inode)->inmem_task == current)
C
Chao Yu 已提交
1790
		f2fs_drop_inmem_pages(inode);
1791
	return 0;
J
Jaegeuk Kim 已提交
1792 1793
}

1794
static int f2fs_setflags_common(struct inode *inode, u32 iflags, u32 mask)
1795 1796
{
	struct f2fs_inode_info *fi = F2FS_I(inode);
1797 1798 1799
	u32 masked_flags = fi->i_flags & mask;

	f2fs_bug_on(F2FS_I_SB(inode), (iflags & ~mask));
1800 1801 1802 1803 1804

	/* Is it quota file? Do not allow user to mess with it */
	if (IS_NOQUOTA(inode))
		return -EPERM;

1805
	if ((iflags ^ masked_flags) & F2FS_CASEFOLD_FL) {
1806 1807 1808 1809 1810 1811
		if (!f2fs_sb_has_casefold(F2FS_I_SB(inode)))
			return -EOPNOTSUPP;
		if (!f2fs_empty_dir(inode))
			return -ENOTEMPTY;
	}

C
Chao Yu 已提交
1812 1813 1814 1815 1816 1817 1818
	if (iflags & (F2FS_COMPR_FL | F2FS_NOCOMP_FL)) {
		if (!f2fs_sb_has_compression(F2FS_I_SB(inode)))
			return -EOPNOTSUPP;
		if ((iflags & F2FS_COMPR_FL) && (iflags & F2FS_NOCOMP_FL))
			return -EINVAL;
	}

1819
	if ((iflags ^ masked_flags) & F2FS_COMPR_FL) {
1820
		if (masked_flags & F2FS_COMPR_FL) {
1821
			if (!f2fs_disable_compressed_file(inode))
1822 1823
				return -EINVAL;
		}
C
Chao Yu 已提交
1824 1825 1826 1827 1828
		if (iflags & F2FS_NOCOMP_FL)
			return -EINVAL;
		if (iflags & F2FS_COMPR_FL) {
			if (!f2fs_may_compress(inode))
				return -EINVAL;
1829 1830
			if (S_ISREG(inode->i_mode) && inode->i_size)
				return -EINVAL;
C
Chao Yu 已提交
1831 1832 1833 1834

			set_compress_context(inode);
		}
	}
1835 1836
	if ((iflags ^ masked_flags) & F2FS_NOCOMP_FL) {
		if (masked_flags & F2FS_COMPR_FL)
C
Chao Yu 已提交
1837 1838 1839
			return -EINVAL;
	}

1840
	fi->i_flags = iflags | (fi->i_flags & ~mask);
C
Chao Yu 已提交
1841 1842
	f2fs_bug_on(F2FS_I_SB(inode), (fi->i_flags & F2FS_COMPR_FL) &&
					(fi->i_flags & F2FS_NOCOMP_FL));
1843

1844
	if (fi->i_flags & F2FS_PROJINHERIT_FL)
1845 1846 1847 1848 1849 1850
		set_inode_flag(inode, FI_PROJ_INHERIT);
	else
		clear_inode_flag(inode, FI_PROJ_INHERIT);

	inode->i_ctime = current_time(inode);
	f2fs_set_inode_flags(inode);
C
Chao Yu 已提交
1851
	f2fs_mark_inode_dirty_sync(inode, true);
1852 1853 1854
	return 0;
}

1855 1856 1857 1858 1859 1860 1861 1862 1863 1864 1865 1866 1867
/* FS_IOC_GETFLAGS and FS_IOC_SETFLAGS support */

/*
 * To make a new on-disk f2fs i_flag gettable via FS_IOC_GETFLAGS, add an entry
 * for it to f2fs_fsflags_map[], and add its FS_*_FL equivalent to
 * F2FS_GETTABLE_FS_FL.  To also make it settable via FS_IOC_SETFLAGS, also add
 * its FS_*_FL equivalent to F2FS_SETTABLE_FS_FL.
 */

static const struct {
	u32 iflag;
	u32 fsflag;
} f2fs_fsflags_map[] = {
C
Chao Yu 已提交
1868
	{ F2FS_COMPR_FL,	FS_COMPR_FL },
1869 1870 1871 1872 1873
	{ F2FS_SYNC_FL,		FS_SYNC_FL },
	{ F2FS_IMMUTABLE_FL,	FS_IMMUTABLE_FL },
	{ F2FS_APPEND_FL,	FS_APPEND_FL },
	{ F2FS_NODUMP_FL,	FS_NODUMP_FL },
	{ F2FS_NOATIME_FL,	FS_NOATIME_FL },
C
Chao Yu 已提交
1874
	{ F2FS_NOCOMP_FL,	FS_NOCOMP_FL },
1875 1876 1877
	{ F2FS_INDEX_FL,	FS_INDEX_FL },
	{ F2FS_DIRSYNC_FL,	FS_DIRSYNC_FL },
	{ F2FS_PROJINHERIT_FL,	FS_PROJINHERIT_FL },
1878
	{ F2FS_CASEFOLD_FL,	FS_CASEFOLD_FL },
1879 1880 1881
};

#define F2FS_GETTABLE_FS_FL (		\
C
Chao Yu 已提交
1882
		FS_COMPR_FL |		\
1883 1884 1885 1886 1887
		FS_SYNC_FL |		\
		FS_IMMUTABLE_FL |	\
		FS_APPEND_FL |		\
		FS_NODUMP_FL |		\
		FS_NOATIME_FL |		\
C
Chao Yu 已提交
1888
		FS_NOCOMP_FL |		\
1889 1890 1891 1892 1893
		FS_INDEX_FL |		\
		FS_DIRSYNC_FL |		\
		FS_PROJINHERIT_FL |	\
		FS_ENCRYPT_FL |		\
		FS_INLINE_DATA_FL |	\
E
Eric Biggers 已提交
1894
		FS_NOCOW_FL |		\
1895
		FS_VERITY_FL |		\
1896
		FS_CASEFOLD_FL)
1897 1898

#define F2FS_SETTABLE_FS_FL (		\
C
Chao Yu 已提交
1899
		FS_COMPR_FL |		\
1900 1901 1902 1903 1904
		FS_SYNC_FL |		\
		FS_IMMUTABLE_FL |	\
		FS_APPEND_FL |		\
		FS_NODUMP_FL |		\
		FS_NOATIME_FL |		\
C
Chao Yu 已提交
1905
		FS_NOCOMP_FL |		\
1906
		FS_DIRSYNC_FL |		\
1907 1908
		FS_PROJINHERIT_FL |	\
		FS_CASEFOLD_FL)
1909 1910 1911 1912 1913 1914 1915 1916 1917 1918 1919 1920 1921 1922 1923 1924 1925 1926 1927 1928 1929 1930 1931 1932 1933 1934 1935 1936 1937 1938 1939 1940 1941 1942 1943

/* Convert f2fs on-disk i_flags to FS_IOC_{GET,SET}FLAGS flags */
static inline u32 f2fs_iflags_to_fsflags(u32 iflags)
{
	u32 fsflags = 0;
	int i;

	for (i = 0; i < ARRAY_SIZE(f2fs_fsflags_map); i++)
		if (iflags & f2fs_fsflags_map[i].iflag)
			fsflags |= f2fs_fsflags_map[i].fsflag;

	return fsflags;
}

/* Convert FS_IOC_{GET,SET}FLAGS flags to f2fs on-disk i_flags */
static inline u32 f2fs_fsflags_to_iflags(u32 fsflags)
{
	u32 iflags = 0;
	int i;

	for (i = 0; i < ARRAY_SIZE(f2fs_fsflags_map); i++)
		if (fsflags & f2fs_fsflags_map[i].fsflag)
			iflags |= f2fs_fsflags_map[i].iflag;

	return iflags;
}

static int f2fs_ioc_getflags(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_inode_info *fi = F2FS_I(inode);
	u32 fsflags = f2fs_iflags_to_fsflags(fi->i_flags);

	if (IS_ENCRYPTED(inode))
		fsflags |= FS_ENCRYPT_FL;
E
Eric Biggers 已提交
1944 1945
	if (IS_VERITY(inode))
		fsflags |= FS_VERITY_FL;
1946 1947 1948 1949 1950 1951 1952 1953 1954 1955
	if (f2fs_has_inline_data(inode) || f2fs_has_inline_dentry(inode))
		fsflags |= FS_INLINE_DATA_FL;
	if (is_inode_flag_set(inode, FI_PIN_FILE))
		fsflags |= FS_NOCOW_FL;

	fsflags &= F2FS_GETTABLE_FS_FL;

	return put_user(fsflags, (int __user *)arg);
}

1956 1957 1958
static int f2fs_ioc_setflags(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
1959 1960
	struct f2fs_inode_info *fi = F2FS_I(inode);
	u32 fsflags, old_fsflags;
1961
	u32 iflags;
1962
	int ret;
J
Jaegeuk Kim 已提交
1963

1964 1965 1966
	if (!inode_owner_or_capable(inode))
		return -EACCES;

1967
	if (get_user(fsflags, (int __user *)arg))
1968 1969
		return -EFAULT;

1970 1971 1972 1973 1974 1975 1976 1977
	if (fsflags & ~F2FS_GETTABLE_FS_FL)
		return -EOPNOTSUPP;
	fsflags &= F2FS_SETTABLE_FS_FL;

	iflags = f2fs_fsflags_to_iflags(fsflags);
	if (f2fs_mask_flags(inode->i_mode, iflags) != iflags)
		return -EOPNOTSUPP;

1978 1979 1980
	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;
J
Jaegeuk Kim 已提交
1981

A
Al Viro 已提交
1982
	inode_lock(inode);
J
Jaegeuk Kim 已提交
1983

1984 1985 1986 1987 1988
	old_fsflags = f2fs_iflags_to_fsflags(fi->i_flags);
	ret = vfs_ioc_setflags_prepare(inode, old_fsflags, fsflags);
	if (ret)
		goto out;

1989 1990
	ret = f2fs_setflags_common(inode, iflags,
			f2fs_fsflags_to_iflags(F2FS_SETTABLE_FS_FL));
1991
out:
1992
	inode_unlock(inode);
1993 1994 1995
	mnt_drop_write_file(filp);
	return ret;
}
1996

C
Chao Yu 已提交
1997 1998 1999 2000 2001 2002 2003
static int f2fs_ioc_getversion(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);

	return put_user(inode->i_generation, (int __user *)arg);
}

J
Jaegeuk Kim 已提交
2004 2005 2006
static int f2fs_ioc_start_atomic_write(struct file *filp)
{
	struct inode *inode = file_inode(filp);
2007 2008
	struct f2fs_inode_info *fi = F2FS_I(inode);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
2009
	int ret;
J
Jaegeuk Kim 已提交
2010 2011 2012 2013

	if (!inode_owner_or_capable(inode))
		return -EACCES;

2014 2015 2016
	if (!S_ISREG(inode->i_mode))
		return -EINVAL;

2017 2018 2019
	if (filp->f_flags & O_DIRECT)
		return -EINVAL;

2020 2021 2022 2023
	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

2024 2025
	inode_lock(inode);

C
Chao Yu 已提交
2026 2027
	f2fs_disable_compressed_file(inode);

2028 2029 2030
	if (f2fs_is_atomic_file(inode)) {
		if (is_inode_flag_set(inode, FI_ATOMIC_REVOKE_REQUEST))
			ret = -EINVAL;
2031
		goto out;
2032
	}
J
Jaegeuk Kim 已提交
2033

2034 2035
	ret = f2fs_convert_inline_inode(inode);
	if (ret)
2036
		goto out;
J
Jaegeuk Kim 已提交
2037

2038 2039
	down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);

2040 2041 2042 2043 2044
	/*
	 * Should wait end_io to count F2FS_WB_CP_DATA correctly by
	 * f2fs_is_atomic_file.
	 */
	if (get_dirty_pages(inode))
2045 2046
		f2fs_warn(F2FS_I_SB(inode), "Unexpected flush for atomic writes: ino=%lu, npages=%u",
			  inode->i_ino, get_dirty_pages(inode));
2047
	ret = filemap_write_and_wait_range(inode->i_mapping, 0, LLONG_MAX);
2048 2049
	if (ret) {
		up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
2050
		goto out;
2051
	}
2052

2053 2054 2055
	spin_lock(&sbi->inode_lock[ATOMIC_FILE]);
	if (list_empty(&fi->inmem_ilist))
		list_add_tail(&fi->inmem_ilist, &sbi->inode_list[ATOMIC_FILE]);
2056
	sbi->atomic_files++;
2057 2058 2059
	spin_unlock(&sbi->inode_lock[ATOMIC_FILE]);

	/* add inode in inmem_list first and set atomic_file */
2060
	set_inode_flag(inode, FI_ATOMIC_FILE);
2061
	clear_inode_flag(inode, FI_ATOMIC_REVOKE_REQUEST);
2062
	up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
2063

2064
	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
2065
	F2FS_I(inode)->inmem_task = current;
2066
	stat_update_max_atomic_write(inode);
2067
out:
2068
	inode_unlock(inode);
2069
	mnt_drop_write_file(filp);
2070
	return ret;
J
Jaegeuk Kim 已提交
2071 2072 2073 2074 2075 2076 2077 2078 2079 2080 2081 2082 2083 2084
}

static int f2fs_ioc_commit_atomic_write(struct file *filp)
{
	struct inode *inode = file_inode(filp);
	int ret;

	if (!inode_owner_or_capable(inode))
		return -EACCES;

	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

2085
	f2fs_balance_fs(F2FS_I_SB(inode), true);
2086

2087
	inode_lock(inode);
2088

2089 2090
	if (f2fs_is_volatile_file(inode)) {
		ret = -EINVAL;
2091
		goto err_out;
2092
	}
2093

2094
	if (f2fs_is_atomic_file(inode)) {
C
Chao Yu 已提交
2095
		ret = f2fs_commit_inmem_pages(inode);
C
Chao Yu 已提交
2096
		if (ret)
2097
			goto err_out;
C
Chao Yu 已提交
2098

2099
		ret = f2fs_do_sync_file(filp, 0, LLONG_MAX, 0, true);
2100 2101
		if (!ret)
			f2fs_drop_inmem_pages(inode);
2102
	} else {
2103
		ret = f2fs_do_sync_file(filp, 0, LLONG_MAX, 1, false);
2104
	}
2105
err_out:
2106 2107 2108 2109
	if (is_inode_flag_set(inode, FI_ATOMIC_REVOKE_REQUEST)) {
		clear_inode_flag(inode, FI_ATOMIC_REVOKE_REQUEST);
		ret = -EINVAL;
	}
2110
	inode_unlock(inode);
J
Jaegeuk Kim 已提交
2111 2112 2113 2114
	mnt_drop_write_file(filp);
	return ret;
}

2115 2116 2117
static int f2fs_ioc_start_volatile_write(struct file *filp)
{
	struct inode *inode = file_inode(filp);
2118
	int ret;
2119 2120 2121 2122

	if (!inode_owner_or_capable(inode))
		return -EACCES;

2123 2124 2125
	if (!S_ISREG(inode->i_mode))
		return -EINVAL;

2126 2127 2128 2129
	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

2130 2131
	inode_lock(inode);

2132
	if (f2fs_is_volatile_file(inode))
2133
		goto out;
2134

2135 2136
	ret = f2fs_convert_inline_inode(inode);
	if (ret)
2137
		goto out;
2138

2139 2140 2141
	stat_inc_volatile_write(inode);
	stat_update_max_volatile_write(inode);

2142
	set_inode_flag(inode, FI_VOLATILE_FILE);
2143
	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
2144
out:
2145
	inode_unlock(inode);
2146 2147
	mnt_drop_write_file(filp);
	return ret;
2148 2149
}

2150 2151 2152
static int f2fs_ioc_release_volatile_write(struct file *filp)
{
	struct inode *inode = file_inode(filp);
2153
	int ret;
2154 2155 2156 2157

	if (!inode_owner_or_capable(inode))
		return -EACCES;

2158 2159 2160 2161
	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

2162 2163
	inode_lock(inode);

2164
	if (!f2fs_is_volatile_file(inode))
2165
		goto out;
2166

2167 2168 2169 2170
	if (!f2fs_is_first_block_written(inode)) {
		ret = truncate_partial_data_page(inode, 0, true);
		goto out;
	}
2171

2172 2173
	ret = punch_hole(inode, 0, F2FS_BLKSIZE);
out:
2174
	inode_unlock(inode);
2175 2176
	mnt_drop_write_file(filp);
	return ret;
2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189 2190
}

static int f2fs_ioc_abort_volatile_write(struct file *filp)
{
	struct inode *inode = file_inode(filp);
	int ret;

	if (!inode_owner_or_capable(inode))
		return -EACCES;

	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

2191 2192
	inode_lock(inode);

2193
	if (f2fs_is_atomic_file(inode))
C
Chao Yu 已提交
2194
		f2fs_drop_inmem_pages(inode);
2195
	if (f2fs_is_volatile_file(inode)) {
2196
		clear_inode_flag(inode, FI_VOLATILE_FILE);
2197
		stat_dec_volatile_write(inode);
2198
		ret = f2fs_do_sync_file(filp, 0, LLONG_MAX, 0, true);
2199
	}
2200

2201 2202
	clear_inode_flag(inode, FI_ATOMIC_REVOKE_REQUEST);

2203 2204
	inode_unlock(inode);

2205
	mnt_drop_write_file(filp);
2206
	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
2207 2208 2209
	return ret;
}

J
Jaegeuk Kim 已提交
2210 2211 2212 2213 2214 2215
static int f2fs_ioc_shutdown(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct super_block *sb = sbi->sb;
	__u32 in;
2216
	int ret = 0;
J
Jaegeuk Kim 已提交
2217 2218 2219 2220 2221 2222 2223

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (get_user(in, (__u32 __user *)arg))
		return -EFAULT;

2224 2225
	if (in != F2FS_GOING_DOWN_FULLSYNC) {
		ret = mnt_want_write_file(filp);
2226 2227 2228 2229 2230 2231 2232
		if (ret) {
			if (ret == -EROFS) {
				ret = 0;
				f2fs_stop_checkpoint(sbi, false);
				set_sbi_flag(sbi, SBI_IS_SHUTDOWN);
				trace_f2fs_shutdown(sbi, in, ret);
			}
2233
			return ret;
2234
		}
2235
	}
2236

J
Jaegeuk Kim 已提交
2237 2238 2239
	switch (in) {
	case F2FS_GOING_DOWN_FULLSYNC:
		sb = freeze_bdev(sb->s_bdev);
2240 2241 2242 2243 2244
		if (IS_ERR(sb)) {
			ret = PTR_ERR(sb);
			goto out;
		}
		if (sb) {
2245
			f2fs_stop_checkpoint(sbi, false);
2246
			set_sbi_flag(sbi, SBI_IS_SHUTDOWN);
J
Jaegeuk Kim 已提交
2247 2248 2249 2250 2251
			thaw_bdev(sb->s_bdev, sb);
		}
		break;
	case F2FS_GOING_DOWN_METASYNC:
		/* do checkpoint only */
2252 2253 2254
		ret = f2fs_sync_fs(sb, 1);
		if (ret)
			goto out;
2255
		f2fs_stop_checkpoint(sbi, false);
2256
		set_sbi_flag(sbi, SBI_IS_SHUTDOWN);
J
Jaegeuk Kim 已提交
2257 2258
		break;
	case F2FS_GOING_DOWN_NOSYNC:
2259
		f2fs_stop_checkpoint(sbi, false);
2260
		set_sbi_flag(sbi, SBI_IS_SHUTDOWN);
J
Jaegeuk Kim 已提交
2261
		break;
2262
	case F2FS_GOING_DOWN_METAFLUSH:
C
Chao Yu 已提交
2263
		f2fs_sync_meta_pages(sbi, META, LONG_MAX, FS_META_IO);
2264
		f2fs_stop_checkpoint(sbi, false);
2265
		set_sbi_flag(sbi, SBI_IS_SHUTDOWN);
2266
		break;
2267 2268
	case F2FS_GOING_DOWN_NEED_FSCK:
		set_sbi_flag(sbi, SBI_NEED_FSCK);
2269 2270
		set_sbi_flag(sbi, SBI_CP_DISABLED_QUICK);
		set_sbi_flag(sbi, SBI_IS_DIRTY);
2271 2272
		/* do checkpoint only */
		ret = f2fs_sync_fs(sb, 1);
2273
		goto out;
J
Jaegeuk Kim 已提交
2274
	default:
2275 2276
		ret = -EINVAL;
		goto out;
J
Jaegeuk Kim 已提交
2277
	}
2278

C
Chao Yu 已提交
2279 2280
	f2fs_stop_gc_thread(sbi);
	f2fs_stop_discard_thread(sbi);
2281

C
Chao Yu 已提交
2282
	f2fs_drop_discard_cmd(sbi);
2283 2284
	clear_opt(sbi, DISCARD);

2285
	f2fs_update_time(sbi, REQ_TIME);
2286
out:
2287 2288
	if (in != F2FS_GOING_DOWN_FULLSYNC)
		mnt_drop_write_file(filp);
C
Chao Yu 已提交
2289 2290 2291

	trace_f2fs_shutdown(sbi, in, ret);

2292
	return ret;
J
Jaegeuk Kim 已提交
2293 2294
}

2295 2296 2297 2298 2299 2300 2301
static int f2fs_ioc_fitrim(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct super_block *sb = inode->i_sb;
	struct request_queue *q = bdev_get_queue(sb->s_bdev);
	struct fstrim_range range;
	int ret;
2302

2303 2304
	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;
2305

2306
	if (!f2fs_hw_support_discard(F2FS_SB(sb)))
2307
		return -EOPNOTSUPP;
2308

2309 2310 2311
	if (copy_from_user(&range, (struct fstrim_range __user *)arg,
				sizeof(range)))
		return -EFAULT;
2312

2313 2314 2315 2316
	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

2317 2318 2319
	range.minlen = max((unsigned int)range.minlen,
				q->limits.discard_granularity);
	ret = f2fs_trim_fs(F2FS_SB(sb), &range);
2320
	mnt_drop_write_file(filp);
2321 2322
	if (ret < 0)
		return ret;
2323

2324 2325 2326
	if (copy_to_user((struct fstrim_range __user *)arg, &range,
				sizeof(range)))
		return -EFAULT;
2327
	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
2328 2329 2330
	return 0;
}

2331 2332 2333 2334 2335 2336 2337 2338 2339 2340 2341 2342 2343 2344
static bool uuid_is_nonzero(__u8 u[16])
{
	int i;

	for (i = 0; i < 16; i++)
		if (u[i])
			return true;
	return false;
}

static int f2fs_ioc_set_encryption_policy(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);

2345
	if (!f2fs_sb_has_encrypt(F2FS_I_SB(inode)))
2346 2347
		return -EOPNOTSUPP;

2348
	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
2349

2350
	return fscrypt_ioctl_set_policy(filp, (const void __user *)arg);
2351 2352 2353 2354
}

static int f2fs_ioc_get_encryption_policy(struct file *filp, unsigned long arg)
{
2355
	if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
2356
		return -EOPNOTSUPP;
2357
	return fscrypt_ioctl_get_policy(filp, (void __user *)arg);
2358 2359 2360 2361 2362 2363 2364 2365
}

static int f2fs_ioc_get_encryption_pwsalt(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	int err;

2366
	if (!f2fs_sb_has_encrypt(sbi))
2367 2368 2369 2370 2371 2372
		return -EOPNOTSUPP;

	err = mnt_want_write_file(filp);
	if (err)
		return err;

2373
	down_write(&sbi->sb_lock);
2374 2375 2376 2377

	if (uuid_is_nonzero(sbi->raw_super->encrypt_pw_salt))
		goto got_it;

2378 2379 2380
	/* update superblock with uuid */
	generate_random_uuid(sbi->raw_super->encrypt_pw_salt);

C
Chao Yu 已提交
2381
	err = f2fs_commit_super(sbi, false);
2382 2383 2384
	if (err) {
		/* undo new data */
		memset(sbi->raw_super->encrypt_pw_salt, 0, 16);
2385
		goto out_err;
2386 2387 2388 2389
	}
got_it:
	if (copy_to_user((__u8 __user *)arg, sbi->raw_super->encrypt_pw_salt,
									16))
2390 2391
		err = -EFAULT;
out_err:
2392
	up_write(&sbi->sb_lock);
2393 2394
	mnt_drop_write_file(filp);
	return err;
2395 2396
}

E
Eric Biggers 已提交
2397 2398 2399 2400 2401 2402 2403 2404 2405 2406 2407 2408 2409 2410 2411 2412 2413 2414 2415 2416 2417 2418 2419 2420 2421 2422 2423 2424 2425 2426 2427 2428 2429 2430 2431 2432 2433 2434 2435 2436 2437 2438 2439
static int f2fs_ioc_get_encryption_policy_ex(struct file *filp,
					     unsigned long arg)
{
	if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
		return -EOPNOTSUPP;

	return fscrypt_ioctl_get_policy_ex(filp, (void __user *)arg);
}

static int f2fs_ioc_add_encryption_key(struct file *filp, unsigned long arg)
{
	if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
		return -EOPNOTSUPP;

	return fscrypt_ioctl_add_key(filp, (void __user *)arg);
}

static int f2fs_ioc_remove_encryption_key(struct file *filp, unsigned long arg)
{
	if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
		return -EOPNOTSUPP;

	return fscrypt_ioctl_remove_key(filp, (void __user *)arg);
}

static int f2fs_ioc_remove_encryption_key_all_users(struct file *filp,
						    unsigned long arg)
{
	if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
		return -EOPNOTSUPP;

	return fscrypt_ioctl_remove_key_all_users(filp, (void __user *)arg);
}

static int f2fs_ioc_get_encryption_key_status(struct file *filp,
					      unsigned long arg)
{
	if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
		return -EOPNOTSUPP;

	return fscrypt_ioctl_get_key_status(filp, (void __user *)arg);
}

2440 2441 2442 2443 2444 2445 2446 2447
static int f2fs_ioc_get_encryption_nonce(struct file *filp, unsigned long arg)
{
	if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
		return -EOPNOTSUPP;

	return fscrypt_ioctl_get_nonce(filp, (void __user *)arg);
}

2448 2449 2450 2451
static int f2fs_ioc_gc(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
C
Chao Yu 已提交
2452
	__u32 sync;
2453
	int ret;
2454 2455 2456 2457

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

C
Chao Yu 已提交
2458
	if (get_user(sync, (__u32 __user *)arg))
2459 2460
		return -EFAULT;

C
Chao Yu 已提交
2461 2462
	if (f2fs_readonly(sbi->sb))
		return -EROFS;
2463

2464 2465 2466 2467
	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

C
Chao Yu 已提交
2468
	if (!sync) {
C
Chao Yu 已提交
2469
		if (!down_write_trylock(&sbi->gc_lock)) {
2470 2471 2472
			ret = -EBUSY;
			goto out;
		}
C
Chao Yu 已提交
2473
	} else {
C
Chao Yu 已提交
2474
		down_write(&sbi->gc_lock);
2475 2476
	}

2477
	ret = f2fs_gc(sbi, sync, true, NULL_SEGNO);
2478 2479 2480
out:
	mnt_drop_write_file(filp);
	return ret;
2481 2482
}

2483 2484 2485 2486 2487 2488 2489 2490 2491 2492 2493 2494 2495 2496 2497 2498 2499 2500
static int f2fs_ioc_gc_range(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct f2fs_gc_range range;
	u64 end;
	int ret;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (copy_from_user(&range, (struct f2fs_gc_range __user *)arg,
							sizeof(range)))
		return -EFAULT;

	if (f2fs_readonly(sbi->sb))
		return -EROFS;

2501
	end = range.start + range.len;
2502 2503
	if (end < range.start || range.start < MAIN_BLKADDR(sbi) ||
					end >= MAX_BLKADDR(sbi))
2504 2505
		return -EINVAL;

2506 2507 2508 2509 2510 2511
	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

do_more:
	if (!range.sync) {
C
Chao Yu 已提交
2512
		if (!down_write_trylock(&sbi->gc_lock)) {
2513 2514 2515 2516
			ret = -EBUSY;
			goto out;
		}
	} else {
C
Chao Yu 已提交
2517
		down_write(&sbi->gc_lock);
2518 2519 2520
	}

	ret = f2fs_gc(sbi, range.sync, true, GET_SEGNO(sbi, range.start));
2521 2522 2523 2524 2525
	if (ret) {
		if (ret == -EBUSY)
			ret = -EAGAIN;
		goto out;
	}
2526
	range.start += BLKS_PER_SEC(sbi);
2527 2528 2529 2530 2531 2532 2533
	if (range.start <= end)
		goto do_more;
out:
	mnt_drop_write_file(filp);
	return ret;
}

C
Chao Yu 已提交
2534
static int f2fs_ioc_write_checkpoint(struct file *filp, unsigned long arg)
2535 2536 2537
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
2538
	int ret;
2539 2540 2541 2542 2543 2544 2545

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (f2fs_readonly(sbi->sb))
		return -EROFS;

D
Daniel Rosenberg 已提交
2546
	if (unlikely(is_sbi_flag_set(sbi, SBI_CP_DISABLED))) {
2547
		f2fs_info(sbi, "Skipping Checkpoint. Checkpoints currently disabled.");
D
Daniel Rosenberg 已提交
2548 2549 2550
		return -EINVAL;
	}

2551 2552 2553 2554 2555 2556 2557 2558
	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

	ret = f2fs_sync_fs(sbi->sb, 1);

	mnt_drop_write_file(filp);
	return ret;
2559 2560
}

C
Chao Yu 已提交
2561 2562 2563 2564 2565
static int f2fs_defragment_range(struct f2fs_sb_info *sbi,
					struct file *filp,
					struct f2fs_defragment *range)
{
	struct inode *inode = file_inode(filp);
2566
	struct f2fs_map_blocks map = { .m_next_extent = NULL,
2567 2568
					.m_seg_type = NO_CHECK_TYPE ,
					.m_may_create = false };
2569
	struct extent_info ei = {0, 0, 0};
2570
	pgoff_t pg_start, pg_end, next_pgofs;
2571
	unsigned int blk_per_seg = sbi->blocks_per_seg;
C
Chao Yu 已提交
2572 2573 2574 2575 2576 2577
	unsigned int total = 0, sec_num;
	block_t blk_end = 0;
	bool fragmented = false;
	int err;

	/* if in-place-update policy is enabled, don't waste time here */
C
Chao Yu 已提交
2578
	if (f2fs_should_update_inplace(inode, NULL))
C
Chao Yu 已提交
2579 2580
		return -EINVAL;

2581 2582
	pg_start = range->start >> PAGE_SHIFT;
	pg_end = (range->start + range->len) >> PAGE_SHIFT;
C
Chao Yu 已提交
2583

J
Jaegeuk Kim 已提交
2584
	f2fs_balance_fs(sbi, true);
C
Chao Yu 已提交
2585

A
Al Viro 已提交
2586
	inode_lock(inode);
C
Chao Yu 已提交
2587 2588 2589

	/* writeback all dirty pages in the range */
	err = filemap_write_and_wait_range(inode->i_mapping, range->start,
2590
						range->start + range->len - 1);
C
Chao Yu 已提交
2591 2592 2593 2594 2595 2596 2597 2598 2599 2600 2601 2602 2603
	if (err)
		goto out;

	/*
	 * lookup mapping info in extent cache, skip defragmenting if physical
	 * block addresses are continuous.
	 */
	if (f2fs_lookup_extent_cache(inode, pg_start, &ei)) {
		if (ei.fofs + ei.len >= pg_end)
			goto out;
	}

	map.m_lblk = pg_start;
2604
	map.m_next_pgofs = &next_pgofs;
C
Chao Yu 已提交
2605 2606 2607 2608 2609 2610 2611

	/*
	 * lookup mapping info in dnode page cache, skip defragmenting if all
	 * physical block addresses are continuous even if there are hole(s)
	 * in logical blocks.
	 */
	while (map.m_lblk < pg_end) {
F
Fan Li 已提交
2612
		map.m_len = pg_end - map.m_lblk;
2613
		err = f2fs_map_blocks(inode, &map, 0, F2FS_GET_BLOCK_DEFAULT);
C
Chao Yu 已提交
2614 2615 2616 2617
		if (err)
			goto out;

		if (!(map.m_flags & F2FS_MAP_FLAGS)) {
2618
			map.m_lblk = next_pgofs;
C
Chao Yu 已提交
2619 2620 2621
			continue;
		}

2622
		if (blk_end && blk_end != map.m_pblk)
C
Chao Yu 已提交
2623
			fragmented = true;
2624 2625 2626 2627

		/* record total count of block that we're going to move */
		total += map.m_len;

C
Chao Yu 已提交
2628 2629 2630 2631 2632
		blk_end = map.m_pblk + map.m_len;

		map.m_lblk += map.m_len;
	}

2633 2634
	if (!fragmented) {
		total = 0;
C
Chao Yu 已提交
2635
		goto out;
2636
	}
C
Chao Yu 已提交
2637

2638
	sec_num = DIV_ROUND_UP(total, BLKS_PER_SEC(sbi));
C
Chao Yu 已提交
2639 2640 2641 2642 2643 2644

	/*
	 * make sure there are enough free section for LFS allocation, this can
	 * avoid defragment running in SSR mode when free section are allocated
	 * intensively
	 */
2645
	if (has_not_enough_free_secs(sbi, 0, sec_num)) {
C
Chao Yu 已提交
2646 2647 2648 2649
		err = -EAGAIN;
		goto out;
	}

2650 2651 2652 2653
	map.m_lblk = pg_start;
	map.m_len = pg_end - pg_start;
	total = 0;

C
Chao Yu 已提交
2654 2655 2656 2657 2658
	while (map.m_lblk < pg_end) {
		pgoff_t idx;
		int cnt = 0;

do_map:
F
Fan Li 已提交
2659
		map.m_len = pg_end - map.m_lblk;
2660
		err = f2fs_map_blocks(inode, &map, 0, F2FS_GET_BLOCK_DEFAULT);
C
Chao Yu 已提交
2661 2662 2663 2664
		if (err)
			goto clear_out;

		if (!(map.m_flags & F2FS_MAP_FLAGS)) {
2665
			map.m_lblk = next_pgofs;
2666
			goto check;
C
Chao Yu 已提交
2667 2668
		}

2669
		set_inode_flag(inode, FI_DO_DEFRAG);
C
Chao Yu 已提交
2670 2671 2672 2673 2674

		idx = map.m_lblk;
		while (idx < map.m_lblk + map.m_len && cnt < blk_per_seg) {
			struct page *page;

C
Chao Yu 已提交
2675
			page = f2fs_get_lock_data_page(inode, idx, true);
C
Chao Yu 已提交
2676 2677 2678 2679 2680 2681 2682 2683 2684 2685 2686 2687 2688 2689
			if (IS_ERR(page)) {
				err = PTR_ERR(page);
				goto clear_out;
			}

			set_page_dirty(page);
			f2fs_put_page(page, 1);

			idx++;
			cnt++;
			total++;
		}

		map.m_lblk = idx;
2690 2691
check:
		if (map.m_lblk < pg_end && cnt < blk_per_seg)
C
Chao Yu 已提交
2692 2693
			goto do_map;

2694
		clear_inode_flag(inode, FI_DO_DEFRAG);
C
Chao Yu 已提交
2695 2696 2697 2698 2699 2700

		err = filemap_fdatawrite(inode->i_mapping);
		if (err)
			goto out;
	}
clear_out:
2701
	clear_inode_flag(inode, FI_DO_DEFRAG);
C
Chao Yu 已提交
2702
out:
A
Al Viro 已提交
2703
	inode_unlock(inode);
C
Chao Yu 已提交
2704
	if (!err)
2705
		range->len = (u64)total << PAGE_SHIFT;
C
Chao Yu 已提交
2706 2707 2708 2709 2710 2711 2712 2713 2714 2715 2716 2717 2718
	return err;
}

static int f2fs_ioc_defragment(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct f2fs_defragment range;
	int err;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

2719
	if (!S_ISREG(inode->i_mode) || f2fs_is_atomic_file(inode))
C
Chao Yu 已提交
2720 2721
		return -EINVAL;

2722 2723
	if (f2fs_readonly(sbi->sb))
		return -EROFS;
C
Chao Yu 已提交
2724 2725

	if (copy_from_user(&range, (struct f2fs_defragment __user *)arg,
2726 2727
							sizeof(range)))
		return -EFAULT;
C
Chao Yu 已提交
2728 2729

	/* verify alignment of offset & size */
2730 2731
	if (range.start & (F2FS_BLKSIZE - 1) || range.len & (F2FS_BLKSIZE - 1))
		return -EINVAL;
C
Chao Yu 已提交
2732

S
Sheng Yong 已提交
2733
	if (unlikely((range.start + range.len) >> PAGE_SHIFT >
2734 2735 2736 2737 2738 2739
					sbi->max_file_blocks))
		return -EINVAL;

	err = mnt_want_write_file(filp);
	if (err)
		return err;
S
Sheng Yong 已提交
2740

C
Chao Yu 已提交
2741
	err = f2fs_defragment_range(sbi, filp, &range);
2742 2743
	mnt_drop_write_file(filp);

2744
	f2fs_update_time(sbi, REQ_TIME);
C
Chao Yu 已提交
2745
	if (err < 0)
2746
		return err;
C
Chao Yu 已提交
2747 2748 2749

	if (copy_to_user((struct f2fs_defragment __user *)arg, &range,
							sizeof(range)))
2750 2751 2752
		return -EFAULT;

	return 0;
C
Chao Yu 已提交
2753 2754
}

2755 2756 2757 2758 2759 2760 2761 2762 2763 2764 2765 2766 2767 2768 2769 2770 2771
static int f2fs_move_file_range(struct file *file_in, loff_t pos_in,
			struct file *file_out, loff_t pos_out, size_t len)
{
	struct inode *src = file_inode(file_in);
	struct inode *dst = file_inode(file_out);
	struct f2fs_sb_info *sbi = F2FS_I_SB(src);
	size_t olen = len, dst_max_i_size = 0;
	size_t dst_osize;
	int ret;

	if (file_in->f_path.mnt != file_out->f_path.mnt ||
				src->i_sb != dst->i_sb)
		return -EXDEV;

	if (unlikely(f2fs_readonly(src->i_sb)))
		return -EROFS;

2772 2773
	if (!S_ISREG(src->i_mode) || !S_ISREG(dst->i_mode))
		return -EINVAL;
2774

2775
	if (IS_ENCRYPTED(src) || IS_ENCRYPTED(dst))
2776 2777
		return -EOPNOTSUPP;

2778 2779 2780
	if (pos_out < 0 || pos_in < 0)
		return -EINVAL;

2781 2782 2783 2784 2785 2786 2787
	if (src == dst) {
		if (pos_in == pos_out)
			return 0;
		if (pos_out > pos_in && pos_out < pos_in + len)
			return -EINVAL;
	}

2788
	inode_lock(src);
2789
	if (src != dst) {
2790 2791 2792
		ret = -EBUSY;
		if (!inode_trylock(dst))
			goto out;
2793
	}
2794 2795 2796 2797 2798 2799 2800 2801 2802 2803 2804 2805 2806 2807 2808 2809 2810 2811 2812 2813 2814 2815 2816 2817 2818 2819 2820 2821 2822 2823 2824 2825 2826 2827 2828 2829 2830 2831 2832 2833 2834 2835 2836

	ret = -EINVAL;
	if (pos_in + len > src->i_size || pos_in + len < pos_in)
		goto out_unlock;
	if (len == 0)
		olen = len = src->i_size - pos_in;
	if (pos_in + len == src->i_size)
		len = ALIGN(src->i_size, F2FS_BLKSIZE) - pos_in;
	if (len == 0) {
		ret = 0;
		goto out_unlock;
	}

	dst_osize = dst->i_size;
	if (pos_out + olen > dst->i_size)
		dst_max_i_size = pos_out + olen;

	/* verify the end result is block aligned */
	if (!IS_ALIGNED(pos_in, F2FS_BLKSIZE) ||
			!IS_ALIGNED(pos_in + len, F2FS_BLKSIZE) ||
			!IS_ALIGNED(pos_out, F2FS_BLKSIZE))
		goto out_unlock;

	ret = f2fs_convert_inline_inode(src);
	if (ret)
		goto out_unlock;

	ret = f2fs_convert_inline_inode(dst);
	if (ret)
		goto out_unlock;

	/* write out all dirty pages from offset */
	ret = filemap_write_and_wait_range(src->i_mapping,
					pos_in, pos_in + len);
	if (ret)
		goto out_unlock;

	ret = filemap_write_and_wait_range(dst->i_mapping,
					pos_out, pos_out + len);
	if (ret)
		goto out_unlock;

	f2fs_balance_fs(sbi, true);
2837 2838 2839 2840 2841 2842 2843 2844

	down_write(&F2FS_I(src)->i_gc_rwsem[WRITE]);
	if (src != dst) {
		ret = -EBUSY;
		if (!down_write_trylock(&F2FS_I(dst)->i_gc_rwsem[WRITE]))
			goto out_src;
	}

2845
	f2fs_lock_op(sbi);
2846 2847 2848
	ret = __exchange_data_block(src, dst, pos_in >> F2FS_BLKSIZE_BITS,
				pos_out >> F2FS_BLKSIZE_BITS,
				len >> F2FS_BLKSIZE_BITS, false);
2849 2850 2851 2852 2853 2854 2855 2856

	if (!ret) {
		if (dst_max_i_size)
			f2fs_i_size_write(dst, dst_max_i_size);
		else if (dst_osize != dst->i_size)
			f2fs_i_size_write(dst, dst_osize);
	}
	f2fs_unlock_op(sbi);
2857 2858

	if (src != dst)
C
Chao Yu 已提交
2859
		up_write(&F2FS_I(dst)->i_gc_rwsem[WRITE]);
2860 2861 2862 2863
out_src:
	up_write(&F2FS_I(src)->i_gc_rwsem[WRITE]);
out_unlock:
	if (src != dst)
2864
		inode_unlock(dst);
2865
out:
2866 2867 2868 2869 2870 2871 2872 2873 2874 2875 2876 2877 2878 2879 2880 2881 2882 2883 2884 2885 2886 2887 2888 2889 2890 2891 2892 2893 2894 2895 2896 2897 2898 2899 2900
	inode_unlock(src);
	return ret;
}

static int f2fs_ioc_move_range(struct file *filp, unsigned long arg)
{
	struct f2fs_move_range range;
	struct fd dst;
	int err;

	if (!(filp->f_mode & FMODE_READ) ||
			!(filp->f_mode & FMODE_WRITE))
		return -EBADF;

	if (copy_from_user(&range, (struct f2fs_move_range __user *)arg,
							sizeof(range)))
		return -EFAULT;

	dst = fdget(range.dst_fd);
	if (!dst.file)
		return -EBADF;

	if (!(dst.file->f_mode & FMODE_WRITE)) {
		err = -EBADF;
		goto err_out;
	}

	err = mnt_want_write_file(filp);
	if (err)
		goto err_out;

	err = f2fs_move_file_range(filp, range.pos_in, dst.file,
					range.pos_out, range.len);

	mnt_drop_write_file(filp);
2901 2902
	if (err)
		goto err_out;
2903 2904 2905 2906 2907 2908 2909 2910 2911

	if (copy_to_user((struct f2fs_move_range __user *)arg,
						&range, sizeof(range)))
		err = -EFAULT;
err_out:
	fdput(dst);
	return err;
}

2912 2913 2914 2915 2916 2917 2918 2919 2920 2921 2922 2923 2924 2925 2926 2927
static int f2fs_ioc_flush_device(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct sit_info *sm = SIT_I(sbi);
	unsigned int start_segno = 0, end_segno = 0;
	unsigned int dev_start_segno = 0, dev_end_segno = 0;
	struct f2fs_flush_device range;
	int ret;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (f2fs_readonly(sbi->sb))
		return -EROFS;

D
Daniel Rosenberg 已提交
2928 2929 2930
	if (unlikely(is_sbi_flag_set(sbi, SBI_CP_DISABLED)))
		return -EINVAL;

2931 2932 2933 2934
	if (copy_from_user(&range, (struct f2fs_flush_device __user *)arg,
							sizeof(range)))
		return -EFAULT;

2935
	if (!f2fs_is_multi_device(sbi) || sbi->s_ndevs - 1 <= range.dev_num ||
2936
			__is_large_section(sbi)) {
2937 2938
		f2fs_warn(sbi, "Can't flush %u in %d for segs_per_sec %u != 1",
			  range.dev_num, sbi->s_ndevs, sbi->segs_per_sec);
2939 2940 2941 2942 2943 2944 2945 2946 2947 2948 2949 2950 2951 2952 2953 2954 2955
		return -EINVAL;
	}

	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

	if (range.dev_num != 0)
		dev_start_segno = GET_SEGNO(sbi, FDEV(range.dev_num).start_blk);
	dev_end_segno = GET_SEGNO(sbi, FDEV(range.dev_num).end_blk);

	start_segno = sm->last_victim[FLUSH_DEVICE];
	if (start_segno < dev_start_segno || start_segno >= dev_end_segno)
		start_segno = dev_start_segno;
	end_segno = min(start_segno + range.segments, dev_end_segno);

	while (start_segno < end_segno) {
C
Chao Yu 已提交
2956
		if (!down_write_trylock(&sbi->gc_lock)) {
2957 2958 2959 2960 2961 2962 2963 2964 2965 2966 2967 2968 2969 2970 2971 2972 2973 2974
			ret = -EBUSY;
			goto out;
		}
		sm->last_victim[GC_CB] = end_segno + 1;
		sm->last_victim[GC_GREEDY] = end_segno + 1;
		sm->last_victim[ALLOC_NEXT] = end_segno + 1;
		ret = f2fs_gc(sbi, true, true, start_segno);
		if (ret == -EAGAIN)
			ret = 0;
		else if (ret < 0)
			break;
		start_segno++;
	}
out:
	mnt_drop_write_file(filp);
	return ret;
}

2975 2976 2977 2978 2979 2980 2981 2982 2983 2984
static int f2fs_ioc_get_features(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	u32 sb_feature = le32_to_cpu(F2FS_I_SB(inode)->raw_super->feature);

	/* Must validate to set it with SQLite behavior in Android. */
	sb_feature |= F2FS_FEATURE_ATOMIC_WRITE;

	return put_user(sb_feature, (u32 __user *)arg);
}
2985

2986
#ifdef CONFIG_QUOTA
2987 2988 2989 2990 2991 2992 2993 2994 2995 2996 2997 2998 2999 3000 3001 3002 3003
int f2fs_transfer_project_quota(struct inode *inode, kprojid_t kprojid)
{
	struct dquot *transfer_to[MAXQUOTAS] = {};
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct super_block *sb = sbi->sb;
	int err = 0;

	transfer_to[PRJQUOTA] = dqget(sb, make_kqid_projid(kprojid));
	if (!IS_ERR(transfer_to[PRJQUOTA])) {
		err = __dquot_transfer(inode, transfer_to);
		if (err)
			set_sbi_flag(sbi, SBI_QUOTA_NEED_REPAIR);
		dqput(transfer_to[PRJQUOTA]);
	}
	return err;
}

3004 3005 3006 3007 3008 3009 3010 3011 3012
static int f2fs_ioc_setproject(struct file *filp, __u32 projid)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_inode_info *fi = F2FS_I(inode);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct page *ipage;
	kprojid_t kprojid;
	int err;

3013
	if (!f2fs_sb_has_project_quota(sbi)) {
3014 3015 3016 3017 3018 3019 3020 3021 3022 3023 3024 3025 3026 3027 3028 3029 3030
		if (projid != F2FS_DEF_PROJID)
			return -EOPNOTSUPP;
		else
			return 0;
	}

	if (!f2fs_has_extra_attr(inode))
		return -EOPNOTSUPP;

	kprojid = make_kprojid(&init_user_ns, (projid_t)projid);

	if (projid_eq(kprojid, F2FS_I(inode)->i_projid))
		return 0;

	err = -EPERM;
	/* Is it quota file? Do not allow user to mess with it */
	if (IS_NOQUOTA(inode))
3031
		return err;
3032

C
Chao Yu 已提交
3033
	ipage = f2fs_get_node_page(sbi, inode->i_ino);
3034 3035
	if (IS_ERR(ipage))
		return PTR_ERR(ipage);
3036 3037 3038 3039 3040

	if (!F2FS_FITS_IN_INODE(F2FS_INODE(ipage), fi->i_extra_isize,
								i_projid)) {
		err = -EOVERFLOW;
		f2fs_put_page(ipage, 1);
3041
		return err;
3042 3043 3044
	}
	f2fs_put_page(ipage, 1);

3045 3046
	err = dquot_initialize(inode);
	if (err)
3047
		return err;
3048

3049 3050 3051 3052
	f2fs_lock_op(sbi);
	err = f2fs_transfer_project_quota(inode, kprojid);
	if (err)
		goto out_unlock;
3053 3054 3055 3056

	F2FS_I(inode)->i_projid = kprojid;
	inode->i_ctime = current_time(inode);
	f2fs_mark_inode_dirty_sync(inode, true);
3057 3058
out_unlock:
	f2fs_unlock_op(sbi);
3059 3060 3061
	return err;
}
#else
3062 3063 3064 3065 3066
int f2fs_transfer_project_quota(struct inode *inode, kprojid_t kprojid)
{
	return 0;
}

3067 3068 3069 3070 3071 3072 3073 3074
static int f2fs_ioc_setproject(struct file *filp, __u32 projid)
{
	if (projid != F2FS_DEF_PROJID)
		return -EOPNOTSUPP;
	return 0;
}
#endif

3075 3076 3077 3078 3079 3080 3081 3082 3083 3084 3085 3086 3087 3088 3089 3090 3091 3092 3093 3094 3095 3096 3097 3098 3099 3100 3101 3102 3103 3104 3105 3106 3107 3108 3109 3110 3111 3112
/* FS_IOC_FSGETXATTR and FS_IOC_FSSETXATTR support */

/*
 * To make a new on-disk f2fs i_flag gettable via FS_IOC_FSGETXATTR and settable
 * via FS_IOC_FSSETXATTR, add an entry for it to f2fs_xflags_map[], and add its
 * FS_XFLAG_* equivalent to F2FS_SUPPORTED_XFLAGS.
 */

static const struct {
	u32 iflag;
	u32 xflag;
} f2fs_xflags_map[] = {
	{ F2FS_SYNC_FL,		FS_XFLAG_SYNC },
	{ F2FS_IMMUTABLE_FL,	FS_XFLAG_IMMUTABLE },
	{ F2FS_APPEND_FL,	FS_XFLAG_APPEND },
	{ F2FS_NODUMP_FL,	FS_XFLAG_NODUMP },
	{ F2FS_NOATIME_FL,	FS_XFLAG_NOATIME },
	{ F2FS_PROJINHERIT_FL,	FS_XFLAG_PROJINHERIT },
};

#define F2FS_SUPPORTED_XFLAGS (		\
		FS_XFLAG_SYNC |		\
		FS_XFLAG_IMMUTABLE |	\
		FS_XFLAG_APPEND |	\
		FS_XFLAG_NODUMP |	\
		FS_XFLAG_NOATIME |	\
		FS_XFLAG_PROJINHERIT)

/* Convert f2fs on-disk i_flags to FS_IOC_FS{GET,SET}XATTR flags */
static inline u32 f2fs_iflags_to_xflags(u32 iflags)
{
	u32 xflags = 0;
	int i;

	for (i = 0; i < ARRAY_SIZE(f2fs_xflags_map); i++)
		if (iflags & f2fs_xflags_map[i].iflag)
			xflags |= f2fs_xflags_map[i].xflag;

3113 3114 3115
	return xflags;
}

3116 3117
/* Convert FS_IOC_FS{GET,SET}XATTR flags to f2fs on-disk i_flags */
static inline u32 f2fs_xflags_to_iflags(u32 xflags)
3118
{
3119 3120
	u32 iflags = 0;
	int i;
3121

3122 3123 3124
	for (i = 0; i < ARRAY_SIZE(f2fs_xflags_map); i++)
		if (xflags & f2fs_xflags_map[i].xflag)
			iflags |= f2fs_xflags_map[i].iflag;
3125 3126 3127 3128

	return iflags;
}

3129
static void f2fs_fill_fsxattr(struct inode *inode, struct fsxattr *fa)
3130 3131 3132
{
	struct f2fs_inode_info *fi = F2FS_I(inode);

3133
	simple_fill_fsxattr(fa, f2fs_iflags_to_xflags(fi->i_flags));
3134

3135
	if (f2fs_sb_has_project_quota(F2FS_I_SB(inode)))
3136
		fa->fsx_projid = from_kprojid(&init_user_ns, fi->i_projid);
3137 3138
}

3139
static int f2fs_ioc_fsgetxattr(struct file *filp, unsigned long arg)
3140
{
3141 3142
	struct inode *inode = file_inode(filp);
	struct fsxattr fa;
3143

3144
	f2fs_fill_fsxattr(inode, &fa);
3145

3146 3147
	if (copy_to_user((struct fsxattr __user *)arg, &fa, sizeof(fa)))
		return -EFAULT;
3148 3149 3150
	return 0;
}

3151 3152 3153
static int f2fs_ioc_fssetxattr(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
3154
	struct fsxattr fa, old_fa;
3155
	u32 iflags;
3156 3157 3158 3159 3160 3161 3162 3163 3164
	int err;

	if (copy_from_user(&fa, (struct fsxattr __user *)arg, sizeof(fa)))
		return -EFAULT;

	/* Make sure caller has proper permission */
	if (!inode_owner_or_capable(inode))
		return -EACCES;

3165
	if (fa.fsx_xflags & ~F2FS_SUPPORTED_XFLAGS)
3166 3167
		return -EOPNOTSUPP;

3168 3169
	iflags = f2fs_xflags_to_iflags(fa.fsx_xflags);
	if (f2fs_mask_flags(inode->i_mode, iflags) != iflags)
3170 3171 3172 3173 3174 3175 3176
		return -EOPNOTSUPP;

	err = mnt_want_write_file(filp);
	if (err)
		return err;

	inode_lock(inode);
3177 3178 3179

	f2fs_fill_fsxattr(inode, &old_fa);
	err = vfs_ioc_fssetxattr_check(inode, &old_fa, &fa);
3180 3181
	if (err)
		goto out;
3182

3183 3184
	err = f2fs_setflags_common(inode, iflags,
			f2fs_xflags_to_iflags(F2FS_SUPPORTED_XFLAGS));
3185
	if (err)
3186
		goto out;
3187 3188

	err = f2fs_ioc_setproject(filp, fa.fsx_projid);
3189 3190 3191 3192
out:
	inode_unlock(inode);
	mnt_drop_write_file(filp);
	return err;
3193
}
3194

3195 3196 3197 3198 3199 3200 3201
int f2fs_pin_file_control(struct inode *inode, bool inc)
{
	struct f2fs_inode_info *fi = F2FS_I(inode);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);

	/* Use i_gc_failures for normal file as a risk signal. */
	if (inc)
3202 3203
		f2fs_i_gc_failures_write(inode,
				fi->i_gc_failures[GC_FAILURE_PIN] + 1);
3204

3205
	if (fi->i_gc_failures[GC_FAILURE_PIN] > sbi->gc_pin_file_threshold) {
3206 3207 3208
		f2fs_warn(sbi, "%s: Enable GC = ino %lx after %x GC trials",
			  __func__, inode->i_ino,
			  fi->i_gc_failures[GC_FAILURE_PIN]);
3209 3210 3211 3212 3213 3214 3215 3216 3217 3218 3219 3220 3221 3222 3223 3224 3225 3226 3227 3228 3229 3230 3231 3232 3233 3234 3235
		clear_inode_flag(inode, FI_PIN_FILE);
		return -EAGAIN;
	}
	return 0;
}

static int f2fs_ioc_set_pin_file(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	__u32 pin;
	int ret = 0;

	if (get_user(pin, (__u32 __user *)arg))
		return -EFAULT;

	if (!S_ISREG(inode->i_mode))
		return -EINVAL;

	if (f2fs_readonly(F2FS_I_SB(inode)->sb))
		return -EROFS;

	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

	inode_lock(inode);

C
Chao Yu 已提交
3236
	if (f2fs_should_update_outplace(inode, NULL)) {
C
Chao Yu 已提交
3237 3238 3239 3240
		ret = -EINVAL;
		goto out;
	}

3241 3242
	if (!pin) {
		clear_inode_flag(inode, FI_PIN_FILE);
3243
		f2fs_i_gc_failures_write(inode, 0);
3244 3245 3246 3247 3248 3249 3250
		goto done;
	}

	if (f2fs_pin_file_control(inode, false)) {
		ret = -EAGAIN;
		goto out;
	}
C
Chao Yu 已提交
3251

3252 3253 3254 3255
	ret = f2fs_convert_inline_inode(inode);
	if (ret)
		goto out;

3256
	if (!f2fs_disable_compressed_file(inode)) {
C
Chao Yu 已提交
3257 3258 3259 3260
		ret = -EOPNOTSUPP;
		goto out;
	}

3261
	set_inode_flag(inode, FI_PIN_FILE);
3262
	ret = F2FS_I(inode)->i_gc_failures[GC_FAILURE_PIN];
3263 3264 3265 3266 3267 3268 3269 3270 3271 3272 3273 3274 3275 3276
done:
	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
out:
	inode_unlock(inode);
	mnt_drop_write_file(filp);
	return ret;
}

static int f2fs_ioc_get_pin_file(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	__u32 pin = 0;

	if (is_inode_flag_set(inode, FI_PIN_FILE))
3277
		pin = F2FS_I(inode)->i_gc_failures[GC_FAILURE_PIN];
3278 3279 3280
	return put_user(pin, (u32 __user *)arg);
}

3281 3282 3283 3284 3285 3286 3287 3288 3289 3290 3291 3292 3293 3294 3295
int f2fs_precache_extents(struct inode *inode)
{
	struct f2fs_inode_info *fi = F2FS_I(inode);
	struct f2fs_map_blocks map;
	pgoff_t m_next_extent;
	loff_t end;
	int err;

	if (is_inode_flag_set(inode, FI_NO_EXTENT))
		return -EOPNOTSUPP;

	map.m_lblk = 0;
	map.m_next_pgofs = NULL;
	map.m_next_extent = &m_next_extent;
	map.m_seg_type = NO_CHECK_TYPE;
3296
	map.m_may_create = false;
3297 3298 3299 3300 3301
	end = F2FS_I_SB(inode)->max_file_blocks;

	while (map.m_lblk < end) {
		map.m_len = end - map.m_lblk;

C
Chao Yu 已提交
3302
		down_write(&fi->i_gc_rwsem[WRITE]);
3303
		err = f2fs_map_blocks(inode, &map, 0, F2FS_GET_BLOCK_PRECACHE);
C
Chao Yu 已提交
3304
		up_write(&fi->i_gc_rwsem[WRITE]);
3305 3306 3307 3308 3309 3310 3311 3312 3313 3314 3315 3316 3317 3318
		if (err)
			return err;

		map.m_lblk = m_next_extent;
	}

	return err;
}

static int f2fs_ioc_precache_extents(struct file *filp, unsigned long arg)
{
	return f2fs_precache_extents(file_inode(filp));
}

3319 3320 3321 3322 3323 3324 3325 3326 3327 3328 3329 3330 3331 3332 3333
static int f2fs_ioc_resize_fs(struct file *filp, unsigned long arg)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(file_inode(filp));
	__u64 block_count;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (f2fs_readonly(sbi->sb))
		return -EROFS;

	if (copy_from_user(&block_count, (void __user *)arg,
			   sizeof(block_count)))
		return -EFAULT;

3334
	return f2fs_resize_fs(sbi, block_count);
3335 3336
}

E
Eric Biggers 已提交
3337 3338 3339 3340 3341 3342 3343 3344 3345 3346 3347 3348 3349 3350 3351 3352 3353 3354 3355 3356 3357 3358 3359 3360
static int f2fs_ioc_enable_verity(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);

	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);

	if (!f2fs_sb_has_verity(F2FS_I_SB(inode))) {
		f2fs_warn(F2FS_I_SB(inode),
			  "Can't enable fs-verity on inode %lu: the verity feature is not enabled on this filesystem.\n",
			  inode->i_ino);
		return -EOPNOTSUPP;
	}

	return fsverity_ioctl_enable(filp, (const void __user *)arg);
}

static int f2fs_ioc_measure_verity(struct file *filp, unsigned long arg)
{
	if (!f2fs_sb_has_verity(F2FS_I_SB(file_inode(filp))))
		return -EOPNOTSUPP;

	return fsverity_ioctl_measure(filp, (void __user *)arg);
}

3361
static int f2fs_ioc_getfslabel(struct file *filp, unsigned long arg)
C
Chao Yu 已提交
3362 3363 3364 3365 3366 3367 3368 3369 3370 3371 3372 3373 3374 3375 3376 3377 3378 3379 3380 3381 3382
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	char *vbuf;
	int count;
	int err = 0;

	vbuf = f2fs_kzalloc(sbi, MAX_VOLUME_NAME, GFP_KERNEL);
	if (!vbuf)
		return -ENOMEM;

	down_read(&sbi->sb_lock);
	count = utf16s_to_utf8s(sbi->raw_super->volume_name,
			ARRAY_SIZE(sbi->raw_super->volume_name),
			UTF16_LITTLE_ENDIAN, vbuf, MAX_VOLUME_NAME);
	up_read(&sbi->sb_lock);

	if (copy_to_user((char __user *)arg, vbuf,
				min(FSLABEL_MAX, count)))
		err = -EFAULT;

C
Chao Yu 已提交
3383
	kfree(vbuf);
C
Chao Yu 已提交
3384 3385 3386
	return err;
}

3387
static int f2fs_ioc_setfslabel(struct file *filp, unsigned long arg)
C
Chao Yu 已提交
3388 3389 3390 3391 3392 3393 3394 3395 3396 3397 3398 3399 3400 3401 3402 3403 3404 3405 3406 3407 3408 3409 3410 3411 3412 3413 3414 3415 3416 3417 3418 3419 3420 3421 3422
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	char *vbuf;
	int err = 0;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	vbuf = strndup_user((const char __user *)arg, FSLABEL_MAX);
	if (IS_ERR(vbuf))
		return PTR_ERR(vbuf);

	err = mnt_want_write_file(filp);
	if (err)
		goto out;

	down_write(&sbi->sb_lock);

	memset(sbi->raw_super->volume_name, 0,
			sizeof(sbi->raw_super->volume_name));
	utf8s_to_utf16s(vbuf, strlen(vbuf), UTF16_LITTLE_ENDIAN,
			sbi->raw_super->volume_name,
			ARRAY_SIZE(sbi->raw_super->volume_name));

	err = f2fs_commit_super(sbi, false);

	up_write(&sbi->sb_lock);

	mnt_drop_write_file(filp);
out:
	kfree(vbuf);
	return err;
}

3423 3424 3425 3426 3427 3428 3429 3430 3431 3432 3433
static int f2fs_get_compress_blocks(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	__u64 blocks;

	if (!f2fs_sb_has_compression(F2FS_I_SB(inode)))
		return -EOPNOTSUPP;

	if (!f2fs_compressed_file(inode))
		return -EINVAL;

3434
	blocks = atomic_read(&F2FS_I(inode)->i_compr_blocks);
3435 3436 3437
	return put_user(blocks, (u64 __user *)arg);
}

3438 3439 3440 3441 3442 3443 3444 3445 3446 3447 3448 3449 3450 3451 3452 3453 3454 3455 3456 3457 3458 3459 3460 3461 3462 3463 3464 3465 3466 3467 3468 3469 3470 3471 3472 3473 3474 3475 3476 3477 3478 3479 3480 3481 3482 3483 3484 3485 3486 3487 3488 3489 3490 3491 3492 3493 3494 3495 3496 3497 3498 3499 3500 3501 3502 3503 3504 3505 3506 3507 3508 3509 3510 3511 3512 3513 3514 3515 3516 3517 3518
static int release_compress_blocks(struct dnode_of_data *dn, pgoff_t count)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
	unsigned int released_blocks = 0;
	int cluster_size = F2FS_I(dn->inode)->i_cluster_size;
	block_t blkaddr;
	int i;

	for (i = 0; i < count; i++) {
		blkaddr = data_blkaddr(dn->inode, dn->node_page,
						dn->ofs_in_node + i);

		if (!__is_valid_data_blkaddr(blkaddr))
			continue;
		if (unlikely(!f2fs_is_valid_blkaddr(sbi, blkaddr,
					DATA_GENERIC_ENHANCE)))
			return -EFSCORRUPTED;
	}

	while (count) {
		int compr_blocks = 0;

		for (i = 0; i < cluster_size; i++, dn->ofs_in_node++) {
			blkaddr = f2fs_data_blkaddr(dn);

			if (i == 0) {
				if (blkaddr == COMPRESS_ADDR)
					continue;
				dn->ofs_in_node += cluster_size;
				goto next;
			}

			if (__is_valid_data_blkaddr(blkaddr))
				compr_blocks++;

			if (blkaddr != NEW_ADDR)
				continue;

			dn->data_blkaddr = NULL_ADDR;
			f2fs_set_data_blkaddr(dn);
		}

		f2fs_i_compr_blocks_update(dn->inode, compr_blocks, false);
		dec_valid_block_count(sbi, dn->inode,
					cluster_size - compr_blocks);

		released_blocks += cluster_size - compr_blocks;
next:
		count -= cluster_size;
	}

	return released_blocks;
}

static int f2fs_release_compress_blocks(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	pgoff_t page_idx = 0, last_idx;
	unsigned int released_blocks = 0;
	int ret;
	int writecount;

	if (!f2fs_sb_has_compression(F2FS_I_SB(inode)))
		return -EOPNOTSUPP;

	if (!f2fs_compressed_file(inode))
		return -EINVAL;

	if (f2fs_readonly(sbi->sb))
		return -EROFS;

	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

	f2fs_balance_fs(F2FS_I_SB(inode), true);

	inode_lock(inode);

	writecount = atomic_read(&inode->i_writecount);
3519 3520
	if ((filp->f_mode & FMODE_WRITE && writecount != 1) ||
			(!(filp->f_mode & FMODE_WRITE) && writecount)) {
3521 3522 3523 3524 3525 3526 3527 3528 3529 3530 3531 3532 3533 3534 3535 3536 3537 3538
		ret = -EBUSY;
		goto out;
	}

	if (IS_IMMUTABLE(inode)) {
		ret = -EINVAL;
		goto out;
	}

	ret = filemap_write_and_wait_range(inode->i_mapping, 0, LLONG_MAX);
	if (ret)
		goto out;

	F2FS_I(inode)->i_flags |= F2FS_IMMUTABLE_FL;
	f2fs_set_inode_flags(inode);
	inode->i_ctime = current_time(inode);
	f2fs_mark_inode_dirty_sync(inode, true);

3539
	if (!atomic_read(&F2FS_I(inode)->i_compr_blocks))
3540 3541
		goto out;

3542 3543 3544 3545 3546 3547 3548 3549 3550 3551 3552 3553 3554 3555 3556 3557 3558 3559 3560 3561 3562 3563 3564
	down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
	down_write(&F2FS_I(inode)->i_mmap_sem);

	last_idx = DIV_ROUND_UP(i_size_read(inode), PAGE_SIZE);

	while (page_idx < last_idx) {
		struct dnode_of_data dn;
		pgoff_t end_offset, count;

		set_new_dnode(&dn, inode, NULL, NULL, 0);
		ret = f2fs_get_dnode_of_data(&dn, page_idx, LOOKUP_NODE);
		if (ret) {
			if (ret == -ENOENT) {
				page_idx = f2fs_get_next_page_offset(&dn,
								page_idx);
				ret = 0;
				continue;
			}
			break;
		}

		end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
		count = min(end_offset - dn.ofs_in_node, last_idx - page_idx);
3565
		count = round_up(count, F2FS_I(inode)->i_cluster_size);
3566 3567 3568 3569 3570 3571 3572 3573 3574 3575 3576 3577 3578 3579 3580 3581 3582 3583 3584 3585 3586

		ret = release_compress_blocks(&dn, count);

		f2fs_put_dnode(&dn);

		if (ret < 0)
			break;

		page_idx += count;
		released_blocks += ret;
	}

	up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
	up_write(&F2FS_I(inode)->i_mmap_sem);
out:
	inode_unlock(inode);

	mnt_drop_write_file(filp);

	if (ret >= 0) {
		ret = put_user(released_blocks, (u64 __user *)arg);
3587 3588
	} else if (released_blocks &&
			atomic_read(&F2FS_I(inode)->i_compr_blocks)) {
3589 3590
		set_sbi_flag(sbi, SBI_NEED_FSCK);
		f2fs_warn(sbi, "%s: partial blocks were released i_ino=%lx "
3591
			"iblocks=%llu, released=%u, compr_blocks=%u, "
3592 3593 3594
			"run fsck to fix.",
			__func__, inode->i_ino, inode->i_blocks,
			released_blocks,
3595
			atomic_read(&F2FS_I(inode)->i_compr_blocks));
3596 3597 3598 3599 3600
	}

	return ret;
}

3601 3602 3603 3604 3605 3606 3607 3608 3609 3610 3611 3612 3613 3614 3615 3616 3617 3618 3619 3620 3621 3622 3623 3624 3625 3626 3627 3628 3629 3630 3631 3632 3633 3634 3635 3636 3637 3638 3639 3640 3641 3642 3643 3644 3645 3646 3647 3648 3649 3650 3651 3652 3653 3654 3655 3656 3657 3658 3659 3660 3661 3662 3663 3664 3665 3666 3667 3668 3669 3670 3671 3672 3673 3674 3675 3676 3677 3678 3679 3680 3681 3682
static int reserve_compress_blocks(struct dnode_of_data *dn, pgoff_t count)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
	unsigned int reserved_blocks = 0;
	int cluster_size = F2FS_I(dn->inode)->i_cluster_size;
	block_t blkaddr;
	int i;

	for (i = 0; i < count; i++) {
		blkaddr = data_blkaddr(dn->inode, dn->node_page,
						dn->ofs_in_node + i);

		if (!__is_valid_data_blkaddr(blkaddr))
			continue;
		if (unlikely(!f2fs_is_valid_blkaddr(sbi, blkaddr,
					DATA_GENERIC_ENHANCE)))
			return -EFSCORRUPTED;
	}

	while (count) {
		int compr_blocks = 0;
		blkcnt_t reserved;
		int ret;

		for (i = 0; i < cluster_size; i++, dn->ofs_in_node++) {
			blkaddr = f2fs_data_blkaddr(dn);

			if (i == 0) {
				if (blkaddr == COMPRESS_ADDR)
					continue;
				dn->ofs_in_node += cluster_size;
				goto next;
			}

			if (__is_valid_data_blkaddr(blkaddr)) {
				compr_blocks++;
				continue;
			}

			dn->data_blkaddr = NEW_ADDR;
			f2fs_set_data_blkaddr(dn);
		}

		reserved = cluster_size - compr_blocks;
		ret = inc_valid_block_count(sbi, dn->inode, &reserved);
		if (ret)
			return ret;

		if (reserved != cluster_size - compr_blocks)
			return -ENOSPC;

		f2fs_i_compr_blocks_update(dn->inode, compr_blocks, true);

		reserved_blocks += reserved;
next:
		count -= cluster_size;
	}

	return reserved_blocks;
}

static int f2fs_reserve_compress_blocks(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	pgoff_t page_idx = 0, last_idx;
	unsigned int reserved_blocks = 0;
	int ret;

	if (!f2fs_sb_has_compression(F2FS_I_SB(inode)))
		return -EOPNOTSUPP;

	if (!f2fs_compressed_file(inode))
		return -EINVAL;

	if (f2fs_readonly(sbi->sb))
		return -EROFS;

	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

3683
	if (atomic_read(&F2FS_I(inode)->i_compr_blocks))
3684 3685 3686 3687 3688 3689 3690 3691 3692 3693 3694 3695 3696 3697 3698 3699 3700 3701 3702 3703 3704 3705 3706 3707 3708 3709 3710 3711 3712 3713 3714 3715 3716 3717
		goto out;

	f2fs_balance_fs(F2FS_I_SB(inode), true);

	inode_lock(inode);

	if (!IS_IMMUTABLE(inode)) {
		ret = -EINVAL;
		goto unlock_inode;
	}

	down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
	down_write(&F2FS_I(inode)->i_mmap_sem);

	last_idx = DIV_ROUND_UP(i_size_read(inode), PAGE_SIZE);

	while (page_idx < last_idx) {
		struct dnode_of_data dn;
		pgoff_t end_offset, count;

		set_new_dnode(&dn, inode, NULL, NULL, 0);
		ret = f2fs_get_dnode_of_data(&dn, page_idx, LOOKUP_NODE);
		if (ret) {
			if (ret == -ENOENT) {
				page_idx = f2fs_get_next_page_offset(&dn,
								page_idx);
				ret = 0;
				continue;
			}
			break;
		}

		end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
		count = min(end_offset - dn.ofs_in_node, last_idx - page_idx);
3718
		count = round_up(count, F2FS_I(inode)->i_cluster_size);
3719 3720 3721 3722 3723 3724 3725 3726 3727 3728 3729 3730 3731 3732 3733 3734 3735 3736 3737 3738 3739 3740 3741 3742 3743 3744 3745 3746

		ret = reserve_compress_blocks(&dn, count);

		f2fs_put_dnode(&dn);

		if (ret < 0)
			break;

		page_idx += count;
		reserved_blocks += ret;
	}

	up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
	up_write(&F2FS_I(inode)->i_mmap_sem);

	if (ret >= 0) {
		F2FS_I(inode)->i_flags &= ~F2FS_IMMUTABLE_FL;
		f2fs_set_inode_flags(inode);
		inode->i_ctime = current_time(inode);
		f2fs_mark_inode_dirty_sync(inode, true);
	}
unlock_inode:
	inode_unlock(inode);
out:
	mnt_drop_write_file(filp);

	if (ret >= 0) {
		ret = put_user(reserved_blocks, (u64 __user *)arg);
3747 3748
	} else if (reserved_blocks &&
			atomic_read(&F2FS_I(inode)->i_compr_blocks)) {
3749 3750
		set_sbi_flag(sbi, SBI_NEED_FSCK);
		f2fs_warn(sbi, "%s: partial blocks were released i_ino=%lx "
3751
			"iblocks=%llu, reserved=%u, compr_blocks=%u, "
3752 3753 3754
			"run fsck to fix.",
			__func__, inode->i_ino, inode->i_blocks,
			reserved_blocks,
3755
			atomic_read(&F2FS_I(inode)->i_compr_blocks));
3756 3757 3758 3759 3760
	}

	return ret;
}

3761 3762 3763 3764 3765 3766 3767 3768 3769 3770 3771 3772 3773 3774 3775 3776 3777 3778 3779 3780 3781 3782 3783 3784 3785 3786 3787 3788 3789 3790 3791 3792 3793 3794 3795 3796 3797 3798 3799 3800 3801 3802 3803 3804 3805 3806 3807 3808 3809 3810 3811 3812 3813 3814 3815 3816 3817 3818 3819 3820 3821 3822 3823 3824 3825 3826 3827 3828 3829 3830 3831 3832 3833 3834 3835 3836 3837 3838 3839 3840 3841 3842 3843 3844 3845 3846 3847 3848 3849 3850 3851 3852 3853 3854 3855 3856 3857 3858 3859 3860 3861 3862 3863 3864 3865 3866 3867 3868 3869 3870 3871 3872 3873 3874 3875 3876 3877 3878 3879 3880 3881 3882 3883 3884 3885 3886 3887 3888 3889 3890 3891 3892 3893 3894 3895 3896 3897 3898 3899 3900 3901 3902 3903 3904 3905 3906 3907 3908 3909 3910 3911 3912 3913 3914 3915 3916 3917 3918 3919 3920 3921 3922 3923 3924 3925 3926 3927 3928 3929 3930 3931 3932 3933 3934 3935 3936 3937 3938 3939 3940 3941 3942 3943 3944 3945 3946 3947
static int f2fs_secure_erase(struct block_device *bdev, struct inode *inode,
		pgoff_t off, block_t block, block_t len, u32 flags)
{
	struct request_queue *q = bdev_get_queue(bdev);
	sector_t sector = SECTOR_FROM_BLOCK(block);
	sector_t nr_sects = SECTOR_FROM_BLOCK(len);
	int ret = 0;

	if (!q)
		return -ENXIO;

	if (flags & F2FS_TRIM_FILE_DISCARD)
		ret = blkdev_issue_discard(bdev, sector, nr_sects, GFP_NOFS,
						blk_queue_secure_erase(q) ?
						BLKDEV_DISCARD_SECURE : 0);

	if (!ret && (flags & F2FS_TRIM_FILE_ZEROOUT)) {
		if (IS_ENCRYPTED(inode))
			ret = fscrypt_zeroout_range(inode, off, block, len);
		else
			ret = blkdev_issue_zeroout(bdev, sector, nr_sects,
					GFP_NOFS, 0);
	}

	return ret;
}

static int f2fs_sec_trim_file(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct address_space *mapping = inode->i_mapping;
	struct block_device *prev_bdev = NULL;
	struct f2fs_sectrim_range range;
	pgoff_t index, pg_end, prev_index = 0;
	block_t prev_block = 0, len = 0;
	loff_t end_addr;
	bool to_end = false;
	int ret = 0;

	if (!(filp->f_mode & FMODE_WRITE))
		return -EBADF;

	if (copy_from_user(&range, (struct f2fs_sectrim_range __user *)arg,
				sizeof(range)))
		return -EFAULT;

	if (range.flags == 0 || (range.flags & ~F2FS_TRIM_FILE_MASK) ||
			!S_ISREG(inode->i_mode))
		return -EINVAL;

	if (((range.flags & F2FS_TRIM_FILE_DISCARD) &&
			!f2fs_hw_support_discard(sbi)) ||
			((range.flags & F2FS_TRIM_FILE_ZEROOUT) &&
			 IS_ENCRYPTED(inode) && f2fs_is_multi_device(sbi)))
		return -EOPNOTSUPP;

	file_start_write(filp);
	inode_lock(inode);

	if (f2fs_is_atomic_file(inode) || f2fs_compressed_file(inode) ||
			range.start >= inode->i_size) {
		ret = -EINVAL;
		goto err;
	}

	if (range.len == 0)
		goto err;

	if (inode->i_size - range.start > range.len) {
		end_addr = range.start + range.len;
	} else {
		end_addr = range.len == (u64)-1 ?
			sbi->sb->s_maxbytes : inode->i_size;
		to_end = true;
	}

	if (!IS_ALIGNED(range.start, F2FS_BLKSIZE) ||
			(!to_end && !IS_ALIGNED(end_addr, F2FS_BLKSIZE))) {
		ret = -EINVAL;
		goto err;
	}

	index = F2FS_BYTES_TO_BLK(range.start);
	pg_end = DIV_ROUND_UP(end_addr, F2FS_BLKSIZE);

	ret = f2fs_convert_inline_inode(inode);
	if (ret)
		goto err;

	down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
	down_write(&F2FS_I(inode)->i_mmap_sem);

	ret = filemap_write_and_wait_range(mapping, range.start,
			to_end ? LLONG_MAX : end_addr - 1);
	if (ret)
		goto out;

	truncate_inode_pages_range(mapping, range.start,
			to_end ? -1 : end_addr - 1);

	while (index < pg_end) {
		struct dnode_of_data dn;
		pgoff_t end_offset, count;
		int i;

		set_new_dnode(&dn, inode, NULL, NULL, 0);
		ret = f2fs_get_dnode_of_data(&dn, index, LOOKUP_NODE);
		if (ret) {
			if (ret == -ENOENT) {
				index = f2fs_get_next_page_offset(&dn, index);
				continue;
			}
			goto out;
		}

		end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
		count = min(end_offset - dn.ofs_in_node, pg_end - index);
		for (i = 0; i < count; i++, index++, dn.ofs_in_node++) {
			struct block_device *cur_bdev;
			block_t blkaddr = f2fs_data_blkaddr(&dn);

			if (!__is_valid_data_blkaddr(blkaddr))
				continue;

			if (!f2fs_is_valid_blkaddr(sbi, blkaddr,
						DATA_GENERIC_ENHANCE)) {
				ret = -EFSCORRUPTED;
				f2fs_put_dnode(&dn);
				goto out;
			}

			cur_bdev = f2fs_target_device(sbi, blkaddr, NULL);
			if (f2fs_is_multi_device(sbi)) {
				int di = f2fs_target_device_index(sbi, blkaddr);

				blkaddr -= FDEV(di).start_blk;
			}

			if (len) {
				if (prev_bdev == cur_bdev &&
						index == prev_index + len &&
						blkaddr == prev_block + len) {
					len++;
				} else {
					ret = f2fs_secure_erase(prev_bdev,
						inode, prev_index, prev_block,
						len, range.flags);
					if (ret) {
						f2fs_put_dnode(&dn);
						goto out;
					}

					len = 0;
				}
			}

			if (!len) {
				prev_bdev = cur_bdev;
				prev_index = index;
				prev_block = blkaddr;
				len = 1;
			}
		}

		f2fs_put_dnode(&dn);

		if (fatal_signal_pending(current)) {
			ret = -EINTR;
			goto out;
		}
		cond_resched();
	}

	if (len)
		ret = f2fs_secure_erase(prev_bdev, inode, prev_index,
				prev_block, len, range.flags);
out:
	up_write(&F2FS_I(inode)->i_mmap_sem);
	up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
err:
	inode_unlock(inode);
	file_end_write(filp);

	return ret;
}

3948 3949 3950 3951 3952 3953 3954 3955 3956 3957 3958 3959 3960 3961 3962 3963 3964 3965 3966 3967 3968 3969 3970 3971 3972 3973 3974
static int f2fs_ioc_get_compress_option(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_comp_option option;

	if (!f2fs_sb_has_compression(F2FS_I_SB(inode)))
		return -EOPNOTSUPP;

	inode_lock_shared(inode);

	if (!f2fs_compressed_file(inode)) {
		inode_unlock_shared(inode);
		return -ENODATA;
	}

	option.algorithm = F2FS_I(inode)->i_compress_algorithm;
	option.log_cluster_size = F2FS_I(inode)->i_log_cluster_size;

	inode_unlock_shared(inode);

	if (copy_to_user((struct f2fs_comp_option __user *)arg, &option,
				sizeof(option)))
		return -EFAULT;

	return 0;
}

3975 3976
long f2fs_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
{
3977 3978
	if (unlikely(f2fs_cp_error(F2FS_I_SB(file_inode(filp)))))
		return -EIO;
3979 3980
	if (!f2fs_is_checkpoint_ready(F2FS_I_SB(file_inode(filp))))
		return -ENOSPC;
3981

3982
	switch (cmd) {
3983
	case FS_IOC_GETFLAGS:
3984
		return f2fs_ioc_getflags(filp, arg);
3985
	case FS_IOC_SETFLAGS:
3986
		return f2fs_ioc_setflags(filp, arg);
3987
	case FS_IOC_GETVERSION:
C
Chao Yu 已提交
3988
		return f2fs_ioc_getversion(filp, arg);
J
Jaegeuk Kim 已提交
3989 3990 3991 3992
	case F2FS_IOC_START_ATOMIC_WRITE:
		return f2fs_ioc_start_atomic_write(filp);
	case F2FS_IOC_COMMIT_ATOMIC_WRITE:
		return f2fs_ioc_commit_atomic_write(filp);
3993 3994
	case F2FS_IOC_START_VOLATILE_WRITE:
		return f2fs_ioc_start_volatile_write(filp);
3995 3996 3997 3998
	case F2FS_IOC_RELEASE_VOLATILE_WRITE:
		return f2fs_ioc_release_volatile_write(filp);
	case F2FS_IOC_ABORT_VOLATILE_WRITE:
		return f2fs_ioc_abort_volatile_write(filp);
J
Jaegeuk Kim 已提交
3999 4000
	case F2FS_IOC_SHUTDOWN:
		return f2fs_ioc_shutdown(filp, arg);
4001 4002
	case FITRIM:
		return f2fs_ioc_fitrim(filp, arg);
4003
	case FS_IOC_SET_ENCRYPTION_POLICY:
4004
		return f2fs_ioc_set_encryption_policy(filp, arg);
4005
	case FS_IOC_GET_ENCRYPTION_POLICY:
4006
		return f2fs_ioc_get_encryption_policy(filp, arg);
4007
	case FS_IOC_GET_ENCRYPTION_PWSALT:
4008
		return f2fs_ioc_get_encryption_pwsalt(filp, arg);
E
Eric Biggers 已提交
4009 4010 4011 4012 4013 4014 4015 4016 4017 4018
	case FS_IOC_GET_ENCRYPTION_POLICY_EX:
		return f2fs_ioc_get_encryption_policy_ex(filp, arg);
	case FS_IOC_ADD_ENCRYPTION_KEY:
		return f2fs_ioc_add_encryption_key(filp, arg);
	case FS_IOC_REMOVE_ENCRYPTION_KEY:
		return f2fs_ioc_remove_encryption_key(filp, arg);
	case FS_IOC_REMOVE_ENCRYPTION_KEY_ALL_USERS:
		return f2fs_ioc_remove_encryption_key_all_users(filp, arg);
	case FS_IOC_GET_ENCRYPTION_KEY_STATUS:
		return f2fs_ioc_get_encryption_key_status(filp, arg);
4019 4020
	case FS_IOC_GET_ENCRYPTION_NONCE:
		return f2fs_ioc_get_encryption_nonce(filp, arg);
4021 4022
	case F2FS_IOC_GARBAGE_COLLECT:
		return f2fs_ioc_gc(filp, arg);
4023 4024
	case F2FS_IOC_GARBAGE_COLLECT_RANGE:
		return f2fs_ioc_gc_range(filp, arg);
4025
	case F2FS_IOC_WRITE_CHECKPOINT:
C
Chao Yu 已提交
4026
		return f2fs_ioc_write_checkpoint(filp, arg);
C
Chao Yu 已提交
4027 4028
	case F2FS_IOC_DEFRAGMENT:
		return f2fs_ioc_defragment(filp, arg);
4029 4030
	case F2FS_IOC_MOVE_RANGE:
		return f2fs_ioc_move_range(filp, arg);
4031 4032
	case F2FS_IOC_FLUSH_DEVICE:
		return f2fs_ioc_flush_device(filp, arg);
4033 4034
	case F2FS_IOC_GET_FEATURES:
		return f2fs_ioc_get_features(filp, arg);
4035
	case FS_IOC_FSGETXATTR:
4036
		return f2fs_ioc_fsgetxattr(filp, arg);
4037
	case FS_IOC_FSSETXATTR:
4038
		return f2fs_ioc_fssetxattr(filp, arg);
4039 4040 4041 4042
	case F2FS_IOC_GET_PIN_FILE:
		return f2fs_ioc_get_pin_file(filp, arg);
	case F2FS_IOC_SET_PIN_FILE:
		return f2fs_ioc_set_pin_file(filp, arg);
4043 4044
	case F2FS_IOC_PRECACHE_EXTENTS:
		return f2fs_ioc_precache_extents(filp, arg);
4045 4046
	case F2FS_IOC_RESIZE_FS:
		return f2fs_ioc_resize_fs(filp, arg);
E
Eric Biggers 已提交
4047 4048 4049 4050
	case FS_IOC_ENABLE_VERITY:
		return f2fs_ioc_enable_verity(filp, arg);
	case FS_IOC_MEASURE_VERITY:
		return f2fs_ioc_measure_verity(filp, arg);
4051 4052 4053 4054
	case FS_IOC_GETFSLABEL:
		return f2fs_ioc_getfslabel(filp, arg);
	case FS_IOC_SETFSLABEL:
		return f2fs_ioc_setfslabel(filp, arg);
4055 4056
	case F2FS_IOC_GET_COMPRESS_BLOCKS:
		return f2fs_get_compress_blocks(filp, arg);
4057 4058
	case F2FS_IOC_RELEASE_COMPRESS_BLOCKS:
		return f2fs_release_compress_blocks(filp, arg);
4059 4060
	case F2FS_IOC_RESERVE_COMPRESS_BLOCKS:
		return f2fs_reserve_compress_blocks(filp, arg);
4061 4062
	case F2FS_IOC_SEC_TRIM_FILE:
		return f2fs_sec_trim_file(filp, arg);
4063 4064
	case F2FS_IOC_GET_COMPRESS_OPTION:
		return f2fs_ioc_get_compress_option(filp, arg);
J
Jaegeuk Kim 已提交
4065 4066 4067 4068 4069
	default:
		return -ENOTTY;
	}
}

C
Chao Yu 已提交
4070 4071 4072 4073
static ssize_t f2fs_file_read_iter(struct kiocb *iocb, struct iov_iter *iter)
{
	struct file *file = iocb->ki_filp;
	struct inode *inode = file_inode(file);
C
Chao Yu 已提交
4074
	int ret;
C
Chao Yu 已提交
4075 4076 4077 4078

	if (!f2fs_is_compress_backend_ready(inode))
		return -EOPNOTSUPP;

C
Chao Yu 已提交
4079 4080 4081 4082 4083 4084
	ret = generic_file_read_iter(iocb, iter);

	if (ret > 0)
		f2fs_update_iostat(F2FS_I_SB(inode), APP_READ_IO, ret);

	return ret;
C
Chao Yu 已提交
4085 4086
}

4087 4088
static ssize_t f2fs_file_write_iter(struct kiocb *iocb, struct iov_iter *from)
{
4089 4090 4091
	struct file *file = iocb->ki_filp;
	struct inode *inode = file_inode(file);
	ssize_t ret;
4092

4093 4094 4095 4096
	if (unlikely(f2fs_cp_error(F2FS_I_SB(inode)))) {
		ret = -EIO;
		goto out;
	}
4097

C
Chao Yu 已提交
4098 4099 4100 4101
	if (!f2fs_is_compress_backend_ready(inode)) {
		ret = -EOPNOTSUPP;
		goto out;
	}
C
Chao Yu 已提交
4102

4103 4104
	if (iocb->ki_flags & IOCB_NOWAIT) {
		if (!inode_trylock(inode)) {
4105 4106 4107
			ret = -EAGAIN;
			goto out;
		}
4108
	} else {
H
Hyunchul Lee 已提交
4109 4110 4111
		inode_lock(inode);
	}

4112 4113
	ret = generic_write_checks(iocb, from);
	if (ret > 0) {
4114 4115
		bool preallocated = false;
		size_t target_size = 0;
4116
		int err;
4117

4118 4119
		if (iov_iter_fault_in_readable(from, iov_iter_count(from)))
			set_inode_flag(inode, FI_NO_PREALLOC);
4120

4121 4122
		if ((iocb->ki_flags & IOCB_NOWAIT)) {
			if (!f2fs_overwrite_io(inode, iocb->ki_pos,
H
Hyunchul Lee 已提交
4123
						iov_iter_count(from)) ||
4124 4125 4126 4127 4128 4129 4130
				f2fs_has_inline_data(inode) ||
				f2fs_force_buffered_io(inode, iocb, from)) {
				clear_inode_flag(inode, FI_NO_PREALLOC);
				inode_unlock(inode);
				ret = -EAGAIN;
				goto out;
			}
4131 4132
			goto write;
		}
4133

4134 4135 4136 4137 4138 4139 4140 4141 4142 4143 4144 4145 4146 4147 4148 4149 4150 4151 4152 4153 4154 4155 4156 4157 4158 4159 4160 4161 4162 4163
		if (is_inode_flag_set(inode, FI_NO_PREALLOC))
			goto write;

		if (iocb->ki_flags & IOCB_DIRECT) {
			/*
			 * Convert inline data for Direct I/O before entering
			 * f2fs_direct_IO().
			 */
			err = f2fs_convert_inline_inode(inode);
			if (err)
				goto out_err;
			/*
			 * If force_buffere_io() is true, we have to allocate
			 * blocks all the time, since f2fs_direct_IO will fall
			 * back to buffered IO.
			 */
			if (!f2fs_force_buffered_io(inode, iocb, from) &&
					allow_outplace_dio(inode, iocb, from))
				goto write;
		}
		preallocated = true;
		target_size = iocb->ki_pos + iov_iter_count(from);

		err = f2fs_preallocate_blocks(iocb, from);
		if (err) {
out_err:
			clear_inode_flag(inode, FI_NO_PREALLOC);
			inode_unlock(inode);
			ret = err;
			goto out;
4164
		}
4165
write:
4166
		ret = __generic_file_write_iter(iocb, from);
4167
		clear_inode_flag(inode, FI_NO_PREALLOC);
C
Chao Yu 已提交
4168

4169 4170 4171 4172
		/* if we couldn't write data, we should deallocate blocks. */
		if (preallocated && i_size_read(inode) < target_size)
			f2fs_truncate(inode);

C
Chao Yu 已提交
4173 4174
		if (ret > 0)
			f2fs_update_iostat(F2FS_I_SB(inode), APP_WRITE_IO, ret);
4175 4176
	}
	inode_unlock(inode);
4177 4178 4179
out:
	trace_f2fs_file_write_iter(inode, iocb->ki_pos,
					iov_iter_count(from), ret);
4180 4181
	if (ret > 0)
		ret = generic_write_sync(iocb, ret);
4182
	return ret;
4183 4184
}

4185 4186 4187 4188
#ifdef CONFIG_COMPAT
long f2fs_compat_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
{
	switch (cmd) {
4189 4190
	case FS_IOC32_GETFLAGS:
		cmd = FS_IOC_GETFLAGS;
4191
		break;
4192 4193
	case FS_IOC32_SETFLAGS:
		cmd = FS_IOC_SETFLAGS;
4194
		break;
4195 4196
	case FS_IOC32_GETVERSION:
		cmd = FS_IOC_GETVERSION;
4197 4198 4199 4200 4201 4202 4203
		break;
	case F2FS_IOC_START_ATOMIC_WRITE:
	case F2FS_IOC_COMMIT_ATOMIC_WRITE:
	case F2FS_IOC_START_VOLATILE_WRITE:
	case F2FS_IOC_RELEASE_VOLATILE_WRITE:
	case F2FS_IOC_ABORT_VOLATILE_WRITE:
	case F2FS_IOC_SHUTDOWN:
4204
	case FITRIM:
4205 4206 4207
	case FS_IOC_SET_ENCRYPTION_POLICY:
	case FS_IOC_GET_ENCRYPTION_PWSALT:
	case FS_IOC_GET_ENCRYPTION_POLICY:
E
Eric Biggers 已提交
4208 4209 4210 4211 4212
	case FS_IOC_GET_ENCRYPTION_POLICY_EX:
	case FS_IOC_ADD_ENCRYPTION_KEY:
	case FS_IOC_REMOVE_ENCRYPTION_KEY:
	case FS_IOC_REMOVE_ENCRYPTION_KEY_ALL_USERS:
	case FS_IOC_GET_ENCRYPTION_KEY_STATUS:
4213
	case FS_IOC_GET_ENCRYPTION_NONCE:
4214
	case F2FS_IOC_GARBAGE_COLLECT:
4215
	case F2FS_IOC_GARBAGE_COLLECT_RANGE:
4216 4217
	case F2FS_IOC_WRITE_CHECKPOINT:
	case F2FS_IOC_DEFRAGMENT:
4218
	case F2FS_IOC_MOVE_RANGE:
4219
	case F2FS_IOC_FLUSH_DEVICE:
4220
	case F2FS_IOC_GET_FEATURES:
4221 4222
	case FS_IOC_FSGETXATTR:
	case FS_IOC_FSSETXATTR:
4223 4224
	case F2FS_IOC_GET_PIN_FILE:
	case F2FS_IOC_SET_PIN_FILE:
4225
	case F2FS_IOC_PRECACHE_EXTENTS:
4226
	case F2FS_IOC_RESIZE_FS:
E
Eric Biggers 已提交
4227 4228
	case FS_IOC_ENABLE_VERITY:
	case FS_IOC_MEASURE_VERITY:
4229 4230
	case FS_IOC_GETFSLABEL:
	case FS_IOC_SETFSLABEL:
4231
	case F2FS_IOC_GET_COMPRESS_BLOCKS:
4232
	case F2FS_IOC_RELEASE_COMPRESS_BLOCKS:
4233
	case F2FS_IOC_RESERVE_COMPRESS_BLOCKS:
4234
	case F2FS_IOC_SEC_TRIM_FILE:
4235
	case F2FS_IOC_GET_COMPRESS_OPTION:
4236
		break;
4237 4238 4239 4240 4241 4242 4243
	default:
		return -ENOIOCTLCMD;
	}
	return f2fs_ioctl(file, cmd, (unsigned long) compat_ptr(arg));
}
#endif

J
Jaegeuk Kim 已提交
4244
const struct file_operations f2fs_file_operations = {
4245
	.llseek		= f2fs_llseek,
C
Chao Yu 已提交
4246
	.read_iter	= f2fs_file_read_iter,
4247 4248
	.write_iter	= f2fs_file_write_iter,
	.open		= f2fs_file_open,
4249
	.release	= f2fs_release_file,
J
Jaegeuk Kim 已提交
4250
	.mmap		= f2fs_file_mmap,
4251
	.flush		= f2fs_file_flush,
J
Jaegeuk Kim 已提交
4252 4253 4254
	.fsync		= f2fs_sync_file,
	.fallocate	= f2fs_fallocate,
	.unlocked_ioctl	= f2fs_ioctl,
4255 4256 4257
#ifdef CONFIG_COMPAT
	.compat_ioctl	= f2fs_compat_ioctl,
#endif
J
Jaegeuk Kim 已提交
4258
	.splice_read	= generic_file_splice_read,
A
Al Viro 已提交
4259
	.splice_write	= iter_file_splice_write,
J
Jaegeuk Kim 已提交
4260
};