file.c 105.0 KB
Newer Older
C
Chao Yu 已提交
1
// SPDX-License-Identifier: GPL-2.0
J
Jaegeuk Kim 已提交
2
/*
J
Jaegeuk Kim 已提交
3 4 5 6 7 8 9 10 11 12
 * fs/f2fs/file.c
 *
 * Copyright (c) 2012 Samsung Electronics Co., Ltd.
 *             http://www.samsung.com/
 */
#include <linux/fs.h>
#include <linux/f2fs_fs.h>
#include <linux/stat.h>
#include <linux/buffer_head.h>
#include <linux/writeback.h>
13
#include <linux/blkdev.h>
J
Jaegeuk Kim 已提交
14 15
#include <linux/falloc.h>
#include <linux/types.h>
16
#include <linux/compat.h>
J
Jaegeuk Kim 已提交
17 18
#include <linux/uaccess.h>
#include <linux/mount.h>
19
#include <linux/pagevec.h>
20
#include <linux/uio.h>
21
#include <linux/uuid.h>
22
#include <linux/file.h>
C
Chao Yu 已提交
23
#include <linux/nls.h>
24
#include <linux/sched/signal.h>
M
Miklos Szeredi 已提交
25
#include <linux/fileattr.h>
J
Jaegeuk Kim 已提交
26 27 28 29 30 31

#include "f2fs.h"
#include "node.h"
#include "segment.h"
#include "xattr.h"
#include "acl.h"
32
#include "gc.h"
33
#include <trace/events/f2fs.h>
34
#include <uapi/linux/f2fs.h>
J
Jaegeuk Kim 已提交
35

36
static vm_fault_t f2fs_filemap_fault(struct vm_fault *vmf)
37 38
{
	struct inode *inode = file_inode(vmf->vma->vm_file);
39
	vm_fault_t ret;
40 41

	down_read(&F2FS_I(inode)->i_mmap_sem);
42
	ret = filemap_fault(vmf);
43 44
	up_read(&F2FS_I(inode)->i_mmap_sem);

C
Chao Yu 已提交
45 46 47 48
	if (!ret)
		f2fs_update_iostat(F2FS_I_SB(inode), APP_MAPPED_READ_IO,
							F2FS_BLKSIZE);

49 50
	trace_f2fs_filemap_fault(inode, vmf->pgoff, (unsigned long)ret);

51
	return ret;
52 53
}

54
static vm_fault_t f2fs_vm_page_mkwrite(struct vm_fault *vmf)
J
Jaegeuk Kim 已提交
55 56
{
	struct page *page = vmf->page;
57
	struct inode *inode = file_inode(vmf->vma->vm_file);
58
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
59
	struct dnode_of_data dn;
C
Chao Yu 已提交
60 61
	bool need_alloc = true;
	int err = 0;
J
Jaegeuk Kim 已提交
62

63 64 65
	if (unlikely(IS_IMMUTABLE(inode)))
		return VM_FAULT_SIGBUS;

66 67 68 69 70
	if (unlikely(f2fs_cp_error(sbi))) {
		err = -EIO;
		goto err;
	}

71 72
	if (!f2fs_is_checkpoint_ready(sbi)) {
		err = -ENOSPC;
73
		goto err;
74
	}
75

76 77 78 79
	err = f2fs_convert_inline_inode(inode);
	if (err)
		goto err;

C
Chao Yu 已提交
80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95
#ifdef CONFIG_F2FS_FS_COMPRESSION
	if (f2fs_compressed_file(inode)) {
		int ret = f2fs_is_compressed_cluster(inode, page->index);

		if (ret < 0) {
			err = ret;
			goto err;
		} else if (ret) {
			if (ret < F2FS_I(inode)->i_cluster_size) {
				err = -EAGAIN;
				goto err;
			}
			need_alloc = false;
		}
	}
#endif
96
	/* should do out of any locked page */
C
Chao Yu 已提交
97 98
	if (need_alloc)
		f2fs_balance_fs(sbi, true);
99

J
Jaegeuk Kim 已提交
100
	sb_start_pagefault(inode->i_sb);
101 102

	f2fs_bug_on(sbi, f2fs_has_inline_data(inode));
103

104
	file_update_time(vmf->vma->vm_file);
105
	down_read(&F2FS_I(inode)->i_mmap_sem);
J
Jaegeuk Kim 已提交
106
	lock_page(page);
107
	if (unlikely(page->mapping != inode->i_mapping ||
108
			page_offset(page) > i_size_read(inode) ||
109
			!PageUptodate(page))) {
J
Jaegeuk Kim 已提交
110 111
		unlock_page(page);
		err = -EFAULT;
112
		goto out_sem;
J
Jaegeuk Kim 已提交
113 114
	}

C
Chao Yu 已提交
115 116
	if (need_alloc) {
		/* block allocation */
C
Chao Yu 已提交
117
		f2fs_do_map_lock(sbi, F2FS_GET_BLOCK_PRE_AIO, true);
C
Chao Yu 已提交
118 119 120
		set_new_dnode(&dn, inode, NULL, NULL, 0);
		err = f2fs_get_block(&dn, page->index);
		f2fs_put_dnode(&dn);
C
Chao Yu 已提交
121
		f2fs_do_map_lock(sbi, F2FS_GET_BLOCK_PRE_AIO, false);
C
Chao Yu 已提交
122 123
	}

124 125 126 127 128 129 130 131 132 133
#ifdef CONFIG_F2FS_FS_COMPRESSION
	if (!need_alloc) {
		set_new_dnode(&dn, inode, NULL, NULL, 0);
		err = f2fs_get_dnode_of_data(&dn, page->index, LOOKUP_NODE);
		f2fs_put_dnode(&dn);
	}
#endif
	if (err) {
		unlock_page(page);
		goto out_sem;
C
Chao Yu 已提交
134 135
	}

136
	f2fs_wait_on_page_writeback(page, DATA, false, true);
C
Chao Yu 已提交
137 138 139 140

	/* wait for GCed page writeback via META_MAPPING */
	f2fs_wait_on_block_writeback(inode, dn.data_blkaddr);

J
Jaegeuk Kim 已提交
141 142 143 144
	/*
	 * check to see if the page is mapped already (no holes)
	 */
	if (PageMappedToDisk(page))
C
Chao Yu 已提交
145
		goto out_sem;
J
Jaegeuk Kim 已提交
146 147

	/* page is wholly or partially inside EOF */
148
	if (((loff_t)(page->index + 1) << PAGE_SHIFT) >
C
Chao Yu 已提交
149
						i_size_read(inode)) {
150
		loff_t offset;
151

152 153
		offset = i_size_read(inode) & ~PAGE_MASK;
		zero_user_segment(page, offset, PAGE_SIZE);
J
Jaegeuk Kim 已提交
154 155
	}
	set_page_dirty(page);
156 157
	if (!PageUptodate(page))
		SetPageUptodate(page);
J
Jaegeuk Kim 已提交
158

C
Chao Yu 已提交
159
	f2fs_update_iostat(sbi, APP_MAPPED_IO, F2FS_BLKSIZE);
160
	f2fs_update_time(sbi, REQ_TIME);
C
Chao Yu 已提交
161

162
	trace_f2fs_vm_page_mkwrite(page, DATA);
163 164
out_sem:
	up_read(&F2FS_I(inode)->i_mmap_sem);
C
Chao Yu 已提交
165

J
Jaegeuk Kim 已提交
166
	sb_end_pagefault(inode->i_sb);
167
err:
J
Jaegeuk Kim 已提交
168 169 170 171
	return block_page_mkwrite_return(err);
}

static const struct vm_operations_struct f2fs_file_vm_ops = {
172
	.fault		= f2fs_filemap_fault,
173
	.map_pages	= filemap_map_pages,
174
	.page_mkwrite	= f2fs_vm_page_mkwrite,
J
Jaegeuk Kim 已提交
175 176
};

177 178 179 180
static int get_parent_ino(struct inode *inode, nid_t *pino)
{
	struct dentry *dentry;

181 182 183 184 185
	/*
	 * Make sure to get the non-deleted alias.  The alias associated with
	 * the open file descriptor being fsync()'ed may be deleted already.
	 */
	dentry = d_find_alias(inode);
186 187 188
	if (!dentry)
		return 0;

189 190
	*pino = parent_ino(dentry);
	dput(dentry);
191 192 193
	return 1;
}

C
Chao Yu 已提交
194
static inline enum cp_reason_type need_do_checkpoint(struct inode *inode)
195
{
196
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
C
Chao Yu 已提交
197
	enum cp_reason_type cp_reason = CP_NO_NEEDED;
198

C
Chao Yu 已提交
199 200
	if (!S_ISREG(inode->i_mode))
		cp_reason = CP_NON_REGULAR;
C
Chao Yu 已提交
201 202
	else if (f2fs_compressed_file(inode))
		cp_reason = CP_COMPRESSED;
C
Chao Yu 已提交
203 204
	else if (inode->i_nlink != 1)
		cp_reason = CP_HARDLINK;
205
	else if (is_sbi_flag_set(sbi, SBI_NEED_CP))
C
Chao Yu 已提交
206
		cp_reason = CP_SB_NEED_CP;
207
	else if (file_wrong_pino(inode))
C
Chao Yu 已提交
208
		cp_reason = CP_WRONG_PINO;
C
Chao Yu 已提交
209
	else if (!f2fs_space_for_roll_forward(sbi))
C
Chao Yu 已提交
210
		cp_reason = CP_NO_SPC_ROLL;
C
Chao Yu 已提交
211
	else if (!f2fs_is_checkpointed_node(sbi, F2FS_I(inode)->i_pino))
C
Chao Yu 已提交
212
		cp_reason = CP_NODE_NEED_CP;
213
	else if (test_opt(sbi, FASTBOOT))
C
Chao Yu 已提交
214
		cp_reason = CP_FASTBOOT_MODE;
215
	else if (F2FS_OPTION(sbi).active_logs == 2)
C
Chao Yu 已提交
216
		cp_reason = CP_SPEC_LOG_NUM;
217
	else if (F2FS_OPTION(sbi).fsync_mode == FSYNC_MODE_STRICT &&
C
Chao Yu 已提交
218 219 220
		f2fs_need_dentry_mark(sbi, inode->i_ino) &&
		f2fs_exist_written_data(sbi, F2FS_I(inode)->i_pino,
							TRANS_DIR_INO))
221
		cp_reason = CP_RECOVER_DIR;
222

C
Chao Yu 已提交
223
	return cp_reason;
224 225
}

226 227 228 229 230
static bool need_inode_page_update(struct f2fs_sb_info *sbi, nid_t ino)
{
	struct page *i = find_get_page(NODE_MAPPING(sbi), ino);
	bool ret = false;
	/* But we need to avoid that there are some inode updates */
C
Chao Yu 已提交
231
	if ((i && PageDirty(i)) || f2fs_need_inode_block_update(sbi, ino))
232 233 234 235 236
		ret = true;
	f2fs_put_page(i, 0);
	return ret;
}

237 238 239 240 241 242 243 244
static void try_to_fix_pino(struct inode *inode)
{
	struct f2fs_inode_info *fi = F2FS_I(inode);
	nid_t pino;

	down_write(&fi->i_sem);
	if (file_wrong_pino(inode) && inode->i_nlink == 1 &&
			get_parent_ino(inode, &pino)) {
245
		f2fs_i_pino_write(inode, pino);
246 247
		file_got_pino(inode);
	}
248
	up_write(&fi->i_sem);
249 250
}

251 252
static int f2fs_do_sync_file(struct file *file, loff_t start, loff_t end,
						int datasync, bool atomic)
J
Jaegeuk Kim 已提交
253 254
{
	struct inode *inode = file->f_mapping->host;
255
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
J
Jaegeuk Kim 已提交
256
	nid_t ino = inode->i_ino;
J
Jaegeuk Kim 已提交
257
	int ret = 0;
C
Chao Yu 已提交
258
	enum cp_reason_type cp_reason = 0;
J
Jaegeuk Kim 已提交
259
	struct writeback_control wbc = {
260
		.sync_mode = WB_SYNC_ALL,
J
Jaegeuk Kim 已提交
261 262 263
		.nr_to_write = LONG_MAX,
		.for_reclaim = 0,
	};
264
	unsigned int seq_id = 0;
J
Jaegeuk Kim 已提交
265

D
Daniel Rosenberg 已提交
266 267
	if (unlikely(f2fs_readonly(inode->i_sb) ||
				is_sbi_flag_set(sbi, SBI_CP_DISABLED)))
268 269
		return 0;

270
	trace_f2fs_sync_file_enter(inode);
271

272 273 274
	if (S_ISDIR(inode->i_mode))
		goto go_write;

275
	/* if fdatasync is triggered, let's do in-place-update */
J
Jaegeuk Kim 已提交
276
	if (datasync || get_dirty_pages(inode) <= SM_I(sbi)->min_fsync_blocks)
277
		set_inode_flag(inode, FI_NEED_IPU);
278
	ret = file_write_and_wait_range(file, start, end);
279
	clear_inode_flag(inode, FI_NEED_IPU);
280

281
	if (ret) {
C
Chao Yu 已提交
282
		trace_f2fs_sync_file_exit(inode, cp_reason, datasync, ret);
J
Jaegeuk Kim 已提交
283
		return ret;
284
	}
J
Jaegeuk Kim 已提交
285

286
	/* if the inode is dirty, let's recover all the time */
C
Chao Yu 已提交
287
	if (!f2fs_skip_inode_update(inode, datasync)) {
288
		f2fs_write_inode(inode, NULL);
289 290 291
		goto go_write;
	}

292 293 294
	/*
	 * if there is no written data, don't waste time to write recovery info.
	 */
295
	if (!is_inode_flag_set(inode, FI_APPEND_WRITE) &&
C
Chao Yu 已提交
296
			!f2fs_exist_written_data(sbi, ino, APPEND_INO)) {
297

298 299
		/* it may call write_inode just prior to fsync */
		if (need_inode_page_update(sbi, ino))
300 301
			goto go_write;

302
		if (is_inode_flag_set(inode, FI_UPDATE_WRITE) ||
C
Chao Yu 已提交
303
				f2fs_exist_written_data(sbi, ino, UPDATE_INO))
304 305 306
			goto flush_out;
		goto out;
	}
307
go_write:
308 309 310 311
	/*
	 * Both of fdatasync() and fsync() are able to be recovered from
	 * sudden-power-off.
	 */
312
	down_read(&F2FS_I(inode)->i_sem);
C
Chao Yu 已提交
313
	cp_reason = need_do_checkpoint(inode);
314
	up_read(&F2FS_I(inode)->i_sem);
315

C
Chao Yu 已提交
316
	if (cp_reason) {
J
Jaegeuk Kim 已提交
317 318
		/* all the dirty node pages should be flushed for POR */
		ret = f2fs_sync_fs(inode->i_sb, 1);
319

320 321 322 323 324
		/*
		 * We've secured consistency through sync_fs. Following pino
		 * will be used only for fsynced inodes after checkpoint.
		 */
		try_to_fix_pino(inode);
325 326
		clear_inode_flag(inode, FI_APPEND_WRITE);
		clear_inode_flag(inode, FI_UPDATE_WRITE);
327 328
		goto out;
	}
329
sync_nodes:
330
	atomic_inc(&sbi->wb_sync_req[NODE]);
331
	ret = f2fs_fsync_node_pages(sbi, inode, &wbc, atomic, &seq_id);
332
	atomic_dec(&sbi->wb_sync_req[NODE]);
333 334
	if (ret)
		goto out;
335

336
	/* if cp_error was enabled, we should avoid infinite loop */
C
Chao Yu 已提交
337 338
	if (unlikely(f2fs_cp_error(sbi))) {
		ret = -EIO;
339
		goto out;
C
Chao Yu 已提交
340
	}
341

C
Chao Yu 已提交
342
	if (f2fs_need_inode_block_update(sbi, ino)) {
343
		f2fs_mark_inode_dirty_sync(inode, true);
344 345
		f2fs_write_inode(inode, NULL);
		goto sync_nodes;
J
Jaegeuk Kim 已提交
346
	}
347

348 349 350 351 352 353 354 355 356
	/*
	 * If it's atomic_write, it's just fine to keep write ordering. So
	 * here we don't need to wait for node write completion, since we use
	 * node chain which serializes node blocks. If one of node writes are
	 * reordered, we can see simply broken chain, resulting in stopping
	 * roll-forward recovery. It means we'll recover all or none node blocks
	 * given fsync mark.
	 */
	if (!atomic) {
357
		ret = f2fs_wait_on_node_pages_writeback(sbi, seq_id);
358 359 360
		if (ret)
			goto out;
	}
361 362

	/* once recovery info is written, don't need to tack this */
C
Chao Yu 已提交
363
	f2fs_remove_ino_entry(sbi, ino, APPEND_INO);
364
	clear_inode_flag(inode, FI_APPEND_WRITE);
365
flush_out:
366
	if (!atomic && F2FS_OPTION(sbi).fsync_mode != FSYNC_MODE_NOBARRIER)
C
Chao Yu 已提交
367
		ret = f2fs_issue_flush(sbi, inode->i_ino);
368
	if (!ret) {
C
Chao Yu 已提交
369
		f2fs_remove_ino_entry(sbi, ino, UPDATE_INO);
370
		clear_inode_flag(inode, FI_UPDATE_WRITE);
C
Chao Yu 已提交
371
		f2fs_remove_ino_entry(sbi, ino, FLUSH_INO);
372
	}
373
	f2fs_update_time(sbi, REQ_TIME);
J
Jaegeuk Kim 已提交
374
out:
C
Chao Yu 已提交
375
	trace_f2fs_sync_file_exit(inode, cp_reason, datasync, ret);
J
Jaegeuk Kim 已提交
376 377 378
	return ret;
}

379 380
int f2fs_sync_file(struct file *file, loff_t start, loff_t end, int datasync)
{
381 382
	if (unlikely(f2fs_cp_error(F2FS_I_SB(file_inode(file)))))
		return -EIO;
383 384 385
	return f2fs_do_sync_file(file, start, end, datasync, false);
}

386 387
static bool __found_offset(struct address_space *mapping, block_t blkaddr,
				pgoff_t index, int whence)
388 389 390
{
	switch (whence) {
	case SEEK_DATA:
391 392 393 394
		if (__is_valid_data_blkaddr(blkaddr))
			return true;
		if (blkaddr == NEW_ADDR &&
		    xa_get_mark(&mapping->i_pages, index, PAGECACHE_TAG_DIRTY))
395 396 397 398 399 400 401 402 403 404
			return true;
		break;
	case SEEK_HOLE:
		if (blkaddr == NULL_ADDR)
			return true;
		break;
	}
	return false;
}

405 406 407 408 409
static loff_t f2fs_seek_block(struct file *file, loff_t offset, int whence)
{
	struct inode *inode = file->f_mapping->host;
	loff_t maxbytes = inode->i_sb->s_maxbytes;
	struct dnode_of_data dn;
410
	pgoff_t pgofs, end_offset;
411 412
	loff_t data_ofs = offset;
	loff_t isize;
413 414
	int err = 0;

A
Al Viro 已提交
415
	inode_lock(inode);
416 417 418 419 420 421

	isize = i_size_read(inode);
	if (offset >= isize)
		goto fail;

	/* handle inline data case */
422 423 424 425 426 427 428 429
	if (f2fs_has_inline_data(inode)) {
		if (whence == SEEK_HOLE) {
			data_ofs = isize;
			goto found;
		} else if (whence == SEEK_DATA) {
			data_ofs = offset;
			goto found;
		}
430 431
	}

432
	pgofs = (pgoff_t)(offset >> PAGE_SHIFT);
433

434
	for (; data_ofs < isize; data_ofs = (loff_t)pgofs << PAGE_SHIFT) {
435
		set_new_dnode(&dn, inode, NULL, NULL, 0);
C
Chao Yu 已提交
436
		err = f2fs_get_dnode_of_data(&dn, pgofs, LOOKUP_NODE);
437 438 439
		if (err && err != -ENOENT) {
			goto fail;
		} else if (err == -ENOENT) {
A
arter97 已提交
440
			/* direct node does not exists */
441
			if (whence == SEEK_DATA) {
C
Chao Yu 已提交
442
				pgofs = f2fs_get_next_page_offset(&dn, pgofs);
443 444 445 446 447 448
				continue;
			} else {
				goto found;
			}
		}

449
		end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
450 451 452 453

		/* find data/hole in dnode block */
		for (; dn.ofs_in_node < end_offset;
				dn.ofs_in_node++, pgofs++,
454
				data_ofs = (loff_t)pgofs << PAGE_SHIFT) {
455
			block_t blkaddr;
456

457
			blkaddr = f2fs_data_blkaddr(&dn);
458

459 460
			if (__is_valid_data_blkaddr(blkaddr) &&
				!f2fs_is_valid_blkaddr(F2FS_I_SB(inode),
C
Chao Yu 已提交
461
					blkaddr, DATA_GENERIC_ENHANCE)) {
462 463 464 465
				f2fs_put_dnode(&dn);
				goto fail;
			}

466
			if (__found_offset(file->f_mapping, blkaddr,
467
							pgofs, whence)) {
468 469 470 471 472 473 474 475 476 477
				f2fs_put_dnode(&dn);
				goto found;
			}
		}
		f2fs_put_dnode(&dn);
	}

	if (whence == SEEK_DATA)
		goto fail;
found:
478 479
	if (whence == SEEK_HOLE && data_ofs > isize)
		data_ofs = isize;
A
Al Viro 已提交
480
	inode_unlock(inode);
481 482
	return vfs_setpos(file, data_ofs, maxbytes);
fail:
A
Al Viro 已提交
483
	inode_unlock(inode);
484 485 486 487 488 489 490 491
	return -ENXIO;
}

static loff_t f2fs_llseek(struct file *file, loff_t offset, int whence)
{
	struct inode *inode = file->f_mapping->host;
	loff_t maxbytes = inode->i_sb->s_maxbytes;

492 493 494
	if (f2fs_compressed_file(inode))
		maxbytes = max_file_blocks(inode) << F2FS_BLKSIZE_BITS;

495 496 497 498 499 500 501 502
	switch (whence) {
	case SEEK_SET:
	case SEEK_CUR:
	case SEEK_END:
		return generic_file_llseek_size(file, offset, whence,
						maxbytes, i_size_read(inode));
	case SEEK_DATA:
	case SEEK_HOLE:
503 504
		if (offset < 0)
			return -ENXIO;
505 506 507 508 509 510
		return f2fs_seek_block(file, offset, whence);
	}

	return -EINVAL;
}

J
Jaegeuk Kim 已提交
511 512
static int f2fs_file_mmap(struct file *file, struct vm_area_struct *vma)
{
513 514
	struct inode *inode = file_inode(file);

515 516 517
	if (unlikely(f2fs_cp_error(F2FS_I_SB(inode))))
		return -EIO;

C
Chao Yu 已提交
518 519 520
	if (!f2fs_is_compress_backend_ready(inode))
		return -EOPNOTSUPP;

J
Jaegeuk Kim 已提交
521 522
	file_accessed(file);
	vma->vm_ops = &f2fs_file_vm_ops;
C
Chao Yu 已提交
523
	set_inode_flag(inode, FI_MMAP_FILE);
J
Jaegeuk Kim 已提交
524 525 526
	return 0;
}

527 528
static int f2fs_file_open(struct inode *inode, struct file *filp)
{
529
	int err = fscrypt_file_open(inode, filp);
530

E
Eric Biggers 已提交
531 532 533
	if (err)
		return err;

C
Chao Yu 已提交
534 535 536
	if (!f2fs_is_compress_backend_ready(inode))
		return -EOPNOTSUPP;

E
Eric Biggers 已提交
537
	err = fsverity_file_open(inode, filp);
538 539
	if (err)
		return err;
H
Hyunchul Lee 已提交
540 541 542

	filp->f_mode |= FMODE_NOWAIT;

C
Chao Yu 已提交
543
	return dquot_file_open(inode, filp);
544 545
}

C
Chao Yu 已提交
546
void f2fs_truncate_data_blocks_range(struct dnode_of_data *dn, int count)
J
Jaegeuk Kim 已提交
547
{
548
	struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
J
Jaegeuk Kim 已提交
549
	struct f2fs_node *raw_node;
C
Chao Yu 已提交
550
	int nr_free = 0, ofs = dn->ofs_in_node, len = count;
J
Jaegeuk Kim 已提交
551
	__le32 *addr;
552
	int base = 0;
C
Chao Yu 已提交
553 554 555
	bool compressed_cluster = false;
	int cluster_index = 0, valid_blocks = 0;
	int cluster_size = F2FS_I(dn->inode)->i_cluster_size;
556
	bool released = !atomic_read(&F2FS_I(dn->inode)->i_compr_blocks);
557 558 559

	if (IS_INODE(dn->node_page) && f2fs_has_extra_attr(dn->inode))
		base = get_extra_isize(dn->inode);
J
Jaegeuk Kim 已提交
560

561
	raw_node = F2FS_NODE(dn->node_page);
562
	addr = blkaddr_in_node(raw_node) + base + ofs;
J
Jaegeuk Kim 已提交
563

C
Chao Yu 已提交
564 565
	/* Assumption: truncateion starts with cluster */
	for (; count > 0; count--, addr++, dn->ofs_in_node++, cluster_index++) {
J
Jaegeuk Kim 已提交
566
		block_t blkaddr = le32_to_cpu(*addr);
567

C
Chao Yu 已提交
568 569 570 571 572 573 574 575 576
		if (f2fs_compressed_file(dn->inode) &&
					!(cluster_index & (cluster_size - 1))) {
			if (compressed_cluster)
				f2fs_i_compr_blocks_update(dn->inode,
							valid_blocks, false);
			compressed_cluster = (blkaddr == COMPRESS_ADDR);
			valid_blocks = 0;
		}

J
Jaegeuk Kim 已提交
577 578 579
		if (blkaddr == NULL_ADDR)
			continue;

J
Jaegeuk Kim 已提交
580
		dn->data_blkaddr = NULL_ADDR;
C
Chao Yu 已提交
581
		f2fs_set_data_blkaddr(dn);
582

C
Chao Yu 已提交
583 584
		if (__is_valid_data_blkaddr(blkaddr)) {
			if (!f2fs_is_valid_blkaddr(sbi, blkaddr,
C
Chao Yu 已提交
585
					DATA_GENERIC_ENHANCE))
C
Chao Yu 已提交
586 587 588 589
				continue;
			if (compressed_cluster)
				valid_blocks++;
		}
590

591
		if (dn->ofs_in_node == 0 && IS_INODE(dn->node_page))
592
			clear_inode_flag(dn->inode, FI_FIRST_BLOCK_WRITTEN);
C
Chao Yu 已提交
593 594

		f2fs_invalidate_blocks(sbi, blkaddr);
595 596 597

		if (!released || blkaddr != COMPRESS_ADDR)
			nr_free++;
J
Jaegeuk Kim 已提交
598
	}
C
Chao Yu 已提交
599

C
Chao Yu 已提交
600 601 602
	if (compressed_cluster)
		f2fs_i_compr_blocks_update(dn->inode, valid_blocks, false);

J
Jaegeuk Kim 已提交
603
	if (nr_free) {
C
Chao Yu 已提交
604 605 606 607 608
		pgoff_t fofs;
		/*
		 * once we invalidate valid blkaddr in range [ofs, ofs + count],
		 * we will invalidate all blkaddr in the whole range.
		 */
C
Chao Yu 已提交
609
		fofs = f2fs_start_bidx_of_node(ofs_of_node(dn->node_page),
610
							dn->inode) + ofs;
C
Chao Yu 已提交
611
		f2fs_update_extent_cache_range(dn, fofs, 0, len);
612
		dec_valid_block_count(sbi, dn->inode, nr_free);
J
Jaegeuk Kim 已提交
613 614
	}
	dn->ofs_in_node = ofs;
615

616
	f2fs_update_time(sbi, REQ_TIME);
617 618
	trace_f2fs_truncate_data_blocks_range(dn->inode, dn->nid,
					 dn->ofs_in_node, nr_free);
J
Jaegeuk Kim 已提交
619 620
}

C
Chao Yu 已提交
621
void f2fs_truncate_data_blocks(struct dnode_of_data *dn)
J
Jaegeuk Kim 已提交
622
{
623
	f2fs_truncate_data_blocks_range(dn, ADDRS_PER_BLOCK(dn->inode));
J
Jaegeuk Kim 已提交
624 625
}

626
static int truncate_partial_data_page(struct inode *inode, u64 from,
627
								bool cache_only)
J
Jaegeuk Kim 已提交
628
{
629
	loff_t offset = from & (PAGE_SIZE - 1);
630
	pgoff_t index = from >> PAGE_SHIFT;
631
	struct address_space *mapping = inode->i_mapping;
J
Jaegeuk Kim 已提交
632 633
	struct page *page;

634
	if (!offset && !cache_only)
635
		return 0;
J
Jaegeuk Kim 已提交
636

637
	if (cache_only) {
638
		page = find_lock_page(mapping, index);
639 640 641
		if (page && PageUptodate(page))
			goto truncate_out;
		f2fs_put_page(page, 1);
642
		return 0;
643
	}
J
Jaegeuk Kim 已提交
644

C
Chao Yu 已提交
645
	page = f2fs_get_lock_data_page(inode, index, true);
646
	if (IS_ERR(page))
647
		return PTR_ERR(page) == -ENOENT ? 0 : PTR_ERR(page);
648
truncate_out:
649
	f2fs_wait_on_page_writeback(page, DATA, true, true);
650
	zero_user(page, offset, PAGE_SIZE - offset);
651 652

	/* An encrypted inode should have a key and truncate the last page. */
653
	f2fs_bug_on(F2FS_I_SB(inode), cache_only && IS_ENCRYPTED(inode));
654
	if (!cache_only)
655
		set_page_dirty(page);
J
Jaegeuk Kim 已提交
656
	f2fs_put_page(page, 1);
657
	return 0;
J
Jaegeuk Kim 已提交
658 659
}

660
int f2fs_do_truncate_blocks(struct inode *inode, u64 from, bool lock)
J
Jaegeuk Kim 已提交
661
{
662
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
J
Jaegeuk Kim 已提交
663 664
	struct dnode_of_data dn;
	pgoff_t free_from;
H
Huajun Li 已提交
665
	int count = 0, err = 0;
666
	struct page *ipage;
667
	bool truncate_page = false;
J
Jaegeuk Kim 已提交
668

669 670
	trace_f2fs_truncate_blocks_enter(inode, from);

C
Chao Yu 已提交
671
	free_from = (pgoff_t)F2FS_BLK_ALIGN(from);
J
Jaegeuk Kim 已提交
672

673
	if (free_from >= max_file_blocks(inode))
674 675
		goto free_partial;

676
	if (lock)
677
		f2fs_lock_op(sbi);
H
Huajun Li 已提交
678

C
Chao Yu 已提交
679
	ipage = f2fs_get_node_page(sbi, inode->i_ino);
680 681 682 683 684 685
	if (IS_ERR(ipage)) {
		err = PTR_ERR(ipage);
		goto out;
	}

	if (f2fs_has_inline_data(inode)) {
C
Chao Yu 已提交
686
		f2fs_truncate_inline_inode(inode, ipage, from);
687
		f2fs_put_page(ipage, 1);
688
		truncate_page = true;
689 690 691 692
		goto out;
	}

	set_new_dnode(&dn, inode, ipage, NULL, 0);
C
Chao Yu 已提交
693
	err = f2fs_get_dnode_of_data(&dn, free_from, LOOKUP_NODE_RA);
J
Jaegeuk Kim 已提交
694 695 696
	if (err) {
		if (err == -ENOENT)
			goto free_next;
697
		goto out;
698 699
	}

700
	count = ADDRS_PER_PAGE(dn.node_page, inode);
J
Jaegeuk Kim 已提交
701 702

	count -= dn.ofs_in_node;
703
	f2fs_bug_on(sbi, count < 0);
704

J
Jaegeuk Kim 已提交
705
	if (dn.ofs_in_node || IS_INODE(dn.node_page)) {
C
Chao Yu 已提交
706
		f2fs_truncate_data_blocks_range(&dn, count);
J
Jaegeuk Kim 已提交
707 708 709 710 711
		free_from += count;
	}

	f2fs_put_dnode(&dn);
free_next:
C
Chao Yu 已提交
712
	err = f2fs_truncate_inode_blocks(inode, free_from);
713 714
out:
	if (lock)
715
		f2fs_unlock_op(sbi);
716
free_partial:
717 718
	/* lastly zero out the first data page */
	if (!err)
719
		err = truncate_partial_data_page(inode, from, truncate_page);
J
Jaegeuk Kim 已提交
720

721
	trace_f2fs_truncate_blocks_exit(inode, err);
J
Jaegeuk Kim 已提交
722 723 724
	return err;
}

C
Chao Yu 已提交
725 726 727
int f2fs_truncate_blocks(struct inode *inode, u64 from, bool lock)
{
	u64 free_from = from;
728
	int err;
C
Chao Yu 已提交
729

730
#ifdef CONFIG_F2FS_FS_COMPRESSION
C
Chao Yu 已提交
731 732 733 734
	/*
	 * for compressed file, only support cluster size
	 * aligned truncation.
	 */
735 736 737
	if (f2fs_compressed_file(inode))
		free_from = round_up(from,
				F2FS_I(inode)->i_cluster_size << PAGE_SHIFT);
738 739 740 741 742 743 744
#endif

	err = f2fs_do_truncate_blocks(inode, free_from, lock);
	if (err)
		return err;

#ifdef CONFIG_F2FS_FS_COMPRESSION
C
Chao Yu 已提交
745
	if (from != free_from) {
746
		err = f2fs_truncate_partial_cluster(inode, from, lock);
C
Chao Yu 已提交
747 748 749
		if (err)
			return err;
	}
750
#endif
C
Chao Yu 已提交
751

C
Chao Yu 已提交
752
	return 0;
C
Chao Yu 已提交
753 754
}

755
int f2fs_truncate(struct inode *inode)
J
Jaegeuk Kim 已提交
756
{
757 758
	int err;

759 760 761
	if (unlikely(f2fs_cp_error(F2FS_I_SB(inode))))
		return -EIO;

J
Jaegeuk Kim 已提交
762 763
	if (!(S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode) ||
				S_ISLNK(inode->i_mode)))
764
		return 0;
J
Jaegeuk Kim 已提交
765

766 767
	trace_f2fs_truncate(inode);

768
	if (time_to_inject(F2FS_I_SB(inode), FAULT_TRUNCATE)) {
769
		f2fs_show_injection_info(F2FS_I_SB(inode), FAULT_TRUNCATE);
770 771
		return -EIO;
	}
772

773 774 775 776
	err = dquot_initialize(inode);
	if (err)
		return err;

777
	/* we should check inline_data size */
778
	if (!f2fs_may_inline_data(inode)) {
779 780 781
		err = f2fs_convert_inline_inode(inode);
		if (err)
			return err;
782 783
	}

784
	err = f2fs_truncate_blocks(inode, i_size_read(inode), true);
785 786 787
	if (err)
		return err;

788
	inode->i_mtime = inode->i_ctime = current_time(inode);
789
	f2fs_mark_inode_dirty_sync(inode, false);
790
	return 0;
J
Jaegeuk Kim 已提交
791 792
}

793 794
int f2fs_getattr(struct user_namespace *mnt_userns, const struct path *path,
		 struct kstat *stat, u32 request_mask, unsigned int query_flags)
J
Jaegeuk Kim 已提交
795
{
796
	struct inode *inode = d_inode(path->dentry);
C
Chao Yu 已提交
797
	struct f2fs_inode_info *fi = F2FS_I(inode);
C
Chao Yu 已提交
798
	struct f2fs_inode *ri;
C
Chao Yu 已提交
799 800
	unsigned int flags;

C
Chao Yu 已提交
801
	if (f2fs_has_extra_attr(inode) &&
802
			f2fs_sb_has_inode_crtime(F2FS_I_SB(inode)) &&
C
Chao Yu 已提交
803 804 805 806 807 808
			F2FS_FITS_IN_INODE(ri, fi->i_extra_isize, i_crtime)) {
		stat->result_mask |= STATX_BTIME;
		stat->btime.tv_sec = fi->i_crtime.tv_sec;
		stat->btime.tv_nsec = fi->i_crtime.tv_nsec;
	}

809
	flags = fi->i_flags;
C
Chao Yu 已提交
810 811
	if (flags & F2FS_COMPR_FL)
		stat->attributes |= STATX_ATTR_COMPRESSED;
812
	if (flags & F2FS_APPEND_FL)
C
Chao Yu 已提交
813
		stat->attributes |= STATX_ATTR_APPEND;
814
	if (IS_ENCRYPTED(inode))
C
Chao Yu 已提交
815
		stat->attributes |= STATX_ATTR_ENCRYPTED;
816
	if (flags & F2FS_IMMUTABLE_FL)
C
Chao Yu 已提交
817
		stat->attributes |= STATX_ATTR_IMMUTABLE;
818
	if (flags & F2FS_NODUMP_FL)
C
Chao Yu 已提交
819
		stat->attributes |= STATX_ATTR_NODUMP;
E
Eric Biggers 已提交
820 821
	if (IS_VERITY(inode))
		stat->attributes |= STATX_ATTR_VERITY;
C
Chao Yu 已提交
822

C
Chao Yu 已提交
823 824
	stat->attributes_mask |= (STATX_ATTR_COMPRESSED |
				  STATX_ATTR_APPEND |
C
Chao Yu 已提交
825 826
				  STATX_ATTR_ENCRYPTED |
				  STATX_ATTR_IMMUTABLE |
E
Eric Biggers 已提交
827 828
				  STATX_ATTR_NODUMP |
				  STATX_ATTR_VERITY);
C
Chao Yu 已提交
829

C
Christian Brauner 已提交
830
	generic_fillattr(&init_user_ns, inode, stat);
831 832 833 834 835 836

	/* we need to show initial sectors used for inline_data/dentries */
	if ((S_ISREG(inode->i_mode) && f2fs_has_inline_data(inode)) ||
					f2fs_has_inline_dentry(inode))
		stat->blocks += (stat->size + 511) >> 9;

J
Jaegeuk Kim 已提交
837 838 839 840
	return 0;
}

#ifdef CONFIG_F2FS_FS_POSIX_ACL
C
Christian Brauner 已提交
841 842
static void __setattr_copy(struct user_namespace *mnt_userns,
			   struct inode *inode, const struct iattr *attr)
J
Jaegeuk Kim 已提交
843 844 845 846 847 848 849
{
	unsigned int ia_valid = attr->ia_valid;

	if (ia_valid & ATTR_UID)
		inode->i_uid = attr->ia_uid;
	if (ia_valid & ATTR_GID)
		inode->i_gid = attr->ia_gid;
850 851 852 853 854 855
	if (ia_valid & ATTR_ATIME)
		inode->i_atime = attr->ia_atime;
	if (ia_valid & ATTR_MTIME)
		inode->i_mtime = attr->ia_mtime;
	if (ia_valid & ATTR_CTIME)
		inode->i_ctime = attr->ia_ctime;
J
Jaegeuk Kim 已提交
856 857
	if (ia_valid & ATTR_MODE) {
		umode_t mode = attr->ia_mode;
C
Christian Brauner 已提交
858
		kgid_t kgid = i_gid_into_mnt(mnt_userns, inode);
J
Jaegeuk Kim 已提交
859

860
		if (!in_group_p(kgid) && !capable_wrt_inode_uidgid(mnt_userns, inode, CAP_FSETID))
J
Jaegeuk Kim 已提交
861
			mode &= ~S_ISGID;
862
		set_acl_inode(inode, mode);
J
Jaegeuk Kim 已提交
863 864 865 866 867 868
	}
}
#else
#define __setattr_copy setattr_copy
#endif

869 870
int f2fs_setattr(struct user_namespace *mnt_userns, struct dentry *dentry,
		 struct iattr *attr)
J
Jaegeuk Kim 已提交
871
{
872
	struct inode *inode = d_inode(dentry);
J
Jaegeuk Kim 已提交
873 874
	int err;

875 876 877
	if (unlikely(f2fs_cp_error(F2FS_I_SB(inode))))
		return -EIO;

878 879 880 881 882 883 884 885
	if (unlikely(IS_IMMUTABLE(inode)))
		return -EPERM;

	if (unlikely(IS_APPEND(inode) &&
			(attr->ia_valid & (ATTR_MODE | ATTR_UID |
				  ATTR_GID | ATTR_TIMES_SET))))
		return -EPERM;

C
Chao Yu 已提交
886 887 888 889
	if ((attr->ia_valid & ATTR_SIZE) &&
		!f2fs_is_compress_backend_ready(inode))
		return -EOPNOTSUPP;

C
Christian Brauner 已提交
890
	err = setattr_prepare(&init_user_ns, dentry, attr);
J
Jaegeuk Kim 已提交
891 892 893
	if (err)
		return err;

894 895 896 897
	err = fscrypt_prepare_setattr(dentry, attr);
	if (err)
		return err;

E
Eric Biggers 已提交
898 899 900 901
	err = fsverity_prepare_setattr(dentry, attr);
	if (err)
		return err;

C
Chao Yu 已提交
902 903 904 905 906 907 908 909 910
	if (is_quota_modification(inode, attr)) {
		err = dquot_initialize(inode);
		if (err)
			return err;
	}
	if ((attr->ia_valid & ATTR_UID &&
		!uid_eq(attr->ia_uid, inode->i_uid)) ||
		(attr->ia_valid & ATTR_GID &&
		!gid_eq(attr->ia_gid, inode->i_gid))) {
911
		f2fs_lock_op(F2FS_I_SB(inode));
C
Chao Yu 已提交
912
		err = dquot_transfer(inode, attr);
913 914 915 916
		if (err) {
			set_sbi_flag(F2FS_I_SB(inode),
					SBI_QUOTA_NEED_REPAIR);
			f2fs_unlock_op(F2FS_I_SB(inode));
C
Chao Yu 已提交
917
			return err;
918 919 920 921 922 923 924 925 926 927 928
		}
		/*
		 * update uid/gid under lock_op(), so that dquot and inode can
		 * be updated atomically.
		 */
		if (attr->ia_valid & ATTR_UID)
			inode->i_uid = attr->ia_uid;
		if (attr->ia_valid & ATTR_GID)
			inode->i_gid = attr->ia_gid;
		f2fs_mark_inode_dirty_sync(inode, true);
		f2fs_unlock_op(F2FS_I_SB(inode));
C
Chao Yu 已提交
929 930
	}

931
	if (attr->ia_valid & ATTR_SIZE) {
932 933 934 935 936 937 938 939 940 941 942
		loff_t old_size = i_size_read(inode);

		if (attr->ia_size > MAX_INLINE_DATA(inode)) {
			/*
			 * should convert inline inode before i_size_write to
			 * keep smaller than inline_data size with inline flag.
			 */
			err = f2fs_convert_inline_inode(inode);
			if (err)
				return err;
		}
943 944

		down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
945
		down_write(&F2FS_I(inode)->i_mmap_sem);
946 947 948

		truncate_setsize(inode, attr->ia_size);

949
		if (attr->ia_size <= old_size)
950
			err = f2fs_truncate(inode);
951 952 953 954 955
		/*
		 * do not trim all blocks after i_size if target size is
		 * larger than i_size.
		 */
		up_write(&F2FS_I(inode)->i_mmap_sem);
956
		up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
957 958
		if (err)
			return err;
959

960
		spin_lock(&F2FS_I(inode)->i_size_lock);
961
		inode->i_mtime = inode->i_ctime = current_time(inode);
962
		F2FS_I(inode)->last_disk_size = i_size_read(inode);
963
		spin_unlock(&F2FS_I(inode)->i_size_lock);
J
Jaegeuk Kim 已提交
964 965
	}

C
Christian Brauner 已提交
966
	__setattr_copy(&init_user_ns, inode, attr);
J
Jaegeuk Kim 已提交
967 968

	if (attr->ia_valid & ATTR_MODE) {
969
		err = posix_acl_chmod(&init_user_ns, inode, f2fs_get_inode_mode(inode));
970 971 972 973

		if (is_inode_flag_set(inode, FI_ACL_MODE)) {
			if (!err)
				inode->i_mode = F2FS_I(inode)->i_acl_mode;
974
			clear_inode_flag(inode, FI_ACL_MODE);
J
Jaegeuk Kim 已提交
975 976 977
		}
	}

978
	/* file size may changed here */
979
	f2fs_mark_inode_dirty_sync(inode, true);
980 981 982 983

	/* inode change will produce dirty node pages flushed by checkpoint */
	f2fs_balance_fs(F2FS_I_SB(inode), true);

J
Jaegeuk Kim 已提交
984 985 986 987 988 989 990
	return err;
}

const struct inode_operations f2fs_file_inode_operations = {
	.getattr	= f2fs_getattr,
	.setattr	= f2fs_setattr,
	.get_acl	= f2fs_get_acl,
991
	.set_acl	= f2fs_set_acl,
J
Jaegeuk Kim 已提交
992
	.listxattr	= f2fs_listxattr,
J
Jaegeuk Kim 已提交
993
	.fiemap		= f2fs_fiemap,
M
Miklos Szeredi 已提交
994 995
	.fileattr_get	= f2fs_fileattr_get,
	.fileattr_set	= f2fs_fileattr_set,
J
Jaegeuk Kim 已提交
996 997
};

C
Chao Yu 已提交
998
static int fill_zero(struct inode *inode, pgoff_t index,
J
Jaegeuk Kim 已提交
999 1000
					loff_t start, loff_t len)
{
1001
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
J
Jaegeuk Kim 已提交
1002 1003 1004
	struct page *page;

	if (!len)
C
Chao Yu 已提交
1005
		return 0;
J
Jaegeuk Kim 已提交
1006

J
Jaegeuk Kim 已提交
1007
	f2fs_balance_fs(sbi, true);
1008

1009
	f2fs_lock_op(sbi);
C
Chao Yu 已提交
1010
	page = f2fs_get_new_data_page(inode, NULL, index, false);
1011
	f2fs_unlock_op(sbi);
J
Jaegeuk Kim 已提交
1012

C
Chao Yu 已提交
1013 1014 1015
	if (IS_ERR(page))
		return PTR_ERR(page);

1016
	f2fs_wait_on_page_writeback(page, DATA, true, true);
C
Chao Yu 已提交
1017 1018 1019 1020
	zero_user(page, start, len);
	set_page_dirty(page);
	f2fs_put_page(page, 1);
	return 0;
J
Jaegeuk Kim 已提交
1021 1022
}

C
Chao Yu 已提交
1023
int f2fs_truncate_hole(struct inode *inode, pgoff_t pg_start, pgoff_t pg_end)
J
Jaegeuk Kim 已提交
1024 1025 1026
{
	int err;

1027
	while (pg_start < pg_end) {
J
Jaegeuk Kim 已提交
1028
		struct dnode_of_data dn;
1029
		pgoff_t end_offset, count;
1030

J
Jaegeuk Kim 已提交
1031
		set_new_dnode(&dn, inode, NULL, NULL, 0);
C
Chao Yu 已提交
1032
		err = f2fs_get_dnode_of_data(&dn, pg_start, LOOKUP_NODE);
J
Jaegeuk Kim 已提交
1033
		if (err) {
1034
			if (err == -ENOENT) {
C
Chao Yu 已提交
1035 1036
				pg_start = f2fs_get_next_page_offset(&dn,
								pg_start);
J
Jaegeuk Kim 已提交
1037
				continue;
1038
			}
J
Jaegeuk Kim 已提交
1039 1040 1041
			return err;
		}

1042
		end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
1043 1044 1045 1046
		count = min(end_offset - dn.ofs_in_node, pg_end - pg_start);

		f2fs_bug_on(F2FS_I_SB(inode), count == 0 || count > end_offset);

C
Chao Yu 已提交
1047
		f2fs_truncate_data_blocks_range(&dn, count);
J
Jaegeuk Kim 已提交
1048
		f2fs_put_dnode(&dn);
1049 1050

		pg_start += count;
J
Jaegeuk Kim 已提交
1051 1052 1053 1054
	}
	return 0;
}

C
Chao Yu 已提交
1055
static int punch_hole(struct inode *inode, loff_t offset, loff_t len)
J
Jaegeuk Kim 已提交
1056 1057 1058
{
	pgoff_t pg_start, pg_end;
	loff_t off_start, off_end;
1059
	int ret;
J
Jaegeuk Kim 已提交
1060

1061 1062 1063
	ret = f2fs_convert_inline_inode(inode);
	if (ret)
		return ret;
H
Huajun Li 已提交
1064

1065 1066
	pg_start = ((unsigned long long) offset) >> PAGE_SHIFT;
	pg_end = ((unsigned long long) offset + len) >> PAGE_SHIFT;
J
Jaegeuk Kim 已提交
1067

1068 1069
	off_start = offset & (PAGE_SIZE - 1);
	off_end = (offset + len) & (PAGE_SIZE - 1);
J
Jaegeuk Kim 已提交
1070 1071

	if (pg_start == pg_end) {
C
Chao Yu 已提交
1072
		ret = fill_zero(inode, pg_start, off_start,
J
Jaegeuk Kim 已提交
1073
						off_end - off_start);
C
Chao Yu 已提交
1074 1075
		if (ret)
			return ret;
J
Jaegeuk Kim 已提交
1076
	} else {
C
Chao Yu 已提交
1077 1078
		if (off_start) {
			ret = fill_zero(inode, pg_start++, off_start,
1079
						PAGE_SIZE - off_start);
C
Chao Yu 已提交
1080 1081 1082 1083 1084 1085 1086 1087
			if (ret)
				return ret;
		}
		if (off_end) {
			ret = fill_zero(inode, pg_end, 0, off_end);
			if (ret)
				return ret;
		}
J
Jaegeuk Kim 已提交
1088 1089 1090 1091

		if (pg_start < pg_end) {
			struct address_space *mapping = inode->i_mapping;
			loff_t blk_start, blk_end;
1092
			struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1093

J
Jaegeuk Kim 已提交
1094
			f2fs_balance_fs(sbi, true);
J
Jaegeuk Kim 已提交
1095

1096 1097
			blk_start = (loff_t)pg_start << PAGE_SHIFT;
			blk_end = (loff_t)pg_end << PAGE_SHIFT;
1098 1099

			down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
1100
			down_write(&F2FS_I(inode)->i_mmap_sem);
1101

J
Jaegeuk Kim 已提交
1102 1103
			truncate_inode_pages_range(mapping, blk_start,
					blk_end - 1);
1104

1105
			f2fs_lock_op(sbi);
C
Chao Yu 已提交
1106
			ret = f2fs_truncate_hole(inode, pg_start, pg_end);
1107
			f2fs_unlock_op(sbi);
1108

1109
			up_write(&F2FS_I(inode)->i_mmap_sem);
1110
			up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
J
Jaegeuk Kim 已提交
1111 1112 1113 1114 1115 1116
		}
	}

	return ret;
}

1117 1118
static int __read_out_blkaddrs(struct inode *inode, block_t *blkaddr,
				int *do_replace, pgoff_t off, pgoff_t len)
C
Chao Yu 已提交
1119 1120 1121
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct dnode_of_data dn;
1122
	int ret, done, i;
1123

1124
next_dnode:
1125
	set_new_dnode(&dn, inode, NULL, NULL, 0);
C
Chao Yu 已提交
1126
	ret = f2fs_get_dnode_of_data(&dn, off, LOOKUP_NODE_RA);
1127 1128 1129
	if (ret && ret != -ENOENT) {
		return ret;
	} else if (ret == -ENOENT) {
1130 1131
		if (dn.max_level == 0)
			return -ENOENT;
C
Chao Yu 已提交
1132 1133
		done = min((pgoff_t)ADDRS_PER_BLOCK(inode) -
						dn.ofs_in_node, len);
1134 1135 1136 1137 1138 1139 1140 1141
		blkaddr += done;
		do_replace += done;
		goto next;
	}

	done = min((pgoff_t)ADDRS_PER_PAGE(dn.node_page, inode) -
							dn.ofs_in_node, len);
	for (i = 0; i < done; i++, blkaddr++, do_replace++, dn.ofs_in_node++) {
1142
		*blkaddr = f2fs_data_blkaddr(&dn);
C
Chao Yu 已提交
1143 1144 1145 1146 1147

		if (__is_valid_data_blkaddr(*blkaddr) &&
			!f2fs_is_valid_blkaddr(sbi, *blkaddr,
					DATA_GENERIC_ENHANCE)) {
			f2fs_put_dnode(&dn);
1148
			return -EFSCORRUPTED;
C
Chao Yu 已提交
1149 1150
		}

C
Chao Yu 已提交
1151
		if (!f2fs_is_checkpointed_data(sbi, *blkaddr)) {
1152

1153
			if (f2fs_lfs_mode(sbi)) {
1154
				f2fs_put_dnode(&dn);
1155
				return -EOPNOTSUPP;
1156 1157
			}

1158
			/* do not invalidate this block address */
1159
			f2fs_update_data_blkaddr(&dn, NULL_ADDR);
1160
			*do_replace = 1;
C
Chao Yu 已提交
1161
		}
1162
	}
1163 1164 1165 1166 1167 1168 1169 1170
	f2fs_put_dnode(&dn);
next:
	len -= done;
	off += done;
	if (len)
		goto next_dnode;
	return 0;
}
C
Chao Yu 已提交
1171

1172 1173 1174 1175 1176 1177
static int __roll_back_blkaddrs(struct inode *inode, block_t *blkaddr,
				int *do_replace, pgoff_t off, int len)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct dnode_of_data dn;
	int ret, i;
C
Chao Yu 已提交
1178

1179 1180 1181
	for (i = 0; i < len; i++, do_replace++, blkaddr++) {
		if (*do_replace == 0)
			continue;
C
Chao Yu 已提交
1182

1183
		set_new_dnode(&dn, inode, NULL, NULL, 0);
C
Chao Yu 已提交
1184
		ret = f2fs_get_dnode_of_data(&dn, off + i, LOOKUP_NODE_RA);
1185 1186
		if (ret) {
			dec_valid_block_count(sbi, inode, 1);
C
Chao Yu 已提交
1187
			f2fs_invalidate_blocks(sbi, *blkaddr);
1188 1189
		} else {
			f2fs_update_data_blkaddr(&dn, *blkaddr);
1190
		}
1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202
		f2fs_put_dnode(&dn);
	}
	return 0;
}

static int __clone_blkaddrs(struct inode *src_inode, struct inode *dst_inode,
			block_t *blkaddr, int *do_replace,
			pgoff_t src, pgoff_t dst, pgoff_t len, bool full)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(src_inode);
	pgoff_t i = 0;
	int ret;
1203

1204 1205 1206 1207
	while (i < len) {
		if (blkaddr[i] == NULL_ADDR && !full) {
			i++;
			continue;
1208
		}
C
Chao Yu 已提交
1209

1210 1211 1212 1213 1214
		if (do_replace[i] || blkaddr[i] == NULL_ADDR) {
			struct dnode_of_data dn;
			struct node_info ni;
			size_t new_size;
			pgoff_t ilen;
C
Chao Yu 已提交
1215

1216
			set_new_dnode(&dn, dst_inode, NULL, NULL, 0);
C
Chao Yu 已提交
1217
			ret = f2fs_get_dnode_of_data(&dn, dst + i, ALLOC_NODE);
1218 1219
			if (ret)
				return ret;
C
Chao Yu 已提交
1220

1221 1222 1223 1224 1225 1226
			ret = f2fs_get_node_info(sbi, dn.nid, &ni);
			if (ret) {
				f2fs_put_dnode(&dn);
				return ret;
			}

1227 1228 1229 1230
			ilen = min((pgoff_t)
				ADDRS_PER_PAGE(dn.node_page, dst_inode) -
						dn.ofs_in_node, len - i);
			do {
1231
				dn.data_blkaddr = f2fs_data_blkaddr(&dn);
C
Chao Yu 已提交
1232
				f2fs_truncate_data_blocks_range(&dn, 1);
1233 1234 1235

				if (do_replace[i]) {
					f2fs_i_blocks_write(src_inode,
C
Chao Yu 已提交
1236
							1, false, false);
1237
					f2fs_i_blocks_write(dst_inode,
C
Chao Yu 已提交
1238
							1, true, false);
1239 1240 1241 1242 1243 1244 1245
					f2fs_replace_block(sbi, &dn, dn.data_blkaddr,
					blkaddr[i], ni.version, true, false);

					do_replace[i] = 0;
				}
				dn.ofs_in_node++;
				i++;
C
Chao Yu 已提交
1246
				new_size = (loff_t)(dst + i) << PAGE_SHIFT;
1247 1248
				if (dst_inode->i_size < new_size)
					f2fs_i_size_write(dst_inode, new_size);
1249
			} while (--ilen && (do_replace[i] || blkaddr[i] == NULL_ADDR));
1250

1251 1252 1253 1254
			f2fs_put_dnode(&dn);
		} else {
			struct page *psrc, *pdst;

C
Chao Yu 已提交
1255 1256
			psrc = f2fs_get_lock_data_page(src_inode,
							src + i, true);
1257 1258
			if (IS_ERR(psrc))
				return PTR_ERR(psrc);
C
Chao Yu 已提交
1259
			pdst = f2fs_get_new_data_page(dst_inode, NULL, dst + i,
1260 1261 1262 1263 1264 1265 1266 1267
								true);
			if (IS_ERR(pdst)) {
				f2fs_put_page(psrc, 1);
				return PTR_ERR(pdst);
			}
			f2fs_copy_page(psrc, pdst);
			set_page_dirty(pdst);
			f2fs_put_page(pdst, 1);
1268
			f2fs_put_page(psrc, 1);
C
Chao Yu 已提交
1269

C
Chao Yu 已提交
1270 1271
			ret = f2fs_truncate_hole(src_inode,
						src + i, src + i + 1);
1272 1273 1274 1275
			if (ret)
				return ret;
			i++;
		}
1276 1277
	}
	return 0;
1278
}
C
Chao Yu 已提交
1279

1280 1281
static int __exchange_data_block(struct inode *src_inode,
			struct inode *dst_inode, pgoff_t src, pgoff_t dst,
1282
			pgoff_t len, bool full)
1283 1284 1285
{
	block_t *src_blkaddr;
	int *do_replace;
1286
	pgoff_t olen;
1287 1288
	int ret;

1289
	while (len) {
1290
		olen = min((pgoff_t)4 * ADDRS_PER_BLOCK(src_inode), len);
1291

C
Chao Yu 已提交
1292
		src_blkaddr = f2fs_kvzalloc(F2FS_I_SB(src_inode),
1293
					array_size(olen, sizeof(block_t)),
1294
					GFP_NOFS);
1295 1296
		if (!src_blkaddr)
			return -ENOMEM;
1297

C
Chao Yu 已提交
1298
		do_replace = f2fs_kvzalloc(F2FS_I_SB(src_inode),
1299
					array_size(olen, sizeof(int)),
1300
					GFP_NOFS);
1301 1302 1303 1304
		if (!do_replace) {
			kvfree(src_blkaddr);
			return -ENOMEM;
		}
1305

1306 1307 1308 1309
		ret = __read_out_blkaddrs(src_inode, src_blkaddr,
					do_replace, src, olen);
		if (ret)
			goto roll_back;
1310

1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322
		ret = __clone_blkaddrs(src_inode, dst_inode, src_blkaddr,
					do_replace, src, dst, olen, full);
		if (ret)
			goto roll_back;

		src += olen;
		dst += olen;
		len -= olen;

		kvfree(src_blkaddr);
		kvfree(do_replace);
	}
1323 1324 1325
	return 0;

roll_back:
1326
	__roll_back_blkaddrs(src_inode, src_blkaddr, do_replace, src, olen);
1327 1328
	kvfree(src_blkaddr);
	kvfree(do_replace);
1329 1330
	return ret;
}
C
Chao Yu 已提交
1331

1332
static int f2fs_do_collapse(struct inode *inode, loff_t offset, loff_t len)
1333 1334
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1335
	pgoff_t nrpages = DIV_ROUND_UP(i_size_read(inode), PAGE_SIZE);
1336 1337
	pgoff_t start = offset >> PAGE_SHIFT;
	pgoff_t end = (offset + len) >> PAGE_SHIFT;
1338
	int ret;
1339

1340
	f2fs_balance_fs(sbi, true);
1341

1342 1343 1344
	/* avoid gc operation during block exchange */
	down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
	down_write(&F2FS_I(inode)->i_mmap_sem);
1345

1346 1347 1348
	f2fs_lock_op(sbi);
	f2fs_drop_extent_tree(inode);
	truncate_pagecache(inode, offset);
1349 1350
	ret = __exchange_data_block(inode, inode, end, start, nrpages - end, true);
	f2fs_unlock_op(sbi);
1351 1352 1353

	up_write(&F2FS_I(inode)->i_mmap_sem);
	up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
C
Chao Yu 已提交
1354 1355 1356 1357 1358 1359 1360 1361 1362 1363 1364 1365 1366 1367 1368
	return ret;
}

static int f2fs_collapse_range(struct inode *inode, loff_t offset, loff_t len)
{
	loff_t new_size;
	int ret;

	if (offset + len >= i_size_read(inode))
		return -EINVAL;

	/* collapse range should be aligned to block size of f2fs. */
	if (offset & (F2FS_BLKSIZE - 1) || len & (F2FS_BLKSIZE - 1))
		return -EINVAL;

1369 1370 1371
	ret = f2fs_convert_inline_inode(inode);
	if (ret)
		return ret;
1372

C
Chao Yu 已提交
1373 1374 1375
	/* write out all dirty pages from offset */
	ret = filemap_write_and_wait_range(inode->i_mapping, offset, LLONG_MAX);
	if (ret)
1376
		return ret;
C
Chao Yu 已提交
1377

1378
	ret = f2fs_do_collapse(inode, offset, len);
C
Chao Yu 已提交
1379
	if (ret)
1380
		return ret;
C
Chao Yu 已提交
1381

1382
	/* write out all moved pages, if possible */
1383
	down_write(&F2FS_I(inode)->i_mmap_sem);
1384 1385 1386
	filemap_write_and_wait_range(inode->i_mapping, offset, LLONG_MAX);
	truncate_pagecache(inode, offset);

C
Chao Yu 已提交
1387
	new_size = i_size_read(inode) - len;
1388
	ret = f2fs_truncate_blocks(inode, new_size, true);
1389
	up_write(&F2FS_I(inode)->i_mmap_sem);
C
Chao Yu 已提交
1390
	if (!ret)
1391
		f2fs_i_size_write(inode, new_size);
C
Chao Yu 已提交
1392 1393 1394
	return ret;
}

1395 1396 1397 1398 1399 1400 1401 1402 1403 1404
static int f2fs_do_zero_range(struct dnode_of_data *dn, pgoff_t start,
								pgoff_t end)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
	pgoff_t index = start;
	unsigned int ofs_in_node = dn->ofs_in_node;
	blkcnt_t count = 0;
	int ret;

	for (; index < end; index++, dn->ofs_in_node++) {
1405
		if (f2fs_data_blkaddr(dn) == NULL_ADDR)
1406 1407 1408 1409
			count++;
	}

	dn->ofs_in_node = ofs_in_node;
C
Chao Yu 已提交
1410
	ret = f2fs_reserve_new_blocks(dn, count);
1411 1412 1413 1414 1415
	if (ret)
		return ret;

	dn->ofs_in_node = ofs_in_node;
	for (index = start; index < end; index++, dn->ofs_in_node++) {
1416
		dn->data_blkaddr = f2fs_data_blkaddr(dn);
1417
		/*
C
Chao Yu 已提交
1418
		 * f2fs_reserve_new_blocks will not guarantee entire block
1419 1420 1421 1422 1423 1424 1425
		 * allocation.
		 */
		if (dn->data_blkaddr == NULL_ADDR) {
			ret = -ENOSPC;
			break;
		}
		if (dn->data_blkaddr != NEW_ADDR) {
C
Chao Yu 已提交
1426
			f2fs_invalidate_blocks(sbi, dn->data_blkaddr);
1427
			dn->data_blkaddr = NEW_ADDR;
C
Chao Yu 已提交
1428
			f2fs_set_data_blkaddr(dn);
1429 1430 1431 1432 1433 1434 1435 1436
		}
	}

	f2fs_update_extent_cache_range(dn, start, 0, index - start);

	return ret;
}

C
Chao Yu 已提交
1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448 1449 1450
static int f2fs_zero_range(struct inode *inode, loff_t offset, loff_t len,
								int mode)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct address_space *mapping = inode->i_mapping;
	pgoff_t index, pg_start, pg_end;
	loff_t new_size = i_size_read(inode);
	loff_t off_start, off_end;
	int ret = 0;

	ret = inode_newsize_ok(inode, (len + offset));
	if (ret)
		return ret;

1451 1452 1453
	ret = f2fs_convert_inline_inode(inode);
	if (ret)
		return ret;
C
Chao Yu 已提交
1454 1455 1456

	ret = filemap_write_and_wait_range(mapping, offset, offset + len - 1);
	if (ret)
1457
		return ret;
C
Chao Yu 已提交
1458

1459 1460
	pg_start = ((unsigned long long) offset) >> PAGE_SHIFT;
	pg_end = ((unsigned long long) offset + len) >> PAGE_SHIFT;
C
Chao Yu 已提交
1461

1462 1463
	off_start = offset & (PAGE_SIZE - 1);
	off_end = (offset + len) & (PAGE_SIZE - 1);
C
Chao Yu 已提交
1464 1465

	if (pg_start == pg_end) {
C
Chao Yu 已提交
1466 1467 1468
		ret = fill_zero(inode, pg_start, off_start,
						off_end - off_start);
		if (ret)
1469
			return ret;
C
Chao Yu 已提交
1470

C
Chao Yu 已提交
1471 1472 1473
		new_size = max_t(loff_t, new_size, offset + len);
	} else {
		if (off_start) {
C
Chao Yu 已提交
1474
			ret = fill_zero(inode, pg_start++, off_start,
1475
						PAGE_SIZE - off_start);
C
Chao Yu 已提交
1476
			if (ret)
1477
				return ret;
C
Chao Yu 已提交
1478

C
Chao Yu 已提交
1479
			new_size = max_t(loff_t, new_size,
1480
					(loff_t)pg_start << PAGE_SHIFT);
C
Chao Yu 已提交
1481 1482
		}

1483
		for (index = pg_start; index < pg_end;) {
C
Chao Yu 已提交
1484
			struct dnode_of_data dn;
1485 1486
			unsigned int end_offset;
			pgoff_t end;
C
Chao Yu 已提交
1487

1488
			down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
1489
			down_write(&F2FS_I(inode)->i_mmap_sem);
1490 1491 1492 1493 1494

			truncate_pagecache_range(inode,
				(loff_t)index << PAGE_SHIFT,
				((loff_t)pg_end << PAGE_SHIFT) - 1);

C
Chao Yu 已提交
1495 1496
			f2fs_lock_op(sbi);

1497
			set_new_dnode(&dn, inode, NULL, NULL, 0);
C
Chao Yu 已提交
1498
			ret = f2fs_get_dnode_of_data(&dn, index, ALLOC_NODE);
C
Chao Yu 已提交
1499 1500
			if (ret) {
				f2fs_unlock_op(sbi);
1501
				up_write(&F2FS_I(inode)->i_mmap_sem);
1502
				up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
C
Chao Yu 已提交
1503 1504 1505
				goto out;
			}

1506 1507 1508 1509
			end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
			end = min(pg_end, end_offset - dn.ofs_in_node + index);

			ret = f2fs_do_zero_range(&dn, index, end);
C
Chao Yu 已提交
1510
			f2fs_put_dnode(&dn);
1511

C
Chao Yu 已提交
1512
			f2fs_unlock_op(sbi);
1513
			up_write(&F2FS_I(inode)->i_mmap_sem);
1514
			up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
1515 1516 1517

			f2fs_balance_fs(sbi, dn.node_changed);

1518 1519
			if (ret)
				goto out;
C
Chao Yu 已提交
1520

1521
			index = end;
C
Chao Yu 已提交
1522
			new_size = max_t(loff_t, new_size,
1523
					(loff_t)index << PAGE_SHIFT);
C
Chao Yu 已提交
1524 1525 1526
		}

		if (off_end) {
C
Chao Yu 已提交
1527 1528 1529 1530
			ret = fill_zero(inode, pg_end, 0, off_end);
			if (ret)
				goto out;

C
Chao Yu 已提交
1531 1532 1533 1534 1535
			new_size = max_t(loff_t, new_size, offset + len);
		}
	}

out:
1536 1537 1538 1539 1540 1541
	if (new_size > i_size_read(inode)) {
		if (mode & FALLOC_FL_KEEP_SIZE)
			file_set_keep_isize(inode);
		else
			f2fs_i_size_write(inode, new_size);
	}
C
Chao Yu 已提交
1542 1543 1544
	return ret;
}

C
Chao Yu 已提交
1545 1546 1547
static int f2fs_insert_range(struct inode *inode, loff_t offset, loff_t len)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1548
	pgoff_t nr, pg_start, pg_end, delta, idx;
C
Chao Yu 已提交
1549
	loff_t new_size;
1550
	int ret = 0;
C
Chao Yu 已提交
1551 1552

	new_size = i_size_read(inode) + len;
1553 1554 1555
	ret = inode_newsize_ok(inode, new_size);
	if (ret)
		return ret;
C
Chao Yu 已提交
1556 1557 1558 1559 1560 1561 1562 1563

	if (offset >= i_size_read(inode))
		return -EINVAL;

	/* insert range should be aligned to block size of f2fs. */
	if (offset & (F2FS_BLKSIZE - 1) || len & (F2FS_BLKSIZE - 1))
		return -EINVAL;

1564 1565 1566
	ret = f2fs_convert_inline_inode(inode);
	if (ret)
		return ret;
1567

J
Jaegeuk Kim 已提交
1568
	f2fs_balance_fs(sbi, true);
1569

1570
	down_write(&F2FS_I(inode)->i_mmap_sem);
1571
	ret = f2fs_truncate_blocks(inode, i_size_read(inode), true);
1572
	up_write(&F2FS_I(inode)->i_mmap_sem);
C
Chao Yu 已提交
1573
	if (ret)
1574
		return ret;
C
Chao Yu 已提交
1575 1576 1577 1578

	/* write out all dirty pages from offset */
	ret = filemap_write_and_wait_range(inode->i_mapping, offset, LLONG_MAX);
	if (ret)
1579
		return ret;
C
Chao Yu 已提交
1580

1581 1582
	pg_start = offset >> PAGE_SHIFT;
	pg_end = (offset + len) >> PAGE_SHIFT;
C
Chao Yu 已提交
1583
	delta = pg_end - pg_start;
1584
	idx = DIV_ROUND_UP(i_size_read(inode), PAGE_SIZE);
1585

1586 1587 1588 1589 1590
	/* avoid gc operation during block exchange */
	down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
	down_write(&F2FS_I(inode)->i_mmap_sem);
	truncate_pagecache(inode, offset);

1591 1592 1593 1594 1595
	while (!ret && idx > pg_start) {
		nr = idx - pg_start;
		if (nr > delta)
			nr = delta;
		idx -= nr;
C
Chao Yu 已提交
1596 1597

		f2fs_lock_op(sbi);
1598 1599
		f2fs_drop_extent_tree(inode);

1600 1601
		ret = __exchange_data_block(inode, inode, idx,
					idx + delta, nr, false);
C
Chao Yu 已提交
1602 1603
		f2fs_unlock_op(sbi);
	}
1604 1605
	up_write(&F2FS_I(inode)->i_mmap_sem);
	up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
C
Chao Yu 已提交
1606

1607
	/* write out all moved pages, if possible */
1608
	down_write(&F2FS_I(inode)->i_mmap_sem);
1609 1610
	filemap_write_and_wait_range(inode->i_mapping, offset, LLONG_MAX);
	truncate_pagecache(inode, offset);
1611
	up_write(&F2FS_I(inode)->i_mmap_sem);
1612 1613

	if (!ret)
1614
		f2fs_i_size_write(inode, new_size);
C
Chao Yu 已提交
1615 1616 1617
	return ret;
}

J
Jaegeuk Kim 已提交
1618 1619 1620
static int expand_inode_data(struct inode *inode, loff_t offset,
					loff_t len, int mode)
{
1621
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1622
	struct f2fs_map_blocks map = { .m_next_pgofs = NULL,
C
Chao Yu 已提交
1623 1624
			.m_next_extent = NULL, .m_seg_type = NO_CHECK_TYPE,
			.m_may_create = true };
1625
	pgoff_t pg_end;
J
Jaegeuk Kim 已提交
1626
	loff_t new_size = i_size_read(inode);
1627
	loff_t off_end;
1628
	int err;
J
Jaegeuk Kim 已提交
1629

1630 1631 1632
	err = inode_newsize_ok(inode, (len + offset));
	if (err)
		return err;
J
Jaegeuk Kim 已提交
1633

1634 1635 1636
	err = f2fs_convert_inline_inode(inode);
	if (err)
		return err;
1637

J
Jaegeuk Kim 已提交
1638
	f2fs_balance_fs(sbi, true);
1639

1640
	pg_end = ((unsigned long long)offset + len) >> PAGE_SHIFT;
1641
	off_end = (offset + len) & (PAGE_SIZE - 1);
J
Jaegeuk Kim 已提交
1642

1643 1644 1645 1646
	map.m_lblk = ((unsigned long long)offset) >> PAGE_SHIFT;
	map.m_len = pg_end - map.m_lblk;
	if (off_end)
		map.m_len++;
1647

J
Jaegeuk Kim 已提交
1648 1649 1650 1651 1652 1653 1654 1655 1656 1657 1658 1659 1660 1661 1662
	if (!map.m_len)
		return 0;

	if (f2fs_is_pinned_file(inode)) {
		block_t len = (map.m_len >> sbi->log_blocks_per_seg) <<
					sbi->log_blocks_per_seg;
		block_t done = 0;

		if (map.m_len % sbi->blocks_per_seg)
			len += sbi->blocks_per_seg;

		map.m_len = sbi->blocks_per_seg;
next_alloc:
		if (has_not_enough_free_secs(sbi, 0,
			GET_SEC_FROM_SEG(sbi, overprovision_segments(sbi)))) {
C
Chao Yu 已提交
1663
			down_write(&sbi->gc_lock);
J
Jaegeuk Kim 已提交
1664 1665 1666 1667 1668 1669
			err = f2fs_gc(sbi, true, false, NULL_SEGNO);
			if (err && err != -ENODATA && err != -EAGAIN)
				goto out_err;
		}

		down_write(&sbi->pin_sem);
1670 1671

		f2fs_lock_op(sbi);
C
Chao Yu 已提交
1672
		f2fs_allocate_new_segment(sbi, CURSEG_COLD_DATA_PINNED);
1673 1674
		f2fs_unlock_op(sbi);

C
Chao Yu 已提交
1675
		map.m_seg_type = CURSEG_COLD_DATA_PINNED;
J
Jaegeuk Kim 已提交
1676
		err = f2fs_map_blocks(inode, &map, 1, F2FS_GET_BLOCK_PRE_DIO);
C
Chao Yu 已提交
1677

J
Jaegeuk Kim 已提交
1678
		up_write(&sbi->pin_sem);
1679

J
Jaegeuk Kim 已提交
1680 1681 1682 1683 1684 1685 1686 1687 1688 1689 1690
		done += map.m_len;
		len -= map.m_len;
		map.m_lblk += map.m_len;
		if (!err && len)
			goto next_alloc;

		map.m_len = done;
	} else {
		err = f2fs_map_blocks(inode, &map, 1, F2FS_GET_BLOCK_PRE_AIO);
	}
out_err:
1691
	if (err) {
1692
		pgoff_t last_off;
J
Jaegeuk Kim 已提交
1693

1694
		if (!map.m_len)
1695
			return err;
1696

1697 1698 1699
		last_off = map.m_lblk + map.m_len - 1;

		/* update new size to the failed position */
1700
		new_size = (last_off == pg_end) ? offset + len :
1701 1702 1703
					(loff_t)(last_off + 1) << PAGE_SHIFT;
	} else {
		new_size = ((loff_t)pg_end << PAGE_SHIFT) + off_end;
J
Jaegeuk Kim 已提交
1704 1705
	}

1706 1707 1708 1709 1710 1711
	if (new_size > i_size_read(inode)) {
		if (mode & FALLOC_FL_KEEP_SIZE)
			file_set_keep_isize(inode);
		else
			f2fs_i_size_write(inode, new_size);
	}
J
Jaegeuk Kim 已提交
1712

1713
	return err;
J
Jaegeuk Kim 已提交
1714 1715 1716 1717 1718
}

static long f2fs_fallocate(struct file *file, int mode,
				loff_t offset, loff_t len)
{
A
Al Viro 已提交
1719
	struct inode *inode = file_inode(file);
1720
	long ret = 0;
J
Jaegeuk Kim 已提交
1721

1722 1723
	if (unlikely(f2fs_cp_error(F2FS_I_SB(inode))))
		return -EIO;
1724 1725
	if (!f2fs_is_checkpoint_ready(F2FS_I_SB(inode)))
		return -ENOSPC;
C
Chao Yu 已提交
1726 1727
	if (!f2fs_is_compress_backend_ready(inode))
		return -EOPNOTSUPP;
1728

1729 1730 1731 1732
	/* f2fs only support ->fallocate for regular file */
	if (!S_ISREG(inode->i_mode))
		return -EINVAL;

1733
	if (IS_ENCRYPTED(inode) &&
C
Chao Yu 已提交
1734
		(mode & (FALLOC_FL_COLLAPSE_RANGE | FALLOC_FL_INSERT_RANGE)))
1735 1736
		return -EOPNOTSUPP;

C
Chao Yu 已提交
1737 1738 1739 1740 1741
	if (f2fs_compressed_file(inode) &&
		(mode & (FALLOC_FL_PUNCH_HOLE | FALLOC_FL_COLLAPSE_RANGE |
			FALLOC_FL_ZERO_RANGE | FALLOC_FL_INSERT_RANGE)))
		return -EOPNOTSUPP;

C
Chao Yu 已提交
1742
	if (mode & ~(FALLOC_FL_KEEP_SIZE | FALLOC_FL_PUNCH_HOLE |
C
Chao Yu 已提交
1743 1744
			FALLOC_FL_COLLAPSE_RANGE | FALLOC_FL_ZERO_RANGE |
			FALLOC_FL_INSERT_RANGE))
J
Jaegeuk Kim 已提交
1745 1746
		return -EOPNOTSUPP;

A
Al Viro 已提交
1747
	inode_lock(inode);
1748

1749 1750 1751 1752
	if (mode & FALLOC_FL_PUNCH_HOLE) {
		if (offset >= inode->i_size)
			goto out;

C
Chao Yu 已提交
1753
		ret = punch_hole(inode, offset, len);
C
Chao Yu 已提交
1754 1755
	} else if (mode & FALLOC_FL_COLLAPSE_RANGE) {
		ret = f2fs_collapse_range(inode, offset, len);
C
Chao Yu 已提交
1756 1757
	} else if (mode & FALLOC_FL_ZERO_RANGE) {
		ret = f2fs_zero_range(inode, offset, len, mode);
C
Chao Yu 已提交
1758 1759
	} else if (mode & FALLOC_FL_INSERT_RANGE) {
		ret = f2fs_insert_range(inode, offset, len);
C
Chao Yu 已提交
1760
	} else {
J
Jaegeuk Kim 已提交
1761
		ret = expand_inode_data(inode, offset, len, mode);
C
Chao Yu 已提交
1762
	}
J
Jaegeuk Kim 已提交
1763

1764
	if (!ret) {
1765
		inode->i_mtime = inode->i_ctime = current_time(inode);
1766
		f2fs_mark_inode_dirty_sync(inode, false);
1767
		f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
1768
	}
1769

1770
out:
A
Al Viro 已提交
1771
	inode_unlock(inode);
1772

1773
	trace_f2fs_fallocate(inode, mode, offset, len, ret);
J
Jaegeuk Kim 已提交
1774 1775 1776
	return ret;
}

1777 1778
static int f2fs_release_file(struct inode *inode, struct file *filp)
{
1779 1780 1781 1782 1783 1784 1785 1786
	/*
	 * f2fs_relase_file is called at every close calls. So we should
	 * not drop any inmemory pages by close called by other process.
	 */
	if (!(filp->f_mode & FMODE_WRITE) ||
			atomic_read(&inode->i_writecount) != 1)
		return 0;

1787 1788
	/* some remained atomic pages should discarded */
	if (f2fs_is_atomic_file(inode))
C
Chao Yu 已提交
1789
		f2fs_drop_inmem_pages(inode);
1790
	if (f2fs_is_volatile_file(inode)) {
1791
		set_inode_flag(inode, FI_DROP_CACHE);
1792
		filemap_fdatawrite(inode->i_mapping);
1793
		clear_inode_flag(inode, FI_DROP_CACHE);
1794 1795
		clear_inode_flag(inode, FI_VOLATILE_FILE);
		stat_dec_volatile_write(inode);
1796 1797 1798 1799
	}
	return 0;
}

1800
static int f2fs_file_flush(struct file *file, fl_owner_t id)
J
Jaegeuk Kim 已提交
1801
{
1802 1803 1804 1805 1806 1807 1808 1809 1810 1811
	struct inode *inode = file_inode(file);

	/*
	 * If the process doing a transaction is crashed, we should do
	 * roll-back. Otherwise, other reader/write can see corrupted database
	 * until all the writers close its file. Since this should be done
	 * before dropping file lock, it needs to do in ->flush.
	 */
	if (f2fs_is_atomic_file(inode) &&
			F2FS_I(inode)->inmem_task == current)
C
Chao Yu 已提交
1812
		f2fs_drop_inmem_pages(inode);
1813
	return 0;
J
Jaegeuk Kim 已提交
1814 1815
}

1816
static int f2fs_setflags_common(struct inode *inode, u32 iflags, u32 mask)
1817 1818
{
	struct f2fs_inode_info *fi = F2FS_I(inode);
1819 1820 1821
	u32 masked_flags = fi->i_flags & mask;

	f2fs_bug_on(F2FS_I_SB(inode), (iflags & ~mask));
1822 1823 1824 1825 1826

	/* Is it quota file? Do not allow user to mess with it */
	if (IS_NOQUOTA(inode))
		return -EPERM;

1827
	if ((iflags ^ masked_flags) & F2FS_CASEFOLD_FL) {
1828 1829 1830 1831 1832 1833
		if (!f2fs_sb_has_casefold(F2FS_I_SB(inode)))
			return -EOPNOTSUPP;
		if (!f2fs_empty_dir(inode))
			return -ENOTEMPTY;
	}

C
Chao Yu 已提交
1834 1835 1836 1837 1838 1839 1840
	if (iflags & (F2FS_COMPR_FL | F2FS_NOCOMP_FL)) {
		if (!f2fs_sb_has_compression(F2FS_I_SB(inode)))
			return -EOPNOTSUPP;
		if ((iflags & F2FS_COMPR_FL) && (iflags & F2FS_NOCOMP_FL))
			return -EINVAL;
	}

1841
	if ((iflags ^ masked_flags) & F2FS_COMPR_FL) {
1842
		if (masked_flags & F2FS_COMPR_FL) {
1843
			if (!f2fs_disable_compressed_file(inode))
1844 1845
				return -EINVAL;
		}
C
Chao Yu 已提交
1846 1847 1848 1849 1850
		if (iflags & F2FS_NOCOMP_FL)
			return -EINVAL;
		if (iflags & F2FS_COMPR_FL) {
			if (!f2fs_may_compress(inode))
				return -EINVAL;
1851 1852
			if (S_ISREG(inode->i_mode) && inode->i_size)
				return -EINVAL;
C
Chao Yu 已提交
1853 1854 1855 1856

			set_compress_context(inode);
		}
	}
1857 1858
	if ((iflags ^ masked_flags) & F2FS_NOCOMP_FL) {
		if (masked_flags & F2FS_COMPR_FL)
C
Chao Yu 已提交
1859 1860 1861
			return -EINVAL;
	}

1862
	fi->i_flags = iflags | (fi->i_flags & ~mask);
C
Chao Yu 已提交
1863 1864
	f2fs_bug_on(F2FS_I_SB(inode), (fi->i_flags & F2FS_COMPR_FL) &&
					(fi->i_flags & F2FS_NOCOMP_FL));
1865

1866
	if (fi->i_flags & F2FS_PROJINHERIT_FL)
1867 1868 1869 1870 1871 1872
		set_inode_flag(inode, FI_PROJ_INHERIT);
	else
		clear_inode_flag(inode, FI_PROJ_INHERIT);

	inode->i_ctime = current_time(inode);
	f2fs_set_inode_flags(inode);
C
Chao Yu 已提交
1873
	f2fs_mark_inode_dirty_sync(inode, true);
1874 1875 1876
	return 0;
}

M
Miklos Szeredi 已提交
1877
/* FS_IOC_[GS]ETFLAGS and FS_IOC_FS[GS]ETXATTR support */
1878 1879 1880 1881 1882 1883

/*
 * To make a new on-disk f2fs i_flag gettable via FS_IOC_GETFLAGS, add an entry
 * for it to f2fs_fsflags_map[], and add its FS_*_FL equivalent to
 * F2FS_GETTABLE_FS_FL.  To also make it settable via FS_IOC_SETFLAGS, also add
 * its FS_*_FL equivalent to F2FS_SETTABLE_FS_FL.
M
Miklos Szeredi 已提交
1884 1885 1886
 *
 * Translating flags to fsx_flags value used by FS_IOC_FSGETXATTR and
 * FS_IOC_FSSETXATTR is done by the VFS.
1887 1888 1889 1890 1891 1892
 */

static const struct {
	u32 iflag;
	u32 fsflag;
} f2fs_fsflags_map[] = {
C
Chao Yu 已提交
1893
	{ F2FS_COMPR_FL,	FS_COMPR_FL },
1894 1895 1896 1897 1898
	{ F2FS_SYNC_FL,		FS_SYNC_FL },
	{ F2FS_IMMUTABLE_FL,	FS_IMMUTABLE_FL },
	{ F2FS_APPEND_FL,	FS_APPEND_FL },
	{ F2FS_NODUMP_FL,	FS_NODUMP_FL },
	{ F2FS_NOATIME_FL,	FS_NOATIME_FL },
C
Chao Yu 已提交
1899
	{ F2FS_NOCOMP_FL,	FS_NOCOMP_FL },
1900 1901 1902
	{ F2FS_INDEX_FL,	FS_INDEX_FL },
	{ F2FS_DIRSYNC_FL,	FS_DIRSYNC_FL },
	{ F2FS_PROJINHERIT_FL,	FS_PROJINHERIT_FL },
1903
	{ F2FS_CASEFOLD_FL,	FS_CASEFOLD_FL },
1904 1905 1906
};

#define F2FS_GETTABLE_FS_FL (		\
C
Chao Yu 已提交
1907
		FS_COMPR_FL |		\
1908 1909 1910 1911 1912
		FS_SYNC_FL |		\
		FS_IMMUTABLE_FL |	\
		FS_APPEND_FL |		\
		FS_NODUMP_FL |		\
		FS_NOATIME_FL |		\
C
Chao Yu 已提交
1913
		FS_NOCOMP_FL |		\
1914 1915 1916 1917 1918
		FS_INDEX_FL |		\
		FS_DIRSYNC_FL |		\
		FS_PROJINHERIT_FL |	\
		FS_ENCRYPT_FL |		\
		FS_INLINE_DATA_FL |	\
E
Eric Biggers 已提交
1919
		FS_NOCOW_FL |		\
1920
		FS_VERITY_FL |		\
1921
		FS_CASEFOLD_FL)
1922 1923

#define F2FS_SETTABLE_FS_FL (		\
C
Chao Yu 已提交
1924
		FS_COMPR_FL |		\
1925 1926 1927 1928 1929
		FS_SYNC_FL |		\
		FS_IMMUTABLE_FL |	\
		FS_APPEND_FL |		\
		FS_NODUMP_FL |		\
		FS_NOATIME_FL |		\
C
Chao Yu 已提交
1930
		FS_NOCOMP_FL |		\
1931
		FS_DIRSYNC_FL |		\
1932 1933
		FS_PROJINHERIT_FL |	\
		FS_CASEFOLD_FL)
1934 1935 1936 1937 1938 1939 1940 1941 1942 1943 1944 1945 1946 1947 1948 1949 1950 1951 1952 1953 1954 1955 1956 1957 1958 1959 1960

/* Convert f2fs on-disk i_flags to FS_IOC_{GET,SET}FLAGS flags */
static inline u32 f2fs_iflags_to_fsflags(u32 iflags)
{
	u32 fsflags = 0;
	int i;

	for (i = 0; i < ARRAY_SIZE(f2fs_fsflags_map); i++)
		if (iflags & f2fs_fsflags_map[i].iflag)
			fsflags |= f2fs_fsflags_map[i].fsflag;

	return fsflags;
}

/* Convert FS_IOC_{GET,SET}FLAGS flags to f2fs on-disk i_flags */
static inline u32 f2fs_fsflags_to_iflags(u32 fsflags)
{
	u32 iflags = 0;
	int i;

	for (i = 0; i < ARRAY_SIZE(f2fs_fsflags_map); i++)
		if (fsflags & f2fs_fsflags_map[i].fsflag)
			iflags |= f2fs_fsflags_map[i].iflag;

	return iflags;
}

C
Chao Yu 已提交
1961 1962 1963 1964 1965 1966 1967
static int f2fs_ioc_getversion(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);

	return put_user(inode->i_generation, (int __user *)arg);
}

J
Jaegeuk Kim 已提交
1968 1969 1970
static int f2fs_ioc_start_atomic_write(struct file *filp)
{
	struct inode *inode = file_inode(filp);
1971 1972
	struct f2fs_inode_info *fi = F2FS_I(inode);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1973
	int ret;
J
Jaegeuk Kim 已提交
1974

1975
	if (!inode_owner_or_capable(&init_user_ns, inode))
J
Jaegeuk Kim 已提交
1976 1977
		return -EACCES;

1978 1979 1980
	if (!S_ISREG(inode->i_mode))
		return -EINVAL;

1981 1982 1983
	if (filp->f_flags & O_DIRECT)
		return -EINVAL;

1984 1985 1986 1987
	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

1988 1989
	inode_lock(inode);

C
Chao Yu 已提交
1990 1991
	f2fs_disable_compressed_file(inode);

1992 1993 1994
	if (f2fs_is_atomic_file(inode)) {
		if (is_inode_flag_set(inode, FI_ATOMIC_REVOKE_REQUEST))
			ret = -EINVAL;
1995
		goto out;
1996
	}
J
Jaegeuk Kim 已提交
1997

1998 1999
	ret = f2fs_convert_inline_inode(inode);
	if (ret)
2000
		goto out;
J
Jaegeuk Kim 已提交
2001

2002 2003
	down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);

2004 2005 2006 2007 2008
	/*
	 * Should wait end_io to count F2FS_WB_CP_DATA correctly by
	 * f2fs_is_atomic_file.
	 */
	if (get_dirty_pages(inode))
2009 2010
		f2fs_warn(F2FS_I_SB(inode), "Unexpected flush for atomic writes: ino=%lu, npages=%u",
			  inode->i_ino, get_dirty_pages(inode));
2011
	ret = filemap_write_and_wait_range(inode->i_mapping, 0, LLONG_MAX);
2012 2013
	if (ret) {
		up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
2014
		goto out;
2015
	}
2016

2017 2018 2019
	spin_lock(&sbi->inode_lock[ATOMIC_FILE]);
	if (list_empty(&fi->inmem_ilist))
		list_add_tail(&fi->inmem_ilist, &sbi->inode_list[ATOMIC_FILE]);
2020
	sbi->atomic_files++;
2021 2022 2023
	spin_unlock(&sbi->inode_lock[ATOMIC_FILE]);

	/* add inode in inmem_list first and set atomic_file */
2024
	set_inode_flag(inode, FI_ATOMIC_FILE);
2025
	clear_inode_flag(inode, FI_ATOMIC_REVOKE_REQUEST);
2026
	up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
2027

2028
	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
2029
	F2FS_I(inode)->inmem_task = current;
2030
	stat_update_max_atomic_write(inode);
2031
out:
2032
	inode_unlock(inode);
2033
	mnt_drop_write_file(filp);
2034
	return ret;
J
Jaegeuk Kim 已提交
2035 2036 2037 2038 2039 2040 2041
}

static int f2fs_ioc_commit_atomic_write(struct file *filp)
{
	struct inode *inode = file_inode(filp);
	int ret;

2042
	if (!inode_owner_or_capable(&init_user_ns, inode))
J
Jaegeuk Kim 已提交
2043 2044 2045 2046 2047 2048
		return -EACCES;

	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

2049
	f2fs_balance_fs(F2FS_I_SB(inode), true);
2050

2051
	inode_lock(inode);
2052

2053 2054
	if (f2fs_is_volatile_file(inode)) {
		ret = -EINVAL;
2055
		goto err_out;
2056
	}
2057

2058
	if (f2fs_is_atomic_file(inode)) {
C
Chao Yu 已提交
2059
		ret = f2fs_commit_inmem_pages(inode);
C
Chao Yu 已提交
2060
		if (ret)
2061
			goto err_out;
C
Chao Yu 已提交
2062

2063
		ret = f2fs_do_sync_file(filp, 0, LLONG_MAX, 0, true);
2064 2065
		if (!ret)
			f2fs_drop_inmem_pages(inode);
2066
	} else {
2067
		ret = f2fs_do_sync_file(filp, 0, LLONG_MAX, 1, false);
2068
	}
2069
err_out:
2070 2071 2072 2073
	if (is_inode_flag_set(inode, FI_ATOMIC_REVOKE_REQUEST)) {
		clear_inode_flag(inode, FI_ATOMIC_REVOKE_REQUEST);
		ret = -EINVAL;
	}
2074
	inode_unlock(inode);
J
Jaegeuk Kim 已提交
2075 2076 2077 2078
	mnt_drop_write_file(filp);
	return ret;
}

2079 2080 2081
static int f2fs_ioc_start_volatile_write(struct file *filp)
{
	struct inode *inode = file_inode(filp);
2082
	int ret;
2083

2084
	if (!inode_owner_or_capable(&init_user_ns, inode))
2085 2086
		return -EACCES;

2087 2088 2089
	if (!S_ISREG(inode->i_mode))
		return -EINVAL;

2090 2091 2092 2093
	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

2094 2095
	inode_lock(inode);

2096
	if (f2fs_is_volatile_file(inode))
2097
		goto out;
2098

2099 2100
	ret = f2fs_convert_inline_inode(inode);
	if (ret)
2101
		goto out;
2102

2103 2104 2105
	stat_inc_volatile_write(inode);
	stat_update_max_volatile_write(inode);

2106
	set_inode_flag(inode, FI_VOLATILE_FILE);
2107
	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
2108
out:
2109
	inode_unlock(inode);
2110 2111
	mnt_drop_write_file(filp);
	return ret;
2112 2113
}

2114 2115 2116
static int f2fs_ioc_release_volatile_write(struct file *filp)
{
	struct inode *inode = file_inode(filp);
2117
	int ret;
2118

2119
	if (!inode_owner_or_capable(&init_user_ns, inode))
2120 2121
		return -EACCES;

2122 2123 2124 2125
	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

2126 2127
	inode_lock(inode);

2128
	if (!f2fs_is_volatile_file(inode))
2129
		goto out;
2130

2131 2132 2133 2134
	if (!f2fs_is_first_block_written(inode)) {
		ret = truncate_partial_data_page(inode, 0, true);
		goto out;
	}
2135

2136 2137
	ret = punch_hole(inode, 0, F2FS_BLKSIZE);
out:
2138
	inode_unlock(inode);
2139 2140
	mnt_drop_write_file(filp);
	return ret;
2141 2142 2143 2144 2145 2146 2147
}

static int f2fs_ioc_abort_volatile_write(struct file *filp)
{
	struct inode *inode = file_inode(filp);
	int ret;

2148
	if (!inode_owner_or_capable(&init_user_ns, inode))
2149 2150 2151 2152 2153 2154
		return -EACCES;

	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

2155 2156
	inode_lock(inode);

2157
	if (f2fs_is_atomic_file(inode))
C
Chao Yu 已提交
2158
		f2fs_drop_inmem_pages(inode);
2159
	if (f2fs_is_volatile_file(inode)) {
2160
		clear_inode_flag(inode, FI_VOLATILE_FILE);
2161
		stat_dec_volatile_write(inode);
2162
		ret = f2fs_do_sync_file(filp, 0, LLONG_MAX, 0, true);
2163
	}
2164

2165 2166
	clear_inode_flag(inode, FI_ATOMIC_REVOKE_REQUEST);

2167 2168
	inode_unlock(inode);

2169
	mnt_drop_write_file(filp);
2170
	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
2171 2172 2173
	return ret;
}

J
Jaegeuk Kim 已提交
2174 2175 2176 2177 2178 2179
static int f2fs_ioc_shutdown(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct super_block *sb = sbi->sb;
	__u32 in;
2180
	int ret = 0;
J
Jaegeuk Kim 已提交
2181 2182 2183 2184 2185 2186 2187

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (get_user(in, (__u32 __user *)arg))
		return -EFAULT;

2188 2189
	if (in != F2FS_GOING_DOWN_FULLSYNC) {
		ret = mnt_want_write_file(filp);
2190 2191 2192 2193 2194 2195 2196
		if (ret) {
			if (ret == -EROFS) {
				ret = 0;
				f2fs_stop_checkpoint(sbi, false);
				set_sbi_flag(sbi, SBI_IS_SHUTDOWN);
				trace_f2fs_shutdown(sbi, in, ret);
			}
2197
			return ret;
2198
		}
2199
	}
2200

J
Jaegeuk Kim 已提交
2201 2202
	switch (in) {
	case F2FS_GOING_DOWN_FULLSYNC:
2203 2204
		ret = freeze_bdev(sb->s_bdev);
		if (ret)
2205
			goto out;
2206 2207 2208
		f2fs_stop_checkpoint(sbi, false);
		set_sbi_flag(sbi, SBI_IS_SHUTDOWN);
		thaw_bdev(sb->s_bdev);
J
Jaegeuk Kim 已提交
2209 2210 2211
		break;
	case F2FS_GOING_DOWN_METASYNC:
		/* do checkpoint only */
2212 2213 2214
		ret = f2fs_sync_fs(sb, 1);
		if (ret)
			goto out;
2215
		f2fs_stop_checkpoint(sbi, false);
2216
		set_sbi_flag(sbi, SBI_IS_SHUTDOWN);
J
Jaegeuk Kim 已提交
2217 2218
		break;
	case F2FS_GOING_DOWN_NOSYNC:
2219
		f2fs_stop_checkpoint(sbi, false);
2220
		set_sbi_flag(sbi, SBI_IS_SHUTDOWN);
J
Jaegeuk Kim 已提交
2221
		break;
2222
	case F2FS_GOING_DOWN_METAFLUSH:
C
Chao Yu 已提交
2223
		f2fs_sync_meta_pages(sbi, META, LONG_MAX, FS_META_IO);
2224
		f2fs_stop_checkpoint(sbi, false);
2225
		set_sbi_flag(sbi, SBI_IS_SHUTDOWN);
2226
		break;
2227 2228
	case F2FS_GOING_DOWN_NEED_FSCK:
		set_sbi_flag(sbi, SBI_NEED_FSCK);
2229 2230
		set_sbi_flag(sbi, SBI_CP_DISABLED_QUICK);
		set_sbi_flag(sbi, SBI_IS_DIRTY);
2231 2232
		/* do checkpoint only */
		ret = f2fs_sync_fs(sb, 1);
2233
		goto out;
J
Jaegeuk Kim 已提交
2234
	default:
2235 2236
		ret = -EINVAL;
		goto out;
J
Jaegeuk Kim 已提交
2237
	}
2238

C
Chao Yu 已提交
2239 2240
	f2fs_stop_gc_thread(sbi);
	f2fs_stop_discard_thread(sbi);
2241

C
Chao Yu 已提交
2242
	f2fs_drop_discard_cmd(sbi);
2243 2244
	clear_opt(sbi, DISCARD);

2245
	f2fs_update_time(sbi, REQ_TIME);
2246
out:
2247 2248
	if (in != F2FS_GOING_DOWN_FULLSYNC)
		mnt_drop_write_file(filp);
C
Chao Yu 已提交
2249 2250 2251

	trace_f2fs_shutdown(sbi, in, ret);

2252
	return ret;
J
Jaegeuk Kim 已提交
2253 2254
}

2255 2256 2257 2258 2259 2260 2261
static int f2fs_ioc_fitrim(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct super_block *sb = inode->i_sb;
	struct request_queue *q = bdev_get_queue(sb->s_bdev);
	struct fstrim_range range;
	int ret;
2262

2263 2264
	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;
2265

2266
	if (!f2fs_hw_support_discard(F2FS_SB(sb)))
2267
		return -EOPNOTSUPP;
2268

2269 2270 2271
	if (copy_from_user(&range, (struct fstrim_range __user *)arg,
				sizeof(range)))
		return -EFAULT;
2272

2273 2274 2275 2276
	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

2277 2278 2279
	range.minlen = max((unsigned int)range.minlen,
				q->limits.discard_granularity);
	ret = f2fs_trim_fs(F2FS_SB(sb), &range);
2280
	mnt_drop_write_file(filp);
2281 2282
	if (ret < 0)
		return ret;
2283

2284 2285 2286
	if (copy_to_user((struct fstrim_range __user *)arg, &range,
				sizeof(range)))
		return -EFAULT;
2287
	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
2288 2289 2290
	return 0;
}

2291 2292 2293 2294 2295 2296 2297 2298 2299 2300 2301 2302 2303 2304
static bool uuid_is_nonzero(__u8 u[16])
{
	int i;

	for (i = 0; i < 16; i++)
		if (u[i])
			return true;
	return false;
}

static int f2fs_ioc_set_encryption_policy(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);

2305
	if (!f2fs_sb_has_encrypt(F2FS_I_SB(inode)))
2306 2307
		return -EOPNOTSUPP;

2308
	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
2309

2310
	return fscrypt_ioctl_set_policy(filp, (const void __user *)arg);
2311 2312 2313 2314
}

static int f2fs_ioc_get_encryption_policy(struct file *filp, unsigned long arg)
{
2315
	if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
2316
		return -EOPNOTSUPP;
2317
	return fscrypt_ioctl_get_policy(filp, (void __user *)arg);
2318 2319 2320 2321 2322 2323 2324 2325
}

static int f2fs_ioc_get_encryption_pwsalt(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	int err;

2326
	if (!f2fs_sb_has_encrypt(sbi))
2327 2328 2329 2330 2331 2332
		return -EOPNOTSUPP;

	err = mnt_want_write_file(filp);
	if (err)
		return err;

2333
	down_write(&sbi->sb_lock);
2334 2335 2336 2337

	if (uuid_is_nonzero(sbi->raw_super->encrypt_pw_salt))
		goto got_it;

2338 2339 2340
	/* update superblock with uuid */
	generate_random_uuid(sbi->raw_super->encrypt_pw_salt);

C
Chao Yu 已提交
2341
	err = f2fs_commit_super(sbi, false);
2342 2343 2344
	if (err) {
		/* undo new data */
		memset(sbi->raw_super->encrypt_pw_salt, 0, 16);
2345
		goto out_err;
2346 2347 2348 2349
	}
got_it:
	if (copy_to_user((__u8 __user *)arg, sbi->raw_super->encrypt_pw_salt,
									16))
2350 2351
		err = -EFAULT;
out_err:
2352
	up_write(&sbi->sb_lock);
2353 2354
	mnt_drop_write_file(filp);
	return err;
2355 2356
}

E
Eric Biggers 已提交
2357 2358 2359 2360 2361 2362 2363 2364 2365 2366 2367 2368 2369 2370 2371 2372 2373 2374 2375 2376 2377 2378 2379 2380 2381 2382 2383 2384 2385 2386 2387 2388 2389 2390 2391 2392 2393 2394 2395 2396 2397 2398 2399
static int f2fs_ioc_get_encryption_policy_ex(struct file *filp,
					     unsigned long arg)
{
	if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
		return -EOPNOTSUPP;

	return fscrypt_ioctl_get_policy_ex(filp, (void __user *)arg);
}

static int f2fs_ioc_add_encryption_key(struct file *filp, unsigned long arg)
{
	if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
		return -EOPNOTSUPP;

	return fscrypt_ioctl_add_key(filp, (void __user *)arg);
}

static int f2fs_ioc_remove_encryption_key(struct file *filp, unsigned long arg)
{
	if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
		return -EOPNOTSUPP;

	return fscrypt_ioctl_remove_key(filp, (void __user *)arg);
}

static int f2fs_ioc_remove_encryption_key_all_users(struct file *filp,
						    unsigned long arg)
{
	if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
		return -EOPNOTSUPP;

	return fscrypt_ioctl_remove_key_all_users(filp, (void __user *)arg);
}

static int f2fs_ioc_get_encryption_key_status(struct file *filp,
					      unsigned long arg)
{
	if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
		return -EOPNOTSUPP;

	return fscrypt_ioctl_get_key_status(filp, (void __user *)arg);
}

2400 2401 2402 2403 2404 2405 2406 2407
static int f2fs_ioc_get_encryption_nonce(struct file *filp, unsigned long arg)
{
	if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
		return -EOPNOTSUPP;

	return fscrypt_ioctl_get_nonce(filp, (void __user *)arg);
}

2408 2409 2410 2411
static int f2fs_ioc_gc(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
C
Chao Yu 已提交
2412
	__u32 sync;
2413
	int ret;
2414 2415 2416 2417

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

C
Chao Yu 已提交
2418
	if (get_user(sync, (__u32 __user *)arg))
2419 2420
		return -EFAULT;

C
Chao Yu 已提交
2421 2422
	if (f2fs_readonly(sbi->sb))
		return -EROFS;
2423

2424 2425 2426 2427
	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

C
Chao Yu 已提交
2428
	if (!sync) {
C
Chao Yu 已提交
2429
		if (!down_write_trylock(&sbi->gc_lock)) {
2430 2431 2432
			ret = -EBUSY;
			goto out;
		}
C
Chao Yu 已提交
2433
	} else {
C
Chao Yu 已提交
2434
		down_write(&sbi->gc_lock);
2435 2436
	}

2437
	ret = f2fs_gc(sbi, sync, true, NULL_SEGNO);
2438 2439 2440
out:
	mnt_drop_write_file(filp);
	return ret;
2441 2442
}

2443
static int __f2fs_ioc_gc_range(struct file *filp, struct f2fs_gc_range *range)
2444
{
2445
	struct f2fs_sb_info *sbi = F2FS_I_SB(file_inode(filp));
2446 2447 2448 2449 2450 2451 2452 2453
	u64 end;
	int ret;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;
	if (f2fs_readonly(sbi->sb))
		return -EROFS;

2454 2455
	end = range->start + range->len;
	if (end < range->start || range->start < MAIN_BLKADDR(sbi) ||
2456
					end >= MAX_BLKADDR(sbi))
2457 2458
		return -EINVAL;

2459 2460 2461 2462 2463
	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

do_more:
2464
	if (!range->sync) {
C
Chao Yu 已提交
2465
		if (!down_write_trylock(&sbi->gc_lock)) {
2466 2467 2468 2469
			ret = -EBUSY;
			goto out;
		}
	} else {
C
Chao Yu 已提交
2470
		down_write(&sbi->gc_lock);
2471 2472
	}

2473
	ret = f2fs_gc(sbi, range->sync, true, GET_SEGNO(sbi, range->start));
2474 2475 2476 2477 2478
	if (ret) {
		if (ret == -EBUSY)
			ret = -EAGAIN;
		goto out;
	}
2479 2480
	range->start += BLKS_PER_SEC(sbi);
	if (range->start <= end)
2481 2482 2483 2484 2485 2486
		goto do_more;
out:
	mnt_drop_write_file(filp);
	return ret;
}

2487 2488 2489 2490 2491 2492 2493 2494 2495 2496
static int f2fs_ioc_gc_range(struct file *filp, unsigned long arg)
{
	struct f2fs_gc_range range;

	if (copy_from_user(&range, (struct f2fs_gc_range __user *)arg,
							sizeof(range)))
		return -EFAULT;
	return __f2fs_ioc_gc_range(filp, &range);
}

C
Chao Yu 已提交
2497
static int f2fs_ioc_write_checkpoint(struct file *filp, unsigned long arg)
2498 2499 2500
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
2501
	int ret;
2502 2503 2504 2505 2506 2507 2508

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (f2fs_readonly(sbi->sb))
		return -EROFS;

D
Daniel Rosenberg 已提交
2509
	if (unlikely(is_sbi_flag_set(sbi, SBI_CP_DISABLED))) {
2510
		f2fs_info(sbi, "Skipping Checkpoint. Checkpoints currently disabled.");
D
Daniel Rosenberg 已提交
2511 2512 2513
		return -EINVAL;
	}

2514 2515 2516 2517 2518 2519 2520 2521
	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

	ret = f2fs_sync_fs(sbi->sb, 1);

	mnt_drop_write_file(filp);
	return ret;
2522 2523
}

C
Chao Yu 已提交
2524 2525 2526 2527 2528
static int f2fs_defragment_range(struct f2fs_sb_info *sbi,
					struct file *filp,
					struct f2fs_defragment *range)
{
	struct inode *inode = file_inode(filp);
2529
	struct f2fs_map_blocks map = { .m_next_extent = NULL,
2530 2531
					.m_seg_type = NO_CHECK_TYPE ,
					.m_may_create = false };
2532
	struct extent_info ei = {0, 0, 0};
2533
	pgoff_t pg_start, pg_end, next_pgofs;
2534
	unsigned int blk_per_seg = sbi->blocks_per_seg;
C
Chao Yu 已提交
2535 2536 2537 2538 2539 2540
	unsigned int total = 0, sec_num;
	block_t blk_end = 0;
	bool fragmented = false;
	int err;

	/* if in-place-update policy is enabled, don't waste time here */
C
Chao Yu 已提交
2541
	if (f2fs_should_update_inplace(inode, NULL))
C
Chao Yu 已提交
2542 2543
		return -EINVAL;

2544 2545
	pg_start = range->start >> PAGE_SHIFT;
	pg_end = (range->start + range->len) >> PAGE_SHIFT;
C
Chao Yu 已提交
2546

J
Jaegeuk Kim 已提交
2547
	f2fs_balance_fs(sbi, true);
C
Chao Yu 已提交
2548

A
Al Viro 已提交
2549
	inode_lock(inode);
C
Chao Yu 已提交
2550 2551 2552

	/* writeback all dirty pages in the range */
	err = filemap_write_and_wait_range(inode->i_mapping, range->start,
2553
						range->start + range->len - 1);
C
Chao Yu 已提交
2554 2555 2556 2557 2558 2559 2560 2561 2562 2563 2564 2565 2566
	if (err)
		goto out;

	/*
	 * lookup mapping info in extent cache, skip defragmenting if physical
	 * block addresses are continuous.
	 */
	if (f2fs_lookup_extent_cache(inode, pg_start, &ei)) {
		if (ei.fofs + ei.len >= pg_end)
			goto out;
	}

	map.m_lblk = pg_start;
2567
	map.m_next_pgofs = &next_pgofs;
C
Chao Yu 已提交
2568 2569 2570 2571 2572 2573 2574

	/*
	 * lookup mapping info in dnode page cache, skip defragmenting if all
	 * physical block addresses are continuous even if there are hole(s)
	 * in logical blocks.
	 */
	while (map.m_lblk < pg_end) {
F
Fan Li 已提交
2575
		map.m_len = pg_end - map.m_lblk;
2576
		err = f2fs_map_blocks(inode, &map, 0, F2FS_GET_BLOCK_DEFAULT);
C
Chao Yu 已提交
2577 2578 2579 2580
		if (err)
			goto out;

		if (!(map.m_flags & F2FS_MAP_FLAGS)) {
2581
			map.m_lblk = next_pgofs;
C
Chao Yu 已提交
2582 2583 2584
			continue;
		}

2585
		if (blk_end && blk_end != map.m_pblk)
C
Chao Yu 已提交
2586
			fragmented = true;
2587 2588 2589 2590

		/* record total count of block that we're going to move */
		total += map.m_len;

C
Chao Yu 已提交
2591 2592 2593 2594 2595
		blk_end = map.m_pblk + map.m_len;

		map.m_lblk += map.m_len;
	}

2596 2597
	if (!fragmented) {
		total = 0;
C
Chao Yu 已提交
2598
		goto out;
2599
	}
C
Chao Yu 已提交
2600

2601
	sec_num = DIV_ROUND_UP(total, BLKS_PER_SEC(sbi));
C
Chao Yu 已提交
2602 2603 2604 2605 2606 2607

	/*
	 * make sure there are enough free section for LFS allocation, this can
	 * avoid defragment running in SSR mode when free section are allocated
	 * intensively
	 */
2608
	if (has_not_enough_free_secs(sbi, 0, sec_num)) {
C
Chao Yu 已提交
2609 2610 2611 2612
		err = -EAGAIN;
		goto out;
	}

2613 2614 2615 2616
	map.m_lblk = pg_start;
	map.m_len = pg_end - pg_start;
	total = 0;

C
Chao Yu 已提交
2617 2618 2619 2620 2621
	while (map.m_lblk < pg_end) {
		pgoff_t idx;
		int cnt = 0;

do_map:
F
Fan Li 已提交
2622
		map.m_len = pg_end - map.m_lblk;
2623
		err = f2fs_map_blocks(inode, &map, 0, F2FS_GET_BLOCK_DEFAULT);
C
Chao Yu 已提交
2624 2625 2626 2627
		if (err)
			goto clear_out;

		if (!(map.m_flags & F2FS_MAP_FLAGS)) {
2628
			map.m_lblk = next_pgofs;
2629
			goto check;
C
Chao Yu 已提交
2630 2631
		}

2632
		set_inode_flag(inode, FI_DO_DEFRAG);
C
Chao Yu 已提交
2633 2634 2635 2636 2637

		idx = map.m_lblk;
		while (idx < map.m_lblk + map.m_len && cnt < blk_per_seg) {
			struct page *page;

C
Chao Yu 已提交
2638
			page = f2fs_get_lock_data_page(inode, idx, true);
C
Chao Yu 已提交
2639 2640 2641 2642 2643 2644 2645 2646 2647 2648 2649 2650 2651 2652
			if (IS_ERR(page)) {
				err = PTR_ERR(page);
				goto clear_out;
			}

			set_page_dirty(page);
			f2fs_put_page(page, 1);

			idx++;
			cnt++;
			total++;
		}

		map.m_lblk = idx;
2653 2654
check:
		if (map.m_lblk < pg_end && cnt < blk_per_seg)
C
Chao Yu 已提交
2655 2656
			goto do_map;

2657
		clear_inode_flag(inode, FI_DO_DEFRAG);
C
Chao Yu 已提交
2658 2659 2660 2661 2662 2663

		err = filemap_fdatawrite(inode->i_mapping);
		if (err)
			goto out;
	}
clear_out:
2664
	clear_inode_flag(inode, FI_DO_DEFRAG);
C
Chao Yu 已提交
2665
out:
A
Al Viro 已提交
2666
	inode_unlock(inode);
C
Chao Yu 已提交
2667
	if (!err)
2668
		range->len = (u64)total << PAGE_SHIFT;
C
Chao Yu 已提交
2669 2670 2671 2672 2673 2674 2675 2676 2677 2678 2679 2680 2681
	return err;
}

static int f2fs_ioc_defragment(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct f2fs_defragment range;
	int err;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

2682
	if (!S_ISREG(inode->i_mode) || f2fs_is_atomic_file(inode))
C
Chao Yu 已提交
2683 2684
		return -EINVAL;

2685 2686
	if (f2fs_readonly(sbi->sb))
		return -EROFS;
C
Chao Yu 已提交
2687 2688

	if (copy_from_user(&range, (struct f2fs_defragment __user *)arg,
2689 2690
							sizeof(range)))
		return -EFAULT;
C
Chao Yu 已提交
2691 2692

	/* verify alignment of offset & size */
2693 2694
	if (range.start & (F2FS_BLKSIZE - 1) || range.len & (F2FS_BLKSIZE - 1))
		return -EINVAL;
C
Chao Yu 已提交
2695

S
Sheng Yong 已提交
2696
	if (unlikely((range.start + range.len) >> PAGE_SHIFT >
2697
					max_file_blocks(inode)))
2698 2699 2700 2701 2702
		return -EINVAL;

	err = mnt_want_write_file(filp);
	if (err)
		return err;
S
Sheng Yong 已提交
2703

C
Chao Yu 已提交
2704
	err = f2fs_defragment_range(sbi, filp, &range);
2705 2706
	mnt_drop_write_file(filp);

2707
	f2fs_update_time(sbi, REQ_TIME);
C
Chao Yu 已提交
2708
	if (err < 0)
2709
		return err;
C
Chao Yu 已提交
2710 2711 2712

	if (copy_to_user((struct f2fs_defragment __user *)arg, &range,
							sizeof(range)))
2713 2714 2715
		return -EFAULT;

	return 0;
C
Chao Yu 已提交
2716 2717
}

2718 2719 2720 2721 2722 2723 2724 2725 2726 2727 2728 2729 2730 2731 2732 2733 2734
static int f2fs_move_file_range(struct file *file_in, loff_t pos_in,
			struct file *file_out, loff_t pos_out, size_t len)
{
	struct inode *src = file_inode(file_in);
	struct inode *dst = file_inode(file_out);
	struct f2fs_sb_info *sbi = F2FS_I_SB(src);
	size_t olen = len, dst_max_i_size = 0;
	size_t dst_osize;
	int ret;

	if (file_in->f_path.mnt != file_out->f_path.mnt ||
				src->i_sb != dst->i_sb)
		return -EXDEV;

	if (unlikely(f2fs_readonly(src->i_sb)))
		return -EROFS;

2735 2736
	if (!S_ISREG(src->i_mode) || !S_ISREG(dst->i_mode))
		return -EINVAL;
2737

2738
	if (IS_ENCRYPTED(src) || IS_ENCRYPTED(dst))
2739 2740
		return -EOPNOTSUPP;

2741 2742 2743
	if (pos_out < 0 || pos_in < 0)
		return -EINVAL;

2744 2745 2746 2747 2748 2749 2750
	if (src == dst) {
		if (pos_in == pos_out)
			return 0;
		if (pos_out > pos_in && pos_out < pos_in + len)
			return -EINVAL;
	}

2751
	inode_lock(src);
2752
	if (src != dst) {
2753 2754 2755
		ret = -EBUSY;
		if (!inode_trylock(dst))
			goto out;
2756
	}
2757 2758 2759 2760 2761 2762 2763 2764 2765 2766 2767 2768 2769 2770 2771 2772 2773 2774 2775 2776 2777 2778 2779 2780 2781 2782 2783 2784 2785 2786 2787 2788 2789 2790 2791 2792 2793 2794 2795 2796 2797 2798 2799

	ret = -EINVAL;
	if (pos_in + len > src->i_size || pos_in + len < pos_in)
		goto out_unlock;
	if (len == 0)
		olen = len = src->i_size - pos_in;
	if (pos_in + len == src->i_size)
		len = ALIGN(src->i_size, F2FS_BLKSIZE) - pos_in;
	if (len == 0) {
		ret = 0;
		goto out_unlock;
	}

	dst_osize = dst->i_size;
	if (pos_out + olen > dst->i_size)
		dst_max_i_size = pos_out + olen;

	/* verify the end result is block aligned */
	if (!IS_ALIGNED(pos_in, F2FS_BLKSIZE) ||
			!IS_ALIGNED(pos_in + len, F2FS_BLKSIZE) ||
			!IS_ALIGNED(pos_out, F2FS_BLKSIZE))
		goto out_unlock;

	ret = f2fs_convert_inline_inode(src);
	if (ret)
		goto out_unlock;

	ret = f2fs_convert_inline_inode(dst);
	if (ret)
		goto out_unlock;

	/* write out all dirty pages from offset */
	ret = filemap_write_and_wait_range(src->i_mapping,
					pos_in, pos_in + len);
	if (ret)
		goto out_unlock;

	ret = filemap_write_and_wait_range(dst->i_mapping,
					pos_out, pos_out + len);
	if (ret)
		goto out_unlock;

	f2fs_balance_fs(sbi, true);
2800 2801 2802 2803 2804 2805 2806 2807

	down_write(&F2FS_I(src)->i_gc_rwsem[WRITE]);
	if (src != dst) {
		ret = -EBUSY;
		if (!down_write_trylock(&F2FS_I(dst)->i_gc_rwsem[WRITE]))
			goto out_src;
	}

2808
	f2fs_lock_op(sbi);
2809 2810 2811
	ret = __exchange_data_block(src, dst, pos_in >> F2FS_BLKSIZE_BITS,
				pos_out >> F2FS_BLKSIZE_BITS,
				len >> F2FS_BLKSIZE_BITS, false);
2812 2813 2814 2815 2816 2817 2818 2819

	if (!ret) {
		if (dst_max_i_size)
			f2fs_i_size_write(dst, dst_max_i_size);
		else if (dst_osize != dst->i_size)
			f2fs_i_size_write(dst, dst_osize);
	}
	f2fs_unlock_op(sbi);
2820 2821

	if (src != dst)
C
Chao Yu 已提交
2822
		up_write(&F2FS_I(dst)->i_gc_rwsem[WRITE]);
2823 2824 2825 2826
out_src:
	up_write(&F2FS_I(src)->i_gc_rwsem[WRITE]);
out_unlock:
	if (src != dst)
2827
		inode_unlock(dst);
2828
out:
2829 2830 2831 2832
	inode_unlock(src);
	return ret;
}

2833 2834
static int __f2fs_ioc_move_range(struct file *filp,
				struct f2fs_move_range *range)
2835 2836 2837 2838 2839 2840 2841 2842
{
	struct fd dst;
	int err;

	if (!(filp->f_mode & FMODE_READ) ||
			!(filp->f_mode & FMODE_WRITE))
		return -EBADF;

2843
	dst = fdget(range->dst_fd);
2844 2845 2846 2847 2848 2849 2850 2851 2852 2853 2854 2855
	if (!dst.file)
		return -EBADF;

	if (!(dst.file->f_mode & FMODE_WRITE)) {
		err = -EBADF;
		goto err_out;
	}

	err = mnt_want_write_file(filp);
	if (err)
		goto err_out;

2856 2857
	err = f2fs_move_file_range(filp, range->pos_in, dst.file,
					range->pos_out, range->len);
2858 2859 2860 2861 2862 2863 2864

	mnt_drop_write_file(filp);
err_out:
	fdput(dst);
	return err;
}

2865 2866 2867 2868 2869 2870 2871 2872 2873 2874
static int f2fs_ioc_move_range(struct file *filp, unsigned long arg)
{
	struct f2fs_move_range range;

	if (copy_from_user(&range, (struct f2fs_move_range __user *)arg,
							sizeof(range)))
		return -EFAULT;
	return __f2fs_ioc_move_range(filp, &range);
}

2875 2876 2877 2878 2879 2880 2881 2882 2883 2884 2885 2886 2887 2888 2889 2890
static int f2fs_ioc_flush_device(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct sit_info *sm = SIT_I(sbi);
	unsigned int start_segno = 0, end_segno = 0;
	unsigned int dev_start_segno = 0, dev_end_segno = 0;
	struct f2fs_flush_device range;
	int ret;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (f2fs_readonly(sbi->sb))
		return -EROFS;

D
Daniel Rosenberg 已提交
2891 2892 2893
	if (unlikely(is_sbi_flag_set(sbi, SBI_CP_DISABLED)))
		return -EINVAL;

2894 2895 2896 2897
	if (copy_from_user(&range, (struct f2fs_flush_device __user *)arg,
							sizeof(range)))
		return -EFAULT;

2898
	if (!f2fs_is_multi_device(sbi) || sbi->s_ndevs - 1 <= range.dev_num ||
2899
			__is_large_section(sbi)) {
2900 2901
		f2fs_warn(sbi, "Can't flush %u in %d for segs_per_sec %u != 1",
			  range.dev_num, sbi->s_ndevs, sbi->segs_per_sec);
2902 2903 2904 2905 2906 2907 2908 2909 2910 2911 2912 2913 2914 2915 2916 2917 2918
		return -EINVAL;
	}

	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

	if (range.dev_num != 0)
		dev_start_segno = GET_SEGNO(sbi, FDEV(range.dev_num).start_blk);
	dev_end_segno = GET_SEGNO(sbi, FDEV(range.dev_num).end_blk);

	start_segno = sm->last_victim[FLUSH_DEVICE];
	if (start_segno < dev_start_segno || start_segno >= dev_end_segno)
		start_segno = dev_start_segno;
	end_segno = min(start_segno + range.segments, dev_end_segno);

	while (start_segno < end_segno) {
C
Chao Yu 已提交
2919
		if (!down_write_trylock(&sbi->gc_lock)) {
2920 2921 2922 2923 2924 2925 2926 2927 2928 2929 2930 2931 2932 2933 2934 2935 2936 2937
			ret = -EBUSY;
			goto out;
		}
		sm->last_victim[GC_CB] = end_segno + 1;
		sm->last_victim[GC_GREEDY] = end_segno + 1;
		sm->last_victim[ALLOC_NEXT] = end_segno + 1;
		ret = f2fs_gc(sbi, true, true, start_segno);
		if (ret == -EAGAIN)
			ret = 0;
		else if (ret < 0)
			break;
		start_segno++;
	}
out:
	mnt_drop_write_file(filp);
	return ret;
}

2938 2939 2940 2941 2942 2943 2944 2945 2946 2947
static int f2fs_ioc_get_features(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	u32 sb_feature = le32_to_cpu(F2FS_I_SB(inode)->raw_super->feature);

	/* Must validate to set it with SQLite behavior in Android. */
	sb_feature |= F2FS_FEATURE_ATOMIC_WRITE;

	return put_user(sb_feature, (u32 __user *)arg);
}
2948

2949
#ifdef CONFIG_QUOTA
2950 2951 2952 2953 2954 2955 2956 2957 2958 2959 2960 2961 2962 2963 2964 2965 2966
int f2fs_transfer_project_quota(struct inode *inode, kprojid_t kprojid)
{
	struct dquot *transfer_to[MAXQUOTAS] = {};
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct super_block *sb = sbi->sb;
	int err = 0;

	transfer_to[PRJQUOTA] = dqget(sb, make_kqid_projid(kprojid));
	if (!IS_ERR(transfer_to[PRJQUOTA])) {
		err = __dquot_transfer(inode, transfer_to);
		if (err)
			set_sbi_flag(sbi, SBI_QUOTA_NEED_REPAIR);
		dqput(transfer_to[PRJQUOTA]);
	}
	return err;
}

M
Miklos Szeredi 已提交
2967
static int f2fs_ioc_setproject(struct inode *inode, __u32 projid)
2968 2969 2970 2971 2972 2973 2974
{
	struct f2fs_inode_info *fi = F2FS_I(inode);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct page *ipage;
	kprojid_t kprojid;
	int err;

2975
	if (!f2fs_sb_has_project_quota(sbi)) {
2976 2977 2978 2979 2980 2981 2982 2983 2984 2985 2986 2987 2988 2989 2990 2991 2992
		if (projid != F2FS_DEF_PROJID)
			return -EOPNOTSUPP;
		else
			return 0;
	}

	if (!f2fs_has_extra_attr(inode))
		return -EOPNOTSUPP;

	kprojid = make_kprojid(&init_user_ns, (projid_t)projid);

	if (projid_eq(kprojid, F2FS_I(inode)->i_projid))
		return 0;

	err = -EPERM;
	/* Is it quota file? Do not allow user to mess with it */
	if (IS_NOQUOTA(inode))
2993
		return err;
2994

C
Chao Yu 已提交
2995
	ipage = f2fs_get_node_page(sbi, inode->i_ino);
2996 2997
	if (IS_ERR(ipage))
		return PTR_ERR(ipage);
2998 2999 3000 3001 3002

	if (!F2FS_FITS_IN_INODE(F2FS_INODE(ipage), fi->i_extra_isize,
								i_projid)) {
		err = -EOVERFLOW;
		f2fs_put_page(ipage, 1);
3003
		return err;
3004 3005 3006
	}
	f2fs_put_page(ipage, 1);

3007 3008
	err = dquot_initialize(inode);
	if (err)
3009
		return err;
3010

3011 3012 3013 3014
	f2fs_lock_op(sbi);
	err = f2fs_transfer_project_quota(inode, kprojid);
	if (err)
		goto out_unlock;
3015 3016 3017 3018

	F2FS_I(inode)->i_projid = kprojid;
	inode->i_ctime = current_time(inode);
	f2fs_mark_inode_dirty_sync(inode, true);
3019 3020
out_unlock:
	f2fs_unlock_op(sbi);
3021 3022 3023
	return err;
}
#else
3024 3025 3026 3027 3028
int f2fs_transfer_project_quota(struct inode *inode, kprojid_t kprojid)
{
	return 0;
}

M
Miklos Szeredi 已提交
3029
static int f2fs_ioc_setproject(struct inode *inode, __u32 projid)
3030 3031 3032 3033 3034 3035 3036
{
	if (projid != F2FS_DEF_PROJID)
		return -EOPNOTSUPP;
	return 0;
}
#endif

M
Miklos Szeredi 已提交
3037
int f2fs_fileattr_get(struct dentry *dentry, struct fileattr *fa)
3038
{
M
Miklos Szeredi 已提交
3039
	struct inode *inode = d_inode(dentry);
3040
	struct f2fs_inode_info *fi = F2FS_I(inode);
M
Miklos Szeredi 已提交
3041
	u32 fsflags = f2fs_iflags_to_fsflags(fi->i_flags);
3042

M
Miklos Szeredi 已提交
3043 3044 3045 3046 3047 3048 3049 3050 3051 3052
	if (IS_ENCRYPTED(inode))
		fsflags |= FS_ENCRYPT_FL;
	if (IS_VERITY(inode))
		fsflags |= FS_VERITY_FL;
	if (f2fs_has_inline_data(inode) || f2fs_has_inline_dentry(inode))
		fsflags |= FS_INLINE_DATA_FL;
	if (is_inode_flag_set(inode, FI_PIN_FILE))
		fsflags |= FS_NOCOW_FL;

	fileattr_fill_flags(fa, fsflags & F2FS_GETTABLE_FS_FL);
3053

3054
	if (f2fs_sb_has_project_quota(F2FS_I_SB(inode)))
3055
		fa->fsx_projid = from_kprojid(&init_user_ns, fi->i_projid);
3056

3057 3058 3059
	return 0;
}

M
Miklos Szeredi 已提交
3060 3061
int f2fs_fileattr_set(struct user_namespace *mnt_userns,
		      struct dentry *dentry, struct fileattr *fa)
3062
{
M
Miklos Szeredi 已提交
3063 3064
	struct inode *inode = d_inode(dentry);
	u32 fsflags = fa->flags, mask = F2FS_SETTABLE_FS_FL;
3065
	u32 iflags;
3066 3067
	int err;

M
Miklos Szeredi 已提交
3068 3069 3070 3071 3072
	if (unlikely(f2fs_cp_error(F2FS_I_SB(inode))))
		return -EIO;
	if (!f2fs_is_checkpoint_ready(F2FS_I_SB(inode)))
		return -ENOSPC;
	if (fsflags & ~F2FS_GETTABLE_FS_FL)
3073
		return -EOPNOTSUPP;
M
Miklos Szeredi 已提交
3074 3075 3076
	fsflags &= F2FS_SETTABLE_FS_FL;
	if (!fa->flags_valid)
		mask &= FS_COMMON_FL;
3077

M
Miklos Szeredi 已提交
3078
	iflags = f2fs_fsflags_to_iflags(fsflags);
3079
	if (f2fs_mask_flags(inode->i_mode, iflags) != iflags)
3080 3081
		return -EOPNOTSUPP;

M
Miklos Szeredi 已提交
3082 3083 3084
	err = f2fs_setflags_common(inode, iflags, f2fs_fsflags_to_iflags(mask));
	if (!err)
		err = f2fs_ioc_setproject(inode, fa->fsx_projid);
3085

3086
	return err;
3087
}
3088

3089 3090 3091 3092 3093 3094 3095
int f2fs_pin_file_control(struct inode *inode, bool inc)
{
	struct f2fs_inode_info *fi = F2FS_I(inode);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);

	/* Use i_gc_failures for normal file as a risk signal. */
	if (inc)
3096 3097
		f2fs_i_gc_failures_write(inode,
				fi->i_gc_failures[GC_FAILURE_PIN] + 1);
3098

3099
	if (fi->i_gc_failures[GC_FAILURE_PIN] > sbi->gc_pin_file_threshold) {
3100 3101 3102
		f2fs_warn(sbi, "%s: Enable GC = ino %lx after %x GC trials",
			  __func__, inode->i_ino,
			  fi->i_gc_failures[GC_FAILURE_PIN]);
3103 3104 3105 3106 3107 3108 3109 3110 3111 3112 3113 3114 3115 3116 3117 3118 3119 3120 3121 3122 3123 3124 3125 3126 3127 3128 3129
		clear_inode_flag(inode, FI_PIN_FILE);
		return -EAGAIN;
	}
	return 0;
}

static int f2fs_ioc_set_pin_file(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	__u32 pin;
	int ret = 0;

	if (get_user(pin, (__u32 __user *)arg))
		return -EFAULT;

	if (!S_ISREG(inode->i_mode))
		return -EINVAL;

	if (f2fs_readonly(F2FS_I_SB(inode)->sb))
		return -EROFS;

	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

	inode_lock(inode);

C
Chao Yu 已提交
3130
	if (f2fs_should_update_outplace(inode, NULL)) {
C
Chao Yu 已提交
3131 3132 3133 3134
		ret = -EINVAL;
		goto out;
	}

3135 3136
	if (!pin) {
		clear_inode_flag(inode, FI_PIN_FILE);
3137
		f2fs_i_gc_failures_write(inode, 0);
3138 3139 3140 3141 3142 3143 3144
		goto done;
	}

	if (f2fs_pin_file_control(inode, false)) {
		ret = -EAGAIN;
		goto out;
	}
C
Chao Yu 已提交
3145

3146 3147 3148 3149
	ret = f2fs_convert_inline_inode(inode);
	if (ret)
		goto out;

3150
	if (!f2fs_disable_compressed_file(inode)) {
C
Chao Yu 已提交
3151 3152 3153 3154
		ret = -EOPNOTSUPP;
		goto out;
	}

3155
	set_inode_flag(inode, FI_PIN_FILE);
3156
	ret = F2FS_I(inode)->i_gc_failures[GC_FAILURE_PIN];
3157 3158 3159 3160 3161 3162 3163 3164 3165 3166 3167 3168 3169 3170
done:
	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
out:
	inode_unlock(inode);
	mnt_drop_write_file(filp);
	return ret;
}

static int f2fs_ioc_get_pin_file(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	__u32 pin = 0;

	if (is_inode_flag_set(inode, FI_PIN_FILE))
3171
		pin = F2FS_I(inode)->i_gc_failures[GC_FAILURE_PIN];
3172 3173 3174
	return put_user(pin, (u32 __user *)arg);
}

3175 3176 3177 3178 3179 3180 3181 3182 3183 3184 3185 3186 3187 3188 3189
int f2fs_precache_extents(struct inode *inode)
{
	struct f2fs_inode_info *fi = F2FS_I(inode);
	struct f2fs_map_blocks map;
	pgoff_t m_next_extent;
	loff_t end;
	int err;

	if (is_inode_flag_set(inode, FI_NO_EXTENT))
		return -EOPNOTSUPP;

	map.m_lblk = 0;
	map.m_next_pgofs = NULL;
	map.m_next_extent = &m_next_extent;
	map.m_seg_type = NO_CHECK_TYPE;
3190
	map.m_may_create = false;
3191
	end = max_file_blocks(inode);
3192 3193 3194 3195

	while (map.m_lblk < end) {
		map.m_len = end - map.m_lblk;

C
Chao Yu 已提交
3196
		down_write(&fi->i_gc_rwsem[WRITE]);
3197
		err = f2fs_map_blocks(inode, &map, 0, F2FS_GET_BLOCK_PRECACHE);
C
Chao Yu 已提交
3198
		up_write(&fi->i_gc_rwsem[WRITE]);
3199 3200 3201 3202 3203 3204 3205 3206 3207 3208 3209 3210 3211 3212
		if (err)
			return err;

		map.m_lblk = m_next_extent;
	}

	return err;
}

static int f2fs_ioc_precache_extents(struct file *filp, unsigned long arg)
{
	return f2fs_precache_extents(file_inode(filp));
}

3213 3214 3215 3216 3217 3218 3219 3220 3221 3222 3223 3224 3225 3226 3227
static int f2fs_ioc_resize_fs(struct file *filp, unsigned long arg)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(file_inode(filp));
	__u64 block_count;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	if (f2fs_readonly(sbi->sb))
		return -EROFS;

	if (copy_from_user(&block_count, (void __user *)arg,
			   sizeof(block_count)))
		return -EFAULT;

3228
	return f2fs_resize_fs(sbi, block_count);
3229 3230
}

E
Eric Biggers 已提交
3231 3232 3233 3234 3235 3236 3237 3238 3239 3240 3241 3242 3243 3244 3245 3246 3247 3248 3249 3250 3251 3252 3253 3254
static int f2fs_ioc_enable_verity(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);

	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);

	if (!f2fs_sb_has_verity(F2FS_I_SB(inode))) {
		f2fs_warn(F2FS_I_SB(inode),
			  "Can't enable fs-verity on inode %lu: the verity feature is not enabled on this filesystem.\n",
			  inode->i_ino);
		return -EOPNOTSUPP;
	}

	return fsverity_ioctl_enable(filp, (const void __user *)arg);
}

static int f2fs_ioc_measure_verity(struct file *filp, unsigned long arg)
{
	if (!f2fs_sb_has_verity(F2FS_I_SB(file_inode(filp))))
		return -EOPNOTSUPP;

	return fsverity_ioctl_measure(filp, (void __user *)arg);
}

3255 3256 3257 3258 3259 3260 3261 3262
static int f2fs_ioc_read_verity_metadata(struct file *filp, unsigned long arg)
{
	if (!f2fs_sb_has_verity(F2FS_I_SB(file_inode(filp))))
		return -EOPNOTSUPP;

	return fsverity_ioctl_read_metadata(filp, (const void __user *)arg);
}

3263
static int f2fs_ioc_getfslabel(struct file *filp, unsigned long arg)
C
Chao Yu 已提交
3264 3265 3266 3267 3268 3269 3270 3271 3272 3273 3274 3275 3276 3277 3278 3279 3280 3281 3282 3283 3284
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	char *vbuf;
	int count;
	int err = 0;

	vbuf = f2fs_kzalloc(sbi, MAX_VOLUME_NAME, GFP_KERNEL);
	if (!vbuf)
		return -ENOMEM;

	down_read(&sbi->sb_lock);
	count = utf16s_to_utf8s(sbi->raw_super->volume_name,
			ARRAY_SIZE(sbi->raw_super->volume_name),
			UTF16_LITTLE_ENDIAN, vbuf, MAX_VOLUME_NAME);
	up_read(&sbi->sb_lock);

	if (copy_to_user((char __user *)arg, vbuf,
				min(FSLABEL_MAX, count)))
		err = -EFAULT;

C
Chao Yu 已提交
3285
	kfree(vbuf);
C
Chao Yu 已提交
3286 3287 3288
	return err;
}

3289
static int f2fs_ioc_setfslabel(struct file *filp, unsigned long arg)
C
Chao Yu 已提交
3290 3291 3292 3293 3294 3295 3296 3297 3298 3299 3300 3301 3302 3303 3304 3305 3306 3307 3308 3309 3310 3311 3312 3313 3314 3315 3316 3317 3318 3319 3320 3321 3322 3323 3324
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	char *vbuf;
	int err = 0;

	if (!capable(CAP_SYS_ADMIN))
		return -EPERM;

	vbuf = strndup_user((const char __user *)arg, FSLABEL_MAX);
	if (IS_ERR(vbuf))
		return PTR_ERR(vbuf);

	err = mnt_want_write_file(filp);
	if (err)
		goto out;

	down_write(&sbi->sb_lock);

	memset(sbi->raw_super->volume_name, 0,
			sizeof(sbi->raw_super->volume_name));
	utf8s_to_utf16s(vbuf, strlen(vbuf), UTF16_LITTLE_ENDIAN,
			sbi->raw_super->volume_name,
			ARRAY_SIZE(sbi->raw_super->volume_name));

	err = f2fs_commit_super(sbi, false);

	up_write(&sbi->sb_lock);

	mnt_drop_write_file(filp);
out:
	kfree(vbuf);
	return err;
}

3325 3326 3327 3328 3329 3330 3331 3332 3333 3334 3335
static int f2fs_get_compress_blocks(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	__u64 blocks;

	if (!f2fs_sb_has_compression(F2FS_I_SB(inode)))
		return -EOPNOTSUPP;

	if (!f2fs_compressed_file(inode))
		return -EINVAL;

3336
	blocks = atomic_read(&F2FS_I(inode)->i_compr_blocks);
3337 3338 3339
	return put_user(blocks, (u64 __user *)arg);
}

3340 3341 3342 3343 3344 3345 3346 3347 3348 3349 3350 3351 3352 3353 3354 3355 3356 3357 3358 3359 3360 3361 3362 3363 3364 3365 3366 3367 3368 3369 3370 3371 3372 3373 3374 3375 3376 3377 3378 3379 3380 3381 3382 3383 3384 3385 3386 3387 3388 3389 3390 3391 3392 3393 3394 3395 3396 3397 3398 3399 3400 3401 3402 3403 3404 3405 3406 3407 3408 3409 3410 3411 3412 3413 3414 3415 3416 3417 3418 3419 3420
static int release_compress_blocks(struct dnode_of_data *dn, pgoff_t count)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
	unsigned int released_blocks = 0;
	int cluster_size = F2FS_I(dn->inode)->i_cluster_size;
	block_t blkaddr;
	int i;

	for (i = 0; i < count; i++) {
		blkaddr = data_blkaddr(dn->inode, dn->node_page,
						dn->ofs_in_node + i);

		if (!__is_valid_data_blkaddr(blkaddr))
			continue;
		if (unlikely(!f2fs_is_valid_blkaddr(sbi, blkaddr,
					DATA_GENERIC_ENHANCE)))
			return -EFSCORRUPTED;
	}

	while (count) {
		int compr_blocks = 0;

		for (i = 0; i < cluster_size; i++, dn->ofs_in_node++) {
			blkaddr = f2fs_data_blkaddr(dn);

			if (i == 0) {
				if (blkaddr == COMPRESS_ADDR)
					continue;
				dn->ofs_in_node += cluster_size;
				goto next;
			}

			if (__is_valid_data_blkaddr(blkaddr))
				compr_blocks++;

			if (blkaddr != NEW_ADDR)
				continue;

			dn->data_blkaddr = NULL_ADDR;
			f2fs_set_data_blkaddr(dn);
		}

		f2fs_i_compr_blocks_update(dn->inode, compr_blocks, false);
		dec_valid_block_count(sbi, dn->inode,
					cluster_size - compr_blocks);

		released_blocks += cluster_size - compr_blocks;
next:
		count -= cluster_size;
	}

	return released_blocks;
}

static int f2fs_release_compress_blocks(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	pgoff_t page_idx = 0, last_idx;
	unsigned int released_blocks = 0;
	int ret;
	int writecount;

	if (!f2fs_sb_has_compression(F2FS_I_SB(inode)))
		return -EOPNOTSUPP;

	if (!f2fs_compressed_file(inode))
		return -EINVAL;

	if (f2fs_readonly(sbi->sb))
		return -EROFS;

	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

	f2fs_balance_fs(F2FS_I_SB(inode), true);

	inode_lock(inode);

	writecount = atomic_read(&inode->i_writecount);
3421 3422
	if ((filp->f_mode & FMODE_WRITE && writecount != 1) ||
			(!(filp->f_mode & FMODE_WRITE) && writecount)) {
3423 3424 3425 3426 3427 3428 3429 3430 3431 3432 3433 3434 3435 3436 3437 3438 3439 3440
		ret = -EBUSY;
		goto out;
	}

	if (IS_IMMUTABLE(inode)) {
		ret = -EINVAL;
		goto out;
	}

	ret = filemap_write_and_wait_range(inode->i_mapping, 0, LLONG_MAX);
	if (ret)
		goto out;

	F2FS_I(inode)->i_flags |= F2FS_IMMUTABLE_FL;
	f2fs_set_inode_flags(inode);
	inode->i_ctime = current_time(inode);
	f2fs_mark_inode_dirty_sync(inode, true);

3441
	if (!atomic_read(&F2FS_I(inode)->i_compr_blocks))
3442 3443
		goto out;

3444 3445 3446 3447 3448 3449 3450 3451 3452 3453 3454 3455 3456 3457 3458 3459 3460 3461 3462 3463 3464 3465 3466
	down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
	down_write(&F2FS_I(inode)->i_mmap_sem);

	last_idx = DIV_ROUND_UP(i_size_read(inode), PAGE_SIZE);

	while (page_idx < last_idx) {
		struct dnode_of_data dn;
		pgoff_t end_offset, count;

		set_new_dnode(&dn, inode, NULL, NULL, 0);
		ret = f2fs_get_dnode_of_data(&dn, page_idx, LOOKUP_NODE);
		if (ret) {
			if (ret == -ENOENT) {
				page_idx = f2fs_get_next_page_offset(&dn,
								page_idx);
				ret = 0;
				continue;
			}
			break;
		}

		end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
		count = min(end_offset - dn.ofs_in_node, last_idx - page_idx);
3467
		count = round_up(count, F2FS_I(inode)->i_cluster_size);
3468 3469 3470 3471 3472 3473 3474 3475 3476 3477 3478 3479 3480 3481 3482 3483 3484 3485 3486 3487 3488

		ret = release_compress_blocks(&dn, count);

		f2fs_put_dnode(&dn);

		if (ret < 0)
			break;

		page_idx += count;
		released_blocks += ret;
	}

	up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
	up_write(&F2FS_I(inode)->i_mmap_sem);
out:
	inode_unlock(inode);

	mnt_drop_write_file(filp);

	if (ret >= 0) {
		ret = put_user(released_blocks, (u64 __user *)arg);
3489 3490
	} else if (released_blocks &&
			atomic_read(&F2FS_I(inode)->i_compr_blocks)) {
3491 3492
		set_sbi_flag(sbi, SBI_NEED_FSCK);
		f2fs_warn(sbi, "%s: partial blocks were released i_ino=%lx "
3493
			"iblocks=%llu, released=%u, compr_blocks=%u, "
3494 3495 3496
			"run fsck to fix.",
			__func__, inode->i_ino, inode->i_blocks,
			released_blocks,
3497
			atomic_read(&F2FS_I(inode)->i_compr_blocks));
3498 3499 3500 3501 3502
	}

	return ret;
}

3503 3504 3505 3506 3507 3508 3509 3510 3511 3512 3513 3514 3515 3516 3517 3518 3519 3520 3521 3522 3523 3524 3525 3526 3527 3528 3529 3530 3531 3532 3533 3534 3535 3536 3537 3538 3539 3540 3541 3542 3543 3544 3545 3546 3547 3548 3549 3550 3551 3552 3553 3554 3555 3556 3557 3558 3559 3560 3561 3562 3563 3564 3565 3566 3567 3568 3569 3570 3571 3572 3573 3574 3575 3576 3577 3578 3579 3580 3581 3582 3583 3584
static int reserve_compress_blocks(struct dnode_of_data *dn, pgoff_t count)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
	unsigned int reserved_blocks = 0;
	int cluster_size = F2FS_I(dn->inode)->i_cluster_size;
	block_t blkaddr;
	int i;

	for (i = 0; i < count; i++) {
		blkaddr = data_blkaddr(dn->inode, dn->node_page,
						dn->ofs_in_node + i);

		if (!__is_valid_data_blkaddr(blkaddr))
			continue;
		if (unlikely(!f2fs_is_valid_blkaddr(sbi, blkaddr,
					DATA_GENERIC_ENHANCE)))
			return -EFSCORRUPTED;
	}

	while (count) {
		int compr_blocks = 0;
		blkcnt_t reserved;
		int ret;

		for (i = 0; i < cluster_size; i++, dn->ofs_in_node++) {
			blkaddr = f2fs_data_blkaddr(dn);

			if (i == 0) {
				if (blkaddr == COMPRESS_ADDR)
					continue;
				dn->ofs_in_node += cluster_size;
				goto next;
			}

			if (__is_valid_data_blkaddr(blkaddr)) {
				compr_blocks++;
				continue;
			}

			dn->data_blkaddr = NEW_ADDR;
			f2fs_set_data_blkaddr(dn);
		}

		reserved = cluster_size - compr_blocks;
		ret = inc_valid_block_count(sbi, dn->inode, &reserved);
		if (ret)
			return ret;

		if (reserved != cluster_size - compr_blocks)
			return -ENOSPC;

		f2fs_i_compr_blocks_update(dn->inode, compr_blocks, true);

		reserved_blocks += reserved;
next:
		count -= cluster_size;
	}

	return reserved_blocks;
}

static int f2fs_reserve_compress_blocks(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	pgoff_t page_idx = 0, last_idx;
	unsigned int reserved_blocks = 0;
	int ret;

	if (!f2fs_sb_has_compression(F2FS_I_SB(inode)))
		return -EOPNOTSUPP;

	if (!f2fs_compressed_file(inode))
		return -EINVAL;

	if (f2fs_readonly(sbi->sb))
		return -EROFS;

	ret = mnt_want_write_file(filp);
	if (ret)
		return ret;

3585
	if (atomic_read(&F2FS_I(inode)->i_compr_blocks))
3586 3587 3588 3589 3590 3591 3592 3593 3594 3595 3596 3597 3598 3599 3600 3601 3602 3603 3604 3605 3606 3607 3608 3609 3610 3611 3612 3613 3614 3615 3616 3617 3618 3619
		goto out;

	f2fs_balance_fs(F2FS_I_SB(inode), true);

	inode_lock(inode);

	if (!IS_IMMUTABLE(inode)) {
		ret = -EINVAL;
		goto unlock_inode;
	}

	down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
	down_write(&F2FS_I(inode)->i_mmap_sem);

	last_idx = DIV_ROUND_UP(i_size_read(inode), PAGE_SIZE);

	while (page_idx < last_idx) {
		struct dnode_of_data dn;
		pgoff_t end_offset, count;

		set_new_dnode(&dn, inode, NULL, NULL, 0);
		ret = f2fs_get_dnode_of_data(&dn, page_idx, LOOKUP_NODE);
		if (ret) {
			if (ret == -ENOENT) {
				page_idx = f2fs_get_next_page_offset(&dn,
								page_idx);
				ret = 0;
				continue;
			}
			break;
		}

		end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
		count = min(end_offset - dn.ofs_in_node, last_idx - page_idx);
3620
		count = round_up(count, F2FS_I(inode)->i_cluster_size);
3621 3622 3623 3624 3625 3626 3627 3628 3629 3630 3631 3632 3633 3634 3635 3636 3637 3638 3639 3640 3641 3642 3643 3644 3645 3646 3647 3648

		ret = reserve_compress_blocks(&dn, count);

		f2fs_put_dnode(&dn);

		if (ret < 0)
			break;

		page_idx += count;
		reserved_blocks += ret;
	}

	up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
	up_write(&F2FS_I(inode)->i_mmap_sem);

	if (ret >= 0) {
		F2FS_I(inode)->i_flags &= ~F2FS_IMMUTABLE_FL;
		f2fs_set_inode_flags(inode);
		inode->i_ctime = current_time(inode);
		f2fs_mark_inode_dirty_sync(inode, true);
	}
unlock_inode:
	inode_unlock(inode);
out:
	mnt_drop_write_file(filp);

	if (ret >= 0) {
		ret = put_user(reserved_blocks, (u64 __user *)arg);
3649 3650
	} else if (reserved_blocks &&
			atomic_read(&F2FS_I(inode)->i_compr_blocks)) {
3651 3652
		set_sbi_flag(sbi, SBI_NEED_FSCK);
		f2fs_warn(sbi, "%s: partial blocks were released i_ino=%lx "
3653
			"iblocks=%llu, reserved=%u, compr_blocks=%u, "
3654 3655 3656
			"run fsck to fix.",
			__func__, inode->i_ino, inode->i_blocks,
			reserved_blocks,
3657
			atomic_read(&F2FS_I(inode)->i_compr_blocks));
3658 3659 3660 3661 3662
	}

	return ret;
}

3663 3664 3665 3666 3667 3668 3669 3670 3671 3672 3673 3674 3675 3676 3677 3678 3679 3680 3681 3682 3683 3684 3685 3686 3687 3688 3689 3690 3691 3692 3693 3694 3695 3696 3697 3698 3699 3700 3701 3702 3703 3704 3705 3706 3707 3708 3709 3710 3711 3712 3713 3714 3715 3716 3717 3718 3719 3720 3721 3722 3723 3724 3725 3726 3727 3728 3729 3730 3731 3732 3733 3734 3735 3736 3737 3738 3739 3740 3741 3742 3743 3744 3745 3746 3747 3748 3749 3750 3751 3752 3753 3754 3755 3756 3757 3758 3759 3760 3761 3762 3763 3764 3765 3766 3767 3768 3769 3770 3771 3772 3773 3774 3775 3776 3777 3778 3779 3780 3781 3782 3783 3784 3785 3786 3787 3788 3789 3790 3791 3792 3793 3794 3795 3796 3797 3798 3799 3800 3801 3802 3803 3804 3805 3806 3807 3808 3809 3810 3811 3812 3813 3814 3815 3816 3817 3818 3819 3820 3821 3822 3823 3824 3825 3826 3827 3828 3829 3830 3831 3832 3833 3834 3835 3836 3837 3838 3839 3840 3841 3842 3843 3844 3845 3846 3847 3848 3849
static int f2fs_secure_erase(struct block_device *bdev, struct inode *inode,
		pgoff_t off, block_t block, block_t len, u32 flags)
{
	struct request_queue *q = bdev_get_queue(bdev);
	sector_t sector = SECTOR_FROM_BLOCK(block);
	sector_t nr_sects = SECTOR_FROM_BLOCK(len);
	int ret = 0;

	if (!q)
		return -ENXIO;

	if (flags & F2FS_TRIM_FILE_DISCARD)
		ret = blkdev_issue_discard(bdev, sector, nr_sects, GFP_NOFS,
						blk_queue_secure_erase(q) ?
						BLKDEV_DISCARD_SECURE : 0);

	if (!ret && (flags & F2FS_TRIM_FILE_ZEROOUT)) {
		if (IS_ENCRYPTED(inode))
			ret = fscrypt_zeroout_range(inode, off, block, len);
		else
			ret = blkdev_issue_zeroout(bdev, sector, nr_sects,
					GFP_NOFS, 0);
	}

	return ret;
}

static int f2fs_sec_trim_file(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct address_space *mapping = inode->i_mapping;
	struct block_device *prev_bdev = NULL;
	struct f2fs_sectrim_range range;
	pgoff_t index, pg_end, prev_index = 0;
	block_t prev_block = 0, len = 0;
	loff_t end_addr;
	bool to_end = false;
	int ret = 0;

	if (!(filp->f_mode & FMODE_WRITE))
		return -EBADF;

	if (copy_from_user(&range, (struct f2fs_sectrim_range __user *)arg,
				sizeof(range)))
		return -EFAULT;

	if (range.flags == 0 || (range.flags & ~F2FS_TRIM_FILE_MASK) ||
			!S_ISREG(inode->i_mode))
		return -EINVAL;

	if (((range.flags & F2FS_TRIM_FILE_DISCARD) &&
			!f2fs_hw_support_discard(sbi)) ||
			((range.flags & F2FS_TRIM_FILE_ZEROOUT) &&
			 IS_ENCRYPTED(inode) && f2fs_is_multi_device(sbi)))
		return -EOPNOTSUPP;

	file_start_write(filp);
	inode_lock(inode);

	if (f2fs_is_atomic_file(inode) || f2fs_compressed_file(inode) ||
			range.start >= inode->i_size) {
		ret = -EINVAL;
		goto err;
	}

	if (range.len == 0)
		goto err;

	if (inode->i_size - range.start > range.len) {
		end_addr = range.start + range.len;
	} else {
		end_addr = range.len == (u64)-1 ?
			sbi->sb->s_maxbytes : inode->i_size;
		to_end = true;
	}

	if (!IS_ALIGNED(range.start, F2FS_BLKSIZE) ||
			(!to_end && !IS_ALIGNED(end_addr, F2FS_BLKSIZE))) {
		ret = -EINVAL;
		goto err;
	}

	index = F2FS_BYTES_TO_BLK(range.start);
	pg_end = DIV_ROUND_UP(end_addr, F2FS_BLKSIZE);

	ret = f2fs_convert_inline_inode(inode);
	if (ret)
		goto err;

	down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
	down_write(&F2FS_I(inode)->i_mmap_sem);

	ret = filemap_write_and_wait_range(mapping, range.start,
			to_end ? LLONG_MAX : end_addr - 1);
	if (ret)
		goto out;

	truncate_inode_pages_range(mapping, range.start,
			to_end ? -1 : end_addr - 1);

	while (index < pg_end) {
		struct dnode_of_data dn;
		pgoff_t end_offset, count;
		int i;

		set_new_dnode(&dn, inode, NULL, NULL, 0);
		ret = f2fs_get_dnode_of_data(&dn, index, LOOKUP_NODE);
		if (ret) {
			if (ret == -ENOENT) {
				index = f2fs_get_next_page_offset(&dn, index);
				continue;
			}
			goto out;
		}

		end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
		count = min(end_offset - dn.ofs_in_node, pg_end - index);
		for (i = 0; i < count; i++, index++, dn.ofs_in_node++) {
			struct block_device *cur_bdev;
			block_t blkaddr = f2fs_data_blkaddr(&dn);

			if (!__is_valid_data_blkaddr(blkaddr))
				continue;

			if (!f2fs_is_valid_blkaddr(sbi, blkaddr,
						DATA_GENERIC_ENHANCE)) {
				ret = -EFSCORRUPTED;
				f2fs_put_dnode(&dn);
				goto out;
			}

			cur_bdev = f2fs_target_device(sbi, blkaddr, NULL);
			if (f2fs_is_multi_device(sbi)) {
				int di = f2fs_target_device_index(sbi, blkaddr);

				blkaddr -= FDEV(di).start_blk;
			}

			if (len) {
				if (prev_bdev == cur_bdev &&
						index == prev_index + len &&
						blkaddr == prev_block + len) {
					len++;
				} else {
					ret = f2fs_secure_erase(prev_bdev,
						inode, prev_index, prev_block,
						len, range.flags);
					if (ret) {
						f2fs_put_dnode(&dn);
						goto out;
					}

					len = 0;
				}
			}

			if (!len) {
				prev_bdev = cur_bdev;
				prev_index = index;
				prev_block = blkaddr;
				len = 1;
			}
		}

		f2fs_put_dnode(&dn);

		if (fatal_signal_pending(current)) {
			ret = -EINTR;
			goto out;
		}
		cond_resched();
	}

	if (len)
		ret = f2fs_secure_erase(prev_bdev, inode, prev_index,
				prev_block, len, range.flags);
out:
	up_write(&F2FS_I(inode)->i_mmap_sem);
	up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
err:
	inode_unlock(inode);
	file_end_write(filp);

	return ret;
}

3850
static int f2fs_ioc_get_compress_option(struct file *filp, unsigned long arg)
3851
{
3852 3853 3854 3855 3856 3857 3858 3859 3860 3861 3862 3863 3864 3865 3866 3867 3868 3869 3870 3871 3872 3873 3874 3875 3876
	struct inode *inode = file_inode(filp);
	struct f2fs_comp_option option;

	if (!f2fs_sb_has_compression(F2FS_I_SB(inode)))
		return -EOPNOTSUPP;

	inode_lock_shared(inode);

	if (!f2fs_compressed_file(inode)) {
		inode_unlock_shared(inode);
		return -ENODATA;
	}

	option.algorithm = F2FS_I(inode)->i_compress_algorithm;
	option.log_cluster_size = F2FS_I(inode)->i_log_cluster_size;

	inode_unlock_shared(inode);

	if (copy_to_user((struct f2fs_comp_option __user *)arg, &option,
				sizeof(option)))
		return -EFAULT;

	return 0;
}

3877 3878 3879 3880 3881 3882
static int f2fs_ioc_set_compress_option(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct f2fs_comp_option option;
	int ret = 0;
3883

3884 3885 3886 3887 3888 3889 3890 3891 3892 3893 3894 3895 3896 3897 3898 3899 3900 3901 3902 3903 3904 3905 3906 3907 3908 3909 3910 3911 3912 3913 3914 3915 3916 3917 3918 3919 3920 3921 3922 3923 3924 3925 3926 3927
	if (!f2fs_sb_has_compression(sbi))
		return -EOPNOTSUPP;

	if (!(filp->f_mode & FMODE_WRITE))
		return -EBADF;

	if (copy_from_user(&option, (struct f2fs_comp_option __user *)arg,
				sizeof(option)))
		return -EFAULT;

	if (!f2fs_compressed_file(inode) ||
			option.log_cluster_size < MIN_COMPRESS_LOG_SIZE ||
			option.log_cluster_size > MAX_COMPRESS_LOG_SIZE ||
			option.algorithm >= COMPRESS_MAX)
		return -EINVAL;

	file_start_write(filp);
	inode_lock(inode);

	if (f2fs_is_mmap_file(inode) || get_dirty_pages(inode)) {
		ret = -EBUSY;
		goto out;
	}

	if (inode->i_size != 0) {
		ret = -EFBIG;
		goto out;
	}

	F2FS_I(inode)->i_compress_algorithm = option.algorithm;
	F2FS_I(inode)->i_log_cluster_size = option.log_cluster_size;
	F2FS_I(inode)->i_cluster_size = 1 << option.log_cluster_size;
	f2fs_mark_inode_dirty_sync(inode, true);

	if (!f2fs_is_compress_backend_ready(inode))
		f2fs_warn(sbi, "compression algorithm is successfully set, "
			"but current kernel doesn't support this algorithm.");
out:
	inode_unlock(inode);
	file_end_write(filp);

	return ret;
}

3928 3929 3930 3931 3932 3933 3934 3935 3936 3937 3938 3939 3940 3941 3942 3943 3944 3945 3946 3947 3948
static int redirty_blocks(struct inode *inode, pgoff_t page_idx, int len)
{
	DEFINE_READAHEAD(ractl, NULL, inode->i_mapping, page_idx);
	struct address_space *mapping = inode->i_mapping;
	struct page *page;
	pgoff_t redirty_idx = page_idx;
	int i, page_len = 0, ret = 0;

	page_cache_ra_unbounded(&ractl, len, 0);

	for (i = 0; i < len; i++, page_idx++) {
		page = read_cache_page(mapping, page_idx, NULL, NULL);
		if (IS_ERR(page)) {
			ret = PTR_ERR(page);
			break;
		}
		page_len++;
	}

	for (i = 0; i < page_len; i++, redirty_idx++) {
		page = find_lock_page(mapping, redirty_idx);
3949 3950 3951 3952
		if (!page) {
			ret = -ENOMEM;
			break;
		}
3953 3954 3955 3956 3957 3958 3959 3960 3961 3962 3963 3964 3965 3966 3967 3968 3969 3970 3971 3972 3973 3974 3975 3976 3977 3978 3979 3980 3981 3982 3983 3984 3985 3986 3987 3988 3989 3990 3991 3992 3993 3994 3995 3996 3997 3998 3999 4000 4001 4002 4003 4004 4005 4006 4007 4008 4009 4010 4011 4012 4013 4014 4015 4016 4017 4018 4019 4020 4021 4022 4023 4024 4025 4026 4027 4028 4029 4030 4031 4032 4033 4034 4035 4036 4037 4038 4039 4040 4041 4042 4043 4044 4045 4046 4047 4048 4049 4050 4051 4052 4053 4054 4055 4056 4057 4058 4059 4060 4061 4062 4063 4064 4065 4066 4067 4068 4069 4070 4071 4072 4073 4074 4075 4076 4077 4078 4079 4080 4081 4082 4083 4084 4085 4086 4087 4088 4089 4090 4091 4092 4093 4094 4095 4096 4097 4098 4099 4100 4101 4102 4103 4104 4105 4106 4107 4108
		set_page_dirty(page);
		f2fs_put_page(page, 1);
		f2fs_put_page(page, 0);
	}

	return ret;
}

static int f2fs_ioc_decompress_file(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct f2fs_inode_info *fi = F2FS_I(inode);
	pgoff_t page_idx = 0, last_idx;
	unsigned int blk_per_seg = sbi->blocks_per_seg;
	int cluster_size = F2FS_I(inode)->i_cluster_size;
	int count, ret;

	if (!f2fs_sb_has_compression(sbi) ||
			F2FS_OPTION(sbi).compress_mode != COMPR_MODE_USER)
		return -EOPNOTSUPP;

	if (!(filp->f_mode & FMODE_WRITE))
		return -EBADF;

	if (!f2fs_compressed_file(inode))
		return -EINVAL;

	f2fs_balance_fs(F2FS_I_SB(inode), true);

	file_start_write(filp);
	inode_lock(inode);

	if (!f2fs_is_compress_backend_ready(inode)) {
		ret = -EOPNOTSUPP;
		goto out;
	}

	if (f2fs_is_mmap_file(inode)) {
		ret = -EBUSY;
		goto out;
	}

	ret = filemap_write_and_wait_range(inode->i_mapping, 0, LLONG_MAX);
	if (ret)
		goto out;

	if (!atomic_read(&fi->i_compr_blocks))
		goto out;

	last_idx = DIV_ROUND_UP(i_size_read(inode), PAGE_SIZE);

	count = last_idx - page_idx;
	while (count) {
		int len = min(cluster_size, count);

		ret = redirty_blocks(inode, page_idx, len);
		if (ret < 0)
			break;

		if (get_dirty_pages(inode) >= blk_per_seg)
			filemap_fdatawrite(inode->i_mapping);

		count -= len;
		page_idx += len;
	}

	if (!ret)
		ret = filemap_write_and_wait_range(inode->i_mapping, 0,
							LLONG_MAX);

	if (ret)
		f2fs_warn(sbi, "%s: The file might be partially decompressed "
				"(errno=%d). Please delete the file.\n",
				__func__, ret);
out:
	inode_unlock(inode);
	file_end_write(filp);

	return ret;
}

static int f2fs_ioc_compress_file(struct file *filp, unsigned long arg)
{
	struct inode *inode = file_inode(filp);
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	pgoff_t page_idx = 0, last_idx;
	unsigned int blk_per_seg = sbi->blocks_per_seg;
	int cluster_size = F2FS_I(inode)->i_cluster_size;
	int count, ret;

	if (!f2fs_sb_has_compression(sbi) ||
			F2FS_OPTION(sbi).compress_mode != COMPR_MODE_USER)
		return -EOPNOTSUPP;

	if (!(filp->f_mode & FMODE_WRITE))
		return -EBADF;

	if (!f2fs_compressed_file(inode))
		return -EINVAL;

	f2fs_balance_fs(F2FS_I_SB(inode), true);

	file_start_write(filp);
	inode_lock(inode);

	if (!f2fs_is_compress_backend_ready(inode)) {
		ret = -EOPNOTSUPP;
		goto out;
	}

	if (f2fs_is_mmap_file(inode)) {
		ret = -EBUSY;
		goto out;
	}

	ret = filemap_write_and_wait_range(inode->i_mapping, 0, LLONG_MAX);
	if (ret)
		goto out;

	set_inode_flag(inode, FI_ENABLE_COMPRESS);

	last_idx = DIV_ROUND_UP(i_size_read(inode), PAGE_SIZE);

	count = last_idx - page_idx;
	while (count) {
		int len = min(cluster_size, count);

		ret = redirty_blocks(inode, page_idx, len);
		if (ret < 0)
			break;

		if (get_dirty_pages(inode) >= blk_per_seg)
			filemap_fdatawrite(inode->i_mapping);

		count -= len;
		page_idx += len;
	}

	if (!ret)
		ret = filemap_write_and_wait_range(inode->i_mapping, 0,
							LLONG_MAX);

	clear_inode_flag(inode, FI_ENABLE_COMPRESS);

	if (ret)
		f2fs_warn(sbi, "%s: The file might be partially compressed "
				"(errno=%d). Please delete the file.\n",
				__func__, ret);
out:
	inode_unlock(inode);
	file_end_write(filp);

	return ret;
}

4109
static long __f2fs_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
4110 4111
{
	switch (cmd) {
4112
	case FS_IOC_GETVERSION:
C
Chao Yu 已提交
4113
		return f2fs_ioc_getversion(filp, arg);
J
Jaegeuk Kim 已提交
4114 4115 4116 4117
	case F2FS_IOC_START_ATOMIC_WRITE:
		return f2fs_ioc_start_atomic_write(filp);
	case F2FS_IOC_COMMIT_ATOMIC_WRITE:
		return f2fs_ioc_commit_atomic_write(filp);
4118 4119
	case F2FS_IOC_START_VOLATILE_WRITE:
		return f2fs_ioc_start_volatile_write(filp);
4120 4121 4122 4123
	case F2FS_IOC_RELEASE_VOLATILE_WRITE:
		return f2fs_ioc_release_volatile_write(filp);
	case F2FS_IOC_ABORT_VOLATILE_WRITE:
		return f2fs_ioc_abort_volatile_write(filp);
J
Jaegeuk Kim 已提交
4124 4125
	case F2FS_IOC_SHUTDOWN:
		return f2fs_ioc_shutdown(filp, arg);
4126 4127
	case FITRIM:
		return f2fs_ioc_fitrim(filp, arg);
4128
	case FS_IOC_SET_ENCRYPTION_POLICY:
4129
		return f2fs_ioc_set_encryption_policy(filp, arg);
4130
	case FS_IOC_GET_ENCRYPTION_POLICY:
4131
		return f2fs_ioc_get_encryption_policy(filp, arg);
4132
	case FS_IOC_GET_ENCRYPTION_PWSALT:
4133
		return f2fs_ioc_get_encryption_pwsalt(filp, arg);
E
Eric Biggers 已提交
4134 4135 4136 4137 4138 4139 4140 4141 4142 4143
	case FS_IOC_GET_ENCRYPTION_POLICY_EX:
		return f2fs_ioc_get_encryption_policy_ex(filp, arg);
	case FS_IOC_ADD_ENCRYPTION_KEY:
		return f2fs_ioc_add_encryption_key(filp, arg);
	case FS_IOC_REMOVE_ENCRYPTION_KEY:
		return f2fs_ioc_remove_encryption_key(filp, arg);
	case FS_IOC_REMOVE_ENCRYPTION_KEY_ALL_USERS:
		return f2fs_ioc_remove_encryption_key_all_users(filp, arg);
	case FS_IOC_GET_ENCRYPTION_KEY_STATUS:
		return f2fs_ioc_get_encryption_key_status(filp, arg);
4144 4145
	case FS_IOC_GET_ENCRYPTION_NONCE:
		return f2fs_ioc_get_encryption_nonce(filp, arg);
4146 4147
	case F2FS_IOC_GARBAGE_COLLECT:
		return f2fs_ioc_gc(filp, arg);
4148 4149
	case F2FS_IOC_GARBAGE_COLLECT_RANGE:
		return f2fs_ioc_gc_range(filp, arg);
4150
	case F2FS_IOC_WRITE_CHECKPOINT:
C
Chao Yu 已提交
4151
		return f2fs_ioc_write_checkpoint(filp, arg);
C
Chao Yu 已提交
4152 4153
	case F2FS_IOC_DEFRAGMENT:
		return f2fs_ioc_defragment(filp, arg);
4154 4155
	case F2FS_IOC_MOVE_RANGE:
		return f2fs_ioc_move_range(filp, arg);
4156 4157
	case F2FS_IOC_FLUSH_DEVICE:
		return f2fs_ioc_flush_device(filp, arg);
4158 4159
	case F2FS_IOC_GET_FEATURES:
		return f2fs_ioc_get_features(filp, arg);
4160 4161 4162 4163
	case F2FS_IOC_GET_PIN_FILE:
		return f2fs_ioc_get_pin_file(filp, arg);
	case F2FS_IOC_SET_PIN_FILE:
		return f2fs_ioc_set_pin_file(filp, arg);
4164 4165
	case F2FS_IOC_PRECACHE_EXTENTS:
		return f2fs_ioc_precache_extents(filp, arg);
4166 4167
	case F2FS_IOC_RESIZE_FS:
		return f2fs_ioc_resize_fs(filp, arg);
E
Eric Biggers 已提交
4168 4169 4170 4171
	case FS_IOC_ENABLE_VERITY:
		return f2fs_ioc_enable_verity(filp, arg);
	case FS_IOC_MEASURE_VERITY:
		return f2fs_ioc_measure_verity(filp, arg);
4172 4173
	case FS_IOC_READ_VERITY_METADATA:
		return f2fs_ioc_read_verity_metadata(filp, arg);
4174 4175 4176 4177
	case FS_IOC_GETFSLABEL:
		return f2fs_ioc_getfslabel(filp, arg);
	case FS_IOC_SETFSLABEL:
		return f2fs_ioc_setfslabel(filp, arg);
4178 4179
	case F2FS_IOC_GET_COMPRESS_BLOCKS:
		return f2fs_get_compress_blocks(filp, arg);
4180 4181
	case F2FS_IOC_RELEASE_COMPRESS_BLOCKS:
		return f2fs_release_compress_blocks(filp, arg);
4182 4183
	case F2FS_IOC_RESERVE_COMPRESS_BLOCKS:
		return f2fs_reserve_compress_blocks(filp, arg);
4184 4185
	case F2FS_IOC_SEC_TRIM_FILE:
		return f2fs_sec_trim_file(filp, arg);
4186 4187
	case F2FS_IOC_GET_COMPRESS_OPTION:
		return f2fs_ioc_get_compress_option(filp, arg);
4188 4189
	case F2FS_IOC_SET_COMPRESS_OPTION:
		return f2fs_ioc_set_compress_option(filp, arg);
4190 4191 4192 4193
	case F2FS_IOC_DECOMPRESS_FILE:
		return f2fs_ioc_decompress_file(filp, arg);
	case F2FS_IOC_COMPRESS_FILE:
		return f2fs_ioc_compress_file(filp, arg);
J
Jaegeuk Kim 已提交
4194 4195 4196 4197 4198
	default:
		return -ENOTTY;
	}
}

4199 4200 4201 4202 4203 4204 4205 4206 4207 4208
long f2fs_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
{
	if (unlikely(f2fs_cp_error(F2FS_I_SB(file_inode(filp)))))
		return -EIO;
	if (!f2fs_is_checkpoint_ready(F2FS_I_SB(file_inode(filp))))
		return -ENOSPC;

	return __f2fs_ioctl(filp, cmd, arg);
}

C
Chao Yu 已提交
4209 4210 4211 4212
static ssize_t f2fs_file_read_iter(struct kiocb *iocb, struct iov_iter *iter)
{
	struct file *file = iocb->ki_filp;
	struct inode *inode = file_inode(file);
C
Chao Yu 已提交
4213
	int ret;
C
Chao Yu 已提交
4214 4215 4216 4217

	if (!f2fs_is_compress_backend_ready(inode))
		return -EOPNOTSUPP;

C
Chao Yu 已提交
4218 4219 4220 4221 4222 4223
	ret = generic_file_read_iter(iocb, iter);

	if (ret > 0)
		f2fs_update_iostat(F2FS_I_SB(inode), APP_READ_IO, ret);

	return ret;
C
Chao Yu 已提交
4224 4225
}

4226 4227
static ssize_t f2fs_file_write_iter(struct kiocb *iocb, struct iov_iter *from)
{
4228 4229 4230
	struct file *file = iocb->ki_filp;
	struct inode *inode = file_inode(file);
	ssize_t ret;
4231

4232 4233 4234 4235
	if (unlikely(f2fs_cp_error(F2FS_I_SB(inode)))) {
		ret = -EIO;
		goto out;
	}
4236

C
Chao Yu 已提交
4237 4238 4239 4240
	if (!f2fs_is_compress_backend_ready(inode)) {
		ret = -EOPNOTSUPP;
		goto out;
	}
C
Chao Yu 已提交
4241

4242 4243
	if (iocb->ki_flags & IOCB_NOWAIT) {
		if (!inode_trylock(inode)) {
4244 4245 4246
			ret = -EAGAIN;
			goto out;
		}
4247
	} else {
H
Hyunchul Lee 已提交
4248 4249 4250
		inode_lock(inode);
	}

4251 4252 4253 4254 4255
	if (unlikely(IS_IMMUTABLE(inode))) {
		ret = -EPERM;
		goto unlock;
	}

4256 4257
	ret = generic_write_checks(iocb, from);
	if (ret > 0) {
4258 4259
		bool preallocated = false;
		size_t target_size = 0;
4260
		int err;
4261

4262 4263
		if (iov_iter_fault_in_readable(from, iov_iter_count(from)))
			set_inode_flag(inode, FI_NO_PREALLOC);
4264

4265 4266
		if ((iocb->ki_flags & IOCB_NOWAIT)) {
			if (!f2fs_overwrite_io(inode, iocb->ki_pos,
H
Hyunchul Lee 已提交
4267
						iov_iter_count(from)) ||
4268 4269 4270 4271 4272 4273 4274
				f2fs_has_inline_data(inode) ||
				f2fs_force_buffered_io(inode, iocb, from)) {
				clear_inode_flag(inode, FI_NO_PREALLOC);
				inode_unlock(inode);
				ret = -EAGAIN;
				goto out;
			}
4275 4276
			goto write;
		}
4277

4278 4279 4280 4281 4282 4283 4284 4285 4286 4287 4288 4289 4290 4291 4292 4293 4294 4295 4296 4297 4298 4299 4300 4301 4302 4303 4304 4305 4306 4307
		if (is_inode_flag_set(inode, FI_NO_PREALLOC))
			goto write;

		if (iocb->ki_flags & IOCB_DIRECT) {
			/*
			 * Convert inline data for Direct I/O before entering
			 * f2fs_direct_IO().
			 */
			err = f2fs_convert_inline_inode(inode);
			if (err)
				goto out_err;
			/*
			 * If force_buffere_io() is true, we have to allocate
			 * blocks all the time, since f2fs_direct_IO will fall
			 * back to buffered IO.
			 */
			if (!f2fs_force_buffered_io(inode, iocb, from) &&
					allow_outplace_dio(inode, iocb, from))
				goto write;
		}
		preallocated = true;
		target_size = iocb->ki_pos + iov_iter_count(from);

		err = f2fs_preallocate_blocks(iocb, from);
		if (err) {
out_err:
			clear_inode_flag(inode, FI_NO_PREALLOC);
			inode_unlock(inode);
			ret = err;
			goto out;
4308
		}
4309
write:
4310
		ret = __generic_file_write_iter(iocb, from);
4311
		clear_inode_flag(inode, FI_NO_PREALLOC);
C
Chao Yu 已提交
4312

4313 4314 4315 4316
		/* if we couldn't write data, we should deallocate blocks. */
		if (preallocated && i_size_read(inode) < target_size)
			f2fs_truncate(inode);

C
Chao Yu 已提交
4317 4318
		if (ret > 0)
			f2fs_update_iostat(F2FS_I_SB(inode), APP_WRITE_IO, ret);
4319
	}
4320
unlock:
4321
	inode_unlock(inode);
4322 4323 4324
out:
	trace_f2fs_file_write_iter(inode, iocb->ki_pos,
					iov_iter_count(from), ret);
4325 4326
	if (ret > 0)
		ret = generic_write_sync(iocb, ret);
4327
	return ret;
4328 4329
}

4330
#ifdef CONFIG_COMPAT
4331 4332 4333 4334 4335 4336 4337 4338 4339 4340 4341 4342 4343 4344 4345 4346 4347 4348 4349 4350 4351 4352 4353 4354 4355 4356 4357 4358 4359 4360 4361 4362 4363 4364 4365 4366 4367 4368 4369 4370 4371 4372 4373 4374 4375 4376 4377 4378 4379 4380
struct compat_f2fs_gc_range {
	u32 sync;
	compat_u64 start;
	compat_u64 len;
};
#define F2FS_IOC32_GARBAGE_COLLECT_RANGE	_IOW(F2FS_IOCTL_MAGIC, 11,\
						struct compat_f2fs_gc_range)

static int f2fs_compat_ioc_gc_range(struct file *file, unsigned long arg)
{
	struct compat_f2fs_gc_range __user *urange;
	struct f2fs_gc_range range;
	int err;

	urange = compat_ptr(arg);
	err = get_user(range.sync, &urange->sync);
	err |= get_user(range.start, &urange->start);
	err |= get_user(range.len, &urange->len);
	if (err)
		return -EFAULT;

	return __f2fs_ioc_gc_range(file, &range);
}

struct compat_f2fs_move_range {
	u32 dst_fd;
	compat_u64 pos_in;
	compat_u64 pos_out;
	compat_u64 len;
};
#define F2FS_IOC32_MOVE_RANGE		_IOWR(F2FS_IOCTL_MAGIC, 9,	\
					struct compat_f2fs_move_range)

static int f2fs_compat_ioc_move_range(struct file *file, unsigned long arg)
{
	struct compat_f2fs_move_range __user *urange;
	struct f2fs_move_range range;
	int err;

	urange = compat_ptr(arg);
	err = get_user(range.dst_fd, &urange->dst_fd);
	err |= get_user(range.pos_in, &urange->pos_in);
	err |= get_user(range.pos_out, &urange->pos_out);
	err |= get_user(range.len, &urange->len);
	if (err)
		return -EFAULT;

	return __f2fs_ioc_move_range(file, &range);
}

4381 4382
long f2fs_compat_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
{
4383 4384 4385 4386 4387
	if (unlikely(f2fs_cp_error(F2FS_I_SB(file_inode(file)))))
		return -EIO;
	if (!f2fs_is_checkpoint_ready(F2FS_I_SB(file_inode(file))))
		return -ENOSPC;

4388
	switch (cmd) {
4389 4390
	case FS_IOC32_GETVERSION:
		cmd = FS_IOC_GETVERSION;
4391
		break;
4392 4393 4394 4395
	case F2FS_IOC32_GARBAGE_COLLECT_RANGE:
		return f2fs_compat_ioc_gc_range(file, arg);
	case F2FS_IOC32_MOVE_RANGE:
		return f2fs_compat_ioc_move_range(file, arg);
4396 4397 4398 4399 4400 4401
	case F2FS_IOC_START_ATOMIC_WRITE:
	case F2FS_IOC_COMMIT_ATOMIC_WRITE:
	case F2FS_IOC_START_VOLATILE_WRITE:
	case F2FS_IOC_RELEASE_VOLATILE_WRITE:
	case F2FS_IOC_ABORT_VOLATILE_WRITE:
	case F2FS_IOC_SHUTDOWN:
4402
	case FITRIM:
4403 4404 4405
	case FS_IOC_SET_ENCRYPTION_POLICY:
	case FS_IOC_GET_ENCRYPTION_PWSALT:
	case FS_IOC_GET_ENCRYPTION_POLICY:
E
Eric Biggers 已提交
4406 4407 4408 4409 4410
	case FS_IOC_GET_ENCRYPTION_POLICY_EX:
	case FS_IOC_ADD_ENCRYPTION_KEY:
	case FS_IOC_REMOVE_ENCRYPTION_KEY:
	case FS_IOC_REMOVE_ENCRYPTION_KEY_ALL_USERS:
	case FS_IOC_GET_ENCRYPTION_KEY_STATUS:
4411
	case FS_IOC_GET_ENCRYPTION_NONCE:
4412 4413 4414
	case F2FS_IOC_GARBAGE_COLLECT:
	case F2FS_IOC_WRITE_CHECKPOINT:
	case F2FS_IOC_DEFRAGMENT:
4415
	case F2FS_IOC_FLUSH_DEVICE:
4416
	case F2FS_IOC_GET_FEATURES:
4417 4418
	case F2FS_IOC_GET_PIN_FILE:
	case F2FS_IOC_SET_PIN_FILE:
4419
	case F2FS_IOC_PRECACHE_EXTENTS:
4420
	case F2FS_IOC_RESIZE_FS:
E
Eric Biggers 已提交
4421 4422
	case FS_IOC_ENABLE_VERITY:
	case FS_IOC_MEASURE_VERITY:
4423
	case FS_IOC_READ_VERITY_METADATA:
4424 4425
	case FS_IOC_GETFSLABEL:
	case FS_IOC_SETFSLABEL:
4426
	case F2FS_IOC_GET_COMPRESS_BLOCKS:
4427
	case F2FS_IOC_RELEASE_COMPRESS_BLOCKS:
4428
	case F2FS_IOC_RESERVE_COMPRESS_BLOCKS:
4429
	case F2FS_IOC_SEC_TRIM_FILE:
4430
	case F2FS_IOC_GET_COMPRESS_OPTION:
4431
	case F2FS_IOC_SET_COMPRESS_OPTION:
4432 4433
	case F2FS_IOC_DECOMPRESS_FILE:
	case F2FS_IOC_COMPRESS_FILE:
4434
		break;
4435 4436 4437
	default:
		return -ENOIOCTLCMD;
	}
4438
	return __f2fs_ioctl(file, cmd, (unsigned long) compat_ptr(arg));
4439 4440 4441
}
#endif

J
Jaegeuk Kim 已提交
4442
const struct file_operations f2fs_file_operations = {
4443
	.llseek		= f2fs_llseek,
C
Chao Yu 已提交
4444
	.read_iter	= f2fs_file_read_iter,
4445 4446
	.write_iter	= f2fs_file_write_iter,
	.open		= f2fs_file_open,
4447
	.release	= f2fs_release_file,
J
Jaegeuk Kim 已提交
4448
	.mmap		= f2fs_file_mmap,
4449
	.flush		= f2fs_file_flush,
J
Jaegeuk Kim 已提交
4450 4451 4452
	.fsync		= f2fs_sync_file,
	.fallocate	= f2fs_fallocate,
	.unlocked_ioctl	= f2fs_ioctl,
4453 4454 4455
#ifdef CONFIG_COMPAT
	.compat_ioctl	= f2fs_compat_ioctl,
#endif
J
Jaegeuk Kim 已提交
4456
	.splice_read	= generic_file_splice_read,
A
Al Viro 已提交
4457
	.splice_write	= iter_file_splice_write,
J
Jaegeuk Kim 已提交
4458
};