aops.c 32.6 KB
Newer Older
D
David Teigland 已提交
1 2
/*
 * Copyright (C) Sistina Software, Inc.  1997-2003 All rights reserved.
B
Bob Peterson 已提交
3
 * Copyright (C) 2004-2008 Red Hat, Inc.  All rights reserved.
D
David Teigland 已提交
4 5 6
 *
 * This copyrighted material is made available to anyone wishing to use,
 * modify, copy, or redistribute it subject to the terms and conditions
7
 * of the GNU General Public License version 2.
D
David Teigland 已提交
8 9 10 11 12 13 14 15
 */

#include <linux/sched.h>
#include <linux/slab.h>
#include <linux/spinlock.h>
#include <linux/completion.h>
#include <linux/buffer_head.h>
#include <linux/pagemap.h>
S
Steven Whitehouse 已提交
16
#include <linux/pagevec.h>
17
#include <linux/mpage.h>
18
#include <linux/fs.h>
19
#include <linux/writeback.h>
S
Steven Whitehouse 已提交
20
#include <linux/swap.h>
21
#include <linux/gfs2_ondisk.h>
22
#include <linux/backing-dev.h>
23
#include <linux/uio.h>
24
#include <trace/events/writeback.h>
D
David Teigland 已提交
25 26

#include "gfs2.h"
27
#include "incore.h"
D
David Teigland 已提交
28 29 30 31 32 33 34
#include "bmap.h"
#include "glock.h"
#include "inode.h"
#include "log.h"
#include "meta_io.h"
#include "quota.h"
#include "trans.h"
35
#include "rgrp.h"
36
#include "super.h"
37
#include "util.h"
S
Steven Whitehouse 已提交
38
#include "glops.h"
D
David Teigland 已提交
39

S
Steven Whitehouse 已提交
40

41 42
static void gfs2_page_add_databufs(struct gfs2_inode *ip, struct page *page,
				   unsigned int from, unsigned int to)
S
Steven Whitehouse 已提交
43 44 45 46 47 48 49 50 51 52 53
{
	struct buffer_head *head = page_buffers(page);
	unsigned int bsize = head->b_size;
	struct buffer_head *bh;
	unsigned int start, end;

	for (bh = head, start = 0; bh != head || !start;
	     bh = bh->b_this_page, start = end) {
		end = start + bsize;
		if (end <= from || start >= to)
			continue;
B
Benjamin Marzinski 已提交
54 55
		if (gfs2_is_jdata(ip))
			set_buffer_uptodate(bh);
56
		gfs2_trans_add_data(ip->i_gl, bh);
S
Steven Whitehouse 已提交
57 58 59
	}
}

D
David Teigland 已提交
60
/**
61
 * gfs2_get_block_noalloc - Fills in a buffer head with details about a block
D
David Teigland 已提交
62 63 64 65 66 67 68 69
 * @inode: The inode
 * @lblock: The block number to look up
 * @bh_result: The buffer head to return the result in
 * @create: Non-zero if we may add block to the file
 *
 * Returns: errno
 */

70 71
static int gfs2_get_block_noalloc(struct inode *inode, sector_t lblock,
				  struct buffer_head *bh_result, int create)
D
David Teigland 已提交
72 73 74
{
	int error;

75
	error = gfs2_block_map(inode, lblock, bh_result, 0);
D
David Teigland 已提交
76 77
	if (error)
		return error;
W
Wendy Cheng 已提交
78
	if (!buffer_mapped(bh_result))
79 80
		return -EIO;
	return 0;
D
David Teigland 已提交
81 82
}

83 84
static int gfs2_get_block_direct(struct inode *inode, sector_t lblock,
				 struct buffer_head *bh_result, int create)
85
{
86
	return gfs2_block_map(inode, lblock, bh_result, 0);
87
}
88

D
David Teigland 已提交
89
/**
90 91 92
 * gfs2_writepage_common - Common bits of writepage
 * @page: The page to be written
 * @wbc: The writeback control
D
David Teigland 已提交
93
 *
94
 * Returns: 1 if writepage is ok, otherwise an error code or zero if no error.
D
David Teigland 已提交
95 96
 */

97 98
static int gfs2_writepage_common(struct page *page,
				 struct writeback_control *wbc)
D
David Teigland 已提交
99
{
100
	struct inode *inode = page->mapping->host;
101 102
	struct gfs2_inode *ip = GFS2_I(inode);
	struct gfs2_sbd *sdp = GFS2_SB(inode);
103
	loff_t i_size = i_size_read(inode);
104
	pgoff_t end_index = i_size >> PAGE_SHIFT;
105
	unsigned offset;
D
David Teigland 已提交
106

107 108
	if (gfs2_assert_withdraw(sdp, gfs2_glock_is_held_excl(ip->i_gl)))
		goto out;
109
	if (current->journal_info)
110
		goto redirty;
111
	/* Is the page fully outside i_size? (truncate in progress) */
112
	offset = i_size & (PAGE_SIZE-1);
113
	if (page->index > end_index || (page->index == end_index && !offset)) {
114
		page->mapping->a_ops->invalidatepage(page, 0, PAGE_SIZE);
115
		goto out;
D
David Teigland 已提交
116
	}
117 118 119 120 121 122 123 124 125
	return 1;
redirty:
	redirty_page_for_writepage(wbc, page);
out:
	unlock_page(page);
	return 0;
}

/**
126
 * gfs2_writepage - Write page for writeback mappings
127 128 129 130 131
 * @page: The page
 * @wbc: The writeback control
 *
 */

132
static int gfs2_writepage(struct page *page, struct writeback_control *wbc)
133 134 135 136 137 138 139
{
	int ret;

	ret = gfs2_writepage_common(page, wbc);
	if (ret <= 0)
		return ret;

S
Steven Whitehouse 已提交
140
	return nobh_writepage(page, gfs2_get_block_noalloc, wbc);
141 142
}

143 144 145
/* This is the same as calling block_write_full_page, but it also
 * writes pages outside of i_size
 */
146 147
static int gfs2_write_full_page(struct page *page, get_block_t *get_block,
				struct writeback_control *wbc)
148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168
{
	struct inode * const inode = page->mapping->host;
	loff_t i_size = i_size_read(inode);
	const pgoff_t end_index = i_size >> PAGE_SHIFT;
	unsigned offset;

	/*
	 * The page straddles i_size.  It must be zeroed out on each and every
	 * writepage invocation because it may be mmapped.  "A file is mapped
	 * in multiples of the page size.  For a file that is not a multiple of
	 * the  page size, the remaining memory is zeroed when mapped, and
	 * writes to that region are not written out to the file."
	 */
	offset = i_size & (PAGE_SIZE-1);
	if (page->index == end_index && offset)
		zero_user_segment(page, offset, PAGE_SIZE);

	return __block_write_full_page(inode, page, get_block, wbc,
				       end_buffer_async_write);
}

169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189
/**
 * __gfs2_jdata_writepage - The core of jdata writepage
 * @page: The page to write
 * @wbc: The writeback control
 *
 * This is shared between writepage and writepages and implements the
 * core of the writepage operation. If a transaction is required then
 * PageChecked will have been set and the transaction will have
 * already been started before this is called.
 */

static int __gfs2_jdata_writepage(struct page *page, struct writeback_control *wbc)
{
	struct inode *inode = page->mapping->host;
	struct gfs2_inode *ip = GFS2_I(inode);
	struct gfs2_sbd *sdp = GFS2_SB(inode);

	if (PageChecked(page)) {
		ClearPageChecked(page);
		if (!page_has_buffers(page)) {
			create_empty_buffers(page, inode->i_sb->s_blocksize,
F
Fabian Frederick 已提交
190
					     BIT(BH_Dirty)|BIT(BH_Uptodate));
191 192 193
		}
		gfs2_page_add_databufs(ip, page, 0, sdp->sd_vfs->s_blocksize-1);
	}
194
	return gfs2_write_full_page(page, gfs2_get_block_noalloc, wbc);
195 196
}

197 198 199
/**
 * gfs2_jdata_writepage - Write complete page
 * @page: Page to write
F
Fabian Frederick 已提交
200
 * @wbc: The writeback control
201 202 203 204 205 206 207 208
 *
 * Returns: errno
 *
 */

static int gfs2_jdata_writepage(struct page *page, struct writeback_control *wbc)
{
	struct inode *inode = page->mapping->host;
209
	struct gfs2_inode *ip = GFS2_I(inode);
210
	struct gfs2_sbd *sdp = GFS2_SB(inode);
211
	int ret;
212

213 214 215 216 217
	if (gfs2_assert_withdraw(sdp, gfs2_glock_is_held_excl(ip->i_gl)))
		goto out;
	if (PageChecked(page) || current->journal_info)
		goto out_ignore;
	ret = __gfs2_jdata_writepage(page, wbc);
218
	return ret;
219 220 221

out_ignore:
	redirty_page_for_writepage(wbc, page);
222
out:
223 224
	unlock_page(page);
	return 0;
D
David Teigland 已提交
225 226
}

227
/**
228
 * gfs2_writepages - Write a bunch of dirty pages back to disk
229 230 231
 * @mapping: The mapping to write
 * @wbc: Write-back control
 *
232
 * Used for both ordered and writeback modes.
233
 */
234 235
static int gfs2_writepages(struct address_space *mapping,
			   struct writeback_control *wbc)
236
{
237 238 239 240 241 242 243 244 245 246 247 248 249
	struct gfs2_sbd *sdp = gfs2_mapping2sbd(mapping);
	int ret = mpage_writepages(mapping, wbc, gfs2_get_block_noalloc);

	/*
	 * Even if we didn't write any pages here, we might still be holding
	 * dirty pages in the ail. We forcibly flush the ail because we don't
	 * want balance_dirty_pages() to loop indefinitely trying to write out
	 * pages held in the ail that it can't find.
	 */
	if (ret == 0)
		set_bit(SDF_FORCE_AIL_FLUSH, &sdp->sd_flags);

	return ret;
250 251
}

252 253 254 255 256 257
/**
 * gfs2_write_jdata_pagevec - Write back a pagevec's worth of pages
 * @mapping: The mapping
 * @wbc: The writeback control
 * @pvec: The vector of pages
 * @nr_pages: The number of pages to write
F
Fabian Frederick 已提交
258 259
 * @end: End position
 * @done_index: Page index
260 261 262 263 264 265 266
 *
 * Returns: non-zero if loop should terminate, zero otherwise
 */

static int gfs2_write_jdata_pagevec(struct address_space *mapping,
				    struct writeback_control *wbc,
				    struct pagevec *pvec,
267 268
				    int nr_pages, pgoff_t end,
				    pgoff_t *done_index)
269 270 271
{
	struct inode *inode = mapping->host;
	struct gfs2_sbd *sdp = GFS2_SB(inode);
272
	unsigned nrblocks = nr_pages * (PAGE_SIZE/inode->i_sb->s_blocksize);
273 274 275
	int i;
	int ret;

276
	ret = gfs2_trans_begin(sdp, nrblocks, nrblocks);
277 278 279 280 281 282
	if (ret < 0)
		return ret;

	for(i = 0; i < nr_pages; i++) {
		struct page *page = pvec->pages[i];

283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300
		/*
		 * At this point, the page may be truncated or
		 * invalidated (changing page->mapping to NULL), or
		 * even swizzled back from swapper_space to tmpfs file
		 * mapping. However, page->index will not change
		 * because we have a reference on the page.
		 */
		if (page->index > end) {
			/*
			 * can't be range_cyclic (1st pass) because
			 * end == -1 in that case.
			 */
			ret = 1;
			break;
		}

		*done_index = page->index;

301 302 303
		lock_page(page);

		if (unlikely(page->mapping != mapping)) {
304
continue_unlock:
305 306 307 308
			unlock_page(page);
			continue;
		}

309 310 311
		if (!PageDirty(page)) {
			/* someone wrote it for us */
			goto continue_unlock;
312 313
		}

314 315 316 317 318
		if (PageWriteback(page)) {
			if (wbc->sync_mode != WB_SYNC_NONE)
				wait_on_page_writeback(page);
			else
				goto continue_unlock;
319 320
		}

321 322 323 324
		BUG_ON(PageWriteback(page));
		if (!clear_page_dirty_for_io(page))
			goto continue_unlock;

325
		trace_wbc_writepage(wbc, inode_to_bdi(inode));
326 327

		ret = __gfs2_jdata_writepage(page, wbc);
328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347
		if (unlikely(ret)) {
			if (ret == AOP_WRITEPAGE_ACTIVATE) {
				unlock_page(page);
				ret = 0;
			} else {

				/*
				 * done_index is set past this page,
				 * so media errors will not choke
				 * background writeout for the entire
				 * file. This has consequences for
				 * range_cyclic semantics (ie. it may
				 * not be suitable for data integrity
				 * writeout).
				 */
				*done_index = page->index + 1;
				ret = 1;
				break;
			}
		}
348

349 350 351 352 353 354 355
		/*
		 * We stop writing back only if we are not doing
		 * integrity sync. In case of integrity sync we have to
		 * keep going until we have written all the pages
		 * we tagged for writeback prior to entering this loop.
		 */
		if (--wbc->nr_to_write <= 0 && wbc->sync_mode == WB_SYNC_NONE) {
356
			ret = 1;
357 358 359
			break;
		}

360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381
	}
	gfs2_trans_end(sdp);
	return ret;
}

/**
 * gfs2_write_cache_jdata - Like write_cache_pages but different
 * @mapping: The mapping to write
 * @wbc: The writeback control
 *
 * The reason that we use our own function here is that we need to
 * start transactions before we grab page locks. This allows us
 * to get the ordering right.
 */

static int gfs2_write_cache_jdata(struct address_space *mapping,
				  struct writeback_control *wbc)
{
	int ret = 0;
	int done = 0;
	struct pagevec pvec;
	int nr_pages;
382
	pgoff_t uninitialized_var(writeback_index);
383 384
	pgoff_t index;
	pgoff_t end;
385 386
	pgoff_t done_index;
	int cycled;
387
	int range_whole = 0;
388
	int tag;
389 390 391

	pagevec_init(&pvec, 0);
	if (wbc->range_cyclic) {
392 393 394 395 396 397
		writeback_index = mapping->writeback_index; /* prev offset */
		index = writeback_index;
		if (index == 0)
			cycled = 1;
		else
			cycled = 0;
398 399
		end = -1;
	} else {
400 401
		index = wbc->range_start >> PAGE_SHIFT;
		end = wbc->range_end >> PAGE_SHIFT;
402 403
		if (wbc->range_start == 0 && wbc->range_end == LLONG_MAX)
			range_whole = 1;
404
		cycled = 1; /* ignore range_cyclic tests */
405
	}
406 407 408 409
	if (wbc->sync_mode == WB_SYNC_ALL || wbc->tagged_writepages)
		tag = PAGECACHE_TAG_TOWRITE;
	else
		tag = PAGECACHE_TAG_DIRTY;
410 411

retry:
412 413 414 415 416 417 418 419 420 421
	if (wbc->sync_mode == WB_SYNC_ALL || wbc->tagged_writepages)
		tag_pages_for_writeback(mapping, index, end);
	done_index = index;
	while (!done && (index <= end)) {
		nr_pages = pagevec_lookup_tag(&pvec, mapping, &index, tag,
			      min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1);
		if (nr_pages == 0)
			break;

		ret = gfs2_write_jdata_pagevec(mapping, wbc, &pvec, nr_pages, end, &done_index);
422 423 424 425 426 427 428 429
		if (ret)
			done = 1;
		if (ret > 0)
			ret = 0;
		pagevec_release(&pvec);
		cond_resched();
	}

430
	if (!cycled && !done) {
431
		/*
432
		 * range_cyclic:
433 434 435
		 * We hit the last page and there is more work to be done: wrap
		 * back to the start of the file
		 */
436
		cycled = 1;
437
		index = 0;
438
		end = writeback_index - 1;
439 440 441 442
		goto retry;
	}

	if (wbc->range_cyclic || (range_whole && wbc->nr_to_write > 0))
443 444
		mapping->writeback_index = done_index;

445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464
	return ret;
}


/**
 * gfs2_jdata_writepages - Write a bunch of dirty pages back to disk
 * @mapping: The mapping to write
 * @wbc: The writeback control
 * 
 */

static int gfs2_jdata_writepages(struct address_space *mapping,
				 struct writeback_control *wbc)
{
	struct gfs2_inode *ip = GFS2_I(mapping->host);
	struct gfs2_sbd *sdp = GFS2_SB(mapping->host);
	int ret;

	ret = gfs2_write_cache_jdata(mapping, wbc);
	if (ret == 0 && wbc->sync_mode == WB_SYNC_ALL) {
465
		gfs2_log_flush(sdp, ip->i_gl, NORMAL_FLUSH);
466 467 468 469 470
		ret = gfs2_write_cache_jdata(mapping, wbc);
	}
	return ret;
}

D
David Teigland 已提交
471 472 473 474 475 476 477 478 479 480 481
/**
 * stuffed_readpage - Fill in a Linux page with stuffed file data
 * @ip: the inode
 * @page: the page
 *
 * Returns: errno
 */

static int stuffed_readpage(struct gfs2_inode *ip, struct page *page)
{
	struct buffer_head *dibh;
482
	u64 dsize = i_size_read(&ip->i_inode);
D
David Teigland 已提交
483 484 485
	void *kaddr;
	int error;

486
	/*
N
Nick Piggin 已提交
487
	 * Due to the order of unstuffing files and ->fault(), we can be
488 489 490 491
	 * asked for a zero page in the case of a stuffed file being extended,
	 * so we need to supply one here. It doesn't happen often.
	 */
	if (unlikely(page->index)) {
492
		zero_user(page, 0, PAGE_SIZE);
493
		SetPageUptodate(page);
494 495
		return 0;
	}
S
Steven Whitehouse 已提交
496

D
David Teigland 已提交
497 498 499 500
	error = gfs2_meta_inode_buffer(ip, &dibh);
	if (error)
		return error;

501
	kaddr = kmap_atomic(page);
502 503 504
	if (dsize > (dibh->b_size - sizeof(struct gfs2_dinode)))
		dsize = (dibh->b_size - sizeof(struct gfs2_dinode));
	memcpy(kaddr, dibh->b_data + sizeof(struct gfs2_dinode), dsize);
505
	memset(kaddr + dsize, 0, PAGE_SIZE - dsize);
506
	kunmap_atomic(kaddr);
507
	flush_dcache_page(page);
D
David Teigland 已提交
508 509 510 511 512 513 514 515
	brelse(dibh);
	SetPageUptodate(page);

	return 0;
}


/**
516 517
 * __gfs2_readpage - readpage
 * @file: The file to read a page for
D
David Teigland 已提交
518 519
 * @page: The page to read
 *
520 521 522 523
 * This is the core of gfs2's readpage. Its used by the internal file
 * reading code as in that case we already hold the glock. Also its
 * called by gfs2_readpage() once the required lock has been granted.
 *
D
David Teigland 已提交
524 525
 */

526
static int __gfs2_readpage(void *file, struct page *page)
D
David Teigland 已提交
527
{
528 529
	struct gfs2_inode *ip = GFS2_I(page->mapping->host);
	struct gfs2_sbd *sdp = GFS2_SB(page->mapping->host);
D
David Teigland 已提交
530 531
	int error;

532
	if (gfs2_is_stuffed(ip)) {
S
Steven Whitehouse 已提交
533 534
		error = stuffed_readpage(ip, page);
		unlock_page(page);
535
	} else {
536
		error = mpage_readpage(page, gfs2_block_map);
537
	}
D
David Teigland 已提交
538 539

	if (unlikely(test_bit(SDF_SHUTDOWN, &sdp->sd_flags)))
540
		return -EIO;
D
David Teigland 已提交
541

542 543 544 545 546 547 548 549
	return error;
}

/**
 * gfs2_readpage - read a page of a file
 * @file: The file to read
 * @page: The page of the file
 *
550 551 552
 * This deals with the locking required. We have to unlock and
 * relock the page in order to get the locking in the right
 * order.
553 554 555 556
 */

static int gfs2_readpage(struct file *file, struct page *page)
{
557 558
	struct address_space *mapping = page->mapping;
	struct gfs2_inode *ip = GFS2_I(mapping->host);
559
	struct gfs2_holder gh;
560 561
	int error;

562
	unlock_page(page);
563 564
	gfs2_holder_init(ip->i_gl, LM_ST_SHARED, 0, &gh);
	error = gfs2_glock_nq(&gh);
565
	if (unlikely(error))
566
		goto out;
567 568 569 570 571 572
	error = AOP_TRUNCATED_PAGE;
	lock_page(page);
	if (page->mapping == mapping && !PageUptodate(page))
		error = __gfs2_readpage(file, page);
	else
		unlock_page(page);
573
	gfs2_glock_dq(&gh);
574
out:
575
	gfs2_holder_uninit(&gh);
576 577
	if (error && error != AOP_TRUNCATED_PAGE)
		lock_page(page);
578 579 580 581 582 583 584 585 586 587 588 589
	return error;
}

/**
 * gfs2_internal_read - read an internal file
 * @ip: The gfs2 inode
 * @buf: The buffer to fill
 * @pos: The file position
 * @size: The amount to read
 *
 */

590 591
int gfs2_internal_read(struct gfs2_inode *ip, char *buf, loff_t *pos,
                       unsigned size)
592 593
{
	struct address_space *mapping = ip->i_inode.i_mapping;
594 595
	unsigned long index = *pos / PAGE_SIZE;
	unsigned offset = *pos & (PAGE_SIZE - 1);
596 597 598 599 600 601 602
	unsigned copied = 0;
	unsigned amt;
	struct page *page;
	void *p;

	do {
		amt = size - copied;
603 604
		if (offset + size > PAGE_SIZE)
			amt = PAGE_SIZE - offset;
605 606 607
		page = read_cache_page(mapping, index, __gfs2_readpage, NULL);
		if (IS_ERR(page))
			return PTR_ERR(page);
608
		p = kmap_atomic(page);
609
		memcpy(buf + copied, p + offset, amt);
610
		kunmap_atomic(p);
611
		put_page(page);
612 613 614 615 616 617
		copied += amt;
		index++;
		offset = 0;
	} while(copied < size);
	(*pos) += size;
	return size;
S
Steven Whitehouse 已提交
618 619 620 621
}

/**
 * gfs2_readpages - Read a bunch of pages at once
F
Fabian Frederick 已提交
622 623 624 625
 * @file: The file to read from
 * @mapping: Address space info
 * @pages: List of pages to read
 * @nr_pages: Number of pages to read
S
Steven Whitehouse 已提交
626 627 628 629 630 631 632
 *
 * Some notes:
 * 1. This is only for readahead, so we can simply ignore any things
 *    which are slightly inconvenient (such as locking conflicts between
 *    the page lock and the glock) and return having done no I/O. Its
 *    obviously not something we'd want to do on too regular a basis.
 *    Any I/O we ignore at this time will be done via readpage later.
633
 * 2. We don't handle stuffed files here we let readpage do the honours.
S
Steven Whitehouse 已提交
634
 * 3. mpage_readpages() does most of the heavy lifting in the common case.
635
 * 4. gfs2_block_map() is relied upon to set BH_Boundary in the right places.
S
Steven Whitehouse 已提交
636
 */
637

S
Steven Whitehouse 已提交
638 639 640 641
static int gfs2_readpages(struct file *file, struct address_space *mapping,
			  struct list_head *pages, unsigned nr_pages)
{
	struct inode *inode = mapping->host;
642 643
	struct gfs2_inode *ip = GFS2_I(inode);
	struct gfs2_sbd *sdp = GFS2_SB(inode);
S
Steven Whitehouse 已提交
644
	struct gfs2_holder gh;
645
	int ret;
S
Steven Whitehouse 已提交
646

647 648
	gfs2_holder_init(ip->i_gl, LM_ST_SHARED, 0, &gh);
	ret = gfs2_glock_nq(&gh);
649
	if (unlikely(ret))
650
		goto out_uninit;
651
	if (!gfs2_is_stuffed(ip))
652
		ret = mpage_readpages(mapping, pages, nr_pages, gfs2_block_map);
653 654 655
	gfs2_glock_dq(&gh);
out_uninit:
	gfs2_holder_uninit(&gh);
S
Steven Whitehouse 已提交
656 657 658
	if (unlikely(test_bit(SDF_SHUTDOWN, &sdp->sd_flags)))
		ret = -EIO;
	return ret;
D
David Teigland 已提交
659 660 661
}

/**
S
Steven Whitehouse 已提交
662
 * gfs2_write_begin - Begin to write to a file
D
David Teigland 已提交
663
 * @file: The file to write to
S
Steven Whitehouse 已提交
664 665 666 667 668 669
 * @mapping: The mapping in which to write
 * @pos: The file offset at which to start writing
 * @len: Length of the write
 * @flags: Various flags
 * @pagep: Pointer to return the page
 * @fsdata: Pointer to return fs data (unused by GFS2)
D
David Teigland 已提交
670 671 672 673
 *
 * Returns: errno
 */

S
Steven Whitehouse 已提交
674 675 676
static int gfs2_write_begin(struct file *file, struct address_space *mapping,
			    loff_t pos, unsigned len, unsigned flags,
			    struct page **pagep, void **fsdata)
D
David Teigland 已提交
677
{
S
Steven Whitehouse 已提交
678 679
	struct gfs2_inode *ip = GFS2_I(mapping->host);
	struct gfs2_sbd *sdp = GFS2_SB(mapping->host);
680
	struct gfs2_inode *m_ip = GFS2_I(sdp->sd_statfs_inode);
681
	unsigned int data_blocks = 0, ind_blocks = 0, rblocks;
682
	unsigned requested = 0;
683
	int alloc_required;
D
David Teigland 已提交
684
	int error = 0;
685 686
	pgoff_t index = pos >> PAGE_SHIFT;
	unsigned from = pos & (PAGE_SIZE - 1);
S
Steven Whitehouse 已提交
687
	struct page *page;
688

689 690
	gfs2_holder_init(ip->i_gl, LM_ST_EXCLUSIVE, 0, &ip->i_gh);
	error = gfs2_glock_nq(&ip->i_gh);
S
Steven Whitehouse 已提交
691
	if (unlikely(error))
692
		goto out_uninit;
693 694 695 696 697 698 699 700
	if (&ip->i_inode == sdp->sd_rindex) {
		error = gfs2_glock_nq_init(m_ip->i_gl, LM_ST_EXCLUSIVE,
					   GL_NOCACHE, &m_ip->i_gh);
		if (unlikely(error)) {
			gfs2_glock_dq(&ip->i_gh);
			goto out_uninit;
		}
	}
D
David Teigland 已提交
701

702
	alloc_required = gfs2_write_alloc_required(ip, pos, len);
703

704 705 706
	if (alloc_required || gfs2_is_jdata(ip))
		gfs2_write_calc_reserv(ip, len, &data_blocks, &ind_blocks);

707
	if (alloc_required) {
708
		struct gfs2_alloc_parms ap = { .aflags = 0, };
709 710 711
		requested = data_blocks + ind_blocks;
		ap.target = requested;
		error = gfs2_quota_lock_check(ip, &ap);
712
		if (error)
713
			goto out_unlock;
714

715
		error = gfs2_inplace_reserve(ip, &ap);
716 717 718 719 720 721 722 723 724
		if (error)
			goto out_qunlock;
	}

	rblocks = RES_DINODE + ind_blocks;
	if (gfs2_is_jdata(ip))
		rblocks += data_blocks ? data_blocks : 1;
	if (ind_blocks || data_blocks)
		rblocks += RES_STATFS + RES_QUOTA;
725 726
	if (&ip->i_inode == sdp->sd_rindex)
		rblocks += 2 * RES_STATFS;
727
	if (alloc_required)
728
		rblocks += gfs2_rg_blocks(ip, requested);
729

730
	error = gfs2_trans_begin(sdp, rblocks,
731
				 PAGE_SIZE/sdp->sd_sb.sb_bsize);
732
	if (error)
733
		goto out_trans_fail;
734

735
	error = -ENOMEM;
736
	flags |= AOP_FLAG_NOFS;
737
	page = grab_cache_page_write_begin(mapping, index, flags);
738 739 740 741
	*pagep = page;
	if (unlikely(!page))
		goto out_endtrans;

742
	if (gfs2_is_stuffed(ip)) {
743
		error = 0;
S
Steven Whitehouse 已提交
744
		if (pos + len > sdp->sd_sb.sb_bsize - sizeof(struct gfs2_dinode)) {
745
			error = gfs2_unstuff_dinode(ip, page);
746 747
			if (error == 0)
				goto prepare_write;
748
		} else if (!PageUptodate(page)) {
D
David Teigland 已提交
749
			error = stuffed_readpage(ip, page);
750
		}
751
		goto out;
752 753
	}

754
prepare_write:
C
Christoph Hellwig 已提交
755
	error = __block_write_begin(page, from, len, gfs2_block_map);
756
out:
757 758 759
	if (error == 0)
		return 0;

M
Maxim 已提交
760
	unlock_page(page);
761
	put_page(page);
762

S
Steven Whitehouse 已提交
763
	gfs2_trans_end(sdp);
764
	if (pos + len > ip->i_inode.i_size)
S
Steven Whitehouse 已提交
765 766 767
		gfs2_trim_blocks(&ip->i_inode);
	goto out_trans_fail;

768 769
out_endtrans:
	gfs2_trans_end(sdp);
770
out_trans_fail:
771 772
	if (alloc_required) {
		gfs2_inplace_release(ip);
773
out_qunlock:
774 775
		gfs2_quota_unlock(ip);
	}
776
out_unlock:
777 778 779 780
	if (&ip->i_inode == sdp->sd_rindex) {
		gfs2_glock_dq(&m_ip->i_gh);
		gfs2_holder_uninit(&m_ip->i_gh);
	}
781
	gfs2_glock_dq(&ip->i_gh);
782
out_uninit:
783
	gfs2_holder_uninit(&ip->i_gh);
D
David Teigland 已提交
784 785 786
	return error;
}

787 788 789 790 791 792 793
/**
 * adjust_fs_space - Adjusts the free space available due to gfs2_grow
 * @inode: the rindex inode
 */
static void adjust_fs_space(struct inode *inode)
{
	struct gfs2_sbd *sdp = inode->i_sb->s_fs_info;
794 795
	struct gfs2_inode *m_ip = GFS2_I(sdp->sd_statfs_inode);
	struct gfs2_inode *l_ip = GFS2_I(sdp->sd_sc_inode);
796 797
	struct gfs2_statfs_change_host *m_sc = &sdp->sd_statfs_master;
	struct gfs2_statfs_change_host *l_sc = &sdp->sd_statfs_local;
798
	struct buffer_head *m_bh, *l_bh;
799 800 801 802
	u64 fs_total, new_free;

	/* Total up the file system space, according to the latest rindex. */
	fs_total = gfs2_ri_total(sdp);
803 804
	if (gfs2_meta_inode_buffer(m_ip, &m_bh) != 0)
		return;
805 806

	spin_lock(&sdp->sd_statfs_spin);
807 808
	gfs2_statfs_change_in(m_sc, m_bh->b_data +
			      sizeof(struct gfs2_dinode));
809 810 811 812 813
	if (fs_total > (m_sc->sc_total + l_sc->sc_total))
		new_free = fs_total - (m_sc->sc_total + l_sc->sc_total);
	else
		new_free = 0;
	spin_unlock(&sdp->sd_statfs_spin);
814 815
	fs_warn(sdp, "File system extended by %llu blocks.\n",
		(unsigned long long)new_free);
816
	gfs2_statfs_change(sdp, new_free, new_free, 0);
817 818 819 820 821 822 823

	if (gfs2_meta_inode_buffer(l_ip, &l_bh) != 0)
		goto out;
	update_statfs(sdp, m_bh, l_bh);
	brelse(l_bh);
out:
	brelse(m_bh);
824 825
}

D
David Teigland 已提交
826
/**
S
Steven Whitehouse 已提交
827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845
 * gfs2_stuffed_write_end - Write end for stuffed files
 * @inode: The inode
 * @dibh: The buffer_head containing the on-disk inode
 * @pos: The file position
 * @len: The length of the write
 * @copied: How much was actually copied by the VFS
 * @page: The page
 *
 * This copies the data from the page into the inode block after
 * the inode data structure itself.
 *
 * Returns: errno
 */
static int gfs2_stuffed_write_end(struct inode *inode, struct buffer_head *dibh,
				  loff_t pos, unsigned len, unsigned copied,
				  struct page *page)
{
	struct gfs2_inode *ip = GFS2_I(inode);
	struct gfs2_sbd *sdp = GFS2_SB(inode);
846
	struct gfs2_inode *m_ip = GFS2_I(sdp->sd_statfs_inode);
S
Steven Whitehouse 已提交
847 848 849 850 851
	u64 to = pos + copied;
	void *kaddr;
	unsigned char *buf = dibh->b_data + sizeof(struct gfs2_dinode);

	BUG_ON((pos + len) > (dibh->b_size - sizeof(struct gfs2_dinode)));
852
	kaddr = kmap_atomic(page);
S
Steven Whitehouse 已提交
853 854
	memcpy(buf + pos, kaddr + pos, copied);
	flush_dcache_page(page);
855
	kunmap_atomic(kaddr);
S
Steven Whitehouse 已提交
856

857
	WARN_ON(!PageUptodate(page));
S
Steven Whitehouse 已提交
858
	unlock_page(page);
859
	put_page(page);
S
Steven Whitehouse 已提交
860

A
Abhijith Das 已提交
861
	if (copied) {
S
Steven Whitehouse 已提交
862
		if (inode->i_size < to)
A
Abhijith Das 已提交
863
			i_size_write(inode, to);
S
Steven Whitehouse 已提交
864 865 866
		mark_inode_dirty(inode);
	}

867
	if (inode == sdp->sd_rindex) {
S
Steven Whitehouse 已提交
868
		adjust_fs_space(inode);
869
		sdp->sd_rindex_uptodate = 0;
870
	}
S
Steven Whitehouse 已提交
871 872 873

	brelse(dibh);
	gfs2_trans_end(sdp);
874 875 876 877
	if (inode == sdp->sd_rindex) {
		gfs2_glock_dq(&m_ip->i_gh);
		gfs2_holder_uninit(&m_ip->i_gh);
	}
S
Steven Whitehouse 已提交
878 879 880 881 882 883 884
	gfs2_glock_dq(&ip->i_gh);
	gfs2_holder_uninit(&ip->i_gh);
	return copied;
}

/**
 * gfs2_write_end
D
David Teigland 已提交
885
 * @file: The file to write to
S
Steven Whitehouse 已提交
886 887 888
 * @mapping: The address space to write to
 * @pos: The file position
 * @len: The length of the data
F
Fabian Frederick 已提交
889
 * @copied: How much was actually copied by the VFS
S
Steven Whitehouse 已提交
890 891 892 893 894 895
 * @page: The page that has been written
 * @fsdata: The fsdata (unused in GFS2)
 *
 * The main write_end function for GFS2. We have a separate one for
 * stuffed files as they are slightly different, otherwise we just
 * put our locking around the VFS provided functions.
D
David Teigland 已提交
896 897 898 899
 *
 * Returns: errno
 */

S
Steven Whitehouse 已提交
900 901 902
static int gfs2_write_end(struct file *file, struct address_space *mapping,
			  loff_t pos, unsigned len, unsigned copied,
			  struct page *page, void *fsdata)
D
David Teigland 已提交
903 904
{
	struct inode *inode = page->mapping->host;
905 906
	struct gfs2_inode *ip = GFS2_I(inode);
	struct gfs2_sbd *sdp = GFS2_SB(inode);
907
	struct gfs2_inode *m_ip = GFS2_I(sdp->sd_statfs_inode);
908
	struct buffer_head *dibh;
909
	unsigned int from = pos & (PAGE_SIZE - 1);
S
Steven Whitehouse 已提交
910 911
	unsigned int to = from + len;
	int ret;
912 913
	struct gfs2_trans *tr = current->journal_info;
	BUG_ON(!tr);
D
David Teigland 已提交
914

915
	BUG_ON(gfs2_glock_is_locked_by_me(ip->i_gl) == NULL);
916

S
Steven Whitehouse 已提交
917 918 919
	ret = gfs2_meta_inode_buffer(ip, &dibh);
	if (unlikely(ret)) {
		unlock_page(page);
920
		put_page(page);
S
Steven Whitehouse 已提交
921 922
		goto failed;
	}
923

S
Steven Whitehouse 已提交
924 925
	if (gfs2_is_stuffed(ip))
		return gfs2_stuffed_write_end(inode, dibh, pos, len, copied, page);
D
David Teigland 已提交
926

927
	if (!gfs2_is_writeback(ip))
S
Steven Whitehouse 已提交
928
		gfs2_page_add_databufs(ip, page, from, to);
D
David Teigland 已提交
929

S
Steven Whitehouse 已提交
930
	ret = generic_write_end(file, mapping, pos, len, copied, page, fsdata);
931 932 933 934 935
	if (tr->tr_num_buf_new)
		__mark_inode_dirty(inode, I_DIRTY_DATASYNC);
	else
		gfs2_trans_add_meta(ip->i_gl, dibh);

936

937
	if (inode == sdp->sd_rindex) {
938
		adjust_fs_space(inode);
939
		sdp->sd_rindex_uptodate = 0;
940
	}
941

942
	brelse(dibh);
S
Steven Whitehouse 已提交
943
failed:
944
	gfs2_trans_end(sdp);
945
	gfs2_inplace_release(ip);
946
	if (ip->i_qadata && ip->i_qadata->qa_qd_num)
947
		gfs2_quota_unlock(ip);
948 949 950 951
	if (inode == sdp->sd_rindex) {
		gfs2_glock_dq(&m_ip->i_gh);
		gfs2_holder_uninit(&m_ip->i_gh);
	}
S
Steven Whitehouse 已提交
952
	gfs2_glock_dq(&ip->i_gh);
953
	gfs2_holder_uninit(&ip->i_gh);
S
Steven Whitehouse 已提交
954
	return ret;
D
David Teigland 已提交
955 956
}

957 958 959 960 961 962 963 964 965
/**
 * gfs2_set_page_dirty - Page dirtying function
 * @page: The page to dirty
 *
 * Returns: 1 if it dirtyed the page, or 0 otherwise
 */
 
static int gfs2_set_page_dirty(struct page *page)
{
966
	SetPageChecked(page);
967 968 969
	return __set_page_dirty_buffers(page);
}

D
David Teigland 已提交
970 971 972 973 974 975 976 977 978 979
/**
 * gfs2_bmap - Block map function
 * @mapping: Address space info
 * @lblock: The block to map
 *
 * Returns: The disk address for the block or 0 on hole or error
 */

static sector_t gfs2_bmap(struct address_space *mapping, sector_t lblock)
{
980
	struct gfs2_inode *ip = GFS2_I(mapping->host);
D
David Teigland 已提交
981 982 983 984 985 986 987 988 989
	struct gfs2_holder i_gh;
	sector_t dblock = 0;
	int error;

	error = gfs2_glock_nq_init(ip->i_gl, LM_ST_SHARED, LM_FLAG_ANY, &i_gh);
	if (error)
		return 0;

	if (!gfs2_is_stuffed(ip))
990
		dblock = generic_block_bmap(mapping, lblock, gfs2_block_map);
D
David Teigland 已提交
991 992 993 994 995 996

	gfs2_glock_dq_uninit(&i_gh);

	return dblock;
}

997 998 999 1000 1001 1002 1003 1004 1005
static void gfs2_discard(struct gfs2_sbd *sdp, struct buffer_head *bh)
{
	struct gfs2_bufdata *bd;

	lock_buffer(bh);
	gfs2_log_lock(sdp);
	clear_buffer_dirty(bh);
	bd = bh->b_private;
	if (bd) {
1006 1007
		if (!list_empty(&bd->bd_list) && !buffer_pinned(bh))
			list_del_init(&bd->bd_list);
1008
		else
1009
			gfs2_remove_from_journal(bh, REMOVE_JDATA);
1010 1011 1012 1013 1014 1015 1016 1017 1018
	}
	bh->b_bdev = NULL;
	clear_buffer_mapped(bh);
	clear_buffer_req(bh);
	clear_buffer_new(bh);
	gfs2_log_unlock(sdp);
	unlock_buffer(bh);
}

1019 1020
static void gfs2_invalidatepage(struct page *page, unsigned int offset,
				unsigned int length)
D
David Teigland 已提交
1021
{
1022
	struct gfs2_sbd *sdp = GFS2_SB(page->mapping->host);
1023
	unsigned int stop = offset + length;
1024
	int partial_page = (offset || length < PAGE_SIZE);
1025 1026 1027
	struct buffer_head *bh, *head;
	unsigned long pos = 0;

D
David Teigland 已提交
1028
	BUG_ON(!PageLocked(page));
1029
	if (!partial_page)
1030
		ClearPageChecked(page);
1031 1032
	if (!page_has_buffers(page))
		goto out;
D
David Teigland 已提交
1033

1034 1035
	bh = head = page_buffers(page);
	do {
1036 1037 1038
		if (pos + bh->b_size > stop)
			return;

1039 1040 1041 1042 1043 1044
		if (offset <= pos)
			gfs2_discard(sdp, bh);
		pos += bh->b_size;
		bh = bh->b_this_page;
	} while (bh != head);
out:
1045
	if (!partial_page)
1046
		try_to_release_page(page, 0);
D
David Teigland 已提交
1047 1048
}

S
Steven Whitehouse 已提交
1049 1050 1051 1052 1053 1054 1055 1056
/**
 * gfs2_ok_for_dio - check that dio is valid on this file
 * @ip: The inode
 * @offset: The offset at which we are reading or writing
 *
 * Returns: 0 (to ignore the i/o request and thus fall back to buffered i/o)
 *          1 (to accept the i/o request)
 */
1057
static int gfs2_ok_for_dio(struct gfs2_inode *ip, loff_t offset)
S
Steven Whitehouse 已提交
1058 1059 1060
{
	/*
	 * Should we return an error here? I can't see that O_DIRECT for
1061 1062
	 * a stuffed file makes any sense. For now we'll silently fall
	 * back to buffered I/O
S
Steven Whitehouse 已提交
1063 1064 1065 1066
	 */
	if (gfs2_is_stuffed(ip))
		return 0;

1067
	if (offset >= i_size_read(&ip->i_inode))
S
Steven Whitehouse 已提交
1068 1069 1070 1071 1072 1073
		return 0;
	return 1;
}



1074
static ssize_t gfs2_direct_IO(struct kiocb *iocb, struct iov_iter *iter)
1075 1076 1077
{
	struct file *file = iocb->ki_filp;
	struct inode *inode = file->f_mapping->host;
1078
	struct address_space *mapping = inode->i_mapping;
1079
	struct gfs2_inode *ip = GFS2_I(inode);
1080
	loff_t offset = iocb->ki_pos;
1081 1082 1083 1084
	struct gfs2_holder gh;
	int rv;

	/*
S
Steven Whitehouse 已提交
1085 1086 1087 1088 1089 1090
	 * Deferred lock, even if its a write, since we do no allocation
	 * on this path. All we need change is atime, and this lock mode
	 * ensures that other nodes have flushed their buffered read caches
	 * (i.e. their page cache entries for this inode). We do not,
	 * unfortunately have the option of only flushing a range like
	 * the VFS does.
1091
	 */
1092 1093
	gfs2_holder_init(ip->i_gl, LM_ST_DEFERRED, 0, &gh);
	rv = gfs2_glock_nq(&gh);
1094
	if (rv)
1095
		goto out_uninit;
1096
	rv = gfs2_ok_for_dio(ip, offset);
S
Steven Whitehouse 已提交
1097 1098 1099
	if (rv != 1)
		goto out; /* dio not valid, fall back to buffered i/o */

1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113
	/*
	 * Now since we are holding a deferred (CW) lock at this point, you
	 * might be wondering why this is ever needed. There is a case however
	 * where we've granted a deferred local lock against a cached exclusive
	 * glock. That is ok provided all granted local locks are deferred, but
	 * it also means that it is possible to encounter pages which are
	 * cached and possibly also mapped. So here we check for that and sort
	 * them out ahead of the dio. The glock state machine will take care of
	 * everything else.
	 *
	 * If in fact the cached glock state (gl->gl_state) is deferred (CW) in
	 * the first place, mapping->nr_pages will always be zero.
	 */
	if (mapping->nrpages) {
1114
		loff_t lstart = offset & ~(PAGE_SIZE - 1);
1115
		loff_t len = iov_iter_count(iter);
1116 1117 1118 1119 1120 1121 1122 1123 1124
		loff_t end = PAGE_ALIGN(offset + len) - 1;

		rv = 0;
		if (len == 0)
			goto out;
		if (test_and_clear_bit(GIF_SW_PAGED, &ip->i_flags))
			unmap_shared_mapping_range(ip->i_inode.i_mapping, offset, len);
		rv = filemap_write_and_wait_range(mapping, lstart, end);
		if (rv)
1125
			goto out;
1126
		if (iov_iter_rw(iter) == WRITE)
1127
			truncate_inode_pages_range(mapping, lstart, end);
1128 1129
	}

1130
	rv = __blockdev_direct_IO(iocb, inode, inode->i_sb->s_bdev, iter,
1131
				  gfs2_get_block_direct, NULL, NULL, 0);
1132
out:
1133
	gfs2_glock_dq(&gh);
1134
out_uninit:
1135 1136 1137 1138
	gfs2_holder_uninit(&gh);
	return rv;
}

S
Steven Whitehouse 已提交
1139
/**
1140
 * gfs2_releasepage - free the metadata associated with a page
S
Steven Whitehouse 已提交
1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151
 * @page: the page that's being released
 * @gfp_mask: passed from Linux VFS, ignored by us
 *
 * Call try_to_free_buffers() if the buffers in this page can be
 * released.
 *
 * Returns: 0
 */

int gfs2_releasepage(struct page *page, gfp_t gfp_mask)
{
1152 1153
	struct address_space *mapping = page->mapping;
	struct gfs2_sbd *sdp = gfs2_mapping2sbd(mapping);
S
Steven Whitehouse 已提交
1154 1155 1156 1157
	struct buffer_head *bh, *head;
	struct gfs2_bufdata *bd;

	if (!page_has_buffers(page))
1158
		return 0;
S
Steven Whitehouse 已提交
1159

1160 1161 1162 1163 1164 1165 1166 1167 1168 1169
	/*
	 * From xfs_vm_releasepage: mm accommodates an old ext3 case where
	 * clean pages might not have had the dirty bit cleared.  Thus, it can
	 * send actual dirty pages to ->releasepage() via shrink_active_list().
	 *
	 * As a workaround, we skip pages that contain dirty buffers below.
	 * Once ->releasepage isn't called on dirty pages anymore, we can warn
	 * on dirty buffers like we used to here again.
	 */

1170
	gfs2_log_lock(sdp);
1171
	spin_lock(&sdp->sd_ail_lock);
S
Steven Whitehouse 已提交
1172 1173
	head = bh = page_buffers(page);
	do {
1174 1175 1176
		if (atomic_read(&bh->b_count))
			goto cannot_release;
		bd = bh->b_private;
1177
		if (bd && bd->bd_tr)
1178
			goto cannot_release;
1179 1180
		if (buffer_dirty(bh) || WARN_ON(buffer_pinned(bh)))
			goto cannot_release;
1181 1182
		bh = bh->b_this_page;
	} while(bh != head);
1183
	spin_unlock(&sdp->sd_ail_lock);
S
Steven Whitehouse 已提交
1184

1185 1186
	head = bh = page_buffers(page);
	do {
S
Steven Whitehouse 已提交
1187 1188 1189
		bd = bh->b_private;
		if (bd) {
			gfs2_assert_warn(sdp, bd->bd_bh == bh);
S
Steven Whitehouse 已提交
1190 1191 1192
			if (!list_empty(&bd->bd_list))
				list_del_init(&bd->bd_list);
			bd->bd_bh = NULL;
S
Steven Whitehouse 已提交
1193
			bh->b_private = NULL;
1194
			kmem_cache_free(gfs2_bufdata_cachep, bd);
S
Steven Whitehouse 已提交
1195
		}
S
Steven Whitehouse 已提交
1196 1197

		bh = bh->b_this_page;
1198
	} while (bh != head);
S
Steven Whitehouse 已提交
1199
	gfs2_log_unlock(sdp);
S
Steven Whitehouse 已提交
1200 1201

	return try_to_free_buffers(page);
1202

1203
cannot_release:
1204
	spin_unlock(&sdp->sd_ail_lock);
1205 1206
	gfs2_log_unlock(sdp);
	return 0;
S
Steven Whitehouse 已提交
1207 1208
}

1209
static const struct address_space_operations gfs2_writeback_aops = {
1210
	.writepage = gfs2_writepage,
1211
	.writepages = gfs2_writepages,
1212 1213 1214 1215 1216 1217 1218 1219
	.readpage = gfs2_readpage,
	.readpages = gfs2_readpages,
	.write_begin = gfs2_write_begin,
	.write_end = gfs2_write_end,
	.bmap = gfs2_bmap,
	.invalidatepage = gfs2_invalidatepage,
	.releasepage = gfs2_releasepage,
	.direct_IO = gfs2_direct_IO,
1220
	.migratepage = buffer_migrate_page,
1221
	.is_partially_uptodate = block_is_partially_uptodate,
1222
	.error_remove_page = generic_error_remove_page,
1223 1224 1225
};

static const struct address_space_operations gfs2_ordered_aops = {
1226
	.writepage = gfs2_writepage,
1227
	.writepages = gfs2_writepages,
D
David Teigland 已提交
1228
	.readpage = gfs2_readpage,
S
Steven Whitehouse 已提交
1229
	.readpages = gfs2_readpages,
S
Steven Whitehouse 已提交
1230 1231
	.write_begin = gfs2_write_begin,
	.write_end = gfs2_write_end,
1232
	.set_page_dirty = gfs2_set_page_dirty,
D
David Teigland 已提交
1233 1234
	.bmap = gfs2_bmap,
	.invalidatepage = gfs2_invalidatepage,
S
Steven Whitehouse 已提交
1235
	.releasepage = gfs2_releasepage,
D
David Teigland 已提交
1236
	.direct_IO = gfs2_direct_IO,
1237
	.migratepage = buffer_migrate_page,
1238
	.is_partially_uptodate = block_is_partially_uptodate,
1239
	.error_remove_page = generic_error_remove_page,
D
David Teigland 已提交
1240 1241
};

1242
static const struct address_space_operations gfs2_jdata_aops = {
1243
	.writepage = gfs2_jdata_writepage,
1244
	.writepages = gfs2_jdata_writepages,
1245 1246 1247 1248 1249 1250 1251 1252
	.readpage = gfs2_readpage,
	.readpages = gfs2_readpages,
	.write_begin = gfs2_write_begin,
	.write_end = gfs2_write_end,
	.set_page_dirty = gfs2_set_page_dirty,
	.bmap = gfs2_bmap,
	.invalidatepage = gfs2_invalidatepage,
	.releasepage = gfs2_releasepage,
1253
	.is_partially_uptodate = block_is_partially_uptodate,
1254
	.error_remove_page = generic_error_remove_page,
1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270
};

void gfs2_set_aops(struct inode *inode)
{
	struct gfs2_inode *ip = GFS2_I(inode);

	if (gfs2_is_writeback(ip))
		inode->i_mapping->a_ops = &gfs2_writeback_aops;
	else if (gfs2_is_ordered(ip))
		inode->i_mapping->a_ops = &gfs2_ordered_aops;
	else if (gfs2_is_jdata(ip))
		inode->i_mapping->a_ops = &gfs2_jdata_aops;
	else
		BUG();
}