jfs_metapage.c 19.6 KB
Newer Older
L
Linus Torvalds 已提交
1
/*
2
 *   Copyright (C) International Business Machines Corp., 2000-2005
L
Linus Torvalds 已提交
3 4 5 6
 *   Portions Copyright (C) Christoph Hellwig, 2001-2002
 *
 *   This program is free software;  you can redistribute it and/or modify
 *   it under the terms of the GNU General Public License as published by
D
Dave Kleikamp 已提交
7
 *   the Free Software Foundation; either version 2 of the License, or
L
Linus Torvalds 已提交
8
 *   (at your option) any later version.
D
Dave Kleikamp 已提交
9
 *
L
Linus Torvalds 已提交
10 11 12 13 14 15
 *   This program is distributed in the hope that it will be useful,
 *   but WITHOUT ANY WARRANTY;  without even the implied warranty of
 *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See
 *   the GNU General Public License for more details.
 *
 *   You should have received a copy of the GNU General Public License
D
Dave Kleikamp 已提交
16
 *   along with this program;  if not, write to the Free Software
L
Linus Torvalds 已提交
17 18 19 20
 *   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
 */

#include <linux/fs.h>
21
#include <linux/mm.h>
A
Alexey Dobriyan 已提交
22
#include <linux/module.h>
23
#include <linux/bio.h>
24
#include <linux/slab.h>
L
Linus Torvalds 已提交
25 26 27
#include <linux/init.h>
#include <linux/buffer_head.h>
#include <linux/mempool.h>
A
Alexey Dobriyan 已提交
28
#include <linux/seq_file.h>
L
Linus Torvalds 已提交
29 30 31 32 33 34 35 36 37 38 39 40 41 42 43
#include "jfs_incore.h"
#include "jfs_superblock.h"
#include "jfs_filsys.h"
#include "jfs_metapage.h"
#include "jfs_txnmgr.h"
#include "jfs_debug.h"

#ifdef CONFIG_JFS_STATISTICS
static struct {
	uint	pagealloc;	/* # of page allocations */
	uint	pagefree;	/* # of page frees */
	uint	lockwait;	/* # of sleeping lock_metapage() calls */
} mpStat;
#endif

44
#define metapage_locked(mp) test_bit(META_locked, &(mp)->flag)
N
Nick Piggin 已提交
45
#define trylock_metapage(mp) test_and_set_bit_lock(META_locked, &(mp)->flag)
L
Linus Torvalds 已提交
46 47 48

static inline void unlock_metapage(struct metapage *mp)
{
N
Nick Piggin 已提交
49
	clear_bit_unlock(META_locked, &mp->flag);
L
Linus Torvalds 已提交
50 51 52
	wake_up(&mp->wait);
}

53
static inline void __lock_metapage(struct metapage *mp)
L
Linus Torvalds 已提交
54 55 56 57 58 59 60
{
	DECLARE_WAITQUEUE(wait, current);
	INCREMENT(mpStat.lockwait);
	add_wait_queue_exclusive(&mp->wait, &wait);
	do {
		set_current_state(TASK_UNINTERRUPTIBLE);
		if (metapage_locked(mp)) {
61
			unlock_page(mp->page);
62
			io_schedule();
63
			lock_page(mp->page);
L
Linus Torvalds 已提交
64 65 66 67 68 69
		}
	} while (trylock_metapage(mp));
	__set_current_state(TASK_RUNNING);
	remove_wait_queue(&mp->wait, &wait);
}

70 71 72
/*
 * Must have mp->page locked
 */
L
Linus Torvalds 已提交
73 74 75 76 77 78 79
static inline void lock_metapage(struct metapage *mp)
{
	if (trylock_metapage(mp))
		__lock_metapage(mp);
}

#define METAPOOL_MIN_PAGES 32
80
static struct kmem_cache *metapage_cache;
L
Linus Torvalds 已提交
81 82
static mempool_t *metapage_mempool;

83 84 85 86 87 88 89 90 91
#define MPS_PER_PAGE (PAGE_CACHE_SIZE >> L2PSIZE)

#if MPS_PER_PAGE > 1

struct meta_anchor {
	int mp_count;
	atomic_t io_count;
	struct metapage *mp[MPS_PER_PAGE];
};
H
Hugh Dickins 已提交
92
#define mp_anchor(page) ((struct meta_anchor *)page_private(page))
93

94
static inline struct metapage *page_to_mp(struct page *page, int offset)
95 96 97 98 99 100 101 102 103 104 105 106 107 108 109
{
	if (!PagePrivate(page))
		return NULL;
	return mp_anchor(page)->mp[offset >> L2PSIZE];
}

static inline int insert_metapage(struct page *page, struct metapage *mp)
{
	struct meta_anchor *a;
	int index;
	int l2mp_blocks;	/* log2 blocks per metapage */

	if (PagePrivate(page))
		a = mp_anchor(page);
	else {
E
Eric Sesterhenn 已提交
110
		a = kzalloc(sizeof(struct meta_anchor), GFP_NOFS);
111 112
		if (!a)
			return -ENOMEM;
H
Hugh Dickins 已提交
113
		set_page_private(page, (unsigned long)a);
114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140
		SetPagePrivate(page);
		kmap(page);
	}

	if (mp) {
		l2mp_blocks = L2PSIZE - page->mapping->host->i_blkbits;
		index = (mp->index >> l2mp_blocks) & (MPS_PER_PAGE - 1);
		a->mp_count++;
		a->mp[index] = mp;
	}

	return 0;
}

static inline void remove_metapage(struct page *page, struct metapage *mp)
{
	struct meta_anchor *a = mp_anchor(page);
	int l2mp_blocks = L2PSIZE - page->mapping->host->i_blkbits;
	int index;

	index = (mp->index >> l2mp_blocks) & (MPS_PER_PAGE - 1);

	BUG_ON(a->mp[index] != mp);

	a->mp[index] = NULL;
	if (--a->mp_count == 0) {
		kfree(a);
H
Hugh Dickins 已提交
141
		set_page_private(page, 0);
142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158
		ClearPagePrivate(page);
		kunmap(page);
	}
}

static inline void inc_io(struct page *page)
{
	atomic_inc(&mp_anchor(page)->io_count);
}

static inline void dec_io(struct page *page, void (*handler) (struct page *))
{
	if (atomic_dec_and_test(&mp_anchor(page)->io_count))
		handler(page);
}

#else
159
static inline struct metapage *page_to_mp(struct page *page, int offset)
160
{
H
Hugh Dickins 已提交
161
	return PagePrivate(page) ? (struct metapage *)page_private(page) : NULL;
162 163 164 165 166
}

static inline int insert_metapage(struct page *page, struct metapage *mp)
{
	if (mp) {
H
Hugh Dickins 已提交
167
		set_page_private(page, (unsigned long)mp);
168 169 170 171 172 173 174 175
		SetPagePrivate(page);
		kmap(page);
	}
	return 0;
}

static inline void remove_metapage(struct page *page, struct metapage *mp)
{
H
Hugh Dickins 已提交
176
	set_page_private(page, 0);
177 178 179 180 181 182 183 184 185
	ClearPagePrivate(page);
	kunmap(page);
}

#define inc_io(page) do {} while(0)
#define dec_io(page, handler) handler(page)

#endif

186
static void init_once(void *foo)
L
Linus Torvalds 已提交
187 188 189
{
	struct metapage *mp = (struct metapage *)foo;

C
Christoph Lameter 已提交
190 191 192 193 194 195 196 197
	mp->lid = 0;
	mp->lsn = 0;
	mp->flag = 0;
	mp->data = NULL;
	mp->clsn = 0;
	mp->log = NULL;
	set_bit(META_free, &mp->flag);
	init_waitqueue_head(&mp->wait);
L
Linus Torvalds 已提交
198 199
}

A
Al Viro 已提交
200
static inline struct metapage *alloc_metapage(gfp_t gfp_mask)
L
Linus Torvalds 已提交
201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218
{
	return mempool_alloc(metapage_mempool, gfp_mask);
}

static inline void free_metapage(struct metapage *mp)
{
	mp->flag = 0;
	set_bit(META_free, &mp->flag);

	mempool_free(mp, metapage_mempool);
}

int __init metapage_init(void)
{
	/*
	 * Allocate the metapage structures
	 */
	metapage_cache = kmem_cache_create("jfs_mp", sizeof(struct metapage),
219
					   0, 0, init_once);
L
Linus Torvalds 已提交
220 221 222
	if (metapage_cache == NULL)
		return -ENOMEM;

223 224
	metapage_mempool = mempool_create_slab_pool(METAPOOL_MIN_PAGES,
						    metapage_cache);
L
Linus Torvalds 已提交
225 226 227 228 229 230 231 232 233 234 235 236 237 238 239

	if (metapage_mempool == NULL) {
		kmem_cache_destroy(metapage_cache);
		return -ENOMEM;
	}

	return 0;
}

void metapage_exit(void)
{
	mempool_destroy(metapage_mempool);
	kmem_cache_destroy(metapage_cache);
}

240 241 242 243 244 245 246 247 248 249
static inline void drop_metapage(struct page *page, struct metapage *mp)
{
	if (mp->count || mp->nohomeok || test_bit(META_dirty, &mp->flag) ||
	    test_bit(META_io, &mp->flag))
		return;
	remove_metapage(page, mp);
	INCREMENT(mpStat.pagefree);
	free_metapage(mp);
}

L
Linus Torvalds 已提交
250
/*
251
 * Metapage address space operations
L
Linus Torvalds 已提交
252
 */
253 254

static sector_t metapage_get_blocks(struct inode *inode, sector_t lblock,
255
				    int *len)
L
Linus Torvalds 已提交
256
{
257 258 259
	int rc = 0;
	int xflag;
	s64 xaddr;
260
	sector_t file_blocks = (inode->i_size + inode->i_sb->s_blocksize - 1) >>
261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276
			       inode->i_blkbits;

	if (lblock >= file_blocks)
		return 0;
	if (lblock + *len > file_blocks)
		*len = file_blocks - lblock;

	if (inode->i_ino) {
		rc = xtLookup(inode, (s64)lblock, *len, &xflag, &xaddr, len, 0);
		if ((rc == 0) && *len)
			lblock = (sector_t)xaddr;
		else
			lblock = 0;
	} /* else no mapping */

	return lblock;
L
Linus Torvalds 已提交
277 278
}

279
static void last_read_complete(struct page *page)
L
Linus Torvalds 已提交
280
{
281 282 283 284 285
	if (!PageError(page))
		SetPageUptodate(page);
	unlock_page(page);
}

286
static void metapage_read_end_io(struct bio *bio, int err)
287 288 289 290 291 292
{
	struct page *page = bio->bi_private;

	if (!test_bit(BIO_UPTODATE, &bio->bi_flags)) {
		printk(KERN_ERR "metapage_read_end_io: I/O error\n");
		SetPageError(page);
L
Linus Torvalds 已提交
293 294
	}

295 296
	dec_io(page, last_read_complete);
	bio_put(bio);
L
Linus Torvalds 已提交
297 298
}

299
static void remove_from_logsync(struct metapage *mp)
L
Linus Torvalds 已提交
300
{
301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319
	struct jfs_log *log = mp->log;
	unsigned long flags;
/*
 * This can race.  Recheck that log hasn't been set to null, and after
 * acquiring logsync lock, recheck lsn
 */
	if (!log)
		return;

	LOGSYNC_LOCK(log, flags);
	if (mp->lsn) {
		mp->log = NULL;
		mp->lsn = 0;
		mp->clsn = 0;
		log->count--;
		list_del(&mp->synclist);
	}
	LOGSYNC_UNLOCK(log, flags);
}
L
Linus Torvalds 已提交
320

321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338
static void last_write_complete(struct page *page)
{
	struct metapage *mp;
	unsigned int offset;

	for (offset = 0; offset < PAGE_CACHE_SIZE; offset += PSIZE) {
		mp = page_to_mp(page, offset);
		if (mp && test_bit(META_io, &mp->flag)) {
			if (mp->lsn)
				remove_from_logsync(mp);
			clear_bit(META_io, &mp->flag);
		}
		/*
		 * I'd like to call drop_metapage here, but I don't think it's
		 * safe unless I have the page locked
		 */
	}
	end_page_writeback(page);
L
Linus Torvalds 已提交
339 340
}

341
static void metapage_write_end_io(struct bio *bio, int err)
L
Linus Torvalds 已提交
342
{
343 344 345 346 347 348 349 350 351 352 353 354 355 356 357
	struct page *page = bio->bi_private;

	BUG_ON(!PagePrivate(page));

	if (! test_bit(BIO_UPTODATE, &bio->bi_flags)) {
		printk(KERN_ERR "metapage_write_end_io: I/O error\n");
		SetPageError(page);
	}
	dec_io(page, last_write_complete);
	bio_put(bio);
}

static int metapage_writepage(struct page *page, struct writeback_control *wbc)
{
	struct bio *bio = NULL;
358
	int block_offset;	/* block offset of mp within page */
359
	struct inode *inode = page->mapping->host;
360 361 362
	int blocks_per_mp = JFS_SBI(inode->i_sb)->nbperpage;
	int len;
	int xlen;
363 364 365
	struct metapage *mp;
	int redirty = 0;
	sector_t lblock;
366
	int nr_underway = 0;
367 368 369 370 371
	sector_t pblock;
	sector_t next_block = 0;
	sector_t page_start;
	unsigned long bio_bytes = 0;
	unsigned long bio_offset = 0;
372
	int offset;
373
	int bad_blocks = 0;
374 375 376 377 378

	page_start = (sector_t)page->index <<
		     (PAGE_CACHE_SHIFT - inode->i_blkbits);
	BUG_ON(!PageLocked(page));
	BUG_ON(PageWriteback(page));
379
	set_page_writeback(page);
380 381 382 383 384 385 386 387 388

	for (offset = 0; offset < PAGE_CACHE_SIZE; offset += PSIZE) {
		mp = page_to_mp(page, offset);

		if (!mp || !test_bit(META_dirty, &mp->flag))
			continue;

		if (mp->nohomeok && !test_bit(META_forcewrite, &mp->flag)) {
			redirty = 1;
389 390 391 392 393 394
			/*
			 * Make sure this page isn't blocked indefinitely.
			 * If the journal isn't undergoing I/O, push it
			 */
			if (mp->log && !(mp->log->cflag & logGC_PAGEOUT))
				jfs_flush_journal(mp->log, 0);
395 396 397 398
			continue;
		}

		clear_bit(META_dirty, &mp->flag);
399
		set_bit(META_io, &mp->flag);
400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421
		block_offset = offset >> inode->i_blkbits;
		lblock = page_start + block_offset;
		if (bio) {
			if (xlen && lblock == next_block) {
				/* Contiguous, in memory & on disk */
				len = min(xlen, blocks_per_mp);
				xlen -= len;
				bio_bytes += len << inode->i_blkbits;
				continue;
			}
			/* Not contiguous */
			if (bio_add_page(bio, page, bio_bytes, bio_offset) <
			    bio_bytes)
				goto add_failed;
			/*
			 * Increment counter before submitting i/o to keep
			 * count from hitting zero before we're through
			 */
			inc_io(page);
			if (!bio->bi_size)
				goto dump_bio;
			submit_bio(WRITE, bio);
422
			nr_underway++;
423
			bio = NULL;
424
		} else
425 426 427 428 429
			inc_io(page);
		xlen = (PAGE_CACHE_SIZE - offset) >> inode->i_blkbits;
		pblock = metapage_get_blocks(inode, lblock, &xlen);
		if (!pblock) {
			printk(KERN_ERR "JFS: metapage_get_blocks failed\n");
430 431 432 433 434
			/*
			 * We already called inc_io(), but can't cancel it
			 * with dec_io() until we're done with the page
			 */
			bad_blocks++;
435 436
			continue;
		}
437
		len = min(xlen, (int)JFS_SBI(inode->i_sb)->nbperpage);
438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456

		bio = bio_alloc(GFP_NOFS, 1);
		bio->bi_bdev = inode->i_sb->s_bdev;
		bio->bi_sector = pblock << (inode->i_blkbits - 9);
		bio->bi_end_io = metapage_write_end_io;
		bio->bi_private = page;

		/* Don't call bio_add_page yet, we may add to this vec */
		bio_offset = offset;
		bio_bytes = len << inode->i_blkbits;

		xlen -= len;
		next_block = lblock + len;
	}
	if (bio) {
		if (bio_add_page(bio, page, bio_bytes, bio_offset) < bio_bytes)
				goto add_failed;
		if (!bio->bi_size)
			goto dump_bio;
D
Dave Kleikamp 已提交
457

458
		submit_bio(WRITE, bio);
459
		nr_underway++;
460 461 462 463 464 465
	}
	if (redirty)
		redirty_page_for_writepage(wbc, page);

	unlock_page(page);

466 467 468
	if (bad_blocks)
		goto err_out;

469 470 471
	if (nr_underway == 0)
		end_page_writeback(page);

472 473 474 475 476 477
	return 0;
add_failed:
	/* We should never reach here, since we're only adding one vec */
	printk(KERN_ERR "JFS: bio_add_page failed unexpectedly\n");
	goto skip;
dump_bio:
478 479
	print_hex_dump(KERN_ERR, "JFS: dump of bio: ", DUMP_PREFIX_ADDRESS, 16,
		       4, bio, sizeof(*bio), 0);
480 481 482 483
skip:
	bio_put(bio);
	unlock_page(page);
	dec_io(page, last_write_complete);
484 485 486
err_out:
	while (bad_blocks--)
		dec_io(page, last_write_complete);
487 488 489 490 491 492 493
	return -EIO;
}

static int metapage_readpage(struct file *fp, struct page *page)
{
	struct inode *inode = page->mapping->host;
	struct bio *bio = NULL;
494 495
	int block_offset;
	int blocks_per_page = PAGE_CACHE_SIZE >> inode->i_blkbits;
496 497
	sector_t page_start;	/* address of page in fs blocks */
	sector_t pblock;
498
	int xlen;
499
	unsigned int len;
500
	int offset;
501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529

	BUG_ON(!PageLocked(page));
	page_start = (sector_t)page->index <<
		     (PAGE_CACHE_SHIFT - inode->i_blkbits);

	block_offset = 0;
	while (block_offset < blocks_per_page) {
		xlen = blocks_per_page - block_offset;
		pblock = metapage_get_blocks(inode, page_start + block_offset,
					     &xlen);
		if (pblock) {
			if (!PagePrivate(page))
				insert_metapage(page, NULL);
			inc_io(page);
			if (bio)
				submit_bio(READ, bio);

			bio = bio_alloc(GFP_NOFS, 1);
			bio->bi_bdev = inode->i_sb->s_bdev;
			bio->bi_sector = pblock << (inode->i_blkbits - 9);
			bio->bi_end_io = metapage_read_end_io;
			bio->bi_private = page;
			len = xlen << inode->i_blkbits;
			offset = block_offset << inode->i_blkbits;
			if (bio_add_page(bio, page, len, offset) < len)
				goto add_failed;
			block_offset += xlen;
		} else
			block_offset++;
L
Linus Torvalds 已提交
530
	}
531 532 533 534 535 536
	if (bio)
		submit_bio(READ, bio);
	else
		unlock_page(page);

	return 0;
L
Linus Torvalds 已提交
537

538 539 540 541 542
add_failed:
	printk(KERN_ERR "JFS: bio_add_page failed unexpectedly\n");
	bio_put(bio);
	dec_io(page, last_read_complete);
	return -EIO;
L
Linus Torvalds 已提交
543 544
}

A
Al Viro 已提交
545
static int metapage_releasepage(struct page *page, gfp_t gfp_mask)
546 547
{
	struct metapage *mp;
548
	int ret = 1;
549
	int offset;
550 551 552 553 554 555 556 557

	for (offset = 0; offset < PAGE_CACHE_SIZE; offset += PSIZE) {
		mp = page_to_mp(page, offset);

		if (!mp)
			continue;

		jfs_info("metapage_releasepage: mp = 0x%p", mp);
558 559
		if (mp->count || mp->nohomeok ||
		    test_bit(META_dirty, &mp->flag)) {
560 561
			jfs_info("count = %ld, nohomeok = %d", mp->count,
				 mp->nohomeok);
562
			ret = 0;
563 564 565 566 567 568 569 570
			continue;
		}
		if (mp->lsn)
			remove_from_logsync(mp);
		remove_metapage(page, mp);
		INCREMENT(mpStat.pagefree);
		free_metapage(mp);
	}
571
	return ret;
572 573
}

574
static void metapage_invalidatepage(struct page *page, unsigned long offset)
575 576 577
{
	BUG_ON(offset);

578
	BUG_ON(PageWriteback(page));
579

580
	metapage_releasepage(page, 0);
581 582
}

583
const struct address_space_operations jfs_metapage_aops = {
584 585 586 587 588 589 590
	.readpage	= metapage_readpage,
	.writepage	= metapage_writepage,
	.releasepage	= metapage_releasepage,
	.invalidatepage	= metapage_invalidatepage,
	.set_page_dirty	= __set_page_dirty_nobuffers,
};

L
Linus Torvalds 已提交
591 592 593 594 595 596 597
struct metapage *__get_metapage(struct inode *inode, unsigned long lblock,
				unsigned int size, int absolute,
				unsigned long new)
{
	int l2BlocksPerPage;
	int l2bsize;
	struct address_space *mapping;
598 599
	struct metapage *mp = NULL;
	struct page *page;
L
Linus Torvalds 已提交
600 601 602
	unsigned long page_index;
	unsigned long page_offset;

603 604 605 606 607 608 609 610 611 612 613 614 615
	jfs_info("__get_metapage: ino = %ld, lblock = 0x%lx, abs=%d",
		 inode->i_ino, lblock, absolute);

	l2bsize = inode->i_blkbits;
	l2BlocksPerPage = PAGE_CACHE_SHIFT - l2bsize;
	page_index = lblock >> l2BlocksPerPage;
	page_offset = (lblock - (page_index << l2BlocksPerPage)) << l2bsize;
	if ((page_offset + size) > PAGE_CACHE_SIZE) {
		jfs_err("MetaData crosses page boundary!!");
		jfs_err("lblock = %lx, size  = %d", lblock, size);
		dump_stack();
		return NULL;
	}
L
Linus Torvalds 已提交
616
	if (absolute)
617
		mapping = JFS_SBI(inode->i_sb)->direct_inode->i_mapping;
L
Linus Torvalds 已提交
618 619 620 621 622 623 624 625 626 627 628
	else {
		/*
		 * If an nfs client tries to read an inode that is larger
		 * than any existing inodes, we may try to read past the
		 * end of the inode map
		 */
		if ((lblock << inode->i_blkbits) >= inode->i_size)
			return NULL;
		mapping = inode->i_mapping;
	}

629 630 631 632 633 634 635 636
	if (new && (PSIZE == PAGE_CACHE_SIZE)) {
		page = grab_cache_page(mapping, page_index);
		if (!page) {
			jfs_err("grab_cache_page failed!");
			return NULL;
		}
		SetPageUptodate(page);
	} else {
637
		page = read_mapping_page(mapping, page_index, NULL);
D
Dave Kleikamp 已提交
638
		if (IS_ERR(page) || !PageUptodate(page)) {
639
			jfs_err("read_mapping_page failed!");
640 641 642 643 644 645
			return NULL;
		}
		lock_page(page);
	}

	mp = page_to_mp(page, page_offset);
L
Linus Torvalds 已提交
646
	if (mp) {
647 648 649 650 651 652
		if (mp->logical_size != size) {
			jfs_error(inode->i_sb,
				  "__get_metapage: mp->logical_size != size");
			jfs_err("logical_size = %d, size = %d",
				mp->logical_size, size);
			dump_stack();
D
Dave Kleikamp 已提交
653
			goto unlock;
L
Linus Torvalds 已提交
654 655 656 657 658 659 660 661
		}
		mp->count++;
		lock_metapage(mp);
		if (test_bit(META_discard, &mp->flag)) {
			if (!new) {
				jfs_error(inode->i_sb,
					  "__get_metapage: using a "
					  "discarded metapage");
662
				discard_metapage(mp);
D
Dave Kleikamp 已提交
663
				goto unlock;
L
Linus Torvalds 已提交
664 665 666 667
			}
			clear_bit(META_discard, &mp->flag);
		}
	} else {
668 669 670
		INCREMENT(mpStat.pagealloc);
		mp = alloc_metapage(GFP_NOFS);
		mp->page = page;
L
Linus Torvalds 已提交
671 672 673
		mp->flag = 0;
		mp->xflag = COMMIT_PAGE;
		mp->count = 1;
674
		mp->nohomeok = 0;
L
Linus Torvalds 已提交
675
		mp->logical_size = size;
676 677 678 679 680
		mp->data = page_address(page) + page_offset;
		mp->index = lblock;
		if (unlikely(insert_metapage(page, mp))) {
			free_metapage(mp);
			goto unlock;
L
Linus Torvalds 已提交
681
		}
682
		lock_metapage(mp);
L
Linus Torvalds 已提交
683 684
	}

685 686
	if (new) {
		jfs_info("zeroing mp = 0x%p", mp);
L
Linus Torvalds 已提交
687
		memset(mp->data, 0, PSIZE);
688
	}
L
Linus Torvalds 已提交
689

690 691
	unlock_page(page);
	jfs_info("__get_metapage: returning = 0x%p data = 0x%p", mp, mp->data);
L
Linus Torvalds 已提交
692 693
	return mp;

694 695
unlock:
	unlock_page(page);
L
Linus Torvalds 已提交
696 697 698
	return NULL;
}

699
void grab_metapage(struct metapage * mp)
L
Linus Torvalds 已提交
700
{
701 702 703
	jfs_info("grab_metapage: mp = 0x%p", mp);
	page_cache_get(mp->page);
	lock_page(mp->page);
L
Linus Torvalds 已提交
704
	mp->count++;
705 706
	lock_metapage(mp);
	unlock_page(mp->page);
L
Linus Torvalds 已提交
707 708
}

709
void force_metapage(struct metapage *mp)
L
Linus Torvalds 已提交
710
{
711 712 713 714 715 716 717 718 719 720 721
	struct page *page = mp->page;
	jfs_info("force_metapage: mp = 0x%p", mp);
	set_bit(META_forcewrite, &mp->flag);
	clear_bit(META_sync, &mp->flag);
	page_cache_get(page);
	lock_page(page);
	set_page_dirty(page);
	write_one_page(page, 1);
	clear_bit(META_forcewrite, &mp->flag);
	page_cache_release(page);
}
L
Linus Torvalds 已提交
722

723
void hold_metapage(struct metapage *mp)
724
{
L
Linus Torvalds 已提交
725
	lock_page(mp->page);
726 727
}

728
void put_metapage(struct metapage *mp)
729 730 731
{
	if (mp->count || mp->nohomeok) {
		/* Someone else will release this */
L
Linus Torvalds 已提交
732 733 734
		unlock_page(mp->page);
		return;
	}
735 736 737
	page_cache_get(mp->page);
	mp->count++;
	lock_metapage(mp);
L
Linus Torvalds 已提交
738
	unlock_page(mp->page);
739
	release_metapage(mp);
L
Linus Torvalds 已提交
740 741 742 743
}

void release_metapage(struct metapage * mp)
{
744
	struct page *page = mp->page;
L
Linus Torvalds 已提交
745 746
	jfs_info("release_metapage: mp = 0x%p, flag = 0x%lx", mp, mp->flag);

747 748 749 750
	BUG_ON(!page);

	lock_page(page);
	unlock_metapage(mp);
L
Linus Torvalds 已提交
751 752

	assert(mp->count);
753 754 755
	if (--mp->count || mp->nohomeok) {
		unlock_page(page);
		page_cache_release(page);
L
Linus Torvalds 已提交
756 757 758
		return;
	}

759 760
	if (test_bit(META_dirty, &mp->flag)) {
		set_page_dirty(page);
L
Linus Torvalds 已提交
761 762
		if (test_bit(META_sync, &mp->flag)) {
			clear_bit(META_sync, &mp->flag);
763 764
			write_one_page(page, 1);
			lock_page(page); /* write_one_page unlocks the page */
L
Linus Torvalds 已提交
765
		}
766 767
	} else if (mp->lsn)	/* discard_metapage doesn't remove it */
		remove_from_logsync(mp);
L
Linus Torvalds 已提交
768

769 770
	/* Try to keep metapages from using up too much memory */
	drop_metapage(page, mp);
771

772 773
	unlock_page(page);
	page_cache_release(page);
L
Linus Torvalds 已提交
774 775 776 777
}

void __invalidate_metapages(struct inode *ip, s64 addr, int len)
{
778
	sector_t lblock;
L
Linus Torvalds 已提交
779
	int l2BlocksPerPage = PAGE_CACHE_SHIFT - ip->i_blkbits;
780
	int BlocksPerPage = 1 << l2BlocksPerPage;
L
Linus Torvalds 已提交
781
	/* All callers are interested in block device's mapping */
782 783
	struct address_space *mapping =
		JFS_SBI(ip->i_sb)->direct_inode->i_mapping;
L
Linus Torvalds 已提交
784 785
	struct metapage *mp;
	struct page *page;
786
	unsigned int offset;
L
Linus Torvalds 已提交
787 788

	/*
789
	 * Mark metapages to discard.  They will eventually be
L
Linus Torvalds 已提交
790 791
	 * released, but should not be written.
	 */
792 793 794 795 796 797 798 799 800 801 802 803 804
	for (lblock = addr & ~(BlocksPerPage - 1); lblock < addr + len;
	     lblock += BlocksPerPage) {
		page = find_lock_page(mapping, lblock >> l2BlocksPerPage);
		if (!page)
			continue;
		for (offset = 0; offset < PAGE_CACHE_SIZE; offset += PSIZE) {
			mp = page_to_mp(page, offset);
			if (!mp)
				continue;
			if (mp->index < addr)
				continue;
			if (mp->index >= addr + len)
				break;
L
Linus Torvalds 已提交
805 806 807

			clear_bit(META_dirty, &mp->flag);
			set_bit(META_discard, &mp->flag);
808 809
			if (mp->lsn)
				remove_from_logsync(mp);
L
Linus Torvalds 已提交
810
		}
811 812
		unlock_page(page);
		page_cache_release(page);
L
Linus Torvalds 已提交
813 814 815 816
	}
}

#ifdef CONFIG_JFS_STATISTICS
A
Alexey Dobriyan 已提交
817
static int jfs_mpstat_proc_show(struct seq_file *m, void *v)
L
Linus Torvalds 已提交
818
{
A
Alexey Dobriyan 已提交
819
	seq_printf(m,
L
Linus Torvalds 已提交
820 821 822 823 824 825 826 827
		       "JFS Metapage statistics\n"
		       "=======================\n"
		       "page allocations = %d\n"
		       "page frees = %d\n"
		       "lock waits = %d\n",
		       mpStat.pagealloc,
		       mpStat.pagefree,
		       mpStat.lockwait);
A
Alexey Dobriyan 已提交
828 829
	return 0;
}
L
Linus Torvalds 已提交
830

A
Alexey Dobriyan 已提交
831 832 833
static int jfs_mpstat_proc_open(struct inode *inode, struct file *file)
{
	return single_open(file, jfs_mpstat_proc_show, NULL);
L
Linus Torvalds 已提交
834
}
A
Alexey Dobriyan 已提交
835 836 837 838 839 840 841 842

const struct file_operations jfs_mpstat_proc_fops = {
	.owner		= THIS_MODULE,
	.open		= jfs_mpstat_proc_open,
	.read		= seq_read,
	.llseek		= seq_lseek,
	.release	= single_release,
};
L
Linus Torvalds 已提交
843
#endif