xfs_rmap_btree.c 16.0 KB
Newer Older
D
Dave Chinner 已提交
1
// SPDX-License-Identifier: GPL-2.0
2 3 4 5 6 7 8 9 10 11 12 13 14 15
/*
 * Copyright (c) 2014 Red Hat, Inc.
 * All Rights Reserved.
 */
#include "xfs.h"
#include "xfs_fs.h"
#include "xfs_shared.h"
#include "xfs_format.h"
#include "xfs_log_format.h"
#include "xfs_trans_resv.h"
#include "xfs_mount.h"
#include "xfs_trans.h"
#include "xfs_alloc.h"
#include "xfs_btree.h"
16
#include "xfs_btree_staging.h"
D
Darrick J. Wong 已提交
17
#include "xfs_rmap.h"
18 19 20 21
#include "xfs_rmap_btree.h"
#include "xfs_trace.h"
#include "xfs_error.h"
#include "xfs_extent_busy.h"
22
#include "xfs_ag.h"
23
#include "xfs_ag_resv.h"
24

D
Darrick J. Wong 已提交
25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49
/*
 * Reverse map btree.
 *
 * This is a per-ag tree used to track the owner(s) of a given extent. With
 * reflink it is possible for there to be multiple owners, which is a departure
 * from classic XFS. Owner records for data extents are inserted when the
 * extent is mapped and removed when an extent is unmapped.  Owner records for
 * all other block types (i.e. metadata) are inserted when an extent is
 * allocated and removed when an extent is freed. There can only be one owner
 * of a metadata extent, usually an inode or some other metadata structure like
 * an AG btree.
 *
 * The rmap btree is part of the free space management, so blocks for the tree
 * are sourced from the agfl. Hence we need transaction reservation support for
 * this tree so that the freelist is always large enough. This also impacts on
 * the minimum space we need to leave free in the AG.
 *
 * The tree is ordered by [ag block, owner, offset]. This is a large key size,
 * but it is the only way to enforce unique keys when a block can be owned by
 * multiple files at any offset. There's no need to order/search by extent
 * size for online updating/management of the tree. It is intended that most
 * reverse lookups will be to find the owner(s) of a particular block, or to
 * try to recover tree and file data from corrupt primary metadata.
 */

50 51 52 53 54
static struct xfs_btree_cur *
xfs_rmapbt_dup_cursor(
	struct xfs_btree_cur	*cur)
{
	return xfs_rmapbt_init_cursor(cur->bc_mp, cur->bc_tp,
55
			cur->bc_ag.agbp, cur->bc_ag.agno);
56 57
}

D
Darrick J. Wong 已提交
58 59 60 61 62 63
STATIC void
xfs_rmapbt_set_root(
	struct xfs_btree_cur	*cur,
	union xfs_btree_ptr	*ptr,
	int			inc)
{
64
	struct xfs_buf		*agbp = cur->bc_ag.agbp;
C
Christoph Hellwig 已提交
65
	struct xfs_agf		*agf = agbp->b_addr;
D
Darrick J. Wong 已提交
66
	int			btnum = cur->bc_btnum;
67
	struct xfs_perag	*pag = agbp->b_pag;
D
Darrick J. Wong 已提交
68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84

	ASSERT(ptr->s != 0);

	agf->agf_roots[btnum] = ptr->s;
	be32_add_cpu(&agf->agf_levels[btnum], inc);
	pag->pagf_levels[btnum] += inc;

	xfs_alloc_log_agf(cur->bc_tp, agbp, XFS_AGF_ROOTS | XFS_AGF_LEVELS);
}

STATIC int
xfs_rmapbt_alloc_block(
	struct xfs_btree_cur	*cur,
	union xfs_btree_ptr	*start,
	union xfs_btree_ptr	*new,
	int			*stat)
{
85
	struct xfs_buf		*agbp = cur->bc_ag.agbp;
C
Christoph Hellwig 已提交
86
	struct xfs_agf		*agf = agbp->b_addr;
D
Darrick J. Wong 已提交
87 88 89 90
	int			error;
	xfs_agblock_t		bno;

	/* Allocate the new block from the freelist. If we can't, give up.  */
91
	error = xfs_alloc_get_freelist(cur->bc_tp, cur->bc_ag.agbp,
D
Darrick J. Wong 已提交
92
				       &bno, 1);
C
Carlos Maiolino 已提交
93
	if (error)
D
Darrick J. Wong 已提交
94 95
		return error;

96
	trace_xfs_rmapbt_alloc_block(cur->bc_mp, cur->bc_ag.agno,
D
Darrick J. Wong 已提交
97 98 99 100 101 102
			bno, 1);
	if (bno == NULLAGBLOCK) {
		*stat = 0;
		return 0;
	}

103
	xfs_extent_busy_reuse(cur->bc_mp, cur->bc_ag.agno, bno, 1,
D
Darrick J. Wong 已提交
104 105 106
			false);

	new->s = cpu_to_be32(bno);
107 108
	be32_add_cpu(&agf->agf_rmap_blocks, 1);
	xfs_alloc_log_agf(cur->bc_tp, agbp, XFS_AGF_RMAP_BLOCKS);
D
Darrick J. Wong 已提交
109

110
	xfs_ag_resv_rmapbt_alloc(cur->bc_mp, cur->bc_ag.agno);
111

D
Darrick J. Wong 已提交
112 113 114 115 116 117 118 119 120
	*stat = 1;
	return 0;
}

STATIC int
xfs_rmapbt_free_block(
	struct xfs_btree_cur	*cur,
	struct xfs_buf		*bp)
{
121
	struct xfs_buf		*agbp = cur->bc_ag.agbp;
C
Christoph Hellwig 已提交
122
	struct xfs_agf		*agf = agbp->b_addr;
123
	struct xfs_perag	*pag;
D
Darrick J. Wong 已提交
124 125 126 127
	xfs_agblock_t		bno;
	int			error;

	bno = xfs_daddr_to_agbno(cur->bc_mp, XFS_BUF_ADDR(bp));
128
	trace_xfs_rmapbt_free_block(cur->bc_mp, cur->bc_ag.agno,
D
Darrick J. Wong 已提交
129
			bno, 1);
130 131
	be32_add_cpu(&agf->agf_rmap_blocks, -1);
	xfs_alloc_log_agf(cur->bc_tp, agbp, XFS_AGF_RMAP_BLOCKS);
D
Darrick J. Wong 已提交
132 133 134 135 136 137 138
	error = xfs_alloc_put_freelist(cur->bc_tp, agbp, NULL, bno, 1);
	if (error)
		return error;

	xfs_extent_busy_insert(cur->bc_tp, be32_to_cpu(agf->agf_seqno), bno, 1,
			      XFS_EXTENT_BUSY_SKIP_DISCARD);

139 140
	pag = cur->bc_ag.agbp->b_pag;
	xfs_ag_resv_free_extent(pag, XFS_AG_RESV_RMAPBT, NULL, 1);
D
Darrick J. Wong 已提交
141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169
	return 0;
}

STATIC int
xfs_rmapbt_get_minrecs(
	struct xfs_btree_cur	*cur,
	int			level)
{
	return cur->bc_mp->m_rmap_mnr[level != 0];
}

STATIC int
xfs_rmapbt_get_maxrecs(
	struct xfs_btree_cur	*cur,
	int			level)
{
	return cur->bc_mp->m_rmap_mxr[level != 0];
}

STATIC void
xfs_rmapbt_init_key_from_rec(
	union xfs_btree_key	*key,
	union xfs_btree_rec	*rec)
{
	key->rmap.rm_startblock = rec->rmap.rm_startblock;
	key->rmap.rm_owner = rec->rmap.rm_owner;
	key->rmap.rm_offset = rec->rmap.rm_offset;
}

170 171 172 173 174 175 176 177 178 179 180 181
/*
 * The high key for a reverse mapping record can be computed by shifting
 * the startblock and offset to the highest value that would still map
 * to that record.  In practice this means that we add blockcount-1 to
 * the startblock for all records, and if the record is for a data/attr
 * fork mapping, we add blockcount-1 to the offset too.
 */
STATIC void
xfs_rmapbt_init_high_key_from_rec(
	union xfs_btree_key	*key,
	union xfs_btree_rec	*rec)
{
182
	uint64_t		off;
183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198
	int			adj;

	adj = be32_to_cpu(rec->rmap.rm_blockcount) - 1;

	key->rmap.rm_startblock = rec->rmap.rm_startblock;
	be32_add_cpu(&key->rmap.rm_startblock, adj);
	key->rmap.rm_owner = rec->rmap.rm_owner;
	key->rmap.rm_offset = rec->rmap.rm_offset;
	if (XFS_RMAP_NON_INODE_OWNER(be64_to_cpu(rec->rmap.rm_owner)) ||
	    XFS_RMAP_IS_BMBT_BLOCK(be64_to_cpu(rec->rmap.rm_offset)))
		return;
	off = be64_to_cpu(key->rmap.rm_offset);
	off = (XFS_RMAP_OFF(off) + adj) | (off & ~XFS_RMAP_OFF_MASK);
	key->rmap.rm_offset = cpu_to_be64(off);
}

D
Darrick J. Wong 已提交
199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215
STATIC void
xfs_rmapbt_init_rec_from_cur(
	struct xfs_btree_cur	*cur,
	union xfs_btree_rec	*rec)
{
	rec->rmap.rm_startblock = cpu_to_be32(cur->bc_rec.r.rm_startblock);
	rec->rmap.rm_blockcount = cpu_to_be32(cur->bc_rec.r.rm_blockcount);
	rec->rmap.rm_owner = cpu_to_be64(cur->bc_rec.r.rm_owner);
	rec->rmap.rm_offset = cpu_to_be64(
			xfs_rmap_irec_offset_pack(&cur->bc_rec.r));
}

STATIC void
xfs_rmapbt_init_ptr_from_cur(
	struct xfs_btree_cur	*cur,
	union xfs_btree_ptr	*ptr)
{
216
	struct xfs_agf		*agf = cur->bc_ag.agbp->b_addr;
D
Darrick J. Wong 已提交
217

218
	ASSERT(cur->bc_ag.agno == be32_to_cpu(agf->agf_seqno));
D
Darrick J. Wong 已提交
219 220 221 222

	ptr->s = agf->agf_roots[cur->bc_btnum];
}

223
STATIC int64_t
D
Darrick J. Wong 已提交
224 225 226 227 228 229 230
xfs_rmapbt_key_diff(
	struct xfs_btree_cur	*cur,
	union xfs_btree_key	*key)
{
	struct xfs_rmap_irec	*rec = &cur->bc_rec.r;
	struct xfs_rmap_key	*kp = &key->rmap;
	__u64			x, y;
231
	int64_t			d;
D
Darrick J. Wong 已提交
232

233
	d = (int64_t)be32_to_cpu(kp->rm_startblock) - rec->rm_startblock;
D
Darrick J. Wong 已提交
234 235 236 237 238 239 240 241 242 243
	if (d)
		return d;

	x = be64_to_cpu(kp->rm_owner);
	y = rec->rm_owner;
	if (x > y)
		return 1;
	else if (y > x)
		return -1;

244 245
	x = XFS_RMAP_OFF(be64_to_cpu(kp->rm_offset));
	y = rec->rm_offset;
D
Darrick J. Wong 已提交
246 247 248 249 250 251 252
	if (x > y)
		return 1;
	else if (y > x)
		return -1;
	return 0;
}

253
STATIC int64_t
254 255 256 257 258 259 260
xfs_rmapbt_diff_two_keys(
	struct xfs_btree_cur	*cur,
	union xfs_btree_key	*k1,
	union xfs_btree_key	*k2)
{
	struct xfs_rmap_key	*kp1 = &k1->rmap;
	struct xfs_rmap_key	*kp2 = &k2->rmap;
261
	int64_t			d;
262 263
	__u64			x, y;

264
	d = (int64_t)be32_to_cpu(kp1->rm_startblock) -
265 266 267 268 269 270 271 272 273 274 275
		       be32_to_cpu(kp2->rm_startblock);
	if (d)
		return d;

	x = be64_to_cpu(kp1->rm_owner);
	y = be64_to_cpu(kp2->rm_owner);
	if (x > y)
		return 1;
	else if (y > x)
		return -1;

276 277
	x = XFS_RMAP_OFF(be64_to_cpu(kp1->rm_offset));
	y = XFS_RMAP_OFF(be64_to_cpu(kp2->rm_offset));
278 279 280 281 282 283 284
	if (x > y)
		return 1;
	else if (y > x)
		return -1;
	return 0;
}

285
static xfs_failaddr_t
286 287 288
xfs_rmapbt_verify(
	struct xfs_buf		*bp)
{
289
	struct xfs_mount	*mp = bp->b_mount;
290 291
	struct xfs_btree_block	*block = XFS_BUF_TO_BLOCK(bp);
	struct xfs_perag	*pag = bp->b_pag;
292
	xfs_failaddr_t		fa;
293 294 295 296 297 298 299 300 301 302 303 304 305 306
	unsigned int		level;

	/*
	 * magic number and level verification
	 *
	 * During growfs operations, we can't verify the exact level or owner as
	 * the perag is not fully initialised and hence not attached to the
	 * buffer.  In this case, check against the maximum tree depth.
	 *
	 * Similarly, during log recovery we will have a perag structure
	 * attached, but the agf information will not yet have been initialised
	 * from the on disk AGF. Again, we can only check against maximum limits
	 * in this case.
	 */
307
	if (!xfs_verify_magic(bp, block->bb_magic))
308
		return __this_address;
309 310

	if (!xfs_sb_version_hasrmapbt(&mp->m_sb))
311 312 313 314
		return __this_address;
	fa = xfs_btree_sblock_v5hdr_verify(bp);
	if (fa)
		return fa;
315 316 317 318

	level = be16_to_cpu(block->bb_level);
	if (pag && pag->pagf_init) {
		if (level >= pag->pagf_levels[XFS_BTNUM_RMAPi])
319
			return __this_address;
320
	} else if (level >= mp->m_rmap_maxlevels)
321
		return __this_address;
322 323 324 325 326 327 328 329

	return xfs_btree_sblock_verify(bp, mp->m_rmap_mxr[level != 0]);
}

static void
xfs_rmapbt_read_verify(
	struct xfs_buf	*bp)
{
330 331
	xfs_failaddr_t	fa;

332
	if (!xfs_btree_sblock_verify_crc(bp))
333 334 335 336 337 338
		xfs_verifier_error(bp, -EFSBADCRC, __this_address);
	else {
		fa = xfs_rmapbt_verify(bp);
		if (fa)
			xfs_verifier_error(bp, -EFSCORRUPTED, fa);
	}
339

340
	if (bp->b_error)
341 342 343 344 345 346 347
		trace_xfs_btree_corrupt(bp, _RET_IP_);
}

static void
xfs_rmapbt_write_verify(
	struct xfs_buf	*bp)
{
348 349 350 351
	xfs_failaddr_t	fa;

	fa = xfs_rmapbt_verify(bp);
	if (fa) {
352
		trace_xfs_btree_corrupt(bp, _RET_IP_);
353
		xfs_verifier_error(bp, -EFSCORRUPTED, fa);
354 355 356 357 358 359 360 361
		return;
	}
	xfs_btree_sblock_calc_crc(bp);

}

const struct xfs_buf_ops xfs_rmapbt_buf_ops = {
	.name			= "xfs_rmapbt",
362
	.magic			= { 0, cpu_to_be32(XFS_RMAP_CRC_MAGIC) },
363 364
	.verify_read		= xfs_rmapbt_read_verify,
	.verify_write		= xfs_rmapbt_write_verify,
365
	.verify_struct		= xfs_rmapbt_verify,
366 367
};

D
Darrick J. Wong 已提交
368 369 370 371 372 373
STATIC int
xfs_rmapbt_keys_inorder(
	struct xfs_btree_cur	*cur,
	union xfs_btree_key	*k1,
	union xfs_btree_key	*k2)
{
374 375 376 377
	uint32_t		x;
	uint32_t		y;
	uint64_t		a;
	uint64_t		b;
D
Darrick J. Wong 已提交
378 379 380 381 382 383 384 385 386 387 388 389 390

	x = be32_to_cpu(k1->rmap.rm_startblock);
	y = be32_to_cpu(k2->rmap.rm_startblock);
	if (x < y)
		return 1;
	else if (x > y)
		return 0;
	a = be64_to_cpu(k1->rmap.rm_owner);
	b = be64_to_cpu(k2->rmap.rm_owner);
	if (a < b)
		return 1;
	else if (a > b)
		return 0;
391 392
	a = XFS_RMAP_OFF(be64_to_cpu(k1->rmap.rm_offset));
	b = XFS_RMAP_OFF(be64_to_cpu(k2->rmap.rm_offset));
D
Darrick J. Wong 已提交
393 394 395 396 397 398 399 400 401 402 403
	if (a <= b)
		return 1;
	return 0;
}

STATIC int
xfs_rmapbt_recs_inorder(
	struct xfs_btree_cur	*cur,
	union xfs_btree_rec	*r1,
	union xfs_btree_rec	*r2)
{
404 405 406 407
	uint32_t		x;
	uint32_t		y;
	uint64_t		a;
	uint64_t		b;
D
Darrick J. Wong 已提交
408 409 410 411 412 413 414 415 416 417 418 419 420

	x = be32_to_cpu(r1->rmap.rm_startblock);
	y = be32_to_cpu(r2->rmap.rm_startblock);
	if (x < y)
		return 1;
	else if (x > y)
		return 0;
	a = be64_to_cpu(r1->rmap.rm_owner);
	b = be64_to_cpu(r2->rmap.rm_owner);
	if (a < b)
		return 1;
	else if (a > b)
		return 0;
421 422
	a = XFS_RMAP_OFF(be64_to_cpu(r1->rmap.rm_offset));
	b = XFS_RMAP_OFF(be64_to_cpu(r2->rmap.rm_offset));
D
Darrick J. Wong 已提交
423 424 425 426 427
	if (a <= b)
		return 1;
	return 0;
}

428 429 430 431 432
static const struct xfs_btree_ops xfs_rmapbt_ops = {
	.rec_len		= sizeof(struct xfs_rmap_rec),
	.key_len		= 2 * sizeof(struct xfs_rmap_key),

	.dup_cursor		= xfs_rmapbt_dup_cursor,
D
Darrick J. Wong 已提交
433 434 435 436 437 438
	.set_root		= xfs_rmapbt_set_root,
	.alloc_block		= xfs_rmapbt_alloc_block,
	.free_block		= xfs_rmapbt_free_block,
	.get_minrecs		= xfs_rmapbt_get_minrecs,
	.get_maxrecs		= xfs_rmapbt_get_maxrecs,
	.init_key_from_rec	= xfs_rmapbt_init_key_from_rec,
439
	.init_high_key_from_rec	= xfs_rmapbt_init_high_key_from_rec,
D
Darrick J. Wong 已提交
440 441 442
	.init_rec_from_cur	= xfs_rmapbt_init_rec_from_cur,
	.init_ptr_from_cur	= xfs_rmapbt_init_ptr_from_cur,
	.key_diff		= xfs_rmapbt_key_diff,
443
	.buf_ops		= &xfs_rmapbt_buf_ops,
444
	.diff_two_keys		= xfs_rmapbt_diff_two_keys,
D
Darrick J. Wong 已提交
445 446
	.keys_inorder		= xfs_rmapbt_keys_inorder,
	.recs_inorder		= xfs_rmapbt_recs_inorder,
447 448
};

449 450
static struct xfs_btree_cur *
xfs_rmapbt_init_common(
451 452 453 454 455 456
	struct xfs_mount	*mp,
	struct xfs_trans	*tp,
	xfs_agnumber_t		agno)
{
	struct xfs_btree_cur	*cur;

457
	cur = kmem_cache_zalloc(xfs_btree_cur_zone, GFP_NOFS | __GFP_NOFAIL);
458 459
	cur->bc_tp = tp;
	cur->bc_mp = mp;
460
	/* Overlapping btree; 2 keys per pointer. */
461
	cur->bc_btnum = XFS_BTNUM_RMAP;
462
	cur->bc_flags = XFS_BTREE_CRC_BLOCKS | XFS_BTREE_OVERLAPPING;
463
	cur->bc_blocklog = mp->m_sb.sb_blocklog;
D
Dave Chinner 已提交
464
	cur->bc_statoff = XFS_STATS_CALC_INDEX(xs_rmap_2);
465 466
	cur->bc_ag.agno = agno;
	cur->bc_ops = &xfs_rmapbt_ops;
467

468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483
	return cur;
}

/* Create a new reverse mapping btree cursor. */
struct xfs_btree_cur *
xfs_rmapbt_init_cursor(
	struct xfs_mount	*mp,
	struct xfs_trans	*tp,
	struct xfs_buf		*agbp,
	xfs_agnumber_t		agno)
{
	struct xfs_agf		*agf = agbp->b_addr;
	struct xfs_btree_cur	*cur;

	cur = xfs_rmapbt_init_common(mp, tp, agno);
	cur->bc_nlevels = be32_to_cpu(agf->agf_levels[XFS_BTNUM_RMAP]);
484
	cur->bc_ag.agbp = agbp;
485 486 487 488 489 490 491 492 493 494 495
	return cur;
}

/* Create a new reverse mapping btree cursor with a fake root for staging. */
struct xfs_btree_cur *
xfs_rmapbt_stage_cursor(
	struct xfs_mount	*mp,
	struct xbtree_afakeroot	*afake,
	xfs_agnumber_t		agno)
{
	struct xfs_btree_cur	*cur;
496

497 498
	cur = xfs_rmapbt_init_common(mp, NULL, agno);
	xfs_btree_stage_afakeroot(cur, afake);
499 500 501
	return cur;
}

502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524
/*
 * Install a new reverse mapping btree root.  Caller is responsible for
 * invalidating and freeing the old btree blocks.
 */
void
xfs_rmapbt_commit_staged_btree(
	struct xfs_btree_cur	*cur,
	struct xfs_trans	*tp,
	struct xfs_buf		*agbp)
{
	struct xfs_agf		*agf = agbp->b_addr;
	struct xbtree_afakeroot	*afake = cur->bc_ag.afake;

	ASSERT(cur->bc_flags & XFS_BTREE_STAGING);

	agf->agf_roots[cur->bc_btnum] = cpu_to_be32(afake->af_root);
	agf->agf_levels[cur->bc_btnum] = cpu_to_be32(afake->af_levels);
	agf->agf_rmap_blocks = cpu_to_be32(afake->af_blocks);
	xfs_alloc_log_agf(tp, agbp, XFS_AGF_ROOTS | XFS_AGF_LEVELS |
				    XFS_AGF_RMAP_BLOCKS);
	xfs_btree_commit_afakeroot(cur, tp, agbp, &xfs_rmapbt_ops);
}

525 526 527 528 529 530 531 532 533 534 535 536 537
/*
 * Calculate number of records in an rmap btree block.
 */
int
xfs_rmapbt_maxrecs(
	int			blocklen,
	int			leaf)
{
	blocklen -= XFS_RMAP_BLOCK_LEN;

	if (leaf)
		return blocklen / sizeof(struct xfs_rmap_rec);
	return blocklen /
538
		(2 * sizeof(struct xfs_rmap_key) + sizeof(xfs_rmap_ptr_t));
539 540 541 542 543 544 545
}

/* Compute the maximum height of an rmap btree. */
void
xfs_rmapbt_compute_maxlevels(
	struct xfs_mount		*mp)
{
546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563
	/*
	 * On a non-reflink filesystem, the maximum number of rmap
	 * records is the number of blocks in the AG, hence the max
	 * rmapbt height is log_$maxrecs($agblocks).  However, with
	 * reflink each AG block can have up to 2^32 (per the refcount
	 * record format) owners, which means that theoretically we
	 * could face up to 2^64 rmap records.
	 *
	 * That effectively means that the max rmapbt height must be
	 * XFS_BTREE_MAXLEVELS.  "Fortunately" we'll run out of AG
	 * blocks to feed the rmapbt long before the rmapbt reaches
	 * maximum height.  The reflink code uses ag_resv_critical to
	 * disallow reflinking when less than 10% of the per-AG metadata
	 * block reservation since the fallback is a regular file copy.
	 */
	if (xfs_sb_version_hasreflink(&mp->m_sb))
		mp->m_rmap_maxlevels = XFS_BTREE_MAXLEVELS;
	else
564
		mp->m_rmap_maxlevels = xfs_btree_compute_maxlevels(
565
				mp->m_rmap_mnr, mp->m_sb.sb_agblocks);
566
}
567 568 569 570 571 572 573

/* Calculate the refcount btree size for some records. */
xfs_extlen_t
xfs_rmapbt_calc_size(
	struct xfs_mount	*mp,
	unsigned long long	len)
{
574
	return xfs_btree_calc_size(mp->m_rmap_mnr, len);
575 576 577 578 579 580 581
}

/*
 * Calculate the maximum refcount btree size.
 */
xfs_extlen_t
xfs_rmapbt_max_size(
582 583
	struct xfs_mount	*mp,
	xfs_agblock_t		agblocks)
584 585 586 587 588
{
	/* Bail out if we're uninitialized, which can happen in mkfs. */
	if (mp->m_rmap_mxr[0] == 0)
		return 0;

589
	return xfs_rmapbt_calc_size(mp, agblocks);
590 591 592 593 594 595 596 597
}

/*
 * Figure out how many blocks to reserve and how many are used by this btree.
 */
int
xfs_rmapbt_calc_reserves(
	struct xfs_mount	*mp,
598
	struct xfs_trans	*tp,
599 600 601 602 603 604
	xfs_agnumber_t		agno,
	xfs_extlen_t		*ask,
	xfs_extlen_t		*used)
{
	struct xfs_buf		*agbp;
	struct xfs_agf		*agf;
605
	xfs_agblock_t		agblocks;
606 607 608 609 610 611
	xfs_extlen_t		tree_len;
	int			error;

	if (!xfs_sb_version_hasrmapbt(&mp->m_sb))
		return 0;

612
	error = xfs_alloc_read_agf(mp, tp, agno, 0, &agbp);
613 614 615
	if (error)
		return error;

C
Christoph Hellwig 已提交
616
	agf = agbp->b_addr;
617
	agblocks = be32_to_cpu(agf->agf_length);
618
	tree_len = be32_to_cpu(agf->agf_rmap_blocks);
619
	xfs_trans_brelse(tp, agbp);
620

621 622 623 624 625 626 627 628 629
	/*
	 * The log is permanently allocated, so the space it occupies will
	 * never be available for the kinds of things that would require btree
	 * expansion.  We therefore can pretend the space isn't there.
	 */
	if (mp->m_sb.sb_logstart &&
	    XFS_FSB_TO_AGNO(mp, mp->m_sb.sb_logstart) == agno)
		agblocks -= mp->m_sb.sb_logblocks;

630 631
	/* Reserve 1% of the AG or enough for 1 block per record. */
	*ask += max(agblocks / 100, xfs_rmapbt_max_size(mp, agblocks));
632 633 634 635
	*used += tree_len;

	return error;
}