xfs_attr_leaf.c 81.6 KB
Newer Older
D
Dave Chinner 已提交
1
// SPDX-License-Identifier: GPL-2.0
L
Linus Torvalds 已提交
2
/*
3
 * Copyright (c) 2000-2005 Silicon Graphics, Inc.
D
Dave Chinner 已提交
4
 * Copyright (c) 2013 Red Hat, Inc.
5
 * All Rights Reserved.
L
Linus Torvalds 已提交
6 7
 */
#include "xfs.h"
8
#include "xfs_fs.h"
9
#include "xfs_shared.h"
10
#include "xfs_format.h"
11 12
#include "xfs_log_format.h"
#include "xfs_trans_resv.h"
13
#include "xfs_bit.h"
L
Linus Torvalds 已提交
14 15
#include "xfs_sb.h"
#include "xfs_mount.h"
16
#include "xfs_da_format.h"
17
#include "xfs_da_btree.h"
L
Linus Torvalds 已提交
18
#include "xfs_inode.h"
19
#include "xfs_trans.h"
20
#include "xfs_inode_item.h"
21
#include "xfs_bmap_btree.h"
L
Linus Torvalds 已提交
22
#include "xfs_bmap.h"
23 24
#include "xfs_attr_sf.h"
#include "xfs_attr_remote.h"
L
Linus Torvalds 已提交
25 26 27
#include "xfs_attr.h"
#include "xfs_attr_leaf.h"
#include "xfs_error.h"
C
Christoph Hellwig 已提交
28
#include "xfs_trace.h"
D
Dave Chinner 已提交
29 30
#include "xfs_buf_item.h"
#include "xfs_cksum.h"
D
Dave Chinner 已提交
31
#include "xfs_dir2.h"
32
#include "xfs_log.h"
D
Dave Chinner 已提交
33

L
Linus Torvalds 已提交
34 35 36 37 38 39 40 41 42 43 44 45 46 47

/*
 * xfs_attr_leaf.c
 *
 * Routines to implement leaf blocks of attributes as Btrees of hashed names.
 */

/*========================================================================
 * Function prototypes for the kernel.
 *========================================================================*/

/*
 * Routines used for growing the Btree.
 */
D
Dave Chinner 已提交
48 49 50 51 52 53 54 55 56
STATIC int xfs_attr3_leaf_create(struct xfs_da_args *args,
				 xfs_dablk_t which_block, struct xfs_buf **bpp);
STATIC int xfs_attr3_leaf_add_work(struct xfs_buf *leaf_buffer,
				   struct xfs_attr3_icleaf_hdr *ichdr,
				   struct xfs_da_args *args, int freemap_index);
STATIC void xfs_attr3_leaf_compact(struct xfs_da_args *args,
				   struct xfs_attr3_icleaf_hdr *ichdr,
				   struct xfs_buf *leaf_buffer);
STATIC void xfs_attr3_leaf_rebalance(xfs_da_state_t *state,
L
Linus Torvalds 已提交
57 58
						   xfs_da_state_blk_t *blk1,
						   xfs_da_state_blk_t *blk2);
D
Dave Chinner 已提交
59 60 61 62 63 64 65
STATIC int xfs_attr3_leaf_figure_balance(xfs_da_state_t *state,
			xfs_da_state_blk_t *leaf_blk_1,
			struct xfs_attr3_icleaf_hdr *ichdr1,
			xfs_da_state_blk_t *leaf_blk_2,
			struct xfs_attr3_icleaf_hdr *ichdr2,
			int *number_entries_in_blk1,
			int *number_usedbytes_in_blk1);
L
Linus Torvalds 已提交
66 67 68 69

/*
 * Utility routines.
 */
70 71
STATIC void xfs_attr3_leaf_moveents(struct xfs_da_args *args,
			struct xfs_attr_leafblock *src_leaf,
D
Dave Chinner 已提交
72 73 74
			struct xfs_attr3_icleaf_hdr *src_ichdr, int src_start,
			struct xfs_attr_leafblock *dst_leaf,
			struct xfs_attr3_icleaf_hdr *dst_ichdr, int dst_start,
75
			int move_count);
76
STATIC int xfs_attr_leaf_entsize(xfs_attr_leafblock_t *leaf, int index);
77

78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151
/*
 * attr3 block 'firstused' conversion helpers.
 *
 * firstused refers to the offset of the first used byte of the nameval region
 * of an attr leaf block. The region starts at the tail of the block and expands
 * backwards towards the middle. As such, firstused is initialized to the block
 * size for an empty leaf block and is reduced from there.
 *
 * The attr3 block size is pegged to the fsb size and the maximum fsb is 64k.
 * The in-core firstused field is 32-bit and thus supports the maximum fsb size.
 * The on-disk field is only 16-bit, however, and overflows at 64k. Since this
 * only occurs at exactly 64k, we use zero as a magic on-disk value to represent
 * the attr block size. The following helpers manage the conversion between the
 * in-core and on-disk formats.
 */

static void
xfs_attr3_leaf_firstused_from_disk(
	struct xfs_da_geometry		*geo,
	struct xfs_attr3_icleaf_hdr	*to,
	struct xfs_attr_leafblock	*from)
{
	struct xfs_attr3_leaf_hdr	*hdr3;

	if (from->hdr.info.magic == cpu_to_be16(XFS_ATTR3_LEAF_MAGIC)) {
		hdr3 = (struct xfs_attr3_leaf_hdr *) from;
		to->firstused = be16_to_cpu(hdr3->firstused);
	} else {
		to->firstused = be16_to_cpu(from->hdr.firstused);
	}

	/*
	 * Convert from the magic fsb size value to actual blocksize. This
	 * should only occur for empty blocks when the block size overflows
	 * 16-bits.
	 */
	if (to->firstused == XFS_ATTR3_LEAF_NULLOFF) {
		ASSERT(!to->count && !to->usedbytes);
		ASSERT(geo->blksize > USHRT_MAX);
		to->firstused = geo->blksize;
	}
}

static void
xfs_attr3_leaf_firstused_to_disk(
	struct xfs_da_geometry		*geo,
	struct xfs_attr_leafblock	*to,
	struct xfs_attr3_icleaf_hdr	*from)
{
	struct xfs_attr3_leaf_hdr	*hdr3;
	uint32_t			firstused;

	/* magic value should only be seen on disk */
	ASSERT(from->firstused != XFS_ATTR3_LEAF_NULLOFF);

	/*
	 * Scale down the 32-bit in-core firstused value to the 16-bit on-disk
	 * value. This only overflows at the max supported value of 64k. Use the
	 * magic on-disk value to represent block size in this case.
	 */
	firstused = from->firstused;
	if (firstused > USHRT_MAX) {
		ASSERT(from->firstused == geo->blksize);
		firstused = XFS_ATTR3_LEAF_NULLOFF;
	}

	if (from->magic == XFS_ATTR3_LEAF_MAGIC) {
		hdr3 = (struct xfs_attr3_leaf_hdr *) to;
		hdr3->firstused = cpu_to_be16(firstused);
	} else {
		to->hdr.firstused = cpu_to_be16(firstused);
	}
}

D
Dave Chinner 已提交
152 153
void
xfs_attr3_leaf_hdr_from_disk(
154
	struct xfs_da_geometry		*geo,
D
Dave Chinner 已提交
155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170
	struct xfs_attr3_icleaf_hdr	*to,
	struct xfs_attr_leafblock	*from)
{
	int	i;

	ASSERT(from->hdr.info.magic == cpu_to_be16(XFS_ATTR_LEAF_MAGIC) ||
	       from->hdr.info.magic == cpu_to_be16(XFS_ATTR3_LEAF_MAGIC));

	if (from->hdr.info.magic == cpu_to_be16(XFS_ATTR3_LEAF_MAGIC)) {
		struct xfs_attr3_leaf_hdr *hdr3 = (struct xfs_attr3_leaf_hdr *)from;

		to->forw = be32_to_cpu(hdr3->info.hdr.forw);
		to->back = be32_to_cpu(hdr3->info.hdr.back);
		to->magic = be16_to_cpu(hdr3->info.hdr.magic);
		to->count = be16_to_cpu(hdr3->count);
		to->usedbytes = be16_to_cpu(hdr3->usedbytes);
171
		xfs_attr3_leaf_firstused_from_disk(geo, to, from);
D
Dave Chinner 已提交
172 173 174 175 176 177 178 179 180 181 182 183 184
		to->holes = hdr3->holes;

		for (i = 0; i < XFS_ATTR_LEAF_MAPSIZE; i++) {
			to->freemap[i].base = be16_to_cpu(hdr3->freemap[i].base);
			to->freemap[i].size = be16_to_cpu(hdr3->freemap[i].size);
		}
		return;
	}
	to->forw = be32_to_cpu(from->hdr.info.forw);
	to->back = be32_to_cpu(from->hdr.info.back);
	to->magic = be16_to_cpu(from->hdr.info.magic);
	to->count = be16_to_cpu(from->hdr.count);
	to->usedbytes = be16_to_cpu(from->hdr.usedbytes);
185
	xfs_attr3_leaf_firstused_from_disk(geo, to, from);
D
Dave Chinner 已提交
186 187 188 189 190 191 192 193 194 195
	to->holes = from->hdr.holes;

	for (i = 0; i < XFS_ATTR_LEAF_MAPSIZE; i++) {
		to->freemap[i].base = be16_to_cpu(from->hdr.freemap[i].base);
		to->freemap[i].size = be16_to_cpu(from->hdr.freemap[i].size);
	}
}

void
xfs_attr3_leaf_hdr_to_disk(
196
	struct xfs_da_geometry		*geo,
D
Dave Chinner 已提交
197 198 199
	struct xfs_attr_leafblock	*to,
	struct xfs_attr3_icleaf_hdr	*from)
{
200
	int				i;
D
Dave Chinner 已提交
201 202 203 204 205 206 207 208 209 210 211 212

	ASSERT(from->magic == XFS_ATTR_LEAF_MAGIC ||
	       from->magic == XFS_ATTR3_LEAF_MAGIC);

	if (from->magic == XFS_ATTR3_LEAF_MAGIC) {
		struct xfs_attr3_leaf_hdr *hdr3 = (struct xfs_attr3_leaf_hdr *)to;

		hdr3->info.hdr.forw = cpu_to_be32(from->forw);
		hdr3->info.hdr.back = cpu_to_be32(from->back);
		hdr3->info.hdr.magic = cpu_to_be16(from->magic);
		hdr3->count = cpu_to_be16(from->count);
		hdr3->usedbytes = cpu_to_be16(from->usedbytes);
213
		xfs_attr3_leaf_firstused_to_disk(geo, to, from);
D
Dave Chinner 已提交
214 215 216 217 218 219 220 221 222 223 224 225 226 227
		hdr3->holes = from->holes;
		hdr3->pad1 = 0;

		for (i = 0; i < XFS_ATTR_LEAF_MAPSIZE; i++) {
			hdr3->freemap[i].base = cpu_to_be16(from->freemap[i].base);
			hdr3->freemap[i].size = cpu_to_be16(from->freemap[i].size);
		}
		return;
	}
	to->hdr.info.forw = cpu_to_be32(from->forw);
	to->hdr.info.back = cpu_to_be32(from->back);
	to->hdr.info.magic = cpu_to_be16(from->magic);
	to->hdr.count = cpu_to_be16(from->count);
	to->hdr.usedbytes = cpu_to_be16(from->usedbytes);
228
	xfs_attr3_leaf_firstused_to_disk(geo, to, from);
D
Dave Chinner 已提交
229 230 231 232 233 234 235 236 237
	to->hdr.holes = from->holes;
	to->hdr.pad1 = 0;

	for (i = 0; i < XFS_ATTR_LEAF_MAPSIZE; i++) {
		to->hdr.freemap[i].base = cpu_to_be16(from->freemap[i].base);
		to->hdr.freemap[i].size = cpu_to_be16(from->freemap[i].size);
	}
}

238
static xfs_failaddr_t
D
Dave Chinner 已提交
239
xfs_attr3_leaf_verify(
240
	struct xfs_buf			*bp)
241
{
242 243 244 245 246
	struct xfs_attr3_icleaf_hdr	ichdr;
	struct xfs_mount		*mp = bp->b_target->bt_mount;
	struct xfs_attr_leafblock	*leaf = bp->b_addr;
	struct xfs_perag		*pag = bp->b_pag;
	struct xfs_attr_leaf_entry	*entries;
247 248
	uint16_t			end;
	int				i;
249

250
	xfs_attr3_leaf_hdr_from_disk(mp->m_attr_geo, &ichdr, leaf);
D
Dave Chinner 已提交
251 252 253 254 255

	if (xfs_sb_version_hascrc(&mp->m_sb)) {
		struct xfs_da3_node_hdr *hdr3 = bp->b_addr;

		if (ichdr.magic != XFS_ATTR3_LEAF_MAGIC)
256
			return __this_address;
D
Dave Chinner 已提交
257

258
		if (!uuid_equal(&hdr3->info.uuid, &mp->m_sb.sb_meta_uuid))
259
			return __this_address;
D
Dave Chinner 已提交
260
		if (be64_to_cpu(hdr3->info.blkno) != bp->b_bn)
261
			return __this_address;
262
		if (!xfs_log_check_lsn(mp, be64_to_cpu(hdr3->info.lsn)))
263
			return __this_address;
D
Dave Chinner 已提交
264 265
	} else {
		if (ichdr.magic != XFS_ATTR_LEAF_MAGIC)
266
			return __this_address;
267
	}
268 269 270 271 272 273
	/*
	 * In recovery there is a transient state where count == 0 is valid
	 * because we may have transitioned an empty shortform attr to a leaf
	 * if the attr didn't fit in shortform.
	 */
	if (pag && pag->pagf_init && ichdr.count == 0)
274
		return __this_address;
D
Dave Chinner 已提交
275

276 277 278 279 280 281 282 283 284 285 286 287 288 289 290
	/*
	 * firstused is the block offset of the first name info structure.
	 * Make sure it doesn't go off the block or crash into the header.
	 */
	if (ichdr.firstused > mp->m_attr_geo->blksize)
		return __this_address;
	if (ichdr.firstused < xfs_attr3_leaf_hdr_size(leaf))
		return __this_address;

	/* Make sure the entries array doesn't crash into the name info. */
	entries = xfs_attr3_leaf_entryp(bp->b_addr);
	if ((char *)&entries[ichdr.count] >
	    (char *)bp->b_addr + ichdr.firstused)
		return __this_address;

D
Dave Chinner 已提交
291 292 293
	/* XXX: need to range check rest of attr header values */
	/* XXX: hash order check? */

294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313
	/*
	 * Quickly check the freemap information.  Attribute data has to be
	 * aligned to 4-byte boundaries, and likewise for the free space.
	 */
	for (i = 0; i < XFS_ATTR_LEAF_MAPSIZE; i++) {
		if (ichdr.freemap[i].base > mp->m_attr_geo->blksize)
			return __this_address;
		if (ichdr.freemap[i].base & 0x3)
			return __this_address;
		if (ichdr.freemap[i].size > mp->m_attr_geo->blksize)
			return __this_address;
		if (ichdr.freemap[i].size & 0x3)
			return __this_address;
		end = ichdr.freemap[i].base + ichdr.freemap[i].size;
		if (end < ichdr.freemap[i].base)
			return __this_address;
		if (end > mp->m_attr_geo->blksize)
			return __this_address;
	}

314
	return NULL;
315 316 317
}

static void
D
Dave Chinner 已提交
318
xfs_attr3_leaf_write_verify(
319 320
	struct xfs_buf	*bp)
{
D
Dave Chinner 已提交
321
	struct xfs_mount	*mp = bp->b_target->bt_mount;
C
Carlos Maiolino 已提交
322
	struct xfs_buf_log_item	*bip = bp->b_log_item;
D
Dave Chinner 已提交
323
	struct xfs_attr3_leaf_hdr *hdr3 = bp->b_addr;
324
	xfs_failaddr_t		fa;
D
Dave Chinner 已提交
325

326 327 328
	fa = xfs_attr3_leaf_verify(bp);
	if (fa) {
		xfs_verifier_error(bp, -EFSCORRUPTED, fa);
D
Dave Chinner 已提交
329 330 331 332 333 334 335 336 337
		return;
	}

	if (!xfs_sb_version_hascrc(&mp->m_sb))
		return;

	if (bip)
		hdr3->info.lsn = cpu_to_be64(bip->bli_item.li_lsn);

338
	xfs_buf_update_cksum(bp, XFS_ATTR3_LEAF_CRC_OFF);
339
}
340

D
Dave Chinner 已提交
341 342 343 344 345 346
/*
 * leaf/node format detection on trees is sketchy, so a node read can be done on
 * leaf level blocks when detection identifies the tree as a node format tree
 * incorrectly. In this case, we need to swap the verifier to match the correct
 * format of the block being read.
 */
347
static void
D
Dave Chinner 已提交
348 349
xfs_attr3_leaf_read_verify(
	struct xfs_buf		*bp)
350
{
D
Dave Chinner 已提交
351
	struct xfs_mount	*mp = bp->b_target->bt_mount;
352
	xfs_failaddr_t		fa;
D
Dave Chinner 已提交
353

354 355
	if (xfs_sb_version_hascrc(&mp->m_sb) &&
	     !xfs_buf_verify_cksum(bp, XFS_ATTR3_LEAF_CRC_OFF))
356 357 358 359 360 361
		xfs_verifier_error(bp, -EFSBADCRC, __this_address);
	else {
		fa = xfs_attr3_leaf_verify(bp);
		if (fa)
			xfs_verifier_error(bp, -EFSCORRUPTED, fa);
	}
362 363
}

D
Dave Chinner 已提交
364
const struct xfs_buf_ops xfs_attr3_leaf_buf_ops = {
365
	.name = "xfs_attr3_leaf",
D
Dave Chinner 已提交
366 367
	.verify_read = xfs_attr3_leaf_read_verify,
	.verify_write = xfs_attr3_leaf_write_verify,
368
	.verify_struct = xfs_attr3_leaf_verify,
369
};
370

371
int
D
Dave Chinner 已提交
372
xfs_attr3_leaf_read(
373 374 375 376 377 378
	struct xfs_trans	*tp,
	struct xfs_inode	*dp,
	xfs_dablk_t		bno,
	xfs_daddr_t		mappedbno,
	struct xfs_buf		**bpp)
{
379 380 381
	int			err;

	err = xfs_da_read_buf(tp, dp, bno, mappedbno, bpp,
D
Dave Chinner 已提交
382
				XFS_ATTR_FORK, &xfs_attr3_leaf_buf_ops);
383
	if (!err && tp && *bpp)
384
		xfs_trans_buf_set_type(tp, *bpp, XFS_BLFT_ATTR_LEAF_BUF);
385
	return err;
386 387
}

388 389 390 391 392 393 394 395
/*========================================================================
 * Namespace helper routines
 *========================================================================*/

/*
 * If namespace bits don't match return 0.
 * If all match then return 1.
 */
396
STATIC int
397 398 399 400 401
xfs_attr_namesp_match(int arg_flags, int ondisk_flags)
{
	return XFS_ATTR_NSP_ONDISK(ondisk_flags) == XFS_ATTR_NSP_ARGS_TO_ONDISK(arg_flags);
}

L
Linus Torvalds 已提交
402 403

/*========================================================================
404
 * External routines when attribute fork size < XFS_LITINO(mp).
L
Linus Torvalds 已提交
405 406 407
 *========================================================================*/

/*
408 409
 * Query whether the requested number of additional bytes of extended
 * attribute space will be able to fit inline.
410
 *
411 412 413 414 415
 * Returns zero if not, else the di_forkoff fork offset to be used in the
 * literal area for attribute data once the new bytes have been added.
 *
 * di_forkoff must be 8 byte aligned, hence is stored as a >>3 value;
 * special case for dev/uuid inodes, they have fixed size data forks.
L
Linus Torvalds 已提交
416 417
 */
int
418 419 420 421 422
xfs_attr_shortform_bytesfit(xfs_inode_t *dp, int bytes)
{
	int offset;
	int minforkoff;	/* lower limit on valid forkoff locations */
	int maxforkoff;	/* upper limit on valid forkoff locations */
423
	int dsize;
424 425
	xfs_mount_t *mp = dp->i_mount;

426 427
	/* rounded down */
	offset = (XFS_LITINO(mp, dp->i_d.di_version) - bytes) >> 3;
428

429
	if (dp->i_d.di_format == XFS_DINODE_FMT_DEV) {
430 431 432 433
		minforkoff = roundup(sizeof(xfs_dev_t), 8) >> 3;
		return (offset >= minforkoff) ? minforkoff : 0;
	}

434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452
	/*
	 * If the requested numbers of bytes is smaller or equal to the
	 * current attribute fork size we can always proceed.
	 *
	 * Note that if_bytes in the data fork might actually be larger than
	 * the current data fork size is due to delalloc extents. In that
	 * case either the extent count will go down when they are converted
	 * to real extents, or the delalloc conversion will take care of the
	 * literal area rebalancing.
	 */
	if (bytes <= XFS_IFORK_ASIZE(dp))
		return dp->i_d.di_forkoff;

	/*
	 * For attr2 we can try to move the forkoff if there is space in the
	 * literal area, but for the old format we are done if there is no
	 * space in the fixed attribute fork.
	 */
	if (!(mp->m_flags & XFS_MOUNT_ATTR2))
453 454
		return 0;

455
	dsize = dp->i_df.if_bytes;
456

457 458
	switch (dp->i_d.di_format) {
	case XFS_DINODE_FMT_EXTENTS:
459
		/*
460
		 * If there is no attr fork and the data fork is extents, 
461 462 463
		 * determine if creating the default attr fork will result
		 * in the extents form migrating to btree. If so, the
		 * minimum offset only needs to be the space required for
464
		 * the btree root.
465
		 */
C
Christoph Hellwig 已提交
466 467
		if (!dp->i_d.di_forkoff && dp->i_df.if_bytes >
		    xfs_default_attroffset(dp))
468 469 470 471
			dsize = XFS_BMDR_SPACE_CALC(MINDBTPTRS);
		break;
	case XFS_DINODE_FMT_BTREE:
		/*
472 473 474
		 * If we have a data btree then keep forkoff if we have one,
		 * otherwise we are adding a new attr, so then we set
		 * minforkoff to where the btree root can finish so we have
475 476 477
		 * plenty of room for attrs
		 */
		if (dp->i_d.di_forkoff) {
478
			if (offset < dp->i_d.di_forkoff)
479
				return 0;
480 481
			return dp->i_d.di_forkoff;
		}
482
		dsize = XFS_BMAP_BROOT_SPACE(mp, dp->i_df.if_broot);
483 484
		break;
	}
485 486 487

	/*
	 * A data fork btree root must have space for at least
488 489
	 * MINDBTPTRS key/ptr pairs if the data fork is small or empty.
	 */
D
Dave Chinner 已提交
490
	minforkoff = max(dsize, XFS_BMDR_SPACE_CALC(MINDBTPTRS));
491 492 493
	minforkoff = roundup(minforkoff, 8) >> 3;

	/* attr fork btree root can have at least this many key/ptr pairs */
494 495
	maxforkoff = XFS_LITINO(mp, dp->i_d.di_version) -
			XFS_BMDR_SPACE_CALC(MINABTPTRS);
496 497 498 499
	maxforkoff = maxforkoff >> 3;	/* rounded down */

	if (offset >= maxforkoff)
		return maxforkoff;
500 501
	if (offset >= minforkoff)
		return offset;
502 503 504 505 506 507 508 509 510
	return 0;
}

/*
 * Switch on the ATTR2 superblock bit (implies also FEATURES2)
 */
STATIC void
xfs_sbversion_add_attr2(xfs_mount_t *mp, xfs_trans_t *tp)
{
511
	if ((mp->m_flags & XFS_MOUNT_ATTR2) &&
512
	    !(xfs_sb_version_hasattr2(&mp->m_sb))) {
E
Eric Sandeen 已提交
513
		spin_lock(&mp->m_sb_lock);
514 515
		if (!xfs_sb_version_hasattr2(&mp->m_sb)) {
			xfs_sb_version_addattr2(&mp->m_sb);
E
Eric Sandeen 已提交
516
			spin_unlock(&mp->m_sb_lock);
517
			xfs_log_sb(tp);
518
		} else
E
Eric Sandeen 已提交
519
			spin_unlock(&mp->m_sb_lock);
520 521 522 523 524 525 526
	}
}

/*
 * Create the initial contents of a shortform attribute list.
 */
void
L
Linus Torvalds 已提交
527 528 529 530 531 532
xfs_attr_shortform_create(xfs_da_args_t *args)
{
	xfs_attr_sf_hdr_t *hdr;
	xfs_inode_t *dp;
	xfs_ifork_t *ifp;

533 534
	trace_xfs_attr_sf_create(args);

L
Linus Torvalds 已提交
535 536 537 538 539 540 541 542 543 544 545 546 547 548 549
	dp = args->dp;
	ASSERT(dp != NULL);
	ifp = dp->i_afp;
	ASSERT(ifp != NULL);
	ASSERT(ifp->if_bytes == 0);
	if (dp->i_d.di_aformat == XFS_DINODE_FMT_EXTENTS) {
		ifp->if_flags &= ~XFS_IFEXTENTS;	/* just in case */
		dp->i_d.di_aformat = XFS_DINODE_FMT_LOCAL;
		ifp->if_flags |= XFS_IFINLINE;
	} else {
		ASSERT(ifp->if_flags & XFS_IFINLINE);
	}
	xfs_idata_realloc(dp, sizeof(*hdr), XFS_ATTR_FORK);
	hdr = (xfs_attr_sf_hdr_t *)ifp->if_u1.if_data;
	hdr->count = 0;
550
	hdr->totsize = cpu_to_be16(sizeof(*hdr));
L
Linus Torvalds 已提交
551 552 553 554 555 556 557
	xfs_trans_log_inode(args->trans, dp, XFS_ILOG_CORE | XFS_ILOG_ADATA);
}

/*
 * Add a name/value pair to the shortform attribute list.
 * Overflow from the inode has already been checked for.
 */
558 559
void
xfs_attr_shortform_add(xfs_da_args_t *args, int forkoff)
L
Linus Torvalds 已提交
560 561 562 563
{
	xfs_attr_shortform_t *sf;
	xfs_attr_sf_entry_t *sfe;
	int i, offset, size;
564
	xfs_mount_t *mp;
L
Linus Torvalds 已提交
565 566 567
	xfs_inode_t *dp;
	xfs_ifork_t *ifp;

568 569
	trace_xfs_attr_sf_add(args);

L
Linus Torvalds 已提交
570
	dp = args->dp;
571 572 573
	mp = dp->i_mount;
	dp->i_d.di_forkoff = forkoff;

L
Linus Torvalds 已提交
574 575 576 577
	ifp = dp->i_afp;
	ASSERT(ifp->if_flags & XFS_IFINLINE);
	sf = (xfs_attr_shortform_t *)ifp->if_u1.if_data;
	sfe = &sf->list[0];
578
	for (i = 0; i < sf->hdr.count; sfe = XFS_ATTR_SF_NEXTENTRY(sfe), i++) {
579
#ifdef DEBUG
L
Linus Torvalds 已提交
580 581 582 583
		if (sfe->namelen != args->namelen)
			continue;
		if (memcmp(args->name, sfe->nameval, args->namelen) != 0)
			continue;
584
		if (!xfs_attr_namesp_match(args->flags, sfe->flags))
L
Linus Torvalds 已提交
585
			continue;
586 587
		ASSERT(0);
#endif
L
Linus Torvalds 已提交
588 589 590 591 592 593 594 595 596
	}

	offset = (char *)sfe - (char *)sf;
	size = XFS_ATTR_SF_ENTSIZE_BYNAME(args->namelen, args->valuelen);
	xfs_idata_realloc(dp, size, XFS_ATTR_FORK);
	sf = (xfs_attr_shortform_t *)ifp->if_u1.if_data;
	sfe = (xfs_attr_sf_entry_t *)((char *)sf + offset);

	sfe->namelen = args->namelen;
597
	sfe->valuelen = args->valuelen;
598
	sfe->flags = XFS_ATTR_NSP_ARGS_TO_ONDISK(args->flags);
L
Linus Torvalds 已提交
599 600
	memcpy(sfe->nameval, args->name, args->namelen);
	memcpy(&sfe->nameval[args->namelen], args->value, args->valuelen);
601
	sf->hdr.count++;
602
	be16_add_cpu(&sf->hdr.totsize, size);
L
Linus Torvalds 已提交
603 604
	xfs_trans_log_inode(args->trans, dp, XFS_ILOG_CORE | XFS_ILOG_ADATA);

605
	xfs_sbversion_add_attr2(mp, args->trans);
L
Linus Torvalds 已提交
606 607
}

608 609 610 611
/*
 * After the last attribute is removed revert to original inode format,
 * making all literal area available to the data fork once more.
 */
612 613
void
xfs_attr_fork_remove(
614 615 616 617 618 619 620 621 622 623 624 625 626
	struct xfs_inode	*ip,
	struct xfs_trans	*tp)
{
	xfs_idestroy_fork(ip, XFS_ATTR_FORK);
	ip->i_d.di_forkoff = 0;
	ip->i_d.di_aformat = XFS_DINODE_FMT_EXTENTS;

	ASSERT(ip->i_d.di_anextents == 0);
	ASSERT(ip->i_afp == NULL);

	xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE);
}

L
Linus Torvalds 已提交
627
/*
628
 * Remove an attribute from the shortform attribute list structure.
L
Linus Torvalds 已提交
629 630 631 632 633 634 635
 */
int
xfs_attr_shortform_remove(xfs_da_args_t *args)
{
	xfs_attr_shortform_t *sf;
	xfs_attr_sf_entry_t *sfe;
	int base, size=0, end, totsize, i;
636
	xfs_mount_t *mp;
L
Linus Torvalds 已提交
637 638
	xfs_inode_t *dp;

639 640
	trace_xfs_attr_sf_remove(args);

L
Linus Torvalds 已提交
641
	dp = args->dp;
642
	mp = dp->i_mount;
L
Linus Torvalds 已提交
643 644 645
	base = sizeof(xfs_attr_sf_hdr_t);
	sf = (xfs_attr_shortform_t *)dp->i_afp->if_u1.if_data;
	sfe = &sf->list[0];
646
	end = sf->hdr.count;
647
	for (i = 0; i < end; sfe = XFS_ATTR_SF_NEXTENTRY(sfe),
L
Linus Torvalds 已提交
648 649 650 651 652 653
					base += size, i++) {
		size = XFS_ATTR_SF_ENTSIZE(sfe);
		if (sfe->namelen != args->namelen)
			continue;
		if (memcmp(sfe->nameval, args->name, args->namelen) != 0)
			continue;
654
		if (!xfs_attr_namesp_match(args->flags, sfe->flags))
L
Linus Torvalds 已提交
655 656 657
			continue;
		break;
	}
658
	if (i == end)
D
Dave Chinner 已提交
659
		return -ENOATTR;
L
Linus Torvalds 已提交
660

661 662 663
	/*
	 * Fix up the attribute fork data, covering the hole
	 */
L
Linus Torvalds 已提交
664
	end = base + size;
665
	totsize = be16_to_cpu(sf->hdr.totsize);
666 667
	if (end != totsize)
		memmove(&((char *)sf)[base], &((char *)sf)[end], totsize - end);
668
	sf->hdr.count--;
669
	be16_add_cpu(&sf->hdr.totsize, -size);
670 671 672 673 674

	/*
	 * Fix up the start offset of the attribute fork
	 */
	totsize -= size;
675
	if (totsize == sizeof(xfs_attr_sf_hdr_t) &&
676 677 678
	    (mp->m_flags & XFS_MOUNT_ATTR2) &&
	    (dp->i_d.di_format != XFS_DINODE_FMT_BTREE) &&
	    !(args->op_flags & XFS_DA_OP_ADDNAME)) {
679
		xfs_attr_fork_remove(dp, args->trans);
680 681 682 683
	} else {
		xfs_idata_realloc(dp, -size, XFS_ATTR_FORK);
		dp->i_d.di_forkoff = xfs_attr_shortform_bytesfit(dp, totsize);
		ASSERT(dp->i_d.di_forkoff);
684 685 686 687
		ASSERT(totsize > sizeof(xfs_attr_sf_hdr_t) ||
				(args->op_flags & XFS_DA_OP_ADDNAME) ||
				!(mp->m_flags & XFS_MOUNT_ATTR2) ||
				dp->i_d.di_format == XFS_DINODE_FMT_BTREE);
688 689 690 691 692
		xfs_trans_log_inode(args->trans, dp,
					XFS_ILOG_CORE | XFS_ILOG_ADATA);
	}

	xfs_sbversion_add_attr2(mp, args->trans);
L
Linus Torvalds 已提交
693

E
Eric Sandeen 已提交
694
	return 0;
L
Linus Torvalds 已提交
695 696 697 698 699 700 701 702 703 704 705 706 707 708
}

/*
 * Look up a name in a shortform attribute list structure.
 */
/*ARGSUSED*/
int
xfs_attr_shortform_lookup(xfs_da_args_t *args)
{
	xfs_attr_shortform_t *sf;
	xfs_attr_sf_entry_t *sfe;
	int i;
	xfs_ifork_t *ifp;

709 710
	trace_xfs_attr_sf_lookup(args);

L
Linus Torvalds 已提交
711 712 713 714
	ifp = args->dp->i_afp;
	ASSERT(ifp->if_flags & XFS_IFINLINE);
	sf = (xfs_attr_shortform_t *)ifp->if_u1.if_data;
	sfe = &sf->list[0];
715
	for (i = 0; i < sf->hdr.count;
L
Linus Torvalds 已提交
716 717 718 719 720
				sfe = XFS_ATTR_SF_NEXTENTRY(sfe), i++) {
		if (sfe->namelen != args->namelen)
			continue;
		if (memcmp(args->name, sfe->nameval, args->namelen) != 0)
			continue;
721
		if (!xfs_attr_namesp_match(args->flags, sfe->flags))
L
Linus Torvalds 已提交
722
			continue;
D
Dave Chinner 已提交
723
		return -EEXIST;
L
Linus Torvalds 已提交
724
	}
D
Dave Chinner 已提交
725
	return -ENOATTR;
L
Linus Torvalds 已提交
726 727 728 729 730 731 732 733 734 735 736 737 738
}

/*
 * Look up a name in a shortform attribute list structure.
 */
/*ARGSUSED*/
int
xfs_attr_shortform_getvalue(xfs_da_args_t *args)
{
	xfs_attr_shortform_t *sf;
	xfs_attr_sf_entry_t *sfe;
	int i;

739
	ASSERT(args->dp->i_afp->if_flags == XFS_IFINLINE);
L
Linus Torvalds 已提交
740 741
	sf = (xfs_attr_shortform_t *)args->dp->i_afp->if_u1.if_data;
	sfe = &sf->list[0];
742
	for (i = 0; i < sf->hdr.count;
L
Linus Torvalds 已提交
743 744 745 746 747
				sfe = XFS_ATTR_SF_NEXTENTRY(sfe), i++) {
		if (sfe->namelen != args->namelen)
			continue;
		if (memcmp(args->name, sfe->nameval, args->namelen) != 0)
			continue;
748
		if (!xfs_attr_namesp_match(args->flags, sfe->flags))
L
Linus Torvalds 已提交
749 750
			continue;
		if (args->flags & ATTR_KERNOVAL) {
751
			args->valuelen = sfe->valuelen;
D
Dave Chinner 已提交
752
			return -EEXIST;
L
Linus Torvalds 已提交
753
		}
754 755
		if (args->valuelen < sfe->valuelen) {
			args->valuelen = sfe->valuelen;
D
Dave Chinner 已提交
756
			return -ERANGE;
L
Linus Torvalds 已提交
757
		}
758
		args->valuelen = sfe->valuelen;
L
Linus Torvalds 已提交
759 760
		memcpy(args->value, &sfe->nameval[args->namelen],
						    args->valuelen);
D
Dave Chinner 已提交
761
		return -EEXIST;
L
Linus Torvalds 已提交
762
	}
D
Dave Chinner 已提交
763
	return -ENOATTR;
L
Linus Torvalds 已提交
764 765 766
}

/*
767 768
 * Convert from using the shortform to the leaf.  On success, return the
 * buffer so that we can keep it locked until we're totally done with it.
L
Linus Torvalds 已提交
769 770
 */
int
771
xfs_attr_shortform_to_leaf(
772 773
	struct xfs_da_args		*args,
	struct xfs_buf			**leaf_bp)
L
Linus Torvalds 已提交
774
{
775 776 777 778 779 780 781 782 783
	struct xfs_inode		*dp;
	struct xfs_attr_shortform	*sf;
	struct xfs_attr_sf_entry	*sfe;
	struct xfs_da_args		nargs;
	char				*tmpbuffer;
	int				error, i, size;
	xfs_dablk_t			blkno;
	struct xfs_buf			*bp;
	struct xfs_ifork		*ifp;
L
Linus Torvalds 已提交
784

785 786
	trace_xfs_attr_sf_to_leaf(args);

L
Linus Torvalds 已提交
787 788 789
	dp = args->dp;
	ifp = dp->i_afp;
	sf = (xfs_attr_shortform_t *)ifp->if_u1.if_data;
790
	size = be16_to_cpu(sf->hdr.totsize);
L
Linus Torvalds 已提交
791 792 793 794 795 796
	tmpbuffer = kmem_alloc(size, KM_SLEEP);
	ASSERT(tmpbuffer != NULL);
	memcpy(tmpbuffer, ifp->if_u1.if_data, size);
	sf = (xfs_attr_shortform_t *)tmpbuffer;

	xfs_idata_realloc(dp, -size, XFS_ATTR_FORK);
797 798
	xfs_bmap_local_to_extents_empty(dp, XFS_ATTR_FORK);

L
Linus Torvalds 已提交
799 800 801 802 803 804 805
	bp = NULL;
	error = xfs_da_grow_inode(args, &blkno);
	if (error) {
		/*
		 * If we hit an IO error middle of the transaction inside
		 * grow_inode(), we may have inconsistent data. Bail out.
		 */
D
Dave Chinner 已提交
806
		if (error == -EIO)
L
Linus Torvalds 已提交
807 808 809 810 811 812 813
			goto out;
		xfs_idata_realloc(dp, size, XFS_ATTR_FORK);	/* try to put */
		memcpy(ifp->if_u1.if_data, tmpbuffer, size);	/* it back */
		goto out;
	}

	ASSERT(blkno == 0);
D
Dave Chinner 已提交
814
	error = xfs_attr3_leaf_create(args, blkno, &bp);
L
Linus Torvalds 已提交
815
	if (error) {
816 817
		/* xfs_attr3_leaf_create may not have instantiated a block */
		if (bp && (xfs_da_shrink_inode(args, 0, bp) != 0))
L
Linus Torvalds 已提交
818 819 820 821 822 823 824 825
			goto out;
		xfs_idata_realloc(dp, size, XFS_ATTR_FORK);	/* try to put */
		memcpy(ifp->if_u1.if_data, tmpbuffer, size);	/* it back */
		goto out;
	}

	memset((char *)&nargs, 0, sizeof(nargs));
	nargs.dp = dp;
826
	nargs.geo = args->geo;
L
Linus Torvalds 已提交
827 828 829
	nargs.total = args->total;
	nargs.whichfork = XFS_ATTR_FORK;
	nargs.trans = args->trans;
830
	nargs.op_flags = XFS_DA_OP_OKNOENT;
L
Linus Torvalds 已提交
831 832

	sfe = &sf->list[0];
833
	for (i = 0; i < sf->hdr.count; i++) {
834
		nargs.name = sfe->nameval;
L
Linus Torvalds 已提交
835
		nargs.namelen = sfe->namelen;
836
		nargs.value = &sfe->nameval[nargs.namelen];
837
		nargs.valuelen = sfe->valuelen;
838
		nargs.hashval = xfs_da_hashname(sfe->nameval,
L
Linus Torvalds 已提交
839
						sfe->namelen);
840
		nargs.flags = XFS_ATTR_NSP_ONDISK_TO_ARGS(sfe->flags);
D
Dave Chinner 已提交
841
		error = xfs_attr3_leaf_lookup_int(bp, &nargs); /* set a->index */
D
Dave Chinner 已提交
842
		ASSERT(error == -ENOATTR);
D
Dave Chinner 已提交
843
		error = xfs_attr3_leaf_add(bp, &nargs);
D
Dave Chinner 已提交
844
		ASSERT(error != -ENOSPC);
L
Linus Torvalds 已提交
845 846 847 848 849
		if (error)
			goto out;
		sfe = XFS_ATTR_SF_NEXTENTRY(sfe);
	}
	error = 0;
850
	*leaf_bp = bp;
L
Linus Torvalds 已提交
851
out:
852
	kmem_free(tmpbuffer);
E
Eric Sandeen 已提交
853
	return error;
L
Linus Torvalds 已提交
854 855 856 857 858 859 860
}

/*
 * Check a leaf attribute block to see if all the entries would fit into
 * a shortform attribute list.
 */
int
861
xfs_attr_shortform_allfit(
862 863
	struct xfs_buf		*bp,
	struct xfs_inode	*dp)
L
Linus Torvalds 已提交
864
{
865 866
	struct xfs_attr_leafblock *leaf;
	struct xfs_attr_leaf_entry *entry;
L
Linus Torvalds 已提交
867
	xfs_attr_leaf_name_local_t *name_loc;
868 869 870
	struct xfs_attr3_icleaf_hdr leafhdr;
	int			bytes;
	int			i;
871
	struct xfs_mount	*mp = bp->b_target->bt_mount;
L
Linus Torvalds 已提交
872

873
	leaf = bp->b_addr;
874
	xfs_attr3_leaf_hdr_from_disk(mp->m_attr_geo, &leafhdr, leaf);
875
	entry = xfs_attr3_leaf_entryp(leaf);
L
Linus Torvalds 已提交
876 877

	bytes = sizeof(struct xfs_attr_sf_hdr);
878
	for (i = 0; i < leafhdr.count; entry++, i++) {
L
Linus Torvalds 已提交
879 880 881
		if (entry->flags & XFS_ATTR_INCOMPLETE)
			continue;		/* don't copy partial entries */
		if (!(entry->flags & XFS_ATTR_LOCAL))
E
Eric Sandeen 已提交
882
			return 0;
D
Dave Chinner 已提交
883
		name_loc = xfs_attr3_leaf_name_local(leaf, i);
L
Linus Torvalds 已提交
884
		if (name_loc->namelen >= XFS_ATTR_SF_ENTSIZE_MAX)
E
Eric Sandeen 已提交
885
			return 0;
886
		if (be16_to_cpu(name_loc->valuelen) >= XFS_ATTR_SF_ENTSIZE_MAX)
E
Eric Sandeen 已提交
887
			return 0;
888
		bytes += sizeof(struct xfs_attr_sf_entry) - 1
L
Linus Torvalds 已提交
889
				+ name_loc->namelen
890
				+ be16_to_cpu(name_loc->valuelen);
L
Linus Torvalds 已提交
891
	}
892
	if ((dp->i_mount->m_flags & XFS_MOUNT_ATTR2) &&
893
	    (dp->i_d.di_format != XFS_DINODE_FMT_BTREE) &&
894
	    (bytes == sizeof(struct xfs_attr_sf_hdr)))
895 896
		return -1;
	return xfs_attr_shortform_bytesfit(dp, bytes);
L
Linus Torvalds 已提交
897 898
}

899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919 920 921 922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972
/* Verify the consistency of an inline attribute fork. */
xfs_failaddr_t
xfs_attr_shortform_verify(
	struct xfs_inode		*ip)
{
	struct xfs_attr_shortform	*sfp;
	struct xfs_attr_sf_entry	*sfep;
	struct xfs_attr_sf_entry	*next_sfep;
	char				*endp;
	struct xfs_ifork		*ifp;
	int				i;
	int				size;

	ASSERT(ip->i_d.di_aformat == XFS_DINODE_FMT_LOCAL);
	ifp = XFS_IFORK_PTR(ip, XFS_ATTR_FORK);
	sfp = (struct xfs_attr_shortform *)ifp->if_u1.if_data;
	size = ifp->if_bytes;

	/*
	 * Give up if the attribute is way too short.
	 */
	if (size < sizeof(struct xfs_attr_sf_hdr))
		return __this_address;

	endp = (char *)sfp + size;

	/* Check all reported entries */
	sfep = &sfp->list[0];
	for (i = 0; i < sfp->hdr.count; i++) {
		/*
		 * struct xfs_attr_sf_entry has a variable length.
		 * Check the fixed-offset parts of the structure are
		 * within the data buffer.
		 */
		if (((char *)sfep + sizeof(*sfep)) >= endp)
			return __this_address;

		/* Don't allow names with known bad length. */
		if (sfep->namelen == 0)
			return __this_address;

		/*
		 * Check that the variable-length part of the structure is
		 * within the data buffer.  The next entry starts after the
		 * name component, so nextentry is an acceptable test.
		 */
		next_sfep = XFS_ATTR_SF_NEXTENTRY(sfep);
		if ((char *)next_sfep > endp)
			return __this_address;

		/*
		 * Check for unknown flags.  Short form doesn't support
		 * the incomplete or local bits, so we can use the namespace
		 * mask here.
		 */
		if (sfep->flags & ~XFS_ATTR_NSP_ONDISK_MASK)
			return __this_address;

		/*
		 * Check for invalid namespace combinations.  We only allow
		 * one namespace flag per xattr, so we can just count the
		 * bits (i.e. hweight) here.
		 */
		if (hweight8(sfep->flags & XFS_ATTR_NSP_ONDISK_MASK) > 1)
			return __this_address;

		sfep = next_sfep;
	}
	if ((void *)sfep != (void *)endp)
		return __this_address;

	return NULL;
}

L
Linus Torvalds 已提交
973 974 975 976
/*
 * Convert a leaf attribute list to shortform attribute list
 */
int
D
Dave Chinner 已提交
977 978 979 980
xfs_attr3_leaf_to_shortform(
	struct xfs_buf		*bp,
	struct xfs_da_args	*args,
	int			forkoff)
L
Linus Torvalds 已提交
981
{
D
Dave Chinner 已提交
982 983 984 985 986 987 988 989 990
	struct xfs_attr_leafblock *leaf;
	struct xfs_attr3_icleaf_hdr ichdr;
	struct xfs_attr_leaf_entry *entry;
	struct xfs_attr_leaf_name_local *name_loc;
	struct xfs_da_args	nargs;
	struct xfs_inode	*dp = args->dp;
	char			*tmpbuffer;
	int			error;
	int			i;
L
Linus Torvalds 已提交
991

992 993
	trace_xfs_attr_leaf_to_sf(args);

994
	tmpbuffer = kmem_alloc(args->geo->blksize, KM_SLEEP);
D
Dave Chinner 已提交
995
	if (!tmpbuffer)
D
Dave Chinner 已提交
996
		return -ENOMEM;
L
Linus Torvalds 已提交
997

998
	memcpy(tmpbuffer, bp->b_addr, args->geo->blksize);
D
Dave Chinner 已提交
999

L
Linus Torvalds 已提交
1000
	leaf = (xfs_attr_leafblock_t *)tmpbuffer;
1001
	xfs_attr3_leaf_hdr_from_disk(args->geo, &ichdr, leaf);
D
Dave Chinner 已提交
1002 1003 1004
	entry = xfs_attr3_leaf_entryp(leaf);

	/* XXX (dgc): buffer is about to be marked stale - why zero it? */
1005
	memset(bp->b_addr, 0, args->geo->blksize);
L
Linus Torvalds 已提交
1006 1007 1008 1009 1010 1011 1012

	/*
	 * Clean out the prior contents of the attribute list.
	 */
	error = xfs_da_shrink_inode(args, 0, bp);
	if (error)
		goto out;
1013 1014

	if (forkoff == -1) {
1015
		ASSERT(dp->i_mount->m_flags & XFS_MOUNT_ATTR2);
1016
		ASSERT(dp->i_d.di_format != XFS_DINODE_FMT_BTREE);
1017
		xfs_attr_fork_remove(dp, args->trans);
L
Linus Torvalds 已提交
1018
		goto out;
1019 1020 1021
	}

	xfs_attr_shortform_create(args);
L
Linus Torvalds 已提交
1022 1023 1024 1025 1026

	/*
	 * Copy the attributes
	 */
	memset((char *)&nargs, 0, sizeof(nargs));
1027
	nargs.geo = args->geo;
L
Linus Torvalds 已提交
1028 1029 1030 1031
	nargs.dp = dp;
	nargs.total = args->total;
	nargs.whichfork = XFS_ATTR_FORK;
	nargs.trans = args->trans;
1032
	nargs.op_flags = XFS_DA_OP_OKNOENT;
D
Dave Chinner 已提交
1033 1034

	for (i = 0; i < ichdr.count; entry++, i++) {
L
Linus Torvalds 已提交
1035 1036 1037 1038 1039
		if (entry->flags & XFS_ATTR_INCOMPLETE)
			continue;	/* don't copy partial entries */
		if (!entry->nameidx)
			continue;
		ASSERT(entry->flags & XFS_ATTR_LOCAL);
D
Dave Chinner 已提交
1040
		name_loc = xfs_attr3_leaf_name_local(leaf, i);
1041
		nargs.name = name_loc->nameval;
L
Linus Torvalds 已提交
1042
		nargs.namelen = name_loc->namelen;
1043
		nargs.value = &name_loc->nameval[nargs.namelen];
1044
		nargs.valuelen = be16_to_cpu(name_loc->valuelen);
1045
		nargs.hashval = be32_to_cpu(entry->hashval);
1046
		nargs.flags = XFS_ATTR_NSP_ONDISK_TO_ARGS(entry->flags);
1047
		xfs_attr_shortform_add(&nargs, forkoff);
L
Linus Torvalds 已提交
1048 1049 1050 1051
	}
	error = 0;

out:
1052
	kmem_free(tmpbuffer);
D
Dave Chinner 已提交
1053
	return error;
L
Linus Torvalds 已提交
1054 1055 1056 1057 1058 1059
}

/*
 * Convert from using a single leaf to a root node and a leaf.
 */
int
D
Dave Chinner 已提交
1060 1061
xfs_attr3_leaf_to_node(
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
1062
{
D
Dave Chinner 已提交
1063 1064 1065
	struct xfs_attr_leafblock *leaf;
	struct xfs_attr3_icleaf_hdr icleafhdr;
	struct xfs_attr_leaf_entry *entries;
1066
	struct xfs_da_node_entry *btree;
D
Dave Chinner 已提交
1067 1068 1069 1070 1071 1072 1073 1074
	struct xfs_da3_icnode_hdr icnodehdr;
	struct xfs_da_intnode	*node;
	struct xfs_inode	*dp = args->dp;
	struct xfs_mount	*mp = dp->i_mount;
	struct xfs_buf		*bp1 = NULL;
	struct xfs_buf		*bp2 = NULL;
	xfs_dablk_t		blkno;
	int			error;
L
Linus Torvalds 已提交
1075

1076 1077
	trace_xfs_attr_leaf_to_node(args);

L
Linus Torvalds 已提交
1078 1079 1080
	error = xfs_da_grow_inode(args, &blkno);
	if (error)
		goto out;
D
Dave Chinner 已提交
1081
	error = xfs_attr3_leaf_read(args->trans, dp, 0, -1, &bp1);
L
Linus Torvalds 已提交
1082 1083
	if (error)
		goto out;
1084

D
Dave Chinner 已提交
1085
	error = xfs_da_get_buf(args->trans, dp, blkno, -1, &bp2, XFS_ATTR_FORK);
L
Linus Torvalds 已提交
1086 1087
	if (error)
		goto out;
D
Dave Chinner 已提交
1088 1089

	/* copy leaf to new buffer, update identifiers */
1090
	xfs_trans_buf_set_type(args->trans, bp2, XFS_BLFT_ATTR_LEAF_BUF);
1091
	bp2->b_ops = bp1->b_ops;
1092
	memcpy(bp2->b_addr, bp1->b_addr, args->geo->blksize);
D
Dave Chinner 已提交
1093 1094 1095 1096
	if (xfs_sb_version_hascrc(&mp->m_sb)) {
		struct xfs_da3_blkinfo *hdr3 = bp2->b_addr;
		hdr3->blkno = cpu_to_be64(bp2->b_bn);
	}
1097
	xfs_trans_log_buf(args->trans, bp2, 0, args->geo->blksize - 1);
L
Linus Torvalds 已提交
1098 1099 1100 1101

	/*
	 * Set up the new root node.
	 */
1102
	error = xfs_da3_node_create(args, 0, 1, &bp1, XFS_ATTR_FORK);
L
Linus Torvalds 已提交
1103 1104
	if (error)
		goto out;
1105
	node = bp1->b_addr;
1106
	dp->d_ops->node_hdr_from_disk(&icnodehdr, node);
D
Dave Chinner 已提交
1107
	btree = dp->d_ops->node_tree_p(node);
D
Dave Chinner 已提交
1108

1109
	leaf = bp2->b_addr;
1110
	xfs_attr3_leaf_hdr_from_disk(args->geo, &icleafhdr, leaf);
D
Dave Chinner 已提交
1111 1112
	entries = xfs_attr3_leaf_entryp(leaf);

L
Linus Torvalds 已提交
1113
	/* both on-disk, don't endian-flip twice */
D
Dave Chinner 已提交
1114
	btree[0].hashval = entries[icleafhdr.count - 1].hashval;
1115
	btree[0].before = cpu_to_be32(blkno);
D
Dave Chinner 已提交
1116
	icnodehdr.count = 1;
1117
	dp->d_ops->node_hdr_to_disk(node, &icnodehdr);
1118
	xfs_trans_log_buf(args->trans, bp1, 0, args->geo->blksize - 1);
L
Linus Torvalds 已提交
1119 1120
	error = 0;
out:
D
Dave Chinner 已提交
1121
	return error;
L
Linus Torvalds 已提交
1122 1123 1124 1125 1126 1127 1128 1129 1130 1131
}

/*========================================================================
 * Routines used for growing the Btree.
 *========================================================================*/

/*
 * Create the initial contents of a leaf attribute list
 * or a leaf in a node attribute list.
 */
1132
STATIC int
D
Dave Chinner 已提交
1133 1134 1135 1136
xfs_attr3_leaf_create(
	struct xfs_da_args	*args,
	xfs_dablk_t		blkno,
	struct xfs_buf		**bpp)
L
Linus Torvalds 已提交
1137
{
D
Dave Chinner 已提交
1138 1139 1140 1141 1142 1143
	struct xfs_attr_leafblock *leaf;
	struct xfs_attr3_icleaf_hdr ichdr;
	struct xfs_inode	*dp = args->dp;
	struct xfs_mount	*mp = dp->i_mount;
	struct xfs_buf		*bp;
	int			error;
L
Linus Torvalds 已提交
1144

1145 1146
	trace_xfs_attr_leaf_create(args);

L
Linus Torvalds 已提交
1147 1148 1149
	error = xfs_da_get_buf(args->trans, args->dp, blkno, -1, &bp,
					    XFS_ATTR_FORK);
	if (error)
D
Dave Chinner 已提交
1150 1151
		return error;
	bp->b_ops = &xfs_attr3_leaf_buf_ops;
1152
	xfs_trans_buf_set_type(args->trans, bp, XFS_BLFT_ATTR_LEAF_BUF);
1153
	leaf = bp->b_addr;
1154
	memset(leaf, 0, args->geo->blksize);
D
Dave Chinner 已提交
1155 1156

	memset(&ichdr, 0, sizeof(ichdr));
1157
	ichdr.firstused = args->geo->blksize;
D
Dave Chinner 已提交
1158 1159 1160 1161 1162 1163 1164 1165

	if (xfs_sb_version_hascrc(&mp->m_sb)) {
		struct xfs_da3_blkinfo *hdr3 = bp->b_addr;

		ichdr.magic = XFS_ATTR3_LEAF_MAGIC;

		hdr3->blkno = cpu_to_be64(bp->b_bn);
		hdr3->owner = cpu_to_be64(dp->i_ino);
1166
		uuid_copy(&hdr3->uuid, &mp->m_sb.sb_meta_uuid);
L
Linus Torvalds 已提交
1167

D
Dave Chinner 已提交
1168 1169 1170 1171 1172 1173
		ichdr.freemap[0].base = sizeof(struct xfs_attr3_leaf_hdr);
	} else {
		ichdr.magic = XFS_ATTR_LEAF_MAGIC;
		ichdr.freemap[0].base = sizeof(struct xfs_attr_leaf_hdr);
	}
	ichdr.freemap[0].size = ichdr.firstused - ichdr.freemap[0].base;
L
Linus Torvalds 已提交
1174

1175
	xfs_attr3_leaf_hdr_to_disk(args->geo, leaf, &ichdr);
1176
	xfs_trans_log_buf(args->trans, bp, 0, args->geo->blksize - 1);
L
Linus Torvalds 已提交
1177 1178

	*bpp = bp;
D
Dave Chinner 已提交
1179
	return 0;
L
Linus Torvalds 已提交
1180 1181 1182 1183 1184 1185
}

/*
 * Split the leaf node, rebalance, then add the new entry.
 */
int
D
Dave Chinner 已提交
1186 1187 1188 1189
xfs_attr3_leaf_split(
	struct xfs_da_state	*state,
	struct xfs_da_state_blk	*oldblk,
	struct xfs_da_state_blk	*newblk)
L
Linus Torvalds 已提交
1190 1191 1192 1193
{
	xfs_dablk_t blkno;
	int error;

1194 1195
	trace_xfs_attr_leaf_split(state->args);

L
Linus Torvalds 已提交
1196 1197 1198 1199 1200 1201
	/*
	 * Allocate space for a new leaf node.
	 */
	ASSERT(oldblk->magic == XFS_ATTR_LEAF_MAGIC);
	error = xfs_da_grow_inode(state->args, &blkno);
	if (error)
E
Eric Sandeen 已提交
1202
		return error;
D
Dave Chinner 已提交
1203
	error = xfs_attr3_leaf_create(state->args, blkno, &newblk->bp);
L
Linus Torvalds 已提交
1204
	if (error)
E
Eric Sandeen 已提交
1205
		return error;
L
Linus Torvalds 已提交
1206 1207 1208 1209 1210 1211 1212
	newblk->blkno = blkno;
	newblk->magic = XFS_ATTR_LEAF_MAGIC;

	/*
	 * Rebalance the entries across the two leaves.
	 * NOTE: rebalance() currently depends on the 2nd block being empty.
	 */
D
Dave Chinner 已提交
1213
	xfs_attr3_leaf_rebalance(state, oldblk, newblk);
1214
	error = xfs_da3_blk_link(state, oldblk, newblk);
L
Linus Torvalds 已提交
1215
	if (error)
E
Eric Sandeen 已提交
1216
		return error;
L
Linus Torvalds 已提交
1217 1218 1219 1220 1221 1222 1223 1224

	/*
	 * Save info on "old" attribute for "atomic rename" ops, leaf_add()
	 * modifies the index/blkno/rmtblk/rmtblkcnt fields to show the
	 * "new" attrs info.  Will need the "old" info to remove it later.
	 *
	 * Insert the "new" entry in the correct block.
	 */
1225 1226
	if (state->inleaf) {
		trace_xfs_attr_leaf_add_old(state->args);
D
Dave Chinner 已提交
1227
		error = xfs_attr3_leaf_add(oldblk->bp, state->args);
1228 1229
	} else {
		trace_xfs_attr_leaf_add_new(state->args);
D
Dave Chinner 已提交
1230
		error = xfs_attr3_leaf_add(newblk->bp, state->args);
1231
	}
L
Linus Torvalds 已提交
1232 1233 1234 1235 1236 1237

	/*
	 * Update last hashval in each block since we added the name.
	 */
	oldblk->hashval = xfs_attr_leaf_lasthash(oldblk->bp, NULL);
	newblk->hashval = xfs_attr_leaf_lasthash(newblk->bp, NULL);
E
Eric Sandeen 已提交
1238
	return error;
L
Linus Torvalds 已提交
1239 1240 1241 1242 1243 1244
}

/*
 * Add a name to the leaf attribute list structure.
 */
int
D
Dave Chinner 已提交
1245
xfs_attr3_leaf_add(
1246 1247
	struct xfs_buf		*bp,
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
1248
{
D
Dave Chinner 已提交
1249 1250 1251 1252 1253 1254 1255
	struct xfs_attr_leafblock *leaf;
	struct xfs_attr3_icleaf_hdr ichdr;
	int			tablesize;
	int			entsize;
	int			sum;
	int			tmp;
	int			i;
L
Linus Torvalds 已提交
1256

1257 1258
	trace_xfs_attr_leaf_add(args);

1259
	leaf = bp->b_addr;
1260
	xfs_attr3_leaf_hdr_from_disk(args->geo, &ichdr, leaf);
D
Dave Chinner 已提交
1261
	ASSERT(args->index >= 0 && args->index <= ichdr.count);
1262
	entsize = xfs_attr_leaf_newentsize(args, NULL);
L
Linus Torvalds 已提交
1263 1264 1265 1266 1267

	/*
	 * Search through freemap for first-fit on new name length.
	 * (may need to figure in size of entry struct too)
	 */
D
Dave Chinner 已提交
1268 1269 1270 1271 1272
	tablesize = (ichdr.count + 1) * sizeof(xfs_attr_leaf_entry_t)
					+ xfs_attr3_leaf_hdr_size(leaf);
	for (sum = 0, i = XFS_ATTR_LEAF_MAPSIZE - 1; i >= 0; i--) {
		if (tablesize > ichdr.firstused) {
			sum += ichdr.freemap[i].size;
L
Linus Torvalds 已提交
1273 1274
			continue;
		}
D
Dave Chinner 已提交
1275
		if (!ichdr.freemap[i].size)
L
Linus Torvalds 已提交
1276 1277
			continue;	/* no space in this map */
		tmp = entsize;
D
Dave Chinner 已提交
1278
		if (ichdr.freemap[i].base < ichdr.firstused)
L
Linus Torvalds 已提交
1279
			tmp += sizeof(xfs_attr_leaf_entry_t);
D
Dave Chinner 已提交
1280 1281 1282
		if (ichdr.freemap[i].size >= tmp) {
			tmp = xfs_attr3_leaf_add_work(bp, &ichdr, args, i);
			goto out_log_hdr;
L
Linus Torvalds 已提交
1283
		}
D
Dave Chinner 已提交
1284
		sum += ichdr.freemap[i].size;
L
Linus Torvalds 已提交
1285 1286 1287 1288 1289 1290 1291
	}

	/*
	 * If there are no holes in the address space of the block,
	 * and we don't have enough freespace, then compaction will do us
	 * no good and we should just give up.
	 */
D
Dave Chinner 已提交
1292
	if (!ichdr.holes && sum < entsize)
D
Dave Chinner 已提交
1293
		return -ENOSPC;
L
Linus Torvalds 已提交
1294 1295 1296 1297 1298

	/*
	 * Compact the entries to coalesce free space.
	 * This may change the hdr->count via dropping INCOMPLETE entries.
	 */
D
Dave Chinner 已提交
1299
	xfs_attr3_leaf_compact(args, &ichdr, bp);
L
Linus Torvalds 已提交
1300 1301 1302 1303 1304

	/*
	 * After compaction, the block is guaranteed to have only one
	 * free region, in freemap[0].  If it is not big enough, give up.
	 */
D
Dave Chinner 已提交
1305
	if (ichdr.freemap[0].size < (entsize + sizeof(xfs_attr_leaf_entry_t))) {
D
Dave Chinner 已提交
1306
		tmp = -ENOSPC;
D
Dave Chinner 已提交
1307 1308 1309 1310
		goto out_log_hdr;
	}

	tmp = xfs_attr3_leaf_add_work(bp, &ichdr, args, 0);
L
Linus Torvalds 已提交
1311

D
Dave Chinner 已提交
1312
out_log_hdr:
1313
	xfs_attr3_leaf_hdr_to_disk(args->geo, leaf, &ichdr);
D
Dave Chinner 已提交
1314 1315 1316 1317
	xfs_trans_log_buf(args->trans, bp,
		XFS_DA_LOGRANGE(leaf, &leaf->hdr,
				xfs_attr3_leaf_hdr_size(leaf)));
	return tmp;
L
Linus Torvalds 已提交
1318 1319 1320 1321 1322 1323
}

/*
 * Add a name to a leaf attribute list structure.
 */
STATIC int
D
Dave Chinner 已提交
1324 1325 1326 1327 1328
xfs_attr3_leaf_add_work(
	struct xfs_buf		*bp,
	struct xfs_attr3_icleaf_hdr *ichdr,
	struct xfs_da_args	*args,
	int			mapindex)
L
Linus Torvalds 已提交
1329
{
D
Dave Chinner 已提交
1330 1331 1332 1333 1334 1335 1336
	struct xfs_attr_leafblock *leaf;
	struct xfs_attr_leaf_entry *entry;
	struct xfs_attr_leaf_name_local *name_loc;
	struct xfs_attr_leaf_name_remote *name_rmt;
	struct xfs_mount	*mp;
	int			tmp;
	int			i;
L
Linus Torvalds 已提交
1337

1338 1339
	trace_xfs_attr_leaf_add_work(args);

1340
	leaf = bp->b_addr;
D
Dave Chinner 已提交
1341 1342
	ASSERT(mapindex >= 0 && mapindex < XFS_ATTR_LEAF_MAPSIZE);
	ASSERT(args->index >= 0 && args->index <= ichdr->count);
L
Linus Torvalds 已提交
1343 1344 1345 1346

	/*
	 * Force open some space in the entry array and fill it in.
	 */
D
Dave Chinner 已提交
1347 1348 1349
	entry = &xfs_attr3_leaf_entryp(leaf)[args->index];
	if (args->index < ichdr->count) {
		tmp  = ichdr->count - args->index;
L
Linus Torvalds 已提交
1350
		tmp *= sizeof(xfs_attr_leaf_entry_t);
D
Dave Chinner 已提交
1351
		memmove(entry + 1, entry, tmp);
1352
		xfs_trans_log_buf(args->trans, bp,
L
Linus Torvalds 已提交
1353 1354
		    XFS_DA_LOGRANGE(leaf, entry, tmp + sizeof(*entry)));
	}
D
Dave Chinner 已提交
1355
	ichdr->count++;
L
Linus Torvalds 已提交
1356 1357 1358 1359 1360

	/*
	 * Allocate space for the new string (at the end of the run).
	 */
	mp = args->trans->t_mountp;
1361
	ASSERT(ichdr->freemap[mapindex].base < args->geo->blksize);
D
Dave Chinner 已提交
1362 1363
	ASSERT((ichdr->freemap[mapindex].base & 0x3) == 0);
	ASSERT(ichdr->freemap[mapindex].size >=
1364
		xfs_attr_leaf_newentsize(args, NULL));
1365
	ASSERT(ichdr->freemap[mapindex].size < args->geo->blksize);
D
Dave Chinner 已提交
1366 1367
	ASSERT((ichdr->freemap[mapindex].size & 0x3) == 0);

1368
	ichdr->freemap[mapindex].size -= xfs_attr_leaf_newentsize(args, &tmp);
D
Dave Chinner 已提交
1369 1370 1371

	entry->nameidx = cpu_to_be16(ichdr->freemap[mapindex].base +
				     ichdr->freemap[mapindex].size);
1372
	entry->hashval = cpu_to_be32(args->hashval);
L
Linus Torvalds 已提交
1373
	entry->flags = tmp ? XFS_ATTR_LOCAL : 0;
1374
	entry->flags |= XFS_ATTR_NSP_ARGS_TO_ONDISK(args->flags);
1375
	if (args->op_flags & XFS_DA_OP_RENAME) {
L
Linus Torvalds 已提交
1376 1377 1378 1379 1380 1381
		entry->flags |= XFS_ATTR_INCOMPLETE;
		if ((args->blkno2 == args->blkno) &&
		    (args->index2 <= args->index)) {
			args->index2++;
		}
	}
1382
	xfs_trans_log_buf(args->trans, bp,
L
Linus Torvalds 已提交
1383
			  XFS_DA_LOGRANGE(leaf, entry, sizeof(*entry)));
1384 1385
	ASSERT((args->index == 0) ||
	       (be32_to_cpu(entry->hashval) >= be32_to_cpu((entry-1)->hashval)));
D
Dave Chinner 已提交
1386
	ASSERT((args->index == ichdr->count - 1) ||
1387
	       (be32_to_cpu(entry->hashval) <= be32_to_cpu((entry+1)->hashval)));
L
Linus Torvalds 已提交
1388 1389 1390 1391 1392 1393 1394 1395 1396

	/*
	 * For "remote" attribute values, simply note that we need to
	 * allocate space for the "remote" value.  We can't actually
	 * allocate the extents in this transaction, and we can't decide
	 * which blocks they should be as we might allocate more blocks
	 * as part of this transaction (a split operation for example).
	 */
	if (entry->flags & XFS_ATTR_LOCAL) {
D
Dave Chinner 已提交
1397
		name_loc = xfs_attr3_leaf_name_local(leaf, args->index);
L
Linus Torvalds 已提交
1398
		name_loc->namelen = args->namelen;
1399
		name_loc->valuelen = cpu_to_be16(args->valuelen);
L
Linus Torvalds 已提交
1400 1401
		memcpy((char *)name_loc->nameval, args->name, args->namelen);
		memcpy((char *)&name_loc->nameval[args->namelen], args->value,
1402
				   be16_to_cpu(name_loc->valuelen));
L
Linus Torvalds 已提交
1403
	} else {
D
Dave Chinner 已提交
1404
		name_rmt = xfs_attr3_leaf_name_remote(leaf, args->index);
L
Linus Torvalds 已提交
1405 1406 1407 1408 1409 1410 1411
		name_rmt->namelen = args->namelen;
		memcpy((char *)name_rmt->name, args->name, args->namelen);
		entry->flags |= XFS_ATTR_INCOMPLETE;
		/* just in case */
		name_rmt->valuelen = 0;
		name_rmt->valueblk = 0;
		args->rmtblkno = 1;
D
Dave Chinner 已提交
1412
		args->rmtblkcnt = xfs_attr3_rmt_blocks(mp, args->valuelen);
1413
		args->rmtvaluelen = args->valuelen;
L
Linus Torvalds 已提交
1414
	}
1415
	xfs_trans_log_buf(args->trans, bp,
D
Dave Chinner 已提交
1416
	     XFS_DA_LOGRANGE(leaf, xfs_attr3_leaf_name(leaf, args->index),
L
Linus Torvalds 已提交
1417 1418 1419 1420 1421
				   xfs_attr_leaf_entsize(leaf, args->index)));

	/*
	 * Update the control info for this leaf node
	 */
D
Dave Chinner 已提交
1422 1423 1424 1425 1426 1427 1428 1429 1430 1431 1432 1433
	if (be16_to_cpu(entry->nameidx) < ichdr->firstused)
		ichdr->firstused = be16_to_cpu(entry->nameidx);

	ASSERT(ichdr->firstused >= ichdr->count * sizeof(xfs_attr_leaf_entry_t)
					+ xfs_attr3_leaf_hdr_size(leaf));
	tmp = (ichdr->count - 1) * sizeof(xfs_attr_leaf_entry_t)
					+ xfs_attr3_leaf_hdr_size(leaf);

	for (i = 0; i < XFS_ATTR_LEAF_MAPSIZE; i++) {
		if (ichdr->freemap[i].base == tmp) {
			ichdr->freemap[i].base += sizeof(xfs_attr_leaf_entry_t);
			ichdr->freemap[i].size -= sizeof(xfs_attr_leaf_entry_t);
L
Linus Torvalds 已提交
1434 1435
		}
	}
D
Dave Chinner 已提交
1436 1437
	ichdr->usedbytes += xfs_attr_leaf_entsize(leaf, args->index);
	return 0;
L
Linus Torvalds 已提交
1438 1439 1440 1441 1442 1443
}

/*
 * Garbage collect a leaf attribute list block by copying it to a new buffer.
 */
STATIC void
D
Dave Chinner 已提交
1444
xfs_attr3_leaf_compact(
1445
	struct xfs_da_args	*args,
1446
	struct xfs_attr3_icleaf_hdr *ichdr_dst,
1447
	struct xfs_buf		*bp)
L
Linus Torvalds 已提交
1448
{
1449 1450 1451
	struct xfs_attr_leafblock *leaf_src;
	struct xfs_attr_leafblock *leaf_dst;
	struct xfs_attr3_icleaf_hdr ichdr_src;
1452 1453 1454 1455
	struct xfs_trans	*trans = args->trans;
	char			*tmpbuffer;

	trace_xfs_attr_leaf_compact(args);
L
Linus Torvalds 已提交
1456

1457 1458 1459
	tmpbuffer = kmem_alloc(args->geo->blksize, KM_SLEEP);
	memcpy(tmpbuffer, bp->b_addr, args->geo->blksize);
	memset(bp->b_addr, 0, args->geo->blksize);
1460 1461
	leaf_src = (xfs_attr_leafblock_t *)tmpbuffer;
	leaf_dst = bp->b_addr;
L
Linus Torvalds 已提交
1462 1463

	/*
1464 1465 1466
	 * Copy the on-disk header back into the destination buffer to ensure
	 * all the information in the header that is not part of the incore
	 * header structure is preserved.
L
Linus Torvalds 已提交
1467
	 */
1468 1469 1470 1471
	memcpy(bp->b_addr, tmpbuffer, xfs_attr3_leaf_hdr_size(leaf_src));

	/* Initialise the incore headers */
	ichdr_src = *ichdr_dst;	/* struct copy */
1472
	ichdr_dst->firstused = args->geo->blksize;
1473 1474 1475 1476 1477 1478 1479 1480
	ichdr_dst->usedbytes = 0;
	ichdr_dst->count = 0;
	ichdr_dst->holes = 0;
	ichdr_dst->freemap[0].base = xfs_attr3_leaf_hdr_size(leaf_src);
	ichdr_dst->freemap[0].size = ichdr_dst->firstused -
						ichdr_dst->freemap[0].base;

	/* write the header back to initialise the underlying buffer */
1481
	xfs_attr3_leaf_hdr_to_disk(args->geo, leaf_dst, ichdr_dst);
L
Linus Torvalds 已提交
1482 1483 1484 1485 1486

	/*
	 * Copy all entry's in the same (sorted) order,
	 * but allocate name/value pairs packed and in sequence.
	 */
1487 1488
	xfs_attr3_leaf_moveents(args, leaf_src, &ichdr_src, 0,
				leaf_dst, ichdr_dst, 0, ichdr_src.count);
D
Dave Chinner 已提交
1489 1490 1491 1492
	/*
	 * this logs the entire buffer, but the caller must write the header
	 * back to the buffer when it is finished modifying it.
	 */
1493
	xfs_trans_log_buf(trans, bp, 0, args->geo->blksize - 1);
L
Linus Torvalds 已提交
1494

1495
	kmem_free(tmpbuffer);
L
Linus Torvalds 已提交
1496 1497
}

D
Dave Chinner 已提交
1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 1519 1520 1521 1522 1523 1524 1525 1526 1527 1528 1529 1530
/*
 * Compare two leaf blocks "order".
 * Return 0 unless leaf2 should go before leaf1.
 */
static int
xfs_attr3_leaf_order(
	struct xfs_buf	*leaf1_bp,
	struct xfs_attr3_icleaf_hdr *leaf1hdr,
	struct xfs_buf	*leaf2_bp,
	struct xfs_attr3_icleaf_hdr *leaf2hdr)
{
	struct xfs_attr_leaf_entry *entries1;
	struct xfs_attr_leaf_entry *entries2;

	entries1 = xfs_attr3_leaf_entryp(leaf1_bp->b_addr);
	entries2 = xfs_attr3_leaf_entryp(leaf2_bp->b_addr);
	if (leaf1hdr->count > 0 && leaf2hdr->count > 0 &&
	    ((be32_to_cpu(entries2[0].hashval) <
	      be32_to_cpu(entries1[0].hashval)) ||
	     (be32_to_cpu(entries2[leaf2hdr->count - 1].hashval) <
	      be32_to_cpu(entries1[leaf1hdr->count - 1].hashval)))) {
		return 1;
	}
	return 0;
}

int
xfs_attr_leaf_order(
	struct xfs_buf	*leaf1_bp,
	struct xfs_buf	*leaf2_bp)
{
	struct xfs_attr3_icleaf_hdr ichdr1;
	struct xfs_attr3_icleaf_hdr ichdr2;
1531
	struct xfs_mount *mp = leaf1_bp->b_target->bt_mount;
D
Dave Chinner 已提交
1532

1533 1534
	xfs_attr3_leaf_hdr_from_disk(mp->m_attr_geo, &ichdr1, leaf1_bp->b_addr);
	xfs_attr3_leaf_hdr_from_disk(mp->m_attr_geo, &ichdr2, leaf2_bp->b_addr);
D
Dave Chinner 已提交
1535 1536 1537
	return xfs_attr3_leaf_order(leaf1_bp, &ichdr1, leaf2_bp, &ichdr2);
}

L
Linus Torvalds 已提交
1538 1539 1540 1541 1542 1543 1544 1545 1546 1547 1548 1549 1550
/*
 * Redistribute the attribute list entries between two leaf nodes,
 * taking into account the size of the new entry.
 *
 * NOTE: if new block is empty, then it will get the upper half of the
 * old block.  At present, all (one) callers pass in an empty second block.
 *
 * This code adjusts the args->index/blkno and args->index2/blkno2 fields
 * to match what it is doing in splitting the attribute leaf block.  Those
 * values are used in "atomic rename" operations on attributes.  Note that
 * the "new" and "old" values can end up in different blocks.
 */
STATIC void
D
Dave Chinner 已提交
1551 1552 1553 1554
xfs_attr3_leaf_rebalance(
	struct xfs_da_state	*state,
	struct xfs_da_state_blk	*blk1,
	struct xfs_da_state_blk	*blk2)
L
Linus Torvalds 已提交
1555
{
D
Dave Chinner 已提交
1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567
	struct xfs_da_args	*args;
	struct xfs_attr_leafblock *leaf1;
	struct xfs_attr_leafblock *leaf2;
	struct xfs_attr3_icleaf_hdr ichdr1;
	struct xfs_attr3_icleaf_hdr ichdr2;
	struct xfs_attr_leaf_entry *entries1;
	struct xfs_attr_leaf_entry *entries2;
	int			count;
	int			totallen;
	int			max;
	int			space;
	int			swap;
L
Linus Torvalds 已提交
1568 1569 1570 1571 1572 1573

	/*
	 * Set up environment.
	 */
	ASSERT(blk1->magic == XFS_ATTR_LEAF_MAGIC);
	ASSERT(blk2->magic == XFS_ATTR_LEAF_MAGIC);
1574 1575
	leaf1 = blk1->bp->b_addr;
	leaf2 = blk2->bp->b_addr;
1576 1577
	xfs_attr3_leaf_hdr_from_disk(state->args->geo, &ichdr1, leaf1);
	xfs_attr3_leaf_hdr_from_disk(state->args->geo, &ichdr2, leaf2);
D
Dave Chinner 已提交
1578
	ASSERT(ichdr2.count == 0);
L
Linus Torvalds 已提交
1579 1580
	args = state->args;

1581 1582
	trace_xfs_attr_leaf_rebalance(args);

L
Linus Torvalds 已提交
1583 1584 1585 1586 1587 1588 1589
	/*
	 * Check ordering of blocks, reverse if it makes things simpler.
	 *
	 * NOTE: Given that all (current) callers pass in an empty
	 * second block, this code should never set "swap".
	 */
	swap = 0;
D
Dave Chinner 已提交
1590
	if (xfs_attr3_leaf_order(blk1->bp, &ichdr1, blk2->bp, &ichdr2)) {
1591
		swap(blk1, blk2);
D
Dave Chinner 已提交
1592

1593 1594
		/* swap structures rather than reconverting them */
		swap(ichdr1, ichdr2);
D
Dave Chinner 已提交
1595

1596 1597
		leaf1 = blk1->bp->b_addr;
		leaf2 = blk2->bp->b_addr;
L
Linus Torvalds 已提交
1598 1599 1600 1601 1602 1603 1604 1605 1606 1607 1608
		swap = 1;
	}

	/*
	 * Examine entries until we reduce the absolute difference in
	 * byte usage between the two blocks to a minimum.  Then get
	 * the direction to copy and the number of elements to move.
	 *
	 * "inleaf" is true if the new entry should be inserted into blk1.
	 * If "swap" is also true, then reverse the sense of "inleaf".
	 */
D
Dave Chinner 已提交
1609 1610 1611
	state->inleaf = xfs_attr3_leaf_figure_balance(state, blk1, &ichdr1,
						      blk2, &ichdr2,
						      &count, &totallen);
L
Linus Torvalds 已提交
1612 1613 1614 1615 1616 1617
	if (swap)
		state->inleaf = !state->inleaf;

	/*
	 * Move any entries required from leaf to leaf:
	 */
D
Dave Chinner 已提交
1618
	if (count < ichdr1.count) {
L
Linus Torvalds 已提交
1619 1620 1621 1622
		/*
		 * Figure the total bytes to be added to the destination leaf.
		 */
		/* number entries being moved */
D
Dave Chinner 已提交
1623 1624
		count = ichdr1.count - count;
		space  = ichdr1.usedbytes - totallen;
L
Linus Torvalds 已提交
1625 1626 1627 1628 1629
		space += count * sizeof(xfs_attr_leaf_entry_t);

		/*
		 * leaf2 is the destination, compact it if it looks tight.
		 */
D
Dave Chinner 已提交
1630 1631
		max  = ichdr2.firstused - xfs_attr3_leaf_hdr_size(leaf1);
		max -= ichdr2.count * sizeof(xfs_attr_leaf_entry_t);
1632
		if (space > max)
D
Dave Chinner 已提交
1633
			xfs_attr3_leaf_compact(args, &ichdr2, blk2->bp);
L
Linus Torvalds 已提交
1634 1635 1636 1637

		/*
		 * Move high entries from leaf1 to low end of leaf2.
		 */
1638 1639
		xfs_attr3_leaf_moveents(args, leaf1, &ichdr1,
				ichdr1.count - count, leaf2, &ichdr2, 0, count);
L
Linus Torvalds 已提交
1640

D
Dave Chinner 已提交
1641
	} else if (count > ichdr1.count) {
L
Linus Torvalds 已提交
1642 1643 1644 1645
		/*
		 * I assert that since all callers pass in an empty
		 * second buffer, this code should never execute.
		 */
1646
		ASSERT(0);
L
Linus Torvalds 已提交
1647 1648 1649 1650 1651

		/*
		 * Figure the total bytes to be added to the destination leaf.
		 */
		/* number entries being moved */
D
Dave Chinner 已提交
1652 1653
		count -= ichdr1.count;
		space  = totallen - ichdr1.usedbytes;
L
Linus Torvalds 已提交
1654 1655 1656 1657 1658
		space += count * sizeof(xfs_attr_leaf_entry_t);

		/*
		 * leaf1 is the destination, compact it if it looks tight.
		 */
D
Dave Chinner 已提交
1659 1660
		max  = ichdr1.firstused - xfs_attr3_leaf_hdr_size(leaf1);
		max -= ichdr1.count * sizeof(xfs_attr_leaf_entry_t);
1661
		if (space > max)
D
Dave Chinner 已提交
1662
			xfs_attr3_leaf_compact(args, &ichdr1, blk1->bp);
L
Linus Torvalds 已提交
1663 1664 1665 1666

		/*
		 * Move low entries from leaf2 to high end of leaf1.
		 */
1667 1668
		xfs_attr3_leaf_moveents(args, leaf2, &ichdr2, 0, leaf1, &ichdr1,
					ichdr1.count, count);
L
Linus Torvalds 已提交
1669 1670
	}

1671 1672
	xfs_attr3_leaf_hdr_to_disk(state->args->geo, leaf1, &ichdr1);
	xfs_attr3_leaf_hdr_to_disk(state->args->geo, leaf2, &ichdr2);
1673 1674
	xfs_trans_log_buf(args->trans, blk1->bp, 0, args->geo->blksize - 1);
	xfs_trans_log_buf(args->trans, blk2->bp, 0, args->geo->blksize - 1);
D
Dave Chinner 已提交
1675

L
Linus Torvalds 已提交
1676 1677 1678
	/*
	 * Copy out last hashval in each block for B-tree code.
	 */
D
Dave Chinner 已提交
1679 1680 1681 1682
	entries1 = xfs_attr3_leaf_entryp(leaf1);
	entries2 = xfs_attr3_leaf_entryp(leaf2);
	blk1->hashval = be32_to_cpu(entries1[ichdr1.count - 1].hashval);
	blk2->hashval = be32_to_cpu(entries2[ichdr2.count - 1].hashval);
L
Linus Torvalds 已提交
1683 1684 1685 1686 1687 1688 1689 1690 1691 1692 1693 1694 1695

	/*
	 * Adjust the expected index for insertion.
	 * NOTE: this code depends on the (current) situation that the
	 * second block was originally empty.
	 *
	 * If the insertion point moved to the 2nd block, we must adjust
	 * the index.  We must also track the entry just following the
	 * new entry for use in an "atomic rename" operation, that entry
	 * is always the "old" entry and the "new" entry is what we are
	 * inserting.  The index/blkno fields refer to the "old" entry,
	 * while the index2/blkno2 fields refer to the "new" entry.
	 */
D
Dave Chinner 已提交
1696
	if (blk1->index > ichdr1.count) {
L
Linus Torvalds 已提交
1697
		ASSERT(state->inleaf == 0);
D
Dave Chinner 已提交
1698
		blk2->index = blk1->index - ichdr1.count;
L
Linus Torvalds 已提交
1699 1700
		args->index = args->index2 = blk2->index;
		args->blkno = args->blkno2 = blk2->blkno;
D
Dave Chinner 已提交
1701
	} else if (blk1->index == ichdr1.count) {
L
Linus Torvalds 已提交
1702 1703 1704 1705 1706 1707
		if (state->inleaf) {
			args->index = blk1->index;
			args->blkno = blk1->blkno;
			args->index2 = 0;
			args->blkno2 = blk2->blkno;
		} else {
1708 1709 1710 1711 1712
			/*
			 * On a double leaf split, the original attr location
			 * is already stored in blkno2/index2, so don't
			 * overwrite it overwise we corrupt the tree.
			 */
D
Dave Chinner 已提交
1713
			blk2->index = blk1->index - ichdr1.count;
1714 1715 1716 1717 1718 1719 1720 1721 1722 1723 1724
			args->index = blk2->index;
			args->blkno = blk2->blkno;
			if (!state->extravalid) {
				/*
				 * set the new attr location to match the old
				 * one and let the higher level split code
				 * decide where in the leaf to place it.
				 */
				args->index2 = blk2->index;
				args->blkno2 = blk2->blkno;
			}
L
Linus Torvalds 已提交
1725 1726 1727 1728 1729 1730 1731 1732 1733 1734 1735 1736 1737 1738 1739 1740
		}
	} else {
		ASSERT(state->inleaf == 1);
		args->index = args->index2 = blk1->index;
		args->blkno = args->blkno2 = blk1->blkno;
	}
}

/*
 * Examine entries until we reduce the absolute difference in
 * byte usage between the two blocks to a minimum.
 * GROT: Is this really necessary?  With other than a 512 byte blocksize,
 * GROT: there will always be enough room in either block for a new entry.
 * GROT: Do a double-split for this case?
 */
STATIC int
D
Dave Chinner 已提交
1741 1742 1743 1744 1745 1746 1747 1748
xfs_attr3_leaf_figure_balance(
	struct xfs_da_state		*state,
	struct xfs_da_state_blk		*blk1,
	struct xfs_attr3_icleaf_hdr	*ichdr1,
	struct xfs_da_state_blk		*blk2,
	struct xfs_attr3_icleaf_hdr	*ichdr2,
	int				*countarg,
	int				*usedbytesarg)
L
Linus Torvalds 已提交
1749
{
D
Dave Chinner 已提交
1750 1751 1752 1753 1754 1755 1756 1757 1758 1759 1760
	struct xfs_attr_leafblock	*leaf1 = blk1->bp->b_addr;
	struct xfs_attr_leafblock	*leaf2 = blk2->bp->b_addr;
	struct xfs_attr_leaf_entry	*entry;
	int				count;
	int				max;
	int				index;
	int				totallen = 0;
	int				half;
	int				lastdelta;
	int				foundit = 0;
	int				tmp;
L
Linus Torvalds 已提交
1761 1762 1763 1764 1765

	/*
	 * Examine entries until we reduce the absolute difference in
	 * byte usage between the two blocks to a minimum.
	 */
D
Dave Chinner 已提交
1766 1767 1768
	max = ichdr1->count + ichdr2->count;
	half = (max + 1) * sizeof(*entry);
	half += ichdr1->usedbytes + ichdr2->usedbytes +
1769
			xfs_attr_leaf_newentsize(state->args, NULL);
L
Linus Torvalds 已提交
1770
	half /= 2;
1771
	lastdelta = state->args->geo->blksize;
D
Dave Chinner 已提交
1772
	entry = xfs_attr3_leaf_entryp(leaf1);
L
Linus Torvalds 已提交
1773 1774 1775 1776 1777 1778 1779 1780
	for (count = index = 0; count < max; entry++, index++, count++) {

#define XFS_ATTR_ABS(A)	(((A) < 0) ? -(A) : (A))
		/*
		 * The new entry is in the first block, account for it.
		 */
		if (count == blk1->index) {
			tmp = totallen + sizeof(*entry) +
1781
				xfs_attr_leaf_newentsize(state->args, NULL);
L
Linus Torvalds 已提交
1782 1783 1784 1785 1786 1787 1788 1789 1790 1791
			if (XFS_ATTR_ABS(half - tmp) > lastdelta)
				break;
			lastdelta = XFS_ATTR_ABS(half - tmp);
			totallen = tmp;
			foundit = 1;
		}

		/*
		 * Wrap around into the second block if necessary.
		 */
D
Dave Chinner 已提交
1792
		if (count == ichdr1->count) {
L
Linus Torvalds 已提交
1793
			leaf1 = leaf2;
D
Dave Chinner 已提交
1794
			entry = xfs_attr3_leaf_entryp(leaf1);
L
Linus Torvalds 已提交
1795 1796 1797 1798 1799 1800 1801 1802 1803 1804 1805 1806 1807 1808 1809 1810 1811 1812 1813 1814 1815 1816
			index = 0;
		}

		/*
		 * Figure out if next leaf entry would be too much.
		 */
		tmp = totallen + sizeof(*entry) + xfs_attr_leaf_entsize(leaf1,
									index);
		if (XFS_ATTR_ABS(half - tmp) > lastdelta)
			break;
		lastdelta = XFS_ATTR_ABS(half - tmp);
		totallen = tmp;
#undef XFS_ATTR_ABS
	}

	/*
	 * Calculate the number of usedbytes that will end up in lower block.
	 * If new entry not in lower block, fix up the count.
	 */
	totallen -= count * sizeof(*entry);
	if (foundit) {
		totallen -= sizeof(*entry) +
1817
				xfs_attr_leaf_newentsize(state->args, NULL);
L
Linus Torvalds 已提交
1818 1819 1820 1821
	}

	*countarg = count;
	*usedbytesarg = totallen;
D
Dave Chinner 已提交
1822
	return foundit;
L
Linus Torvalds 已提交
1823 1824 1825 1826 1827 1828 1829 1830 1831 1832 1833 1834 1835 1836 1837 1838 1839 1840
}

/*========================================================================
 * Routines used for shrinking the Btree.
 *========================================================================*/

/*
 * Check a leaf block and its neighbors to see if the block should be
 * collapsed into one or the other neighbor.  Always keep the block
 * with the smaller block number.
 * If the current block is over 50% full, don't try to join it, return 0.
 * If the block is empty, fill in the state structure and return 2.
 * If it can be collapsed, fill in the state structure and return 1.
 * If nothing can be done, return 0.
 *
 * GROT: allow for INCOMPLETE entries in calculation.
 */
int
D
Dave Chinner 已提交
1841 1842 1843
xfs_attr3_leaf_toosmall(
	struct xfs_da_state	*state,
	int			*action)
L
Linus Torvalds 已提交
1844
{
D
Dave Chinner 已提交
1845 1846 1847 1848 1849 1850 1851 1852 1853 1854
	struct xfs_attr_leafblock *leaf;
	struct xfs_da_state_blk	*blk;
	struct xfs_attr3_icleaf_hdr ichdr;
	struct xfs_buf		*bp;
	xfs_dablk_t		blkno;
	int			bytes;
	int			forward;
	int			error;
	int			retval;
	int			i;
L
Linus Torvalds 已提交
1855

1856 1857
	trace_xfs_attr_leaf_toosmall(state->args);

L
Linus Torvalds 已提交
1858 1859 1860 1861 1862 1863
	/*
	 * Check for the degenerate case of the block being over 50% full.
	 * If so, it's not worth even looking to see if we might be able
	 * to coalesce with a sibling.
	 */
	blk = &state->path.blk[ state->path.active-1 ];
D
Dave Chinner 已提交
1864
	leaf = blk->bp->b_addr;
1865
	xfs_attr3_leaf_hdr_from_disk(state->args->geo, &ichdr, leaf);
D
Dave Chinner 已提交
1866 1867 1868
	bytes = xfs_attr3_leaf_hdr_size(leaf) +
		ichdr.count * sizeof(xfs_attr_leaf_entry_t) +
		ichdr.usedbytes;
1869
	if (bytes > (state->args->geo->blksize >> 1)) {
L
Linus Torvalds 已提交
1870
		*action = 0;	/* blk over 50%, don't try to join */
E
Eric Sandeen 已提交
1871
		return 0;
L
Linus Torvalds 已提交
1872 1873 1874 1875 1876
	}

	/*
	 * Check for the degenerate case of the block being empty.
	 * If the block is empty, we'll simply delete it, no need to
1877
	 * coalesce it with a sibling block.  We choose (arbitrarily)
L
Linus Torvalds 已提交
1878 1879
	 * to merge with the forward block unless it is NULL.
	 */
D
Dave Chinner 已提交
1880
	if (ichdr.count == 0) {
L
Linus Torvalds 已提交
1881 1882 1883 1884
		/*
		 * Make altpath point to the block we want to keep and
		 * path point to the block we want to drop (this one).
		 */
D
Dave Chinner 已提交
1885
		forward = (ichdr.forw != 0);
L
Linus Torvalds 已提交
1886
		memcpy(&state->altpath, &state->path, sizeof(state->path));
1887
		error = xfs_da3_path_shift(state, &state->altpath, forward,
L
Linus Torvalds 已提交
1888 1889
						 0, &retval);
		if (error)
E
Eric Sandeen 已提交
1890
			return error;
L
Linus Torvalds 已提交
1891 1892 1893 1894 1895
		if (retval) {
			*action = 0;
		} else {
			*action = 2;
		}
D
Dave Chinner 已提交
1896
		return 0;
L
Linus Torvalds 已提交
1897 1898 1899 1900 1901 1902 1903 1904 1905 1906
	}

	/*
	 * Examine each sibling block to see if we can coalesce with
	 * at least 25% free space to spare.  We need to figure out
	 * whether to merge with the forward or the backward block.
	 * We prefer coalescing with the lower numbered sibling so as
	 * to shrink an attribute list over time.
	 */
	/* start with smaller blk num */
D
Dave Chinner 已提交
1907
	forward = ichdr.forw < ichdr.back;
L
Linus Torvalds 已提交
1908
	for (i = 0; i < 2; forward = !forward, i++) {
D
Dave Chinner 已提交
1909
		struct xfs_attr3_icleaf_hdr ichdr2;
L
Linus Torvalds 已提交
1910
		if (forward)
D
Dave Chinner 已提交
1911
			blkno = ichdr.forw;
L
Linus Torvalds 已提交
1912
		else
D
Dave Chinner 已提交
1913
			blkno = ichdr.back;
L
Linus Torvalds 已提交
1914 1915
		if (blkno == 0)
			continue;
D
Dave Chinner 已提交
1916
		error = xfs_attr3_leaf_read(state->args->trans, state->args->dp,
1917
					blkno, -1, &bp);
L
Linus Torvalds 已提交
1918
		if (error)
E
Eric Sandeen 已提交
1919
			return error;
L
Linus Torvalds 已提交
1920

1921
		xfs_attr3_leaf_hdr_from_disk(state->args->geo, &ichdr2, bp->b_addr);
D
Dave Chinner 已提交
1922

1923 1924
		bytes = state->args->geo->blksize -
			(state->args->geo->blksize >> 2) -
D
Dave Chinner 已提交
1925 1926 1927 1928 1929
			ichdr.usedbytes - ichdr2.usedbytes -
			((ichdr.count + ichdr2.count) *
					sizeof(xfs_attr_leaf_entry_t)) -
			xfs_attr3_leaf_hdr_size(leaf);

1930
		xfs_trans_brelse(state->args->trans, bp);
L
Linus Torvalds 已提交
1931 1932 1933 1934 1935
		if (bytes >= 0)
			break;	/* fits with at least 25% to spare */
	}
	if (i >= 2) {
		*action = 0;
E
Eric Sandeen 已提交
1936
		return 0;
L
Linus Torvalds 已提交
1937 1938 1939 1940 1941 1942 1943 1944
	}

	/*
	 * Make altpath point to the block we want to keep (the lower
	 * numbered block) and path point to the block we want to drop.
	 */
	memcpy(&state->altpath, &state->path, sizeof(state->path));
	if (blkno < blk->blkno) {
1945
		error = xfs_da3_path_shift(state, &state->altpath, forward,
L
Linus Torvalds 已提交
1946 1947
						 0, &retval);
	} else {
1948
		error = xfs_da3_path_shift(state, &state->path, forward,
L
Linus Torvalds 已提交
1949 1950 1951
						 0, &retval);
	}
	if (error)
E
Eric Sandeen 已提交
1952
		return error;
L
Linus Torvalds 已提交
1953 1954 1955 1956 1957
	if (retval) {
		*action = 0;
	} else {
		*action = 1;
	}
E
Eric Sandeen 已提交
1958
	return 0;
L
Linus Torvalds 已提交
1959 1960 1961 1962 1963 1964 1965 1966 1967
}

/*
 * Remove a name from the leaf attribute list structure.
 *
 * Return 1 if leaf is less than 37% full, 0 if >= 37% full.
 * If two leaves are 37% full, when combined they will leave 25% free.
 */
int
D
Dave Chinner 已提交
1968 1969 1970
xfs_attr3_leaf_remove(
	struct xfs_buf		*bp,
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
1971
{
D
Dave Chinner 已提交
1972 1973 1974 1975 1976 1977 1978 1979 1980 1981
	struct xfs_attr_leafblock *leaf;
	struct xfs_attr3_icleaf_hdr ichdr;
	struct xfs_attr_leaf_entry *entry;
	int			before;
	int			after;
	int			smallest;
	int			entsize;
	int			tablesize;
	int			tmp;
	int			i;
L
Linus Torvalds 已提交
1982

1983 1984
	trace_xfs_attr_leaf_remove(args);

1985
	leaf = bp->b_addr;
1986
	xfs_attr3_leaf_hdr_from_disk(args->geo, &ichdr, leaf);
D
Dave Chinner 已提交
1987

1988
	ASSERT(ichdr.count > 0 && ichdr.count < args->geo->blksize / 8);
D
Dave Chinner 已提交
1989 1990 1991 1992 1993 1994 1995
	ASSERT(args->index >= 0 && args->index < ichdr.count);
	ASSERT(ichdr.firstused >= ichdr.count * sizeof(*entry) +
					xfs_attr3_leaf_hdr_size(leaf));

	entry = &xfs_attr3_leaf_entryp(leaf)[args->index];

	ASSERT(be16_to_cpu(entry->nameidx) >= ichdr.firstused);
1996
	ASSERT(be16_to_cpu(entry->nameidx) < args->geo->blksize);
L
Linus Torvalds 已提交
1997 1998 1999 2000 2001 2002 2003

	/*
	 * Scan through free region table:
	 *    check for adjacency of free'd entry with an existing one,
	 *    find smallest free region in case we need to replace it,
	 *    adjust any map that borders the entry table,
	 */
D
Dave Chinner 已提交
2004 2005 2006
	tablesize = ichdr.count * sizeof(xfs_attr_leaf_entry_t)
					+ xfs_attr3_leaf_hdr_size(leaf);
	tmp = ichdr.freemap[0].size;
L
Linus Torvalds 已提交
2007 2008 2009
	before = after = -1;
	smallest = XFS_ATTR_LEAF_MAPSIZE - 1;
	entsize = xfs_attr_leaf_entsize(leaf, args->index);
D
Dave Chinner 已提交
2010
	for (i = 0; i < XFS_ATTR_LEAF_MAPSIZE; i++) {
2011 2012
		ASSERT(ichdr.freemap[i].base < args->geo->blksize);
		ASSERT(ichdr.freemap[i].size < args->geo->blksize);
D
Dave Chinner 已提交
2013 2014 2015
		if (ichdr.freemap[i].base == tablesize) {
			ichdr.freemap[i].base -= sizeof(xfs_attr_leaf_entry_t);
			ichdr.freemap[i].size += sizeof(xfs_attr_leaf_entry_t);
L
Linus Torvalds 已提交
2016 2017
		}

D
Dave Chinner 已提交
2018 2019
		if (ichdr.freemap[i].base + ichdr.freemap[i].size ==
				be16_to_cpu(entry->nameidx)) {
L
Linus Torvalds 已提交
2020
			before = i;
D
Dave Chinner 已提交
2021 2022
		} else if (ichdr.freemap[i].base ==
				(be16_to_cpu(entry->nameidx) + entsize)) {
L
Linus Torvalds 已提交
2023
			after = i;
D
Dave Chinner 已提交
2024 2025
		} else if (ichdr.freemap[i].size < tmp) {
			tmp = ichdr.freemap[i].size;
L
Linus Torvalds 已提交
2026 2027 2028 2029 2030 2031 2032 2033 2034 2035
			smallest = i;
		}
	}

	/*
	 * Coalesce adjacent freemap regions,
	 * or replace the smallest region.
	 */
	if ((before >= 0) || (after >= 0)) {
		if ((before >= 0) && (after >= 0)) {
D
Dave Chinner 已提交
2036 2037 2038 2039
			ichdr.freemap[before].size += entsize;
			ichdr.freemap[before].size += ichdr.freemap[after].size;
			ichdr.freemap[after].base = 0;
			ichdr.freemap[after].size = 0;
L
Linus Torvalds 已提交
2040
		} else if (before >= 0) {
D
Dave Chinner 已提交
2041
			ichdr.freemap[before].size += entsize;
L
Linus Torvalds 已提交
2042
		} else {
D
Dave Chinner 已提交
2043 2044
			ichdr.freemap[after].base = be16_to_cpu(entry->nameidx);
			ichdr.freemap[after].size += entsize;
L
Linus Torvalds 已提交
2045 2046 2047 2048 2049
		}
	} else {
		/*
		 * Replace smallest region (if it is smaller than free'd entry)
		 */
D
Dave Chinner 已提交
2050 2051 2052
		if (ichdr.freemap[smallest].size < entsize) {
			ichdr.freemap[smallest].base = be16_to_cpu(entry->nameidx);
			ichdr.freemap[smallest].size = entsize;
L
Linus Torvalds 已提交
2053 2054 2055 2056 2057 2058
		}
	}

	/*
	 * Did we remove the first entry?
	 */
D
Dave Chinner 已提交
2059
	if (be16_to_cpu(entry->nameidx) == ichdr.firstused)
L
Linus Torvalds 已提交
2060 2061 2062 2063 2064 2065 2066
		smallest = 1;
	else
		smallest = 0;

	/*
	 * Compress the remaining entries and zero out the removed stuff.
	 */
D
Dave Chinner 已提交
2067 2068
	memset(xfs_attr3_leaf_name(leaf, args->index), 0, entsize);
	ichdr.usedbytes -= entsize;
2069
	xfs_trans_log_buf(args->trans, bp,
D
Dave Chinner 已提交
2070
	     XFS_DA_LOGRANGE(leaf, xfs_attr3_leaf_name(leaf, args->index),
L
Linus Torvalds 已提交
2071 2072
				   entsize));

D
Dave Chinner 已提交
2073 2074 2075
	tmp = (ichdr.count - args->index) * sizeof(xfs_attr_leaf_entry_t);
	memmove(entry, entry + 1, tmp);
	ichdr.count--;
2076
	xfs_trans_log_buf(args->trans, bp,
D
Dave Chinner 已提交
2077 2078 2079 2080
	    XFS_DA_LOGRANGE(leaf, entry, tmp + sizeof(xfs_attr_leaf_entry_t)));

	entry = &xfs_attr3_leaf_entryp(leaf)[ichdr.count];
	memset(entry, 0, sizeof(xfs_attr_leaf_entry_t));
L
Linus Torvalds 已提交
2081 2082 2083 2084 2085 2086 2087 2088

	/*
	 * If we removed the first entry, re-find the first used byte
	 * in the name area.  Note that if the entry was the "firstused",
	 * then we don't have a "hole" in our block resulting from
	 * removing the name.
	 */
	if (smallest) {
2089
		tmp = args->geo->blksize;
D
Dave Chinner 已提交
2090 2091 2092
		entry = xfs_attr3_leaf_entryp(leaf);
		for (i = ichdr.count - 1; i >= 0; entry++, i--) {
			ASSERT(be16_to_cpu(entry->nameidx) >= ichdr.firstused);
2093
			ASSERT(be16_to_cpu(entry->nameidx) < args->geo->blksize);
2094 2095 2096

			if (be16_to_cpu(entry->nameidx) < tmp)
				tmp = be16_to_cpu(entry->nameidx);
L
Linus Torvalds 已提交
2097
		}
D
Dave Chinner 已提交
2098
		ichdr.firstused = tmp;
2099
		ASSERT(ichdr.firstused != 0);
L
Linus Torvalds 已提交
2100
	} else {
D
Dave Chinner 已提交
2101
		ichdr.holes = 1;	/* mark as needing compaction */
L
Linus Torvalds 已提交
2102
	}
2103
	xfs_attr3_leaf_hdr_to_disk(args->geo, leaf, &ichdr);
2104
	xfs_trans_log_buf(args->trans, bp,
D
Dave Chinner 已提交
2105 2106
			  XFS_DA_LOGRANGE(leaf, &leaf->hdr,
					  xfs_attr3_leaf_hdr_size(leaf)));
L
Linus Torvalds 已提交
2107 2108 2109 2110 2111

	/*
	 * Check if leaf is less than 50% full, caller may want to
	 * "join" the leaf with a sibling if so.
	 */
D
Dave Chinner 已提交
2112 2113 2114
	tmp = ichdr.usedbytes + xfs_attr3_leaf_hdr_size(leaf) +
	      ichdr.count * sizeof(xfs_attr_leaf_entry_t);

2115
	return tmp < args->geo->magicpct; /* leaf is < 37% full */
L
Linus Torvalds 已提交
2116 2117 2118 2119 2120 2121
}

/*
 * Move all the attribute list entries from drop_leaf into save_leaf.
 */
void
D
Dave Chinner 已提交
2122 2123 2124 2125
xfs_attr3_leaf_unbalance(
	struct xfs_da_state	*state,
	struct xfs_da_state_blk	*drop_blk,
	struct xfs_da_state_blk	*save_blk)
L
Linus Torvalds 已提交
2126
{
D
Dave Chinner 已提交
2127 2128 2129 2130 2131
	struct xfs_attr_leafblock *drop_leaf = drop_blk->bp->b_addr;
	struct xfs_attr_leafblock *save_leaf = save_blk->bp->b_addr;
	struct xfs_attr3_icleaf_hdr drophdr;
	struct xfs_attr3_icleaf_hdr savehdr;
	struct xfs_attr_leaf_entry *entry;
L
Linus Torvalds 已提交
2132

2133 2134
	trace_xfs_attr_leaf_unbalance(state->args);

2135 2136
	drop_leaf = drop_blk->bp->b_addr;
	save_leaf = save_blk->bp->b_addr;
2137 2138
	xfs_attr3_leaf_hdr_from_disk(state->args->geo, &drophdr, drop_leaf);
	xfs_attr3_leaf_hdr_from_disk(state->args->geo, &savehdr, save_leaf);
D
Dave Chinner 已提交
2139
	entry = xfs_attr3_leaf_entryp(drop_leaf);
L
Linus Torvalds 已提交
2140 2141 2142 2143

	/*
	 * Save last hashval from dying block for later Btree fixup.
	 */
D
Dave Chinner 已提交
2144
	drop_blk->hashval = be32_to_cpu(entry[drophdr.count - 1].hashval);
L
Linus Torvalds 已提交
2145 2146 2147 2148 2149 2150

	/*
	 * Check if we need a temp buffer, or can we do it in place.
	 * Note that we don't check "leaf" for holes because we will
	 * always be dropping it, toosmall() decided that for us already.
	 */
D
Dave Chinner 已提交
2151
	if (savehdr.holes == 0) {
L
Linus Torvalds 已提交
2152 2153 2154 2155
		/*
		 * dest leaf has no holes, so we add there.  May need
		 * to make some room in the entry array.
		 */
D
Dave Chinner 已提交
2156 2157
		if (xfs_attr3_leaf_order(save_blk->bp, &savehdr,
					 drop_blk->bp, &drophdr)) {
2158 2159
			xfs_attr3_leaf_moveents(state->args,
						drop_leaf, &drophdr, 0,
D
Dave Chinner 已提交
2160
						save_leaf, &savehdr, 0,
2161
						drophdr.count);
L
Linus Torvalds 已提交
2162
		} else {
2163 2164
			xfs_attr3_leaf_moveents(state->args,
						drop_leaf, &drophdr, 0,
D
Dave Chinner 已提交
2165
						save_leaf, &savehdr,
2166
						savehdr.count, drophdr.count);
L
Linus Torvalds 已提交
2167 2168 2169 2170 2171 2172
		}
	} else {
		/*
		 * Destination has holes, so we make a temporary copy
		 * of the leaf and add them both to that.
		 */
D
Dave Chinner 已提交
2173 2174 2175
		struct xfs_attr_leafblock *tmp_leaf;
		struct xfs_attr3_icleaf_hdr tmphdr;

2176
		tmp_leaf = kmem_zalloc(state->args->geo->blksize, KM_SLEEP);
2177 2178 2179 2180 2181 2182 2183

		/*
		 * Copy the header into the temp leaf so that all the stuff
		 * not in the incore header is present and gets copied back in
		 * once we've moved all the entries.
		 */
		memcpy(tmp_leaf, save_leaf, xfs_attr3_leaf_hdr_size(save_leaf));
D
Dave Chinner 已提交
2184

2185
		memset(&tmphdr, 0, sizeof(tmphdr));
D
Dave Chinner 已提交
2186 2187 2188
		tmphdr.magic = savehdr.magic;
		tmphdr.forw = savehdr.forw;
		tmphdr.back = savehdr.back;
2189
		tmphdr.firstused = state->args->geo->blksize;
2190 2191

		/* write the header to the temp buffer to initialise it */
2192
		xfs_attr3_leaf_hdr_to_disk(state->args->geo, tmp_leaf, &tmphdr);
2193

D
Dave Chinner 已提交
2194 2195
		if (xfs_attr3_leaf_order(save_blk->bp, &savehdr,
					 drop_blk->bp, &drophdr)) {
2196 2197
			xfs_attr3_leaf_moveents(state->args,
						drop_leaf, &drophdr, 0,
D
Dave Chinner 已提交
2198
						tmp_leaf, &tmphdr, 0,
2199 2200 2201
						drophdr.count);
			xfs_attr3_leaf_moveents(state->args,
						save_leaf, &savehdr, 0,
D
Dave Chinner 已提交
2202
						tmp_leaf, &tmphdr, tmphdr.count,
2203
						savehdr.count);
L
Linus Torvalds 已提交
2204
		} else {
2205 2206
			xfs_attr3_leaf_moveents(state->args,
						save_leaf, &savehdr, 0,
D
Dave Chinner 已提交
2207
						tmp_leaf, &tmphdr, 0,
2208 2209 2210
						savehdr.count);
			xfs_attr3_leaf_moveents(state->args,
						drop_leaf, &drophdr, 0,
D
Dave Chinner 已提交
2211
						tmp_leaf, &tmphdr, tmphdr.count,
2212
						drophdr.count);
L
Linus Torvalds 已提交
2213
		}
2214
		memcpy(save_leaf, tmp_leaf, state->args->geo->blksize);
D
Dave Chinner 已提交
2215 2216
		savehdr = tmphdr; /* struct copy */
		kmem_free(tmp_leaf);
L
Linus Torvalds 已提交
2217 2218
	}

2219
	xfs_attr3_leaf_hdr_to_disk(state->args->geo, save_leaf, &savehdr);
2220
	xfs_trans_log_buf(state->args->trans, save_blk->bp, 0,
2221
					   state->args->geo->blksize - 1);
L
Linus Torvalds 已提交
2222 2223 2224 2225

	/*
	 * Copy out last hashval in each block for B-tree code.
	 */
D
Dave Chinner 已提交
2226 2227
	entry = xfs_attr3_leaf_entryp(save_leaf);
	save_blk->hashval = be32_to_cpu(entry[savehdr.count - 1].hashval);
L
Linus Torvalds 已提交
2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242 2243 2244 2245 2246 2247
}

/*========================================================================
 * Routines used for finding things in the Btree.
 *========================================================================*/

/*
 * Look up a name in a leaf attribute list structure.
 * This is the internal routine, it uses the caller's buffer.
 *
 * Note that duplicate keys are allowed, but only check within the
 * current leaf node.  The Btree code must check in adjacent leaf nodes.
 *
 * Return in args->index the index into the entry[] array of either
 * the found entry, or where the entry should have been (insert before
 * that entry).
 *
 * Don't change the args->value unless we find the attribute.
 */
int
D
Dave Chinner 已提交
2248 2249 2250
xfs_attr3_leaf_lookup_int(
	struct xfs_buf		*bp,
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
2251
{
D
Dave Chinner 已提交
2252 2253 2254 2255 2256 2257 2258 2259 2260
	struct xfs_attr_leafblock *leaf;
	struct xfs_attr3_icleaf_hdr ichdr;
	struct xfs_attr_leaf_entry *entry;
	struct xfs_attr_leaf_entry *entries;
	struct xfs_attr_leaf_name_local *name_loc;
	struct xfs_attr_leaf_name_remote *name_rmt;
	xfs_dahash_t		hashval;
	int			probe;
	int			span;
L
Linus Torvalds 已提交
2261

2262 2263
	trace_xfs_attr_leaf_lookup(args);

2264
	leaf = bp->b_addr;
2265
	xfs_attr3_leaf_hdr_from_disk(args->geo, &ichdr, leaf);
D
Dave Chinner 已提交
2266
	entries = xfs_attr3_leaf_entryp(leaf);
2267 2268
	if (ichdr.count >= args->geo->blksize / 8)
		return -EFSCORRUPTED;
L
Linus Torvalds 已提交
2269 2270 2271 2272 2273

	/*
	 * Binary search.  (note: small blocks will skip this loop)
	 */
	hashval = args->hashval;
D
Dave Chinner 已提交
2274 2275
	probe = span = ichdr.count / 2;
	for (entry = &entries[probe]; span > 4; entry = &entries[probe]) {
L
Linus Torvalds 已提交
2276
		span /= 2;
2277
		if (be32_to_cpu(entry->hashval) < hashval)
L
Linus Torvalds 已提交
2278
			probe += span;
2279
		else if (be32_to_cpu(entry->hashval) > hashval)
L
Linus Torvalds 已提交
2280 2281 2282 2283
			probe -= span;
		else
			break;
	}
2284 2285 2286 2287
	if (!(probe >= 0 && (!ichdr.count || probe < ichdr.count)))
		return -EFSCORRUPTED;
	if (!(span <= 4 || be32_to_cpu(entry->hashval) == hashval))
		return -EFSCORRUPTED;
L
Linus Torvalds 已提交
2288 2289 2290 2291 2292

	/*
	 * Since we may have duplicate hashval's, find the first matching
	 * hashval in the leaf.
	 */
D
Dave Chinner 已提交
2293
	while (probe > 0 && be32_to_cpu(entry->hashval) >= hashval) {
L
Linus Torvalds 已提交
2294 2295 2296
		entry--;
		probe--;
	}
D
Dave Chinner 已提交
2297 2298
	while (probe < ichdr.count &&
	       be32_to_cpu(entry->hashval) < hashval) {
L
Linus Torvalds 已提交
2299 2300 2301
		entry++;
		probe++;
	}
D
Dave Chinner 已提交
2302
	if (probe == ichdr.count || be32_to_cpu(entry->hashval) != hashval) {
L
Linus Torvalds 已提交
2303
		args->index = probe;
D
Dave Chinner 已提交
2304
		return -ENOATTR;
L
Linus Torvalds 已提交
2305 2306 2307 2308 2309
	}

	/*
	 * Duplicate keys may be present, so search all of them for a match.
	 */
D
Dave Chinner 已提交
2310
	for (; probe < ichdr.count && (be32_to_cpu(entry->hashval) == hashval);
L
Linus Torvalds 已提交
2311 2312 2313 2314 2315 2316 2317 2318 2319 2320 2321 2322 2323
			entry++, probe++) {
/*
 * GROT: Add code to remove incomplete entries.
 */
		/*
		 * If we are looking for INCOMPLETE entries, show only those.
		 * If we are looking for complete entries, show only those.
		 */
		if ((args->flags & XFS_ATTR_INCOMPLETE) !=
		    (entry->flags & XFS_ATTR_INCOMPLETE)) {
			continue;
		}
		if (entry->flags & XFS_ATTR_LOCAL) {
D
Dave Chinner 已提交
2324
			name_loc = xfs_attr3_leaf_name_local(leaf, probe);
L
Linus Torvalds 已提交
2325 2326
			if (name_loc->namelen != args->namelen)
				continue;
D
Dave Chinner 已提交
2327 2328
			if (memcmp(args->name, name_loc->nameval,
							args->namelen) != 0)
L
Linus Torvalds 已提交
2329
				continue;
2330
			if (!xfs_attr_namesp_match(args->flags, entry->flags))
L
Linus Torvalds 已提交
2331 2332
				continue;
			args->index = probe;
D
Dave Chinner 已提交
2333
			return -EEXIST;
L
Linus Torvalds 已提交
2334
		} else {
D
Dave Chinner 已提交
2335
			name_rmt = xfs_attr3_leaf_name_remote(leaf, probe);
L
Linus Torvalds 已提交
2336 2337
			if (name_rmt->namelen != args->namelen)
				continue;
D
Dave Chinner 已提交
2338 2339
			if (memcmp(args->name, name_rmt->name,
							args->namelen) != 0)
L
Linus Torvalds 已提交
2340
				continue;
2341
			if (!xfs_attr_namesp_match(args->flags, entry->flags))
L
Linus Torvalds 已提交
2342 2343
				continue;
			args->index = probe;
2344
			args->rmtvaluelen = be32_to_cpu(name_rmt->valuelen);
2345
			args->rmtblkno = be32_to_cpu(name_rmt->valueblk);
D
Dave Chinner 已提交
2346 2347
			args->rmtblkcnt = xfs_attr3_rmt_blocks(
							args->dp->i_mount,
2348
							args->rmtvaluelen);
D
Dave Chinner 已提交
2349
			return -EEXIST;
L
Linus Torvalds 已提交
2350 2351 2352
		}
	}
	args->index = probe;
D
Dave Chinner 已提交
2353
	return -ENOATTR;
L
Linus Torvalds 已提交
2354 2355 2356 2357 2358 2359 2360
}

/*
 * Get the value associated with an attribute name from a leaf attribute
 * list structure.
 */
int
D
Dave Chinner 已提交
2361 2362 2363
xfs_attr3_leaf_getvalue(
	struct xfs_buf		*bp,
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
2364
{
D
Dave Chinner 已提交
2365 2366 2367 2368 2369 2370
	struct xfs_attr_leafblock *leaf;
	struct xfs_attr3_icleaf_hdr ichdr;
	struct xfs_attr_leaf_entry *entry;
	struct xfs_attr_leaf_name_local *name_loc;
	struct xfs_attr_leaf_name_remote *name_rmt;
	int			valuelen;
L
Linus Torvalds 已提交
2371

2372
	leaf = bp->b_addr;
2373
	xfs_attr3_leaf_hdr_from_disk(args->geo, &ichdr, leaf);
2374
	ASSERT(ichdr.count < args->geo->blksize / 8);
D
Dave Chinner 已提交
2375
	ASSERT(args->index < ichdr.count);
L
Linus Torvalds 已提交
2376

D
Dave Chinner 已提交
2377
	entry = &xfs_attr3_leaf_entryp(leaf)[args->index];
L
Linus Torvalds 已提交
2378
	if (entry->flags & XFS_ATTR_LOCAL) {
D
Dave Chinner 已提交
2379
		name_loc = xfs_attr3_leaf_name_local(leaf, args->index);
L
Linus Torvalds 已提交
2380 2381
		ASSERT(name_loc->namelen == args->namelen);
		ASSERT(memcmp(args->name, name_loc->nameval, args->namelen) == 0);
2382
		valuelen = be16_to_cpu(name_loc->valuelen);
L
Linus Torvalds 已提交
2383 2384
		if (args->flags & ATTR_KERNOVAL) {
			args->valuelen = valuelen;
D
Dave Chinner 已提交
2385
			return 0;
L
Linus Torvalds 已提交
2386 2387 2388
		}
		if (args->valuelen < valuelen) {
			args->valuelen = valuelen;
D
Dave Chinner 已提交
2389
			return -ERANGE;
L
Linus Torvalds 已提交
2390 2391 2392 2393
		}
		args->valuelen = valuelen;
		memcpy(args->value, &name_loc->nameval[args->namelen], valuelen);
	} else {
D
Dave Chinner 已提交
2394
		name_rmt = xfs_attr3_leaf_name_remote(leaf, args->index);
L
Linus Torvalds 已提交
2395 2396
		ASSERT(name_rmt->namelen == args->namelen);
		ASSERT(memcmp(args->name, name_rmt->name, args->namelen) == 0);
2397
		args->rmtvaluelen = be32_to_cpu(name_rmt->valuelen);
2398
		args->rmtblkno = be32_to_cpu(name_rmt->valueblk);
D
Dave Chinner 已提交
2399
		args->rmtblkcnt = xfs_attr3_rmt_blocks(args->dp->i_mount,
2400
						       args->rmtvaluelen);
L
Linus Torvalds 已提交
2401
		if (args->flags & ATTR_KERNOVAL) {
2402
			args->valuelen = args->rmtvaluelen;
D
Dave Chinner 已提交
2403
			return 0;
L
Linus Torvalds 已提交
2404
		}
2405 2406
		if (args->valuelen < args->rmtvaluelen) {
			args->valuelen = args->rmtvaluelen;
D
Dave Chinner 已提交
2407
			return -ERANGE;
L
Linus Torvalds 已提交
2408
		}
2409
		args->valuelen = args->rmtvaluelen;
L
Linus Torvalds 已提交
2410
	}
D
Dave Chinner 已提交
2411
	return 0;
L
Linus Torvalds 已提交
2412 2413 2414 2415 2416 2417 2418 2419 2420 2421 2422 2423
}

/*========================================================================
 * Utility routines.
 *========================================================================*/

/*
 * Move the indicated entries from one leaf to another.
 * NOTE: this routine modifies both source and destination leaves.
 */
/*ARGSUSED*/
STATIC void
D
Dave Chinner 已提交
2424
xfs_attr3_leaf_moveents(
2425
	struct xfs_da_args		*args,
D
Dave Chinner 已提交
2426 2427 2428 2429 2430 2431
	struct xfs_attr_leafblock	*leaf_s,
	struct xfs_attr3_icleaf_hdr	*ichdr_s,
	int				start_s,
	struct xfs_attr_leafblock	*leaf_d,
	struct xfs_attr3_icleaf_hdr	*ichdr_d,
	int				start_d,
2432
	int				count)
L
Linus Torvalds 已提交
2433
{
D
Dave Chinner 已提交
2434 2435 2436 2437 2438
	struct xfs_attr_leaf_entry	*entry_s;
	struct xfs_attr_leaf_entry	*entry_d;
	int				desti;
	int				tmp;
	int				i;
L
Linus Torvalds 已提交
2439 2440 2441 2442 2443 2444 2445 2446 2447 2448

	/*
	 * Check for nothing to do.
	 */
	if (count == 0)
		return;

	/*
	 * Set up environment.
	 */
D
Dave Chinner 已提交
2449 2450 2451
	ASSERT(ichdr_s->magic == XFS_ATTR_LEAF_MAGIC ||
	       ichdr_s->magic == XFS_ATTR3_LEAF_MAGIC);
	ASSERT(ichdr_s->magic == ichdr_d->magic);
2452
	ASSERT(ichdr_s->count > 0 && ichdr_s->count < args->geo->blksize / 8);
D
Dave Chinner 已提交
2453 2454
	ASSERT(ichdr_s->firstused >= (ichdr_s->count * sizeof(*entry_s))
					+ xfs_attr3_leaf_hdr_size(leaf_s));
2455
	ASSERT(ichdr_d->count < args->geo->blksize / 8);
D
Dave Chinner 已提交
2456 2457 2458 2459 2460 2461 2462
	ASSERT(ichdr_d->firstused >= (ichdr_d->count * sizeof(*entry_d))
					+ xfs_attr3_leaf_hdr_size(leaf_d));

	ASSERT(start_s < ichdr_s->count);
	ASSERT(start_d <= ichdr_d->count);
	ASSERT(count <= ichdr_s->count);

L
Linus Torvalds 已提交
2463 2464 2465 2466

	/*
	 * Move the entries in the destination leaf up to make a hole?
	 */
D
Dave Chinner 已提交
2467 2468
	if (start_d < ichdr_d->count) {
		tmp  = ichdr_d->count - start_d;
L
Linus Torvalds 已提交
2469
		tmp *= sizeof(xfs_attr_leaf_entry_t);
D
Dave Chinner 已提交
2470 2471 2472
		entry_s = &xfs_attr3_leaf_entryp(leaf_d)[start_d];
		entry_d = &xfs_attr3_leaf_entryp(leaf_d)[start_d + count];
		memmove(entry_d, entry_s, tmp);
L
Linus Torvalds 已提交
2473 2474 2475 2476 2477 2478
	}

	/*
	 * Copy all entry's in the same (sorted) order,
	 * but allocate attribute info packed and in sequence.
	 */
D
Dave Chinner 已提交
2479 2480
	entry_s = &xfs_attr3_leaf_entryp(leaf_s)[start_s];
	entry_d = &xfs_attr3_leaf_entryp(leaf_d)[start_d];
L
Linus Torvalds 已提交
2481 2482
	desti = start_d;
	for (i = 0; i < count; entry_s++, entry_d++, desti++, i++) {
D
Dave Chinner 已提交
2483
		ASSERT(be16_to_cpu(entry_s->nameidx) >= ichdr_s->firstused);
L
Linus Torvalds 已提交
2484 2485 2486 2487 2488 2489 2490 2491
		tmp = xfs_attr_leaf_entsize(leaf_s, start_s + i);
#ifdef GROT
		/*
		 * Code to drop INCOMPLETE entries.  Difficult to use as we
		 * may also need to change the insertion index.  Code turned
		 * off for 6.2, should be revisited later.
		 */
		if (entry_s->flags & XFS_ATTR_INCOMPLETE) { /* skip partials? */
D
Dave Chinner 已提交
2492 2493 2494
			memset(xfs_attr3_leaf_name(leaf_s, start_s + i), 0, tmp);
			ichdr_s->usedbytes -= tmp;
			ichdr_s->count -= 1;
L
Linus Torvalds 已提交
2495 2496 2497 2498 2499 2500
			entry_d--;	/* to compensate for ++ in loop hdr */
			desti--;
			if ((start_s + i) < offset)
				result++;	/* insertion index adjustment */
		} else {
#endif /* GROT */
D
Dave Chinner 已提交
2501
			ichdr_d->firstused -= tmp;
L
Linus Torvalds 已提交
2502 2503
			/* both on-disk, don't endian flip twice */
			entry_d->hashval = entry_s->hashval;
D
Dave Chinner 已提交
2504
			entry_d->nameidx = cpu_to_be16(ichdr_d->firstused);
L
Linus Torvalds 已提交
2505
			entry_d->flags = entry_s->flags;
2506
			ASSERT(be16_to_cpu(entry_d->nameidx) + tmp
2507
							<= args->geo->blksize);
D
Dave Chinner 已提交
2508 2509
			memmove(xfs_attr3_leaf_name(leaf_d, desti),
				xfs_attr3_leaf_name(leaf_s, start_s + i), tmp);
2510
			ASSERT(be16_to_cpu(entry_s->nameidx) + tmp
2511
							<= args->geo->blksize);
D
Dave Chinner 已提交
2512 2513 2514 2515 2516 2517 2518 2519
			memset(xfs_attr3_leaf_name(leaf_s, start_s + i), 0, tmp);
			ichdr_s->usedbytes -= tmp;
			ichdr_d->usedbytes += tmp;
			ichdr_s->count -= 1;
			ichdr_d->count += 1;
			tmp = ichdr_d->count * sizeof(xfs_attr_leaf_entry_t)
					+ xfs_attr3_leaf_hdr_size(leaf_d);
			ASSERT(ichdr_d->firstused >= tmp);
L
Linus Torvalds 已提交
2520 2521 2522 2523 2524 2525 2526 2527
#ifdef GROT
		}
#endif /* GROT */
	}

	/*
	 * Zero out the entries we just copied.
	 */
D
Dave Chinner 已提交
2528
	if (start_s == ichdr_s->count) {
L
Linus Torvalds 已提交
2529
		tmp = count * sizeof(xfs_attr_leaf_entry_t);
D
Dave Chinner 已提交
2530
		entry_s = &xfs_attr3_leaf_entryp(leaf_s)[start_s];
L
Linus Torvalds 已提交
2531
		ASSERT(((char *)entry_s + tmp) <=
2532
		       ((char *)leaf_s + args->geo->blksize));
D
Dave Chinner 已提交
2533
		memset(entry_s, 0, tmp);
L
Linus Torvalds 已提交
2534 2535 2536 2537 2538
	} else {
		/*
		 * Move the remaining entries down to fill the hole,
		 * then zero the entries at the top.
		 */
D
Dave Chinner 已提交
2539 2540 2541 2542
		tmp  = (ichdr_s->count - count) * sizeof(xfs_attr_leaf_entry_t);
		entry_s = &xfs_attr3_leaf_entryp(leaf_s)[start_s + count];
		entry_d = &xfs_attr3_leaf_entryp(leaf_s)[start_s];
		memmove(entry_d, entry_s, tmp);
L
Linus Torvalds 已提交
2543 2544

		tmp = count * sizeof(xfs_attr_leaf_entry_t);
D
Dave Chinner 已提交
2545
		entry_s = &xfs_attr3_leaf_entryp(leaf_s)[ichdr_s->count];
L
Linus Torvalds 已提交
2546
		ASSERT(((char *)entry_s + tmp) <=
2547
		       ((char *)leaf_s + args->geo->blksize));
D
Dave Chinner 已提交
2548
		memset(entry_s, 0, tmp);
L
Linus Torvalds 已提交
2549 2550 2551 2552 2553
	}

	/*
	 * Fill in the freemap information
	 */
D
Dave Chinner 已提交
2554 2555 2556 2557 2558 2559 2560 2561
	ichdr_d->freemap[0].base = xfs_attr3_leaf_hdr_size(leaf_d);
	ichdr_d->freemap[0].base += ichdr_d->count * sizeof(xfs_attr_leaf_entry_t);
	ichdr_d->freemap[0].size = ichdr_d->firstused - ichdr_d->freemap[0].base;
	ichdr_d->freemap[1].base = 0;
	ichdr_d->freemap[2].base = 0;
	ichdr_d->freemap[1].size = 0;
	ichdr_d->freemap[2].size = 0;
	ichdr_s->holes = 1;	/* leaf may not be compact */
L
Linus Torvalds 已提交
2562 2563 2564 2565 2566 2567
}

/*
 * Pick up the last hashvalue from a leaf block.
 */
xfs_dahash_t
2568 2569 2570
xfs_attr_leaf_lasthash(
	struct xfs_buf	*bp,
	int		*count)
L
Linus Torvalds 已提交
2571
{
D
Dave Chinner 已提交
2572 2573
	struct xfs_attr3_icleaf_hdr ichdr;
	struct xfs_attr_leaf_entry *entries;
2574
	struct xfs_mount *mp = bp->b_target->bt_mount;
L
Linus Torvalds 已提交
2575

2576
	xfs_attr3_leaf_hdr_from_disk(mp->m_attr_geo, &ichdr, bp->b_addr);
D
Dave Chinner 已提交
2577
	entries = xfs_attr3_leaf_entryp(bp->b_addr);
L
Linus Torvalds 已提交
2578
	if (count)
D
Dave Chinner 已提交
2579 2580 2581 2582
		*count = ichdr.count;
	if (!ichdr.count)
		return 0;
	return be32_to_cpu(entries[ichdr.count - 1].hashval);
L
Linus Torvalds 已提交
2583 2584 2585 2586 2587 2588
}

/*
 * Calculate the number of bytes used to store the indicated attribute
 * (whether local or remote only calculate bytes in this block).
 */
2589
STATIC int
L
Linus Torvalds 已提交
2590 2591
xfs_attr_leaf_entsize(xfs_attr_leafblock_t *leaf, int index)
{
D
Dave Chinner 已提交
2592
	struct xfs_attr_leaf_entry *entries;
L
Linus Torvalds 已提交
2593 2594 2595 2596
	xfs_attr_leaf_name_local_t *name_loc;
	xfs_attr_leaf_name_remote_t *name_rmt;
	int size;

D
Dave Chinner 已提交
2597 2598 2599
	entries = xfs_attr3_leaf_entryp(leaf);
	if (entries[index].flags & XFS_ATTR_LOCAL) {
		name_loc = xfs_attr3_leaf_name_local(leaf, index);
2600
		size = xfs_attr_leaf_entsize_local(name_loc->namelen,
2601
						   be16_to_cpu(name_loc->valuelen));
L
Linus Torvalds 已提交
2602
	} else {
D
Dave Chinner 已提交
2603
		name_rmt = xfs_attr3_leaf_name_remote(leaf, index);
2604
		size = xfs_attr_leaf_entsize_remote(name_rmt->namelen);
L
Linus Torvalds 已提交
2605
	}
D
Dave Chinner 已提交
2606
	return size;
L
Linus Torvalds 已提交
2607 2608 2609 2610 2611 2612 2613 2614 2615
}

/*
 * Calculate the number of bytes that would be required to store the new
 * attribute (whether local or remote only calculate bytes in this block).
 * This routine decides as a side effect whether the attribute will be
 * a "local" or a "remote" attribute.
 */
int
2616 2617 2618
xfs_attr_leaf_newentsize(
	struct xfs_da_args	*args,
	int			*local)
L
Linus Torvalds 已提交
2619
{
2620
	int			size;
L
Linus Torvalds 已提交
2621

2622 2623 2624
	size = xfs_attr_leaf_entsize_local(args->namelen, args->valuelen);
	if (size < xfs_attr_leaf_entsize_local_max(args->geo->blksize)) {
		if (local)
L
Linus Torvalds 已提交
2625
			*local = 1;
2626
		return size;
L
Linus Torvalds 已提交
2627
	}
2628 2629 2630
	if (local)
		*local = 0;
	return xfs_attr_leaf_entsize_remote(args->namelen);
L
Linus Torvalds 已提交
2631 2632 2633 2634 2635 2636 2637 2638 2639 2640 2641
}


/*========================================================================
 * Manage the INCOMPLETE flag in a leaf entry
 *========================================================================*/

/*
 * Clear the INCOMPLETE flag on an entry in a leaf block.
 */
int
D
Dave Chinner 已提交
2642 2643
xfs_attr3_leaf_clearflag(
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
2644
{
D
Dave Chinner 已提交
2645 2646 2647 2648 2649
	struct xfs_attr_leafblock *leaf;
	struct xfs_attr_leaf_entry *entry;
	struct xfs_attr_leaf_name_remote *name_rmt;
	struct xfs_buf		*bp;
	int			error;
L
Linus Torvalds 已提交
2650
#ifdef DEBUG
D
Dave Chinner 已提交
2651
	struct xfs_attr3_icleaf_hdr ichdr;
L
Linus Torvalds 已提交
2652 2653 2654 2655 2656
	xfs_attr_leaf_name_local_t *name_loc;
	int namelen;
	char *name;
#endif /* DEBUG */

2657
	trace_xfs_attr_leaf_clearflag(args);
L
Linus Torvalds 已提交
2658 2659 2660
	/*
	 * Set up the operation.
	 */
D
Dave Chinner 已提交
2661
	error = xfs_attr3_leaf_read(args->trans, args->dp, args->blkno, -1, &bp);
2662
	if (error)
E
Eric Sandeen 已提交
2663
		return error;
L
Linus Torvalds 已提交
2664

2665
	leaf = bp->b_addr;
D
Dave Chinner 已提交
2666
	entry = &xfs_attr3_leaf_entryp(leaf)[args->index];
L
Linus Torvalds 已提交
2667 2668 2669
	ASSERT(entry->flags & XFS_ATTR_INCOMPLETE);

#ifdef DEBUG
2670
	xfs_attr3_leaf_hdr_from_disk(args->geo, &ichdr, leaf);
D
Dave Chinner 已提交
2671 2672 2673
	ASSERT(args->index < ichdr.count);
	ASSERT(args->index >= 0);

L
Linus Torvalds 已提交
2674
	if (entry->flags & XFS_ATTR_LOCAL) {
D
Dave Chinner 已提交
2675
		name_loc = xfs_attr3_leaf_name_local(leaf, args->index);
L
Linus Torvalds 已提交
2676 2677 2678
		namelen = name_loc->namelen;
		name = (char *)name_loc->nameval;
	} else {
D
Dave Chinner 已提交
2679
		name_rmt = xfs_attr3_leaf_name_remote(leaf, args->index);
L
Linus Torvalds 已提交
2680 2681 2682
		namelen = name_rmt->namelen;
		name = (char *)name_rmt->name;
	}
2683
	ASSERT(be32_to_cpu(entry->hashval) == args->hashval);
L
Linus Torvalds 已提交
2684 2685 2686 2687 2688
	ASSERT(namelen == args->namelen);
	ASSERT(memcmp(name, args->name, namelen) == 0);
#endif /* DEBUG */

	entry->flags &= ~XFS_ATTR_INCOMPLETE;
2689
	xfs_trans_log_buf(args->trans, bp,
L
Linus Torvalds 已提交
2690 2691 2692 2693
			 XFS_DA_LOGRANGE(leaf, entry, sizeof(*entry)));

	if (args->rmtblkno) {
		ASSERT((entry->flags & XFS_ATTR_LOCAL) == 0);
D
Dave Chinner 已提交
2694
		name_rmt = xfs_attr3_leaf_name_remote(leaf, args->index);
2695
		name_rmt->valueblk = cpu_to_be32(args->rmtblkno);
2696
		name_rmt->valuelen = cpu_to_be32(args->rmtvaluelen);
2697
		xfs_trans_log_buf(args->trans, bp,
L
Linus Torvalds 已提交
2698 2699 2700 2701 2702 2703
			 XFS_DA_LOGRANGE(leaf, name_rmt, sizeof(*name_rmt)));
	}

	/*
	 * Commit the flag value change and start the next trans in series.
	 */
C
Christoph Hellwig 已提交
2704
	return xfs_trans_roll_inode(&args->trans, args->dp);
L
Linus Torvalds 已提交
2705 2706 2707 2708 2709 2710
}

/*
 * Set the INCOMPLETE flag on an entry in a leaf block.
 */
int
D
Dave Chinner 已提交
2711 2712
xfs_attr3_leaf_setflag(
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
2713
{
D
Dave Chinner 已提交
2714 2715 2716 2717
	struct xfs_attr_leafblock *leaf;
	struct xfs_attr_leaf_entry *entry;
	struct xfs_attr_leaf_name_remote *name_rmt;
	struct xfs_buf		*bp;
L
Linus Torvalds 已提交
2718
	int error;
D
Dave Chinner 已提交
2719 2720 2721
#ifdef DEBUG
	struct xfs_attr3_icleaf_hdr ichdr;
#endif
L
Linus Torvalds 已提交
2722

2723 2724
	trace_xfs_attr_leaf_setflag(args);

L
Linus Torvalds 已提交
2725 2726 2727
	/*
	 * Set up the operation.
	 */
D
Dave Chinner 已提交
2728
	error = xfs_attr3_leaf_read(args->trans, args->dp, args->blkno, -1, &bp);
2729
	if (error)
E
Eric Sandeen 已提交
2730
		return error;
L
Linus Torvalds 已提交
2731

2732
	leaf = bp->b_addr;
D
Dave Chinner 已提交
2733
#ifdef DEBUG
2734
	xfs_attr3_leaf_hdr_from_disk(args->geo, &ichdr, leaf);
D
Dave Chinner 已提交
2735
	ASSERT(args->index < ichdr.count);
L
Linus Torvalds 已提交
2736
	ASSERT(args->index >= 0);
D
Dave Chinner 已提交
2737 2738
#endif
	entry = &xfs_attr3_leaf_entryp(leaf)[args->index];
L
Linus Torvalds 已提交
2739 2740 2741

	ASSERT((entry->flags & XFS_ATTR_INCOMPLETE) == 0);
	entry->flags |= XFS_ATTR_INCOMPLETE;
2742
	xfs_trans_log_buf(args->trans, bp,
L
Linus Torvalds 已提交
2743 2744
			XFS_DA_LOGRANGE(leaf, entry, sizeof(*entry)));
	if ((entry->flags & XFS_ATTR_LOCAL) == 0) {
D
Dave Chinner 已提交
2745
		name_rmt = xfs_attr3_leaf_name_remote(leaf, args->index);
L
Linus Torvalds 已提交
2746 2747
		name_rmt->valueblk = 0;
		name_rmt->valuelen = 0;
2748
		xfs_trans_log_buf(args->trans, bp,
L
Linus Torvalds 已提交
2749 2750 2751 2752 2753 2754
			 XFS_DA_LOGRANGE(leaf, name_rmt, sizeof(*name_rmt)));
	}

	/*
	 * Commit the flag value change and start the next trans in series.
	 */
C
Christoph Hellwig 已提交
2755
	return xfs_trans_roll_inode(&args->trans, args->dp);
L
Linus Torvalds 已提交
2756 2757 2758 2759 2760 2761 2762 2763 2764 2765
}

/*
 * In a single transaction, clear the INCOMPLETE flag on the leaf entry
 * given by args->blkno/index and set the INCOMPLETE flag on the leaf
 * entry given by args->blkno2/index2.
 *
 * Note that they could be in different blocks, or in the same block.
 */
int
D
Dave Chinner 已提交
2766 2767
xfs_attr3_leaf_flipflags(
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
2768
{
D
Dave Chinner 已提交
2769 2770 2771 2772 2773 2774 2775
	struct xfs_attr_leafblock *leaf1;
	struct xfs_attr_leafblock *leaf2;
	struct xfs_attr_leaf_entry *entry1;
	struct xfs_attr_leaf_entry *entry2;
	struct xfs_attr_leaf_name_remote *name_rmt;
	struct xfs_buf		*bp1;
	struct xfs_buf		*bp2;
L
Linus Torvalds 已提交
2776 2777
	int error;
#ifdef DEBUG
D
Dave Chinner 已提交
2778 2779
	struct xfs_attr3_icleaf_hdr ichdr1;
	struct xfs_attr3_icleaf_hdr ichdr2;
L
Linus Torvalds 已提交
2780 2781 2782 2783 2784
	xfs_attr_leaf_name_local_t *name_loc;
	int namelen1, namelen2;
	char *name1, *name2;
#endif /* DEBUG */

2785 2786
	trace_xfs_attr_leaf_flipflags(args);

L
Linus Torvalds 已提交
2787 2788 2789
	/*
	 * Read the block containing the "old" attr
	 */
D
Dave Chinner 已提交
2790
	error = xfs_attr3_leaf_read(args->trans, args->dp, args->blkno, -1, &bp1);
2791 2792
	if (error)
		return error;
L
Linus Torvalds 已提交
2793 2794 2795 2796 2797

	/*
	 * Read the block containing the "new" attr, if it is different
	 */
	if (args->blkno2 != args->blkno) {
D
Dave Chinner 已提交
2798
		error = xfs_attr3_leaf_read(args->trans, args->dp, args->blkno2,
2799 2800 2801
					   -1, &bp2);
		if (error)
			return error;
L
Linus Torvalds 已提交
2802 2803 2804 2805
	} else {
		bp2 = bp1;
	}

2806
	leaf1 = bp1->b_addr;
D
Dave Chinner 已提交
2807
	entry1 = &xfs_attr3_leaf_entryp(leaf1)[args->index];
L
Linus Torvalds 已提交
2808

2809
	leaf2 = bp2->b_addr;
D
Dave Chinner 已提交
2810
	entry2 = &xfs_attr3_leaf_entryp(leaf2)[args->index2];
L
Linus Torvalds 已提交
2811 2812

#ifdef DEBUG
2813
	xfs_attr3_leaf_hdr_from_disk(args->geo, &ichdr1, leaf1);
D
Dave Chinner 已提交
2814 2815 2816
	ASSERT(args->index < ichdr1.count);
	ASSERT(args->index >= 0);

2817
	xfs_attr3_leaf_hdr_from_disk(args->geo, &ichdr2, leaf2);
D
Dave Chinner 已提交
2818 2819 2820
	ASSERT(args->index2 < ichdr2.count);
	ASSERT(args->index2 >= 0);

L
Linus Torvalds 已提交
2821
	if (entry1->flags & XFS_ATTR_LOCAL) {
D
Dave Chinner 已提交
2822
		name_loc = xfs_attr3_leaf_name_local(leaf1, args->index);
L
Linus Torvalds 已提交
2823 2824 2825
		namelen1 = name_loc->namelen;
		name1 = (char *)name_loc->nameval;
	} else {
D
Dave Chinner 已提交
2826
		name_rmt = xfs_attr3_leaf_name_remote(leaf1, args->index);
L
Linus Torvalds 已提交
2827 2828 2829 2830
		namelen1 = name_rmt->namelen;
		name1 = (char *)name_rmt->name;
	}
	if (entry2->flags & XFS_ATTR_LOCAL) {
D
Dave Chinner 已提交
2831
		name_loc = xfs_attr3_leaf_name_local(leaf2, args->index2);
L
Linus Torvalds 已提交
2832 2833 2834
		namelen2 = name_loc->namelen;
		name2 = (char *)name_loc->nameval;
	} else {
D
Dave Chinner 已提交
2835
		name_rmt = xfs_attr3_leaf_name_remote(leaf2, args->index2);
L
Linus Torvalds 已提交
2836 2837 2838
		namelen2 = name_rmt->namelen;
		name2 = (char *)name_rmt->name;
	}
2839
	ASSERT(be32_to_cpu(entry1->hashval) == be32_to_cpu(entry2->hashval));
L
Linus Torvalds 已提交
2840 2841 2842 2843 2844 2845 2846 2847
	ASSERT(namelen1 == namelen2);
	ASSERT(memcmp(name1, name2, namelen1) == 0);
#endif /* DEBUG */

	ASSERT(entry1->flags & XFS_ATTR_INCOMPLETE);
	ASSERT((entry2->flags & XFS_ATTR_INCOMPLETE) == 0);

	entry1->flags &= ~XFS_ATTR_INCOMPLETE;
2848
	xfs_trans_log_buf(args->trans, bp1,
L
Linus Torvalds 已提交
2849 2850 2851
			  XFS_DA_LOGRANGE(leaf1, entry1, sizeof(*entry1)));
	if (args->rmtblkno) {
		ASSERT((entry1->flags & XFS_ATTR_LOCAL) == 0);
D
Dave Chinner 已提交
2852
		name_rmt = xfs_attr3_leaf_name_remote(leaf1, args->index);
2853
		name_rmt->valueblk = cpu_to_be32(args->rmtblkno);
2854
		name_rmt->valuelen = cpu_to_be32(args->rmtvaluelen);
2855
		xfs_trans_log_buf(args->trans, bp1,
L
Linus Torvalds 已提交
2856 2857 2858 2859
			 XFS_DA_LOGRANGE(leaf1, name_rmt, sizeof(*name_rmt)));
	}

	entry2->flags |= XFS_ATTR_INCOMPLETE;
2860
	xfs_trans_log_buf(args->trans, bp2,
L
Linus Torvalds 已提交
2861 2862
			  XFS_DA_LOGRANGE(leaf2, entry2, sizeof(*entry2)));
	if ((entry2->flags & XFS_ATTR_LOCAL) == 0) {
D
Dave Chinner 已提交
2863
		name_rmt = xfs_attr3_leaf_name_remote(leaf2, args->index2);
L
Linus Torvalds 已提交
2864 2865
		name_rmt->valueblk = 0;
		name_rmt->valuelen = 0;
2866
		xfs_trans_log_buf(args->trans, bp2,
L
Linus Torvalds 已提交
2867 2868 2869 2870 2871 2872
			 XFS_DA_LOGRANGE(leaf2, name_rmt, sizeof(*name_rmt)));
	}

	/*
	 * Commit the flag value change and start the next trans in series.
	 */
C
Christoph Hellwig 已提交
2873
	error = xfs_trans_roll_inode(&args->trans, args->dp);
L
Linus Torvalds 已提交
2874

D
Dave Chinner 已提交
2875
	return error;
L
Linus Torvalds 已提交
2876
}