xfs_attr.c 40.1 KB
Newer Older
D
Dave Chinner 已提交
1
// SPDX-License-Identifier: GPL-2.0
L
Linus Torvalds 已提交
2
/*
3 4
 * Copyright (c) 2000-2005 Silicon Graphics, Inc.
 * All Rights Reserved.
L
Linus Torvalds 已提交
5 6
 */
#include "xfs.h"
7
#include "xfs_fs.h"
8
#include "xfs_shared.h"
9 10 11
#include "xfs_format.h"
#include "xfs_log_format.h"
#include "xfs_trans_resv.h"
L
Linus Torvalds 已提交
12
#include "xfs_mount.h"
13
#include "xfs_defer.h"
14
#include "xfs_da_format.h"
15 16
#include "xfs_da_btree.h"
#include "xfs_attr_sf.h"
L
Linus Torvalds 已提交
17
#include "xfs_inode.h"
18
#include "xfs_trans.h"
L
Linus Torvalds 已提交
19
#include "xfs_bmap.h"
20
#include "xfs_bmap_btree.h"
L
Linus Torvalds 已提交
21 22
#include "xfs_attr.h"
#include "xfs_attr_leaf.h"
23
#include "xfs_attr_remote.h"
L
Linus Torvalds 已提交
24 25
#include "xfs_quota.h"
#include "xfs_trans_space.h"
C
Christoph Hellwig 已提交
26
#include "xfs_trace.h"
27
#include "xfs_attr_item.h"
28
#include "xfs_xattr.h"
29

30
struct kmem_cache		*xfs_attr_intent_cache;
L
Linus Torvalds 已提交
31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49

/*
 * xfs_attr.c
 *
 * Provide the external interfaces to manage attribute lists.
 */

/*========================================================================
 * Function prototypes for the kernel.
 *========================================================================*/

/*
 * Internal routines when attribute list fits inside the inode.
 */
STATIC int xfs_attr_shortform_addname(xfs_da_args_t *args);

/*
 * Internal routines when attribute list is one block.
 */
50
STATIC int xfs_attr_leaf_get(xfs_da_args_t *args);
L
Linus Torvalds 已提交
51
STATIC int xfs_attr_leaf_removename(xfs_da_args_t *args);
52
STATIC int xfs_attr_leaf_hasname(struct xfs_da_args *args, struct xfs_buf **bp);
53
STATIC int xfs_attr_leaf_try_add(struct xfs_da_args *args, struct xfs_buf *bp);
L
Linus Torvalds 已提交
54 55 56 57

/*
 * Internal routines when attribute list is more than one block.
 */
58
STATIC int xfs_attr_node_get(xfs_da_args_t *args);
59
STATIC void xfs_attr_restore_rmt_blk(struct xfs_da_args *args);
60 61 62
static int xfs_attr_node_try_addname(struct xfs_attr_intent *attr);
STATIC int xfs_attr_node_addname_find_attr(struct xfs_attr_intent *attr);
STATIC int xfs_attr_node_remove_attr(struct xfs_attr_intent *attr);
63 64
STATIC int xfs_attr_node_lookup(struct xfs_da_args *args,
		struct xfs_da_state *state);
L
Linus Torvalds 已提交
65

66
int
67 68 69
xfs_inode_hasattr(
	struct xfs_inode	*ip)
{
70 71 72 73 74 75
	if (!XFS_IFORK_Q(ip))
		return 0;
	if (!ip->i_afp)
		return 0;
	if (ip->i_afp->if_format == XFS_DINODE_FMT_EXTENTS &&
	    ip->i_afp->if_nextents == 0)
76 77 78 79
		return 0;
	return 1;
}

80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99
/*
 * Returns true if the there is exactly only block in the attr fork, in which
 * case the attribute fork consists of a single leaf block entry.
 */
bool
xfs_attr_is_leaf(
	struct xfs_inode	*ip)
{
	struct xfs_ifork	*ifp = ip->i_afp;
	struct xfs_iext_cursor	icur;
	struct xfs_bmbt_irec	imap;

	if (ifp->if_nextents != 1 || ifp->if_format != XFS_DINODE_FMT_EXTENTS)
		return false;

	xfs_iext_first(ifp, &icur);
	xfs_iext_get_extent(ifp, &icur, &imap);
	return imap.br_startoff == 0 && imap.br_blockcount == 1;
}

D
Dave Chinner 已提交
100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216
/*
 * XXX (dchinner): name path state saving and refilling is an optimisation to
 * avoid needing to look up name entries after rolling transactions removing
 * remote xattr blocks between the name entry lookup and name entry removal.
 * This optimisation got sidelined when combining the set and remove state
 * machines, but the code has been left in place because it is worthwhile to
 * restore the optimisation once the combined state machine paths have settled.
 *
 * This comment is a public service announcement to remind Future Dave that he
 * still needs to restore this code to working order.
 */
#if 0
/*
 * Fill in the disk block numbers in the state structure for the buffers
 * that are attached to the state structure.
 * This is done so that we can quickly reattach ourselves to those buffers
 * after some set of transaction commits have released these buffers.
 */
static int
xfs_attr_fillstate(xfs_da_state_t *state)
{
	xfs_da_state_path_t *path;
	xfs_da_state_blk_t *blk;
	int level;

	trace_xfs_attr_fillstate(state->args);

	/*
	 * Roll down the "path" in the state structure, storing the on-disk
	 * block number for those buffers in the "path".
	 */
	path = &state->path;
	ASSERT((path->active >= 0) && (path->active < XFS_DA_NODE_MAXDEPTH));
	for (blk = path->blk, level = 0; level < path->active; blk++, level++) {
		if (blk->bp) {
			blk->disk_blkno = xfs_buf_daddr(blk->bp);
			blk->bp = NULL;
		} else {
			blk->disk_blkno = 0;
		}
	}

	/*
	 * Roll down the "altpath" in the state structure, storing the on-disk
	 * block number for those buffers in the "altpath".
	 */
	path = &state->altpath;
	ASSERT((path->active >= 0) && (path->active < XFS_DA_NODE_MAXDEPTH));
	for (blk = path->blk, level = 0; level < path->active; blk++, level++) {
		if (blk->bp) {
			blk->disk_blkno = xfs_buf_daddr(blk->bp);
			blk->bp = NULL;
		} else {
			blk->disk_blkno = 0;
		}
	}

	return 0;
}

/*
 * Reattach the buffers to the state structure based on the disk block
 * numbers stored in the state structure.
 * This is done after some set of transaction commits have released those
 * buffers from our grip.
 */
static int
xfs_attr_refillstate(xfs_da_state_t *state)
{
	xfs_da_state_path_t *path;
	xfs_da_state_blk_t *blk;
	int level, error;

	trace_xfs_attr_refillstate(state->args);

	/*
	 * Roll down the "path" in the state structure, storing the on-disk
	 * block number for those buffers in the "path".
	 */
	path = &state->path;
	ASSERT((path->active >= 0) && (path->active < XFS_DA_NODE_MAXDEPTH));
	for (blk = path->blk, level = 0; level < path->active; blk++, level++) {
		if (blk->disk_blkno) {
			error = xfs_da3_node_read_mapped(state->args->trans,
					state->args->dp, blk->disk_blkno,
					&blk->bp, XFS_ATTR_FORK);
			if (error)
				return error;
		} else {
			blk->bp = NULL;
		}
	}

	/*
	 * Roll down the "altpath" in the state structure, storing the on-disk
	 * block number for those buffers in the "altpath".
	 */
	path = &state->altpath;
	ASSERT((path->active >= 0) && (path->active < XFS_DA_NODE_MAXDEPTH));
	for (blk = path->blk, level = 0; level < path->active; blk++, level++) {
		if (blk->disk_blkno) {
			error = xfs_da3_node_read_mapped(state->args->trans,
					state->args->dp, blk->disk_blkno,
					&blk->bp, XFS_ATTR_FORK);
			if (error)
				return error;
		} else {
			blk->bp = NULL;
		}
	}

	return 0;
}
#else
static int xfs_attr_fillstate(xfs_da_state_t *state) { return 0; }
#endif

L
Linus Torvalds 已提交
217 218 219 220
/*========================================================================
 * Overall external interface routines.
 *========================================================================*/

221 222 223 224
/*
 * Retrieve an extended attribute and its value.  Must have ilock.
 * Returns 0 on successful retrieval, otherwise an error.
 */
225 226 227 228
int
xfs_attr_get_ilocked(
	struct xfs_da_args	*args)
{
229
	ASSERT(xfs_isilocked(args->dp, XFS_ILOCK_SHARED | XFS_ILOCK_EXCL));
230

231
	if (!xfs_inode_hasattr(args->dp))
232
		return -ENOATTR;
233

234
	if (args->dp->i_afp->if_format == XFS_DINODE_FMT_LOCAL)
235
		return xfs_attr_shortform_getvalue(args);
236
	if (xfs_attr_is_leaf(args->dp))
237
		return xfs_attr_leaf_get(args);
238
	return xfs_attr_node_get(args);
239 240
}

241 242 243
/*
 * Retrieve an extended attribute by name, and its value if requested.
 *
C
Christoph Hellwig 已提交
244 245 246
 * If args->valuelen is zero, then the caller does not want the value, just an
 * indication whether the attribute exists and the size of the value if it
 * exists. The size is returned in args.valuelen.
247
 *
248 249 250 251 252
 * If args->value is NULL but args->valuelen is non-zero, allocate the buffer
 * for the value after existence of the attribute has been determined. The
 * caller always has to free args->value if it is set, no matter if this
 * function was successful or not.
 *
253
 * If the attribute is found, but exceeds the size limit set by the caller in
254 255
 * args->valuelen, return -ERANGE with the size of the attribute that was found
 * in args->valuelen.
256
 */
257 258
int
xfs_attr_get(
259
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
260
{
261 262 263
	uint			lock_mode;
	int			error;

264
	XFS_STATS_INC(args->dp->i_mount, xs_attr_get);
265

266
	if (xfs_is_shutdown(args->dp->i_mount))
D
Dave Chinner 已提交
267
		return -EIO;
L
Linus Torvalds 已提交
268

269 270 271
	args->geo = args->dp->i_mount->m_attr_geo;
	args->whichfork = XFS_ATTR_FORK;
	args->hashval = xfs_da_hashname(args->name, args->namelen);
272

273
	/* Entirely possible to look up a name which doesn't exist */
274
	args->op_flags = XFS_DA_OP_OKNOENT;
L
Linus Torvalds 已提交
275

276
	lock_mode = xfs_ilock_attr_map_shared(args->dp);
277
	error = xfs_attr_get_ilocked(args);
278
	xfs_iunlock(args->dp, lock_mode);
279

280
	return error;
L
Linus Torvalds 已提交
281 282
}

283 284 285
/*
 * Calculate how many blocks we need for the new attribute,
 */
286
int
287
xfs_attr_calc_size(
288
	struct xfs_da_args	*args,
289 290
	int			*local)
{
291
	struct xfs_mount	*mp = args->dp->i_mount;
292 293 294 295 296 297 298
	int			size;
	int			nblks;

	/*
	 * Determine space new attribute will use, and if it would be
	 * "local" or "remote" (note: local != inline).
	 */
299
	size = xfs_attr_leaf_newentsize(args, local);
300 301
	nblks = XFS_DAENTER_SPACE_RES(mp, XFS_ATTR_FORK);
	if (*local) {
302
		if (size > (args->geo->blksize / 2)) {
303 304 305 306 307 308 309 310
			/* Double split possible */
			nblks *= 2;
		}
	} else {
		/*
		 * Out of line attribute, cannot double split, but
		 * make room for the attribute value itself.
		 */
311
		uint	dblocks = xfs_attr3_rmt_blocks(mp, args->valuelen);
312 313 314 315 316 317 318
		nblks += dblocks;
		nblks += XFS_NEXTENTADD_SPACE_RES(mp, dblocks, XFS_ATTR_FORK);
	}

	return nblks;
}

319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340
/* Initialize transaction reservation for attr operations */
void
xfs_init_attr_trans(
	struct xfs_da_args	*args,
	struct xfs_trans_res	*tres,
	unsigned int		*total)
{
	struct xfs_mount	*mp = args->dp->i_mount;

	if (args->value) {
		tres->tr_logres = M_RES(mp)->tr_attrsetm.tr_logres +
				 M_RES(mp)->tr_attrsetrt.tr_logres *
				 args->total;
		tres->tr_logcount = XFS_ATTRSET_LOG_COUNT;
		tres->tr_logflags = XFS_TRANS_PERM_LOG_RES;
		*total = args->total;
	} else {
		*tres = M_RES(mp)->tr_attrrm;
		*total = XFS_ATTRRM_SPACE_RES(mp);
	}
}

341 342 343 344 345
/*
 * Add an attr to a shortform fork. If there is no space,
 * xfs_attr_shortform_addname() will convert to leaf format and return -ENOSPC.
 * to use.
 */
346 347 348 349 350 351
STATIC int
xfs_attr_try_sf_addname(
	struct xfs_inode	*dp,
	struct xfs_da_args	*args)
{

352 353 354 355 356 357 358
	int			error;

	/*
	 * Build initial attribute list (if required).
	 */
	if (dp->i_afp->if_format == XFS_DINODE_FMT_EXTENTS)
		xfs_attr_shortform_create(args);
359 360 361 362 363 364 365 366 367

	error = xfs_attr_shortform_addname(args);
	if (error == -ENOSPC)
		return error;

	/*
	 * Commit the shortform mods, and we're done.
	 * NOTE: this is also the error path (EEXIST, etc).
	 */
368
	if (!error && !(args->op_flags & XFS_DA_OP_NOTIME))
369 370
		xfs_trans_ichgtime(args->trans, dp, XFS_ICHGTIME_CHG);

371
	if (xfs_has_wsync(dp->i_mount))
372 373
		xfs_trans_set_sync(args->trans);

374
	return error;
375 376
}

377
static int
378
xfs_attr_sf_addname(
379
	struct xfs_attr_intent		*attr)
380
{
381
	struct xfs_da_args		*args = attr->xattri_da_args;
382 383
	struct xfs_inode		*dp = args->dp;
	int				error = 0;
384 385

	error = xfs_attr_try_sf_addname(dp, args);
386 387 388 389 390
	if (error != -ENOSPC) {
		ASSERT(!error || error == -EEXIST);
		attr->xattri_dela_state = XFS_DAS_DONE;
		goto out;
	}
391

392 393 394 395
	/*
	 * It won't fit in the shortform, transform to a leaf block.  GROT:
	 * another possible req'mt for a double-split btree op.
	 */
396
	error = xfs_attr_shortform_to_leaf(args, &attr->xattri_leaf_bp);
397 398 399 400 401 402
	if (error)
		return error;

	/*
	 * Prevent the leaf buffer from being unlocked so that a concurrent AIL
	 * push cannot grab the half-baked leaf buffer and run into problems
403
	 * with the write verifier.
404
	 */
405
	xfs_trans_bhold(args->trans, attr->xattri_leaf_bp);
406 407 408 409
	attr->xattri_dela_state = XFS_DAS_LEAF_ADD;
out:
	trace_xfs_attr_sf_addname_return(attr->xattri_dela_state, args->dp);
	return error;
410 411
}

412
/*
413 414 415 416 417 418 419 420 421
 * Handle the state change on completion of a multi-state attr operation.
 *
 * If the XFS_DA_OP_REPLACE flag is set, this means the operation was the first
 * modification in a attr replace operation and we still have to do the second
 * state, indicated by @replace_state.
 *
 * We consume the XFS_DA_OP_REPLACE flag so that when we are called again on
 * completion of the second half of the attr replace operation we correctly
 * signal that it is done.
422
 */
423 424
static enum xfs_delattr_state
xfs_attr_complete_op(
425
	struct xfs_attr_intent	*attr,
426
	enum xfs_delattr_state	replace_state)
427 428
{
	struct xfs_da_args	*args = attr->xattri_da_args;
429
	bool			do_replace = args->op_flags & XFS_DA_OP_REPLACE;
430

431 432 433 434 435 436
	args->op_flags &= ~XFS_DA_OP_REPLACE;
	if (do_replace) {
		args->attr_filter &= ~XFS_ATTR_INCOMPLETE;
		return replace_state;
	}
	return XFS_DAS_DONE;
437 438
}

439
static int
440
xfs_attr_leaf_addname(
441
	struct xfs_attr_intent	*attr)
442 443 444 445
{
	struct xfs_da_args	*args = attr->xattri_da_args;
	int			error;

446
	ASSERT(xfs_attr_is_leaf(args->dp));
447

448 449 450 451 452 453 454
	/*
	 * Use the leaf buffer we may already hold locked as a result of
	 * a sf-to-leaf conversion. The held buffer is no longer valid
	 * after this call, regardless of the result.
	 */
	error = xfs_attr_leaf_try_add(args, attr->xattri_leaf_bp);
	attr->xattri_leaf_bp = NULL;
455

456 457
	if (error == -ENOSPC) {
		error = xfs_attr3_leaf_to_node(args);
458 459 460
		if (error)
			return error;

461 462 463 464 465 466
		/*
		 * We're not in leaf format anymore, so roll the transaction and
		 * retry the add to the newly allocated node block.
		 */
		attr->xattri_dela_state = XFS_DAS_NODE_ADD;
		goto out;
467 468 469
	}
	if (error)
		return error;
470

471 472 473 474 475
	/*
	 * We need to commit and roll if we need to allocate remote xattr blocks
	 * or perform more xattr manipulations. Otherwise there is nothing more
	 * to do and we can return success.
	 */
476
	if (args->rmtblkno)
477
		attr->xattri_dela_state = XFS_DAS_LEAF_SET_RMT;
478
	else
479 480
		attr->xattri_dela_state = xfs_attr_complete_op(attr,
							XFS_DAS_LEAF_REPLACE);
481
out:
482
	trace_xfs_attr_leaf_addname_return(attr->xattri_dela_state, args->dp);
483
	return error;
484 485
}

486 487 488 489 490 491 492
/*
 * Add an entry to a node format attr tree.
 *
 * Note that we might still have a leaf here - xfs_attr_is_leaf() cannot tell
 * the difference between leaf + remote attr blocks and a node format tree,
 * so we may still end up having to convert from leaf to node format here.
 */
493 494
static int
xfs_attr_node_addname(
495
	struct xfs_attr_intent	*attr)
496 497 498 499 500 501 502 503 504 505 506
{
	struct xfs_da_args	*args = attr->xattri_da_args;
	int			error;

	ASSERT(!attr->xattri_leaf_bp);

	error = xfs_attr_node_addname_find_attr(attr);
	if (error)
		return error;

	error = xfs_attr_node_try_addname(attr);
507 508 509 510 511 512 513 514 515 516
	if (error == -ENOSPC) {
		error = xfs_attr3_leaf_to_node(args);
		if (error)
			return error;
		/*
		 * No state change, we really are in node form now
		 * but we need the transaction rolled to continue.
		 */
		goto out;
	}
517 518 519
	if (error)
		return error;

520
	if (args->rmtblkno)
521
		attr->xattri_dela_state = XFS_DAS_NODE_SET_RMT;
522
	else
523 524
		attr->xattri_dela_state = xfs_attr_complete_op(attr,
							XFS_DAS_NODE_REPLACE);
525
out:
526 527 528 529
	trace_xfs_attr_node_addname_return(attr->xattri_dela_state, args->dp);
	return error;
}

530 531
static int
xfs_attr_rmtval_alloc(
532
	struct xfs_attr_intent		*attr)
533 534 535 536 537 538 539 540 541 542 543 544 545 546
{
	struct xfs_da_args              *args = attr->xattri_da_args;
	int				error = 0;

	/*
	 * If there was an out-of-line value, allocate the blocks we
	 * identified for its storage and copy the value.  This is done
	 * after we create the attribute so that we don't overflow the
	 * maximum size of a transaction and/or hit a deadlock.
	 */
	if (attr->xattri_blkcnt > 0) {
		error = xfs_attr_rmtval_set_blk(attr);
		if (error)
			return error;
547
		/* Roll the transaction only if there is more to allocate. */
548
		if (attr->xattri_blkcnt > 0)
549
			goto out;
550 551 552 553 554 555
	}

	error = xfs_attr_rmtval_set_value(args);
	if (error)
		return error;

556 557 558 559 560 561 562 563
	attr->xattri_dela_state = xfs_attr_complete_op(attr,
						++attr->xattri_dela_state);
	/*
	 * If we are not doing a rename, we've finished the operation but still
	 * have to clear the incomplete flag protecting the new attr from
	 * exposing partially initialised state if we crash during creation.
	 */
	if (attr->xattri_dela_state == XFS_DAS_DONE)
564 565 566 567 568
		error = xfs_attr3_leaf_clearflag(args);
out:
	trace_xfs_attr_rmtval_alloc(attr->xattri_dela_state, args->dp);
	return error;
}
569

570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595
/*
 * Mark an attribute entry INCOMPLETE and save pointers to the relevant buffers
 * for later deletion of the entry.
 */
static int
xfs_attr_leaf_mark_incomplete(
	struct xfs_da_args	*args,
	struct xfs_da_state	*state)
{
	int			error;

	/*
	 * Fill in disk block numbers in the state structure
	 * so that we can get the buffers back after we commit
	 * several transactions in the following calls.
	 */
	error = xfs_attr_fillstate(state);
	if (error)
		return error;

	/*
	 * Mark the attribute as INCOMPLETE
	 */
	return xfs_attr3_leaf_setflag(args);
}

596 597 598
/* Ensure the da state of an xattr deferred work item is ready to go. */
static inline void
xfs_attr_item_init_da_state(
599
	struct xfs_attr_intent	*attr)
600 601 602 603 604 605 606 607 608
{
	struct xfs_da_args	*args = attr->xattri_da_args;

	if (!attr->xattri_da_state)
		attr->xattri_da_state = xfs_da_state_alloc(args);
	else
		xfs_da_state_reset(attr->xattri_da_state, args);
}

609 610 611 612 613 614 615
/*
 * Initial setup for xfs_attr_node_removename.  Make sure the attr is there and
 * the blocks are valid.  Attr keys with remote blocks will be marked
 * incomplete.
 */
static
int xfs_attr_node_removename_setup(
616
	struct xfs_attr_intent		*attr)
617 618
{
	struct xfs_da_args		*args = attr->xattri_da_args;
619
	struct xfs_da_state		*state;
620 621
	int				error;

622 623
	xfs_attr_item_init_da_state(attr);
	error = xfs_attr_node_lookup(args, attr->xattri_da_state);
624 625 626 627
	if (error != -EEXIST)
		goto out;
	error = 0;

628 629 630
	state = attr->xattri_da_state;
	ASSERT(state->path.blk[state->path.active - 1].bp != NULL);
	ASSERT(state->path.blk[state->path.active - 1].magic ==
631 632
		XFS_ATTR_LEAF_MAGIC);

633
	error = xfs_attr_leaf_mark_incomplete(args, state);
634 635 636
	if (error)
		goto out;
	if (args->rmtblkno > 0)
637 638
		error = xfs_attr_rmtval_invalidate(args);
out:
639 640 641 642
	if (error) {
		xfs_da_state_free(attr->xattri_da_state);
		attr->xattri_da_state = NULL;
	}
643 644 645 646

	return error;
}

647 648 649 650 651 652 653
/*
 * Remove the original attr we have just replaced. This is dependent on the
 * original lookup and insert placing the old attr in args->blkno/args->index
 * and the new attr in args->blkno2/args->index2.
 */
static int
xfs_attr_leaf_remove_attr(
654
	struct xfs_attr_intent		*attr)
655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683
{
	struct xfs_da_args              *args = attr->xattri_da_args;
	struct xfs_inode		*dp = args->dp;
	struct xfs_buf			*bp = NULL;
	int				forkoff;
	int				error;

	error = xfs_attr3_leaf_read(args->trans, args->dp, args->blkno,
				   &bp);
	if (error)
		return error;

	xfs_attr3_leaf_remove(bp, args);

	forkoff = xfs_attr_shortform_allfit(bp, dp);
	if (forkoff)
		error = xfs_attr3_leaf_to_shortform(bp, args, forkoff);
		/* bp is gone due to xfs_da_shrink_inode */

	return error;
}

/*
 * Shrink an attribute from leaf to shortform. Used by the node format remove
 * path when the node format collapses to a single block and so we have to check
 * if it can be collapsed further.
 */
static int
xfs_attr_leaf_shrink(
D
Dave Chinner 已提交
684
	struct xfs_da_args	*args)
685 686 687
{
	struct xfs_inode	*dp = args->dp;
	struct xfs_buf		*bp;
D
Dave Chinner 已提交
688 689
	int			forkoff;
	int			error;
690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708

	if (!xfs_attr_is_leaf(dp))
		return 0;

	error = xfs_attr3_leaf_read(args->trans, args->dp, 0, &bp);
	if (error)
		return error;

	forkoff = xfs_attr_shortform_allfit(bp, dp);
	if (forkoff) {
		error = xfs_attr3_leaf_to_shortform(bp, args, forkoff);
		/* bp is gone due to xfs_da_shrink_inode */
	} else {
		xfs_trans_brelse(args->trans, bp);
	}

	return error;
}

709
/*
710 711 712 713 714 715
 * Run the attribute operation specified in @attr.
 *
 * This routine is meant to function as a delayed operation and will set the
 * state to XFS_DAS_DONE when the operation is complete.  Calling functions will
 * need to handle this, and recall the function until either an error or
 * XFS_DAS_DONE is detected.
716 717
 */
int
718
xfs_attr_set_iter(
719
	struct xfs_attr_intent		*attr)
720
{
721
	struct xfs_da_args              *args = attr->xattri_da_args;
722
	int				error = 0;
723 724

	/* State machine switch */
725
next_state:
726
	switch (attr->xattri_dela_state) {
727
	case XFS_DAS_UNINIT:
728 729 730 731 732
		ASSERT(0);
		return -EFSCORRUPTED;
	case XFS_DAS_SF_ADD:
		return xfs_attr_sf_addname(attr);
	case XFS_DAS_LEAF_ADD:
733
		return xfs_attr_leaf_addname(attr);
734 735
	case XFS_DAS_NODE_ADD:
		return xfs_attr_node_addname(attr);
736

737
	case XFS_DAS_SF_REMOVE:
738 739 740 741
		error = xfs_attr_sf_removename(args);
		attr->xattri_dela_state = xfs_attr_complete_op(attr,
						xfs_attr_init_add_state(args));
		break;
742
	case XFS_DAS_LEAF_REMOVE:
743 744 745 746
		error = xfs_attr_leaf_removename(args);
		attr->xattri_dela_state = xfs_attr_complete_op(attr,
						xfs_attr_init_add_state(args));
		break;
747 748
	case XFS_DAS_NODE_REMOVE:
		error = xfs_attr_node_removename_setup(attr);
749 750 751 752 753 754 755
		if (error == -ENOATTR &&
		    (args->op_flags & XFS_DA_OP_RECOVERY)) {
			attr->xattri_dela_state = xfs_attr_complete_op(attr,
						xfs_attr_init_add_state(args));
			error = 0;
			break;
		}
756 757 758 759 760 761 762
		if (error)
			return error;
		attr->xattri_dela_state = XFS_DAS_NODE_REMOVE_RMT;
		if (args->rmtblkno == 0)
			attr->xattri_dela_state++;
		break;

763 764 765 766 767
	case XFS_DAS_LEAF_SET_RMT:
	case XFS_DAS_NODE_SET_RMT:
		error = xfs_attr_rmtval_find_space(attr);
		if (error)
			return error;
768
		attr->xattri_dela_state++;
769
		fallthrough;
770

771
	case XFS_DAS_LEAF_ALLOC_RMT:
772
	case XFS_DAS_NODE_ALLOC_RMT:
773 774
		error = xfs_attr_rmtval_alloc(attr);
		if (error)
775
			return error;
776 777
		if (attr->xattri_dela_state == XFS_DAS_DONE)
			break;
778
		goto next_state;
779

780 781
	case XFS_DAS_LEAF_REPLACE:
	case XFS_DAS_NODE_REPLACE:
782
		/*
783 784
		 * We must "flip" the incomplete flags on the "new" and "old"
		 * attribute/value pairs so that one disappears and one appears
785
		 * atomically.
786
		 */
787 788 789 790
		error = xfs_attr3_leaf_flipflags(args);
		if (error)
			return error;
		/*
791 792
		 * We must commit the flag value change now to make it atomic
		 * and then we can start the next trans in series at REMOVE_OLD.
793
		 */
794
		attr->xattri_dela_state++;
795 796 797 798
		break;

	case XFS_DAS_LEAF_REMOVE_OLD:
	case XFS_DAS_NODE_REMOVE_OLD:
799
		/*
800 801 802 803 804
		 * If we have a remote attr, start the process of removing it
		 * by invalidating any cached buffers.
		 *
		 * If we don't have a remote attr, we skip the remote block
		 * removal state altogether with a second state increment.
805 806 807
		 */
		xfs_attr_restore_rmt_blk(args);
		if (args->rmtblkno) {
808
			error = xfs_attr_rmtval_invalidate(args);
809 810
			if (error)
				return error;
811 812
		} else {
			attr->xattri_dela_state++;
813 814
		}

815 816 817 818 819 820
		attr->xattri_dela_state++;
		goto next_state;

	case XFS_DAS_LEAF_REMOVE_RMT:
	case XFS_DAS_NODE_REMOVE_RMT:
		error = xfs_attr_rmtval_remove(attr);
821 822
		if (error == -EAGAIN) {
			error = 0;
823
			break;
824
		}
825 826 827
		if (error)
			return error;

828
		/*
829 830 831 832 833 834
		 * We've finished removing the remote attr blocks, so commit the
		 * transaction and move on to removing the attr name from the
		 * leaf/node block. Removing the attr might require a full
		 * transaction reservation for btree block freeing, so we
		 * can't do that in the same transaction where we removed the
		 * remote attr blocks.
835 836
		 */
		attr->xattri_dela_state++;
837
		break;
838

839 840
	case XFS_DAS_LEAF_REMOVE_ATTR:
		error = xfs_attr_leaf_remove_attr(attr);
841 842
		attr->xattri_dela_state = xfs_attr_complete_op(attr,
						xfs_attr_init_add_state(args));
843
		break;
844

845 846 847
	case XFS_DAS_NODE_REMOVE_ATTR:
		error = xfs_attr_node_remove_attr(attr);
		if (!error)
D
Dave Chinner 已提交
848
			error = xfs_attr_leaf_shrink(args);
849 850
		attr->xattri_dela_state = xfs_attr_complete_op(attr,
						xfs_attr_init_add_state(args));
851 852
		break;
	default:
853
		ASSERT(0);
854 855
		break;
	}
856 857

	trace_xfs_attr_set_iter_return(attr->xattri_dela_state, args->dp);
858
	return error;
859 860
}

861

862 863 864
/*
 * Return EEXIST if attr is found, or ENOATTR if not
 */
D
Dave Chinner 已提交
865 866
static int
xfs_attr_lookup(
867 868 869 870
	struct xfs_da_args	*args)
{
	struct xfs_inode	*dp = args->dp;
	struct xfs_buf		*bp = NULL;
871
	struct xfs_da_state	*state;
872 873 874 875 876
	int			error;

	if (!xfs_inode_hasattr(dp))
		return -ENOATTR;

C
Christoph Hellwig 已提交
877
	if (dp->i_afp->if_format == XFS_DINODE_FMT_LOCAL)
878 879
		return xfs_attr_sf_findname(args, NULL, NULL);

880
	if (xfs_attr_is_leaf(dp)) {
881 882 883 884 885 886 887 888
		error = xfs_attr_leaf_hasname(args, &bp);

		if (bp)
			xfs_trans_brelse(args->trans, bp);

		return error;
	}

889 890 891 892
	state = xfs_da_state_alloc(args);
	error = xfs_attr_node_lookup(args, state);
	xfs_da_state_free(state);
	return error;
893 894
}

895
static int
896
xfs_attr_intent_init(
897 898
	struct xfs_da_args	*args,
	unsigned int		op_flags,	/* op flag (set or remove) */
899
	struct xfs_attr_intent	**attr)		/* new xfs_attr_intent */
900 901
{

902
	struct xfs_attr_intent	*new;
903

904
	new = kmem_cache_zalloc(xfs_attr_intent_cache, GFP_NOFS | __GFP_NOFAIL);
905 906 907 908 909 910 911 912 913 914 915 916
	new->xattri_op_flags = op_flags;
	new->xattri_da_args = args;

	*attr = new;
	return 0;
}

/* Sets an attribute for an inode as a deferred operation */
static int
xfs_attr_defer_add(
	struct xfs_da_args	*args)
{
917
	struct xfs_attr_intent	*new;
918 919
	int			error = 0;

920
	error = xfs_attr_intent_init(args, XFS_ATTRI_OP_FLAGS_SET, &new);
921 922 923
	if (error)
		return error;

924
	new->xattri_dela_state = xfs_attr_init_add_state(args);
925 926 927 928 929 930 931 932 933 934 935
	xfs_defer_add(args->trans, XFS_DEFER_OPS_TYPE_ATTR, &new->xattri_list);
	trace_xfs_attr_defer_add(new->xattri_dela_state, args->dp);

	return 0;
}

/* Sets an attribute for an inode as a deferred operation */
static int
xfs_attr_defer_replace(
	struct xfs_da_args	*args)
{
936
	struct xfs_attr_intent	*new;
937 938
	int			error = 0;

939
	error = xfs_attr_intent_init(args, XFS_ATTRI_OP_FLAGS_REPLACE, &new);
940 941 942
	if (error)
		return error;

943
	new->xattri_dela_state = xfs_attr_init_replace_state(args);
944 945 946 947 948 949 950 951 952 953 954 955
	xfs_defer_add(args->trans, XFS_DEFER_OPS_TYPE_ATTR, &new->xattri_list);
	trace_xfs_attr_defer_replace(new->xattri_dela_state, args->dp);

	return 0;
}

/* Removes an attribute for an inode as a deferred operation */
static int
xfs_attr_defer_remove(
	struct xfs_da_args	*args)
{

956
	struct xfs_attr_intent	*new;
957 958
	int			error;

959
	error  = xfs_attr_intent_init(args, XFS_ATTRI_OP_FLAGS_REMOVE, &new);
960 961 962
	if (error)
		return error;

963
	new->xattri_dela_state = xfs_attr_init_remove_state(args);
964 965 966 967 968 969
	xfs_defer_add(args->trans, XFS_DEFER_OPS_TYPE_ATTR, &new->xattri_list);
	trace_xfs_attr_defer_remove(new->xattri_dela_state, args->dp);

	return 0;
}

970
/*
971
 * Note: If args->value is NULL the attribute will be removed, just like the
972 973
 * Linux ->setattr API.
 */
974 975
int
xfs_attr_set(
976
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
977
{
978
	struct xfs_inode	*dp = args->dp;
979 980
	struct xfs_mount	*mp = dp->i_mount;
	struct xfs_trans_res	tres;
981
	bool			rsvd = (args->attr_filter & XFS_ATTR_ROOT);
982
	int			error, local;
983
	int			rmt_blks = 0;
984
	unsigned int		total;
985

986
	if (xfs_is_shutdown(dp->i_mount))
D
Dave Chinner 已提交
987
		return -EIO;
988

989 990 991 992
	error = xfs_qm_dqattach(dp);
	if (error)
		return error;

993 994 995
	args->geo = mp->m_attr_geo;
	args->whichfork = XFS_ATTR_FORK;
	args->hashval = xfs_da_hashname(args->name, args->namelen);
L
Linus Torvalds 已提交
996 997

	/*
998 999
	 * We have no control over the attribute names that userspace passes us
	 * to remove, so we have to allow the name lookup prior to attribute
1000 1001
	 * removal to fail as well.  Preserve the logged flag, since we need
	 * to pass that through to the logging code.
L
Linus Torvalds 已提交
1002
	 */
1003 1004
	args->op_flags = XFS_DA_OP_OKNOENT |
					(args->op_flags & XFS_DA_OP_LOGGED);
1005

1006
	if (args->value) {
1007
		XFS_STATS_INC(mp, xs_attr_set);
1008
		args->total = xfs_attr_calc_size(args, &local);
1009 1010 1011 1012 1013 1014 1015

		/*
		 * If the inode doesn't have an attribute fork, add one.
		 * (inode must not be locked when we call this routine)
		 */
		if (XFS_IFORK_Q(dp) == 0) {
			int sf_size = sizeof(struct xfs_attr_sf_hdr) +
1016
				xfs_attr_sf_entsize_byname(args->namelen,
1017
						args->valuelen);
1018 1019 1020 1021 1022 1023

			error = xfs_bmap_add_attrfork(dp, sf_size, rsvd);
			if (error)
				return error;
		}

1024 1025
		if (!local)
			rmt_blks = xfs_attr3_rmt_blocks(mp, args->valuelen);
1026 1027
	} else {
		XFS_STATS_INC(mp, xs_attr_remove);
1028
		rmt_blks = xfs_attr3_rmt_blocks(mp, XFS_XATTR_SIZE_MAX);
1029
	}
L
Linus Torvalds 已提交
1030 1031 1032 1033 1034

	/*
	 * Root fork attributes can use reserved data blocks for this
	 * operation if necessary
	 */
1035
	xfs_init_attr_trans(args, &tres, &total);
1036
	error = xfs_trans_alloc_inode(dp, &tres, total, 0, rsvd, &args->trans);
1037
	if (error)
1038
		return error;
L
Linus Torvalds 已提交
1039

1040 1041 1042
	if (args->value || xfs_inode_hasattr(dp)) {
		error = xfs_iext_count_may_overflow(dp, XFS_ATTR_FORK,
				XFS_IEXT_ATTR_MANIP_CNT(rmt_blks));
1043 1044 1045
		if (error == -EFBIG)
			error = xfs_iext_count_upgrade(args->trans, dp,
					XFS_IEXT_ATTR_MANIP_CNT(rmt_blks));
1046 1047 1048 1049
		if (error)
			goto out_trans_cancel;
	}

D
Dave Chinner 已提交
1050
	error = xfs_attr_lookup(args);
1051 1052 1053 1054 1055 1056 1057 1058 1059
	switch (error) {
	case -EEXIST:
		/* if no value, we are performing a remove operation */
		if (!args->value) {
			error = xfs_attr_defer_remove(args);
			break;
		}
		/* Pure create fails if the attr already exists */
		if (args->attr_flags & XATTR_CREATE)
1060 1061
			goto out_trans_cancel;

1062 1063 1064 1065 1066
		error = xfs_attr_defer_replace(args);
		break;
	case -ENOATTR:
		/* Can't remove what isn't there. */
		if (!args->value)
1067
			goto out_trans_cancel;
1068

1069 1070
		/* Pure replace fails if no existing attr to replace. */
		if (args->attr_flags & XATTR_REPLACE)
1071 1072
			goto out_trans_cancel;

1073 1074 1075 1076
		error = xfs_attr_defer_add(args);
		break;
	default:
		goto out_trans_cancel;
1077
	}
1078 1079
	if (error)
		goto out_trans_cancel;
L
Linus Torvalds 已提交
1080 1081 1082 1083 1084

	/*
	 * If this is a synchronous mount, make sure that the
	 * transaction goes to disk before returning to the user.
	 */
1085
	if (xfs_has_wsync(mp))
1086
		xfs_trans_set_sync(args->trans);
L
Linus Torvalds 已提交
1087

1088
	if (!(args->op_flags & XFS_DA_OP_NOTIME))
1089
		xfs_trans_ichgtime(args->trans, dp, XFS_ICHGTIME_CHG);
1090

L
Linus Torvalds 已提交
1091 1092 1093
	/*
	 * Commit the last in the sequence of transactions.
	 */
1094 1095
	xfs_trans_log_inode(args->trans, dp, XFS_ILOG_CORE);
	error = xfs_trans_commit(args->trans);
1096
out_unlock:
L
Linus Torvalds 已提交
1097
	xfs_iunlock(dp, XFS_ILOCK_EXCL);
1098
	return error;
L
Linus Torvalds 已提交
1099

1100
out_trans_cancel:
1101 1102
	if (args->trans)
		xfs_trans_cancel(args->trans);
1103
	goto out_unlock;
L
Linus Torvalds 已提交
1104 1105 1106 1107 1108 1109
}

/*========================================================================
 * External routines when attribute list is inside the inode
 *========================================================================*/

1110 1111 1112 1113 1114 1115 1116 1117
static inline int xfs_attr_sf_totsize(struct xfs_inode *dp)
{
	struct xfs_attr_shortform *sf;

	sf = (struct xfs_attr_shortform *)dp->i_afp->if_u1.if_data;
	return be16_to_cpu(sf->hdr.totsize);
}

L
Linus Torvalds 已提交
1118 1119 1120 1121
/*
 * Add a name to the shortform attribute list structure
 * This is the external routine.
 */
1122 1123 1124
static int
xfs_attr_shortform_addname(
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
1125
{
1126 1127
	int			newsize, forkoff;
	int			error;
L
Linus Torvalds 已提交
1128

1129 1130
	trace_xfs_attr_sf_addname(args);

1131 1132 1133 1134 1135 1136 1137 1138 1139 1140 1141 1142 1143 1144
	error = xfs_attr_shortform_lookup(args);
	switch (error) {
	case -ENOATTR:
		if (args->op_flags & XFS_DA_OP_REPLACE)
			return error;
		break;
	case -EEXIST:
		if (!(args->op_flags & XFS_DA_OP_REPLACE))
			return error;

		error = xfs_attr_sf_removename(args);
		if (error)
			return error;

1145
		/*
1146 1147 1148 1149
		 * Since we have removed the old attr, clear XFS_DA_OP_REPLACE
		 * so that the new attr doesn't fit in shortform format, the
		 * leaf format add routine won't trip over the attr not being
		 * around.
1150
		 */
1151 1152 1153 1154 1155 1156
		args->op_flags &= ~XFS_DA_OP_REPLACE;
		break;
	case 0:
		break;
	default:
		return error;
L
Linus Torvalds 已提交
1157 1158
	}

1159 1160
	if (args->namelen >= XFS_ATTR_SF_ENTSIZE_MAX ||
	    args->valuelen >= XFS_ATTR_SF_ENTSIZE_MAX)
D
Dave Chinner 已提交
1161
		return -ENOSPC;
1162

1163 1164
	newsize = xfs_attr_sf_totsize(args->dp);
	newsize += xfs_attr_sf_entsize_byname(args->namelen, args->valuelen);
1165 1166 1167

	forkoff = xfs_attr_shortform_bytesfit(args->dp, newsize);
	if (!forkoff)
D
Dave Chinner 已提交
1168
		return -ENOSPC;
1169 1170

	xfs_attr_shortform_add(args, forkoff);
E
Eric Sandeen 已提交
1171
	return 0;
L
Linus Torvalds 已提交
1172 1173 1174 1175 1176 1177 1178
}


/*========================================================================
 * External routines when attribute list is one block
 *========================================================================*/

1179 1180
/* Save the current remote block info and clear the current pointers. */
static void
1181 1182 1183 1184 1185 1186 1187 1188
xfs_attr_save_rmt_blk(
	struct xfs_da_args	*args)
{
	args->blkno2 = args->blkno;
	args->index2 = args->index;
	args->rmtblkno2 = args->rmtblkno;
	args->rmtblkcnt2 = args->rmtblkcnt;
	args->rmtvaluelen2 = args->rmtvaluelen;
1189 1190 1191
	args->rmtblkno = 0;
	args->rmtblkcnt = 0;
	args->rmtvaluelen = 0;
1192 1193 1194
}

/* Set stored info about a remote block */
1195
static void
1196 1197 1198 1199 1200 1201 1202 1203 1204 1205
xfs_attr_restore_rmt_blk(
	struct xfs_da_args	*args)
{
	args->blkno = args->blkno2;
	args->index = args->index2;
	args->rmtblkno = args->rmtblkno2;
	args->rmtblkcnt = args->rmtblkcnt2;
	args->rmtvaluelen = args->rmtvaluelen2;
}

L
Linus Torvalds 已提交
1206
/*
1207
 * Tries to add an attribute to an inode in leaf form
L
Linus Torvalds 已提交
1208
 *
1209 1210 1211 1212 1213 1214
 * This function is meant to execute as part of a delayed operation and leaves
 * the transaction handling to the caller.  On success the attribute is added
 * and the inode and transaction are left dirty.  If there is not enough space,
 * the attr data is converted to node format and -ENOSPC is returned. Caller is
 * responsible for handling the dirty inode and transaction or adding the attr
 * in node format.
L
Linus Torvalds 已提交
1215
 */
D
David Chinner 已提交
1216
STATIC int
1217 1218 1219
xfs_attr_leaf_try_add(
	struct xfs_da_args	*args,
	struct xfs_buf		*bp)
L
Linus Torvalds 已提交
1220
{
1221
	int			error;
1222

L
Linus Torvalds 已提交
1223
	/*
1224 1225 1226 1227
	 * If the caller provided a buffer to us, it is locked and held in
	 * the transaction because it just did a shortform to leaf conversion.
	 * Hence we don't need to read it again. Otherwise read in the leaf
	 * buffer.
L
Linus Torvalds 已提交
1228
	 */
1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239 1240
	if (bp) {
		xfs_trans_bhold_release(args->trans, bp);
	} else {
		error = xfs_attr3_leaf_read(args->trans, args->dp, 0, &bp);
		if (error)
			return error;
	}

	/*
	 * Look up the xattr name to set the insertion point for the new xattr.
	 */
	error = xfs_attr3_leaf_lookup_int(bp, args);
1241 1242 1243 1244 1245 1246 1247
	switch (error) {
	case -ENOATTR:
		if (args->op_flags & XFS_DA_OP_REPLACE)
			goto out_brelse;
		break;
	case -EEXIST:
		if (!(args->op_flags & XFS_DA_OP_REPLACE))
1248
			goto out_brelse;
1249 1250

		trace_xfs_attr_leaf_replace(args);
1251
		/*
1252 1253
		 * Save the existing remote attr state so that the current
		 * values reflect the state of the new attribute we are about to
1254 1255
		 * add, not the attribute we just found and will remove later.
		 */
1256 1257 1258 1259 1260 1261
		xfs_attr_save_rmt_blk(args);
		break;
	case 0:
		break;
	default:
		goto out_brelse;
L
Linus Torvalds 已提交
1262 1263
	}

1264 1265
	return xfs_attr3_leaf_add(bp, args);

1266 1267
out_brelse:
	xfs_trans_brelse(args->trans, bp);
1268
	return error;
1269
}
L
Linus Torvalds 已提交
1270

1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291
/*
 * Return EEXIST if attr is found, or ENOATTR if not
 */
STATIC int
xfs_attr_leaf_hasname(
	struct xfs_da_args	*args,
	struct xfs_buf		**bp)
{
	int                     error = 0;

	error = xfs_attr3_leaf_read(args->trans, args->dp, 0, bp);
	if (error)
		return error;

	error = xfs_attr3_leaf_lookup_int(*bp, args);
	if (error != -ENOATTR && error != -EEXIST)
		xfs_trans_brelse(args->trans, *bp);

	return error;
}

L
Linus Torvalds 已提交
1292 1293 1294 1295 1296 1297 1298
/*
 * Remove a name from the leaf attribute list structure
 *
 * This leaf block cannot have a "remote" value, we only call this routine
 * if bmap_one_block() says there is only one block (ie: no remote blks).
 */
STATIC int
1299 1300
xfs_attr_leaf_removename(
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
1301
{
1302 1303 1304
	struct xfs_inode	*dp;
	struct xfs_buf		*bp;
	int			error, forkoff;
L
Linus Torvalds 已提交
1305

1306 1307
	trace_xfs_attr_leaf_removename(args);

L
Linus Torvalds 已提交
1308 1309 1310 1311 1312
	/*
	 * Remove the attribute.
	 */
	dp = args->dp;

1313
	error = xfs_attr_leaf_hasname(args, &bp);
D
Dave Chinner 已提交
1314
	if (error == -ENOATTR) {
1315
		xfs_trans_brelse(args->trans, bp);
1316 1317
		if (args->op_flags & XFS_DA_OP_RECOVERY)
			return 0;
D
Dave Chinner 已提交
1318
		return error;
1319 1320
	} else if (error != -EEXIST)
		return error;
L
Linus Torvalds 已提交
1321

D
Dave Chinner 已提交
1322
	xfs_attr3_leaf_remove(bp, args);
L
Linus Torvalds 已提交
1323 1324 1325 1326

	/*
	 * If the result is small enough, shrink it all into the inode.
	 */
1327 1328 1329
	forkoff = xfs_attr_shortform_allfit(bp, dp);
	if (forkoff)
		return xfs_attr3_leaf_to_shortform(bp, args, forkoff);
L
Linus Torvalds 已提交
1330
		/* bp is gone due to xfs_da_shrink_inode */
1331

D
Dave Chinner 已提交
1332
	return 0;
L
Linus Torvalds 已提交
1333 1334 1335 1336 1337 1338 1339
}

/*
 * Look up a name in a leaf attribute list structure.
 *
 * This leaf block cannot have a "remote" value, we only call this routine
 * if bmap_one_block() says there is only one block (ie: no remote blks).
1340 1341
 *
 * Returns 0 on successful retrieval, otherwise an error.
L
Linus Torvalds 已提交
1342
 */
1343
STATIC int
L
Linus Torvalds 已提交
1344 1345
xfs_attr_leaf_get(xfs_da_args_t *args)
{
1346
	struct xfs_buf *bp;
L
Linus Torvalds 已提交
1347 1348
	int error;

1349 1350
	trace_xfs_attr_leaf_get(args);

1351
	error = xfs_attr_leaf_hasname(args, &bp);
L
Linus Torvalds 已提交
1352

1353
	if (error == -ENOATTR)  {
1354
		xfs_trans_brelse(args->trans, bp);
D
Dave Chinner 已提交
1355
		return error;
1356 1357 1358 1359
	} else if (error != -EEXIST)
		return error;


D
Dave Chinner 已提交
1360
	error = xfs_attr3_leaf_getvalue(bp, args);
1361
	xfs_trans_brelse(args->trans, bp);
1362
	return error;
L
Linus Torvalds 已提交
1363 1364
}

1365
/* Return EEXIST if attr is found, or ENOATTR if not. */
1366
STATIC int
1367
xfs_attr_node_lookup(
1368
	struct xfs_da_args	*args,
1369
	struct xfs_da_state	*state)
1370 1371 1372 1373 1374 1375 1376
{
	int			retval, error;

	/*
	 * Search to see if name exists, and get back a pointer to it.
	 */
	error = xfs_da3_node_lookup_int(state, &retval);
1377
	if (error)
1378
		return error;
1379

1380 1381 1382
	return retval;
}

L
Linus Torvalds 已提交
1383
/*========================================================================
1384
 * External routines when attribute list size > geo->blksize
L
Linus Torvalds 已提交
1385 1386 1387
 *========================================================================*/

STATIC int
1388
xfs_attr_node_addname_find_attr(
1389
	 struct xfs_attr_intent	*attr)
L
Linus Torvalds 已提交
1390
{
1391 1392
	struct xfs_da_args	*args = attr->xattri_da_args;
	int			error;
1393

L
Linus Torvalds 已提交
1394 1395 1396 1397
	/*
	 * Search to see if name already exists, and get back a pointer
	 * to where it should go.
	 */
1398 1399
	xfs_attr_item_init_da_state(attr);
	error = xfs_attr_node_lookup(args, attr->xattri_da_state);
1400 1401 1402 1403 1404 1405 1406
	switch (error) {
	case -ENOATTR:
		if (args->op_flags & XFS_DA_OP_REPLACE)
			goto error;
		break;
	case -EEXIST:
		if (!(args->op_flags & XFS_DA_OP_REPLACE))
1407
			goto error;
1408

1409

1410
		trace_xfs_attr_node_replace(args);
1411
		/*
1412 1413
		 * Save the existing remote attr state so that the current
		 * values reflect the state of the new attribute we are about to
1414 1415
		 * add, not the attribute we just found and will remove later.
		 */
1416 1417 1418 1419 1420 1421
		xfs_attr_save_rmt_blk(args);
		break;
	case 0:
		break;
	default:
		goto error;
L
Linus Torvalds 已提交
1422 1423
	}

1424 1425
	return 0;
error:
1426
	if (attr->xattri_da_state) {
1427
		xfs_da_state_free(attr->xattri_da_state);
1428 1429
		attr->xattri_da_state = NULL;
	}
1430
	return error;
1431 1432 1433 1434 1435 1436 1437 1438 1439
}

/*
 * Add a name to a Btree-format attribute list.
 *
 * This will involve walking down the Btree, and may involve splitting
 * leaf nodes and even splitting intermediate nodes up to and including
 * the root node (a special case of an intermediate node).
 */
1440 1441
static int
xfs_attr_node_try_addname(
1442
	struct xfs_attr_intent		*attr)
1443
{
1444 1445
	struct xfs_da_args		*args = attr->xattri_da_args;
	struct xfs_da_state		*state = attr->xattri_da_state;
1446 1447
	struct xfs_da_state_blk		*blk;
	int				error;
1448 1449 1450 1451 1452 1453

	trace_xfs_attr_node_addname(args);

	blk = &state->path.blk[state->path.active-1];
	ASSERT(blk->magic == XFS_ATTR_LEAF_MAGIC);

1454 1455
	error = xfs_attr3_leaf_add(blk->bp, state->args);
	if (error == -ENOSPC) {
L
Linus Torvalds 已提交
1456 1457 1458 1459
		if (state->path.active == 1) {
			/*
			 * Its really a single leaf node, but it had
			 * out-of-line values so it looked like it *might*
1460
			 * have been a b-tree. Let the caller deal with this.
L
Linus Torvalds 已提交
1461
			 */
1462
			goto out;
L
Linus Torvalds 已提交
1463 1464 1465 1466 1467 1468 1469 1470
		}

		/*
		 * Split as many Btree elements as required.
		 * This code tracks the new and old attr's location
		 * in the index/blkno/rmtblkno/rmtblkcnt fields and
		 * in the index2/blkno2/rmtblkno2/rmtblkcnt2 fields.
		 */
1471
		error = xfs_da3_split(state);
1472
		if (error)
1473
			goto out;
L
Linus Torvalds 已提交
1474 1475 1476 1477
	} else {
		/*
		 * Addition succeeded, update Btree hashvals.
		 */
1478
		xfs_da3_fixhashpath(state, &state->path);
L
Linus Torvalds 已提交
1479 1480
	}

1481
out:
1482
	xfs_da_state_free(state);
1483
	attr->xattri_da_state = NULL;
1484
	return error;
1485 1486
}

D
Dave Chinner 已提交
1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497 1498 1499 1500 1501 1502 1503 1504
static int
xfs_attr_node_removename(
	struct xfs_da_args	*args,
	struct xfs_da_state	*state)
{
	struct xfs_da_state_blk	*blk;
	int			retval;

	/*
	 * Remove the name and update the hashvals in the tree.
	 */
	blk = &state->path.blk[state->path.active-1];
	ASSERT(blk->magic == XFS_ATTR_LEAF_MAGIC);
	retval = xfs_attr3_leaf_remove(blk->bp, args);
	xfs_da3_fixhashpath(state, &state->path);

	return retval;
}
1505

1506 1507
static int
xfs_attr_node_remove_attr(
1508
	struct xfs_attr_intent		*attr)
1509
{
1510
	struct xfs_da_args		*args = attr->xattri_da_args;
1511
	struct xfs_da_state		*state = xfs_da_state_alloc(args);
1512 1513 1514
	int				retval = 0;
	int				error = 0;

1515
	/*
1516 1517 1518
	 * The attr we are removing has already been marked incomplete, so
	 * we need to set the filter appropriately to re-find the "old"
	 * attribute entry after any split ops.
1519
	 */
1520
	args->attr_filter |= XFS_ATTR_INCOMPLETE;
1521 1522 1523
	error = xfs_da3_node_lookup_int(state, &retval);
	if (error)
		goto out;
L
Linus Torvalds 已提交
1524

1525
	error = xfs_attr_node_removename(args, state);
L
Linus Torvalds 已提交
1526

1527 1528 1529 1530 1531
	/*
	 * Check to see if the tree needs to be collapsed.
	 */
	if (retval && (state->path.active > 1)) {
		error = xfs_da3_join(state);
L
Linus Torvalds 已提交
1532 1533 1534 1535 1536 1537
		if (error)
			goto out;
	}
	retval = error = 0;

out:
1538
	xfs_da_state_free(state);
L
Linus Torvalds 已提交
1539
	if (error)
E
Eric Sandeen 已提交
1540 1541
		return error;
	return retval;
L
Linus Torvalds 已提交
1542 1543 1544
}

/*
1545
 * Retrieve the attribute data from a node attribute list.
L
Linus Torvalds 已提交
1546 1547 1548 1549
 *
 * This routine gets called for any attribute fork that has more than one
 * block, ie: both true Btree attr lists and for single-leaf-blocks with
 * "remote" values taking up more blocks.
1550 1551
 *
 * Returns 0 on successful retrieval, otherwise an error.
L
Linus Torvalds 已提交
1552
 */
1553
STATIC int
1554 1555
xfs_attr_node_get(
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
1556
{
1557
	struct xfs_da_state	*state;
1558 1559 1560
	struct xfs_da_state_blk	*blk;
	int			i;
	int			error;
L
Linus Torvalds 已提交
1561

1562 1563
	trace_xfs_attr_node_get(args);

L
Linus Torvalds 已提交
1564 1565 1566
	/*
	 * Search to see if name exists, and get back a pointer to it.
	 */
1567 1568
	state = xfs_da_state_alloc(args);
	error = xfs_attr_node_lookup(args, state);
1569
	if (error != -EEXIST)
1570 1571 1572 1573 1574 1575
		goto out_release;

	/*
	 * Get the value, local or "remote"
	 */
	blk = &state->path.blk[state->path.active - 1];
1576
	error = xfs_attr3_leaf_getvalue(blk->bp, args);
L
Linus Torvalds 已提交
1577 1578 1579 1580

	/*
	 * If not in a transaction, we have to release all the buffers.
	 */
1581
out_release:
1582
	for (i = 0; state != NULL && i < state->path.active; i++) {
1583
		xfs_trans_brelse(args->trans, state->path.blk[i].bp);
L
Linus Torvalds 已提交
1584 1585 1586
		state->path.blk[i].bp = NULL;
	}

1587
	xfs_da_state_free(state);
1588
	return error;
L
Linus Torvalds 已提交
1589
}
1590 1591 1592 1593 1594 1595 1596 1597 1598 1599 1600 1601 1602 1603 1604 1605 1606

/* Returns true if the attribute entry name is valid. */
bool
xfs_attr_namecheck(
	const void	*name,
	size_t		length)
{
	/*
	 * MAXNAMELEN includes the trailing null, but (name/length) leave it
	 * out, so use >= for the length check.
	 */
	if (length >= MAXNAMELEN)
		return false;

	/* There shouldn't be any nulls here */
	return !memchr(name, 0, length);
}
1607 1608 1609 1610

int __init
xfs_attr_intent_init_cache(void)
{
1611 1612
	xfs_attr_intent_cache = kmem_cache_create("xfs_attr_intent",
			sizeof(struct xfs_attr_intent),
1613 1614 1615 1616 1617 1618 1619 1620 1621 1622 1623
			0, 0, NULL);

	return xfs_attr_intent_cache != NULL ? 0 : -ENOMEM;
}

void
xfs_attr_intent_destroy_cache(void)
{
	kmem_cache_destroy(xfs_attr_intent_cache);
	xfs_attr_intent_cache = NULL;
}