xfs_attr.c 41.6 KB
Newer Older
D
Dave Chinner 已提交
1
// SPDX-License-Identifier: GPL-2.0
L
Linus Torvalds 已提交
2
/*
3 4
 * Copyright (c) 2000-2005 Silicon Graphics, Inc.
 * All Rights Reserved.
L
Linus Torvalds 已提交
5 6
 */
#include "xfs.h"
7
#include "xfs_fs.h"
8
#include "xfs_shared.h"
9 10 11
#include "xfs_format.h"
#include "xfs_log_format.h"
#include "xfs_trans_resv.h"
L
Linus Torvalds 已提交
12
#include "xfs_mount.h"
13
#include "xfs_defer.h"
14
#include "xfs_da_format.h"
15 16
#include "xfs_da_btree.h"
#include "xfs_attr_sf.h"
L
Linus Torvalds 已提交
17
#include "xfs_inode.h"
18
#include "xfs_trans.h"
L
Linus Torvalds 已提交
19
#include "xfs_bmap.h"
20
#include "xfs_bmap_btree.h"
L
Linus Torvalds 已提交
21 22
#include "xfs_attr.h"
#include "xfs_attr_leaf.h"
23
#include "xfs_attr_remote.h"
L
Linus Torvalds 已提交
24 25
#include "xfs_quota.h"
#include "xfs_trans_space.h"
C
Christoph Hellwig 已提交
26
#include "xfs_trace.h"
L
Linus Torvalds 已提交
27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45

/*
 * xfs_attr.c
 *
 * Provide the external interfaces to manage attribute lists.
 */

/*========================================================================
 * Function prototypes for the kernel.
 *========================================================================*/

/*
 * Internal routines when attribute list fits inside the inode.
 */
STATIC int xfs_attr_shortform_addname(xfs_da_args_t *args);

/*
 * Internal routines when attribute list is one block.
 */
46
STATIC int xfs_attr_leaf_get(xfs_da_args_t *args);
L
Linus Torvalds 已提交
47
STATIC int xfs_attr_leaf_removename(xfs_da_args_t *args);
48
STATIC int xfs_attr_leaf_hasname(struct xfs_da_args *args, struct xfs_buf **bp);
49
STATIC int xfs_attr_leaf_try_add(struct xfs_da_args *args, struct xfs_buf *bp);
L
Linus Torvalds 已提交
50 51 52 53

/*
 * Internal routines when attribute list is more than one block.
 */
54
STATIC int xfs_attr_node_get(xfs_da_args_t *args);
55
STATIC void xfs_attr_restore_rmt_blk(struct xfs_da_args *args);
56 57 58 59
STATIC int xfs_attr_node_addname(struct xfs_delattr_context *dac);
STATIC int xfs_attr_node_addname_find_attr(struct xfs_delattr_context *dac);
STATIC int xfs_attr_node_addname_clear_incomplete(
				struct xfs_delattr_context *dac);
60 61
STATIC int xfs_attr_node_hasname(xfs_da_args_t *args,
				 struct xfs_da_state **state);
L
Linus Torvalds 已提交
62 63
STATIC int xfs_attr_fillstate(xfs_da_state_t *state);
STATIC int xfs_attr_refillstate(xfs_da_state_t *state);
64 65
STATIC int xfs_attr_set_iter(struct xfs_delattr_context *dac,
			     struct xfs_buf **leaf_bp);
66 67
STATIC int xfs_attr_node_removename(struct xfs_da_args *args,
				    struct xfs_da_state *state);
L
Linus Torvalds 已提交
68

69
int
70 71 72 73
xfs_inode_hasattr(
	struct xfs_inode	*ip)
{
	if (!XFS_IFORK_Q(ip) ||
74
	    (ip->i_afp->if_format == XFS_DINODE_FMT_EXTENTS &&
75
	     ip->i_afp->if_nextents == 0))
76 77 78 79
		return 0;
	return 1;
}

80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99
/*
 * Returns true if the there is exactly only block in the attr fork, in which
 * case the attribute fork consists of a single leaf block entry.
 */
bool
xfs_attr_is_leaf(
	struct xfs_inode	*ip)
{
	struct xfs_ifork	*ifp = ip->i_afp;
	struct xfs_iext_cursor	icur;
	struct xfs_bmbt_irec	imap;

	if (ifp->if_nextents != 1 || ifp->if_format != XFS_DINODE_FMT_EXTENTS)
		return false;

	xfs_iext_first(ifp, &icur);
	xfs_iext_get_extent(ifp, &icur, &imap);
	return imap.br_startoff == 0 && imap.br_blockcount == 1;
}

L
Linus Torvalds 已提交
100 101 102 103
/*========================================================================
 * Overall external interface routines.
 *========================================================================*/

104 105 106 107
/*
 * Retrieve an extended attribute and its value.  Must have ilock.
 * Returns 0 on successful retrieval, otherwise an error.
 */
108 109 110 111
int
xfs_attr_get_ilocked(
	struct xfs_da_args	*args)
{
112
	ASSERT(xfs_isilocked(args->dp, XFS_ILOCK_SHARED | XFS_ILOCK_EXCL));
113

114
	if (!xfs_inode_hasattr(args->dp))
115
		return -ENOATTR;
116

117
	if (args->dp->i_afp->if_format == XFS_DINODE_FMT_LOCAL)
118
		return xfs_attr_shortform_getvalue(args);
119
	if (xfs_attr_is_leaf(args->dp))
120
		return xfs_attr_leaf_get(args);
121
	return xfs_attr_node_get(args);
122 123
}

124 125 126
/*
 * Retrieve an extended attribute by name, and its value if requested.
 *
C
Christoph Hellwig 已提交
127 128 129
 * If args->valuelen is zero, then the caller does not want the value, just an
 * indication whether the attribute exists and the size of the value if it
 * exists. The size is returned in args.valuelen.
130
 *
131 132 133 134 135
 * If args->value is NULL but args->valuelen is non-zero, allocate the buffer
 * for the value after existence of the attribute has been determined. The
 * caller always has to free args->value if it is set, no matter if this
 * function was successful or not.
 *
136
 * If the attribute is found, but exceeds the size limit set by the caller in
137 138
 * args->valuelen, return -ERANGE with the size of the attribute that was found
 * in args->valuelen.
139
 */
140 141
int
xfs_attr_get(
142
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
143
{
144 145 146
	uint			lock_mode;
	int			error;

147
	XFS_STATS_INC(args->dp->i_mount, xs_attr_get);
148

149
	if (xfs_is_shutdown(args->dp->i_mount))
D
Dave Chinner 已提交
150
		return -EIO;
L
Linus Torvalds 已提交
151

152 153 154
	args->geo = args->dp->i_mount->m_attr_geo;
	args->whichfork = XFS_ATTR_FORK;
	args->hashval = xfs_da_hashname(args->name, args->namelen);
155

156
	/* Entirely possible to look up a name which doesn't exist */
157
	args->op_flags = XFS_DA_OP_OKNOENT;
L
Linus Torvalds 已提交
158

159
	lock_mode = xfs_ilock_attr_map_shared(args->dp);
160
	error = xfs_attr_get_ilocked(args);
161
	xfs_iunlock(args->dp, lock_mode);
162

163
	return error;
L
Linus Torvalds 已提交
164 165
}

166 167 168
/*
 * Calculate how many blocks we need for the new attribute,
 */
169
STATIC int
170
xfs_attr_calc_size(
171
	struct xfs_da_args	*args,
172 173
	int			*local)
{
174
	struct xfs_mount	*mp = args->dp->i_mount;
175 176 177 178 179 180 181
	int			size;
	int			nblks;

	/*
	 * Determine space new attribute will use, and if it would be
	 * "local" or "remote" (note: local != inline).
	 */
182
	size = xfs_attr_leaf_newentsize(args, local);
183 184
	nblks = XFS_DAENTER_SPACE_RES(mp, XFS_ATTR_FORK);
	if (*local) {
185
		if (size > (args->geo->blksize / 2)) {
186 187 188 189 190 191 192 193
			/* Double split possible */
			nblks *= 2;
		}
	} else {
		/*
		 * Out of line attribute, cannot double split, but
		 * make room for the attribute value itself.
		 */
194
		uint	dblocks = xfs_attr3_rmt_blocks(mp, args->valuelen);
195 196 197 198 199 200 201
		nblks += dblocks;
		nblks += XFS_NEXTENTADD_SPACE_RES(mp, dblocks, XFS_ATTR_FORK);
	}

	return nblks;
}

202 203 204 205 206 207
STATIC int
xfs_attr_try_sf_addname(
	struct xfs_inode	*dp,
	struct xfs_da_args	*args)
{

208 209 210 211 212 213 214
	int			error;

	/*
	 * Build initial attribute list (if required).
	 */
	if (dp->i_afp->if_format == XFS_DINODE_FMT_EXTENTS)
		xfs_attr_shortform_create(args);
215 216 217 218 219 220 221 222 223

	error = xfs_attr_shortform_addname(args);
	if (error == -ENOSPC)
		return error;

	/*
	 * Commit the shortform mods, and we're done.
	 * NOTE: this is also the error path (EEXIST, etc).
	 */
224
	if (!error && !(args->op_flags & XFS_DA_OP_NOTIME))
225 226
		xfs_trans_ichgtime(args->trans, dp, XFS_ICHGTIME_CHG);

227
	if (xfs_has_wsync(dp->i_mount))
228 229
		xfs_trans_set_sync(args->trans);

230
	return error;
231 232
}

233 234 235 236 237 238 239 240 241 242 243 244 245
/*
 * Check to see if the attr should be upgraded from non-existent or shortform to
 * single-leaf-block attribute list.
 */
static inline bool
xfs_attr_is_shortform(
	struct xfs_inode    *ip)
{
	return ip->i_afp->if_format == XFS_DINODE_FMT_LOCAL ||
	       (ip->i_afp->if_format == XFS_DINODE_FMT_EXTENTS &&
		ip->i_afp->if_nextents == 0);
}

246 247 248 249
/*
 * Checks to see if a delayed attribute transaction should be rolled.  If so,
 * transaction is finished or rolled as needed.
 */
250
STATIC int
251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270
xfs_attr_trans_roll(
	struct xfs_delattr_context	*dac)
{
	struct xfs_da_args		*args = dac->da_args;
	int				error;

	if (dac->flags & XFS_DAC_DEFER_FINISH) {
		/*
		 * The caller wants us to finish all the deferred ops so that we
		 * avoid pinning the log tail with a large number of deferred
		 * ops.
		 */
		dac->flags &= ~XFS_DAC_DEFER_FINISH;
		error = xfs_defer_finish(&args->trans);
	} else
		error = xfs_trans_roll_inode(&args->trans, args->dp);

	return error;
}

271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299
/*
 * Set the attribute specified in @args.
 */
int
xfs_attr_set_args(
	struct xfs_da_args		*args)
{
	struct xfs_buf			*leaf_bp = NULL;
	int				error = 0;
	struct xfs_delattr_context	dac = {
		.da_args	= args,
	};

	do {
		error = xfs_attr_set_iter(&dac, &leaf_bp);
		if (error != -EAGAIN)
			break;

		error = xfs_attr_trans_roll(&dac);
		if (error) {
			if (leaf_bp)
				xfs_trans_brelse(args->trans, leaf_bp);
			return error;
		}
	} while (true);

	return error;
}

300
STATIC int
301
xfs_attr_sf_addname(
302 303
	struct xfs_delattr_context	*dac,
	struct xfs_buf			**leaf_bp)
304
{
305 306 307
	struct xfs_da_args		*args = dac->da_args;
	struct xfs_inode		*dp = args->dp;
	int				error = 0;
308 309 310 311 312

	/*
	 * Try to add the attr to the attribute list in the inode.
	 */
	error = xfs_attr_try_sf_addname(dp, args);
313 314 315 316

	/* Should only be 0, -EEXIST or -ENOSPC */
	if (error != -ENOSPC)
		return error;
317

318 319 320 321
	/*
	 * It won't fit in the shortform, transform to a leaf block.  GROT:
	 * another possible req'mt for a double-split btree op.
	 */
322
	error = xfs_attr_shortform_to_leaf(args, leaf_bp);
323 324 325 326 327 328
	if (error)
		return error;

	/*
	 * Prevent the leaf buffer from being unlocked so that a concurrent AIL
	 * push cannot grab the half-baked leaf buffer and run into problems
329
	 * with the write verifier.
330
	 */
331
	xfs_trans_bhold(args->trans, *leaf_bp);
332

333 334 335 336 337
	/*
	 * We're still in XFS_DAS_UNINIT state here.  We've converted
	 * the attr fork to leaf format and will restart with the leaf
	 * add.
	 */
338
	trace_xfs_attr_sf_addname_return(XFS_DAS_UNINIT, args->dp);
339
	dac->flags |= XFS_DAC_DEFER_FINISH;
340
	return -EAGAIN;
341 342
}

343 344
/*
 * Set the attribute specified in @args.
345 346 347 348
 * This routine is meant to function as a delayed operation, and may return
 * -EAGAIN when the transaction needs to be rolled.  Calling functions will need
 * to handle this, and recall the function until a successful error code is
 * returned.
349 350
 */
int
351 352 353
xfs_attr_set_iter(
	struct xfs_delattr_context	*dac,
	struct xfs_buf			**leaf_bp)
354
{
355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370
	struct xfs_da_args              *args = dac->da_args;
	struct xfs_inode		*dp = args->dp;
	struct xfs_buf			*bp = NULL;
	int				forkoff, error = 0;

	/* State machine switch */
	switch (dac->dela_state) {
	case XFS_DAS_UNINIT:
		/*
		 * If the fork is shortform, attempt to add the attr. If there
		 * is no space, this converts to leaf format and returns
		 * -EAGAIN with the leaf buffer held across the roll. The caller
		 * will deal with a transaction roll error, but otherwise
		 * release the hold once we return with a clean transaction.
		 */
		if (xfs_attr_is_shortform(dp))
371
			return xfs_attr_sf_addname(dac, leaf_bp);
372 373 374 375
		if (*leaf_bp != NULL) {
			xfs_trans_bhold_release(args->trans, *leaf_bp);
			*leaf_bp = NULL;
		}
376

377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397
		if (xfs_attr_is_leaf(dp)) {
			error = xfs_attr_leaf_try_add(args, *leaf_bp);
			if (error == -ENOSPC) {
				error = xfs_attr3_leaf_to_node(args);
				if (error)
					return error;

				/*
				 * Finish any deferred work items and roll the
				 * transaction once more.  The goal here is to
				 * call node_addname with the inode and
				 * transaction in the same state (inode locked
				 * and joined, transaction clean) no matter how
				 * we got to this step.
				 *
				 * At this point, we are still in
				 * XFS_DAS_UNINIT, but when we come back, we'll
				 * be a node, so we'll fall down into the node
				 * handling code below
				 */
				dac->flags |= XFS_DAC_DEFER_FINISH;
398 399
				trace_xfs_attr_set_iter_return(
					dac->dela_state, args->dp);
400 401
				return -EAGAIN;
			} else if (error) {
402
				return error;
403
			}
404

405 406 407
			dac->dela_state = XFS_DAS_FOUND_LBLK;
		} else {
			error = xfs_attr_node_addname_find_attr(dac);
408 409 410
			if (error)
				return error;

411
			error = xfs_attr_node_addname(dac);
412 413 414
			if (error)
				return error;

415
			dac->dela_state = XFS_DAS_FOUND_NBLK;
416
		}
417
		trace_xfs_attr_set_iter_return(dac->dela_state,	args->dp);
418 419
		return -EAGAIN;
	case XFS_DAS_FOUND_LBLK:
420 421 422 423 424 425
		/*
		 * If there was an out-of-line value, allocate the blocks we
		 * identified for its storage and copy the value.  This is done
		 * after we create the attribute so that we don't overflow the
		 * maximum size of a transaction and/or hit a deadlock.
		 */
426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442

		/* Open coded xfs_attr_rmtval_set without trans handling */
		if ((dac->flags & XFS_DAC_LEAF_ADDNAME_INIT) == 0) {
			dac->flags |= XFS_DAC_LEAF_ADDNAME_INIT;
			if (args->rmtblkno > 0) {
				error = xfs_attr_rmtval_find_space(dac);
				if (error)
					return error;
			}
		}

		/*
		 * Repeat allocating remote blocks for the attr value until
		 * blkcnt drops to zero.
		 */
		if (dac->blkcnt > 0) {
			error = xfs_attr_rmtval_set_blk(dac);
443 444
			if (error)
				return error;
445 446
			trace_xfs_attr_set_iter_return(dac->dela_state,
						       args->dp);
447
			return -EAGAIN;
448 449
		}

450 451 452 453 454 455 456 457
		error = xfs_attr_rmtval_set_value(args);
		if (error)
			return error;

		/*
		 * If this is not a rename, clear the incomplete flag and we're
		 * done.
		 */
458 459 460
		if (!(args->op_flags & XFS_DA_OP_RENAME)) {
			if (args->rmtblkno > 0)
				error = xfs_attr3_leaf_clearflag(args);
461
			return error;
462
		}
463

464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479
		/*
		 * If this is an atomic rename operation, we must "flip" the
		 * incomplete flags on the "new" and "old" attribute/value pairs
		 * so that one disappears and one appears atomically.  Then we
		 * must remove the "old" attribute/value pair.
		 *
		 * In a separate transaction, set the incomplete flag on the
		 * "old" attr and clear the incomplete flag on the "new" attr.
		 */
		error = xfs_attr3_leaf_flipflags(args);
		if (error)
			return error;
		/*
		 * Commit the flag value change and start the next trans in
		 * series.
		 */
480
		dac->dela_state = XFS_DAS_FLIP_LFLAG;
481
		trace_xfs_attr_set_iter_return(dac->dela_state, args->dp);
482 483
		return -EAGAIN;
	case XFS_DAS_FLIP_LFLAG:
484 485 486 487 488
		/*
		 * Dismantle the "old" attribute/value pair by removing a
		 * "remote" value (if it exists).
		 */
		xfs_attr_restore_rmt_blk(args);
489 490 491
		error = xfs_attr_rmtval_invalidate(args);
		if (error)
			return error;
492

493
		fallthrough;
494 495 496
	case XFS_DAS_RM_LBLK:
		/* Set state in case xfs_attr_rmtval_remove returns -EAGAIN */
		dac->dela_state = XFS_DAS_RM_LBLK;
497
		if (args->rmtblkno) {
498
			error = xfs_attr_rmtval_remove(dac);
499 500 501
			if (error == -EAGAIN)
				trace_xfs_attr_set_iter_return(
					dac->dela_state, args->dp);
502 503 504
			if (error)
				return error;

505
			dac->dela_state = XFS_DAS_RD_LEAF;
506
			trace_xfs_attr_set_iter_return(dac->dela_state, args->dp);
507
			return -EAGAIN;
508 509
		}

510
		fallthrough;
511
	case XFS_DAS_RD_LEAF:
512
		/*
513 514 515
		 * This is the last step for leaf format. Read the block with
		 * the old attr, remove the old attr, check for shortform
		 * conversion and return.
516 517 518 519 520 521 522 523 524 525 526 527 528 529
		 */
		error = xfs_attr3_leaf_read(args->trans, args->dp, args->blkno,
					   &bp);
		if (error)
			return error;

		xfs_attr3_leaf_remove(bp, args);

		forkoff = xfs_attr_shortform_allfit(bp, dp);
		if (forkoff)
			error = xfs_attr3_leaf_to_shortform(bp, args, forkoff);
			/* bp is gone due to xfs_da_shrink_inode */

		return error;
530

531 532 533 534 535 536 537 538 539 540
	case XFS_DAS_FOUND_NBLK:
		/*
		 * Find space for remote blocks and fall into the allocation
		 * state.
		 */
		if (args->rmtblkno > 0) {
			error = xfs_attr_rmtval_find_space(dac);
			if (error)
				return error;
		}
541

542
		fallthrough;
543 544 545 546 547 548 549 550 551 552 553 554 555
	case XFS_DAS_ALLOC_NODE:
		/*
		 * If there was an out-of-line value, allocate the blocks we
		 * identified for its storage and copy the value.  This is done
		 * after we create the attribute so that we don't overflow the
		 * maximum size of a transaction and/or hit a deadlock.
		 */
		dac->dela_state = XFS_DAS_ALLOC_NODE;
		if (args->rmtblkno > 0) {
			if (dac->blkcnt > 0) {
				error = xfs_attr_rmtval_set_blk(dac);
				if (error)
					return error;
556 557
				trace_xfs_attr_set_iter_return(
					dac->dela_state, args->dp);
558 559 560 561 562 563 564
				return -EAGAIN;
			}

			error = xfs_attr_rmtval_set_value(args);
			if (error)
				return error;
		}
565

566 567 568 569 570 571 572 573 574
		/*
		 * If this was not a rename, clear the incomplete flag and we're
		 * done.
		 */
		if (!(args->op_flags & XFS_DA_OP_RENAME)) {
			if (args->rmtblkno > 0)
				error = xfs_attr3_leaf_clearflag(args);
			goto out;
		}
575

576 577 578 579 580 581 582 583 584 585
		/*
		 * If this is an atomic rename operation, we must "flip" the
		 * incomplete flags on the "new" and "old" attribute/value pairs
		 * so that one disappears and one appears atomically.  Then we
		 * must remove the "old" attribute/value pair.
		 *
		 * In a separate transaction, set the incomplete flag on the
		 * "old" attr and clear the incomplete flag on the "new" attr.
		 */
		error = xfs_attr3_leaf_flipflags(args);
586
		if (error)
587
			goto out;
588
		/*
589 590
		 * Commit the flag value change and start the next trans in
		 * series
591
		 */
592
		dac->dela_state = XFS_DAS_FLIP_NFLAG;
593
		trace_xfs_attr_set_iter_return(dac->dela_state, args->dp);
594
		return -EAGAIN;
595

596 597 598 599 600 601
	case XFS_DAS_FLIP_NFLAG:
		/*
		 * Dismantle the "old" attribute/value pair by removing a
		 * "remote" value (if it exists).
		 */
		xfs_attr_restore_rmt_blk(args);
602 603 604 605 606

		error = xfs_attr_rmtval_invalidate(args);
		if (error)
			return error;

607
		fallthrough;
608 609 610 611
	case XFS_DAS_RM_NBLK:
		/* Set state in case xfs_attr_rmtval_remove returns -EAGAIN */
		dac->dela_state = XFS_DAS_RM_NBLK;
		if (args->rmtblkno) {
612
			error = xfs_attr_rmtval_remove(dac);
613 614 615 616
			if (error == -EAGAIN)
				trace_xfs_attr_set_iter_return(
					dac->dela_state, args->dp);

617 618 619 620
			if (error)
				return error;

			dac->dela_state = XFS_DAS_CLR_FLAG;
621
			trace_xfs_attr_set_iter_return(dac->dela_state, args->dp);
622 623
			return -EAGAIN;
		}
624

625
		fallthrough;
626 627 628 629 630 631 632 633
	case XFS_DAS_CLR_FLAG:
		/*
		 * The last state for node format. Look up the old attr and
		 * remove it.
		 */
		error = xfs_attr_node_addname_clear_incomplete(dac);
		break;
	default:
634
		ASSERT(0);
635 636
		break;
	}
637
out:
638
	return error;
639 640
}

641

642 643 644
/*
 * Return EEXIST if attr is found, or ENOATTR if not
 */
D
Dave Chinner 已提交
645 646
static int
xfs_attr_lookup(
647 648 649 650 651 652 653 654 655
	struct xfs_da_args	*args)
{
	struct xfs_inode	*dp = args->dp;
	struct xfs_buf		*bp = NULL;
	int			error;

	if (!xfs_inode_hasattr(dp))
		return -ENOATTR;

C
Christoph Hellwig 已提交
656
	if (dp->i_afp->if_format == XFS_DINODE_FMT_LOCAL)
657 658
		return xfs_attr_sf_findname(args, NULL, NULL);

659
	if (xfs_attr_is_leaf(dp)) {
660 661 662 663 664 665 666 667 668 669 670
		error = xfs_attr_leaf_hasname(args, &bp);

		if (bp)
			xfs_trans_brelse(args->trans, bp);

		return error;
	}

	return xfs_attr_node_hasname(args, NULL);
}

671 672 673 674 675
/*
 * Remove the attribute specified in @args.
 */
int
xfs_attr_remove_args(
676
	struct xfs_da_args	*args)
677
{
678 679 680 681
	int				error;
	struct xfs_delattr_context	dac = {
		.da_args	= args,
	};
682

683 684 685 686 687 688 689 690 691 692 693 694
	do {
		error = xfs_attr_remove_iter(&dac);
		if (error != -EAGAIN)
			break;

		error = xfs_attr_trans_roll(&dac);
		if (error)
			return error;

	} while (true);

	return error;
695 696
}

697
/*
698
 * Note: If args->value is NULL the attribute will be removed, just like the
699 700
 * Linux ->setattr API.
 */
701 702
int
xfs_attr_set(
703
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
704
{
705
	struct xfs_inode	*dp = args->dp;
706 707
	struct xfs_mount	*mp = dp->i_mount;
	struct xfs_trans_res	tres;
708
	bool			rsvd = (args->attr_filter & XFS_ATTR_ROOT);
709
	int			error, local;
710
	int			rmt_blks = 0;
711
	unsigned int		total;
712

713
	if (xfs_is_shutdown(dp->i_mount))
D
Dave Chinner 已提交
714
		return -EIO;
715

716 717 718 719
	error = xfs_qm_dqattach(dp);
	if (error)
		return error;

720 721 722
	args->geo = mp->m_attr_geo;
	args->whichfork = XFS_ATTR_FORK;
	args->hashval = xfs_da_hashname(args->name, args->namelen);
L
Linus Torvalds 已提交
723 724

	/*
725 726 727
	 * We have no control over the attribute names that userspace passes us
	 * to remove, so we have to allow the name lookup prior to attribute
	 * removal to fail as well.
L
Linus Torvalds 已提交
728
	 */
729
	args->op_flags = XFS_DA_OP_OKNOENT;
730

731
	if (args->value) {
732 733
		XFS_STATS_INC(mp, xs_attr_set);

734 735
		args->op_flags |= XFS_DA_OP_ADDNAME;
		args->total = xfs_attr_calc_size(args, &local);
736 737 738 739 740 741 742

		/*
		 * If the inode doesn't have an attribute fork, add one.
		 * (inode must not be locked when we call this routine)
		 */
		if (XFS_IFORK_Q(dp) == 0) {
			int sf_size = sizeof(struct xfs_attr_sf_hdr) +
743
				xfs_attr_sf_entsize_byname(args->namelen,
744
						args->valuelen);
745 746 747 748 749 750 751

			error = xfs_bmap_add_attrfork(dp, sf_size, rsvd);
			if (error)
				return error;
		}

		tres.tr_logres = M_RES(mp)->tr_attrsetm.tr_logres +
752 753
				 M_RES(mp)->tr_attrsetrt.tr_logres *
					args->total;
754 755
		tres.tr_logcount = XFS_ATTRSET_LOG_COUNT;
		tres.tr_logflags = XFS_TRANS_PERM_LOG_RES;
756
		total = args->total;
757 758 759

		if (!local)
			rmt_blks = xfs_attr3_rmt_blocks(mp, args->valuelen);
760 761
	} else {
		XFS_STATS_INC(mp, xs_attr_remove);
L
Linus Torvalds 已提交
762

763 764
		tres = M_RES(mp)->tr_attrrm;
		total = XFS_ATTRRM_SPACE_RES(mp);
765
		rmt_blks = xfs_attr3_rmt_blocks(mp, XFS_XATTR_SIZE_MAX);
766
	}
L
Linus Torvalds 已提交
767 768 769 770 771

	/*
	 * Root fork attributes can use reserved data blocks for this
	 * operation if necessary
	 */
772
	error = xfs_trans_alloc_inode(dp, &tres, total, 0, rsvd, &args->trans);
773
	if (error)
774
		return error;
L
Linus Torvalds 已提交
775

776 777 778
	if (args->value || xfs_inode_hasattr(dp)) {
		error = xfs_iext_count_may_overflow(dp, XFS_ATTR_FORK,
				XFS_IEXT_ATTR_MANIP_CNT(rmt_blks));
779 780 781
		if (error == -EFBIG)
			error = xfs_iext_count_upgrade(args->trans, dp,
					XFS_IEXT_ATTR_MANIP_CNT(rmt_blks));
782 783 784 785
		if (error)
			goto out_trans_cancel;
	}

D
Dave Chinner 已提交
786
	error = xfs_attr_lookup(args);
787
	if (args->value) {
788 789 790 791 792 793 794
		if (error == -EEXIST && (args->attr_flags & XATTR_CREATE))
			goto out_trans_cancel;
		if (error == -ENOATTR && (args->attr_flags & XATTR_REPLACE))
			goto out_trans_cancel;
		if (error != -ENOATTR && error != -EEXIST)
			goto out_trans_cancel;

795
		error = xfs_attr_set_args(args);
796 797
		if (error)
			goto out_trans_cancel;
798
		/* shortform attribute has already been committed */
799
		if (!args->trans)
800 801
			goto out_unlock;
	} else {
802 803 804
		if (error != -EEXIST)
			goto out_trans_cancel;

805
		error = xfs_attr_remove_args(args);
806 807
		if (error)
			goto out_trans_cancel;
808
	}
L
Linus Torvalds 已提交
809 810 811 812 813

	/*
	 * If this is a synchronous mount, make sure that the
	 * transaction goes to disk before returning to the user.
	 */
814
	if (xfs_has_wsync(mp))
815
		xfs_trans_set_sync(args->trans);
L
Linus Torvalds 已提交
816

817
	if (!(args->op_flags & XFS_DA_OP_NOTIME))
818
		xfs_trans_ichgtime(args->trans, dp, XFS_ICHGTIME_CHG);
819

L
Linus Torvalds 已提交
820 821 822
	/*
	 * Commit the last in the sequence of transactions.
	 */
823 824
	xfs_trans_log_inode(args->trans, dp, XFS_ILOG_CORE);
	error = xfs_trans_commit(args->trans);
825
out_unlock:
L
Linus Torvalds 已提交
826
	xfs_iunlock(dp, XFS_ILOCK_EXCL);
827
	return error;
L
Linus Torvalds 已提交
828

829
out_trans_cancel:
830 831
	if (args->trans)
		xfs_trans_cancel(args->trans);
832
	goto out_unlock;
L
Linus Torvalds 已提交
833 834 835 836 837 838
}

/*========================================================================
 * External routines when attribute list is inside the inode
 *========================================================================*/

839 840 841 842 843 844 845 846
static inline int xfs_attr_sf_totsize(struct xfs_inode *dp)
{
	struct xfs_attr_shortform *sf;

	sf = (struct xfs_attr_shortform *)dp->i_afp->if_u1.if_data;
	return be16_to_cpu(sf->hdr.totsize);
}

L
Linus Torvalds 已提交
847 848 849 850 851 852 853
/*
 * Add a name to the shortform attribute list structure
 * This is the external routine.
 */
STATIC int
xfs_attr_shortform_addname(xfs_da_args_t *args)
{
854
	int newsize, forkoff, retval;
L
Linus Torvalds 已提交
855

856 857
	trace_xfs_attr_sf_addname(args);

L
Linus Torvalds 已提交
858
	retval = xfs_attr_shortform_lookup(args);
859
	if (retval == -ENOATTR && (args->attr_flags & XATTR_REPLACE))
E
Eric Sandeen 已提交
860
		return retval;
861
	if (retval == -EEXIST) {
862
		if (args->attr_flags & XATTR_CREATE)
E
Eric Sandeen 已提交
863
			return retval;
864
		retval = xfs_attr_sf_removename(args);
865 866 867 868 869 870 871
		if (retval)
			return retval;
		/*
		 * Since we have removed the old attr, clear ATTR_REPLACE so
		 * that the leaf format add routine won't trip over the attr
		 * not being around.
		 */
872
		args->attr_flags &= ~XATTR_REPLACE;
L
Linus Torvalds 已提交
873 874
	}

875 876
	if (args->namelen >= XFS_ATTR_SF_ENTSIZE_MAX ||
	    args->valuelen >= XFS_ATTR_SF_ENTSIZE_MAX)
D
Dave Chinner 已提交
877
		return -ENOSPC;
878

879 880
	newsize = xfs_attr_sf_totsize(args->dp);
	newsize += xfs_attr_sf_entsize_byname(args->namelen, args->valuelen);
881 882 883

	forkoff = xfs_attr_shortform_bytesfit(args->dp, newsize);
	if (!forkoff)
D
Dave Chinner 已提交
884
		return -ENOSPC;
885 886

	xfs_attr_shortform_add(args, forkoff);
E
Eric Sandeen 已提交
887
	return 0;
L
Linus Torvalds 已提交
888 889 890 891 892 893 894
}


/*========================================================================
 * External routines when attribute list is one block
 *========================================================================*/

895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918
/* Store info about a remote block */
STATIC void
xfs_attr_save_rmt_blk(
	struct xfs_da_args	*args)
{
	args->blkno2 = args->blkno;
	args->index2 = args->index;
	args->rmtblkno2 = args->rmtblkno;
	args->rmtblkcnt2 = args->rmtblkcnt;
	args->rmtvaluelen2 = args->rmtvaluelen;
}

/* Set stored info about a remote block */
STATIC void
xfs_attr_restore_rmt_blk(
	struct xfs_da_args	*args)
{
	args->blkno = args->blkno2;
	args->index = args->index2;
	args->rmtblkno = args->rmtblkno2;
	args->rmtblkcnt = args->rmtblkcnt2;
	args->rmtvaluelen = args->rmtvaluelen2;
}

L
Linus Torvalds 已提交
919
/*
920
 * Tries to add an attribute to an inode in leaf form
L
Linus Torvalds 已提交
921
 *
922 923 924 925 926 927
 * This function is meant to execute as part of a delayed operation and leaves
 * the transaction handling to the caller.  On success the attribute is added
 * and the inode and transaction are left dirty.  If there is not enough space,
 * the attr data is converted to node format and -ENOSPC is returned. Caller is
 * responsible for handling the dirty inode and transaction or adding the attr
 * in node format.
L
Linus Torvalds 已提交
928
 */
D
David Chinner 已提交
929
STATIC int
930 931 932
xfs_attr_leaf_try_add(
	struct xfs_da_args	*args,
	struct xfs_buf		*bp)
L
Linus Torvalds 已提交
933
{
934
	int			retval;
935

L
Linus Torvalds 已提交
936 937 938 939
	/*
	 * Look up the given attribute in the leaf block.  Figure out if
	 * the given flags produce an error or call for an atomic rename.
	 */
940 941 942
	retval = xfs_attr_leaf_hasname(args, &bp);
	if (retval != -ENOATTR && retval != -EEXIST)
		return retval;
943
	if (retval == -ENOATTR && (args->attr_flags & XATTR_REPLACE))
944 945
		goto out_brelse;
	if (retval == -EEXIST) {
946
		if (args->attr_flags & XATTR_CREATE)
947
			goto out_brelse;
948 949 950

		trace_xfs_attr_leaf_replace(args);

951
		/* save the attribute state for later removal*/
952
		args->op_flags |= XFS_DA_OP_RENAME;	/* an atomic rename */
953
		xfs_attr_save_rmt_blk(args);
954 955 956 957 958 959 960 961 962

		/*
		 * clear the remote attr state now that it is saved so that the
		 * values reflect the state of the attribute we are about to
		 * add, not the attribute we just found and will remove later.
		 */
		args->rmtblkno = 0;
		args->rmtblkcnt = 0;
		args->rmtvaluelen = 0;
L
Linus Torvalds 已提交
963 964 965
	}

	/*
966
	 * Add the attribute to the leaf block
L
Linus Torvalds 已提交
967
	 */
968 969
	return xfs_attr3_leaf_add(bp, args);

970 971 972 973
out_brelse:
	xfs_trans_brelse(args->trans, bp);
	return retval;
}
L
Linus Torvalds 已提交
974

975 976 977 978 979 980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995
/*
 * Return EEXIST if attr is found, or ENOATTR if not
 */
STATIC int
xfs_attr_leaf_hasname(
	struct xfs_da_args	*args,
	struct xfs_buf		**bp)
{
	int                     error = 0;

	error = xfs_attr3_leaf_read(args->trans, args->dp, 0, bp);
	if (error)
		return error;

	error = xfs_attr3_leaf_lookup_int(*bp, args);
	if (error != -ENOATTR && error != -EEXIST)
		xfs_trans_brelse(args->trans, *bp);

	return error;
}

L
Linus Torvalds 已提交
996 997 998 999 1000 1001 1002
/*
 * Remove a name from the leaf attribute list structure
 *
 * This leaf block cannot have a "remote" value, we only call this routine
 * if bmap_one_block() says there is only one block (ie: no remote blks).
 */
STATIC int
1003 1004
xfs_attr_leaf_removename(
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
1005
{
1006 1007 1008
	struct xfs_inode	*dp;
	struct xfs_buf		*bp;
	int			error, forkoff;
L
Linus Torvalds 已提交
1009

1010 1011
	trace_xfs_attr_leaf_removename(args);

L
Linus Torvalds 已提交
1012 1013 1014 1015 1016
	/*
	 * Remove the attribute.
	 */
	dp = args->dp;

1017 1018
	error = xfs_attr_leaf_hasname(args, &bp);

D
Dave Chinner 已提交
1019
	if (error == -ENOATTR) {
1020
		xfs_trans_brelse(args->trans, bp);
D
Dave Chinner 已提交
1021
		return error;
1022 1023
	} else if (error != -EEXIST)
		return error;
L
Linus Torvalds 已提交
1024

D
Dave Chinner 已提交
1025
	xfs_attr3_leaf_remove(bp, args);
L
Linus Torvalds 已提交
1026 1027 1028 1029

	/*
	 * If the result is small enough, shrink it all into the inode.
	 */
1030 1031 1032
	forkoff = xfs_attr_shortform_allfit(bp, dp);
	if (forkoff)
		return xfs_attr3_leaf_to_shortform(bp, args, forkoff);
L
Linus Torvalds 已提交
1033
		/* bp is gone due to xfs_da_shrink_inode */
1034

D
Dave Chinner 已提交
1035
	return 0;
L
Linus Torvalds 已提交
1036 1037 1038 1039 1040 1041 1042
}

/*
 * Look up a name in a leaf attribute list structure.
 *
 * This leaf block cannot have a "remote" value, we only call this routine
 * if bmap_one_block() says there is only one block (ie: no remote blks).
1043 1044
 *
 * Returns 0 on successful retrieval, otherwise an error.
L
Linus Torvalds 已提交
1045
 */
1046
STATIC int
L
Linus Torvalds 已提交
1047 1048
xfs_attr_leaf_get(xfs_da_args_t *args)
{
1049
	struct xfs_buf *bp;
L
Linus Torvalds 已提交
1050 1051
	int error;

1052 1053
	trace_xfs_attr_leaf_get(args);

1054
	error = xfs_attr_leaf_hasname(args, &bp);
L
Linus Torvalds 已提交
1055

1056
	if (error == -ENOATTR)  {
1057
		xfs_trans_brelse(args->trans, bp);
D
Dave Chinner 已提交
1058
		return error;
1059 1060 1061 1062
	} else if (error != -EEXIST)
		return error;


D
Dave Chinner 已提交
1063
	error = xfs_attr3_leaf_getvalue(bp, args);
1064
	xfs_trans_brelse(args->trans, bp);
1065
	return error;
L
Linus Torvalds 已提交
1066 1067
}

1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082
/*
 * Return EEXIST if attr is found, or ENOATTR if not
 * statep: If not null is set to point at the found state.  Caller will
 *         be responsible for freeing the state in this case.
 */
STATIC int
xfs_attr_node_hasname(
	struct xfs_da_args	*args,
	struct xfs_da_state	**statep)
{
	struct xfs_da_state	*state;
	int			retval, error;

	state = xfs_da_state_alloc(args);
	if (statep != NULL)
1083
		*statep = state;
1084 1085 1086 1087 1088

	/*
	 * Search to see if name exists, and get back a pointer to it.
	 */
	error = xfs_da3_node_lookup_int(state, &retval);
1089 1090
	if (error)
		retval = error;
1091

1092
	if (!statep)
1093
		xfs_da_state_free(state);
1094

1095 1096 1097
	return retval;
}

L
Linus Torvalds 已提交
1098
/*========================================================================
1099
 * External routines when attribute list size > geo->blksize
L
Linus Torvalds 已提交
1100 1101 1102
 *========================================================================*/

STATIC int
1103
xfs_attr_node_addname_find_attr(
1104
	struct xfs_delattr_context	*dac)
L
Linus Torvalds 已提交
1105
{
1106 1107
	struct xfs_da_args		*args = dac->da_args;
	int				retval;
1108

L
Linus Torvalds 已提交
1109 1110 1111 1112
	/*
	 * Search to see if name already exists, and get back a pointer
	 * to where it should go.
	 */
1113
	retval = xfs_attr_node_hasname(args, &dac->da_state);
1114
	if (retval != -ENOATTR && retval != -EEXIST)
1115
		goto error;
1116

1117
	if (retval == -ENOATTR && (args->attr_flags & XATTR_REPLACE))
1118
		goto error;
1119
	if (retval == -EEXIST) {
1120
		if (args->attr_flags & XATTR_CREATE)
1121
			goto error;
1122 1123 1124

		trace_xfs_attr_node_replace(args);

1125
		/* save the attribute state for later removal*/
1126
		args->op_flags |= XFS_DA_OP_RENAME;	/* atomic rename op */
1127
		xfs_attr_save_rmt_blk(args);
1128 1129 1130 1131 1132 1133

		/*
		 * clear the remote attr state now that it is saved so that the
		 * values reflect the state of the attribute we are about to
		 * add, not the attribute we just found and will remove later.
		 */
L
Linus Torvalds 已提交
1134 1135
		args->rmtblkno = 0;
		args->rmtblkcnt = 0;
1136
		args->rmtvaluelen = 0;
L
Linus Torvalds 已提交
1137 1138
	}

1139 1140
	return 0;
error:
1141 1142
	if (dac->da_state)
		xfs_da_state_free(dac->da_state);
1143 1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154
	return retval;
}

/*
 * Add a name to a Btree-format attribute list.
 *
 * This will involve walking down the Btree, and may involve splitting
 * leaf nodes and even splitting intermediate nodes up to and including
 * the root node (a special case of an intermediate node).
 *
 * "Remote" attribute values confuse the issue and atomic rename operations
 * add a whole extra layer of confusion on top of that.
1155 1156 1157 1158 1159
 *
 * This routine is meant to function as a delayed operation, and may return
 * -EAGAIN when the transaction needs to be rolled.  Calling functions will need
 * to handle this, and recall the function until a successful error code is
 *returned.
1160 1161 1162
 */
STATIC int
xfs_attr_node_addname(
1163
	struct xfs_delattr_context	*dac)
1164
{
1165 1166 1167 1168
	struct xfs_da_args		*args = dac->da_args;
	struct xfs_da_state		*state = dac->da_state;
	struct xfs_da_state_blk		*blk;
	int				error;
1169 1170 1171 1172 1173 1174

	trace_xfs_attr_node_addname(args);

	blk = &state->path.blk[state->path.active-1];
	ASSERT(blk->magic == XFS_ATTR_LEAF_MAGIC);

1175 1176
	error = xfs_attr3_leaf_add(blk->bp, state->args);
	if (error == -ENOSPC) {
L
Linus Torvalds 已提交
1177 1178 1179 1180 1181 1182 1183
		if (state->path.active == 1) {
			/*
			 * Its really a single leaf node, but it had
			 * out-of-line values so it looked like it *might*
			 * have been a b-tree.
			 */
			xfs_da_state_free(state);
1184
			state = NULL;
D
Dave Chinner 已提交
1185
			error = xfs_attr3_leaf_to_node(args);
1186
			if (error)
1187
				goto out;
L
Linus Torvalds 已提交
1188 1189

			/*
1190 1191 1192 1193 1194
			 * Now that we have converted the leaf to a node, we can
			 * roll the transaction, and try xfs_attr3_leaf_add
			 * again on re-entry.  No need to set dela_state to do
			 * this. dela_state is still unset by this function at
			 * this point.
L
Linus Torvalds 已提交
1195
			 */
1196
			dac->flags |= XFS_DAC_DEFER_FINISH;
1197 1198
			trace_xfs_attr_node_addname_return(
					dac->dela_state, args->dp);
1199
			return -EAGAIN;
L
Linus Torvalds 已提交
1200 1201 1202 1203 1204 1205 1206 1207
		}

		/*
		 * Split as many Btree elements as required.
		 * This code tracks the new and old attr's location
		 * in the index/blkno/rmtblkno/rmtblkcnt fields and
		 * in the index2/blkno2/rmtblkno2/rmtblkcnt2 fields.
		 */
1208
		error = xfs_da3_split(state);
1209
		if (error)
1210
			goto out;
1211
		dac->flags |= XFS_DAC_DEFER_FINISH;
L
Linus Torvalds 已提交
1212 1213 1214 1215
	} else {
		/*
		 * Addition succeeded, update Btree hashvals.
		 */
1216
		xfs_da3_fixhashpath(state, &state->path);
L
Linus Torvalds 已提交
1217 1218
	}

1219 1220 1221
out:
	if (state)
		xfs_da_state_free(state);
1222
	return error;
1223 1224 1225 1226 1227
}


STATIC int
xfs_attr_node_addname_clear_incomplete(
1228
	struct xfs_delattr_context	*dac)
1229
{
1230
	struct xfs_da_args		*args = dac->da_args;
1231 1232 1233 1234
	struct xfs_da_state		*state = NULL;
	int				retval = 0;
	int				error = 0;

1235 1236 1237 1238 1239 1240 1241 1242 1243 1244
	/*
	 * Re-find the "old" attribute entry after any split ops. The INCOMPLETE
	 * flag means that we will find the "old" attr, not the "new" one.
	 */
	args->attr_filter |= XFS_ATTR_INCOMPLETE;
	state = xfs_da_state_alloc(args);
	state->inleaf = 0;
	error = xfs_da3_node_lookup_int(state, &retval);
	if (error)
		goto out;
L
Linus Torvalds 已提交
1245

1246
	error = xfs_attr_node_removename(args, state);
L
Linus Torvalds 已提交
1247

1248 1249 1250 1251 1252
	/*
	 * Check to see if the tree needs to be collapsed.
	 */
	if (retval && (state->path.active > 1)) {
		error = xfs_da3_join(state);
L
Linus Torvalds 已提交
1253 1254 1255 1256 1257 1258 1259 1260 1261
		if (error)
			goto out;
	}
	retval = error = 0;

out:
	if (state)
		xfs_da_state_free(state);
	if (error)
E
Eric Sandeen 已提交
1262 1263
		return error;
	return retval;
L
Linus Torvalds 已提交
1264 1265
}

1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291 1292 1293 1294 1295
/*
 * Shrink an attribute from leaf to shortform
 */
STATIC int
xfs_attr_node_shrink(
	struct xfs_da_args	*args,
	struct xfs_da_state     *state)
{
	struct xfs_inode	*dp = args->dp;
	int			error, forkoff;
	struct xfs_buf		*bp;

	/*
	 * Have to get rid of the copy of this dabuf in the state.
	 */
	ASSERT(state->path.active == 1);
	ASSERT(state->path.blk[0].bp);
	state->path.blk[0].bp = NULL;

	error = xfs_attr3_leaf_read(args->trans, args->dp, 0, &bp);
	if (error)
		return error;

	forkoff = xfs_attr_shortform_allfit(bp, dp);
	if (forkoff) {
		error = xfs_attr3_leaf_to_shortform(bp, args, forkoff);
		/* bp is gone due to xfs_da_shrink_inode */
	} else
		xfs_trans_brelse(args->trans, bp);

1296
	return error;
1297 1298
}

1299 1300 1301 1302 1303 1304 1305 1306 1307 1308 1309 1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324
/*
 * Mark an attribute entry INCOMPLETE and save pointers to the relevant buffers
 * for later deletion of the entry.
 */
STATIC int
xfs_attr_leaf_mark_incomplete(
	struct xfs_da_args	*args,
	struct xfs_da_state	*state)
{
	int			error;

	/*
	 * Fill in disk block numbers in the state structure
	 * so that we can get the buffers back after we commit
	 * several transactions in the following calls.
	 */
	error = xfs_attr_fillstate(state);
	if (error)
		return error;

	/*
	 * Mark the attribute as INCOMPLETE
	 */
	return xfs_attr3_leaf_setflag(args);
}

1325 1326 1327 1328 1329 1330 1331
/*
 * Initial setup for xfs_attr_node_removename.  Make sure the attr is there and
 * the blocks are valid.  Attr keys with remote blocks will be marked
 * incomplete.
 */
STATIC
int xfs_attr_node_removename_setup(
1332
	struct xfs_delattr_context	*dac)
1333
{
1334 1335 1336
	struct xfs_da_args		*args = dac->da_args;
	struct xfs_da_state		**state = &dac->da_state;
	int				error;
1337 1338 1339

	error = xfs_attr_node_hasname(args, state);
	if (error != -EEXIST)
1340
		goto out;
1341
	error = 0;
1342 1343 1344 1345 1346 1347 1348 1349

	ASSERT((*state)->path.blk[(*state)->path.active - 1].bp != NULL);
	ASSERT((*state)->path.blk[(*state)->path.active - 1].magic ==
		XFS_ATTR_LEAF_MAGIC);

	if (args->rmtblkno > 0) {
		error = xfs_attr_leaf_mark_incomplete(args, *state);
		if (error)
1350
			goto out;
1351

1352
		error = xfs_attr_rmtval_invalidate(args);
1353
	}
1354 1355 1356
out:
	if (error)
		xfs_da_state_free(*state);
1357

1358
	return error;
1359 1360
}

1361
STATIC int
1362
xfs_attr_node_removename(
1363 1364 1365 1366 1367 1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379
	struct xfs_da_args	*args,
	struct xfs_da_state	*state)
{
	struct xfs_da_state_blk	*blk;
	int			retval;

	/*
	 * Remove the name and update the hashvals in the tree.
	 */
	blk = &state->path.blk[state->path.active-1];
	ASSERT(blk->magic == XFS_ATTR_LEAF_MAGIC);
	retval = xfs_attr3_leaf_remove(blk->bp, args);
	xfs_da3_fixhashpath(state, &state->path);

	return retval;
}

L
Linus Torvalds 已提交
1380
/*
1381
 * Remove the attribute specified in @args.
L
Linus Torvalds 已提交
1382 1383 1384 1385
 *
 * This will involve walking down the Btree, and may involve joining
 * leaf nodes and even joining intermediate nodes up to and including
 * the root node (a special case of an intermediate node).
1386 1387 1388 1389 1390
 *
 * This routine is meant to function as either an in-line or delayed operation,
 * and may return -EAGAIN when the transaction needs to be rolled.  Calling
 * functions will need to handle this, and call the function until a
 * successful error code is returned.
L
Linus Torvalds 已提交
1391
 */
1392 1393 1394
int
xfs_attr_remove_iter(
	struct xfs_delattr_context	*dac)
L
Linus Torvalds 已提交
1395
{
1396 1397
	struct xfs_da_args		*args = dac->da_args;
	struct xfs_da_state		*state = dac->da_state;
1398
	int				retval, error = 0;
1399
	struct xfs_inode		*dp = args->dp;
L
Linus Torvalds 已提交
1400

1401 1402
	trace_xfs_attr_node_removename(args);

1403 1404 1405 1406
	switch (dac->dela_state) {
	case XFS_DAS_UNINIT:
		if (!xfs_inode_hasattr(dp))
			return -ENOATTR;
L
Linus Torvalds 已提交
1407

1408 1409 1410 1411 1412
		/*
		 * Shortform or leaf formats don't require transaction rolls and
		 * thus state transitions. Call the right helper and return.
		 */
		if (dp->i_afp->if_format == XFS_DINODE_FMT_LOCAL)
1413
			return xfs_attr_sf_removename(args);
1414 1415 1416

		if (xfs_attr_is_leaf(dp))
			return xfs_attr_leaf_removename(args);
1417 1418

		/*
1419 1420
		 * Node format may require transaction rolls. Set up the
		 * state context and fall into the state machine.
1421
		 */
1422 1423 1424 1425 1426 1427 1428
		if (!dac->da_state) {
			error = xfs_attr_node_removename_setup(dac);
			if (error)
				return error;
			state = dac->da_state;
		}

1429
		fallthrough;
1430 1431
	case XFS_DAS_RMTBLK:
		dac->dela_state = XFS_DAS_RMTBLK;
L
Linus Torvalds 已提交
1432 1433

		/*
1434 1435 1436 1437
		 * If there is an out-of-line value, de-allocate the blocks.
		 * This is done before we remove the attribute so that we don't
		 * overflow the maximum size of a transaction and/or hit a
		 * deadlock.
L
Linus Torvalds 已提交
1438
		 */
1439 1440 1441 1442 1443
		if (args->rmtblkno > 0) {
			/*
			 * May return -EAGAIN. Roll and repeat until all remote
			 * blocks are removed.
			 */
1444
			error = xfs_attr_rmtval_remove(dac);
1445 1446 1447
			if (error == -EAGAIN) {
				trace_xfs_attr_remove_iter_return(
						dac->dela_state, args->dp);
1448
				return error;
1449
			} else if (error) {
1450
				goto out;
1451
			}
L
Linus Torvalds 已提交
1452

1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463
			/*
			 * Refill the state structure with buffers (the prior
			 * calls released our buffers) and close out this
			 * transaction before proceeding.
			 */
			ASSERT(args->rmtblkno == 0);
			error = xfs_attr_refillstate(state);
			if (error)
				goto out;
			dac->dela_state = XFS_DAS_RM_NAME;
			dac->flags |= XFS_DAC_DEFER_FINISH;
1464
			trace_xfs_attr_remove_iter_return(dac->dela_state, args->dp);
1465 1466 1467
			return -EAGAIN;
		}

1468
		fallthrough;
1469 1470 1471 1472 1473 1474 1475 1476 1477 1478
	case XFS_DAS_RM_NAME:
		/*
		 * If we came here fresh from a transaction roll, reattach all
		 * the buffers to the current transaction.
		 */
		if (dac->dela_state == XFS_DAS_RM_NAME) {
			error = xfs_attr_refillstate(state);
			if (error)
				goto out;
		}
L
Linus Torvalds 已提交
1479

1480
		retval = xfs_attr_node_removename(args, state);
1481 1482 1483 1484 1485 1486 1487 1488 1489 1490 1491 1492

		/*
		 * Check to see if the tree needs to be collapsed. If so, roll
		 * the transacton and fall into the shrink state.
		 */
		if (retval && (state->path.active > 1)) {
			error = xfs_da3_join(state);
			if (error)
				goto out;

			dac->flags |= XFS_DAC_DEFER_FINISH;
			dac->dela_state = XFS_DAS_RM_SHRINK;
1493 1494
			trace_xfs_attr_remove_iter_return(
					dac->dela_state, args->dp);
1495 1496 1497
			return -EAGAIN;
		}

1498
		fallthrough;
1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513
	case XFS_DAS_RM_SHRINK:
		/*
		 * If the result is small enough, push it all into the inode.
		 * This is our final state so it's safe to return a dirty
		 * transaction.
		 */
		if (xfs_attr_is_leaf(dp))
			error = xfs_attr_node_shrink(args, state);
		ASSERT(error != -EAGAIN);
		break;
	default:
		ASSERT(0);
		error = -EINVAL;
		goto out;
	}
L
Linus Torvalds 已提交
1514
out:
1515 1516
	if (state)
		xfs_da_state_free(state);
E
Eric Sandeen 已提交
1517
	return error;
L
Linus Torvalds 已提交
1518 1519 1520 1521 1522 1523
}

/*
 * Fill in the disk block numbers in the state structure for the buffers
 * that are attached to the state structure.
 * This is done so that we can quickly reattach ourselves to those buffers
1524
 * after some set of transaction commits have released these buffers.
L
Linus Torvalds 已提交
1525 1526 1527 1528 1529 1530 1531 1532
 */
STATIC int
xfs_attr_fillstate(xfs_da_state_t *state)
{
	xfs_da_state_path_t *path;
	xfs_da_state_blk_t *blk;
	int level;

1533 1534
	trace_xfs_attr_fillstate(state->args);

L
Linus Torvalds 已提交
1535 1536 1537 1538 1539 1540 1541 1542
	/*
	 * Roll down the "path" in the state structure, storing the on-disk
	 * block number for those buffers in the "path".
	 */
	path = &state->path;
	ASSERT((path->active >= 0) && (path->active < XFS_DA_NODE_MAXDEPTH));
	for (blk = path->blk, level = 0; level < path->active; blk++, level++) {
		if (blk->bp) {
D
Dave Chinner 已提交
1543
			blk->disk_blkno = xfs_buf_daddr(blk->bp);
L
Linus Torvalds 已提交
1544 1545 1546 1547 1548 1549 1550 1551 1552 1553 1554 1555 1556 1557
			blk->bp = NULL;
		} else {
			blk->disk_blkno = 0;
		}
	}

	/*
	 * Roll down the "altpath" in the state structure, storing the on-disk
	 * block number for those buffers in the "altpath".
	 */
	path = &state->altpath;
	ASSERT((path->active >= 0) && (path->active < XFS_DA_NODE_MAXDEPTH));
	for (blk = path->blk, level = 0; level < path->active; blk++, level++) {
		if (blk->bp) {
D
Dave Chinner 已提交
1558
			blk->disk_blkno = xfs_buf_daddr(blk->bp);
L
Linus Torvalds 已提交
1559 1560 1561 1562 1563 1564
			blk->bp = NULL;
		} else {
			blk->disk_blkno = 0;
		}
	}

E
Eric Sandeen 已提交
1565
	return 0;
L
Linus Torvalds 已提交
1566 1567 1568 1569 1570
}

/*
 * Reattach the buffers to the state structure based on the disk block
 * numbers stored in the state structure.
1571
 * This is done after some set of transaction commits have released those
L
Linus Torvalds 已提交
1572 1573 1574 1575 1576 1577 1578 1579 1580
 * buffers from our grip.
 */
STATIC int
xfs_attr_refillstate(xfs_da_state_t *state)
{
	xfs_da_state_path_t *path;
	xfs_da_state_blk_t *blk;
	int level, error;

1581 1582
	trace_xfs_attr_refillstate(state->args);

L
Linus Torvalds 已提交
1583 1584 1585 1586 1587 1588 1589 1590
	/*
	 * Roll down the "path" in the state structure, storing the on-disk
	 * block number for those buffers in the "path".
	 */
	path = &state->path;
	ASSERT((path->active >= 0) && (path->active < XFS_DA_NODE_MAXDEPTH));
	for (blk = path->blk, level = 0; level < path->active; blk++, level++) {
		if (blk->disk_blkno) {
C
Christoph Hellwig 已提交
1591 1592 1593
			error = xfs_da3_node_read_mapped(state->args->trans,
					state->args->dp, blk->disk_blkno,
					&blk->bp, XFS_ATTR_FORK);
L
Linus Torvalds 已提交
1594
			if (error)
E
Eric Sandeen 已提交
1595
				return error;
L
Linus Torvalds 已提交
1596 1597 1598 1599 1600 1601 1602 1603 1604 1605 1606 1607 1608
		} else {
			blk->bp = NULL;
		}
	}

	/*
	 * Roll down the "altpath" in the state structure, storing the on-disk
	 * block number for those buffers in the "altpath".
	 */
	path = &state->altpath;
	ASSERT((path->active >= 0) && (path->active < XFS_DA_NODE_MAXDEPTH));
	for (blk = path->blk, level = 0; level < path->active; blk++, level++) {
		if (blk->disk_blkno) {
C
Christoph Hellwig 已提交
1609 1610 1611
			error = xfs_da3_node_read_mapped(state->args->trans,
					state->args->dp, blk->disk_blkno,
					&blk->bp, XFS_ATTR_FORK);
L
Linus Torvalds 已提交
1612
			if (error)
E
Eric Sandeen 已提交
1613
				return error;
L
Linus Torvalds 已提交
1614 1615 1616 1617 1618
		} else {
			blk->bp = NULL;
		}
	}

E
Eric Sandeen 已提交
1619
	return 0;
L
Linus Torvalds 已提交
1620 1621 1622
}

/*
1623
 * Retrieve the attribute data from a node attribute list.
L
Linus Torvalds 已提交
1624 1625 1626 1627
 *
 * This routine gets called for any attribute fork that has more than one
 * block, ie: both true Btree attr lists and for single-leaf-blocks with
 * "remote" values taking up more blocks.
1628 1629
 *
 * Returns 0 on successful retrieval, otherwise an error.
L
Linus Torvalds 已提交
1630
 */
1631
STATIC int
1632 1633
xfs_attr_node_get(
	struct xfs_da_args	*args)
L
Linus Torvalds 已提交
1634
{
1635 1636 1637 1638
	struct xfs_da_state	*state;
	struct xfs_da_state_blk	*blk;
	int			i;
	int			error;
L
Linus Torvalds 已提交
1639

1640 1641
	trace_xfs_attr_node_get(args);

L
Linus Torvalds 已提交
1642 1643 1644
	/*
	 * Search to see if name exists, and get back a pointer to it.
	 */
1645 1646
	error = xfs_attr_node_hasname(args, &state);
	if (error != -EEXIST)
1647 1648 1649 1650 1651 1652
		goto out_release;

	/*
	 * Get the value, local or "remote"
	 */
	blk = &state->path.blk[state->path.active - 1];
1653
	error = xfs_attr3_leaf_getvalue(blk->bp, args);
L
Linus Torvalds 已提交
1654 1655 1656 1657

	/*
	 * If not in a transaction, we have to release all the buffers.
	 */
1658
out_release:
1659
	for (i = 0; state != NULL && i < state->path.active; i++) {
1660
		xfs_trans_brelse(args->trans, state->path.blk[i].bp);
L
Linus Torvalds 已提交
1661 1662 1663
		state->path.blk[i].bp = NULL;
	}

1664 1665 1666
	if (state)
		xfs_da_state_free(state);
	return error;
L
Linus Torvalds 已提交
1667
}
1668 1669 1670 1671 1672 1673 1674 1675 1676 1677 1678 1679 1680 1681 1682 1683 1684

/* Returns true if the attribute entry name is valid. */
bool
xfs_attr_namecheck(
	const void	*name,
	size_t		length)
{
	/*
	 * MAXNAMELEN includes the trailing null, but (name/length) leave it
	 * out, so use >= for the length check.
	 */
	if (length >= MAXNAMELEN)
		return false;

	/* There shouldn't be any nulls here */
	return !memchr(name, 0, length);
}