xfs_dir2_block.c 35.2 KB
Newer Older
L
Linus Torvalds 已提交
1
/*
2
 * Copyright (c) 2000-2003,2005 Silicon Graphics, Inc.
3
 * Copyright (c) 2013 Red Hat, Inc.
4
 * All Rights Reserved.
L
Linus Torvalds 已提交
5
 *
6 7
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License as
L
Linus Torvalds 已提交
8 9
 * published by the Free Software Foundation.
 *
10 11 12 13
 * This program is distributed in the hope that it would be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
L
Linus Torvalds 已提交
14
 *
15 16 17
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write the Free Software Foundation,
 * Inc.,  51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
L
Linus Torvalds 已提交
18 19
 */
#include "xfs.h"
20
#include "xfs_fs.h"
21
#include "xfs_format.h"
22 23
#include "xfs_log_format.h"
#include "xfs_trans_resv.h"
L
Linus Torvalds 已提交
24
#include "xfs_mount.h"
25
#include "xfs_da_format.h"
26
#include "xfs_da_btree.h"
L
Linus Torvalds 已提交
27
#include "xfs_inode.h"
28
#include "xfs_trans.h"
29
#include "xfs_inode_item.h"
30
#include "xfs_bmap.h"
31
#include "xfs_buf_item.h"
32
#include "xfs_dir2.h"
C
Christoph Hellwig 已提交
33
#include "xfs_dir2_priv.h"
L
Linus Torvalds 已提交
34
#include "xfs_error.h"
C
Christoph Hellwig 已提交
35
#include "xfs_trace.h"
36
#include "xfs_cksum.h"
37
#include "xfs_log.h"
L
Linus Torvalds 已提交
38 39 40 41

/*
 * Local function prototypes.
 */
42 43 44 45
static void xfs_dir2_block_log_leaf(xfs_trans_t *tp, struct xfs_buf *bp,
				    int first, int last);
static void xfs_dir2_block_log_tail(xfs_trans_t *tp, struct xfs_buf *bp);
static int xfs_dir2_block_lookup_int(xfs_da_args_t *args, struct xfs_buf **bpp,
L
Linus Torvalds 已提交
46 47 48
				     int *entno);
static int xfs_dir2_block_sort(const void *a, const void *b);

49 50 51 52 53 54 55 56
static xfs_dahash_t xfs_dir_hash_dot, xfs_dir_hash_dotdot;

/*
 * One-time startup routine called from xfs_init().
 */
void
xfs_dir_startup(void)
{
57 58
	xfs_dir_hash_dot = xfs_da_hashname((unsigned char *)".", 1);
	xfs_dir_hash_dotdot = xfs_da_hashname((unsigned char *)"..", 2);
59 60
}

61
static xfs_failaddr_t
62
xfs_dir3_block_verify(
63 64 65
	struct xfs_buf		*bp)
{
	struct xfs_mount	*mp = bp->b_target->bt_mount;
66 67 68 69
	struct xfs_dir3_blk_hdr	*hdr3 = bp->b_addr;

	if (xfs_sb_version_hascrc(&mp->m_sb)) {
		if (hdr3->magic != cpu_to_be32(XFS_DIR3_BLOCK_MAGIC))
70
			return __this_address;
71
		if (!uuid_equal(&hdr3->uuid, &mp->m_sb.sb_meta_uuid))
72
			return __this_address;
73
		if (be64_to_cpu(hdr3->blkno) != bp->b_bn)
74
			return __this_address;
75
		if (!xfs_log_check_lsn(mp, be64_to_cpu(hdr3->lsn)))
76
			return __this_address;
77 78
	} else {
		if (hdr3->magic != cpu_to_be32(XFS_DIR2_BLOCK_MAGIC))
79
			return __this_address;
80
	}
81
	return __xfs_dir3_data_check(NULL, bp);
82
}
83

84
static void
85
xfs_dir3_block_read_verify(
86 87
	struct xfs_buf	*bp)
{
88
	struct xfs_mount	*mp = bp->b_target->bt_mount;
89
	xfs_failaddr_t		fa;
90

91 92
	if (xfs_sb_version_hascrc(&mp->m_sb) &&
	     !xfs_buf_verify_cksum(bp, XFS_DIR3_DATA_CRC_OFF))
93 94 95 96 97 98
		xfs_verifier_error(bp, -EFSBADCRC, __this_address);
	else {
		fa = xfs_dir3_block_verify(bp);
		if (fa)
			xfs_verifier_error(bp, -EFSCORRUPTED, fa);
	}
99 100
}

101
static void
102
xfs_dir3_block_write_verify(
103 104
	struct xfs_buf	*bp)
{
105 106 107
	struct xfs_mount	*mp = bp->b_target->bt_mount;
	struct xfs_buf_log_item	*bip = bp->b_fspriv;
	struct xfs_dir3_blk_hdr	*hdr3 = bp->b_addr;
108
	xfs_failaddr_t		fa;
109

110 111 112
	fa = xfs_dir3_block_verify(bp);
	if (fa) {
		xfs_verifier_error(bp, -EFSCORRUPTED, fa);
113 114 115 116 117 118 119 120 121
		return;
	}

	if (!xfs_sb_version_hascrc(&mp->m_sb))
		return;

	if (bip)
		hdr3->lsn = cpu_to_be64(bip->bli_item.li_lsn);

122
	xfs_buf_update_cksum(bp, XFS_DIR3_DATA_CRC_OFF);
123 124
}

125
const struct xfs_buf_ops xfs_dir3_block_buf_ops = {
126
	.name = "xfs_dir3_block",
127 128
	.verify_read = xfs_dir3_block_read_verify,
	.verify_write = xfs_dir3_block_write_verify,
129
	.verify_struct = xfs_dir3_block_verify,
130 131
};

132
int
133
xfs_dir3_block_read(
134 135 136 137 138
	struct xfs_trans	*tp,
	struct xfs_inode	*dp,
	struct xfs_buf		**bpp)
{
	struct xfs_mount	*mp = dp->i_mount;
139
	int			err;
140

141
	err = xfs_da_read_buf(tp, dp, mp->m_dir_geo->datablk, -1, bpp,
142
				XFS_DATA_FORK, &xfs_dir3_block_buf_ops);
143
	if (!err && tp && *bpp)
144
		xfs_trans_buf_set_type(tp, *bpp, XFS_BLFT_DIR_BLOCK_BUF);
145
	return err;
146 147 148 149 150
}

static void
xfs_dir3_block_init(
	struct xfs_mount	*mp,
151
	struct xfs_trans	*tp,
152 153 154 155 156 157
	struct xfs_buf		*bp,
	struct xfs_inode	*dp)
{
	struct xfs_dir3_blk_hdr *hdr3 = bp->b_addr;

	bp->b_ops = &xfs_dir3_block_buf_ops;
158
	xfs_trans_buf_set_type(tp, bp, XFS_BLFT_DIR_BLOCK_BUF);
159 160 161 162 163 164

	if (xfs_sb_version_hascrc(&mp->m_sb)) {
		memset(hdr3, 0, sizeof(*hdr3));
		hdr3->magic = cpu_to_be32(XFS_DIR3_BLOCK_MAGIC);
		hdr3->blkno = cpu_to_be64(bp->b_bn);
		hdr3->owner = cpu_to_be64(dp->i_ino);
165
		uuid_copy(&hdr3->uuid, &mp->m_sb.sb_meta_uuid);
166 167 168 169
		return;

	}
	hdr3->magic = cpu_to_be32(XFS_DIR2_BLOCK_MAGIC);
170 171 172 173
}

static void
xfs_dir2_block_need_space(
174
	struct xfs_inode		*dp,
175 176 177 178 179 180 181 182 183 184 185 186 187 188 189
	struct xfs_dir2_data_hdr	*hdr,
	struct xfs_dir2_block_tail	*btp,
	struct xfs_dir2_leaf_entry	*blp,
	__be16				**tagpp,
	struct xfs_dir2_data_unused	**dupp,
	struct xfs_dir2_data_unused	**enddupp,
	int				*compact,
	int				len)
{
	struct xfs_dir2_data_free	*bf;
	__be16				*tagp = NULL;
	struct xfs_dir2_data_unused	*dup = NULL;
	struct xfs_dir2_data_unused	*enddup = NULL;

	*compact = 0;
190
	bf = dp->d_ops->data_bestfree_p(hdr);
191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285

	/*
	 * If there are stale entries we'll use one for the leaf.
	 */
	if (btp->stale) {
		if (be16_to_cpu(bf[0].length) >= len) {
			/*
			 * The biggest entry enough to avoid compaction.
			 */
			dup = (xfs_dir2_data_unused_t *)
			      ((char *)hdr + be16_to_cpu(bf[0].offset));
			goto out;
		}

		/*
		 * Will need to compact to make this work.
		 * Tag just before the first leaf entry.
		 */
		*compact = 1;
		tagp = (__be16 *)blp - 1;

		/* Data object just before the first leaf entry.  */
		dup = (xfs_dir2_data_unused_t *)((char *)hdr + be16_to_cpu(*tagp));

		/*
		 * If it's not free then the data will go where the
		 * leaf data starts now, if it works at all.
		 */
		if (be16_to_cpu(dup->freetag) == XFS_DIR2_DATA_FREE_TAG) {
			if (be16_to_cpu(dup->length) + (be32_to_cpu(btp->stale) - 1) *
			    (uint)sizeof(*blp) < len)
				dup = NULL;
		} else if ((be32_to_cpu(btp->stale) - 1) * (uint)sizeof(*blp) < len)
			dup = NULL;
		else
			dup = (xfs_dir2_data_unused_t *)blp;
		goto out;
	}

	/*
	 * no stale entries, so just use free space.
	 * Tag just before the first leaf entry.
	 */
	tagp = (__be16 *)blp - 1;

	/* Data object just before the first leaf entry.  */
	enddup = (xfs_dir2_data_unused_t *)((char *)hdr + be16_to_cpu(*tagp));

	/*
	 * If it's not free then can't do this add without cleaning up:
	 * the space before the first leaf entry needs to be free so it
	 * can be expanded to hold the pointer to the new entry.
	 */
	if (be16_to_cpu(enddup->freetag) == XFS_DIR2_DATA_FREE_TAG) {
		/*
		 * Check out the biggest freespace and see if it's the same one.
		 */
		dup = (xfs_dir2_data_unused_t *)
		      ((char *)hdr + be16_to_cpu(bf[0].offset));
		if (dup != enddup) {
			/*
			 * Not the same free entry, just check its length.
			 */
			if (be16_to_cpu(dup->length) < len)
				dup = NULL;
			goto out;
		}

		/*
		 * It is the biggest freespace, can it hold the leaf too?
		 */
		if (be16_to_cpu(dup->length) < len + (uint)sizeof(*blp)) {
			/*
			 * Yes, use the second-largest entry instead if it works.
			 */
			if (be16_to_cpu(bf[1].length) >= len)
				dup = (xfs_dir2_data_unused_t *)
				      ((char *)hdr + be16_to_cpu(bf[1].offset));
			else
				dup = NULL;
		}
	}
out:
	*tagpp = tagp;
	*dupp = dup;
	*enddupp = enddup;
}

/*
 * compact the leaf entries.
 * Leave the highest-numbered stale entry stale.
 * XXX should be the one closest to mid but mid is not yet computed.
 */
static void
xfs_dir2_block_compact(
286
	struct xfs_da_args		*args,
287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318
	struct xfs_buf			*bp,
	struct xfs_dir2_data_hdr	*hdr,
	struct xfs_dir2_block_tail	*btp,
	struct xfs_dir2_leaf_entry	*blp,
	int				*needlog,
	int				*lfloghigh,
	int				*lfloglow)
{
	int			fromidx;	/* source leaf index */
	int			toidx;		/* target leaf index */
	int			needscan = 0;
	int			highstale;	/* high stale index */

	fromidx = toidx = be32_to_cpu(btp->count) - 1;
	highstale = *lfloghigh = -1;
	for (; fromidx >= 0; fromidx--) {
		if (blp[fromidx].address == cpu_to_be32(XFS_DIR2_NULL_DATAPTR)) {
			if (highstale == -1)
				highstale = toidx;
			else {
				if (*lfloghigh == -1)
					*lfloghigh = toidx;
				continue;
			}
		}
		if (fromidx < toidx)
			blp[toidx] = blp[fromidx];
		toidx--;
	}
	*lfloglow = toidx + 1 - (be32_to_cpu(btp->stale) - 1);
	*lfloghigh -= be32_to_cpu(btp->stale) - 1;
	be32_add_cpu(&btp->count, -(be32_to_cpu(btp->stale) - 1));
319
	xfs_dir2_data_make_free(args, bp,
320 321 322 323 324 325 326 327 328
		(xfs_dir2_data_aoff_t)((char *)blp - (char *)hdr),
		(xfs_dir2_data_aoff_t)((be32_to_cpu(btp->stale) - 1) * sizeof(*blp)),
		needlog, &needscan);
	btp->stale = cpu_to_be32(1);
	/*
	 * If we now need to rebuild the bestfree map, do so.
	 * This needs to happen before the next call to use_free.
	 */
	if (needscan)
329
		xfs_dir2_data_freescan(args->dp, hdr, needlog);
330 331
}

L
Linus Torvalds 已提交
332 333 334 335 336 337 338
/*
 * Add an entry to a block directory.
 */
int						/* error */
xfs_dir2_block_addname(
	xfs_da_args_t		*args)		/* directory op arguments */
{
339
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
340
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf entries */
341
	struct xfs_buf		*bp;		/* buffer for block */
L
Linus Torvalds 已提交
342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	int			compact;	/* need to compact leaf ents */
	xfs_dir2_data_entry_t	*dep;		/* block data entry */
	xfs_inode_t		*dp;		/* directory inode */
	xfs_dir2_data_unused_t	*dup;		/* block unused entry */
	int			error;		/* error return value */
	xfs_dir2_data_unused_t	*enddup=NULL;	/* unused at end of data */
	xfs_dahash_t		hash;		/* hash value of found entry */
	int			high;		/* high index for binary srch */
	int			highstale;	/* high stale index */
	int			lfloghigh=0;	/* last final leaf to log */
	int			lfloglow=0;	/* first final leaf to log */
	int			len;		/* length of the new entry */
	int			low;		/* low index for binary srch */
	int			lowstale;	/* low stale index */
	int			mid=0;		/* midpoint for binary srch */
	int			needlog;	/* need to log header */
	int			needscan;	/* need to rescan freespace */
360
	__be16			*tagp;		/* pointer to tag value */
L
Linus Torvalds 已提交
361 362
	xfs_trans_t		*tp;		/* transaction structure */

C
Christoph Hellwig 已提交
363 364
	trace_xfs_dir2_block_addname(args);

L
Linus Torvalds 已提交
365 366
	dp = args->dp;
	tp = args->trans;
367 368

	/* Read the (one and only) directory block into bp. */
369
	error = xfs_dir3_block_read(tp, dp, &bp);
370
	if (error)
L
Linus Torvalds 已提交
371
		return error;
372

373
	len = dp->d_ops->data_entsize(args->namelen);
374

L
Linus Torvalds 已提交
375 376 377
	/*
	 * Set up pointers to parts of the block.
	 */
378
	hdr = bp->b_addr;
379
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
380
	blp = xfs_dir2_block_leaf_p(btp);
381

L
Linus Torvalds 已提交
382
	/*
383 384
	 * Find out if we can reuse stale entries or whether we need extra
	 * space for entry and new leaf.
L
Linus Torvalds 已提交
385
	 */
386
	xfs_dir2_block_need_space(dp, hdr, btp, blp, &tagp, &dup,
387 388
				  &enddup, &compact, len);

L
Linus Torvalds 已提交
389
	/*
390
	 * Done everything we need for a space check now.
L
Linus Torvalds 已提交
391
	 */
392
	if (args->op_flags & XFS_DA_OP_JUSTCHECK) {
393
		xfs_trans_brelse(tp, bp);
394
		if (!dup)
D
Dave Chinner 已提交
395
			return -ENOSPC;
396 397 398
		return 0;
	}

L
Linus Torvalds 已提交
399 400 401 402
	/*
	 * If we don't have space for the new entry & leaf ...
	 */
	if (!dup) {
403 404
		/* Don't have a space reservation: return no-space.  */
		if (args->total == 0)
D
Dave Chinner 已提交
405
			return -ENOSPC;
L
Linus Torvalds 已提交
406 407 408 409 410 411 412 413 414
		/*
		 * Convert to the next larger format.
		 * Then add the new entry in that format.
		 */
		error = xfs_dir2_block_to_leaf(args, bp);
		if (error)
			return error;
		return xfs_dir2_leaf_addname(args);
	}
415

L
Linus Torvalds 已提交
416
	needlog = needscan = 0;
417

L
Linus Torvalds 已提交
418 419 420
	/*
	 * If need to compact the leaf entries, do it now.
	 */
421
	if (compact) {
422
		xfs_dir2_block_compact(args, bp, hdr, btp, blp, &needlog,
423
				      &lfloghigh, &lfloglow);
424 425 426
		/* recalculate blp post-compaction */
		blp = xfs_dir2_block_leaf_p(btp);
	} else if (btp->stale) {
L
Linus Torvalds 已提交
427
		/*
428 429
		 * Set leaf logging boundaries to impossible state.
		 * For the no-stale case they're set explicitly.
L
Linus Torvalds 已提交
430
		 */
431
		lfloglow = be32_to_cpu(btp->count);
L
Linus Torvalds 已提交
432 433
		lfloghigh = -1;
	}
434

L
Linus Torvalds 已提交
435 436 437
	/*
	 * Find the slot that's first lower than our hash value, -1 if none.
	 */
438
	for (low = 0, high = be32_to_cpu(btp->count) - 1; low <= high; ) {
L
Linus Torvalds 已提交
439
		mid = (low + high) >> 1;
440
		if ((hash = be32_to_cpu(blp[mid].hashval)) == args->hashval)
L
Linus Torvalds 已提交
441 442 443 444 445 446
			break;
		if (hash < args->hashval)
			low = mid + 1;
		else
			high = mid - 1;
	}
447
	while (mid >= 0 && be32_to_cpu(blp[mid].hashval) >= args->hashval) {
L
Linus Torvalds 已提交
448 449 450 451 452 453 454 455 456
		mid--;
	}
	/*
	 * No stale entries, will use enddup space to hold new leaf.
	 */
	if (!btp->stale) {
		/*
		 * Mark the space needed for the new leaf entry, now in use.
		 */
457
		xfs_dir2_data_use_free(args, bp, enddup,
L
Linus Torvalds 已提交
458
			(xfs_dir2_data_aoff_t)
459
			((char *)enddup - (char *)hdr + be16_to_cpu(enddup->length) -
L
Linus Torvalds 已提交
460 461 462 463 464 465
			 sizeof(*blp)),
			(xfs_dir2_data_aoff_t)sizeof(*blp),
			&needlog, &needscan);
		/*
		 * Update the tail (entry count).
		 */
466
		be32_add_cpu(&btp->count, 1);
L
Linus Torvalds 已提交
467 468 469 470 471
		/*
		 * If we now need to rebuild the bestfree map, do so.
		 * This needs to happen before the next call to use_free.
		 */
		if (needscan) {
472
			xfs_dir2_data_freescan(dp, hdr, &needlog);
L
Linus Torvalds 已提交
473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492
			needscan = 0;
		}
		/*
		 * Adjust pointer to the first leaf entry, we're about to move
		 * the table up one to open up space for the new leaf entry.
		 * Then adjust our index to match.
		 */
		blp--;
		mid++;
		if (mid)
			memmove(blp, &blp[1], mid * sizeof(*blp));
		lfloglow = 0;
		lfloghigh = mid;
	}
	/*
	 * Use a stale leaf for our new entry.
	 */
	else {
		for (lowstale = mid;
		     lowstale >= 0 &&
493 494
			blp[lowstale].address !=
			cpu_to_be32(XFS_DIR2_NULL_DATAPTR);
L
Linus Torvalds 已提交
495 496 497
		     lowstale--)
			continue;
		for (highstale = mid + 1;
498
		     highstale < be32_to_cpu(btp->count) &&
499 500
			blp[highstale].address !=
			cpu_to_be32(XFS_DIR2_NULL_DATAPTR) &&
L
Linus Torvalds 已提交
501 502 503 504 505 506 507
			(lowstale < 0 || mid - lowstale > highstale - mid);
		     highstale++)
			continue;
		/*
		 * Move entries toward the low-numbered stale entry.
		 */
		if (lowstale >= 0 &&
508
		    (highstale == be32_to_cpu(btp->count) ||
L
Linus Torvalds 已提交
509 510 511 512 513 514 515 516 517 518 519
		     mid - lowstale <= highstale - mid)) {
			if (mid - lowstale)
				memmove(&blp[lowstale], &blp[lowstale + 1],
					(mid - lowstale) * sizeof(*blp));
			lfloglow = MIN(lowstale, lfloglow);
			lfloghigh = MAX(mid, lfloghigh);
		}
		/*
		 * Move entries toward the high-numbered stale entry.
		 */
		else {
520
			ASSERT(highstale < be32_to_cpu(btp->count));
L
Linus Torvalds 已提交
521 522 523 524 525 526 527
			mid++;
			if (highstale - mid)
				memmove(&blp[mid + 1], &blp[mid],
					(highstale - mid) * sizeof(*blp));
			lfloglow = MIN(mid, lfloglow);
			lfloghigh = MAX(highstale, lfloghigh);
		}
528
		be32_add_cpu(&btp->stale, -1);
L
Linus Torvalds 已提交
529 530 531 532 533 534 535 536
	}
	/*
	 * Point to the new data entry.
	 */
	dep = (xfs_dir2_data_entry_t *)dup;
	/*
	 * Fill in the leaf entry.
	 */
537
	blp[mid].hashval = cpu_to_be32(args->hashval);
538
	blp[mid].address = cpu_to_be32(xfs_dir2_byte_to_dataptr(
539
				(char *)dep - (char *)hdr));
L
Linus Torvalds 已提交
540 541 542 543
	xfs_dir2_block_log_leaf(tp, bp, lfloglow, lfloghigh);
	/*
	 * Mark space for the data entry used.
	 */
544
	xfs_dir2_data_use_free(args, bp, dup,
545
		(xfs_dir2_data_aoff_t)((char *)dup - (char *)hdr),
L
Linus Torvalds 已提交
546 547 548 549
		(xfs_dir2_data_aoff_t)len, &needlog, &needscan);
	/*
	 * Create the new data entry.
	 */
550
	dep->inumber = cpu_to_be64(args->inumber);
L
Linus Torvalds 已提交
551 552
	dep->namelen = args->namelen;
	memcpy(dep->name, args->name, args->namelen);
553 554
	dp->d_ops->data_put_ftype(dep, args->filetype);
	tagp = dp->d_ops->data_entry_tag_p(dep);
555
	*tagp = cpu_to_be16((char *)dep - (char *)hdr);
L
Linus Torvalds 已提交
556 557 558 559
	/*
	 * Clean up the bestfree array and log the header, tail, and entry.
	 */
	if (needscan)
560
		xfs_dir2_data_freescan(dp, hdr, &needlog);
L
Linus Torvalds 已提交
561
	if (needlog)
562
		xfs_dir2_data_log_header(args, bp);
L
Linus Torvalds 已提交
563
	xfs_dir2_block_log_tail(tp, bp);
564
	xfs_dir2_data_log_entry(args, bp, dep);
565
	xfs_dir3_data_check(dp, bp);
L
Linus Torvalds 已提交
566 567 568 569 570 571 572 573 574
	return 0;
}

/*
 * Log leaf entries from the block.
 */
static void
xfs_dir2_block_log_leaf(
	xfs_trans_t		*tp,		/* transaction structure */
575
	struct xfs_buf		*bp,		/* block buffer */
L
Linus Torvalds 已提交
576 577 578
	int			first,		/* index of first logged leaf */
	int			last)		/* index of last logged leaf */
{
579
	xfs_dir2_data_hdr_t	*hdr = bp->b_addr;
580 581
	xfs_dir2_leaf_entry_t	*blp;
	xfs_dir2_block_tail_t	*btp;
L
Linus Torvalds 已提交
582

583
	btp = xfs_dir2_block_tail_p(tp->t_mountp->m_dir_geo, hdr);
584
	blp = xfs_dir2_block_leaf_p(btp);
585
	xfs_trans_log_buf(tp, bp, (uint)((char *)&blp[first] - (char *)hdr),
586
		(uint)((char *)&blp[last + 1] - (char *)hdr - 1));
L
Linus Torvalds 已提交
587 588 589 590 591 592 593 594
}

/*
 * Log the block tail.
 */
static void
xfs_dir2_block_log_tail(
	xfs_trans_t		*tp,		/* transaction structure */
595
	struct xfs_buf		*bp)		/* block buffer */
L
Linus Torvalds 已提交
596
{
597
	xfs_dir2_data_hdr_t	*hdr = bp->b_addr;
598
	xfs_dir2_block_tail_t	*btp;
L
Linus Torvalds 已提交
599

600
	btp = xfs_dir2_block_tail_p(tp->t_mountp->m_dir_geo, hdr);
601
	xfs_trans_log_buf(tp, bp, (uint)((char *)btp - (char *)hdr),
602
		(uint)((char *)(btp + 1) - (char *)hdr - 1));
L
Linus Torvalds 已提交
603 604 605 606 607 608 609 610 611 612
}

/*
 * Look up an entry in the block.  This is the external routine,
 * xfs_dir2_block_lookup_int does the real work.
 */
int						/* error */
xfs_dir2_block_lookup(
	xfs_da_args_t		*args)		/* dir lookup arguments */
{
613
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
614
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf entries */
615
	struct xfs_buf		*bp;		/* block buffer */
L
Linus Torvalds 已提交
616 617 618 619 620 621
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	xfs_dir2_data_entry_t	*dep;		/* block data entry */
	xfs_inode_t		*dp;		/* incore inode */
	int			ent;		/* entry index */
	int			error;		/* error return value */

C
Christoph Hellwig 已提交
622 623
	trace_xfs_dir2_block_lookup(args);

L
Linus Torvalds 已提交
624 625 626 627 628 629 630
	/*
	 * Get the buffer, look up the entry.
	 * If not found (ENOENT) then return, have no buffer.
	 */
	if ((error = xfs_dir2_block_lookup_int(args, &bp, &ent)))
		return error;
	dp = args->dp;
631
	hdr = bp->b_addr;
632
	xfs_dir3_data_check(dp, bp);
633
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
634
	blp = xfs_dir2_block_leaf_p(btp);
L
Linus Torvalds 已提交
635 636 637
	/*
	 * Get the offset from the leaf entry, to point to the data.
	 */
638
	dep = (xfs_dir2_data_entry_t *)((char *)hdr +
639 640
			xfs_dir2_dataptr_to_off(args->geo,
						be32_to_cpu(blp[ent].address)));
L
Linus Torvalds 已提交
641
	/*
642
	 * Fill in inode number, CI name if appropriate, release the block.
L
Linus Torvalds 已提交
643
	 */
644
	args->inumber = be64_to_cpu(dep->inumber);
645
	args->filetype = dp->d_ops->data_get_ftype(dep);
646
	error = xfs_dir_cilookup_result(args, dep->name, dep->namelen);
647
	xfs_trans_brelse(args->trans, bp);
E
Eric Sandeen 已提交
648
	return error;
L
Linus Torvalds 已提交
649 650 651 652 653 654 655 656
}

/*
 * Internal block lookup routine.
 */
static int					/* error */
xfs_dir2_block_lookup_int(
	xfs_da_args_t		*args,		/* dir lookup arguments */
657
	struct xfs_buf		**bpp,		/* returned block buffer */
L
Linus Torvalds 已提交
658 659 660
	int			*entno)		/* returned entry number */
{
	xfs_dir2_dataptr_t	addr;		/* data entry address */
661
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
662
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf entries */
663
	struct xfs_buf		*bp;		/* block buffer */
L
Linus Torvalds 已提交
664 665 666 667 668 669 670 671 672 673
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	xfs_dir2_data_entry_t	*dep;		/* block data entry */
	xfs_inode_t		*dp;		/* incore inode */
	int			error;		/* error return value */
	xfs_dahash_t		hash;		/* found hash value */
	int			high;		/* binary search high index */
	int			low;		/* binary search low index */
	int			mid;		/* binary search current idx */
	xfs_mount_t		*mp;		/* filesystem mount point */
	xfs_trans_t		*tp;		/* transaction pointer */
674
	enum xfs_dacmp		cmp;		/* comparison result */
L
Linus Torvalds 已提交
675 676 677 678

	dp = args->dp;
	tp = args->trans;
	mp = dp->i_mount;
679

680
	error = xfs_dir3_block_read(tp, dp, &bp);
681
	if (error)
L
Linus Torvalds 已提交
682
		return error;
683

684
	hdr = bp->b_addr;
685
	xfs_dir3_data_check(dp, bp);
686
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
687
	blp = xfs_dir2_block_leaf_p(btp);
L
Linus Torvalds 已提交
688 689 690 691
	/*
	 * Loop doing a binary search for our hash value.
	 * Find our entry, ENOENT if it's not there.
	 */
692
	for (low = 0, high = be32_to_cpu(btp->count) - 1; ; ) {
L
Linus Torvalds 已提交
693 694
		ASSERT(low <= high);
		mid = (low + high) >> 1;
695
		if ((hash = be32_to_cpu(blp[mid].hashval)) == args->hashval)
L
Linus Torvalds 已提交
696 697 698 699 700 701
			break;
		if (hash < args->hashval)
			low = mid + 1;
		else
			high = mid - 1;
		if (low > high) {
702
			ASSERT(args->op_flags & XFS_DA_OP_OKNOENT);
703
			xfs_trans_brelse(tp, bp);
D
Dave Chinner 已提交
704
			return -ENOENT;
L
Linus Torvalds 已提交
705 706 707 708 709
		}
	}
	/*
	 * Back up to the first one with the right hash value.
	 */
710
	while (mid > 0 && be32_to_cpu(blp[mid - 1].hashval) == args->hashval) {
L
Linus Torvalds 已提交
711 712 713 714 715 716 717
		mid--;
	}
	/*
	 * Now loop forward through all the entries with the
	 * right hash value looking for our name.
	 */
	do {
718
		if ((addr = be32_to_cpu(blp[mid].address)) == XFS_DIR2_NULL_DATAPTR)
L
Linus Torvalds 已提交
719 720 721 722 723
			continue;
		/*
		 * Get pointer to the entry from the leaf.
		 */
		dep = (xfs_dir2_data_entry_t *)
724
			((char *)hdr + xfs_dir2_dataptr_to_off(args->geo, addr));
L
Linus Torvalds 已提交
725
		/*
726 727 728
		 * Compare name and if it's an exact match, return the index
		 * and buffer. If it's the first case-insensitive match, store
		 * the index and buffer and continue looking for an exact match.
L
Linus Torvalds 已提交
729
		 */
730 731 732
		cmp = mp->m_dirnameops->compname(args, dep->name, dep->namelen);
		if (cmp != XFS_CMP_DIFFERENT && cmp != args->cmpresult) {
			args->cmpresult = cmp;
L
Linus Torvalds 已提交
733 734
			*bpp = bp;
			*entno = mid;
735 736
			if (cmp == XFS_CMP_EXACT)
				return 0;
L
Linus Torvalds 已提交
737
		}
738 739 740
	} while (++mid < be32_to_cpu(btp->count) &&
			be32_to_cpu(blp[mid].hashval) == hash);

741
	ASSERT(args->op_flags & XFS_DA_OP_OKNOENT);
742 743 744 745 746 747
	/*
	 * Here, we can only be doing a lookup (not a rename or replace).
	 * If a case-insensitive match was found earlier, return success.
	 */
	if (args->cmpresult == XFS_CMP_CASE)
		return 0;
L
Linus Torvalds 已提交
748 749 750
	/*
	 * No match, release the buffer and return ENOENT.
	 */
751
	xfs_trans_brelse(tp, bp);
D
Dave Chinner 已提交
752
	return -ENOENT;
L
Linus Torvalds 已提交
753 754 755 756 757 758 759 760 761 762
}

/*
 * Remove an entry from a block format directory.
 * If that makes the block small enough to fit in shortform, transform it.
 */
int						/* error */
xfs_dir2_block_removename(
	xfs_da_args_t		*args)		/* directory operation args */
{
763
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
764
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf pointer */
765
	struct xfs_buf		*bp;		/* block buffer */
L
Linus Torvalds 已提交
766 767 768 769 770 771 772 773 774 775 776
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	xfs_dir2_data_entry_t	*dep;		/* block data entry */
	xfs_inode_t		*dp;		/* incore inode */
	int			ent;		/* block leaf entry index */
	int			error;		/* error return value */
	int			needlog;	/* need to log block header */
	int			needscan;	/* need to fixup bestfree */
	xfs_dir2_sf_hdr_t	sfh;		/* shortform header */
	int			size;		/* shortform size */
	xfs_trans_t		*tp;		/* transaction pointer */

C
Christoph Hellwig 已提交
777 778
	trace_xfs_dir2_block_removename(args);

L
Linus Torvalds 已提交
779 780 781 782 783 784 785 786 787
	/*
	 * Look up the entry in the block.  Gets the buffer and entry index.
	 * It will always be there, the vnodeops level does a lookup first.
	 */
	if ((error = xfs_dir2_block_lookup_int(args, &bp, &ent))) {
		return error;
	}
	dp = args->dp;
	tp = args->trans;
788
	hdr = bp->b_addr;
789
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
790
	blp = xfs_dir2_block_leaf_p(btp);
L
Linus Torvalds 已提交
791 792 793
	/*
	 * Point to the data entry using the leaf entry.
	 */
794 795 796
	dep = (xfs_dir2_data_entry_t *)((char *)hdr +
			xfs_dir2_dataptr_to_off(args->geo,
						be32_to_cpu(blp[ent].address)));
L
Linus Torvalds 已提交
797 798 799 800
	/*
	 * Mark the data entry's space free.
	 */
	needlog = needscan = 0;
801
	xfs_dir2_data_make_free(args, bp,
802
		(xfs_dir2_data_aoff_t)((char *)dep - (char *)hdr),
803
		dp->d_ops->data_entsize(dep->namelen), &needlog, &needscan);
L
Linus Torvalds 已提交
804 805 806
	/*
	 * Fix up the block tail.
	 */
807
	be32_add_cpu(&btp->stale, 1);
L
Linus Torvalds 已提交
808 809 810 811
	xfs_dir2_block_log_tail(tp, bp);
	/*
	 * Remove the leaf entry by marking it stale.
	 */
812
	blp[ent].address = cpu_to_be32(XFS_DIR2_NULL_DATAPTR);
L
Linus Torvalds 已提交
813 814 815 816 817
	xfs_dir2_block_log_leaf(tp, bp, ent, ent);
	/*
	 * Fix up bestfree, log the header if necessary.
	 */
	if (needscan)
818
		xfs_dir2_data_freescan(dp, hdr, &needlog);
L
Linus Torvalds 已提交
819
	if (needlog)
820
		xfs_dir2_data_log_header(args, bp);
821
	xfs_dir3_data_check(dp, bp);
L
Linus Torvalds 已提交
822 823 824
	/*
	 * See if the size as a shortform is good enough.
	 */
825
	size = xfs_dir2_block_sfsize(dp, hdr, &sfh);
826
	if (size > XFS_IFORK_DSIZE(dp))
L
Linus Torvalds 已提交
827
		return 0;
828

L
Linus Torvalds 已提交
829 830 831 832 833 834 835 836 837 838 839 840 841 842
	/*
	 * If it works, do the conversion.
	 */
	return xfs_dir2_block_to_sf(args, bp, size, &sfh);
}

/*
 * Replace an entry in a V2 block directory.
 * Change the inode number to the new value.
 */
int						/* error */
xfs_dir2_block_replace(
	xfs_da_args_t		*args)		/* directory operation args */
{
843
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
844
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf entries */
845
	struct xfs_buf		*bp;		/* block buffer */
L
Linus Torvalds 已提交
846 847 848 849 850 851
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	xfs_dir2_data_entry_t	*dep;		/* block data entry */
	xfs_inode_t		*dp;		/* incore inode */
	int			ent;		/* leaf entry index */
	int			error;		/* error return value */

C
Christoph Hellwig 已提交
852 853
	trace_xfs_dir2_block_replace(args);

L
Linus Torvalds 已提交
854 855 856 857 858 859 860 861
	/*
	 * Lookup the entry in the directory.  Get buffer and entry index.
	 * This will always succeed since the caller has already done a lookup.
	 */
	if ((error = xfs_dir2_block_lookup_int(args, &bp, &ent))) {
		return error;
	}
	dp = args->dp;
862
	hdr = bp->b_addr;
863
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
864
	blp = xfs_dir2_block_leaf_p(btp);
L
Linus Torvalds 已提交
865 866 867
	/*
	 * Point to the data entry we need to change.
	 */
868 869 870
	dep = (xfs_dir2_data_entry_t *)((char *)hdr +
			xfs_dir2_dataptr_to_off(args->geo,
						be32_to_cpu(blp[ent].address)));
871
	ASSERT(be64_to_cpu(dep->inumber) != args->inumber);
L
Linus Torvalds 已提交
872 873 874
	/*
	 * Change the inode number to the new value.
	 */
875
	dep->inumber = cpu_to_be64(args->inumber);
876
	dp->d_ops->data_put_ftype(dep, args->filetype);
877
	xfs_dir2_data_log_entry(args, bp, dep);
878
	xfs_dir3_data_check(dp, bp);
L
Linus Torvalds 已提交
879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894
	return 0;
}

/*
 * Qsort comparison routine for the block leaf entries.
 */
static int					/* sort order */
xfs_dir2_block_sort(
	const void			*a,	/* first leaf entry */
	const void			*b)	/* second leaf entry */
{
	const xfs_dir2_leaf_entry_t	*la;	/* first leaf entry */
	const xfs_dir2_leaf_entry_t	*lb;	/* second leaf entry */

	la = a;
	lb = b;
895 896
	return be32_to_cpu(la->hashval) < be32_to_cpu(lb->hashval) ? -1 :
		(be32_to_cpu(la->hashval) > be32_to_cpu(lb->hashval) ? 1 : 0);
L
Linus Torvalds 已提交
897 898 899 900 901 902 903 904
}

/*
 * Convert a V2 leaf directory to a V2 block directory if possible.
 */
int						/* error */
xfs_dir2_leaf_to_block(
	xfs_da_args_t		*args,		/* operation arguments */
905 906
	struct xfs_buf		*lbp,		/* leaf buffer */
	struct xfs_buf		*dbp)		/* data buffer */
L
Linus Torvalds 已提交
907
{
908
	__be16			*bestsp;	/* leaf bests table */
909
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
910 911 912 913 914 915 916 917 918 919 920 921 922
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	xfs_inode_t		*dp;		/* incore directory inode */
	xfs_dir2_data_unused_t	*dup;		/* unused data entry */
	int			error;		/* error return value */
	int			from;		/* leaf from index */
	xfs_dir2_leaf_t		*leaf;		/* leaf structure */
	xfs_dir2_leaf_entry_t	*lep;		/* leaf entry */
	xfs_dir2_leaf_tail_t	*ltp;		/* leaf tail structure */
	xfs_mount_t		*mp;		/* file system mount point */
	int			needlog;	/* need to log data header */
	int			needscan;	/* need to scan for bestfree */
	xfs_dir2_sf_hdr_t	sfh;		/* shortform header */
	int			size;		/* bytes used */
923
	__be16			*tagp;		/* end of entry (tag) */
L
Linus Torvalds 已提交
924 925
	int			to;		/* block/leaf to index */
	xfs_trans_t		*tp;		/* transaction pointer */
926 927
	struct xfs_dir2_leaf_entry *ents;
	struct xfs_dir3_icleaf_hdr leafhdr;
L
Linus Torvalds 已提交
928

C
Christoph Hellwig 已提交
929 930
	trace_xfs_dir2_leaf_to_block(args);

L
Linus Torvalds 已提交
931 932 933
	dp = args->dp;
	tp = args->trans;
	mp = dp->i_mount;
934
	leaf = lbp->b_addr;
935
	dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf);
936
	ents = dp->d_ops->leaf_ents_p(leaf);
937
	ltp = xfs_dir2_leaf_tail_p(args->geo, leaf);
938 939 940

	ASSERT(leafhdr.magic == XFS_DIR2_LEAF1_MAGIC ||
	       leafhdr.magic == XFS_DIR3_LEAF1_MAGIC);
L
Linus Torvalds 已提交
941 942 943 944 945 946
	/*
	 * If there are data blocks other than the first one, take this
	 * opportunity to remove trailing empty data blocks that may have
	 * been left behind during no-space-reservation operations.
	 * These will show up in the leaf bests table.
	 */
947
	while (dp->i_d.di_size > args->geo->blksize) {
948 949
		int hdrsz;

950
		hdrsz = dp->d_ops->data_entry_offset;
951
		bestsp = xfs_dir2_leaf_bests_p(ltp);
952
		if (be16_to_cpu(bestsp[be32_to_cpu(ltp->bestcount) - 1]) ==
953
					    args->geo->blksize - hdrsz) {
L
Linus Torvalds 已提交
954 955
			if ((error =
			    xfs_dir2_leaf_trim_data(args, lbp,
956
				    (xfs_dir2_db_t)(be32_to_cpu(ltp->bestcount) - 1))))
957 958 959
				return error;
		} else
			return 0;
L
Linus Torvalds 已提交
960 961 962 963
	}
	/*
	 * Read the data block if we don't already have it, give up if it fails.
	 */
964
	if (!dbp) {
965
		error = xfs_dir3_data_read(tp, dp, args->geo->datablk, -1, &dbp);
966 967
		if (error)
			return error;
L
Linus Torvalds 已提交
968
	}
969
	hdr = dbp->b_addr;
970 971 972
	ASSERT(hdr->magic == cpu_to_be32(XFS_DIR2_DATA_MAGIC) ||
	       hdr->magic == cpu_to_be32(XFS_DIR3_DATA_MAGIC));

L
Linus Torvalds 已提交
973 974 975
	/*
	 * Size of the "leaf" area in the block.
	 */
976
	size = (uint)sizeof(xfs_dir2_block_tail_t) +
977
	       (uint)sizeof(*lep) * (leafhdr.count - leafhdr.stale);
L
Linus Torvalds 已提交
978 979 980
	/*
	 * Look at the last data entry.
	 */
981
	tagp = (__be16 *)((char *)hdr + args->geo->blksize) - 1;
982
	dup = (xfs_dir2_data_unused_t *)((char *)hdr + be16_to_cpu(*tagp));
L
Linus Torvalds 已提交
983 984 985
	/*
	 * If it's not free or is too short we can't do it.
	 */
986
	if (be16_to_cpu(dup->freetag) != XFS_DIR2_DATA_FREE_TAG ||
987 988 989
	    be16_to_cpu(dup->length) < size)
		return 0;

L
Linus Torvalds 已提交
990 991 992
	/*
	 * Start converting it to block form.
	 */
993
	xfs_dir3_block_init(mp, tp, dbp, dp);
994

L
Linus Torvalds 已提交
995 996 997 998 999
	needlog = 1;
	needscan = 0;
	/*
	 * Use up the space at the end of the block (blp/btp).
	 */
1000
	xfs_dir2_data_use_free(args, dbp, dup, args->geo->blksize - size, size,
L
Linus Torvalds 已提交
1001 1002 1003 1004
		&needlog, &needscan);
	/*
	 * Initialize the block tail.
	 */
1005
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
1006
	btp->count = cpu_to_be32(leafhdr.count - leafhdr.stale);
L
Linus Torvalds 已提交
1007 1008 1009 1010 1011
	btp->stale = 0;
	xfs_dir2_block_log_tail(tp, dbp);
	/*
	 * Initialize the block leaf area.  We compact out stale entries.
	 */
1012
	lep = xfs_dir2_block_leaf_p(btp);
1013 1014
	for (from = to = 0; from < leafhdr.count; from++) {
		if (ents[from].address == cpu_to_be32(XFS_DIR2_NULL_DATAPTR))
L
Linus Torvalds 已提交
1015
			continue;
1016
		lep[to++] = ents[from];
L
Linus Torvalds 已提交
1017
	}
1018 1019
	ASSERT(to == be32_to_cpu(btp->count));
	xfs_dir2_block_log_leaf(tp, dbp, 0, be32_to_cpu(btp->count) - 1);
L
Linus Torvalds 已提交
1020 1021 1022 1023
	/*
	 * Scan the bestfree if we need it and log the data block header.
	 */
	if (needscan)
1024
		xfs_dir2_data_freescan(dp, hdr, &needlog);
L
Linus Torvalds 已提交
1025
	if (needlog)
1026
		xfs_dir2_data_log_header(args, dbp);
L
Linus Torvalds 已提交
1027 1028 1029
	/*
	 * Pitch the old leaf block.
	 */
1030
	error = xfs_da_shrink_inode(args, args->geo->leafblk, lbp);
1031 1032 1033
	if (error)
		return error;

L
Linus Torvalds 已提交
1034 1035 1036
	/*
	 * Now see if the resulting block can be shrunken to shortform.
	 */
1037
	size = xfs_dir2_block_sfsize(dp, hdr, &sfh);
1038 1039 1040
	if (size > XFS_IFORK_DSIZE(dp))
		return 0;

L
Linus Torvalds 已提交
1041 1042 1043 1044 1045 1046 1047 1048 1049 1050 1051
	return xfs_dir2_block_to_sf(args, dbp, size, &sfh);
}

/*
 * Convert the shortform directory to block form.
 */
int						/* error */
xfs_dir2_sf_to_block(
	xfs_da_args_t		*args)		/* operation arguments */
{
	xfs_dir2_db_t		blkno;		/* dir-relative block # (0) */
1052
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
1053
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf entries */
1054
	struct xfs_buf		*bp;		/* block buffer */
L
Linus Torvalds 已提交
1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067 1068
	xfs_dir2_block_tail_t	*btp;		/* block tail pointer */
	xfs_dir2_data_entry_t	*dep;		/* data entry pointer */
	xfs_inode_t		*dp;		/* incore directory inode */
	int			dummy;		/* trash */
	xfs_dir2_data_unused_t	*dup;		/* unused entry pointer */
	int			endoffset;	/* end of data objects */
	int			error;		/* error return value */
	int			i;		/* index */
	xfs_mount_t		*mp;		/* filesystem mount point */
	int			needlog;	/* need to log block header */
	int			needscan;	/* need to scan block freespc */
	int			newoffset;	/* offset from current entry */
	int			offset;		/* target block offset */
	xfs_dir2_sf_entry_t	*sfep;		/* sf entry pointer */
C
Christoph Hellwig 已提交
1069 1070
	xfs_dir2_sf_hdr_t	*oldsfp;	/* old shortform header  */
	xfs_dir2_sf_hdr_t	*sfp;		/* shortform header  */
1071
	__be16			*tagp;		/* end of data entry */
L
Linus Torvalds 已提交
1072
	xfs_trans_t		*tp;		/* transaction pointer */
1073
	struct xfs_name		name;
1074
	struct xfs_ifork	*ifp;
L
Linus Torvalds 已提交
1075

C
Christoph Hellwig 已提交
1076 1077
	trace_xfs_dir2_sf_to_block(args);

L
Linus Torvalds 已提交
1078 1079 1080
	dp = args->dp;
	tp = args->trans;
	mp = dp->i_mount;
1081 1082
	ifp = XFS_IFORK_PTR(dp, XFS_DATA_FORK);
	ASSERT(ifp->if_flags & XFS_IFINLINE);
L
Linus Torvalds 已提交
1083 1084 1085 1086 1087
	/*
	 * Bomb out if the shortform directory is way too short.
	 */
	if (dp->i_d.di_size < offsetof(xfs_dir2_sf_hdr_t, parent)) {
		ASSERT(XFS_FORCED_SHUTDOWN(mp));
D
Dave Chinner 已提交
1088
		return -EIO;
L
Linus Torvalds 已提交
1089
	}
C
Christoph Hellwig 已提交
1090

1091
	oldsfp = (xfs_dir2_sf_hdr_t *)ifp->if_u1.if_data;
C
Christoph Hellwig 已提交
1092

1093 1094
	ASSERT(ifp->if_bytes == dp->i_d.di_size);
	ASSERT(ifp->if_u1.if_data != NULL);
C
Christoph Hellwig 已提交
1095
	ASSERT(dp->i_d.di_size >= xfs_dir2_sf_hdr_size(oldsfp->i8count));
1096
	ASSERT(dp->i_d.di_nextents == 0);
C
Christoph Hellwig 已提交
1097

L
Linus Torvalds 已提交
1098
	/*
C
Christoph Hellwig 已提交
1099
	 * Copy the directory into a temporary buffer.
L
Linus Torvalds 已提交
1100 1101
	 * Then pitch the incore inode data so we can make extents.
	 */
1102 1103
	sfp = kmem_alloc(ifp->if_bytes, KM_SLEEP);
	memcpy(sfp, oldsfp, ifp->if_bytes);
L
Linus Torvalds 已提交
1104

1105 1106
	xfs_idata_realloc(dp, -ifp->if_bytes, XFS_DATA_FORK);
	xfs_bmap_local_to_extents_empty(dp, XFS_DATA_FORK);
L
Linus Torvalds 已提交
1107
	dp->i_d.di_size = 0;
C
Christoph Hellwig 已提交
1108

L
Linus Torvalds 已提交
1109 1110 1111 1112 1113
	/*
	 * Add block 0 to the inode.
	 */
	error = xfs_dir2_grow_inode(args, XFS_DIR2_DATA_SPACE, &blkno);
	if (error) {
C
Christoph Hellwig 已提交
1114
		kmem_free(sfp);
L
Linus Torvalds 已提交
1115 1116 1117
		return error;
	}
	/*
1118
	 * Initialize the data block, then convert it to block format.
L
Linus Torvalds 已提交
1119
	 */
1120
	error = xfs_dir3_data_init(args, blkno, &bp);
L
Linus Torvalds 已提交
1121
	if (error) {
C
Christoph Hellwig 已提交
1122
		kmem_free(sfp);
L
Linus Torvalds 已提交
1123 1124
		return error;
	}
1125
	xfs_dir3_block_init(mp, tp, bp, dp);
1126
	hdr = bp->b_addr;
1127

L
Linus Torvalds 已提交
1128 1129 1130 1131
	/*
	 * Compute size of block "tail" area.
	 */
	i = (uint)sizeof(*btp) +
C
Christoph Hellwig 已提交
1132
	    (sfp->count + 2) * (uint)sizeof(xfs_dir2_leaf_entry_t);
L
Linus Torvalds 已提交
1133 1134 1135 1136
	/*
	 * The whole thing is initialized to free by the init routine.
	 * Say we're using the leaf and tail area.
	 */
1137
	dup = dp->d_ops->data_unused_p(hdr);
L
Linus Torvalds 已提交
1138
	needlog = needscan = 0;
1139
	xfs_dir2_data_use_free(args, bp, dup, args->geo->blksize - i,
1140
			       i, &needlog, &needscan);
L
Linus Torvalds 已提交
1141 1142 1143 1144
	ASSERT(needscan == 0);
	/*
	 * Fill in the tail.
	 */
1145
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
C
Christoph Hellwig 已提交
1146
	btp->count = cpu_to_be32(sfp->count + 2);	/* ., .. */
L
Linus Torvalds 已提交
1147
	btp->stale = 0;
1148
	blp = xfs_dir2_block_leaf_p(btp);
1149
	endoffset = (uint)((char *)blp - (char *)hdr);
L
Linus Torvalds 已提交
1150 1151 1152
	/*
	 * Remove the freespace, we'll manage it.
	 */
1153
	xfs_dir2_data_use_free(args, bp, dup,
1154
		(xfs_dir2_data_aoff_t)((char *)dup - (char *)hdr),
1155
		be16_to_cpu(dup->length), &needlog, &needscan);
L
Linus Torvalds 已提交
1156 1157 1158
	/*
	 * Create entry for .
	 */
1159
	dep = dp->d_ops->data_dot_entry_p(hdr);
1160
	dep->inumber = cpu_to_be64(dp->i_ino);
L
Linus Torvalds 已提交
1161 1162
	dep->namelen = 1;
	dep->name[0] = '.';
1163 1164
	dp->d_ops->data_put_ftype(dep, XFS_DIR3_FT_DIR);
	tagp = dp->d_ops->data_entry_tag_p(dep);
1165
	*tagp = cpu_to_be16((char *)dep - (char *)hdr);
1166
	xfs_dir2_data_log_entry(args, bp, dep);
1167
	blp[0].hashval = cpu_to_be32(xfs_dir_hash_dot);
1168
	blp[0].address = cpu_to_be32(xfs_dir2_byte_to_dataptr(
1169
				(char *)dep - (char *)hdr));
L
Linus Torvalds 已提交
1170 1171 1172
	/*
	 * Create entry for ..
	 */
1173
	dep = dp->d_ops->data_dotdot_entry_p(hdr);
1174
	dep->inumber = cpu_to_be64(dp->d_ops->sf_get_parent_ino(sfp));
L
Linus Torvalds 已提交
1175 1176
	dep->namelen = 2;
	dep->name[0] = dep->name[1] = '.';
1177 1178
	dp->d_ops->data_put_ftype(dep, XFS_DIR3_FT_DIR);
	tagp = dp->d_ops->data_entry_tag_p(dep);
1179
	*tagp = cpu_to_be16((char *)dep - (char *)hdr);
1180
	xfs_dir2_data_log_entry(args, bp, dep);
1181
	blp[1].hashval = cpu_to_be32(xfs_dir_hash_dotdot);
1182
	blp[1].address = cpu_to_be32(xfs_dir2_byte_to_dataptr(
1183
				(char *)dep - (char *)hdr));
1184
	offset = dp->d_ops->data_first_offset;
L
Linus Torvalds 已提交
1185 1186 1187
	/*
	 * Loop over existing entries, stuff them in.
	 */
C
Christoph Hellwig 已提交
1188 1189
	i = 0;
	if (!sfp->count)
L
Linus Torvalds 已提交
1190 1191
		sfep = NULL;
	else
1192
		sfep = xfs_dir2_sf_firstentry(sfp);
L
Linus Torvalds 已提交
1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203
	/*
	 * Need to preserve the existing offset values in the sf directory.
	 * Insert holes (unused entries) where necessary.
	 */
	while (offset < endoffset) {
		/*
		 * sfep is null when we reach the end of the list.
		 */
		if (sfep == NULL)
			newoffset = endoffset;
		else
1204
			newoffset = xfs_dir2_sf_get_offset(sfep);
L
Linus Torvalds 已提交
1205 1206 1207 1208
		/*
		 * There should be a hole here, make one.
		 */
		if (offset < newoffset) {
1209
			dup = (xfs_dir2_data_unused_t *)((char *)hdr + offset);
1210 1211
			dup->freetag = cpu_to_be16(XFS_DIR2_DATA_FREE_TAG);
			dup->length = cpu_to_be16(newoffset - offset);
1212
			*xfs_dir2_data_unused_tag_p(dup) = cpu_to_be16(
1213
				((char *)dup - (char *)hdr));
1214
			xfs_dir2_data_log_unused(args, bp, dup);
1215 1216 1217
			xfs_dir2_data_freeinsert(hdr,
						 dp->d_ops->data_bestfree_p(hdr),
						 dup, &dummy);
1218
			offset += be16_to_cpu(dup->length);
L
Linus Torvalds 已提交
1219 1220 1221 1222 1223
			continue;
		}
		/*
		 * Copy a real entry.
		 */
1224
		dep = (xfs_dir2_data_entry_t *)((char *)hdr + newoffset);
1225
		dep->inumber = cpu_to_be64(dp->d_ops->sf_get_ino(sfp, sfep));
L
Linus Torvalds 已提交
1226
		dep->namelen = sfep->namelen;
1227
		dp->d_ops->data_put_ftype(dep, dp->d_ops->sf_get_ftype(sfep));
L
Linus Torvalds 已提交
1228
		memcpy(dep->name, sfep->name, dep->namelen);
1229
		tagp = dp->d_ops->data_entry_tag_p(dep);
1230
		*tagp = cpu_to_be16((char *)dep - (char *)hdr);
1231
		xfs_dir2_data_log_entry(args, bp, dep);
1232 1233 1234 1235
		name.name = sfep->name;
		name.len = sfep->namelen;
		blp[2 + i].hashval = cpu_to_be32(mp->m_dirnameops->
							hashname(&name));
1236
		blp[2 + i].address = cpu_to_be32(xfs_dir2_byte_to_dataptr(
1237 1238
						 (char *)dep - (char *)hdr));
		offset = (int)((char *)(tagp + 1) - (char *)hdr);
C
Christoph Hellwig 已提交
1239
		if (++i == sfp->count)
L
Linus Torvalds 已提交
1240 1241
			sfep = NULL;
		else
1242
			sfep = dp->d_ops->sf_nextentry(sfp, sfep);
L
Linus Torvalds 已提交
1243 1244
	}
	/* Done with the temporary buffer */
C
Christoph Hellwig 已提交
1245
	kmem_free(sfp);
L
Linus Torvalds 已提交
1246 1247 1248
	/*
	 * Sort the leaf entries by hash value.
	 */
1249
	xfs_sort(blp, be32_to_cpu(btp->count), sizeof(*blp), xfs_dir2_block_sort);
L
Linus Torvalds 已提交
1250 1251 1252 1253 1254
	/*
	 * Log the leaf entry area and tail.
	 * Already logged the header in data_init, ignore needlog.
	 */
	ASSERT(needscan == 0);
1255
	xfs_dir2_block_log_leaf(tp, bp, 0, be32_to_cpu(btp->count) - 1);
L
Linus Torvalds 已提交
1256
	xfs_dir2_block_log_tail(tp, bp);
1257
	xfs_dir3_data_check(dp, bp);
L
Linus Torvalds 已提交
1258 1259
	return 0;
}