xfs_dir2_block.c 35.1 KB
Newer Older
L
Linus Torvalds 已提交
1
/*
2
 * Copyright (c) 2000-2003,2005 Silicon Graphics, Inc.
3
 * Copyright (c) 2013 Red Hat, Inc.
4
 * All Rights Reserved.
L
Linus Torvalds 已提交
5
 *
6 7
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License as
L
Linus Torvalds 已提交
8 9
 * published by the Free Software Foundation.
 *
10 11 12 13
 * This program is distributed in the hope that it would be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
L
Linus Torvalds 已提交
14
 *
15 16 17
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write the Free Software Foundation,
 * Inc.,  51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
L
Linus Torvalds 已提交
18 19
 */
#include "xfs.h"
20
#include "xfs_fs.h"
21
#include "xfs_format.h"
22 23
#include "xfs_log_format.h"
#include "xfs_trans_resv.h"
L
Linus Torvalds 已提交
24
#include "xfs_mount.h"
25
#include "xfs_da_format.h"
26
#include "xfs_da_btree.h"
L
Linus Torvalds 已提交
27
#include "xfs_inode.h"
28
#include "xfs_trans.h"
29
#include "xfs_inode_item.h"
30
#include "xfs_bmap.h"
31
#include "xfs_buf_item.h"
32
#include "xfs_dir2.h"
C
Christoph Hellwig 已提交
33
#include "xfs_dir2_priv.h"
L
Linus Torvalds 已提交
34
#include "xfs_error.h"
C
Christoph Hellwig 已提交
35
#include "xfs_trace.h"
36
#include "xfs_cksum.h"
37
#include "xfs_log.h"
L
Linus Torvalds 已提交
38 39 40 41

/*
 * Local function prototypes.
 */
42 43 44 45
static void xfs_dir2_block_log_leaf(xfs_trans_t *tp, struct xfs_buf *bp,
				    int first, int last);
static void xfs_dir2_block_log_tail(xfs_trans_t *tp, struct xfs_buf *bp);
static int xfs_dir2_block_lookup_int(xfs_da_args_t *args, struct xfs_buf **bpp,
L
Linus Torvalds 已提交
46 47 48
				     int *entno);
static int xfs_dir2_block_sort(const void *a, const void *b);

49 50 51 52 53 54 55 56
static xfs_dahash_t xfs_dir_hash_dot, xfs_dir_hash_dotdot;

/*
 * One-time startup routine called from xfs_init().
 */
void
xfs_dir_startup(void)
{
57 58
	xfs_dir_hash_dot = xfs_da_hashname((unsigned char *)".", 1);
	xfs_dir_hash_dotdot = xfs_da_hashname((unsigned char *)"..", 2);
59 60
}

61
static xfs_failaddr_t
62
xfs_dir3_block_verify(
63 64 65
	struct xfs_buf		*bp)
{
	struct xfs_mount	*mp = bp->b_target->bt_mount;
66 67 68 69
	struct xfs_dir3_blk_hdr	*hdr3 = bp->b_addr;

	if (xfs_sb_version_hascrc(&mp->m_sb)) {
		if (hdr3->magic != cpu_to_be32(XFS_DIR3_BLOCK_MAGIC))
70
			return __this_address;
71
		if (!uuid_equal(&hdr3->uuid, &mp->m_sb.sb_meta_uuid))
72
			return __this_address;
73
		if (be64_to_cpu(hdr3->blkno) != bp->b_bn)
74
			return __this_address;
75
		if (!xfs_log_check_lsn(mp, be64_to_cpu(hdr3->lsn)))
76
			return __this_address;
77 78
	} else {
		if (hdr3->magic != cpu_to_be32(XFS_DIR2_BLOCK_MAGIC))
79
			return __this_address;
80
	}
81
	return __xfs_dir3_data_check(NULL, bp);
82
}
83

84
static void
85
xfs_dir3_block_read_verify(
86 87
	struct xfs_buf	*bp)
{
88 89
	struct xfs_mount	*mp = bp->b_target->bt_mount;

90 91
	if (xfs_sb_version_hascrc(&mp->m_sb) &&
	     !xfs_buf_verify_cksum(bp, XFS_DIR3_DATA_CRC_OFF))
92
		xfs_verifier_error(bp, -EFSBADCRC);
93
	else if (xfs_dir3_block_verify(bp))
94
		xfs_verifier_error(bp, -EFSCORRUPTED);
95 96
}

97
static void
98
xfs_dir3_block_write_verify(
99 100
	struct xfs_buf	*bp)
{
101 102 103 104
	struct xfs_mount	*mp = bp->b_target->bt_mount;
	struct xfs_buf_log_item	*bip = bp->b_fspriv;
	struct xfs_dir3_blk_hdr	*hdr3 = bp->b_addr;

105
	if (xfs_dir3_block_verify(bp)) {
106
		xfs_verifier_error(bp, -EFSCORRUPTED);
107 108 109 110 111 112 113 114 115
		return;
	}

	if (!xfs_sb_version_hascrc(&mp->m_sb))
		return;

	if (bip)
		hdr3->lsn = cpu_to_be64(bip->bli_item.li_lsn);

116
	xfs_buf_update_cksum(bp, XFS_DIR3_DATA_CRC_OFF);
117 118
}

119
const struct xfs_buf_ops xfs_dir3_block_buf_ops = {
120
	.name = "xfs_dir3_block",
121 122
	.verify_read = xfs_dir3_block_read_verify,
	.verify_write = xfs_dir3_block_write_verify,
123 124
};

125
int
126
xfs_dir3_block_read(
127 128 129 130 131
	struct xfs_trans	*tp,
	struct xfs_inode	*dp,
	struct xfs_buf		**bpp)
{
	struct xfs_mount	*mp = dp->i_mount;
132
	int			err;
133

134
	err = xfs_da_read_buf(tp, dp, mp->m_dir_geo->datablk, -1, bpp,
135
				XFS_DATA_FORK, &xfs_dir3_block_buf_ops);
136
	if (!err && tp && *bpp)
137
		xfs_trans_buf_set_type(tp, *bpp, XFS_BLFT_DIR_BLOCK_BUF);
138
	return err;
139 140 141 142 143
}

static void
xfs_dir3_block_init(
	struct xfs_mount	*mp,
144
	struct xfs_trans	*tp,
145 146 147 148 149 150
	struct xfs_buf		*bp,
	struct xfs_inode	*dp)
{
	struct xfs_dir3_blk_hdr *hdr3 = bp->b_addr;

	bp->b_ops = &xfs_dir3_block_buf_ops;
151
	xfs_trans_buf_set_type(tp, bp, XFS_BLFT_DIR_BLOCK_BUF);
152 153 154 155 156 157

	if (xfs_sb_version_hascrc(&mp->m_sb)) {
		memset(hdr3, 0, sizeof(*hdr3));
		hdr3->magic = cpu_to_be32(XFS_DIR3_BLOCK_MAGIC);
		hdr3->blkno = cpu_to_be64(bp->b_bn);
		hdr3->owner = cpu_to_be64(dp->i_ino);
158
		uuid_copy(&hdr3->uuid, &mp->m_sb.sb_meta_uuid);
159 160 161 162
		return;

	}
	hdr3->magic = cpu_to_be32(XFS_DIR2_BLOCK_MAGIC);
163 164 165 166
}

static void
xfs_dir2_block_need_space(
167
	struct xfs_inode		*dp,
168 169 170 171 172 173 174 175 176 177 178 179 180 181 182
	struct xfs_dir2_data_hdr	*hdr,
	struct xfs_dir2_block_tail	*btp,
	struct xfs_dir2_leaf_entry	*blp,
	__be16				**tagpp,
	struct xfs_dir2_data_unused	**dupp,
	struct xfs_dir2_data_unused	**enddupp,
	int				*compact,
	int				len)
{
	struct xfs_dir2_data_free	*bf;
	__be16				*tagp = NULL;
	struct xfs_dir2_data_unused	*dup = NULL;
	struct xfs_dir2_data_unused	*enddup = NULL;

	*compact = 0;
183
	bf = dp->d_ops->data_bestfree_p(hdr);
184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278

	/*
	 * If there are stale entries we'll use one for the leaf.
	 */
	if (btp->stale) {
		if (be16_to_cpu(bf[0].length) >= len) {
			/*
			 * The biggest entry enough to avoid compaction.
			 */
			dup = (xfs_dir2_data_unused_t *)
			      ((char *)hdr + be16_to_cpu(bf[0].offset));
			goto out;
		}

		/*
		 * Will need to compact to make this work.
		 * Tag just before the first leaf entry.
		 */
		*compact = 1;
		tagp = (__be16 *)blp - 1;

		/* Data object just before the first leaf entry.  */
		dup = (xfs_dir2_data_unused_t *)((char *)hdr + be16_to_cpu(*tagp));

		/*
		 * If it's not free then the data will go where the
		 * leaf data starts now, if it works at all.
		 */
		if (be16_to_cpu(dup->freetag) == XFS_DIR2_DATA_FREE_TAG) {
			if (be16_to_cpu(dup->length) + (be32_to_cpu(btp->stale) - 1) *
			    (uint)sizeof(*blp) < len)
				dup = NULL;
		} else if ((be32_to_cpu(btp->stale) - 1) * (uint)sizeof(*blp) < len)
			dup = NULL;
		else
			dup = (xfs_dir2_data_unused_t *)blp;
		goto out;
	}

	/*
	 * no stale entries, so just use free space.
	 * Tag just before the first leaf entry.
	 */
	tagp = (__be16 *)blp - 1;

	/* Data object just before the first leaf entry.  */
	enddup = (xfs_dir2_data_unused_t *)((char *)hdr + be16_to_cpu(*tagp));

	/*
	 * If it's not free then can't do this add without cleaning up:
	 * the space before the first leaf entry needs to be free so it
	 * can be expanded to hold the pointer to the new entry.
	 */
	if (be16_to_cpu(enddup->freetag) == XFS_DIR2_DATA_FREE_TAG) {
		/*
		 * Check out the biggest freespace and see if it's the same one.
		 */
		dup = (xfs_dir2_data_unused_t *)
		      ((char *)hdr + be16_to_cpu(bf[0].offset));
		if (dup != enddup) {
			/*
			 * Not the same free entry, just check its length.
			 */
			if (be16_to_cpu(dup->length) < len)
				dup = NULL;
			goto out;
		}

		/*
		 * It is the biggest freespace, can it hold the leaf too?
		 */
		if (be16_to_cpu(dup->length) < len + (uint)sizeof(*blp)) {
			/*
			 * Yes, use the second-largest entry instead if it works.
			 */
			if (be16_to_cpu(bf[1].length) >= len)
				dup = (xfs_dir2_data_unused_t *)
				      ((char *)hdr + be16_to_cpu(bf[1].offset));
			else
				dup = NULL;
		}
	}
out:
	*tagpp = tagp;
	*dupp = dup;
	*enddupp = enddup;
}

/*
 * compact the leaf entries.
 * Leave the highest-numbered stale entry stale.
 * XXX should be the one closest to mid but mid is not yet computed.
 */
static void
xfs_dir2_block_compact(
279
	struct xfs_da_args		*args,
280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311
	struct xfs_buf			*bp,
	struct xfs_dir2_data_hdr	*hdr,
	struct xfs_dir2_block_tail	*btp,
	struct xfs_dir2_leaf_entry	*blp,
	int				*needlog,
	int				*lfloghigh,
	int				*lfloglow)
{
	int			fromidx;	/* source leaf index */
	int			toidx;		/* target leaf index */
	int			needscan = 0;
	int			highstale;	/* high stale index */

	fromidx = toidx = be32_to_cpu(btp->count) - 1;
	highstale = *lfloghigh = -1;
	for (; fromidx >= 0; fromidx--) {
		if (blp[fromidx].address == cpu_to_be32(XFS_DIR2_NULL_DATAPTR)) {
			if (highstale == -1)
				highstale = toidx;
			else {
				if (*lfloghigh == -1)
					*lfloghigh = toidx;
				continue;
			}
		}
		if (fromidx < toidx)
			blp[toidx] = blp[fromidx];
		toidx--;
	}
	*lfloglow = toidx + 1 - (be32_to_cpu(btp->stale) - 1);
	*lfloghigh -= be32_to_cpu(btp->stale) - 1;
	be32_add_cpu(&btp->count, -(be32_to_cpu(btp->stale) - 1));
312
	xfs_dir2_data_make_free(args, bp,
313 314 315 316 317 318 319 320 321
		(xfs_dir2_data_aoff_t)((char *)blp - (char *)hdr),
		(xfs_dir2_data_aoff_t)((be32_to_cpu(btp->stale) - 1) * sizeof(*blp)),
		needlog, &needscan);
	btp->stale = cpu_to_be32(1);
	/*
	 * If we now need to rebuild the bestfree map, do so.
	 * This needs to happen before the next call to use_free.
	 */
	if (needscan)
322
		xfs_dir2_data_freescan(args->dp, hdr, needlog);
323 324
}

L
Linus Torvalds 已提交
325 326 327 328 329 330 331
/*
 * Add an entry to a block directory.
 */
int						/* error */
xfs_dir2_block_addname(
	xfs_da_args_t		*args)		/* directory op arguments */
{
332
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
333
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf entries */
334
	struct xfs_buf		*bp;		/* buffer for block */
L
Linus Torvalds 已提交
335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	int			compact;	/* need to compact leaf ents */
	xfs_dir2_data_entry_t	*dep;		/* block data entry */
	xfs_inode_t		*dp;		/* directory inode */
	xfs_dir2_data_unused_t	*dup;		/* block unused entry */
	int			error;		/* error return value */
	xfs_dir2_data_unused_t	*enddup=NULL;	/* unused at end of data */
	xfs_dahash_t		hash;		/* hash value of found entry */
	int			high;		/* high index for binary srch */
	int			highstale;	/* high stale index */
	int			lfloghigh=0;	/* last final leaf to log */
	int			lfloglow=0;	/* first final leaf to log */
	int			len;		/* length of the new entry */
	int			low;		/* low index for binary srch */
	int			lowstale;	/* low stale index */
	int			mid=0;		/* midpoint for binary srch */
	int			needlog;	/* need to log header */
	int			needscan;	/* need to rescan freespace */
353
	__be16			*tagp;		/* pointer to tag value */
L
Linus Torvalds 已提交
354 355
	xfs_trans_t		*tp;		/* transaction structure */

C
Christoph Hellwig 已提交
356 357
	trace_xfs_dir2_block_addname(args);

L
Linus Torvalds 已提交
358 359
	dp = args->dp;
	tp = args->trans;
360 361

	/* Read the (one and only) directory block into bp. */
362
	error = xfs_dir3_block_read(tp, dp, &bp);
363
	if (error)
L
Linus Torvalds 已提交
364
		return error;
365

366
	len = dp->d_ops->data_entsize(args->namelen);
367

L
Linus Torvalds 已提交
368 369 370
	/*
	 * Set up pointers to parts of the block.
	 */
371
	hdr = bp->b_addr;
372
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
373
	blp = xfs_dir2_block_leaf_p(btp);
374

L
Linus Torvalds 已提交
375
	/*
376 377
	 * Find out if we can reuse stale entries or whether we need extra
	 * space for entry and new leaf.
L
Linus Torvalds 已提交
378
	 */
379
	xfs_dir2_block_need_space(dp, hdr, btp, blp, &tagp, &dup,
380 381
				  &enddup, &compact, len);

L
Linus Torvalds 已提交
382
	/*
383
	 * Done everything we need for a space check now.
L
Linus Torvalds 已提交
384
	 */
385
	if (args->op_flags & XFS_DA_OP_JUSTCHECK) {
386
		xfs_trans_brelse(tp, bp);
387
		if (!dup)
D
Dave Chinner 已提交
388
			return -ENOSPC;
389 390 391
		return 0;
	}

L
Linus Torvalds 已提交
392 393 394 395
	/*
	 * If we don't have space for the new entry & leaf ...
	 */
	if (!dup) {
396 397
		/* Don't have a space reservation: return no-space.  */
		if (args->total == 0)
D
Dave Chinner 已提交
398
			return -ENOSPC;
L
Linus Torvalds 已提交
399 400 401 402 403 404 405 406 407
		/*
		 * Convert to the next larger format.
		 * Then add the new entry in that format.
		 */
		error = xfs_dir2_block_to_leaf(args, bp);
		if (error)
			return error;
		return xfs_dir2_leaf_addname(args);
	}
408

L
Linus Torvalds 已提交
409
	needlog = needscan = 0;
410

L
Linus Torvalds 已提交
411 412 413
	/*
	 * If need to compact the leaf entries, do it now.
	 */
414
	if (compact) {
415
		xfs_dir2_block_compact(args, bp, hdr, btp, blp, &needlog,
416
				      &lfloghigh, &lfloglow);
417 418 419
		/* recalculate blp post-compaction */
		blp = xfs_dir2_block_leaf_p(btp);
	} else if (btp->stale) {
L
Linus Torvalds 已提交
420
		/*
421 422
		 * Set leaf logging boundaries to impossible state.
		 * For the no-stale case they're set explicitly.
L
Linus Torvalds 已提交
423
		 */
424
		lfloglow = be32_to_cpu(btp->count);
L
Linus Torvalds 已提交
425 426
		lfloghigh = -1;
	}
427

L
Linus Torvalds 已提交
428 429 430
	/*
	 * Find the slot that's first lower than our hash value, -1 if none.
	 */
431
	for (low = 0, high = be32_to_cpu(btp->count) - 1; low <= high; ) {
L
Linus Torvalds 已提交
432
		mid = (low + high) >> 1;
433
		if ((hash = be32_to_cpu(blp[mid].hashval)) == args->hashval)
L
Linus Torvalds 已提交
434 435 436 437 438 439
			break;
		if (hash < args->hashval)
			low = mid + 1;
		else
			high = mid - 1;
	}
440
	while (mid >= 0 && be32_to_cpu(blp[mid].hashval) >= args->hashval) {
L
Linus Torvalds 已提交
441 442 443 444 445 446 447 448 449
		mid--;
	}
	/*
	 * No stale entries, will use enddup space to hold new leaf.
	 */
	if (!btp->stale) {
		/*
		 * Mark the space needed for the new leaf entry, now in use.
		 */
450
		xfs_dir2_data_use_free(args, bp, enddup,
L
Linus Torvalds 已提交
451
			(xfs_dir2_data_aoff_t)
452
			((char *)enddup - (char *)hdr + be16_to_cpu(enddup->length) -
L
Linus Torvalds 已提交
453 454 455 456 457 458
			 sizeof(*blp)),
			(xfs_dir2_data_aoff_t)sizeof(*blp),
			&needlog, &needscan);
		/*
		 * Update the tail (entry count).
		 */
459
		be32_add_cpu(&btp->count, 1);
L
Linus Torvalds 已提交
460 461 462 463 464
		/*
		 * If we now need to rebuild the bestfree map, do so.
		 * This needs to happen before the next call to use_free.
		 */
		if (needscan) {
465
			xfs_dir2_data_freescan(dp, hdr, &needlog);
L
Linus Torvalds 已提交
466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485
			needscan = 0;
		}
		/*
		 * Adjust pointer to the first leaf entry, we're about to move
		 * the table up one to open up space for the new leaf entry.
		 * Then adjust our index to match.
		 */
		blp--;
		mid++;
		if (mid)
			memmove(blp, &blp[1], mid * sizeof(*blp));
		lfloglow = 0;
		lfloghigh = mid;
	}
	/*
	 * Use a stale leaf for our new entry.
	 */
	else {
		for (lowstale = mid;
		     lowstale >= 0 &&
486 487
			blp[lowstale].address !=
			cpu_to_be32(XFS_DIR2_NULL_DATAPTR);
L
Linus Torvalds 已提交
488 489 490
		     lowstale--)
			continue;
		for (highstale = mid + 1;
491
		     highstale < be32_to_cpu(btp->count) &&
492 493
			blp[highstale].address !=
			cpu_to_be32(XFS_DIR2_NULL_DATAPTR) &&
L
Linus Torvalds 已提交
494 495 496 497 498 499 500
			(lowstale < 0 || mid - lowstale > highstale - mid);
		     highstale++)
			continue;
		/*
		 * Move entries toward the low-numbered stale entry.
		 */
		if (lowstale >= 0 &&
501
		    (highstale == be32_to_cpu(btp->count) ||
L
Linus Torvalds 已提交
502 503 504 505 506 507 508 509 510 511 512
		     mid - lowstale <= highstale - mid)) {
			if (mid - lowstale)
				memmove(&blp[lowstale], &blp[lowstale + 1],
					(mid - lowstale) * sizeof(*blp));
			lfloglow = MIN(lowstale, lfloglow);
			lfloghigh = MAX(mid, lfloghigh);
		}
		/*
		 * Move entries toward the high-numbered stale entry.
		 */
		else {
513
			ASSERT(highstale < be32_to_cpu(btp->count));
L
Linus Torvalds 已提交
514 515 516 517 518 519 520
			mid++;
			if (highstale - mid)
				memmove(&blp[mid + 1], &blp[mid],
					(highstale - mid) * sizeof(*blp));
			lfloglow = MIN(mid, lfloglow);
			lfloghigh = MAX(highstale, lfloghigh);
		}
521
		be32_add_cpu(&btp->stale, -1);
L
Linus Torvalds 已提交
522 523 524 525 526 527 528 529
	}
	/*
	 * Point to the new data entry.
	 */
	dep = (xfs_dir2_data_entry_t *)dup;
	/*
	 * Fill in the leaf entry.
	 */
530
	blp[mid].hashval = cpu_to_be32(args->hashval);
531
	blp[mid].address = cpu_to_be32(xfs_dir2_byte_to_dataptr(
532
				(char *)dep - (char *)hdr));
L
Linus Torvalds 已提交
533 534 535 536
	xfs_dir2_block_log_leaf(tp, bp, lfloglow, lfloghigh);
	/*
	 * Mark space for the data entry used.
	 */
537
	xfs_dir2_data_use_free(args, bp, dup,
538
		(xfs_dir2_data_aoff_t)((char *)dup - (char *)hdr),
L
Linus Torvalds 已提交
539 540 541 542
		(xfs_dir2_data_aoff_t)len, &needlog, &needscan);
	/*
	 * Create the new data entry.
	 */
543
	dep->inumber = cpu_to_be64(args->inumber);
L
Linus Torvalds 已提交
544 545
	dep->namelen = args->namelen;
	memcpy(dep->name, args->name, args->namelen);
546 547
	dp->d_ops->data_put_ftype(dep, args->filetype);
	tagp = dp->d_ops->data_entry_tag_p(dep);
548
	*tagp = cpu_to_be16((char *)dep - (char *)hdr);
L
Linus Torvalds 已提交
549 550 551 552
	/*
	 * Clean up the bestfree array and log the header, tail, and entry.
	 */
	if (needscan)
553
		xfs_dir2_data_freescan(dp, hdr, &needlog);
L
Linus Torvalds 已提交
554
	if (needlog)
555
		xfs_dir2_data_log_header(args, bp);
L
Linus Torvalds 已提交
556
	xfs_dir2_block_log_tail(tp, bp);
557
	xfs_dir2_data_log_entry(args, bp, dep);
558
	xfs_dir3_data_check(dp, bp);
L
Linus Torvalds 已提交
559 560 561 562 563 564 565 566 567
	return 0;
}

/*
 * Log leaf entries from the block.
 */
static void
xfs_dir2_block_log_leaf(
	xfs_trans_t		*tp,		/* transaction structure */
568
	struct xfs_buf		*bp,		/* block buffer */
L
Linus Torvalds 已提交
569 570 571
	int			first,		/* index of first logged leaf */
	int			last)		/* index of last logged leaf */
{
572
	xfs_dir2_data_hdr_t	*hdr = bp->b_addr;
573 574
	xfs_dir2_leaf_entry_t	*blp;
	xfs_dir2_block_tail_t	*btp;
L
Linus Torvalds 已提交
575

576
	btp = xfs_dir2_block_tail_p(tp->t_mountp->m_dir_geo, hdr);
577
	blp = xfs_dir2_block_leaf_p(btp);
578
	xfs_trans_log_buf(tp, bp, (uint)((char *)&blp[first] - (char *)hdr),
579
		(uint)((char *)&blp[last + 1] - (char *)hdr - 1));
L
Linus Torvalds 已提交
580 581 582 583 584 585 586 587
}

/*
 * Log the block tail.
 */
static void
xfs_dir2_block_log_tail(
	xfs_trans_t		*tp,		/* transaction structure */
588
	struct xfs_buf		*bp)		/* block buffer */
L
Linus Torvalds 已提交
589
{
590
	xfs_dir2_data_hdr_t	*hdr = bp->b_addr;
591
	xfs_dir2_block_tail_t	*btp;
L
Linus Torvalds 已提交
592

593
	btp = xfs_dir2_block_tail_p(tp->t_mountp->m_dir_geo, hdr);
594
	xfs_trans_log_buf(tp, bp, (uint)((char *)btp - (char *)hdr),
595
		(uint)((char *)(btp + 1) - (char *)hdr - 1));
L
Linus Torvalds 已提交
596 597 598 599 600 601 602 603 604 605
}

/*
 * Look up an entry in the block.  This is the external routine,
 * xfs_dir2_block_lookup_int does the real work.
 */
int						/* error */
xfs_dir2_block_lookup(
	xfs_da_args_t		*args)		/* dir lookup arguments */
{
606
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
607
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf entries */
608
	struct xfs_buf		*bp;		/* block buffer */
L
Linus Torvalds 已提交
609 610 611 612 613 614
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	xfs_dir2_data_entry_t	*dep;		/* block data entry */
	xfs_inode_t		*dp;		/* incore inode */
	int			ent;		/* entry index */
	int			error;		/* error return value */

C
Christoph Hellwig 已提交
615 616
	trace_xfs_dir2_block_lookup(args);

L
Linus Torvalds 已提交
617 618 619 620 621 622 623
	/*
	 * Get the buffer, look up the entry.
	 * If not found (ENOENT) then return, have no buffer.
	 */
	if ((error = xfs_dir2_block_lookup_int(args, &bp, &ent)))
		return error;
	dp = args->dp;
624
	hdr = bp->b_addr;
625
	xfs_dir3_data_check(dp, bp);
626
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
627
	blp = xfs_dir2_block_leaf_p(btp);
L
Linus Torvalds 已提交
628 629 630
	/*
	 * Get the offset from the leaf entry, to point to the data.
	 */
631
	dep = (xfs_dir2_data_entry_t *)((char *)hdr +
632 633
			xfs_dir2_dataptr_to_off(args->geo,
						be32_to_cpu(blp[ent].address)));
L
Linus Torvalds 已提交
634
	/*
635
	 * Fill in inode number, CI name if appropriate, release the block.
L
Linus Torvalds 已提交
636
	 */
637
	args->inumber = be64_to_cpu(dep->inumber);
638
	args->filetype = dp->d_ops->data_get_ftype(dep);
639
	error = xfs_dir_cilookup_result(args, dep->name, dep->namelen);
640
	xfs_trans_brelse(args->trans, bp);
E
Eric Sandeen 已提交
641
	return error;
L
Linus Torvalds 已提交
642 643 644 645 646 647 648 649
}

/*
 * Internal block lookup routine.
 */
static int					/* error */
xfs_dir2_block_lookup_int(
	xfs_da_args_t		*args,		/* dir lookup arguments */
650
	struct xfs_buf		**bpp,		/* returned block buffer */
L
Linus Torvalds 已提交
651 652 653
	int			*entno)		/* returned entry number */
{
	xfs_dir2_dataptr_t	addr;		/* data entry address */
654
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
655
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf entries */
656
	struct xfs_buf		*bp;		/* block buffer */
L
Linus Torvalds 已提交
657 658 659 660 661 662 663 664 665 666
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	xfs_dir2_data_entry_t	*dep;		/* block data entry */
	xfs_inode_t		*dp;		/* incore inode */
	int			error;		/* error return value */
	xfs_dahash_t		hash;		/* found hash value */
	int			high;		/* binary search high index */
	int			low;		/* binary search low index */
	int			mid;		/* binary search current idx */
	xfs_mount_t		*mp;		/* filesystem mount point */
	xfs_trans_t		*tp;		/* transaction pointer */
667
	enum xfs_dacmp		cmp;		/* comparison result */
L
Linus Torvalds 已提交
668 669 670 671

	dp = args->dp;
	tp = args->trans;
	mp = dp->i_mount;
672

673
	error = xfs_dir3_block_read(tp, dp, &bp);
674
	if (error)
L
Linus Torvalds 已提交
675
		return error;
676

677
	hdr = bp->b_addr;
678
	xfs_dir3_data_check(dp, bp);
679
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
680
	blp = xfs_dir2_block_leaf_p(btp);
L
Linus Torvalds 已提交
681 682 683 684
	/*
	 * Loop doing a binary search for our hash value.
	 * Find our entry, ENOENT if it's not there.
	 */
685
	for (low = 0, high = be32_to_cpu(btp->count) - 1; ; ) {
L
Linus Torvalds 已提交
686 687
		ASSERT(low <= high);
		mid = (low + high) >> 1;
688
		if ((hash = be32_to_cpu(blp[mid].hashval)) == args->hashval)
L
Linus Torvalds 已提交
689 690 691 692 693 694
			break;
		if (hash < args->hashval)
			low = mid + 1;
		else
			high = mid - 1;
		if (low > high) {
695
			ASSERT(args->op_flags & XFS_DA_OP_OKNOENT);
696
			xfs_trans_brelse(tp, bp);
D
Dave Chinner 已提交
697
			return -ENOENT;
L
Linus Torvalds 已提交
698 699 700 701 702
		}
	}
	/*
	 * Back up to the first one with the right hash value.
	 */
703
	while (mid > 0 && be32_to_cpu(blp[mid - 1].hashval) == args->hashval) {
L
Linus Torvalds 已提交
704 705 706 707 708 709 710
		mid--;
	}
	/*
	 * Now loop forward through all the entries with the
	 * right hash value looking for our name.
	 */
	do {
711
		if ((addr = be32_to_cpu(blp[mid].address)) == XFS_DIR2_NULL_DATAPTR)
L
Linus Torvalds 已提交
712 713 714 715 716
			continue;
		/*
		 * Get pointer to the entry from the leaf.
		 */
		dep = (xfs_dir2_data_entry_t *)
717
			((char *)hdr + xfs_dir2_dataptr_to_off(args->geo, addr));
L
Linus Torvalds 已提交
718
		/*
719 720 721
		 * Compare name and if it's an exact match, return the index
		 * and buffer. If it's the first case-insensitive match, store
		 * the index and buffer and continue looking for an exact match.
L
Linus Torvalds 已提交
722
		 */
723 724 725
		cmp = mp->m_dirnameops->compname(args, dep->name, dep->namelen);
		if (cmp != XFS_CMP_DIFFERENT && cmp != args->cmpresult) {
			args->cmpresult = cmp;
L
Linus Torvalds 已提交
726 727
			*bpp = bp;
			*entno = mid;
728 729
			if (cmp == XFS_CMP_EXACT)
				return 0;
L
Linus Torvalds 已提交
730
		}
731 732 733
	} while (++mid < be32_to_cpu(btp->count) &&
			be32_to_cpu(blp[mid].hashval) == hash);

734
	ASSERT(args->op_flags & XFS_DA_OP_OKNOENT);
735 736 737 738 739 740
	/*
	 * Here, we can only be doing a lookup (not a rename or replace).
	 * If a case-insensitive match was found earlier, return success.
	 */
	if (args->cmpresult == XFS_CMP_CASE)
		return 0;
L
Linus Torvalds 已提交
741 742 743
	/*
	 * No match, release the buffer and return ENOENT.
	 */
744
	xfs_trans_brelse(tp, bp);
D
Dave Chinner 已提交
745
	return -ENOENT;
L
Linus Torvalds 已提交
746 747 748 749 750 751 752 753 754 755
}

/*
 * Remove an entry from a block format directory.
 * If that makes the block small enough to fit in shortform, transform it.
 */
int						/* error */
xfs_dir2_block_removename(
	xfs_da_args_t		*args)		/* directory operation args */
{
756
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
757
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf pointer */
758
	struct xfs_buf		*bp;		/* block buffer */
L
Linus Torvalds 已提交
759 760 761 762 763 764 765 766 767 768 769
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	xfs_dir2_data_entry_t	*dep;		/* block data entry */
	xfs_inode_t		*dp;		/* incore inode */
	int			ent;		/* block leaf entry index */
	int			error;		/* error return value */
	int			needlog;	/* need to log block header */
	int			needscan;	/* need to fixup bestfree */
	xfs_dir2_sf_hdr_t	sfh;		/* shortform header */
	int			size;		/* shortform size */
	xfs_trans_t		*tp;		/* transaction pointer */

C
Christoph Hellwig 已提交
770 771
	trace_xfs_dir2_block_removename(args);

L
Linus Torvalds 已提交
772 773 774 775 776 777 778 779 780
	/*
	 * Look up the entry in the block.  Gets the buffer and entry index.
	 * It will always be there, the vnodeops level does a lookup first.
	 */
	if ((error = xfs_dir2_block_lookup_int(args, &bp, &ent))) {
		return error;
	}
	dp = args->dp;
	tp = args->trans;
781
	hdr = bp->b_addr;
782
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
783
	blp = xfs_dir2_block_leaf_p(btp);
L
Linus Torvalds 已提交
784 785 786
	/*
	 * Point to the data entry using the leaf entry.
	 */
787 788 789
	dep = (xfs_dir2_data_entry_t *)((char *)hdr +
			xfs_dir2_dataptr_to_off(args->geo,
						be32_to_cpu(blp[ent].address)));
L
Linus Torvalds 已提交
790 791 792 793
	/*
	 * Mark the data entry's space free.
	 */
	needlog = needscan = 0;
794
	xfs_dir2_data_make_free(args, bp,
795
		(xfs_dir2_data_aoff_t)((char *)dep - (char *)hdr),
796
		dp->d_ops->data_entsize(dep->namelen), &needlog, &needscan);
L
Linus Torvalds 已提交
797 798 799
	/*
	 * Fix up the block tail.
	 */
800
	be32_add_cpu(&btp->stale, 1);
L
Linus Torvalds 已提交
801 802 803 804
	xfs_dir2_block_log_tail(tp, bp);
	/*
	 * Remove the leaf entry by marking it stale.
	 */
805
	blp[ent].address = cpu_to_be32(XFS_DIR2_NULL_DATAPTR);
L
Linus Torvalds 已提交
806 807 808 809 810
	xfs_dir2_block_log_leaf(tp, bp, ent, ent);
	/*
	 * Fix up bestfree, log the header if necessary.
	 */
	if (needscan)
811
		xfs_dir2_data_freescan(dp, hdr, &needlog);
L
Linus Torvalds 已提交
812
	if (needlog)
813
		xfs_dir2_data_log_header(args, bp);
814
	xfs_dir3_data_check(dp, bp);
L
Linus Torvalds 已提交
815 816 817
	/*
	 * See if the size as a shortform is good enough.
	 */
818
	size = xfs_dir2_block_sfsize(dp, hdr, &sfh);
819
	if (size > XFS_IFORK_DSIZE(dp))
L
Linus Torvalds 已提交
820
		return 0;
821

L
Linus Torvalds 已提交
822 823 824 825 826 827 828 829 830 831 832 833 834 835
	/*
	 * If it works, do the conversion.
	 */
	return xfs_dir2_block_to_sf(args, bp, size, &sfh);
}

/*
 * Replace an entry in a V2 block directory.
 * Change the inode number to the new value.
 */
int						/* error */
xfs_dir2_block_replace(
	xfs_da_args_t		*args)		/* directory operation args */
{
836
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
837
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf entries */
838
	struct xfs_buf		*bp;		/* block buffer */
L
Linus Torvalds 已提交
839 840 841 842 843 844
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	xfs_dir2_data_entry_t	*dep;		/* block data entry */
	xfs_inode_t		*dp;		/* incore inode */
	int			ent;		/* leaf entry index */
	int			error;		/* error return value */

C
Christoph Hellwig 已提交
845 846
	trace_xfs_dir2_block_replace(args);

L
Linus Torvalds 已提交
847 848 849 850 851 852 853 854
	/*
	 * Lookup the entry in the directory.  Get buffer and entry index.
	 * This will always succeed since the caller has already done a lookup.
	 */
	if ((error = xfs_dir2_block_lookup_int(args, &bp, &ent))) {
		return error;
	}
	dp = args->dp;
855
	hdr = bp->b_addr;
856
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
857
	blp = xfs_dir2_block_leaf_p(btp);
L
Linus Torvalds 已提交
858 859 860
	/*
	 * Point to the data entry we need to change.
	 */
861 862 863
	dep = (xfs_dir2_data_entry_t *)((char *)hdr +
			xfs_dir2_dataptr_to_off(args->geo,
						be32_to_cpu(blp[ent].address)));
864
	ASSERT(be64_to_cpu(dep->inumber) != args->inumber);
L
Linus Torvalds 已提交
865 866 867
	/*
	 * Change the inode number to the new value.
	 */
868
	dep->inumber = cpu_to_be64(args->inumber);
869
	dp->d_ops->data_put_ftype(dep, args->filetype);
870
	xfs_dir2_data_log_entry(args, bp, dep);
871
	xfs_dir3_data_check(dp, bp);
L
Linus Torvalds 已提交
872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887
	return 0;
}

/*
 * Qsort comparison routine for the block leaf entries.
 */
static int					/* sort order */
xfs_dir2_block_sort(
	const void			*a,	/* first leaf entry */
	const void			*b)	/* second leaf entry */
{
	const xfs_dir2_leaf_entry_t	*la;	/* first leaf entry */
	const xfs_dir2_leaf_entry_t	*lb;	/* second leaf entry */

	la = a;
	lb = b;
888 889
	return be32_to_cpu(la->hashval) < be32_to_cpu(lb->hashval) ? -1 :
		(be32_to_cpu(la->hashval) > be32_to_cpu(lb->hashval) ? 1 : 0);
L
Linus Torvalds 已提交
890 891 892 893 894 895 896 897
}

/*
 * Convert a V2 leaf directory to a V2 block directory if possible.
 */
int						/* error */
xfs_dir2_leaf_to_block(
	xfs_da_args_t		*args,		/* operation arguments */
898 899
	struct xfs_buf		*lbp,		/* leaf buffer */
	struct xfs_buf		*dbp)		/* data buffer */
L
Linus Torvalds 已提交
900
{
901
	__be16			*bestsp;	/* leaf bests table */
902
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
903 904 905 906 907 908 909 910 911 912 913 914 915
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	xfs_inode_t		*dp;		/* incore directory inode */
	xfs_dir2_data_unused_t	*dup;		/* unused data entry */
	int			error;		/* error return value */
	int			from;		/* leaf from index */
	xfs_dir2_leaf_t		*leaf;		/* leaf structure */
	xfs_dir2_leaf_entry_t	*lep;		/* leaf entry */
	xfs_dir2_leaf_tail_t	*ltp;		/* leaf tail structure */
	xfs_mount_t		*mp;		/* file system mount point */
	int			needlog;	/* need to log data header */
	int			needscan;	/* need to scan for bestfree */
	xfs_dir2_sf_hdr_t	sfh;		/* shortform header */
	int			size;		/* bytes used */
916
	__be16			*tagp;		/* end of entry (tag) */
L
Linus Torvalds 已提交
917 918
	int			to;		/* block/leaf to index */
	xfs_trans_t		*tp;		/* transaction pointer */
919 920
	struct xfs_dir2_leaf_entry *ents;
	struct xfs_dir3_icleaf_hdr leafhdr;
L
Linus Torvalds 已提交
921

C
Christoph Hellwig 已提交
922 923
	trace_xfs_dir2_leaf_to_block(args);

L
Linus Torvalds 已提交
924 925 926
	dp = args->dp;
	tp = args->trans;
	mp = dp->i_mount;
927
	leaf = lbp->b_addr;
928
	dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf);
929
	ents = dp->d_ops->leaf_ents_p(leaf);
930
	ltp = xfs_dir2_leaf_tail_p(args->geo, leaf);
931 932 933

	ASSERT(leafhdr.magic == XFS_DIR2_LEAF1_MAGIC ||
	       leafhdr.magic == XFS_DIR3_LEAF1_MAGIC);
L
Linus Torvalds 已提交
934 935 936 937 938 939
	/*
	 * If there are data blocks other than the first one, take this
	 * opportunity to remove trailing empty data blocks that may have
	 * been left behind during no-space-reservation operations.
	 * These will show up in the leaf bests table.
	 */
940
	while (dp->i_d.di_size > args->geo->blksize) {
941 942
		int hdrsz;

943
		hdrsz = dp->d_ops->data_entry_offset;
944
		bestsp = xfs_dir2_leaf_bests_p(ltp);
945
		if (be16_to_cpu(bestsp[be32_to_cpu(ltp->bestcount) - 1]) ==
946
					    args->geo->blksize - hdrsz) {
L
Linus Torvalds 已提交
947 948
			if ((error =
			    xfs_dir2_leaf_trim_data(args, lbp,
949
				    (xfs_dir2_db_t)(be32_to_cpu(ltp->bestcount) - 1))))
950 951 952
				return error;
		} else
			return 0;
L
Linus Torvalds 已提交
953 954 955 956
	}
	/*
	 * Read the data block if we don't already have it, give up if it fails.
	 */
957
	if (!dbp) {
958
		error = xfs_dir3_data_read(tp, dp, args->geo->datablk, -1, &dbp);
959 960
		if (error)
			return error;
L
Linus Torvalds 已提交
961
	}
962
	hdr = dbp->b_addr;
963 964 965
	ASSERT(hdr->magic == cpu_to_be32(XFS_DIR2_DATA_MAGIC) ||
	       hdr->magic == cpu_to_be32(XFS_DIR3_DATA_MAGIC));

L
Linus Torvalds 已提交
966 967 968
	/*
	 * Size of the "leaf" area in the block.
	 */
969
	size = (uint)sizeof(xfs_dir2_block_tail_t) +
970
	       (uint)sizeof(*lep) * (leafhdr.count - leafhdr.stale);
L
Linus Torvalds 已提交
971 972 973
	/*
	 * Look at the last data entry.
	 */
974
	tagp = (__be16 *)((char *)hdr + args->geo->blksize) - 1;
975
	dup = (xfs_dir2_data_unused_t *)((char *)hdr + be16_to_cpu(*tagp));
L
Linus Torvalds 已提交
976 977 978
	/*
	 * If it's not free or is too short we can't do it.
	 */
979
	if (be16_to_cpu(dup->freetag) != XFS_DIR2_DATA_FREE_TAG ||
980 981 982
	    be16_to_cpu(dup->length) < size)
		return 0;

L
Linus Torvalds 已提交
983 984 985
	/*
	 * Start converting it to block form.
	 */
986
	xfs_dir3_block_init(mp, tp, dbp, dp);
987

L
Linus Torvalds 已提交
988 989 990 991 992
	needlog = 1;
	needscan = 0;
	/*
	 * Use up the space at the end of the block (blp/btp).
	 */
993
	xfs_dir2_data_use_free(args, dbp, dup, args->geo->blksize - size, size,
L
Linus Torvalds 已提交
994 995 996 997
		&needlog, &needscan);
	/*
	 * Initialize the block tail.
	 */
998
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
999
	btp->count = cpu_to_be32(leafhdr.count - leafhdr.stale);
L
Linus Torvalds 已提交
1000 1001 1002 1003 1004
	btp->stale = 0;
	xfs_dir2_block_log_tail(tp, dbp);
	/*
	 * Initialize the block leaf area.  We compact out stale entries.
	 */
1005
	lep = xfs_dir2_block_leaf_p(btp);
1006 1007
	for (from = to = 0; from < leafhdr.count; from++) {
		if (ents[from].address == cpu_to_be32(XFS_DIR2_NULL_DATAPTR))
L
Linus Torvalds 已提交
1008
			continue;
1009
		lep[to++] = ents[from];
L
Linus Torvalds 已提交
1010
	}
1011 1012
	ASSERT(to == be32_to_cpu(btp->count));
	xfs_dir2_block_log_leaf(tp, dbp, 0, be32_to_cpu(btp->count) - 1);
L
Linus Torvalds 已提交
1013 1014 1015 1016
	/*
	 * Scan the bestfree if we need it and log the data block header.
	 */
	if (needscan)
1017
		xfs_dir2_data_freescan(dp, hdr, &needlog);
L
Linus Torvalds 已提交
1018
	if (needlog)
1019
		xfs_dir2_data_log_header(args, dbp);
L
Linus Torvalds 已提交
1020 1021 1022
	/*
	 * Pitch the old leaf block.
	 */
1023
	error = xfs_da_shrink_inode(args, args->geo->leafblk, lbp);
1024 1025 1026
	if (error)
		return error;

L
Linus Torvalds 已提交
1027 1028 1029
	/*
	 * Now see if the resulting block can be shrunken to shortform.
	 */
1030
	size = xfs_dir2_block_sfsize(dp, hdr, &sfh);
1031 1032 1033
	if (size > XFS_IFORK_DSIZE(dp))
		return 0;

L
Linus Torvalds 已提交
1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044
	return xfs_dir2_block_to_sf(args, dbp, size, &sfh);
}

/*
 * Convert the shortform directory to block form.
 */
int						/* error */
xfs_dir2_sf_to_block(
	xfs_da_args_t		*args)		/* operation arguments */
{
	xfs_dir2_db_t		blkno;		/* dir-relative block # (0) */
1045
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
1046
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf entries */
1047
	struct xfs_buf		*bp;		/* block buffer */
L
Linus Torvalds 已提交
1048 1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060 1061
	xfs_dir2_block_tail_t	*btp;		/* block tail pointer */
	xfs_dir2_data_entry_t	*dep;		/* data entry pointer */
	xfs_inode_t		*dp;		/* incore directory inode */
	int			dummy;		/* trash */
	xfs_dir2_data_unused_t	*dup;		/* unused entry pointer */
	int			endoffset;	/* end of data objects */
	int			error;		/* error return value */
	int			i;		/* index */
	xfs_mount_t		*mp;		/* filesystem mount point */
	int			needlog;	/* need to log block header */
	int			needscan;	/* need to scan block freespc */
	int			newoffset;	/* offset from current entry */
	int			offset;		/* target block offset */
	xfs_dir2_sf_entry_t	*sfep;		/* sf entry pointer */
C
Christoph Hellwig 已提交
1062 1063
	xfs_dir2_sf_hdr_t	*oldsfp;	/* old shortform header  */
	xfs_dir2_sf_hdr_t	*sfp;		/* shortform header  */
1064
	__be16			*tagp;		/* end of data entry */
L
Linus Torvalds 已提交
1065
	xfs_trans_t		*tp;		/* transaction pointer */
1066
	struct xfs_name		name;
1067
	struct xfs_ifork	*ifp;
L
Linus Torvalds 已提交
1068

C
Christoph Hellwig 已提交
1069 1070
	trace_xfs_dir2_sf_to_block(args);

L
Linus Torvalds 已提交
1071 1072 1073
	dp = args->dp;
	tp = args->trans;
	mp = dp->i_mount;
1074 1075
	ifp = XFS_IFORK_PTR(dp, XFS_DATA_FORK);
	ASSERT(ifp->if_flags & XFS_IFINLINE);
L
Linus Torvalds 已提交
1076 1077 1078 1079 1080
	/*
	 * Bomb out if the shortform directory is way too short.
	 */
	if (dp->i_d.di_size < offsetof(xfs_dir2_sf_hdr_t, parent)) {
		ASSERT(XFS_FORCED_SHUTDOWN(mp));
D
Dave Chinner 已提交
1081
		return -EIO;
L
Linus Torvalds 已提交
1082
	}
C
Christoph Hellwig 已提交
1083

1084
	oldsfp = (xfs_dir2_sf_hdr_t *)ifp->if_u1.if_data;
C
Christoph Hellwig 已提交
1085

1086 1087
	ASSERT(ifp->if_bytes == dp->i_d.di_size);
	ASSERT(ifp->if_u1.if_data != NULL);
C
Christoph Hellwig 已提交
1088
	ASSERT(dp->i_d.di_size >= xfs_dir2_sf_hdr_size(oldsfp->i8count));
1089
	ASSERT(dp->i_d.di_nextents == 0);
C
Christoph Hellwig 已提交
1090

L
Linus Torvalds 已提交
1091
	/*
C
Christoph Hellwig 已提交
1092
	 * Copy the directory into a temporary buffer.
L
Linus Torvalds 已提交
1093 1094
	 * Then pitch the incore inode data so we can make extents.
	 */
1095 1096
	sfp = kmem_alloc(ifp->if_bytes, KM_SLEEP);
	memcpy(sfp, oldsfp, ifp->if_bytes);
L
Linus Torvalds 已提交
1097

1098 1099
	xfs_idata_realloc(dp, -ifp->if_bytes, XFS_DATA_FORK);
	xfs_bmap_local_to_extents_empty(dp, XFS_DATA_FORK);
L
Linus Torvalds 已提交
1100
	dp->i_d.di_size = 0;
C
Christoph Hellwig 已提交
1101

L
Linus Torvalds 已提交
1102 1103 1104 1105 1106
	/*
	 * Add block 0 to the inode.
	 */
	error = xfs_dir2_grow_inode(args, XFS_DIR2_DATA_SPACE, &blkno);
	if (error) {
C
Christoph Hellwig 已提交
1107
		kmem_free(sfp);
L
Linus Torvalds 已提交
1108 1109 1110
		return error;
	}
	/*
1111
	 * Initialize the data block, then convert it to block format.
L
Linus Torvalds 已提交
1112
	 */
1113
	error = xfs_dir3_data_init(args, blkno, &bp);
L
Linus Torvalds 已提交
1114
	if (error) {
C
Christoph Hellwig 已提交
1115
		kmem_free(sfp);
L
Linus Torvalds 已提交
1116 1117
		return error;
	}
1118
	xfs_dir3_block_init(mp, tp, bp, dp);
1119
	hdr = bp->b_addr;
1120

L
Linus Torvalds 已提交
1121 1122 1123 1124
	/*
	 * Compute size of block "tail" area.
	 */
	i = (uint)sizeof(*btp) +
C
Christoph Hellwig 已提交
1125
	    (sfp->count + 2) * (uint)sizeof(xfs_dir2_leaf_entry_t);
L
Linus Torvalds 已提交
1126 1127 1128 1129
	/*
	 * The whole thing is initialized to free by the init routine.
	 * Say we're using the leaf and tail area.
	 */
1130
	dup = dp->d_ops->data_unused_p(hdr);
L
Linus Torvalds 已提交
1131
	needlog = needscan = 0;
1132
	xfs_dir2_data_use_free(args, bp, dup, args->geo->blksize - i,
1133
			       i, &needlog, &needscan);
L
Linus Torvalds 已提交
1134 1135 1136 1137
	ASSERT(needscan == 0);
	/*
	 * Fill in the tail.
	 */
1138
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
C
Christoph Hellwig 已提交
1139
	btp->count = cpu_to_be32(sfp->count + 2);	/* ., .. */
L
Linus Torvalds 已提交
1140
	btp->stale = 0;
1141
	blp = xfs_dir2_block_leaf_p(btp);
1142
	endoffset = (uint)((char *)blp - (char *)hdr);
L
Linus Torvalds 已提交
1143 1144 1145
	/*
	 * Remove the freespace, we'll manage it.
	 */
1146
	xfs_dir2_data_use_free(args, bp, dup,
1147
		(xfs_dir2_data_aoff_t)((char *)dup - (char *)hdr),
1148
		be16_to_cpu(dup->length), &needlog, &needscan);
L
Linus Torvalds 已提交
1149 1150 1151
	/*
	 * Create entry for .
	 */
1152
	dep = dp->d_ops->data_dot_entry_p(hdr);
1153
	dep->inumber = cpu_to_be64(dp->i_ino);
L
Linus Torvalds 已提交
1154 1155
	dep->namelen = 1;
	dep->name[0] = '.';
1156 1157
	dp->d_ops->data_put_ftype(dep, XFS_DIR3_FT_DIR);
	tagp = dp->d_ops->data_entry_tag_p(dep);
1158
	*tagp = cpu_to_be16((char *)dep - (char *)hdr);
1159
	xfs_dir2_data_log_entry(args, bp, dep);
1160
	blp[0].hashval = cpu_to_be32(xfs_dir_hash_dot);
1161
	blp[0].address = cpu_to_be32(xfs_dir2_byte_to_dataptr(
1162
				(char *)dep - (char *)hdr));
L
Linus Torvalds 已提交
1163 1164 1165
	/*
	 * Create entry for ..
	 */
1166
	dep = dp->d_ops->data_dotdot_entry_p(hdr);
1167
	dep->inumber = cpu_to_be64(dp->d_ops->sf_get_parent_ino(sfp));
L
Linus Torvalds 已提交
1168 1169
	dep->namelen = 2;
	dep->name[0] = dep->name[1] = '.';
1170 1171
	dp->d_ops->data_put_ftype(dep, XFS_DIR3_FT_DIR);
	tagp = dp->d_ops->data_entry_tag_p(dep);
1172
	*tagp = cpu_to_be16((char *)dep - (char *)hdr);
1173
	xfs_dir2_data_log_entry(args, bp, dep);
1174
	blp[1].hashval = cpu_to_be32(xfs_dir_hash_dotdot);
1175
	blp[1].address = cpu_to_be32(xfs_dir2_byte_to_dataptr(
1176
				(char *)dep - (char *)hdr));
1177
	offset = dp->d_ops->data_first_offset;
L
Linus Torvalds 已提交
1178 1179 1180
	/*
	 * Loop over existing entries, stuff them in.
	 */
C
Christoph Hellwig 已提交
1181 1182
	i = 0;
	if (!sfp->count)
L
Linus Torvalds 已提交
1183 1184
		sfep = NULL;
	else
1185
		sfep = xfs_dir2_sf_firstentry(sfp);
L
Linus Torvalds 已提交
1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196
	/*
	 * Need to preserve the existing offset values in the sf directory.
	 * Insert holes (unused entries) where necessary.
	 */
	while (offset < endoffset) {
		/*
		 * sfep is null when we reach the end of the list.
		 */
		if (sfep == NULL)
			newoffset = endoffset;
		else
1197
			newoffset = xfs_dir2_sf_get_offset(sfep);
L
Linus Torvalds 已提交
1198 1199 1200 1201
		/*
		 * There should be a hole here, make one.
		 */
		if (offset < newoffset) {
1202
			dup = (xfs_dir2_data_unused_t *)((char *)hdr + offset);
1203 1204
			dup->freetag = cpu_to_be16(XFS_DIR2_DATA_FREE_TAG);
			dup->length = cpu_to_be16(newoffset - offset);
1205
			*xfs_dir2_data_unused_tag_p(dup) = cpu_to_be16(
1206
				((char *)dup - (char *)hdr));
1207
			xfs_dir2_data_log_unused(args, bp, dup);
1208 1209 1210
			xfs_dir2_data_freeinsert(hdr,
						 dp->d_ops->data_bestfree_p(hdr),
						 dup, &dummy);
1211
			offset += be16_to_cpu(dup->length);
L
Linus Torvalds 已提交
1212 1213 1214 1215 1216
			continue;
		}
		/*
		 * Copy a real entry.
		 */
1217
		dep = (xfs_dir2_data_entry_t *)((char *)hdr + newoffset);
1218
		dep->inumber = cpu_to_be64(dp->d_ops->sf_get_ino(sfp, sfep));
L
Linus Torvalds 已提交
1219
		dep->namelen = sfep->namelen;
1220
		dp->d_ops->data_put_ftype(dep, dp->d_ops->sf_get_ftype(sfep));
L
Linus Torvalds 已提交
1221
		memcpy(dep->name, sfep->name, dep->namelen);
1222
		tagp = dp->d_ops->data_entry_tag_p(dep);
1223
		*tagp = cpu_to_be16((char *)dep - (char *)hdr);
1224
		xfs_dir2_data_log_entry(args, bp, dep);
1225 1226 1227 1228
		name.name = sfep->name;
		name.len = sfep->namelen;
		blp[2 + i].hashval = cpu_to_be32(mp->m_dirnameops->
							hashname(&name));
1229
		blp[2 + i].address = cpu_to_be32(xfs_dir2_byte_to_dataptr(
1230 1231
						 (char *)dep - (char *)hdr));
		offset = (int)((char *)(tagp + 1) - (char *)hdr);
C
Christoph Hellwig 已提交
1232
		if (++i == sfp->count)
L
Linus Torvalds 已提交
1233 1234
			sfep = NULL;
		else
1235
			sfep = dp->d_ops->sf_nextentry(sfp, sfep);
L
Linus Torvalds 已提交
1236 1237
	}
	/* Done with the temporary buffer */
C
Christoph Hellwig 已提交
1238
	kmem_free(sfp);
L
Linus Torvalds 已提交
1239 1240 1241
	/*
	 * Sort the leaf entries by hash value.
	 */
1242
	xfs_sort(blp, be32_to_cpu(btp->count), sizeof(*blp), xfs_dir2_block_sort);
L
Linus Torvalds 已提交
1243 1244 1245 1246 1247
	/*
	 * Log the leaf entry area and tail.
	 * Already logged the header in data_init, ignore needlog.
	 */
	ASSERT(needscan == 0);
1248
	xfs_dir2_block_log_leaf(tp, bp, 0, be32_to_cpu(btp->count) - 1);
L
Linus Torvalds 已提交
1249
	xfs_dir2_block_log_tail(tp, bp);
1250
	xfs_dir3_data_check(dp, bp);
L
Linus Torvalds 已提交
1251 1252
	return 0;
}