xfs_dir2_block.c 35.1 KB
Newer Older
L
Linus Torvalds 已提交
1
/*
2
 * Copyright (c) 2000-2003,2005 Silicon Graphics, Inc.
3
 * Copyright (c) 2013 Red Hat, Inc.
4
 * All Rights Reserved.
L
Linus Torvalds 已提交
5
 *
6 7
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License as
L
Linus Torvalds 已提交
8 9
 * published by the Free Software Foundation.
 *
10 11 12 13
 * This program is distributed in the hope that it would be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
L
Linus Torvalds 已提交
14
 *
15 16 17
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write the Free Software Foundation,
 * Inc.,  51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
L
Linus Torvalds 已提交
18 19
 */
#include "xfs.h"
20
#include "xfs_fs.h"
21
#include "xfs_format.h"
22 23
#include "xfs_log_format.h"
#include "xfs_trans_resv.h"
L
Linus Torvalds 已提交
24
#include "xfs_mount.h"
25
#include "xfs_da_format.h"
26
#include "xfs_da_btree.h"
L
Linus Torvalds 已提交
27
#include "xfs_inode.h"
28
#include "xfs_trans.h"
29
#include "xfs_inode_item.h"
30
#include "xfs_bmap.h"
31
#include "xfs_buf_item.h"
32
#include "xfs_dir2.h"
C
Christoph Hellwig 已提交
33
#include "xfs_dir2_priv.h"
L
Linus Torvalds 已提交
34
#include "xfs_error.h"
C
Christoph Hellwig 已提交
35
#include "xfs_trace.h"
36
#include "xfs_cksum.h"
37
#include "xfs_log.h"
L
Linus Torvalds 已提交
38 39 40 41

/*
 * Local function prototypes.
 */
42 43 44 45
static void xfs_dir2_block_log_leaf(xfs_trans_t *tp, struct xfs_buf *bp,
				    int first, int last);
static void xfs_dir2_block_log_tail(xfs_trans_t *tp, struct xfs_buf *bp);
static int xfs_dir2_block_lookup_int(xfs_da_args_t *args, struct xfs_buf **bpp,
L
Linus Torvalds 已提交
46 47 48
				     int *entno);
static int xfs_dir2_block_sort(const void *a, const void *b);

49 50 51 52 53 54 55 56
static xfs_dahash_t xfs_dir_hash_dot, xfs_dir_hash_dotdot;

/*
 * One-time startup routine called from xfs_init().
 */
void
xfs_dir_startup(void)
{
57 58
	xfs_dir_hash_dot = xfs_da_hashname((unsigned char *)".", 1);
	xfs_dir_hash_dotdot = xfs_da_hashname((unsigned char *)"..", 2);
59 60
}

61 62
static bool
xfs_dir3_block_verify(
63 64 65
	struct xfs_buf		*bp)
{
	struct xfs_mount	*mp = bp->b_target->bt_mount;
66 67 68 69 70
	struct xfs_dir3_blk_hdr	*hdr3 = bp->b_addr;

	if (xfs_sb_version_hascrc(&mp->m_sb)) {
		if (hdr3->magic != cpu_to_be32(XFS_DIR3_BLOCK_MAGIC))
			return false;
71
		if (!uuid_equal(&hdr3->uuid, &mp->m_sb.sb_meta_uuid))
72 73 74
			return false;
		if (be64_to_cpu(hdr3->blkno) != bp->b_bn)
			return false;
75 76
		if (!xfs_log_check_lsn(mp, be64_to_cpu(hdr3->lsn)))
			return false;
77 78 79
	} else {
		if (hdr3->magic != cpu_to_be32(XFS_DIR2_BLOCK_MAGIC))
			return false;
80
	}
81
	if (__xfs_dir3_data_check(NULL, bp))
82 83
		return false;
	return true;
84
}
85

86
static void
87
xfs_dir3_block_read_verify(
88 89
	struct xfs_buf	*bp)
{
90 91
	struct xfs_mount	*mp = bp->b_target->bt_mount;

92 93
	if (xfs_sb_version_hascrc(&mp->m_sb) &&
	     !xfs_buf_verify_cksum(bp, XFS_DIR3_DATA_CRC_OFF))
D
Dave Chinner 已提交
94
		xfs_buf_ioerror(bp, -EFSBADCRC);
95
	else if (!xfs_dir3_block_verify(bp))
D
Dave Chinner 已提交
96
		xfs_buf_ioerror(bp, -EFSCORRUPTED);
97 98 99

	if (bp->b_error)
		xfs_verifier_error(bp);
100 101
}

102
static void
103
xfs_dir3_block_write_verify(
104 105
	struct xfs_buf	*bp)
{
106 107 108 109 110
	struct xfs_mount	*mp = bp->b_target->bt_mount;
	struct xfs_buf_log_item	*bip = bp->b_fspriv;
	struct xfs_dir3_blk_hdr	*hdr3 = bp->b_addr;

	if (!xfs_dir3_block_verify(bp)) {
D
Dave Chinner 已提交
111
		xfs_buf_ioerror(bp, -EFSCORRUPTED);
112
		xfs_verifier_error(bp);
113 114 115 116 117 118 119 120 121
		return;
	}

	if (!xfs_sb_version_hascrc(&mp->m_sb))
		return;

	if (bip)
		hdr3->lsn = cpu_to_be64(bip->bli_item.li_lsn);

122
	xfs_buf_update_cksum(bp, XFS_DIR3_DATA_CRC_OFF);
123 124
}

125
const struct xfs_buf_ops xfs_dir3_block_buf_ops = {
126
	.name = "xfs_dir3_block",
127 128
	.verify_read = xfs_dir3_block_read_verify,
	.verify_write = xfs_dir3_block_write_verify,
129 130
};

131
int
132
xfs_dir3_block_read(
133 134 135 136 137
	struct xfs_trans	*tp,
	struct xfs_inode	*dp,
	struct xfs_buf		**bpp)
{
	struct xfs_mount	*mp = dp->i_mount;
138
	int			err;
139

140
	err = xfs_da_read_buf(tp, dp, mp->m_dir_geo->datablk, -1, bpp,
141
				XFS_DATA_FORK, &xfs_dir3_block_buf_ops);
142
	if (!err && tp)
143
		xfs_trans_buf_set_type(tp, *bpp, XFS_BLFT_DIR_BLOCK_BUF);
144
	return err;
145 146 147 148 149
}

static void
xfs_dir3_block_init(
	struct xfs_mount	*mp,
150
	struct xfs_trans	*tp,
151 152 153 154 155 156
	struct xfs_buf		*bp,
	struct xfs_inode	*dp)
{
	struct xfs_dir3_blk_hdr *hdr3 = bp->b_addr;

	bp->b_ops = &xfs_dir3_block_buf_ops;
157
	xfs_trans_buf_set_type(tp, bp, XFS_BLFT_DIR_BLOCK_BUF);
158 159 160 161 162 163

	if (xfs_sb_version_hascrc(&mp->m_sb)) {
		memset(hdr3, 0, sizeof(*hdr3));
		hdr3->magic = cpu_to_be32(XFS_DIR3_BLOCK_MAGIC);
		hdr3->blkno = cpu_to_be64(bp->b_bn);
		hdr3->owner = cpu_to_be64(dp->i_ino);
164
		uuid_copy(&hdr3->uuid, &mp->m_sb.sb_meta_uuid);
165 166 167 168
		return;

	}
	hdr3->magic = cpu_to_be32(XFS_DIR2_BLOCK_MAGIC);
169 170 171 172
}

static void
xfs_dir2_block_need_space(
173
	struct xfs_inode		*dp,
174 175 176 177 178 179 180 181 182 183 184 185 186 187 188
	struct xfs_dir2_data_hdr	*hdr,
	struct xfs_dir2_block_tail	*btp,
	struct xfs_dir2_leaf_entry	*blp,
	__be16				**tagpp,
	struct xfs_dir2_data_unused	**dupp,
	struct xfs_dir2_data_unused	**enddupp,
	int				*compact,
	int				len)
{
	struct xfs_dir2_data_free	*bf;
	__be16				*tagp = NULL;
	struct xfs_dir2_data_unused	*dup = NULL;
	struct xfs_dir2_data_unused	*enddup = NULL;

	*compact = 0;
189
	bf = dp->d_ops->data_bestfree_p(hdr);
190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284

	/*
	 * If there are stale entries we'll use one for the leaf.
	 */
	if (btp->stale) {
		if (be16_to_cpu(bf[0].length) >= len) {
			/*
			 * The biggest entry enough to avoid compaction.
			 */
			dup = (xfs_dir2_data_unused_t *)
			      ((char *)hdr + be16_to_cpu(bf[0].offset));
			goto out;
		}

		/*
		 * Will need to compact to make this work.
		 * Tag just before the first leaf entry.
		 */
		*compact = 1;
		tagp = (__be16 *)blp - 1;

		/* Data object just before the first leaf entry.  */
		dup = (xfs_dir2_data_unused_t *)((char *)hdr + be16_to_cpu(*tagp));

		/*
		 * If it's not free then the data will go where the
		 * leaf data starts now, if it works at all.
		 */
		if (be16_to_cpu(dup->freetag) == XFS_DIR2_DATA_FREE_TAG) {
			if (be16_to_cpu(dup->length) + (be32_to_cpu(btp->stale) - 1) *
			    (uint)sizeof(*blp) < len)
				dup = NULL;
		} else if ((be32_to_cpu(btp->stale) - 1) * (uint)sizeof(*blp) < len)
			dup = NULL;
		else
			dup = (xfs_dir2_data_unused_t *)blp;
		goto out;
	}

	/*
	 * no stale entries, so just use free space.
	 * Tag just before the first leaf entry.
	 */
	tagp = (__be16 *)blp - 1;

	/* Data object just before the first leaf entry.  */
	enddup = (xfs_dir2_data_unused_t *)((char *)hdr + be16_to_cpu(*tagp));

	/*
	 * If it's not free then can't do this add without cleaning up:
	 * the space before the first leaf entry needs to be free so it
	 * can be expanded to hold the pointer to the new entry.
	 */
	if (be16_to_cpu(enddup->freetag) == XFS_DIR2_DATA_FREE_TAG) {
		/*
		 * Check out the biggest freespace and see if it's the same one.
		 */
		dup = (xfs_dir2_data_unused_t *)
		      ((char *)hdr + be16_to_cpu(bf[0].offset));
		if (dup != enddup) {
			/*
			 * Not the same free entry, just check its length.
			 */
			if (be16_to_cpu(dup->length) < len)
				dup = NULL;
			goto out;
		}

		/*
		 * It is the biggest freespace, can it hold the leaf too?
		 */
		if (be16_to_cpu(dup->length) < len + (uint)sizeof(*blp)) {
			/*
			 * Yes, use the second-largest entry instead if it works.
			 */
			if (be16_to_cpu(bf[1].length) >= len)
				dup = (xfs_dir2_data_unused_t *)
				      ((char *)hdr + be16_to_cpu(bf[1].offset));
			else
				dup = NULL;
		}
	}
out:
	*tagpp = tagp;
	*dupp = dup;
	*enddupp = enddup;
}

/*
 * compact the leaf entries.
 * Leave the highest-numbered stale entry stale.
 * XXX should be the one closest to mid but mid is not yet computed.
 */
static void
xfs_dir2_block_compact(
285
	struct xfs_da_args		*args,
286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317
	struct xfs_buf			*bp,
	struct xfs_dir2_data_hdr	*hdr,
	struct xfs_dir2_block_tail	*btp,
	struct xfs_dir2_leaf_entry	*blp,
	int				*needlog,
	int				*lfloghigh,
	int				*lfloglow)
{
	int			fromidx;	/* source leaf index */
	int			toidx;		/* target leaf index */
	int			needscan = 0;
	int			highstale;	/* high stale index */

	fromidx = toidx = be32_to_cpu(btp->count) - 1;
	highstale = *lfloghigh = -1;
	for (; fromidx >= 0; fromidx--) {
		if (blp[fromidx].address == cpu_to_be32(XFS_DIR2_NULL_DATAPTR)) {
			if (highstale == -1)
				highstale = toidx;
			else {
				if (*lfloghigh == -1)
					*lfloghigh = toidx;
				continue;
			}
		}
		if (fromidx < toidx)
			blp[toidx] = blp[fromidx];
		toidx--;
	}
	*lfloglow = toidx + 1 - (be32_to_cpu(btp->stale) - 1);
	*lfloghigh -= be32_to_cpu(btp->stale) - 1;
	be32_add_cpu(&btp->count, -(be32_to_cpu(btp->stale) - 1));
318
	xfs_dir2_data_make_free(args, bp,
319 320 321 322 323 324 325 326 327
		(xfs_dir2_data_aoff_t)((char *)blp - (char *)hdr),
		(xfs_dir2_data_aoff_t)((be32_to_cpu(btp->stale) - 1) * sizeof(*blp)),
		needlog, &needscan);
	btp->stale = cpu_to_be32(1);
	/*
	 * If we now need to rebuild the bestfree map, do so.
	 * This needs to happen before the next call to use_free.
	 */
	if (needscan)
328
		xfs_dir2_data_freescan(args->dp, hdr, needlog);
329 330
}

L
Linus Torvalds 已提交
331 332 333 334 335 336 337
/*
 * Add an entry to a block directory.
 */
int						/* error */
xfs_dir2_block_addname(
	xfs_da_args_t		*args)		/* directory op arguments */
{
338
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
339
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf entries */
340
	struct xfs_buf		*bp;		/* buffer for block */
L
Linus Torvalds 已提交
341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	int			compact;	/* need to compact leaf ents */
	xfs_dir2_data_entry_t	*dep;		/* block data entry */
	xfs_inode_t		*dp;		/* directory inode */
	xfs_dir2_data_unused_t	*dup;		/* block unused entry */
	int			error;		/* error return value */
	xfs_dir2_data_unused_t	*enddup=NULL;	/* unused at end of data */
	xfs_dahash_t		hash;		/* hash value of found entry */
	int			high;		/* high index for binary srch */
	int			highstale;	/* high stale index */
	int			lfloghigh=0;	/* last final leaf to log */
	int			lfloglow=0;	/* first final leaf to log */
	int			len;		/* length of the new entry */
	int			low;		/* low index for binary srch */
	int			lowstale;	/* low stale index */
	int			mid=0;		/* midpoint for binary srch */
	int			needlog;	/* need to log header */
	int			needscan;	/* need to rescan freespace */
359
	__be16			*tagp;		/* pointer to tag value */
L
Linus Torvalds 已提交
360 361
	xfs_trans_t		*tp;		/* transaction structure */

C
Christoph Hellwig 已提交
362 363
	trace_xfs_dir2_block_addname(args);

L
Linus Torvalds 已提交
364 365
	dp = args->dp;
	tp = args->trans;
366 367

	/* Read the (one and only) directory block into bp. */
368
	error = xfs_dir3_block_read(tp, dp, &bp);
369
	if (error)
L
Linus Torvalds 已提交
370
		return error;
371

372
	len = dp->d_ops->data_entsize(args->namelen);
373

L
Linus Torvalds 已提交
374 375 376
	/*
	 * Set up pointers to parts of the block.
	 */
377
	hdr = bp->b_addr;
378
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
379
	blp = xfs_dir2_block_leaf_p(btp);
380

L
Linus Torvalds 已提交
381
	/*
382 383
	 * Find out if we can reuse stale entries or whether we need extra
	 * space for entry and new leaf.
L
Linus Torvalds 已提交
384
	 */
385
	xfs_dir2_block_need_space(dp, hdr, btp, blp, &tagp, &dup,
386 387
				  &enddup, &compact, len);

L
Linus Torvalds 已提交
388
	/*
389
	 * Done everything we need for a space check now.
L
Linus Torvalds 已提交
390
	 */
391
	if (args->op_flags & XFS_DA_OP_JUSTCHECK) {
392
		xfs_trans_brelse(tp, bp);
393
		if (!dup)
D
Dave Chinner 已提交
394
			return -ENOSPC;
395 396 397
		return 0;
	}

L
Linus Torvalds 已提交
398 399 400 401
	/*
	 * If we don't have space for the new entry & leaf ...
	 */
	if (!dup) {
402 403
		/* Don't have a space reservation: return no-space.  */
		if (args->total == 0)
D
Dave Chinner 已提交
404
			return -ENOSPC;
L
Linus Torvalds 已提交
405 406 407 408 409 410 411 412 413
		/*
		 * Convert to the next larger format.
		 * Then add the new entry in that format.
		 */
		error = xfs_dir2_block_to_leaf(args, bp);
		if (error)
			return error;
		return xfs_dir2_leaf_addname(args);
	}
414

L
Linus Torvalds 已提交
415
	needlog = needscan = 0;
416

L
Linus Torvalds 已提交
417 418 419
	/*
	 * If need to compact the leaf entries, do it now.
	 */
420
	if (compact) {
421
		xfs_dir2_block_compact(args, bp, hdr, btp, blp, &needlog,
422
				      &lfloghigh, &lfloglow);
423 424 425
		/* recalculate blp post-compaction */
		blp = xfs_dir2_block_leaf_p(btp);
	} else if (btp->stale) {
L
Linus Torvalds 已提交
426
		/*
427 428
		 * Set leaf logging boundaries to impossible state.
		 * For the no-stale case they're set explicitly.
L
Linus Torvalds 已提交
429
		 */
430
		lfloglow = be32_to_cpu(btp->count);
L
Linus Torvalds 已提交
431 432
		lfloghigh = -1;
	}
433

L
Linus Torvalds 已提交
434 435 436
	/*
	 * Find the slot that's first lower than our hash value, -1 if none.
	 */
437
	for (low = 0, high = be32_to_cpu(btp->count) - 1; low <= high; ) {
L
Linus Torvalds 已提交
438
		mid = (low + high) >> 1;
439
		if ((hash = be32_to_cpu(blp[mid].hashval)) == args->hashval)
L
Linus Torvalds 已提交
440 441 442 443 444 445
			break;
		if (hash < args->hashval)
			low = mid + 1;
		else
			high = mid - 1;
	}
446
	while (mid >= 0 && be32_to_cpu(blp[mid].hashval) >= args->hashval) {
L
Linus Torvalds 已提交
447 448 449 450 451 452 453 454 455
		mid--;
	}
	/*
	 * No stale entries, will use enddup space to hold new leaf.
	 */
	if (!btp->stale) {
		/*
		 * Mark the space needed for the new leaf entry, now in use.
		 */
456
		xfs_dir2_data_use_free(args, bp, enddup,
L
Linus Torvalds 已提交
457
			(xfs_dir2_data_aoff_t)
458
			((char *)enddup - (char *)hdr + be16_to_cpu(enddup->length) -
L
Linus Torvalds 已提交
459 460 461 462 463 464
			 sizeof(*blp)),
			(xfs_dir2_data_aoff_t)sizeof(*blp),
			&needlog, &needscan);
		/*
		 * Update the tail (entry count).
		 */
465
		be32_add_cpu(&btp->count, 1);
L
Linus Torvalds 已提交
466 467 468 469 470
		/*
		 * If we now need to rebuild the bestfree map, do so.
		 * This needs to happen before the next call to use_free.
		 */
		if (needscan) {
471
			xfs_dir2_data_freescan(dp, hdr, &needlog);
L
Linus Torvalds 已提交
472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491
			needscan = 0;
		}
		/*
		 * Adjust pointer to the first leaf entry, we're about to move
		 * the table up one to open up space for the new leaf entry.
		 * Then adjust our index to match.
		 */
		blp--;
		mid++;
		if (mid)
			memmove(blp, &blp[1], mid * sizeof(*blp));
		lfloglow = 0;
		lfloghigh = mid;
	}
	/*
	 * Use a stale leaf for our new entry.
	 */
	else {
		for (lowstale = mid;
		     lowstale >= 0 &&
492 493
			blp[lowstale].address !=
			cpu_to_be32(XFS_DIR2_NULL_DATAPTR);
L
Linus Torvalds 已提交
494 495 496
		     lowstale--)
			continue;
		for (highstale = mid + 1;
497
		     highstale < be32_to_cpu(btp->count) &&
498 499
			blp[highstale].address !=
			cpu_to_be32(XFS_DIR2_NULL_DATAPTR) &&
L
Linus Torvalds 已提交
500 501 502 503 504 505 506
			(lowstale < 0 || mid - lowstale > highstale - mid);
		     highstale++)
			continue;
		/*
		 * Move entries toward the low-numbered stale entry.
		 */
		if (lowstale >= 0 &&
507
		    (highstale == be32_to_cpu(btp->count) ||
L
Linus Torvalds 已提交
508 509 510 511 512 513 514 515 516 517 518
		     mid - lowstale <= highstale - mid)) {
			if (mid - lowstale)
				memmove(&blp[lowstale], &blp[lowstale + 1],
					(mid - lowstale) * sizeof(*blp));
			lfloglow = MIN(lowstale, lfloglow);
			lfloghigh = MAX(mid, lfloghigh);
		}
		/*
		 * Move entries toward the high-numbered stale entry.
		 */
		else {
519
			ASSERT(highstale < be32_to_cpu(btp->count));
L
Linus Torvalds 已提交
520 521 522 523 524 525 526
			mid++;
			if (highstale - mid)
				memmove(&blp[mid + 1], &blp[mid],
					(highstale - mid) * sizeof(*blp));
			lfloglow = MIN(mid, lfloglow);
			lfloghigh = MAX(highstale, lfloghigh);
		}
527
		be32_add_cpu(&btp->stale, -1);
L
Linus Torvalds 已提交
528 529 530 531 532 533 534 535
	}
	/*
	 * Point to the new data entry.
	 */
	dep = (xfs_dir2_data_entry_t *)dup;
	/*
	 * Fill in the leaf entry.
	 */
536
	blp[mid].hashval = cpu_to_be32(args->hashval);
537
	blp[mid].address = cpu_to_be32(xfs_dir2_byte_to_dataptr(
538
				(char *)dep - (char *)hdr));
L
Linus Torvalds 已提交
539 540 541 542
	xfs_dir2_block_log_leaf(tp, bp, lfloglow, lfloghigh);
	/*
	 * Mark space for the data entry used.
	 */
543
	xfs_dir2_data_use_free(args, bp, dup,
544
		(xfs_dir2_data_aoff_t)((char *)dup - (char *)hdr),
L
Linus Torvalds 已提交
545 546 547 548
		(xfs_dir2_data_aoff_t)len, &needlog, &needscan);
	/*
	 * Create the new data entry.
	 */
549
	dep->inumber = cpu_to_be64(args->inumber);
L
Linus Torvalds 已提交
550 551
	dep->namelen = args->namelen;
	memcpy(dep->name, args->name, args->namelen);
552 553
	dp->d_ops->data_put_ftype(dep, args->filetype);
	tagp = dp->d_ops->data_entry_tag_p(dep);
554
	*tagp = cpu_to_be16((char *)dep - (char *)hdr);
L
Linus Torvalds 已提交
555 556 557 558
	/*
	 * Clean up the bestfree array and log the header, tail, and entry.
	 */
	if (needscan)
559
		xfs_dir2_data_freescan(dp, hdr, &needlog);
L
Linus Torvalds 已提交
560
	if (needlog)
561
		xfs_dir2_data_log_header(args, bp);
L
Linus Torvalds 已提交
562
	xfs_dir2_block_log_tail(tp, bp);
563
	xfs_dir2_data_log_entry(args, bp, dep);
564
	xfs_dir3_data_check(dp, bp);
L
Linus Torvalds 已提交
565 566 567 568 569 570 571 572 573
	return 0;
}

/*
 * Log leaf entries from the block.
 */
static void
xfs_dir2_block_log_leaf(
	xfs_trans_t		*tp,		/* transaction structure */
574
	struct xfs_buf		*bp,		/* block buffer */
L
Linus Torvalds 已提交
575 576 577
	int			first,		/* index of first logged leaf */
	int			last)		/* index of last logged leaf */
{
578
	xfs_dir2_data_hdr_t	*hdr = bp->b_addr;
579 580
	xfs_dir2_leaf_entry_t	*blp;
	xfs_dir2_block_tail_t	*btp;
L
Linus Torvalds 已提交
581

582
	btp = xfs_dir2_block_tail_p(tp->t_mountp->m_dir_geo, hdr);
583
	blp = xfs_dir2_block_leaf_p(btp);
584
	xfs_trans_log_buf(tp, bp, (uint)((char *)&blp[first] - (char *)hdr),
585
		(uint)((char *)&blp[last + 1] - (char *)hdr - 1));
L
Linus Torvalds 已提交
586 587 588 589 590 591 592 593
}

/*
 * Log the block tail.
 */
static void
xfs_dir2_block_log_tail(
	xfs_trans_t		*tp,		/* transaction structure */
594
	struct xfs_buf		*bp)		/* block buffer */
L
Linus Torvalds 已提交
595
{
596
	xfs_dir2_data_hdr_t	*hdr = bp->b_addr;
597
	xfs_dir2_block_tail_t	*btp;
L
Linus Torvalds 已提交
598

599
	btp = xfs_dir2_block_tail_p(tp->t_mountp->m_dir_geo, hdr);
600
	xfs_trans_log_buf(tp, bp, (uint)((char *)btp - (char *)hdr),
601
		(uint)((char *)(btp + 1) - (char *)hdr - 1));
L
Linus Torvalds 已提交
602 603 604 605 606 607 608 609 610 611
}

/*
 * Look up an entry in the block.  This is the external routine,
 * xfs_dir2_block_lookup_int does the real work.
 */
int						/* error */
xfs_dir2_block_lookup(
	xfs_da_args_t		*args)		/* dir lookup arguments */
{
612
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
613
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf entries */
614
	struct xfs_buf		*bp;		/* block buffer */
L
Linus Torvalds 已提交
615 616 617 618 619 620
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	xfs_dir2_data_entry_t	*dep;		/* block data entry */
	xfs_inode_t		*dp;		/* incore inode */
	int			ent;		/* entry index */
	int			error;		/* error return value */

C
Christoph Hellwig 已提交
621 622
	trace_xfs_dir2_block_lookup(args);

L
Linus Torvalds 已提交
623 624 625 626 627 628 629
	/*
	 * Get the buffer, look up the entry.
	 * If not found (ENOENT) then return, have no buffer.
	 */
	if ((error = xfs_dir2_block_lookup_int(args, &bp, &ent)))
		return error;
	dp = args->dp;
630
	hdr = bp->b_addr;
631
	xfs_dir3_data_check(dp, bp);
632
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
633
	blp = xfs_dir2_block_leaf_p(btp);
L
Linus Torvalds 已提交
634 635 636
	/*
	 * Get the offset from the leaf entry, to point to the data.
	 */
637
	dep = (xfs_dir2_data_entry_t *)((char *)hdr +
638 639
			xfs_dir2_dataptr_to_off(args->geo,
						be32_to_cpu(blp[ent].address)));
L
Linus Torvalds 已提交
640
	/*
641
	 * Fill in inode number, CI name if appropriate, release the block.
L
Linus Torvalds 已提交
642
	 */
643
	args->inumber = be64_to_cpu(dep->inumber);
644
	args->filetype = dp->d_ops->data_get_ftype(dep);
645
	error = xfs_dir_cilookup_result(args, dep->name, dep->namelen);
646
	xfs_trans_brelse(args->trans, bp);
E
Eric Sandeen 已提交
647
	return error;
L
Linus Torvalds 已提交
648 649 650 651 652 653 654 655
}

/*
 * Internal block lookup routine.
 */
static int					/* error */
xfs_dir2_block_lookup_int(
	xfs_da_args_t		*args,		/* dir lookup arguments */
656
	struct xfs_buf		**bpp,		/* returned block buffer */
L
Linus Torvalds 已提交
657 658 659
	int			*entno)		/* returned entry number */
{
	xfs_dir2_dataptr_t	addr;		/* data entry address */
660
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
661
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf entries */
662
	struct xfs_buf		*bp;		/* block buffer */
L
Linus Torvalds 已提交
663 664 665 666 667 668 669 670 671 672
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	xfs_dir2_data_entry_t	*dep;		/* block data entry */
	xfs_inode_t		*dp;		/* incore inode */
	int			error;		/* error return value */
	xfs_dahash_t		hash;		/* found hash value */
	int			high;		/* binary search high index */
	int			low;		/* binary search low index */
	int			mid;		/* binary search current idx */
	xfs_mount_t		*mp;		/* filesystem mount point */
	xfs_trans_t		*tp;		/* transaction pointer */
673
	enum xfs_dacmp		cmp;		/* comparison result */
L
Linus Torvalds 已提交
674 675 676 677

	dp = args->dp;
	tp = args->trans;
	mp = dp->i_mount;
678

679
	error = xfs_dir3_block_read(tp, dp, &bp);
680
	if (error)
L
Linus Torvalds 已提交
681
		return error;
682

683
	hdr = bp->b_addr;
684
	xfs_dir3_data_check(dp, bp);
685
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
686
	blp = xfs_dir2_block_leaf_p(btp);
L
Linus Torvalds 已提交
687 688 689 690
	/*
	 * Loop doing a binary search for our hash value.
	 * Find our entry, ENOENT if it's not there.
	 */
691
	for (low = 0, high = be32_to_cpu(btp->count) - 1; ; ) {
L
Linus Torvalds 已提交
692 693
		ASSERT(low <= high);
		mid = (low + high) >> 1;
694
		if ((hash = be32_to_cpu(blp[mid].hashval)) == args->hashval)
L
Linus Torvalds 已提交
695 696 697 698 699 700
			break;
		if (hash < args->hashval)
			low = mid + 1;
		else
			high = mid - 1;
		if (low > high) {
701
			ASSERT(args->op_flags & XFS_DA_OP_OKNOENT);
702
			xfs_trans_brelse(tp, bp);
D
Dave Chinner 已提交
703
			return -ENOENT;
L
Linus Torvalds 已提交
704 705 706 707 708
		}
	}
	/*
	 * Back up to the first one with the right hash value.
	 */
709
	while (mid > 0 && be32_to_cpu(blp[mid - 1].hashval) == args->hashval) {
L
Linus Torvalds 已提交
710 711 712 713 714 715 716
		mid--;
	}
	/*
	 * Now loop forward through all the entries with the
	 * right hash value looking for our name.
	 */
	do {
717
		if ((addr = be32_to_cpu(blp[mid].address)) == XFS_DIR2_NULL_DATAPTR)
L
Linus Torvalds 已提交
718 719 720 721 722
			continue;
		/*
		 * Get pointer to the entry from the leaf.
		 */
		dep = (xfs_dir2_data_entry_t *)
723
			((char *)hdr + xfs_dir2_dataptr_to_off(args->geo, addr));
L
Linus Torvalds 已提交
724
		/*
725 726 727
		 * Compare name and if it's an exact match, return the index
		 * and buffer. If it's the first case-insensitive match, store
		 * the index and buffer and continue looking for an exact match.
L
Linus Torvalds 已提交
728
		 */
729 730 731
		cmp = mp->m_dirnameops->compname(args, dep->name, dep->namelen);
		if (cmp != XFS_CMP_DIFFERENT && cmp != args->cmpresult) {
			args->cmpresult = cmp;
L
Linus Torvalds 已提交
732 733
			*bpp = bp;
			*entno = mid;
734 735
			if (cmp == XFS_CMP_EXACT)
				return 0;
L
Linus Torvalds 已提交
736
		}
737 738 739
	} while (++mid < be32_to_cpu(btp->count) &&
			be32_to_cpu(blp[mid].hashval) == hash);

740
	ASSERT(args->op_flags & XFS_DA_OP_OKNOENT);
741 742 743 744 745 746
	/*
	 * Here, we can only be doing a lookup (not a rename or replace).
	 * If a case-insensitive match was found earlier, return success.
	 */
	if (args->cmpresult == XFS_CMP_CASE)
		return 0;
L
Linus Torvalds 已提交
747 748 749
	/*
	 * No match, release the buffer and return ENOENT.
	 */
750
	xfs_trans_brelse(tp, bp);
D
Dave Chinner 已提交
751
	return -ENOENT;
L
Linus Torvalds 已提交
752 753 754 755 756 757 758 759 760 761
}

/*
 * Remove an entry from a block format directory.
 * If that makes the block small enough to fit in shortform, transform it.
 */
int						/* error */
xfs_dir2_block_removename(
	xfs_da_args_t		*args)		/* directory operation args */
{
762
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
763
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf pointer */
764
	struct xfs_buf		*bp;		/* block buffer */
L
Linus Torvalds 已提交
765 766 767 768 769 770 771 772 773 774 775
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	xfs_dir2_data_entry_t	*dep;		/* block data entry */
	xfs_inode_t		*dp;		/* incore inode */
	int			ent;		/* block leaf entry index */
	int			error;		/* error return value */
	int			needlog;	/* need to log block header */
	int			needscan;	/* need to fixup bestfree */
	xfs_dir2_sf_hdr_t	sfh;		/* shortform header */
	int			size;		/* shortform size */
	xfs_trans_t		*tp;		/* transaction pointer */

C
Christoph Hellwig 已提交
776 777
	trace_xfs_dir2_block_removename(args);

L
Linus Torvalds 已提交
778 779 780 781 782 783 784 785 786
	/*
	 * Look up the entry in the block.  Gets the buffer and entry index.
	 * It will always be there, the vnodeops level does a lookup first.
	 */
	if ((error = xfs_dir2_block_lookup_int(args, &bp, &ent))) {
		return error;
	}
	dp = args->dp;
	tp = args->trans;
787
	hdr = bp->b_addr;
788
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
789
	blp = xfs_dir2_block_leaf_p(btp);
L
Linus Torvalds 已提交
790 791 792
	/*
	 * Point to the data entry using the leaf entry.
	 */
793 794 795
	dep = (xfs_dir2_data_entry_t *)((char *)hdr +
			xfs_dir2_dataptr_to_off(args->geo,
						be32_to_cpu(blp[ent].address)));
L
Linus Torvalds 已提交
796 797 798 799
	/*
	 * Mark the data entry's space free.
	 */
	needlog = needscan = 0;
800
	xfs_dir2_data_make_free(args, bp,
801
		(xfs_dir2_data_aoff_t)((char *)dep - (char *)hdr),
802
		dp->d_ops->data_entsize(dep->namelen), &needlog, &needscan);
L
Linus Torvalds 已提交
803 804 805
	/*
	 * Fix up the block tail.
	 */
806
	be32_add_cpu(&btp->stale, 1);
L
Linus Torvalds 已提交
807 808 809 810
	xfs_dir2_block_log_tail(tp, bp);
	/*
	 * Remove the leaf entry by marking it stale.
	 */
811
	blp[ent].address = cpu_to_be32(XFS_DIR2_NULL_DATAPTR);
L
Linus Torvalds 已提交
812 813 814 815 816
	xfs_dir2_block_log_leaf(tp, bp, ent, ent);
	/*
	 * Fix up bestfree, log the header if necessary.
	 */
	if (needscan)
817
		xfs_dir2_data_freescan(dp, hdr, &needlog);
L
Linus Torvalds 已提交
818
	if (needlog)
819
		xfs_dir2_data_log_header(args, bp);
820
	xfs_dir3_data_check(dp, bp);
L
Linus Torvalds 已提交
821 822 823
	/*
	 * See if the size as a shortform is good enough.
	 */
824
	size = xfs_dir2_block_sfsize(dp, hdr, &sfh);
825
	if (size > XFS_IFORK_DSIZE(dp))
L
Linus Torvalds 已提交
826
		return 0;
827

L
Linus Torvalds 已提交
828 829 830 831 832 833 834 835 836 837 838 839 840 841
	/*
	 * If it works, do the conversion.
	 */
	return xfs_dir2_block_to_sf(args, bp, size, &sfh);
}

/*
 * Replace an entry in a V2 block directory.
 * Change the inode number to the new value.
 */
int						/* error */
xfs_dir2_block_replace(
	xfs_da_args_t		*args)		/* directory operation args */
{
842
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
843
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf entries */
844
	struct xfs_buf		*bp;		/* block buffer */
L
Linus Torvalds 已提交
845 846 847 848 849 850
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	xfs_dir2_data_entry_t	*dep;		/* block data entry */
	xfs_inode_t		*dp;		/* incore inode */
	int			ent;		/* leaf entry index */
	int			error;		/* error return value */

C
Christoph Hellwig 已提交
851 852
	trace_xfs_dir2_block_replace(args);

L
Linus Torvalds 已提交
853 854 855 856 857 858 859 860
	/*
	 * Lookup the entry in the directory.  Get buffer and entry index.
	 * This will always succeed since the caller has already done a lookup.
	 */
	if ((error = xfs_dir2_block_lookup_int(args, &bp, &ent))) {
		return error;
	}
	dp = args->dp;
861
	hdr = bp->b_addr;
862
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
863
	blp = xfs_dir2_block_leaf_p(btp);
L
Linus Torvalds 已提交
864 865 866
	/*
	 * Point to the data entry we need to change.
	 */
867 868 869
	dep = (xfs_dir2_data_entry_t *)((char *)hdr +
			xfs_dir2_dataptr_to_off(args->geo,
						be32_to_cpu(blp[ent].address)));
870
	ASSERT(be64_to_cpu(dep->inumber) != args->inumber);
L
Linus Torvalds 已提交
871 872 873
	/*
	 * Change the inode number to the new value.
	 */
874
	dep->inumber = cpu_to_be64(args->inumber);
875
	dp->d_ops->data_put_ftype(dep, args->filetype);
876
	xfs_dir2_data_log_entry(args, bp, dep);
877
	xfs_dir3_data_check(dp, bp);
L
Linus Torvalds 已提交
878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893
	return 0;
}

/*
 * Qsort comparison routine for the block leaf entries.
 */
static int					/* sort order */
xfs_dir2_block_sort(
	const void			*a,	/* first leaf entry */
	const void			*b)	/* second leaf entry */
{
	const xfs_dir2_leaf_entry_t	*la;	/* first leaf entry */
	const xfs_dir2_leaf_entry_t	*lb;	/* second leaf entry */

	la = a;
	lb = b;
894 895
	return be32_to_cpu(la->hashval) < be32_to_cpu(lb->hashval) ? -1 :
		(be32_to_cpu(la->hashval) > be32_to_cpu(lb->hashval) ? 1 : 0);
L
Linus Torvalds 已提交
896 897 898 899 900 901 902 903
}

/*
 * Convert a V2 leaf directory to a V2 block directory if possible.
 */
int						/* error */
xfs_dir2_leaf_to_block(
	xfs_da_args_t		*args,		/* operation arguments */
904 905
	struct xfs_buf		*lbp,		/* leaf buffer */
	struct xfs_buf		*dbp)		/* data buffer */
L
Linus Torvalds 已提交
906
{
907
	__be16			*bestsp;	/* leaf bests table */
908
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
909 910 911 912 913 914 915 916 917 918 919 920 921
	xfs_dir2_block_tail_t	*btp;		/* block tail */
	xfs_inode_t		*dp;		/* incore directory inode */
	xfs_dir2_data_unused_t	*dup;		/* unused data entry */
	int			error;		/* error return value */
	int			from;		/* leaf from index */
	xfs_dir2_leaf_t		*leaf;		/* leaf structure */
	xfs_dir2_leaf_entry_t	*lep;		/* leaf entry */
	xfs_dir2_leaf_tail_t	*ltp;		/* leaf tail structure */
	xfs_mount_t		*mp;		/* file system mount point */
	int			needlog;	/* need to log data header */
	int			needscan;	/* need to scan for bestfree */
	xfs_dir2_sf_hdr_t	sfh;		/* shortform header */
	int			size;		/* bytes used */
922
	__be16			*tagp;		/* end of entry (tag) */
L
Linus Torvalds 已提交
923 924
	int			to;		/* block/leaf to index */
	xfs_trans_t		*tp;		/* transaction pointer */
925 926
	struct xfs_dir2_leaf_entry *ents;
	struct xfs_dir3_icleaf_hdr leafhdr;
L
Linus Torvalds 已提交
927

C
Christoph Hellwig 已提交
928 929
	trace_xfs_dir2_leaf_to_block(args);

L
Linus Torvalds 已提交
930 931 932
	dp = args->dp;
	tp = args->trans;
	mp = dp->i_mount;
933
	leaf = lbp->b_addr;
934
	dp->d_ops->leaf_hdr_from_disk(&leafhdr, leaf);
935
	ents = dp->d_ops->leaf_ents_p(leaf);
936
	ltp = xfs_dir2_leaf_tail_p(args->geo, leaf);
937 938 939

	ASSERT(leafhdr.magic == XFS_DIR2_LEAF1_MAGIC ||
	       leafhdr.magic == XFS_DIR3_LEAF1_MAGIC);
L
Linus Torvalds 已提交
940 941 942 943 944 945
	/*
	 * If there are data blocks other than the first one, take this
	 * opportunity to remove trailing empty data blocks that may have
	 * been left behind during no-space-reservation operations.
	 * These will show up in the leaf bests table.
	 */
946
	while (dp->i_d.di_size > args->geo->blksize) {
947 948
		int hdrsz;

949
		hdrsz = dp->d_ops->data_entry_offset;
950
		bestsp = xfs_dir2_leaf_bests_p(ltp);
951
		if (be16_to_cpu(bestsp[be32_to_cpu(ltp->bestcount) - 1]) ==
952
					    args->geo->blksize - hdrsz) {
L
Linus Torvalds 已提交
953 954
			if ((error =
			    xfs_dir2_leaf_trim_data(args, lbp,
955
				    (xfs_dir2_db_t)(be32_to_cpu(ltp->bestcount) - 1))))
956 957 958
				return error;
		} else
			return 0;
L
Linus Torvalds 已提交
959 960 961 962
	}
	/*
	 * Read the data block if we don't already have it, give up if it fails.
	 */
963
	if (!dbp) {
964
		error = xfs_dir3_data_read(tp, dp, args->geo->datablk, -1, &dbp);
965 966
		if (error)
			return error;
L
Linus Torvalds 已提交
967
	}
968
	hdr = dbp->b_addr;
969 970 971
	ASSERT(hdr->magic == cpu_to_be32(XFS_DIR2_DATA_MAGIC) ||
	       hdr->magic == cpu_to_be32(XFS_DIR3_DATA_MAGIC));

L
Linus Torvalds 已提交
972 973 974
	/*
	 * Size of the "leaf" area in the block.
	 */
975
	size = (uint)sizeof(xfs_dir2_block_tail_t) +
976
	       (uint)sizeof(*lep) * (leafhdr.count - leafhdr.stale);
L
Linus Torvalds 已提交
977 978 979
	/*
	 * Look at the last data entry.
	 */
980
	tagp = (__be16 *)((char *)hdr + args->geo->blksize) - 1;
981
	dup = (xfs_dir2_data_unused_t *)((char *)hdr + be16_to_cpu(*tagp));
L
Linus Torvalds 已提交
982 983 984
	/*
	 * If it's not free or is too short we can't do it.
	 */
985
	if (be16_to_cpu(dup->freetag) != XFS_DIR2_DATA_FREE_TAG ||
986 987 988
	    be16_to_cpu(dup->length) < size)
		return 0;

L
Linus Torvalds 已提交
989 990 991
	/*
	 * Start converting it to block form.
	 */
992
	xfs_dir3_block_init(mp, tp, dbp, dp);
993

L
Linus Torvalds 已提交
994 995 996 997 998
	needlog = 1;
	needscan = 0;
	/*
	 * Use up the space at the end of the block (blp/btp).
	 */
999
	xfs_dir2_data_use_free(args, dbp, dup, args->geo->blksize - size, size,
L
Linus Torvalds 已提交
1000 1001 1002 1003
		&needlog, &needscan);
	/*
	 * Initialize the block tail.
	 */
1004
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
1005
	btp->count = cpu_to_be32(leafhdr.count - leafhdr.stale);
L
Linus Torvalds 已提交
1006 1007 1008 1009 1010
	btp->stale = 0;
	xfs_dir2_block_log_tail(tp, dbp);
	/*
	 * Initialize the block leaf area.  We compact out stale entries.
	 */
1011
	lep = xfs_dir2_block_leaf_p(btp);
1012 1013
	for (from = to = 0; from < leafhdr.count; from++) {
		if (ents[from].address == cpu_to_be32(XFS_DIR2_NULL_DATAPTR))
L
Linus Torvalds 已提交
1014
			continue;
1015
		lep[to++] = ents[from];
L
Linus Torvalds 已提交
1016
	}
1017 1018
	ASSERT(to == be32_to_cpu(btp->count));
	xfs_dir2_block_log_leaf(tp, dbp, 0, be32_to_cpu(btp->count) - 1);
L
Linus Torvalds 已提交
1019 1020 1021 1022
	/*
	 * Scan the bestfree if we need it and log the data block header.
	 */
	if (needscan)
1023
		xfs_dir2_data_freescan(dp, hdr, &needlog);
L
Linus Torvalds 已提交
1024
	if (needlog)
1025
		xfs_dir2_data_log_header(args, dbp);
L
Linus Torvalds 已提交
1026 1027 1028
	/*
	 * Pitch the old leaf block.
	 */
1029
	error = xfs_da_shrink_inode(args, args->geo->leafblk, lbp);
1030 1031 1032
	if (error)
		return error;

L
Linus Torvalds 已提交
1033 1034 1035
	/*
	 * Now see if the resulting block can be shrunken to shortform.
	 */
1036
	size = xfs_dir2_block_sfsize(dp, hdr, &sfh);
1037 1038 1039
	if (size > XFS_IFORK_DSIZE(dp))
		return 0;

L
Linus Torvalds 已提交
1040 1041 1042 1043 1044 1045 1046 1047 1048 1049 1050
	return xfs_dir2_block_to_sf(args, dbp, size, &sfh);
}

/*
 * Convert the shortform directory to block form.
 */
int						/* error */
xfs_dir2_sf_to_block(
	xfs_da_args_t		*args)		/* operation arguments */
{
	xfs_dir2_db_t		blkno;		/* dir-relative block # (0) */
1051
	xfs_dir2_data_hdr_t	*hdr;		/* block header */
L
Linus Torvalds 已提交
1052
	xfs_dir2_leaf_entry_t	*blp;		/* block leaf entries */
1053
	struct xfs_buf		*bp;		/* block buffer */
L
Linus Torvalds 已提交
1054 1055 1056 1057 1058 1059 1060 1061 1062 1063 1064 1065 1066 1067
	xfs_dir2_block_tail_t	*btp;		/* block tail pointer */
	xfs_dir2_data_entry_t	*dep;		/* data entry pointer */
	xfs_inode_t		*dp;		/* incore directory inode */
	int			dummy;		/* trash */
	xfs_dir2_data_unused_t	*dup;		/* unused entry pointer */
	int			endoffset;	/* end of data objects */
	int			error;		/* error return value */
	int			i;		/* index */
	xfs_mount_t		*mp;		/* filesystem mount point */
	int			needlog;	/* need to log block header */
	int			needscan;	/* need to scan block freespc */
	int			newoffset;	/* offset from current entry */
	int			offset;		/* target block offset */
	xfs_dir2_sf_entry_t	*sfep;		/* sf entry pointer */
C
Christoph Hellwig 已提交
1068 1069
	xfs_dir2_sf_hdr_t	*oldsfp;	/* old shortform header  */
	xfs_dir2_sf_hdr_t	*sfp;		/* shortform header  */
1070
	__be16			*tagp;		/* end of data entry */
L
Linus Torvalds 已提交
1071
	xfs_trans_t		*tp;		/* transaction pointer */
1072
	struct xfs_name		name;
1073
	struct xfs_ifork	*ifp;
L
Linus Torvalds 已提交
1074

C
Christoph Hellwig 已提交
1075 1076
	trace_xfs_dir2_sf_to_block(args);

L
Linus Torvalds 已提交
1077 1078 1079
	dp = args->dp;
	tp = args->trans;
	mp = dp->i_mount;
1080 1081
	ifp = XFS_IFORK_PTR(dp, XFS_DATA_FORK);
	ASSERT(ifp->if_flags & XFS_IFINLINE);
L
Linus Torvalds 已提交
1082 1083 1084 1085 1086
	/*
	 * Bomb out if the shortform directory is way too short.
	 */
	if (dp->i_d.di_size < offsetof(xfs_dir2_sf_hdr_t, parent)) {
		ASSERT(XFS_FORCED_SHUTDOWN(mp));
D
Dave Chinner 已提交
1087
		return -EIO;
L
Linus Torvalds 已提交
1088
	}
C
Christoph Hellwig 已提交
1089

1090
	oldsfp = (xfs_dir2_sf_hdr_t *)ifp->if_u1.if_data;
C
Christoph Hellwig 已提交
1091

1092 1093
	ASSERT(ifp->if_bytes == dp->i_d.di_size);
	ASSERT(ifp->if_u1.if_data != NULL);
C
Christoph Hellwig 已提交
1094
	ASSERT(dp->i_d.di_size >= xfs_dir2_sf_hdr_size(oldsfp->i8count));
1095
	ASSERT(dp->i_d.di_nextents == 0);
C
Christoph Hellwig 已提交
1096

L
Linus Torvalds 已提交
1097
	/*
C
Christoph Hellwig 已提交
1098
	 * Copy the directory into a temporary buffer.
L
Linus Torvalds 已提交
1099 1100
	 * Then pitch the incore inode data so we can make extents.
	 */
1101 1102
	sfp = kmem_alloc(ifp->if_bytes, KM_SLEEP);
	memcpy(sfp, oldsfp, ifp->if_bytes);
L
Linus Torvalds 已提交
1103

1104 1105
	xfs_idata_realloc(dp, -ifp->if_bytes, XFS_DATA_FORK);
	xfs_bmap_local_to_extents_empty(dp, XFS_DATA_FORK);
L
Linus Torvalds 已提交
1106
	dp->i_d.di_size = 0;
C
Christoph Hellwig 已提交
1107

L
Linus Torvalds 已提交
1108 1109 1110 1111 1112
	/*
	 * Add block 0 to the inode.
	 */
	error = xfs_dir2_grow_inode(args, XFS_DIR2_DATA_SPACE, &blkno);
	if (error) {
C
Christoph Hellwig 已提交
1113
		kmem_free(sfp);
L
Linus Torvalds 已提交
1114 1115 1116
		return error;
	}
	/*
1117
	 * Initialize the data block, then convert it to block format.
L
Linus Torvalds 已提交
1118
	 */
1119
	error = xfs_dir3_data_init(args, blkno, &bp);
L
Linus Torvalds 已提交
1120
	if (error) {
C
Christoph Hellwig 已提交
1121
		kmem_free(sfp);
L
Linus Torvalds 已提交
1122 1123
		return error;
	}
1124
	xfs_dir3_block_init(mp, tp, bp, dp);
1125
	hdr = bp->b_addr;
1126

L
Linus Torvalds 已提交
1127 1128 1129 1130
	/*
	 * Compute size of block "tail" area.
	 */
	i = (uint)sizeof(*btp) +
C
Christoph Hellwig 已提交
1131
	    (sfp->count + 2) * (uint)sizeof(xfs_dir2_leaf_entry_t);
L
Linus Torvalds 已提交
1132 1133 1134 1135
	/*
	 * The whole thing is initialized to free by the init routine.
	 * Say we're using the leaf and tail area.
	 */
1136
	dup = dp->d_ops->data_unused_p(hdr);
L
Linus Torvalds 已提交
1137
	needlog = needscan = 0;
1138
	xfs_dir2_data_use_free(args, bp, dup, args->geo->blksize - i,
1139
			       i, &needlog, &needscan);
L
Linus Torvalds 已提交
1140 1141 1142 1143
	ASSERT(needscan == 0);
	/*
	 * Fill in the tail.
	 */
1144
	btp = xfs_dir2_block_tail_p(args->geo, hdr);
C
Christoph Hellwig 已提交
1145
	btp->count = cpu_to_be32(sfp->count + 2);	/* ., .. */
L
Linus Torvalds 已提交
1146
	btp->stale = 0;
1147
	blp = xfs_dir2_block_leaf_p(btp);
1148
	endoffset = (uint)((char *)blp - (char *)hdr);
L
Linus Torvalds 已提交
1149 1150 1151
	/*
	 * Remove the freespace, we'll manage it.
	 */
1152
	xfs_dir2_data_use_free(args, bp, dup,
1153
		(xfs_dir2_data_aoff_t)((char *)dup - (char *)hdr),
1154
		be16_to_cpu(dup->length), &needlog, &needscan);
L
Linus Torvalds 已提交
1155 1156 1157
	/*
	 * Create entry for .
	 */
1158
	dep = dp->d_ops->data_dot_entry_p(hdr);
1159
	dep->inumber = cpu_to_be64(dp->i_ino);
L
Linus Torvalds 已提交
1160 1161
	dep->namelen = 1;
	dep->name[0] = '.';
1162 1163
	dp->d_ops->data_put_ftype(dep, XFS_DIR3_FT_DIR);
	tagp = dp->d_ops->data_entry_tag_p(dep);
1164
	*tagp = cpu_to_be16((char *)dep - (char *)hdr);
1165
	xfs_dir2_data_log_entry(args, bp, dep);
1166
	blp[0].hashval = cpu_to_be32(xfs_dir_hash_dot);
1167
	blp[0].address = cpu_to_be32(xfs_dir2_byte_to_dataptr(
1168
				(char *)dep - (char *)hdr));
L
Linus Torvalds 已提交
1169 1170 1171
	/*
	 * Create entry for ..
	 */
1172
	dep = dp->d_ops->data_dotdot_entry_p(hdr);
1173
	dep->inumber = cpu_to_be64(dp->d_ops->sf_get_parent_ino(sfp));
L
Linus Torvalds 已提交
1174 1175
	dep->namelen = 2;
	dep->name[0] = dep->name[1] = '.';
1176 1177
	dp->d_ops->data_put_ftype(dep, XFS_DIR3_FT_DIR);
	tagp = dp->d_ops->data_entry_tag_p(dep);
1178
	*tagp = cpu_to_be16((char *)dep - (char *)hdr);
1179
	xfs_dir2_data_log_entry(args, bp, dep);
1180
	blp[1].hashval = cpu_to_be32(xfs_dir_hash_dotdot);
1181
	blp[1].address = cpu_to_be32(xfs_dir2_byte_to_dataptr(
1182
				(char *)dep - (char *)hdr));
1183
	offset = dp->d_ops->data_first_offset;
L
Linus Torvalds 已提交
1184 1185 1186
	/*
	 * Loop over existing entries, stuff them in.
	 */
C
Christoph Hellwig 已提交
1187 1188
	i = 0;
	if (!sfp->count)
L
Linus Torvalds 已提交
1189 1190
		sfep = NULL;
	else
1191
		sfep = xfs_dir2_sf_firstentry(sfp);
L
Linus Torvalds 已提交
1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202
	/*
	 * Need to preserve the existing offset values in the sf directory.
	 * Insert holes (unused entries) where necessary.
	 */
	while (offset < endoffset) {
		/*
		 * sfep is null when we reach the end of the list.
		 */
		if (sfep == NULL)
			newoffset = endoffset;
		else
1203
			newoffset = xfs_dir2_sf_get_offset(sfep);
L
Linus Torvalds 已提交
1204 1205 1206 1207
		/*
		 * There should be a hole here, make one.
		 */
		if (offset < newoffset) {
1208
			dup = (xfs_dir2_data_unused_t *)((char *)hdr + offset);
1209 1210
			dup->freetag = cpu_to_be16(XFS_DIR2_DATA_FREE_TAG);
			dup->length = cpu_to_be16(newoffset - offset);
1211
			*xfs_dir2_data_unused_tag_p(dup) = cpu_to_be16(
1212
				((char *)dup - (char *)hdr));
1213
			xfs_dir2_data_log_unused(args, bp, dup);
1214 1215 1216
			xfs_dir2_data_freeinsert(hdr,
						 dp->d_ops->data_bestfree_p(hdr),
						 dup, &dummy);
1217
			offset += be16_to_cpu(dup->length);
L
Linus Torvalds 已提交
1218 1219 1220 1221 1222
			continue;
		}
		/*
		 * Copy a real entry.
		 */
1223
		dep = (xfs_dir2_data_entry_t *)((char *)hdr + newoffset);
1224
		dep->inumber = cpu_to_be64(dp->d_ops->sf_get_ino(sfp, sfep));
L
Linus Torvalds 已提交
1225
		dep->namelen = sfep->namelen;
1226
		dp->d_ops->data_put_ftype(dep, dp->d_ops->sf_get_ftype(sfep));
L
Linus Torvalds 已提交
1227
		memcpy(dep->name, sfep->name, dep->namelen);
1228
		tagp = dp->d_ops->data_entry_tag_p(dep);
1229
		*tagp = cpu_to_be16((char *)dep - (char *)hdr);
1230
		xfs_dir2_data_log_entry(args, bp, dep);
1231 1232 1233 1234
		name.name = sfep->name;
		name.len = sfep->namelen;
		blp[2 + i].hashval = cpu_to_be32(mp->m_dirnameops->
							hashname(&name));
1235
		blp[2 + i].address = cpu_to_be32(xfs_dir2_byte_to_dataptr(
1236 1237
						 (char *)dep - (char *)hdr));
		offset = (int)((char *)(tagp + 1) - (char *)hdr);
C
Christoph Hellwig 已提交
1238
		if (++i == sfp->count)
L
Linus Torvalds 已提交
1239 1240
			sfep = NULL;
		else
1241
			sfep = dp->d_ops->sf_nextentry(sfp, sfep);
L
Linus Torvalds 已提交
1242 1243
	}
	/* Done with the temporary buffer */
C
Christoph Hellwig 已提交
1244
	kmem_free(sfp);
L
Linus Torvalds 已提交
1245 1246 1247
	/*
	 * Sort the leaf entries by hash value.
	 */
1248
	xfs_sort(blp, be32_to_cpu(btp->count), sizeof(*blp), xfs_dir2_block_sort);
L
Linus Torvalds 已提交
1249 1250 1251 1252 1253
	/*
	 * Log the leaf entry area and tail.
	 * Already logged the header in data_init, ignore needlog.
	 */
	ASSERT(needscan == 0);
1254
	xfs_dir2_block_log_leaf(tp, bp, 0, be32_to_cpu(btp->count) - 1);
L
Linus Torvalds 已提交
1255
	xfs_dir2_block_log_tail(tp, bp);
1256
	xfs_dir3_data_check(dp, bp);
L
Linus Torvalds 已提交
1257 1258
	return 0;
}