extent-tree.c 26.0 KB
Newer Older
1
#include <linux/module.h>
2 3 4
#include "ctree.h"
#include "disk-io.h"
#include "print-tree.h"
5
#include "transaction.h"
6

7 8 9 10 11
static int find_free_extent(struct btrfs_trans_handle *trans, struct btrfs_root
			    *orig_root, u64 num_blocks, u64 search_start, u64
			    search_end, struct btrfs_key *ins);
static int finish_current_insert(struct btrfs_trans_handle *trans, struct
				 btrfs_root *extent_root);
C
Chris Mason 已提交
12 13
static int del_pending_extents(struct btrfs_trans_handle *trans, struct
			       btrfs_root *extent_root);
14

C
Chris Mason 已提交
15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71
static int find_search_start(struct btrfs_root *root, int data)
{
	struct btrfs_block_group_cache *cache[8];
	struct btrfs_fs_info *info = root->fs_info;
	u64 used;
	u64 last;
	int i;
	int ret;

	cache[0] = info->block_group_cache;
	if (!cache[0])
		goto find_new;
	used = btrfs_block_group_used(&cache[0]->item);
	if (used < (cache[0]->key.offset * 3 / 2))
		return 0;
find_new:
	last = 0;
	while(1) {
		ret = radix_tree_gang_lookup_tag(&info->block_group_radix,
						 (void **)cache,
						 last, ARRAY_SIZE(cache),
						 BTRFS_BLOCK_GROUP_DIRTY);
		if (!ret)
			break;
		for (i = 0; i < ret; i++) {
			used = btrfs_block_group_used(&cache[i]->item);
			if (used < (cache[i]->key.offset * 3 / 2)) {
				info->block_group_cache = cache[i];
				cache[i]->last_alloc = cache[i]->first_free;
				return 0;
			}
			last = cache[i]->key.objectid +
				cache[i]->key.offset - 1;
		}
	}
	last = 0;
	while(1) {
		ret = radix_tree_gang_lookup(&info->block_group_radix,
						 (void **)cache,
						 last, ARRAY_SIZE(cache));
		if (!ret)
			break;
		for (i = 0; i < ret; i++) {
			used = btrfs_block_group_used(&cache[i]->item);
			if (used < (cache[i]->key.offset * 3 / 2)) {
				info->block_group_cache = cache[i];
				cache[i]->last_alloc = cache[i]->first_free;
				return 0;
			}
			last = cache[i]->key.objectid +
				cache[i]->key.offset - 1;
		}
	}
	info->block_group_cache = NULL;
	return 0;
}

C
Chris Mason 已提交
72 73 74
int btrfs_inc_extent_ref(struct btrfs_trans_handle *trans,
				struct btrfs_root *root,
				u64 blocknr, u64 num_blocks)
C
Chris Mason 已提交
75
{
76
	struct btrfs_path *path;
C
Chris Mason 已提交
77
	int ret;
C
Chris Mason 已提交
78
	struct btrfs_key key;
C
Chris Mason 已提交
79 80
	struct btrfs_leaf *l;
	struct btrfs_extent_item *item;
C
Chris Mason 已提交
81
	struct btrfs_key ins;
C
Chris Mason 已提交
82
	u32 refs;
C
Chris Mason 已提交
83

84 85
	find_free_extent(trans, root->fs_info->extent_root, 0, 0, (u64)-1,
			 &ins);
86 87 88
	path = btrfs_alloc_path();
	BUG_ON(!path);
	btrfs_init_path(path);
C
Chris Mason 已提交
89 90
	key.objectid = blocknr;
	key.flags = 0;
91
	btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY);
92
	key.offset = num_blocks;
93
	ret = btrfs_search_slot(trans, root->fs_info->extent_root, &key, path,
94
				0, 1);
95 96
	if (ret != 0) {
printk("can't find block %Lu %Lu\n", blocknr, num_blocks);
97
		BUG();
98
	}
C
Chris Mason 已提交
99
	BUG_ON(ret != 0);
100 101
	l = btrfs_buffer_leaf(path->nodes[0]);
	item = btrfs_item_ptr(l, path->slots[0], struct btrfs_extent_item);
C
Chris Mason 已提交
102 103
	refs = btrfs_extent_refs(item);
	btrfs_set_extent_refs(item, refs + 1);
104
	btrfs_mark_buffer_dirty(path->nodes[0]);
105

106 107
	btrfs_release_path(root->fs_info->extent_root, path);
	btrfs_free_path(path);
108
	finish_current_insert(trans, root->fs_info->extent_root);
C
Chris Mason 已提交
109
	del_pending_extents(trans, root->fs_info->extent_root);
C
Chris Mason 已提交
110 111 112
	return 0;
}

C
Chris Mason 已提交
113 114 115
static int lookup_extent_ref(struct btrfs_trans_handle *trans,
			     struct btrfs_root *root, u64 blocknr,
			     u64 num_blocks, u32 *refs)
116
{
117
	struct btrfs_path *path;
118
	int ret;
C
Chris Mason 已提交
119
	struct btrfs_key key;
C
Chris Mason 已提交
120 121
	struct btrfs_leaf *l;
	struct btrfs_extent_item *item;
122 123 124

	path = btrfs_alloc_path();
	btrfs_init_path(path);
125
	key.objectid = blocknr;
126
	key.offset = num_blocks;
127 128
	key.flags = 0;
	btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY);
129
	ret = btrfs_search_slot(trans, root->fs_info->extent_root, &key, path,
130
				0, 0);
131 132
	if (ret != 0)
		BUG();
133 134
	l = btrfs_buffer_leaf(path->nodes[0]);
	item = btrfs_item_ptr(l, path->slots[0], struct btrfs_extent_item);
C
Chris Mason 已提交
135
	*refs = btrfs_extent_refs(item);
136 137
	btrfs_release_path(root->fs_info->extent_root, path);
	btrfs_free_path(path);
138 139 140
	return 0;
}

C
Chris Mason 已提交
141 142 143
int btrfs_inc_root_ref(struct btrfs_trans_handle *trans,
		       struct btrfs_root *root)
{
C
Chris Mason 已提交
144
	return btrfs_inc_extent_ref(trans, root, bh_blocknr(root->node), 1);
C
Chris Mason 已提交
145 146
}

147
int btrfs_inc_ref(struct btrfs_trans_handle *trans, struct btrfs_root *root,
C
Chris Mason 已提交
148
		  struct buffer_head *buf)
C
Chris Mason 已提交
149 150
{
	u64 blocknr;
C
Chris Mason 已提交
151
	struct btrfs_node *buf_node;
152 153 154
	struct btrfs_leaf *buf_leaf;
	struct btrfs_disk_key *key;
	struct btrfs_file_extent_item *fi;
C
Chris Mason 已提交
155
	int i;
156 157
	int leaf;
	int ret;
158

159
	if (!root->ref_cows)
160
		return 0;
C
Chris Mason 已提交
161
	buf_node = btrfs_buffer_node(buf);
162 163
	leaf = btrfs_is_leaf(buf_node);
	buf_leaf = btrfs_buffer_leaf(buf);
C
Chris Mason 已提交
164
	for (i = 0; i < btrfs_header_nritems(&buf_node->header); i++) {
165 166 167 168 169 170
		if (leaf) {
			key = &buf_leaf->items[i].key;
			if (btrfs_disk_key_type(key) != BTRFS_EXTENT_DATA_KEY)
				continue;
			fi = btrfs_item_ptr(buf_leaf, i,
					    struct btrfs_file_extent_item);
171 172 173
			if (btrfs_file_extent_type(fi) ==
			    BTRFS_FILE_EXTENT_INLINE)
				continue;
C
Chris Mason 已提交
174
			ret = btrfs_inc_extent_ref(trans, root,
175 176 177 178 179
				    btrfs_file_extent_disk_blocknr(fi),
				    btrfs_file_extent_disk_num_blocks(fi));
			BUG_ON(ret);
		} else {
			blocknr = btrfs_node_blockptr(buf_node, i);
C
Chris Mason 已提交
180
			ret = btrfs_inc_extent_ref(trans, root, blocknr, 1);
181 182
			BUG_ON(ret);
		}
C
Chris Mason 已提交
183 184 185 186
	}
	return 0;
}

C
Chris Mason 已提交
187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264
static int write_one_cache_group(struct btrfs_trans_handle *trans,
				 struct btrfs_root *root,
				 struct btrfs_path *path,
				 struct btrfs_block_group_cache *cache)
{
	int ret;
	int pending_ret;
	struct btrfs_root *extent_root = root->fs_info->extent_root;
	struct btrfs_block_group_item *bi;
	struct btrfs_key ins;

	find_free_extent(trans, extent_root, 0, 0, (u64)-1, &ins);
	ret = btrfs_search_slot(trans, extent_root, &cache->key, path, 0, 1);
	BUG_ON(ret);
	bi = btrfs_item_ptr(btrfs_buffer_leaf(path->nodes[0]), path->slots[0],
			    struct btrfs_block_group_item);
	memcpy(bi, &cache->item, sizeof(*bi));
	mark_buffer_dirty(path->nodes[0]);
	btrfs_release_path(extent_root, path);

	finish_current_insert(trans, extent_root);
	pending_ret = del_pending_extents(trans, extent_root);
	if (ret)
		return ret;
	if (pending_ret)
		return pending_ret;
	return 0;

}

int btrfs_write_dirty_block_groups(struct btrfs_trans_handle *trans,
				    struct btrfs_root *root)
{
	struct btrfs_block_group_cache *cache[8];
	int ret;
	int err = 0;
	int werr = 0;
	struct radix_tree_root *radix = &root->fs_info->block_group_radix;
	int i;
	struct btrfs_path *path;

	path = btrfs_alloc_path();
	if (!path)
		return -ENOMEM;

	while(1) {
		ret = radix_tree_gang_lookup_tag(radix, (void **)cache,
						 0, ARRAY_SIZE(cache),
						 BTRFS_BLOCK_GROUP_DIRTY);
		if (!ret)
			break;
		for (i = 0; i < ret; i++) {
			radix_tree_tag_clear(radix, cache[i]->key.objectid +
					     cache[i]->key.offset - 1,
					     BTRFS_BLOCK_GROUP_DIRTY);
			err = write_one_cache_group(trans, root,
						    path, cache[i]);
			if (err)
				werr = err;
		}
	}
	btrfs_free_path(path);
	return werr;
}

static int update_block_group(struct btrfs_trans_handle *trans,
			      struct btrfs_root *root,
			      u64 blocknr, u64 num, int alloc)
{
	struct btrfs_block_group_cache *cache;
	struct btrfs_fs_info *info = root->fs_info;
	u64 total = num;
	u64 old_val;
	u64 block_in_group;
	int ret;
	while(total) {
		ret = radix_tree_gang_lookup(&info->block_group_radix,
					     (void **)&cache, blocknr, 1);
C
Chris Mason 已提交
265 266 267
		if (!ret) {
			printk(KERN_CRIT "blocknr %Lu lookup failed\n",
			       blocknr);
C
Chris Mason 已提交
268
			return -1;
C
Chris Mason 已提交
269
		}
C
Chris Mason 已提交
270 271 272 273 274 275 276 277 278 279
		block_in_group = blocknr - cache->key.objectid;
		WARN_ON(block_in_group > cache->key.offset);
		radix_tree_tag_set(&info->block_group_radix,
				   cache->key.objectid + cache->key.offset - 1,
				   BTRFS_BLOCK_GROUP_DIRTY);

		old_val = btrfs_block_group_used(&cache->item);
		num = min(total, cache->key.offset - block_in_group);
		total -= num;
		blocknr += num;
C
Chris Mason 已提交
280
		if (alloc) {
C
Chris Mason 已提交
281
			old_val += num;
C
Chris Mason 已提交
282 283 284
			if (blocknr > cache->last_alloc)
				cache->last_alloc = blocknr;
		} else {
C
Chris Mason 已提交
285
			old_val -= num;
C
Chris Mason 已提交
286 287 288
			if (blocknr < cache->first_free)
				cache->first_free = blocknr;
		}
C
Chris Mason 已提交
289 290 291 292 293
		btrfs_set_block_group_used(&cache->item, old_val);
	}
	return 0;
}

294 295
int btrfs_finish_extent_commit(struct btrfs_trans_handle *trans, struct
			       btrfs_root *root)
296
{
C
Chris Mason 已提交
297
	unsigned long gang[8];
298
	u64 first = 0;
299 300
	int ret;
	int i;
C
Chris Mason 已提交
301
	struct radix_tree_root *pinned_radix = &root->fs_info->pinned_radix;
302 303

	while(1) {
C
Chris Mason 已提交
304 305
		ret = find_first_radix_bit(pinned_radix, gang,
					   ARRAY_SIZE(gang));
306 307
		if (!ret)
			break;
308
		if (!first)
C
Chris Mason 已提交
309
			first = gang[0];
310
		for (i = 0; i < ret; i++) {
C
Chris Mason 已提交
311
			clear_radix_bit(pinned_radix, gang[i]);
312
		}
313
	}
C
Chris Mason 已提交
314
	root->fs_info->block_group_cache = NULL;
315 316 317
	return 0;
}

318 319
static int finish_current_insert(struct btrfs_trans_handle *trans, struct
				 btrfs_root *extent_root)
C
Chris Mason 已提交
320
{
C
Chris Mason 已提交
321
	struct btrfs_key ins;
C
Chris Mason 已提交
322
	struct btrfs_extent_item extent_item;
C
Chris Mason 已提交
323 324
	int i;
	int ret;
325 326
	u64 super_blocks_used;
	struct btrfs_fs_info *info = extent_root->fs_info;
C
Chris Mason 已提交
327

C
Chris Mason 已提交
328
	btrfs_set_extent_refs(&extent_item, 1);
C
Chris Mason 已提交
329 330
	ins.offset = 1;
	ins.flags = 0;
331
	btrfs_set_key_type(&ins, BTRFS_EXTENT_ITEM_KEY);
332
	btrfs_set_extent_owner(&extent_item, extent_root->root_key.objectid);
C
Chris Mason 已提交
333

334 335
	for (i = 0; i < extent_root->fs_info->extent_tree_insert_nr; i++) {
		ins.objectid = extent_root->fs_info->extent_tree_insert[i];
336 337 338
		super_blocks_used = btrfs_super_blocks_used(info->disk_super);
		btrfs_set_super_blocks_used(info->disk_super,
					    super_blocks_used + 1);
339 340
		ret = btrfs_insert_item(trans, extent_root, &ins, &extent_item,
					sizeof(extent_item));
C
Chris Mason 已提交
341 342
		BUG_ON(ret);
	}
343 344
	extent_root->fs_info->extent_tree_insert_nr = 0;
	extent_root->fs_info->extent_tree_prealloc_nr = 0;
C
Chris Mason 已提交
345 346 347
	return 0;
}

C
Chris Mason 已提交
348
static int pin_down_block(struct btrfs_root *root, u64 blocknr, int pending)
C
Chris Mason 已提交
349 350
{
	int err;
C
Chris Mason 已提交
351
	struct btrfs_header *header;
C
Chris Mason 已提交
352 353
	struct buffer_head *bh;

C
Chris Mason 已提交
354
	if (!pending) {
355
		bh = btrfs_find_tree_block(root, blocknr);
C
Chris Mason 已提交
356 357 358 359 360 361 362 363 364 365
		if (bh) {
			if (buffer_uptodate(bh)) {
				u64 transid =
				    root->fs_info->running_transaction->transid;
				header = btrfs_buffer_header(bh);
				if (btrfs_header_generation(header) ==
				    transid) {
					btrfs_block_release(root, bh);
					return 0;
				}
C
Chris Mason 已提交
366
			}
C
Chris Mason 已提交
367
			btrfs_block_release(root, bh);
C
Chris Mason 已提交
368 369
		}
		err = set_radix_bit(&root->fs_info->pinned_radix, blocknr);
C
Chris Mason 已提交
370 371 372
	} else {
		err = set_radix_bit(&root->fs_info->pending_del_radix, blocknr);
	}
C
Chris Mason 已提交
373
	BUG_ON(err);
C
Chris Mason 已提交
374 375 376
	return 0;
}

377
/*
378
 * remove an extent from the root, returns 0 on success
379
 */
380
static int __free_extent(struct btrfs_trans_handle *trans, struct btrfs_root
C
Chris Mason 已提交
381
			 *root, u64 blocknr, u64 num_blocks, int pin)
382
{
383
	struct btrfs_path *path;
C
Chris Mason 已提交
384
	struct btrfs_key key;
385 386
	struct btrfs_fs_info *info = root->fs_info;
	struct btrfs_root *extent_root = info->extent_root;
387
	int ret;
C
Chris Mason 已提交
388
	struct btrfs_extent_item *ei;
C
Chris Mason 已提交
389
	struct btrfs_key ins;
C
Chris Mason 已提交
390
	u32 refs;
C
Chris Mason 已提交
391

392 393
	key.objectid = blocknr;
	key.flags = 0;
394
	btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY);
395 396
	key.offset = num_blocks;

397
	find_free_extent(trans, root, 0, 0, (u64)-1, &ins);
398 399 400
	path = btrfs_alloc_path();
	BUG_ON(!path);
	btrfs_init_path(path);
401

402
	ret = btrfs_search_slot(trans, extent_root, &key, path, -1, 1);
403
	if (ret) {
404
		printk("failed to find %Lu\n", key.objectid);
C
Chris Mason 已提交
405
		btrfs_print_tree(extent_root, extent_root->node);
406
		printk("failed to find %Lu\n", key.objectid);
407 408
		BUG();
	}
409
	ei = btrfs_item_ptr(btrfs_buffer_leaf(path->nodes[0]), path->slots[0],
C
Chris Mason 已提交
410
			    struct btrfs_extent_item);
411
	BUG_ON(ei->refs == 0);
C
Chris Mason 已提交
412 413
	refs = btrfs_extent_refs(ei) - 1;
	btrfs_set_extent_refs(ei, refs);
414
	btrfs_mark_buffer_dirty(path->nodes[0]);
C
Chris Mason 已提交
415
	if (refs == 0) {
416
		u64 super_blocks_used;
C
Chris Mason 已提交
417 418

		if (pin) {
C
Chris Mason 已提交
419
			ret = pin_down_block(root, blocknr, 0);
C
Chris Mason 已提交
420 421 422
			BUG_ON(ret);
		}

423 424 425
		super_blocks_used = btrfs_super_blocks_used(info->disk_super);
		btrfs_set_super_blocks_used(info->disk_super,
					    super_blocks_used - num_blocks);
426
		ret = btrfs_del_item(trans, extent_root, path);
427 428
		if (ret)
			BUG();
C
Chris Mason 已提交
429 430
		ret = update_block_group(trans, root, blocknr, num_blocks, 0);
		BUG_ON(ret);
431
	}
432 433
	btrfs_release_path(extent_root, path);
	btrfs_free_path(path);
434
	finish_current_insert(trans, extent_root);
435 436 437 438 439 440 441
	return ret;
}

/*
 * find all the blocks marked as pending in the radix tree and remove
 * them from the extent map
 */
442 443
static int del_pending_extents(struct btrfs_trans_handle *trans, struct
			       btrfs_root *extent_root)
444 445
{
	int ret;
C
Chris Mason 已提交
446 447
	int wret;
	int err = 0;
C
Chris Mason 已提交
448
	unsigned long gang[4];
449
	int i;
C
Chris Mason 已提交
450 451 452 453 454
	struct radix_tree_root *pending_radix;
	struct radix_tree_root *pinned_radix;

	pending_radix = &extent_root->fs_info->pending_del_radix;
	pinned_radix = &extent_root->fs_info->pinned_radix;
455 456

	while(1) {
C
Chris Mason 已提交
457 458
		ret = find_first_radix_bit(pending_radix, gang,
					   ARRAY_SIZE(gang));
459 460 461
		if (!ret)
			break;
		for (i = 0; i < ret; i++) {
C
Chris Mason 已提交
462 463 464 465
			wret = set_radix_bit(pinned_radix, gang[i]);
			BUG_ON(wret);
			wret = clear_radix_bit(pending_radix, gang[i]);
			BUG_ON(wret);
466
			wret = __free_extent(trans, extent_root,
C
Chris Mason 已提交
467
					     gang[i], 1, 0);
C
Chris Mason 已提交
468 469
			if (wret)
				err = wret;
470 471
		}
	}
C
Chris Mason 已提交
472
	return err;
473 474 475 476 477
}

/*
 * remove an extent from the root, returns 0 on success
 */
478 479
int btrfs_free_extent(struct btrfs_trans_handle *trans, struct btrfs_root
		      *root, u64 blocknr, u64 num_blocks, int pin)
480
{
481
	struct btrfs_root *extent_root = root->fs_info->extent_root;
482 483
	int pending_ret;
	int ret;
484

485
	if (root == extent_root) {
C
Chris Mason 已提交
486
		pin_down_block(root, blocknr, 1);
487 488
		return 0;
	}
C
Chris Mason 已提交
489
	ret = __free_extent(trans, root, blocknr, num_blocks, pin);
C
Chris Mason 已提交
490
	pending_ret = del_pending_extents(trans, root->fs_info->extent_root);
491 492 493 494 495 496 497
	return ret ? ret : pending_ret;
}

/*
 * walks the btree of allocated extents and find a hole of a given size.
 * The key ins is changed to record the hole:
 * ins->objectid == block start
498
 * ins->flags = BTRFS_EXTENT_ITEM_KEY
499 500 501
 * ins->offset == number of blocks
 * Any available blocks before search_start are skipped.
 */
502 503 504
static int find_free_extent(struct btrfs_trans_handle *trans, struct btrfs_root
			    *orig_root, u64 num_blocks, u64 search_start, u64
			    search_end, struct btrfs_key *ins)
505
{
506
	struct btrfs_path *path;
C
Chris Mason 已提交
507
	struct btrfs_key key;
508 509 510
	int ret;
	u64 hole_size = 0;
	int slot = 0;
C
Chris Mason 已提交
511
	u64 last_block = 0;
C
Chris Mason 已提交
512
	u64 test_block;
513
	int start_found;
C
Chris Mason 已提交
514
	struct btrfs_leaf *l;
515
	struct btrfs_root * root = orig_root->fs_info->extent_root;
516
	struct btrfs_fs_info *info = root->fs_info;
517
	int total_needed = num_blocks;
518 519
	int total_found = 0;
	int fill_prealloc = 0;
C
Chris Mason 已提交
520
	int level;
521

522 523 524 525
	path = btrfs_alloc_path();
	ins->flags = 0;
	btrfs_set_key_type(ins, BTRFS_EXTENT_ITEM_KEY);

C
Chris Mason 已提交
526
	level = btrfs_header_level(btrfs_buffer_header(root->node));
527 528 529 530 531
	if (num_blocks == 0) {
		fill_prealloc = 1;
		num_blocks = 1;
		total_needed = min(level + 2, BTRFS_MAX_LEVEL) * 3;
	}
C
Chris Mason 已提交
532 533 534 535
	find_search_start(root, 0);
	if (info->block_group_cache &&
	    info->block_group_cache->last_alloc > search_start)
		search_start = info->block_group_cache->last_alloc;
536

537
check_failed:
538
	btrfs_init_path(path);
539 540 541
	ins->objectid = search_start;
	ins->offset = 0;
	start_found = 0;
542
	ret = btrfs_search_slot(trans, root, ins, path, 0, 0);
C
Chris Mason 已提交
543 544
	if (ret < 0)
		goto error;
C
Chris Mason 已提交
545

546 547
	if (path->slots[0] > 0)
		path->slots[0]--;
548

549
	while (1) {
550 551
		l = btrfs_buffer_leaf(path->nodes[0]);
		slot = path->slots[0];
552
		if (slot >= btrfs_header_nritems(&l->header)) {
553 554 555 556
			if (fill_prealloc) {
				info->extent_tree_prealloc_nr = 0;
				total_found = 0;
			}
557
			ret = btrfs_next_leaf(root, path);
558 559
			if (ret == 0)
				continue;
C
Chris Mason 已提交
560 561
			if (ret < 0)
				goto error;
562 563
			if (!start_found) {
				ins->objectid = search_start;
564
				ins->offset = (u64)-1 - search_start;
565 566 567 568 569
				start_found = 1;
				goto check_pending;
			}
			ins->objectid = last_block > search_start ?
					last_block : search_start;
570
			ins->offset = (u64)-1 - ins->objectid;
571 572
			goto check_pending;
		}
C
Chris Mason 已提交
573
		btrfs_disk_key_to_cpu(&key, &l->items[slot].key);
C
Chris Mason 已提交
574 575
		if (btrfs_key_type(&key) != BTRFS_EXTENT_ITEM_KEY)
			goto next;
C
Chris Mason 已提交
576
		if (key.objectid >= search_start) {
577
			if (start_found) {
578 579
				if (last_block < search_start)
					last_block = search_start;
C
Chris Mason 已提交
580
				hole_size = key.objectid - last_block;
581
				if (hole_size > num_blocks) {
582
					ins->objectid = last_block;
C
Chris Mason 已提交
583
					ins->offset = hole_size;
584 585
					goto check_pending;
				}
586
			}
587
		}
588
		start_found = 1;
C
Chris Mason 已提交
589
		last_block = key.objectid + key.offset;
C
Chris Mason 已提交
590
next:
591
		path->slots[0]++;
592 593 594 595 596 597
	}
	// FIXME -ENOSPC
check_pending:
	/* we have to make sure we didn't find an extent that has already
	 * been allocated by the map tree or the original allocation
	 */
598
	btrfs_release_path(root, path);
599
	BUG_ON(ins->objectid < search_start);
C
Chris Mason 已提交
600
	for (test_block = ins->objectid;
601 602
	     test_block < ins->objectid + num_blocks; test_block++) {
		if (test_radix_bit(&info->pinned_radix, test_block)) {
C
Chris Mason 已提交
603
			search_start = test_block + 1;
604 605 606
			goto check_failed;
		}
	}
607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634
	if (!fill_prealloc && info->extent_tree_insert_nr) {
		u64 last =
		  info->extent_tree_insert[info->extent_tree_insert_nr - 1];
		if (ins->objectid + num_blocks >
		    info->extent_tree_insert[0] &&
		    ins->objectid <= last) {
			search_start = last + 1;
			WARN_ON(1);
			goto check_failed;
		}
	}
	if (!fill_prealloc && info->extent_tree_prealloc_nr) {
		u64 first =
		  info->extent_tree_prealloc[info->extent_tree_prealloc_nr - 1];
		if (ins->objectid + num_blocks > first &&
		    ins->objectid <= info->extent_tree_prealloc[0]) {
			search_start = info->extent_tree_prealloc[0] + 1;
			WARN_ON(1);
			goto check_failed;
		}
	}
	if (fill_prealloc) {
		int nr;
		test_block = ins->objectid;
		while(test_block < ins->objectid + ins->offset &&
		      total_found < total_needed) {
			nr = total_needed - total_found - 1;
			BUG_ON(nr < 0);
C
Chris Mason 已提交
635
			info->extent_tree_prealloc[nr] = test_block;
636 637 638 639 640 641 642
			total_found++;
			test_block++;
		}
		if (total_found < total_needed) {
			search_start = test_block;
			goto check_failed;
		}
C
Chris Mason 已提交
643 644 645 646 647 648 649
		info->extent_tree_prealloc_nr = total_found;
	}
	ret = radix_tree_gang_lookup(&info->block_group_radix,
				     (void **)&info->block_group_cache,
				     ins->objectid, 1);
	if (ret) {
		info->block_group_cache->last_alloc = ins->objectid;
650
	}
C
Chris Mason 已提交
651
	ins->offset = num_blocks;
652
	btrfs_free_path(path);
653
	return 0;
C
Chris Mason 已提交
654
error:
655 656
	btrfs_release_path(root, path);
	btrfs_free_path(path);
C
Chris Mason 已提交
657
	return ret;
658 659 660 661 662 663 664 665
}
/*
 * finds a free extent and does all the dirty work required for allocation
 * returns the key for the extent through ins, and a tree buffer for
 * the first block of the extent through buf.
 *
 * returns 0 if everything worked, non-zero otherwise.
 */
666 667
int btrfs_alloc_extent(struct btrfs_trans_handle *trans,
		       struct btrfs_root *root, u64 owner,
668
		       u64 num_blocks, u64 search_start,
669
		       u64 search_end, struct btrfs_key *ins)
670 671 672
{
	int ret;
	int pending_ret;
673 674 675
	u64 super_blocks_used;
	struct btrfs_fs_info *info = root->fs_info;
	struct btrfs_root *extent_root = info->extent_root;
C
Chris Mason 已提交
676
	struct btrfs_extent_item extent_item;
677
	struct btrfs_key prealloc_key;
C
Chris Mason 已提交
678

C
Chris Mason 已提交
679
	btrfs_set_extent_refs(&extent_item, 1);
680
	btrfs_set_extent_owner(&extent_item, owner);
681

C
Chris Mason 已提交
682
	if (root == extent_root) {
683 684
		int nr;
		BUG_ON(info->extent_tree_prealloc_nr == 0);
C
Chris Mason 已提交
685 686
		BUG_ON(num_blocks != 1);
		ins->offset = 1;
687 688 689 690 691
		info->extent_tree_prealloc_nr--;
		nr = info->extent_tree_prealloc_nr;
		ins->objectid = info->extent_tree_prealloc[nr];
		info->extent_tree_insert[info->extent_tree_insert_nr++] =
			ins->objectid;
C
Chris Mason 已提交
692 693 694
		ret = update_block_group(trans, root,
					 ins->objectid, ins->offset, 1);
		BUG_ON(ret);
695 696
		return 0;
	}
697
	/* do the real allocation */
698
	ret = find_free_extent(trans, root, num_blocks, search_start,
C
Chris Mason 已提交
699 700 701
			       search_end, ins);
	if (ret)
		return ret;
702

703 704 705 706 707 708
	/* then do prealloc for the extent tree */
	ret = find_free_extent(trans, root, 0, ins->objectid + ins->offset,
			       search_end, &prealloc_key);
	if (ret)
		return ret;

709 710 711
	super_blocks_used = btrfs_super_blocks_used(info->disk_super);
	btrfs_set_super_blocks_used(info->disk_super, super_blocks_used +
				    num_blocks);
712 713
	ret = btrfs_insert_item(trans, extent_root, ins, &extent_item,
				sizeof(extent_item));
C
Chris Mason 已提交
714

715
	finish_current_insert(trans, extent_root);
C
Chris Mason 已提交
716
	pending_ret = del_pending_extents(trans, extent_root);
C
Chris Mason 已提交
717 718 719 720
	if (ret)
		return ret;
	if (pending_ret)
		return pending_ret;
C
Chris Mason 已提交
721
	ret = update_block_group(trans, root, ins->objectid, ins->offset, 1);
C
Chris Mason 已提交
722
	return 0;
723 724 725 726 727 728
}

/*
 * helper function to allocate a block for a given tree
 * returns the tree buffer or NULL.
 */
C
Chris Mason 已提交
729
struct buffer_head *btrfs_alloc_free_block(struct btrfs_trans_handle *trans,
730
					   struct btrfs_root *root)
731
{
C
Chris Mason 已提交
732
	struct btrfs_key ins;
733
	int ret;
C
Chris Mason 已提交
734
	struct buffer_head *buf;
735

736 737
	ret = btrfs_alloc_extent(trans, root, root->root_key.objectid,
				 1, 0, (unsigned long)-1, &ins);
738 739 740 741
	if (ret) {
		BUG();
		return NULL;
	}
C
Chris Mason 已提交
742
	BUG_ON(ret);
743
	buf = btrfs_find_create_tree_block(root, ins.objectid);
744
	set_buffer_uptodate(buf);
745 746
	return buf;
}
747

748 749 750 751 752 753 754 755 756 757 758 759 760 761 762 763 764 765
static int drop_leaf_ref(struct btrfs_trans_handle *trans,
			 struct btrfs_root *root, struct buffer_head *cur)
{
	struct btrfs_disk_key *key;
	struct btrfs_leaf *leaf;
	struct btrfs_file_extent_item *fi;
	int i;
	int nritems;
	int ret;

	BUG_ON(!btrfs_is_leaf(btrfs_buffer_node(cur)));
	leaf = btrfs_buffer_leaf(cur);
	nritems = btrfs_header_nritems(&leaf->header);
	for (i = 0; i < nritems; i++) {
		key = &leaf->items[i].key;
		if (btrfs_disk_key_type(key) != BTRFS_EXTENT_DATA_KEY)
			continue;
		fi = btrfs_item_ptr(leaf, i, struct btrfs_file_extent_item);
766 767
		if (btrfs_file_extent_type(fi) == BTRFS_FILE_EXTENT_INLINE)
			continue;
768 769 770 771 772 773 774 775 776 777 778 779 780
		/*
		 * FIXME make sure to insert a trans record that
		 * repeats the snapshot del on crash
		 */
		ret = btrfs_free_extent(trans, root,
					btrfs_file_extent_disk_blocknr(fi),
					btrfs_file_extent_disk_num_blocks(fi),
					0);
		BUG_ON(ret);
	}
	return 0;
}

C
Chris Mason 已提交
781 782 783 784
/*
 * helper function for drop_snapshot, this walks down the tree dropping ref
 * counts as it goes.
 */
785 786
static int walk_down_tree(struct btrfs_trans_handle *trans, struct btrfs_root
			  *root, struct btrfs_path *path, int *level)
C
Chris Mason 已提交
787
{
C
Chris Mason 已提交
788 789
	struct buffer_head *next;
	struct buffer_head *cur;
C
Chris Mason 已提交
790 791 792 793
	u64 blocknr;
	int ret;
	u32 refs;

794 795
	WARN_ON(*level < 0);
	WARN_ON(*level >= BTRFS_MAX_LEVEL);
C
Chris Mason 已提交
796
	ret = lookup_extent_ref(trans, root, bh_blocknr(path->nodes[*level]),
797
			       1, &refs);
C
Chris Mason 已提交
798 799 800
	BUG_ON(ret);
	if (refs > 1)
		goto out;
C
Chris Mason 已提交
801 802 803
	/*
	 * walk down to the last node level and free all the leaves
	 */
804
	while(*level >= 0) {
805 806
		WARN_ON(*level < 0);
		WARN_ON(*level >= BTRFS_MAX_LEVEL);
C
Chris Mason 已提交
807
		cur = path->nodes[*level];
C
Chris Mason 已提交
808 809
		if (btrfs_header_level(btrfs_buffer_header(cur)) != *level)
			WARN_ON(1);
810
		if (path->slots[*level] >=
C
Chris Mason 已提交
811
		    btrfs_header_nritems(btrfs_buffer_header(cur)))
C
Chris Mason 已提交
812
			break;
813 814 815 816 817
		if (*level == 0) {
			ret = drop_leaf_ref(trans, root, cur);
			BUG_ON(ret);
			break;
		}
C
Chris Mason 已提交
818 819
		blocknr = btrfs_node_blockptr(btrfs_buffer_node(cur),
					      path->slots[*level]);
C
Chris Mason 已提交
820
		ret = lookup_extent_ref(trans, root, blocknr, 1, &refs);
821 822
		BUG_ON(ret);
		if (refs != 1) {
C
Chris Mason 已提交
823
			path->slots[*level]++;
824
			ret = btrfs_free_extent(trans, root, blocknr, 1, 1);
C
Chris Mason 已提交
825 826 827 828
			BUG_ON(ret);
			continue;
		}
		next = read_tree_block(root, blocknr);
829
		WARN_ON(*level <= 0);
C
Chris Mason 已提交
830
		if (path->nodes[*level-1])
C
Chris Mason 已提交
831
			btrfs_block_release(root, path->nodes[*level-1]);
C
Chris Mason 已提交
832
		path->nodes[*level-1] = next;
C
Chris Mason 已提交
833
		*level = btrfs_header_level(btrfs_buffer_header(next));
C
Chris Mason 已提交
834 835 836
		path->slots[*level] = 0;
	}
out:
837 838
	WARN_ON(*level < 0);
	WARN_ON(*level >= BTRFS_MAX_LEVEL);
839
	ret = btrfs_free_extent(trans, root,
840
				bh_blocknr(path->nodes[*level]), 1, 1);
C
Chris Mason 已提交
841
	btrfs_block_release(root, path->nodes[*level]);
C
Chris Mason 已提交
842 843 844 845 846 847
	path->nodes[*level] = NULL;
	*level += 1;
	BUG_ON(ret);
	return 0;
}

C
Chris Mason 已提交
848 849 850 851 852
/*
 * helper for dropping snapshots.  This walks back up the tree in the path
 * to find the first node higher up where we haven't yet gone through
 * all the slots
 */
853 854
static int walk_up_tree(struct btrfs_trans_handle *trans, struct btrfs_root
			*root, struct btrfs_path *path, int *level)
C
Chris Mason 已提交
855 856 857 858
{
	int i;
	int slot;
	int ret;
C
Chris Mason 已提交
859
	for(i = *level; i < BTRFS_MAX_LEVEL - 1 && path->nodes[i]; i++) {
C
Chris Mason 已提交
860
		slot = path->slots[i];
C
Chris Mason 已提交
861 862
		if (slot < btrfs_header_nritems(
		    btrfs_buffer_header(path->nodes[i])) - 1) {
C
Chris Mason 已提交
863 864 865 866
			path->slots[i]++;
			*level = i;
			return 0;
		} else {
867
			ret = btrfs_free_extent(trans, root,
868
						bh_blocknr(path->nodes[*level]),
869
						1, 1);
870
			BUG_ON(ret);
C
Chris Mason 已提交
871
			btrfs_block_release(root, path->nodes[*level]);
C
Chris Mason 已提交
872
			path->nodes[*level] = NULL;
C
Chris Mason 已提交
873 874 875 876 877 878
			*level = i + 1;
		}
	}
	return 1;
}

C
Chris Mason 已提交
879 880 881 882 883
/*
 * drop the reference count on the tree rooted at 'snap'.  This traverses
 * the tree freeing any blocks that have a ref count of zero after being
 * decremented.
 */
884
int btrfs_drop_snapshot(struct btrfs_trans_handle *trans, struct btrfs_root
C
Chris Mason 已提交
885
			*root, struct buffer_head *snap)
C
Chris Mason 已提交
886
{
887
	int ret = 0;
C
Chris Mason 已提交
888
	int wret;
C
Chris Mason 已提交
889
	int level;
890
	struct btrfs_path *path;
C
Chris Mason 已提交
891 892 893
	int i;
	int orig_level;

894 895 896
	path = btrfs_alloc_path();
	BUG_ON(!path);
	btrfs_init_path(path);
C
Chris Mason 已提交
897

C
Chris Mason 已提交
898
	level = btrfs_header_level(btrfs_buffer_header(snap));
C
Chris Mason 已提交
899
	orig_level = level;
900 901
	path->nodes[level] = snap;
	path->slots[level] = 0;
C
Chris Mason 已提交
902
	while(1) {
903
		wret = walk_down_tree(trans, root, path, &level);
C
Chris Mason 已提交
904
		if (wret > 0)
C
Chris Mason 已提交
905
			break;
C
Chris Mason 已提交
906 907 908
		if (wret < 0)
			ret = wret;

909
		wret = walk_up_tree(trans, root, path, &level);
C
Chris Mason 已提交
910
		if (wret > 0)
C
Chris Mason 已提交
911
			break;
C
Chris Mason 已提交
912 913
		if (wret < 0)
			ret = wret;
C
Chris Mason 已提交
914
	}
C
Chris Mason 已提交
915
	for (i = 0; i <= orig_level; i++) {
916 917
		if (path->nodes[i]) {
			btrfs_block_release(root, path->nodes[i]);
C
Chris Mason 已提交
918
		}
C
Chris Mason 已提交
919
	}
920
	btrfs_free_path(path);
C
Chris Mason 已提交
921
	return ret;
C
Chris Mason 已提交
922
}
C
Chris Mason 已提交
923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980 981 982 983 984 985 986

int btrfs_free_block_groups(struct btrfs_fs_info *info)
{
	int ret;
	struct btrfs_block_group_cache *cache[8];
	int i;

	while(1) {
		ret = radix_tree_gang_lookup(&info->block_group_radix,
					     (void **)cache, 0,
					     ARRAY_SIZE(cache));
		if (!ret)
			break;
		for (i = 0; i < ret; i++) {
			radix_tree_delete(&info->block_group_radix,
					  cache[i]->key.objectid +
					  cache[i]->key.offset - 1);
			kfree(cache[i]);
		}
	}
	return 0;
}

int btrfs_read_block_groups(struct btrfs_root *root)
{
	struct btrfs_path *path;
	int ret;
	int err = 0;
	struct btrfs_block_group_item *bi;
	struct btrfs_block_group_cache *cache;
	struct btrfs_key key;
	struct btrfs_key found_key;
	struct btrfs_leaf *leaf;
	u64 group_size_blocks = BTRFS_BLOCK_GROUP_SIZE / root->blocksize;

	root = root->fs_info->extent_root;
	key.objectid = 0;
	key.offset = group_size_blocks;
	key.flags = 0;
	btrfs_set_key_type(&key, BTRFS_BLOCK_GROUP_ITEM_KEY);

	path = btrfs_alloc_path();
	if (!path)
		return -ENOMEM;

	while(1) {
		ret = btrfs_search_slot(NULL, root->fs_info->extent_root,
					&key, path, 0, 0);
		if (ret != 0) {
			err = ret;
			break;
		}
		leaf = btrfs_buffer_leaf(path->nodes[0]);
		btrfs_disk_key_to_cpu(&found_key,
				      &leaf->items[path->slots[0]].key);
		cache = kmalloc(sizeof(*cache), GFP_NOFS);
		if (!cache) {
			err = -1;
			break;
		}
		bi = btrfs_item_ptr(leaf, path->slots[0],
				    struct btrfs_block_group_item);
		memcpy(&cache->item, bi, sizeof(*bi));
		memcpy(&cache->key, &found_key, sizeof(found_key));
C
Chris Mason 已提交
987 988
		cache->last_alloc = 0;
		cache->first_free = 0;
C
Chris Mason 已提交
989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003
		key.objectid = found_key.objectid + found_key.offset;
		btrfs_release_path(root, path);
		ret = radix_tree_insert(&root->fs_info->block_group_radix,
					found_key.objectid +
					found_key.offset - 1,
					(void *)cache);
		BUG_ON(ret);
		if (key.objectid >=
		    btrfs_super_total_blocks(root->fs_info->disk_super))
			break;
	}

	btrfs_free_path(path);
	return 0;
}