extent-tree.c 11.3 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
#include <stdio.h>
#include <stdlib.h>
#include "kerncompat.h"
#include "radix-tree.h"
#include "ctree.h"
#include "disk-io.h"
#include "print-tree.h"

/*
 * pending extents are blocks that we're trying to allocate in the extent
 * map while trying to grow the map because of other allocations.  To avoid
 * recursing, they are tagged in the radix tree and cleaned up after
 * other allocations are done.  The pending tag is also used in the same
 * manner for deletes.
 */
16 17
#define CTREE_EXTENT_PENDING_ADD 0
#define CTREE_EXTENT_PENDING_DEL 1
18

C
Chris Mason 已提交
19 20 21 22 23 24 25 26 27 28 29 30
static int inc_block_ref(struct ctree_root *root, u64 blocknr)
{
	struct ctree_path path;
	int ret;
	struct key key;
	struct leaf *l;
	struct extent_item *item;
	init_path(&path);
	key.objectid = blocknr;
	key.flags = 0;
	key.offset = 1;
	ret = search_slot(root->extent_root, &key, &path, 0, 1);
31 32
	if (ret != 0)
		BUG();
C
Chris Mason 已提交
33 34 35 36 37
	BUG_ON(ret != 0);
	l = &path.nodes[0]->leaf;
	item = (struct extent_item *)(l->data +
				      l->items[path.slots[0]].offset);
	item->refs++;
38

C
Chris Mason 已提交
39 40 41 42 43
	BUG_ON(list_empty(&path.nodes[0]->dirty));
	release_path(root->extent_root, &path);
	return 0;
}

44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65
static int lookup_block_ref(struct ctree_root *root, u64 blocknr, int *refs)
{
	struct ctree_path path;
	int ret;
	struct key key;
	struct leaf *l;
	struct extent_item *item;
	init_path(&path);
	key.objectid = blocknr;
	key.flags = 0;
	key.offset = 1;
	ret = search_slot(root->extent_root, &key, &path, 0, 0);
	if (ret != 0)
		BUG();
	l = &path.nodes[0]->leaf;
	item = (struct extent_item *)(l->data +
				      l->items[path.slots[0]].offset);
	*refs = item->refs;
	release_path(root->extent_root, &path);
	return 0;
}

C
Chris Mason 已提交
66 67 68 69
int btrfs_inc_ref(struct ctree_root *root, struct tree_buffer *buf)
{
	u64 blocknr;
	int i;
70 71 72 73 74 75

	if (root == root->extent_root)
		return 0;
	if (is_leaf(buf->node.header.flags))
		return 0;

C
Chris Mason 已提交
76 77 78 79 80 81 82
	for (i = 0; i < buf->node.header.nritems; i++) {
		blocknr = buf->node.blockptrs[i];
		inc_block_ref(root, blocknr);
	}
	return 0;
}

83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101
int btrfs_finish_extent_commit(struct ctree_root *root)
{
	struct ctree_root *extent_root = root->extent_root;
	unsigned long gang[8];
	int ret;
	int i;

	while(1) {
		ret = radix_tree_gang_lookup(&extent_root->pinned_radix,
						 (void **)gang, 0,
						 ARRAY_SIZE(gang));
		if (!ret)
			break;
		for (i = 0; i < ret; i++)
			radix_tree_delete(&extent_root->pinned_radix, gang[i]);
	}
	return 0;
}

102
/*
103
 * remove an extent from the root, returns 0 on success
104
 */
105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150
int __free_extent(struct ctree_root *root, u64 blocknr, u64 num_blocks)
{
	struct ctree_path path;
	struct key key;
	struct ctree_root *extent_root = root->extent_root;
	int ret;
	struct item *item;
	struct extent_item *ei;
	key.objectid = blocknr;
	key.flags = 0;
	key.offset = num_blocks;

	init_path(&path);
	ret = search_slot(extent_root, &key, &path, -1, 1);
	if (ret) {
		printf("failed to find %Lu\n", key.objectid);
		print_tree(extent_root, extent_root->node);
		printf("failed to find %Lu\n", key.objectid);
		BUG();
	}
	item = path.nodes[0]->leaf.items + path.slots[0];
	ei = (struct extent_item *)(path.nodes[0]->leaf.data + item->offset);
	BUG_ON(ei->refs == 0);
	ei->refs--;
	if (ei->refs == 0) {
		if (root == extent_root) {
			int err;
			radix_tree_preload(GFP_KERNEL);
			err = radix_tree_insert(&extent_root->pinned_radix,
					  blocknr, (void *)blocknr);
			BUG_ON(err);
			radix_tree_preload_end();
		}
		ret = del_item(extent_root, &path);
		if (ret)
			BUG();
	}
	release_path(extent_root, &path);
	return ret;
}

/*
 * insert all of the pending extents reserved during the original
 * allocation.  (CTREE_EXTENT_PENDING).  Returns zero if it all worked out
 */
static int insert_pending_extents(struct ctree_root *extent_root)
151 152 153
{
	int ret;
	struct key key;
154
	struct extent_item item;
155 156 157
	struct tree_buffer *gang[4];
	int i;

158 159 160
	// FIXME -ENOSPC
	item.owner = extent_root->node->node.header.parentid;
	item.refs = 1;
161 162 163 164
	while(1) {
		ret = radix_tree_gang_lookup_tag(&extent_root->cache_radix,
						 (void **)gang, 0,
						 ARRAY_SIZE(gang),
165
						 CTREE_EXTENT_PENDING_ADD);
166 167 168 169 170 171
		if (!ret)
			break;
		for (i = 0; i < ret; i++) {
			key.objectid = gang[i]->blocknr;
			key.flags = 0;
			key.offset = 1;
172 173
			ret = insert_item(extent_root, &key, &item,
					  sizeof(item));
174
			if (ret) {
175
				printf("%Lu already in tree\n", key.objectid);
176 177 178 179 180
				print_tree(extent_root, extent_root->node);
				BUG();
				// FIXME undo it and return sane
				return ret;
			}
181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208
			radix_tree_tag_clear(&extent_root->cache_radix,
					     gang[i]->blocknr,
					     CTREE_EXTENT_PENDING_ADD);
			tree_block_release(extent_root, gang[i]);
		}
	}
	return 0;
}

/*
 * find all the blocks marked as pending in the radix tree and remove
 * them from the extent map
 */
static int del_pending_extents(struct ctree_root *extent_root)
{
	int ret;
	struct tree_buffer *gang[4];
	int i;

	while(1) {
		ret = radix_tree_gang_lookup_tag(&extent_root->cache_radix,
						 (void **)gang, 0,
						 ARRAY_SIZE(gang),
						 CTREE_EXTENT_PENDING_DEL);
		if (!ret)
			break;
		for (i = 0; i < ret; i++) {
			ret = __free_extent(extent_root, gang[i]->blocknr, 1);
209 210
			radix_tree_tag_clear(&extent_root->cache_radix,
						gang[i]->blocknr,
211
						CTREE_EXTENT_PENDING_DEL);
212 213 214 215 216 217
			tree_block_release(extent_root, gang[i]);
		}
	}
	return 0;
}

218 219 220 221 222 223 224 225 226 227 228 229 230
static int run_pending(struct ctree_root *extent_root)
{
	while(radix_tree_tagged(&extent_root->cache_radix,
			        CTREE_EXTENT_PENDING_DEL) ||
	      radix_tree_tagged(&extent_root->cache_radix,
				CTREE_EXTENT_PENDING_ADD)) {
		insert_pending_extents(extent_root);
		del_pending_extents(extent_root);
	}
	return 0;
}


231 232 233 234 235 236 237 238 239 240
/*
 * remove an extent from the root, returns 0 on success
 */
int free_extent(struct ctree_root *root, u64 blocknr, u64 num_blocks)
{
	struct key key;
	struct ctree_root *extent_root = root->extent_root;
	struct tree_buffer *t;
	int pending_ret;
	int ret;
241

242
	if (root == extent_root) {
243 244 245 246 247 248 249 250 251 252 253 254 255 256
		t = find_tree_block(root, blocknr);
		if (radix_tree_tag_get(&root->cache_radix, blocknr,
				      CTREE_EXTENT_PENDING_ADD)) {
			radix_tree_tag_clear(&root->cache_radix,
					     blocknr,
					     CTREE_EXTENT_PENDING_ADD);
			/* once for us */
			tree_block_release(root, t);
			/* once for the pending add */
			tree_block_release(root, t);
		} else {
			radix_tree_tag_set(&root->cache_radix, blocknr,
				   CTREE_EXTENT_PENDING_DEL);
		}
257 258
		return 0;
	}
259 260 261 262 263
	key.objectid = blocknr;
	key.flags = 0;
	key.offset = num_blocks;
	ret = __free_extent(root, blocknr, num_blocks);
	pending_ret = run_pending(root->extent_root);
264 265 266 267 268 269 270 271 272 273 274
	return ret ? ret : pending_ret;
}

/*
 * walks the btree of allocated extents and find a hole of a given size.
 * The key ins is changed to record the hole:
 * ins->objectid == block start
 * ins->flags = 0
 * ins->offset == number of blocks
 * Any available blocks before search_start are skipped.
 */
C
Chris Mason 已提交
275 276
static int find_free_extent(struct ctree_root *orig_root, u64 num_blocks,
			    u64 search_start, u64 search_end, struct key *ins)
277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293
{
	struct ctree_path path;
	struct key *key;
	int ret;
	u64 hole_size = 0;
	int slot = 0;
	u64 last_block;
	int start_found;
	struct leaf *l;
	struct ctree_root * root = orig_root->extent_root;

check_failed:
	init_path(&path);
	ins->objectid = search_start;
	ins->offset = 0;
	ins->flags = 0;
	start_found = 0;
C
Chris Mason 已提交
294
	ret = search_slot(root, ins, &path, 0, 0);
C
Chris Mason 已提交
295 296
	if (ret < 0)
		goto error;
C
Chris Mason 已提交
297

298 299 300 301 302 303 304
	while (1) {
		l = &path.nodes[0]->leaf;
		slot = path.slots[0];
		if (slot >= l->header.nritems) {
			ret = next_leaf(root, &path);
			if (ret == 0)
				continue;
C
Chris Mason 已提交
305 306
			if (ret < 0)
				goto error;
307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339
			if (!start_found) {
				ins->objectid = search_start;
				ins->offset = num_blocks;
				start_found = 1;
				goto check_pending;
			}
			ins->objectid = last_block > search_start ?
					last_block : search_start;
			ins->offset = num_blocks;
			goto check_pending;
		}
		key = &l->items[slot].key;
		if (key->objectid >= search_start) {
			if (start_found) {
				hole_size = key->objectid - last_block;
				if (hole_size > num_blocks) {
					ins->objectid = last_block;
					ins->offset = num_blocks;
					goto check_pending;
				}
			} else
				start_found = 1;
			last_block = key->objectid + key->offset;
		}
		path.slots[0]++;
	}
	// FIXME -ENOSPC
check_pending:
	/* we have to make sure we didn't find an extent that has already
	 * been allocated by the map tree or the original allocation
	 */
	release_path(root, &path);
	BUG_ON(ins->objectid < search_start);
340
	if (1 || orig_root->extent_root == orig_root) {
341 342 343 344 345 346 347
		BUG_ON(num_blocks != 1);
		if ((root->current_insert.objectid <= ins->objectid &&
		    root->current_insert.objectid +
		    root->current_insert.offset > ins->objectid) ||
		   (root->current_insert.objectid > ins->objectid &&
		    root->current_insert.objectid <= ins->objectid +
		    ins->offset) ||
348
		   radix_tree_lookup(&root->pinned_radix, ins->objectid) ||
349
		   radix_tree_tag_get(&root->cache_radix, ins->objectid,
350
				      CTREE_EXTENT_PENDING_ADD)) {
351 352 353 354 355 356 357
			search_start = ins->objectid + 1;
			goto check_failed;
		}
	}
	if (ins->offset != 1)
		BUG();
	return 0;
C
Chris Mason 已提交
358 359 360
error:
	release_path(root, &path);
	return ret;
361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388
}

/*
 * finds a free extent and does all the dirty work required for allocation
 * returns the key for the extent through ins, and a tree buffer for
 * the first block of the extent through buf.
 *
 * returns 0 if everything worked, non-zero otherwise.
 */
int alloc_extent(struct ctree_root *root, u64 num_blocks, u64 search_start,
			 u64 search_end, u64 owner, struct key *ins,
			 struct tree_buffer **buf)
{
	int ret;
	int pending_ret;
	struct extent_item extent_item;
	extent_item.refs = 1;
	extent_item.owner = owner;

	ret = find_free_extent(root, num_blocks, search_start, search_end, ins);
	if (ret)
		return ret;
	if (root != root->extent_root) {
		memcpy(&root->extent_root->current_insert, ins, sizeof(*ins));
		ret = insert_item(root->extent_root, ins, &extent_item,
				  sizeof(extent_item));
		memset(&root->extent_root->current_insert, 0,
		       sizeof(struct key));
389
		pending_ret = run_pending(root->extent_root);
390 391 392 393 394
		if (ret)
			return ret;
		if (pending_ret)
			return pending_ret;
		*buf = find_tree_block(root, ins->objectid);
C
Chris Mason 已提交
395
		dirty_tree_block(root, *buf);
396 397 398 399 400 401 402
		return 0;
	}
	/* we're allocating an extent for the extent tree, don't recurse */
	BUG_ON(ins->offset != 1);
	*buf = find_tree_block(root, ins->objectid);
	BUG_ON(!*buf);
	radix_tree_tag_set(&root->cache_radix, ins->objectid,
403
			   CTREE_EXTENT_PENDING_ADD);
404
	(*buf)->count++;
C
Chris Mason 已提交
405
	dirty_tree_block(root, *buf);
406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428
	return 0;

}

/*
 * helper function to allocate a block for a given tree
 * returns the tree buffer or NULL.
 */
struct tree_buffer *alloc_free_block(struct ctree_root *root)
{
	struct key ins;
	int ret;
	struct tree_buffer *buf = NULL;

	ret = alloc_extent(root, 1, 0, (unsigned long)-1,
			   root->node->node.header.parentid,
			   &ins, &buf);
	if (ret) {
		BUG();
		return NULL;
	}
	if (root != root->extent_root)
		BUG_ON(radix_tree_tag_get(&root->extent_root->cache_radix,
429 430
					  buf->blocknr,
					  CTREE_EXTENT_PENDING_ADD));
431 432
	return buf;
}
433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460

int btrfs_drop_snapshot(struct ctree_root *root, struct tree_buffer *snap)
{
	int ret;
	int level;
	int refs;
	u64 blocknr = snap->blocknr;

	level = node_level(snap->node.header.flags);
	ret = lookup_block_ref(root, snap->blocknr, &refs);
	BUG_ON(ret);
	if (refs == 1 && level != 0) {
		struct node *n = &snap->node;
		struct tree_buffer *b;
		int i;
		for (i = 0; i < n->header.nritems; i++) {
			b = read_tree_block(root, n->blockptrs[i]);
			/* FIXME, don't recurse here */
			ret = btrfs_drop_snapshot(root, b);
			BUG_ON(ret);
			tree_block_release(root, b);
		}
	}
	ret = free_extent(root, blocknr, 1);
	BUG_ON(ret);
	return 0;
}