123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674 |
- #include <linux/module.h>
- #include "ctree.h"
- #include "disk-io.h"
- #include "print-tree.h"
- #include "transaction.h"
- static int find_free_extent(struct btrfs_trans_handle *trans, struct btrfs_root
- *orig_root, u64 num_blocks, u64 search_start, u64
- search_end, struct btrfs_key *ins);
- static int finish_current_insert(struct btrfs_trans_handle *trans, struct
- btrfs_root *extent_root);
- static int del_pending_extents(struct btrfs_trans_handle *trans, struct
- btrfs_root *extent_root);
- static int inc_block_ref(struct btrfs_trans_handle *trans, struct btrfs_root
- *root, u64 blocknr, u64 num_blocks)
- {
- struct btrfs_path *path;
- int ret;
- struct btrfs_key key;
- struct btrfs_leaf *l;
- struct btrfs_extent_item *item;
- struct btrfs_key ins;
- u32 refs;
- find_free_extent(trans, root->fs_info->extent_root, 0, 0, (u64)-1,
- &ins);
- path = btrfs_alloc_path();
- BUG_ON(!path);
- btrfs_init_path(path);
- key.objectid = blocknr;
- key.flags = 0;
- btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY);
- key.offset = num_blocks;
- ret = btrfs_search_slot(trans, root->fs_info->extent_root, &key, path,
- 0, 1);
- if (ret != 0)
- BUG();
- BUG_ON(ret != 0);
- l = btrfs_buffer_leaf(path->nodes[0]);
- item = btrfs_item_ptr(l, path->slots[0], struct btrfs_extent_item);
- refs = btrfs_extent_refs(item);
- btrfs_set_extent_refs(item, refs + 1);
- btrfs_mark_buffer_dirty(path->nodes[0]);
- btrfs_release_path(root->fs_info->extent_root, path);
- btrfs_free_path(path);
- finish_current_insert(trans, root->fs_info->extent_root);
- del_pending_extents(trans, root->fs_info->extent_root);
- return 0;
- }
- static int lookup_block_ref(struct btrfs_trans_handle *trans, struct btrfs_root
- *root, u64 blocknr, u64 num_blocks, u32 *refs)
- {
- struct btrfs_path *path;
- int ret;
- struct btrfs_key key;
- struct btrfs_leaf *l;
- struct btrfs_extent_item *item;
- path = btrfs_alloc_path();
- btrfs_init_path(path);
- key.objectid = blocknr;
- key.offset = num_blocks;
- key.flags = 0;
- btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY);
- ret = btrfs_search_slot(trans, root->fs_info->extent_root, &key, path,
- 0, 0);
- if (ret != 0)
- BUG();
- l = btrfs_buffer_leaf(path->nodes[0]);
- item = btrfs_item_ptr(l, path->slots[0], struct btrfs_extent_item);
- *refs = btrfs_extent_refs(item);
- btrfs_release_path(root->fs_info->extent_root, path);
- btrfs_free_path(path);
- return 0;
- }
- int btrfs_inc_ref(struct btrfs_trans_handle *trans, struct btrfs_root *root,
- struct buffer_head *buf)
- {
- u64 blocknr;
- struct btrfs_node *buf_node;
- struct btrfs_leaf *buf_leaf;
- struct btrfs_disk_key *key;
- struct btrfs_file_extent_item *fi;
- int i;
- int leaf;
- int ret;
- if (!root->ref_cows)
- return 0;
- buf_node = btrfs_buffer_node(buf);
- leaf = btrfs_is_leaf(buf_node);
- buf_leaf = btrfs_buffer_leaf(buf);
- for (i = 0; i < btrfs_header_nritems(&buf_node->header); i++) {
- if (leaf) {
- key = &buf_leaf->items[i].key;
- if (btrfs_disk_key_type(key) != BTRFS_EXTENT_DATA_KEY)
- continue;
- fi = btrfs_item_ptr(buf_leaf, i,
- struct btrfs_file_extent_item);
- ret = inc_block_ref(trans, root,
- btrfs_file_extent_disk_blocknr(fi),
- btrfs_file_extent_disk_num_blocks(fi));
- BUG_ON(ret);
- } else {
- blocknr = btrfs_node_blockptr(buf_node, i);
- ret = inc_block_ref(trans, root, blocknr, 1);
- BUG_ON(ret);
- }
- }
- return 0;
- }
- int btrfs_finish_extent_commit(struct btrfs_trans_handle *trans, struct
- btrfs_root *root)
- {
- unsigned long gang[8];
- u64 first = 0;
- int ret;
- int i;
- struct radix_tree_root *pinned_radix = &root->fs_info->pinned_radix;
- while(1) {
- ret = find_first_radix_bit(pinned_radix, gang,
- ARRAY_SIZE(gang));
- if (!ret)
- break;
- if (!first)
- first = gang[0];
- for (i = 0; i < ret; i++) {
- clear_radix_bit(pinned_radix, gang[i]);
- }
- }
- if (root->fs_info->last_insert.objectid > first)
- root->fs_info->last_insert.objectid = first;
- root->fs_info->last_insert.offset = 0;
- return 0;
- }
- static int finish_current_insert(struct btrfs_trans_handle *trans, struct
- btrfs_root *extent_root)
- {
- struct btrfs_key ins;
- struct btrfs_extent_item extent_item;
- int i;
- int ret;
- u64 super_blocks_used;
- struct btrfs_fs_info *info = extent_root->fs_info;
- btrfs_set_extent_refs(&extent_item, 1);
- btrfs_set_extent_owner(&extent_item,
- btrfs_header_parentid(btrfs_buffer_header(extent_root->node)));
- ins.offset = 1;
- ins.flags = 0;
- btrfs_set_key_type(&ins, BTRFS_EXTENT_ITEM_KEY);
- for (i = 0; i < extent_root->fs_info->current_insert.flags; i++) {
- ins.objectid = extent_root->fs_info->current_insert.objectid +
- i;
- super_blocks_used = btrfs_super_blocks_used(info->disk_super);
- btrfs_set_super_blocks_used(info->disk_super,
- super_blocks_used + 1);
- ret = btrfs_insert_item(trans, extent_root, &ins, &extent_item,
- sizeof(extent_item));
- BUG_ON(ret);
- }
- extent_root->fs_info->current_insert.offset = 0;
- return 0;
- }
- static int pin_down_block(struct btrfs_root *root, u64 blocknr, int pending)
- {
- int err;
- struct btrfs_header *header;
- struct buffer_head *bh;
- if (!pending) {
- bh = btrfs_find_tree_block(root, blocknr);
- if (bh) {
- if (buffer_uptodate(bh)) {
- u64 transid =
- root->fs_info->running_transaction->transid;
- header = btrfs_buffer_header(bh);
- if (btrfs_header_generation(header) ==
- transid) {
- btrfs_block_release(root, bh);
- return 0;
- }
- }
- btrfs_block_release(root, bh);
- }
- err = set_radix_bit(&root->fs_info->pinned_radix, blocknr);
- } else {
- err = set_radix_bit(&root->fs_info->pending_del_radix, blocknr);
- }
- BUG_ON(err);
- return 0;
- }
- /*
- * remove an extent from the root, returns 0 on success
- */
- static int __free_extent(struct btrfs_trans_handle *trans, struct btrfs_root
- *root, u64 blocknr, u64 num_blocks, int pin)
- {
- struct btrfs_path *path;
- struct btrfs_key key;
- struct btrfs_fs_info *info = root->fs_info;
- struct btrfs_root *extent_root = info->extent_root;
- int ret;
- struct btrfs_extent_item *ei;
- struct btrfs_key ins;
- u32 refs;
- key.objectid = blocknr;
- key.flags = 0;
- btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY);
- key.offset = num_blocks;
- find_free_extent(trans, root, 0, 0, (u64)-1, &ins);
- path = btrfs_alloc_path();
- BUG_ON(!path);
- btrfs_init_path(path);
- ret = btrfs_search_slot(trans, extent_root, &key, path, -1, 1);
- if (ret) {
- printk("failed to find %Lu\n", key.objectid);
- btrfs_print_tree(extent_root, extent_root->node);
- printk("failed to find %Lu\n", key.objectid);
- BUG();
- }
- ei = btrfs_item_ptr(btrfs_buffer_leaf(path->nodes[0]), path->slots[0],
- struct btrfs_extent_item);
- BUG_ON(ei->refs == 0);
- refs = btrfs_extent_refs(ei) - 1;
- btrfs_set_extent_refs(ei, refs);
- btrfs_mark_buffer_dirty(path->nodes[0]);
- if (refs == 0) {
- u64 super_blocks_used;
- if (pin) {
- ret = pin_down_block(root, blocknr, 0);
- BUG_ON(ret);
- }
- super_blocks_used = btrfs_super_blocks_used(info->disk_super);
- btrfs_set_super_blocks_used(info->disk_super,
- super_blocks_used - num_blocks);
- ret = btrfs_del_item(trans, extent_root, path);
- if (ret)
- BUG();
- }
- btrfs_release_path(extent_root, path);
- btrfs_free_path(path);
- finish_current_insert(trans, extent_root);
- return ret;
- }
- /*
- * find all the blocks marked as pending in the radix tree and remove
- * them from the extent map
- */
- static int del_pending_extents(struct btrfs_trans_handle *trans, struct
- btrfs_root *extent_root)
- {
- int ret;
- int wret;
- int err = 0;
- unsigned long gang[4];
- int i;
- struct radix_tree_root *pending_radix;
- struct radix_tree_root *pinned_radix;
- pending_radix = &extent_root->fs_info->pending_del_radix;
- pinned_radix = &extent_root->fs_info->pinned_radix;
- while(1) {
- ret = find_first_radix_bit(pending_radix, gang,
- ARRAY_SIZE(gang));
- if (!ret)
- break;
- for (i = 0; i < ret; i++) {
- wret = set_radix_bit(pinned_radix, gang[i]);
- BUG_ON(wret);
- wret = clear_radix_bit(pending_radix, gang[i]);
- BUG_ON(wret);
- wret = __free_extent(trans, extent_root,
- gang[i], 1, 0);
- if (wret)
- err = wret;
- }
- }
- return err;
- }
- /*
- * remove an extent from the root, returns 0 on success
- */
- int btrfs_free_extent(struct btrfs_trans_handle *trans, struct btrfs_root
- *root, u64 blocknr, u64 num_blocks, int pin)
- {
- struct btrfs_root *extent_root = root->fs_info->extent_root;
- int pending_ret;
- int ret;
- if (root == extent_root) {
- pin_down_block(root, blocknr, 1);
- return 0;
- }
- ret = __free_extent(trans, root, blocknr, num_blocks, pin);
- pending_ret = del_pending_extents(trans, root->fs_info->extent_root);
- return ret ? ret : pending_ret;
- }
- /*
- * walks the btree of allocated extents and find a hole of a given size.
- * The key ins is changed to record the hole:
- * ins->objectid == block start
- * ins->flags = BTRFS_EXTENT_ITEM_KEY
- * ins->offset == number of blocks
- * Any available blocks before search_start are skipped.
- */
- static int find_free_extent(struct btrfs_trans_handle *trans, struct btrfs_root
- *orig_root, u64 num_blocks, u64 search_start, u64
- search_end, struct btrfs_key *ins)
- {
- struct btrfs_path *path;
- struct btrfs_key key;
- int ret;
- u64 hole_size = 0;
- int slot = 0;
- u64 last_block = 0;
- u64 test_block;
- int start_found;
- struct btrfs_leaf *l;
- struct btrfs_root * root = orig_root->fs_info->extent_root;
- int total_needed = num_blocks;
- int level;
- level = btrfs_header_level(btrfs_buffer_header(root->node));
- total_needed += (level + 1) * 3;
- if (root->fs_info->last_insert.objectid > search_start)
- search_start = root->fs_info->last_insert.objectid;
- ins->flags = 0;
- btrfs_set_key_type(ins, BTRFS_EXTENT_ITEM_KEY);
- path = btrfs_alloc_path();
- check_failed:
- btrfs_init_path(path);
- ins->objectid = search_start;
- ins->offset = 0;
- start_found = 0;
- ret = btrfs_search_slot(trans, root, ins, path, 0, 0);
- if (ret < 0)
- goto error;
- if (path->slots[0] > 0)
- path->slots[0]--;
- while (1) {
- l = btrfs_buffer_leaf(path->nodes[0]);
- slot = path->slots[0];
- if (slot >= btrfs_header_nritems(&l->header)) {
- ret = btrfs_next_leaf(root, path);
- if (ret == 0)
- continue;
- if (ret < 0)
- goto error;
- if (!start_found) {
- ins->objectid = search_start;
- ins->offset = (u64)-1;
- start_found = 1;
- goto check_pending;
- }
- ins->objectid = last_block > search_start ?
- last_block : search_start;
- ins->offset = (u64)-1;
- goto check_pending;
- }
- btrfs_disk_key_to_cpu(&key, &l->items[slot].key);
- if (key.objectid >= search_start) {
- if (start_found) {
- if (last_block < search_start)
- last_block = search_start;
- hole_size = key.objectid - last_block;
- if (hole_size > total_needed) {
- ins->objectid = last_block;
- ins->offset = hole_size;
- goto check_pending;
- }
- }
- }
- start_found = 1;
- last_block = key.objectid + key.offset;
- path->slots[0]++;
- }
- // FIXME -ENOSPC
- check_pending:
- /* we have to make sure we didn't find an extent that has already
- * been allocated by the map tree or the original allocation
- */
- btrfs_release_path(root, path);
- BUG_ON(ins->objectid < search_start);
- for (test_block = ins->objectid;
- test_block < ins->objectid + total_needed; test_block++) {
- if (test_radix_bit(&root->fs_info->pinned_radix,
- test_block)) {
- search_start = test_block + 1;
- goto check_failed;
- }
- }
- BUG_ON(root->fs_info->current_insert.offset);
- root->fs_info->current_insert.offset = total_needed - num_blocks;
- root->fs_info->current_insert.objectid = ins->objectid + num_blocks;
- root->fs_info->current_insert.flags = 0;
- root->fs_info->last_insert.objectid = ins->objectid;
- ins->offset = num_blocks;
- btrfs_free_path(path);
- return 0;
- error:
- btrfs_release_path(root, path);
- btrfs_free_path(path);
- return ret;
- }
- /*
- * finds a free extent and does all the dirty work required for allocation
- * returns the key for the extent through ins, and a tree buffer for
- * the first block of the extent through buf.
- *
- * returns 0 if everything worked, non-zero otherwise.
- */
- int btrfs_alloc_extent(struct btrfs_trans_handle *trans, struct btrfs_root
- *root, u64 num_blocks, u64 search_start, u64
- search_end, u64 owner, struct btrfs_key *ins)
- {
- int ret;
- int pending_ret;
- u64 super_blocks_used;
- struct btrfs_fs_info *info = root->fs_info;
- struct btrfs_root *extent_root = info->extent_root;
- struct btrfs_extent_item extent_item;
- btrfs_set_extent_refs(&extent_item, 1);
- btrfs_set_extent_owner(&extent_item, owner);
- if (root == extent_root) {
- BUG_ON(extent_root->fs_info->current_insert.offset == 0);
- BUG_ON(num_blocks != 1);
- BUG_ON(extent_root->fs_info->current_insert.flags ==
- extent_root->fs_info->current_insert.offset);
- ins->offset = 1;
- ins->objectid = extent_root->fs_info->current_insert.objectid +
- extent_root->fs_info->current_insert.flags++;
- return 0;
- }
- ret = find_free_extent(trans, root, num_blocks, search_start,
- search_end, ins);
- if (ret)
- return ret;
- super_blocks_used = btrfs_super_blocks_used(info->disk_super);
- btrfs_set_super_blocks_used(info->disk_super, super_blocks_used +
- num_blocks);
- ret = btrfs_insert_item(trans, extent_root, ins, &extent_item,
- sizeof(extent_item));
- finish_current_insert(trans, extent_root);
- pending_ret = del_pending_extents(trans, extent_root);
- if (ret)
- return ret;
- if (pending_ret)
- return pending_ret;
- return 0;
- }
- /*
- * helper function to allocate a block for a given tree
- * returns the tree buffer or NULL.
- */
- struct buffer_head *btrfs_alloc_free_block(struct btrfs_trans_handle *trans,
- struct btrfs_root *root)
- {
- struct btrfs_key ins;
- int ret;
- struct buffer_head *buf;
- ret = btrfs_alloc_extent(trans, root, 1, 0, (unsigned long)-1,
- btrfs_header_parentid(btrfs_buffer_header(root->node)), &ins);
- if (ret) {
- BUG();
- return NULL;
- }
- buf = btrfs_find_create_tree_block(root, ins.objectid);
- set_buffer_uptodate(buf);
- return buf;
- }
- static int drop_leaf_ref(struct btrfs_trans_handle *trans,
- struct btrfs_root *root, struct buffer_head *cur)
- {
- struct btrfs_disk_key *key;
- struct btrfs_leaf *leaf;
- struct btrfs_file_extent_item *fi;
- int i;
- int nritems;
- int ret;
- BUG_ON(!btrfs_is_leaf(btrfs_buffer_node(cur)));
- leaf = btrfs_buffer_leaf(cur);
- nritems = btrfs_header_nritems(&leaf->header);
- for (i = 0; i < nritems; i++) {
- key = &leaf->items[i].key;
- if (btrfs_disk_key_type(key) != BTRFS_EXTENT_DATA_KEY)
- continue;
- fi = btrfs_item_ptr(leaf, i, struct btrfs_file_extent_item);
- /*
- * FIXME make sure to insert a trans record that
- * repeats the snapshot del on crash
- */
- ret = btrfs_free_extent(trans, root,
- btrfs_file_extent_disk_blocknr(fi),
- btrfs_file_extent_disk_num_blocks(fi),
- 0);
- BUG_ON(ret);
- }
- return 0;
- }
- /*
- * helper function for drop_snapshot, this walks down the tree dropping ref
- * counts as it goes.
- */
- static int walk_down_tree(struct btrfs_trans_handle *trans, struct btrfs_root
- *root, struct btrfs_path *path, int *level)
- {
- struct buffer_head *next;
- struct buffer_head *cur;
- u64 blocknr;
- int ret;
- u32 refs;
- WARN_ON(*level < 0);
- WARN_ON(*level >= BTRFS_MAX_LEVEL);
- ret = lookup_block_ref(trans, root, path->nodes[*level]->b_blocknr,
- 1, &refs);
- BUG_ON(ret);
- if (refs > 1)
- goto out;
- /*
- * walk down to the last node level and free all the leaves
- */
- while(*level >= 0) {
- WARN_ON(*level < 0);
- WARN_ON(*level >= BTRFS_MAX_LEVEL);
- cur = path->nodes[*level];
- if (btrfs_header_level(btrfs_buffer_header(cur)) != *level)
- WARN_ON(1);
- if (path->slots[*level] >=
- btrfs_header_nritems(btrfs_buffer_header(cur)))
- break;
- if (*level == 0) {
- ret = drop_leaf_ref(trans, root, cur);
- BUG_ON(ret);
- break;
- }
- blocknr = btrfs_node_blockptr(btrfs_buffer_node(cur),
- path->slots[*level]);
- ret = lookup_block_ref(trans, root, blocknr, 1, &refs);
- BUG_ON(ret);
- if (refs != 1) {
- path->slots[*level]++;
- ret = btrfs_free_extent(trans, root, blocknr, 1, 1);
- BUG_ON(ret);
- continue;
- }
- next = read_tree_block(root, blocknr);
- WARN_ON(*level <= 0);
- if (path->nodes[*level-1])
- btrfs_block_release(root, path->nodes[*level-1]);
- path->nodes[*level-1] = next;
- *level = btrfs_header_level(btrfs_buffer_header(next));
- path->slots[*level] = 0;
- }
- out:
- WARN_ON(*level < 0);
- WARN_ON(*level >= BTRFS_MAX_LEVEL);
- ret = btrfs_free_extent(trans, root,
- path->nodes[*level]->b_blocknr, 1, 1);
- btrfs_block_release(root, path->nodes[*level]);
- path->nodes[*level] = NULL;
- *level += 1;
- BUG_ON(ret);
- return 0;
- }
- /*
- * helper for dropping snapshots. This walks back up the tree in the path
- * to find the first node higher up where we haven't yet gone through
- * all the slots
- */
- static int walk_up_tree(struct btrfs_trans_handle *trans, struct btrfs_root
- *root, struct btrfs_path *path, int *level)
- {
- int i;
- int slot;
- int ret;
- for(i = *level; i < BTRFS_MAX_LEVEL - 1 && path->nodes[i]; i++) {
- slot = path->slots[i];
- if (slot < btrfs_header_nritems(
- btrfs_buffer_header(path->nodes[i])) - 1) {
- path->slots[i]++;
- *level = i;
- return 0;
- } else {
- ret = btrfs_free_extent(trans, root,
- path->nodes[*level]->b_blocknr,
- 1, 1);
- BUG_ON(ret);
- btrfs_block_release(root, path->nodes[*level]);
- path->nodes[*level] = NULL;
- *level = i + 1;
- }
- }
- return 1;
- }
- /*
- * drop the reference count on the tree rooted at 'snap'. This traverses
- * the tree freeing any blocks that have a ref count of zero after being
- * decremented.
- */
- int btrfs_drop_snapshot(struct btrfs_trans_handle *trans, struct btrfs_root
- *root, struct buffer_head *snap)
- {
- int ret = 0;
- int wret;
- int level;
- struct btrfs_path *path;
- int i;
- int orig_level;
- path = btrfs_alloc_path();
- BUG_ON(!path);
- btrfs_init_path(path);
- level = btrfs_header_level(btrfs_buffer_header(snap));
- orig_level = level;
- path->nodes[level] = snap;
- path->slots[level] = 0;
- while(1) {
- wret = walk_down_tree(trans, root, path, &level);
- if (wret > 0)
- break;
- if (wret < 0)
- ret = wret;
- wret = walk_up_tree(trans, root, path, &level);
- if (wret > 0)
- break;
- if (wret < 0)
- ret = wret;
- }
- for (i = 0; i <= orig_level; i++) {
- if (path->nodes[i]) {
- btrfs_block_release(root, path->nodes[i]);
- }
- }
- btrfs_free_path(path);
- return ret;
- }
|