extent-tree.c 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596
  1. #include <linux/module.h>
  2. #include "ctree.h"
  3. #include "disk-io.h"
  4. #include "print-tree.h"
  5. #include "transaction.h"
  6. static int find_free_extent(struct btrfs_trans_handle *trans, struct btrfs_root
  7. *orig_root, u64 num_blocks, u64 search_start, u64
  8. search_end, struct btrfs_key *ins);
  9. static int finish_current_insert(struct btrfs_trans_handle *trans, struct
  10. btrfs_root *extent_root);
  11. static int del_pending_extents(struct btrfs_trans_handle *trans, struct
  12. btrfs_root *extent_root);
  13. static int inc_block_ref(struct btrfs_trans_handle *trans, struct btrfs_root
  14. *root, u64 blocknr)
  15. {
  16. struct btrfs_path path;
  17. int ret;
  18. struct btrfs_key key;
  19. struct btrfs_leaf *l;
  20. struct btrfs_extent_item *item;
  21. struct btrfs_key ins;
  22. u32 refs;
  23. find_free_extent(trans, root->fs_info->extent_root, 0, 0, (u64)-1,
  24. &ins);
  25. btrfs_init_path(&path);
  26. key.objectid = blocknr;
  27. key.flags = 0;
  28. btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY);
  29. key.offset = 1;
  30. ret = btrfs_search_slot(trans, root->fs_info->extent_root, &key, &path,
  31. 0, 1);
  32. if (ret != 0)
  33. BUG();
  34. BUG_ON(ret != 0);
  35. l = btrfs_buffer_leaf(path.nodes[0]);
  36. item = btrfs_item_ptr(l, path.slots[0], struct btrfs_extent_item);
  37. refs = btrfs_extent_refs(item);
  38. btrfs_set_extent_refs(item, refs + 1);
  39. mark_buffer_dirty(path.nodes[0]);
  40. btrfs_release_path(root->fs_info->extent_root, &path);
  41. finish_current_insert(trans, root->fs_info->extent_root);
  42. del_pending_extents(trans, root->fs_info->extent_root);
  43. return 0;
  44. }
  45. static int lookup_block_ref(struct btrfs_trans_handle *trans, struct btrfs_root
  46. *root, u64 blocknr, u32 *refs)
  47. {
  48. struct btrfs_path path;
  49. int ret;
  50. struct btrfs_key key;
  51. struct btrfs_leaf *l;
  52. struct btrfs_extent_item *item;
  53. btrfs_init_path(&path);
  54. key.objectid = blocknr;
  55. key.offset = 1;
  56. key.flags = 0;
  57. btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY);
  58. ret = btrfs_search_slot(trans, root->fs_info->extent_root, &key, &path,
  59. 0, 0);
  60. if (ret != 0)
  61. BUG();
  62. l = btrfs_buffer_leaf(path.nodes[0]);
  63. item = btrfs_item_ptr(l, path.slots[0], struct btrfs_extent_item);
  64. *refs = btrfs_extent_refs(item);
  65. btrfs_release_path(root->fs_info->extent_root, &path);
  66. return 0;
  67. }
  68. int btrfs_inc_ref(struct btrfs_trans_handle *trans, struct btrfs_root *root,
  69. struct buffer_head *buf)
  70. {
  71. u64 blocknr;
  72. struct btrfs_node *buf_node;
  73. int i;
  74. if (!root->ref_cows)
  75. return 0;
  76. buf_node = btrfs_buffer_node(buf);
  77. if (btrfs_is_leaf(buf_node))
  78. return 0;
  79. for (i = 0; i < btrfs_header_nritems(&buf_node->header); i++) {
  80. blocknr = btrfs_node_blockptr(buf_node, i);
  81. inc_block_ref(trans, root, blocknr);
  82. }
  83. return 0;
  84. }
  85. int btrfs_finish_extent_commit(struct btrfs_trans_handle *trans, struct
  86. btrfs_root *root)
  87. {
  88. unsigned long gang[8];
  89. u64 first = 0;
  90. int ret;
  91. int i;
  92. struct radix_tree_root *pinned_radix = &root->fs_info->pinned_radix;
  93. while(1) {
  94. ret = find_first_radix_bit(pinned_radix, gang,
  95. ARRAY_SIZE(gang));
  96. if (!ret)
  97. break;
  98. if (!first)
  99. first = gang[0];
  100. for (i = 0; i < ret; i++) {
  101. clear_radix_bit(pinned_radix, gang[i]);
  102. }
  103. }
  104. if (root->fs_info->last_insert.objectid > first)
  105. root->fs_info->last_insert.objectid = first;
  106. root->fs_info->last_insert.offset = 0;
  107. return 0;
  108. }
  109. static int finish_current_insert(struct btrfs_trans_handle *trans, struct
  110. btrfs_root *extent_root)
  111. {
  112. struct btrfs_key ins;
  113. struct btrfs_extent_item extent_item;
  114. int i;
  115. int ret;
  116. u64 super_blocks_used;
  117. struct btrfs_fs_info *info = extent_root->fs_info;
  118. btrfs_set_extent_refs(&extent_item, 1);
  119. btrfs_set_extent_owner(&extent_item,
  120. btrfs_header_parentid(btrfs_buffer_header(extent_root->node)));
  121. ins.offset = 1;
  122. ins.flags = 0;
  123. btrfs_set_key_type(&ins, BTRFS_EXTENT_ITEM_KEY);
  124. for (i = 0; i < extent_root->fs_info->current_insert.flags; i++) {
  125. ins.objectid = extent_root->fs_info->current_insert.objectid +
  126. i;
  127. super_blocks_used = btrfs_super_blocks_used(info->disk_super);
  128. btrfs_set_super_blocks_used(info->disk_super,
  129. super_blocks_used + 1);
  130. ret = btrfs_insert_item(trans, extent_root, &ins, &extent_item,
  131. sizeof(extent_item));
  132. BUG_ON(ret);
  133. }
  134. extent_root->fs_info->current_insert.offset = 0;
  135. return 0;
  136. }
  137. static int pin_down_block(struct btrfs_root *root, u64 blocknr, int pending)
  138. {
  139. int err;
  140. struct btrfs_header *header;
  141. struct buffer_head *bh;
  142. bh = sb_find_get_block(root->fs_info->sb, blocknr);
  143. if (bh) {
  144. header = btrfs_buffer_header(bh);
  145. if (btrfs_header_generation(header) ==
  146. root->fs_info->running_transaction->transid) {
  147. brelse(bh);
  148. return 0;
  149. }
  150. brelse(bh);
  151. }
  152. if (pending)
  153. err = set_radix_bit(&root->fs_info->pending_del_radix, blocknr);
  154. else
  155. err = set_radix_bit(&root->fs_info->pinned_radix, blocknr);
  156. BUG_ON(err);
  157. return 0;
  158. }
  159. /*
  160. * remove an extent from the root, returns 0 on success
  161. */
  162. static int __free_extent(struct btrfs_trans_handle *trans, struct btrfs_root
  163. *root, u64 blocknr, u64 num_blocks, int pin)
  164. {
  165. struct btrfs_path path;
  166. struct btrfs_key key;
  167. struct btrfs_fs_info *info = root->fs_info;
  168. struct btrfs_root *extent_root = info->extent_root;
  169. int ret;
  170. struct btrfs_extent_item *ei;
  171. struct btrfs_key ins;
  172. u32 refs;
  173. key.objectid = blocknr;
  174. key.flags = 0;
  175. btrfs_set_key_type(&key, BTRFS_EXTENT_ITEM_KEY);
  176. key.offset = num_blocks;
  177. find_free_extent(trans, root, 0, 0, (u64)-1, &ins);
  178. btrfs_init_path(&path);
  179. ret = btrfs_search_slot(trans, extent_root, &key, &path, -1, 1);
  180. if (ret) {
  181. printk("failed to find %Lu\n", key.objectid);
  182. btrfs_print_tree(extent_root, extent_root->node);
  183. printk("failed to find %Lu\n", key.objectid);
  184. BUG();
  185. }
  186. ei = btrfs_item_ptr(btrfs_buffer_leaf(path.nodes[0]), path.slots[0],
  187. struct btrfs_extent_item);
  188. BUG_ON(ei->refs == 0);
  189. refs = btrfs_extent_refs(ei) - 1;
  190. btrfs_set_extent_refs(ei, refs);
  191. if (refs == 0) {
  192. u64 super_blocks_used;
  193. if (pin) {
  194. ret = pin_down_block(root, blocknr, 0);
  195. BUG_ON(ret);
  196. }
  197. super_blocks_used = btrfs_super_blocks_used(info->disk_super);
  198. btrfs_set_super_blocks_used(info->disk_super,
  199. super_blocks_used - num_blocks);
  200. ret = btrfs_del_item(trans, extent_root, &path);
  201. if (extent_root->fs_info->last_insert.objectid > blocknr)
  202. extent_root->fs_info->last_insert.objectid = blocknr;
  203. if (ret)
  204. BUG();
  205. }
  206. mark_buffer_dirty(path.nodes[0]);
  207. btrfs_release_path(extent_root, &path);
  208. finish_current_insert(trans, extent_root);
  209. return ret;
  210. }
  211. /*
  212. * find all the blocks marked as pending in the radix tree and remove
  213. * them from the extent map
  214. */
  215. static int del_pending_extents(struct btrfs_trans_handle *trans, struct
  216. btrfs_root *extent_root)
  217. {
  218. int ret;
  219. int wret;
  220. int err = 0;
  221. unsigned long gang[4];
  222. int i;
  223. struct radix_tree_root *pending_radix;
  224. struct radix_tree_root *pinned_radix;
  225. pending_radix = &extent_root->fs_info->pending_del_radix;
  226. pinned_radix = &extent_root->fs_info->pinned_radix;
  227. while(1) {
  228. ret = find_first_radix_bit(pending_radix, gang,
  229. ARRAY_SIZE(gang));
  230. if (!ret)
  231. break;
  232. for (i = 0; i < ret; i++) {
  233. wret = set_radix_bit(pinned_radix, gang[i]);
  234. BUG_ON(wret);
  235. wret = clear_radix_bit(pending_radix, gang[i]);
  236. BUG_ON(wret);
  237. wret = __free_extent(trans, extent_root,
  238. gang[i], 1, 0);
  239. if (wret)
  240. err = wret;
  241. }
  242. }
  243. return err;
  244. }
  245. /*
  246. * remove an extent from the root, returns 0 on success
  247. */
  248. int btrfs_free_extent(struct btrfs_trans_handle *trans, struct btrfs_root
  249. *root, u64 blocknr, u64 num_blocks, int pin)
  250. {
  251. struct btrfs_root *extent_root = root->fs_info->extent_root;
  252. struct buffer_head *t;
  253. int pending_ret;
  254. int ret;
  255. if (root == extent_root) {
  256. t = find_tree_block(root, blocknr);
  257. pin_down_block(root, blocknr, 1);
  258. return 0;
  259. }
  260. ret = __free_extent(trans, root, blocknr, num_blocks, pin);
  261. pending_ret = del_pending_extents(trans, root->fs_info->extent_root);
  262. return ret ? ret : pending_ret;
  263. }
  264. /*
  265. * walks the btree of allocated extents and find a hole of a given size.
  266. * The key ins is changed to record the hole:
  267. * ins->objectid == block start
  268. * ins->flags = BTRFS_EXTENT_ITEM_KEY
  269. * ins->offset == number of blocks
  270. * Any available blocks before search_start are skipped.
  271. */
  272. static int find_free_extent(struct btrfs_trans_handle *trans, struct btrfs_root
  273. *orig_root, u64 num_blocks, u64 search_start, u64
  274. search_end, struct btrfs_key *ins)
  275. {
  276. struct btrfs_path path;
  277. struct btrfs_key key;
  278. int ret;
  279. u64 hole_size = 0;
  280. int slot = 0;
  281. u64 last_block = 0;
  282. u64 test_block;
  283. int start_found;
  284. struct btrfs_leaf *l;
  285. struct btrfs_root * root = orig_root->fs_info->extent_root;
  286. int total_needed = num_blocks;
  287. int level;
  288. level = btrfs_header_level(btrfs_buffer_header(root->node));
  289. total_needed += (level + 1) * 3;
  290. if (root->fs_info->last_insert.objectid > search_start)
  291. search_start = root->fs_info->last_insert.objectid;
  292. ins->flags = 0;
  293. btrfs_set_key_type(ins, BTRFS_EXTENT_ITEM_KEY);
  294. check_failed:
  295. btrfs_init_path(&path);
  296. ins->objectid = search_start;
  297. ins->offset = 0;
  298. start_found = 0;
  299. ret = btrfs_search_slot(trans, root, ins, &path, 0, 0);
  300. if (ret < 0)
  301. goto error;
  302. if (path.slots[0] > 0)
  303. path.slots[0]--;
  304. while (1) {
  305. l = btrfs_buffer_leaf(path.nodes[0]);
  306. slot = path.slots[0];
  307. if (slot >= btrfs_header_nritems(&l->header)) {
  308. ret = btrfs_next_leaf(root, &path);
  309. if (ret == 0)
  310. continue;
  311. if (ret < 0)
  312. goto error;
  313. if (!start_found) {
  314. ins->objectid = search_start;
  315. ins->offset = (u64)-1;
  316. start_found = 1;
  317. goto check_pending;
  318. }
  319. ins->objectid = last_block > search_start ?
  320. last_block : search_start;
  321. ins->offset = (u64)-1;
  322. goto check_pending;
  323. }
  324. btrfs_disk_key_to_cpu(&key, &l->items[slot].key);
  325. if (key.objectid >= search_start) {
  326. if (start_found) {
  327. if (last_block < search_start)
  328. last_block = search_start;
  329. hole_size = key.objectid - last_block;
  330. if (hole_size > total_needed) {
  331. ins->objectid = last_block;
  332. ins->offset = hole_size;
  333. goto check_pending;
  334. }
  335. }
  336. }
  337. start_found = 1;
  338. last_block = key.objectid + key.offset;
  339. path.slots[0]++;
  340. }
  341. // FIXME -ENOSPC
  342. check_pending:
  343. /* we have to make sure we didn't find an extent that has already
  344. * been allocated by the map tree or the original allocation
  345. */
  346. btrfs_release_path(root, &path);
  347. BUG_ON(ins->objectid < search_start);
  348. for (test_block = ins->objectid;
  349. test_block < ins->objectid + total_needed; test_block++) {
  350. if (test_radix_bit(&root->fs_info->pinned_radix,
  351. test_block)) {
  352. search_start = test_block + 1;
  353. goto check_failed;
  354. }
  355. }
  356. BUG_ON(root->fs_info->current_insert.offset);
  357. root->fs_info->current_insert.offset = total_needed - num_blocks;
  358. root->fs_info->current_insert.objectid = ins->objectid + num_blocks;
  359. root->fs_info->current_insert.flags = 0;
  360. root->fs_info->last_insert.objectid = ins->objectid;
  361. ins->offset = num_blocks;
  362. return 0;
  363. error:
  364. btrfs_release_path(root, &path);
  365. return ret;
  366. }
  367. /*
  368. * finds a free extent and does all the dirty work required for allocation
  369. * returns the key for the extent through ins, and a tree buffer for
  370. * the first block of the extent through buf.
  371. *
  372. * returns 0 if everything worked, non-zero otherwise.
  373. */
  374. static int alloc_extent(struct btrfs_trans_handle *trans, struct btrfs_root
  375. *root, u64 num_blocks, u64 search_start, u64
  376. search_end, u64 owner, struct btrfs_key *ins)
  377. {
  378. int ret;
  379. int pending_ret;
  380. u64 super_blocks_used;
  381. struct btrfs_fs_info *info = root->fs_info;
  382. struct btrfs_root *extent_root = info->extent_root;
  383. struct btrfs_extent_item extent_item;
  384. btrfs_set_extent_refs(&extent_item, 1);
  385. btrfs_set_extent_owner(&extent_item, owner);
  386. if (root == extent_root) {
  387. BUG_ON(extent_root->fs_info->current_insert.offset == 0);
  388. BUG_ON(num_blocks != 1);
  389. BUG_ON(extent_root->fs_info->current_insert.flags ==
  390. extent_root->fs_info->current_insert.offset);
  391. ins->offset = 1;
  392. ins->objectid = extent_root->fs_info->current_insert.objectid +
  393. extent_root->fs_info->current_insert.flags++;
  394. return 0;
  395. }
  396. ret = find_free_extent(trans, root, num_blocks, search_start,
  397. search_end, ins);
  398. if (ret)
  399. return ret;
  400. super_blocks_used = btrfs_super_blocks_used(info->disk_super);
  401. btrfs_set_super_blocks_used(info->disk_super, super_blocks_used +
  402. num_blocks);
  403. ret = btrfs_insert_item(trans, extent_root, ins, &extent_item,
  404. sizeof(extent_item));
  405. finish_current_insert(trans, extent_root);
  406. pending_ret = del_pending_extents(trans, extent_root);
  407. if (ret)
  408. return ret;
  409. if (pending_ret)
  410. return pending_ret;
  411. return 0;
  412. }
  413. /*
  414. * helper function to allocate a block for a given tree
  415. * returns the tree buffer or NULL.
  416. */
  417. struct buffer_head *btrfs_alloc_free_block(struct btrfs_trans_handle *trans,
  418. struct btrfs_root *root)
  419. {
  420. struct btrfs_key ins;
  421. int ret;
  422. struct buffer_head *buf;
  423. ret = alloc_extent(trans, root, 1, 0, (unsigned long)-1,
  424. btrfs_header_parentid(btrfs_buffer_header(root->node)), &ins);
  425. if (ret) {
  426. BUG();
  427. return NULL;
  428. }
  429. buf = find_tree_block(root, ins.objectid);
  430. set_buffer_uptodate(buf);
  431. return buf;
  432. }
  433. /*
  434. * helper function for drop_snapshot, this walks down the tree dropping ref
  435. * counts as it goes.
  436. */
  437. static int walk_down_tree(struct btrfs_trans_handle *trans, struct btrfs_root
  438. *root, struct btrfs_path *path, int *level)
  439. {
  440. struct buffer_head *next;
  441. struct buffer_head *cur;
  442. u64 blocknr;
  443. int ret;
  444. u32 refs;
  445. ret = lookup_block_ref(trans, root, path->nodes[*level]->b_blocknr,
  446. &refs);
  447. BUG_ON(ret);
  448. if (refs > 1)
  449. goto out;
  450. /*
  451. * walk down to the last node level and free all the leaves
  452. */
  453. while(*level > 0) {
  454. cur = path->nodes[*level];
  455. if (path->slots[*level] >=
  456. btrfs_header_nritems(btrfs_buffer_header(cur)))
  457. break;
  458. blocknr = btrfs_node_blockptr(btrfs_buffer_node(cur),
  459. path->slots[*level]);
  460. ret = lookup_block_ref(trans, root, blocknr, &refs);
  461. if (refs != 1 || *level == 1) {
  462. path->slots[*level]++;
  463. ret = btrfs_free_extent(trans, root, blocknr, 1, 1);
  464. BUG_ON(ret);
  465. continue;
  466. }
  467. BUG_ON(ret);
  468. next = read_tree_block(root, blocknr);
  469. if (path->nodes[*level-1])
  470. btrfs_block_release(root, path->nodes[*level-1]);
  471. path->nodes[*level-1] = next;
  472. *level = btrfs_header_level(btrfs_buffer_header(next));
  473. path->slots[*level] = 0;
  474. }
  475. out:
  476. ret = btrfs_free_extent(trans, root, path->nodes[*level]->b_blocknr,
  477. 1, 1);
  478. btrfs_block_release(root, path->nodes[*level]);
  479. path->nodes[*level] = NULL;
  480. *level += 1;
  481. BUG_ON(ret);
  482. return 0;
  483. }
  484. /*
  485. * helper for dropping snapshots. This walks back up the tree in the path
  486. * to find the first node higher up where we haven't yet gone through
  487. * all the slots
  488. */
  489. static int walk_up_tree(struct btrfs_trans_handle *trans, struct btrfs_root
  490. *root, struct btrfs_path *path, int *level)
  491. {
  492. int i;
  493. int slot;
  494. int ret;
  495. for(i = *level; i < BTRFS_MAX_LEVEL - 1 && path->nodes[i]; i++) {
  496. slot = path->slots[i];
  497. if (slot < btrfs_header_nritems(
  498. btrfs_buffer_header(path->nodes[i])) - 1) {
  499. path->slots[i]++;
  500. *level = i;
  501. return 0;
  502. } else {
  503. ret = btrfs_free_extent(trans, root,
  504. path->nodes[*level]->b_blocknr,
  505. 1, 1);
  506. btrfs_block_release(root, path->nodes[*level]);
  507. path->nodes[*level] = NULL;
  508. *level = i + 1;
  509. BUG_ON(ret);
  510. }
  511. }
  512. return 1;
  513. }
  514. /*
  515. * drop the reference count on the tree rooted at 'snap'. This traverses
  516. * the tree freeing any blocks that have a ref count of zero after being
  517. * decremented.
  518. */
  519. int btrfs_drop_snapshot(struct btrfs_trans_handle *trans, struct btrfs_root
  520. *root, struct buffer_head *snap)
  521. {
  522. int ret = 0;
  523. int wret;
  524. int level;
  525. struct btrfs_path path;
  526. int i;
  527. int orig_level;
  528. btrfs_init_path(&path);
  529. level = btrfs_header_level(btrfs_buffer_header(snap));
  530. orig_level = level;
  531. path.nodes[level] = snap;
  532. path.slots[level] = 0;
  533. while(1) {
  534. wret = walk_down_tree(trans, root, &path, &level);
  535. if (wret > 0)
  536. break;
  537. if (wret < 0)
  538. ret = wret;
  539. wret = walk_up_tree(trans, root, &path, &level);
  540. if (wret > 0)
  541. break;
  542. if (wret < 0)
  543. ret = wret;
  544. }
  545. for (i = 0; i <= orig_level; i++) {
  546. if (path.nodes[i]) {
  547. btrfs_block_release(root, path.nodes[i]);
  548. }
  549. }
  550. return ret;
  551. }