extent-tree.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441
  1. #include <stdio.h>
  2. #include <stdlib.h>
  3. #include "kerncompat.h"
  4. #include "radix-tree.h"
  5. #include "ctree.h"
  6. #include "disk-io.h"
  7. #include "print-tree.h"
  8. static int find_free_extent(struct ctree_root *orig_root, u64 num_blocks,
  9. u64 search_start, u64 search_end, struct key *ins);
  10. static int finish_current_insert(struct ctree_root *extent_root);
  11. static int run_pending(struct ctree_root *extent_root);
  12. /*
  13. * pending extents are blocks that we're trying to allocate in the extent
  14. * map while trying to grow the map because of other allocations. To avoid
  15. * recursing, they are tagged in the radix tree and cleaned up after
  16. * other allocations are done. The pending tag is also used in the same
  17. * manner for deletes.
  18. */
  19. #define CTREE_EXTENT_PENDING_DEL 0
  20. static int inc_block_ref(struct ctree_root *root, u64 blocknr)
  21. {
  22. struct ctree_path path;
  23. int ret;
  24. struct key key;
  25. struct leaf *l;
  26. struct extent_item *item;
  27. struct key ins;
  28. find_free_extent(root->extent_root, 0, 0, (u64)-1, &ins);
  29. init_path(&path);
  30. key.objectid = blocknr;
  31. key.flags = 0;
  32. key.offset = 1;
  33. ret = search_slot(root->extent_root, &key, &path, 0, 1);
  34. if (ret != 0)
  35. BUG();
  36. BUG_ON(ret != 0);
  37. l = &path.nodes[0]->leaf;
  38. item = (struct extent_item *)(l->data +
  39. l->items[path.slots[0]].offset);
  40. item->refs++;
  41. BUG_ON(list_empty(&path.nodes[0]->dirty));
  42. release_path(root->extent_root, &path);
  43. finish_current_insert(root->extent_root);
  44. run_pending(root->extent_root);
  45. return 0;
  46. }
  47. static int lookup_block_ref(struct ctree_root *root, u64 blocknr, int *refs)
  48. {
  49. struct ctree_path path;
  50. int ret;
  51. struct key key;
  52. struct leaf *l;
  53. struct extent_item *item;
  54. init_path(&path);
  55. key.objectid = blocknr;
  56. key.flags = 0;
  57. key.offset = 1;
  58. ret = search_slot(root->extent_root, &key, &path, 0, 0);
  59. if (ret != 0)
  60. BUG();
  61. l = &path.nodes[0]->leaf;
  62. item = (struct extent_item *)(l->data +
  63. l->items[path.slots[0]].offset);
  64. *refs = item->refs;
  65. release_path(root->extent_root, &path);
  66. return 0;
  67. }
  68. int btrfs_inc_ref(struct ctree_root *root, struct tree_buffer *buf)
  69. {
  70. u64 blocknr;
  71. int i;
  72. if (root == root->extent_root)
  73. return 0;
  74. if (is_leaf(buf->node.header.flags))
  75. return 0;
  76. for (i = 0; i < buf->node.header.nritems; i++) {
  77. blocknr = buf->node.blockptrs[i];
  78. inc_block_ref(root, blocknr);
  79. }
  80. return 0;
  81. }
  82. int btrfs_finish_extent_commit(struct ctree_root *root)
  83. {
  84. struct ctree_root *extent_root = root->extent_root;
  85. unsigned long gang[8];
  86. int ret;
  87. int i;
  88. while(1) {
  89. ret = radix_tree_gang_lookup(&extent_root->pinned_radix,
  90. (void **)gang, 0,
  91. ARRAY_SIZE(gang));
  92. if (!ret)
  93. break;
  94. for (i = 0; i < ret; i++)
  95. radix_tree_delete(&extent_root->pinned_radix, gang[i]);
  96. }
  97. return 0;
  98. }
  99. static int finish_current_insert(struct ctree_root *extent_root)
  100. {
  101. struct key ins;
  102. struct extent_item extent_item;
  103. int i;
  104. int ret;
  105. extent_item.refs = 1;
  106. extent_item.owner = extent_root->node->node.header.parentid;
  107. ins.offset = 1;
  108. ins.flags = 0;
  109. for (i = 0; i < extent_root->current_insert.flags; i++) {
  110. ins.objectid = extent_root->current_insert.objectid + i;
  111. ret = insert_item(extent_root, &ins, &extent_item,
  112. sizeof(extent_item));
  113. BUG_ON(ret);
  114. }
  115. extent_root->current_insert.offset = 0;
  116. return 0;
  117. }
  118. /*
  119. * remove an extent from the root, returns 0 on success
  120. */
  121. int __free_extent(struct ctree_root *root, u64 blocknr, u64 num_blocks)
  122. {
  123. struct ctree_path path;
  124. struct key key;
  125. struct ctree_root *extent_root = root->extent_root;
  126. int ret;
  127. struct item *item;
  128. struct extent_item *ei;
  129. struct key ins;
  130. key.objectid = blocknr;
  131. key.flags = 0;
  132. key.offset = num_blocks;
  133. find_free_extent(root, 0, 0, (u64)-1, &ins);
  134. init_path(&path);
  135. ret = search_slot(extent_root, &key, &path, -1, 1);
  136. if (ret) {
  137. printf("failed to find %Lu\n", key.objectid);
  138. print_tree(extent_root, extent_root->node);
  139. printf("failed to find %Lu\n", key.objectid);
  140. BUG();
  141. }
  142. item = path.nodes[0]->leaf.items + path.slots[0];
  143. ei = (struct extent_item *)(path.nodes[0]->leaf.data + item->offset);
  144. BUG_ON(ei->refs == 0);
  145. ei->refs--;
  146. if (ei->refs == 0) {
  147. if (root == extent_root) {
  148. int err;
  149. radix_tree_preload(GFP_KERNEL);
  150. err = radix_tree_insert(&extent_root->pinned_radix,
  151. blocknr, (void *)blocknr);
  152. BUG_ON(err);
  153. radix_tree_preload_end();
  154. }
  155. ret = del_item(extent_root, &path);
  156. if (ret)
  157. BUG();
  158. }
  159. release_path(extent_root, &path);
  160. finish_current_insert(extent_root);
  161. return ret;
  162. }
  163. /*
  164. * find all the blocks marked as pending in the radix tree and remove
  165. * them from the extent map
  166. */
  167. static int del_pending_extents(struct ctree_root *extent_root)
  168. {
  169. int ret;
  170. struct tree_buffer *gang[4];
  171. int i;
  172. while(1) {
  173. ret = radix_tree_gang_lookup_tag(&extent_root->cache_radix,
  174. (void **)gang, 0,
  175. ARRAY_SIZE(gang),
  176. CTREE_EXTENT_PENDING_DEL);
  177. if (!ret)
  178. break;
  179. for (i = 0; i < ret; i++) {
  180. ret = __free_extent(extent_root, gang[i]->blocknr, 1);
  181. radix_tree_tag_clear(&extent_root->cache_radix,
  182. gang[i]->blocknr,
  183. CTREE_EXTENT_PENDING_DEL);
  184. tree_block_release(extent_root, gang[i]);
  185. }
  186. }
  187. return 0;
  188. }
  189. static int run_pending(struct ctree_root *extent_root)
  190. {
  191. while(radix_tree_tagged(&extent_root->cache_radix,
  192. CTREE_EXTENT_PENDING_DEL))
  193. del_pending_extents(extent_root);
  194. return 0;
  195. }
  196. /*
  197. * remove an extent from the root, returns 0 on success
  198. */
  199. int free_extent(struct ctree_root *root, u64 blocknr, u64 num_blocks)
  200. {
  201. struct key key;
  202. struct ctree_root *extent_root = root->extent_root;
  203. struct tree_buffer *t;
  204. int pending_ret;
  205. int ret;
  206. if (root == extent_root) {
  207. t = find_tree_block(root, blocknr);
  208. radix_tree_tag_set(&root->cache_radix, blocknr,
  209. CTREE_EXTENT_PENDING_DEL);
  210. return 0;
  211. }
  212. key.objectid = blocknr;
  213. key.flags = 0;
  214. key.offset = num_blocks;
  215. ret = __free_extent(root, blocknr, num_blocks);
  216. pending_ret = run_pending(root->extent_root);
  217. return ret ? ret : pending_ret;
  218. }
  219. /*
  220. * walks the btree of allocated extents and find a hole of a given size.
  221. * The key ins is changed to record the hole:
  222. * ins->objectid == block start
  223. * ins->flags = 0
  224. * ins->offset == number of blocks
  225. * Any available blocks before search_start are skipped.
  226. */
  227. static int find_free_extent(struct ctree_root *orig_root, u64 num_blocks,
  228. u64 search_start, u64 search_end, struct key *ins)
  229. {
  230. struct ctree_path path;
  231. struct key *key;
  232. int ret;
  233. u64 hole_size = 0;
  234. int slot = 0;
  235. u64 last_block;
  236. u64 test_block;
  237. int start_found;
  238. struct leaf *l;
  239. struct ctree_root * root = orig_root->extent_root;
  240. int total_needed = num_blocks + MAX_LEVEL * 3;
  241. check_failed:
  242. init_path(&path);
  243. ins->objectid = search_start;
  244. ins->offset = 0;
  245. ins->flags = 0;
  246. start_found = 0;
  247. ret = search_slot(root, ins, &path, 0, 0);
  248. if (ret < 0)
  249. goto error;
  250. while (1) {
  251. l = &path.nodes[0]->leaf;
  252. slot = path.slots[0];
  253. if (slot >= l->header.nritems) {
  254. ret = next_leaf(root, &path);
  255. if (ret == 0)
  256. continue;
  257. if (ret < 0)
  258. goto error;
  259. if (!start_found) {
  260. ins->objectid = search_start;
  261. ins->offset = (u64)-1;
  262. start_found = 1;
  263. goto check_pending;
  264. }
  265. ins->objectid = last_block > search_start ?
  266. last_block : search_start;
  267. ins->offset = (u64)-1;
  268. goto check_pending;
  269. }
  270. if (slot == 0) {
  271. int last_slot = l->header.nritems - 1;
  272. u64 span = l->items[last_slot].key.objectid;
  273. span -= l->items[slot].key.objectid;
  274. if (span + total_needed > last_slot - slot) {
  275. path.slots[0] = last_slot + 1;
  276. key = &l->items[last_slot].key;
  277. last_block = key->objectid + key->offset;
  278. start_found = 1;
  279. continue;
  280. }
  281. }
  282. key = &l->items[slot].key;
  283. if (key->objectid >= search_start) {
  284. if (start_found) {
  285. hole_size = key->objectid - last_block;
  286. if (hole_size > total_needed) {
  287. ins->objectid = last_block;
  288. ins->offset = hole_size;
  289. goto check_pending;
  290. }
  291. } else
  292. start_found = 1;
  293. last_block = key->objectid + key->offset;
  294. }
  295. path.slots[0]++;
  296. }
  297. // FIXME -ENOSPC
  298. check_pending:
  299. /* we have to make sure we didn't find an extent that has already
  300. * been allocated by the map tree or the original allocation
  301. */
  302. release_path(root, &path);
  303. BUG_ON(ins->objectid < search_start);
  304. for (test_block = ins->objectid;
  305. test_block < ins->objectid + total_needed; test_block++) {
  306. if (radix_tree_lookup(&root->pinned_radix, test_block)) {
  307. search_start = test_block + 1;
  308. goto check_failed;
  309. }
  310. }
  311. BUG_ON(root->current_insert.offset);
  312. root->current_insert.offset = total_needed;
  313. root->current_insert.objectid = ins->objectid + num_blocks;
  314. root->current_insert.flags = 0;
  315. ins->offset = num_blocks;
  316. return 0;
  317. error:
  318. release_path(root, &path);
  319. return ret;
  320. }
  321. /*
  322. * finds a free extent and does all the dirty work required for allocation
  323. * returns the key for the extent through ins, and a tree buffer for
  324. * the first block of the extent through buf.
  325. *
  326. * returns 0 if everything worked, non-zero otherwise.
  327. */
  328. int alloc_extent(struct ctree_root *root, u64 num_blocks, u64 search_start,
  329. u64 search_end, u64 owner, struct key *ins)
  330. {
  331. int ret;
  332. int pending_ret;
  333. struct ctree_root *extent_root = root->extent_root;
  334. struct extent_item extent_item;
  335. extent_item.refs = 1;
  336. extent_item.owner = owner;
  337. if (root == extent_root) {
  338. BUG_ON(extent_root->current_insert.offset == 0);
  339. BUG_ON(num_blocks != 1);
  340. BUG_ON(extent_root->current_insert.flags ==
  341. extent_root->current_insert.offset);
  342. ins->offset = 1;
  343. ins->objectid = extent_root->current_insert.objectid +
  344. extent_root->current_insert.flags++;
  345. return 0;
  346. }
  347. ret = find_free_extent(root, num_blocks, search_start,
  348. search_end, ins);
  349. if (ret)
  350. return ret;
  351. ret = insert_item(extent_root, ins, &extent_item,
  352. sizeof(extent_item));
  353. finish_current_insert(extent_root);
  354. pending_ret = run_pending(extent_root);
  355. if (ret)
  356. return ret;
  357. if (pending_ret)
  358. return pending_ret;
  359. return 0;
  360. }
  361. /*
  362. * helper function to allocate a block for a given tree
  363. * returns the tree buffer or NULL.
  364. */
  365. struct tree_buffer *alloc_free_block(struct ctree_root *root)
  366. {
  367. struct key ins;
  368. int ret;
  369. struct tree_buffer *buf;
  370. ret = alloc_extent(root, 1, 0, (unsigned long)-1,
  371. root->node->node.header.parentid,
  372. &ins);
  373. if (ret) {
  374. BUG();
  375. return NULL;
  376. }
  377. buf = find_tree_block(root, ins.objectid);
  378. dirty_tree_block(root, buf);
  379. return buf;
  380. }
  381. int btrfs_drop_snapshot(struct ctree_root *root, struct tree_buffer *snap)
  382. {
  383. int ret;
  384. int level;
  385. int refs;
  386. u64 blocknr = snap->blocknr;
  387. level = node_level(snap->node.header.flags);
  388. ret = lookup_block_ref(root, snap->blocknr, &refs);
  389. BUG_ON(ret);
  390. if (refs == 1 && level != 0) {
  391. struct node *n = &snap->node;
  392. struct tree_buffer *b;
  393. int i;
  394. for (i = 0; i < n->header.nritems; i++) {
  395. b = read_tree_block(root, n->blockptrs[i]);
  396. /* FIXME, don't recurse here */
  397. ret = btrfs_drop_snapshot(root, b);
  398. BUG_ON(ret);
  399. tree_block_release(root, b);
  400. }
  401. }
  402. ret = free_extent(root, blocknr, 1);
  403. BUG_ON(ret);
  404. return 0;
  405. }