disk-io.c 27 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012
  1. /*
  2. * Copyright (C) 2007 Oracle. All rights reserved.
  3. *
  4. * This program is free software; you can redistribute it and/or
  5. * modify it under the terms of the GNU General Public
  6. * License v2 as published by the Free Software Foundation.
  7. *
  8. * This program is distributed in the hope that it will be useful,
  9. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  11. * General Public License for more details.
  12. *
  13. * You should have received a copy of the GNU General Public
  14. * License along with this program; if not, write to the
  15. * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
  16. * Boston, MA 021110-1307, USA.
  17. */
  18. #include <linux/fs.h>
  19. #include <linux/blkdev.h>
  20. #include <linux/crc32c.h>
  21. #include <linux/scatterlist.h>
  22. #include <linux/swap.h>
  23. #include <linux/radix-tree.h>
  24. #include <linux/writeback.h>
  25. #include <linux/buffer_head.h> // for block_sync_page
  26. #include "ctree.h"
  27. #include "disk-io.h"
  28. #include "transaction.h"
  29. #include "btrfs_inode.h"
  30. #include "print-tree.h"
  31. #if 0
  32. static int check_tree_block(struct btrfs_root *root, struct extent_buffer *buf)
  33. {
  34. if (extent_buffer_blocknr(buf) != btrfs_header_blocknr(buf)) {
  35. printk(KERN_CRIT "buf blocknr(buf) is %llu, header is %llu\n",
  36. (unsigned long long)extent_buffer_blocknr(buf),
  37. (unsigned long long)btrfs_header_blocknr(buf));
  38. return 1;
  39. }
  40. return 0;
  41. }
  42. #endif
  43. static struct extent_io_ops btree_extent_io_ops;
  44. struct extent_buffer *btrfs_find_tree_block(struct btrfs_root *root,
  45. u64 bytenr, u32 blocksize)
  46. {
  47. struct inode *btree_inode = root->fs_info->btree_inode;
  48. struct extent_buffer *eb;
  49. eb = find_extent_buffer(&BTRFS_I(btree_inode)->io_tree,
  50. bytenr, blocksize, GFP_NOFS);
  51. return eb;
  52. }
  53. struct extent_buffer *btrfs_find_create_tree_block(struct btrfs_root *root,
  54. u64 bytenr, u32 blocksize)
  55. {
  56. struct inode *btree_inode = root->fs_info->btree_inode;
  57. struct extent_buffer *eb;
  58. eb = alloc_extent_buffer(&BTRFS_I(btree_inode)->io_tree,
  59. bytenr, blocksize, NULL, GFP_NOFS);
  60. return eb;
  61. }
  62. struct extent_map *btree_get_extent(struct inode *inode, struct page *page,
  63. size_t page_offset, u64 start, u64 len,
  64. int create)
  65. {
  66. struct extent_map_tree *em_tree = &BTRFS_I(inode)->extent_tree;
  67. struct extent_map *em;
  68. int ret;
  69. again:
  70. spin_lock(&em_tree->lock);
  71. em = lookup_extent_mapping(em_tree, start, len);
  72. spin_unlock(&em_tree->lock);
  73. if (em) {
  74. goto out;
  75. }
  76. em = alloc_extent_map(GFP_NOFS);
  77. if (!em) {
  78. em = ERR_PTR(-ENOMEM);
  79. goto out;
  80. }
  81. em->start = 0;
  82. em->len = i_size_read(inode);
  83. em->block_start = 0;
  84. em->bdev = inode->i_sb->s_bdev;
  85. spin_lock(&em_tree->lock);
  86. ret = add_extent_mapping(em_tree, em);
  87. spin_unlock(&em_tree->lock);
  88. if (ret == -EEXIST) {
  89. free_extent_map(em);
  90. em = NULL;
  91. goto again;
  92. } else if (ret) {
  93. em = ERR_PTR(ret);
  94. }
  95. out:
  96. return em;
  97. }
  98. u32 btrfs_csum_data(struct btrfs_root *root, char *data, u32 seed, size_t len)
  99. {
  100. return crc32c(seed, data, len);
  101. }
  102. void btrfs_csum_final(u32 crc, char *result)
  103. {
  104. *(__le32 *)result = ~cpu_to_le32(crc);
  105. }
  106. static int csum_tree_block(struct btrfs_root *root, struct extent_buffer *buf,
  107. int verify)
  108. {
  109. char result[BTRFS_CRC32_SIZE];
  110. unsigned long len;
  111. unsigned long cur_len;
  112. unsigned long offset = BTRFS_CSUM_SIZE;
  113. char *map_token = NULL;
  114. char *kaddr;
  115. unsigned long map_start;
  116. unsigned long map_len;
  117. int err;
  118. u32 crc = ~(u32)0;
  119. len = buf->len - offset;
  120. while(len > 0) {
  121. err = map_private_extent_buffer(buf, offset, 32,
  122. &map_token, &kaddr,
  123. &map_start, &map_len, KM_USER0);
  124. if (err) {
  125. printk("failed to map extent buffer! %lu\n",
  126. offset);
  127. return 1;
  128. }
  129. cur_len = min(len, map_len - (offset - map_start));
  130. crc = btrfs_csum_data(root, kaddr + offset - map_start,
  131. crc, cur_len);
  132. len -= cur_len;
  133. offset += cur_len;
  134. unmap_extent_buffer(buf, map_token, KM_USER0);
  135. }
  136. btrfs_csum_final(crc, result);
  137. if (verify) {
  138. int from_this_trans = 0;
  139. if (root->fs_info->running_transaction &&
  140. btrfs_header_generation(buf) ==
  141. root->fs_info->running_transaction->transid)
  142. from_this_trans = 1;
  143. /* FIXME, this is not good */
  144. if (from_this_trans == 0 &&
  145. memcmp_extent_buffer(buf, result, 0, BTRFS_CRC32_SIZE)) {
  146. u32 val;
  147. u32 found = 0;
  148. memcpy(&found, result, BTRFS_CRC32_SIZE);
  149. read_extent_buffer(buf, &val, 0, BTRFS_CRC32_SIZE);
  150. printk("btrfs: %s checksum verify failed on %llu "
  151. "wanted %X found %X from_this_trans %d\n",
  152. root->fs_info->sb->s_id,
  153. buf->start, val, found, from_this_trans);
  154. return 1;
  155. }
  156. } else {
  157. write_extent_buffer(buf, result, 0, BTRFS_CRC32_SIZE);
  158. }
  159. return 0;
  160. }
  161. int csum_dirty_buffer(struct btrfs_root *root, struct page *page)
  162. {
  163. struct extent_io_tree *tree;
  164. u64 start = (u64)page->index << PAGE_CACHE_SHIFT;
  165. u64 found_start;
  166. int found_level;
  167. unsigned long len;
  168. struct extent_buffer *eb;
  169. tree = &BTRFS_I(page->mapping->host)->io_tree;
  170. if (page->private == EXTENT_PAGE_PRIVATE)
  171. goto out;
  172. if (!page->private)
  173. goto out;
  174. len = page->private >> 2;
  175. if (len == 0) {
  176. WARN_ON(1);
  177. }
  178. eb = alloc_extent_buffer(tree, start, len, page, GFP_NOFS);
  179. read_extent_buffer_pages(tree, eb, start + PAGE_CACHE_SIZE, 1);
  180. btrfs_clear_buffer_defrag(eb);
  181. found_start = btrfs_header_bytenr(eb);
  182. if (found_start != start) {
  183. printk("warning: eb start incorrect %Lu buffer %Lu len %lu\n",
  184. start, found_start, len);
  185. WARN_ON(1);
  186. goto err;
  187. }
  188. if (eb->first_page != page) {
  189. printk("bad first page %lu %lu\n", eb->first_page->index,
  190. page->index);
  191. WARN_ON(1);
  192. goto err;
  193. }
  194. if (!PageUptodate(page)) {
  195. printk("csum not up to date page %lu\n", page->index);
  196. WARN_ON(1);
  197. goto err;
  198. }
  199. found_level = btrfs_header_level(eb);
  200. csum_tree_block(root, eb, 0);
  201. err:
  202. free_extent_buffer(eb);
  203. out:
  204. return 0;
  205. }
  206. static int btree_writepage_io_hook(struct page *page, u64 start, u64 end)
  207. {
  208. struct btrfs_root *root = BTRFS_I(page->mapping->host)->root;
  209. csum_dirty_buffer(root, page);
  210. return 0;
  211. }
  212. static int btree_writepage(struct page *page, struct writeback_control *wbc)
  213. {
  214. struct extent_io_tree *tree;
  215. tree = &BTRFS_I(page->mapping->host)->io_tree;
  216. return extent_write_full_page(tree, page, btree_get_extent, wbc);
  217. }
  218. static int btree_writepages(struct address_space *mapping,
  219. struct writeback_control *wbc)
  220. {
  221. struct extent_io_tree *tree;
  222. tree = &BTRFS_I(mapping->host)->io_tree;
  223. if (wbc->sync_mode == WB_SYNC_NONE) {
  224. u64 num_dirty;
  225. u64 start = 0;
  226. unsigned long thresh = 96 * 1024 * 1024;
  227. if (wbc->for_kupdate)
  228. return 0;
  229. if (current_is_pdflush()) {
  230. thresh = 96 * 1024 * 1024;
  231. } else {
  232. thresh = 8 * 1024 * 1024;
  233. }
  234. num_dirty = count_range_bits(tree, &start, (u64)-1,
  235. thresh, EXTENT_DIRTY);
  236. if (num_dirty < thresh) {
  237. return 0;
  238. }
  239. }
  240. return extent_writepages(tree, mapping, btree_get_extent, wbc);
  241. }
  242. int btree_readpage(struct file *file, struct page *page)
  243. {
  244. struct extent_io_tree *tree;
  245. tree = &BTRFS_I(page->mapping->host)->io_tree;
  246. return extent_read_full_page(tree, page, btree_get_extent);
  247. }
  248. static int btree_releasepage(struct page *page, gfp_t gfp_flags)
  249. {
  250. struct extent_io_tree *tree;
  251. struct extent_map_tree *map;
  252. int ret;
  253. tree = &BTRFS_I(page->mapping->host)->io_tree;
  254. map = &BTRFS_I(page->mapping->host)->extent_tree;
  255. ret = try_release_extent_mapping(map, tree, page, gfp_flags);
  256. if (ret == 1) {
  257. ClearPagePrivate(page);
  258. set_page_private(page, 0);
  259. page_cache_release(page);
  260. }
  261. return ret;
  262. }
  263. static void btree_invalidatepage(struct page *page, unsigned long offset)
  264. {
  265. struct extent_io_tree *tree;
  266. tree = &BTRFS_I(page->mapping->host)->io_tree;
  267. extent_invalidatepage(tree, page, offset);
  268. btree_releasepage(page, GFP_NOFS);
  269. }
  270. #if 0
  271. static int btree_writepage(struct page *page, struct writeback_control *wbc)
  272. {
  273. struct buffer_head *bh;
  274. struct btrfs_root *root = BTRFS_I(page->mapping->host)->root;
  275. struct buffer_head *head;
  276. if (!page_has_buffers(page)) {
  277. create_empty_buffers(page, root->fs_info->sb->s_blocksize,
  278. (1 << BH_Dirty)|(1 << BH_Uptodate));
  279. }
  280. head = page_buffers(page);
  281. bh = head;
  282. do {
  283. if (buffer_dirty(bh))
  284. csum_tree_block(root, bh, 0);
  285. bh = bh->b_this_page;
  286. } while (bh != head);
  287. return block_write_full_page(page, btree_get_block, wbc);
  288. }
  289. #endif
  290. static struct address_space_operations btree_aops = {
  291. .readpage = btree_readpage,
  292. .writepage = btree_writepage,
  293. .writepages = btree_writepages,
  294. .releasepage = btree_releasepage,
  295. .invalidatepage = btree_invalidatepage,
  296. .sync_page = block_sync_page,
  297. };
  298. int readahead_tree_block(struct btrfs_root *root, u64 bytenr, u32 blocksize)
  299. {
  300. struct extent_buffer *buf = NULL;
  301. struct inode *btree_inode = root->fs_info->btree_inode;
  302. int ret = 0;
  303. buf = btrfs_find_create_tree_block(root, bytenr, blocksize);
  304. if (!buf)
  305. return 0;
  306. read_extent_buffer_pages(&BTRFS_I(btree_inode)->io_tree,
  307. buf, 0, 0);
  308. free_extent_buffer(buf);
  309. return ret;
  310. }
  311. struct extent_buffer *read_tree_block(struct btrfs_root *root, u64 bytenr,
  312. u32 blocksize)
  313. {
  314. struct extent_buffer *buf = NULL;
  315. struct inode *btree_inode = root->fs_info->btree_inode;
  316. struct extent_io_tree *io_tree;
  317. u64 end;
  318. int ret;
  319. io_tree = &BTRFS_I(btree_inode)->io_tree;
  320. buf = btrfs_find_create_tree_block(root, bytenr, blocksize);
  321. if (!buf)
  322. return NULL;
  323. read_extent_buffer_pages(&BTRFS_I(btree_inode)->io_tree, buf, 0, 1);
  324. if (buf->flags & EXTENT_CSUM)
  325. return buf;
  326. end = buf->start + PAGE_CACHE_SIZE - 1;
  327. if (test_range_bit(io_tree, buf->start, end, EXTENT_CSUM, 1)) {
  328. buf->flags |= EXTENT_CSUM;
  329. return buf;
  330. }
  331. lock_extent(io_tree, buf->start, end, GFP_NOFS);
  332. if (test_range_bit(io_tree, buf->start, end, EXTENT_CSUM, 1)) {
  333. buf->flags |= EXTENT_CSUM;
  334. goto out_unlock;
  335. }
  336. ret = csum_tree_block(root, buf, 1);
  337. set_extent_bits(io_tree, buf->start, end, EXTENT_CSUM, GFP_NOFS);
  338. buf->flags |= EXTENT_CSUM;
  339. out_unlock:
  340. unlock_extent(io_tree, buf->start, end, GFP_NOFS);
  341. return buf;
  342. }
  343. int clean_tree_block(struct btrfs_trans_handle *trans, struct btrfs_root *root,
  344. struct extent_buffer *buf)
  345. {
  346. struct inode *btree_inode = root->fs_info->btree_inode;
  347. if (btrfs_header_generation(buf) ==
  348. root->fs_info->running_transaction->transid)
  349. clear_extent_buffer_dirty(&BTRFS_I(btree_inode)->io_tree,
  350. buf);
  351. return 0;
  352. }
  353. int wait_on_tree_block_writeback(struct btrfs_root *root,
  354. struct extent_buffer *buf)
  355. {
  356. struct inode *btree_inode = root->fs_info->btree_inode;
  357. wait_on_extent_buffer_writeback(&BTRFS_I(btree_inode)->io_tree,
  358. buf);
  359. return 0;
  360. }
  361. static int __setup_root(u32 nodesize, u32 leafsize, u32 sectorsize,
  362. u32 stripesize, struct btrfs_root *root,
  363. struct btrfs_fs_info *fs_info,
  364. u64 objectid)
  365. {
  366. root->node = NULL;
  367. root->inode = NULL;
  368. root->commit_root = NULL;
  369. root->sectorsize = sectorsize;
  370. root->nodesize = nodesize;
  371. root->leafsize = leafsize;
  372. root->stripesize = stripesize;
  373. root->ref_cows = 0;
  374. root->fs_info = fs_info;
  375. root->objectid = objectid;
  376. root->last_trans = 0;
  377. root->highest_inode = 0;
  378. root->last_inode_alloc = 0;
  379. root->name = NULL;
  380. root->in_sysfs = 0;
  381. memset(&root->root_key, 0, sizeof(root->root_key));
  382. memset(&root->root_item, 0, sizeof(root->root_item));
  383. memset(&root->defrag_progress, 0, sizeof(root->defrag_progress));
  384. memset(&root->root_kobj, 0, sizeof(root->root_kobj));
  385. init_completion(&root->kobj_unregister);
  386. root->defrag_running = 0;
  387. root->defrag_level = 0;
  388. root->root_key.objectid = objectid;
  389. return 0;
  390. }
  391. static int find_and_setup_root(struct btrfs_root *tree_root,
  392. struct btrfs_fs_info *fs_info,
  393. u64 objectid,
  394. struct btrfs_root *root)
  395. {
  396. int ret;
  397. u32 blocksize;
  398. __setup_root(tree_root->nodesize, tree_root->leafsize,
  399. tree_root->sectorsize, tree_root->stripesize,
  400. root, fs_info, objectid);
  401. ret = btrfs_find_last_root(tree_root, objectid,
  402. &root->root_item, &root->root_key);
  403. BUG_ON(ret);
  404. blocksize = btrfs_level_size(root, btrfs_root_level(&root->root_item));
  405. root->node = read_tree_block(root, btrfs_root_bytenr(&root->root_item),
  406. blocksize);
  407. BUG_ON(!root->node);
  408. return 0;
  409. }
  410. struct btrfs_root *btrfs_read_fs_root_no_radix(struct btrfs_fs_info *fs_info,
  411. struct btrfs_key *location)
  412. {
  413. struct btrfs_root *root;
  414. struct btrfs_root *tree_root = fs_info->tree_root;
  415. struct btrfs_path *path;
  416. struct extent_buffer *l;
  417. u64 highest_inode;
  418. u32 blocksize;
  419. int ret = 0;
  420. root = kzalloc(sizeof(*root), GFP_NOFS);
  421. if (!root)
  422. return ERR_PTR(-ENOMEM);
  423. if (location->offset == (u64)-1) {
  424. ret = find_and_setup_root(tree_root, fs_info,
  425. location->objectid, root);
  426. if (ret) {
  427. kfree(root);
  428. return ERR_PTR(ret);
  429. }
  430. goto insert;
  431. }
  432. __setup_root(tree_root->nodesize, tree_root->leafsize,
  433. tree_root->sectorsize, tree_root->stripesize,
  434. root, fs_info, location->objectid);
  435. path = btrfs_alloc_path();
  436. BUG_ON(!path);
  437. ret = btrfs_search_slot(NULL, tree_root, location, path, 0, 0);
  438. if (ret != 0) {
  439. if (ret > 0)
  440. ret = -ENOENT;
  441. goto out;
  442. }
  443. l = path->nodes[0];
  444. read_extent_buffer(l, &root->root_item,
  445. btrfs_item_ptr_offset(l, path->slots[0]),
  446. sizeof(root->root_item));
  447. memcpy(&root->root_key, location, sizeof(*location));
  448. ret = 0;
  449. out:
  450. btrfs_release_path(root, path);
  451. btrfs_free_path(path);
  452. if (ret) {
  453. kfree(root);
  454. return ERR_PTR(ret);
  455. }
  456. blocksize = btrfs_level_size(root, btrfs_root_level(&root->root_item));
  457. root->node = read_tree_block(root, btrfs_root_bytenr(&root->root_item),
  458. blocksize);
  459. BUG_ON(!root->node);
  460. insert:
  461. root->ref_cows = 1;
  462. ret = btrfs_find_highest_inode(root, &highest_inode);
  463. if (ret == 0) {
  464. root->highest_inode = highest_inode;
  465. root->last_inode_alloc = highest_inode;
  466. }
  467. return root;
  468. }
  469. struct btrfs_root *btrfs_lookup_fs_root(struct btrfs_fs_info *fs_info,
  470. u64 root_objectid)
  471. {
  472. struct btrfs_root *root;
  473. if (root_objectid == BTRFS_ROOT_TREE_OBJECTID)
  474. return fs_info->tree_root;
  475. if (root_objectid == BTRFS_EXTENT_TREE_OBJECTID)
  476. return fs_info->extent_root;
  477. root = radix_tree_lookup(&fs_info->fs_roots_radix,
  478. (unsigned long)root_objectid);
  479. return root;
  480. }
  481. struct btrfs_root *btrfs_read_fs_root_no_name(struct btrfs_fs_info *fs_info,
  482. struct btrfs_key *location)
  483. {
  484. struct btrfs_root *root;
  485. int ret;
  486. if (location->objectid == BTRFS_ROOT_TREE_OBJECTID)
  487. return fs_info->tree_root;
  488. if (location->objectid == BTRFS_EXTENT_TREE_OBJECTID)
  489. return fs_info->extent_root;
  490. root = radix_tree_lookup(&fs_info->fs_roots_radix,
  491. (unsigned long)location->objectid);
  492. if (root)
  493. return root;
  494. root = btrfs_read_fs_root_no_radix(fs_info, location);
  495. if (IS_ERR(root))
  496. return root;
  497. ret = radix_tree_insert(&fs_info->fs_roots_radix,
  498. (unsigned long)root->root_key.objectid,
  499. root);
  500. if (ret) {
  501. free_extent_buffer(root->node);
  502. kfree(root);
  503. return ERR_PTR(ret);
  504. }
  505. ret = btrfs_find_dead_roots(fs_info->tree_root,
  506. root->root_key.objectid, root);
  507. BUG_ON(ret);
  508. return root;
  509. }
  510. struct btrfs_root *btrfs_read_fs_root(struct btrfs_fs_info *fs_info,
  511. struct btrfs_key *location,
  512. const char *name, int namelen)
  513. {
  514. struct btrfs_root *root;
  515. int ret;
  516. root = btrfs_read_fs_root_no_name(fs_info, location);
  517. if (!root)
  518. return NULL;
  519. if (root->in_sysfs)
  520. return root;
  521. ret = btrfs_set_root_name(root, name, namelen);
  522. if (ret) {
  523. free_extent_buffer(root->node);
  524. kfree(root);
  525. return ERR_PTR(ret);
  526. }
  527. ret = btrfs_sysfs_add_root(root);
  528. if (ret) {
  529. free_extent_buffer(root->node);
  530. kfree(root->name);
  531. kfree(root);
  532. return ERR_PTR(ret);
  533. }
  534. root->in_sysfs = 1;
  535. return root;
  536. }
  537. #if 0
  538. static int add_hasher(struct btrfs_fs_info *info, char *type) {
  539. struct btrfs_hasher *hasher;
  540. hasher = kmalloc(sizeof(*hasher), GFP_NOFS);
  541. if (!hasher)
  542. return -ENOMEM;
  543. hasher->hash_tfm = crypto_alloc_hash(type, 0, CRYPTO_ALG_ASYNC);
  544. if (!hasher->hash_tfm) {
  545. kfree(hasher);
  546. return -EINVAL;
  547. }
  548. spin_lock(&info->hash_lock);
  549. list_add(&hasher->list, &info->hashers);
  550. spin_unlock(&info->hash_lock);
  551. return 0;
  552. }
  553. #endif
  554. struct btrfs_root *open_ctree(struct super_block *sb)
  555. {
  556. u32 sectorsize;
  557. u32 nodesize;
  558. u32 leafsize;
  559. u32 blocksize;
  560. u32 stripesize;
  561. struct btrfs_root *extent_root = kmalloc(sizeof(struct btrfs_root),
  562. GFP_NOFS);
  563. struct btrfs_root *tree_root = kmalloc(sizeof(struct btrfs_root),
  564. GFP_NOFS);
  565. struct btrfs_fs_info *fs_info = kmalloc(sizeof(*fs_info),
  566. GFP_NOFS);
  567. int ret;
  568. int err = -EIO;
  569. struct btrfs_super_block *disk_super;
  570. if (!extent_root || !tree_root || !fs_info) {
  571. err = -ENOMEM;
  572. goto fail;
  573. }
  574. INIT_RADIX_TREE(&fs_info->fs_roots_radix, GFP_NOFS);
  575. INIT_LIST_HEAD(&fs_info->trans_list);
  576. INIT_LIST_HEAD(&fs_info->dead_roots);
  577. INIT_LIST_HEAD(&fs_info->hashers);
  578. spin_lock_init(&fs_info->hash_lock);
  579. spin_lock_init(&fs_info->delalloc_lock);
  580. spin_lock_init(&fs_info->new_trans_lock);
  581. memset(&fs_info->super_kobj, 0, sizeof(fs_info->super_kobj));
  582. init_completion(&fs_info->kobj_unregister);
  583. sb_set_blocksize(sb, 4096);
  584. fs_info->running_transaction = NULL;
  585. fs_info->last_trans_committed = 0;
  586. fs_info->tree_root = tree_root;
  587. fs_info->extent_root = extent_root;
  588. fs_info->sb = sb;
  589. fs_info->throttles = 0;
  590. fs_info->mount_opt = 0;
  591. fs_info->max_extent = (u64)-1;
  592. fs_info->max_inline = 8192 * 1024;
  593. fs_info->delalloc_bytes = 0;
  594. fs_info->btree_inode = new_inode(sb);
  595. fs_info->btree_inode->i_ino = 1;
  596. fs_info->btree_inode->i_nlink = 1;
  597. fs_info->btree_inode->i_size = sb->s_bdev->bd_inode->i_size;
  598. fs_info->btree_inode->i_mapping->a_ops = &btree_aops;
  599. extent_io_tree_init(&BTRFS_I(fs_info->btree_inode)->io_tree,
  600. fs_info->btree_inode->i_mapping,
  601. GFP_NOFS);
  602. extent_map_tree_init(&BTRFS_I(fs_info->btree_inode)->extent_tree,
  603. GFP_NOFS);
  604. BTRFS_I(fs_info->btree_inode)->io_tree.ops = &btree_extent_io_ops;
  605. extent_io_tree_init(&fs_info->free_space_cache,
  606. fs_info->btree_inode->i_mapping, GFP_NOFS);
  607. extent_io_tree_init(&fs_info->block_group_cache,
  608. fs_info->btree_inode->i_mapping, GFP_NOFS);
  609. extent_io_tree_init(&fs_info->pinned_extents,
  610. fs_info->btree_inode->i_mapping, GFP_NOFS);
  611. extent_io_tree_init(&fs_info->pending_del,
  612. fs_info->btree_inode->i_mapping, GFP_NOFS);
  613. extent_io_tree_init(&fs_info->extent_ins,
  614. fs_info->btree_inode->i_mapping, GFP_NOFS);
  615. fs_info->do_barriers = 1;
  616. fs_info->closing = 0;
  617. fs_info->total_pinned = 0;
  618. fs_info->last_alloc = 0;
  619. #if LINUX_VERSION_CODE <= KERNEL_VERSION(2,6,18)
  620. INIT_WORK(&fs_info->trans_work, btrfs_transaction_cleaner, fs_info);
  621. #else
  622. INIT_DELAYED_WORK(&fs_info->trans_work, btrfs_transaction_cleaner);
  623. #endif
  624. BTRFS_I(fs_info->btree_inode)->root = tree_root;
  625. memset(&BTRFS_I(fs_info->btree_inode)->location, 0,
  626. sizeof(struct btrfs_key));
  627. insert_inode_hash(fs_info->btree_inode);
  628. mapping_set_gfp_mask(fs_info->btree_inode->i_mapping, GFP_NOFS);
  629. mutex_init(&fs_info->trans_mutex);
  630. mutex_init(&fs_info->fs_mutex);
  631. #if 0
  632. ret = add_hasher(fs_info, "crc32c");
  633. if (ret) {
  634. printk("btrfs: failed hash setup, modprobe cryptomgr?\n");
  635. err = -ENOMEM;
  636. goto fail_iput;
  637. }
  638. #endif
  639. __setup_root(512, 512, 512, 512, tree_root,
  640. fs_info, BTRFS_ROOT_TREE_OBJECTID);
  641. fs_info->sb_buffer = read_tree_block(tree_root,
  642. BTRFS_SUPER_INFO_OFFSET,
  643. 512);
  644. if (!fs_info->sb_buffer)
  645. goto fail_iput;
  646. read_extent_buffer(fs_info->sb_buffer, &fs_info->super_copy, 0,
  647. sizeof(fs_info->super_copy));
  648. read_extent_buffer(fs_info->sb_buffer, fs_info->fsid,
  649. (unsigned long)btrfs_super_fsid(fs_info->sb_buffer),
  650. BTRFS_FSID_SIZE);
  651. disk_super = &fs_info->super_copy;
  652. if (!btrfs_super_root(disk_super))
  653. goto fail_sb_buffer;
  654. nodesize = btrfs_super_nodesize(disk_super);
  655. leafsize = btrfs_super_leafsize(disk_super);
  656. sectorsize = btrfs_super_sectorsize(disk_super);
  657. stripesize = btrfs_super_stripesize(disk_super);
  658. tree_root->nodesize = nodesize;
  659. tree_root->leafsize = leafsize;
  660. tree_root->sectorsize = sectorsize;
  661. tree_root->stripesize = stripesize;
  662. sb_set_blocksize(sb, sectorsize);
  663. i_size_write(fs_info->btree_inode,
  664. btrfs_super_total_bytes(disk_super));
  665. if (strncmp((char *)(&disk_super->magic), BTRFS_MAGIC,
  666. sizeof(disk_super->magic))) {
  667. printk("btrfs: valid FS not found on %s\n", sb->s_id);
  668. goto fail_sb_buffer;
  669. }
  670. blocksize = btrfs_level_size(tree_root,
  671. btrfs_super_root_level(disk_super));
  672. tree_root->node = read_tree_block(tree_root,
  673. btrfs_super_root(disk_super),
  674. blocksize);
  675. if (!tree_root->node)
  676. goto fail_sb_buffer;
  677. mutex_lock(&fs_info->fs_mutex);
  678. ret = find_and_setup_root(tree_root, fs_info,
  679. BTRFS_EXTENT_TREE_OBJECTID, extent_root);
  680. if (ret) {
  681. mutex_unlock(&fs_info->fs_mutex);
  682. goto fail_tree_root;
  683. }
  684. btrfs_read_block_groups(extent_root);
  685. fs_info->generation = btrfs_super_generation(disk_super) + 1;
  686. mutex_unlock(&fs_info->fs_mutex);
  687. return tree_root;
  688. fail_tree_root:
  689. free_extent_buffer(tree_root->node);
  690. fail_sb_buffer:
  691. free_extent_buffer(fs_info->sb_buffer);
  692. fail_iput:
  693. iput(fs_info->btree_inode);
  694. fail:
  695. kfree(extent_root);
  696. kfree(tree_root);
  697. kfree(fs_info);
  698. return ERR_PTR(err);
  699. }
  700. int write_ctree_super(struct btrfs_trans_handle *trans, struct btrfs_root
  701. *root)
  702. {
  703. int ret;
  704. struct extent_buffer *super = root->fs_info->sb_buffer;
  705. struct inode *btree_inode = root->fs_info->btree_inode;
  706. struct super_block *sb = root->fs_info->sb;
  707. if (!btrfs_test_opt(root, NOBARRIER))
  708. blkdev_issue_flush(sb->s_bdev, NULL);
  709. set_extent_buffer_dirty(&BTRFS_I(btree_inode)->io_tree, super);
  710. ret = sync_page_range_nolock(btree_inode, btree_inode->i_mapping,
  711. super->start, super->len);
  712. if (!btrfs_test_opt(root, NOBARRIER))
  713. blkdev_issue_flush(sb->s_bdev, NULL);
  714. return ret;
  715. }
  716. int btrfs_free_fs_root(struct btrfs_fs_info *fs_info, struct btrfs_root *root)
  717. {
  718. radix_tree_delete(&fs_info->fs_roots_radix,
  719. (unsigned long)root->root_key.objectid);
  720. if (root->in_sysfs)
  721. btrfs_sysfs_del_root(root);
  722. if (root->inode)
  723. iput(root->inode);
  724. if (root->node)
  725. free_extent_buffer(root->node);
  726. if (root->commit_root)
  727. free_extent_buffer(root->commit_root);
  728. if (root->name)
  729. kfree(root->name);
  730. kfree(root);
  731. return 0;
  732. }
  733. static int del_fs_roots(struct btrfs_fs_info *fs_info)
  734. {
  735. int ret;
  736. struct btrfs_root *gang[8];
  737. int i;
  738. while(1) {
  739. ret = radix_tree_gang_lookup(&fs_info->fs_roots_radix,
  740. (void **)gang, 0,
  741. ARRAY_SIZE(gang));
  742. if (!ret)
  743. break;
  744. for (i = 0; i < ret; i++)
  745. btrfs_free_fs_root(fs_info, gang[i]);
  746. }
  747. return 0;
  748. }
  749. int close_ctree(struct btrfs_root *root)
  750. {
  751. int ret;
  752. struct btrfs_trans_handle *trans;
  753. struct btrfs_fs_info *fs_info = root->fs_info;
  754. fs_info->closing = 1;
  755. btrfs_transaction_flush_work(root);
  756. mutex_lock(&fs_info->fs_mutex);
  757. btrfs_defrag_dirty_roots(root->fs_info);
  758. trans = btrfs_start_transaction(root, 1);
  759. ret = btrfs_commit_transaction(trans, root);
  760. /* run commit again to drop the original snapshot */
  761. trans = btrfs_start_transaction(root, 1);
  762. btrfs_commit_transaction(trans, root);
  763. ret = btrfs_write_and_wait_transaction(NULL, root);
  764. BUG_ON(ret);
  765. write_ctree_super(NULL, root);
  766. mutex_unlock(&fs_info->fs_mutex);
  767. if (fs_info->extent_root->node)
  768. free_extent_buffer(fs_info->extent_root->node);
  769. if (fs_info->tree_root->node)
  770. free_extent_buffer(fs_info->tree_root->node);
  771. free_extent_buffer(fs_info->sb_buffer);
  772. btrfs_free_block_groups(root->fs_info);
  773. del_fs_roots(fs_info);
  774. filemap_write_and_wait(fs_info->btree_inode->i_mapping);
  775. extent_io_tree_empty_lru(&fs_info->free_space_cache);
  776. extent_io_tree_empty_lru(&fs_info->block_group_cache);
  777. extent_io_tree_empty_lru(&fs_info->pinned_extents);
  778. extent_io_tree_empty_lru(&fs_info->pending_del);
  779. extent_io_tree_empty_lru(&fs_info->extent_ins);
  780. extent_io_tree_empty_lru(&BTRFS_I(fs_info->btree_inode)->io_tree);
  781. truncate_inode_pages(fs_info->btree_inode->i_mapping, 0);
  782. iput(fs_info->btree_inode);
  783. #if 0
  784. while(!list_empty(&fs_info->hashers)) {
  785. struct btrfs_hasher *hasher;
  786. hasher = list_entry(fs_info->hashers.next, struct btrfs_hasher,
  787. hashers);
  788. list_del(&hasher->hashers);
  789. crypto_free_hash(&fs_info->hash_tfm);
  790. kfree(hasher);
  791. }
  792. #endif
  793. kfree(fs_info->extent_root);
  794. kfree(fs_info->tree_root);
  795. return 0;
  796. }
  797. int btrfs_buffer_uptodate(struct extent_buffer *buf)
  798. {
  799. struct inode *btree_inode = buf->first_page->mapping->host;
  800. return extent_buffer_uptodate(&BTRFS_I(btree_inode)->io_tree, buf);
  801. }
  802. int btrfs_set_buffer_uptodate(struct extent_buffer *buf)
  803. {
  804. struct inode *btree_inode = buf->first_page->mapping->host;
  805. return set_extent_buffer_uptodate(&BTRFS_I(btree_inode)->io_tree,
  806. buf);
  807. }
  808. void btrfs_mark_buffer_dirty(struct extent_buffer *buf)
  809. {
  810. struct btrfs_root *root = BTRFS_I(buf->first_page->mapping->host)->root;
  811. u64 transid = btrfs_header_generation(buf);
  812. struct inode *btree_inode = root->fs_info->btree_inode;
  813. if (transid != root->fs_info->generation) {
  814. printk(KERN_CRIT "transid mismatch buffer %llu, found %Lu running %Lu\n",
  815. (unsigned long long)buf->start,
  816. transid, root->fs_info->generation);
  817. WARN_ON(1);
  818. }
  819. set_extent_buffer_dirty(&BTRFS_I(btree_inode)->io_tree, buf);
  820. }
  821. void btrfs_throttle(struct btrfs_root *root)
  822. {
  823. struct backing_dev_info *bdi;
  824. bdi = root->fs_info->sb->s_bdev->bd_inode->i_mapping->backing_dev_info;
  825. if (root->fs_info->throttles && bdi_write_congested(bdi)) {
  826. #if LINUX_VERSION_CODE > KERNEL_VERSION(2,6,18)
  827. congestion_wait(WRITE, HZ/20);
  828. #else
  829. blk_congestion_wait(WRITE, HZ/20);
  830. #endif
  831. }
  832. }
  833. void btrfs_btree_balance_dirty(struct btrfs_root *root, unsigned long nr)
  834. {
  835. balance_dirty_pages_ratelimited_nr(
  836. root->fs_info->btree_inode->i_mapping, 1);
  837. }
  838. void btrfs_set_buffer_defrag(struct extent_buffer *buf)
  839. {
  840. struct btrfs_root *root = BTRFS_I(buf->first_page->mapping->host)->root;
  841. struct inode *btree_inode = root->fs_info->btree_inode;
  842. set_extent_bits(&BTRFS_I(btree_inode)->io_tree, buf->start,
  843. buf->start + buf->len - 1, EXTENT_DEFRAG, GFP_NOFS);
  844. }
  845. void btrfs_set_buffer_defrag_done(struct extent_buffer *buf)
  846. {
  847. struct btrfs_root *root = BTRFS_I(buf->first_page->mapping->host)->root;
  848. struct inode *btree_inode = root->fs_info->btree_inode;
  849. set_extent_bits(&BTRFS_I(btree_inode)->io_tree, buf->start,
  850. buf->start + buf->len - 1, EXTENT_DEFRAG_DONE,
  851. GFP_NOFS);
  852. }
  853. int btrfs_buffer_defrag(struct extent_buffer *buf)
  854. {
  855. struct btrfs_root *root = BTRFS_I(buf->first_page->mapping->host)->root;
  856. struct inode *btree_inode = root->fs_info->btree_inode;
  857. return test_range_bit(&BTRFS_I(btree_inode)->io_tree,
  858. buf->start, buf->start + buf->len - 1, EXTENT_DEFRAG, 0);
  859. }
  860. int btrfs_buffer_defrag_done(struct extent_buffer *buf)
  861. {
  862. struct btrfs_root *root = BTRFS_I(buf->first_page->mapping->host)->root;
  863. struct inode *btree_inode = root->fs_info->btree_inode;
  864. return test_range_bit(&BTRFS_I(btree_inode)->io_tree,
  865. buf->start, buf->start + buf->len - 1,
  866. EXTENT_DEFRAG_DONE, 0);
  867. }
  868. int btrfs_clear_buffer_defrag_done(struct extent_buffer *buf)
  869. {
  870. struct btrfs_root *root = BTRFS_I(buf->first_page->mapping->host)->root;
  871. struct inode *btree_inode = root->fs_info->btree_inode;
  872. return clear_extent_bits(&BTRFS_I(btree_inode)->io_tree,
  873. buf->start, buf->start + buf->len - 1,
  874. EXTENT_DEFRAG_DONE, GFP_NOFS);
  875. }
  876. int btrfs_clear_buffer_defrag(struct extent_buffer *buf)
  877. {
  878. struct btrfs_root *root = BTRFS_I(buf->first_page->mapping->host)->root;
  879. struct inode *btree_inode = root->fs_info->btree_inode;
  880. return clear_extent_bits(&BTRFS_I(btree_inode)->io_tree,
  881. buf->start, buf->start + buf->len - 1,
  882. EXTENT_DEFRAG, GFP_NOFS);
  883. }
  884. int btrfs_read_buffer(struct extent_buffer *buf)
  885. {
  886. struct btrfs_root *root = BTRFS_I(buf->first_page->mapping->host)->root;
  887. struct inode *btree_inode = root->fs_info->btree_inode;
  888. return read_extent_buffer_pages(&BTRFS_I(btree_inode)->io_tree,
  889. buf, 0, 1);
  890. }
  891. static struct extent_io_ops btree_extent_io_ops = {
  892. .writepage_io_hook = btree_writepage_io_hook,
  893. };