super.c 22 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986
  1. /*
  2. * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
  3. * Copyright (C) 2004-2006 Red Hat, Inc. All rights reserved.
  4. *
  5. * This copyrighted material is made available to anyone wishing to use,
  6. * modify, copy, or redistribute it subject to the terms and conditions
  7. * of the GNU General Public License version 2.
  8. */
  9. #include <linux/sched.h>
  10. #include <linux/slab.h>
  11. #include <linux/spinlock.h>
  12. #include <linux/completion.h>
  13. #include <linux/buffer_head.h>
  14. #include <linux/crc32.h>
  15. #include <linux/gfs2_ondisk.h>
  16. #include <linux/bio.h>
  17. #include <linux/lm_interface.h>
  18. #include "gfs2.h"
  19. #include "incore.h"
  20. #include "bmap.h"
  21. #include "dir.h"
  22. #include "glock.h"
  23. #include "glops.h"
  24. #include "inode.h"
  25. #include "log.h"
  26. #include "meta_io.h"
  27. #include "quota.h"
  28. #include "recovery.h"
  29. #include "rgrp.h"
  30. #include "super.h"
  31. #include "trans.h"
  32. #include "util.h"
  33. static const u32 gfs2_old_fs_formats[] = {
  34. 0
  35. };
  36. static const u32 gfs2_old_multihost_formats[] = {
  37. 0
  38. };
  39. /**
  40. * gfs2_tune_init - Fill a gfs2_tune structure with default values
  41. * @gt: tune
  42. *
  43. */
  44. void gfs2_tune_init(struct gfs2_tune *gt)
  45. {
  46. spin_lock_init(&gt->gt_spin);
  47. gt->gt_ilimit = 100;
  48. gt->gt_ilimit_tries = 3;
  49. gt->gt_ilimit_min = 1;
  50. gt->gt_demote_secs = 300;
  51. gt->gt_incore_log_blocks = 1024;
  52. gt->gt_log_flush_secs = 60;
  53. gt->gt_jindex_refresh_secs = 60;
  54. gt->gt_scand_secs = 15;
  55. gt->gt_recoverd_secs = 60;
  56. gt->gt_logd_secs = 1;
  57. gt->gt_quotad_secs = 5;
  58. gt->gt_quota_simul_sync = 64;
  59. gt->gt_quota_warn_period = 10;
  60. gt->gt_quota_scale_num = 1;
  61. gt->gt_quota_scale_den = 1;
  62. gt->gt_quota_cache_secs = 300;
  63. gt->gt_quota_quantum = 60;
  64. gt->gt_atime_quantum = 3600;
  65. gt->gt_new_files_jdata = 0;
  66. gt->gt_new_files_directio = 0;
  67. gt->gt_max_readahead = 1 << 18;
  68. gt->gt_lockdump_size = 131072;
  69. gt->gt_stall_secs = 600;
  70. gt->gt_complain_secs = 10;
  71. gt->gt_reclaim_limit = 5000;
  72. gt->gt_entries_per_readdir = 32;
  73. gt->gt_statfs_quantum = 30;
  74. gt->gt_statfs_slow = 0;
  75. }
  76. /**
  77. * gfs2_check_sb - Check superblock
  78. * @sdp: the filesystem
  79. * @sb: The superblock
  80. * @silent: Don't print a message if the check fails
  81. *
  82. * Checks the version code of the FS is one that we understand how to
  83. * read and that the sizes of the various on-disk structures have not
  84. * changed.
  85. */
  86. int gfs2_check_sb(struct gfs2_sbd *sdp, struct gfs2_sb_host *sb, int silent)
  87. {
  88. unsigned int x;
  89. if (sb->sb_header.mh_magic != GFS2_MAGIC ||
  90. sb->sb_header.mh_type != GFS2_METATYPE_SB) {
  91. if (!silent)
  92. printk(KERN_WARNING "GFS2: not a GFS2 filesystem\n");
  93. return -EINVAL;
  94. }
  95. /* If format numbers match exactly, we're done. */
  96. if (sb->sb_fs_format == GFS2_FORMAT_FS &&
  97. sb->sb_multihost_format == GFS2_FORMAT_MULTI)
  98. return 0;
  99. if (sb->sb_fs_format != GFS2_FORMAT_FS) {
  100. for (x = 0; gfs2_old_fs_formats[x]; x++)
  101. if (gfs2_old_fs_formats[x] == sb->sb_fs_format)
  102. break;
  103. if (!gfs2_old_fs_formats[x]) {
  104. printk(KERN_WARNING
  105. "GFS2: code version (%u, %u) is incompatible "
  106. "with ondisk format (%u, %u)\n",
  107. GFS2_FORMAT_FS, GFS2_FORMAT_MULTI,
  108. sb->sb_fs_format, sb->sb_multihost_format);
  109. printk(KERN_WARNING
  110. "GFS2: I don't know how to upgrade this FS\n");
  111. return -EINVAL;
  112. }
  113. }
  114. if (sb->sb_multihost_format != GFS2_FORMAT_MULTI) {
  115. for (x = 0; gfs2_old_multihost_formats[x]; x++)
  116. if (gfs2_old_multihost_formats[x] ==
  117. sb->sb_multihost_format)
  118. break;
  119. if (!gfs2_old_multihost_formats[x]) {
  120. printk(KERN_WARNING
  121. "GFS2: code version (%u, %u) is incompatible "
  122. "with ondisk format (%u, %u)\n",
  123. GFS2_FORMAT_FS, GFS2_FORMAT_MULTI,
  124. sb->sb_fs_format, sb->sb_multihost_format);
  125. printk(KERN_WARNING
  126. "GFS2: I don't know how to upgrade this FS\n");
  127. return -EINVAL;
  128. }
  129. }
  130. if (!sdp->sd_args.ar_upgrade) {
  131. printk(KERN_WARNING
  132. "GFS2: code version (%u, %u) is incompatible "
  133. "with ondisk format (%u, %u)\n",
  134. GFS2_FORMAT_FS, GFS2_FORMAT_MULTI,
  135. sb->sb_fs_format, sb->sb_multihost_format);
  136. printk(KERN_INFO
  137. "GFS2: Use the \"upgrade\" mount option to upgrade "
  138. "the FS\n");
  139. printk(KERN_INFO "GFS2: See the manual for more details\n");
  140. return -EINVAL;
  141. }
  142. return 0;
  143. }
  144. static int end_bio_io_page(struct bio *bio, unsigned int bytes_done, int error)
  145. {
  146. struct page *page = bio->bi_private;
  147. if (bio->bi_size)
  148. return 1;
  149. if (!error)
  150. SetPageUptodate(page);
  151. else
  152. printk(KERN_WARNING "gfs2: error %d reading superblock\n", error);
  153. unlock_page(page);
  154. return 0;
  155. }
  156. /**
  157. * gfs2_read_super - Read the gfs2 super block from disk
  158. * @sb: The VFS super block
  159. * @sector: The location of the super block
  160. *
  161. * This uses the bio functions to read the super block from disk
  162. * because we want to be 100% sure that we never read cached data.
  163. * A super block is read twice only during each GFS2 mount and is
  164. * never written to by the filesystem. The first time its read no
  165. * locks are held, and the only details which are looked at are those
  166. * relating to the locking protocol. Once locking is up and working,
  167. * the sb is read again under the lock to establish the location of
  168. * the master directory (contains pointers to journals etc) and the
  169. * root directory.
  170. *
  171. * Returns: A page containing the sb or NULL
  172. */
  173. struct page *gfs2_read_super(struct super_block *sb, sector_t sector)
  174. {
  175. struct page *page;
  176. struct bio *bio;
  177. page = alloc_page(GFP_KERNEL);
  178. if (unlikely(!page))
  179. return NULL;
  180. ClearPageUptodate(page);
  181. ClearPageDirty(page);
  182. lock_page(page);
  183. bio = bio_alloc(GFP_KERNEL, 1);
  184. if (unlikely(!bio)) {
  185. __free_page(page);
  186. return NULL;
  187. }
  188. bio->bi_sector = sector * (sb->s_blocksize >> 9);
  189. bio->bi_bdev = sb->s_bdev;
  190. bio_add_page(bio, page, PAGE_SIZE, 0);
  191. bio->bi_end_io = end_bio_io_page;
  192. bio->bi_private = page;
  193. submit_bio(READ_SYNC | (1 << BIO_RW_META), bio);
  194. wait_on_page_locked(page);
  195. bio_put(bio);
  196. if (!PageUptodate(page)) {
  197. __free_page(page);
  198. return NULL;
  199. }
  200. return page;
  201. }
  202. /**
  203. * gfs2_read_sb - Read super block
  204. * @sdp: The GFS2 superblock
  205. * @gl: the glock for the superblock (assumed to be held)
  206. * @silent: Don't print message if mount fails
  207. *
  208. */
  209. int gfs2_read_sb(struct gfs2_sbd *sdp, struct gfs2_glock *gl, int silent)
  210. {
  211. u32 hash_blocks, ind_blocks, leaf_blocks;
  212. u32 tmp_blocks;
  213. unsigned int x;
  214. int error;
  215. struct page *page;
  216. char *sb;
  217. page = gfs2_read_super(sdp->sd_vfs, GFS2_SB_ADDR >> sdp->sd_fsb2bb_shift);
  218. if (!page) {
  219. if (!silent)
  220. fs_err(sdp, "can't read superblock\n");
  221. return -EIO;
  222. }
  223. sb = kmap(page);
  224. gfs2_sb_in(&sdp->sd_sb, sb);
  225. kunmap(page);
  226. __free_page(page);
  227. error = gfs2_check_sb(sdp, &sdp->sd_sb, silent);
  228. if (error)
  229. return error;
  230. sdp->sd_fsb2bb_shift = sdp->sd_sb.sb_bsize_shift -
  231. GFS2_BASIC_BLOCK_SHIFT;
  232. sdp->sd_fsb2bb = 1 << sdp->sd_fsb2bb_shift;
  233. sdp->sd_diptrs = (sdp->sd_sb.sb_bsize -
  234. sizeof(struct gfs2_dinode)) / sizeof(u64);
  235. sdp->sd_inptrs = (sdp->sd_sb.sb_bsize -
  236. sizeof(struct gfs2_meta_header)) / sizeof(u64);
  237. sdp->sd_jbsize = sdp->sd_sb.sb_bsize - sizeof(struct gfs2_meta_header);
  238. sdp->sd_hash_bsize = sdp->sd_sb.sb_bsize / 2;
  239. sdp->sd_hash_bsize_shift = sdp->sd_sb.sb_bsize_shift - 1;
  240. sdp->sd_hash_ptrs = sdp->sd_hash_bsize / sizeof(u64);
  241. sdp->sd_qc_per_block = (sdp->sd_sb.sb_bsize -
  242. sizeof(struct gfs2_meta_header)) /
  243. sizeof(struct gfs2_quota_change);
  244. /* Compute maximum reservation required to add a entry to a directory */
  245. hash_blocks = DIV_ROUND_UP(sizeof(u64) * (1 << GFS2_DIR_MAX_DEPTH),
  246. sdp->sd_jbsize);
  247. ind_blocks = 0;
  248. for (tmp_blocks = hash_blocks; tmp_blocks > sdp->sd_diptrs;) {
  249. tmp_blocks = DIV_ROUND_UP(tmp_blocks, sdp->sd_inptrs);
  250. ind_blocks += tmp_blocks;
  251. }
  252. leaf_blocks = 2 + GFS2_DIR_MAX_DEPTH;
  253. sdp->sd_max_dirres = hash_blocks + ind_blocks + leaf_blocks;
  254. sdp->sd_heightsize[0] = sdp->sd_sb.sb_bsize -
  255. sizeof(struct gfs2_dinode);
  256. sdp->sd_heightsize[1] = sdp->sd_sb.sb_bsize * sdp->sd_diptrs;
  257. for (x = 2;; x++) {
  258. u64 space, d;
  259. u32 m;
  260. space = sdp->sd_heightsize[x - 1] * sdp->sd_inptrs;
  261. d = space;
  262. m = do_div(d, sdp->sd_inptrs);
  263. if (d != sdp->sd_heightsize[x - 1] || m)
  264. break;
  265. sdp->sd_heightsize[x] = space;
  266. }
  267. sdp->sd_max_height = x;
  268. gfs2_assert(sdp, sdp->sd_max_height <= GFS2_MAX_META_HEIGHT);
  269. sdp->sd_jheightsize[0] = sdp->sd_sb.sb_bsize -
  270. sizeof(struct gfs2_dinode);
  271. sdp->sd_jheightsize[1] = sdp->sd_jbsize * sdp->sd_diptrs;
  272. for (x = 2;; x++) {
  273. u64 space, d;
  274. u32 m;
  275. space = sdp->sd_jheightsize[x - 1] * sdp->sd_inptrs;
  276. d = space;
  277. m = do_div(d, sdp->sd_inptrs);
  278. if (d != sdp->sd_jheightsize[x - 1] || m)
  279. break;
  280. sdp->sd_jheightsize[x] = space;
  281. }
  282. sdp->sd_max_jheight = x;
  283. gfs2_assert(sdp, sdp->sd_max_jheight <= GFS2_MAX_META_HEIGHT);
  284. return 0;
  285. }
  286. /**
  287. * gfs2_jindex_hold - Grab a lock on the jindex
  288. * @sdp: The GFS2 superblock
  289. * @ji_gh: the holder for the jindex glock
  290. *
  291. * This is very similar to the gfs2_rindex_hold() function, except that
  292. * in general we hold the jindex lock for longer periods of time and
  293. * we grab it far less frequently (in general) then the rgrp lock.
  294. *
  295. * Returns: errno
  296. */
  297. int gfs2_jindex_hold(struct gfs2_sbd *sdp, struct gfs2_holder *ji_gh)
  298. {
  299. struct gfs2_inode *dip = GFS2_I(sdp->sd_jindex);
  300. struct qstr name;
  301. char buf[20];
  302. struct gfs2_jdesc *jd;
  303. int error;
  304. name.name = buf;
  305. mutex_lock(&sdp->sd_jindex_mutex);
  306. for (;;) {
  307. error = gfs2_glock_nq_init(dip->i_gl, LM_ST_SHARED, 0, ji_gh);
  308. if (error)
  309. break;
  310. name.len = sprintf(buf, "journal%u", sdp->sd_journals);
  311. name.hash = gfs2_disk_hash(name.name, name.len);
  312. error = gfs2_dir_search(sdp->sd_jindex, &name, NULL, NULL);
  313. if (error == -ENOENT) {
  314. error = 0;
  315. break;
  316. }
  317. gfs2_glock_dq_uninit(ji_gh);
  318. if (error)
  319. break;
  320. error = -ENOMEM;
  321. jd = kzalloc(sizeof(struct gfs2_jdesc), GFP_KERNEL);
  322. if (!jd)
  323. break;
  324. jd->jd_inode = gfs2_lookupi(sdp->sd_jindex, &name, 1, NULL);
  325. if (!jd->jd_inode || IS_ERR(jd->jd_inode)) {
  326. if (!jd->jd_inode)
  327. error = -ENOENT;
  328. else
  329. error = PTR_ERR(jd->jd_inode);
  330. kfree(jd);
  331. break;
  332. }
  333. spin_lock(&sdp->sd_jindex_spin);
  334. jd->jd_jid = sdp->sd_journals++;
  335. list_add_tail(&jd->jd_list, &sdp->sd_jindex_list);
  336. spin_unlock(&sdp->sd_jindex_spin);
  337. }
  338. mutex_unlock(&sdp->sd_jindex_mutex);
  339. return error;
  340. }
  341. /**
  342. * gfs2_jindex_free - Clear all the journal index information
  343. * @sdp: The GFS2 superblock
  344. *
  345. */
  346. void gfs2_jindex_free(struct gfs2_sbd *sdp)
  347. {
  348. struct list_head list;
  349. struct gfs2_jdesc *jd;
  350. spin_lock(&sdp->sd_jindex_spin);
  351. list_add(&list, &sdp->sd_jindex_list);
  352. list_del_init(&sdp->sd_jindex_list);
  353. sdp->sd_journals = 0;
  354. spin_unlock(&sdp->sd_jindex_spin);
  355. while (!list_empty(&list)) {
  356. jd = list_entry(list.next, struct gfs2_jdesc, jd_list);
  357. list_del(&jd->jd_list);
  358. iput(jd->jd_inode);
  359. kfree(jd);
  360. }
  361. }
  362. static struct gfs2_jdesc *jdesc_find_i(struct list_head *head, unsigned int jid)
  363. {
  364. struct gfs2_jdesc *jd;
  365. int found = 0;
  366. list_for_each_entry(jd, head, jd_list) {
  367. if (jd->jd_jid == jid) {
  368. found = 1;
  369. break;
  370. }
  371. }
  372. if (!found)
  373. jd = NULL;
  374. return jd;
  375. }
  376. struct gfs2_jdesc *gfs2_jdesc_find(struct gfs2_sbd *sdp, unsigned int jid)
  377. {
  378. struct gfs2_jdesc *jd;
  379. spin_lock(&sdp->sd_jindex_spin);
  380. jd = jdesc_find_i(&sdp->sd_jindex_list, jid);
  381. spin_unlock(&sdp->sd_jindex_spin);
  382. return jd;
  383. }
  384. void gfs2_jdesc_make_dirty(struct gfs2_sbd *sdp, unsigned int jid)
  385. {
  386. struct gfs2_jdesc *jd;
  387. spin_lock(&sdp->sd_jindex_spin);
  388. jd = jdesc_find_i(&sdp->sd_jindex_list, jid);
  389. if (jd)
  390. jd->jd_dirty = 1;
  391. spin_unlock(&sdp->sd_jindex_spin);
  392. }
  393. struct gfs2_jdesc *gfs2_jdesc_find_dirty(struct gfs2_sbd *sdp)
  394. {
  395. struct gfs2_jdesc *jd;
  396. int found = 0;
  397. spin_lock(&sdp->sd_jindex_spin);
  398. list_for_each_entry(jd, &sdp->sd_jindex_list, jd_list) {
  399. if (jd->jd_dirty) {
  400. jd->jd_dirty = 0;
  401. found = 1;
  402. break;
  403. }
  404. }
  405. spin_unlock(&sdp->sd_jindex_spin);
  406. if (!found)
  407. jd = NULL;
  408. return jd;
  409. }
  410. int gfs2_jdesc_check(struct gfs2_jdesc *jd)
  411. {
  412. struct gfs2_inode *ip = GFS2_I(jd->jd_inode);
  413. struct gfs2_sbd *sdp = GFS2_SB(jd->jd_inode);
  414. int ar;
  415. int error;
  416. if (ip->i_di.di_size < (8 << 20) || ip->i_di.di_size > (1 << 30) ||
  417. (ip->i_di.di_size & (sdp->sd_sb.sb_bsize - 1))) {
  418. gfs2_consist_inode(ip);
  419. return -EIO;
  420. }
  421. jd->jd_blocks = ip->i_di.di_size >> sdp->sd_sb.sb_bsize_shift;
  422. error = gfs2_write_alloc_required(ip, 0, ip->i_di.di_size, &ar);
  423. if (!error && ar) {
  424. gfs2_consist_inode(ip);
  425. error = -EIO;
  426. }
  427. return error;
  428. }
  429. /**
  430. * gfs2_make_fs_rw - Turn a Read-Only FS into a Read-Write one
  431. * @sdp: the filesystem
  432. *
  433. * Returns: errno
  434. */
  435. int gfs2_make_fs_rw(struct gfs2_sbd *sdp)
  436. {
  437. struct gfs2_inode *ip = GFS2_I(sdp->sd_jdesc->jd_inode);
  438. struct gfs2_glock *j_gl = ip->i_gl;
  439. struct gfs2_holder t_gh;
  440. struct gfs2_log_header_host head;
  441. int error;
  442. error = gfs2_glock_nq_init(sdp->sd_trans_gl, LM_ST_SHARED, 0, &t_gh);
  443. if (error)
  444. return error;
  445. gfs2_meta_cache_flush(ip);
  446. j_gl->gl_ops->go_inval(j_gl, DIO_METADATA);
  447. error = gfs2_find_jhead(sdp->sd_jdesc, &head);
  448. if (error)
  449. goto fail;
  450. if (!(head.lh_flags & GFS2_LOG_HEAD_UNMOUNT)) {
  451. gfs2_consist(sdp);
  452. error = -EIO;
  453. goto fail;
  454. }
  455. /* Initialize some head of the log stuff */
  456. sdp->sd_log_sequence = head.lh_sequence + 1;
  457. gfs2_log_pointers_init(sdp, head.lh_blkno);
  458. error = gfs2_quota_init(sdp);
  459. if (error)
  460. goto fail;
  461. set_bit(SDF_JOURNAL_LIVE, &sdp->sd_flags);
  462. gfs2_glock_dq_uninit(&t_gh);
  463. return 0;
  464. fail:
  465. t_gh.gh_flags |= GL_NOCACHE;
  466. gfs2_glock_dq_uninit(&t_gh);
  467. return error;
  468. }
  469. /**
  470. * gfs2_make_fs_ro - Turn a Read-Write FS into a Read-Only one
  471. * @sdp: the filesystem
  472. *
  473. * Returns: errno
  474. */
  475. int gfs2_make_fs_ro(struct gfs2_sbd *sdp)
  476. {
  477. struct gfs2_holder t_gh;
  478. int error;
  479. gfs2_quota_sync(sdp);
  480. gfs2_statfs_sync(sdp);
  481. error = gfs2_glock_nq_init(sdp->sd_trans_gl, LM_ST_SHARED, GL_NOCACHE,
  482. &t_gh);
  483. if (error && !test_bit(SDF_SHUTDOWN, &sdp->sd_flags))
  484. return error;
  485. gfs2_meta_syncfs(sdp);
  486. gfs2_log_shutdown(sdp);
  487. clear_bit(SDF_JOURNAL_LIVE, &sdp->sd_flags);
  488. if (t_gh.gh_gl)
  489. gfs2_glock_dq_uninit(&t_gh);
  490. gfs2_quota_cleanup(sdp);
  491. return error;
  492. }
  493. int gfs2_statfs_init(struct gfs2_sbd *sdp)
  494. {
  495. struct gfs2_inode *m_ip = GFS2_I(sdp->sd_statfs_inode);
  496. struct gfs2_statfs_change_host *m_sc = &sdp->sd_statfs_master;
  497. struct gfs2_inode *l_ip = GFS2_I(sdp->sd_sc_inode);
  498. struct gfs2_statfs_change_host *l_sc = &sdp->sd_statfs_local;
  499. struct buffer_head *m_bh, *l_bh;
  500. struct gfs2_holder gh;
  501. int error;
  502. error = gfs2_glock_nq_init(m_ip->i_gl, LM_ST_EXCLUSIVE, GL_NOCACHE,
  503. &gh);
  504. if (error)
  505. return error;
  506. error = gfs2_meta_inode_buffer(m_ip, &m_bh);
  507. if (error)
  508. goto out;
  509. if (sdp->sd_args.ar_spectator) {
  510. spin_lock(&sdp->sd_statfs_spin);
  511. gfs2_statfs_change_in(m_sc, m_bh->b_data +
  512. sizeof(struct gfs2_dinode));
  513. spin_unlock(&sdp->sd_statfs_spin);
  514. } else {
  515. error = gfs2_meta_inode_buffer(l_ip, &l_bh);
  516. if (error)
  517. goto out_m_bh;
  518. spin_lock(&sdp->sd_statfs_spin);
  519. gfs2_statfs_change_in(m_sc, m_bh->b_data +
  520. sizeof(struct gfs2_dinode));
  521. gfs2_statfs_change_in(l_sc, l_bh->b_data +
  522. sizeof(struct gfs2_dinode));
  523. spin_unlock(&sdp->sd_statfs_spin);
  524. brelse(l_bh);
  525. }
  526. out_m_bh:
  527. brelse(m_bh);
  528. out:
  529. gfs2_glock_dq_uninit(&gh);
  530. return 0;
  531. }
  532. void gfs2_statfs_change(struct gfs2_sbd *sdp, s64 total, s64 free,
  533. s64 dinodes)
  534. {
  535. struct gfs2_inode *l_ip = GFS2_I(sdp->sd_sc_inode);
  536. struct gfs2_statfs_change_host *l_sc = &sdp->sd_statfs_local;
  537. struct buffer_head *l_bh;
  538. int error;
  539. error = gfs2_meta_inode_buffer(l_ip, &l_bh);
  540. if (error)
  541. return;
  542. mutex_lock(&sdp->sd_statfs_mutex);
  543. gfs2_trans_add_bh(l_ip->i_gl, l_bh, 1);
  544. mutex_unlock(&sdp->sd_statfs_mutex);
  545. spin_lock(&sdp->sd_statfs_spin);
  546. l_sc->sc_total += total;
  547. l_sc->sc_free += free;
  548. l_sc->sc_dinodes += dinodes;
  549. gfs2_statfs_change_out(l_sc, l_bh->b_data + sizeof(struct gfs2_dinode));
  550. spin_unlock(&sdp->sd_statfs_spin);
  551. brelse(l_bh);
  552. }
  553. int gfs2_statfs_sync(struct gfs2_sbd *sdp)
  554. {
  555. struct gfs2_inode *m_ip = GFS2_I(sdp->sd_statfs_inode);
  556. struct gfs2_inode *l_ip = GFS2_I(sdp->sd_sc_inode);
  557. struct gfs2_statfs_change_host *m_sc = &sdp->sd_statfs_master;
  558. struct gfs2_statfs_change_host *l_sc = &sdp->sd_statfs_local;
  559. struct gfs2_holder gh;
  560. struct buffer_head *m_bh, *l_bh;
  561. int error;
  562. error = gfs2_glock_nq_init(m_ip->i_gl, LM_ST_EXCLUSIVE, GL_NOCACHE,
  563. &gh);
  564. if (error)
  565. return error;
  566. error = gfs2_meta_inode_buffer(m_ip, &m_bh);
  567. if (error)
  568. goto out;
  569. spin_lock(&sdp->sd_statfs_spin);
  570. gfs2_statfs_change_in(m_sc, m_bh->b_data +
  571. sizeof(struct gfs2_dinode));
  572. if (!l_sc->sc_total && !l_sc->sc_free && !l_sc->sc_dinodes) {
  573. spin_unlock(&sdp->sd_statfs_spin);
  574. goto out_bh;
  575. }
  576. spin_unlock(&sdp->sd_statfs_spin);
  577. error = gfs2_meta_inode_buffer(l_ip, &l_bh);
  578. if (error)
  579. goto out_bh;
  580. error = gfs2_trans_begin(sdp, 2 * RES_DINODE, 0);
  581. if (error)
  582. goto out_bh2;
  583. mutex_lock(&sdp->sd_statfs_mutex);
  584. gfs2_trans_add_bh(l_ip->i_gl, l_bh, 1);
  585. mutex_unlock(&sdp->sd_statfs_mutex);
  586. spin_lock(&sdp->sd_statfs_spin);
  587. m_sc->sc_total += l_sc->sc_total;
  588. m_sc->sc_free += l_sc->sc_free;
  589. m_sc->sc_dinodes += l_sc->sc_dinodes;
  590. memset(l_sc, 0, sizeof(struct gfs2_statfs_change));
  591. memset(l_bh->b_data + sizeof(struct gfs2_dinode),
  592. 0, sizeof(struct gfs2_statfs_change));
  593. spin_unlock(&sdp->sd_statfs_spin);
  594. gfs2_trans_add_bh(m_ip->i_gl, m_bh, 1);
  595. gfs2_statfs_change_out(m_sc, m_bh->b_data + sizeof(struct gfs2_dinode));
  596. gfs2_trans_end(sdp);
  597. out_bh2:
  598. brelse(l_bh);
  599. out_bh:
  600. brelse(m_bh);
  601. out:
  602. gfs2_glock_dq_uninit(&gh);
  603. return error;
  604. }
  605. /**
  606. * gfs2_statfs_i - Do a statfs
  607. * @sdp: the filesystem
  608. * @sg: the sg structure
  609. *
  610. * Returns: errno
  611. */
  612. int gfs2_statfs_i(struct gfs2_sbd *sdp, struct gfs2_statfs_change_host *sc)
  613. {
  614. struct gfs2_statfs_change_host *m_sc = &sdp->sd_statfs_master;
  615. struct gfs2_statfs_change_host *l_sc = &sdp->sd_statfs_local;
  616. spin_lock(&sdp->sd_statfs_spin);
  617. *sc = *m_sc;
  618. sc->sc_total += l_sc->sc_total;
  619. sc->sc_free += l_sc->sc_free;
  620. sc->sc_dinodes += l_sc->sc_dinodes;
  621. spin_unlock(&sdp->sd_statfs_spin);
  622. if (sc->sc_free < 0)
  623. sc->sc_free = 0;
  624. if (sc->sc_free > sc->sc_total)
  625. sc->sc_free = sc->sc_total;
  626. if (sc->sc_dinodes < 0)
  627. sc->sc_dinodes = 0;
  628. return 0;
  629. }
  630. /**
  631. * statfs_fill - fill in the sg for a given RG
  632. * @rgd: the RG
  633. * @sc: the sc structure
  634. *
  635. * Returns: 0 on success, -ESTALE if the LVB is invalid
  636. */
  637. static int statfs_slow_fill(struct gfs2_rgrpd *rgd,
  638. struct gfs2_statfs_change_host *sc)
  639. {
  640. gfs2_rgrp_verify(rgd);
  641. sc->sc_total += rgd->rd_ri.ri_data;
  642. sc->sc_free += rgd->rd_rg.rg_free;
  643. sc->sc_dinodes += rgd->rd_rg.rg_dinodes;
  644. return 0;
  645. }
  646. /**
  647. * gfs2_statfs_slow - Stat a filesystem using asynchronous locking
  648. * @sdp: the filesystem
  649. * @sc: the sc info that will be returned
  650. *
  651. * Any error (other than a signal) will cause this routine to fall back
  652. * to the synchronous version.
  653. *
  654. * FIXME: This really shouldn't busy wait like this.
  655. *
  656. * Returns: errno
  657. */
  658. int gfs2_statfs_slow(struct gfs2_sbd *sdp, struct gfs2_statfs_change_host *sc)
  659. {
  660. struct gfs2_holder ri_gh;
  661. struct gfs2_rgrpd *rgd_next;
  662. struct gfs2_holder *gha, *gh;
  663. unsigned int slots = 64;
  664. unsigned int x;
  665. int done;
  666. int error = 0, err;
  667. memset(sc, 0, sizeof(struct gfs2_statfs_change_host));
  668. gha = kcalloc(slots, sizeof(struct gfs2_holder), GFP_KERNEL);
  669. if (!gha)
  670. return -ENOMEM;
  671. error = gfs2_rindex_hold(sdp, &ri_gh);
  672. if (error)
  673. goto out;
  674. rgd_next = gfs2_rgrpd_get_first(sdp);
  675. for (;;) {
  676. done = 1;
  677. for (x = 0; x < slots; x++) {
  678. gh = gha + x;
  679. if (gh->gh_gl && gfs2_glock_poll(gh)) {
  680. err = gfs2_glock_wait(gh);
  681. if (err) {
  682. gfs2_holder_uninit(gh);
  683. error = err;
  684. } else {
  685. if (!error)
  686. error = statfs_slow_fill(
  687. gh->gh_gl->gl_object, sc);
  688. gfs2_glock_dq_uninit(gh);
  689. }
  690. }
  691. if (gh->gh_gl)
  692. done = 0;
  693. else if (rgd_next && !error) {
  694. error = gfs2_glock_nq_init(rgd_next->rd_gl,
  695. LM_ST_SHARED,
  696. GL_ASYNC,
  697. gh);
  698. rgd_next = gfs2_rgrpd_get_next(rgd_next);
  699. done = 0;
  700. }
  701. if (signal_pending(current))
  702. error = -ERESTARTSYS;
  703. }
  704. if (done)
  705. break;
  706. yield();
  707. }
  708. gfs2_glock_dq_uninit(&ri_gh);
  709. out:
  710. kfree(gha);
  711. return error;
  712. }
  713. struct lfcc {
  714. struct list_head list;
  715. struct gfs2_holder gh;
  716. };
  717. /**
  718. * gfs2_lock_fs_check_clean - Stop all writes to the FS and check that all
  719. * journals are clean
  720. * @sdp: the file system
  721. * @state: the state to put the transaction lock into
  722. * @t_gh: the hold on the transaction lock
  723. *
  724. * Returns: errno
  725. */
  726. static int gfs2_lock_fs_check_clean(struct gfs2_sbd *sdp,
  727. struct gfs2_holder *t_gh)
  728. {
  729. struct gfs2_inode *ip;
  730. struct gfs2_holder ji_gh;
  731. struct gfs2_jdesc *jd;
  732. struct lfcc *lfcc;
  733. LIST_HEAD(list);
  734. struct gfs2_log_header_host lh;
  735. int error;
  736. error = gfs2_jindex_hold(sdp, &ji_gh);
  737. if (error)
  738. return error;
  739. list_for_each_entry(jd, &sdp->sd_jindex_list, jd_list) {
  740. lfcc = kmalloc(sizeof(struct lfcc), GFP_KERNEL);
  741. if (!lfcc) {
  742. error = -ENOMEM;
  743. goto out;
  744. }
  745. ip = GFS2_I(jd->jd_inode);
  746. error = gfs2_glock_nq_init(ip->i_gl, LM_ST_SHARED, 0, &lfcc->gh);
  747. if (error) {
  748. kfree(lfcc);
  749. goto out;
  750. }
  751. list_add(&lfcc->list, &list);
  752. }
  753. error = gfs2_glock_nq_init(sdp->sd_trans_gl, LM_ST_DEFERRED,
  754. LM_FLAG_PRIORITY | GL_NOCACHE,
  755. t_gh);
  756. list_for_each_entry(jd, &sdp->sd_jindex_list, jd_list) {
  757. error = gfs2_jdesc_check(jd);
  758. if (error)
  759. break;
  760. error = gfs2_find_jhead(jd, &lh);
  761. if (error)
  762. break;
  763. if (!(lh.lh_flags & GFS2_LOG_HEAD_UNMOUNT)) {
  764. error = -EBUSY;
  765. break;
  766. }
  767. }
  768. if (error)
  769. gfs2_glock_dq_uninit(t_gh);
  770. out:
  771. while (!list_empty(&list)) {
  772. lfcc = list_entry(list.next, struct lfcc, list);
  773. list_del(&lfcc->list);
  774. gfs2_glock_dq_uninit(&lfcc->gh);
  775. kfree(lfcc);
  776. }
  777. gfs2_glock_dq_uninit(&ji_gh);
  778. return error;
  779. }
  780. /**
  781. * gfs2_freeze_fs - freezes the file system
  782. * @sdp: the file system
  783. *
  784. * This function flushes data and meta data for all machines by
  785. * aquiring the transaction log exclusively. All journals are
  786. * ensured to be in a clean state as well.
  787. *
  788. * Returns: errno
  789. */
  790. int gfs2_freeze_fs(struct gfs2_sbd *sdp)
  791. {
  792. int error = 0;
  793. mutex_lock(&sdp->sd_freeze_lock);
  794. if (!sdp->sd_freeze_count++) {
  795. error = gfs2_lock_fs_check_clean(sdp, &sdp->sd_freeze_gh);
  796. if (error)
  797. sdp->sd_freeze_count--;
  798. }
  799. mutex_unlock(&sdp->sd_freeze_lock);
  800. return error;
  801. }
  802. /**
  803. * gfs2_unfreeze_fs - unfreezes the file system
  804. * @sdp: the file system
  805. *
  806. * This function allows the file system to proceed by unlocking
  807. * the exclusively held transaction lock. Other GFS2 nodes are
  808. * now free to acquire the lock shared and go on with their lives.
  809. *
  810. */
  811. void gfs2_unfreeze_fs(struct gfs2_sbd *sdp)
  812. {
  813. mutex_lock(&sdp->sd_freeze_lock);
  814. if (sdp->sd_freeze_count && !--sdp->sd_freeze_count)
  815. gfs2_glock_dq_uninit(&sdp->sd_freeze_gh);
  816. mutex_unlock(&sdp->sd_freeze_lock);
  817. }