xfs_trans_ail.c 22 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810
  1. /*
  2. * Copyright (c) 2000-2002,2005 Silicon Graphics, Inc.
  3. * Copyright (c) 2008 Dave Chinner
  4. * All Rights Reserved.
  5. *
  6. * This program is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU General Public License as
  8. * published by the Free Software Foundation.
  9. *
  10. * This program is distributed in the hope that it would be useful,
  11. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  13. * GNU General Public License for more details.
  14. *
  15. * You should have received a copy of the GNU General Public License
  16. * along with this program; if not, write the Free Software Foundation,
  17. * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
  18. */
  19. #include "xfs.h"
  20. #include "xfs_fs.h"
  21. #include "xfs_types.h"
  22. #include "xfs_log.h"
  23. #include "xfs_inum.h"
  24. #include "xfs_trans.h"
  25. #include "xfs_sb.h"
  26. #include "xfs_ag.h"
  27. #include "xfs_mount.h"
  28. #include "xfs_trans_priv.h"
  29. #include "xfs_error.h"
  30. struct workqueue_struct *xfs_ail_wq; /* AIL workqueue */
  31. #ifdef DEBUG
  32. /*
  33. * Check that the list is sorted as it should be.
  34. */
  35. STATIC void
  36. xfs_ail_check(
  37. struct xfs_ail *ailp,
  38. xfs_log_item_t *lip)
  39. {
  40. xfs_log_item_t *prev_lip;
  41. if (list_empty(&ailp->xa_ail))
  42. return;
  43. /*
  44. * Check the next and previous entries are valid.
  45. */
  46. ASSERT((lip->li_flags & XFS_LI_IN_AIL) != 0);
  47. prev_lip = list_entry(lip->li_ail.prev, xfs_log_item_t, li_ail);
  48. if (&prev_lip->li_ail != &ailp->xa_ail)
  49. ASSERT(XFS_LSN_CMP(prev_lip->li_lsn, lip->li_lsn) <= 0);
  50. prev_lip = list_entry(lip->li_ail.next, xfs_log_item_t, li_ail);
  51. if (&prev_lip->li_ail != &ailp->xa_ail)
  52. ASSERT(XFS_LSN_CMP(prev_lip->li_lsn, lip->li_lsn) >= 0);
  53. #ifdef XFS_TRANS_DEBUG
  54. /*
  55. * Walk the list checking lsn ordering, and that every entry has the
  56. * XFS_LI_IN_AIL flag set. This is really expensive, so only do it
  57. * when specifically debugging the transaction subsystem.
  58. */
  59. prev_lip = list_entry(&ailp->xa_ail, xfs_log_item_t, li_ail);
  60. list_for_each_entry(lip, &ailp->xa_ail, li_ail) {
  61. if (&prev_lip->li_ail != &ailp->xa_ail)
  62. ASSERT(XFS_LSN_CMP(prev_lip->li_lsn, lip->li_lsn) <= 0);
  63. ASSERT((lip->li_flags & XFS_LI_IN_AIL) != 0);
  64. prev_lip = lip;
  65. }
  66. #endif /* XFS_TRANS_DEBUG */
  67. }
  68. #else /* !DEBUG */
  69. #define xfs_ail_check(a,l)
  70. #endif /* DEBUG */
  71. /*
  72. * Return a pointer to the first item in the AIL. If the AIL is empty, then
  73. * return NULL.
  74. */
  75. static xfs_log_item_t *
  76. xfs_ail_min(
  77. struct xfs_ail *ailp)
  78. {
  79. if (list_empty(&ailp->xa_ail))
  80. return NULL;
  81. return list_first_entry(&ailp->xa_ail, xfs_log_item_t, li_ail);
  82. }
  83. /*
  84. * Return a pointer to the last item in the AIL. If the AIL is empty, then
  85. * return NULL.
  86. */
  87. static xfs_log_item_t *
  88. xfs_ail_max(
  89. struct xfs_ail *ailp)
  90. {
  91. if (list_empty(&ailp->xa_ail))
  92. return NULL;
  93. return list_entry(ailp->xa_ail.prev, xfs_log_item_t, li_ail);
  94. }
  95. /*
  96. * Return a pointer to the item which follows the given item in the AIL. If
  97. * the given item is the last item in the list, then return NULL.
  98. */
  99. static xfs_log_item_t *
  100. xfs_ail_next(
  101. struct xfs_ail *ailp,
  102. xfs_log_item_t *lip)
  103. {
  104. if (lip->li_ail.next == &ailp->xa_ail)
  105. return NULL;
  106. return list_first_entry(&lip->li_ail, xfs_log_item_t, li_ail);
  107. }
  108. /*
  109. * This is called by the log manager code to determine the LSN of the tail of
  110. * the log. This is exactly the LSN of the first item in the AIL. If the AIL
  111. * is empty, then this function returns 0.
  112. *
  113. * We need the AIL lock in order to get a coherent read of the lsn of the last
  114. * item in the AIL.
  115. */
  116. xfs_lsn_t
  117. xfs_ail_min_lsn(
  118. struct xfs_ail *ailp)
  119. {
  120. xfs_lsn_t lsn = 0;
  121. xfs_log_item_t *lip;
  122. spin_lock(&ailp->xa_lock);
  123. lip = xfs_ail_min(ailp);
  124. if (lip)
  125. lsn = lip->li_lsn;
  126. spin_unlock(&ailp->xa_lock);
  127. return lsn;
  128. }
  129. /*
  130. * Return the maximum lsn held in the AIL, or zero if the AIL is empty.
  131. */
  132. static xfs_lsn_t
  133. xfs_ail_max_lsn(
  134. struct xfs_ail *ailp)
  135. {
  136. xfs_lsn_t lsn = 0;
  137. xfs_log_item_t *lip;
  138. spin_lock(&ailp->xa_lock);
  139. lip = xfs_ail_max(ailp);
  140. if (lip)
  141. lsn = lip->li_lsn;
  142. spin_unlock(&ailp->xa_lock);
  143. return lsn;
  144. }
  145. /*
  146. * AIL traversal cursor initialisation.
  147. *
  148. * The cursor keeps track of where our current traversal is up
  149. * to by tracking the next ƣtem in the list for us. However, for
  150. * this to be safe, removing an object from the AIL needs to invalidate
  151. * any cursor that points to it. hence the traversal cursor needs to
  152. * be linked to the struct xfs_ail so that deletion can search all the
  153. * active cursors for invalidation.
  154. *
  155. * We don't link the push cursor because it is embedded in the struct
  156. * xfs_ail and hence easily findable.
  157. */
  158. STATIC void
  159. xfs_trans_ail_cursor_init(
  160. struct xfs_ail *ailp,
  161. struct xfs_ail_cursor *cur)
  162. {
  163. cur->item = NULL;
  164. if (cur == &ailp->xa_cursors)
  165. return;
  166. cur->next = ailp->xa_cursors.next;
  167. ailp->xa_cursors.next = cur;
  168. }
  169. /*
  170. * Set the cursor to the next item, because when we look
  171. * up the cursor the current item may have been freed.
  172. */
  173. STATIC void
  174. xfs_trans_ail_cursor_set(
  175. struct xfs_ail *ailp,
  176. struct xfs_ail_cursor *cur,
  177. struct xfs_log_item *lip)
  178. {
  179. if (lip)
  180. cur->item = xfs_ail_next(ailp, lip);
  181. }
  182. /*
  183. * Get the next item in the traversal and advance the cursor.
  184. * If the cursor was invalidated (inidicated by a lip of 1),
  185. * restart the traversal.
  186. */
  187. struct xfs_log_item *
  188. xfs_trans_ail_cursor_next(
  189. struct xfs_ail *ailp,
  190. struct xfs_ail_cursor *cur)
  191. {
  192. struct xfs_log_item *lip = cur->item;
  193. if ((__psint_t)lip & 1)
  194. lip = xfs_ail_min(ailp);
  195. xfs_trans_ail_cursor_set(ailp, cur, lip);
  196. return lip;
  197. }
  198. /*
  199. * Now that the traversal is complete, we need to remove the cursor
  200. * from the list of traversing cursors. Avoid removing the embedded
  201. * push cursor, but use the fact it is always present to make the
  202. * list deletion simple.
  203. */
  204. void
  205. xfs_trans_ail_cursor_done(
  206. struct xfs_ail *ailp,
  207. struct xfs_ail_cursor *done)
  208. {
  209. struct xfs_ail_cursor *prev = NULL;
  210. struct xfs_ail_cursor *cur;
  211. done->item = NULL;
  212. if (done == &ailp->xa_cursors)
  213. return;
  214. prev = &ailp->xa_cursors;
  215. for (cur = prev->next; cur; prev = cur, cur = prev->next) {
  216. if (cur == done) {
  217. prev->next = cur->next;
  218. break;
  219. }
  220. }
  221. ASSERT(cur);
  222. }
  223. /*
  224. * Invalidate any cursor that is pointing to this item. This is
  225. * called when an item is removed from the AIL. Any cursor pointing
  226. * to this object is now invalid and the traversal needs to be
  227. * terminated so it doesn't reference a freed object. We set the
  228. * cursor item to a value of 1 so we can distinguish between an
  229. * invalidation and the end of the list when getting the next item
  230. * from the cursor.
  231. */
  232. STATIC void
  233. xfs_trans_ail_cursor_clear(
  234. struct xfs_ail *ailp,
  235. struct xfs_log_item *lip)
  236. {
  237. struct xfs_ail_cursor *cur;
  238. /* need to search all cursors */
  239. for (cur = &ailp->xa_cursors; cur; cur = cur->next) {
  240. if (cur->item == lip)
  241. cur->item = (struct xfs_log_item *)
  242. ((__psint_t)cur->item | 1);
  243. }
  244. }
  245. /*
  246. * Return the item in the AIL with the current lsn.
  247. * Return the current tree generation number for use
  248. * in calls to xfs_trans_next_ail().
  249. */
  250. xfs_log_item_t *
  251. xfs_trans_ail_cursor_first(
  252. struct xfs_ail *ailp,
  253. struct xfs_ail_cursor *cur,
  254. xfs_lsn_t lsn)
  255. {
  256. xfs_log_item_t *lip;
  257. xfs_trans_ail_cursor_init(ailp, cur);
  258. lip = xfs_ail_min(ailp);
  259. if (lsn == 0)
  260. goto out;
  261. list_for_each_entry(lip, &ailp->xa_ail, li_ail) {
  262. if (XFS_LSN_CMP(lip->li_lsn, lsn) >= 0)
  263. goto out;
  264. }
  265. lip = NULL;
  266. out:
  267. xfs_trans_ail_cursor_set(ailp, cur, lip);
  268. return lip;
  269. }
  270. /*
  271. * splice the log item list into the AIL at the given LSN.
  272. */
  273. static void
  274. xfs_ail_splice(
  275. struct xfs_ail *ailp,
  276. struct list_head *list,
  277. xfs_lsn_t lsn)
  278. {
  279. xfs_log_item_t *next_lip;
  280. /* If the list is empty, just insert the item. */
  281. if (list_empty(&ailp->xa_ail)) {
  282. list_splice(list, &ailp->xa_ail);
  283. return;
  284. }
  285. list_for_each_entry_reverse(next_lip, &ailp->xa_ail, li_ail) {
  286. if (XFS_LSN_CMP(next_lip->li_lsn, lsn) <= 0)
  287. break;
  288. }
  289. ASSERT(&next_lip->li_ail == &ailp->xa_ail ||
  290. XFS_LSN_CMP(next_lip->li_lsn, lsn) <= 0);
  291. list_splice_init(list, &next_lip->li_ail);
  292. }
  293. /*
  294. * Delete the given item from the AIL. Return a pointer to the item.
  295. */
  296. static void
  297. xfs_ail_delete(
  298. struct xfs_ail *ailp,
  299. xfs_log_item_t *lip)
  300. {
  301. xfs_ail_check(ailp, lip);
  302. list_del(&lip->li_ail);
  303. xfs_trans_ail_cursor_clear(ailp, lip);
  304. }
  305. /*
  306. * xfs_ail_worker does the work of pushing on the AIL. It will requeue itself
  307. * to run at a later time if there is more work to do to complete the push.
  308. */
  309. STATIC void
  310. xfs_ail_worker(
  311. struct work_struct *work)
  312. {
  313. struct xfs_ail *ailp = container_of(to_delayed_work(work),
  314. struct xfs_ail, xa_work);
  315. xfs_mount_t *mp = ailp->xa_mount;
  316. struct xfs_ail_cursor *cur = &ailp->xa_cursors;
  317. xfs_log_item_t *lip;
  318. xfs_lsn_t lsn;
  319. xfs_lsn_t target;
  320. long tout = 10;
  321. int flush_log = 0;
  322. int stuck = 0;
  323. int count = 0;
  324. int push_xfsbufd = 0;
  325. spin_lock(&ailp->xa_lock);
  326. target = ailp->xa_target;
  327. xfs_trans_ail_cursor_init(ailp, cur);
  328. lip = xfs_trans_ail_cursor_first(ailp, cur, ailp->xa_last_pushed_lsn);
  329. if (!lip || XFS_FORCED_SHUTDOWN(mp)) {
  330. /*
  331. * AIL is empty or our push has reached the end.
  332. */
  333. xfs_trans_ail_cursor_done(ailp, cur);
  334. spin_unlock(&ailp->xa_lock);
  335. goto out_done;
  336. }
  337. XFS_STATS_INC(xs_push_ail);
  338. /*
  339. * While the item we are looking at is below the given threshold
  340. * try to flush it out. We'd like not to stop until we've at least
  341. * tried to push on everything in the AIL with an LSN less than
  342. * the given threshold.
  343. *
  344. * However, we will stop after a certain number of pushes and wait
  345. * for a reduced timeout to fire before pushing further. This
  346. * prevents use from spinning when we can't do anything or there is
  347. * lots of contention on the AIL lists.
  348. */
  349. lsn = lip->li_lsn;
  350. while ((XFS_LSN_CMP(lip->li_lsn, target) <= 0)) {
  351. int lock_result;
  352. /*
  353. * If we can lock the item without sleeping, unlock the AIL
  354. * lock and flush the item. Then re-grab the AIL lock so we
  355. * can look for the next item on the AIL. List changes are
  356. * handled by the AIL lookup functions internally
  357. *
  358. * If we can't lock the item, either its holder will flush it
  359. * or it is already being flushed or it is being relogged. In
  360. * any of these case it is being taken care of and we can just
  361. * skip to the next item in the list.
  362. */
  363. lock_result = IOP_TRYLOCK(lip);
  364. spin_unlock(&ailp->xa_lock);
  365. switch (lock_result) {
  366. case XFS_ITEM_SUCCESS:
  367. XFS_STATS_INC(xs_push_ail_success);
  368. IOP_PUSH(lip);
  369. ailp->xa_last_pushed_lsn = lsn;
  370. break;
  371. case XFS_ITEM_PUSHBUF:
  372. XFS_STATS_INC(xs_push_ail_pushbuf);
  373. IOP_PUSHBUF(lip);
  374. ailp->xa_last_pushed_lsn = lsn;
  375. push_xfsbufd = 1;
  376. break;
  377. case XFS_ITEM_PINNED:
  378. XFS_STATS_INC(xs_push_ail_pinned);
  379. stuck++;
  380. flush_log = 1;
  381. break;
  382. case XFS_ITEM_LOCKED:
  383. XFS_STATS_INC(xs_push_ail_locked);
  384. ailp->xa_last_pushed_lsn = lsn;
  385. stuck++;
  386. break;
  387. default:
  388. ASSERT(0);
  389. break;
  390. }
  391. spin_lock(&ailp->xa_lock);
  392. /* should we bother continuing? */
  393. if (XFS_FORCED_SHUTDOWN(mp))
  394. break;
  395. ASSERT(mp->m_log);
  396. count++;
  397. /*
  398. * Are there too many items we can't do anything with?
  399. * If we we are skipping too many items because we can't flush
  400. * them or they are already being flushed, we back off and
  401. * given them time to complete whatever operation is being
  402. * done. i.e. remove pressure from the AIL while we can't make
  403. * progress so traversals don't slow down further inserts and
  404. * removals to/from the AIL.
  405. *
  406. * The value of 100 is an arbitrary magic number based on
  407. * observation.
  408. */
  409. if (stuck > 100)
  410. break;
  411. lip = xfs_trans_ail_cursor_next(ailp, cur);
  412. if (lip == NULL)
  413. break;
  414. lsn = lip->li_lsn;
  415. }
  416. xfs_trans_ail_cursor_done(ailp, cur);
  417. spin_unlock(&ailp->xa_lock);
  418. if (flush_log) {
  419. /*
  420. * If something we need to push out was pinned, then
  421. * push out the log so it will become unpinned and
  422. * move forward in the AIL.
  423. */
  424. XFS_STATS_INC(xs_push_ail_flush);
  425. xfs_log_force(mp, 0);
  426. }
  427. if (push_xfsbufd) {
  428. /* we've got delayed write buffers to flush */
  429. wake_up_process(mp->m_ddev_targp->bt_task);
  430. }
  431. /* assume we have more work to do in a short while */
  432. out_done:
  433. if (!count) {
  434. /* We're past our target or empty, so idle */
  435. ailp->xa_last_pushed_lsn = 0;
  436. /*
  437. * We clear the XFS_AIL_PUSHING_BIT first before checking
  438. * whether the target has changed. If the target has changed,
  439. * this pushes the requeue race directly onto the result of the
  440. * atomic test/set bit, so we are guaranteed that either the
  441. * the pusher that changed the target or ourselves will requeue
  442. * the work (but not both).
  443. */
  444. clear_bit(XFS_AIL_PUSHING_BIT, &ailp->xa_flags);
  445. smp_rmb();
  446. if (XFS_LSN_CMP(ailp->xa_target, target) == 0 ||
  447. test_and_set_bit(XFS_AIL_PUSHING_BIT, &ailp->xa_flags))
  448. return;
  449. tout = 50;
  450. } else if (XFS_LSN_CMP(lsn, target) >= 0) {
  451. /*
  452. * We reached the target so wait a bit longer for I/O to
  453. * complete and remove pushed items from the AIL before we
  454. * start the next scan from the start of the AIL.
  455. */
  456. tout = 50;
  457. ailp->xa_last_pushed_lsn = 0;
  458. } else if ((stuck * 100) / count > 90) {
  459. /*
  460. * Either there is a lot of contention on the AIL or we
  461. * are stuck due to operations in progress. "Stuck" in this
  462. * case is defined as >90% of the items we tried to push
  463. * were stuck.
  464. *
  465. * Backoff a bit more to allow some I/O to complete before
  466. * continuing from where we were.
  467. */
  468. tout = 20;
  469. }
  470. /* There is more to do, requeue us. */
  471. queue_delayed_work(xfs_syncd_wq, &ailp->xa_work,
  472. msecs_to_jiffies(tout));
  473. }
  474. /*
  475. * This routine is called to move the tail of the AIL forward. It does this by
  476. * trying to flush items in the AIL whose lsns are below the given
  477. * threshold_lsn.
  478. *
  479. * The push is run asynchronously in a workqueue, which means the caller needs
  480. * to handle waiting on the async flush for space to become available.
  481. * We don't want to interrupt any push that is in progress, hence we only queue
  482. * work if we set the pushing bit approriately.
  483. *
  484. * We do this unlocked - we only need to know whether there is anything in the
  485. * AIL at the time we are called. We don't need to access the contents of
  486. * any of the objects, so the lock is not needed.
  487. */
  488. void
  489. xfs_ail_push(
  490. struct xfs_ail *ailp,
  491. xfs_lsn_t threshold_lsn)
  492. {
  493. xfs_log_item_t *lip;
  494. lip = xfs_ail_min(ailp);
  495. if (!lip || XFS_FORCED_SHUTDOWN(ailp->xa_mount) ||
  496. XFS_LSN_CMP(threshold_lsn, ailp->xa_target) <= 0)
  497. return;
  498. /*
  499. * Ensure that the new target is noticed in push code before it clears
  500. * the XFS_AIL_PUSHING_BIT.
  501. */
  502. smp_wmb();
  503. xfs_trans_ail_copy_lsn(ailp, &ailp->xa_target, &threshold_lsn);
  504. if (!test_and_set_bit(XFS_AIL_PUSHING_BIT, &ailp->xa_flags))
  505. queue_delayed_work(xfs_syncd_wq, &ailp->xa_work, 0);
  506. }
  507. /*
  508. * Push out all items in the AIL immediately
  509. */
  510. void
  511. xfs_ail_push_all(
  512. struct xfs_ail *ailp)
  513. {
  514. xfs_lsn_t threshold_lsn = xfs_ail_max_lsn(ailp);
  515. if (threshold_lsn)
  516. xfs_ail_push(ailp, threshold_lsn);
  517. }
  518. /*
  519. * This is to be called when an item is unlocked that may have
  520. * been in the AIL. It will wake up the first member of the AIL
  521. * wait list if this item's unlocking might allow it to progress.
  522. * If the item is in the AIL, then we need to get the AIL lock
  523. * while doing our checking so we don't race with someone going
  524. * to sleep waiting for this event in xfs_trans_push_ail().
  525. */
  526. void
  527. xfs_trans_unlocked_item(
  528. struct xfs_ail *ailp,
  529. xfs_log_item_t *lip)
  530. {
  531. xfs_log_item_t *min_lip;
  532. /*
  533. * If we're forcibly shutting down, we may have
  534. * unlocked log items arbitrarily. The last thing
  535. * we want to do is to move the tail of the log
  536. * over some potentially valid data.
  537. */
  538. if (!(lip->li_flags & XFS_LI_IN_AIL) ||
  539. XFS_FORCED_SHUTDOWN(ailp->xa_mount)) {
  540. return;
  541. }
  542. /*
  543. * This is the one case where we can call into xfs_ail_min()
  544. * without holding the AIL lock because we only care about the
  545. * case where we are at the tail of the AIL. If the object isn't
  546. * at the tail, it doesn't matter what result we get back. This
  547. * is slightly racy because since we were just unlocked, we could
  548. * go to sleep between the call to xfs_ail_min and the call to
  549. * xfs_log_move_tail, have someone else lock us, commit to us disk,
  550. * move us out of the tail of the AIL, and then we wake up. However,
  551. * the call to xfs_log_move_tail() doesn't do anything if there's
  552. * not enough free space to wake people up so we're safe calling it.
  553. */
  554. min_lip = xfs_ail_min(ailp);
  555. if (min_lip == lip)
  556. xfs_log_move_tail(ailp->xa_mount, 1);
  557. } /* xfs_trans_unlocked_item */
  558. /*
  559. * xfs_trans_ail_update - bulk AIL insertion operation.
  560. *
  561. * @xfs_trans_ail_update takes an array of log items that all need to be
  562. * positioned at the same LSN in the AIL. If an item is not in the AIL, it will
  563. * be added. Otherwise, it will be repositioned by removing it and re-adding
  564. * it to the AIL. If we move the first item in the AIL, update the log tail to
  565. * match the new minimum LSN in the AIL.
  566. *
  567. * This function takes the AIL lock once to execute the update operations on
  568. * all the items in the array, and as such should not be called with the AIL
  569. * lock held. As a result, once we have the AIL lock, we need to check each log
  570. * item LSN to confirm it needs to be moved forward in the AIL.
  571. *
  572. * To optimise the insert operation, we delete all the items from the AIL in
  573. * the first pass, moving them into a temporary list, then splice the temporary
  574. * list into the correct position in the AIL. This avoids needing to do an
  575. * insert operation on every item.
  576. *
  577. * This function must be called with the AIL lock held. The lock is dropped
  578. * before returning.
  579. */
  580. void
  581. xfs_trans_ail_update_bulk(
  582. struct xfs_ail *ailp,
  583. struct xfs_log_item **log_items,
  584. int nr_items,
  585. xfs_lsn_t lsn) __releases(ailp->xa_lock)
  586. {
  587. xfs_log_item_t *mlip;
  588. xfs_lsn_t tail_lsn;
  589. int mlip_changed = 0;
  590. int i;
  591. LIST_HEAD(tmp);
  592. mlip = xfs_ail_min(ailp);
  593. for (i = 0; i < nr_items; i++) {
  594. struct xfs_log_item *lip = log_items[i];
  595. if (lip->li_flags & XFS_LI_IN_AIL) {
  596. /* check if we really need to move the item */
  597. if (XFS_LSN_CMP(lsn, lip->li_lsn) <= 0)
  598. continue;
  599. xfs_ail_delete(ailp, lip);
  600. if (mlip == lip)
  601. mlip_changed = 1;
  602. } else {
  603. lip->li_flags |= XFS_LI_IN_AIL;
  604. }
  605. lip->li_lsn = lsn;
  606. list_add(&lip->li_ail, &tmp);
  607. }
  608. xfs_ail_splice(ailp, &tmp, lsn);
  609. if (!mlip_changed) {
  610. spin_unlock(&ailp->xa_lock);
  611. return;
  612. }
  613. /*
  614. * It is not safe to access mlip after the AIL lock is dropped, so we
  615. * must get a copy of li_lsn before we do so. This is especially
  616. * important on 32-bit platforms where accessing and updating 64-bit
  617. * values like li_lsn is not atomic.
  618. */
  619. mlip = xfs_ail_min(ailp);
  620. tail_lsn = mlip->li_lsn;
  621. spin_unlock(&ailp->xa_lock);
  622. xfs_log_move_tail(ailp->xa_mount, tail_lsn);
  623. }
  624. /*
  625. * xfs_trans_ail_delete_bulk - remove multiple log items from the AIL
  626. *
  627. * @xfs_trans_ail_delete_bulk takes an array of log items that all need to
  628. * removed from the AIL. The caller is already holding the AIL lock, and done
  629. * all the checks necessary to ensure the items passed in via @log_items are
  630. * ready for deletion. This includes checking that the items are in the AIL.
  631. *
  632. * For each log item to be removed, unlink it from the AIL, clear the IN_AIL
  633. * flag from the item and reset the item's lsn to 0. If we remove the first
  634. * item in the AIL, update the log tail to match the new minimum LSN in the
  635. * AIL.
  636. *
  637. * This function will not drop the AIL lock until all items are removed from
  638. * the AIL to minimise the amount of lock traffic on the AIL. This does not
  639. * greatly increase the AIL hold time, but does significantly reduce the amount
  640. * of traffic on the lock, especially during IO completion.
  641. *
  642. * This function must be called with the AIL lock held. The lock is dropped
  643. * before returning.
  644. */
  645. void
  646. xfs_trans_ail_delete_bulk(
  647. struct xfs_ail *ailp,
  648. struct xfs_log_item **log_items,
  649. int nr_items) __releases(ailp->xa_lock)
  650. {
  651. xfs_log_item_t *mlip;
  652. xfs_lsn_t tail_lsn;
  653. int mlip_changed = 0;
  654. int i;
  655. mlip = xfs_ail_min(ailp);
  656. for (i = 0; i < nr_items; i++) {
  657. struct xfs_log_item *lip = log_items[i];
  658. if (!(lip->li_flags & XFS_LI_IN_AIL)) {
  659. struct xfs_mount *mp = ailp->xa_mount;
  660. spin_unlock(&ailp->xa_lock);
  661. if (!XFS_FORCED_SHUTDOWN(mp)) {
  662. xfs_alert_tag(mp, XFS_PTAG_AILDELETE,
  663. "%s: attempting to delete a log item that is not in the AIL",
  664. __func__);
  665. xfs_force_shutdown(mp, SHUTDOWN_CORRUPT_INCORE);
  666. }
  667. return;
  668. }
  669. xfs_ail_delete(ailp, lip);
  670. lip->li_flags &= ~XFS_LI_IN_AIL;
  671. lip->li_lsn = 0;
  672. if (mlip == lip)
  673. mlip_changed = 1;
  674. }
  675. if (!mlip_changed) {
  676. spin_unlock(&ailp->xa_lock);
  677. return;
  678. }
  679. /*
  680. * It is not safe to access mlip after the AIL lock is dropped, so we
  681. * must get a copy of li_lsn before we do so. This is especially
  682. * important on 32-bit platforms where accessing and updating 64-bit
  683. * values like li_lsn is not atomic. It is possible we've emptied the
  684. * AIL here, so if that is the case, pass an LSN of 0 to the tail move.
  685. */
  686. mlip = xfs_ail_min(ailp);
  687. tail_lsn = mlip ? mlip->li_lsn : 0;
  688. spin_unlock(&ailp->xa_lock);
  689. xfs_log_move_tail(ailp->xa_mount, tail_lsn);
  690. }
  691. /*
  692. * The active item list (AIL) is a doubly linked list of log
  693. * items sorted by ascending lsn. The base of the list is
  694. * a forw/back pointer pair embedded in the xfs mount structure.
  695. * The base is initialized with both pointers pointing to the
  696. * base. This case always needs to be distinguished, because
  697. * the base has no lsn to look at. We almost always insert
  698. * at the end of the list, so on inserts we search from the
  699. * end of the list to find where the new item belongs.
  700. */
  701. /*
  702. * Initialize the doubly linked list to point only to itself.
  703. */
  704. int
  705. xfs_trans_ail_init(
  706. xfs_mount_t *mp)
  707. {
  708. struct xfs_ail *ailp;
  709. ailp = kmem_zalloc(sizeof(struct xfs_ail), KM_MAYFAIL);
  710. if (!ailp)
  711. return ENOMEM;
  712. ailp->xa_mount = mp;
  713. INIT_LIST_HEAD(&ailp->xa_ail);
  714. spin_lock_init(&ailp->xa_lock);
  715. INIT_DELAYED_WORK(&ailp->xa_work, xfs_ail_worker);
  716. mp->m_ail = ailp;
  717. return 0;
  718. }
  719. void
  720. xfs_trans_ail_destroy(
  721. xfs_mount_t *mp)
  722. {
  723. struct xfs_ail *ailp = mp->m_ail;
  724. cancel_delayed_work_sync(&ailp->xa_work);
  725. kmem_free(ailp);
  726. }