glock.c 50 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254
  1. /*
  2. * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
  3. * Copyright (C) 2004-2006 Red Hat, Inc. All rights reserved.
  4. *
  5. * This copyrighted material is made available to anyone wishing to use,
  6. * modify, copy, or redistribute it subject to the terms and conditions
  7. * of the GNU General Public License v.2.
  8. */
  9. #include <linux/sched.h>
  10. #include <linux/slab.h>
  11. #include <linux/spinlock.h>
  12. #include <linux/completion.h>
  13. #include <linux/buffer_head.h>
  14. #include <linux/delay.h>
  15. #include <linux/sort.h>
  16. #include <linux/jhash.h>
  17. #include <linux/kref.h>
  18. #include <linux/kallsyms.h>
  19. #include <linux/gfs2_ondisk.h>
  20. #include <asm/uaccess.h>
  21. #include "gfs2.h"
  22. #include "lm_interface.h"
  23. #include "incore.h"
  24. #include "glock.h"
  25. #include "glops.h"
  26. #include "inode.h"
  27. #include "lm.h"
  28. #include "lops.h"
  29. #include "meta_io.h"
  30. #include "quota.h"
  31. #include "super.h"
  32. #include "util.h"
  33. /* Must be kept in sync with the beginning of struct gfs2_glock */
  34. struct glock_plug {
  35. struct list_head gl_list;
  36. unsigned long gl_flags;
  37. };
  38. struct greedy {
  39. struct gfs2_holder gr_gh;
  40. struct work_struct gr_work;
  41. };
  42. typedef void (*glock_examiner) (struct gfs2_glock * gl);
  43. static int gfs2_dump_lockstate(struct gfs2_sbd *sdp);
  44. static int dump_glock(struct gfs2_glock *gl);
  45. /**
  46. * relaxed_state_ok - is a requested lock compatible with the current lock mode?
  47. * @actual: the current state of the lock
  48. * @requested: the lock state that was requested by the caller
  49. * @flags: the modifier flags passed in by the caller
  50. *
  51. * Returns: 1 if the locks are compatible, 0 otherwise
  52. */
  53. static inline int relaxed_state_ok(unsigned int actual, unsigned requested,
  54. int flags)
  55. {
  56. if (actual == requested)
  57. return 1;
  58. if (flags & GL_EXACT)
  59. return 0;
  60. if (actual == LM_ST_EXCLUSIVE && requested == LM_ST_SHARED)
  61. return 1;
  62. if (actual != LM_ST_UNLOCKED && (flags & LM_FLAG_ANY))
  63. return 1;
  64. return 0;
  65. }
  66. /**
  67. * gl_hash() - Turn glock number into hash bucket number
  68. * @lock: The glock number
  69. *
  70. * Returns: The number of the corresponding hash bucket
  71. */
  72. static unsigned int gl_hash(const struct lm_lockname *name)
  73. {
  74. unsigned int h;
  75. h = jhash(&name->ln_number, sizeof(uint64_t), 0);
  76. h = jhash(&name->ln_type, sizeof(unsigned int), h);
  77. h &= GFS2_GL_HASH_MASK;
  78. return h;
  79. }
  80. /**
  81. * glock_free() - Perform a few checks and then release struct gfs2_glock
  82. * @gl: The glock to release
  83. *
  84. * Also calls lock module to release its internal structure for this glock.
  85. *
  86. */
  87. static void glock_free(struct gfs2_glock *gl)
  88. {
  89. struct gfs2_sbd *sdp = gl->gl_sbd;
  90. struct inode *aspace = gl->gl_aspace;
  91. gfs2_lm_put_lock(sdp, gl->gl_lock);
  92. if (aspace)
  93. gfs2_aspace_put(aspace);
  94. kmem_cache_free(gfs2_glock_cachep, gl);
  95. }
  96. /**
  97. * gfs2_glock_hold() - increment reference count on glock
  98. * @gl: The glock to hold
  99. *
  100. */
  101. void gfs2_glock_hold(struct gfs2_glock *gl)
  102. {
  103. kref_get(&gl->gl_ref);
  104. }
  105. /* All work is done after the return from kref_put() so we
  106. can release the write_lock before the free. */
  107. static void kill_glock(struct kref *kref)
  108. {
  109. struct gfs2_glock *gl = container_of(kref, struct gfs2_glock, gl_ref);
  110. struct gfs2_sbd *sdp = gl->gl_sbd;
  111. gfs2_assert(sdp, gl->gl_state == LM_ST_UNLOCKED);
  112. gfs2_assert(sdp, list_empty(&gl->gl_reclaim));
  113. gfs2_assert(sdp, list_empty(&gl->gl_holders));
  114. gfs2_assert(sdp, list_empty(&gl->gl_waiters1));
  115. gfs2_assert(sdp, list_empty(&gl->gl_waiters2));
  116. gfs2_assert(sdp, list_empty(&gl->gl_waiters3));
  117. }
  118. /**
  119. * gfs2_glock_put() - Decrement reference count on glock
  120. * @gl: The glock to put
  121. *
  122. */
  123. int gfs2_glock_put(struct gfs2_glock *gl)
  124. {
  125. struct gfs2_gl_hash_bucket *bucket = gl->gl_bucket;
  126. int rv = 0;
  127. write_lock(&bucket->hb_lock);
  128. if (kref_put(&gl->gl_ref, kill_glock)) {
  129. list_del_init(&gl->gl_list);
  130. write_unlock(&bucket->hb_lock);
  131. BUG_ON(spin_is_locked(&gl->gl_spin));
  132. glock_free(gl);
  133. rv = 1;
  134. goto out;
  135. }
  136. write_unlock(&bucket->hb_lock);
  137. out:
  138. return rv;
  139. }
  140. /**
  141. * queue_empty - check to see if a glock's queue is empty
  142. * @gl: the glock
  143. * @head: the head of the queue to check
  144. *
  145. * This function protects the list in the event that a process already
  146. * has a holder on the list and is adding a second holder for itself.
  147. * The glmutex lock is what generally prevents processes from working
  148. * on the same glock at once, but the special case of adding a second
  149. * holder for yourself ("recursive" locking) doesn't involve locking
  150. * glmutex, making the spin lock necessary.
  151. *
  152. * Returns: 1 if the queue is empty
  153. */
  154. static inline int queue_empty(struct gfs2_glock *gl, struct list_head *head)
  155. {
  156. int empty;
  157. spin_lock(&gl->gl_spin);
  158. empty = list_empty(head);
  159. spin_unlock(&gl->gl_spin);
  160. return empty;
  161. }
  162. /**
  163. * search_bucket() - Find struct gfs2_glock by lock number
  164. * @bucket: the bucket to search
  165. * @name: The lock name
  166. *
  167. * Returns: NULL, or the struct gfs2_glock with the requested number
  168. */
  169. static struct gfs2_glock *search_bucket(struct gfs2_gl_hash_bucket *bucket,
  170. const struct gfs2_sbd *sdp,
  171. const struct lm_lockname *name)
  172. {
  173. struct gfs2_glock *gl;
  174. list_for_each_entry(gl, &bucket->hb_list, gl_list) {
  175. if (test_bit(GLF_PLUG, &gl->gl_flags))
  176. continue;
  177. if (!lm_name_equal(&gl->gl_name, name))
  178. continue;
  179. if (gl->gl_sbd != sdp)
  180. continue;
  181. kref_get(&gl->gl_ref);
  182. return gl;
  183. }
  184. return NULL;
  185. }
  186. /**
  187. * gfs2_glock_find() - Find glock by lock number
  188. * @sdp: The GFS2 superblock
  189. * @name: The lock name
  190. *
  191. * Returns: NULL, or the struct gfs2_glock with the requested number
  192. */
  193. static struct gfs2_glock *gfs2_glock_find(struct gfs2_sbd *sdp,
  194. const struct lm_lockname *name)
  195. {
  196. struct gfs2_gl_hash_bucket *bucket = &sdp->sd_gl_hash[gl_hash(name)];
  197. struct gfs2_glock *gl;
  198. read_lock(&bucket->hb_lock);
  199. gl = search_bucket(bucket, sdp, name);
  200. read_unlock(&bucket->hb_lock);
  201. return gl;
  202. }
  203. /**
  204. * gfs2_glock_get() - Get a glock, or create one if one doesn't exist
  205. * @sdp: The GFS2 superblock
  206. * @number: the lock number
  207. * @glops: The glock_operations to use
  208. * @create: If 0, don't create the glock if it doesn't exist
  209. * @glp: the glock is returned here
  210. *
  211. * This does not lock a glock, just finds/creates structures for one.
  212. *
  213. * Returns: errno
  214. */
  215. int gfs2_glock_get(struct gfs2_sbd *sdp, uint64_t number,
  216. const struct gfs2_glock_operations *glops, int create,
  217. struct gfs2_glock **glp)
  218. {
  219. struct lm_lockname name;
  220. struct gfs2_glock *gl, *tmp;
  221. struct gfs2_gl_hash_bucket *bucket;
  222. int error;
  223. name.ln_number = number;
  224. name.ln_type = glops->go_type;
  225. bucket = &sdp->sd_gl_hash[gl_hash(&name)];
  226. read_lock(&bucket->hb_lock);
  227. gl = search_bucket(bucket, sdp, &name);
  228. read_unlock(&bucket->hb_lock);
  229. if (gl || !create) {
  230. *glp = gl;
  231. return 0;
  232. }
  233. gl = kmem_cache_alloc(gfs2_glock_cachep, GFP_KERNEL);
  234. if (!gl)
  235. return -ENOMEM;
  236. gl->gl_flags = 0;
  237. gl->gl_name = name;
  238. kref_init(&gl->gl_ref);
  239. gl->gl_state = LM_ST_UNLOCKED;
  240. gl->gl_owner = NULL;
  241. gl->gl_ip = 0;
  242. gl->gl_ops = glops;
  243. gl->gl_req_gh = NULL;
  244. gl->gl_req_bh = NULL;
  245. gl->gl_vn = 0;
  246. gl->gl_stamp = jiffies;
  247. gl->gl_object = NULL;
  248. gl->gl_bucket = bucket;
  249. gl->gl_sbd = sdp;
  250. gl->gl_aspace = NULL;
  251. lops_init_le(&gl->gl_le, &gfs2_glock_lops);
  252. /* If this glock protects actual on-disk data or metadata blocks,
  253. create a VFS inode to manage the pages/buffers holding them. */
  254. if (glops == &gfs2_inode_glops ||
  255. glops == &gfs2_rgrp_glops) {
  256. gl->gl_aspace = gfs2_aspace_get(sdp);
  257. if (!gl->gl_aspace) {
  258. error = -ENOMEM;
  259. goto fail;
  260. }
  261. }
  262. error = gfs2_lm_get_lock(sdp, &name, &gl->gl_lock);
  263. if (error)
  264. goto fail_aspace;
  265. write_lock(&bucket->hb_lock);
  266. tmp = search_bucket(bucket, sdp, &name);
  267. if (tmp) {
  268. write_unlock(&bucket->hb_lock);
  269. glock_free(gl);
  270. gl = tmp;
  271. } else {
  272. list_add_tail(&gl->gl_list, &bucket->hb_list);
  273. write_unlock(&bucket->hb_lock);
  274. }
  275. *glp = gl;
  276. return 0;
  277. fail_aspace:
  278. if (gl->gl_aspace)
  279. gfs2_aspace_put(gl->gl_aspace);
  280. fail:
  281. kmem_cache_free(gfs2_glock_cachep, gl);
  282. return error;
  283. }
  284. /**
  285. * gfs2_holder_init - initialize a struct gfs2_holder in the default way
  286. * @gl: the glock
  287. * @state: the state we're requesting
  288. * @flags: the modifier flags
  289. * @gh: the holder structure
  290. *
  291. */
  292. void gfs2_holder_init(struct gfs2_glock *gl, unsigned int state, unsigned flags,
  293. struct gfs2_holder *gh)
  294. {
  295. INIT_LIST_HEAD(&gh->gh_list);
  296. gh->gh_gl = gl;
  297. gh->gh_ip = (unsigned long)__builtin_return_address(0);
  298. gh->gh_owner = current;
  299. gh->gh_state = state;
  300. gh->gh_flags = flags;
  301. gh->gh_error = 0;
  302. gh->gh_iflags = 0;
  303. init_completion(&gh->gh_wait);
  304. if (gh->gh_state == LM_ST_EXCLUSIVE)
  305. gh->gh_flags |= GL_LOCAL_EXCL;
  306. gfs2_glock_hold(gl);
  307. }
  308. /**
  309. * gfs2_holder_reinit - reinitialize a struct gfs2_holder so we can requeue it
  310. * @state: the state we're requesting
  311. * @flags: the modifier flags
  312. * @gh: the holder structure
  313. *
  314. * Don't mess with the glock.
  315. *
  316. */
  317. void gfs2_holder_reinit(unsigned int state, unsigned flags, struct gfs2_holder *gh)
  318. {
  319. gh->gh_state = state;
  320. gh->gh_flags = flags;
  321. if (gh->gh_state == LM_ST_EXCLUSIVE)
  322. gh->gh_flags |= GL_LOCAL_EXCL;
  323. gh->gh_iflags &= 1 << HIF_ALLOCED;
  324. gh->gh_ip = (unsigned long)__builtin_return_address(0);
  325. }
  326. /**
  327. * gfs2_holder_uninit - uninitialize a holder structure (drop glock reference)
  328. * @gh: the holder structure
  329. *
  330. */
  331. void gfs2_holder_uninit(struct gfs2_holder *gh)
  332. {
  333. gfs2_glock_put(gh->gh_gl);
  334. gh->gh_gl = NULL;
  335. gh->gh_ip = 0;
  336. }
  337. /**
  338. * gfs2_holder_get - get a struct gfs2_holder structure
  339. * @gl: the glock
  340. * @state: the state we're requesting
  341. * @flags: the modifier flags
  342. * @gfp_flags:
  343. *
  344. * Figure out how big an impact this function has. Either:
  345. * 1) Replace it with a cache of structures hanging off the struct gfs2_sbd
  346. * 2) Leave it like it is
  347. *
  348. * Returns: the holder structure, NULL on ENOMEM
  349. */
  350. static struct gfs2_holder *gfs2_holder_get(struct gfs2_glock *gl,
  351. unsigned int state,
  352. int flags, gfp_t gfp_flags)
  353. {
  354. struct gfs2_holder *gh;
  355. gh = kmalloc(sizeof(struct gfs2_holder), gfp_flags);
  356. if (!gh)
  357. return NULL;
  358. gfs2_holder_init(gl, state, flags, gh);
  359. set_bit(HIF_ALLOCED, &gh->gh_iflags);
  360. gh->gh_ip = (unsigned long)__builtin_return_address(0);
  361. return gh;
  362. }
  363. /**
  364. * gfs2_holder_put - get rid of a struct gfs2_holder structure
  365. * @gh: the holder structure
  366. *
  367. */
  368. static void gfs2_holder_put(struct gfs2_holder *gh)
  369. {
  370. gfs2_holder_uninit(gh);
  371. kfree(gh);
  372. }
  373. /**
  374. * rq_mutex - process a mutex request in the queue
  375. * @gh: the glock holder
  376. *
  377. * Returns: 1 if the queue is blocked
  378. */
  379. static int rq_mutex(struct gfs2_holder *gh)
  380. {
  381. struct gfs2_glock *gl = gh->gh_gl;
  382. list_del_init(&gh->gh_list);
  383. /* gh->gh_error never examined. */
  384. set_bit(GLF_LOCK, &gl->gl_flags);
  385. complete(&gh->gh_wait);
  386. return 1;
  387. }
  388. /**
  389. * rq_promote - process a promote request in the queue
  390. * @gh: the glock holder
  391. *
  392. * Acquire a new inter-node lock, or change a lock state to more restrictive.
  393. *
  394. * Returns: 1 if the queue is blocked
  395. */
  396. static int rq_promote(struct gfs2_holder *gh)
  397. {
  398. struct gfs2_glock *gl = gh->gh_gl;
  399. struct gfs2_sbd *sdp = gl->gl_sbd;
  400. const struct gfs2_glock_operations *glops = gl->gl_ops;
  401. if (!relaxed_state_ok(gl->gl_state, gh->gh_state, gh->gh_flags)) {
  402. if (list_empty(&gl->gl_holders)) {
  403. gl->gl_req_gh = gh;
  404. set_bit(GLF_LOCK, &gl->gl_flags);
  405. spin_unlock(&gl->gl_spin);
  406. if (atomic_read(&sdp->sd_reclaim_count) >
  407. gfs2_tune_get(sdp, gt_reclaim_limit) &&
  408. !(gh->gh_flags & LM_FLAG_PRIORITY)) {
  409. gfs2_reclaim_glock(sdp);
  410. gfs2_reclaim_glock(sdp);
  411. }
  412. glops->go_xmote_th(gl, gh->gh_state, gh->gh_flags);
  413. spin_lock(&gl->gl_spin);
  414. }
  415. return 1;
  416. }
  417. if (list_empty(&gl->gl_holders)) {
  418. set_bit(HIF_FIRST, &gh->gh_iflags);
  419. set_bit(GLF_LOCK, &gl->gl_flags);
  420. } else {
  421. struct gfs2_holder *next_gh;
  422. if (gh->gh_flags & GL_LOCAL_EXCL)
  423. return 1;
  424. next_gh = list_entry(gl->gl_holders.next, struct gfs2_holder,
  425. gh_list);
  426. if (next_gh->gh_flags & GL_LOCAL_EXCL)
  427. return 1;
  428. }
  429. list_move_tail(&gh->gh_list, &gl->gl_holders);
  430. gh->gh_error = 0;
  431. set_bit(HIF_HOLDER, &gh->gh_iflags);
  432. complete(&gh->gh_wait);
  433. return 0;
  434. }
  435. /**
  436. * rq_demote - process a demote request in the queue
  437. * @gh: the glock holder
  438. *
  439. * Returns: 1 if the queue is blocked
  440. */
  441. static int rq_demote(struct gfs2_holder *gh)
  442. {
  443. struct gfs2_glock *gl = gh->gh_gl;
  444. const struct gfs2_glock_operations *glops = gl->gl_ops;
  445. if (!list_empty(&gl->gl_holders))
  446. return 1;
  447. if (gl->gl_state == gh->gh_state || gl->gl_state == LM_ST_UNLOCKED) {
  448. list_del_init(&gh->gh_list);
  449. gh->gh_error = 0;
  450. spin_unlock(&gl->gl_spin);
  451. if (test_bit(HIF_DEALLOC, &gh->gh_iflags))
  452. gfs2_holder_put(gh);
  453. else
  454. complete(&gh->gh_wait);
  455. spin_lock(&gl->gl_spin);
  456. } else {
  457. gl->gl_req_gh = gh;
  458. set_bit(GLF_LOCK, &gl->gl_flags);
  459. spin_unlock(&gl->gl_spin);
  460. if (gh->gh_state == LM_ST_UNLOCKED ||
  461. gl->gl_state != LM_ST_EXCLUSIVE)
  462. glops->go_drop_th(gl);
  463. else
  464. glops->go_xmote_th(gl, gh->gh_state, gh->gh_flags);
  465. spin_lock(&gl->gl_spin);
  466. }
  467. return 0;
  468. }
  469. /**
  470. * rq_greedy - process a queued request to drop greedy status
  471. * @gh: the glock holder
  472. *
  473. * Returns: 1 if the queue is blocked
  474. */
  475. static int rq_greedy(struct gfs2_holder *gh)
  476. {
  477. struct gfs2_glock *gl = gh->gh_gl;
  478. list_del_init(&gh->gh_list);
  479. /* gh->gh_error never examined. */
  480. clear_bit(GLF_GREEDY, &gl->gl_flags);
  481. spin_unlock(&gl->gl_spin);
  482. gfs2_holder_uninit(gh);
  483. kfree(container_of(gh, struct greedy, gr_gh));
  484. spin_lock(&gl->gl_spin);
  485. return 0;
  486. }
  487. /**
  488. * run_queue - process holder structures on a glock
  489. * @gl: the glock
  490. *
  491. */
  492. static void run_queue(struct gfs2_glock *gl)
  493. {
  494. struct gfs2_holder *gh;
  495. int blocked = 1;
  496. for (;;) {
  497. if (test_bit(GLF_LOCK, &gl->gl_flags))
  498. break;
  499. if (!list_empty(&gl->gl_waiters1)) {
  500. gh = list_entry(gl->gl_waiters1.next,
  501. struct gfs2_holder, gh_list);
  502. if (test_bit(HIF_MUTEX, &gh->gh_iflags))
  503. blocked = rq_mutex(gh);
  504. else
  505. gfs2_assert_warn(gl->gl_sbd, 0);
  506. } else if (!list_empty(&gl->gl_waiters2) &&
  507. !test_bit(GLF_SKIP_WAITERS2, &gl->gl_flags)) {
  508. gh = list_entry(gl->gl_waiters2.next,
  509. struct gfs2_holder, gh_list);
  510. if (test_bit(HIF_DEMOTE, &gh->gh_iflags))
  511. blocked = rq_demote(gh);
  512. else if (test_bit(HIF_GREEDY, &gh->gh_iflags))
  513. blocked = rq_greedy(gh);
  514. else
  515. gfs2_assert_warn(gl->gl_sbd, 0);
  516. } else if (!list_empty(&gl->gl_waiters3)) {
  517. gh = list_entry(gl->gl_waiters3.next,
  518. struct gfs2_holder, gh_list);
  519. if (test_bit(HIF_PROMOTE, &gh->gh_iflags))
  520. blocked = rq_promote(gh);
  521. else
  522. gfs2_assert_warn(gl->gl_sbd, 0);
  523. } else
  524. break;
  525. if (blocked)
  526. break;
  527. }
  528. }
  529. /**
  530. * gfs2_glmutex_lock - acquire a local lock on a glock
  531. * @gl: the glock
  532. *
  533. * Gives caller exclusive access to manipulate a glock structure.
  534. */
  535. static void gfs2_glmutex_lock(struct gfs2_glock *gl)
  536. {
  537. struct gfs2_holder gh;
  538. gfs2_holder_init(gl, 0, 0, &gh);
  539. set_bit(HIF_MUTEX, &gh.gh_iflags);
  540. spin_lock(&gl->gl_spin);
  541. if (test_and_set_bit(GLF_LOCK, &gl->gl_flags))
  542. list_add_tail(&gh.gh_list, &gl->gl_waiters1);
  543. else {
  544. gl->gl_owner = current;
  545. gl->gl_ip = (unsigned long)__builtin_return_address(0);
  546. complete(&gh.gh_wait);
  547. }
  548. spin_unlock(&gl->gl_spin);
  549. wait_for_completion(&gh.gh_wait);
  550. gfs2_holder_uninit(&gh);
  551. }
  552. /**
  553. * gfs2_glmutex_trylock - try to acquire a local lock on a glock
  554. * @gl: the glock
  555. *
  556. * Returns: 1 if the glock is acquired
  557. */
  558. static int gfs2_glmutex_trylock(struct gfs2_glock *gl)
  559. {
  560. int acquired = 1;
  561. spin_lock(&gl->gl_spin);
  562. if (test_and_set_bit(GLF_LOCK, &gl->gl_flags))
  563. acquired = 0;
  564. else {
  565. gl->gl_owner = current;
  566. gl->gl_ip = (unsigned long)__builtin_return_address(0);
  567. }
  568. spin_unlock(&gl->gl_spin);
  569. return acquired;
  570. }
  571. /**
  572. * gfs2_glmutex_unlock - release a local lock on a glock
  573. * @gl: the glock
  574. *
  575. */
  576. static void gfs2_glmutex_unlock(struct gfs2_glock *gl)
  577. {
  578. spin_lock(&gl->gl_spin);
  579. clear_bit(GLF_LOCK, &gl->gl_flags);
  580. gl->gl_owner = NULL;
  581. gl->gl_ip = 0;
  582. run_queue(gl);
  583. BUG_ON(!spin_is_locked(&gl->gl_spin));
  584. spin_unlock(&gl->gl_spin);
  585. }
  586. /**
  587. * handle_callback - add a demote request to a lock's queue
  588. * @gl: the glock
  589. * @state: the state the caller wants us to change to
  590. *
  591. * Note: This may fail sliently if we are out of memory.
  592. */
  593. static void handle_callback(struct gfs2_glock *gl, unsigned int state)
  594. {
  595. struct gfs2_holder *gh, *new_gh = NULL;
  596. restart:
  597. spin_lock(&gl->gl_spin);
  598. list_for_each_entry(gh, &gl->gl_waiters2, gh_list) {
  599. if (test_bit(HIF_DEMOTE, &gh->gh_iflags) &&
  600. gl->gl_req_gh != gh) {
  601. if (gh->gh_state != state)
  602. gh->gh_state = LM_ST_UNLOCKED;
  603. goto out;
  604. }
  605. }
  606. if (new_gh) {
  607. list_add_tail(&new_gh->gh_list, &gl->gl_waiters2);
  608. new_gh = NULL;
  609. } else {
  610. spin_unlock(&gl->gl_spin);
  611. new_gh = gfs2_holder_get(gl, state, LM_FLAG_TRY, GFP_KERNEL);
  612. if (!new_gh)
  613. return;
  614. set_bit(HIF_DEMOTE, &new_gh->gh_iflags);
  615. set_bit(HIF_DEALLOC, &new_gh->gh_iflags);
  616. goto restart;
  617. }
  618. out:
  619. spin_unlock(&gl->gl_spin);
  620. if (new_gh)
  621. gfs2_holder_put(new_gh);
  622. }
  623. void gfs2_glock_inode_squish(struct inode *inode)
  624. {
  625. struct gfs2_holder gh;
  626. struct gfs2_glock *gl = GFS2_I(inode)->i_gl;
  627. gfs2_holder_init(gl, LM_ST_UNLOCKED, 0, &gh);
  628. set_bit(HIF_DEMOTE, &gh.gh_iflags);
  629. spin_lock(&gl->gl_spin);
  630. gfs2_assert(inode->i_sb->s_fs_info, list_empty(&gl->gl_holders));
  631. list_add_tail(&gh.gh_list, &gl->gl_waiters2);
  632. run_queue(gl);
  633. spin_unlock(&gl->gl_spin);
  634. wait_for_completion(&gh.gh_wait);
  635. gfs2_holder_uninit(&gh);
  636. }
  637. /**
  638. * state_change - record that the glock is now in a different state
  639. * @gl: the glock
  640. * @new_state the new state
  641. *
  642. */
  643. static void state_change(struct gfs2_glock *gl, unsigned int new_state)
  644. {
  645. int held1, held2;
  646. held1 = (gl->gl_state != LM_ST_UNLOCKED);
  647. held2 = (new_state != LM_ST_UNLOCKED);
  648. if (held1 != held2) {
  649. if (held2)
  650. gfs2_glock_hold(gl);
  651. else
  652. gfs2_glock_put(gl);
  653. }
  654. gl->gl_state = new_state;
  655. }
  656. /**
  657. * xmote_bh - Called after the lock module is done acquiring a lock
  658. * @gl: The glock in question
  659. * @ret: the int returned from the lock module
  660. *
  661. */
  662. static void xmote_bh(struct gfs2_glock *gl, unsigned int ret)
  663. {
  664. struct gfs2_sbd *sdp = gl->gl_sbd;
  665. const struct gfs2_glock_operations *glops = gl->gl_ops;
  666. struct gfs2_holder *gh = gl->gl_req_gh;
  667. int prev_state = gl->gl_state;
  668. int op_done = 1;
  669. gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
  670. gfs2_assert_warn(sdp, queue_empty(gl, &gl->gl_holders));
  671. gfs2_assert_warn(sdp, !(ret & LM_OUT_ASYNC));
  672. state_change(gl, ret & LM_OUT_ST_MASK);
  673. if (prev_state != LM_ST_UNLOCKED && !(ret & LM_OUT_CACHEABLE)) {
  674. if (glops->go_inval)
  675. glops->go_inval(gl, DIO_METADATA | DIO_DATA);
  676. } else if (gl->gl_state == LM_ST_DEFERRED) {
  677. /* We might not want to do this here.
  678. Look at moving to the inode glops. */
  679. if (glops->go_inval)
  680. glops->go_inval(gl, DIO_DATA);
  681. }
  682. /* Deal with each possible exit condition */
  683. if (!gh)
  684. gl->gl_stamp = jiffies;
  685. else if (unlikely(test_bit(SDF_SHUTDOWN, &sdp->sd_flags))) {
  686. spin_lock(&gl->gl_spin);
  687. list_del_init(&gh->gh_list);
  688. gh->gh_error = -EIO;
  689. spin_unlock(&gl->gl_spin);
  690. } else if (test_bit(HIF_DEMOTE, &gh->gh_iflags)) {
  691. spin_lock(&gl->gl_spin);
  692. list_del_init(&gh->gh_list);
  693. if (gl->gl_state == gh->gh_state ||
  694. gl->gl_state == LM_ST_UNLOCKED)
  695. gh->gh_error = 0;
  696. else {
  697. if (gfs2_assert_warn(sdp, gh->gh_flags &
  698. (LM_FLAG_TRY | LM_FLAG_TRY_1CB)) == -1)
  699. fs_warn(sdp, "ret = 0x%.8X\n", ret);
  700. gh->gh_error = GLR_TRYFAILED;
  701. }
  702. spin_unlock(&gl->gl_spin);
  703. if (ret & LM_OUT_CANCELED)
  704. handle_callback(gl, LM_ST_UNLOCKED); /* Lame */
  705. } else if (ret & LM_OUT_CANCELED) {
  706. spin_lock(&gl->gl_spin);
  707. list_del_init(&gh->gh_list);
  708. gh->gh_error = GLR_CANCELED;
  709. spin_unlock(&gl->gl_spin);
  710. } else if (relaxed_state_ok(gl->gl_state, gh->gh_state, gh->gh_flags)) {
  711. spin_lock(&gl->gl_spin);
  712. list_move_tail(&gh->gh_list, &gl->gl_holders);
  713. gh->gh_error = 0;
  714. set_bit(HIF_HOLDER, &gh->gh_iflags);
  715. spin_unlock(&gl->gl_spin);
  716. set_bit(HIF_FIRST, &gh->gh_iflags);
  717. op_done = 0;
  718. } else if (gh->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB)) {
  719. spin_lock(&gl->gl_spin);
  720. list_del_init(&gh->gh_list);
  721. gh->gh_error = GLR_TRYFAILED;
  722. spin_unlock(&gl->gl_spin);
  723. } else {
  724. if (gfs2_assert_withdraw(sdp, 0) == -1)
  725. fs_err(sdp, "ret = 0x%.8X\n", ret);
  726. }
  727. if (glops->go_xmote_bh)
  728. glops->go_xmote_bh(gl);
  729. if (op_done) {
  730. spin_lock(&gl->gl_spin);
  731. gl->gl_req_gh = NULL;
  732. gl->gl_req_bh = NULL;
  733. clear_bit(GLF_LOCK, &gl->gl_flags);
  734. run_queue(gl);
  735. spin_unlock(&gl->gl_spin);
  736. }
  737. gfs2_glock_put(gl);
  738. if (gh) {
  739. if (test_bit(HIF_DEALLOC, &gh->gh_iflags))
  740. gfs2_holder_put(gh);
  741. else
  742. complete(&gh->gh_wait);
  743. }
  744. }
  745. /**
  746. * gfs2_glock_xmote_th - Call into the lock module to acquire or change a glock
  747. * @gl: The glock in question
  748. * @state: the requested state
  749. * @flags: modifier flags to the lock call
  750. *
  751. */
  752. void gfs2_glock_xmote_th(struct gfs2_glock *gl, unsigned int state, int flags)
  753. {
  754. struct gfs2_sbd *sdp = gl->gl_sbd;
  755. const struct gfs2_glock_operations *glops = gl->gl_ops;
  756. int lck_flags = flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB |
  757. LM_FLAG_NOEXP | LM_FLAG_ANY |
  758. LM_FLAG_PRIORITY);
  759. unsigned int lck_ret;
  760. gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
  761. gfs2_assert_warn(sdp, queue_empty(gl, &gl->gl_holders));
  762. gfs2_assert_warn(sdp, state != LM_ST_UNLOCKED);
  763. gfs2_assert_warn(sdp, state != gl->gl_state);
  764. if (gl->gl_state == LM_ST_EXCLUSIVE) {
  765. if (glops->go_sync)
  766. glops->go_sync(gl,
  767. DIO_METADATA | DIO_DATA | DIO_RELEASE);
  768. }
  769. gfs2_glock_hold(gl);
  770. gl->gl_req_bh = xmote_bh;
  771. lck_ret = gfs2_lm_lock(sdp, gl->gl_lock, gl->gl_state, state, lck_flags);
  772. if (gfs2_assert_withdraw(sdp, !(lck_ret & LM_OUT_ERROR)))
  773. return;
  774. if (lck_ret & LM_OUT_ASYNC)
  775. gfs2_assert_warn(sdp, lck_ret == LM_OUT_ASYNC);
  776. else
  777. xmote_bh(gl, lck_ret);
  778. }
  779. /**
  780. * drop_bh - Called after a lock module unlock completes
  781. * @gl: the glock
  782. * @ret: the return status
  783. *
  784. * Doesn't wake up the process waiting on the struct gfs2_holder (if any)
  785. * Doesn't drop the reference on the glock the top half took out
  786. *
  787. */
  788. static void drop_bh(struct gfs2_glock *gl, unsigned int ret)
  789. {
  790. struct gfs2_sbd *sdp = gl->gl_sbd;
  791. const struct gfs2_glock_operations *glops = gl->gl_ops;
  792. struct gfs2_holder *gh = gl->gl_req_gh;
  793. clear_bit(GLF_PREFETCH, &gl->gl_flags);
  794. gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
  795. gfs2_assert_warn(sdp, queue_empty(gl, &gl->gl_holders));
  796. gfs2_assert_warn(sdp, !ret);
  797. state_change(gl, LM_ST_UNLOCKED);
  798. if (glops->go_inval)
  799. glops->go_inval(gl, DIO_METADATA | DIO_DATA);
  800. if (gh) {
  801. spin_lock(&gl->gl_spin);
  802. list_del_init(&gh->gh_list);
  803. gh->gh_error = 0;
  804. spin_unlock(&gl->gl_spin);
  805. }
  806. if (glops->go_drop_bh)
  807. glops->go_drop_bh(gl);
  808. spin_lock(&gl->gl_spin);
  809. gl->gl_req_gh = NULL;
  810. gl->gl_req_bh = NULL;
  811. clear_bit(GLF_LOCK, &gl->gl_flags);
  812. run_queue(gl);
  813. spin_unlock(&gl->gl_spin);
  814. gfs2_glock_put(gl);
  815. if (gh) {
  816. if (test_bit(HIF_DEALLOC, &gh->gh_iflags))
  817. gfs2_holder_put(gh);
  818. else
  819. complete(&gh->gh_wait);
  820. }
  821. }
  822. /**
  823. * gfs2_glock_drop_th - call into the lock module to unlock a lock
  824. * @gl: the glock
  825. *
  826. */
  827. void gfs2_glock_drop_th(struct gfs2_glock *gl)
  828. {
  829. struct gfs2_sbd *sdp = gl->gl_sbd;
  830. const struct gfs2_glock_operations *glops = gl->gl_ops;
  831. unsigned int ret;
  832. gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
  833. gfs2_assert_warn(sdp, queue_empty(gl, &gl->gl_holders));
  834. gfs2_assert_warn(sdp, gl->gl_state != LM_ST_UNLOCKED);
  835. if (gl->gl_state == LM_ST_EXCLUSIVE) {
  836. if (glops->go_sync)
  837. glops->go_sync(gl, DIO_METADATA | DIO_DATA | DIO_RELEASE);
  838. }
  839. gfs2_glock_hold(gl);
  840. gl->gl_req_bh = drop_bh;
  841. ret = gfs2_lm_unlock(sdp, gl->gl_lock, gl->gl_state);
  842. if (gfs2_assert_withdraw(sdp, !(ret & LM_OUT_ERROR)))
  843. return;
  844. if (!ret)
  845. drop_bh(gl, ret);
  846. else
  847. gfs2_assert_warn(sdp, ret == LM_OUT_ASYNC);
  848. }
  849. /**
  850. * do_cancels - cancel requests for locks stuck waiting on an expire flag
  851. * @gh: the LM_FLAG_PRIORITY holder waiting to acquire the lock
  852. *
  853. * Don't cancel GL_NOCANCEL requests.
  854. */
  855. static void do_cancels(struct gfs2_holder *gh)
  856. {
  857. struct gfs2_glock *gl = gh->gh_gl;
  858. spin_lock(&gl->gl_spin);
  859. while (gl->gl_req_gh != gh &&
  860. !test_bit(HIF_HOLDER, &gh->gh_iflags) &&
  861. !list_empty(&gh->gh_list)) {
  862. if (gl->gl_req_bh &&
  863. !(gl->gl_req_gh &&
  864. (gl->gl_req_gh->gh_flags & GL_NOCANCEL))) {
  865. spin_unlock(&gl->gl_spin);
  866. gfs2_lm_cancel(gl->gl_sbd, gl->gl_lock);
  867. msleep(100);
  868. spin_lock(&gl->gl_spin);
  869. } else {
  870. spin_unlock(&gl->gl_spin);
  871. msleep(100);
  872. spin_lock(&gl->gl_spin);
  873. }
  874. }
  875. spin_unlock(&gl->gl_spin);
  876. }
  877. /**
  878. * glock_wait_internal - wait on a glock acquisition
  879. * @gh: the glock holder
  880. *
  881. * Returns: 0 on success
  882. */
  883. static int glock_wait_internal(struct gfs2_holder *gh)
  884. {
  885. struct gfs2_glock *gl = gh->gh_gl;
  886. struct gfs2_sbd *sdp = gl->gl_sbd;
  887. const struct gfs2_glock_operations *glops = gl->gl_ops;
  888. if (test_bit(HIF_ABORTED, &gh->gh_iflags))
  889. return -EIO;
  890. if (gh->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB)) {
  891. spin_lock(&gl->gl_spin);
  892. if (gl->gl_req_gh != gh &&
  893. !test_bit(HIF_HOLDER, &gh->gh_iflags) &&
  894. !list_empty(&gh->gh_list)) {
  895. list_del_init(&gh->gh_list);
  896. gh->gh_error = GLR_TRYFAILED;
  897. run_queue(gl);
  898. spin_unlock(&gl->gl_spin);
  899. return gh->gh_error;
  900. }
  901. spin_unlock(&gl->gl_spin);
  902. }
  903. if (gh->gh_flags & LM_FLAG_PRIORITY)
  904. do_cancels(gh);
  905. wait_for_completion(&gh->gh_wait);
  906. if (gh->gh_error)
  907. return gh->gh_error;
  908. gfs2_assert_withdraw(sdp, test_bit(HIF_HOLDER, &gh->gh_iflags));
  909. gfs2_assert_withdraw(sdp, relaxed_state_ok(gl->gl_state,
  910. gh->gh_state,
  911. gh->gh_flags));
  912. if (test_bit(HIF_FIRST, &gh->gh_iflags)) {
  913. gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
  914. if (glops->go_lock) {
  915. gh->gh_error = glops->go_lock(gh);
  916. if (gh->gh_error) {
  917. spin_lock(&gl->gl_spin);
  918. list_del_init(&gh->gh_list);
  919. spin_unlock(&gl->gl_spin);
  920. }
  921. }
  922. spin_lock(&gl->gl_spin);
  923. gl->gl_req_gh = NULL;
  924. gl->gl_req_bh = NULL;
  925. clear_bit(GLF_LOCK, &gl->gl_flags);
  926. run_queue(gl);
  927. spin_unlock(&gl->gl_spin);
  928. }
  929. return gh->gh_error;
  930. }
  931. static inline struct gfs2_holder *
  932. find_holder_by_owner(struct list_head *head, struct task_struct *owner)
  933. {
  934. struct gfs2_holder *gh;
  935. list_for_each_entry(gh, head, gh_list) {
  936. if (gh->gh_owner == owner)
  937. return gh;
  938. }
  939. return NULL;
  940. }
  941. /**
  942. * add_to_queue - Add a holder to the wait queue (but look for recursion)
  943. * @gh: the holder structure to add
  944. *
  945. */
  946. static void add_to_queue(struct gfs2_holder *gh)
  947. {
  948. struct gfs2_glock *gl = gh->gh_gl;
  949. struct gfs2_holder *existing;
  950. BUG_ON(!gh->gh_owner);
  951. existing = find_holder_by_owner(&gl->gl_holders, gh->gh_owner);
  952. if (existing) {
  953. print_symbol(KERN_WARNING "original: %s\n", existing->gh_ip);
  954. printk(KERN_INFO "pid : %d\n", existing->gh_owner->pid);
  955. printk(KERN_INFO "lock type : %d lock state : %d\n",
  956. existing->gh_gl->gl_name.ln_type, existing->gh_gl->gl_state);
  957. print_symbol(KERN_WARNING "new: %s\n", gh->gh_ip);
  958. printk(KERN_INFO "pid : %d\n", gh->gh_owner->pid);
  959. printk(KERN_INFO "lock type : %d lock state : %d\n",
  960. gl->gl_name.ln_type, gl->gl_state);
  961. BUG();
  962. }
  963. existing = find_holder_by_owner(&gl->gl_waiters3, gh->gh_owner);
  964. if (existing) {
  965. print_symbol(KERN_WARNING "original: %s\n", existing->gh_ip);
  966. print_symbol(KERN_WARNING "new: %s\n", gh->gh_ip);
  967. BUG();
  968. }
  969. if (gh->gh_flags & LM_FLAG_PRIORITY)
  970. list_add(&gh->gh_list, &gl->gl_waiters3);
  971. else
  972. list_add_tail(&gh->gh_list, &gl->gl_waiters3);
  973. }
  974. /**
  975. * gfs2_glock_nq - enqueue a struct gfs2_holder onto a glock (acquire a glock)
  976. * @gh: the holder structure
  977. *
  978. * if (gh->gh_flags & GL_ASYNC), this never returns an error
  979. *
  980. * Returns: 0, GLR_TRYFAILED, or errno on failure
  981. */
  982. int gfs2_glock_nq(struct gfs2_holder *gh)
  983. {
  984. struct gfs2_glock *gl = gh->gh_gl;
  985. struct gfs2_sbd *sdp = gl->gl_sbd;
  986. int error = 0;
  987. restart:
  988. if (unlikely(test_bit(SDF_SHUTDOWN, &sdp->sd_flags))) {
  989. set_bit(HIF_ABORTED, &gh->gh_iflags);
  990. return -EIO;
  991. }
  992. set_bit(HIF_PROMOTE, &gh->gh_iflags);
  993. spin_lock(&gl->gl_spin);
  994. add_to_queue(gh);
  995. run_queue(gl);
  996. spin_unlock(&gl->gl_spin);
  997. if (!(gh->gh_flags & GL_ASYNC)) {
  998. error = glock_wait_internal(gh);
  999. if (error == GLR_CANCELED) {
  1000. msleep(100);
  1001. goto restart;
  1002. }
  1003. }
  1004. clear_bit(GLF_PREFETCH, &gl->gl_flags);
  1005. if (error == GLR_TRYFAILED && (gh->gh_flags & GL_DUMP))
  1006. dump_glock(gl);
  1007. return error;
  1008. }
  1009. /**
  1010. * gfs2_glock_poll - poll to see if an async request has been completed
  1011. * @gh: the holder
  1012. *
  1013. * Returns: 1 if the request is ready to be gfs2_glock_wait()ed on
  1014. */
  1015. int gfs2_glock_poll(struct gfs2_holder *gh)
  1016. {
  1017. struct gfs2_glock *gl = gh->gh_gl;
  1018. int ready = 0;
  1019. spin_lock(&gl->gl_spin);
  1020. if (test_bit(HIF_HOLDER, &gh->gh_iflags))
  1021. ready = 1;
  1022. else if (list_empty(&gh->gh_list)) {
  1023. if (gh->gh_error == GLR_CANCELED) {
  1024. spin_unlock(&gl->gl_spin);
  1025. msleep(100);
  1026. if (gfs2_glock_nq(gh))
  1027. return 1;
  1028. return 0;
  1029. } else
  1030. ready = 1;
  1031. }
  1032. spin_unlock(&gl->gl_spin);
  1033. return ready;
  1034. }
  1035. /**
  1036. * gfs2_glock_wait - wait for a lock acquisition that ended in a GLR_ASYNC
  1037. * @gh: the holder structure
  1038. *
  1039. * Returns: 0, GLR_TRYFAILED, or errno on failure
  1040. */
  1041. int gfs2_glock_wait(struct gfs2_holder *gh)
  1042. {
  1043. int error;
  1044. error = glock_wait_internal(gh);
  1045. if (error == GLR_CANCELED) {
  1046. msleep(100);
  1047. gh->gh_flags &= ~GL_ASYNC;
  1048. error = gfs2_glock_nq(gh);
  1049. }
  1050. return error;
  1051. }
  1052. /**
  1053. * gfs2_glock_dq - dequeue a struct gfs2_holder from a glock (release a glock)
  1054. * @gh: the glock holder
  1055. *
  1056. */
  1057. void gfs2_glock_dq(struct gfs2_holder *gh)
  1058. {
  1059. struct gfs2_glock *gl = gh->gh_gl;
  1060. const struct gfs2_glock_operations *glops = gl->gl_ops;
  1061. if (gh->gh_flags & GL_NOCACHE)
  1062. handle_callback(gl, LM_ST_UNLOCKED);
  1063. gfs2_glmutex_lock(gl);
  1064. spin_lock(&gl->gl_spin);
  1065. list_del_init(&gh->gh_list);
  1066. if (list_empty(&gl->gl_holders)) {
  1067. spin_unlock(&gl->gl_spin);
  1068. if (glops->go_unlock)
  1069. glops->go_unlock(gh);
  1070. gl->gl_stamp = jiffies;
  1071. spin_lock(&gl->gl_spin);
  1072. }
  1073. clear_bit(GLF_LOCK, &gl->gl_flags);
  1074. run_queue(gl);
  1075. spin_unlock(&gl->gl_spin);
  1076. }
  1077. /**
  1078. * gfs2_glock_prefetch - Try to prefetch a glock
  1079. * @gl: the glock
  1080. * @state: the state to prefetch in
  1081. * @flags: flags passed to go_xmote_th()
  1082. *
  1083. */
  1084. static void gfs2_glock_prefetch(struct gfs2_glock *gl, unsigned int state,
  1085. int flags)
  1086. {
  1087. const struct gfs2_glock_operations *glops = gl->gl_ops;
  1088. spin_lock(&gl->gl_spin);
  1089. if (test_bit(GLF_LOCK, &gl->gl_flags) ||
  1090. !list_empty(&gl->gl_holders) ||
  1091. !list_empty(&gl->gl_waiters1) ||
  1092. !list_empty(&gl->gl_waiters2) ||
  1093. !list_empty(&gl->gl_waiters3) ||
  1094. relaxed_state_ok(gl->gl_state, state, flags)) {
  1095. spin_unlock(&gl->gl_spin);
  1096. return;
  1097. }
  1098. set_bit(GLF_PREFETCH, &gl->gl_flags);
  1099. set_bit(GLF_LOCK, &gl->gl_flags);
  1100. spin_unlock(&gl->gl_spin);
  1101. glops->go_xmote_th(gl, state, flags);
  1102. }
  1103. static void greedy_work(void *data)
  1104. {
  1105. struct greedy *gr = data;
  1106. struct gfs2_holder *gh = &gr->gr_gh;
  1107. struct gfs2_glock *gl = gh->gh_gl;
  1108. const struct gfs2_glock_operations *glops = gl->gl_ops;
  1109. clear_bit(GLF_SKIP_WAITERS2, &gl->gl_flags);
  1110. if (glops->go_greedy)
  1111. glops->go_greedy(gl);
  1112. spin_lock(&gl->gl_spin);
  1113. if (list_empty(&gl->gl_waiters2)) {
  1114. clear_bit(GLF_GREEDY, &gl->gl_flags);
  1115. spin_unlock(&gl->gl_spin);
  1116. gfs2_holder_uninit(gh);
  1117. kfree(gr);
  1118. } else {
  1119. gfs2_glock_hold(gl);
  1120. list_add_tail(&gh->gh_list, &gl->gl_waiters2);
  1121. run_queue(gl);
  1122. spin_unlock(&gl->gl_spin);
  1123. gfs2_glock_put(gl);
  1124. }
  1125. }
  1126. /**
  1127. * gfs2_glock_be_greedy -
  1128. * @gl:
  1129. * @time:
  1130. *
  1131. * Returns: 0 if go_greedy will be called, 1 otherwise
  1132. */
  1133. int gfs2_glock_be_greedy(struct gfs2_glock *gl, unsigned int time)
  1134. {
  1135. struct greedy *gr;
  1136. struct gfs2_holder *gh;
  1137. if (!time || gl->gl_sbd->sd_args.ar_localcaching ||
  1138. test_and_set_bit(GLF_GREEDY, &gl->gl_flags))
  1139. return 1;
  1140. gr = kmalloc(sizeof(struct greedy), GFP_KERNEL);
  1141. if (!gr) {
  1142. clear_bit(GLF_GREEDY, &gl->gl_flags);
  1143. return 1;
  1144. }
  1145. gh = &gr->gr_gh;
  1146. gfs2_holder_init(gl, 0, 0, gh);
  1147. set_bit(HIF_GREEDY, &gh->gh_iflags);
  1148. INIT_WORK(&gr->gr_work, greedy_work, gr);
  1149. set_bit(GLF_SKIP_WAITERS2, &gl->gl_flags);
  1150. schedule_delayed_work(&gr->gr_work, time);
  1151. return 0;
  1152. }
  1153. /**
  1154. * gfs2_glock_dq_uninit - dequeue a holder from a glock and initialize it
  1155. * @gh: the holder structure
  1156. *
  1157. */
  1158. void gfs2_glock_dq_uninit(struct gfs2_holder *gh)
  1159. {
  1160. gfs2_glock_dq(gh);
  1161. gfs2_holder_uninit(gh);
  1162. }
  1163. /**
  1164. * gfs2_glock_nq_num - acquire a glock based on lock number
  1165. * @sdp: the filesystem
  1166. * @number: the lock number
  1167. * @glops: the glock operations for the type of glock
  1168. * @state: the state to acquire the glock in
  1169. * @flags: modifier flags for the aquisition
  1170. * @gh: the struct gfs2_holder
  1171. *
  1172. * Returns: errno
  1173. */
  1174. int gfs2_glock_nq_num(struct gfs2_sbd *sdp, uint64_t number,
  1175. const struct gfs2_glock_operations *glops,
  1176. unsigned int state, int flags, struct gfs2_holder *gh)
  1177. {
  1178. struct gfs2_glock *gl;
  1179. int error;
  1180. error = gfs2_glock_get(sdp, number, glops, CREATE, &gl);
  1181. if (!error) {
  1182. error = gfs2_glock_nq_init(gl, state, flags, gh);
  1183. gfs2_glock_put(gl);
  1184. }
  1185. return error;
  1186. }
  1187. /**
  1188. * glock_compare - Compare two struct gfs2_glock structures for sorting
  1189. * @arg_a: the first structure
  1190. * @arg_b: the second structure
  1191. *
  1192. */
  1193. static int glock_compare(const void *arg_a, const void *arg_b)
  1194. {
  1195. struct gfs2_holder *gh_a = *(struct gfs2_holder **)arg_a;
  1196. struct gfs2_holder *gh_b = *(struct gfs2_holder **)arg_b;
  1197. struct lm_lockname *a = &gh_a->gh_gl->gl_name;
  1198. struct lm_lockname *b = &gh_b->gh_gl->gl_name;
  1199. int ret = 0;
  1200. if (a->ln_number > b->ln_number)
  1201. ret = 1;
  1202. else if (a->ln_number < b->ln_number)
  1203. ret = -1;
  1204. else {
  1205. if (gh_a->gh_state == LM_ST_SHARED &&
  1206. gh_b->gh_state == LM_ST_EXCLUSIVE)
  1207. ret = 1;
  1208. else if (!(gh_a->gh_flags & GL_LOCAL_EXCL) &&
  1209. (gh_b->gh_flags & GL_LOCAL_EXCL))
  1210. ret = 1;
  1211. }
  1212. return ret;
  1213. }
  1214. /**
  1215. * nq_m_sync - synchonously acquire more than one glock in deadlock free order
  1216. * @num_gh: the number of structures
  1217. * @ghs: an array of struct gfs2_holder structures
  1218. *
  1219. * Returns: 0 on success (all glocks acquired),
  1220. * errno on failure (no glocks acquired)
  1221. */
  1222. static int nq_m_sync(unsigned int num_gh, struct gfs2_holder *ghs,
  1223. struct gfs2_holder **p)
  1224. {
  1225. unsigned int x;
  1226. int error = 0;
  1227. for (x = 0; x < num_gh; x++)
  1228. p[x] = &ghs[x];
  1229. sort(p, num_gh, sizeof(struct gfs2_holder *), glock_compare, NULL);
  1230. for (x = 0; x < num_gh; x++) {
  1231. p[x]->gh_flags &= ~(LM_FLAG_TRY | GL_ASYNC);
  1232. error = gfs2_glock_nq(p[x]);
  1233. if (error) {
  1234. while (x--)
  1235. gfs2_glock_dq(p[x]);
  1236. break;
  1237. }
  1238. }
  1239. return error;
  1240. }
  1241. /**
  1242. * gfs2_glock_nq_m - acquire multiple glocks
  1243. * @num_gh: the number of structures
  1244. * @ghs: an array of struct gfs2_holder structures
  1245. *
  1246. * Figure out how big an impact this function has. Either:
  1247. * 1) Replace this code with code that calls gfs2_glock_prefetch()
  1248. * 2) Forget async stuff and just call nq_m_sync()
  1249. * 3) Leave it like it is
  1250. *
  1251. * Returns: 0 on success (all glocks acquired),
  1252. * errno on failure (no glocks acquired)
  1253. */
  1254. int gfs2_glock_nq_m(unsigned int num_gh, struct gfs2_holder *ghs)
  1255. {
  1256. int *e;
  1257. unsigned int x;
  1258. int borked = 0, serious = 0;
  1259. int error = 0;
  1260. if (!num_gh)
  1261. return 0;
  1262. if (num_gh == 1) {
  1263. ghs->gh_flags &= ~(LM_FLAG_TRY | GL_ASYNC);
  1264. return gfs2_glock_nq(ghs);
  1265. }
  1266. e = kcalloc(num_gh, sizeof(struct gfs2_holder *), GFP_KERNEL);
  1267. if (!e)
  1268. return -ENOMEM;
  1269. for (x = 0; x < num_gh; x++) {
  1270. ghs[x].gh_flags |= LM_FLAG_TRY | GL_ASYNC;
  1271. error = gfs2_glock_nq(&ghs[x]);
  1272. if (error) {
  1273. borked = 1;
  1274. serious = error;
  1275. num_gh = x;
  1276. break;
  1277. }
  1278. }
  1279. for (x = 0; x < num_gh; x++) {
  1280. error = e[x] = glock_wait_internal(&ghs[x]);
  1281. if (error) {
  1282. borked = 1;
  1283. if (error != GLR_TRYFAILED && error != GLR_CANCELED)
  1284. serious = error;
  1285. }
  1286. }
  1287. if (!borked) {
  1288. kfree(e);
  1289. return 0;
  1290. }
  1291. for (x = 0; x < num_gh; x++)
  1292. if (!e[x])
  1293. gfs2_glock_dq(&ghs[x]);
  1294. if (serious)
  1295. error = serious;
  1296. else {
  1297. for (x = 0; x < num_gh; x++)
  1298. gfs2_holder_reinit(ghs[x].gh_state, ghs[x].gh_flags,
  1299. &ghs[x]);
  1300. error = nq_m_sync(num_gh, ghs, (struct gfs2_holder **)e);
  1301. }
  1302. kfree(e);
  1303. return error;
  1304. }
  1305. /**
  1306. * gfs2_glock_dq_m - release multiple glocks
  1307. * @num_gh: the number of structures
  1308. * @ghs: an array of struct gfs2_holder structures
  1309. *
  1310. */
  1311. void gfs2_glock_dq_m(unsigned int num_gh, struct gfs2_holder *ghs)
  1312. {
  1313. unsigned int x;
  1314. for (x = 0; x < num_gh; x++)
  1315. gfs2_glock_dq(&ghs[x]);
  1316. }
  1317. /**
  1318. * gfs2_glock_dq_uninit_m - release multiple glocks
  1319. * @num_gh: the number of structures
  1320. * @ghs: an array of struct gfs2_holder structures
  1321. *
  1322. */
  1323. void gfs2_glock_dq_uninit_m(unsigned int num_gh, struct gfs2_holder *ghs)
  1324. {
  1325. unsigned int x;
  1326. for (x = 0; x < num_gh; x++)
  1327. gfs2_glock_dq_uninit(&ghs[x]);
  1328. }
  1329. /**
  1330. * gfs2_glock_prefetch_num - prefetch a glock based on lock number
  1331. * @sdp: the filesystem
  1332. * @number: the lock number
  1333. * @glops: the glock operations for the type of glock
  1334. * @state: the state to acquire the glock in
  1335. * @flags: modifier flags for the aquisition
  1336. *
  1337. * Returns: errno
  1338. */
  1339. void gfs2_glock_prefetch_num(struct gfs2_sbd *sdp, uint64_t number,
  1340. const struct gfs2_glock_operations *glops,
  1341. unsigned int state, int flags)
  1342. {
  1343. struct gfs2_glock *gl;
  1344. int error;
  1345. if (atomic_read(&sdp->sd_reclaim_count) <
  1346. gfs2_tune_get(sdp, gt_reclaim_limit)) {
  1347. error = gfs2_glock_get(sdp, number, glops, CREATE, &gl);
  1348. if (!error) {
  1349. gfs2_glock_prefetch(gl, state, flags);
  1350. gfs2_glock_put(gl);
  1351. }
  1352. }
  1353. }
  1354. /**
  1355. * gfs2_lvb_hold - attach a LVB from a glock
  1356. * @gl: The glock in question
  1357. *
  1358. */
  1359. int gfs2_lvb_hold(struct gfs2_glock *gl)
  1360. {
  1361. int error;
  1362. gfs2_glmutex_lock(gl);
  1363. if (!atomic_read(&gl->gl_lvb_count)) {
  1364. error = gfs2_lm_hold_lvb(gl->gl_sbd, gl->gl_lock, &gl->gl_lvb);
  1365. if (error) {
  1366. gfs2_glmutex_unlock(gl);
  1367. return error;
  1368. }
  1369. gfs2_glock_hold(gl);
  1370. }
  1371. atomic_inc(&gl->gl_lvb_count);
  1372. gfs2_glmutex_unlock(gl);
  1373. return 0;
  1374. }
  1375. /**
  1376. * gfs2_lvb_unhold - detach a LVB from a glock
  1377. * @gl: The glock in question
  1378. *
  1379. */
  1380. void gfs2_lvb_unhold(struct gfs2_glock *gl)
  1381. {
  1382. gfs2_glock_hold(gl);
  1383. gfs2_glmutex_lock(gl);
  1384. gfs2_assert(gl->gl_sbd, atomic_read(&gl->gl_lvb_count) > 0);
  1385. if (atomic_dec_and_test(&gl->gl_lvb_count)) {
  1386. gfs2_lm_unhold_lvb(gl->gl_sbd, gl->gl_lock, gl->gl_lvb);
  1387. gl->gl_lvb = NULL;
  1388. gfs2_glock_put(gl);
  1389. }
  1390. gfs2_glmutex_unlock(gl);
  1391. gfs2_glock_put(gl);
  1392. }
  1393. #if 0
  1394. void gfs2_lvb_sync(struct gfs2_glock *gl)
  1395. {
  1396. gfs2_glmutex_lock(gl);
  1397. gfs2_assert(gl->gl_sbd, atomic_read(&gl->gl_lvb_count));
  1398. if (!gfs2_assert_warn(gl->gl_sbd, gfs2_glock_is_held_excl(gl)))
  1399. gfs2_lm_sync_lvb(gl->gl_sbd, gl->gl_lock, gl->gl_lvb);
  1400. gfs2_glmutex_unlock(gl);
  1401. }
  1402. #endif /* 0 */
  1403. static void blocking_cb(struct gfs2_sbd *sdp, struct lm_lockname *name,
  1404. unsigned int state)
  1405. {
  1406. struct gfs2_glock *gl;
  1407. gl = gfs2_glock_find(sdp, name);
  1408. if (!gl)
  1409. return;
  1410. if (gl->gl_ops->go_callback)
  1411. gl->gl_ops->go_callback(gl, state);
  1412. handle_callback(gl, state);
  1413. spin_lock(&gl->gl_spin);
  1414. run_queue(gl);
  1415. spin_unlock(&gl->gl_spin);
  1416. gfs2_glock_put(gl);
  1417. }
  1418. /**
  1419. * gfs2_glock_cb - Callback used by locking module
  1420. * @fsdata: Pointer to the superblock
  1421. * @type: Type of callback
  1422. * @data: Type dependent data pointer
  1423. *
  1424. * Called by the locking module when it wants to tell us something.
  1425. * Either we need to drop a lock, one of our ASYNC requests completed, or
  1426. * a journal from another client needs to be recovered.
  1427. */
  1428. void gfs2_glock_cb(lm_fsdata_t *fsdata, unsigned int type, void *data)
  1429. {
  1430. struct gfs2_sbd *sdp = (struct gfs2_sbd *)fsdata;
  1431. switch (type) {
  1432. case LM_CB_NEED_E:
  1433. blocking_cb(sdp, data, LM_ST_UNLOCKED);
  1434. return;
  1435. case LM_CB_NEED_D:
  1436. blocking_cb(sdp, data, LM_ST_DEFERRED);
  1437. return;
  1438. case LM_CB_NEED_S:
  1439. blocking_cb(sdp, data, LM_ST_SHARED);
  1440. return;
  1441. case LM_CB_ASYNC: {
  1442. struct lm_async_cb *async = data;
  1443. struct gfs2_glock *gl;
  1444. gl = gfs2_glock_find(sdp, &async->lc_name);
  1445. if (gfs2_assert_warn(sdp, gl))
  1446. return;
  1447. if (!gfs2_assert_warn(sdp, gl->gl_req_bh))
  1448. gl->gl_req_bh(gl, async->lc_ret);
  1449. gfs2_glock_put(gl);
  1450. return;
  1451. }
  1452. case LM_CB_NEED_RECOVERY:
  1453. gfs2_jdesc_make_dirty(sdp, *(unsigned int *)data);
  1454. if (sdp->sd_recoverd_process)
  1455. wake_up_process(sdp->sd_recoverd_process);
  1456. return;
  1457. case LM_CB_DROPLOCKS:
  1458. gfs2_gl_hash_clear(sdp, NO_WAIT);
  1459. gfs2_quota_scan(sdp);
  1460. return;
  1461. default:
  1462. gfs2_assert_warn(sdp, 0);
  1463. return;
  1464. }
  1465. }
  1466. /**
  1467. * gfs2_iopen_go_callback - Try to kick the inode/vnode associated with an
  1468. * iopen glock from memory
  1469. * @io_gl: the iopen glock
  1470. * @state: the state into which the glock should be put
  1471. *
  1472. */
  1473. void gfs2_iopen_go_callback(struct gfs2_glock *io_gl, unsigned int state)
  1474. {
  1475. if (state != LM_ST_UNLOCKED)
  1476. return;
  1477. /* FIXME: remove this? */
  1478. }
  1479. /**
  1480. * demote_ok - Check to see if it's ok to unlock a glock
  1481. * @gl: the glock
  1482. *
  1483. * Returns: 1 if it's ok
  1484. */
  1485. static int demote_ok(struct gfs2_glock *gl)
  1486. {
  1487. struct gfs2_sbd *sdp = gl->gl_sbd;
  1488. const struct gfs2_glock_operations *glops = gl->gl_ops;
  1489. int demote = 1;
  1490. if (test_bit(GLF_STICKY, &gl->gl_flags))
  1491. demote = 0;
  1492. else if (test_bit(GLF_PREFETCH, &gl->gl_flags))
  1493. demote = time_after_eq(jiffies,
  1494. gl->gl_stamp +
  1495. gfs2_tune_get(sdp, gt_prefetch_secs) * HZ);
  1496. else if (glops->go_demote_ok)
  1497. demote = glops->go_demote_ok(gl);
  1498. return demote;
  1499. }
  1500. /**
  1501. * gfs2_glock_schedule_for_reclaim - Add a glock to the reclaim list
  1502. * @gl: the glock
  1503. *
  1504. */
  1505. void gfs2_glock_schedule_for_reclaim(struct gfs2_glock *gl)
  1506. {
  1507. struct gfs2_sbd *sdp = gl->gl_sbd;
  1508. spin_lock(&sdp->sd_reclaim_lock);
  1509. if (list_empty(&gl->gl_reclaim)) {
  1510. gfs2_glock_hold(gl);
  1511. list_add(&gl->gl_reclaim, &sdp->sd_reclaim_list);
  1512. atomic_inc(&sdp->sd_reclaim_count);
  1513. }
  1514. spin_unlock(&sdp->sd_reclaim_lock);
  1515. wake_up(&sdp->sd_reclaim_wq);
  1516. }
  1517. /**
  1518. * gfs2_reclaim_glock - process the next glock on the filesystem's reclaim list
  1519. * @sdp: the filesystem
  1520. *
  1521. * Called from gfs2_glockd() glock reclaim daemon, or when promoting a
  1522. * different glock and we notice that there are a lot of glocks in the
  1523. * reclaim list.
  1524. *
  1525. */
  1526. void gfs2_reclaim_glock(struct gfs2_sbd *sdp)
  1527. {
  1528. struct gfs2_glock *gl;
  1529. spin_lock(&sdp->sd_reclaim_lock);
  1530. if (list_empty(&sdp->sd_reclaim_list)) {
  1531. spin_unlock(&sdp->sd_reclaim_lock);
  1532. return;
  1533. }
  1534. gl = list_entry(sdp->sd_reclaim_list.next,
  1535. struct gfs2_glock, gl_reclaim);
  1536. list_del_init(&gl->gl_reclaim);
  1537. spin_unlock(&sdp->sd_reclaim_lock);
  1538. atomic_dec(&sdp->sd_reclaim_count);
  1539. atomic_inc(&sdp->sd_reclaimed);
  1540. if (gfs2_glmutex_trylock(gl)) {
  1541. if (queue_empty(gl, &gl->gl_holders) &&
  1542. gl->gl_state != LM_ST_UNLOCKED &&
  1543. demote_ok(gl))
  1544. handle_callback(gl, LM_ST_UNLOCKED);
  1545. gfs2_glmutex_unlock(gl);
  1546. }
  1547. gfs2_glock_put(gl);
  1548. }
  1549. /**
  1550. * examine_bucket - Call a function for glock in a hash bucket
  1551. * @examiner: the function
  1552. * @sdp: the filesystem
  1553. * @bucket: the bucket
  1554. *
  1555. * Returns: 1 if the bucket has entries
  1556. */
  1557. static int examine_bucket(glock_examiner examiner, struct gfs2_sbd *sdp,
  1558. struct gfs2_gl_hash_bucket *bucket)
  1559. {
  1560. struct glock_plug plug;
  1561. struct list_head *tmp;
  1562. struct gfs2_glock *gl;
  1563. int entries;
  1564. /* Add "plug" to end of bucket list, work back up list from there */
  1565. memset(&plug.gl_flags, 0, sizeof(unsigned long));
  1566. set_bit(GLF_PLUG, &plug.gl_flags);
  1567. write_lock(&bucket->hb_lock);
  1568. list_add(&plug.gl_list, &bucket->hb_list);
  1569. write_unlock(&bucket->hb_lock);
  1570. for (;;) {
  1571. write_lock(&bucket->hb_lock);
  1572. for (;;) {
  1573. tmp = plug.gl_list.next;
  1574. if (tmp == &bucket->hb_list) {
  1575. list_del(&plug.gl_list);
  1576. entries = !list_empty(&bucket->hb_list);
  1577. write_unlock(&bucket->hb_lock);
  1578. return entries;
  1579. }
  1580. gl = list_entry(tmp, struct gfs2_glock, gl_list);
  1581. /* Move plug up list */
  1582. list_move(&plug.gl_list, &gl->gl_list);
  1583. if (test_bit(GLF_PLUG, &gl->gl_flags))
  1584. continue;
  1585. /* examiner() must glock_put() */
  1586. gfs2_glock_hold(gl);
  1587. break;
  1588. }
  1589. write_unlock(&bucket->hb_lock);
  1590. examiner(gl);
  1591. }
  1592. }
  1593. /**
  1594. * scan_glock - look at a glock and see if we can reclaim it
  1595. * @gl: the glock to look at
  1596. *
  1597. */
  1598. static void scan_glock(struct gfs2_glock *gl)
  1599. {
  1600. if (gl->gl_ops == &gfs2_inode_glops)
  1601. goto out;
  1602. if (gfs2_glmutex_trylock(gl)) {
  1603. if (queue_empty(gl, &gl->gl_holders) &&
  1604. gl->gl_state != LM_ST_UNLOCKED &&
  1605. demote_ok(gl))
  1606. goto out_schedule;
  1607. gfs2_glmutex_unlock(gl);
  1608. }
  1609. out:
  1610. gfs2_glock_put(gl);
  1611. return;
  1612. out_schedule:
  1613. gfs2_glmutex_unlock(gl);
  1614. gfs2_glock_schedule_for_reclaim(gl);
  1615. gfs2_glock_put(gl);
  1616. }
  1617. /**
  1618. * gfs2_scand_internal - Look for glocks and inodes to toss from memory
  1619. * @sdp: the filesystem
  1620. *
  1621. */
  1622. void gfs2_scand_internal(struct gfs2_sbd *sdp)
  1623. {
  1624. unsigned int x;
  1625. for (x = 0; x < GFS2_GL_HASH_SIZE; x++) {
  1626. examine_bucket(scan_glock, sdp, &sdp->sd_gl_hash[x]);
  1627. cond_resched();
  1628. }
  1629. }
  1630. /**
  1631. * clear_glock - look at a glock and see if we can free it from glock cache
  1632. * @gl: the glock to look at
  1633. *
  1634. */
  1635. static void clear_glock(struct gfs2_glock *gl)
  1636. {
  1637. struct gfs2_sbd *sdp = gl->gl_sbd;
  1638. int released;
  1639. spin_lock(&sdp->sd_reclaim_lock);
  1640. if (!list_empty(&gl->gl_reclaim)) {
  1641. list_del_init(&gl->gl_reclaim);
  1642. atomic_dec(&sdp->sd_reclaim_count);
  1643. spin_unlock(&sdp->sd_reclaim_lock);
  1644. released = gfs2_glock_put(gl);
  1645. gfs2_assert(sdp, !released);
  1646. } else {
  1647. spin_unlock(&sdp->sd_reclaim_lock);
  1648. }
  1649. if (gfs2_glmutex_trylock(gl)) {
  1650. if (queue_empty(gl, &gl->gl_holders) &&
  1651. gl->gl_state != LM_ST_UNLOCKED)
  1652. handle_callback(gl, LM_ST_UNLOCKED);
  1653. gfs2_glmutex_unlock(gl);
  1654. }
  1655. gfs2_glock_put(gl);
  1656. }
  1657. /**
  1658. * gfs2_gl_hash_clear - Empty out the glock hash table
  1659. * @sdp: the filesystem
  1660. * @wait: wait until it's all gone
  1661. *
  1662. * Called when unmounting the filesystem, or when inter-node lock manager
  1663. * requests DROPLOCKS because it is running out of capacity.
  1664. */
  1665. void gfs2_gl_hash_clear(struct gfs2_sbd *sdp, int wait)
  1666. {
  1667. unsigned long t;
  1668. unsigned int x;
  1669. int cont;
  1670. t = jiffies;
  1671. for (;;) {
  1672. cont = 0;
  1673. for (x = 0; x < GFS2_GL_HASH_SIZE; x++)
  1674. if (examine_bucket(clear_glock, sdp,
  1675. &sdp->sd_gl_hash[x]))
  1676. cont = 1;
  1677. if (!wait || !cont)
  1678. break;
  1679. if (time_after_eq(jiffies,
  1680. t + gfs2_tune_get(sdp, gt_stall_secs) * HZ)) {
  1681. fs_warn(sdp, "Unmount seems to be stalled. "
  1682. "Dumping lock state...\n");
  1683. gfs2_dump_lockstate(sdp);
  1684. t = jiffies;
  1685. }
  1686. invalidate_inodes(sdp->sd_vfs);
  1687. msleep(10);
  1688. }
  1689. }
  1690. /*
  1691. * Diagnostic routines to help debug distributed deadlock
  1692. */
  1693. /**
  1694. * dump_holder - print information about a glock holder
  1695. * @str: a string naming the type of holder
  1696. * @gh: the glock holder
  1697. *
  1698. * Returns: 0 on success, -ENOBUFS when we run out of space
  1699. */
  1700. static int dump_holder(char *str, struct gfs2_holder *gh)
  1701. {
  1702. unsigned int x;
  1703. int error = -ENOBUFS;
  1704. printk(KERN_INFO " %s\n", str);
  1705. printk(KERN_INFO " owner = %ld\n",
  1706. (gh->gh_owner) ? (long)gh->gh_owner->pid : -1);
  1707. printk(KERN_INFO " gh_state = %u\n", gh->gh_state);
  1708. printk(KERN_INFO " gh_flags =");
  1709. for (x = 0; x < 32; x++)
  1710. if (gh->gh_flags & (1 << x))
  1711. printk(" %u", x);
  1712. printk(" \n");
  1713. printk(KERN_INFO " error = %d\n", gh->gh_error);
  1714. printk(KERN_INFO " gh_iflags =");
  1715. for (x = 0; x < 32; x++)
  1716. if (test_bit(x, &gh->gh_iflags))
  1717. printk(" %u", x);
  1718. printk(" \n");
  1719. print_symbol(KERN_INFO " initialized at: %s\n", gh->gh_ip);
  1720. error = 0;
  1721. return error;
  1722. }
  1723. /**
  1724. * dump_inode - print information about an inode
  1725. * @ip: the inode
  1726. *
  1727. * Returns: 0 on success, -ENOBUFS when we run out of space
  1728. */
  1729. static int dump_inode(struct gfs2_inode *ip)
  1730. {
  1731. unsigned int x;
  1732. int error = -ENOBUFS;
  1733. printk(KERN_INFO " Inode:\n");
  1734. printk(KERN_INFO " num = %llu %llu\n",
  1735. (unsigned long long)ip->i_num.no_formal_ino,
  1736. (unsigned long long)ip->i_num.no_addr);
  1737. printk(KERN_INFO " type = %u\n", IF2DT(ip->i_di.di_mode));
  1738. printk(KERN_INFO " i_flags =");
  1739. for (x = 0; x < 32; x++)
  1740. if (test_bit(x, &ip->i_flags))
  1741. printk(" %u", x);
  1742. printk(" \n");
  1743. error = 0;
  1744. return error;
  1745. }
  1746. /**
  1747. * dump_glock - print information about a glock
  1748. * @gl: the glock
  1749. * @count: where we are in the buffer
  1750. *
  1751. * Returns: 0 on success, -ENOBUFS when we run out of space
  1752. */
  1753. static int dump_glock(struct gfs2_glock *gl)
  1754. {
  1755. struct gfs2_holder *gh;
  1756. unsigned int x;
  1757. int error = -ENOBUFS;
  1758. spin_lock(&gl->gl_spin);
  1759. printk(KERN_INFO "Glock 0x%p (%u, %llu)\n",
  1760. gl,
  1761. gl->gl_name.ln_type,
  1762. (unsigned long long)gl->gl_name.ln_number);
  1763. printk(KERN_INFO " gl_flags =");
  1764. for (x = 0; x < 32; x++)
  1765. if (test_bit(x, &gl->gl_flags))
  1766. printk(" %u", x);
  1767. printk(" \n");
  1768. printk(KERN_INFO " gl_ref = %d\n", atomic_read(&gl->gl_ref.refcount));
  1769. printk(KERN_INFO " gl_state = %u\n", gl->gl_state);
  1770. printk(KERN_INFO " gl_owner = %s\n", gl->gl_owner->comm);
  1771. print_symbol(KERN_INFO " gl_ip = %s\n", gl->gl_ip);
  1772. printk(KERN_INFO " req_gh = %s\n", (gl->gl_req_gh) ? "yes" : "no");
  1773. printk(KERN_INFO " req_bh = %s\n", (gl->gl_req_bh) ? "yes" : "no");
  1774. printk(KERN_INFO " lvb_count = %d\n", atomic_read(&gl->gl_lvb_count));
  1775. printk(KERN_INFO " object = %s\n", (gl->gl_object) ? "yes" : "no");
  1776. printk(KERN_INFO " le = %s\n",
  1777. (list_empty(&gl->gl_le.le_list)) ? "no" : "yes");
  1778. printk(KERN_INFO " reclaim = %s\n",
  1779. (list_empty(&gl->gl_reclaim)) ? "no" : "yes");
  1780. if (gl->gl_aspace)
  1781. printk(KERN_INFO " aspace = 0x%p nrpages = %lu\n",
  1782. gl->gl_aspace,
  1783. gl->gl_aspace->i_mapping->nrpages);
  1784. else
  1785. printk(KERN_INFO " aspace = no\n");
  1786. printk(KERN_INFO " ail = %d\n", atomic_read(&gl->gl_ail_count));
  1787. if (gl->gl_req_gh) {
  1788. error = dump_holder("Request", gl->gl_req_gh);
  1789. if (error)
  1790. goto out;
  1791. }
  1792. list_for_each_entry(gh, &gl->gl_holders, gh_list) {
  1793. error = dump_holder("Holder", gh);
  1794. if (error)
  1795. goto out;
  1796. }
  1797. list_for_each_entry(gh, &gl->gl_waiters1, gh_list) {
  1798. error = dump_holder("Waiter1", gh);
  1799. if (error)
  1800. goto out;
  1801. }
  1802. list_for_each_entry(gh, &gl->gl_waiters2, gh_list) {
  1803. error = dump_holder("Waiter2", gh);
  1804. if (error)
  1805. goto out;
  1806. }
  1807. list_for_each_entry(gh, &gl->gl_waiters3, gh_list) {
  1808. error = dump_holder("Waiter3", gh);
  1809. if (error)
  1810. goto out;
  1811. }
  1812. if (gl->gl_ops == &gfs2_inode_glops && gl->gl_object) {
  1813. if (!test_bit(GLF_LOCK, &gl->gl_flags) &&
  1814. list_empty(&gl->gl_holders)) {
  1815. error = dump_inode(gl->gl_object);
  1816. if (error)
  1817. goto out;
  1818. } else {
  1819. error = -ENOBUFS;
  1820. printk(KERN_INFO " Inode: busy\n");
  1821. }
  1822. }
  1823. error = 0;
  1824. out:
  1825. spin_unlock(&gl->gl_spin);
  1826. return error;
  1827. }
  1828. /**
  1829. * gfs2_dump_lockstate - print out the current lockstate
  1830. * @sdp: the filesystem
  1831. * @ub: the buffer to copy the information into
  1832. *
  1833. * If @ub is NULL, dump the lockstate to the console.
  1834. *
  1835. */
  1836. static int gfs2_dump_lockstate(struct gfs2_sbd *sdp)
  1837. {
  1838. struct gfs2_gl_hash_bucket *bucket;
  1839. struct gfs2_glock *gl;
  1840. unsigned int x;
  1841. int error = 0;
  1842. for (x = 0; x < GFS2_GL_HASH_SIZE; x++) {
  1843. bucket = &sdp->sd_gl_hash[x];
  1844. read_lock(&bucket->hb_lock);
  1845. list_for_each_entry(gl, &bucket->hb_list, gl_list) {
  1846. if (test_bit(GLF_PLUG, &gl->gl_flags))
  1847. continue;
  1848. error = dump_glock(gl);
  1849. if (error)
  1850. break;
  1851. }
  1852. read_unlock(&bucket->hb_lock);
  1853. if (error)
  1854. break;
  1855. }
  1856. return error;
  1857. }