nfs4state.c 58 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231
  1. /*
  2. * fs/nfs/nfs4state.c
  3. *
  4. * Client-side XDR for NFSv4.
  5. *
  6. * Copyright (c) 2002 The Regents of the University of Michigan.
  7. * All rights reserved.
  8. *
  9. * Kendrick Smith <kmsmith@umich.edu>
  10. *
  11. * Redistribution and use in source and binary forms, with or without
  12. * modification, are permitted provided that the following conditions
  13. * are met:
  14. *
  15. * 1. Redistributions of source code must retain the above copyright
  16. * notice, this list of conditions and the following disclaimer.
  17. * 2. Redistributions in binary form must reproduce the above copyright
  18. * notice, this list of conditions and the following disclaimer in the
  19. * documentation and/or other materials provided with the distribution.
  20. * 3. Neither the name of the University nor the names of its
  21. * contributors may be used to endorse or promote products derived
  22. * from this software without specific prior written permission.
  23. *
  24. * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESS OR IMPLIED
  25. * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
  26. * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
  27. * DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
  28. * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  29. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  30. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
  31. * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
  32. * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
  33. * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
  34. * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  35. *
  36. * Implementation of the NFSv4 state model. For the time being,
  37. * this is minimal, but will be made much more complex in a
  38. * subsequent patch.
  39. */
  40. #include <linux/kernel.h>
  41. #include <linux/slab.h>
  42. #include <linux/fs.h>
  43. #include <linux/nfs_fs.h>
  44. #include <linux/nfs_idmap.h>
  45. #include <linux/kthread.h>
  46. #include <linux/module.h>
  47. #include <linux/random.h>
  48. #include <linux/ratelimit.h>
  49. #include <linux/workqueue.h>
  50. #include <linux/bitops.h>
  51. #include <linux/jiffies.h>
  52. #include <linux/sunrpc/clnt.h>
  53. #include "nfs4_fs.h"
  54. #include "callback.h"
  55. #include "delegation.h"
  56. #include "internal.h"
  57. #include "nfs4session.h"
  58. #include "pnfs.h"
  59. #include "netns.h"
  60. #define NFSDBG_FACILITY NFSDBG_STATE
  61. #define OPENOWNER_POOL_SIZE 8
  62. const nfs4_stateid zero_stateid;
  63. static DEFINE_MUTEX(nfs_clid_init_mutex);
  64. int nfs4_init_clientid(struct nfs_client *clp, struct rpc_cred *cred)
  65. {
  66. struct nfs4_setclientid_res clid = {
  67. .clientid = clp->cl_clientid,
  68. .confirm = clp->cl_confirm,
  69. };
  70. unsigned short port;
  71. int status;
  72. struct nfs_net *nn = net_generic(clp->cl_net, nfs_net_id);
  73. if (test_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state))
  74. goto do_confirm;
  75. port = nn->nfs_callback_tcpport;
  76. if (clp->cl_addr.ss_family == AF_INET6)
  77. port = nn->nfs_callback_tcpport6;
  78. status = nfs4_proc_setclientid(clp, NFS4_CALLBACK, port, cred, &clid);
  79. if (status != 0)
  80. goto out;
  81. clp->cl_clientid = clid.clientid;
  82. clp->cl_confirm = clid.confirm;
  83. set_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state);
  84. do_confirm:
  85. status = nfs4_proc_setclientid_confirm(clp, &clid, cred);
  86. if (status != 0)
  87. goto out;
  88. clear_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state);
  89. nfs4_schedule_state_renewal(clp);
  90. out:
  91. return status;
  92. }
  93. /**
  94. * nfs40_discover_server_trunking - Detect server IP address trunking (mv0)
  95. *
  96. * @clp: nfs_client under test
  97. * @result: OUT: found nfs_client, or clp
  98. * @cred: credential to use for trunking test
  99. *
  100. * Returns zero, a negative errno, or a negative NFS4ERR status.
  101. * If zero is returned, an nfs_client pointer is planted in
  102. * "result".
  103. *
  104. * Note: The returned client may not yet be marked ready.
  105. */
  106. int nfs40_discover_server_trunking(struct nfs_client *clp,
  107. struct nfs_client **result,
  108. struct rpc_cred *cred)
  109. {
  110. struct nfs4_setclientid_res clid = {
  111. .clientid = clp->cl_clientid,
  112. .confirm = clp->cl_confirm,
  113. };
  114. struct nfs_net *nn = net_generic(clp->cl_net, nfs_net_id);
  115. unsigned short port;
  116. int status;
  117. port = nn->nfs_callback_tcpport;
  118. if (clp->cl_addr.ss_family == AF_INET6)
  119. port = nn->nfs_callback_tcpport6;
  120. status = nfs4_proc_setclientid(clp, NFS4_CALLBACK, port, cred, &clid);
  121. if (status != 0)
  122. goto out;
  123. clp->cl_clientid = clid.clientid;
  124. clp->cl_confirm = clid.confirm;
  125. status = nfs40_walk_client_list(clp, result, cred);
  126. if (status == 0) {
  127. /* Sustain the lease, even if it's empty. If the clientid4
  128. * goes stale it's of no use for trunking discovery. */
  129. nfs4_schedule_state_renewal(*result);
  130. }
  131. out:
  132. return status;
  133. }
  134. struct rpc_cred *nfs4_get_machine_cred_locked(struct nfs_client *clp)
  135. {
  136. struct rpc_cred *cred = NULL;
  137. if (clp->cl_machine_cred != NULL)
  138. cred = get_rpccred(clp->cl_machine_cred);
  139. return cred;
  140. }
  141. static void nfs4_root_machine_cred(struct nfs_client *clp)
  142. {
  143. struct rpc_cred *cred, *new;
  144. new = rpc_lookup_machine_cred(NULL);
  145. spin_lock(&clp->cl_lock);
  146. cred = clp->cl_machine_cred;
  147. clp->cl_machine_cred = new;
  148. spin_unlock(&clp->cl_lock);
  149. if (cred != NULL)
  150. put_rpccred(cred);
  151. }
  152. static struct rpc_cred *
  153. nfs4_get_renew_cred_server_locked(struct nfs_server *server)
  154. {
  155. struct rpc_cred *cred = NULL;
  156. struct nfs4_state_owner *sp;
  157. struct rb_node *pos;
  158. for (pos = rb_first(&server->state_owners);
  159. pos != NULL;
  160. pos = rb_next(pos)) {
  161. sp = rb_entry(pos, struct nfs4_state_owner, so_server_node);
  162. if (list_empty(&sp->so_states))
  163. continue;
  164. cred = get_rpccred(sp->so_cred);
  165. break;
  166. }
  167. return cred;
  168. }
  169. /**
  170. * nfs4_get_renew_cred_locked - Acquire credential for a renew operation
  171. * @clp: client state handle
  172. *
  173. * Returns an rpc_cred with reference count bumped, or NULL.
  174. * Caller must hold clp->cl_lock.
  175. */
  176. struct rpc_cred *nfs4_get_renew_cred_locked(struct nfs_client *clp)
  177. {
  178. struct rpc_cred *cred = NULL;
  179. struct nfs_server *server;
  180. /* Use machine credentials if available */
  181. cred = nfs4_get_machine_cred_locked(clp);
  182. if (cred != NULL)
  183. goto out;
  184. rcu_read_lock();
  185. list_for_each_entry_rcu(server, &clp->cl_superblocks, client_link) {
  186. cred = nfs4_get_renew_cred_server_locked(server);
  187. if (cred != NULL)
  188. break;
  189. }
  190. rcu_read_unlock();
  191. out:
  192. return cred;
  193. }
  194. static void nfs4_end_drain_slot_table(struct nfs4_slot_table *tbl)
  195. {
  196. if (test_and_clear_bit(NFS4_SLOT_TBL_DRAINING, &tbl->slot_tbl_state)) {
  197. spin_lock(&tbl->slot_tbl_lock);
  198. nfs41_wake_slot_table(tbl);
  199. spin_unlock(&tbl->slot_tbl_lock);
  200. }
  201. }
  202. static void nfs4_end_drain_session(struct nfs_client *clp)
  203. {
  204. struct nfs4_session *ses = clp->cl_session;
  205. if (clp->cl_slot_tbl) {
  206. nfs4_end_drain_slot_table(clp->cl_slot_tbl);
  207. return;
  208. }
  209. if (ses != NULL) {
  210. nfs4_end_drain_slot_table(&ses->bc_slot_table);
  211. nfs4_end_drain_slot_table(&ses->fc_slot_table);
  212. }
  213. }
  214. #if defined(CONFIG_NFS_V4_1)
  215. static int nfs4_drain_slot_tbl(struct nfs4_slot_table *tbl)
  216. {
  217. set_bit(NFS4_SLOT_TBL_DRAINING, &tbl->slot_tbl_state);
  218. spin_lock(&tbl->slot_tbl_lock);
  219. if (tbl->highest_used_slotid != NFS4_NO_SLOT) {
  220. INIT_COMPLETION(tbl->complete);
  221. spin_unlock(&tbl->slot_tbl_lock);
  222. return wait_for_completion_interruptible(&tbl->complete);
  223. }
  224. spin_unlock(&tbl->slot_tbl_lock);
  225. return 0;
  226. }
  227. static int nfs4_begin_drain_session(struct nfs_client *clp)
  228. {
  229. struct nfs4_session *ses = clp->cl_session;
  230. int ret = 0;
  231. if (clp->cl_slot_tbl)
  232. return nfs4_drain_slot_tbl(clp->cl_slot_tbl);
  233. /* back channel */
  234. ret = nfs4_drain_slot_tbl(&ses->bc_slot_table);
  235. if (ret)
  236. return ret;
  237. /* fore channel */
  238. return nfs4_drain_slot_tbl(&ses->fc_slot_table);
  239. }
  240. static int nfs41_setup_state_renewal(struct nfs_client *clp)
  241. {
  242. int status;
  243. struct nfs_fsinfo fsinfo;
  244. if (!test_bit(NFS_CS_CHECK_LEASE_TIME, &clp->cl_res_state)) {
  245. nfs4_schedule_state_renewal(clp);
  246. return 0;
  247. }
  248. status = nfs4_proc_get_lease_time(clp, &fsinfo);
  249. if (status == 0) {
  250. /* Update lease time and schedule renewal */
  251. spin_lock(&clp->cl_lock);
  252. clp->cl_lease_time = fsinfo.lease_time * HZ;
  253. clp->cl_last_renewal = jiffies;
  254. spin_unlock(&clp->cl_lock);
  255. nfs4_schedule_state_renewal(clp);
  256. }
  257. return status;
  258. }
  259. static void nfs41_finish_session_reset(struct nfs_client *clp)
  260. {
  261. clear_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state);
  262. clear_bit(NFS4CLNT_SESSION_RESET, &clp->cl_state);
  263. /* create_session negotiated new slot table */
  264. clear_bit(NFS4CLNT_BIND_CONN_TO_SESSION, &clp->cl_state);
  265. nfs41_setup_state_renewal(clp);
  266. }
  267. int nfs41_init_clientid(struct nfs_client *clp, struct rpc_cred *cred)
  268. {
  269. int status;
  270. if (test_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state))
  271. goto do_confirm;
  272. nfs4_begin_drain_session(clp);
  273. status = nfs4_proc_exchange_id(clp, cred);
  274. if (status != 0)
  275. goto out;
  276. set_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state);
  277. do_confirm:
  278. status = nfs4_proc_create_session(clp, cred);
  279. if (status != 0)
  280. goto out;
  281. nfs41_finish_session_reset(clp);
  282. nfs_mark_client_ready(clp, NFS_CS_READY);
  283. out:
  284. return status;
  285. }
  286. /**
  287. * nfs41_discover_server_trunking - Detect server IP address trunking (mv1)
  288. *
  289. * @clp: nfs_client under test
  290. * @result: OUT: found nfs_client, or clp
  291. * @cred: credential to use for trunking test
  292. *
  293. * Returns NFS4_OK, a negative errno, or a negative NFS4ERR status.
  294. * If NFS4_OK is returned, an nfs_client pointer is planted in
  295. * "result".
  296. *
  297. * Note: The returned client may not yet be marked ready.
  298. */
  299. int nfs41_discover_server_trunking(struct nfs_client *clp,
  300. struct nfs_client **result,
  301. struct rpc_cred *cred)
  302. {
  303. int status;
  304. status = nfs4_proc_exchange_id(clp, cred);
  305. if (status != NFS4_OK)
  306. return status;
  307. set_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state);
  308. return nfs41_walk_client_list(clp, result, cred);
  309. }
  310. #endif /* CONFIG_NFS_V4_1 */
  311. /**
  312. * nfs4_get_clid_cred - Acquire credential for a setclientid operation
  313. * @clp: client state handle
  314. *
  315. * Returns an rpc_cred with reference count bumped, or NULL.
  316. */
  317. struct rpc_cred *nfs4_get_clid_cred(struct nfs_client *clp)
  318. {
  319. struct rpc_cred *cred;
  320. spin_lock(&clp->cl_lock);
  321. cred = nfs4_get_machine_cred_locked(clp);
  322. spin_unlock(&clp->cl_lock);
  323. return cred;
  324. }
  325. static struct nfs4_state_owner *
  326. nfs4_find_state_owner_locked(struct nfs_server *server, struct rpc_cred *cred)
  327. {
  328. struct rb_node **p = &server->state_owners.rb_node,
  329. *parent = NULL;
  330. struct nfs4_state_owner *sp;
  331. while (*p != NULL) {
  332. parent = *p;
  333. sp = rb_entry(parent, struct nfs4_state_owner, so_server_node);
  334. if (cred < sp->so_cred)
  335. p = &parent->rb_left;
  336. else if (cred > sp->so_cred)
  337. p = &parent->rb_right;
  338. else {
  339. if (!list_empty(&sp->so_lru))
  340. list_del_init(&sp->so_lru);
  341. atomic_inc(&sp->so_count);
  342. return sp;
  343. }
  344. }
  345. return NULL;
  346. }
  347. static struct nfs4_state_owner *
  348. nfs4_insert_state_owner_locked(struct nfs4_state_owner *new)
  349. {
  350. struct nfs_server *server = new->so_server;
  351. struct rb_node **p = &server->state_owners.rb_node,
  352. *parent = NULL;
  353. struct nfs4_state_owner *sp;
  354. int err;
  355. while (*p != NULL) {
  356. parent = *p;
  357. sp = rb_entry(parent, struct nfs4_state_owner, so_server_node);
  358. if (new->so_cred < sp->so_cred)
  359. p = &parent->rb_left;
  360. else if (new->so_cred > sp->so_cred)
  361. p = &parent->rb_right;
  362. else {
  363. if (!list_empty(&sp->so_lru))
  364. list_del_init(&sp->so_lru);
  365. atomic_inc(&sp->so_count);
  366. return sp;
  367. }
  368. }
  369. err = ida_get_new(&server->openowner_id, &new->so_seqid.owner_id);
  370. if (err)
  371. return ERR_PTR(err);
  372. rb_link_node(&new->so_server_node, parent, p);
  373. rb_insert_color(&new->so_server_node, &server->state_owners);
  374. return new;
  375. }
  376. static void
  377. nfs4_remove_state_owner_locked(struct nfs4_state_owner *sp)
  378. {
  379. struct nfs_server *server = sp->so_server;
  380. if (!RB_EMPTY_NODE(&sp->so_server_node))
  381. rb_erase(&sp->so_server_node, &server->state_owners);
  382. ida_remove(&server->openowner_id, sp->so_seqid.owner_id);
  383. }
  384. static void
  385. nfs4_init_seqid_counter(struct nfs_seqid_counter *sc)
  386. {
  387. sc->create_time = ktime_get();
  388. sc->flags = 0;
  389. sc->counter = 0;
  390. spin_lock_init(&sc->lock);
  391. INIT_LIST_HEAD(&sc->list);
  392. rpc_init_wait_queue(&sc->wait, "Seqid_waitqueue");
  393. }
  394. static void
  395. nfs4_destroy_seqid_counter(struct nfs_seqid_counter *sc)
  396. {
  397. rpc_destroy_wait_queue(&sc->wait);
  398. }
  399. /*
  400. * nfs4_alloc_state_owner(): this is called on the OPEN or CREATE path to
  401. * create a new state_owner.
  402. *
  403. */
  404. static struct nfs4_state_owner *
  405. nfs4_alloc_state_owner(struct nfs_server *server,
  406. struct rpc_cred *cred,
  407. gfp_t gfp_flags)
  408. {
  409. struct nfs4_state_owner *sp;
  410. sp = kzalloc(sizeof(*sp), gfp_flags);
  411. if (!sp)
  412. return NULL;
  413. sp->so_server = server;
  414. sp->so_cred = get_rpccred(cred);
  415. spin_lock_init(&sp->so_lock);
  416. INIT_LIST_HEAD(&sp->so_states);
  417. nfs4_init_seqid_counter(&sp->so_seqid);
  418. atomic_set(&sp->so_count, 1);
  419. INIT_LIST_HEAD(&sp->so_lru);
  420. seqcount_init(&sp->so_reclaim_seqcount);
  421. mutex_init(&sp->so_delegreturn_mutex);
  422. return sp;
  423. }
  424. static void
  425. nfs4_drop_state_owner(struct nfs4_state_owner *sp)
  426. {
  427. struct rb_node *rb_node = &sp->so_server_node;
  428. if (!RB_EMPTY_NODE(rb_node)) {
  429. struct nfs_server *server = sp->so_server;
  430. struct nfs_client *clp = server->nfs_client;
  431. spin_lock(&clp->cl_lock);
  432. if (!RB_EMPTY_NODE(rb_node)) {
  433. rb_erase(rb_node, &server->state_owners);
  434. RB_CLEAR_NODE(rb_node);
  435. }
  436. spin_unlock(&clp->cl_lock);
  437. }
  438. }
  439. static void nfs4_free_state_owner(struct nfs4_state_owner *sp)
  440. {
  441. nfs4_destroy_seqid_counter(&sp->so_seqid);
  442. put_rpccred(sp->so_cred);
  443. kfree(sp);
  444. }
  445. static void nfs4_gc_state_owners(struct nfs_server *server)
  446. {
  447. struct nfs_client *clp = server->nfs_client;
  448. struct nfs4_state_owner *sp, *tmp;
  449. unsigned long time_min, time_max;
  450. LIST_HEAD(doomed);
  451. spin_lock(&clp->cl_lock);
  452. time_max = jiffies;
  453. time_min = (long)time_max - (long)clp->cl_lease_time;
  454. list_for_each_entry_safe(sp, tmp, &server->state_owners_lru, so_lru) {
  455. /* NB: LRU is sorted so that oldest is at the head */
  456. if (time_in_range(sp->so_expires, time_min, time_max))
  457. break;
  458. list_move(&sp->so_lru, &doomed);
  459. nfs4_remove_state_owner_locked(sp);
  460. }
  461. spin_unlock(&clp->cl_lock);
  462. list_for_each_entry_safe(sp, tmp, &doomed, so_lru) {
  463. list_del(&sp->so_lru);
  464. nfs4_free_state_owner(sp);
  465. }
  466. }
  467. /**
  468. * nfs4_get_state_owner - Look up a state owner given a credential
  469. * @server: nfs_server to search
  470. * @cred: RPC credential to match
  471. *
  472. * Returns a pointer to an instantiated nfs4_state_owner struct, or NULL.
  473. */
  474. struct nfs4_state_owner *nfs4_get_state_owner(struct nfs_server *server,
  475. struct rpc_cred *cred,
  476. gfp_t gfp_flags)
  477. {
  478. struct nfs_client *clp = server->nfs_client;
  479. struct nfs4_state_owner *sp, *new;
  480. spin_lock(&clp->cl_lock);
  481. sp = nfs4_find_state_owner_locked(server, cred);
  482. spin_unlock(&clp->cl_lock);
  483. if (sp != NULL)
  484. goto out;
  485. new = nfs4_alloc_state_owner(server, cred, gfp_flags);
  486. if (new == NULL)
  487. goto out;
  488. do {
  489. if (ida_pre_get(&server->openowner_id, gfp_flags) == 0)
  490. break;
  491. spin_lock(&clp->cl_lock);
  492. sp = nfs4_insert_state_owner_locked(new);
  493. spin_unlock(&clp->cl_lock);
  494. } while (sp == ERR_PTR(-EAGAIN));
  495. if (sp != new)
  496. nfs4_free_state_owner(new);
  497. out:
  498. nfs4_gc_state_owners(server);
  499. return sp;
  500. }
  501. /**
  502. * nfs4_put_state_owner - Release a nfs4_state_owner
  503. * @sp: state owner data to release
  504. *
  505. * Note that we keep released state owners on an LRU
  506. * list.
  507. * This caches valid state owners so that they can be
  508. * reused, to avoid the OPEN_CONFIRM on minor version 0.
  509. * It also pins the uniquifier of dropped state owners for
  510. * a while, to ensure that those state owner names are
  511. * never reused.
  512. */
  513. void nfs4_put_state_owner(struct nfs4_state_owner *sp)
  514. {
  515. struct nfs_server *server = sp->so_server;
  516. struct nfs_client *clp = server->nfs_client;
  517. if (!atomic_dec_and_lock(&sp->so_count, &clp->cl_lock))
  518. return;
  519. sp->so_expires = jiffies;
  520. list_add_tail(&sp->so_lru, &server->state_owners_lru);
  521. spin_unlock(&clp->cl_lock);
  522. }
  523. /**
  524. * nfs4_purge_state_owners - Release all cached state owners
  525. * @server: nfs_server with cached state owners to release
  526. *
  527. * Called at umount time. Remaining state owners will be on
  528. * the LRU with ref count of zero.
  529. */
  530. void nfs4_purge_state_owners(struct nfs_server *server)
  531. {
  532. struct nfs_client *clp = server->nfs_client;
  533. struct nfs4_state_owner *sp, *tmp;
  534. LIST_HEAD(doomed);
  535. spin_lock(&clp->cl_lock);
  536. list_for_each_entry_safe(sp, tmp, &server->state_owners_lru, so_lru) {
  537. list_move(&sp->so_lru, &doomed);
  538. nfs4_remove_state_owner_locked(sp);
  539. }
  540. spin_unlock(&clp->cl_lock);
  541. list_for_each_entry_safe(sp, tmp, &doomed, so_lru) {
  542. list_del(&sp->so_lru);
  543. nfs4_free_state_owner(sp);
  544. }
  545. }
  546. static struct nfs4_state *
  547. nfs4_alloc_open_state(void)
  548. {
  549. struct nfs4_state *state;
  550. state = kzalloc(sizeof(*state), GFP_NOFS);
  551. if (!state)
  552. return NULL;
  553. atomic_set(&state->count, 1);
  554. INIT_LIST_HEAD(&state->lock_states);
  555. spin_lock_init(&state->state_lock);
  556. seqlock_init(&state->seqlock);
  557. return state;
  558. }
  559. void
  560. nfs4_state_set_mode_locked(struct nfs4_state *state, fmode_t fmode)
  561. {
  562. if (state->state == fmode)
  563. return;
  564. /* NB! List reordering - see the reclaim code for why. */
  565. if ((fmode & FMODE_WRITE) != (state->state & FMODE_WRITE)) {
  566. if (fmode & FMODE_WRITE)
  567. list_move(&state->open_states, &state->owner->so_states);
  568. else
  569. list_move_tail(&state->open_states, &state->owner->so_states);
  570. }
  571. state->state = fmode;
  572. }
  573. static struct nfs4_state *
  574. __nfs4_find_state_byowner(struct inode *inode, struct nfs4_state_owner *owner)
  575. {
  576. struct nfs_inode *nfsi = NFS_I(inode);
  577. struct nfs4_state *state;
  578. list_for_each_entry(state, &nfsi->open_states, inode_states) {
  579. if (state->owner != owner)
  580. continue;
  581. if (!nfs4_valid_open_stateid(state))
  582. continue;
  583. if (atomic_inc_not_zero(&state->count))
  584. return state;
  585. }
  586. return NULL;
  587. }
  588. static void
  589. nfs4_free_open_state(struct nfs4_state *state)
  590. {
  591. kfree(state);
  592. }
  593. struct nfs4_state *
  594. nfs4_get_open_state(struct inode *inode, struct nfs4_state_owner *owner)
  595. {
  596. struct nfs4_state *state, *new;
  597. struct nfs_inode *nfsi = NFS_I(inode);
  598. spin_lock(&inode->i_lock);
  599. state = __nfs4_find_state_byowner(inode, owner);
  600. spin_unlock(&inode->i_lock);
  601. if (state)
  602. goto out;
  603. new = nfs4_alloc_open_state();
  604. spin_lock(&owner->so_lock);
  605. spin_lock(&inode->i_lock);
  606. state = __nfs4_find_state_byowner(inode, owner);
  607. if (state == NULL && new != NULL) {
  608. state = new;
  609. state->owner = owner;
  610. atomic_inc(&owner->so_count);
  611. list_add(&state->inode_states, &nfsi->open_states);
  612. ihold(inode);
  613. state->inode = inode;
  614. spin_unlock(&inode->i_lock);
  615. /* Note: The reclaim code dictates that we add stateless
  616. * and read-only stateids to the end of the list */
  617. list_add_tail(&state->open_states, &owner->so_states);
  618. spin_unlock(&owner->so_lock);
  619. } else {
  620. spin_unlock(&inode->i_lock);
  621. spin_unlock(&owner->so_lock);
  622. if (new)
  623. nfs4_free_open_state(new);
  624. }
  625. out:
  626. return state;
  627. }
  628. void nfs4_put_open_state(struct nfs4_state *state)
  629. {
  630. struct inode *inode = state->inode;
  631. struct nfs4_state_owner *owner = state->owner;
  632. if (!atomic_dec_and_lock(&state->count, &owner->so_lock))
  633. return;
  634. spin_lock(&inode->i_lock);
  635. list_del(&state->inode_states);
  636. list_del(&state->open_states);
  637. spin_unlock(&inode->i_lock);
  638. spin_unlock(&owner->so_lock);
  639. iput(inode);
  640. nfs4_free_open_state(state);
  641. nfs4_put_state_owner(owner);
  642. }
  643. /*
  644. * Close the current file.
  645. */
  646. static void __nfs4_close(struct nfs4_state *state,
  647. fmode_t fmode, gfp_t gfp_mask, int wait)
  648. {
  649. struct nfs4_state_owner *owner = state->owner;
  650. int call_close = 0;
  651. fmode_t newstate;
  652. atomic_inc(&owner->so_count);
  653. /* Protect against nfs4_find_state() */
  654. spin_lock(&owner->so_lock);
  655. switch (fmode & (FMODE_READ | FMODE_WRITE)) {
  656. case FMODE_READ:
  657. state->n_rdonly--;
  658. break;
  659. case FMODE_WRITE:
  660. state->n_wronly--;
  661. break;
  662. case FMODE_READ|FMODE_WRITE:
  663. state->n_rdwr--;
  664. }
  665. newstate = FMODE_READ|FMODE_WRITE;
  666. if (state->n_rdwr == 0) {
  667. if (state->n_rdonly == 0) {
  668. newstate &= ~FMODE_READ;
  669. call_close |= test_bit(NFS_O_RDONLY_STATE, &state->flags);
  670. call_close |= test_bit(NFS_O_RDWR_STATE, &state->flags);
  671. }
  672. if (state->n_wronly == 0) {
  673. newstate &= ~FMODE_WRITE;
  674. call_close |= test_bit(NFS_O_WRONLY_STATE, &state->flags);
  675. call_close |= test_bit(NFS_O_RDWR_STATE, &state->flags);
  676. }
  677. if (newstate == 0)
  678. clear_bit(NFS_DELEGATED_STATE, &state->flags);
  679. }
  680. nfs4_state_set_mode_locked(state, newstate);
  681. spin_unlock(&owner->so_lock);
  682. if (!call_close) {
  683. nfs4_put_open_state(state);
  684. nfs4_put_state_owner(owner);
  685. } else
  686. nfs4_do_close(state, gfp_mask, wait);
  687. }
  688. void nfs4_close_state(struct nfs4_state *state, fmode_t fmode)
  689. {
  690. __nfs4_close(state, fmode, GFP_NOFS, 0);
  691. }
  692. void nfs4_close_sync(struct nfs4_state *state, fmode_t fmode)
  693. {
  694. __nfs4_close(state, fmode, GFP_KERNEL, 1);
  695. }
  696. /*
  697. * Search the state->lock_states for an existing lock_owner
  698. * that is compatible with current->files
  699. */
  700. static struct nfs4_lock_state *
  701. __nfs4_find_lock_state(struct nfs4_state *state, fl_owner_t fl_owner, pid_t fl_pid, unsigned int type)
  702. {
  703. struct nfs4_lock_state *pos;
  704. list_for_each_entry(pos, &state->lock_states, ls_locks) {
  705. if (type != NFS4_ANY_LOCK_TYPE && pos->ls_owner.lo_type != type)
  706. continue;
  707. switch (pos->ls_owner.lo_type) {
  708. case NFS4_POSIX_LOCK_TYPE:
  709. if (pos->ls_owner.lo_u.posix_owner != fl_owner)
  710. continue;
  711. break;
  712. case NFS4_FLOCK_LOCK_TYPE:
  713. if (pos->ls_owner.lo_u.flock_owner != fl_pid)
  714. continue;
  715. }
  716. atomic_inc(&pos->ls_count);
  717. return pos;
  718. }
  719. return NULL;
  720. }
  721. /*
  722. * Return a compatible lock_state. If no initialized lock_state structure
  723. * exists, return an uninitialized one.
  724. *
  725. */
  726. static struct nfs4_lock_state *nfs4_alloc_lock_state(struct nfs4_state *state, fl_owner_t fl_owner, pid_t fl_pid, unsigned int type)
  727. {
  728. struct nfs4_lock_state *lsp;
  729. struct nfs_server *server = state->owner->so_server;
  730. lsp = kzalloc(sizeof(*lsp), GFP_NOFS);
  731. if (lsp == NULL)
  732. return NULL;
  733. nfs4_init_seqid_counter(&lsp->ls_seqid);
  734. atomic_set(&lsp->ls_count, 1);
  735. lsp->ls_state = state;
  736. lsp->ls_owner.lo_type = type;
  737. switch (lsp->ls_owner.lo_type) {
  738. case NFS4_FLOCK_LOCK_TYPE:
  739. lsp->ls_owner.lo_u.flock_owner = fl_pid;
  740. break;
  741. case NFS4_POSIX_LOCK_TYPE:
  742. lsp->ls_owner.lo_u.posix_owner = fl_owner;
  743. break;
  744. default:
  745. goto out_free;
  746. }
  747. lsp->ls_seqid.owner_id = ida_simple_get(&server->lockowner_id, 0, 0, GFP_NOFS);
  748. if (lsp->ls_seqid.owner_id < 0)
  749. goto out_free;
  750. INIT_LIST_HEAD(&lsp->ls_locks);
  751. return lsp;
  752. out_free:
  753. kfree(lsp);
  754. return NULL;
  755. }
  756. void nfs4_free_lock_state(struct nfs_server *server, struct nfs4_lock_state *lsp)
  757. {
  758. ida_simple_remove(&server->lockowner_id, lsp->ls_seqid.owner_id);
  759. nfs4_destroy_seqid_counter(&lsp->ls_seqid);
  760. kfree(lsp);
  761. }
  762. /*
  763. * Return a compatible lock_state. If no initialized lock_state structure
  764. * exists, return an uninitialized one.
  765. *
  766. */
  767. static struct nfs4_lock_state *nfs4_get_lock_state(struct nfs4_state *state, fl_owner_t owner, pid_t pid, unsigned int type)
  768. {
  769. struct nfs4_lock_state *lsp, *new = NULL;
  770. for(;;) {
  771. spin_lock(&state->state_lock);
  772. lsp = __nfs4_find_lock_state(state, owner, pid, type);
  773. if (lsp != NULL)
  774. break;
  775. if (new != NULL) {
  776. list_add(&new->ls_locks, &state->lock_states);
  777. set_bit(LK_STATE_IN_USE, &state->flags);
  778. lsp = new;
  779. new = NULL;
  780. break;
  781. }
  782. spin_unlock(&state->state_lock);
  783. new = nfs4_alloc_lock_state(state, owner, pid, type);
  784. if (new == NULL)
  785. return NULL;
  786. }
  787. spin_unlock(&state->state_lock);
  788. if (new != NULL)
  789. nfs4_free_lock_state(state->owner->so_server, new);
  790. return lsp;
  791. }
  792. /*
  793. * Release reference to lock_state, and free it if we see that
  794. * it is no longer in use
  795. */
  796. void nfs4_put_lock_state(struct nfs4_lock_state *lsp)
  797. {
  798. struct nfs_server *server;
  799. struct nfs4_state *state;
  800. if (lsp == NULL)
  801. return;
  802. state = lsp->ls_state;
  803. if (!atomic_dec_and_lock(&lsp->ls_count, &state->state_lock))
  804. return;
  805. list_del(&lsp->ls_locks);
  806. if (list_empty(&state->lock_states))
  807. clear_bit(LK_STATE_IN_USE, &state->flags);
  808. spin_unlock(&state->state_lock);
  809. server = state->owner->so_server;
  810. if (test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags)) {
  811. struct nfs_client *clp = server->nfs_client;
  812. clp->cl_mvops->free_lock_state(server, lsp);
  813. } else
  814. nfs4_free_lock_state(server, lsp);
  815. }
  816. static void nfs4_fl_copy_lock(struct file_lock *dst, struct file_lock *src)
  817. {
  818. struct nfs4_lock_state *lsp = src->fl_u.nfs4_fl.owner;
  819. dst->fl_u.nfs4_fl.owner = lsp;
  820. atomic_inc(&lsp->ls_count);
  821. }
  822. static void nfs4_fl_release_lock(struct file_lock *fl)
  823. {
  824. nfs4_put_lock_state(fl->fl_u.nfs4_fl.owner);
  825. }
  826. static const struct file_lock_operations nfs4_fl_lock_ops = {
  827. .fl_copy_lock = nfs4_fl_copy_lock,
  828. .fl_release_private = nfs4_fl_release_lock,
  829. };
  830. int nfs4_set_lock_state(struct nfs4_state *state, struct file_lock *fl)
  831. {
  832. struct nfs4_lock_state *lsp;
  833. if (fl->fl_ops != NULL)
  834. return 0;
  835. if (fl->fl_flags & FL_POSIX)
  836. lsp = nfs4_get_lock_state(state, fl->fl_owner, 0, NFS4_POSIX_LOCK_TYPE);
  837. else if (fl->fl_flags & FL_FLOCK)
  838. lsp = nfs4_get_lock_state(state, NULL, fl->fl_pid,
  839. NFS4_FLOCK_LOCK_TYPE);
  840. else
  841. return -EINVAL;
  842. if (lsp == NULL)
  843. return -ENOMEM;
  844. fl->fl_u.nfs4_fl.owner = lsp;
  845. fl->fl_ops = &nfs4_fl_lock_ops;
  846. return 0;
  847. }
  848. static int nfs4_copy_lock_stateid(nfs4_stateid *dst,
  849. struct nfs4_state *state,
  850. const struct nfs_lockowner *lockowner)
  851. {
  852. struct nfs4_lock_state *lsp;
  853. fl_owner_t fl_owner;
  854. pid_t fl_pid;
  855. int ret = -ENOENT;
  856. if (lockowner == NULL)
  857. goto out;
  858. if (test_bit(LK_STATE_IN_USE, &state->flags) == 0)
  859. goto out;
  860. fl_owner = lockowner->l_owner;
  861. fl_pid = lockowner->l_pid;
  862. spin_lock(&state->state_lock);
  863. lsp = __nfs4_find_lock_state(state, fl_owner, fl_pid, NFS4_ANY_LOCK_TYPE);
  864. if (lsp && test_bit(NFS_LOCK_LOST, &lsp->ls_flags))
  865. ret = -EIO;
  866. else if (lsp != NULL && test_bit(NFS_LOCK_INITIALIZED, &lsp->ls_flags) != 0) {
  867. nfs4_stateid_copy(dst, &lsp->ls_stateid);
  868. ret = 0;
  869. smp_rmb();
  870. if (!list_empty(&lsp->ls_seqid.list))
  871. ret = -EWOULDBLOCK;
  872. }
  873. spin_unlock(&state->state_lock);
  874. nfs4_put_lock_state(lsp);
  875. out:
  876. return ret;
  877. }
  878. static int nfs4_copy_open_stateid(nfs4_stateid *dst, struct nfs4_state *state)
  879. {
  880. const nfs4_stateid *src;
  881. int ret;
  882. int seq;
  883. do {
  884. src = &zero_stateid;
  885. seq = read_seqbegin(&state->seqlock);
  886. if (test_bit(NFS_OPEN_STATE, &state->flags))
  887. src = &state->open_stateid;
  888. nfs4_stateid_copy(dst, src);
  889. ret = 0;
  890. smp_rmb();
  891. if (!list_empty(&state->owner->so_seqid.list))
  892. ret = -EWOULDBLOCK;
  893. } while (read_seqretry(&state->seqlock, seq));
  894. return ret;
  895. }
  896. /*
  897. * Byte-range lock aware utility to initialize the stateid of read/write
  898. * requests.
  899. */
  900. int nfs4_select_rw_stateid(nfs4_stateid *dst, struct nfs4_state *state,
  901. fmode_t fmode, const struct nfs_lockowner *lockowner)
  902. {
  903. int ret = nfs4_copy_lock_stateid(dst, state, lockowner);
  904. if (ret == -EIO)
  905. /* A lost lock - don't even consider delegations */
  906. goto out;
  907. if (nfs4_copy_delegation_stateid(dst, state->inode, fmode))
  908. goto out;
  909. if (ret != -ENOENT)
  910. /* nfs4_copy_delegation_stateid() didn't over-write
  911. * dst, so it still has the lock stateid which we now
  912. * choose to use.
  913. */
  914. goto out;
  915. ret = nfs4_copy_open_stateid(dst, state);
  916. out:
  917. if (nfs_server_capable(state->inode, NFS_CAP_STATEID_NFSV41))
  918. dst->seqid = 0;
  919. return ret;
  920. }
  921. struct nfs_seqid *nfs_alloc_seqid(struct nfs_seqid_counter *counter, gfp_t gfp_mask)
  922. {
  923. struct nfs_seqid *new;
  924. new = kmalloc(sizeof(*new), gfp_mask);
  925. if (new != NULL) {
  926. new->sequence = counter;
  927. INIT_LIST_HEAD(&new->list);
  928. new->task = NULL;
  929. }
  930. return new;
  931. }
  932. void nfs_release_seqid(struct nfs_seqid *seqid)
  933. {
  934. struct nfs_seqid_counter *sequence;
  935. if (list_empty(&seqid->list))
  936. return;
  937. sequence = seqid->sequence;
  938. spin_lock(&sequence->lock);
  939. list_del_init(&seqid->list);
  940. if (!list_empty(&sequence->list)) {
  941. struct nfs_seqid *next;
  942. next = list_first_entry(&sequence->list,
  943. struct nfs_seqid, list);
  944. rpc_wake_up_queued_task(&sequence->wait, next->task);
  945. }
  946. spin_unlock(&sequence->lock);
  947. }
  948. void nfs_free_seqid(struct nfs_seqid *seqid)
  949. {
  950. nfs_release_seqid(seqid);
  951. kfree(seqid);
  952. }
  953. /*
  954. * Increment the seqid if the OPEN/OPEN_DOWNGRADE/CLOSE succeeded, or
  955. * failed with a seqid incrementing error -
  956. * see comments nfs_fs.h:seqid_mutating_error()
  957. */
  958. static void nfs_increment_seqid(int status, struct nfs_seqid *seqid)
  959. {
  960. switch (status) {
  961. case 0:
  962. break;
  963. case -NFS4ERR_BAD_SEQID:
  964. if (seqid->sequence->flags & NFS_SEQID_CONFIRMED)
  965. return;
  966. pr_warn_ratelimited("NFS: v4 server returned a bad"
  967. " sequence-id error on an"
  968. " unconfirmed sequence %p!\n",
  969. seqid->sequence);
  970. case -NFS4ERR_STALE_CLIENTID:
  971. case -NFS4ERR_STALE_STATEID:
  972. case -NFS4ERR_BAD_STATEID:
  973. case -NFS4ERR_BADXDR:
  974. case -NFS4ERR_RESOURCE:
  975. case -NFS4ERR_NOFILEHANDLE:
  976. /* Non-seqid mutating errors */
  977. return;
  978. };
  979. /*
  980. * Note: no locking needed as we are guaranteed to be first
  981. * on the sequence list
  982. */
  983. seqid->sequence->counter++;
  984. }
  985. void nfs_increment_open_seqid(int status, struct nfs_seqid *seqid)
  986. {
  987. struct nfs4_state_owner *sp = container_of(seqid->sequence,
  988. struct nfs4_state_owner, so_seqid);
  989. struct nfs_server *server = sp->so_server;
  990. if (status == -NFS4ERR_BAD_SEQID)
  991. nfs4_drop_state_owner(sp);
  992. if (!nfs4_has_session(server->nfs_client))
  993. nfs_increment_seqid(status, seqid);
  994. }
  995. /*
  996. * Increment the seqid if the LOCK/LOCKU succeeded, or
  997. * failed with a seqid incrementing error -
  998. * see comments nfs_fs.h:seqid_mutating_error()
  999. */
  1000. void nfs_increment_lock_seqid(int status, struct nfs_seqid *seqid)
  1001. {
  1002. nfs_increment_seqid(status, seqid);
  1003. }
  1004. int nfs_wait_on_sequence(struct nfs_seqid *seqid, struct rpc_task *task)
  1005. {
  1006. struct nfs_seqid_counter *sequence = seqid->sequence;
  1007. int status = 0;
  1008. spin_lock(&sequence->lock);
  1009. seqid->task = task;
  1010. if (list_empty(&seqid->list))
  1011. list_add_tail(&seqid->list, &sequence->list);
  1012. if (list_first_entry(&sequence->list, struct nfs_seqid, list) == seqid)
  1013. goto unlock;
  1014. rpc_sleep_on(&sequence->wait, task, NULL);
  1015. status = -EAGAIN;
  1016. unlock:
  1017. spin_unlock(&sequence->lock);
  1018. return status;
  1019. }
  1020. static int nfs4_run_state_manager(void *);
  1021. static void nfs4_clear_state_manager_bit(struct nfs_client *clp)
  1022. {
  1023. smp_mb__before_clear_bit();
  1024. clear_bit(NFS4CLNT_MANAGER_RUNNING, &clp->cl_state);
  1025. smp_mb__after_clear_bit();
  1026. wake_up_bit(&clp->cl_state, NFS4CLNT_MANAGER_RUNNING);
  1027. rpc_wake_up(&clp->cl_rpcwaitq);
  1028. }
  1029. /*
  1030. * Schedule the nfs_client asynchronous state management routine
  1031. */
  1032. void nfs4_schedule_state_manager(struct nfs_client *clp)
  1033. {
  1034. struct task_struct *task;
  1035. char buf[INET6_ADDRSTRLEN + sizeof("-manager") + 1];
  1036. if (test_and_set_bit(NFS4CLNT_MANAGER_RUNNING, &clp->cl_state) != 0)
  1037. return;
  1038. __module_get(THIS_MODULE);
  1039. atomic_inc(&clp->cl_count);
  1040. /* The rcu_read_lock() is not strictly necessary, as the state
  1041. * manager is the only thread that ever changes the rpc_xprt
  1042. * after it's initialized. At this point, we're single threaded. */
  1043. rcu_read_lock();
  1044. snprintf(buf, sizeof(buf), "%s-manager",
  1045. rpc_peeraddr2str(clp->cl_rpcclient, RPC_DISPLAY_ADDR));
  1046. rcu_read_unlock();
  1047. task = kthread_run(nfs4_run_state_manager, clp, "%s", buf);
  1048. if (IS_ERR(task)) {
  1049. printk(KERN_ERR "%s: kthread_run: %ld\n",
  1050. __func__, PTR_ERR(task));
  1051. nfs4_clear_state_manager_bit(clp);
  1052. nfs_put_client(clp);
  1053. module_put(THIS_MODULE);
  1054. }
  1055. }
  1056. /*
  1057. * Schedule a lease recovery attempt
  1058. */
  1059. void nfs4_schedule_lease_recovery(struct nfs_client *clp)
  1060. {
  1061. if (!clp)
  1062. return;
  1063. if (!test_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state))
  1064. set_bit(NFS4CLNT_CHECK_LEASE, &clp->cl_state);
  1065. dprintk("%s: scheduling lease recovery for server %s\n", __func__,
  1066. clp->cl_hostname);
  1067. nfs4_schedule_state_manager(clp);
  1068. }
  1069. EXPORT_SYMBOL_GPL(nfs4_schedule_lease_recovery);
  1070. int nfs4_wait_clnt_recover(struct nfs_client *clp)
  1071. {
  1072. int res;
  1073. might_sleep();
  1074. res = wait_on_bit(&clp->cl_state, NFS4CLNT_MANAGER_RUNNING,
  1075. nfs_wait_bit_killable, TASK_KILLABLE);
  1076. if (res)
  1077. return res;
  1078. if (clp->cl_cons_state < 0)
  1079. return clp->cl_cons_state;
  1080. return 0;
  1081. }
  1082. int nfs4_client_recover_expired_lease(struct nfs_client *clp)
  1083. {
  1084. unsigned int loop;
  1085. int ret;
  1086. for (loop = NFS4_MAX_LOOP_ON_RECOVER; loop != 0; loop--) {
  1087. ret = nfs4_wait_clnt_recover(clp);
  1088. if (ret != 0)
  1089. break;
  1090. if (!test_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state) &&
  1091. !test_bit(NFS4CLNT_CHECK_LEASE,&clp->cl_state))
  1092. break;
  1093. nfs4_schedule_state_manager(clp);
  1094. ret = -EIO;
  1095. }
  1096. return ret;
  1097. }
  1098. /*
  1099. * nfs40_handle_cb_pathdown - return all delegations after NFS4ERR_CB_PATH_DOWN
  1100. * @clp: client to process
  1101. *
  1102. * Set the NFS4CLNT_LEASE_EXPIRED state in order to force a
  1103. * resend of the SETCLIENTID and hence re-establish the
  1104. * callback channel. Then return all existing delegations.
  1105. */
  1106. static void nfs40_handle_cb_pathdown(struct nfs_client *clp)
  1107. {
  1108. set_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state);
  1109. nfs_expire_all_delegations(clp);
  1110. dprintk("%s: handling CB_PATHDOWN recovery for server %s\n", __func__,
  1111. clp->cl_hostname);
  1112. }
  1113. void nfs4_schedule_path_down_recovery(struct nfs_client *clp)
  1114. {
  1115. nfs40_handle_cb_pathdown(clp);
  1116. nfs4_schedule_state_manager(clp);
  1117. }
  1118. static int nfs4_state_mark_reclaim_reboot(struct nfs_client *clp, struct nfs4_state *state)
  1119. {
  1120. set_bit(NFS_STATE_RECLAIM_REBOOT, &state->flags);
  1121. /* Don't recover state that expired before the reboot */
  1122. if (test_bit(NFS_STATE_RECLAIM_NOGRACE, &state->flags)) {
  1123. clear_bit(NFS_STATE_RECLAIM_REBOOT, &state->flags);
  1124. return 0;
  1125. }
  1126. set_bit(NFS_OWNER_RECLAIM_REBOOT, &state->owner->so_flags);
  1127. set_bit(NFS4CLNT_RECLAIM_REBOOT, &clp->cl_state);
  1128. return 1;
  1129. }
  1130. static int nfs4_state_mark_reclaim_nograce(struct nfs_client *clp, struct nfs4_state *state)
  1131. {
  1132. set_bit(NFS_STATE_RECLAIM_NOGRACE, &state->flags);
  1133. clear_bit(NFS_STATE_RECLAIM_REBOOT, &state->flags);
  1134. set_bit(NFS_OWNER_RECLAIM_NOGRACE, &state->owner->so_flags);
  1135. set_bit(NFS4CLNT_RECLAIM_NOGRACE, &clp->cl_state);
  1136. return 1;
  1137. }
  1138. int nfs4_schedule_stateid_recovery(const struct nfs_server *server, struct nfs4_state *state)
  1139. {
  1140. struct nfs_client *clp = server->nfs_client;
  1141. if (!nfs4_valid_open_stateid(state))
  1142. return -EBADF;
  1143. nfs4_state_mark_reclaim_nograce(clp, state);
  1144. dprintk("%s: scheduling stateid recovery for server %s\n", __func__,
  1145. clp->cl_hostname);
  1146. nfs4_schedule_state_manager(clp);
  1147. return 0;
  1148. }
  1149. EXPORT_SYMBOL_GPL(nfs4_schedule_stateid_recovery);
  1150. void nfs_inode_find_state_and_recover(struct inode *inode,
  1151. const nfs4_stateid *stateid)
  1152. {
  1153. struct nfs_client *clp = NFS_SERVER(inode)->nfs_client;
  1154. struct nfs_inode *nfsi = NFS_I(inode);
  1155. struct nfs_open_context *ctx;
  1156. struct nfs4_state *state;
  1157. bool found = false;
  1158. spin_lock(&inode->i_lock);
  1159. list_for_each_entry(ctx, &nfsi->open_files, list) {
  1160. state = ctx->state;
  1161. if (state == NULL)
  1162. continue;
  1163. if (!test_bit(NFS_DELEGATED_STATE, &state->flags))
  1164. continue;
  1165. if (!nfs4_stateid_match(&state->stateid, stateid))
  1166. continue;
  1167. nfs4_state_mark_reclaim_nograce(clp, state);
  1168. found = true;
  1169. }
  1170. spin_unlock(&inode->i_lock);
  1171. if (found)
  1172. nfs4_schedule_state_manager(clp);
  1173. }
  1174. static void nfs4_state_mark_open_context_bad(struct nfs4_state *state)
  1175. {
  1176. struct inode *inode = state->inode;
  1177. struct nfs_inode *nfsi = NFS_I(inode);
  1178. struct nfs_open_context *ctx;
  1179. spin_lock(&inode->i_lock);
  1180. list_for_each_entry(ctx, &nfsi->open_files, list) {
  1181. if (ctx->state != state)
  1182. continue;
  1183. set_bit(NFS_CONTEXT_BAD, &ctx->flags);
  1184. }
  1185. spin_unlock(&inode->i_lock);
  1186. }
  1187. static void nfs4_state_mark_recovery_failed(struct nfs4_state *state, int error)
  1188. {
  1189. set_bit(NFS_STATE_RECOVERY_FAILED, &state->flags);
  1190. nfs4_state_mark_open_context_bad(state);
  1191. }
  1192. static int nfs4_reclaim_locks(struct nfs4_state *state, const struct nfs4_state_recovery_ops *ops)
  1193. {
  1194. struct inode *inode = state->inode;
  1195. struct nfs_inode *nfsi = NFS_I(inode);
  1196. struct file_lock *fl;
  1197. int status = 0;
  1198. if (inode->i_flock == NULL)
  1199. return 0;
  1200. /* Guard against delegation returns and new lock/unlock calls */
  1201. down_write(&nfsi->rwsem);
  1202. /* Protect inode->i_flock using the BKL */
  1203. spin_lock(&inode->i_lock);
  1204. for (fl = inode->i_flock; fl != NULL; fl = fl->fl_next) {
  1205. if (!(fl->fl_flags & (FL_POSIX|FL_FLOCK)))
  1206. continue;
  1207. if (nfs_file_open_context(fl->fl_file)->state != state)
  1208. continue;
  1209. spin_unlock(&inode->i_lock);
  1210. status = ops->recover_lock(state, fl);
  1211. switch (status) {
  1212. case 0:
  1213. break;
  1214. case -ESTALE:
  1215. case -NFS4ERR_ADMIN_REVOKED:
  1216. case -NFS4ERR_STALE_STATEID:
  1217. case -NFS4ERR_BAD_STATEID:
  1218. case -NFS4ERR_EXPIRED:
  1219. case -NFS4ERR_NO_GRACE:
  1220. case -NFS4ERR_STALE_CLIENTID:
  1221. case -NFS4ERR_BADSESSION:
  1222. case -NFS4ERR_BADSLOT:
  1223. case -NFS4ERR_BAD_HIGH_SLOT:
  1224. case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
  1225. goto out;
  1226. default:
  1227. printk(KERN_ERR "NFS: %s: unhandled error %d. "
  1228. "Zeroing state\n", __func__, status);
  1229. case -ENOMEM:
  1230. case -NFS4ERR_DENIED:
  1231. case -NFS4ERR_RECLAIM_BAD:
  1232. case -NFS4ERR_RECLAIM_CONFLICT:
  1233. /* kill_proc(fl->fl_pid, SIGLOST, 1); */
  1234. status = 0;
  1235. }
  1236. spin_lock(&inode->i_lock);
  1237. }
  1238. spin_unlock(&inode->i_lock);
  1239. out:
  1240. up_write(&nfsi->rwsem);
  1241. return status;
  1242. }
  1243. static int nfs4_reclaim_open_state(struct nfs4_state_owner *sp, const struct nfs4_state_recovery_ops *ops)
  1244. {
  1245. struct nfs4_state *state;
  1246. struct nfs4_lock_state *lock;
  1247. int status = 0;
  1248. /* Note: we rely on the sp->so_states list being ordered
  1249. * so that we always reclaim open(O_RDWR) and/or open(O_WRITE)
  1250. * states first.
  1251. * This is needed to ensure that the server won't give us any
  1252. * read delegations that we have to return if, say, we are
  1253. * recovering after a network partition or a reboot from a
  1254. * server that doesn't support a grace period.
  1255. */
  1256. spin_lock(&sp->so_lock);
  1257. write_seqcount_begin(&sp->so_reclaim_seqcount);
  1258. restart:
  1259. list_for_each_entry(state, &sp->so_states, open_states) {
  1260. if (!test_and_clear_bit(ops->state_flag_bit, &state->flags))
  1261. continue;
  1262. if (!nfs4_valid_open_stateid(state))
  1263. continue;
  1264. if (state->state == 0)
  1265. continue;
  1266. atomic_inc(&state->count);
  1267. spin_unlock(&sp->so_lock);
  1268. status = ops->recover_open(sp, state);
  1269. if (status >= 0) {
  1270. status = nfs4_reclaim_locks(state, ops);
  1271. if (status >= 0) {
  1272. if (test_bit(NFS_DELEGATED_STATE, &state->flags) != 0) {
  1273. spin_lock(&state->state_lock);
  1274. list_for_each_entry(lock, &state->lock_states, ls_locks) {
  1275. if (!test_bit(NFS_LOCK_INITIALIZED, &lock->ls_flags))
  1276. pr_warn_ratelimited("NFS: "
  1277. "%s: Lock reclaim "
  1278. "failed!\n", __func__);
  1279. }
  1280. spin_unlock(&state->state_lock);
  1281. }
  1282. nfs4_put_open_state(state);
  1283. spin_lock(&sp->so_lock);
  1284. goto restart;
  1285. }
  1286. }
  1287. switch (status) {
  1288. default:
  1289. printk(KERN_ERR "NFS: %s: unhandled error %d. "
  1290. "Zeroing state\n", __func__, status);
  1291. case -ENOENT:
  1292. case -ENOMEM:
  1293. case -ESTALE:
  1294. /*
  1295. * Open state on this file cannot be recovered
  1296. * All we can do is revert to using the zero stateid.
  1297. */
  1298. nfs4_state_mark_recovery_failed(state, status);
  1299. break;
  1300. case -EAGAIN:
  1301. ssleep(1);
  1302. case -NFS4ERR_ADMIN_REVOKED:
  1303. case -NFS4ERR_STALE_STATEID:
  1304. case -NFS4ERR_BAD_STATEID:
  1305. case -NFS4ERR_RECLAIM_BAD:
  1306. case -NFS4ERR_RECLAIM_CONFLICT:
  1307. nfs4_state_mark_reclaim_nograce(sp->so_server->nfs_client, state);
  1308. break;
  1309. case -NFS4ERR_EXPIRED:
  1310. case -NFS4ERR_NO_GRACE:
  1311. nfs4_state_mark_reclaim_nograce(sp->so_server->nfs_client, state);
  1312. case -NFS4ERR_STALE_CLIENTID:
  1313. case -NFS4ERR_BADSESSION:
  1314. case -NFS4ERR_BADSLOT:
  1315. case -NFS4ERR_BAD_HIGH_SLOT:
  1316. case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
  1317. goto out_err;
  1318. }
  1319. nfs4_put_open_state(state);
  1320. spin_lock(&sp->so_lock);
  1321. goto restart;
  1322. }
  1323. write_seqcount_end(&sp->so_reclaim_seqcount);
  1324. spin_unlock(&sp->so_lock);
  1325. return 0;
  1326. out_err:
  1327. nfs4_put_open_state(state);
  1328. spin_lock(&sp->so_lock);
  1329. write_seqcount_end(&sp->so_reclaim_seqcount);
  1330. spin_unlock(&sp->so_lock);
  1331. return status;
  1332. }
  1333. static void nfs4_clear_open_state(struct nfs4_state *state)
  1334. {
  1335. struct nfs4_lock_state *lock;
  1336. clear_bit(NFS_DELEGATED_STATE, &state->flags);
  1337. clear_bit(NFS_O_RDONLY_STATE, &state->flags);
  1338. clear_bit(NFS_O_WRONLY_STATE, &state->flags);
  1339. clear_bit(NFS_O_RDWR_STATE, &state->flags);
  1340. spin_lock(&state->state_lock);
  1341. list_for_each_entry(lock, &state->lock_states, ls_locks) {
  1342. lock->ls_seqid.flags = 0;
  1343. clear_bit(NFS_LOCK_INITIALIZED, &lock->ls_flags);
  1344. }
  1345. spin_unlock(&state->state_lock);
  1346. }
  1347. static void nfs4_reset_seqids(struct nfs_server *server,
  1348. int (*mark_reclaim)(struct nfs_client *clp, struct nfs4_state *state))
  1349. {
  1350. struct nfs_client *clp = server->nfs_client;
  1351. struct nfs4_state_owner *sp;
  1352. struct rb_node *pos;
  1353. struct nfs4_state *state;
  1354. spin_lock(&clp->cl_lock);
  1355. for (pos = rb_first(&server->state_owners);
  1356. pos != NULL;
  1357. pos = rb_next(pos)) {
  1358. sp = rb_entry(pos, struct nfs4_state_owner, so_server_node);
  1359. sp->so_seqid.flags = 0;
  1360. spin_lock(&sp->so_lock);
  1361. list_for_each_entry(state, &sp->so_states, open_states) {
  1362. if (mark_reclaim(clp, state))
  1363. nfs4_clear_open_state(state);
  1364. }
  1365. spin_unlock(&sp->so_lock);
  1366. }
  1367. spin_unlock(&clp->cl_lock);
  1368. }
  1369. static void nfs4_state_mark_reclaim_helper(struct nfs_client *clp,
  1370. int (*mark_reclaim)(struct nfs_client *clp, struct nfs4_state *state))
  1371. {
  1372. struct nfs_server *server;
  1373. rcu_read_lock();
  1374. list_for_each_entry_rcu(server, &clp->cl_superblocks, client_link)
  1375. nfs4_reset_seqids(server, mark_reclaim);
  1376. rcu_read_unlock();
  1377. }
  1378. static void nfs4_state_start_reclaim_reboot(struct nfs_client *clp)
  1379. {
  1380. /* Mark all delegations for reclaim */
  1381. nfs_delegation_mark_reclaim(clp);
  1382. nfs4_state_mark_reclaim_helper(clp, nfs4_state_mark_reclaim_reboot);
  1383. }
  1384. static void nfs4_reclaim_complete(struct nfs_client *clp,
  1385. const struct nfs4_state_recovery_ops *ops,
  1386. struct rpc_cred *cred)
  1387. {
  1388. /* Notify the server we're done reclaiming our state */
  1389. if (ops->reclaim_complete)
  1390. (void)ops->reclaim_complete(clp, cred);
  1391. }
  1392. static void nfs4_clear_reclaim_server(struct nfs_server *server)
  1393. {
  1394. struct nfs_client *clp = server->nfs_client;
  1395. struct nfs4_state_owner *sp;
  1396. struct rb_node *pos;
  1397. struct nfs4_state *state;
  1398. spin_lock(&clp->cl_lock);
  1399. for (pos = rb_first(&server->state_owners);
  1400. pos != NULL;
  1401. pos = rb_next(pos)) {
  1402. sp = rb_entry(pos, struct nfs4_state_owner, so_server_node);
  1403. spin_lock(&sp->so_lock);
  1404. list_for_each_entry(state, &sp->so_states, open_states) {
  1405. if (!test_and_clear_bit(NFS_STATE_RECLAIM_REBOOT,
  1406. &state->flags))
  1407. continue;
  1408. nfs4_state_mark_reclaim_nograce(clp, state);
  1409. }
  1410. spin_unlock(&sp->so_lock);
  1411. }
  1412. spin_unlock(&clp->cl_lock);
  1413. }
  1414. static int nfs4_state_clear_reclaim_reboot(struct nfs_client *clp)
  1415. {
  1416. struct nfs_server *server;
  1417. if (!test_and_clear_bit(NFS4CLNT_RECLAIM_REBOOT, &clp->cl_state))
  1418. return 0;
  1419. rcu_read_lock();
  1420. list_for_each_entry_rcu(server, &clp->cl_superblocks, client_link)
  1421. nfs4_clear_reclaim_server(server);
  1422. rcu_read_unlock();
  1423. nfs_delegation_reap_unclaimed(clp);
  1424. return 1;
  1425. }
  1426. static void nfs4_state_end_reclaim_reboot(struct nfs_client *clp)
  1427. {
  1428. const struct nfs4_state_recovery_ops *ops;
  1429. struct rpc_cred *cred;
  1430. if (!nfs4_state_clear_reclaim_reboot(clp))
  1431. return;
  1432. ops = clp->cl_mvops->reboot_recovery_ops;
  1433. cred = nfs4_get_clid_cred(clp);
  1434. nfs4_reclaim_complete(clp, ops, cred);
  1435. put_rpccred(cred);
  1436. }
  1437. static void nfs_delegation_clear_all(struct nfs_client *clp)
  1438. {
  1439. nfs_delegation_mark_reclaim(clp);
  1440. nfs_delegation_reap_unclaimed(clp);
  1441. }
  1442. static void nfs4_state_start_reclaim_nograce(struct nfs_client *clp)
  1443. {
  1444. nfs_delegation_clear_all(clp);
  1445. nfs4_state_mark_reclaim_helper(clp, nfs4_state_mark_reclaim_nograce);
  1446. }
  1447. static int nfs4_recovery_handle_error(struct nfs_client *clp, int error)
  1448. {
  1449. switch (error) {
  1450. case 0:
  1451. break;
  1452. case -NFS4ERR_CB_PATH_DOWN:
  1453. nfs40_handle_cb_pathdown(clp);
  1454. break;
  1455. case -NFS4ERR_NO_GRACE:
  1456. nfs4_state_end_reclaim_reboot(clp);
  1457. break;
  1458. case -NFS4ERR_STALE_CLIENTID:
  1459. case -NFS4ERR_LEASE_MOVED:
  1460. set_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state);
  1461. nfs4_state_clear_reclaim_reboot(clp);
  1462. nfs4_state_start_reclaim_reboot(clp);
  1463. break;
  1464. case -NFS4ERR_EXPIRED:
  1465. set_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state);
  1466. nfs4_state_start_reclaim_nograce(clp);
  1467. break;
  1468. case -NFS4ERR_BADSESSION:
  1469. case -NFS4ERR_BADSLOT:
  1470. case -NFS4ERR_BAD_HIGH_SLOT:
  1471. case -NFS4ERR_DEADSESSION:
  1472. case -NFS4ERR_SEQ_FALSE_RETRY:
  1473. case -NFS4ERR_SEQ_MISORDERED:
  1474. set_bit(NFS4CLNT_SESSION_RESET, &clp->cl_state);
  1475. /* Zero session reset errors */
  1476. break;
  1477. case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
  1478. set_bit(NFS4CLNT_BIND_CONN_TO_SESSION, &clp->cl_state);
  1479. break;
  1480. default:
  1481. dprintk("%s: failed to handle error %d for server %s\n",
  1482. __func__, error, clp->cl_hostname);
  1483. return error;
  1484. }
  1485. dprintk("%s: handled error %d for server %s\n", __func__, error,
  1486. clp->cl_hostname);
  1487. return 0;
  1488. }
  1489. static int nfs4_do_reclaim(struct nfs_client *clp, const struct nfs4_state_recovery_ops *ops)
  1490. {
  1491. struct nfs4_state_owner *sp;
  1492. struct nfs_server *server;
  1493. struct rb_node *pos;
  1494. int status = 0;
  1495. restart:
  1496. rcu_read_lock();
  1497. list_for_each_entry_rcu(server, &clp->cl_superblocks, client_link) {
  1498. nfs4_purge_state_owners(server);
  1499. spin_lock(&clp->cl_lock);
  1500. for (pos = rb_first(&server->state_owners);
  1501. pos != NULL;
  1502. pos = rb_next(pos)) {
  1503. sp = rb_entry(pos,
  1504. struct nfs4_state_owner, so_server_node);
  1505. if (!test_and_clear_bit(ops->owner_flag_bit,
  1506. &sp->so_flags))
  1507. continue;
  1508. atomic_inc(&sp->so_count);
  1509. spin_unlock(&clp->cl_lock);
  1510. rcu_read_unlock();
  1511. status = nfs4_reclaim_open_state(sp, ops);
  1512. if (status < 0) {
  1513. set_bit(ops->owner_flag_bit, &sp->so_flags);
  1514. nfs4_put_state_owner(sp);
  1515. return nfs4_recovery_handle_error(clp, status);
  1516. }
  1517. nfs4_put_state_owner(sp);
  1518. goto restart;
  1519. }
  1520. spin_unlock(&clp->cl_lock);
  1521. }
  1522. rcu_read_unlock();
  1523. return status;
  1524. }
  1525. static int nfs4_check_lease(struct nfs_client *clp)
  1526. {
  1527. struct rpc_cred *cred;
  1528. const struct nfs4_state_maintenance_ops *ops =
  1529. clp->cl_mvops->state_renewal_ops;
  1530. int status;
  1531. /* Is the client already known to have an expired lease? */
  1532. if (test_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state))
  1533. return 0;
  1534. spin_lock(&clp->cl_lock);
  1535. cred = ops->get_state_renewal_cred_locked(clp);
  1536. spin_unlock(&clp->cl_lock);
  1537. if (cred == NULL) {
  1538. cred = nfs4_get_clid_cred(clp);
  1539. status = -ENOKEY;
  1540. if (cred == NULL)
  1541. goto out;
  1542. }
  1543. status = ops->renew_lease(clp, cred);
  1544. put_rpccred(cred);
  1545. if (status == -ETIMEDOUT) {
  1546. set_bit(NFS4CLNT_CHECK_LEASE, &clp->cl_state);
  1547. return 0;
  1548. }
  1549. out:
  1550. return nfs4_recovery_handle_error(clp, status);
  1551. }
  1552. /* Set NFS4CLNT_LEASE_EXPIRED and reclaim reboot state for all v4.0 errors
  1553. * and for recoverable errors on EXCHANGE_ID for v4.1
  1554. */
  1555. static int nfs4_handle_reclaim_lease_error(struct nfs_client *clp, int status)
  1556. {
  1557. switch (status) {
  1558. case -NFS4ERR_SEQ_MISORDERED:
  1559. if (test_and_set_bit(NFS4CLNT_PURGE_STATE, &clp->cl_state))
  1560. return -ESERVERFAULT;
  1561. /* Lease confirmation error: retry after purging the lease */
  1562. ssleep(1);
  1563. clear_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state);
  1564. break;
  1565. case -NFS4ERR_STALE_CLIENTID:
  1566. clear_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state);
  1567. nfs4_state_clear_reclaim_reboot(clp);
  1568. nfs4_state_start_reclaim_reboot(clp);
  1569. break;
  1570. case -NFS4ERR_CLID_INUSE:
  1571. pr_err("NFS: Server %s reports our clientid is in use\n",
  1572. clp->cl_hostname);
  1573. nfs_mark_client_ready(clp, -EPERM);
  1574. clear_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state);
  1575. return -EPERM;
  1576. case -EACCES:
  1577. case -NFS4ERR_DELAY:
  1578. case -ETIMEDOUT:
  1579. case -EAGAIN:
  1580. ssleep(1);
  1581. break;
  1582. case -NFS4ERR_MINOR_VERS_MISMATCH:
  1583. if (clp->cl_cons_state == NFS_CS_SESSION_INITING)
  1584. nfs_mark_client_ready(clp, -EPROTONOSUPPORT);
  1585. dprintk("%s: exit with error %d for server %s\n",
  1586. __func__, -EPROTONOSUPPORT, clp->cl_hostname);
  1587. return -EPROTONOSUPPORT;
  1588. case -NFS4ERR_NOT_SAME: /* FixMe: implement recovery
  1589. * in nfs4_exchange_id */
  1590. default:
  1591. dprintk("%s: exit with error %d for server %s\n", __func__,
  1592. status, clp->cl_hostname);
  1593. return status;
  1594. }
  1595. set_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state);
  1596. dprintk("%s: handled error %d for server %s\n", __func__, status,
  1597. clp->cl_hostname);
  1598. return 0;
  1599. }
  1600. static int nfs4_establish_lease(struct nfs_client *clp)
  1601. {
  1602. struct rpc_cred *cred;
  1603. const struct nfs4_state_recovery_ops *ops =
  1604. clp->cl_mvops->reboot_recovery_ops;
  1605. int status;
  1606. cred = nfs4_get_clid_cred(clp);
  1607. if (cred == NULL)
  1608. return -ENOENT;
  1609. status = ops->establish_clid(clp, cred);
  1610. put_rpccred(cred);
  1611. if (status != 0)
  1612. return status;
  1613. pnfs_destroy_all_layouts(clp);
  1614. return 0;
  1615. }
  1616. /*
  1617. * Returns zero or a negative errno. NFS4ERR values are converted
  1618. * to local errno values.
  1619. */
  1620. static int nfs4_reclaim_lease(struct nfs_client *clp)
  1621. {
  1622. int status;
  1623. status = nfs4_establish_lease(clp);
  1624. if (status < 0)
  1625. return nfs4_handle_reclaim_lease_error(clp, status);
  1626. if (test_and_clear_bit(NFS4CLNT_SERVER_SCOPE_MISMATCH, &clp->cl_state))
  1627. nfs4_state_start_reclaim_nograce(clp);
  1628. if (!test_bit(NFS4CLNT_RECLAIM_NOGRACE, &clp->cl_state))
  1629. set_bit(NFS4CLNT_RECLAIM_REBOOT, &clp->cl_state);
  1630. clear_bit(NFS4CLNT_CHECK_LEASE, &clp->cl_state);
  1631. clear_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state);
  1632. return 0;
  1633. }
  1634. static int nfs4_purge_lease(struct nfs_client *clp)
  1635. {
  1636. int status;
  1637. status = nfs4_establish_lease(clp);
  1638. if (status < 0)
  1639. return nfs4_handle_reclaim_lease_error(clp, status);
  1640. clear_bit(NFS4CLNT_PURGE_STATE, &clp->cl_state);
  1641. set_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state);
  1642. nfs4_state_start_reclaim_nograce(clp);
  1643. return 0;
  1644. }
  1645. /**
  1646. * nfs4_discover_server_trunking - Detect server IP address trunking
  1647. *
  1648. * @clp: nfs_client under test
  1649. * @result: OUT: found nfs_client, or clp
  1650. *
  1651. * Returns zero or a negative errno. If zero is returned,
  1652. * an nfs_client pointer is planted in "result".
  1653. *
  1654. * Note: since we are invoked in process context, and
  1655. * not from inside the state manager, we cannot use
  1656. * nfs4_handle_reclaim_lease_error().
  1657. */
  1658. int nfs4_discover_server_trunking(struct nfs_client *clp,
  1659. struct nfs_client **result)
  1660. {
  1661. const struct nfs4_state_recovery_ops *ops =
  1662. clp->cl_mvops->reboot_recovery_ops;
  1663. struct rpc_clnt *clnt;
  1664. struct rpc_cred *cred;
  1665. int i, status;
  1666. dprintk("NFS: %s: testing '%s'\n", __func__, clp->cl_hostname);
  1667. clnt = clp->cl_rpcclient;
  1668. i = 0;
  1669. mutex_lock(&nfs_clid_init_mutex);
  1670. again:
  1671. status = -ENOENT;
  1672. cred = nfs4_get_clid_cred(clp);
  1673. if (cred == NULL)
  1674. goto out_unlock;
  1675. status = ops->detect_trunking(clp, result, cred);
  1676. put_rpccred(cred);
  1677. switch (status) {
  1678. case 0:
  1679. break;
  1680. case -NFS4ERR_DELAY:
  1681. case -ETIMEDOUT:
  1682. case -EAGAIN:
  1683. ssleep(1);
  1684. case -NFS4ERR_STALE_CLIENTID:
  1685. dprintk("NFS: %s after status %d, retrying\n",
  1686. __func__, status);
  1687. goto again;
  1688. case -EACCES:
  1689. if (i++ == 0) {
  1690. nfs4_root_machine_cred(clp);
  1691. goto again;
  1692. }
  1693. if (i > 2)
  1694. break;
  1695. case -NFS4ERR_CLID_INUSE:
  1696. case -NFS4ERR_WRONGSEC:
  1697. clnt = rpc_clone_client_set_auth(clnt, RPC_AUTH_UNIX);
  1698. if (IS_ERR(clnt)) {
  1699. status = PTR_ERR(clnt);
  1700. break;
  1701. }
  1702. /* Note: this is safe because we haven't yet marked the
  1703. * client as ready, so we are the only user of
  1704. * clp->cl_rpcclient
  1705. */
  1706. clnt = xchg(&clp->cl_rpcclient, clnt);
  1707. rpc_shutdown_client(clnt);
  1708. clnt = clp->cl_rpcclient;
  1709. goto again;
  1710. case -NFS4ERR_MINOR_VERS_MISMATCH:
  1711. status = -EPROTONOSUPPORT;
  1712. break;
  1713. case -EKEYEXPIRED:
  1714. case -NFS4ERR_NOT_SAME: /* FixMe: implement recovery
  1715. * in nfs4_exchange_id */
  1716. status = -EKEYEXPIRED;
  1717. break;
  1718. default:
  1719. pr_warn("NFS: %s unhandled error %d. Exiting with error EIO\n",
  1720. __func__, status);
  1721. status = -EIO;
  1722. }
  1723. out_unlock:
  1724. mutex_unlock(&nfs_clid_init_mutex);
  1725. dprintk("NFS: %s: status = %d\n", __func__, status);
  1726. return status;
  1727. }
  1728. #ifdef CONFIG_NFS_V4_1
  1729. void nfs4_schedule_session_recovery(struct nfs4_session *session, int err)
  1730. {
  1731. struct nfs_client *clp = session->clp;
  1732. switch (err) {
  1733. default:
  1734. set_bit(NFS4CLNT_SESSION_RESET, &clp->cl_state);
  1735. break;
  1736. case -NFS4ERR_CONN_NOT_BOUND_TO_SESSION:
  1737. set_bit(NFS4CLNT_BIND_CONN_TO_SESSION, &clp->cl_state);
  1738. }
  1739. nfs4_schedule_lease_recovery(clp);
  1740. }
  1741. EXPORT_SYMBOL_GPL(nfs4_schedule_session_recovery);
  1742. static void nfs41_ping_server(struct nfs_client *clp)
  1743. {
  1744. /* Use CHECK_LEASE to ping the server with a SEQUENCE */
  1745. set_bit(NFS4CLNT_CHECK_LEASE, &clp->cl_state);
  1746. nfs4_schedule_state_manager(clp);
  1747. }
  1748. void nfs41_server_notify_target_slotid_update(struct nfs_client *clp)
  1749. {
  1750. nfs41_ping_server(clp);
  1751. }
  1752. void nfs41_server_notify_highest_slotid_update(struct nfs_client *clp)
  1753. {
  1754. nfs41_ping_server(clp);
  1755. }
  1756. static void nfs4_reset_all_state(struct nfs_client *clp)
  1757. {
  1758. if (test_and_set_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state) == 0) {
  1759. set_bit(NFS4CLNT_PURGE_STATE, &clp->cl_state);
  1760. clear_bit(NFS4CLNT_LEASE_CONFIRM, &clp->cl_state);
  1761. nfs4_state_start_reclaim_nograce(clp);
  1762. dprintk("%s: scheduling reset of all state for server %s!\n",
  1763. __func__, clp->cl_hostname);
  1764. nfs4_schedule_state_manager(clp);
  1765. }
  1766. }
  1767. static void nfs41_handle_server_reboot(struct nfs_client *clp)
  1768. {
  1769. if (test_and_set_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state) == 0) {
  1770. nfs4_state_start_reclaim_reboot(clp);
  1771. dprintk("%s: server %s rebooted!\n", __func__,
  1772. clp->cl_hostname);
  1773. nfs4_schedule_state_manager(clp);
  1774. }
  1775. }
  1776. static void nfs41_handle_state_revoked(struct nfs_client *clp)
  1777. {
  1778. nfs4_reset_all_state(clp);
  1779. dprintk("%s: state revoked on server %s\n", __func__, clp->cl_hostname);
  1780. }
  1781. static void nfs41_handle_recallable_state_revoked(struct nfs_client *clp)
  1782. {
  1783. /* This will need to handle layouts too */
  1784. nfs_expire_all_delegations(clp);
  1785. dprintk("%s: Recallable state revoked on server %s!\n", __func__,
  1786. clp->cl_hostname);
  1787. }
  1788. static void nfs41_handle_backchannel_fault(struct nfs_client *clp)
  1789. {
  1790. nfs_expire_all_delegations(clp);
  1791. if (test_and_set_bit(NFS4CLNT_SESSION_RESET, &clp->cl_state) == 0)
  1792. nfs4_schedule_state_manager(clp);
  1793. dprintk("%s: server %s declared a backchannel fault\n", __func__,
  1794. clp->cl_hostname);
  1795. }
  1796. static void nfs41_handle_cb_path_down(struct nfs_client *clp)
  1797. {
  1798. if (test_and_set_bit(NFS4CLNT_BIND_CONN_TO_SESSION,
  1799. &clp->cl_state) == 0)
  1800. nfs4_schedule_state_manager(clp);
  1801. }
  1802. void nfs41_handle_sequence_flag_errors(struct nfs_client *clp, u32 flags)
  1803. {
  1804. if (!flags)
  1805. return;
  1806. dprintk("%s: \"%s\" (client ID %llx) flags=0x%08x\n",
  1807. __func__, clp->cl_hostname, clp->cl_clientid, flags);
  1808. if (flags & SEQ4_STATUS_RESTART_RECLAIM_NEEDED)
  1809. nfs41_handle_server_reboot(clp);
  1810. if (flags & (SEQ4_STATUS_EXPIRED_ALL_STATE_REVOKED |
  1811. SEQ4_STATUS_EXPIRED_SOME_STATE_REVOKED |
  1812. SEQ4_STATUS_ADMIN_STATE_REVOKED |
  1813. SEQ4_STATUS_LEASE_MOVED))
  1814. nfs41_handle_state_revoked(clp);
  1815. if (flags & SEQ4_STATUS_RECALLABLE_STATE_REVOKED)
  1816. nfs41_handle_recallable_state_revoked(clp);
  1817. if (flags & SEQ4_STATUS_BACKCHANNEL_FAULT)
  1818. nfs41_handle_backchannel_fault(clp);
  1819. else if (flags & (SEQ4_STATUS_CB_PATH_DOWN |
  1820. SEQ4_STATUS_CB_PATH_DOWN_SESSION))
  1821. nfs41_handle_cb_path_down(clp);
  1822. }
  1823. static int nfs4_reset_session(struct nfs_client *clp)
  1824. {
  1825. struct rpc_cred *cred;
  1826. int status;
  1827. if (!nfs4_has_session(clp))
  1828. return 0;
  1829. nfs4_begin_drain_session(clp);
  1830. cred = nfs4_get_clid_cred(clp);
  1831. status = nfs4_proc_destroy_session(clp->cl_session, cred);
  1832. switch (status) {
  1833. case 0:
  1834. case -NFS4ERR_BADSESSION:
  1835. case -NFS4ERR_DEADSESSION:
  1836. break;
  1837. case -NFS4ERR_BACK_CHAN_BUSY:
  1838. case -NFS4ERR_DELAY:
  1839. set_bit(NFS4CLNT_SESSION_RESET, &clp->cl_state);
  1840. status = 0;
  1841. ssleep(1);
  1842. goto out;
  1843. default:
  1844. status = nfs4_recovery_handle_error(clp, status);
  1845. goto out;
  1846. }
  1847. memset(clp->cl_session->sess_id.data, 0, NFS4_MAX_SESSIONID_LEN);
  1848. status = nfs4_proc_create_session(clp, cred);
  1849. if (status) {
  1850. dprintk("%s: session reset failed with status %d for server %s!\n",
  1851. __func__, status, clp->cl_hostname);
  1852. status = nfs4_handle_reclaim_lease_error(clp, status);
  1853. goto out;
  1854. }
  1855. nfs41_finish_session_reset(clp);
  1856. dprintk("%s: session reset was successful for server %s!\n",
  1857. __func__, clp->cl_hostname);
  1858. out:
  1859. if (cred)
  1860. put_rpccred(cred);
  1861. return status;
  1862. }
  1863. static int nfs4_bind_conn_to_session(struct nfs_client *clp)
  1864. {
  1865. struct rpc_cred *cred;
  1866. int ret;
  1867. if (!nfs4_has_session(clp))
  1868. return 0;
  1869. nfs4_begin_drain_session(clp);
  1870. cred = nfs4_get_clid_cred(clp);
  1871. ret = nfs4_proc_bind_conn_to_session(clp, cred);
  1872. if (cred)
  1873. put_rpccred(cred);
  1874. clear_bit(NFS4CLNT_BIND_CONN_TO_SESSION, &clp->cl_state);
  1875. switch (ret) {
  1876. case 0:
  1877. dprintk("%s: bind_conn_to_session was successful for server %s!\n",
  1878. __func__, clp->cl_hostname);
  1879. break;
  1880. case -NFS4ERR_DELAY:
  1881. ssleep(1);
  1882. set_bit(NFS4CLNT_BIND_CONN_TO_SESSION, &clp->cl_state);
  1883. break;
  1884. default:
  1885. return nfs4_recovery_handle_error(clp, ret);
  1886. }
  1887. return 0;
  1888. }
  1889. #else /* CONFIG_NFS_V4_1 */
  1890. static int nfs4_reset_session(struct nfs_client *clp) { return 0; }
  1891. static int nfs4_bind_conn_to_session(struct nfs_client *clp)
  1892. {
  1893. return 0;
  1894. }
  1895. #endif /* CONFIG_NFS_V4_1 */
  1896. static void nfs4_state_manager(struct nfs_client *clp)
  1897. {
  1898. int status = 0;
  1899. const char *section = "", *section_sep = "";
  1900. /* Ensure exclusive access to NFSv4 state */
  1901. do {
  1902. if (test_bit(NFS4CLNT_PURGE_STATE, &clp->cl_state)) {
  1903. section = "purge state";
  1904. status = nfs4_purge_lease(clp);
  1905. if (status < 0)
  1906. goto out_error;
  1907. continue;
  1908. }
  1909. if (test_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state)) {
  1910. section = "lease expired";
  1911. /* We're going to have to re-establish a clientid */
  1912. status = nfs4_reclaim_lease(clp);
  1913. if (status < 0)
  1914. goto out_error;
  1915. continue;
  1916. }
  1917. /* Initialize or reset the session */
  1918. if (test_and_clear_bit(NFS4CLNT_SESSION_RESET, &clp->cl_state)) {
  1919. section = "reset session";
  1920. status = nfs4_reset_session(clp);
  1921. if (test_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state))
  1922. continue;
  1923. if (status < 0)
  1924. goto out_error;
  1925. }
  1926. /* Send BIND_CONN_TO_SESSION */
  1927. if (test_and_clear_bit(NFS4CLNT_BIND_CONN_TO_SESSION,
  1928. &clp->cl_state)) {
  1929. section = "bind conn to session";
  1930. status = nfs4_bind_conn_to_session(clp);
  1931. if (status < 0)
  1932. goto out_error;
  1933. continue;
  1934. }
  1935. if (test_and_clear_bit(NFS4CLNT_CHECK_LEASE, &clp->cl_state)) {
  1936. section = "check lease";
  1937. status = nfs4_check_lease(clp);
  1938. if (status < 0)
  1939. goto out_error;
  1940. continue;
  1941. }
  1942. /* First recover reboot state... */
  1943. if (test_bit(NFS4CLNT_RECLAIM_REBOOT, &clp->cl_state)) {
  1944. section = "reclaim reboot";
  1945. status = nfs4_do_reclaim(clp,
  1946. clp->cl_mvops->reboot_recovery_ops);
  1947. if (test_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state) ||
  1948. test_bit(NFS4CLNT_SESSION_RESET, &clp->cl_state))
  1949. continue;
  1950. nfs4_state_end_reclaim_reboot(clp);
  1951. if (test_bit(NFS4CLNT_RECLAIM_NOGRACE, &clp->cl_state))
  1952. continue;
  1953. if (status < 0)
  1954. goto out_error;
  1955. }
  1956. /* Now recover expired state... */
  1957. if (test_and_clear_bit(NFS4CLNT_RECLAIM_NOGRACE, &clp->cl_state)) {
  1958. section = "reclaim nograce";
  1959. status = nfs4_do_reclaim(clp,
  1960. clp->cl_mvops->nograce_recovery_ops);
  1961. if (test_bit(NFS4CLNT_LEASE_EXPIRED, &clp->cl_state) ||
  1962. test_bit(NFS4CLNT_SESSION_RESET, &clp->cl_state) ||
  1963. test_bit(NFS4CLNT_RECLAIM_REBOOT, &clp->cl_state))
  1964. continue;
  1965. if (status < 0)
  1966. goto out_error;
  1967. }
  1968. nfs4_end_drain_session(clp);
  1969. if (test_and_clear_bit(NFS4CLNT_DELEGRETURN, &clp->cl_state)) {
  1970. nfs_client_return_marked_delegations(clp);
  1971. continue;
  1972. }
  1973. nfs4_clear_state_manager_bit(clp);
  1974. /* Did we race with an attempt to give us more work? */
  1975. if (clp->cl_state == 0)
  1976. break;
  1977. if (test_and_set_bit(NFS4CLNT_MANAGER_RUNNING, &clp->cl_state) != 0)
  1978. break;
  1979. } while (atomic_read(&clp->cl_count) > 1);
  1980. return;
  1981. out_error:
  1982. if (strlen(section))
  1983. section_sep = ": ";
  1984. pr_warn_ratelimited("NFS: state manager%s%s failed on NFSv4 server %s"
  1985. " with error %d\n", section_sep, section,
  1986. clp->cl_hostname, -status);
  1987. ssleep(1);
  1988. nfs4_end_drain_session(clp);
  1989. nfs4_clear_state_manager_bit(clp);
  1990. }
  1991. static int nfs4_run_state_manager(void *ptr)
  1992. {
  1993. struct nfs_client *clp = ptr;
  1994. allow_signal(SIGKILL);
  1995. nfs4_state_manager(clp);
  1996. nfs_put_client(clp);
  1997. module_put_and_exit(0);
  1998. return 0;
  1999. }
  2000. /*
  2001. * Local variables:
  2002. * c-basic-offset: 8
  2003. * End:
  2004. */