inode.c 40 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457
  1. /*
  2. * linux/fs/nfs/inode.c
  3. *
  4. * Copyright (C) 1992 Rick Sladkey
  5. *
  6. * nfs inode and superblock handling functions
  7. *
  8. * Modularised by Alan Cox <Alan.Cox@linux.org>, while hacking some
  9. * experimental NFS changes. Modularisation taken straight from SYS5 fs.
  10. *
  11. * Change to nfs_read_super() to permit NFS mounts to multi-homed hosts.
  12. * J.S.Peatfield@damtp.cam.ac.uk
  13. *
  14. */
  15. #include <linux/module.h>
  16. #include <linux/init.h>
  17. #include <linux/sched.h>
  18. #include <linux/time.h>
  19. #include <linux/kernel.h>
  20. #include <linux/mm.h>
  21. #include <linux/string.h>
  22. #include <linux/stat.h>
  23. #include <linux/errno.h>
  24. #include <linux/unistd.h>
  25. #include <linux/sunrpc/clnt.h>
  26. #include <linux/sunrpc/stats.h>
  27. #include <linux/sunrpc/metrics.h>
  28. #include <linux/nfs_fs.h>
  29. #include <linux/nfs_mount.h>
  30. #include <linux/nfs4_mount.h>
  31. #include <linux/lockd/bind.h>
  32. #include <linux/smp_lock.h>
  33. #include <linux/seq_file.h>
  34. #include <linux/mount.h>
  35. #include <linux/nfs_idmap.h>
  36. #include <linux/vfs.h>
  37. #include <linux/inet.h>
  38. #include <linux/nfs_xdr.h>
  39. #include <asm/system.h>
  40. #include <asm/uaccess.h>
  41. #include "nfs4_fs.h"
  42. #include "callback.h"
  43. #include "delegation.h"
  44. #include "iostat.h"
  45. #include "internal.h"
  46. #define NFSDBG_FACILITY NFSDBG_VFS
  47. #define NFS_64_BIT_INODE_NUMBERS_ENABLED 1
  48. /* Default is to see 64-bit inode numbers */
  49. static int enable_ino64 = NFS_64_BIT_INODE_NUMBERS_ENABLED;
  50. static void nfs_invalidate_inode(struct inode *);
  51. static int nfs_update_inode(struct inode *, struct nfs_fattr *);
  52. static struct kmem_cache * nfs_inode_cachep;
  53. static inline unsigned long
  54. nfs_fattr_to_ino_t(struct nfs_fattr *fattr)
  55. {
  56. return nfs_fileid_to_ino_t(fattr->fileid);
  57. }
  58. /**
  59. * nfs_compat_user_ino64 - returns the user-visible inode number
  60. * @fileid: 64-bit fileid
  61. *
  62. * This function returns a 32-bit inode number if the boot parameter
  63. * nfs.enable_ino64 is zero.
  64. */
  65. u64 nfs_compat_user_ino64(u64 fileid)
  66. {
  67. int ino;
  68. if (enable_ino64)
  69. return fileid;
  70. ino = fileid;
  71. if (sizeof(ino) < sizeof(fileid))
  72. ino ^= fileid >> (sizeof(fileid)-sizeof(ino)) * 8;
  73. return ino;
  74. }
  75. int nfs_write_inode(struct inode *inode, int sync)
  76. {
  77. int ret;
  78. if (sync) {
  79. ret = filemap_fdatawait(inode->i_mapping);
  80. if (ret == 0)
  81. ret = nfs_commit_inode(inode, FLUSH_SYNC);
  82. } else
  83. ret = nfs_commit_inode(inode, 0);
  84. if (ret >= 0)
  85. return 0;
  86. __mark_inode_dirty(inode, I_DIRTY_DATASYNC);
  87. return ret;
  88. }
  89. void nfs_clear_inode(struct inode *inode)
  90. {
  91. /*
  92. * The following should never happen...
  93. */
  94. BUG_ON(nfs_have_writebacks(inode));
  95. BUG_ON(!list_empty(&NFS_I(inode)->open_files));
  96. nfs_zap_acl_cache(inode);
  97. nfs_access_zap_cache(inode);
  98. }
  99. /**
  100. * nfs_sync_mapping - helper to flush all mmapped dirty data to disk
  101. */
  102. int nfs_sync_mapping(struct address_space *mapping)
  103. {
  104. int ret;
  105. if (mapping->nrpages == 0)
  106. return 0;
  107. unmap_mapping_range(mapping, 0, 0, 0);
  108. ret = filemap_write_and_wait(mapping);
  109. if (ret != 0)
  110. goto out;
  111. ret = nfs_wb_all(mapping->host);
  112. out:
  113. return ret;
  114. }
  115. /*
  116. * Invalidate the local caches
  117. */
  118. static void nfs_zap_caches_locked(struct inode *inode)
  119. {
  120. struct nfs_inode *nfsi = NFS_I(inode);
  121. int mode = inode->i_mode;
  122. nfs_inc_stats(inode, NFSIOS_ATTRINVALIDATE);
  123. nfsi->attrtimeo = NFS_MINATTRTIMEO(inode);
  124. nfsi->attrtimeo_timestamp = jiffies;
  125. memset(NFS_COOKIEVERF(inode), 0, sizeof(NFS_COOKIEVERF(inode)));
  126. if (S_ISREG(mode) || S_ISDIR(mode) || S_ISLNK(mode))
  127. nfsi->cache_validity |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL|NFS_INO_REVAL_PAGECACHE;
  128. else
  129. nfsi->cache_validity |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL|NFS_INO_REVAL_PAGECACHE;
  130. }
  131. void nfs_zap_caches(struct inode *inode)
  132. {
  133. spin_lock(&inode->i_lock);
  134. nfs_zap_caches_locked(inode);
  135. spin_unlock(&inode->i_lock);
  136. }
  137. void nfs_zap_mapping(struct inode *inode, struct address_space *mapping)
  138. {
  139. if (mapping->nrpages != 0) {
  140. spin_lock(&inode->i_lock);
  141. NFS_I(inode)->cache_validity |= NFS_INO_INVALID_DATA;
  142. spin_unlock(&inode->i_lock);
  143. }
  144. }
  145. void nfs_zap_acl_cache(struct inode *inode)
  146. {
  147. void (*clear_acl_cache)(struct inode *);
  148. clear_acl_cache = NFS_PROTO(inode)->clear_acl_cache;
  149. if (clear_acl_cache != NULL)
  150. clear_acl_cache(inode);
  151. spin_lock(&inode->i_lock);
  152. NFS_I(inode)->cache_validity &= ~NFS_INO_INVALID_ACL;
  153. spin_unlock(&inode->i_lock);
  154. }
  155. void nfs_invalidate_atime(struct inode *inode)
  156. {
  157. spin_lock(&inode->i_lock);
  158. NFS_I(inode)->cache_validity |= NFS_INO_INVALID_ATIME;
  159. spin_unlock(&inode->i_lock);
  160. }
  161. /*
  162. * Invalidate, but do not unhash, the inode.
  163. * NB: must be called with inode->i_lock held!
  164. */
  165. static void nfs_invalidate_inode(struct inode *inode)
  166. {
  167. set_bit(NFS_INO_STALE, &NFS_I(inode)->flags);
  168. nfs_zap_caches_locked(inode);
  169. }
  170. struct nfs_find_desc {
  171. struct nfs_fh *fh;
  172. struct nfs_fattr *fattr;
  173. };
  174. /*
  175. * In NFSv3 we can have 64bit inode numbers. In order to support
  176. * this, and re-exported directories (also seen in NFSv2)
  177. * we are forced to allow 2 different inodes to have the same
  178. * i_ino.
  179. */
  180. static int
  181. nfs_find_actor(struct inode *inode, void *opaque)
  182. {
  183. struct nfs_find_desc *desc = (struct nfs_find_desc *)opaque;
  184. struct nfs_fh *fh = desc->fh;
  185. struct nfs_fattr *fattr = desc->fattr;
  186. if (NFS_FILEID(inode) != fattr->fileid)
  187. return 0;
  188. if (nfs_compare_fh(NFS_FH(inode), fh))
  189. return 0;
  190. if (is_bad_inode(inode) || NFS_STALE(inode))
  191. return 0;
  192. return 1;
  193. }
  194. static int
  195. nfs_init_locked(struct inode *inode, void *opaque)
  196. {
  197. struct nfs_find_desc *desc = (struct nfs_find_desc *)opaque;
  198. struct nfs_fattr *fattr = desc->fattr;
  199. set_nfs_fileid(inode, fattr->fileid);
  200. nfs_copy_fh(NFS_FH(inode), desc->fh);
  201. return 0;
  202. }
  203. /* Don't use READDIRPLUS on directories that we believe are too large */
  204. #define NFS_LIMIT_READDIRPLUS (8*PAGE_SIZE)
  205. /*
  206. * This is our front-end to iget that looks up inodes by file handle
  207. * instead of inode number.
  208. */
  209. struct inode *
  210. nfs_fhget(struct super_block *sb, struct nfs_fh *fh, struct nfs_fattr *fattr)
  211. {
  212. struct nfs_find_desc desc = {
  213. .fh = fh,
  214. .fattr = fattr
  215. };
  216. struct inode *inode = ERR_PTR(-ENOENT);
  217. unsigned long hash;
  218. if ((fattr->valid & NFS_ATTR_FATTR) == 0)
  219. goto out_no_inode;
  220. if (!fattr->nlink) {
  221. printk("NFS: Buggy server - nlink == 0!\n");
  222. goto out_no_inode;
  223. }
  224. hash = nfs_fattr_to_ino_t(fattr);
  225. inode = iget5_locked(sb, hash, nfs_find_actor, nfs_init_locked, &desc);
  226. if (inode == NULL) {
  227. inode = ERR_PTR(-ENOMEM);
  228. goto out_no_inode;
  229. }
  230. if (inode->i_state & I_NEW) {
  231. struct nfs_inode *nfsi = NFS_I(inode);
  232. unsigned long now = jiffies;
  233. /* We set i_ino for the few things that still rely on it,
  234. * such as stat(2) */
  235. inode->i_ino = hash;
  236. /* We can't support update_atime(), since the server will reset it */
  237. inode->i_flags |= S_NOATIME|S_NOCMTIME;
  238. inode->i_mode = fattr->mode;
  239. /* Why so? Because we want revalidate for devices/FIFOs, and
  240. * that's precisely what we have in nfs_file_inode_operations.
  241. */
  242. inode->i_op = NFS_SB(sb)->nfs_client->rpc_ops->file_inode_ops;
  243. if (S_ISREG(inode->i_mode)) {
  244. inode->i_fop = &nfs_file_operations;
  245. inode->i_data.a_ops = &nfs_file_aops;
  246. inode->i_data.backing_dev_info = &NFS_SB(sb)->backing_dev_info;
  247. } else if (S_ISDIR(inode->i_mode)) {
  248. inode->i_op = NFS_SB(sb)->nfs_client->rpc_ops->dir_inode_ops;
  249. inode->i_fop = &nfs_dir_operations;
  250. if (nfs_server_capable(inode, NFS_CAP_READDIRPLUS)
  251. && fattr->size <= NFS_LIMIT_READDIRPLUS)
  252. set_bit(NFS_INO_ADVISE_RDPLUS, &NFS_I(inode)->flags);
  253. /* Deal with crossing mountpoints */
  254. if (!nfs_fsid_equal(&NFS_SB(sb)->fsid, &fattr->fsid)) {
  255. if (fattr->valid & NFS_ATTR_FATTR_V4_REFERRAL)
  256. inode->i_op = &nfs_referral_inode_operations;
  257. else
  258. inode->i_op = &nfs_mountpoint_inode_operations;
  259. inode->i_fop = NULL;
  260. set_bit(NFS_INO_MOUNTPOINT, &nfsi->flags);
  261. }
  262. } else if (S_ISLNK(inode->i_mode))
  263. inode->i_op = &nfs_symlink_inode_operations;
  264. else
  265. init_special_inode(inode, inode->i_mode, fattr->rdev);
  266. nfsi->read_cache_jiffies = fattr->time_start;
  267. nfsi->last_updated = now;
  268. nfsi->cache_change_attribute = now;
  269. inode->i_atime = fattr->atime;
  270. inode->i_mtime = fattr->mtime;
  271. inode->i_ctime = fattr->ctime;
  272. if (fattr->valid & NFS_ATTR_FATTR_V4)
  273. nfsi->change_attr = fattr->change_attr;
  274. inode->i_size = nfs_size_to_loff_t(fattr->size);
  275. inode->i_nlink = fattr->nlink;
  276. inode->i_uid = fattr->uid;
  277. inode->i_gid = fattr->gid;
  278. if (fattr->valid & (NFS_ATTR_FATTR_V3 | NFS_ATTR_FATTR_V4)) {
  279. /*
  280. * report the blocks in 512byte units
  281. */
  282. inode->i_blocks = nfs_calc_block_size(fattr->du.nfs3.used);
  283. } else {
  284. inode->i_blocks = fattr->du.nfs2.blocks;
  285. }
  286. nfsi->attrtimeo = NFS_MINATTRTIMEO(inode);
  287. nfsi->attrtimeo_timestamp = now;
  288. memset(nfsi->cookieverf, 0, sizeof(nfsi->cookieverf));
  289. nfsi->access_cache = RB_ROOT;
  290. unlock_new_inode(inode);
  291. } else
  292. nfs_refresh_inode(inode, fattr);
  293. dprintk("NFS: nfs_fhget(%s/%Ld ct=%d)\n",
  294. inode->i_sb->s_id,
  295. (long long)NFS_FILEID(inode),
  296. atomic_read(&inode->i_count));
  297. out:
  298. return inode;
  299. out_no_inode:
  300. dprintk("nfs_fhget: iget failed with error %ld\n", PTR_ERR(inode));
  301. goto out;
  302. }
  303. #define NFS_VALID_ATTRS (ATTR_MODE|ATTR_UID|ATTR_GID|ATTR_SIZE|ATTR_ATIME|ATTR_ATIME_SET|ATTR_MTIME|ATTR_MTIME_SET|ATTR_FILE)
  304. int
  305. nfs_setattr(struct dentry *dentry, struct iattr *attr)
  306. {
  307. struct inode *inode = dentry->d_inode;
  308. struct nfs_fattr fattr;
  309. int error;
  310. nfs_inc_stats(inode, NFSIOS_VFSSETATTR);
  311. /* skip mode change if it's just for clearing setuid/setgid */
  312. if (attr->ia_valid & (ATTR_KILL_SUID | ATTR_KILL_SGID))
  313. attr->ia_valid &= ~ATTR_MODE;
  314. if (attr->ia_valid & ATTR_SIZE) {
  315. if (!S_ISREG(inode->i_mode) || attr->ia_size == i_size_read(inode))
  316. attr->ia_valid &= ~ATTR_SIZE;
  317. }
  318. /* Optimization: if the end result is no change, don't RPC */
  319. attr->ia_valid &= NFS_VALID_ATTRS;
  320. if ((attr->ia_valid & ~ATTR_FILE) == 0)
  321. return 0;
  322. /* Write all dirty data */
  323. if (S_ISREG(inode->i_mode)) {
  324. filemap_write_and_wait(inode->i_mapping);
  325. nfs_wb_all(inode);
  326. }
  327. /*
  328. * Return any delegations if we're going to change ACLs
  329. */
  330. if ((attr->ia_valid & (ATTR_MODE|ATTR_UID|ATTR_GID)) != 0)
  331. nfs_inode_return_delegation(inode);
  332. error = NFS_PROTO(inode)->setattr(dentry, &fattr, attr);
  333. if (error == 0)
  334. nfs_refresh_inode(inode, &fattr);
  335. return error;
  336. }
  337. /**
  338. * nfs_vmtruncate - unmap mappings "freed" by truncate() syscall
  339. * @inode: inode of the file used
  340. * @offset: file offset to start truncating
  341. *
  342. * This is a copy of the common vmtruncate, but with the locking
  343. * corrected to take into account the fact that NFS requires
  344. * inode->i_size to be updated under the inode->i_lock.
  345. */
  346. static int nfs_vmtruncate(struct inode * inode, loff_t offset)
  347. {
  348. if (i_size_read(inode) < offset) {
  349. unsigned long limit;
  350. limit = current->signal->rlim[RLIMIT_FSIZE].rlim_cur;
  351. if (limit != RLIM_INFINITY && offset > limit)
  352. goto out_sig;
  353. if (offset > inode->i_sb->s_maxbytes)
  354. goto out_big;
  355. spin_lock(&inode->i_lock);
  356. i_size_write(inode, offset);
  357. spin_unlock(&inode->i_lock);
  358. } else {
  359. struct address_space *mapping = inode->i_mapping;
  360. /*
  361. * truncation of in-use swapfiles is disallowed - it would
  362. * cause subsequent swapout to scribble on the now-freed
  363. * blocks.
  364. */
  365. if (IS_SWAPFILE(inode))
  366. return -ETXTBSY;
  367. spin_lock(&inode->i_lock);
  368. i_size_write(inode, offset);
  369. spin_unlock(&inode->i_lock);
  370. /*
  371. * unmap_mapping_range is called twice, first simply for
  372. * efficiency so that truncate_inode_pages does fewer
  373. * single-page unmaps. However after this first call, and
  374. * before truncate_inode_pages finishes, it is possible for
  375. * private pages to be COWed, which remain after
  376. * truncate_inode_pages finishes, hence the second
  377. * unmap_mapping_range call must be made for correctness.
  378. */
  379. unmap_mapping_range(mapping, offset + PAGE_SIZE - 1, 0, 1);
  380. truncate_inode_pages(mapping, offset);
  381. unmap_mapping_range(mapping, offset + PAGE_SIZE - 1, 0, 1);
  382. }
  383. return 0;
  384. out_sig:
  385. send_sig(SIGXFSZ, current, 0);
  386. out_big:
  387. return -EFBIG;
  388. }
  389. /**
  390. * nfs_setattr_update_inode - Update inode metadata after a setattr call.
  391. * @inode: pointer to struct inode
  392. * @attr: pointer to struct iattr
  393. *
  394. * Note: we do this in the *proc.c in order to ensure that
  395. * it works for things like exclusive creates too.
  396. */
  397. void nfs_setattr_update_inode(struct inode *inode, struct iattr *attr)
  398. {
  399. if ((attr->ia_valid & (ATTR_MODE|ATTR_UID|ATTR_GID)) != 0) {
  400. if ((attr->ia_valid & ATTR_MODE) != 0) {
  401. int mode = attr->ia_mode & S_IALLUGO;
  402. mode |= inode->i_mode & ~S_IALLUGO;
  403. inode->i_mode = mode;
  404. }
  405. if ((attr->ia_valid & ATTR_UID) != 0)
  406. inode->i_uid = attr->ia_uid;
  407. if ((attr->ia_valid & ATTR_GID) != 0)
  408. inode->i_gid = attr->ia_gid;
  409. spin_lock(&inode->i_lock);
  410. NFS_I(inode)->cache_validity |= NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL;
  411. spin_unlock(&inode->i_lock);
  412. }
  413. if ((attr->ia_valid & ATTR_SIZE) != 0) {
  414. nfs_inc_stats(inode, NFSIOS_SETATTRTRUNC);
  415. nfs_vmtruncate(inode, attr->ia_size);
  416. }
  417. }
  418. static int nfs_wait_schedule(void *word)
  419. {
  420. if (signal_pending(current))
  421. return -ERESTARTSYS;
  422. schedule();
  423. return 0;
  424. }
  425. /*
  426. * Wait for the inode to get unlocked.
  427. */
  428. static int nfs_wait_on_inode(struct inode *inode)
  429. {
  430. struct nfs_inode *nfsi = NFS_I(inode);
  431. int error;
  432. error = wait_on_bit_lock(&nfsi->flags, NFS_INO_REVALIDATING,
  433. nfs_wait_schedule, TASK_KILLABLE);
  434. return error;
  435. }
  436. static void nfs_wake_up_inode(struct inode *inode)
  437. {
  438. struct nfs_inode *nfsi = NFS_I(inode);
  439. clear_bit(NFS_INO_REVALIDATING, &nfsi->flags);
  440. smp_mb__after_clear_bit();
  441. wake_up_bit(&nfsi->flags, NFS_INO_REVALIDATING);
  442. }
  443. int nfs_getattr(struct vfsmount *mnt, struct dentry *dentry, struct kstat *stat)
  444. {
  445. struct inode *inode = dentry->d_inode;
  446. int need_atime = NFS_I(inode)->cache_validity & NFS_INO_INVALID_ATIME;
  447. int err;
  448. /*
  449. * Flush out writes to the server in order to update c/mtime.
  450. *
  451. * Hold the i_mutex to suspend application writes temporarily;
  452. * this prevents long-running writing applications from blocking
  453. * nfs_wb_nocommit.
  454. */
  455. if (S_ISREG(inode->i_mode)) {
  456. mutex_lock(&inode->i_mutex);
  457. nfs_wb_nocommit(inode);
  458. mutex_unlock(&inode->i_mutex);
  459. }
  460. /*
  461. * We may force a getattr if the user cares about atime.
  462. *
  463. * Note that we only have to check the vfsmount flags here:
  464. * - NFS always sets S_NOATIME by so checking it would give a
  465. * bogus result
  466. * - NFS never sets MS_NOATIME or MS_NODIRATIME so there is
  467. * no point in checking those.
  468. */
  469. if ((mnt->mnt_flags & MNT_NOATIME) ||
  470. ((mnt->mnt_flags & MNT_NODIRATIME) && S_ISDIR(inode->i_mode)))
  471. need_atime = 0;
  472. if (need_atime)
  473. err = __nfs_revalidate_inode(NFS_SERVER(inode), inode);
  474. else
  475. err = nfs_revalidate_inode(NFS_SERVER(inode), inode);
  476. if (!err) {
  477. generic_fillattr(inode, stat);
  478. stat->ino = nfs_compat_user_ino64(NFS_FILEID(inode));
  479. }
  480. return err;
  481. }
  482. static struct nfs_open_context *alloc_nfs_open_context(struct vfsmount *mnt, struct dentry *dentry, struct rpc_cred *cred)
  483. {
  484. struct nfs_open_context *ctx;
  485. ctx = kmalloc(sizeof(*ctx), GFP_KERNEL);
  486. if (ctx != NULL) {
  487. ctx->path.dentry = dget(dentry);
  488. ctx->path.mnt = mntget(mnt);
  489. ctx->cred = get_rpccred(cred);
  490. ctx->state = NULL;
  491. ctx->lockowner = current->files;
  492. ctx->flags = 0;
  493. ctx->error = 0;
  494. ctx->dir_cookie = 0;
  495. atomic_set(&ctx->count, 1);
  496. }
  497. return ctx;
  498. }
  499. struct nfs_open_context *get_nfs_open_context(struct nfs_open_context *ctx)
  500. {
  501. if (ctx != NULL)
  502. atomic_inc(&ctx->count);
  503. return ctx;
  504. }
  505. static void __put_nfs_open_context(struct nfs_open_context *ctx, int wait)
  506. {
  507. struct inode *inode;
  508. if (ctx == NULL)
  509. return;
  510. inode = ctx->path.dentry->d_inode;
  511. if (!atomic_dec_and_lock(&ctx->count, &inode->i_lock))
  512. return;
  513. list_del(&ctx->list);
  514. spin_unlock(&inode->i_lock);
  515. if (ctx->state != NULL) {
  516. if (wait)
  517. nfs4_close_sync(&ctx->path, ctx->state, ctx->mode);
  518. else
  519. nfs4_close_state(&ctx->path, ctx->state, ctx->mode);
  520. }
  521. if (ctx->cred != NULL)
  522. put_rpccred(ctx->cred);
  523. path_put(&ctx->path);
  524. kfree(ctx);
  525. }
  526. void put_nfs_open_context(struct nfs_open_context *ctx)
  527. {
  528. __put_nfs_open_context(ctx, 0);
  529. }
  530. static void put_nfs_open_context_sync(struct nfs_open_context *ctx)
  531. {
  532. __put_nfs_open_context(ctx, 1);
  533. }
  534. /*
  535. * Ensure that mmap has a recent RPC credential for use when writing out
  536. * shared pages
  537. */
  538. static void nfs_file_set_open_context(struct file *filp, struct nfs_open_context *ctx)
  539. {
  540. struct inode *inode = filp->f_path.dentry->d_inode;
  541. struct nfs_inode *nfsi = NFS_I(inode);
  542. filp->private_data = get_nfs_open_context(ctx);
  543. spin_lock(&inode->i_lock);
  544. list_add(&ctx->list, &nfsi->open_files);
  545. spin_unlock(&inode->i_lock);
  546. }
  547. /*
  548. * Given an inode, search for an open context with the desired characteristics
  549. */
  550. struct nfs_open_context *nfs_find_open_context(struct inode *inode, struct rpc_cred *cred, int mode)
  551. {
  552. struct nfs_inode *nfsi = NFS_I(inode);
  553. struct nfs_open_context *pos, *ctx = NULL;
  554. spin_lock(&inode->i_lock);
  555. list_for_each_entry(pos, &nfsi->open_files, list) {
  556. if (cred != NULL && pos->cred != cred)
  557. continue;
  558. if ((pos->mode & mode) == mode) {
  559. ctx = get_nfs_open_context(pos);
  560. break;
  561. }
  562. }
  563. spin_unlock(&inode->i_lock);
  564. return ctx;
  565. }
  566. static void nfs_file_clear_open_context(struct file *filp)
  567. {
  568. struct inode *inode = filp->f_path.dentry->d_inode;
  569. struct nfs_open_context *ctx = nfs_file_open_context(filp);
  570. if (ctx) {
  571. filp->private_data = NULL;
  572. spin_lock(&inode->i_lock);
  573. list_move_tail(&ctx->list, &NFS_I(inode)->open_files);
  574. spin_unlock(&inode->i_lock);
  575. put_nfs_open_context_sync(ctx);
  576. }
  577. }
  578. /*
  579. * These allocate and release file read/write context information.
  580. */
  581. int nfs_open(struct inode *inode, struct file *filp)
  582. {
  583. struct nfs_open_context *ctx;
  584. struct rpc_cred *cred;
  585. cred = rpc_lookup_cred();
  586. if (IS_ERR(cred))
  587. return PTR_ERR(cred);
  588. ctx = alloc_nfs_open_context(filp->f_path.mnt, filp->f_path.dentry, cred);
  589. put_rpccred(cred);
  590. if (ctx == NULL)
  591. return -ENOMEM;
  592. ctx->mode = filp->f_mode;
  593. nfs_file_set_open_context(filp, ctx);
  594. put_nfs_open_context(ctx);
  595. return 0;
  596. }
  597. int nfs_release(struct inode *inode, struct file *filp)
  598. {
  599. nfs_file_clear_open_context(filp);
  600. return 0;
  601. }
  602. /*
  603. * This function is called whenever some part of NFS notices that
  604. * the cached attributes have to be refreshed.
  605. */
  606. int
  607. __nfs_revalidate_inode(struct nfs_server *server, struct inode *inode)
  608. {
  609. int status = -ESTALE;
  610. struct nfs_fattr fattr;
  611. struct nfs_inode *nfsi = NFS_I(inode);
  612. dfprintk(PAGECACHE, "NFS: revalidating (%s/%Ld)\n",
  613. inode->i_sb->s_id, (long long)NFS_FILEID(inode));
  614. nfs_inc_stats(inode, NFSIOS_INODEREVALIDATE);
  615. if (is_bad_inode(inode))
  616. goto out_nowait;
  617. if (NFS_STALE(inode))
  618. goto out_nowait;
  619. status = nfs_wait_on_inode(inode);
  620. if (status < 0)
  621. goto out;
  622. status = -ESTALE;
  623. if (NFS_STALE(inode))
  624. goto out;
  625. status = NFS_PROTO(inode)->getattr(server, NFS_FH(inode), &fattr);
  626. if (status != 0) {
  627. dfprintk(PAGECACHE, "nfs_revalidate_inode: (%s/%Ld) getattr failed, error=%d\n",
  628. inode->i_sb->s_id,
  629. (long long)NFS_FILEID(inode), status);
  630. if (status == -ESTALE) {
  631. nfs_zap_caches(inode);
  632. if (!S_ISDIR(inode->i_mode))
  633. set_bit(NFS_INO_STALE, &NFS_I(inode)->flags);
  634. }
  635. goto out;
  636. }
  637. spin_lock(&inode->i_lock);
  638. status = nfs_update_inode(inode, &fattr);
  639. if (status) {
  640. spin_unlock(&inode->i_lock);
  641. dfprintk(PAGECACHE, "nfs_revalidate_inode: (%s/%Ld) refresh failed, error=%d\n",
  642. inode->i_sb->s_id,
  643. (long long)NFS_FILEID(inode), status);
  644. goto out;
  645. }
  646. spin_unlock(&inode->i_lock);
  647. if (nfsi->cache_validity & NFS_INO_INVALID_ACL)
  648. nfs_zap_acl_cache(inode);
  649. dfprintk(PAGECACHE, "NFS: (%s/%Ld) revalidation complete\n",
  650. inode->i_sb->s_id,
  651. (long long)NFS_FILEID(inode));
  652. out:
  653. nfs_wake_up_inode(inode);
  654. out_nowait:
  655. return status;
  656. }
  657. int nfs_attribute_timeout(struct inode *inode)
  658. {
  659. struct nfs_inode *nfsi = NFS_I(inode);
  660. if (nfs_have_delegation(inode, FMODE_READ))
  661. return 0;
  662. /*
  663. * Special case: if the attribute timeout is set to 0, then always
  664. * treat the cache as having expired (unless holding
  665. * a delegation).
  666. */
  667. if (nfsi->attrtimeo == 0)
  668. return 1;
  669. return !time_in_range(jiffies, nfsi->read_cache_jiffies, nfsi->read_cache_jiffies + nfsi->attrtimeo);
  670. }
  671. /**
  672. * nfs_revalidate_inode - Revalidate the inode attributes
  673. * @server - pointer to nfs_server struct
  674. * @inode - pointer to inode struct
  675. *
  676. * Updates inode attribute information by retrieving the data from the server.
  677. */
  678. int nfs_revalidate_inode(struct nfs_server *server, struct inode *inode)
  679. {
  680. if (!(NFS_I(inode)->cache_validity & NFS_INO_INVALID_ATTR)
  681. && !nfs_attribute_timeout(inode))
  682. return NFS_STALE(inode) ? -ESTALE : 0;
  683. return __nfs_revalidate_inode(server, inode);
  684. }
  685. static int nfs_invalidate_mapping_nolock(struct inode *inode, struct address_space *mapping)
  686. {
  687. struct nfs_inode *nfsi = NFS_I(inode);
  688. if (mapping->nrpages != 0) {
  689. int ret = invalidate_inode_pages2(mapping);
  690. if (ret < 0)
  691. return ret;
  692. }
  693. spin_lock(&inode->i_lock);
  694. nfsi->cache_validity &= ~NFS_INO_INVALID_DATA;
  695. if (S_ISDIR(inode->i_mode))
  696. memset(nfsi->cookieverf, 0, sizeof(nfsi->cookieverf));
  697. spin_unlock(&inode->i_lock);
  698. nfs_inc_stats(inode, NFSIOS_DATAINVALIDATE);
  699. dfprintk(PAGECACHE, "NFS: (%s/%Ld) data cache invalidated\n",
  700. inode->i_sb->s_id, (long long)NFS_FILEID(inode));
  701. return 0;
  702. }
  703. static int nfs_invalidate_mapping(struct inode *inode, struct address_space *mapping)
  704. {
  705. int ret = 0;
  706. mutex_lock(&inode->i_mutex);
  707. if (NFS_I(inode)->cache_validity & NFS_INO_INVALID_DATA) {
  708. ret = nfs_sync_mapping(mapping);
  709. if (ret == 0)
  710. ret = nfs_invalidate_mapping_nolock(inode, mapping);
  711. }
  712. mutex_unlock(&inode->i_mutex);
  713. return ret;
  714. }
  715. /**
  716. * nfs_revalidate_mapping_nolock - Revalidate the pagecache
  717. * @inode - pointer to host inode
  718. * @mapping - pointer to mapping
  719. */
  720. int nfs_revalidate_mapping_nolock(struct inode *inode, struct address_space *mapping)
  721. {
  722. struct nfs_inode *nfsi = NFS_I(inode);
  723. int ret = 0;
  724. if ((nfsi->cache_validity & NFS_INO_REVAL_PAGECACHE)
  725. || nfs_attribute_timeout(inode) || NFS_STALE(inode)) {
  726. ret = __nfs_revalidate_inode(NFS_SERVER(inode), inode);
  727. if (ret < 0)
  728. goto out;
  729. }
  730. if (nfsi->cache_validity & NFS_INO_INVALID_DATA)
  731. ret = nfs_invalidate_mapping_nolock(inode, mapping);
  732. out:
  733. return ret;
  734. }
  735. /**
  736. * nfs_revalidate_mapping - Revalidate the pagecache
  737. * @inode - pointer to host inode
  738. * @mapping - pointer to mapping
  739. *
  740. * This version of the function will take the inode->i_mutex and attempt to
  741. * flush out all dirty data if it needs to invalidate the page cache.
  742. */
  743. int nfs_revalidate_mapping(struct inode *inode, struct address_space *mapping)
  744. {
  745. struct nfs_inode *nfsi = NFS_I(inode);
  746. int ret = 0;
  747. if ((nfsi->cache_validity & NFS_INO_REVAL_PAGECACHE)
  748. || nfs_attribute_timeout(inode) || NFS_STALE(inode)) {
  749. ret = __nfs_revalidate_inode(NFS_SERVER(inode), inode);
  750. if (ret < 0)
  751. goto out;
  752. }
  753. if (nfsi->cache_validity & NFS_INO_INVALID_DATA)
  754. ret = nfs_invalidate_mapping(inode, mapping);
  755. out:
  756. return ret;
  757. }
  758. static void nfs_wcc_update_inode(struct inode *inode, struct nfs_fattr *fattr)
  759. {
  760. struct nfs_inode *nfsi = NFS_I(inode);
  761. if ((fattr->valid & NFS_ATTR_WCC_V4) != 0 &&
  762. nfsi->change_attr == fattr->pre_change_attr) {
  763. nfsi->change_attr = fattr->change_attr;
  764. if (S_ISDIR(inode->i_mode))
  765. nfsi->cache_validity |= NFS_INO_INVALID_DATA;
  766. }
  767. /* If we have atomic WCC data, we may update some attributes */
  768. if ((fattr->valid & NFS_ATTR_WCC) != 0) {
  769. if (timespec_equal(&inode->i_ctime, &fattr->pre_ctime))
  770. memcpy(&inode->i_ctime, &fattr->ctime, sizeof(inode->i_ctime));
  771. if (timespec_equal(&inode->i_mtime, &fattr->pre_mtime)) {
  772. memcpy(&inode->i_mtime, &fattr->mtime, sizeof(inode->i_mtime));
  773. if (S_ISDIR(inode->i_mode))
  774. nfsi->cache_validity |= NFS_INO_INVALID_DATA;
  775. }
  776. if (i_size_read(inode) == nfs_size_to_loff_t(fattr->pre_size) &&
  777. nfsi->npages == 0)
  778. i_size_write(inode, nfs_size_to_loff_t(fattr->size));
  779. }
  780. }
  781. /**
  782. * nfs_check_inode_attributes - verify consistency of the inode attribute cache
  783. * @inode - pointer to inode
  784. * @fattr - updated attributes
  785. *
  786. * Verifies the attribute cache. If we have just changed the attributes,
  787. * so that fattr carries weak cache consistency data, then it may
  788. * also update the ctime/mtime/change_attribute.
  789. */
  790. static int nfs_check_inode_attributes(struct inode *inode, struct nfs_fattr *fattr)
  791. {
  792. struct nfs_inode *nfsi = NFS_I(inode);
  793. loff_t cur_size, new_isize;
  794. unsigned long invalid = 0;
  795. /* Has the inode gone and changed behind our back? */
  796. if (nfsi->fileid != fattr->fileid
  797. || (inode->i_mode & S_IFMT) != (fattr->mode & S_IFMT)) {
  798. return -EIO;
  799. }
  800. /* Do atomic weak cache consistency updates */
  801. nfs_wcc_update_inode(inode, fattr);
  802. if ((fattr->valid & NFS_ATTR_FATTR_V4) != 0 &&
  803. nfsi->change_attr != fattr->change_attr)
  804. invalid |= NFS_INO_INVALID_ATTR|NFS_INO_REVAL_PAGECACHE;
  805. /* Verify a few of the more important attributes */
  806. if (!timespec_equal(&inode->i_mtime, &fattr->mtime))
  807. invalid |= NFS_INO_INVALID_ATTR|NFS_INO_REVAL_PAGECACHE;
  808. cur_size = i_size_read(inode);
  809. new_isize = nfs_size_to_loff_t(fattr->size);
  810. if (cur_size != new_isize && nfsi->npages == 0)
  811. invalid |= NFS_INO_INVALID_ATTR|NFS_INO_REVAL_PAGECACHE;
  812. /* Have any file permissions changed? */
  813. if ((inode->i_mode & S_IALLUGO) != (fattr->mode & S_IALLUGO)
  814. || inode->i_uid != fattr->uid
  815. || inode->i_gid != fattr->gid)
  816. invalid |= NFS_INO_INVALID_ATTR | NFS_INO_INVALID_ACCESS | NFS_INO_INVALID_ACL;
  817. /* Has the link count changed? */
  818. if (inode->i_nlink != fattr->nlink)
  819. invalid |= NFS_INO_INVALID_ATTR;
  820. if (!timespec_equal(&inode->i_atime, &fattr->atime))
  821. invalid |= NFS_INO_INVALID_ATIME;
  822. if (invalid != 0)
  823. nfsi->cache_validity |= invalid;
  824. else
  825. nfsi->cache_validity &= ~(NFS_INO_INVALID_ATTR
  826. | NFS_INO_INVALID_ATIME
  827. | NFS_INO_REVAL_PAGECACHE);
  828. nfsi->read_cache_jiffies = fattr->time_start;
  829. return 0;
  830. }
  831. static int nfs_ctime_need_update(const struct inode *inode, const struct nfs_fattr *fattr)
  832. {
  833. return timespec_compare(&fattr->ctime, &inode->i_ctime) > 0;
  834. }
  835. static int nfs_size_need_update(const struct inode *inode, const struct nfs_fattr *fattr)
  836. {
  837. return nfs_size_to_loff_t(fattr->size) > i_size_read(inode);
  838. }
  839. /**
  840. * nfs_inode_attrs_need_update - check if the inode attributes need updating
  841. * @inode - pointer to inode
  842. * @fattr - attributes
  843. *
  844. * Attempt to divine whether or not an RPC call reply carrying stale
  845. * attributes got scheduled after another call carrying updated ones.
  846. *
  847. * To do so, the function first assumes that a more recent ctime means
  848. * that the attributes in fattr are newer, however it also attempt to
  849. * catch the case where ctime either didn't change, or went backwards
  850. * (if someone reset the clock on the server) by looking at whether
  851. * or not this RPC call was started after the inode was last updated.
  852. * Note also the check for jiffy wraparound if the last_updated timestamp
  853. * is later than 'jiffies'.
  854. *
  855. * The function returns 'true' if it thinks the attributes in 'fattr' are
  856. * more recent than the ones cached in the inode.
  857. *
  858. */
  859. static int nfs_inode_attrs_need_update(const struct inode *inode, const struct nfs_fattr *fattr)
  860. {
  861. const struct nfs_inode *nfsi = NFS_I(inode);
  862. return nfs_ctime_need_update(inode, fattr) ||
  863. nfs_size_need_update(inode, fattr) ||
  864. time_after(fattr->time_start, nfsi->last_updated) ||
  865. time_after(nfsi->last_updated, jiffies);
  866. }
  867. static int nfs_refresh_inode_locked(struct inode *inode, struct nfs_fattr *fattr)
  868. {
  869. if (nfs_inode_attrs_need_update(inode, fattr))
  870. return nfs_update_inode(inode, fattr);
  871. return nfs_check_inode_attributes(inode, fattr);
  872. }
  873. /**
  874. * nfs_refresh_inode - try to update the inode attribute cache
  875. * @inode - pointer to inode
  876. * @fattr - updated attributes
  877. *
  878. * Check that an RPC call that returned attributes has not overlapped with
  879. * other recent updates of the inode metadata, then decide whether it is
  880. * safe to do a full update of the inode attributes, or whether just to
  881. * call nfs_check_inode_attributes.
  882. */
  883. int nfs_refresh_inode(struct inode *inode, struct nfs_fattr *fattr)
  884. {
  885. int status;
  886. if ((fattr->valid & NFS_ATTR_FATTR) == 0)
  887. return 0;
  888. spin_lock(&inode->i_lock);
  889. status = nfs_refresh_inode_locked(inode, fattr);
  890. spin_unlock(&inode->i_lock);
  891. return status;
  892. }
  893. static int nfs_post_op_update_inode_locked(struct inode *inode, struct nfs_fattr *fattr)
  894. {
  895. struct nfs_inode *nfsi = NFS_I(inode);
  896. nfsi->cache_validity |= NFS_INO_INVALID_ATTR|NFS_INO_REVAL_PAGECACHE;
  897. if (S_ISDIR(inode->i_mode))
  898. nfsi->cache_validity |= NFS_INO_INVALID_DATA;
  899. if ((fattr->valid & NFS_ATTR_FATTR) == 0)
  900. return 0;
  901. return nfs_refresh_inode_locked(inode, fattr);
  902. }
  903. /**
  904. * nfs_post_op_update_inode - try to update the inode attribute cache
  905. * @inode - pointer to inode
  906. * @fattr - updated attributes
  907. *
  908. * After an operation that has changed the inode metadata, mark the
  909. * attribute cache as being invalid, then try to update it.
  910. *
  911. * NB: if the server didn't return any post op attributes, this
  912. * function will force the retrieval of attributes before the next
  913. * NFS request. Thus it should be used only for operations that
  914. * are expected to change one or more attributes, to avoid
  915. * unnecessary NFS requests and trips through nfs_update_inode().
  916. */
  917. int nfs_post_op_update_inode(struct inode *inode, struct nfs_fattr *fattr)
  918. {
  919. int status;
  920. spin_lock(&inode->i_lock);
  921. status = nfs_post_op_update_inode_locked(inode, fattr);
  922. spin_unlock(&inode->i_lock);
  923. return status;
  924. }
  925. /**
  926. * nfs_post_op_update_inode_force_wcc - try to update the inode attribute cache
  927. * @inode - pointer to inode
  928. * @fattr - updated attributes
  929. *
  930. * After an operation that has changed the inode metadata, mark the
  931. * attribute cache as being invalid, then try to update it. Fake up
  932. * weak cache consistency data, if none exist.
  933. *
  934. * This function is mainly designed to be used by the ->write_done() functions.
  935. */
  936. int nfs_post_op_update_inode_force_wcc(struct inode *inode, struct nfs_fattr *fattr)
  937. {
  938. int status;
  939. spin_lock(&inode->i_lock);
  940. /* Don't do a WCC update if these attributes are already stale */
  941. if ((fattr->valid & NFS_ATTR_FATTR) == 0 ||
  942. !nfs_inode_attrs_need_update(inode, fattr)) {
  943. fattr->valid &= ~(NFS_ATTR_WCC_V4|NFS_ATTR_WCC);
  944. goto out_noforce;
  945. }
  946. if ((fattr->valid & NFS_ATTR_FATTR_V4) != 0 &&
  947. (fattr->valid & NFS_ATTR_WCC_V4) == 0) {
  948. fattr->pre_change_attr = NFS_I(inode)->change_attr;
  949. fattr->valid |= NFS_ATTR_WCC_V4;
  950. }
  951. if ((fattr->valid & NFS_ATTR_FATTR) != 0 &&
  952. (fattr->valid & NFS_ATTR_WCC) == 0) {
  953. memcpy(&fattr->pre_ctime, &inode->i_ctime, sizeof(fattr->pre_ctime));
  954. memcpy(&fattr->pre_mtime, &inode->i_mtime, sizeof(fattr->pre_mtime));
  955. fattr->pre_size = i_size_read(inode);
  956. fattr->valid |= NFS_ATTR_WCC;
  957. }
  958. out_noforce:
  959. status = nfs_post_op_update_inode_locked(inode, fattr);
  960. spin_unlock(&inode->i_lock);
  961. return status;
  962. }
  963. /*
  964. * Many nfs protocol calls return the new file attributes after
  965. * an operation. Here we update the inode to reflect the state
  966. * of the server's inode.
  967. *
  968. * This is a bit tricky because we have to make sure all dirty pages
  969. * have been sent off to the server before calling invalidate_inode_pages.
  970. * To make sure no other process adds more write requests while we try
  971. * our best to flush them, we make them sleep during the attribute refresh.
  972. *
  973. * A very similar scenario holds for the dir cache.
  974. */
  975. static int nfs_update_inode(struct inode *inode, struct nfs_fattr *fattr)
  976. {
  977. struct nfs_server *server;
  978. struct nfs_inode *nfsi = NFS_I(inode);
  979. loff_t cur_isize, new_isize;
  980. unsigned long invalid = 0;
  981. unsigned long now = jiffies;
  982. dfprintk(VFS, "NFS: %s(%s/%ld ct=%d info=0x%x)\n",
  983. __func__, inode->i_sb->s_id, inode->i_ino,
  984. atomic_read(&inode->i_count), fattr->valid);
  985. if (nfsi->fileid != fattr->fileid)
  986. goto out_fileid;
  987. /*
  988. * Make sure the inode's type hasn't changed.
  989. */
  990. if ((inode->i_mode & S_IFMT) != (fattr->mode & S_IFMT))
  991. goto out_changed;
  992. server = NFS_SERVER(inode);
  993. /* Update the fsid? */
  994. if (S_ISDIR(inode->i_mode) &&
  995. !nfs_fsid_equal(&server->fsid, &fattr->fsid) &&
  996. !test_bit(NFS_INO_MOUNTPOINT, &nfsi->flags))
  997. server->fsid = fattr->fsid;
  998. /*
  999. * Update the read time so we don't revalidate too often.
  1000. */
  1001. nfsi->read_cache_jiffies = fattr->time_start;
  1002. nfsi->cache_validity &= ~(NFS_INO_INVALID_ATTR | NFS_INO_INVALID_ATIME
  1003. | NFS_INO_REVAL_PAGECACHE);
  1004. /* Do atomic weak cache consistency updates */
  1005. nfs_wcc_update_inode(inode, fattr);
  1006. /* More cache consistency checks */
  1007. if (!(fattr->valid & NFS_ATTR_FATTR_V4)) {
  1008. /* NFSv2/v3: Check if the mtime agrees */
  1009. if (!timespec_equal(&inode->i_mtime, &fattr->mtime)) {
  1010. dprintk("NFS: mtime change on server for file %s/%ld\n",
  1011. inode->i_sb->s_id, inode->i_ino);
  1012. invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA;
  1013. if (S_ISDIR(inode->i_mode))
  1014. nfs_force_lookup_revalidate(inode);
  1015. }
  1016. /* If ctime has changed we should definitely clear access+acl caches */
  1017. if (!timespec_equal(&inode->i_ctime, &fattr->ctime))
  1018. invalid |= NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL;
  1019. } else if (nfsi->change_attr != fattr->change_attr) {
  1020. dprintk("NFS: change_attr change on server for file %s/%ld\n",
  1021. inode->i_sb->s_id, inode->i_ino);
  1022. invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL;
  1023. if (S_ISDIR(inode->i_mode))
  1024. nfs_force_lookup_revalidate(inode);
  1025. }
  1026. /* Check if our cached file size is stale */
  1027. new_isize = nfs_size_to_loff_t(fattr->size);
  1028. cur_isize = i_size_read(inode);
  1029. if (new_isize != cur_isize) {
  1030. /* Do we perhaps have any outstanding writes, or has
  1031. * the file grown beyond our last write? */
  1032. if (nfsi->npages == 0 || new_isize > cur_isize) {
  1033. i_size_write(inode, new_isize);
  1034. invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_DATA;
  1035. }
  1036. dprintk("NFS: isize change on server for file %s/%ld\n",
  1037. inode->i_sb->s_id, inode->i_ino);
  1038. }
  1039. memcpy(&inode->i_mtime, &fattr->mtime, sizeof(inode->i_mtime));
  1040. memcpy(&inode->i_ctime, &fattr->ctime, sizeof(inode->i_ctime));
  1041. memcpy(&inode->i_atime, &fattr->atime, sizeof(inode->i_atime));
  1042. nfsi->change_attr = fattr->change_attr;
  1043. if ((inode->i_mode & S_IALLUGO) != (fattr->mode & S_IALLUGO) ||
  1044. inode->i_uid != fattr->uid ||
  1045. inode->i_gid != fattr->gid)
  1046. invalid |= NFS_INO_INVALID_ATTR|NFS_INO_INVALID_ACCESS|NFS_INO_INVALID_ACL;
  1047. inode->i_mode = fattr->mode;
  1048. inode->i_nlink = fattr->nlink;
  1049. inode->i_uid = fattr->uid;
  1050. inode->i_gid = fattr->gid;
  1051. if (fattr->valid & (NFS_ATTR_FATTR_V3 | NFS_ATTR_FATTR_V4)) {
  1052. /*
  1053. * report the blocks in 512byte units
  1054. */
  1055. inode->i_blocks = nfs_calc_block_size(fattr->du.nfs3.used);
  1056. } else {
  1057. inode->i_blocks = fattr->du.nfs2.blocks;
  1058. }
  1059. /* Update attrtimeo value if we're out of the unstable period */
  1060. if (invalid & NFS_INO_INVALID_ATTR) {
  1061. nfs_inc_stats(inode, NFSIOS_ATTRINVALIDATE);
  1062. nfsi->attrtimeo = NFS_MINATTRTIMEO(inode);
  1063. nfsi->attrtimeo_timestamp = now;
  1064. nfsi->last_updated = now;
  1065. } else {
  1066. if (!time_in_range(now, nfsi->attrtimeo_timestamp, nfsi->attrtimeo_timestamp + nfsi->attrtimeo)) {
  1067. if ((nfsi->attrtimeo <<= 1) > NFS_MAXATTRTIMEO(inode))
  1068. nfsi->attrtimeo = NFS_MAXATTRTIMEO(inode);
  1069. nfsi->attrtimeo_timestamp = now;
  1070. }
  1071. /*
  1072. * Avoid jiffy wraparound issues with nfsi->last_updated
  1073. */
  1074. if (!time_in_range(nfsi->last_updated, nfsi->read_cache_jiffies, now))
  1075. nfsi->last_updated = nfsi->read_cache_jiffies;
  1076. }
  1077. invalid &= ~NFS_INO_INVALID_ATTR;
  1078. /* Don't invalidate the data if we were to blame */
  1079. if (!(S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode)
  1080. || S_ISLNK(inode->i_mode)))
  1081. invalid &= ~NFS_INO_INVALID_DATA;
  1082. if (!nfs_have_delegation(inode, FMODE_READ) ||
  1083. (nfsi->cache_validity & NFS_INO_REVAL_FORCED))
  1084. nfsi->cache_validity |= invalid;
  1085. nfsi->cache_validity &= ~NFS_INO_REVAL_FORCED;
  1086. return 0;
  1087. out_changed:
  1088. /*
  1089. * Big trouble! The inode has become a different object.
  1090. */
  1091. printk(KERN_DEBUG "%s: inode %ld mode changed, %07o to %07o\n",
  1092. __func__, inode->i_ino, inode->i_mode, fattr->mode);
  1093. out_err:
  1094. /*
  1095. * No need to worry about unhashing the dentry, as the
  1096. * lookup validation will know that the inode is bad.
  1097. * (But we fall through to invalidate the caches.)
  1098. */
  1099. nfs_invalidate_inode(inode);
  1100. return -ESTALE;
  1101. out_fileid:
  1102. printk(KERN_ERR "NFS: server %s error: fileid changed\n"
  1103. "fsid %s: expected fileid 0x%Lx, got 0x%Lx\n",
  1104. NFS_SERVER(inode)->nfs_client->cl_hostname, inode->i_sb->s_id,
  1105. (long long)nfsi->fileid, (long long)fattr->fileid);
  1106. goto out_err;
  1107. }
  1108. #ifdef CONFIG_NFS_V4
  1109. /*
  1110. * Clean out any remaining NFSv4 state that might be left over due
  1111. * to open() calls that passed nfs_atomic_lookup, but failed to call
  1112. * nfs_open().
  1113. */
  1114. void nfs4_clear_inode(struct inode *inode)
  1115. {
  1116. /* If we are holding a delegation, return it! */
  1117. nfs_inode_return_delegation_noreclaim(inode);
  1118. /* First call standard NFS clear_inode() code */
  1119. nfs_clear_inode(inode);
  1120. }
  1121. #endif
  1122. struct inode *nfs_alloc_inode(struct super_block *sb)
  1123. {
  1124. struct nfs_inode *nfsi;
  1125. nfsi = (struct nfs_inode *)kmem_cache_alloc(nfs_inode_cachep, GFP_KERNEL);
  1126. if (!nfsi)
  1127. return NULL;
  1128. nfsi->flags = 0UL;
  1129. nfsi->cache_validity = 0UL;
  1130. #ifdef CONFIG_NFS_V3_ACL
  1131. nfsi->acl_access = ERR_PTR(-EAGAIN);
  1132. nfsi->acl_default = ERR_PTR(-EAGAIN);
  1133. #endif
  1134. #ifdef CONFIG_NFS_V4
  1135. nfsi->nfs4_acl = NULL;
  1136. #endif /* CONFIG_NFS_V4 */
  1137. return &nfsi->vfs_inode;
  1138. }
  1139. void nfs_destroy_inode(struct inode *inode)
  1140. {
  1141. kmem_cache_free(nfs_inode_cachep, NFS_I(inode));
  1142. }
  1143. static inline void nfs4_init_once(struct nfs_inode *nfsi)
  1144. {
  1145. #ifdef CONFIG_NFS_V4
  1146. INIT_LIST_HEAD(&nfsi->open_states);
  1147. nfsi->delegation = NULL;
  1148. nfsi->delegation_state = 0;
  1149. init_rwsem(&nfsi->rwsem);
  1150. #endif
  1151. }
  1152. static void init_once(void *foo)
  1153. {
  1154. struct nfs_inode *nfsi = (struct nfs_inode *) foo;
  1155. inode_init_once(&nfsi->vfs_inode);
  1156. INIT_LIST_HEAD(&nfsi->open_files);
  1157. INIT_LIST_HEAD(&nfsi->access_cache_entry_lru);
  1158. INIT_LIST_HEAD(&nfsi->access_cache_inode_lru);
  1159. INIT_RADIX_TREE(&nfsi->nfs_page_tree, GFP_ATOMIC);
  1160. nfsi->ncommit = 0;
  1161. nfsi->npages = 0;
  1162. atomic_set(&nfsi->silly_count, 1);
  1163. INIT_HLIST_HEAD(&nfsi->silly_list);
  1164. init_waitqueue_head(&nfsi->waitqueue);
  1165. nfs4_init_once(nfsi);
  1166. }
  1167. static int __init nfs_init_inodecache(void)
  1168. {
  1169. nfs_inode_cachep = kmem_cache_create("nfs_inode_cache",
  1170. sizeof(struct nfs_inode),
  1171. 0, (SLAB_RECLAIM_ACCOUNT|
  1172. SLAB_MEM_SPREAD),
  1173. init_once);
  1174. if (nfs_inode_cachep == NULL)
  1175. return -ENOMEM;
  1176. return 0;
  1177. }
  1178. static void nfs_destroy_inodecache(void)
  1179. {
  1180. kmem_cache_destroy(nfs_inode_cachep);
  1181. }
  1182. struct workqueue_struct *nfsiod_workqueue;
  1183. /*
  1184. * start up the nfsiod workqueue
  1185. */
  1186. static int nfsiod_start(void)
  1187. {
  1188. struct workqueue_struct *wq;
  1189. dprintk("RPC: creating workqueue nfsiod\n");
  1190. wq = create_singlethread_workqueue("nfsiod");
  1191. if (wq == NULL)
  1192. return -ENOMEM;
  1193. nfsiod_workqueue = wq;
  1194. return 0;
  1195. }
  1196. /*
  1197. * Destroy the nfsiod workqueue
  1198. */
  1199. static void nfsiod_stop(void)
  1200. {
  1201. struct workqueue_struct *wq;
  1202. wq = nfsiod_workqueue;
  1203. if (wq == NULL)
  1204. return;
  1205. nfsiod_workqueue = NULL;
  1206. destroy_workqueue(wq);
  1207. }
  1208. /*
  1209. * Initialize NFS
  1210. */
  1211. static int __init init_nfs_fs(void)
  1212. {
  1213. int err;
  1214. err = nfsiod_start();
  1215. if (err)
  1216. goto out6;
  1217. err = nfs_fs_proc_init();
  1218. if (err)
  1219. goto out5;
  1220. err = nfs_init_nfspagecache();
  1221. if (err)
  1222. goto out4;
  1223. err = nfs_init_inodecache();
  1224. if (err)
  1225. goto out3;
  1226. err = nfs_init_readpagecache();
  1227. if (err)
  1228. goto out2;
  1229. err = nfs_init_writepagecache();
  1230. if (err)
  1231. goto out1;
  1232. err = nfs_init_directcache();
  1233. if (err)
  1234. goto out0;
  1235. #ifdef CONFIG_PROC_FS
  1236. rpc_proc_register(&nfs_rpcstat);
  1237. #endif
  1238. if ((err = register_nfs_fs()) != 0)
  1239. goto out;
  1240. return 0;
  1241. out:
  1242. #ifdef CONFIG_PROC_FS
  1243. rpc_proc_unregister("nfs");
  1244. #endif
  1245. nfs_destroy_directcache();
  1246. out0:
  1247. nfs_destroy_writepagecache();
  1248. out1:
  1249. nfs_destroy_readpagecache();
  1250. out2:
  1251. nfs_destroy_inodecache();
  1252. out3:
  1253. nfs_destroy_nfspagecache();
  1254. out4:
  1255. nfs_fs_proc_exit();
  1256. out5:
  1257. nfsiod_stop();
  1258. out6:
  1259. return err;
  1260. }
  1261. static void __exit exit_nfs_fs(void)
  1262. {
  1263. nfs_destroy_directcache();
  1264. nfs_destroy_writepagecache();
  1265. nfs_destroy_readpagecache();
  1266. nfs_destroy_inodecache();
  1267. nfs_destroy_nfspagecache();
  1268. #ifdef CONFIG_PROC_FS
  1269. rpc_proc_unregister("nfs");
  1270. #endif
  1271. unregister_nfs_fs();
  1272. nfs_fs_proc_exit();
  1273. nfsiod_stop();
  1274. }
  1275. /* Not quite true; I just maintain it */
  1276. MODULE_AUTHOR("Olaf Kirch <okir@monad.swb.de>");
  1277. MODULE_LICENSE("GPL");
  1278. module_param(enable_ino64, bool, 0644);
  1279. module_init(init_nfs_fs)
  1280. module_exit(exit_nfs_fs)