dquot.c 59 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108
  1. /*
  2. * Implementation of the diskquota system for the LINUX operating system. QUOTA
  3. * is implemented using the BSD system call interface as the means of
  4. * communication with the user level. This file contains the generic routines
  5. * called by the different filesystems on allocation of an inode or block.
  6. * These routines take care of the administration needed to have a consistent
  7. * diskquota tracking system. The ideas of both user and group quotas are based
  8. * on the Melbourne quota system as used on BSD derived systems. The internal
  9. * implementation is based on one of the several variants of the LINUX
  10. * inode-subsystem with added complexity of the diskquota system.
  11. *
  12. * Version: $Id: dquot.c,v 6.3 1996/11/17 18:35:34 mvw Exp mvw $
  13. *
  14. * Author: Marco van Wieringen <mvw@planets.elm.net>
  15. *
  16. * Fixes: Dmitry Gorodchanin <pgmdsg@ibi.com>, 11 Feb 96
  17. *
  18. * Revised list management to avoid races
  19. * -- Bill Hawes, <whawes@star.net>, 9/98
  20. *
  21. * Fixed races in dquot_transfer(), dqget() and dquot_alloc_...().
  22. * As the consequence the locking was moved from dquot_decr_...(),
  23. * dquot_incr_...() to calling functions.
  24. * invalidate_dquots() now writes modified dquots.
  25. * Serialized quota_off() and quota_on() for mount point.
  26. * Fixed a few bugs in grow_dquots().
  27. * Fixed deadlock in write_dquot() - we no longer account quotas on
  28. * quota files
  29. * remove_dquot_ref() moved to inode.c - it now traverses through inodes
  30. * add_dquot_ref() restarts after blocking
  31. * Added check for bogus uid and fixed check for group in quotactl.
  32. * Jan Kara, <jack@suse.cz>, sponsored by SuSE CR, 10-11/99
  33. *
  34. * Used struct list_head instead of own list struct
  35. * Invalidation of referenced dquots is no longer possible
  36. * Improved free_dquots list management
  37. * Quota and i_blocks are now updated in one place to avoid races
  38. * Warnings are now delayed so we won't block in critical section
  39. * Write updated not to require dquot lock
  40. * Jan Kara, <jack@suse.cz>, 9/2000
  41. *
  42. * Added dynamic quota structure allocation
  43. * Jan Kara <jack@suse.cz> 12/2000
  44. *
  45. * Rewritten quota interface. Implemented new quota format and
  46. * formats registering.
  47. * Jan Kara, <jack@suse.cz>, 2001,2002
  48. *
  49. * New SMP locking.
  50. * Jan Kara, <jack@suse.cz>, 10/2002
  51. *
  52. * Added journalled quota support, fix lock inversion problems
  53. * Jan Kara, <jack@suse.cz>, 2003,2004
  54. *
  55. * (C) Copyright 1994 - 1997 Marco van Wieringen
  56. */
  57. #include <linux/errno.h>
  58. #include <linux/kernel.h>
  59. #include <linux/fs.h>
  60. #include <linux/mount.h>
  61. #include <linux/mm.h>
  62. #include <linux/time.h>
  63. #include <linux/types.h>
  64. #include <linux/string.h>
  65. #include <linux/fcntl.h>
  66. #include <linux/stat.h>
  67. #include <linux/tty.h>
  68. #include <linux/file.h>
  69. #include <linux/slab.h>
  70. #include <linux/sysctl.h>
  71. #include <linux/init.h>
  72. #include <linux/module.h>
  73. #include <linux/proc_fs.h>
  74. #include <linux/security.h>
  75. #include <linux/kmod.h>
  76. #include <linux/namei.h>
  77. #include <linux/buffer_head.h>
  78. #include <linux/capability.h>
  79. #include <linux/quotaops.h>
  80. #include <linux/writeback.h> /* for inode_lock, oddly enough.. */
  81. #ifdef CONFIG_QUOTA_NETLINK_INTERFACE
  82. #include <net/netlink.h>
  83. #include <net/genetlink.h>
  84. #endif
  85. #include <asm/uaccess.h>
  86. #define __DQUOT_PARANOIA
  87. /*
  88. * There are two quota SMP locks. dq_list_lock protects all lists with quotas
  89. * and quota formats and also dqstats structure containing statistics about the
  90. * lists. dq_data_lock protects data from dq_dqb and also mem_dqinfo structures
  91. * and also guards consistency of dquot->dq_dqb with inode->i_blocks, i_bytes.
  92. * i_blocks and i_bytes updates itself are guarded by i_lock acquired directly
  93. * in inode_add_bytes() and inode_sub_bytes().
  94. *
  95. * The spinlock ordering is hence: dq_data_lock > dq_list_lock > i_lock
  96. *
  97. * Note that some things (eg. sb pointer, type, id) doesn't change during
  98. * the life of the dquot structure and so needn't to be protected by a lock
  99. *
  100. * Any operation working on dquots via inode pointers must hold dqptr_sem. If
  101. * operation is just reading pointers from inode (or not using them at all) the
  102. * read lock is enough. If pointers are altered function must hold write lock
  103. * (these locking rules also apply for S_NOQUOTA flag in the inode - note that
  104. * for altering the flag i_mutex is also needed). If operation is holding
  105. * reference to dquot in other way (e.g. quotactl ops) it must be guarded by
  106. * dqonoff_mutex.
  107. * This locking assures that:
  108. * a) update/access to dquot pointers in inode is serialized
  109. * b) everyone is guarded against invalidate_dquots()
  110. *
  111. * Each dquot has its dq_lock mutex. Locked dquots might not be referenced
  112. * from inodes (dquot_alloc_space() and such don't check the dq_lock).
  113. * Currently dquot is locked only when it is being read to memory (or space for
  114. * it is being allocated) on the first dqget() and when it is being released on
  115. * the last dqput(). The allocation and release oparations are serialized by
  116. * the dq_lock and by checking the use count in dquot_release(). Write
  117. * operations on dquots don't hold dq_lock as they copy data under dq_data_lock
  118. * spinlock to internal buffers before writing.
  119. *
  120. * Lock ordering (including related VFS locks) is the following:
  121. * i_mutex > dqonoff_sem > journal_lock > dqptr_sem > dquot->dq_lock >
  122. * dqio_mutex
  123. * i_mutex on quota files is special (it's below dqio_mutex)
  124. */
  125. static DEFINE_SPINLOCK(dq_list_lock);
  126. DEFINE_SPINLOCK(dq_data_lock);
  127. static char *quotatypes[] = INITQFNAMES;
  128. static struct quota_format_type *quota_formats; /* List of registered formats */
  129. static struct quota_module_name module_names[] = INIT_QUOTA_MODULE_NAMES;
  130. /* SLAB cache for dquot structures */
  131. static struct kmem_cache *dquot_cachep;
  132. int register_quota_format(struct quota_format_type *fmt)
  133. {
  134. spin_lock(&dq_list_lock);
  135. fmt->qf_next = quota_formats;
  136. quota_formats = fmt;
  137. spin_unlock(&dq_list_lock);
  138. return 0;
  139. }
  140. void unregister_quota_format(struct quota_format_type *fmt)
  141. {
  142. struct quota_format_type **actqf;
  143. spin_lock(&dq_list_lock);
  144. for (actqf = &quota_formats; *actqf && *actqf != fmt; actqf = &(*actqf)->qf_next);
  145. if (*actqf)
  146. *actqf = (*actqf)->qf_next;
  147. spin_unlock(&dq_list_lock);
  148. }
  149. static struct quota_format_type *find_quota_format(int id)
  150. {
  151. struct quota_format_type *actqf;
  152. spin_lock(&dq_list_lock);
  153. for (actqf = quota_formats; actqf && actqf->qf_fmt_id != id; actqf = actqf->qf_next);
  154. if (!actqf || !try_module_get(actqf->qf_owner)) {
  155. int qm;
  156. spin_unlock(&dq_list_lock);
  157. for (qm = 0; module_names[qm].qm_fmt_id && module_names[qm].qm_fmt_id != id; qm++);
  158. if (!module_names[qm].qm_fmt_id || request_module(module_names[qm].qm_mod_name))
  159. return NULL;
  160. spin_lock(&dq_list_lock);
  161. for (actqf = quota_formats; actqf && actqf->qf_fmt_id != id; actqf = actqf->qf_next);
  162. if (actqf && !try_module_get(actqf->qf_owner))
  163. actqf = NULL;
  164. }
  165. spin_unlock(&dq_list_lock);
  166. return actqf;
  167. }
  168. static void put_quota_format(struct quota_format_type *fmt)
  169. {
  170. module_put(fmt->qf_owner);
  171. }
  172. /*
  173. * Dquot List Management:
  174. * The quota code uses three lists for dquot management: the inuse_list,
  175. * free_dquots, and dquot_hash[] array. A single dquot structure may be
  176. * on all three lists, depending on its current state.
  177. *
  178. * All dquots are placed to the end of inuse_list when first created, and this
  179. * list is used for invalidate operation, which must look at every dquot.
  180. *
  181. * Unused dquots (dq_count == 0) are added to the free_dquots list when freed,
  182. * and this list is searched whenever we need an available dquot. Dquots are
  183. * removed from the list as soon as they are used again, and
  184. * dqstats.free_dquots gives the number of dquots on the list. When
  185. * dquot is invalidated it's completely released from memory.
  186. *
  187. * Dquots with a specific identity (device, type and id) are placed on
  188. * one of the dquot_hash[] hash chains. The provides an efficient search
  189. * mechanism to locate a specific dquot.
  190. */
  191. static LIST_HEAD(inuse_list);
  192. static LIST_HEAD(free_dquots);
  193. static unsigned int dq_hash_bits, dq_hash_mask;
  194. static struct hlist_head *dquot_hash;
  195. struct dqstats dqstats;
  196. static void dqput(struct dquot *dquot);
  197. static inline unsigned int
  198. hashfn(const struct super_block *sb, unsigned int id, int type)
  199. {
  200. unsigned long tmp;
  201. tmp = (((unsigned long)sb>>L1_CACHE_SHIFT) ^ id) * (MAXQUOTAS - type);
  202. return (tmp + (tmp >> dq_hash_bits)) & dq_hash_mask;
  203. }
  204. /*
  205. * Following list functions expect dq_list_lock to be held
  206. */
  207. static inline void insert_dquot_hash(struct dquot *dquot)
  208. {
  209. struct hlist_head *head = dquot_hash + hashfn(dquot->dq_sb, dquot->dq_id, dquot->dq_type);
  210. hlist_add_head(&dquot->dq_hash, head);
  211. }
  212. static inline void remove_dquot_hash(struct dquot *dquot)
  213. {
  214. hlist_del_init(&dquot->dq_hash);
  215. }
  216. static inline struct dquot *find_dquot(unsigned int hashent, struct super_block *sb, unsigned int id, int type)
  217. {
  218. struct hlist_node *node;
  219. struct dquot *dquot;
  220. hlist_for_each (node, dquot_hash+hashent) {
  221. dquot = hlist_entry(node, struct dquot, dq_hash);
  222. if (dquot->dq_sb == sb && dquot->dq_id == id && dquot->dq_type == type)
  223. return dquot;
  224. }
  225. return NODQUOT;
  226. }
  227. /* Add a dquot to the tail of the free list */
  228. static inline void put_dquot_last(struct dquot *dquot)
  229. {
  230. list_add_tail(&dquot->dq_free, &free_dquots);
  231. dqstats.free_dquots++;
  232. }
  233. static inline void remove_free_dquot(struct dquot *dquot)
  234. {
  235. if (list_empty(&dquot->dq_free))
  236. return;
  237. list_del_init(&dquot->dq_free);
  238. dqstats.free_dquots--;
  239. }
  240. static inline void put_inuse(struct dquot *dquot)
  241. {
  242. /* We add to the back of inuse list so we don't have to restart
  243. * when traversing this list and we block */
  244. list_add_tail(&dquot->dq_inuse, &inuse_list);
  245. dqstats.allocated_dquots++;
  246. }
  247. static inline void remove_inuse(struct dquot *dquot)
  248. {
  249. dqstats.allocated_dquots--;
  250. list_del(&dquot->dq_inuse);
  251. }
  252. /*
  253. * End of list functions needing dq_list_lock
  254. */
  255. static void wait_on_dquot(struct dquot *dquot)
  256. {
  257. mutex_lock(&dquot->dq_lock);
  258. mutex_unlock(&dquot->dq_lock);
  259. }
  260. static inline int dquot_dirty(struct dquot *dquot)
  261. {
  262. return test_bit(DQ_MOD_B, &dquot->dq_flags);
  263. }
  264. static inline int mark_dquot_dirty(struct dquot *dquot)
  265. {
  266. return dquot->dq_sb->dq_op->mark_dirty(dquot);
  267. }
  268. int dquot_mark_dquot_dirty(struct dquot *dquot)
  269. {
  270. spin_lock(&dq_list_lock);
  271. if (!test_and_set_bit(DQ_MOD_B, &dquot->dq_flags))
  272. list_add(&dquot->dq_dirty, &sb_dqopt(dquot->dq_sb)->
  273. info[dquot->dq_type].dqi_dirty_list);
  274. spin_unlock(&dq_list_lock);
  275. return 0;
  276. }
  277. /* This function needs dq_list_lock */
  278. static inline int clear_dquot_dirty(struct dquot *dquot)
  279. {
  280. if (!test_and_clear_bit(DQ_MOD_B, &dquot->dq_flags))
  281. return 0;
  282. list_del_init(&dquot->dq_dirty);
  283. return 1;
  284. }
  285. void mark_info_dirty(struct super_block *sb, int type)
  286. {
  287. set_bit(DQF_INFO_DIRTY_B, &sb_dqopt(sb)->info[type].dqi_flags);
  288. }
  289. EXPORT_SYMBOL(mark_info_dirty);
  290. /*
  291. * Read dquot from disk and alloc space for it
  292. */
  293. int dquot_acquire(struct dquot *dquot)
  294. {
  295. int ret = 0, ret2 = 0;
  296. struct quota_info *dqopt = sb_dqopt(dquot->dq_sb);
  297. mutex_lock(&dquot->dq_lock);
  298. mutex_lock(&dqopt->dqio_mutex);
  299. if (!test_bit(DQ_READ_B, &dquot->dq_flags))
  300. ret = dqopt->ops[dquot->dq_type]->read_dqblk(dquot);
  301. if (ret < 0)
  302. goto out_iolock;
  303. set_bit(DQ_READ_B, &dquot->dq_flags);
  304. /* Instantiate dquot if needed */
  305. if (!test_bit(DQ_ACTIVE_B, &dquot->dq_flags) && !dquot->dq_off) {
  306. ret = dqopt->ops[dquot->dq_type]->commit_dqblk(dquot);
  307. /* Write the info if needed */
  308. if (info_dirty(&dqopt->info[dquot->dq_type]))
  309. ret2 = dqopt->ops[dquot->dq_type]->write_file_info(dquot->dq_sb, dquot->dq_type);
  310. if (ret < 0)
  311. goto out_iolock;
  312. if (ret2 < 0) {
  313. ret = ret2;
  314. goto out_iolock;
  315. }
  316. }
  317. set_bit(DQ_ACTIVE_B, &dquot->dq_flags);
  318. out_iolock:
  319. mutex_unlock(&dqopt->dqio_mutex);
  320. mutex_unlock(&dquot->dq_lock);
  321. return ret;
  322. }
  323. /*
  324. * Write dquot to disk
  325. */
  326. int dquot_commit(struct dquot *dquot)
  327. {
  328. int ret = 0, ret2 = 0;
  329. struct quota_info *dqopt = sb_dqopt(dquot->dq_sb);
  330. mutex_lock(&dqopt->dqio_mutex);
  331. spin_lock(&dq_list_lock);
  332. if (!clear_dquot_dirty(dquot)) {
  333. spin_unlock(&dq_list_lock);
  334. goto out_sem;
  335. }
  336. spin_unlock(&dq_list_lock);
  337. /* Inactive dquot can be only if there was error during read/init
  338. * => we have better not writing it */
  339. if (test_bit(DQ_ACTIVE_B, &dquot->dq_flags)) {
  340. ret = dqopt->ops[dquot->dq_type]->commit_dqblk(dquot);
  341. if (info_dirty(&dqopt->info[dquot->dq_type]))
  342. ret2 = dqopt->ops[dquot->dq_type]->write_file_info(dquot->dq_sb, dquot->dq_type);
  343. if (ret >= 0)
  344. ret = ret2;
  345. }
  346. out_sem:
  347. mutex_unlock(&dqopt->dqio_mutex);
  348. return ret;
  349. }
  350. /*
  351. * Release dquot
  352. */
  353. int dquot_release(struct dquot *dquot)
  354. {
  355. int ret = 0, ret2 = 0;
  356. struct quota_info *dqopt = sb_dqopt(dquot->dq_sb);
  357. mutex_lock(&dquot->dq_lock);
  358. /* Check whether we are not racing with some other dqget() */
  359. if (atomic_read(&dquot->dq_count) > 1)
  360. goto out_dqlock;
  361. mutex_lock(&dqopt->dqio_mutex);
  362. if (dqopt->ops[dquot->dq_type]->release_dqblk) {
  363. ret = dqopt->ops[dquot->dq_type]->release_dqblk(dquot);
  364. /* Write the info */
  365. if (info_dirty(&dqopt->info[dquot->dq_type]))
  366. ret2 = dqopt->ops[dquot->dq_type]->write_file_info(dquot->dq_sb, dquot->dq_type);
  367. if (ret >= 0)
  368. ret = ret2;
  369. }
  370. clear_bit(DQ_ACTIVE_B, &dquot->dq_flags);
  371. mutex_unlock(&dqopt->dqio_mutex);
  372. out_dqlock:
  373. mutex_unlock(&dquot->dq_lock);
  374. return ret;
  375. }
  376. /* Invalidate all dquots on the list. Note that this function is called after
  377. * quota is disabled and pointers from inodes removed so there cannot be new
  378. * quota users. There can still be some users of quotas due to inodes being
  379. * just deleted or pruned by prune_icache() (those are not attached to any
  380. * list). We have to wait for such users.
  381. */
  382. static void invalidate_dquots(struct super_block *sb, int type)
  383. {
  384. struct dquot *dquot, *tmp;
  385. restart:
  386. spin_lock(&dq_list_lock);
  387. list_for_each_entry_safe(dquot, tmp, &inuse_list, dq_inuse) {
  388. if (dquot->dq_sb != sb)
  389. continue;
  390. if (dquot->dq_type != type)
  391. continue;
  392. /* Wait for dquot users */
  393. if (atomic_read(&dquot->dq_count)) {
  394. DEFINE_WAIT(wait);
  395. atomic_inc(&dquot->dq_count);
  396. prepare_to_wait(&dquot->dq_wait_unused, &wait,
  397. TASK_UNINTERRUPTIBLE);
  398. spin_unlock(&dq_list_lock);
  399. /* Once dqput() wakes us up, we know it's time to free
  400. * the dquot.
  401. * IMPORTANT: we rely on the fact that there is always
  402. * at most one process waiting for dquot to free.
  403. * Otherwise dq_count would be > 1 and we would never
  404. * wake up.
  405. */
  406. if (atomic_read(&dquot->dq_count) > 1)
  407. schedule();
  408. finish_wait(&dquot->dq_wait_unused, &wait);
  409. dqput(dquot);
  410. /* At this moment dquot() need not exist (it could be
  411. * reclaimed by prune_dqcache(). Hence we must
  412. * restart. */
  413. goto restart;
  414. }
  415. /*
  416. * Quota now has no users and it has been written on last
  417. * dqput()
  418. */
  419. remove_dquot_hash(dquot);
  420. remove_free_dquot(dquot);
  421. remove_inuse(dquot);
  422. kmem_cache_free(dquot_cachep, dquot);
  423. }
  424. spin_unlock(&dq_list_lock);
  425. }
  426. int vfs_quota_sync(struct super_block *sb, int type)
  427. {
  428. struct list_head *dirty;
  429. struct dquot *dquot;
  430. struct quota_info *dqopt = sb_dqopt(sb);
  431. int cnt;
  432. mutex_lock(&dqopt->dqonoff_mutex);
  433. for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
  434. if (type != -1 && cnt != type)
  435. continue;
  436. if (!sb_has_quota_enabled(sb, cnt))
  437. continue;
  438. spin_lock(&dq_list_lock);
  439. dirty = &dqopt->info[cnt].dqi_dirty_list;
  440. while (!list_empty(dirty)) {
  441. dquot = list_first_entry(dirty, struct dquot, dq_dirty);
  442. /* Dirty and inactive can be only bad dquot... */
  443. if (!test_bit(DQ_ACTIVE_B, &dquot->dq_flags)) {
  444. clear_dquot_dirty(dquot);
  445. continue;
  446. }
  447. /* Now we have active dquot from which someone is
  448. * holding reference so we can safely just increase
  449. * use count */
  450. atomic_inc(&dquot->dq_count);
  451. dqstats.lookups++;
  452. spin_unlock(&dq_list_lock);
  453. sb->dq_op->write_dquot(dquot);
  454. dqput(dquot);
  455. spin_lock(&dq_list_lock);
  456. }
  457. spin_unlock(&dq_list_lock);
  458. }
  459. for (cnt = 0; cnt < MAXQUOTAS; cnt++)
  460. if ((cnt == type || type == -1) && sb_has_quota_enabled(sb, cnt)
  461. && info_dirty(&dqopt->info[cnt]))
  462. sb->dq_op->write_info(sb, cnt);
  463. spin_lock(&dq_list_lock);
  464. dqstats.syncs++;
  465. spin_unlock(&dq_list_lock);
  466. mutex_unlock(&dqopt->dqonoff_mutex);
  467. return 0;
  468. }
  469. /* Free unused dquots from cache */
  470. static void prune_dqcache(int count)
  471. {
  472. struct list_head *head;
  473. struct dquot *dquot;
  474. head = free_dquots.prev;
  475. while (head != &free_dquots && count) {
  476. dquot = list_entry(head, struct dquot, dq_free);
  477. remove_dquot_hash(dquot);
  478. remove_free_dquot(dquot);
  479. remove_inuse(dquot);
  480. kmem_cache_free(dquot_cachep, dquot);
  481. count--;
  482. head = free_dquots.prev;
  483. }
  484. }
  485. /*
  486. * This is called from kswapd when we think we need some
  487. * more memory
  488. */
  489. static int shrink_dqcache_memory(int nr, gfp_t gfp_mask)
  490. {
  491. if (nr) {
  492. spin_lock(&dq_list_lock);
  493. prune_dqcache(nr);
  494. spin_unlock(&dq_list_lock);
  495. }
  496. return (dqstats.free_dquots / 100) * sysctl_vfs_cache_pressure;
  497. }
  498. static struct shrinker dqcache_shrinker = {
  499. .shrink = shrink_dqcache_memory,
  500. .seeks = DEFAULT_SEEKS,
  501. };
  502. /*
  503. * Put reference to dquot
  504. * NOTE: If you change this function please check whether dqput_blocks() works right...
  505. * MUST be called with either dqptr_sem or dqonoff_mutex held
  506. */
  507. static void dqput(struct dquot *dquot)
  508. {
  509. int ret;
  510. if (!dquot)
  511. return;
  512. #ifdef __DQUOT_PARANOIA
  513. if (!atomic_read(&dquot->dq_count)) {
  514. printk("VFS: dqput: trying to free free dquot\n");
  515. printk("VFS: device %s, dquot of %s %d\n",
  516. dquot->dq_sb->s_id,
  517. quotatypes[dquot->dq_type],
  518. dquot->dq_id);
  519. BUG();
  520. }
  521. #endif
  522. spin_lock(&dq_list_lock);
  523. dqstats.drops++;
  524. spin_unlock(&dq_list_lock);
  525. we_slept:
  526. spin_lock(&dq_list_lock);
  527. if (atomic_read(&dquot->dq_count) > 1) {
  528. /* We have more than one user... nothing to do */
  529. atomic_dec(&dquot->dq_count);
  530. /* Releasing dquot during quotaoff phase? */
  531. if (!sb_has_quota_enabled(dquot->dq_sb, dquot->dq_type) &&
  532. atomic_read(&dquot->dq_count) == 1)
  533. wake_up(&dquot->dq_wait_unused);
  534. spin_unlock(&dq_list_lock);
  535. return;
  536. }
  537. /* Need to release dquot? */
  538. if (test_bit(DQ_ACTIVE_B, &dquot->dq_flags) && dquot_dirty(dquot)) {
  539. spin_unlock(&dq_list_lock);
  540. /* Commit dquot before releasing */
  541. ret = dquot->dq_sb->dq_op->write_dquot(dquot);
  542. if (ret < 0) {
  543. printk(KERN_ERR "VFS: cannot write quota structure on "
  544. "device %s (error %d). Quota may get out of "
  545. "sync!\n", dquot->dq_sb->s_id, ret);
  546. /*
  547. * We clear dirty bit anyway, so that we avoid
  548. * infinite loop here
  549. */
  550. spin_lock(&dq_list_lock);
  551. clear_dquot_dirty(dquot);
  552. spin_unlock(&dq_list_lock);
  553. }
  554. goto we_slept;
  555. }
  556. /* Clear flag in case dquot was inactive (something bad happened) */
  557. clear_dquot_dirty(dquot);
  558. if (test_bit(DQ_ACTIVE_B, &dquot->dq_flags)) {
  559. spin_unlock(&dq_list_lock);
  560. dquot->dq_sb->dq_op->release_dquot(dquot);
  561. goto we_slept;
  562. }
  563. atomic_dec(&dquot->dq_count);
  564. #ifdef __DQUOT_PARANOIA
  565. /* sanity check */
  566. BUG_ON(!list_empty(&dquot->dq_free));
  567. #endif
  568. put_dquot_last(dquot);
  569. spin_unlock(&dq_list_lock);
  570. }
  571. static struct dquot *get_empty_dquot(struct super_block *sb, int type)
  572. {
  573. struct dquot *dquot;
  574. dquot = kmem_cache_zalloc(dquot_cachep, GFP_NOFS);
  575. if(!dquot)
  576. return NODQUOT;
  577. mutex_init(&dquot->dq_lock);
  578. INIT_LIST_HEAD(&dquot->dq_free);
  579. INIT_LIST_HEAD(&dquot->dq_inuse);
  580. INIT_HLIST_NODE(&dquot->dq_hash);
  581. INIT_LIST_HEAD(&dquot->dq_dirty);
  582. init_waitqueue_head(&dquot->dq_wait_unused);
  583. dquot->dq_sb = sb;
  584. dquot->dq_type = type;
  585. atomic_set(&dquot->dq_count, 1);
  586. return dquot;
  587. }
  588. /*
  589. * Get reference to dquot
  590. * MUST be called with either dqptr_sem or dqonoff_mutex held
  591. */
  592. static struct dquot *dqget(struct super_block *sb, unsigned int id, int type)
  593. {
  594. unsigned int hashent = hashfn(sb, id, type);
  595. struct dquot *dquot, *empty = NODQUOT;
  596. if (!sb_has_quota_enabled(sb, type))
  597. return NODQUOT;
  598. we_slept:
  599. spin_lock(&dq_list_lock);
  600. if ((dquot = find_dquot(hashent, sb, id, type)) == NODQUOT) {
  601. if (empty == NODQUOT) {
  602. spin_unlock(&dq_list_lock);
  603. if ((empty = get_empty_dquot(sb, type)) == NODQUOT)
  604. schedule(); /* Try to wait for a moment... */
  605. goto we_slept;
  606. }
  607. dquot = empty;
  608. dquot->dq_id = id;
  609. /* all dquots go on the inuse_list */
  610. put_inuse(dquot);
  611. /* hash it first so it can be found */
  612. insert_dquot_hash(dquot);
  613. dqstats.lookups++;
  614. spin_unlock(&dq_list_lock);
  615. } else {
  616. if (!atomic_read(&dquot->dq_count))
  617. remove_free_dquot(dquot);
  618. atomic_inc(&dquot->dq_count);
  619. dqstats.cache_hits++;
  620. dqstats.lookups++;
  621. spin_unlock(&dq_list_lock);
  622. if (empty)
  623. kmem_cache_free(dquot_cachep, empty);
  624. }
  625. /* Wait for dq_lock - after this we know that either dquot_release() is already
  626. * finished or it will be canceled due to dq_count > 1 test */
  627. wait_on_dquot(dquot);
  628. /* Read the dquot and instantiate it (everything done only if needed) */
  629. if (!test_bit(DQ_ACTIVE_B, &dquot->dq_flags) && sb->dq_op->acquire_dquot(dquot) < 0) {
  630. dqput(dquot);
  631. return NODQUOT;
  632. }
  633. #ifdef __DQUOT_PARANOIA
  634. BUG_ON(!dquot->dq_sb); /* Has somebody invalidated entry under us? */
  635. #endif
  636. return dquot;
  637. }
  638. static int dqinit_needed(struct inode *inode, int type)
  639. {
  640. int cnt;
  641. if (IS_NOQUOTA(inode))
  642. return 0;
  643. if (type != -1)
  644. return inode->i_dquot[type] == NODQUOT;
  645. for (cnt = 0; cnt < MAXQUOTAS; cnt++)
  646. if (inode->i_dquot[cnt] == NODQUOT)
  647. return 1;
  648. return 0;
  649. }
  650. /* This routine is guarded by dqonoff_mutex mutex */
  651. static void add_dquot_ref(struct super_block *sb, int type)
  652. {
  653. struct inode *inode, *old_inode = NULL;
  654. spin_lock(&inode_lock);
  655. list_for_each_entry(inode, &sb->s_inodes, i_sb_list) {
  656. if (!atomic_read(&inode->i_writecount))
  657. continue;
  658. if (!dqinit_needed(inode, type))
  659. continue;
  660. if (inode->i_state & (I_FREEING|I_WILL_FREE))
  661. continue;
  662. __iget(inode);
  663. spin_unlock(&inode_lock);
  664. iput(old_inode);
  665. sb->dq_op->initialize(inode, type);
  666. /* We hold a reference to 'inode' so it couldn't have been
  667. * removed from s_inodes list while we dropped the inode_lock.
  668. * We cannot iput the inode now as we can be holding the last
  669. * reference and we cannot iput it under inode_lock. So we
  670. * keep the reference and iput it later. */
  671. old_inode = inode;
  672. spin_lock(&inode_lock);
  673. }
  674. spin_unlock(&inode_lock);
  675. iput(old_inode);
  676. }
  677. /* Return 0 if dqput() won't block (note that 1 doesn't necessarily mean blocking) */
  678. static inline int dqput_blocks(struct dquot *dquot)
  679. {
  680. if (atomic_read(&dquot->dq_count) <= 1)
  681. return 1;
  682. return 0;
  683. }
  684. /* Remove references to dquots from inode - add dquot to list for freeing if needed */
  685. /* We can't race with anybody because we hold dqptr_sem for writing... */
  686. static int remove_inode_dquot_ref(struct inode *inode, int type,
  687. struct list_head *tofree_head)
  688. {
  689. struct dquot *dquot = inode->i_dquot[type];
  690. inode->i_dquot[type] = NODQUOT;
  691. if (dquot != NODQUOT) {
  692. if (dqput_blocks(dquot)) {
  693. #ifdef __DQUOT_PARANOIA
  694. if (atomic_read(&dquot->dq_count) != 1)
  695. printk(KERN_WARNING "VFS: Adding dquot with dq_count %d to dispose list.\n", atomic_read(&dquot->dq_count));
  696. #endif
  697. spin_lock(&dq_list_lock);
  698. list_add(&dquot->dq_free, tofree_head); /* As dquot must have currently users it can't be on the free list... */
  699. spin_unlock(&dq_list_lock);
  700. return 1;
  701. }
  702. else
  703. dqput(dquot); /* We have guaranteed we won't block */
  704. }
  705. return 0;
  706. }
  707. /* Free list of dquots - called from inode.c */
  708. /* dquots are removed from inodes, no new references can be got so we are the only ones holding reference */
  709. static void put_dquot_list(struct list_head *tofree_head)
  710. {
  711. struct list_head *act_head;
  712. struct dquot *dquot;
  713. act_head = tofree_head->next;
  714. /* So now we have dquots on the list... Just free them */
  715. while (act_head != tofree_head) {
  716. dquot = list_entry(act_head, struct dquot, dq_free);
  717. act_head = act_head->next;
  718. list_del_init(&dquot->dq_free); /* Remove dquot from the list so we won't have problems... */
  719. dqput(dquot);
  720. }
  721. }
  722. static void remove_dquot_ref(struct super_block *sb, int type,
  723. struct list_head *tofree_head)
  724. {
  725. struct inode *inode;
  726. spin_lock(&inode_lock);
  727. list_for_each_entry(inode, &sb->s_inodes, i_sb_list) {
  728. if (!IS_NOQUOTA(inode))
  729. remove_inode_dquot_ref(inode, type, tofree_head);
  730. }
  731. spin_unlock(&inode_lock);
  732. }
  733. /* Gather all references from inodes and drop them */
  734. static void drop_dquot_ref(struct super_block *sb, int type)
  735. {
  736. LIST_HEAD(tofree_head);
  737. if (sb->dq_op) {
  738. down_write(&sb_dqopt(sb)->dqptr_sem);
  739. remove_dquot_ref(sb, type, &tofree_head);
  740. up_write(&sb_dqopt(sb)->dqptr_sem);
  741. put_dquot_list(&tofree_head);
  742. }
  743. }
  744. static inline void dquot_incr_inodes(struct dquot *dquot, unsigned long number)
  745. {
  746. dquot->dq_dqb.dqb_curinodes += number;
  747. }
  748. static inline void dquot_incr_space(struct dquot *dquot, qsize_t number)
  749. {
  750. dquot->dq_dqb.dqb_curspace += number;
  751. }
  752. static inline void dquot_decr_inodes(struct dquot *dquot, unsigned long number)
  753. {
  754. if (dquot->dq_dqb.dqb_curinodes > number)
  755. dquot->dq_dqb.dqb_curinodes -= number;
  756. else
  757. dquot->dq_dqb.dqb_curinodes = 0;
  758. if (dquot->dq_dqb.dqb_curinodes <= dquot->dq_dqb.dqb_isoftlimit)
  759. dquot->dq_dqb.dqb_itime = (time_t) 0;
  760. clear_bit(DQ_INODES_B, &dquot->dq_flags);
  761. }
  762. static inline void dquot_decr_space(struct dquot *dquot, qsize_t number)
  763. {
  764. if (dquot->dq_dqb.dqb_curspace > number)
  765. dquot->dq_dqb.dqb_curspace -= number;
  766. else
  767. dquot->dq_dqb.dqb_curspace = 0;
  768. if (toqb(dquot->dq_dqb.dqb_curspace) <= dquot->dq_dqb.dqb_bsoftlimit)
  769. dquot->dq_dqb.dqb_btime = (time_t) 0;
  770. clear_bit(DQ_BLKS_B, &dquot->dq_flags);
  771. }
  772. static int warning_issued(struct dquot *dquot, const int warntype)
  773. {
  774. int flag = (warntype == QUOTA_NL_BHARDWARN ||
  775. warntype == QUOTA_NL_BSOFTLONGWARN) ? DQ_BLKS_B :
  776. ((warntype == QUOTA_NL_IHARDWARN ||
  777. warntype == QUOTA_NL_ISOFTLONGWARN) ? DQ_INODES_B : 0);
  778. if (!flag)
  779. return 0;
  780. return test_and_set_bit(flag, &dquot->dq_flags);
  781. }
  782. #ifdef CONFIG_PRINT_QUOTA_WARNING
  783. static int flag_print_warnings = 1;
  784. static inline int need_print_warning(struct dquot *dquot)
  785. {
  786. if (!flag_print_warnings)
  787. return 0;
  788. switch (dquot->dq_type) {
  789. case USRQUOTA:
  790. return current->fsuid == dquot->dq_id;
  791. case GRPQUOTA:
  792. return in_group_p(dquot->dq_id);
  793. }
  794. return 0;
  795. }
  796. /* Print warning to user which exceeded quota */
  797. static void print_warning(struct dquot *dquot, const int warntype)
  798. {
  799. char *msg = NULL;
  800. struct tty_struct *tty;
  801. if (!need_print_warning(dquot))
  802. return;
  803. mutex_lock(&tty_mutex);
  804. tty = get_current_tty();
  805. if (!tty)
  806. goto out_lock;
  807. tty_write_message(tty, dquot->dq_sb->s_id);
  808. if (warntype == QUOTA_NL_ISOFTWARN || warntype == QUOTA_NL_BSOFTWARN)
  809. tty_write_message(tty, ": warning, ");
  810. else
  811. tty_write_message(tty, ": write failed, ");
  812. tty_write_message(tty, quotatypes[dquot->dq_type]);
  813. switch (warntype) {
  814. case QUOTA_NL_IHARDWARN:
  815. msg = " file limit reached.\r\n";
  816. break;
  817. case QUOTA_NL_ISOFTLONGWARN:
  818. msg = " file quota exceeded too long.\r\n";
  819. break;
  820. case QUOTA_NL_ISOFTWARN:
  821. msg = " file quota exceeded.\r\n";
  822. break;
  823. case QUOTA_NL_BHARDWARN:
  824. msg = " block limit reached.\r\n";
  825. break;
  826. case QUOTA_NL_BSOFTLONGWARN:
  827. msg = " block quota exceeded too long.\r\n";
  828. break;
  829. case QUOTA_NL_BSOFTWARN:
  830. msg = " block quota exceeded.\r\n";
  831. break;
  832. }
  833. tty_write_message(tty, msg);
  834. out_lock:
  835. mutex_unlock(&tty_mutex);
  836. }
  837. #endif
  838. #ifdef CONFIG_QUOTA_NETLINK_INTERFACE
  839. /* Netlink family structure for quota */
  840. static struct genl_family quota_genl_family = {
  841. .id = GENL_ID_GENERATE,
  842. .hdrsize = 0,
  843. .name = "VFS_DQUOT",
  844. .version = 1,
  845. .maxattr = QUOTA_NL_A_MAX,
  846. };
  847. /* Send warning to userspace about user which exceeded quota */
  848. static void send_warning(const struct dquot *dquot, const char warntype)
  849. {
  850. static atomic_t seq;
  851. struct sk_buff *skb;
  852. void *msg_head;
  853. int ret;
  854. int msg_size = 4 * nla_total_size(sizeof(u32)) +
  855. 2 * nla_total_size(sizeof(u64));
  856. /* We have to allocate using GFP_NOFS as we are called from a
  857. * filesystem performing write and thus further recursion into
  858. * the fs to free some data could cause deadlocks. */
  859. skb = genlmsg_new(msg_size, GFP_NOFS);
  860. if (!skb) {
  861. printk(KERN_ERR
  862. "VFS: Not enough memory to send quota warning.\n");
  863. return;
  864. }
  865. msg_head = genlmsg_put(skb, 0, atomic_add_return(1, &seq),
  866. &quota_genl_family, 0, QUOTA_NL_C_WARNING);
  867. if (!msg_head) {
  868. printk(KERN_ERR
  869. "VFS: Cannot store netlink header in quota warning.\n");
  870. goto err_out;
  871. }
  872. ret = nla_put_u32(skb, QUOTA_NL_A_QTYPE, dquot->dq_type);
  873. if (ret)
  874. goto attr_err_out;
  875. ret = nla_put_u64(skb, QUOTA_NL_A_EXCESS_ID, dquot->dq_id);
  876. if (ret)
  877. goto attr_err_out;
  878. ret = nla_put_u32(skb, QUOTA_NL_A_WARNING, warntype);
  879. if (ret)
  880. goto attr_err_out;
  881. ret = nla_put_u32(skb, QUOTA_NL_A_DEV_MAJOR,
  882. MAJOR(dquot->dq_sb->s_dev));
  883. if (ret)
  884. goto attr_err_out;
  885. ret = nla_put_u32(skb, QUOTA_NL_A_DEV_MINOR,
  886. MINOR(dquot->dq_sb->s_dev));
  887. if (ret)
  888. goto attr_err_out;
  889. ret = nla_put_u64(skb, QUOTA_NL_A_CAUSED_ID, current->user->uid);
  890. if (ret)
  891. goto attr_err_out;
  892. genlmsg_end(skb, msg_head);
  893. ret = genlmsg_multicast(skb, 0, quota_genl_family.id, GFP_NOFS);
  894. if (ret < 0 && ret != -ESRCH)
  895. printk(KERN_ERR
  896. "VFS: Failed to send notification message: %d\n", ret);
  897. return;
  898. attr_err_out:
  899. printk(KERN_ERR "VFS: Not enough space to compose quota message!\n");
  900. err_out:
  901. kfree_skb(skb);
  902. }
  903. #endif
  904. static inline void flush_warnings(struct dquot * const *dquots, char *warntype)
  905. {
  906. int i;
  907. for (i = 0; i < MAXQUOTAS; i++)
  908. if (dquots[i] != NODQUOT && warntype[i] != QUOTA_NL_NOWARN &&
  909. !warning_issued(dquots[i], warntype[i])) {
  910. #ifdef CONFIG_PRINT_QUOTA_WARNING
  911. print_warning(dquots[i], warntype[i]);
  912. #endif
  913. #ifdef CONFIG_QUOTA_NETLINK_INTERFACE
  914. send_warning(dquots[i], warntype[i]);
  915. #endif
  916. }
  917. }
  918. static inline char ignore_hardlimit(struct dquot *dquot)
  919. {
  920. struct mem_dqinfo *info = &sb_dqopt(dquot->dq_sb)->info[dquot->dq_type];
  921. return capable(CAP_SYS_RESOURCE) &&
  922. (info->dqi_format->qf_fmt_id != QFMT_VFS_OLD || !(info->dqi_flags & V1_DQF_RSQUASH));
  923. }
  924. /* needs dq_data_lock */
  925. static int check_idq(struct dquot *dquot, ulong inodes, char *warntype)
  926. {
  927. *warntype = QUOTA_NL_NOWARN;
  928. if (inodes <= 0 || test_bit(DQ_FAKE_B, &dquot->dq_flags))
  929. return QUOTA_OK;
  930. if (dquot->dq_dqb.dqb_ihardlimit &&
  931. (dquot->dq_dqb.dqb_curinodes + inodes) > dquot->dq_dqb.dqb_ihardlimit &&
  932. !ignore_hardlimit(dquot)) {
  933. *warntype = QUOTA_NL_IHARDWARN;
  934. return NO_QUOTA;
  935. }
  936. if (dquot->dq_dqb.dqb_isoftlimit &&
  937. (dquot->dq_dqb.dqb_curinodes + inodes) > dquot->dq_dqb.dqb_isoftlimit &&
  938. dquot->dq_dqb.dqb_itime && get_seconds() >= dquot->dq_dqb.dqb_itime &&
  939. !ignore_hardlimit(dquot)) {
  940. *warntype = QUOTA_NL_ISOFTLONGWARN;
  941. return NO_QUOTA;
  942. }
  943. if (dquot->dq_dqb.dqb_isoftlimit &&
  944. (dquot->dq_dqb.dqb_curinodes + inodes) > dquot->dq_dqb.dqb_isoftlimit &&
  945. dquot->dq_dqb.dqb_itime == 0) {
  946. *warntype = QUOTA_NL_ISOFTWARN;
  947. dquot->dq_dqb.dqb_itime = get_seconds() + sb_dqopt(dquot->dq_sb)->info[dquot->dq_type].dqi_igrace;
  948. }
  949. return QUOTA_OK;
  950. }
  951. /* needs dq_data_lock */
  952. static int check_bdq(struct dquot *dquot, qsize_t space, int prealloc, char *warntype)
  953. {
  954. *warntype = QUOTA_NL_NOWARN;
  955. if (space <= 0 || test_bit(DQ_FAKE_B, &dquot->dq_flags))
  956. return QUOTA_OK;
  957. if (dquot->dq_dqb.dqb_bhardlimit &&
  958. toqb(dquot->dq_dqb.dqb_curspace + space) > dquot->dq_dqb.dqb_bhardlimit &&
  959. !ignore_hardlimit(dquot)) {
  960. if (!prealloc)
  961. *warntype = QUOTA_NL_BHARDWARN;
  962. return NO_QUOTA;
  963. }
  964. if (dquot->dq_dqb.dqb_bsoftlimit &&
  965. toqb(dquot->dq_dqb.dqb_curspace + space) > dquot->dq_dqb.dqb_bsoftlimit &&
  966. dquot->dq_dqb.dqb_btime && get_seconds() >= dquot->dq_dqb.dqb_btime &&
  967. !ignore_hardlimit(dquot)) {
  968. if (!prealloc)
  969. *warntype = QUOTA_NL_BSOFTLONGWARN;
  970. return NO_QUOTA;
  971. }
  972. if (dquot->dq_dqb.dqb_bsoftlimit &&
  973. toqb(dquot->dq_dqb.dqb_curspace + space) > dquot->dq_dqb.dqb_bsoftlimit &&
  974. dquot->dq_dqb.dqb_btime == 0) {
  975. if (!prealloc) {
  976. *warntype = QUOTA_NL_BSOFTWARN;
  977. dquot->dq_dqb.dqb_btime = get_seconds() + sb_dqopt(dquot->dq_sb)->info[dquot->dq_type].dqi_bgrace;
  978. }
  979. else
  980. /*
  981. * We don't allow preallocation to exceed softlimit so exceeding will
  982. * be always printed
  983. */
  984. return NO_QUOTA;
  985. }
  986. return QUOTA_OK;
  987. }
  988. /*
  989. * Initialize quota pointers in inode
  990. * Transaction must be started at entry
  991. */
  992. int dquot_initialize(struct inode *inode, int type)
  993. {
  994. unsigned int id = 0;
  995. int cnt, ret = 0;
  996. /* First test before acquiring mutex - solves deadlocks when we
  997. * re-enter the quota code and are already holding the mutex */
  998. if (IS_NOQUOTA(inode))
  999. return 0;
  1000. down_write(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1001. /* Having dqptr_sem we know NOQUOTA flags can't be altered... */
  1002. if (IS_NOQUOTA(inode))
  1003. goto out_err;
  1004. for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
  1005. if (type != -1 && cnt != type)
  1006. continue;
  1007. if (inode->i_dquot[cnt] == NODQUOT) {
  1008. switch (cnt) {
  1009. case USRQUOTA:
  1010. id = inode->i_uid;
  1011. break;
  1012. case GRPQUOTA:
  1013. id = inode->i_gid;
  1014. break;
  1015. }
  1016. inode->i_dquot[cnt] = dqget(inode->i_sb, id, cnt);
  1017. }
  1018. }
  1019. out_err:
  1020. up_write(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1021. return ret;
  1022. }
  1023. /*
  1024. * Release all quotas referenced by inode
  1025. * Transaction must be started at an entry
  1026. */
  1027. int dquot_drop(struct inode *inode)
  1028. {
  1029. int cnt;
  1030. down_write(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1031. for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
  1032. if (inode->i_dquot[cnt] != NODQUOT) {
  1033. dqput(inode->i_dquot[cnt]);
  1034. inode->i_dquot[cnt] = NODQUOT;
  1035. }
  1036. }
  1037. up_write(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1038. return 0;
  1039. }
  1040. /*
  1041. * Following four functions update i_blocks+i_bytes fields and
  1042. * quota information (together with appropriate checks)
  1043. * NOTE: We absolutely rely on the fact that caller dirties
  1044. * the inode (usually macros in quotaops.h care about this) and
  1045. * holds a handle for the current transaction so that dquot write and
  1046. * inode write go into the same transaction.
  1047. */
  1048. /*
  1049. * This operation can block, but only after everything is updated
  1050. */
  1051. int dquot_alloc_space(struct inode *inode, qsize_t number, int warn)
  1052. {
  1053. int cnt, ret = NO_QUOTA;
  1054. char warntype[MAXQUOTAS];
  1055. /* First test before acquiring mutex - solves deadlocks when we
  1056. * re-enter the quota code and are already holding the mutex */
  1057. if (IS_NOQUOTA(inode)) {
  1058. out_add:
  1059. inode_add_bytes(inode, number);
  1060. return QUOTA_OK;
  1061. }
  1062. for (cnt = 0; cnt < MAXQUOTAS; cnt++)
  1063. warntype[cnt] = QUOTA_NL_NOWARN;
  1064. down_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1065. if (IS_NOQUOTA(inode)) { /* Now we can do reliable test... */
  1066. up_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1067. goto out_add;
  1068. }
  1069. spin_lock(&dq_data_lock);
  1070. for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
  1071. if (inode->i_dquot[cnt] == NODQUOT)
  1072. continue;
  1073. if (check_bdq(inode->i_dquot[cnt], number, warn, warntype+cnt) == NO_QUOTA)
  1074. goto warn_put_all;
  1075. }
  1076. for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
  1077. if (inode->i_dquot[cnt] == NODQUOT)
  1078. continue;
  1079. dquot_incr_space(inode->i_dquot[cnt], number);
  1080. }
  1081. inode_add_bytes(inode, number);
  1082. ret = QUOTA_OK;
  1083. warn_put_all:
  1084. spin_unlock(&dq_data_lock);
  1085. if (ret == QUOTA_OK)
  1086. /* Dirtify all the dquots - this can block when journalling */
  1087. for (cnt = 0; cnt < MAXQUOTAS; cnt++)
  1088. if (inode->i_dquot[cnt])
  1089. mark_dquot_dirty(inode->i_dquot[cnt]);
  1090. flush_warnings(inode->i_dquot, warntype);
  1091. up_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1092. return ret;
  1093. }
  1094. /*
  1095. * This operation can block, but only after everything is updated
  1096. */
  1097. int dquot_alloc_inode(const struct inode *inode, unsigned long number)
  1098. {
  1099. int cnt, ret = NO_QUOTA;
  1100. char warntype[MAXQUOTAS];
  1101. /* First test before acquiring mutex - solves deadlocks when we
  1102. * re-enter the quota code and are already holding the mutex */
  1103. if (IS_NOQUOTA(inode))
  1104. return QUOTA_OK;
  1105. for (cnt = 0; cnt < MAXQUOTAS; cnt++)
  1106. warntype[cnt] = QUOTA_NL_NOWARN;
  1107. down_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1108. if (IS_NOQUOTA(inode)) {
  1109. up_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1110. return QUOTA_OK;
  1111. }
  1112. spin_lock(&dq_data_lock);
  1113. for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
  1114. if (inode->i_dquot[cnt] == NODQUOT)
  1115. continue;
  1116. if (check_idq(inode->i_dquot[cnt], number, warntype+cnt) == NO_QUOTA)
  1117. goto warn_put_all;
  1118. }
  1119. for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
  1120. if (inode->i_dquot[cnt] == NODQUOT)
  1121. continue;
  1122. dquot_incr_inodes(inode->i_dquot[cnt], number);
  1123. }
  1124. ret = QUOTA_OK;
  1125. warn_put_all:
  1126. spin_unlock(&dq_data_lock);
  1127. if (ret == QUOTA_OK)
  1128. /* Dirtify all the dquots - this can block when journalling */
  1129. for (cnt = 0; cnt < MAXQUOTAS; cnt++)
  1130. if (inode->i_dquot[cnt])
  1131. mark_dquot_dirty(inode->i_dquot[cnt]);
  1132. flush_warnings(inode->i_dquot, warntype);
  1133. up_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1134. return ret;
  1135. }
  1136. /*
  1137. * This operation can block, but only after everything is updated
  1138. */
  1139. int dquot_free_space(struct inode *inode, qsize_t number)
  1140. {
  1141. unsigned int cnt;
  1142. /* First test before acquiring mutex - solves deadlocks when we
  1143. * re-enter the quota code and are already holding the mutex */
  1144. if (IS_NOQUOTA(inode)) {
  1145. out_sub:
  1146. inode_sub_bytes(inode, number);
  1147. return QUOTA_OK;
  1148. }
  1149. down_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1150. /* Now recheck reliably when holding dqptr_sem */
  1151. if (IS_NOQUOTA(inode)) {
  1152. up_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1153. goto out_sub;
  1154. }
  1155. spin_lock(&dq_data_lock);
  1156. for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
  1157. if (inode->i_dquot[cnt] == NODQUOT)
  1158. continue;
  1159. dquot_decr_space(inode->i_dquot[cnt], number);
  1160. }
  1161. inode_sub_bytes(inode, number);
  1162. spin_unlock(&dq_data_lock);
  1163. /* Dirtify all the dquots - this can block when journalling */
  1164. for (cnt = 0; cnt < MAXQUOTAS; cnt++)
  1165. if (inode->i_dquot[cnt])
  1166. mark_dquot_dirty(inode->i_dquot[cnt]);
  1167. up_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1168. return QUOTA_OK;
  1169. }
  1170. /*
  1171. * This operation can block, but only after everything is updated
  1172. */
  1173. int dquot_free_inode(const struct inode *inode, unsigned long number)
  1174. {
  1175. unsigned int cnt;
  1176. /* First test before acquiring mutex - solves deadlocks when we
  1177. * re-enter the quota code and are already holding the mutex */
  1178. if (IS_NOQUOTA(inode))
  1179. return QUOTA_OK;
  1180. down_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1181. /* Now recheck reliably when holding dqptr_sem */
  1182. if (IS_NOQUOTA(inode)) {
  1183. up_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1184. return QUOTA_OK;
  1185. }
  1186. spin_lock(&dq_data_lock);
  1187. for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
  1188. if (inode->i_dquot[cnt] == NODQUOT)
  1189. continue;
  1190. dquot_decr_inodes(inode->i_dquot[cnt], number);
  1191. }
  1192. spin_unlock(&dq_data_lock);
  1193. /* Dirtify all the dquots - this can block when journalling */
  1194. for (cnt = 0; cnt < MAXQUOTAS; cnt++)
  1195. if (inode->i_dquot[cnt])
  1196. mark_dquot_dirty(inode->i_dquot[cnt]);
  1197. up_read(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1198. return QUOTA_OK;
  1199. }
  1200. /*
  1201. * Transfer the number of inode and blocks from one diskquota to an other.
  1202. *
  1203. * This operation can block, but only after everything is updated
  1204. * A transaction must be started when entering this function.
  1205. */
  1206. int dquot_transfer(struct inode *inode, struct iattr *iattr)
  1207. {
  1208. qsize_t space;
  1209. struct dquot *transfer_from[MAXQUOTAS];
  1210. struct dquot *transfer_to[MAXQUOTAS];
  1211. int cnt, ret = NO_QUOTA, chuid = (iattr->ia_valid & ATTR_UID) && inode->i_uid != iattr->ia_uid,
  1212. chgid = (iattr->ia_valid & ATTR_GID) && inode->i_gid != iattr->ia_gid;
  1213. char warntype[MAXQUOTAS];
  1214. /* First test before acquiring mutex - solves deadlocks when we
  1215. * re-enter the quota code and are already holding the mutex */
  1216. if (IS_NOQUOTA(inode))
  1217. return QUOTA_OK;
  1218. /* Clear the arrays */
  1219. for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
  1220. transfer_to[cnt] = transfer_from[cnt] = NODQUOT;
  1221. warntype[cnt] = QUOTA_NL_NOWARN;
  1222. }
  1223. down_write(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1224. /* Now recheck reliably when holding dqptr_sem */
  1225. if (IS_NOQUOTA(inode)) { /* File without quota accounting? */
  1226. up_write(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1227. return QUOTA_OK;
  1228. }
  1229. /* First build the transfer_to list - here we can block on
  1230. * reading/instantiating of dquots. We know that the transaction for
  1231. * us was already started so we don't violate lock ranking here */
  1232. for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
  1233. switch (cnt) {
  1234. case USRQUOTA:
  1235. if (!chuid)
  1236. continue;
  1237. transfer_to[cnt] = dqget(inode->i_sb, iattr->ia_uid, cnt);
  1238. break;
  1239. case GRPQUOTA:
  1240. if (!chgid)
  1241. continue;
  1242. transfer_to[cnt] = dqget(inode->i_sb, iattr->ia_gid, cnt);
  1243. break;
  1244. }
  1245. }
  1246. spin_lock(&dq_data_lock);
  1247. space = inode_get_bytes(inode);
  1248. /* Build the transfer_from list and check the limits */
  1249. for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
  1250. if (transfer_to[cnt] == NODQUOT)
  1251. continue;
  1252. transfer_from[cnt] = inode->i_dquot[cnt];
  1253. if (check_idq(transfer_to[cnt], 1, warntype+cnt) == NO_QUOTA ||
  1254. check_bdq(transfer_to[cnt], space, 0, warntype+cnt) == NO_QUOTA)
  1255. goto warn_put_all;
  1256. }
  1257. /*
  1258. * Finally perform the needed transfer from transfer_from to transfer_to
  1259. */
  1260. for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
  1261. /*
  1262. * Skip changes for same uid or gid or for turned off quota-type.
  1263. */
  1264. if (transfer_to[cnt] == NODQUOT)
  1265. continue;
  1266. /* Due to IO error we might not have transfer_from[] structure */
  1267. if (transfer_from[cnt]) {
  1268. dquot_decr_inodes(transfer_from[cnt], 1);
  1269. dquot_decr_space(transfer_from[cnt], space);
  1270. }
  1271. dquot_incr_inodes(transfer_to[cnt], 1);
  1272. dquot_incr_space(transfer_to[cnt], space);
  1273. inode->i_dquot[cnt] = transfer_to[cnt];
  1274. }
  1275. ret = QUOTA_OK;
  1276. warn_put_all:
  1277. spin_unlock(&dq_data_lock);
  1278. /* Dirtify all the dquots - this can block when journalling */
  1279. for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
  1280. if (transfer_from[cnt])
  1281. mark_dquot_dirty(transfer_from[cnt]);
  1282. if (transfer_to[cnt])
  1283. mark_dquot_dirty(transfer_to[cnt]);
  1284. }
  1285. flush_warnings(transfer_to, warntype);
  1286. for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
  1287. if (ret == QUOTA_OK && transfer_from[cnt] != NODQUOT)
  1288. dqput(transfer_from[cnt]);
  1289. if (ret == NO_QUOTA && transfer_to[cnt] != NODQUOT)
  1290. dqput(transfer_to[cnt]);
  1291. }
  1292. up_write(&sb_dqopt(inode->i_sb)->dqptr_sem);
  1293. return ret;
  1294. }
  1295. /*
  1296. * Write info of quota file to disk
  1297. */
  1298. int dquot_commit_info(struct super_block *sb, int type)
  1299. {
  1300. int ret;
  1301. struct quota_info *dqopt = sb_dqopt(sb);
  1302. mutex_lock(&dqopt->dqio_mutex);
  1303. ret = dqopt->ops[type]->write_file_info(sb, type);
  1304. mutex_unlock(&dqopt->dqio_mutex);
  1305. return ret;
  1306. }
  1307. /*
  1308. * Definitions of diskquota operations.
  1309. */
  1310. struct dquot_operations dquot_operations = {
  1311. .initialize = dquot_initialize,
  1312. .drop = dquot_drop,
  1313. .alloc_space = dquot_alloc_space,
  1314. .alloc_inode = dquot_alloc_inode,
  1315. .free_space = dquot_free_space,
  1316. .free_inode = dquot_free_inode,
  1317. .transfer = dquot_transfer,
  1318. .write_dquot = dquot_commit,
  1319. .acquire_dquot = dquot_acquire,
  1320. .release_dquot = dquot_release,
  1321. .mark_dirty = dquot_mark_dquot_dirty,
  1322. .write_info = dquot_commit_info
  1323. };
  1324. static inline void set_enable_flags(struct quota_info *dqopt, int type)
  1325. {
  1326. switch (type) {
  1327. case USRQUOTA:
  1328. dqopt->flags |= DQUOT_USR_ENABLED;
  1329. dqopt->flags &= ~DQUOT_USR_SUSPENDED;
  1330. break;
  1331. case GRPQUOTA:
  1332. dqopt->flags |= DQUOT_GRP_ENABLED;
  1333. dqopt->flags &= ~DQUOT_GRP_SUSPENDED;
  1334. break;
  1335. }
  1336. }
  1337. static inline void reset_enable_flags(struct quota_info *dqopt, int type,
  1338. int remount)
  1339. {
  1340. switch (type) {
  1341. case USRQUOTA:
  1342. dqopt->flags &= ~DQUOT_USR_ENABLED;
  1343. if (remount)
  1344. dqopt->flags |= DQUOT_USR_SUSPENDED;
  1345. else
  1346. dqopt->flags &= ~DQUOT_USR_SUSPENDED;
  1347. break;
  1348. case GRPQUOTA:
  1349. dqopt->flags &= ~DQUOT_GRP_ENABLED;
  1350. if (remount)
  1351. dqopt->flags |= DQUOT_GRP_SUSPENDED;
  1352. else
  1353. dqopt->flags &= ~DQUOT_GRP_SUSPENDED;
  1354. break;
  1355. }
  1356. }
  1357. /*
  1358. * Turn quota off on a device. type == -1 ==> quotaoff for all types (umount)
  1359. */
  1360. int vfs_quota_off(struct super_block *sb, int type, int remount)
  1361. {
  1362. int cnt, ret = 0;
  1363. struct quota_info *dqopt = sb_dqopt(sb);
  1364. struct inode *toputinode[MAXQUOTAS];
  1365. /* We need to serialize quota_off() for device */
  1366. mutex_lock(&dqopt->dqonoff_mutex);
  1367. /*
  1368. * Skip everything if there's nothing to do. We have to do this because
  1369. * sometimes we are called when fill_super() failed and calling
  1370. * sync_fs() in such cases does no good.
  1371. */
  1372. if (!sb_any_quota_enabled(sb) && !sb_any_quota_suspended(sb)) {
  1373. mutex_unlock(&dqopt->dqonoff_mutex);
  1374. return 0;
  1375. }
  1376. for (cnt = 0; cnt < MAXQUOTAS; cnt++) {
  1377. toputinode[cnt] = NULL;
  1378. if (type != -1 && cnt != type)
  1379. continue;
  1380. /* If we keep inodes of quota files after remount and quotaoff
  1381. * is called, drop kept inodes. */
  1382. if (!remount && sb_has_quota_suspended(sb, cnt)) {
  1383. iput(dqopt->files[cnt]);
  1384. dqopt->files[cnt] = NULL;
  1385. reset_enable_flags(dqopt, cnt, 0);
  1386. continue;
  1387. }
  1388. if (!sb_has_quota_enabled(sb, cnt))
  1389. continue;
  1390. reset_enable_flags(dqopt, cnt, remount);
  1391. /* Note: these are blocking operations */
  1392. drop_dquot_ref(sb, cnt);
  1393. invalidate_dquots(sb, cnt);
  1394. /*
  1395. * Now all dquots should be invalidated, all writes done so we should be only
  1396. * users of the info. No locks needed.
  1397. */
  1398. if (info_dirty(&dqopt->info[cnt]))
  1399. sb->dq_op->write_info(sb, cnt);
  1400. if (dqopt->ops[cnt]->free_file_info)
  1401. dqopt->ops[cnt]->free_file_info(sb, cnt);
  1402. put_quota_format(dqopt->info[cnt].dqi_format);
  1403. toputinode[cnt] = dqopt->files[cnt];
  1404. if (!remount)
  1405. dqopt->files[cnt] = NULL;
  1406. dqopt->info[cnt].dqi_flags = 0;
  1407. dqopt->info[cnt].dqi_igrace = 0;
  1408. dqopt->info[cnt].dqi_bgrace = 0;
  1409. dqopt->ops[cnt] = NULL;
  1410. }
  1411. mutex_unlock(&dqopt->dqonoff_mutex);
  1412. /* Sync the superblock so that buffers with quota data are written to
  1413. * disk (and so userspace sees correct data afterwards). */
  1414. if (sb->s_op->sync_fs)
  1415. sb->s_op->sync_fs(sb, 1);
  1416. sync_blockdev(sb->s_bdev);
  1417. /* Now the quota files are just ordinary files and we can set the
  1418. * inode flags back. Moreover we discard the pagecache so that
  1419. * userspace sees the writes we did bypassing the pagecache. We
  1420. * must also discard the blockdev buffers so that we see the
  1421. * changes done by userspace on the next quotaon() */
  1422. for (cnt = 0; cnt < MAXQUOTAS; cnt++)
  1423. if (toputinode[cnt]) {
  1424. mutex_lock(&dqopt->dqonoff_mutex);
  1425. /* If quota was reenabled in the meantime, we have
  1426. * nothing to do */
  1427. if (!sb_has_quota_enabled(sb, cnt)) {
  1428. mutex_lock_nested(&toputinode[cnt]->i_mutex, I_MUTEX_QUOTA);
  1429. toputinode[cnt]->i_flags &= ~(S_IMMUTABLE |
  1430. S_NOATIME | S_NOQUOTA);
  1431. truncate_inode_pages(&toputinode[cnt]->i_data, 0);
  1432. mutex_unlock(&toputinode[cnt]->i_mutex);
  1433. mark_inode_dirty(toputinode[cnt]);
  1434. }
  1435. mutex_unlock(&dqopt->dqonoff_mutex);
  1436. /* On remount RO, we keep the inode pointer so that we
  1437. * can reenable quota on the subsequent remount RW.
  1438. * But we have better not keep inode pointer when there
  1439. * is pending delete on the quota file... */
  1440. if (!remount)
  1441. iput(toputinode[cnt]);
  1442. else if (!toputinode[cnt]->i_nlink)
  1443. ret = -EBUSY;
  1444. }
  1445. if (sb->s_bdev)
  1446. invalidate_bdev(sb->s_bdev);
  1447. return ret;
  1448. }
  1449. /*
  1450. * Turn quotas on on a device
  1451. */
  1452. /* Helper function when we already have the inode */
  1453. static int vfs_quota_on_inode(struct inode *inode, int type, int format_id)
  1454. {
  1455. struct quota_format_type *fmt = find_quota_format(format_id);
  1456. struct super_block *sb = inode->i_sb;
  1457. struct quota_info *dqopt = sb_dqopt(sb);
  1458. int error;
  1459. int oldflags = -1;
  1460. if (!fmt)
  1461. return -ESRCH;
  1462. if (!S_ISREG(inode->i_mode)) {
  1463. error = -EACCES;
  1464. goto out_fmt;
  1465. }
  1466. if (IS_RDONLY(inode)) {
  1467. error = -EROFS;
  1468. goto out_fmt;
  1469. }
  1470. if (!sb->s_op->quota_write || !sb->s_op->quota_read) {
  1471. error = -EINVAL;
  1472. goto out_fmt;
  1473. }
  1474. /* As we bypass the pagecache we must now flush the inode so that
  1475. * we see all the changes from userspace... */
  1476. write_inode_now(inode, 1);
  1477. /* And now flush the block cache so that kernel sees the changes */
  1478. invalidate_bdev(sb->s_bdev);
  1479. mutex_lock(&inode->i_mutex);
  1480. mutex_lock(&dqopt->dqonoff_mutex);
  1481. if (sb_has_quota_enabled(sb, type) ||
  1482. sb_has_quota_suspended(sb, type)) {
  1483. error = -EBUSY;
  1484. goto out_lock;
  1485. }
  1486. /* We don't want quota and atime on quota files (deadlocks possible)
  1487. * Also nobody should write to the file - we use special IO operations
  1488. * which ignore the immutable bit. */
  1489. down_write(&dqopt->dqptr_sem);
  1490. oldflags = inode->i_flags & (S_NOATIME | S_IMMUTABLE | S_NOQUOTA);
  1491. inode->i_flags |= S_NOQUOTA | S_NOATIME | S_IMMUTABLE;
  1492. up_write(&dqopt->dqptr_sem);
  1493. sb->dq_op->drop(inode);
  1494. error = -EIO;
  1495. dqopt->files[type] = igrab(inode);
  1496. if (!dqopt->files[type])
  1497. goto out_lock;
  1498. error = -EINVAL;
  1499. if (!fmt->qf_ops->check_quota_file(sb, type))
  1500. goto out_file_init;
  1501. dqopt->ops[type] = fmt->qf_ops;
  1502. dqopt->info[type].dqi_format = fmt;
  1503. dqopt->info[type].dqi_fmt_id = format_id;
  1504. INIT_LIST_HEAD(&dqopt->info[type].dqi_dirty_list);
  1505. mutex_lock(&dqopt->dqio_mutex);
  1506. if ((error = dqopt->ops[type]->read_file_info(sb, type)) < 0) {
  1507. mutex_unlock(&dqopt->dqio_mutex);
  1508. goto out_file_init;
  1509. }
  1510. mutex_unlock(&dqopt->dqio_mutex);
  1511. mutex_unlock(&inode->i_mutex);
  1512. set_enable_flags(dqopt, type);
  1513. add_dquot_ref(sb, type);
  1514. mutex_unlock(&dqopt->dqonoff_mutex);
  1515. return 0;
  1516. out_file_init:
  1517. dqopt->files[type] = NULL;
  1518. iput(inode);
  1519. out_lock:
  1520. mutex_unlock(&dqopt->dqonoff_mutex);
  1521. if (oldflags != -1) {
  1522. down_write(&dqopt->dqptr_sem);
  1523. /* Set the flags back (in the case of accidental quotaon()
  1524. * on a wrong file we don't want to mess up the flags) */
  1525. inode->i_flags &= ~(S_NOATIME | S_NOQUOTA | S_IMMUTABLE);
  1526. inode->i_flags |= oldflags;
  1527. up_write(&dqopt->dqptr_sem);
  1528. }
  1529. mutex_unlock(&inode->i_mutex);
  1530. out_fmt:
  1531. put_quota_format(fmt);
  1532. return error;
  1533. }
  1534. /* Reenable quotas on remount RW */
  1535. static int vfs_quota_on_remount(struct super_block *sb, int type)
  1536. {
  1537. struct quota_info *dqopt = sb_dqopt(sb);
  1538. struct inode *inode;
  1539. int ret;
  1540. mutex_lock(&dqopt->dqonoff_mutex);
  1541. if (!sb_has_quota_suspended(sb, type)) {
  1542. mutex_unlock(&dqopt->dqonoff_mutex);
  1543. return 0;
  1544. }
  1545. BUG_ON(sb_has_quota_enabled(sb, type));
  1546. inode = dqopt->files[type];
  1547. dqopt->files[type] = NULL;
  1548. reset_enable_flags(dqopt, type, 0);
  1549. mutex_unlock(&dqopt->dqonoff_mutex);
  1550. ret = vfs_quota_on_inode(inode, type, dqopt->info[type].dqi_fmt_id);
  1551. iput(inode);
  1552. return ret;
  1553. }
  1554. /* Actual function called from quotactl() */
  1555. int vfs_quota_on(struct super_block *sb, int type, int format_id, char *path,
  1556. int remount)
  1557. {
  1558. struct nameidata nd;
  1559. int error;
  1560. if (remount)
  1561. return vfs_quota_on_remount(sb, type);
  1562. error = path_lookup(path, LOOKUP_FOLLOW, &nd);
  1563. if (error < 0)
  1564. return error;
  1565. error = security_quota_on(nd.path.dentry);
  1566. if (error)
  1567. goto out_path;
  1568. /* Quota file not on the same filesystem? */
  1569. if (nd.path.mnt->mnt_sb != sb)
  1570. error = -EXDEV;
  1571. else
  1572. error = vfs_quota_on_inode(nd.path.dentry->d_inode, type,
  1573. format_id);
  1574. out_path:
  1575. path_put(&nd.path);
  1576. return error;
  1577. }
  1578. /*
  1579. * This function is used when filesystem needs to initialize quotas
  1580. * during mount time.
  1581. */
  1582. int vfs_quota_on_mount(struct super_block *sb, char *qf_name,
  1583. int format_id, int type)
  1584. {
  1585. struct dentry *dentry;
  1586. int error;
  1587. dentry = lookup_one_len(qf_name, sb->s_root, strlen(qf_name));
  1588. if (IS_ERR(dentry))
  1589. return PTR_ERR(dentry);
  1590. if (!dentry->d_inode) {
  1591. error = -ENOENT;
  1592. goto out;
  1593. }
  1594. error = security_quota_on(dentry);
  1595. if (!error)
  1596. error = vfs_quota_on_inode(dentry->d_inode, type, format_id);
  1597. out:
  1598. dput(dentry);
  1599. return error;
  1600. }
  1601. /* Generic routine for getting common part of quota structure */
  1602. static void do_get_dqblk(struct dquot *dquot, struct if_dqblk *di)
  1603. {
  1604. struct mem_dqblk *dm = &dquot->dq_dqb;
  1605. spin_lock(&dq_data_lock);
  1606. di->dqb_bhardlimit = dm->dqb_bhardlimit;
  1607. di->dqb_bsoftlimit = dm->dqb_bsoftlimit;
  1608. di->dqb_curspace = dm->dqb_curspace;
  1609. di->dqb_ihardlimit = dm->dqb_ihardlimit;
  1610. di->dqb_isoftlimit = dm->dqb_isoftlimit;
  1611. di->dqb_curinodes = dm->dqb_curinodes;
  1612. di->dqb_btime = dm->dqb_btime;
  1613. di->dqb_itime = dm->dqb_itime;
  1614. di->dqb_valid = QIF_ALL;
  1615. spin_unlock(&dq_data_lock);
  1616. }
  1617. int vfs_get_dqblk(struct super_block *sb, int type, qid_t id, struct if_dqblk *di)
  1618. {
  1619. struct dquot *dquot;
  1620. mutex_lock(&sb_dqopt(sb)->dqonoff_mutex);
  1621. if (!(dquot = dqget(sb, id, type))) {
  1622. mutex_unlock(&sb_dqopt(sb)->dqonoff_mutex);
  1623. return -ESRCH;
  1624. }
  1625. do_get_dqblk(dquot, di);
  1626. dqput(dquot);
  1627. mutex_unlock(&sb_dqopt(sb)->dqonoff_mutex);
  1628. return 0;
  1629. }
  1630. /* Generic routine for setting common part of quota structure */
  1631. static int do_set_dqblk(struct dquot *dquot, struct if_dqblk *di)
  1632. {
  1633. struct mem_dqblk *dm = &dquot->dq_dqb;
  1634. int check_blim = 0, check_ilim = 0;
  1635. struct mem_dqinfo *dqi = &sb_dqopt(dquot->dq_sb)->info[dquot->dq_type];
  1636. if ((di->dqb_valid & QIF_BLIMITS &&
  1637. (di->dqb_bhardlimit > dqi->dqi_maxblimit ||
  1638. di->dqb_bsoftlimit > dqi->dqi_maxblimit)) ||
  1639. (di->dqb_valid & QIF_ILIMITS &&
  1640. (di->dqb_ihardlimit > dqi->dqi_maxilimit ||
  1641. di->dqb_isoftlimit > dqi->dqi_maxilimit)))
  1642. return -ERANGE;
  1643. spin_lock(&dq_data_lock);
  1644. if (di->dqb_valid & QIF_SPACE) {
  1645. dm->dqb_curspace = di->dqb_curspace;
  1646. check_blim = 1;
  1647. }
  1648. if (di->dqb_valid & QIF_BLIMITS) {
  1649. dm->dqb_bsoftlimit = di->dqb_bsoftlimit;
  1650. dm->dqb_bhardlimit = di->dqb_bhardlimit;
  1651. check_blim = 1;
  1652. }
  1653. if (di->dqb_valid & QIF_INODES) {
  1654. dm->dqb_curinodes = di->dqb_curinodes;
  1655. check_ilim = 1;
  1656. }
  1657. if (di->dqb_valid & QIF_ILIMITS) {
  1658. dm->dqb_isoftlimit = di->dqb_isoftlimit;
  1659. dm->dqb_ihardlimit = di->dqb_ihardlimit;
  1660. check_ilim = 1;
  1661. }
  1662. if (di->dqb_valid & QIF_BTIME)
  1663. dm->dqb_btime = di->dqb_btime;
  1664. if (di->dqb_valid & QIF_ITIME)
  1665. dm->dqb_itime = di->dqb_itime;
  1666. if (check_blim) {
  1667. if (!dm->dqb_bsoftlimit || toqb(dm->dqb_curspace) < dm->dqb_bsoftlimit) {
  1668. dm->dqb_btime = 0;
  1669. clear_bit(DQ_BLKS_B, &dquot->dq_flags);
  1670. }
  1671. else if (!(di->dqb_valid & QIF_BTIME)) /* Set grace only if user hasn't provided his own... */
  1672. dm->dqb_btime = get_seconds() + dqi->dqi_bgrace;
  1673. }
  1674. if (check_ilim) {
  1675. if (!dm->dqb_isoftlimit || dm->dqb_curinodes < dm->dqb_isoftlimit) {
  1676. dm->dqb_itime = 0;
  1677. clear_bit(DQ_INODES_B, &dquot->dq_flags);
  1678. }
  1679. else if (!(di->dqb_valid & QIF_ITIME)) /* Set grace only if user hasn't provided his own... */
  1680. dm->dqb_itime = get_seconds() + dqi->dqi_igrace;
  1681. }
  1682. if (dm->dqb_bhardlimit || dm->dqb_bsoftlimit || dm->dqb_ihardlimit || dm->dqb_isoftlimit)
  1683. clear_bit(DQ_FAKE_B, &dquot->dq_flags);
  1684. else
  1685. set_bit(DQ_FAKE_B, &dquot->dq_flags);
  1686. spin_unlock(&dq_data_lock);
  1687. mark_dquot_dirty(dquot);
  1688. return 0;
  1689. }
  1690. int vfs_set_dqblk(struct super_block *sb, int type, qid_t id, struct if_dqblk *di)
  1691. {
  1692. struct dquot *dquot;
  1693. int rc;
  1694. mutex_lock(&sb_dqopt(sb)->dqonoff_mutex);
  1695. if (!(dquot = dqget(sb, id, type))) {
  1696. mutex_unlock(&sb_dqopt(sb)->dqonoff_mutex);
  1697. return -ESRCH;
  1698. }
  1699. rc = do_set_dqblk(dquot, di);
  1700. dqput(dquot);
  1701. mutex_unlock(&sb_dqopt(sb)->dqonoff_mutex);
  1702. return rc;
  1703. }
  1704. /* Generic routine for getting common part of quota file information */
  1705. int vfs_get_dqinfo(struct super_block *sb, int type, struct if_dqinfo *ii)
  1706. {
  1707. struct mem_dqinfo *mi;
  1708. mutex_lock(&sb_dqopt(sb)->dqonoff_mutex);
  1709. if (!sb_has_quota_enabled(sb, type)) {
  1710. mutex_unlock(&sb_dqopt(sb)->dqonoff_mutex);
  1711. return -ESRCH;
  1712. }
  1713. mi = sb_dqopt(sb)->info + type;
  1714. spin_lock(&dq_data_lock);
  1715. ii->dqi_bgrace = mi->dqi_bgrace;
  1716. ii->dqi_igrace = mi->dqi_igrace;
  1717. ii->dqi_flags = mi->dqi_flags & DQF_MASK;
  1718. ii->dqi_valid = IIF_ALL;
  1719. spin_unlock(&dq_data_lock);
  1720. mutex_unlock(&sb_dqopt(sb)->dqonoff_mutex);
  1721. return 0;
  1722. }
  1723. /* Generic routine for setting common part of quota file information */
  1724. int vfs_set_dqinfo(struct super_block *sb, int type, struct if_dqinfo *ii)
  1725. {
  1726. struct mem_dqinfo *mi;
  1727. mutex_lock(&sb_dqopt(sb)->dqonoff_mutex);
  1728. if (!sb_has_quota_enabled(sb, type)) {
  1729. mutex_unlock(&sb_dqopt(sb)->dqonoff_mutex);
  1730. return -ESRCH;
  1731. }
  1732. mi = sb_dqopt(sb)->info + type;
  1733. spin_lock(&dq_data_lock);
  1734. if (ii->dqi_valid & IIF_BGRACE)
  1735. mi->dqi_bgrace = ii->dqi_bgrace;
  1736. if (ii->dqi_valid & IIF_IGRACE)
  1737. mi->dqi_igrace = ii->dqi_igrace;
  1738. if (ii->dqi_valid & IIF_FLAGS)
  1739. mi->dqi_flags = (mi->dqi_flags & ~DQF_MASK) | (ii->dqi_flags & DQF_MASK);
  1740. spin_unlock(&dq_data_lock);
  1741. mark_info_dirty(sb, type);
  1742. /* Force write to disk */
  1743. sb->dq_op->write_info(sb, type);
  1744. mutex_unlock(&sb_dqopt(sb)->dqonoff_mutex);
  1745. return 0;
  1746. }
  1747. struct quotactl_ops vfs_quotactl_ops = {
  1748. .quota_on = vfs_quota_on,
  1749. .quota_off = vfs_quota_off,
  1750. .quota_sync = vfs_quota_sync,
  1751. .get_info = vfs_get_dqinfo,
  1752. .set_info = vfs_set_dqinfo,
  1753. .get_dqblk = vfs_get_dqblk,
  1754. .set_dqblk = vfs_set_dqblk
  1755. };
  1756. static ctl_table fs_dqstats_table[] = {
  1757. {
  1758. .ctl_name = FS_DQ_LOOKUPS,
  1759. .procname = "lookups",
  1760. .data = &dqstats.lookups,
  1761. .maxlen = sizeof(int),
  1762. .mode = 0444,
  1763. .proc_handler = &proc_dointvec,
  1764. },
  1765. {
  1766. .ctl_name = FS_DQ_DROPS,
  1767. .procname = "drops",
  1768. .data = &dqstats.drops,
  1769. .maxlen = sizeof(int),
  1770. .mode = 0444,
  1771. .proc_handler = &proc_dointvec,
  1772. },
  1773. {
  1774. .ctl_name = FS_DQ_READS,
  1775. .procname = "reads",
  1776. .data = &dqstats.reads,
  1777. .maxlen = sizeof(int),
  1778. .mode = 0444,
  1779. .proc_handler = &proc_dointvec,
  1780. },
  1781. {
  1782. .ctl_name = FS_DQ_WRITES,
  1783. .procname = "writes",
  1784. .data = &dqstats.writes,
  1785. .maxlen = sizeof(int),
  1786. .mode = 0444,
  1787. .proc_handler = &proc_dointvec,
  1788. },
  1789. {
  1790. .ctl_name = FS_DQ_CACHE_HITS,
  1791. .procname = "cache_hits",
  1792. .data = &dqstats.cache_hits,
  1793. .maxlen = sizeof(int),
  1794. .mode = 0444,
  1795. .proc_handler = &proc_dointvec,
  1796. },
  1797. {
  1798. .ctl_name = FS_DQ_ALLOCATED,
  1799. .procname = "allocated_dquots",
  1800. .data = &dqstats.allocated_dquots,
  1801. .maxlen = sizeof(int),
  1802. .mode = 0444,
  1803. .proc_handler = &proc_dointvec,
  1804. },
  1805. {
  1806. .ctl_name = FS_DQ_FREE,
  1807. .procname = "free_dquots",
  1808. .data = &dqstats.free_dquots,
  1809. .maxlen = sizeof(int),
  1810. .mode = 0444,
  1811. .proc_handler = &proc_dointvec,
  1812. },
  1813. {
  1814. .ctl_name = FS_DQ_SYNCS,
  1815. .procname = "syncs",
  1816. .data = &dqstats.syncs,
  1817. .maxlen = sizeof(int),
  1818. .mode = 0444,
  1819. .proc_handler = &proc_dointvec,
  1820. },
  1821. #ifdef CONFIG_PRINT_QUOTA_WARNING
  1822. {
  1823. .ctl_name = FS_DQ_WARNINGS,
  1824. .procname = "warnings",
  1825. .data = &flag_print_warnings,
  1826. .maxlen = sizeof(int),
  1827. .mode = 0644,
  1828. .proc_handler = &proc_dointvec,
  1829. },
  1830. #endif
  1831. { .ctl_name = 0 },
  1832. };
  1833. static ctl_table fs_table[] = {
  1834. {
  1835. .ctl_name = FS_DQSTATS,
  1836. .procname = "quota",
  1837. .mode = 0555,
  1838. .child = fs_dqstats_table,
  1839. },
  1840. { .ctl_name = 0 },
  1841. };
  1842. static ctl_table sys_table[] = {
  1843. {
  1844. .ctl_name = CTL_FS,
  1845. .procname = "fs",
  1846. .mode = 0555,
  1847. .child = fs_table,
  1848. },
  1849. { .ctl_name = 0 },
  1850. };
  1851. static int __init dquot_init(void)
  1852. {
  1853. int i;
  1854. unsigned long nr_hash, order;
  1855. printk(KERN_NOTICE "VFS: Disk quotas %s\n", __DQUOT_VERSION__);
  1856. register_sysctl_table(sys_table);
  1857. dquot_cachep = kmem_cache_create("dquot",
  1858. sizeof(struct dquot), sizeof(unsigned long) * 4,
  1859. (SLAB_HWCACHE_ALIGN|SLAB_RECLAIM_ACCOUNT|
  1860. SLAB_MEM_SPREAD|SLAB_PANIC),
  1861. NULL);
  1862. order = 0;
  1863. dquot_hash = (struct hlist_head *)__get_free_pages(GFP_ATOMIC, order);
  1864. if (!dquot_hash)
  1865. panic("Cannot create dquot hash table");
  1866. /* Find power-of-two hlist_heads which can fit into allocation */
  1867. nr_hash = (1UL << order) * PAGE_SIZE / sizeof(struct hlist_head);
  1868. dq_hash_bits = 0;
  1869. do {
  1870. dq_hash_bits++;
  1871. } while (nr_hash >> dq_hash_bits);
  1872. dq_hash_bits--;
  1873. nr_hash = 1UL << dq_hash_bits;
  1874. dq_hash_mask = nr_hash - 1;
  1875. for (i = 0; i < nr_hash; i++)
  1876. INIT_HLIST_HEAD(dquot_hash + i);
  1877. printk("Dquot-cache hash table entries: %ld (order %ld, %ld bytes)\n",
  1878. nr_hash, order, (PAGE_SIZE << order));
  1879. register_shrinker(&dqcache_shrinker);
  1880. #ifdef CONFIG_QUOTA_NETLINK_INTERFACE
  1881. if (genl_register_family(&quota_genl_family) != 0)
  1882. printk(KERN_ERR "VFS: Failed to create quota netlink interface.\n");
  1883. #endif
  1884. return 0;
  1885. }
  1886. module_init(dquot_init);
  1887. EXPORT_SYMBOL(register_quota_format);
  1888. EXPORT_SYMBOL(unregister_quota_format);
  1889. EXPORT_SYMBOL(dqstats);
  1890. EXPORT_SYMBOL(dq_data_lock);
  1891. EXPORT_SYMBOL(vfs_quota_on);
  1892. EXPORT_SYMBOL(vfs_quota_on_mount);
  1893. EXPORT_SYMBOL(vfs_quota_off);
  1894. EXPORT_SYMBOL(vfs_quota_sync);
  1895. EXPORT_SYMBOL(vfs_get_dqinfo);
  1896. EXPORT_SYMBOL(vfs_set_dqinfo);
  1897. EXPORT_SYMBOL(vfs_get_dqblk);
  1898. EXPORT_SYMBOL(vfs_set_dqblk);
  1899. EXPORT_SYMBOL(dquot_commit);
  1900. EXPORT_SYMBOL(dquot_commit_info);
  1901. EXPORT_SYMBOL(dquot_acquire);
  1902. EXPORT_SYMBOL(dquot_release);
  1903. EXPORT_SYMBOL(dquot_mark_dquot_dirty);
  1904. EXPORT_SYMBOL(dquot_initialize);
  1905. EXPORT_SYMBOL(dquot_drop);
  1906. EXPORT_SYMBOL(dquot_alloc_space);
  1907. EXPORT_SYMBOL(dquot_alloc_inode);
  1908. EXPORT_SYMBOL(dquot_free_space);
  1909. EXPORT_SYMBOL(dquot_free_inode);
  1910. EXPORT_SYMBOL(dquot_transfer);