fs.h 83 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449
  1. #ifndef _LINUX_FS_H
  2. #define _LINUX_FS_H
  3. /*
  4. * This file has definitions for some important file table
  5. * structures etc.
  6. */
  7. #include <linux/limits.h>
  8. #include <linux/ioctl.h>
  9. /*
  10. * It's silly to have NR_OPEN bigger than NR_FILE, but you can change
  11. * the file limit at runtime and only root can increase the per-process
  12. * nr_file rlimit, so it's safe to set up a ridiculously high absolute
  13. * upper limit on files-per-process.
  14. *
  15. * Some programs (notably those using select()) may have to be
  16. * recompiled to take full advantage of the new limits..
  17. */
  18. /* Fixed constants first: */
  19. #undef NR_OPEN
  20. #define INR_OPEN 1024 /* Initial setting for nfile rlimits */
  21. #define BLOCK_SIZE_BITS 10
  22. #define BLOCK_SIZE (1<<BLOCK_SIZE_BITS)
  23. #define SEEK_SET 0 /* seek relative to beginning of file */
  24. #define SEEK_CUR 1 /* seek relative to current file position */
  25. #define SEEK_END 2 /* seek relative to end of file */
  26. #define SEEK_MAX SEEK_END
  27. /* And dynamically-tunable limits and defaults: */
  28. struct files_stat_struct {
  29. int nr_files; /* read only */
  30. int nr_free_files; /* read only */
  31. int max_files; /* tunable */
  32. };
  33. struct inodes_stat_t {
  34. int nr_inodes;
  35. int nr_unused;
  36. int dummy[5]; /* padding for sysctl ABI compatibility */
  37. };
  38. #define NR_FILE 8192 /* this can well be larger on a larger system */
  39. #define MAY_EXEC 1
  40. #define MAY_WRITE 2
  41. #define MAY_READ 4
  42. #define MAY_APPEND 8
  43. #define MAY_ACCESS 16
  44. #define MAY_OPEN 32
  45. /*
  46. * flags in file.f_mode. Note that FMODE_READ and FMODE_WRITE must correspond
  47. * to O_WRONLY and O_RDWR via the strange trick in __dentry_open()
  48. */
  49. /* file is open for reading */
  50. #define FMODE_READ ((__force fmode_t)1)
  51. /* file is open for writing */
  52. #define FMODE_WRITE ((__force fmode_t)2)
  53. /* file is seekable */
  54. #define FMODE_LSEEK ((__force fmode_t)4)
  55. /* file can be accessed using pread */
  56. #define FMODE_PREAD ((__force fmode_t)8)
  57. /* file can be accessed using pwrite */
  58. #define FMODE_PWRITE ((__force fmode_t)16)
  59. /* File is opened for execution with sys_execve / sys_uselib */
  60. #define FMODE_EXEC ((__force fmode_t)32)
  61. /* File is opened with O_NDELAY (only set for block devices) */
  62. #define FMODE_NDELAY ((__force fmode_t)64)
  63. /* File is opened with O_EXCL (only set for block devices) */
  64. #define FMODE_EXCL ((__force fmode_t)128)
  65. /* File is opened using open(.., 3, ..) and is writeable only for ioctls
  66. (specialy hack for floppy.c) */
  67. #define FMODE_WRITE_IOCTL ((__force fmode_t)256)
  68. /*
  69. * Don't update ctime and mtime.
  70. *
  71. * Currently a special hack for the XFS open_by_handle ioctl, but we'll
  72. * hopefully graduate it to a proper O_CMTIME flag supported by open(2) soon.
  73. */
  74. #define FMODE_NOCMTIME ((__force fmode_t)2048)
  75. /*
  76. * The below are the various read and write types that we support. Some of
  77. * them include behavioral modifiers that send information down to the
  78. * block layer and IO scheduler. Terminology:
  79. *
  80. * The block layer uses device plugging to defer IO a little bit, in
  81. * the hope that we will see more IO very shortly. This increases
  82. * coalescing of adjacent IO and thus reduces the number of IOs we
  83. * have to send to the device. It also allows for better queuing,
  84. * if the IO isn't mergeable. If the caller is going to be waiting
  85. * for the IO, then he must ensure that the device is unplugged so
  86. * that the IO is dispatched to the driver.
  87. *
  88. * All IO is handled async in Linux. This is fine for background
  89. * writes, but for reads or writes that someone waits for completion
  90. * on, we want to notify the block layer and IO scheduler so that they
  91. * know about it. That allows them to make better scheduling
  92. * decisions. So when the below references 'sync' and 'async', it
  93. * is referencing this priority hint.
  94. *
  95. * With that in mind, the available types are:
  96. *
  97. * READ A normal read operation. Device will be plugged.
  98. * READ_SYNC A synchronous read. Device is not plugged, caller can
  99. * immediately wait on this read without caring about
  100. * unplugging.
  101. * READA Used for read-ahead operations. Lower priority, and the
  102. * block layer could (in theory) choose to ignore this
  103. * request if it runs into resource problems.
  104. * WRITE A normal async write. Device will be plugged.
  105. * SWRITE Like WRITE, but a special case for ll_rw_block() that
  106. * tells it to lock the buffer first. Normally a buffer
  107. * must be locked before doing IO.
  108. * WRITE_SYNC_PLUG Synchronous write. Identical to WRITE, but passes down
  109. * the hint that someone will be waiting on this IO
  110. * shortly. The device must still be unplugged explicitly,
  111. * WRITE_SYNC_PLUG does not do this as we could be
  112. * submitting more writes before we actually wait on any
  113. * of them.
  114. * WRITE_SYNC Like WRITE_SYNC_PLUG, but also unplugs the device
  115. * immediately after submission. The write equivalent
  116. * of READ_SYNC.
  117. * WRITE_ODIRECT Special case write for O_DIRECT only.
  118. * SWRITE_SYNC
  119. * SWRITE_SYNC_PLUG Like WRITE_SYNC/WRITE_SYNC_PLUG, but locks the buffer.
  120. * See SWRITE.
  121. * WRITE_BARRIER Like WRITE, but tells the block layer that all
  122. * previously submitted writes must be safely on storage
  123. * before this one is started. Also guarantees that when
  124. * this write is complete, it itself is also safely on
  125. * storage. Prevents reordering of writes on both sides
  126. * of this IO.
  127. *
  128. */
  129. #define RW_MASK 1
  130. #define RWA_MASK 2
  131. #define READ 0
  132. #define WRITE 1
  133. #define READA 2 /* read-ahead - don't block if no resources */
  134. #define SWRITE 3 /* for ll_rw_block() - wait for buffer lock */
  135. #define READ_SYNC (READ | (1 << BIO_RW_SYNCIO) | (1 << BIO_RW_UNPLUG))
  136. #define READ_META (READ | (1 << BIO_RW_META))
  137. #define WRITE_SYNC_PLUG (WRITE | (1 << BIO_RW_SYNCIO) | (1 << BIO_RW_NOIDLE))
  138. #define WRITE_SYNC (WRITE_SYNC_PLUG | (1 << BIO_RW_UNPLUG))
  139. #define WRITE_ODIRECT (WRITE | (1 << BIO_RW_SYNCIO) | (1 << BIO_RW_UNPLUG))
  140. #define SWRITE_SYNC_PLUG \
  141. (SWRITE | (1 << BIO_RW_SYNCIO) | (1 << BIO_RW_NOIDLE))
  142. #define SWRITE_SYNC (SWRITE_SYNC_PLUG | (1 << BIO_RW_UNPLUG))
  143. #define WRITE_BARRIER (WRITE | (1 << BIO_RW_BARRIER))
  144. /*
  145. * These aren't really reads or writes, they pass down information about
  146. * parts of device that are now unused by the file system.
  147. */
  148. #define DISCARD_NOBARRIER (1 << BIO_RW_DISCARD)
  149. #define DISCARD_BARRIER ((1 << BIO_RW_DISCARD) | (1 << BIO_RW_BARRIER))
  150. #define SEL_IN 1
  151. #define SEL_OUT 2
  152. #define SEL_EX 4
  153. /* public flags for file_system_type */
  154. #define FS_REQUIRES_DEV 1
  155. #define FS_BINARY_MOUNTDATA 2
  156. #define FS_HAS_SUBTYPE 4
  157. #define FS_REVAL_DOT 16384 /* Check the paths ".", ".." for staleness */
  158. #define FS_RENAME_DOES_D_MOVE 32768 /* FS will handle d_move()
  159. * during rename() internally.
  160. */
  161. /*
  162. * These are the fs-independent mount-flags: up to 32 flags are supported
  163. */
  164. #define MS_RDONLY 1 /* Mount read-only */
  165. #define MS_NOSUID 2 /* Ignore suid and sgid bits */
  166. #define MS_NODEV 4 /* Disallow access to device special files */
  167. #define MS_NOEXEC 8 /* Disallow program execution */
  168. #define MS_SYNCHRONOUS 16 /* Writes are synced at once */
  169. #define MS_REMOUNT 32 /* Alter flags of a mounted FS */
  170. #define MS_MANDLOCK 64 /* Allow mandatory locks on an FS */
  171. #define MS_DIRSYNC 128 /* Directory modifications are synchronous */
  172. #define MS_NOATIME 1024 /* Do not update access times. */
  173. #define MS_NODIRATIME 2048 /* Do not update directory access times */
  174. #define MS_BIND 4096
  175. #define MS_MOVE 8192
  176. #define MS_REC 16384
  177. #define MS_VERBOSE 32768 /* War is peace. Verbosity is silence.
  178. MS_VERBOSE is deprecated. */
  179. #define MS_SILENT 32768
  180. #define MS_POSIXACL (1<<16) /* VFS does not apply the umask */
  181. #define MS_UNBINDABLE (1<<17) /* change to unbindable */
  182. #define MS_PRIVATE (1<<18) /* change to private */
  183. #define MS_SLAVE (1<<19) /* change to slave */
  184. #define MS_SHARED (1<<20) /* change to shared */
  185. #define MS_RELATIME (1<<21) /* Update atime relative to mtime/ctime. */
  186. #define MS_KERNMOUNT (1<<22) /* this is a kern_mount call */
  187. #define MS_I_VERSION (1<<23) /* Update inode I_version field */
  188. #define MS_STRICTATIME (1<<24) /* Always perform atime updates */
  189. #define MS_ACTIVE (1<<30)
  190. #define MS_NOUSER (1<<31)
  191. /*
  192. * Superblock flags that can be altered by MS_REMOUNT
  193. */
  194. #define MS_RMT_MASK (MS_RDONLY|MS_SYNCHRONOUS|MS_MANDLOCK|MS_I_VERSION)
  195. /*
  196. * Old magic mount flag and mask
  197. */
  198. #define MS_MGC_VAL 0xC0ED0000
  199. #define MS_MGC_MSK 0xffff0000
  200. /* Inode flags - they have nothing to superblock flags now */
  201. #define S_SYNC 1 /* Writes are synced at once */
  202. #define S_NOATIME 2 /* Do not update access times */
  203. #define S_APPEND 4 /* Append-only file */
  204. #define S_IMMUTABLE 8 /* Immutable file */
  205. #define S_DEAD 16 /* removed, but still open directory */
  206. #define S_NOQUOTA 32 /* Inode is not counted to quota */
  207. #define S_DIRSYNC 64 /* Directory modifications are synchronous */
  208. #define S_NOCMTIME 128 /* Do not update file c/mtime */
  209. #define S_SWAPFILE 256 /* Do not truncate: swapon got its bmaps */
  210. #define S_PRIVATE 512 /* Inode is fs-internal */
  211. /*
  212. * Note that nosuid etc flags are inode-specific: setting some file-system
  213. * flags just means all the inodes inherit those flags by default. It might be
  214. * possible to override it selectively if you really wanted to with some
  215. * ioctl() that is not currently implemented.
  216. *
  217. * Exception: MS_RDONLY is always applied to the entire file system.
  218. *
  219. * Unfortunately, it is possible to change a filesystems flags with it mounted
  220. * with files in use. This means that all of the inodes will not have their
  221. * i_flags updated. Hence, i_flags no longer inherit the superblock mount
  222. * flags, so these have to be checked separately. -- rmk@arm.uk.linux.org
  223. */
  224. #define __IS_FLG(inode,flg) ((inode)->i_sb->s_flags & (flg))
  225. #define IS_RDONLY(inode) ((inode)->i_sb->s_flags & MS_RDONLY)
  226. #define IS_SYNC(inode) (__IS_FLG(inode, MS_SYNCHRONOUS) || \
  227. ((inode)->i_flags & S_SYNC))
  228. #define IS_DIRSYNC(inode) (__IS_FLG(inode, MS_SYNCHRONOUS|MS_DIRSYNC) || \
  229. ((inode)->i_flags & (S_SYNC|S_DIRSYNC)))
  230. #define IS_MANDLOCK(inode) __IS_FLG(inode, MS_MANDLOCK)
  231. #define IS_NOATIME(inode) __IS_FLG(inode, MS_RDONLY|MS_NOATIME)
  232. #define IS_I_VERSION(inode) __IS_FLG(inode, MS_I_VERSION)
  233. #define IS_NOQUOTA(inode) ((inode)->i_flags & S_NOQUOTA)
  234. #define IS_APPEND(inode) ((inode)->i_flags & S_APPEND)
  235. #define IS_IMMUTABLE(inode) ((inode)->i_flags & S_IMMUTABLE)
  236. #define IS_POSIXACL(inode) __IS_FLG(inode, MS_POSIXACL)
  237. #define IS_DEADDIR(inode) ((inode)->i_flags & S_DEAD)
  238. #define IS_NOCMTIME(inode) ((inode)->i_flags & S_NOCMTIME)
  239. #define IS_SWAPFILE(inode) ((inode)->i_flags & S_SWAPFILE)
  240. #define IS_PRIVATE(inode) ((inode)->i_flags & S_PRIVATE)
  241. /* the read-only stuff doesn't really belong here, but any other place is
  242. probably as bad and I don't want to create yet another include file. */
  243. #define BLKROSET _IO(0x12,93) /* set device read-only (0 = read-write) */
  244. #define BLKROGET _IO(0x12,94) /* get read-only status (0 = read_write) */
  245. #define BLKRRPART _IO(0x12,95) /* re-read partition table */
  246. #define BLKGETSIZE _IO(0x12,96) /* return device size /512 (long *arg) */
  247. #define BLKFLSBUF _IO(0x12,97) /* flush buffer cache */
  248. #define BLKRASET _IO(0x12,98) /* set read ahead for block device */
  249. #define BLKRAGET _IO(0x12,99) /* get current read ahead setting */
  250. #define BLKFRASET _IO(0x12,100)/* set filesystem (mm/filemap.c) read-ahead */
  251. #define BLKFRAGET _IO(0x12,101)/* get filesystem (mm/filemap.c) read-ahead */
  252. #define BLKSECTSET _IO(0x12,102)/* set max sectors per request (ll_rw_blk.c) */
  253. #define BLKSECTGET _IO(0x12,103)/* get max sectors per request (ll_rw_blk.c) */
  254. #define BLKSSZGET _IO(0x12,104)/* get block device sector size */
  255. #if 0
  256. #define BLKPG _IO(0x12,105)/* See blkpg.h */
  257. /* Some people are morons. Do not use sizeof! */
  258. #define BLKELVGET _IOR(0x12,106,size_t)/* elevator get */
  259. #define BLKELVSET _IOW(0x12,107,size_t)/* elevator set */
  260. /* This was here just to show that the number is taken -
  261. probably all these _IO(0x12,*) ioctls should be moved to blkpg.h. */
  262. #endif
  263. /* A jump here: 108-111 have been used for various private purposes. */
  264. #define BLKBSZGET _IOR(0x12,112,size_t)
  265. #define BLKBSZSET _IOW(0x12,113,size_t)
  266. #define BLKGETSIZE64 _IOR(0x12,114,size_t) /* return device size in bytes (u64 *arg) */
  267. #define BLKTRACESETUP _IOWR(0x12,115,struct blk_user_trace_setup)
  268. #define BLKTRACESTART _IO(0x12,116)
  269. #define BLKTRACESTOP _IO(0x12,117)
  270. #define BLKTRACETEARDOWN _IO(0x12,118)
  271. #define BLKDISCARD _IO(0x12,119)
  272. #define BMAP_IOCTL 1 /* obsolete - kept for compatibility */
  273. #define FIBMAP _IO(0x00,1) /* bmap access */
  274. #define FIGETBSZ _IO(0x00,2) /* get the block size used for bmap */
  275. #define FIFREEZE _IOWR('X', 119, int) /* Freeze */
  276. #define FITHAW _IOWR('X', 120, int) /* Thaw */
  277. #define FS_IOC_GETFLAGS _IOR('f', 1, long)
  278. #define FS_IOC_SETFLAGS _IOW('f', 2, long)
  279. #define FS_IOC_GETVERSION _IOR('v', 1, long)
  280. #define FS_IOC_SETVERSION _IOW('v', 2, long)
  281. #define FS_IOC_FIEMAP _IOWR('f', 11, struct fiemap)
  282. #define FS_IOC32_GETFLAGS _IOR('f', 1, int)
  283. #define FS_IOC32_SETFLAGS _IOW('f', 2, int)
  284. #define FS_IOC32_GETVERSION _IOR('v', 1, int)
  285. #define FS_IOC32_SETVERSION _IOW('v', 2, int)
  286. /*
  287. * Inode flags (FS_IOC_GETFLAGS / FS_IOC_SETFLAGS)
  288. */
  289. #define FS_SECRM_FL 0x00000001 /* Secure deletion */
  290. #define FS_UNRM_FL 0x00000002 /* Undelete */
  291. #define FS_COMPR_FL 0x00000004 /* Compress file */
  292. #define FS_SYNC_FL 0x00000008 /* Synchronous updates */
  293. #define FS_IMMUTABLE_FL 0x00000010 /* Immutable file */
  294. #define FS_APPEND_FL 0x00000020 /* writes to file may only append */
  295. #define FS_NODUMP_FL 0x00000040 /* do not dump file */
  296. #define FS_NOATIME_FL 0x00000080 /* do not update atime */
  297. /* Reserved for compression usage... */
  298. #define FS_DIRTY_FL 0x00000100
  299. #define FS_COMPRBLK_FL 0x00000200 /* One or more compressed clusters */
  300. #define FS_NOCOMP_FL 0x00000400 /* Don't compress */
  301. #define FS_ECOMPR_FL 0x00000800 /* Compression error */
  302. /* End compression flags --- maybe not all used */
  303. #define FS_BTREE_FL 0x00001000 /* btree format dir */
  304. #define FS_INDEX_FL 0x00001000 /* hash-indexed directory */
  305. #define FS_IMAGIC_FL 0x00002000 /* AFS directory */
  306. #define FS_JOURNAL_DATA_FL 0x00004000 /* Reserved for ext3 */
  307. #define FS_NOTAIL_FL 0x00008000 /* file tail should not be merged */
  308. #define FS_DIRSYNC_FL 0x00010000 /* dirsync behaviour (directories only) */
  309. #define FS_TOPDIR_FL 0x00020000 /* Top of directory hierarchies*/
  310. #define FS_EXTENT_FL 0x00080000 /* Extents */
  311. #define FS_DIRECTIO_FL 0x00100000 /* Use direct i/o */
  312. #define FS_RESERVED_FL 0x80000000 /* reserved for ext2 lib */
  313. #define FS_FL_USER_VISIBLE 0x0003DFFF /* User visible flags */
  314. #define FS_FL_USER_MODIFIABLE 0x000380FF /* User modifiable flags */
  315. #define SYNC_FILE_RANGE_WAIT_BEFORE 1
  316. #define SYNC_FILE_RANGE_WRITE 2
  317. #define SYNC_FILE_RANGE_WAIT_AFTER 4
  318. #ifdef __KERNEL__
  319. #include <linux/linkage.h>
  320. #include <linux/wait.h>
  321. #include <linux/types.h>
  322. #include <linux/kdev_t.h>
  323. #include <linux/dcache.h>
  324. #include <linux/path.h>
  325. #include <linux/stat.h>
  326. #include <linux/cache.h>
  327. #include <linux/kobject.h>
  328. #include <linux/list.h>
  329. #include <linux/radix-tree.h>
  330. #include <linux/prio_tree.h>
  331. #include <linux/init.h>
  332. #include <linux/pid.h>
  333. #include <linux/mutex.h>
  334. #include <linux/capability.h>
  335. #include <linux/semaphore.h>
  336. #include <linux/fiemap.h>
  337. #include <asm/atomic.h>
  338. #include <asm/byteorder.h>
  339. struct export_operations;
  340. struct hd_geometry;
  341. struct iovec;
  342. struct nameidata;
  343. struct kiocb;
  344. struct pipe_inode_info;
  345. struct poll_table_struct;
  346. struct kstatfs;
  347. struct vm_area_struct;
  348. struct vfsmount;
  349. struct cred;
  350. extern void __init inode_init(void);
  351. extern void __init inode_init_early(void);
  352. extern void __init files_init(unsigned long);
  353. extern struct files_stat_struct files_stat;
  354. extern int get_max_files(void);
  355. extern int sysctl_nr_open;
  356. extern struct inodes_stat_t inodes_stat;
  357. extern int leases_enable, lease_break_time;
  358. #ifdef CONFIG_DNOTIFY
  359. extern int dir_notify_enable;
  360. #endif
  361. struct buffer_head;
  362. typedef int (get_block_t)(struct inode *inode, sector_t iblock,
  363. struct buffer_head *bh_result, int create);
  364. typedef void (dio_iodone_t)(struct kiocb *iocb, loff_t offset,
  365. ssize_t bytes, void *private);
  366. /*
  367. * Attribute flags. These should be or-ed together to figure out what
  368. * has been changed!
  369. */
  370. #define ATTR_MODE (1 << 0)
  371. #define ATTR_UID (1 << 1)
  372. #define ATTR_GID (1 << 2)
  373. #define ATTR_SIZE (1 << 3)
  374. #define ATTR_ATIME (1 << 4)
  375. #define ATTR_MTIME (1 << 5)
  376. #define ATTR_CTIME (1 << 6)
  377. #define ATTR_ATIME_SET (1 << 7)
  378. #define ATTR_MTIME_SET (1 << 8)
  379. #define ATTR_FORCE (1 << 9) /* Not a change, but a change it */
  380. #define ATTR_ATTR_FLAG (1 << 10)
  381. #define ATTR_KILL_SUID (1 << 11)
  382. #define ATTR_KILL_SGID (1 << 12)
  383. #define ATTR_FILE (1 << 13)
  384. #define ATTR_KILL_PRIV (1 << 14)
  385. #define ATTR_OPEN (1 << 15) /* Truncating from open(O_TRUNC) */
  386. #define ATTR_TIMES_SET (1 << 16)
  387. /*
  388. * This is the Inode Attributes structure, used for notify_change(). It
  389. * uses the above definitions as flags, to know which values have changed.
  390. * Also, in this manner, a Filesystem can look at only the values it cares
  391. * about. Basically, these are the attributes that the VFS layer can
  392. * request to change from the FS layer.
  393. *
  394. * Derek Atkins <warlord@MIT.EDU> 94-10-20
  395. */
  396. struct iattr {
  397. unsigned int ia_valid;
  398. umode_t ia_mode;
  399. uid_t ia_uid;
  400. gid_t ia_gid;
  401. loff_t ia_size;
  402. struct timespec ia_atime;
  403. struct timespec ia_mtime;
  404. struct timespec ia_ctime;
  405. /*
  406. * Not an attribute, but an auxilary info for filesystems wanting to
  407. * implement an ftruncate() like method. NOTE: filesystem should
  408. * check for (ia_valid & ATTR_FILE), and not for (ia_file != NULL).
  409. */
  410. struct file *ia_file;
  411. };
  412. /*
  413. * Includes for diskquotas.
  414. */
  415. #include <linux/quota.h>
  416. /**
  417. * enum positive_aop_returns - aop return codes with specific semantics
  418. *
  419. * @AOP_WRITEPAGE_ACTIVATE: Informs the caller that page writeback has
  420. * completed, that the page is still locked, and
  421. * should be considered active. The VM uses this hint
  422. * to return the page to the active list -- it won't
  423. * be a candidate for writeback again in the near
  424. * future. Other callers must be careful to unlock
  425. * the page if they get this return. Returned by
  426. * writepage();
  427. *
  428. * @AOP_TRUNCATED_PAGE: The AOP method that was handed a locked page has
  429. * unlocked it and the page might have been truncated.
  430. * The caller should back up to acquiring a new page and
  431. * trying again. The aop will be taking reasonable
  432. * precautions not to livelock. If the caller held a page
  433. * reference, it should drop it before retrying. Returned
  434. * by readpage().
  435. *
  436. * address_space_operation functions return these large constants to indicate
  437. * special semantics to the caller. These are much larger than the bytes in a
  438. * page to allow for functions that return the number of bytes operated on in a
  439. * given page.
  440. */
  441. enum positive_aop_returns {
  442. AOP_WRITEPAGE_ACTIVATE = 0x80000,
  443. AOP_TRUNCATED_PAGE = 0x80001,
  444. };
  445. #define AOP_FLAG_UNINTERRUPTIBLE 0x0001 /* will not do a short write */
  446. #define AOP_FLAG_CONT_EXPAND 0x0002 /* called from cont_expand */
  447. #define AOP_FLAG_NOFS 0x0004 /* used by filesystem to direct
  448. * helper code (eg buffer layer)
  449. * to clear GFP_FS from alloc */
  450. /*
  451. * oh the beauties of C type declarations.
  452. */
  453. struct page;
  454. struct address_space;
  455. struct writeback_control;
  456. struct iov_iter {
  457. const struct iovec *iov;
  458. unsigned long nr_segs;
  459. size_t iov_offset;
  460. size_t count;
  461. };
  462. size_t iov_iter_copy_from_user_atomic(struct page *page,
  463. struct iov_iter *i, unsigned long offset, size_t bytes);
  464. size_t iov_iter_copy_from_user(struct page *page,
  465. struct iov_iter *i, unsigned long offset, size_t bytes);
  466. void iov_iter_advance(struct iov_iter *i, size_t bytes);
  467. int iov_iter_fault_in_readable(struct iov_iter *i, size_t bytes);
  468. size_t iov_iter_single_seg_count(struct iov_iter *i);
  469. static inline void iov_iter_init(struct iov_iter *i,
  470. const struct iovec *iov, unsigned long nr_segs,
  471. size_t count, size_t written)
  472. {
  473. i->iov = iov;
  474. i->nr_segs = nr_segs;
  475. i->iov_offset = 0;
  476. i->count = count + written;
  477. iov_iter_advance(i, written);
  478. }
  479. static inline size_t iov_iter_count(struct iov_iter *i)
  480. {
  481. return i->count;
  482. }
  483. /*
  484. * "descriptor" for what we're up to with a read.
  485. * This allows us to use the same read code yet
  486. * have multiple different users of the data that
  487. * we read from a file.
  488. *
  489. * The simplest case just copies the data to user
  490. * mode.
  491. */
  492. typedef struct {
  493. size_t written;
  494. size_t count;
  495. union {
  496. char __user *buf;
  497. void *data;
  498. } arg;
  499. int error;
  500. } read_descriptor_t;
  501. typedef int (*read_actor_t)(read_descriptor_t *, struct page *,
  502. unsigned long, unsigned long);
  503. struct address_space_operations {
  504. int (*writepage)(struct page *page, struct writeback_control *wbc);
  505. int (*readpage)(struct file *, struct page *);
  506. void (*sync_page)(struct page *);
  507. /* Write back some dirty pages from this mapping. */
  508. int (*writepages)(struct address_space *, struct writeback_control *);
  509. /* Set a page dirty. Return true if this dirtied it */
  510. int (*set_page_dirty)(struct page *page);
  511. int (*readpages)(struct file *filp, struct address_space *mapping,
  512. struct list_head *pages, unsigned nr_pages);
  513. int (*write_begin)(struct file *, struct address_space *mapping,
  514. loff_t pos, unsigned len, unsigned flags,
  515. struct page **pagep, void **fsdata);
  516. int (*write_end)(struct file *, struct address_space *mapping,
  517. loff_t pos, unsigned len, unsigned copied,
  518. struct page *page, void *fsdata);
  519. /* Unfortunately this kludge is needed for FIBMAP. Don't use it */
  520. sector_t (*bmap)(struct address_space *, sector_t);
  521. void (*invalidatepage) (struct page *, unsigned long);
  522. int (*releasepage) (struct page *, gfp_t);
  523. ssize_t (*direct_IO)(int, struct kiocb *, const struct iovec *iov,
  524. loff_t offset, unsigned long nr_segs);
  525. int (*get_xip_mem)(struct address_space *, pgoff_t, int,
  526. void **, unsigned long *);
  527. /* migrate the contents of a page to the specified target */
  528. int (*migratepage) (struct address_space *,
  529. struct page *, struct page *);
  530. int (*launder_page) (struct page *);
  531. int (*is_partially_uptodate) (struct page *, read_descriptor_t *,
  532. unsigned long);
  533. };
  534. /*
  535. * pagecache_write_begin/pagecache_write_end must be used by general code
  536. * to write into the pagecache.
  537. */
  538. int pagecache_write_begin(struct file *, struct address_space *mapping,
  539. loff_t pos, unsigned len, unsigned flags,
  540. struct page **pagep, void **fsdata);
  541. int pagecache_write_end(struct file *, struct address_space *mapping,
  542. loff_t pos, unsigned len, unsigned copied,
  543. struct page *page, void *fsdata);
  544. struct backing_dev_info;
  545. struct address_space {
  546. struct inode *host; /* owner: inode, block_device */
  547. struct radix_tree_root page_tree; /* radix tree of all pages */
  548. spinlock_t tree_lock; /* and lock protecting it */
  549. unsigned int i_mmap_writable;/* count VM_SHARED mappings */
  550. struct prio_tree_root i_mmap; /* tree of private and shared mappings */
  551. struct list_head i_mmap_nonlinear;/*list VM_NONLINEAR mappings */
  552. spinlock_t i_mmap_lock; /* protect tree, count, list */
  553. unsigned int truncate_count; /* Cover race condition with truncate */
  554. unsigned long nrpages; /* number of total pages */
  555. pgoff_t writeback_index;/* writeback starts here */
  556. const struct address_space_operations *a_ops; /* methods */
  557. unsigned long flags; /* error bits/gfp mask */
  558. struct backing_dev_info *backing_dev_info; /* device readahead, etc */
  559. spinlock_t private_lock; /* for use by the address_space */
  560. struct list_head private_list; /* ditto */
  561. struct address_space *assoc_mapping; /* ditto */
  562. } __attribute__((aligned(sizeof(long))));
  563. /*
  564. * On most architectures that alignment is already the case; but
  565. * must be enforced here for CRIS, to let the least signficant bit
  566. * of struct page's "mapping" pointer be used for PAGE_MAPPING_ANON.
  567. */
  568. struct block_device {
  569. dev_t bd_dev; /* not a kdev_t - it's a search key */
  570. struct inode * bd_inode; /* will die */
  571. struct super_block * bd_super;
  572. int bd_openers;
  573. struct mutex bd_mutex; /* open/close mutex */
  574. struct semaphore bd_mount_sem;
  575. struct list_head bd_inodes;
  576. void * bd_holder;
  577. int bd_holders;
  578. #ifdef CONFIG_SYSFS
  579. struct list_head bd_holder_list;
  580. #endif
  581. struct block_device * bd_contains;
  582. unsigned bd_block_size;
  583. struct hd_struct * bd_part;
  584. /* number of times partitions within this device have been opened. */
  585. unsigned bd_part_count;
  586. int bd_invalidated;
  587. struct gendisk * bd_disk;
  588. struct list_head bd_list;
  589. struct backing_dev_info *bd_inode_backing_dev_info;
  590. /*
  591. * Private data. You must have bd_claim'ed the block_device
  592. * to use this. NOTE: bd_claim allows an owner to claim
  593. * the same device multiple times, the owner must take special
  594. * care to not mess up bd_private for that case.
  595. */
  596. unsigned long bd_private;
  597. /* The counter of freeze processes */
  598. int bd_fsfreeze_count;
  599. /* Mutex for freeze */
  600. struct mutex bd_fsfreeze_mutex;
  601. };
  602. /*
  603. * Radix-tree tags, for tagging dirty and writeback pages within the pagecache
  604. * radix trees
  605. */
  606. #define PAGECACHE_TAG_DIRTY 0
  607. #define PAGECACHE_TAG_WRITEBACK 1
  608. int mapping_tagged(struct address_space *mapping, int tag);
  609. /*
  610. * Might pages of this file be mapped into userspace?
  611. */
  612. static inline int mapping_mapped(struct address_space *mapping)
  613. {
  614. return !prio_tree_empty(&mapping->i_mmap) ||
  615. !list_empty(&mapping->i_mmap_nonlinear);
  616. }
  617. /*
  618. * Might pages of this file have been modified in userspace?
  619. * Note that i_mmap_writable counts all VM_SHARED vmas: do_mmap_pgoff
  620. * marks vma as VM_SHARED if it is shared, and the file was opened for
  621. * writing i.e. vma may be mprotected writable even if now readonly.
  622. */
  623. static inline int mapping_writably_mapped(struct address_space *mapping)
  624. {
  625. return mapping->i_mmap_writable != 0;
  626. }
  627. /*
  628. * Use sequence counter to get consistent i_size on 32-bit processors.
  629. */
  630. #if BITS_PER_LONG==32 && defined(CONFIG_SMP)
  631. #include <linux/seqlock.h>
  632. #define __NEED_I_SIZE_ORDERED
  633. #define i_size_ordered_init(inode) seqcount_init(&inode->i_size_seqcount)
  634. #else
  635. #define i_size_ordered_init(inode) do { } while (0)
  636. #endif
  637. struct inode {
  638. struct hlist_node i_hash;
  639. struct list_head i_list;
  640. struct list_head i_sb_list;
  641. struct list_head i_dentry;
  642. unsigned long i_ino;
  643. atomic_t i_count;
  644. unsigned int i_nlink;
  645. uid_t i_uid;
  646. gid_t i_gid;
  647. dev_t i_rdev;
  648. u64 i_version;
  649. loff_t i_size;
  650. #ifdef __NEED_I_SIZE_ORDERED
  651. seqcount_t i_size_seqcount;
  652. #endif
  653. struct timespec i_atime;
  654. struct timespec i_mtime;
  655. struct timespec i_ctime;
  656. blkcnt_t i_blocks;
  657. unsigned int i_blkbits;
  658. unsigned short i_bytes;
  659. umode_t i_mode;
  660. spinlock_t i_lock; /* i_blocks, i_bytes, maybe i_size */
  661. struct mutex i_mutex;
  662. struct rw_semaphore i_alloc_sem;
  663. const struct inode_operations *i_op;
  664. const struct file_operations *i_fop; /* former ->i_op->default_file_ops */
  665. struct super_block *i_sb;
  666. struct file_lock *i_flock;
  667. struct address_space *i_mapping;
  668. struct address_space i_data;
  669. #ifdef CONFIG_QUOTA
  670. struct dquot *i_dquot[MAXQUOTAS];
  671. #endif
  672. struct list_head i_devices;
  673. union {
  674. struct pipe_inode_info *i_pipe;
  675. struct block_device *i_bdev;
  676. struct cdev *i_cdev;
  677. };
  678. __u32 i_generation;
  679. #ifdef CONFIG_FSNOTIFY
  680. __u32 i_fsnotify_mask; /* all events this inode cares about */
  681. struct hlist_head i_fsnotify_mark_entries; /* fsnotify mark entries */
  682. #endif
  683. #ifdef CONFIG_INOTIFY
  684. struct list_head inotify_watches; /* watches on this inode */
  685. struct mutex inotify_mutex; /* protects the watches list */
  686. #endif
  687. unsigned long i_state;
  688. unsigned long dirtied_when; /* jiffies of first dirtying */
  689. unsigned int i_flags;
  690. atomic_t i_writecount;
  691. #ifdef CONFIG_SECURITY
  692. void *i_security;
  693. #endif
  694. void *i_private; /* fs or device private pointer */
  695. };
  696. /*
  697. * inode->i_mutex nesting subclasses for the lock validator:
  698. *
  699. * 0: the object of the current VFS operation
  700. * 1: parent
  701. * 2: child/target
  702. * 3: quota file
  703. *
  704. * The locking order between these classes is
  705. * parent -> child -> normal -> xattr -> quota
  706. */
  707. enum inode_i_mutex_lock_class
  708. {
  709. I_MUTEX_NORMAL,
  710. I_MUTEX_PARENT,
  711. I_MUTEX_CHILD,
  712. I_MUTEX_XATTR,
  713. I_MUTEX_QUOTA
  714. };
  715. /*
  716. * NOTE: in a 32bit arch with a preemptable kernel and
  717. * an UP compile the i_size_read/write must be atomic
  718. * with respect to the local cpu (unlike with preempt disabled),
  719. * but they don't need to be atomic with respect to other cpus like in
  720. * true SMP (so they need either to either locally disable irq around
  721. * the read or for example on x86 they can be still implemented as a
  722. * cmpxchg8b without the need of the lock prefix). For SMP compiles
  723. * and 64bit archs it makes no difference if preempt is enabled or not.
  724. */
  725. static inline loff_t i_size_read(const struct inode *inode)
  726. {
  727. #if BITS_PER_LONG==32 && defined(CONFIG_SMP)
  728. loff_t i_size;
  729. unsigned int seq;
  730. do {
  731. seq = read_seqcount_begin(&inode->i_size_seqcount);
  732. i_size = inode->i_size;
  733. } while (read_seqcount_retry(&inode->i_size_seqcount, seq));
  734. return i_size;
  735. #elif BITS_PER_LONG==32 && defined(CONFIG_PREEMPT)
  736. loff_t i_size;
  737. preempt_disable();
  738. i_size = inode->i_size;
  739. preempt_enable();
  740. return i_size;
  741. #else
  742. return inode->i_size;
  743. #endif
  744. }
  745. /*
  746. * NOTE: unlike i_size_read(), i_size_write() does need locking around it
  747. * (normally i_mutex), otherwise on 32bit/SMP an update of i_size_seqcount
  748. * can be lost, resulting in subsequent i_size_read() calls spinning forever.
  749. */
  750. static inline void i_size_write(struct inode *inode, loff_t i_size)
  751. {
  752. #if BITS_PER_LONG==32 && defined(CONFIG_SMP)
  753. write_seqcount_begin(&inode->i_size_seqcount);
  754. inode->i_size = i_size;
  755. write_seqcount_end(&inode->i_size_seqcount);
  756. #elif BITS_PER_LONG==32 && defined(CONFIG_PREEMPT)
  757. preempt_disable();
  758. inode->i_size = i_size;
  759. preempt_enable();
  760. #else
  761. inode->i_size = i_size;
  762. #endif
  763. }
  764. static inline unsigned iminor(const struct inode *inode)
  765. {
  766. return MINOR(inode->i_rdev);
  767. }
  768. static inline unsigned imajor(const struct inode *inode)
  769. {
  770. return MAJOR(inode->i_rdev);
  771. }
  772. extern struct block_device *I_BDEV(struct inode *inode);
  773. struct fown_struct {
  774. rwlock_t lock; /* protects pid, uid, euid fields */
  775. struct pid *pid; /* pid or -pgrp where SIGIO should be sent */
  776. enum pid_type pid_type; /* Kind of process group SIGIO should be sent to */
  777. uid_t uid, euid; /* uid/euid of process setting the owner */
  778. int signum; /* posix.1b rt signal to be delivered on IO */
  779. };
  780. /*
  781. * Track a single file's readahead state
  782. */
  783. struct file_ra_state {
  784. pgoff_t start; /* where readahead started */
  785. unsigned int size; /* # of readahead pages */
  786. unsigned int async_size; /* do asynchronous readahead when
  787. there are only # of pages ahead */
  788. unsigned int ra_pages; /* Maximum readahead window */
  789. int mmap_miss; /* Cache miss stat for mmap accesses */
  790. loff_t prev_pos; /* Cache last read() position */
  791. };
  792. /*
  793. * Check if @index falls in the readahead windows.
  794. */
  795. static inline int ra_has_index(struct file_ra_state *ra, pgoff_t index)
  796. {
  797. return (index >= ra->start &&
  798. index < ra->start + ra->size);
  799. }
  800. #define FILE_MNT_WRITE_TAKEN 1
  801. #define FILE_MNT_WRITE_RELEASED 2
  802. struct file {
  803. /*
  804. * fu_list becomes invalid after file_free is called and queued via
  805. * fu_rcuhead for RCU freeing
  806. */
  807. union {
  808. struct list_head fu_list;
  809. struct rcu_head fu_rcuhead;
  810. } f_u;
  811. struct path f_path;
  812. #define f_dentry f_path.dentry
  813. #define f_vfsmnt f_path.mnt
  814. const struct file_operations *f_op;
  815. spinlock_t f_lock; /* f_ep_links, f_flags, no IRQ */
  816. atomic_long_t f_count;
  817. unsigned int f_flags;
  818. fmode_t f_mode;
  819. loff_t f_pos;
  820. struct fown_struct f_owner;
  821. const struct cred *f_cred;
  822. struct file_ra_state f_ra;
  823. u64 f_version;
  824. #ifdef CONFIG_SECURITY
  825. void *f_security;
  826. #endif
  827. /* needed for tty driver, and maybe others */
  828. void *private_data;
  829. #ifdef CONFIG_EPOLL
  830. /* Used by fs/eventpoll.c to link all the hooks to this file */
  831. struct list_head f_ep_links;
  832. #endif /* #ifdef CONFIG_EPOLL */
  833. struct address_space *f_mapping;
  834. #ifdef CONFIG_DEBUG_WRITECOUNT
  835. unsigned long f_mnt_write_state;
  836. #endif
  837. };
  838. extern spinlock_t files_lock;
  839. #define file_list_lock() spin_lock(&files_lock);
  840. #define file_list_unlock() spin_unlock(&files_lock);
  841. #define get_file(x) atomic_long_inc(&(x)->f_count)
  842. #define file_count(x) atomic_long_read(&(x)->f_count)
  843. #ifdef CONFIG_DEBUG_WRITECOUNT
  844. static inline void file_take_write(struct file *f)
  845. {
  846. WARN_ON(f->f_mnt_write_state != 0);
  847. f->f_mnt_write_state = FILE_MNT_WRITE_TAKEN;
  848. }
  849. static inline void file_release_write(struct file *f)
  850. {
  851. f->f_mnt_write_state |= FILE_MNT_WRITE_RELEASED;
  852. }
  853. static inline void file_reset_write(struct file *f)
  854. {
  855. f->f_mnt_write_state = 0;
  856. }
  857. static inline void file_check_state(struct file *f)
  858. {
  859. /*
  860. * At this point, either both or neither of these bits
  861. * should be set.
  862. */
  863. WARN_ON(f->f_mnt_write_state == FILE_MNT_WRITE_TAKEN);
  864. WARN_ON(f->f_mnt_write_state == FILE_MNT_WRITE_RELEASED);
  865. }
  866. static inline int file_check_writeable(struct file *f)
  867. {
  868. if (f->f_mnt_write_state == FILE_MNT_WRITE_TAKEN)
  869. return 0;
  870. printk(KERN_WARNING "writeable file with no "
  871. "mnt_want_write()\n");
  872. WARN_ON(1);
  873. return -EINVAL;
  874. }
  875. #else /* !CONFIG_DEBUG_WRITECOUNT */
  876. static inline void file_take_write(struct file *filp) {}
  877. static inline void file_release_write(struct file *filp) {}
  878. static inline void file_reset_write(struct file *filp) {}
  879. static inline void file_check_state(struct file *filp) {}
  880. static inline int file_check_writeable(struct file *filp)
  881. {
  882. return 0;
  883. }
  884. #endif /* CONFIG_DEBUG_WRITECOUNT */
  885. #define MAX_NON_LFS ((1UL<<31) - 1)
  886. /* Page cache limit. The filesystems should put that into their s_maxbytes
  887. limits, otherwise bad things can happen in VM. */
  888. #if BITS_PER_LONG==32
  889. #define MAX_LFS_FILESIZE (((u64)PAGE_CACHE_SIZE << (BITS_PER_LONG-1))-1)
  890. #elif BITS_PER_LONG==64
  891. #define MAX_LFS_FILESIZE 0x7fffffffffffffffUL
  892. #endif
  893. #define FL_POSIX 1
  894. #define FL_FLOCK 2
  895. #define FL_ACCESS 8 /* not trying to lock, just looking */
  896. #define FL_EXISTS 16 /* when unlocking, test for existence */
  897. #define FL_LEASE 32 /* lease held on this file */
  898. #define FL_CLOSE 64 /* unlock on close */
  899. #define FL_SLEEP 128 /* A blocking lock */
  900. /*
  901. * Special return value from posix_lock_file() and vfs_lock_file() for
  902. * asynchronous locking.
  903. */
  904. #define FILE_LOCK_DEFERRED 1
  905. /*
  906. * The POSIX file lock owner is determined by
  907. * the "struct files_struct" in the thread group
  908. * (or NULL for no owner - BSD locks).
  909. *
  910. * Lockd stuffs a "host" pointer into this.
  911. */
  912. typedef struct files_struct *fl_owner_t;
  913. struct file_lock_operations {
  914. void (*fl_copy_lock)(struct file_lock *, struct file_lock *);
  915. void (*fl_release_private)(struct file_lock *);
  916. };
  917. struct lock_manager_operations {
  918. int (*fl_compare_owner)(struct file_lock *, struct file_lock *);
  919. void (*fl_notify)(struct file_lock *); /* unblock callback */
  920. int (*fl_grant)(struct file_lock *, struct file_lock *, int);
  921. void (*fl_copy_lock)(struct file_lock *, struct file_lock *);
  922. void (*fl_release_private)(struct file_lock *);
  923. void (*fl_break)(struct file_lock *);
  924. int (*fl_mylease)(struct file_lock *, struct file_lock *);
  925. int (*fl_change)(struct file_lock **, int);
  926. };
  927. struct lock_manager {
  928. struct list_head list;
  929. };
  930. void locks_start_grace(struct lock_manager *);
  931. void locks_end_grace(struct lock_manager *);
  932. int locks_in_grace(void);
  933. /* that will die - we need it for nfs_lock_info */
  934. #include <linux/nfs_fs_i.h>
  935. struct file_lock {
  936. struct file_lock *fl_next; /* singly linked list for this inode */
  937. struct list_head fl_link; /* doubly linked list of all locks */
  938. struct list_head fl_block; /* circular list of blocked processes */
  939. fl_owner_t fl_owner;
  940. unsigned char fl_flags;
  941. unsigned char fl_type;
  942. unsigned int fl_pid;
  943. struct pid *fl_nspid;
  944. wait_queue_head_t fl_wait;
  945. struct file *fl_file;
  946. loff_t fl_start;
  947. loff_t fl_end;
  948. struct fasync_struct * fl_fasync; /* for lease break notifications */
  949. unsigned long fl_break_time; /* for nonblocking lease breaks */
  950. struct file_lock_operations *fl_ops; /* Callbacks for filesystems */
  951. struct lock_manager_operations *fl_lmops; /* Callbacks for lockmanagers */
  952. union {
  953. struct nfs_lock_info nfs_fl;
  954. struct nfs4_lock_info nfs4_fl;
  955. struct {
  956. struct list_head link; /* link in AFS vnode's pending_locks list */
  957. int state; /* state of grant or error if -ve */
  958. } afs;
  959. } fl_u;
  960. };
  961. /* The following constant reflects the upper bound of the file/locking space */
  962. #ifndef OFFSET_MAX
  963. #define INT_LIMIT(x) (~((x)1 << (sizeof(x)*8 - 1)))
  964. #define OFFSET_MAX INT_LIMIT(loff_t)
  965. #define OFFT_OFFSET_MAX INT_LIMIT(off_t)
  966. #endif
  967. #include <linux/fcntl.h>
  968. extern void send_sigio(struct fown_struct *fown, int fd, int band);
  969. /* fs/sync.c */
  970. extern int do_sync_mapping_range(struct address_space *mapping, loff_t offset,
  971. loff_t endbyte, unsigned int flags);
  972. #ifdef CONFIG_FILE_LOCKING
  973. extern int fcntl_getlk(struct file *, struct flock __user *);
  974. extern int fcntl_setlk(unsigned int, struct file *, unsigned int,
  975. struct flock __user *);
  976. #if BITS_PER_LONG == 32
  977. extern int fcntl_getlk64(struct file *, struct flock64 __user *);
  978. extern int fcntl_setlk64(unsigned int, struct file *, unsigned int,
  979. struct flock64 __user *);
  980. #endif
  981. extern int fcntl_setlease(unsigned int fd, struct file *filp, long arg);
  982. extern int fcntl_getlease(struct file *filp);
  983. /* fs/locks.c */
  984. extern void locks_init_lock(struct file_lock *);
  985. extern void locks_copy_lock(struct file_lock *, struct file_lock *);
  986. extern void __locks_copy_lock(struct file_lock *, const struct file_lock *);
  987. extern void locks_remove_posix(struct file *, fl_owner_t);
  988. extern void locks_remove_flock(struct file *);
  989. extern void posix_test_lock(struct file *, struct file_lock *);
  990. extern int posix_lock_file(struct file *, struct file_lock *, struct file_lock *);
  991. extern int posix_lock_file_wait(struct file *, struct file_lock *);
  992. extern int posix_unblock_lock(struct file *, struct file_lock *);
  993. extern int vfs_test_lock(struct file *, struct file_lock *);
  994. extern int vfs_lock_file(struct file *, unsigned int, struct file_lock *, struct file_lock *);
  995. extern int vfs_cancel_lock(struct file *filp, struct file_lock *fl);
  996. extern int flock_lock_file_wait(struct file *filp, struct file_lock *fl);
  997. extern int __break_lease(struct inode *inode, unsigned int flags);
  998. extern void lease_get_mtime(struct inode *, struct timespec *time);
  999. extern int generic_setlease(struct file *, long, struct file_lock **);
  1000. extern int vfs_setlease(struct file *, long, struct file_lock **);
  1001. extern int lease_modify(struct file_lock **, int);
  1002. extern int lock_may_read(struct inode *, loff_t start, unsigned long count);
  1003. extern int lock_may_write(struct inode *, loff_t start, unsigned long count);
  1004. #else /* !CONFIG_FILE_LOCKING */
  1005. static inline int fcntl_getlk(struct file *file, struct flock __user *user)
  1006. {
  1007. return -EINVAL;
  1008. }
  1009. static inline int fcntl_setlk(unsigned int fd, struct file *file,
  1010. unsigned int cmd, struct flock __user *user)
  1011. {
  1012. return -EACCES;
  1013. }
  1014. #if BITS_PER_LONG == 32
  1015. static inline int fcntl_getlk64(struct file *file, struct flock64 __user *user)
  1016. {
  1017. return -EINVAL;
  1018. }
  1019. static inline int fcntl_setlk64(unsigned int fd, struct file *file,
  1020. unsigned int cmd, struct flock64 __user *user)
  1021. {
  1022. return -EACCES;
  1023. }
  1024. #endif
  1025. static inline int fcntl_setlease(unsigned int fd, struct file *filp, long arg)
  1026. {
  1027. return 0;
  1028. }
  1029. static inline int fcntl_getlease(struct file *filp)
  1030. {
  1031. return 0;
  1032. }
  1033. static inline void locks_init_lock(struct file_lock *fl)
  1034. {
  1035. return;
  1036. }
  1037. static inline void __locks_copy_lock(struct file_lock *new, struct file_lock *fl)
  1038. {
  1039. return;
  1040. }
  1041. static inline void locks_copy_lock(struct file_lock *new, struct file_lock *fl)
  1042. {
  1043. return;
  1044. }
  1045. static inline void locks_remove_posix(struct file *filp, fl_owner_t owner)
  1046. {
  1047. return;
  1048. }
  1049. static inline void locks_remove_flock(struct file *filp)
  1050. {
  1051. return;
  1052. }
  1053. static inline void posix_test_lock(struct file *filp, struct file_lock *fl)
  1054. {
  1055. return;
  1056. }
  1057. static inline int posix_lock_file(struct file *filp, struct file_lock *fl,
  1058. struct file_lock *conflock)
  1059. {
  1060. return -ENOLCK;
  1061. }
  1062. static inline int posix_lock_file_wait(struct file *filp, struct file_lock *fl)
  1063. {
  1064. return -ENOLCK;
  1065. }
  1066. static inline int posix_unblock_lock(struct file *filp,
  1067. struct file_lock *waiter)
  1068. {
  1069. return -ENOENT;
  1070. }
  1071. static inline int vfs_test_lock(struct file *filp, struct file_lock *fl)
  1072. {
  1073. return 0;
  1074. }
  1075. static inline int vfs_lock_file(struct file *filp, unsigned int cmd,
  1076. struct file_lock *fl, struct file_lock *conf)
  1077. {
  1078. return -ENOLCK;
  1079. }
  1080. static inline int vfs_cancel_lock(struct file *filp, struct file_lock *fl)
  1081. {
  1082. return 0;
  1083. }
  1084. static inline int flock_lock_file_wait(struct file *filp,
  1085. struct file_lock *request)
  1086. {
  1087. return -ENOLCK;
  1088. }
  1089. static inline int __break_lease(struct inode *inode, unsigned int mode)
  1090. {
  1091. return 0;
  1092. }
  1093. static inline void lease_get_mtime(struct inode *inode, struct timespec *time)
  1094. {
  1095. return;
  1096. }
  1097. static inline int generic_setlease(struct file *filp, long arg,
  1098. struct file_lock **flp)
  1099. {
  1100. return -EINVAL;
  1101. }
  1102. static inline int vfs_setlease(struct file *filp, long arg,
  1103. struct file_lock **lease)
  1104. {
  1105. return -EINVAL;
  1106. }
  1107. static inline int lease_modify(struct file_lock **before, int arg)
  1108. {
  1109. return -EINVAL;
  1110. }
  1111. static inline int lock_may_read(struct inode *inode, loff_t start,
  1112. unsigned long len)
  1113. {
  1114. return 1;
  1115. }
  1116. static inline int lock_may_write(struct inode *inode, loff_t start,
  1117. unsigned long len)
  1118. {
  1119. return 1;
  1120. }
  1121. #endif /* !CONFIG_FILE_LOCKING */
  1122. struct fasync_struct {
  1123. int magic;
  1124. int fa_fd;
  1125. struct fasync_struct *fa_next; /* singly linked list */
  1126. struct file *fa_file;
  1127. };
  1128. #define FASYNC_MAGIC 0x4601
  1129. /* SMP safe fasync helpers: */
  1130. extern int fasync_helper(int, struct file *, int, struct fasync_struct **);
  1131. /* can be called from interrupts */
  1132. extern void kill_fasync(struct fasync_struct **, int, int);
  1133. /* only for net: no internal synchronization */
  1134. extern void __kill_fasync(struct fasync_struct *, int, int);
  1135. extern int __f_setown(struct file *filp, struct pid *, enum pid_type, int force);
  1136. extern int f_setown(struct file *filp, unsigned long arg, int force);
  1137. extern void f_delown(struct file *filp);
  1138. extern pid_t f_getown(struct file *filp);
  1139. extern int send_sigurg(struct fown_struct *fown);
  1140. /*
  1141. * Umount options
  1142. */
  1143. #define MNT_FORCE 0x00000001 /* Attempt to forcibily umount */
  1144. #define MNT_DETACH 0x00000002 /* Just detach from the tree */
  1145. #define MNT_EXPIRE 0x00000004 /* Mark for expiry */
  1146. extern struct list_head super_blocks;
  1147. extern spinlock_t sb_lock;
  1148. #define sb_entry(list) list_entry((list), struct super_block, s_list)
  1149. #define S_BIAS (1<<30)
  1150. struct super_block {
  1151. struct list_head s_list; /* Keep this first */
  1152. dev_t s_dev; /* search index; _not_ kdev_t */
  1153. unsigned long s_blocksize;
  1154. unsigned char s_blocksize_bits;
  1155. unsigned char s_dirt;
  1156. unsigned long long s_maxbytes; /* Max file size */
  1157. struct file_system_type *s_type;
  1158. const struct super_operations *s_op;
  1159. struct dquot_operations *dq_op;
  1160. struct quotactl_ops *s_qcop;
  1161. const struct export_operations *s_export_op;
  1162. unsigned long s_flags;
  1163. unsigned long s_magic;
  1164. struct dentry *s_root;
  1165. struct rw_semaphore s_umount;
  1166. struct mutex s_lock;
  1167. int s_count;
  1168. int s_need_sync;
  1169. atomic_t s_active;
  1170. #ifdef CONFIG_SECURITY
  1171. void *s_security;
  1172. #endif
  1173. struct xattr_handler **s_xattr;
  1174. struct list_head s_inodes; /* all inodes */
  1175. struct list_head s_dirty; /* dirty inodes */
  1176. struct list_head s_io; /* parked for writeback */
  1177. struct list_head s_more_io; /* parked for more writeback */
  1178. struct hlist_head s_anon; /* anonymous dentries for (nfs) exporting */
  1179. struct list_head s_files;
  1180. /* s_dentry_lru and s_nr_dentry_unused are protected by dcache_lock */
  1181. struct list_head s_dentry_lru; /* unused dentry lru */
  1182. int s_nr_dentry_unused; /* # of dentry on lru */
  1183. struct block_device *s_bdev;
  1184. struct mtd_info *s_mtd;
  1185. struct list_head s_instances;
  1186. struct quota_info s_dquot; /* Diskquota specific options */
  1187. int s_frozen;
  1188. wait_queue_head_t s_wait_unfrozen;
  1189. char s_id[32]; /* Informational name */
  1190. void *s_fs_info; /* Filesystem private info */
  1191. fmode_t s_mode;
  1192. /*
  1193. * The next field is for VFS *only*. No filesystems have any business
  1194. * even looking at it. You had been warned.
  1195. */
  1196. struct mutex s_vfs_rename_mutex; /* Kludge */
  1197. /* Granularity of c/m/atime in ns.
  1198. Cannot be worse than a second */
  1199. u32 s_time_gran;
  1200. /*
  1201. * Filesystem subtype. If non-empty the filesystem type field
  1202. * in /proc/mounts will be "type.subtype"
  1203. */
  1204. char *s_subtype;
  1205. /*
  1206. * Saved mount options for lazy filesystems using
  1207. * generic_show_options()
  1208. */
  1209. char *s_options;
  1210. };
  1211. extern struct timespec current_fs_time(struct super_block *sb);
  1212. /*
  1213. * Snapshotting support.
  1214. */
  1215. enum {
  1216. SB_UNFROZEN = 0,
  1217. SB_FREEZE_WRITE = 1,
  1218. SB_FREEZE_TRANS = 2,
  1219. };
  1220. #define vfs_check_frozen(sb, level) \
  1221. wait_event((sb)->s_wait_unfrozen, ((sb)->s_frozen < (level)))
  1222. #define get_fs_excl() atomic_inc(&current->fs_excl)
  1223. #define put_fs_excl() atomic_dec(&current->fs_excl)
  1224. #define has_fs_excl() atomic_read(&current->fs_excl)
  1225. #define is_owner_or_cap(inode) \
  1226. ((current_fsuid() == (inode)->i_uid) || capable(CAP_FOWNER))
  1227. /* not quite ready to be deprecated, but... */
  1228. extern void lock_super(struct super_block *);
  1229. extern void unlock_super(struct super_block *);
  1230. /*
  1231. * VFS helper functions..
  1232. */
  1233. extern int vfs_create(struct inode *, struct dentry *, int, struct nameidata *);
  1234. extern int vfs_mkdir(struct inode *, struct dentry *, int);
  1235. extern int vfs_mknod(struct inode *, struct dentry *, int, dev_t);
  1236. extern int vfs_symlink(struct inode *, struct dentry *, const char *);
  1237. extern int vfs_link(struct dentry *, struct inode *, struct dentry *);
  1238. extern int vfs_rmdir(struct inode *, struct dentry *);
  1239. extern int vfs_unlink(struct inode *, struct dentry *);
  1240. extern int vfs_rename(struct inode *, struct dentry *, struct inode *, struct dentry *);
  1241. /*
  1242. * VFS dentry helper functions.
  1243. */
  1244. extern void dentry_unhash(struct dentry *dentry);
  1245. /*
  1246. * VFS file helper functions.
  1247. */
  1248. extern int file_permission(struct file *, int);
  1249. /*
  1250. * VFS FS_IOC_FIEMAP helper definitions.
  1251. */
  1252. struct fiemap_extent_info {
  1253. unsigned int fi_flags; /* Flags as passed from user */
  1254. unsigned int fi_extents_mapped; /* Number of mapped extents */
  1255. unsigned int fi_extents_max; /* Size of fiemap_extent array */
  1256. struct fiemap_extent *fi_extents_start; /* Start of fiemap_extent
  1257. * array */
  1258. };
  1259. int fiemap_fill_next_extent(struct fiemap_extent_info *info, u64 logical,
  1260. u64 phys, u64 len, u32 flags);
  1261. int fiemap_check_flags(struct fiemap_extent_info *fieinfo, u32 fs_flags);
  1262. /*
  1263. * File types
  1264. *
  1265. * NOTE! These match bits 12..15 of stat.st_mode
  1266. * (ie "(i_mode >> 12) & 15").
  1267. */
  1268. #define DT_UNKNOWN 0
  1269. #define DT_FIFO 1
  1270. #define DT_CHR 2
  1271. #define DT_DIR 4
  1272. #define DT_BLK 6
  1273. #define DT_REG 8
  1274. #define DT_LNK 10
  1275. #define DT_SOCK 12
  1276. #define DT_WHT 14
  1277. #define OSYNC_METADATA (1<<0)
  1278. #define OSYNC_DATA (1<<1)
  1279. #define OSYNC_INODE (1<<2)
  1280. int generic_osync_inode(struct inode *, struct address_space *, int);
  1281. /*
  1282. * This is the "filldir" function type, used by readdir() to let
  1283. * the kernel specify what kind of dirent layout it wants to have.
  1284. * This allows the kernel to read directories into kernel space or
  1285. * to have different dirent layouts depending on the binary type.
  1286. */
  1287. typedef int (*filldir_t)(void *, const char *, int, loff_t, u64, unsigned);
  1288. struct block_device_operations;
  1289. /* These macros are for out of kernel modules to test that
  1290. * the kernel supports the unlocked_ioctl and compat_ioctl
  1291. * fields in struct file_operations. */
  1292. #define HAVE_COMPAT_IOCTL 1
  1293. #define HAVE_UNLOCKED_IOCTL 1
  1294. /*
  1295. * NOTE:
  1296. * read, write, poll, fsync, readv, writev, unlocked_ioctl and compat_ioctl
  1297. * can be called without the big kernel lock held in all filesystems.
  1298. */
  1299. struct file_operations {
  1300. struct module *owner;
  1301. loff_t (*llseek) (struct file *, loff_t, int);
  1302. ssize_t (*read) (struct file *, char __user *, size_t, loff_t *);
  1303. ssize_t (*write) (struct file *, const char __user *, size_t, loff_t *);
  1304. ssize_t (*aio_read) (struct kiocb *, const struct iovec *, unsigned long, loff_t);
  1305. ssize_t (*aio_write) (struct kiocb *, const struct iovec *, unsigned long, loff_t);
  1306. int (*readdir) (struct file *, void *, filldir_t);
  1307. unsigned int (*poll) (struct file *, struct poll_table_struct *);
  1308. int (*ioctl) (struct inode *, struct file *, unsigned int, unsigned long);
  1309. long (*unlocked_ioctl) (struct file *, unsigned int, unsigned long);
  1310. long (*compat_ioctl) (struct file *, unsigned int, unsigned long);
  1311. int (*mmap) (struct file *, struct vm_area_struct *);
  1312. int (*open) (struct inode *, struct file *);
  1313. int (*flush) (struct file *, fl_owner_t id);
  1314. int (*release) (struct inode *, struct file *);
  1315. int (*fsync) (struct file *, struct dentry *, int datasync);
  1316. int (*aio_fsync) (struct kiocb *, int datasync);
  1317. int (*fasync) (int, struct file *, int);
  1318. int (*lock) (struct file *, int, struct file_lock *);
  1319. ssize_t (*sendpage) (struct file *, struct page *, int, size_t, loff_t *, int);
  1320. unsigned long (*get_unmapped_area)(struct file *, unsigned long, unsigned long, unsigned long, unsigned long);
  1321. int (*check_flags)(int);
  1322. int (*flock) (struct file *, int, struct file_lock *);
  1323. ssize_t (*splice_write)(struct pipe_inode_info *, struct file *, loff_t *, size_t, unsigned int);
  1324. ssize_t (*splice_read)(struct file *, loff_t *, struct pipe_inode_info *, size_t, unsigned int);
  1325. int (*setlease)(struct file *, long, struct file_lock **);
  1326. };
  1327. struct inode_operations {
  1328. int (*create) (struct inode *,struct dentry *,int, struct nameidata *);
  1329. struct dentry * (*lookup) (struct inode *,struct dentry *, struct nameidata *);
  1330. int (*link) (struct dentry *,struct inode *,struct dentry *);
  1331. int (*unlink) (struct inode *,struct dentry *);
  1332. int (*symlink) (struct inode *,struct dentry *,const char *);
  1333. int (*mkdir) (struct inode *,struct dentry *,int);
  1334. int (*rmdir) (struct inode *,struct dentry *);
  1335. int (*mknod) (struct inode *,struct dentry *,int,dev_t);
  1336. int (*rename) (struct inode *, struct dentry *,
  1337. struct inode *, struct dentry *);
  1338. int (*readlink) (struct dentry *, char __user *,int);
  1339. void * (*follow_link) (struct dentry *, struct nameidata *);
  1340. void (*put_link) (struct dentry *, struct nameidata *, void *);
  1341. void (*truncate) (struct inode *);
  1342. int (*permission) (struct inode *, int);
  1343. int (*setattr) (struct dentry *, struct iattr *);
  1344. int (*getattr) (struct vfsmount *mnt, struct dentry *, struct kstat *);
  1345. int (*setxattr) (struct dentry *, const char *,const void *,size_t,int);
  1346. ssize_t (*getxattr) (struct dentry *, const char *, void *, size_t);
  1347. ssize_t (*listxattr) (struct dentry *, char *, size_t);
  1348. int (*removexattr) (struct dentry *, const char *);
  1349. void (*truncate_range)(struct inode *, loff_t, loff_t);
  1350. long (*fallocate)(struct inode *inode, int mode, loff_t offset,
  1351. loff_t len);
  1352. int (*fiemap)(struct inode *, struct fiemap_extent_info *, u64 start,
  1353. u64 len);
  1354. };
  1355. struct seq_file;
  1356. ssize_t rw_copy_check_uvector(int type, const struct iovec __user * uvector,
  1357. unsigned long nr_segs, unsigned long fast_segs,
  1358. struct iovec *fast_pointer,
  1359. struct iovec **ret_pointer);
  1360. extern ssize_t vfs_read(struct file *, char __user *, size_t, loff_t *);
  1361. extern ssize_t vfs_write(struct file *, const char __user *, size_t, loff_t *);
  1362. extern ssize_t vfs_readv(struct file *, const struct iovec __user *,
  1363. unsigned long, loff_t *);
  1364. extern ssize_t vfs_writev(struct file *, const struct iovec __user *,
  1365. unsigned long, loff_t *);
  1366. struct super_operations {
  1367. struct inode *(*alloc_inode)(struct super_block *sb);
  1368. void (*destroy_inode)(struct inode *);
  1369. void (*dirty_inode) (struct inode *);
  1370. int (*write_inode) (struct inode *, int);
  1371. void (*drop_inode) (struct inode *);
  1372. void (*delete_inode) (struct inode *);
  1373. void (*put_super) (struct super_block *);
  1374. void (*write_super) (struct super_block *);
  1375. int (*sync_fs)(struct super_block *sb, int wait);
  1376. int (*freeze_fs) (struct super_block *);
  1377. int (*unfreeze_fs) (struct super_block *);
  1378. int (*statfs) (struct dentry *, struct kstatfs *);
  1379. int (*remount_fs) (struct super_block *, int *, char *);
  1380. void (*clear_inode) (struct inode *);
  1381. void (*umount_begin) (struct super_block *);
  1382. int (*show_options)(struct seq_file *, struct vfsmount *);
  1383. int (*show_stats)(struct seq_file *, struct vfsmount *);
  1384. #ifdef CONFIG_QUOTA
  1385. ssize_t (*quota_read)(struct super_block *, int, char *, size_t, loff_t);
  1386. ssize_t (*quota_write)(struct super_block *, int, const char *, size_t, loff_t);
  1387. #endif
  1388. int (*bdev_try_to_free_page)(struct super_block*, struct page*, gfp_t);
  1389. };
  1390. /*
  1391. * Inode state bits. Protected by inode_lock.
  1392. *
  1393. * Three bits determine the dirty state of the inode, I_DIRTY_SYNC,
  1394. * I_DIRTY_DATASYNC and I_DIRTY_PAGES.
  1395. *
  1396. * Four bits define the lifetime of an inode. Initially, inodes are I_NEW,
  1397. * until that flag is cleared. I_WILL_FREE, I_FREEING and I_CLEAR are set at
  1398. * various stages of removing an inode.
  1399. *
  1400. * Two bits are used for locking and completion notification, I_LOCK and I_SYNC.
  1401. *
  1402. * I_DIRTY_SYNC Inode is dirty, but doesn't have to be written on
  1403. * fdatasync(). i_atime is the usual cause.
  1404. * I_DIRTY_DATASYNC Data-related inode changes pending. We keep track of
  1405. * these changes separately from I_DIRTY_SYNC so that we
  1406. * don't have to write inode on fdatasync() when only
  1407. * mtime has changed in it.
  1408. * I_DIRTY_PAGES Inode has dirty pages. Inode itself may be clean.
  1409. * I_NEW get_new_inode() sets i_state to I_LOCK|I_NEW. Both
  1410. * are cleared by unlock_new_inode(), called from iget().
  1411. * I_WILL_FREE Must be set when calling write_inode_now() if i_count
  1412. * is zero. I_FREEING must be set when I_WILL_FREE is
  1413. * cleared.
  1414. * I_FREEING Set when inode is about to be freed but still has dirty
  1415. * pages or buffers attached or the inode itself is still
  1416. * dirty.
  1417. * I_CLEAR Set by clear_inode(). In this state the inode is clean
  1418. * and can be destroyed.
  1419. *
  1420. * Inodes that are I_WILL_FREE, I_FREEING or I_CLEAR are
  1421. * prohibited for many purposes. iget() must wait for
  1422. * the inode to be completely released, then create it
  1423. * anew. Other functions will just ignore such inodes,
  1424. * if appropriate. I_LOCK is used for waiting.
  1425. *
  1426. * I_LOCK Serves as both a mutex and completion notification.
  1427. * New inodes set I_LOCK. If two processes both create
  1428. * the same inode, one of them will release its inode and
  1429. * wait for I_LOCK to be released before returning.
  1430. * Inodes in I_WILL_FREE, I_FREEING or I_CLEAR state can
  1431. * also cause waiting on I_LOCK, without I_LOCK actually
  1432. * being set. find_inode() uses this to prevent returning
  1433. * nearly-dead inodes.
  1434. * I_SYNC Similar to I_LOCK, but limited in scope to writeback
  1435. * of inode dirty data. Having a separate lock for this
  1436. * purpose reduces latency and prevents some filesystem-
  1437. * specific deadlocks.
  1438. *
  1439. * Q: What is the difference between I_WILL_FREE and I_FREEING?
  1440. * Q: igrab() only checks on (I_FREEING|I_WILL_FREE). Should it also check on
  1441. * I_CLEAR? If not, why?
  1442. */
  1443. #define I_DIRTY_SYNC 1
  1444. #define I_DIRTY_DATASYNC 2
  1445. #define I_DIRTY_PAGES 4
  1446. #define I_NEW 8
  1447. #define I_WILL_FREE 16
  1448. #define I_FREEING 32
  1449. #define I_CLEAR 64
  1450. #define __I_LOCK 7
  1451. #define I_LOCK (1 << __I_LOCK)
  1452. #define __I_SYNC 8
  1453. #define I_SYNC (1 << __I_SYNC)
  1454. #define I_DIRTY (I_DIRTY_SYNC | I_DIRTY_DATASYNC | I_DIRTY_PAGES)
  1455. extern void __mark_inode_dirty(struct inode *, int);
  1456. static inline void mark_inode_dirty(struct inode *inode)
  1457. {
  1458. __mark_inode_dirty(inode, I_DIRTY);
  1459. }
  1460. static inline void mark_inode_dirty_sync(struct inode *inode)
  1461. {
  1462. __mark_inode_dirty(inode, I_DIRTY_SYNC);
  1463. }
  1464. /**
  1465. * inc_nlink - directly increment an inode's link count
  1466. * @inode: inode
  1467. *
  1468. * This is a low-level filesystem helper to replace any
  1469. * direct filesystem manipulation of i_nlink. Currently,
  1470. * it is only here for parity with dec_nlink().
  1471. */
  1472. static inline void inc_nlink(struct inode *inode)
  1473. {
  1474. inode->i_nlink++;
  1475. }
  1476. static inline void inode_inc_link_count(struct inode *inode)
  1477. {
  1478. inc_nlink(inode);
  1479. mark_inode_dirty(inode);
  1480. }
  1481. /**
  1482. * drop_nlink - directly drop an inode's link count
  1483. * @inode: inode
  1484. *
  1485. * This is a low-level filesystem helper to replace any
  1486. * direct filesystem manipulation of i_nlink. In cases
  1487. * where we are attempting to track writes to the
  1488. * filesystem, a decrement to zero means an imminent
  1489. * write when the file is truncated and actually unlinked
  1490. * on the filesystem.
  1491. */
  1492. static inline void drop_nlink(struct inode *inode)
  1493. {
  1494. inode->i_nlink--;
  1495. }
  1496. /**
  1497. * clear_nlink - directly zero an inode's link count
  1498. * @inode: inode
  1499. *
  1500. * This is a low-level filesystem helper to replace any
  1501. * direct filesystem manipulation of i_nlink. See
  1502. * drop_nlink() for why we care about i_nlink hitting zero.
  1503. */
  1504. static inline void clear_nlink(struct inode *inode)
  1505. {
  1506. inode->i_nlink = 0;
  1507. }
  1508. static inline void inode_dec_link_count(struct inode *inode)
  1509. {
  1510. drop_nlink(inode);
  1511. mark_inode_dirty(inode);
  1512. }
  1513. /**
  1514. * inode_inc_iversion - increments i_version
  1515. * @inode: inode that need to be updated
  1516. *
  1517. * Every time the inode is modified, the i_version field will be incremented.
  1518. * The filesystem has to be mounted with i_version flag
  1519. */
  1520. static inline void inode_inc_iversion(struct inode *inode)
  1521. {
  1522. spin_lock(&inode->i_lock);
  1523. inode->i_version++;
  1524. spin_unlock(&inode->i_lock);
  1525. }
  1526. extern void touch_atime(struct vfsmount *mnt, struct dentry *dentry);
  1527. static inline void file_accessed(struct file *file)
  1528. {
  1529. if (!(file->f_flags & O_NOATIME))
  1530. touch_atime(file->f_path.mnt, file->f_path.dentry);
  1531. }
  1532. int sync_inode(struct inode *inode, struct writeback_control *wbc);
  1533. struct file_system_type {
  1534. const char *name;
  1535. int fs_flags;
  1536. int (*get_sb) (struct file_system_type *, int,
  1537. const char *, void *, struct vfsmount *);
  1538. void (*kill_sb) (struct super_block *);
  1539. struct module *owner;
  1540. struct file_system_type * next;
  1541. struct list_head fs_supers;
  1542. struct lock_class_key s_lock_key;
  1543. struct lock_class_key s_umount_key;
  1544. struct lock_class_key i_lock_key;
  1545. struct lock_class_key i_mutex_key;
  1546. struct lock_class_key i_mutex_dir_key;
  1547. struct lock_class_key i_alloc_sem_key;
  1548. };
  1549. extern int get_sb_ns(struct file_system_type *fs_type, int flags, void *data,
  1550. int (*fill_super)(struct super_block *, void *, int),
  1551. struct vfsmount *mnt);
  1552. extern int get_sb_bdev(struct file_system_type *fs_type,
  1553. int flags, const char *dev_name, void *data,
  1554. int (*fill_super)(struct super_block *, void *, int),
  1555. struct vfsmount *mnt);
  1556. extern int get_sb_single(struct file_system_type *fs_type,
  1557. int flags, void *data,
  1558. int (*fill_super)(struct super_block *, void *, int),
  1559. struct vfsmount *mnt);
  1560. extern int get_sb_nodev(struct file_system_type *fs_type,
  1561. int flags, void *data,
  1562. int (*fill_super)(struct super_block *, void *, int),
  1563. struct vfsmount *mnt);
  1564. void generic_shutdown_super(struct super_block *sb);
  1565. void kill_block_super(struct super_block *sb);
  1566. void kill_anon_super(struct super_block *sb);
  1567. void kill_litter_super(struct super_block *sb);
  1568. void deactivate_super(struct super_block *sb);
  1569. void deactivate_locked_super(struct super_block *sb);
  1570. int set_anon_super(struct super_block *s, void *data);
  1571. struct super_block *sget(struct file_system_type *type,
  1572. int (*test)(struct super_block *,void *),
  1573. int (*set)(struct super_block *,void *),
  1574. void *data);
  1575. extern int get_sb_pseudo(struct file_system_type *, char *,
  1576. const struct super_operations *ops, unsigned long,
  1577. struct vfsmount *mnt);
  1578. extern void simple_set_mnt(struct vfsmount *mnt, struct super_block *sb);
  1579. int __put_super_and_need_restart(struct super_block *sb);
  1580. /* Alas, no aliases. Too much hassle with bringing module.h everywhere */
  1581. #define fops_get(fops) \
  1582. (((fops) && try_module_get((fops)->owner) ? (fops) : NULL))
  1583. #define fops_put(fops) \
  1584. do { if (fops) module_put((fops)->owner); } while(0)
  1585. extern int register_filesystem(struct file_system_type *);
  1586. extern int unregister_filesystem(struct file_system_type *);
  1587. extern struct vfsmount *kern_mount_data(struct file_system_type *, void *data);
  1588. #define kern_mount(type) kern_mount_data(type, NULL)
  1589. extern int may_umount_tree(struct vfsmount *);
  1590. extern int may_umount(struct vfsmount *);
  1591. extern long do_mount(char *, char *, char *, unsigned long, void *);
  1592. extern struct vfsmount *collect_mounts(struct path *);
  1593. extern void drop_collected_mounts(struct vfsmount *);
  1594. extern int vfs_statfs(struct dentry *, struct kstatfs *);
  1595. extern int current_umask(void);
  1596. /* /sys/fs */
  1597. extern struct kobject *fs_kobj;
  1598. extern int rw_verify_area(int, struct file *, loff_t *, size_t);
  1599. #define FLOCK_VERIFY_READ 1
  1600. #define FLOCK_VERIFY_WRITE 2
  1601. #ifdef CONFIG_FILE_LOCKING
  1602. extern int locks_mandatory_locked(struct inode *);
  1603. extern int locks_mandatory_area(int, struct inode *, struct file *, loff_t, size_t);
  1604. /*
  1605. * Candidates for mandatory locking have the setgid bit set
  1606. * but no group execute bit - an otherwise meaningless combination.
  1607. */
  1608. static inline int __mandatory_lock(struct inode *ino)
  1609. {
  1610. return (ino->i_mode & (S_ISGID | S_IXGRP)) == S_ISGID;
  1611. }
  1612. /*
  1613. * ... and these candidates should be on MS_MANDLOCK mounted fs,
  1614. * otherwise these will be advisory locks
  1615. */
  1616. static inline int mandatory_lock(struct inode *ino)
  1617. {
  1618. return IS_MANDLOCK(ino) && __mandatory_lock(ino);
  1619. }
  1620. static inline int locks_verify_locked(struct inode *inode)
  1621. {
  1622. if (mandatory_lock(inode))
  1623. return locks_mandatory_locked(inode);
  1624. return 0;
  1625. }
  1626. static inline int locks_verify_truncate(struct inode *inode,
  1627. struct file *filp,
  1628. loff_t size)
  1629. {
  1630. if (inode->i_flock && mandatory_lock(inode))
  1631. return locks_mandatory_area(
  1632. FLOCK_VERIFY_WRITE, inode, filp,
  1633. size < inode->i_size ? size : inode->i_size,
  1634. (size < inode->i_size ? inode->i_size - size
  1635. : size - inode->i_size)
  1636. );
  1637. return 0;
  1638. }
  1639. static inline int break_lease(struct inode *inode, unsigned int mode)
  1640. {
  1641. if (inode->i_flock)
  1642. return __break_lease(inode, mode);
  1643. return 0;
  1644. }
  1645. #else /* !CONFIG_FILE_LOCKING */
  1646. static inline int locks_mandatory_locked(struct inode *inode)
  1647. {
  1648. return 0;
  1649. }
  1650. static inline int locks_mandatory_area(int rw, struct inode *inode,
  1651. struct file *filp, loff_t offset,
  1652. size_t count)
  1653. {
  1654. return 0;
  1655. }
  1656. static inline int __mandatory_lock(struct inode *inode)
  1657. {
  1658. return 0;
  1659. }
  1660. static inline int mandatory_lock(struct inode *inode)
  1661. {
  1662. return 0;
  1663. }
  1664. static inline int locks_verify_locked(struct inode *inode)
  1665. {
  1666. return 0;
  1667. }
  1668. static inline int locks_verify_truncate(struct inode *inode, struct file *filp,
  1669. size_t size)
  1670. {
  1671. return 0;
  1672. }
  1673. static inline int break_lease(struct inode *inode, unsigned int mode)
  1674. {
  1675. return 0;
  1676. }
  1677. #endif /* CONFIG_FILE_LOCKING */
  1678. /* fs/open.c */
  1679. extern int do_truncate(struct dentry *, loff_t start, unsigned int time_attrs,
  1680. struct file *filp);
  1681. extern long do_sys_open(int dfd, const char __user *filename, int flags,
  1682. int mode);
  1683. extern struct file *filp_open(const char *, int, int);
  1684. extern struct file * dentry_open(struct dentry *, struct vfsmount *, int,
  1685. const struct cred *);
  1686. extern int filp_close(struct file *, fl_owner_t id);
  1687. extern char * getname(const char __user *);
  1688. /* fs/dcache.c */
  1689. extern void __init vfs_caches_init_early(void);
  1690. extern void __init vfs_caches_init(unsigned long);
  1691. extern struct kmem_cache *names_cachep;
  1692. #define __getname() kmem_cache_alloc(names_cachep, GFP_KERNEL)
  1693. #define __putname(name) kmem_cache_free(names_cachep, (void *)(name))
  1694. #ifndef CONFIG_AUDITSYSCALL
  1695. #define putname(name) __putname(name)
  1696. #else
  1697. extern void putname(const char *name);
  1698. #endif
  1699. #ifdef CONFIG_BLOCK
  1700. extern int register_blkdev(unsigned int, const char *);
  1701. extern void unregister_blkdev(unsigned int, const char *);
  1702. extern struct block_device *bdget(dev_t);
  1703. extern void bd_set_size(struct block_device *, loff_t size);
  1704. extern void bd_forget(struct inode *inode);
  1705. extern void bdput(struct block_device *);
  1706. extern struct block_device *open_by_devnum(dev_t, fmode_t);
  1707. extern void invalidate_bdev(struct block_device *);
  1708. extern int sync_blockdev(struct block_device *bdev);
  1709. extern struct super_block *freeze_bdev(struct block_device *);
  1710. extern void emergency_thaw_all(void);
  1711. extern int thaw_bdev(struct block_device *bdev, struct super_block *sb);
  1712. extern int fsync_bdev(struct block_device *);
  1713. #else
  1714. static inline void bd_forget(struct inode *inode) {}
  1715. static inline int sync_blockdev(struct block_device *bdev) { return 0; }
  1716. static inline void invalidate_bdev(struct block_device *bdev) {}
  1717. static inline struct super_block *freeze_bdev(struct block_device *sb)
  1718. {
  1719. return NULL;
  1720. }
  1721. static inline int thaw_bdev(struct block_device *bdev, struct super_block *sb)
  1722. {
  1723. return 0;
  1724. }
  1725. #endif
  1726. extern int sync_filesystem(struct super_block *);
  1727. extern const struct file_operations def_blk_fops;
  1728. extern const struct file_operations def_chr_fops;
  1729. extern const struct file_operations bad_sock_fops;
  1730. extern const struct file_operations def_fifo_fops;
  1731. #ifdef CONFIG_BLOCK
  1732. extern int ioctl_by_bdev(struct block_device *, unsigned, unsigned long);
  1733. extern int blkdev_ioctl(struct block_device *, fmode_t, unsigned, unsigned long);
  1734. extern long compat_blkdev_ioctl(struct file *, unsigned, unsigned long);
  1735. extern int blkdev_get(struct block_device *, fmode_t);
  1736. extern int blkdev_put(struct block_device *, fmode_t);
  1737. extern int bd_claim(struct block_device *, void *);
  1738. extern void bd_release(struct block_device *);
  1739. #ifdef CONFIG_SYSFS
  1740. extern int bd_claim_by_disk(struct block_device *, void *, struct gendisk *);
  1741. extern void bd_release_from_disk(struct block_device *, struct gendisk *);
  1742. #else
  1743. #define bd_claim_by_disk(bdev, holder, disk) bd_claim(bdev, holder)
  1744. #define bd_release_from_disk(bdev, disk) bd_release(bdev)
  1745. #endif
  1746. #endif
  1747. /* fs/char_dev.c */
  1748. #define CHRDEV_MAJOR_HASH_SIZE 255
  1749. extern int alloc_chrdev_region(dev_t *, unsigned, unsigned, const char *);
  1750. extern int register_chrdev_region(dev_t, unsigned, const char *);
  1751. extern int register_chrdev(unsigned int, const char *,
  1752. const struct file_operations *);
  1753. extern void unregister_chrdev(unsigned int, const char *);
  1754. extern void unregister_chrdev_region(dev_t, unsigned);
  1755. extern void chrdev_show(struct seq_file *,off_t);
  1756. /* fs/block_dev.c */
  1757. #define BDEVNAME_SIZE 32 /* Largest string for a blockdev identifier */
  1758. #define BDEVT_SIZE 10 /* Largest string for MAJ:MIN for blkdev */
  1759. #ifdef CONFIG_BLOCK
  1760. #define BLKDEV_MAJOR_HASH_SIZE 255
  1761. extern const char *__bdevname(dev_t, char *buffer);
  1762. extern const char *bdevname(struct block_device *bdev, char *buffer);
  1763. extern struct block_device *lookup_bdev(const char *);
  1764. extern struct block_device *open_bdev_exclusive(const char *, fmode_t, void *);
  1765. extern void close_bdev_exclusive(struct block_device *, fmode_t);
  1766. extern void blkdev_show(struct seq_file *,off_t);
  1767. #else
  1768. #define BLKDEV_MAJOR_HASH_SIZE 0
  1769. #endif
  1770. extern void init_special_inode(struct inode *, umode_t, dev_t);
  1771. /* Invalid inode operations -- fs/bad_inode.c */
  1772. extern void make_bad_inode(struct inode *);
  1773. extern int is_bad_inode(struct inode *);
  1774. extern const struct file_operations read_pipefifo_fops;
  1775. extern const struct file_operations write_pipefifo_fops;
  1776. extern const struct file_operations rdwr_pipefifo_fops;
  1777. extern int fs_may_remount_ro(struct super_block *);
  1778. #ifdef CONFIG_BLOCK
  1779. /*
  1780. * return READ, READA, or WRITE
  1781. */
  1782. #define bio_rw(bio) ((bio)->bi_rw & (RW_MASK | RWA_MASK))
  1783. /*
  1784. * return data direction, READ or WRITE
  1785. */
  1786. #define bio_data_dir(bio) ((bio)->bi_rw & 1)
  1787. extern void check_disk_size_change(struct gendisk *disk,
  1788. struct block_device *bdev);
  1789. extern int revalidate_disk(struct gendisk *);
  1790. extern int check_disk_change(struct block_device *);
  1791. extern int __invalidate_device(struct block_device *);
  1792. extern int invalidate_partition(struct gendisk *, int);
  1793. #endif
  1794. extern int invalidate_inodes(struct super_block *);
  1795. unsigned long __invalidate_mapping_pages(struct address_space *mapping,
  1796. pgoff_t start, pgoff_t end,
  1797. bool be_atomic);
  1798. unsigned long invalidate_mapping_pages(struct address_space *mapping,
  1799. pgoff_t start, pgoff_t end);
  1800. static inline unsigned long __deprecated
  1801. invalidate_inode_pages(struct address_space *mapping)
  1802. {
  1803. return invalidate_mapping_pages(mapping, 0, ~0UL);
  1804. }
  1805. static inline void invalidate_remote_inode(struct inode *inode)
  1806. {
  1807. if (S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode) ||
  1808. S_ISLNK(inode->i_mode))
  1809. invalidate_mapping_pages(inode->i_mapping, 0, -1);
  1810. }
  1811. extern int invalidate_inode_pages2(struct address_space *mapping);
  1812. extern int invalidate_inode_pages2_range(struct address_space *mapping,
  1813. pgoff_t start, pgoff_t end);
  1814. extern void generic_sync_sb_inodes(struct super_block *sb,
  1815. struct writeback_control *wbc);
  1816. extern int write_inode_now(struct inode *, int);
  1817. extern int filemap_fdatawrite(struct address_space *);
  1818. extern int filemap_flush(struct address_space *);
  1819. extern int filemap_fdatawait(struct address_space *);
  1820. extern int filemap_write_and_wait(struct address_space *mapping);
  1821. extern int filemap_write_and_wait_range(struct address_space *mapping,
  1822. loff_t lstart, loff_t lend);
  1823. extern int wait_on_page_writeback_range(struct address_space *mapping,
  1824. pgoff_t start, pgoff_t end);
  1825. extern int __filemap_fdatawrite_range(struct address_space *mapping,
  1826. loff_t start, loff_t end, int sync_mode);
  1827. extern int filemap_fdatawrite_range(struct address_space *mapping,
  1828. loff_t start, loff_t end);
  1829. extern int vfs_fsync(struct file *file, struct dentry *dentry, int datasync);
  1830. extern void sync_supers(void);
  1831. extern void emergency_sync(void);
  1832. extern void emergency_remount(void);
  1833. #ifdef CONFIG_BLOCK
  1834. extern sector_t bmap(struct inode *, sector_t);
  1835. #endif
  1836. extern int notify_change(struct dentry *, struct iattr *);
  1837. extern int inode_permission(struct inode *, int);
  1838. extern int generic_permission(struct inode *, int,
  1839. int (*check_acl)(struct inode *, int));
  1840. static inline bool execute_ok(struct inode *inode)
  1841. {
  1842. return (inode->i_mode & S_IXUGO) || S_ISDIR(inode->i_mode);
  1843. }
  1844. extern int get_write_access(struct inode *);
  1845. extern int deny_write_access(struct file *);
  1846. static inline void put_write_access(struct inode * inode)
  1847. {
  1848. atomic_dec(&inode->i_writecount);
  1849. }
  1850. static inline void allow_write_access(struct file *file)
  1851. {
  1852. if (file)
  1853. atomic_inc(&file->f_path.dentry->d_inode->i_writecount);
  1854. }
  1855. extern int do_pipe_flags(int *, int);
  1856. extern struct file *create_read_pipe(struct file *f, int flags);
  1857. extern struct file *create_write_pipe(int flags);
  1858. extern void free_write_pipe(struct file *);
  1859. extern struct file *do_filp_open(int dfd, const char *pathname,
  1860. int open_flag, int mode, int acc_mode);
  1861. extern int may_open(struct path *, int, int);
  1862. extern int kernel_read(struct file *, unsigned long, char *, unsigned long);
  1863. extern struct file * open_exec(const char *);
  1864. /* fs/dcache.c -- generic fs support functions */
  1865. extern int is_subdir(struct dentry *, struct dentry *);
  1866. extern ino_t find_inode_number(struct dentry *, struct qstr *);
  1867. #include <linux/err.h>
  1868. /* needed for stackable file system support */
  1869. extern loff_t default_llseek(struct file *file, loff_t offset, int origin);
  1870. extern loff_t vfs_llseek(struct file *file, loff_t offset, int origin);
  1871. extern struct inode * inode_init_always(struct super_block *, struct inode *);
  1872. extern void inode_init_once(struct inode *);
  1873. extern void inode_add_to_lists(struct super_block *, struct inode *);
  1874. extern void iput(struct inode *);
  1875. extern struct inode * igrab(struct inode *);
  1876. extern ino_t iunique(struct super_block *, ino_t);
  1877. extern int inode_needs_sync(struct inode *inode);
  1878. extern void generic_delete_inode(struct inode *inode);
  1879. extern void generic_drop_inode(struct inode *inode);
  1880. extern struct inode *ilookup5_nowait(struct super_block *sb,
  1881. unsigned long hashval, int (*test)(struct inode *, void *),
  1882. void *data);
  1883. extern struct inode *ilookup5(struct super_block *sb, unsigned long hashval,
  1884. int (*test)(struct inode *, void *), void *data);
  1885. extern struct inode *ilookup(struct super_block *sb, unsigned long ino);
  1886. extern struct inode * iget5_locked(struct super_block *, unsigned long, int (*test)(struct inode *, void *), int (*set)(struct inode *, void *), void *);
  1887. extern struct inode * iget_locked(struct super_block *, unsigned long);
  1888. extern int insert_inode_locked4(struct inode *, unsigned long, int (*test)(struct inode *, void *), void *);
  1889. extern int insert_inode_locked(struct inode *);
  1890. extern void unlock_new_inode(struct inode *);
  1891. extern void __iget(struct inode * inode);
  1892. extern void iget_failed(struct inode *);
  1893. extern void clear_inode(struct inode *);
  1894. extern void destroy_inode(struct inode *);
  1895. extern struct inode *new_inode(struct super_block *);
  1896. extern int should_remove_suid(struct dentry *);
  1897. extern int file_remove_suid(struct file *);
  1898. extern void __insert_inode_hash(struct inode *, unsigned long hashval);
  1899. extern void remove_inode_hash(struct inode *);
  1900. static inline void insert_inode_hash(struct inode *inode) {
  1901. __insert_inode_hash(inode, inode->i_ino);
  1902. }
  1903. extern struct file * get_empty_filp(void);
  1904. extern void file_move(struct file *f, struct list_head *list);
  1905. extern void file_kill(struct file *f);
  1906. #ifdef CONFIG_BLOCK
  1907. struct bio;
  1908. extern void submit_bio(int, struct bio *);
  1909. extern int bdev_read_only(struct block_device *);
  1910. #endif
  1911. extern int set_blocksize(struct block_device *, int);
  1912. extern int sb_set_blocksize(struct super_block *, int);
  1913. extern int sb_min_blocksize(struct super_block *, int);
  1914. extern int sb_has_dirty_inodes(struct super_block *);
  1915. extern int generic_file_mmap(struct file *, struct vm_area_struct *);
  1916. extern int generic_file_readonly_mmap(struct file *, struct vm_area_struct *);
  1917. extern int file_read_actor(read_descriptor_t * desc, struct page *page, unsigned long offset, unsigned long size);
  1918. int generic_write_checks(struct file *file, loff_t *pos, size_t *count, int isblk);
  1919. extern ssize_t generic_file_aio_read(struct kiocb *, const struct iovec *, unsigned long, loff_t);
  1920. extern ssize_t generic_file_aio_write(struct kiocb *, const struct iovec *, unsigned long, loff_t);
  1921. extern ssize_t generic_file_aio_write_nolock(struct kiocb *, const struct iovec *,
  1922. unsigned long, loff_t);
  1923. extern ssize_t generic_file_direct_write(struct kiocb *, const struct iovec *,
  1924. unsigned long *, loff_t, loff_t *, size_t, size_t);
  1925. extern ssize_t generic_file_buffered_write(struct kiocb *, const struct iovec *,
  1926. unsigned long, loff_t, loff_t *, size_t, ssize_t);
  1927. extern ssize_t do_sync_read(struct file *filp, char __user *buf, size_t len, loff_t *ppos);
  1928. extern ssize_t do_sync_write(struct file *filp, const char __user *buf, size_t len, loff_t *ppos);
  1929. extern int generic_segment_checks(const struct iovec *iov,
  1930. unsigned long *nr_segs, size_t *count, int access_flags);
  1931. /* fs/splice.c */
  1932. extern ssize_t generic_file_splice_read(struct file *, loff_t *,
  1933. struct pipe_inode_info *, size_t, unsigned int);
  1934. extern ssize_t default_file_splice_read(struct file *, loff_t *,
  1935. struct pipe_inode_info *, size_t, unsigned int);
  1936. extern ssize_t generic_file_splice_write(struct pipe_inode_info *,
  1937. struct file *, loff_t *, size_t, unsigned int);
  1938. extern ssize_t generic_splice_sendpage(struct pipe_inode_info *pipe,
  1939. struct file *out, loff_t *, size_t len, unsigned int flags);
  1940. extern long do_splice_direct(struct file *in, loff_t *ppos, struct file *out,
  1941. size_t len, unsigned int flags);
  1942. extern void
  1943. file_ra_state_init(struct file_ra_state *ra, struct address_space *mapping);
  1944. extern loff_t no_llseek(struct file *file, loff_t offset, int origin);
  1945. extern loff_t generic_file_llseek(struct file *file, loff_t offset, int origin);
  1946. extern loff_t generic_file_llseek_unlocked(struct file *file, loff_t offset,
  1947. int origin);
  1948. extern int generic_file_open(struct inode * inode, struct file * filp);
  1949. extern int nonseekable_open(struct inode * inode, struct file * filp);
  1950. #ifdef CONFIG_FS_XIP
  1951. extern ssize_t xip_file_read(struct file *filp, char __user *buf, size_t len,
  1952. loff_t *ppos);
  1953. extern int xip_file_mmap(struct file * file, struct vm_area_struct * vma);
  1954. extern ssize_t xip_file_write(struct file *filp, const char __user *buf,
  1955. size_t len, loff_t *ppos);
  1956. extern int xip_truncate_page(struct address_space *mapping, loff_t from);
  1957. #else
  1958. static inline int xip_truncate_page(struct address_space *mapping, loff_t from)
  1959. {
  1960. return 0;
  1961. }
  1962. #endif
  1963. #ifdef CONFIG_BLOCK
  1964. ssize_t __blockdev_direct_IO(int rw, struct kiocb *iocb, struct inode *inode,
  1965. struct block_device *bdev, const struct iovec *iov, loff_t offset,
  1966. unsigned long nr_segs, get_block_t get_block, dio_iodone_t end_io,
  1967. int lock_type);
  1968. enum {
  1969. DIO_LOCKING = 1, /* need locking between buffered and direct access */
  1970. DIO_NO_LOCKING, /* bdev; no locking at all between buffered/direct */
  1971. DIO_OWN_LOCKING, /* filesystem locks buffered and direct internally */
  1972. };
  1973. static inline ssize_t blockdev_direct_IO(int rw, struct kiocb *iocb,
  1974. struct inode *inode, struct block_device *bdev, const struct iovec *iov,
  1975. loff_t offset, unsigned long nr_segs, get_block_t get_block,
  1976. dio_iodone_t end_io)
  1977. {
  1978. return __blockdev_direct_IO(rw, iocb, inode, bdev, iov, offset,
  1979. nr_segs, get_block, end_io, DIO_LOCKING);
  1980. }
  1981. static inline ssize_t blockdev_direct_IO_no_locking(int rw, struct kiocb *iocb,
  1982. struct inode *inode, struct block_device *bdev, const struct iovec *iov,
  1983. loff_t offset, unsigned long nr_segs, get_block_t get_block,
  1984. dio_iodone_t end_io)
  1985. {
  1986. return __blockdev_direct_IO(rw, iocb, inode, bdev, iov, offset,
  1987. nr_segs, get_block, end_io, DIO_NO_LOCKING);
  1988. }
  1989. static inline ssize_t blockdev_direct_IO_own_locking(int rw, struct kiocb *iocb,
  1990. struct inode *inode, struct block_device *bdev, const struct iovec *iov,
  1991. loff_t offset, unsigned long nr_segs, get_block_t get_block,
  1992. dio_iodone_t end_io)
  1993. {
  1994. return __blockdev_direct_IO(rw, iocb, inode, bdev, iov, offset,
  1995. nr_segs, get_block, end_io, DIO_OWN_LOCKING);
  1996. }
  1997. #endif
  1998. extern const struct file_operations generic_ro_fops;
  1999. #define special_file(m) (S_ISCHR(m)||S_ISBLK(m)||S_ISFIFO(m)||S_ISSOCK(m))
  2000. extern int vfs_readlink(struct dentry *, char __user *, int, const char *);
  2001. extern int vfs_follow_link(struct nameidata *, const char *);
  2002. extern int page_readlink(struct dentry *, char __user *, int);
  2003. extern void *page_follow_link_light(struct dentry *, struct nameidata *);
  2004. extern void page_put_link(struct dentry *, struct nameidata *, void *);
  2005. extern int __page_symlink(struct inode *inode, const char *symname, int len,
  2006. int nofs);
  2007. extern int page_symlink(struct inode *inode, const char *symname, int len);
  2008. extern const struct inode_operations page_symlink_inode_operations;
  2009. extern int generic_readlink(struct dentry *, char __user *, int);
  2010. extern void generic_fillattr(struct inode *, struct kstat *);
  2011. extern int vfs_getattr(struct vfsmount *, struct dentry *, struct kstat *);
  2012. void inode_add_bytes(struct inode *inode, loff_t bytes);
  2013. void inode_sub_bytes(struct inode *inode, loff_t bytes);
  2014. loff_t inode_get_bytes(struct inode *inode);
  2015. void inode_set_bytes(struct inode *inode, loff_t bytes);
  2016. extern int vfs_readdir(struct file *, filldir_t, void *);
  2017. extern int vfs_stat(char __user *, struct kstat *);
  2018. extern int vfs_lstat(char __user *, struct kstat *);
  2019. extern int vfs_fstat(unsigned int, struct kstat *);
  2020. extern int vfs_fstatat(int , char __user *, struct kstat *, int);
  2021. extern int do_vfs_ioctl(struct file *filp, unsigned int fd, unsigned int cmd,
  2022. unsigned long arg);
  2023. extern int __generic_block_fiemap(struct inode *inode,
  2024. struct fiemap_extent_info *fieinfo, u64 start,
  2025. u64 len, get_block_t *get_block);
  2026. extern int generic_block_fiemap(struct inode *inode,
  2027. struct fiemap_extent_info *fieinfo, u64 start,
  2028. u64 len, get_block_t *get_block);
  2029. extern void get_filesystem(struct file_system_type *fs);
  2030. extern void put_filesystem(struct file_system_type *fs);
  2031. extern struct file_system_type *get_fs_type(const char *name);
  2032. extern struct super_block *get_super(struct block_device *);
  2033. extern struct super_block *user_get_super(dev_t);
  2034. extern void drop_super(struct super_block *sb);
  2035. extern int dcache_dir_open(struct inode *, struct file *);
  2036. extern int dcache_dir_close(struct inode *, struct file *);
  2037. extern loff_t dcache_dir_lseek(struct file *, loff_t, int);
  2038. extern int dcache_readdir(struct file *, void *, filldir_t);
  2039. extern int simple_getattr(struct vfsmount *, struct dentry *, struct kstat *);
  2040. extern int simple_statfs(struct dentry *, struct kstatfs *);
  2041. extern int simple_link(struct dentry *, struct inode *, struct dentry *);
  2042. extern int simple_unlink(struct inode *, struct dentry *);
  2043. extern int simple_rmdir(struct inode *, struct dentry *);
  2044. extern int simple_rename(struct inode *, struct dentry *, struct inode *, struct dentry *);
  2045. extern int simple_sync_file(struct file *, struct dentry *, int);
  2046. extern int simple_empty(struct dentry *);
  2047. extern int simple_readpage(struct file *file, struct page *page);
  2048. extern int simple_prepare_write(struct file *file, struct page *page,
  2049. unsigned offset, unsigned to);
  2050. extern int simple_write_begin(struct file *file, struct address_space *mapping,
  2051. loff_t pos, unsigned len, unsigned flags,
  2052. struct page **pagep, void **fsdata);
  2053. extern int simple_write_end(struct file *file, struct address_space *mapping,
  2054. loff_t pos, unsigned len, unsigned copied,
  2055. struct page *page, void *fsdata);
  2056. extern struct dentry *simple_lookup(struct inode *, struct dentry *, struct nameidata *);
  2057. extern ssize_t generic_read_dir(struct file *, char __user *, size_t, loff_t *);
  2058. extern const struct file_operations simple_dir_operations;
  2059. extern const struct inode_operations simple_dir_inode_operations;
  2060. struct tree_descr { char *name; const struct file_operations *ops; int mode; };
  2061. struct dentry *d_alloc_name(struct dentry *, const char *);
  2062. extern int simple_fill_super(struct super_block *, int, struct tree_descr *);
  2063. extern int simple_pin_fs(struct file_system_type *, struct vfsmount **mount, int *count);
  2064. extern void simple_release_fs(struct vfsmount **mount, int *count);
  2065. extern ssize_t simple_read_from_buffer(void __user *to, size_t count,
  2066. loff_t *ppos, const void *from, size_t available);
  2067. extern int simple_fsync(struct file *, struct dentry *, int);
  2068. #ifdef CONFIG_MIGRATION
  2069. extern int buffer_migrate_page(struct address_space *,
  2070. struct page *, struct page *);
  2071. #else
  2072. #define buffer_migrate_page NULL
  2073. #endif
  2074. extern int inode_change_ok(struct inode *, struct iattr *);
  2075. extern int __must_check inode_setattr(struct inode *, struct iattr *);
  2076. extern void file_update_time(struct file *file);
  2077. extern int generic_show_options(struct seq_file *m, struct vfsmount *mnt);
  2078. extern void save_mount_options(struct super_block *sb, char *options);
  2079. extern void replace_mount_options(struct super_block *sb, char *options);
  2080. static inline ino_t parent_ino(struct dentry *dentry)
  2081. {
  2082. ino_t res;
  2083. spin_lock(&dentry->d_lock);
  2084. res = dentry->d_parent->d_inode->i_ino;
  2085. spin_unlock(&dentry->d_lock);
  2086. return res;
  2087. }
  2088. /* Transaction based IO helpers */
  2089. /*
  2090. * An argresp is stored in an allocated page and holds the
  2091. * size of the argument or response, along with its content
  2092. */
  2093. struct simple_transaction_argresp {
  2094. ssize_t size;
  2095. char data[0];
  2096. };
  2097. #define SIMPLE_TRANSACTION_LIMIT (PAGE_SIZE - sizeof(struct simple_transaction_argresp))
  2098. char *simple_transaction_get(struct file *file, const char __user *buf,
  2099. size_t size);
  2100. ssize_t simple_transaction_read(struct file *file, char __user *buf,
  2101. size_t size, loff_t *pos);
  2102. int simple_transaction_release(struct inode *inode, struct file *file);
  2103. void simple_transaction_set(struct file *file, size_t n);
  2104. /*
  2105. * simple attribute files
  2106. *
  2107. * These attributes behave similar to those in sysfs:
  2108. *
  2109. * Writing to an attribute immediately sets a value, an open file can be
  2110. * written to multiple times.
  2111. *
  2112. * Reading from an attribute creates a buffer from the value that might get
  2113. * read with multiple read calls. When the attribute has been read
  2114. * completely, no further read calls are possible until the file is opened
  2115. * again.
  2116. *
  2117. * All attributes contain a text representation of a numeric value
  2118. * that are accessed with the get() and set() functions.
  2119. */
  2120. #define DEFINE_SIMPLE_ATTRIBUTE(__fops, __get, __set, __fmt) \
  2121. static int __fops ## _open(struct inode *inode, struct file *file) \
  2122. { \
  2123. __simple_attr_check_format(__fmt, 0ull); \
  2124. return simple_attr_open(inode, file, __get, __set, __fmt); \
  2125. } \
  2126. static struct file_operations __fops = { \
  2127. .owner = THIS_MODULE, \
  2128. .open = __fops ## _open, \
  2129. .release = simple_attr_release, \
  2130. .read = simple_attr_read, \
  2131. .write = simple_attr_write, \
  2132. };
  2133. static inline void __attribute__((format(printf, 1, 2)))
  2134. __simple_attr_check_format(const char *fmt, ...)
  2135. {
  2136. /* don't do anything, just let the compiler check the arguments; */
  2137. }
  2138. int simple_attr_open(struct inode *inode, struct file *file,
  2139. int (*get)(void *, u64 *), int (*set)(void *, u64),
  2140. const char *fmt);
  2141. int simple_attr_release(struct inode *inode, struct file *file);
  2142. ssize_t simple_attr_read(struct file *file, char __user *buf,
  2143. size_t len, loff_t *ppos);
  2144. ssize_t simple_attr_write(struct file *file, const char __user *buf,
  2145. size_t len, loff_t *ppos);
  2146. struct ctl_table;
  2147. int proc_nr_files(struct ctl_table *table, int write, struct file *filp,
  2148. void __user *buffer, size_t *lenp, loff_t *ppos);
  2149. int __init get_filesystem_list(char *buf);
  2150. #endif /* __KERNEL__ */
  2151. #endif /* _LINUX_FS_H */