namei.c 45 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914
  1. /* -*- mode: c; c-basic-offset: 8; -*-
  2. * vim: noexpandtab sw=8 ts=8 sts=0:
  3. *
  4. * namei.c
  5. *
  6. * Create and rename file, directory, symlinks
  7. *
  8. * Copyright (C) 2002, 2004 Oracle. All rights reserved.
  9. *
  10. * Portions of this code from linux/fs/ext3/dir.c
  11. *
  12. * Copyright (C) 1992, 1993, 1994, 1995
  13. * Remy Card (card@masi.ibp.fr)
  14. * Laboratoire MASI - Institut Blaise pascal
  15. * Universite Pierre et Marie Curie (Paris VI)
  16. *
  17. * from
  18. *
  19. * linux/fs/minix/dir.c
  20. *
  21. * Copyright (C) 1991, 1992 Linux Torvalds
  22. *
  23. * This program is free software; you can redistribute it and/or
  24. * modify it under the terms of the GNU General Public
  25. * License as published by the Free Software Foundation; either
  26. * version 2 of the License, or (at your option) any later version.
  27. *
  28. * This program is distributed in the hope that it will be useful,
  29. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  30. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  31. * General Public License for more details.
  32. *
  33. * You should have received a copy of the GNU General Public
  34. * License along with this program; if not, write to the
  35. * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
  36. * Boston, MA 021110-1307, USA.
  37. */
  38. #include <linux/fs.h>
  39. #include <linux/types.h>
  40. #include <linux/slab.h>
  41. #include <linux/highmem.h>
  42. #define MLOG_MASK_PREFIX ML_NAMEI
  43. #include <cluster/masklog.h>
  44. #include "ocfs2.h"
  45. #include "alloc.h"
  46. #include "dcache.h"
  47. #include "dir.h"
  48. #include "dlmglue.h"
  49. #include "extent_map.h"
  50. #include "file.h"
  51. #include "inode.h"
  52. #include "journal.h"
  53. #include "namei.h"
  54. #include "suballoc.h"
  55. #include "super.h"
  56. #include "symlink.h"
  57. #include "sysfile.h"
  58. #include "uptodate.h"
  59. #include "vote.h"
  60. #include "buffer_head_io.h"
  61. static int ocfs2_mknod_locked(struct ocfs2_super *osb,
  62. struct inode *dir,
  63. struct dentry *dentry, int mode,
  64. dev_t dev,
  65. struct buffer_head **new_fe_bh,
  66. struct buffer_head *parent_fe_bh,
  67. handle_t *handle,
  68. struct inode **ret_inode,
  69. struct ocfs2_alloc_context *inode_ac);
  70. static int ocfs2_prepare_orphan_dir(struct ocfs2_super *osb,
  71. struct inode **ret_orphan_dir,
  72. struct inode *inode,
  73. char *name,
  74. struct buffer_head **de_bh);
  75. static int ocfs2_orphan_add(struct ocfs2_super *osb,
  76. handle_t *handle,
  77. struct inode *inode,
  78. struct ocfs2_dinode *fe,
  79. char *name,
  80. struct buffer_head *de_bh,
  81. struct inode *orphan_dir_inode);
  82. static int ocfs2_create_symlink_data(struct ocfs2_super *osb,
  83. handle_t *handle,
  84. struct inode *inode,
  85. const char *symname);
  86. /* An orphan dir name is an 8 byte value, printed as a hex string */
  87. #define OCFS2_ORPHAN_NAMELEN ((int)(2 * sizeof(u64)))
  88. static struct dentry *ocfs2_lookup(struct inode *dir, struct dentry *dentry,
  89. struct nameidata *nd)
  90. {
  91. int status;
  92. u64 blkno;
  93. struct inode *inode = NULL;
  94. struct dentry *ret;
  95. struct ocfs2_inode_info *oi;
  96. mlog_entry("(0x%p, 0x%p, '%.*s')\n", dir, dentry,
  97. dentry->d_name.len, dentry->d_name.name);
  98. if (dentry->d_name.len > OCFS2_MAX_FILENAME_LEN) {
  99. ret = ERR_PTR(-ENAMETOOLONG);
  100. goto bail;
  101. }
  102. mlog(0, "find name %.*s in directory %llu\n", dentry->d_name.len,
  103. dentry->d_name.name, (unsigned long long)OCFS2_I(dir)->ip_blkno);
  104. status = ocfs2_meta_lock(dir, NULL, 0);
  105. if (status < 0) {
  106. if (status != -ENOENT)
  107. mlog_errno(status);
  108. ret = ERR_PTR(status);
  109. goto bail;
  110. }
  111. status = ocfs2_lookup_ino_from_name(dir, dentry->d_name.name,
  112. dentry->d_name.len, &blkno);
  113. if (status < 0)
  114. goto bail_add;
  115. inode = ocfs2_iget(OCFS2_SB(dir->i_sb), blkno, 0);
  116. if (IS_ERR(inode)) {
  117. ret = ERR_PTR(-EACCES);
  118. goto bail_unlock;
  119. }
  120. oi = OCFS2_I(inode);
  121. /* Clear any orphaned state... If we were able to look up the
  122. * inode from a directory, it certainly can't be orphaned. We
  123. * might have the bad state from a node which intended to
  124. * orphan this inode but crashed before it could commit the
  125. * unlink. */
  126. spin_lock(&oi->ip_lock);
  127. oi->ip_flags &= ~OCFS2_INODE_MAYBE_ORPHANED;
  128. spin_unlock(&oi->ip_lock);
  129. bail_add:
  130. dentry->d_op = &ocfs2_dentry_ops;
  131. ret = d_splice_alias(inode, dentry);
  132. if (inode) {
  133. /*
  134. * If d_splice_alias() finds a DCACHE_DISCONNECTED
  135. * dentry, it will d_move() it on top of ourse. The
  136. * return value will indicate this however, so in
  137. * those cases, we switch them around for the locking
  138. * code.
  139. *
  140. * NOTE: This dentry already has ->d_op set from
  141. * ocfs2_get_parent() and ocfs2_get_dentry()
  142. */
  143. if (ret)
  144. dentry = ret;
  145. status = ocfs2_dentry_attach_lock(dentry, inode,
  146. OCFS2_I(dir)->ip_blkno);
  147. if (status) {
  148. mlog_errno(status);
  149. ret = ERR_PTR(status);
  150. goto bail_unlock;
  151. }
  152. }
  153. bail_unlock:
  154. /* Don't drop the cluster lock until *after* the d_add --
  155. * unlink on another node will message us to remove that
  156. * dentry under this lock so otherwise we can race this with
  157. * the vote thread and have a stale dentry. */
  158. ocfs2_meta_unlock(dir, 0);
  159. bail:
  160. mlog_exit_ptr(ret);
  161. return ret;
  162. }
  163. static int ocfs2_mknod(struct inode *dir,
  164. struct dentry *dentry,
  165. int mode,
  166. dev_t dev)
  167. {
  168. int status = 0;
  169. struct buffer_head *parent_fe_bh = NULL;
  170. handle_t *handle = NULL;
  171. struct ocfs2_super *osb;
  172. struct ocfs2_dinode *dirfe;
  173. struct buffer_head *new_fe_bh = NULL;
  174. struct buffer_head *de_bh = NULL;
  175. struct inode *inode = NULL;
  176. struct ocfs2_alloc_context *inode_ac = NULL;
  177. struct ocfs2_alloc_context *data_ac = NULL;
  178. mlog_entry("(0x%p, 0x%p, %d, %lu, '%.*s')\n", dir, dentry, mode,
  179. (unsigned long)dev, dentry->d_name.len,
  180. dentry->d_name.name);
  181. /* get our super block */
  182. osb = OCFS2_SB(dir->i_sb);
  183. status = ocfs2_meta_lock(dir, &parent_fe_bh, 1);
  184. if (status < 0) {
  185. if (status != -ENOENT)
  186. mlog_errno(status);
  187. return status;
  188. }
  189. if (S_ISDIR(mode) && (dir->i_nlink >= OCFS2_LINK_MAX)) {
  190. status = -EMLINK;
  191. goto leave;
  192. }
  193. dirfe = (struct ocfs2_dinode *) parent_fe_bh->b_data;
  194. if (!dirfe->i_links_count) {
  195. /* can't make a file in a deleted directory. */
  196. status = -ENOENT;
  197. goto leave;
  198. }
  199. status = ocfs2_check_dir_for_entry(dir, dentry->d_name.name,
  200. dentry->d_name.len);
  201. if (status)
  202. goto leave;
  203. /* get a spot inside the dir. */
  204. status = ocfs2_prepare_dir_for_insert(osb, dir, parent_fe_bh,
  205. dentry->d_name.name,
  206. dentry->d_name.len, &de_bh);
  207. if (status < 0) {
  208. mlog_errno(status);
  209. goto leave;
  210. }
  211. /* reserve an inode spot */
  212. status = ocfs2_reserve_new_inode(osb, &inode_ac);
  213. if (status < 0) {
  214. if (status != -ENOSPC)
  215. mlog_errno(status);
  216. goto leave;
  217. }
  218. /* Reserve a cluster if creating an extent based directory. */
  219. if (S_ISDIR(mode) && !ocfs2_supports_inline_data(osb)) {
  220. status = ocfs2_reserve_clusters(osb, 1, &data_ac);
  221. if (status < 0) {
  222. if (status != -ENOSPC)
  223. mlog_errno(status);
  224. goto leave;
  225. }
  226. }
  227. handle = ocfs2_start_trans(osb, OCFS2_MKNOD_CREDITS);
  228. if (IS_ERR(handle)) {
  229. status = PTR_ERR(handle);
  230. handle = NULL;
  231. mlog_errno(status);
  232. goto leave;
  233. }
  234. /* do the real work now. */
  235. status = ocfs2_mknod_locked(osb, dir, dentry, mode, dev,
  236. &new_fe_bh, parent_fe_bh, handle,
  237. &inode, inode_ac);
  238. if (status < 0) {
  239. mlog_errno(status);
  240. goto leave;
  241. }
  242. if (S_ISDIR(mode)) {
  243. status = ocfs2_fill_new_dir(osb, handle, dir, inode,
  244. new_fe_bh, data_ac);
  245. if (status < 0) {
  246. mlog_errno(status);
  247. goto leave;
  248. }
  249. status = ocfs2_journal_access(handle, dir, parent_fe_bh,
  250. OCFS2_JOURNAL_ACCESS_WRITE);
  251. if (status < 0) {
  252. mlog_errno(status);
  253. goto leave;
  254. }
  255. le16_add_cpu(&dirfe->i_links_count, 1);
  256. status = ocfs2_journal_dirty(handle, parent_fe_bh);
  257. if (status < 0) {
  258. mlog_errno(status);
  259. goto leave;
  260. }
  261. inc_nlink(dir);
  262. }
  263. status = ocfs2_add_entry(handle, dentry, inode,
  264. OCFS2_I(inode)->ip_blkno, parent_fe_bh,
  265. de_bh);
  266. if (status < 0) {
  267. mlog_errno(status);
  268. goto leave;
  269. }
  270. status = ocfs2_dentry_attach_lock(dentry, inode,
  271. OCFS2_I(dir)->ip_blkno);
  272. if (status) {
  273. mlog_errno(status);
  274. goto leave;
  275. }
  276. insert_inode_hash(inode);
  277. dentry->d_op = &ocfs2_dentry_ops;
  278. d_instantiate(dentry, inode);
  279. status = 0;
  280. leave:
  281. if (handle)
  282. ocfs2_commit_trans(osb, handle);
  283. ocfs2_meta_unlock(dir, 1);
  284. if (status == -ENOSPC)
  285. mlog(0, "Disk is full\n");
  286. if (new_fe_bh)
  287. brelse(new_fe_bh);
  288. if (de_bh)
  289. brelse(de_bh);
  290. if (parent_fe_bh)
  291. brelse(parent_fe_bh);
  292. if ((status < 0) && inode)
  293. iput(inode);
  294. if (inode_ac)
  295. ocfs2_free_alloc_context(inode_ac);
  296. if (data_ac)
  297. ocfs2_free_alloc_context(data_ac);
  298. mlog_exit(status);
  299. return status;
  300. }
  301. static int ocfs2_mknod_locked(struct ocfs2_super *osb,
  302. struct inode *dir,
  303. struct dentry *dentry, int mode,
  304. dev_t dev,
  305. struct buffer_head **new_fe_bh,
  306. struct buffer_head *parent_fe_bh,
  307. handle_t *handle,
  308. struct inode **ret_inode,
  309. struct ocfs2_alloc_context *inode_ac)
  310. {
  311. int status = 0;
  312. struct ocfs2_dinode *fe = NULL;
  313. struct ocfs2_extent_list *fel;
  314. u64 fe_blkno = 0;
  315. u16 suballoc_bit;
  316. struct inode *inode = NULL;
  317. mlog_entry("(0x%p, 0x%p, %d, %lu, '%.*s')\n", dir, dentry, mode,
  318. (unsigned long)dev, dentry->d_name.len,
  319. dentry->d_name.name);
  320. *new_fe_bh = NULL;
  321. *ret_inode = NULL;
  322. status = ocfs2_claim_new_inode(osb, handle, inode_ac, &suballoc_bit,
  323. &fe_blkno);
  324. if (status < 0) {
  325. mlog_errno(status);
  326. goto leave;
  327. }
  328. inode = new_inode(dir->i_sb);
  329. if (IS_ERR(inode)) {
  330. status = PTR_ERR(inode);
  331. mlog(ML_ERROR, "new_inode failed!\n");
  332. goto leave;
  333. }
  334. /* populate as many fields early on as possible - many of
  335. * these are used by the support functions here and in
  336. * callers. */
  337. inode->i_ino = ino_from_blkno(osb->sb, fe_blkno);
  338. OCFS2_I(inode)->ip_blkno = fe_blkno;
  339. if (S_ISDIR(mode))
  340. inode->i_nlink = 2;
  341. else
  342. inode->i_nlink = 1;
  343. inode->i_mode = mode;
  344. spin_lock(&osb->osb_lock);
  345. inode->i_generation = osb->s_next_generation++;
  346. spin_unlock(&osb->osb_lock);
  347. *new_fe_bh = sb_getblk(osb->sb, fe_blkno);
  348. if (!*new_fe_bh) {
  349. status = -EIO;
  350. mlog_errno(status);
  351. goto leave;
  352. }
  353. ocfs2_set_new_buffer_uptodate(inode, *new_fe_bh);
  354. status = ocfs2_journal_access(handle, inode, *new_fe_bh,
  355. OCFS2_JOURNAL_ACCESS_CREATE);
  356. if (status < 0) {
  357. mlog_errno(status);
  358. goto leave;
  359. }
  360. fe = (struct ocfs2_dinode *) (*new_fe_bh)->b_data;
  361. memset(fe, 0, osb->sb->s_blocksize);
  362. fe->i_generation = cpu_to_le32(inode->i_generation);
  363. fe->i_fs_generation = cpu_to_le32(osb->fs_generation);
  364. fe->i_blkno = cpu_to_le64(fe_blkno);
  365. fe->i_suballoc_bit = cpu_to_le16(suballoc_bit);
  366. fe->i_suballoc_slot = cpu_to_le16(osb->slot_num);
  367. fe->i_uid = cpu_to_le32(current->fsuid);
  368. if (dir->i_mode & S_ISGID) {
  369. fe->i_gid = cpu_to_le32(dir->i_gid);
  370. if (S_ISDIR(mode))
  371. mode |= S_ISGID;
  372. } else
  373. fe->i_gid = cpu_to_le32(current->fsgid);
  374. fe->i_mode = cpu_to_le16(mode);
  375. if (S_ISCHR(mode) || S_ISBLK(mode))
  376. fe->id1.dev1.i_rdev = cpu_to_le64(huge_encode_dev(dev));
  377. fe->i_links_count = cpu_to_le16(inode->i_nlink);
  378. fe->i_last_eb_blk = 0;
  379. strcpy(fe->i_signature, OCFS2_INODE_SIGNATURE);
  380. le32_add_cpu(&fe->i_flags, OCFS2_VALID_FL);
  381. fe->i_atime = fe->i_ctime = fe->i_mtime =
  382. cpu_to_le64(CURRENT_TIME.tv_sec);
  383. fe->i_mtime_nsec = fe->i_ctime_nsec = fe->i_atime_nsec =
  384. cpu_to_le32(CURRENT_TIME.tv_nsec);
  385. fe->i_dtime = 0;
  386. /*
  387. * If supported, directories start with inline data.
  388. */
  389. if (S_ISDIR(mode) && ocfs2_supports_inline_data(osb)) {
  390. u16 feat = le16_to_cpu(fe->i_dyn_features);
  391. fe->i_dyn_features = cpu_to_le16(feat | OCFS2_INLINE_DATA_FL);
  392. fe->id2.i_data.id_count = cpu_to_le16(ocfs2_max_inline_data(osb->sb));
  393. } else {
  394. fel = &fe->id2.i_list;
  395. fel->l_tree_depth = 0;
  396. fel->l_next_free_rec = 0;
  397. fel->l_count = cpu_to_le16(ocfs2_extent_recs_per_inode(osb->sb));
  398. }
  399. status = ocfs2_journal_dirty(handle, *new_fe_bh);
  400. if (status < 0) {
  401. mlog_errno(status);
  402. goto leave;
  403. }
  404. if (ocfs2_populate_inode(inode, fe, 1) < 0) {
  405. mlog(ML_ERROR, "populate inode failed! bh->b_blocknr=%llu, "
  406. "i_blkno=%llu, i_ino=%lu\n",
  407. (unsigned long long)(*new_fe_bh)->b_blocknr,
  408. (unsigned long long)le64_to_cpu(fe->i_blkno),
  409. inode->i_ino);
  410. BUG();
  411. }
  412. ocfs2_inode_set_new(osb, inode);
  413. if (!ocfs2_mount_local(osb)) {
  414. status = ocfs2_create_new_inode_locks(inode);
  415. if (status < 0)
  416. mlog_errno(status);
  417. }
  418. status = 0; /* error in ocfs2_create_new_inode_locks is not
  419. * critical */
  420. *ret_inode = inode;
  421. leave:
  422. if (status < 0) {
  423. if (*new_fe_bh) {
  424. brelse(*new_fe_bh);
  425. *new_fe_bh = NULL;
  426. }
  427. if (inode)
  428. iput(inode);
  429. }
  430. mlog_exit(status);
  431. return status;
  432. }
  433. static int ocfs2_mkdir(struct inode *dir,
  434. struct dentry *dentry,
  435. int mode)
  436. {
  437. int ret;
  438. mlog_entry("(0x%p, 0x%p, %d, '%.*s')\n", dir, dentry, mode,
  439. dentry->d_name.len, dentry->d_name.name);
  440. ret = ocfs2_mknod(dir, dentry, mode | S_IFDIR, 0);
  441. mlog_exit(ret);
  442. return ret;
  443. }
  444. static int ocfs2_create(struct inode *dir,
  445. struct dentry *dentry,
  446. int mode,
  447. struct nameidata *nd)
  448. {
  449. int ret;
  450. mlog_entry("(0x%p, 0x%p, %d, '%.*s')\n", dir, dentry, mode,
  451. dentry->d_name.len, dentry->d_name.name);
  452. ret = ocfs2_mknod(dir, dentry, mode | S_IFREG, 0);
  453. mlog_exit(ret);
  454. return ret;
  455. }
  456. static int ocfs2_link(struct dentry *old_dentry,
  457. struct inode *dir,
  458. struct dentry *dentry)
  459. {
  460. handle_t *handle;
  461. struct inode *inode = old_dentry->d_inode;
  462. int err;
  463. struct buffer_head *fe_bh = NULL;
  464. struct buffer_head *parent_fe_bh = NULL;
  465. struct buffer_head *de_bh = NULL;
  466. struct ocfs2_dinode *fe = NULL;
  467. struct ocfs2_super *osb = OCFS2_SB(dir->i_sb);
  468. mlog_entry("(inode=%lu, old='%.*s' new='%.*s')\n", inode->i_ino,
  469. old_dentry->d_name.len, old_dentry->d_name.name,
  470. dentry->d_name.len, dentry->d_name.name);
  471. if (S_ISDIR(inode->i_mode))
  472. return -EPERM;
  473. err = ocfs2_meta_lock(dir, &parent_fe_bh, 1);
  474. if (err < 0) {
  475. if (err != -ENOENT)
  476. mlog_errno(err);
  477. return err;
  478. }
  479. if (!dir->i_nlink) {
  480. err = -ENOENT;
  481. goto out;
  482. }
  483. err = ocfs2_check_dir_for_entry(dir, dentry->d_name.name,
  484. dentry->d_name.len);
  485. if (err)
  486. goto out;
  487. err = ocfs2_prepare_dir_for_insert(osb, dir, parent_fe_bh,
  488. dentry->d_name.name,
  489. dentry->d_name.len, &de_bh);
  490. if (err < 0) {
  491. mlog_errno(err);
  492. goto out;
  493. }
  494. err = ocfs2_meta_lock(inode, &fe_bh, 1);
  495. if (err < 0) {
  496. if (err != -ENOENT)
  497. mlog_errno(err);
  498. goto out;
  499. }
  500. fe = (struct ocfs2_dinode *) fe_bh->b_data;
  501. if (le16_to_cpu(fe->i_links_count) >= OCFS2_LINK_MAX) {
  502. err = -EMLINK;
  503. goto out_unlock_inode;
  504. }
  505. handle = ocfs2_start_trans(osb, OCFS2_LINK_CREDITS);
  506. if (IS_ERR(handle)) {
  507. err = PTR_ERR(handle);
  508. handle = NULL;
  509. mlog_errno(err);
  510. goto out_unlock_inode;
  511. }
  512. err = ocfs2_journal_access(handle, inode, fe_bh,
  513. OCFS2_JOURNAL_ACCESS_WRITE);
  514. if (err < 0) {
  515. mlog_errno(err);
  516. goto out_commit;
  517. }
  518. inc_nlink(inode);
  519. inode->i_ctime = CURRENT_TIME;
  520. fe->i_links_count = cpu_to_le16(inode->i_nlink);
  521. fe->i_ctime = cpu_to_le64(inode->i_ctime.tv_sec);
  522. fe->i_ctime_nsec = cpu_to_le32(inode->i_ctime.tv_nsec);
  523. err = ocfs2_journal_dirty(handle, fe_bh);
  524. if (err < 0) {
  525. le16_add_cpu(&fe->i_links_count, -1);
  526. drop_nlink(inode);
  527. mlog_errno(err);
  528. goto out_commit;
  529. }
  530. err = ocfs2_add_entry(handle, dentry, inode,
  531. OCFS2_I(inode)->ip_blkno,
  532. parent_fe_bh, de_bh);
  533. if (err) {
  534. le16_add_cpu(&fe->i_links_count, -1);
  535. drop_nlink(inode);
  536. mlog_errno(err);
  537. goto out_commit;
  538. }
  539. err = ocfs2_dentry_attach_lock(dentry, inode, OCFS2_I(dir)->ip_blkno);
  540. if (err) {
  541. mlog_errno(err);
  542. goto out_commit;
  543. }
  544. atomic_inc(&inode->i_count);
  545. dentry->d_op = &ocfs2_dentry_ops;
  546. d_instantiate(dentry, inode);
  547. out_commit:
  548. ocfs2_commit_trans(osb, handle);
  549. out_unlock_inode:
  550. ocfs2_meta_unlock(inode, 1);
  551. out:
  552. ocfs2_meta_unlock(dir, 1);
  553. if (de_bh)
  554. brelse(de_bh);
  555. if (fe_bh)
  556. brelse(fe_bh);
  557. if (parent_fe_bh)
  558. brelse(parent_fe_bh);
  559. mlog_exit(err);
  560. return err;
  561. }
  562. /*
  563. * Takes and drops an exclusive lock on the given dentry. This will
  564. * force other nodes to drop it.
  565. */
  566. static int ocfs2_remote_dentry_delete(struct dentry *dentry)
  567. {
  568. int ret;
  569. ret = ocfs2_dentry_lock(dentry, 1);
  570. if (ret)
  571. mlog_errno(ret);
  572. else
  573. ocfs2_dentry_unlock(dentry, 1);
  574. return ret;
  575. }
  576. static inline int inode_is_unlinkable(struct inode *inode)
  577. {
  578. if (S_ISDIR(inode->i_mode)) {
  579. if (inode->i_nlink == 2)
  580. return 1;
  581. return 0;
  582. }
  583. if (inode->i_nlink == 1)
  584. return 1;
  585. return 0;
  586. }
  587. static int ocfs2_unlink(struct inode *dir,
  588. struct dentry *dentry)
  589. {
  590. int status;
  591. int child_locked = 0;
  592. struct inode *inode = dentry->d_inode;
  593. struct inode *orphan_dir = NULL;
  594. struct ocfs2_super *osb = OCFS2_SB(dir->i_sb);
  595. u64 blkno;
  596. struct ocfs2_dinode *fe = NULL;
  597. struct buffer_head *fe_bh = NULL;
  598. struct buffer_head *parent_node_bh = NULL;
  599. handle_t *handle = NULL;
  600. struct ocfs2_dir_entry *dirent = NULL;
  601. struct buffer_head *dirent_bh = NULL;
  602. char orphan_name[OCFS2_ORPHAN_NAMELEN + 1];
  603. struct buffer_head *orphan_entry_bh = NULL;
  604. mlog_entry("(0x%p, 0x%p, '%.*s')\n", dir, dentry,
  605. dentry->d_name.len, dentry->d_name.name);
  606. BUG_ON(dentry->d_parent->d_inode != dir);
  607. mlog(0, "ino = %llu\n", (unsigned long long)OCFS2_I(inode)->ip_blkno);
  608. if (inode == osb->root_inode) {
  609. mlog(0, "Cannot delete the root directory\n");
  610. return -EPERM;
  611. }
  612. status = ocfs2_meta_lock(dir, &parent_node_bh, 1);
  613. if (status < 0) {
  614. if (status != -ENOENT)
  615. mlog_errno(status);
  616. return status;
  617. }
  618. status = ocfs2_find_files_on_disk(dentry->d_name.name,
  619. dentry->d_name.len, &blkno,
  620. dir, &dirent_bh, &dirent);
  621. if (status < 0) {
  622. if (status != -ENOENT)
  623. mlog_errno(status);
  624. goto leave;
  625. }
  626. if (OCFS2_I(inode)->ip_blkno != blkno) {
  627. status = -ENOENT;
  628. mlog(0, "ip_blkno %llu != dirent blkno %llu ip_flags = %x\n",
  629. (unsigned long long)OCFS2_I(inode)->ip_blkno,
  630. (unsigned long long)blkno, OCFS2_I(inode)->ip_flags);
  631. goto leave;
  632. }
  633. status = ocfs2_meta_lock(inode, &fe_bh, 1);
  634. if (status < 0) {
  635. if (status != -ENOENT)
  636. mlog_errno(status);
  637. goto leave;
  638. }
  639. child_locked = 1;
  640. if (S_ISDIR(inode->i_mode)) {
  641. if (!ocfs2_empty_dir(inode)) {
  642. status = -ENOTEMPTY;
  643. goto leave;
  644. } else if (inode->i_nlink != 2) {
  645. status = -ENOTEMPTY;
  646. goto leave;
  647. }
  648. }
  649. status = ocfs2_remote_dentry_delete(dentry);
  650. if (status < 0) {
  651. /* This vote should succeed under all normal
  652. * circumstances. */
  653. mlog_errno(status);
  654. goto leave;
  655. }
  656. if (inode_is_unlinkable(inode)) {
  657. status = ocfs2_prepare_orphan_dir(osb, &orphan_dir, inode,
  658. orphan_name,
  659. &orphan_entry_bh);
  660. if (status < 0) {
  661. mlog_errno(status);
  662. goto leave;
  663. }
  664. }
  665. handle = ocfs2_start_trans(osb, OCFS2_UNLINK_CREDITS);
  666. if (IS_ERR(handle)) {
  667. status = PTR_ERR(handle);
  668. handle = NULL;
  669. mlog_errno(status);
  670. goto leave;
  671. }
  672. status = ocfs2_journal_access(handle, inode, fe_bh,
  673. OCFS2_JOURNAL_ACCESS_WRITE);
  674. if (status < 0) {
  675. mlog_errno(status);
  676. goto leave;
  677. }
  678. fe = (struct ocfs2_dinode *) fe_bh->b_data;
  679. if (inode_is_unlinkable(inode)) {
  680. status = ocfs2_orphan_add(osb, handle, inode, fe, orphan_name,
  681. orphan_entry_bh, orphan_dir);
  682. if (status < 0) {
  683. mlog_errno(status);
  684. goto leave;
  685. }
  686. }
  687. /* delete the name from the parent dir */
  688. status = ocfs2_delete_entry(handle, dir, dirent, dirent_bh);
  689. if (status < 0) {
  690. mlog_errno(status);
  691. goto leave;
  692. }
  693. if (S_ISDIR(inode->i_mode))
  694. drop_nlink(inode);
  695. drop_nlink(inode);
  696. fe->i_links_count = cpu_to_le16(inode->i_nlink);
  697. status = ocfs2_journal_dirty(handle, fe_bh);
  698. if (status < 0) {
  699. mlog_errno(status);
  700. goto leave;
  701. }
  702. dir->i_ctime = dir->i_mtime = CURRENT_TIME;
  703. if (S_ISDIR(inode->i_mode))
  704. drop_nlink(dir);
  705. status = ocfs2_mark_inode_dirty(handle, dir, parent_node_bh);
  706. if (status < 0) {
  707. mlog_errno(status);
  708. if (S_ISDIR(inode->i_mode))
  709. inc_nlink(dir);
  710. }
  711. leave:
  712. if (handle)
  713. ocfs2_commit_trans(osb, handle);
  714. if (child_locked)
  715. ocfs2_meta_unlock(inode, 1);
  716. ocfs2_meta_unlock(dir, 1);
  717. if (orphan_dir) {
  718. /* This was locked for us in ocfs2_prepare_orphan_dir() */
  719. ocfs2_meta_unlock(orphan_dir, 1);
  720. mutex_unlock(&orphan_dir->i_mutex);
  721. iput(orphan_dir);
  722. }
  723. if (fe_bh)
  724. brelse(fe_bh);
  725. if (dirent_bh)
  726. brelse(dirent_bh);
  727. if (parent_node_bh)
  728. brelse(parent_node_bh);
  729. if (orphan_entry_bh)
  730. brelse(orphan_entry_bh);
  731. mlog_exit(status);
  732. return status;
  733. }
  734. /*
  735. * The only place this should be used is rename!
  736. * if they have the same id, then the 1st one is the only one locked.
  737. */
  738. static int ocfs2_double_lock(struct ocfs2_super *osb,
  739. struct buffer_head **bh1,
  740. struct inode *inode1,
  741. struct buffer_head **bh2,
  742. struct inode *inode2)
  743. {
  744. int status;
  745. struct ocfs2_inode_info *oi1 = OCFS2_I(inode1);
  746. struct ocfs2_inode_info *oi2 = OCFS2_I(inode2);
  747. struct buffer_head **tmpbh;
  748. struct inode *tmpinode;
  749. mlog_entry("(inode1 = %llu, inode2 = %llu)\n",
  750. (unsigned long long)oi1->ip_blkno,
  751. (unsigned long long)oi2->ip_blkno);
  752. if (*bh1)
  753. *bh1 = NULL;
  754. if (*bh2)
  755. *bh2 = NULL;
  756. /* we always want to lock the one with the lower lockid first. */
  757. if (oi1->ip_blkno != oi2->ip_blkno) {
  758. if (oi1->ip_blkno < oi2->ip_blkno) {
  759. /* switch id1 and id2 around */
  760. mlog(0, "switching them around...\n");
  761. tmpbh = bh2;
  762. bh2 = bh1;
  763. bh1 = tmpbh;
  764. tmpinode = inode2;
  765. inode2 = inode1;
  766. inode1 = tmpinode;
  767. }
  768. /* lock id2 */
  769. status = ocfs2_meta_lock(inode2, bh2, 1);
  770. if (status < 0) {
  771. if (status != -ENOENT)
  772. mlog_errno(status);
  773. goto bail;
  774. }
  775. }
  776. /* lock id1 */
  777. status = ocfs2_meta_lock(inode1, bh1, 1);
  778. if (status < 0) {
  779. /*
  780. * An error return must mean that no cluster locks
  781. * were held on function exit.
  782. */
  783. if (oi1->ip_blkno != oi2->ip_blkno)
  784. ocfs2_meta_unlock(inode2, 1);
  785. if (status != -ENOENT)
  786. mlog_errno(status);
  787. }
  788. bail:
  789. mlog_exit(status);
  790. return status;
  791. }
  792. static void ocfs2_double_unlock(struct inode *inode1, struct inode *inode2)
  793. {
  794. ocfs2_meta_unlock(inode1, 1);
  795. if (inode1 != inode2)
  796. ocfs2_meta_unlock(inode2, 1);
  797. }
  798. static int ocfs2_rename(struct inode *old_dir,
  799. struct dentry *old_dentry,
  800. struct inode *new_dir,
  801. struct dentry *new_dentry)
  802. {
  803. int status = 0, rename_lock = 0, parents_locked = 0;
  804. int old_child_locked = 0, new_child_locked = 0;
  805. struct inode *old_inode = old_dentry->d_inode;
  806. struct inode *new_inode = new_dentry->d_inode;
  807. struct inode *orphan_dir = NULL;
  808. struct ocfs2_dinode *newfe = NULL;
  809. char orphan_name[OCFS2_ORPHAN_NAMELEN + 1];
  810. struct buffer_head *orphan_entry_bh = NULL;
  811. struct buffer_head *newfe_bh = NULL;
  812. struct buffer_head *old_inode_bh = NULL;
  813. struct buffer_head *insert_entry_bh = NULL;
  814. struct ocfs2_super *osb = NULL;
  815. u64 newfe_blkno, old_de_ino;
  816. handle_t *handle = NULL;
  817. struct buffer_head *old_dir_bh = NULL;
  818. struct buffer_head *new_dir_bh = NULL;
  819. struct ocfs2_dir_entry *old_inode_dot_dot_de = NULL, *old_de = NULL,
  820. *new_de = NULL;
  821. struct buffer_head *new_de_bh = NULL, *old_de_bh = NULL; // bhs for above
  822. struct buffer_head *old_inode_de_bh = NULL; // if old_dentry is a dir,
  823. // this is the 1st dirent bh
  824. nlink_t old_dir_nlink = old_dir->i_nlink;
  825. struct ocfs2_dinode *old_di;
  826. /* At some point it might be nice to break this function up a
  827. * bit. */
  828. mlog_entry("(0x%p, 0x%p, 0x%p, 0x%p, from='%.*s' to='%.*s')\n",
  829. old_dir, old_dentry, new_dir, new_dentry,
  830. old_dentry->d_name.len, old_dentry->d_name.name,
  831. new_dentry->d_name.len, new_dentry->d_name.name);
  832. osb = OCFS2_SB(old_dir->i_sb);
  833. if (new_inode) {
  834. if (!igrab(new_inode))
  835. BUG();
  836. }
  837. /* Assume a directory hierarchy thusly:
  838. * a/b/c
  839. * a/d
  840. * a,b,c, and d are all directories.
  841. *
  842. * from cwd of 'a' on both nodes:
  843. * node1: mv b/c d
  844. * node2: mv d b/c
  845. *
  846. * And that's why, just like the VFS, we need a file system
  847. * rename lock. */
  848. if (old_dentry != new_dentry) {
  849. status = ocfs2_rename_lock(osb);
  850. if (status < 0) {
  851. mlog_errno(status);
  852. goto bail;
  853. }
  854. rename_lock = 1;
  855. }
  856. /* if old and new are the same, this'll just do one lock. */
  857. status = ocfs2_double_lock(osb, &old_dir_bh, old_dir,
  858. &new_dir_bh, new_dir);
  859. if (status < 0) {
  860. mlog_errno(status);
  861. goto bail;
  862. }
  863. parents_locked = 1;
  864. /* make sure both dirs have bhs
  865. * get an extra ref on old_dir_bh if old==new */
  866. if (!new_dir_bh) {
  867. if (old_dir_bh) {
  868. new_dir_bh = old_dir_bh;
  869. get_bh(new_dir_bh);
  870. } else {
  871. mlog(ML_ERROR, "no old_dir_bh!\n");
  872. status = -EIO;
  873. goto bail;
  874. }
  875. }
  876. /*
  877. * Aside from allowing a meta data update, the locking here
  878. * also ensures that the vote thread on other nodes won't have
  879. * to concurrently downconvert the inode and the dentry locks.
  880. */
  881. status = ocfs2_meta_lock(old_inode, &old_inode_bh, 1);
  882. if (status < 0) {
  883. if (status != -ENOENT)
  884. mlog_errno(status);
  885. goto bail;
  886. }
  887. old_child_locked = 1;
  888. status = ocfs2_remote_dentry_delete(old_dentry);
  889. if (status < 0) {
  890. mlog_errno(status);
  891. goto bail;
  892. }
  893. if (S_ISDIR(old_inode->i_mode)) {
  894. u64 old_inode_parent;
  895. status = ocfs2_find_files_on_disk("..", 2, &old_inode_parent,
  896. old_inode, &old_inode_de_bh,
  897. &old_inode_dot_dot_de);
  898. if (status) {
  899. status = -EIO;
  900. goto bail;
  901. }
  902. if (old_inode_parent != OCFS2_I(old_dir)->ip_blkno) {
  903. status = -EIO;
  904. goto bail;
  905. }
  906. if (!new_inode && new_dir != old_dir &&
  907. new_dir->i_nlink >= OCFS2_LINK_MAX) {
  908. status = -EMLINK;
  909. goto bail;
  910. }
  911. }
  912. status = ocfs2_lookup_ino_from_name(old_dir, old_dentry->d_name.name,
  913. old_dentry->d_name.len,
  914. &old_de_ino);
  915. if (status) {
  916. status = -ENOENT;
  917. goto bail;
  918. }
  919. /*
  920. * Check for inode number is _not_ due to possible IO errors.
  921. * We might rmdir the source, keep it as pwd of some process
  922. * and merrily kill the link to whatever was created under the
  923. * same name. Goodbye sticky bit ;-<
  924. */
  925. if (old_de_ino != OCFS2_I(old_inode)->ip_blkno) {
  926. status = -ENOENT;
  927. goto bail;
  928. }
  929. /* check if the target already exists (in which case we need
  930. * to delete it */
  931. status = ocfs2_find_files_on_disk(new_dentry->d_name.name,
  932. new_dentry->d_name.len,
  933. &newfe_blkno, new_dir, &new_de_bh,
  934. &new_de);
  935. /* The only error we allow here is -ENOENT because the new
  936. * file not existing is perfectly valid. */
  937. if ((status < 0) && (status != -ENOENT)) {
  938. /* If we cannot find the file specified we should just */
  939. /* return the error... */
  940. mlog_errno(status);
  941. goto bail;
  942. }
  943. if (!new_de && new_inode)
  944. mlog(ML_ERROR, "inode %lu does not exist in it's parent "
  945. "directory!", new_inode->i_ino);
  946. /* In case we need to overwrite an existing file, we blow it
  947. * away first */
  948. if (new_de) {
  949. /* VFS didn't think there existed an inode here, but
  950. * someone else in the cluster must have raced our
  951. * rename to create one. Today we error cleanly, in
  952. * the future we should consider calling iget to build
  953. * a new struct inode for this entry. */
  954. if (!new_inode) {
  955. status = -EACCES;
  956. mlog(0, "We found an inode for name %.*s but VFS "
  957. "didn't give us one.\n", new_dentry->d_name.len,
  958. new_dentry->d_name.name);
  959. goto bail;
  960. }
  961. if (OCFS2_I(new_inode)->ip_blkno != newfe_blkno) {
  962. status = -EACCES;
  963. mlog(0, "Inode %llu and dir %llu disagree. flags = %x\n",
  964. (unsigned long long)OCFS2_I(new_inode)->ip_blkno,
  965. (unsigned long long)newfe_blkno,
  966. OCFS2_I(new_inode)->ip_flags);
  967. goto bail;
  968. }
  969. status = ocfs2_meta_lock(new_inode, &newfe_bh, 1);
  970. if (status < 0) {
  971. if (status != -ENOENT)
  972. mlog_errno(status);
  973. goto bail;
  974. }
  975. new_child_locked = 1;
  976. status = ocfs2_remote_dentry_delete(new_dentry);
  977. if (status < 0) {
  978. mlog_errno(status);
  979. goto bail;
  980. }
  981. newfe = (struct ocfs2_dinode *) newfe_bh->b_data;
  982. mlog(0, "aha rename over existing... new_de=%p new_blkno=%llu "
  983. "newfebh=%p bhblocknr=%llu\n", new_de,
  984. (unsigned long long)newfe_blkno, newfe_bh, newfe_bh ?
  985. (unsigned long long)newfe_bh->b_blocknr : 0ULL);
  986. if (S_ISDIR(new_inode->i_mode) || (new_inode->i_nlink == 1)) {
  987. status = ocfs2_prepare_orphan_dir(osb, &orphan_dir,
  988. new_inode,
  989. orphan_name,
  990. &orphan_entry_bh);
  991. if (status < 0) {
  992. mlog_errno(status);
  993. goto bail;
  994. }
  995. }
  996. } else {
  997. BUG_ON(new_dentry->d_parent->d_inode != new_dir);
  998. status = ocfs2_check_dir_for_entry(new_dir,
  999. new_dentry->d_name.name,
  1000. new_dentry->d_name.len);
  1001. if (status)
  1002. goto bail;
  1003. status = ocfs2_prepare_dir_for_insert(osb, new_dir, new_dir_bh,
  1004. new_dentry->d_name.name,
  1005. new_dentry->d_name.len,
  1006. &insert_entry_bh);
  1007. if (status < 0) {
  1008. mlog_errno(status);
  1009. goto bail;
  1010. }
  1011. }
  1012. handle = ocfs2_start_trans(osb, OCFS2_RENAME_CREDITS);
  1013. if (IS_ERR(handle)) {
  1014. status = PTR_ERR(handle);
  1015. handle = NULL;
  1016. mlog_errno(status);
  1017. goto bail;
  1018. }
  1019. if (new_de) {
  1020. if (S_ISDIR(new_inode->i_mode)) {
  1021. if (!ocfs2_empty_dir(new_inode) ||
  1022. new_inode->i_nlink != 2) {
  1023. status = -ENOTEMPTY;
  1024. goto bail;
  1025. }
  1026. }
  1027. status = ocfs2_journal_access(handle, new_inode, newfe_bh,
  1028. OCFS2_JOURNAL_ACCESS_WRITE);
  1029. if (status < 0) {
  1030. mlog_errno(status);
  1031. goto bail;
  1032. }
  1033. if (S_ISDIR(new_inode->i_mode) ||
  1034. (newfe->i_links_count == cpu_to_le16(1))){
  1035. status = ocfs2_orphan_add(osb, handle, new_inode,
  1036. newfe, orphan_name,
  1037. orphan_entry_bh, orphan_dir);
  1038. if (status < 0) {
  1039. mlog_errno(status);
  1040. goto bail;
  1041. }
  1042. }
  1043. /* change the dirent to point to the correct inode */
  1044. status = ocfs2_update_entry(new_dir, handle, new_de_bh,
  1045. new_de, old_inode);
  1046. if (status < 0) {
  1047. mlog_errno(status);
  1048. goto bail;
  1049. }
  1050. new_dir->i_version++;
  1051. if (S_ISDIR(new_inode->i_mode))
  1052. newfe->i_links_count = 0;
  1053. else
  1054. le16_add_cpu(&newfe->i_links_count, -1);
  1055. status = ocfs2_journal_dirty(handle, newfe_bh);
  1056. if (status < 0) {
  1057. mlog_errno(status);
  1058. goto bail;
  1059. }
  1060. } else {
  1061. /* if the name was not found in new_dir, add it now */
  1062. status = ocfs2_add_entry(handle, new_dentry, old_inode,
  1063. OCFS2_I(old_inode)->ip_blkno,
  1064. new_dir_bh, insert_entry_bh);
  1065. }
  1066. old_inode->i_ctime = CURRENT_TIME;
  1067. mark_inode_dirty(old_inode);
  1068. status = ocfs2_journal_access(handle, old_inode, old_inode_bh,
  1069. OCFS2_JOURNAL_ACCESS_WRITE);
  1070. if (status >= 0) {
  1071. old_di = (struct ocfs2_dinode *) old_inode_bh->b_data;
  1072. old_di->i_ctime = cpu_to_le64(old_inode->i_ctime.tv_sec);
  1073. old_di->i_ctime_nsec = cpu_to_le32(old_inode->i_ctime.tv_nsec);
  1074. status = ocfs2_journal_dirty(handle, old_inode_bh);
  1075. if (status < 0)
  1076. mlog_errno(status);
  1077. } else
  1078. mlog_errno(status);
  1079. /*
  1080. * Now that the name has been added to new_dir, remove the old name.
  1081. *
  1082. * We don't keep any directory entry context around until now
  1083. * because the insert might have changed the type of directory
  1084. * we're dealing with.
  1085. */
  1086. old_de_bh = ocfs2_find_entry(old_dentry->d_name.name,
  1087. old_dentry->d_name.len,
  1088. old_dir, &old_de);
  1089. if (!old_de_bh) {
  1090. status = -EIO;
  1091. goto bail;
  1092. }
  1093. status = ocfs2_delete_entry(handle, old_dir, old_de, old_de_bh);
  1094. if (status < 0) {
  1095. mlog_errno(status);
  1096. goto bail;
  1097. }
  1098. if (new_inode) {
  1099. new_inode->i_nlink--;
  1100. new_inode->i_ctime = CURRENT_TIME;
  1101. }
  1102. old_dir->i_ctime = old_dir->i_mtime = CURRENT_TIME;
  1103. if (old_inode_de_bh) {
  1104. status = ocfs2_update_entry(old_inode, handle, old_inode_de_bh,
  1105. old_inode_dot_dot_de, new_dir);
  1106. old_dir->i_nlink--;
  1107. if (new_inode) {
  1108. new_inode->i_nlink--;
  1109. } else {
  1110. inc_nlink(new_dir);
  1111. mark_inode_dirty(new_dir);
  1112. }
  1113. }
  1114. mark_inode_dirty(old_dir);
  1115. ocfs2_mark_inode_dirty(handle, old_dir, old_dir_bh);
  1116. if (new_inode) {
  1117. mark_inode_dirty(new_inode);
  1118. ocfs2_mark_inode_dirty(handle, new_inode, newfe_bh);
  1119. }
  1120. if (old_dir != new_dir) {
  1121. /* Keep the same times on both directories.*/
  1122. new_dir->i_ctime = new_dir->i_mtime = old_dir->i_ctime;
  1123. /*
  1124. * This will also pick up the i_nlink change from the
  1125. * block above.
  1126. */
  1127. ocfs2_mark_inode_dirty(handle, new_dir, new_dir_bh);
  1128. }
  1129. if (old_dir_nlink != old_dir->i_nlink) {
  1130. if (!old_dir_bh) {
  1131. mlog(ML_ERROR, "need to change nlink for old dir "
  1132. "%llu from %d to %d but bh is NULL!\n",
  1133. (unsigned long long)OCFS2_I(old_dir)->ip_blkno,
  1134. (int)old_dir_nlink, old_dir->i_nlink);
  1135. } else {
  1136. struct ocfs2_dinode *fe;
  1137. status = ocfs2_journal_access(handle, old_dir,
  1138. old_dir_bh,
  1139. OCFS2_JOURNAL_ACCESS_WRITE);
  1140. fe = (struct ocfs2_dinode *) old_dir_bh->b_data;
  1141. fe->i_links_count = cpu_to_le16(old_dir->i_nlink);
  1142. status = ocfs2_journal_dirty(handle, old_dir_bh);
  1143. }
  1144. }
  1145. ocfs2_dentry_move(old_dentry, new_dentry, old_dir, new_dir);
  1146. status = 0;
  1147. bail:
  1148. if (rename_lock)
  1149. ocfs2_rename_unlock(osb);
  1150. if (handle)
  1151. ocfs2_commit_trans(osb, handle);
  1152. if (parents_locked)
  1153. ocfs2_double_unlock(old_dir, new_dir);
  1154. if (old_child_locked)
  1155. ocfs2_meta_unlock(old_inode, 1);
  1156. if (new_child_locked)
  1157. ocfs2_meta_unlock(new_inode, 1);
  1158. if (orphan_dir) {
  1159. /* This was locked for us in ocfs2_prepare_orphan_dir() */
  1160. ocfs2_meta_unlock(orphan_dir, 1);
  1161. mutex_unlock(&orphan_dir->i_mutex);
  1162. iput(orphan_dir);
  1163. }
  1164. if (new_inode)
  1165. sync_mapping_buffers(old_inode->i_mapping);
  1166. if (new_inode)
  1167. iput(new_inode);
  1168. if (newfe_bh)
  1169. brelse(newfe_bh);
  1170. if (old_inode_bh)
  1171. brelse(old_inode_bh);
  1172. if (old_dir_bh)
  1173. brelse(old_dir_bh);
  1174. if (new_dir_bh)
  1175. brelse(new_dir_bh);
  1176. if (new_de_bh)
  1177. brelse(new_de_bh);
  1178. if (old_de_bh)
  1179. brelse(old_de_bh);
  1180. if (old_inode_de_bh)
  1181. brelse(old_inode_de_bh);
  1182. if (orphan_entry_bh)
  1183. brelse(orphan_entry_bh);
  1184. if (insert_entry_bh)
  1185. brelse(insert_entry_bh);
  1186. mlog_exit(status);
  1187. return status;
  1188. }
  1189. /*
  1190. * we expect i_size = strlen(symname). Copy symname into the file
  1191. * data, including the null terminator.
  1192. */
  1193. static int ocfs2_create_symlink_data(struct ocfs2_super *osb,
  1194. handle_t *handle,
  1195. struct inode *inode,
  1196. const char *symname)
  1197. {
  1198. struct buffer_head **bhs = NULL;
  1199. const char *c;
  1200. struct super_block *sb = osb->sb;
  1201. u64 p_blkno, p_blocks;
  1202. int virtual, blocks, status, i, bytes_left;
  1203. bytes_left = i_size_read(inode) + 1;
  1204. /* we can't trust i_blocks because we're actually going to
  1205. * write i_size + 1 bytes. */
  1206. blocks = (bytes_left + sb->s_blocksize - 1) >> sb->s_blocksize_bits;
  1207. mlog_entry("i_blocks = %llu, i_size = %llu, blocks = %d\n",
  1208. (unsigned long long)inode->i_blocks,
  1209. i_size_read(inode), blocks);
  1210. /* Sanity check -- make sure we're going to fit. */
  1211. if (bytes_left >
  1212. ocfs2_clusters_to_bytes(sb, OCFS2_I(inode)->ip_clusters)) {
  1213. status = -EIO;
  1214. mlog_errno(status);
  1215. goto bail;
  1216. }
  1217. bhs = kcalloc(blocks, sizeof(struct buffer_head *), GFP_KERNEL);
  1218. if (!bhs) {
  1219. status = -ENOMEM;
  1220. mlog_errno(status);
  1221. goto bail;
  1222. }
  1223. status = ocfs2_extent_map_get_blocks(inode, 0, &p_blkno, &p_blocks,
  1224. NULL);
  1225. if (status < 0) {
  1226. mlog_errno(status);
  1227. goto bail;
  1228. }
  1229. /* links can never be larger than one cluster so we know this
  1230. * is all going to be contiguous, but do a sanity check
  1231. * anyway. */
  1232. if ((p_blocks << sb->s_blocksize_bits) < bytes_left) {
  1233. status = -EIO;
  1234. mlog_errno(status);
  1235. goto bail;
  1236. }
  1237. virtual = 0;
  1238. while(bytes_left > 0) {
  1239. c = &symname[virtual * sb->s_blocksize];
  1240. bhs[virtual] = sb_getblk(sb, p_blkno);
  1241. if (!bhs[virtual]) {
  1242. status = -ENOMEM;
  1243. mlog_errno(status);
  1244. goto bail;
  1245. }
  1246. ocfs2_set_new_buffer_uptodate(inode, bhs[virtual]);
  1247. status = ocfs2_journal_access(handle, inode, bhs[virtual],
  1248. OCFS2_JOURNAL_ACCESS_CREATE);
  1249. if (status < 0) {
  1250. mlog_errno(status);
  1251. goto bail;
  1252. }
  1253. memset(bhs[virtual]->b_data, 0, sb->s_blocksize);
  1254. memcpy(bhs[virtual]->b_data, c,
  1255. (bytes_left > sb->s_blocksize) ? sb->s_blocksize :
  1256. bytes_left);
  1257. status = ocfs2_journal_dirty(handle, bhs[virtual]);
  1258. if (status < 0) {
  1259. mlog_errno(status);
  1260. goto bail;
  1261. }
  1262. virtual++;
  1263. p_blkno++;
  1264. bytes_left -= sb->s_blocksize;
  1265. }
  1266. status = 0;
  1267. bail:
  1268. if (bhs) {
  1269. for(i = 0; i < blocks; i++)
  1270. if (bhs[i])
  1271. brelse(bhs[i]);
  1272. kfree(bhs);
  1273. }
  1274. mlog_exit(status);
  1275. return status;
  1276. }
  1277. static int ocfs2_symlink(struct inode *dir,
  1278. struct dentry *dentry,
  1279. const char *symname)
  1280. {
  1281. int status, l, credits;
  1282. u64 newsize;
  1283. struct ocfs2_super *osb = NULL;
  1284. struct inode *inode = NULL;
  1285. struct super_block *sb;
  1286. struct buffer_head *new_fe_bh = NULL;
  1287. struct buffer_head *de_bh = NULL;
  1288. struct buffer_head *parent_fe_bh = NULL;
  1289. struct ocfs2_dinode *fe = NULL;
  1290. struct ocfs2_dinode *dirfe;
  1291. handle_t *handle = NULL;
  1292. struct ocfs2_alloc_context *inode_ac = NULL;
  1293. struct ocfs2_alloc_context *data_ac = NULL;
  1294. mlog_entry("(0x%p, 0x%p, symname='%s' actual='%.*s')\n", dir,
  1295. dentry, symname, dentry->d_name.len, dentry->d_name.name);
  1296. sb = dir->i_sb;
  1297. osb = OCFS2_SB(sb);
  1298. l = strlen(symname) + 1;
  1299. credits = ocfs2_calc_symlink_credits(sb);
  1300. /* lock the parent directory */
  1301. status = ocfs2_meta_lock(dir, &parent_fe_bh, 1);
  1302. if (status < 0) {
  1303. if (status != -ENOENT)
  1304. mlog_errno(status);
  1305. return status;
  1306. }
  1307. dirfe = (struct ocfs2_dinode *) parent_fe_bh->b_data;
  1308. if (!dirfe->i_links_count) {
  1309. /* can't make a file in a deleted directory. */
  1310. status = -ENOENT;
  1311. goto bail;
  1312. }
  1313. status = ocfs2_check_dir_for_entry(dir, dentry->d_name.name,
  1314. dentry->d_name.len);
  1315. if (status)
  1316. goto bail;
  1317. status = ocfs2_prepare_dir_for_insert(osb, dir, parent_fe_bh,
  1318. dentry->d_name.name,
  1319. dentry->d_name.len, &de_bh);
  1320. if (status < 0) {
  1321. mlog_errno(status);
  1322. goto bail;
  1323. }
  1324. status = ocfs2_reserve_new_inode(osb, &inode_ac);
  1325. if (status < 0) {
  1326. if (status != -ENOSPC)
  1327. mlog_errno(status);
  1328. goto bail;
  1329. }
  1330. /* don't reserve bitmap space for fast symlinks. */
  1331. if (l > ocfs2_fast_symlink_chars(sb)) {
  1332. status = ocfs2_reserve_clusters(osb, 1, &data_ac);
  1333. if (status < 0) {
  1334. if (status != -ENOSPC)
  1335. mlog_errno(status);
  1336. goto bail;
  1337. }
  1338. }
  1339. handle = ocfs2_start_trans(osb, credits);
  1340. if (IS_ERR(handle)) {
  1341. status = PTR_ERR(handle);
  1342. handle = NULL;
  1343. mlog_errno(status);
  1344. goto bail;
  1345. }
  1346. status = ocfs2_mknod_locked(osb, dir, dentry,
  1347. S_IFLNK | S_IRWXUGO, 0,
  1348. &new_fe_bh, parent_fe_bh, handle,
  1349. &inode, inode_ac);
  1350. if (status < 0) {
  1351. mlog_errno(status);
  1352. goto bail;
  1353. }
  1354. fe = (struct ocfs2_dinode *) new_fe_bh->b_data;
  1355. inode->i_rdev = 0;
  1356. newsize = l - 1;
  1357. if (l > ocfs2_fast_symlink_chars(sb)) {
  1358. u32 offset = 0;
  1359. inode->i_op = &ocfs2_symlink_inode_operations;
  1360. status = ocfs2_do_extend_allocation(osb, inode, &offset, 1, 0,
  1361. new_fe_bh,
  1362. handle, data_ac, NULL,
  1363. NULL);
  1364. if (status < 0) {
  1365. if (status != -ENOSPC && status != -EINTR) {
  1366. mlog(ML_ERROR,
  1367. "Failed to extend file to %llu\n",
  1368. (unsigned long long)newsize);
  1369. mlog_errno(status);
  1370. status = -ENOSPC;
  1371. }
  1372. goto bail;
  1373. }
  1374. i_size_write(inode, newsize);
  1375. inode->i_blocks = ocfs2_inode_sector_count(inode);
  1376. } else {
  1377. inode->i_op = &ocfs2_fast_symlink_inode_operations;
  1378. memcpy((char *) fe->id2.i_symlink, symname, l);
  1379. i_size_write(inode, newsize);
  1380. inode->i_blocks = 0;
  1381. }
  1382. status = ocfs2_mark_inode_dirty(handle, inode, new_fe_bh);
  1383. if (status < 0) {
  1384. mlog_errno(status);
  1385. goto bail;
  1386. }
  1387. if (!ocfs2_inode_is_fast_symlink(inode)) {
  1388. status = ocfs2_create_symlink_data(osb, handle, inode,
  1389. symname);
  1390. if (status < 0) {
  1391. mlog_errno(status);
  1392. goto bail;
  1393. }
  1394. }
  1395. status = ocfs2_add_entry(handle, dentry, inode,
  1396. le64_to_cpu(fe->i_blkno), parent_fe_bh,
  1397. de_bh);
  1398. if (status < 0) {
  1399. mlog_errno(status);
  1400. goto bail;
  1401. }
  1402. status = ocfs2_dentry_attach_lock(dentry, inode, OCFS2_I(dir)->ip_blkno);
  1403. if (status) {
  1404. mlog_errno(status);
  1405. goto bail;
  1406. }
  1407. insert_inode_hash(inode);
  1408. dentry->d_op = &ocfs2_dentry_ops;
  1409. d_instantiate(dentry, inode);
  1410. bail:
  1411. if (handle)
  1412. ocfs2_commit_trans(osb, handle);
  1413. ocfs2_meta_unlock(dir, 1);
  1414. if (new_fe_bh)
  1415. brelse(new_fe_bh);
  1416. if (parent_fe_bh)
  1417. brelse(parent_fe_bh);
  1418. if (de_bh)
  1419. brelse(de_bh);
  1420. if (inode_ac)
  1421. ocfs2_free_alloc_context(inode_ac);
  1422. if (data_ac)
  1423. ocfs2_free_alloc_context(data_ac);
  1424. if ((status < 0) && inode)
  1425. iput(inode);
  1426. mlog_exit(status);
  1427. return status;
  1428. }
  1429. static int ocfs2_blkno_stringify(u64 blkno, char *name)
  1430. {
  1431. int status, namelen;
  1432. mlog_entry_void();
  1433. namelen = snprintf(name, OCFS2_ORPHAN_NAMELEN + 1, "%016llx",
  1434. (long long)blkno);
  1435. if (namelen <= 0) {
  1436. if (namelen)
  1437. status = namelen;
  1438. else
  1439. status = -EINVAL;
  1440. mlog_errno(status);
  1441. goto bail;
  1442. }
  1443. if (namelen != OCFS2_ORPHAN_NAMELEN) {
  1444. status = -EINVAL;
  1445. mlog_errno(status);
  1446. goto bail;
  1447. }
  1448. mlog(0, "built filename '%s' for orphan dir (len=%d)\n", name,
  1449. namelen);
  1450. status = 0;
  1451. bail:
  1452. mlog_exit(status);
  1453. return status;
  1454. }
  1455. static int ocfs2_prepare_orphan_dir(struct ocfs2_super *osb,
  1456. struct inode **ret_orphan_dir,
  1457. struct inode *inode,
  1458. char *name,
  1459. struct buffer_head **de_bh)
  1460. {
  1461. struct inode *orphan_dir_inode;
  1462. struct buffer_head *orphan_dir_bh = NULL;
  1463. int status = 0;
  1464. status = ocfs2_blkno_stringify(OCFS2_I(inode)->ip_blkno, name);
  1465. if (status < 0) {
  1466. mlog_errno(status);
  1467. return status;
  1468. }
  1469. orphan_dir_inode = ocfs2_get_system_file_inode(osb,
  1470. ORPHAN_DIR_SYSTEM_INODE,
  1471. osb->slot_num);
  1472. if (!orphan_dir_inode) {
  1473. status = -ENOENT;
  1474. mlog_errno(status);
  1475. return status;
  1476. }
  1477. mutex_lock(&orphan_dir_inode->i_mutex);
  1478. status = ocfs2_meta_lock(orphan_dir_inode, &orphan_dir_bh, 1);
  1479. if (status < 0) {
  1480. mlog_errno(status);
  1481. goto leave;
  1482. }
  1483. status = ocfs2_prepare_dir_for_insert(osb, orphan_dir_inode,
  1484. orphan_dir_bh, name,
  1485. OCFS2_ORPHAN_NAMELEN, de_bh);
  1486. if (status < 0) {
  1487. ocfs2_meta_unlock(orphan_dir_inode, 1);
  1488. mlog_errno(status);
  1489. goto leave;
  1490. }
  1491. *ret_orphan_dir = orphan_dir_inode;
  1492. leave:
  1493. if (status) {
  1494. mutex_unlock(&orphan_dir_inode->i_mutex);
  1495. iput(orphan_dir_inode);
  1496. }
  1497. if (orphan_dir_bh)
  1498. brelse(orphan_dir_bh);
  1499. mlog_exit(status);
  1500. return status;
  1501. }
  1502. static int ocfs2_orphan_add(struct ocfs2_super *osb,
  1503. handle_t *handle,
  1504. struct inode *inode,
  1505. struct ocfs2_dinode *fe,
  1506. char *name,
  1507. struct buffer_head *de_bh,
  1508. struct inode *orphan_dir_inode)
  1509. {
  1510. struct buffer_head *orphan_dir_bh = NULL;
  1511. int status = 0;
  1512. struct ocfs2_dinode *orphan_fe;
  1513. mlog_entry("(inode->i_ino = %lu)\n", inode->i_ino);
  1514. status = ocfs2_read_block(osb,
  1515. OCFS2_I(orphan_dir_inode)->ip_blkno,
  1516. &orphan_dir_bh, OCFS2_BH_CACHED,
  1517. orphan_dir_inode);
  1518. if (status < 0) {
  1519. mlog_errno(status);
  1520. goto leave;
  1521. }
  1522. status = ocfs2_journal_access(handle, orphan_dir_inode, orphan_dir_bh,
  1523. OCFS2_JOURNAL_ACCESS_WRITE);
  1524. if (status < 0) {
  1525. mlog_errno(status);
  1526. goto leave;
  1527. }
  1528. /* we're a cluster, and nlink can change on disk from
  1529. * underneath us... */
  1530. orphan_fe = (struct ocfs2_dinode *) orphan_dir_bh->b_data;
  1531. if (S_ISDIR(inode->i_mode))
  1532. le16_add_cpu(&orphan_fe->i_links_count, 1);
  1533. orphan_dir_inode->i_nlink = le16_to_cpu(orphan_fe->i_links_count);
  1534. status = ocfs2_journal_dirty(handle, orphan_dir_bh);
  1535. if (status < 0) {
  1536. mlog_errno(status);
  1537. goto leave;
  1538. }
  1539. status = __ocfs2_add_entry(handle, orphan_dir_inode, name,
  1540. OCFS2_ORPHAN_NAMELEN, inode,
  1541. OCFS2_I(inode)->ip_blkno,
  1542. orphan_dir_bh, de_bh);
  1543. if (status < 0) {
  1544. mlog_errno(status);
  1545. goto leave;
  1546. }
  1547. le32_add_cpu(&fe->i_flags, OCFS2_ORPHANED_FL);
  1548. /* Record which orphan dir our inode now resides
  1549. * in. delete_inode will use this to determine which orphan
  1550. * dir to lock. */
  1551. fe->i_orphaned_slot = cpu_to_le16(osb->slot_num);
  1552. mlog(0, "Inode %llu orphaned in slot %d\n",
  1553. (unsigned long long)OCFS2_I(inode)->ip_blkno, osb->slot_num);
  1554. leave:
  1555. if (orphan_dir_bh)
  1556. brelse(orphan_dir_bh);
  1557. mlog_exit(status);
  1558. return status;
  1559. }
  1560. /* unlike orphan_add, we expect the orphan dir to already be locked here. */
  1561. int ocfs2_orphan_del(struct ocfs2_super *osb,
  1562. handle_t *handle,
  1563. struct inode *orphan_dir_inode,
  1564. struct inode *inode,
  1565. struct buffer_head *orphan_dir_bh)
  1566. {
  1567. char name[OCFS2_ORPHAN_NAMELEN + 1];
  1568. struct ocfs2_dinode *orphan_fe;
  1569. int status = 0;
  1570. struct buffer_head *target_de_bh = NULL;
  1571. struct ocfs2_dir_entry *target_de = NULL;
  1572. mlog_entry_void();
  1573. status = ocfs2_blkno_stringify(OCFS2_I(inode)->ip_blkno, name);
  1574. if (status < 0) {
  1575. mlog_errno(status);
  1576. goto leave;
  1577. }
  1578. mlog(0, "removing '%s' from orphan dir %llu (namelen=%d)\n",
  1579. name, (unsigned long long)OCFS2_I(orphan_dir_inode)->ip_blkno,
  1580. OCFS2_ORPHAN_NAMELEN);
  1581. /* find it's spot in the orphan directory */
  1582. target_de_bh = ocfs2_find_entry(name, OCFS2_ORPHAN_NAMELEN,
  1583. orphan_dir_inode, &target_de);
  1584. if (!target_de_bh) {
  1585. status = -ENOENT;
  1586. mlog_errno(status);
  1587. goto leave;
  1588. }
  1589. /* remove it from the orphan directory */
  1590. status = ocfs2_delete_entry(handle, orphan_dir_inode, target_de,
  1591. target_de_bh);
  1592. if (status < 0) {
  1593. mlog_errno(status);
  1594. goto leave;
  1595. }
  1596. status = ocfs2_journal_access(handle,orphan_dir_inode, orphan_dir_bh,
  1597. OCFS2_JOURNAL_ACCESS_WRITE);
  1598. if (status < 0) {
  1599. mlog_errno(status);
  1600. goto leave;
  1601. }
  1602. /* do the i_nlink dance! :) */
  1603. orphan_fe = (struct ocfs2_dinode *) orphan_dir_bh->b_data;
  1604. if (S_ISDIR(inode->i_mode))
  1605. le16_add_cpu(&orphan_fe->i_links_count, -1);
  1606. orphan_dir_inode->i_nlink = le16_to_cpu(orphan_fe->i_links_count);
  1607. status = ocfs2_journal_dirty(handle, orphan_dir_bh);
  1608. if (status < 0) {
  1609. mlog_errno(status);
  1610. goto leave;
  1611. }
  1612. leave:
  1613. if (target_de_bh)
  1614. brelse(target_de_bh);
  1615. mlog_exit(status);
  1616. return status;
  1617. }
  1618. const struct inode_operations ocfs2_dir_iops = {
  1619. .create = ocfs2_create,
  1620. .lookup = ocfs2_lookup,
  1621. .link = ocfs2_link,
  1622. .unlink = ocfs2_unlink,
  1623. .rmdir = ocfs2_unlink,
  1624. .symlink = ocfs2_symlink,
  1625. .mkdir = ocfs2_mkdir,
  1626. .mknod = ocfs2_mknod,
  1627. .rename = ocfs2_rename,
  1628. .setattr = ocfs2_setattr,
  1629. .getattr = ocfs2_getattr,
  1630. .permission = ocfs2_permission,
  1631. };