file.c 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657
  1. /*
  2. FUSE: Filesystem in Userspace
  3. Copyright (C) 2001-2006 Miklos Szeredi <miklos@szeredi.hu>
  4. This program can be distributed under the terms of the GNU GPL.
  5. See the file COPYING.
  6. */
  7. #include "fuse_i.h"
  8. #include <linux/pagemap.h>
  9. #include <linux/slab.h>
  10. #include <linux/kernel.h>
  11. static const struct file_operations fuse_direct_io_file_operations;
  12. static int fuse_send_open(struct inode *inode, struct file *file, int isdir,
  13. struct fuse_open_out *outargp)
  14. {
  15. struct fuse_conn *fc = get_fuse_conn(inode);
  16. struct fuse_open_in inarg;
  17. struct fuse_req *req;
  18. int err;
  19. req = fuse_get_req(fc);
  20. if (IS_ERR(req))
  21. return PTR_ERR(req);
  22. memset(&inarg, 0, sizeof(inarg));
  23. inarg.flags = file->f_flags & ~(O_CREAT | O_EXCL | O_NOCTTY | O_TRUNC);
  24. req->in.h.opcode = isdir ? FUSE_OPENDIR : FUSE_OPEN;
  25. req->in.h.nodeid = get_node_id(inode);
  26. req->inode = inode;
  27. req->in.numargs = 1;
  28. req->in.args[0].size = sizeof(inarg);
  29. req->in.args[0].value = &inarg;
  30. req->out.numargs = 1;
  31. req->out.args[0].size = sizeof(*outargp);
  32. req->out.args[0].value = outargp;
  33. request_send(fc, req);
  34. err = req->out.h.error;
  35. fuse_put_request(fc, req);
  36. return err;
  37. }
  38. struct fuse_file *fuse_file_alloc(void)
  39. {
  40. struct fuse_file *ff;
  41. ff = kmalloc(sizeof(struct fuse_file), GFP_KERNEL);
  42. if (ff) {
  43. ff->release_req = fuse_request_alloc();
  44. if (!ff->release_req) {
  45. kfree(ff);
  46. ff = NULL;
  47. }
  48. }
  49. return ff;
  50. }
  51. void fuse_file_free(struct fuse_file *ff)
  52. {
  53. fuse_request_free(ff->release_req);
  54. kfree(ff);
  55. }
  56. void fuse_finish_open(struct inode *inode, struct file *file,
  57. struct fuse_file *ff, struct fuse_open_out *outarg)
  58. {
  59. if (outarg->open_flags & FOPEN_DIRECT_IO)
  60. file->f_op = &fuse_direct_io_file_operations;
  61. if (!(outarg->open_flags & FOPEN_KEEP_CACHE))
  62. invalidate_inode_pages(inode->i_mapping);
  63. ff->fh = outarg->fh;
  64. file->private_data = ff;
  65. }
  66. int fuse_open_common(struct inode *inode, struct file *file, int isdir)
  67. {
  68. struct fuse_open_out outarg;
  69. struct fuse_file *ff;
  70. int err;
  71. /* VFS checks this, but only _after_ ->open() */
  72. if (file->f_flags & O_DIRECT)
  73. return -EINVAL;
  74. err = generic_file_open(inode, file);
  75. if (err)
  76. return err;
  77. /* If opening the root node, no lookup has been performed on
  78. it, so the attributes must be refreshed */
  79. if (get_node_id(inode) == FUSE_ROOT_ID) {
  80. err = fuse_do_getattr(inode);
  81. if (err)
  82. return err;
  83. }
  84. ff = fuse_file_alloc();
  85. if (!ff)
  86. return -ENOMEM;
  87. err = fuse_send_open(inode, file, isdir, &outarg);
  88. if (err)
  89. fuse_file_free(ff);
  90. else {
  91. if (isdir)
  92. outarg.open_flags &= ~FOPEN_DIRECT_IO;
  93. fuse_finish_open(inode, file, ff, &outarg);
  94. }
  95. return err;
  96. }
  97. /* Special case for failed iget in CREATE */
  98. static void fuse_release_end(struct fuse_conn *fc, struct fuse_req *req)
  99. {
  100. /* If called from end_io_requests(), req has more than one
  101. reference and fuse_reset_request() cannot work */
  102. if (fc->connected) {
  103. u64 nodeid = req->in.h.nodeid;
  104. fuse_reset_request(req);
  105. fuse_send_forget(fc, req, nodeid, 1);
  106. } else
  107. fuse_put_request(fc, req);
  108. }
  109. void fuse_send_release(struct fuse_conn *fc, struct fuse_file *ff,
  110. u64 nodeid, struct inode *inode, int flags, int isdir)
  111. {
  112. struct fuse_req * req = ff->release_req;
  113. struct fuse_release_in *inarg = &req->misc.release_in;
  114. inarg->fh = ff->fh;
  115. inarg->flags = flags;
  116. req->in.h.opcode = isdir ? FUSE_RELEASEDIR : FUSE_RELEASE;
  117. req->in.h.nodeid = nodeid;
  118. req->inode = inode;
  119. req->in.numargs = 1;
  120. req->in.args[0].size = sizeof(struct fuse_release_in);
  121. req->in.args[0].value = inarg;
  122. request_send_background(fc, req);
  123. if (!inode)
  124. req->end = fuse_release_end;
  125. kfree(ff);
  126. }
  127. int fuse_release_common(struct inode *inode, struct file *file, int isdir)
  128. {
  129. struct fuse_file *ff = file->private_data;
  130. if (ff) {
  131. struct fuse_conn *fc = get_fuse_conn(inode);
  132. u64 nodeid = get_node_id(inode);
  133. fuse_send_release(fc, ff, nodeid, inode, file->f_flags, isdir);
  134. }
  135. /* Return value is ignored by VFS */
  136. return 0;
  137. }
  138. static int fuse_open(struct inode *inode, struct file *file)
  139. {
  140. return fuse_open_common(inode, file, 0);
  141. }
  142. static int fuse_release(struct inode *inode, struct file *file)
  143. {
  144. return fuse_release_common(inode, file, 0);
  145. }
  146. static int fuse_flush(struct file *file)
  147. {
  148. struct inode *inode = file->f_dentry->d_inode;
  149. struct fuse_conn *fc = get_fuse_conn(inode);
  150. struct fuse_file *ff = file->private_data;
  151. struct fuse_req *req;
  152. struct fuse_flush_in inarg;
  153. int err;
  154. if (is_bad_inode(inode))
  155. return -EIO;
  156. if (fc->no_flush)
  157. return 0;
  158. req = fuse_get_req(fc);
  159. if (IS_ERR(req))
  160. return PTR_ERR(req);
  161. memset(&inarg, 0, sizeof(inarg));
  162. inarg.fh = ff->fh;
  163. req->in.h.opcode = FUSE_FLUSH;
  164. req->in.h.nodeid = get_node_id(inode);
  165. req->inode = inode;
  166. req->file = file;
  167. req->in.numargs = 1;
  168. req->in.args[0].size = sizeof(inarg);
  169. req->in.args[0].value = &inarg;
  170. request_send(fc, req);
  171. err = req->out.h.error;
  172. fuse_put_request(fc, req);
  173. if (err == -ENOSYS) {
  174. fc->no_flush = 1;
  175. err = 0;
  176. }
  177. return err;
  178. }
  179. int fuse_fsync_common(struct file *file, struct dentry *de, int datasync,
  180. int isdir)
  181. {
  182. struct inode *inode = de->d_inode;
  183. struct fuse_conn *fc = get_fuse_conn(inode);
  184. struct fuse_file *ff = file->private_data;
  185. struct fuse_req *req;
  186. struct fuse_fsync_in inarg;
  187. int err;
  188. if (is_bad_inode(inode))
  189. return -EIO;
  190. if ((!isdir && fc->no_fsync) || (isdir && fc->no_fsyncdir))
  191. return 0;
  192. req = fuse_get_req(fc);
  193. if (IS_ERR(req))
  194. return PTR_ERR(req);
  195. memset(&inarg, 0, sizeof(inarg));
  196. inarg.fh = ff->fh;
  197. inarg.fsync_flags = datasync ? 1 : 0;
  198. req->in.h.opcode = isdir ? FUSE_FSYNCDIR : FUSE_FSYNC;
  199. req->in.h.nodeid = get_node_id(inode);
  200. req->inode = inode;
  201. req->file = file;
  202. req->in.numargs = 1;
  203. req->in.args[0].size = sizeof(inarg);
  204. req->in.args[0].value = &inarg;
  205. request_send(fc, req);
  206. err = req->out.h.error;
  207. fuse_put_request(fc, req);
  208. if (err == -ENOSYS) {
  209. if (isdir)
  210. fc->no_fsyncdir = 1;
  211. else
  212. fc->no_fsync = 1;
  213. err = 0;
  214. }
  215. return err;
  216. }
  217. static int fuse_fsync(struct file *file, struct dentry *de, int datasync)
  218. {
  219. return fuse_fsync_common(file, de, datasync, 0);
  220. }
  221. void fuse_read_fill(struct fuse_req *req, struct file *file,
  222. struct inode *inode, loff_t pos, size_t count, int opcode)
  223. {
  224. struct fuse_file *ff = file->private_data;
  225. struct fuse_read_in *inarg = &req->misc.read_in;
  226. inarg->fh = ff->fh;
  227. inarg->offset = pos;
  228. inarg->size = count;
  229. req->in.h.opcode = opcode;
  230. req->in.h.nodeid = get_node_id(inode);
  231. req->inode = inode;
  232. req->file = file;
  233. req->in.numargs = 1;
  234. req->in.args[0].size = sizeof(struct fuse_read_in);
  235. req->in.args[0].value = inarg;
  236. req->out.argpages = 1;
  237. req->out.argvar = 1;
  238. req->out.numargs = 1;
  239. req->out.args[0].size = count;
  240. }
  241. static size_t fuse_send_read(struct fuse_req *req, struct file *file,
  242. struct inode *inode, loff_t pos, size_t count)
  243. {
  244. struct fuse_conn *fc = get_fuse_conn(inode);
  245. fuse_read_fill(req, file, inode, pos, count, FUSE_READ);
  246. request_send(fc, req);
  247. return req->out.args[0].size;
  248. }
  249. static int fuse_readpage(struct file *file, struct page *page)
  250. {
  251. struct inode *inode = page->mapping->host;
  252. struct fuse_conn *fc = get_fuse_conn(inode);
  253. struct fuse_req *req;
  254. int err;
  255. err = -EIO;
  256. if (is_bad_inode(inode))
  257. goto out;
  258. req = fuse_get_req(fc);
  259. err = PTR_ERR(req);
  260. if (IS_ERR(req))
  261. goto out;
  262. req->out.page_zeroing = 1;
  263. req->num_pages = 1;
  264. req->pages[0] = page;
  265. fuse_send_read(req, file, inode, page_offset(page), PAGE_CACHE_SIZE);
  266. err = req->out.h.error;
  267. fuse_put_request(fc, req);
  268. if (!err)
  269. SetPageUptodate(page);
  270. fuse_invalidate_attr(inode); /* atime changed */
  271. out:
  272. unlock_page(page);
  273. return err;
  274. }
  275. static void fuse_readpages_end(struct fuse_conn *fc, struct fuse_req *req)
  276. {
  277. int i;
  278. fuse_invalidate_attr(req->pages[0]->mapping->host); /* atime changed */
  279. for (i = 0; i < req->num_pages; i++) {
  280. struct page *page = req->pages[i];
  281. if (!req->out.h.error)
  282. SetPageUptodate(page);
  283. else
  284. SetPageError(page);
  285. unlock_page(page);
  286. }
  287. fuse_put_request(fc, req);
  288. }
  289. static void fuse_send_readpages(struct fuse_req *req, struct file *file,
  290. struct inode *inode)
  291. {
  292. struct fuse_conn *fc = get_fuse_conn(inode);
  293. loff_t pos = page_offset(req->pages[0]);
  294. size_t count = req->num_pages << PAGE_CACHE_SHIFT;
  295. req->out.page_zeroing = 1;
  296. fuse_read_fill(req, file, inode, pos, count, FUSE_READ);
  297. if (fc->async_read) {
  298. req->end = fuse_readpages_end;
  299. request_send_background(fc, req);
  300. } else {
  301. request_send(fc, req);
  302. fuse_readpages_end(fc, req);
  303. }
  304. }
  305. struct fuse_readpages_data {
  306. struct fuse_req *req;
  307. struct file *file;
  308. struct inode *inode;
  309. };
  310. static int fuse_readpages_fill(void *_data, struct page *page)
  311. {
  312. struct fuse_readpages_data *data = _data;
  313. struct fuse_req *req = data->req;
  314. struct inode *inode = data->inode;
  315. struct fuse_conn *fc = get_fuse_conn(inode);
  316. if (req->num_pages &&
  317. (req->num_pages == FUSE_MAX_PAGES_PER_REQ ||
  318. (req->num_pages + 1) * PAGE_CACHE_SIZE > fc->max_read ||
  319. req->pages[req->num_pages - 1]->index + 1 != page->index)) {
  320. fuse_send_readpages(req, data->file, inode);
  321. data->req = req = fuse_get_req(fc);
  322. if (IS_ERR(req)) {
  323. unlock_page(page);
  324. return PTR_ERR(req);
  325. }
  326. }
  327. req->pages[req->num_pages] = page;
  328. req->num_pages ++;
  329. return 0;
  330. }
  331. static int fuse_readpages(struct file *file, struct address_space *mapping,
  332. struct list_head *pages, unsigned nr_pages)
  333. {
  334. struct inode *inode = mapping->host;
  335. struct fuse_conn *fc = get_fuse_conn(inode);
  336. struct fuse_readpages_data data;
  337. int err;
  338. if (is_bad_inode(inode))
  339. return -EIO;
  340. data.file = file;
  341. data.inode = inode;
  342. data.req = fuse_get_req(fc);
  343. if (IS_ERR(data.req))
  344. return PTR_ERR(data.req);
  345. err = read_cache_pages(mapping, pages, fuse_readpages_fill, &data);
  346. if (!err) {
  347. if (data.req->num_pages)
  348. fuse_send_readpages(data.req, file, inode);
  349. else
  350. fuse_put_request(fc, data.req);
  351. }
  352. return err;
  353. }
  354. static size_t fuse_send_write(struct fuse_req *req, struct file *file,
  355. struct inode *inode, loff_t pos, size_t count)
  356. {
  357. struct fuse_conn *fc = get_fuse_conn(inode);
  358. struct fuse_file *ff = file->private_data;
  359. struct fuse_write_in inarg;
  360. struct fuse_write_out outarg;
  361. memset(&inarg, 0, sizeof(struct fuse_write_in));
  362. inarg.fh = ff->fh;
  363. inarg.offset = pos;
  364. inarg.size = count;
  365. req->in.h.opcode = FUSE_WRITE;
  366. req->in.h.nodeid = get_node_id(inode);
  367. req->inode = inode;
  368. req->file = file;
  369. req->in.argpages = 1;
  370. req->in.numargs = 2;
  371. req->in.args[0].size = sizeof(struct fuse_write_in);
  372. req->in.args[0].value = &inarg;
  373. req->in.args[1].size = count;
  374. req->out.numargs = 1;
  375. req->out.args[0].size = sizeof(struct fuse_write_out);
  376. req->out.args[0].value = &outarg;
  377. request_send(fc, req);
  378. return outarg.size;
  379. }
  380. static int fuse_prepare_write(struct file *file, struct page *page,
  381. unsigned offset, unsigned to)
  382. {
  383. /* No op */
  384. return 0;
  385. }
  386. static int fuse_commit_write(struct file *file, struct page *page,
  387. unsigned offset, unsigned to)
  388. {
  389. int err;
  390. size_t nres;
  391. unsigned count = to - offset;
  392. struct inode *inode = page->mapping->host;
  393. struct fuse_conn *fc = get_fuse_conn(inode);
  394. loff_t pos = page_offset(page) + offset;
  395. struct fuse_req *req;
  396. if (is_bad_inode(inode))
  397. return -EIO;
  398. req = fuse_get_req(fc);
  399. if (IS_ERR(req))
  400. return PTR_ERR(req);
  401. req->num_pages = 1;
  402. req->pages[0] = page;
  403. req->page_offset = offset;
  404. nres = fuse_send_write(req, file, inode, pos, count);
  405. err = req->out.h.error;
  406. fuse_put_request(fc, req);
  407. if (!err && nres != count)
  408. err = -EIO;
  409. if (!err) {
  410. pos += count;
  411. if (pos > i_size_read(inode))
  412. i_size_write(inode, pos);
  413. if (offset == 0 && to == PAGE_CACHE_SIZE) {
  414. clear_page_dirty(page);
  415. SetPageUptodate(page);
  416. }
  417. }
  418. fuse_invalidate_attr(inode);
  419. return err;
  420. }
  421. static void fuse_release_user_pages(struct fuse_req *req, int write)
  422. {
  423. unsigned i;
  424. for (i = 0; i < req->num_pages; i++) {
  425. struct page *page = req->pages[i];
  426. if (write)
  427. set_page_dirty_lock(page);
  428. put_page(page);
  429. }
  430. }
  431. static int fuse_get_user_pages(struct fuse_req *req, const char __user *buf,
  432. unsigned nbytes, int write)
  433. {
  434. unsigned long user_addr = (unsigned long) buf;
  435. unsigned offset = user_addr & ~PAGE_MASK;
  436. int npages;
  437. /* This doesn't work with nfsd */
  438. if (!current->mm)
  439. return -EPERM;
  440. nbytes = min(nbytes, (unsigned) FUSE_MAX_PAGES_PER_REQ << PAGE_SHIFT);
  441. npages = (nbytes + offset + PAGE_SIZE - 1) >> PAGE_SHIFT;
  442. npages = min(max(npages, 1), FUSE_MAX_PAGES_PER_REQ);
  443. down_read(&current->mm->mmap_sem);
  444. npages = get_user_pages(current, current->mm, user_addr, npages, write,
  445. 0, req->pages, NULL);
  446. up_read(&current->mm->mmap_sem);
  447. if (npages < 0)
  448. return npages;
  449. req->num_pages = npages;
  450. req->page_offset = offset;
  451. return 0;
  452. }
  453. static ssize_t fuse_direct_io(struct file *file, const char __user *buf,
  454. size_t count, loff_t *ppos, int write)
  455. {
  456. struct inode *inode = file->f_dentry->d_inode;
  457. struct fuse_conn *fc = get_fuse_conn(inode);
  458. size_t nmax = write ? fc->max_write : fc->max_read;
  459. loff_t pos = *ppos;
  460. ssize_t res = 0;
  461. struct fuse_req *req;
  462. if (is_bad_inode(inode))
  463. return -EIO;
  464. req = fuse_get_req(fc);
  465. if (IS_ERR(req))
  466. return PTR_ERR(req);
  467. while (count) {
  468. size_t nres;
  469. size_t nbytes = min(count, nmax);
  470. int err = fuse_get_user_pages(req, buf, nbytes, !write);
  471. if (err) {
  472. res = err;
  473. break;
  474. }
  475. nbytes = (req->num_pages << PAGE_SHIFT) - req->page_offset;
  476. nbytes = min(count, nbytes);
  477. if (write)
  478. nres = fuse_send_write(req, file, inode, pos, nbytes);
  479. else
  480. nres = fuse_send_read(req, file, inode, pos, nbytes);
  481. fuse_release_user_pages(req, !write);
  482. if (req->out.h.error) {
  483. if (!res)
  484. res = req->out.h.error;
  485. break;
  486. } else if (nres > nbytes) {
  487. res = -EIO;
  488. break;
  489. }
  490. count -= nres;
  491. res += nres;
  492. pos += nres;
  493. buf += nres;
  494. if (nres != nbytes)
  495. break;
  496. if (count) {
  497. fuse_put_request(fc, req);
  498. req = fuse_get_req(fc);
  499. if (IS_ERR(req))
  500. break;
  501. }
  502. }
  503. fuse_put_request(fc, req);
  504. if (res > 0) {
  505. if (write && pos > i_size_read(inode))
  506. i_size_write(inode, pos);
  507. *ppos = pos;
  508. }
  509. fuse_invalidate_attr(inode);
  510. return res;
  511. }
  512. static ssize_t fuse_direct_read(struct file *file, char __user *buf,
  513. size_t count, loff_t *ppos)
  514. {
  515. return fuse_direct_io(file, buf, count, ppos, 0);
  516. }
  517. static ssize_t fuse_direct_write(struct file *file, const char __user *buf,
  518. size_t count, loff_t *ppos)
  519. {
  520. struct inode *inode = file->f_dentry->d_inode;
  521. ssize_t res;
  522. /* Don't allow parallel writes to the same file */
  523. mutex_lock(&inode->i_mutex);
  524. res = fuse_direct_io(file, buf, count, ppos, 1);
  525. mutex_unlock(&inode->i_mutex);
  526. return res;
  527. }
  528. static int fuse_file_mmap(struct file *file, struct vm_area_struct *vma)
  529. {
  530. if ((vma->vm_flags & VM_SHARED)) {
  531. if ((vma->vm_flags & VM_WRITE))
  532. return -ENODEV;
  533. else
  534. vma->vm_flags &= ~VM_MAYWRITE;
  535. }
  536. return generic_file_mmap(file, vma);
  537. }
  538. static int fuse_set_page_dirty(struct page *page)
  539. {
  540. printk("fuse_set_page_dirty: should not happen\n");
  541. dump_stack();
  542. return 0;
  543. }
  544. static const struct file_operations fuse_file_operations = {
  545. .llseek = generic_file_llseek,
  546. .read = generic_file_read,
  547. .write = generic_file_write,
  548. .mmap = fuse_file_mmap,
  549. .open = fuse_open,
  550. .flush = fuse_flush,
  551. .release = fuse_release,
  552. .fsync = fuse_fsync,
  553. .sendfile = generic_file_sendfile,
  554. };
  555. static const struct file_operations fuse_direct_io_file_operations = {
  556. .llseek = generic_file_llseek,
  557. .read = fuse_direct_read,
  558. .write = fuse_direct_write,
  559. .open = fuse_open,
  560. .flush = fuse_flush,
  561. .release = fuse_release,
  562. .fsync = fuse_fsync,
  563. /* no mmap and sendfile */
  564. };
  565. static struct address_space_operations fuse_file_aops = {
  566. .readpage = fuse_readpage,
  567. .prepare_write = fuse_prepare_write,
  568. .commit_write = fuse_commit_write,
  569. .readpages = fuse_readpages,
  570. .set_page_dirty = fuse_set_page_dirty,
  571. };
  572. void fuse_init_file_inode(struct inode *inode)
  573. {
  574. inode->i_fop = &fuse_file_operations;
  575. inode->i_data.a_ops = &fuse_file_aops;
  576. }