shm.c 21 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931
  1. /*
  2. * linux/ipc/shm.c
  3. * Copyright (C) 1992, 1993 Krishna Balasubramanian
  4. * Many improvements/fixes by Bruno Haible.
  5. * Replaced `struct shm_desc' by `struct vm_area_struct', July 1994.
  6. * Fixed the shm swap deallocation (shm_unuse()), August 1998 Andrea Arcangeli.
  7. *
  8. * /proc/sysvipc/shm support (c) 1999 Dragos Acostachioaie <dragos@iname.com>
  9. * BIGMEM support, Andrea Arcangeli <andrea@suse.de>
  10. * SMP thread shm, Jean-Luc Boyard <jean-luc.boyard@siemens.fr>
  11. * HIGHMEM support, Ingo Molnar <mingo@redhat.com>
  12. * Make shmmax, shmall, shmmni sysctl'able, Christoph Rohland <cr@sap.com>
  13. * Shared /dev/zero support, Kanoj Sarcar <kanoj@sgi.com>
  14. * Move the mm functionality over to mm/shmem.c, Christoph Rohland <cr@sap.com>
  15. *
  16. */
  17. #include <linux/config.h>
  18. #include <linux/slab.h>
  19. #include <linux/mm.h>
  20. #include <linux/hugetlb.h>
  21. #include <linux/shm.h>
  22. #include <linux/init.h>
  23. #include <linux/file.h>
  24. #include <linux/mman.h>
  25. #include <linux/proc_fs.h>
  26. #include <linux/shmem_fs.h>
  27. #include <linux/security.h>
  28. #include <linux/syscalls.h>
  29. #include <linux/audit.h>
  30. #include <linux/ptrace.h>
  31. #include <asm/uaccess.h>
  32. #include "util.h"
  33. #define shm_flags shm_perm.mode
  34. static struct file_operations shm_file_operations;
  35. static struct vm_operations_struct shm_vm_ops;
  36. static struct ipc_ids shm_ids;
  37. #define shm_lock(id) ((struct shmid_kernel*)ipc_lock(&shm_ids,id))
  38. #define shm_unlock(shp) ipc_unlock(&(shp)->shm_perm)
  39. #define shm_get(id) ((struct shmid_kernel*)ipc_get(&shm_ids,id))
  40. #define shm_buildid(id, seq) \
  41. ipc_buildid(&shm_ids, id, seq)
  42. static int newseg (key_t key, int shmflg, size_t size);
  43. static void shm_open (struct vm_area_struct *shmd);
  44. static void shm_close (struct vm_area_struct *shmd);
  45. #ifdef CONFIG_PROC_FS
  46. static int sysvipc_shm_read_proc(char *buffer, char **start, off_t offset, int length, int *eof, void *data);
  47. #endif
  48. size_t shm_ctlmax = SHMMAX;
  49. size_t shm_ctlall = SHMALL;
  50. int shm_ctlmni = SHMMNI;
  51. static int shm_tot; /* total number of shared memory pages */
  52. void __init shm_init (void)
  53. {
  54. ipc_init_ids(&shm_ids, 1);
  55. #ifdef CONFIG_PROC_FS
  56. create_proc_read_entry("sysvipc/shm", 0, NULL, sysvipc_shm_read_proc, NULL);
  57. #endif
  58. }
  59. static inline int shm_checkid(struct shmid_kernel *s, int id)
  60. {
  61. if (ipc_checkid(&shm_ids,&s->shm_perm,id))
  62. return -EIDRM;
  63. return 0;
  64. }
  65. static inline struct shmid_kernel *shm_rmid(int id)
  66. {
  67. return (struct shmid_kernel *)ipc_rmid(&shm_ids,id);
  68. }
  69. static inline int shm_addid(struct shmid_kernel *shp)
  70. {
  71. return ipc_addid(&shm_ids, &shp->shm_perm, shm_ctlmni);
  72. }
  73. static inline void shm_inc (int id) {
  74. struct shmid_kernel *shp;
  75. if(!(shp = shm_lock(id)))
  76. BUG();
  77. shp->shm_atim = get_seconds();
  78. shp->shm_lprid = current->tgid;
  79. shp->shm_nattch++;
  80. shm_unlock(shp);
  81. }
  82. /* This is called by fork, once for every shm attach. */
  83. static void shm_open (struct vm_area_struct *shmd)
  84. {
  85. shm_inc (shmd->vm_file->f_dentry->d_inode->i_ino);
  86. }
  87. /*
  88. * shm_destroy - free the struct shmid_kernel
  89. *
  90. * @shp: struct to free
  91. *
  92. * It has to be called with shp and shm_ids.sem locked,
  93. * but returns with shp unlocked and freed.
  94. */
  95. static void shm_destroy (struct shmid_kernel *shp)
  96. {
  97. shm_tot -= (shp->shm_segsz + PAGE_SIZE - 1) >> PAGE_SHIFT;
  98. shm_rmid (shp->id);
  99. shm_unlock(shp);
  100. if (!is_file_hugepages(shp->shm_file))
  101. shmem_lock(shp->shm_file, 0, shp->mlock_user);
  102. else
  103. user_shm_unlock(shp->shm_file->f_dentry->d_inode->i_size,
  104. shp->mlock_user);
  105. fput (shp->shm_file);
  106. security_shm_free(shp);
  107. ipc_rcu_putref(shp);
  108. }
  109. /*
  110. * remove the attach descriptor shmd.
  111. * free memory for segment if it is marked destroyed.
  112. * The descriptor has already been removed from the current->mm->mmap list
  113. * and will later be kfree()d.
  114. */
  115. static void shm_close (struct vm_area_struct *shmd)
  116. {
  117. struct file * file = shmd->vm_file;
  118. int id = file->f_dentry->d_inode->i_ino;
  119. struct shmid_kernel *shp;
  120. down (&shm_ids.sem);
  121. /* remove from the list of attaches of the shm segment */
  122. if(!(shp = shm_lock(id)))
  123. BUG();
  124. shp->shm_lprid = current->tgid;
  125. shp->shm_dtim = get_seconds();
  126. shp->shm_nattch--;
  127. if(shp->shm_nattch == 0 &&
  128. shp->shm_flags & SHM_DEST)
  129. shm_destroy (shp);
  130. else
  131. shm_unlock(shp);
  132. up (&shm_ids.sem);
  133. }
  134. static int shm_mmap(struct file * file, struct vm_area_struct * vma)
  135. {
  136. file_accessed(file);
  137. vma->vm_ops = &shm_vm_ops;
  138. shm_inc(file->f_dentry->d_inode->i_ino);
  139. return 0;
  140. }
  141. static struct file_operations shm_file_operations = {
  142. .mmap = shm_mmap
  143. };
  144. static struct vm_operations_struct shm_vm_ops = {
  145. .open = shm_open, /* callback for a new vm-area open */
  146. .close = shm_close, /* callback for when the vm-area is released */
  147. .nopage = shmem_nopage,
  148. #ifdef CONFIG_NUMA
  149. .set_policy = shmem_set_policy,
  150. .get_policy = shmem_get_policy,
  151. #endif
  152. };
  153. static int newseg (key_t key, int shmflg, size_t size)
  154. {
  155. int error;
  156. struct shmid_kernel *shp;
  157. int numpages = (size + PAGE_SIZE -1) >> PAGE_SHIFT;
  158. struct file * file;
  159. char name[13];
  160. int id;
  161. if (size < SHMMIN || size > shm_ctlmax)
  162. return -EINVAL;
  163. if (shm_tot + numpages >= shm_ctlall)
  164. return -ENOSPC;
  165. shp = ipc_rcu_alloc(sizeof(*shp));
  166. if (!shp)
  167. return -ENOMEM;
  168. shp->shm_perm.key = key;
  169. shp->shm_flags = (shmflg & S_IRWXUGO);
  170. shp->mlock_user = NULL;
  171. shp->shm_perm.security = NULL;
  172. error = security_shm_alloc(shp);
  173. if (error) {
  174. ipc_rcu_putref(shp);
  175. return error;
  176. }
  177. if (shmflg & SHM_HUGETLB) {
  178. /* hugetlb_zero_setup takes care of mlock user accounting */
  179. file = hugetlb_zero_setup(size);
  180. shp->mlock_user = current->user;
  181. } else {
  182. sprintf (name, "SYSV%08x", key);
  183. file = shmem_file_setup(name, size, VM_ACCOUNT);
  184. }
  185. error = PTR_ERR(file);
  186. if (IS_ERR(file))
  187. goto no_file;
  188. error = -ENOSPC;
  189. id = shm_addid(shp);
  190. if(id == -1)
  191. goto no_id;
  192. shp->shm_cprid = current->tgid;
  193. shp->shm_lprid = 0;
  194. shp->shm_atim = shp->shm_dtim = 0;
  195. shp->shm_ctim = get_seconds();
  196. shp->shm_segsz = size;
  197. shp->shm_nattch = 0;
  198. shp->id = shm_buildid(id,shp->shm_perm.seq);
  199. shp->shm_file = file;
  200. file->f_dentry->d_inode->i_ino = shp->id;
  201. if (shmflg & SHM_HUGETLB)
  202. set_file_hugepages(file);
  203. else
  204. file->f_op = &shm_file_operations;
  205. shm_tot += numpages;
  206. shm_unlock(shp);
  207. return shp->id;
  208. no_id:
  209. fput(file);
  210. no_file:
  211. security_shm_free(shp);
  212. ipc_rcu_putref(shp);
  213. return error;
  214. }
  215. asmlinkage long sys_shmget (key_t key, size_t size, int shmflg)
  216. {
  217. struct shmid_kernel *shp;
  218. int err, id = 0;
  219. down(&shm_ids.sem);
  220. if (key == IPC_PRIVATE) {
  221. err = newseg(key, shmflg, size);
  222. } else if ((id = ipc_findkey(&shm_ids, key)) == -1) {
  223. if (!(shmflg & IPC_CREAT))
  224. err = -ENOENT;
  225. else
  226. err = newseg(key, shmflg, size);
  227. } else if ((shmflg & IPC_CREAT) && (shmflg & IPC_EXCL)) {
  228. err = -EEXIST;
  229. } else {
  230. shp = shm_lock(id);
  231. if(shp==NULL)
  232. BUG();
  233. if (shp->shm_segsz < size)
  234. err = -EINVAL;
  235. else if (ipcperms(&shp->shm_perm, shmflg))
  236. err = -EACCES;
  237. else {
  238. int shmid = shm_buildid(id, shp->shm_perm.seq);
  239. err = security_shm_associate(shp, shmflg);
  240. if (!err)
  241. err = shmid;
  242. }
  243. shm_unlock(shp);
  244. }
  245. up(&shm_ids.sem);
  246. return err;
  247. }
  248. static inline unsigned long copy_shmid_to_user(void __user *buf, struct shmid64_ds *in, int version)
  249. {
  250. switch(version) {
  251. case IPC_64:
  252. return copy_to_user(buf, in, sizeof(*in));
  253. case IPC_OLD:
  254. {
  255. struct shmid_ds out;
  256. ipc64_perm_to_ipc_perm(&in->shm_perm, &out.shm_perm);
  257. out.shm_segsz = in->shm_segsz;
  258. out.shm_atime = in->shm_atime;
  259. out.shm_dtime = in->shm_dtime;
  260. out.shm_ctime = in->shm_ctime;
  261. out.shm_cpid = in->shm_cpid;
  262. out.shm_lpid = in->shm_lpid;
  263. out.shm_nattch = in->shm_nattch;
  264. return copy_to_user(buf, &out, sizeof(out));
  265. }
  266. default:
  267. return -EINVAL;
  268. }
  269. }
  270. struct shm_setbuf {
  271. uid_t uid;
  272. gid_t gid;
  273. mode_t mode;
  274. };
  275. static inline unsigned long copy_shmid_from_user(struct shm_setbuf *out, void __user *buf, int version)
  276. {
  277. switch(version) {
  278. case IPC_64:
  279. {
  280. struct shmid64_ds tbuf;
  281. if (copy_from_user(&tbuf, buf, sizeof(tbuf)))
  282. return -EFAULT;
  283. out->uid = tbuf.shm_perm.uid;
  284. out->gid = tbuf.shm_perm.gid;
  285. out->mode = tbuf.shm_flags;
  286. return 0;
  287. }
  288. case IPC_OLD:
  289. {
  290. struct shmid_ds tbuf_old;
  291. if (copy_from_user(&tbuf_old, buf, sizeof(tbuf_old)))
  292. return -EFAULT;
  293. out->uid = tbuf_old.shm_perm.uid;
  294. out->gid = tbuf_old.shm_perm.gid;
  295. out->mode = tbuf_old.shm_flags;
  296. return 0;
  297. }
  298. default:
  299. return -EINVAL;
  300. }
  301. }
  302. static inline unsigned long copy_shminfo_to_user(void __user *buf, struct shminfo64 *in, int version)
  303. {
  304. switch(version) {
  305. case IPC_64:
  306. return copy_to_user(buf, in, sizeof(*in));
  307. case IPC_OLD:
  308. {
  309. struct shminfo out;
  310. if(in->shmmax > INT_MAX)
  311. out.shmmax = INT_MAX;
  312. else
  313. out.shmmax = (int)in->shmmax;
  314. out.shmmin = in->shmmin;
  315. out.shmmni = in->shmmni;
  316. out.shmseg = in->shmseg;
  317. out.shmall = in->shmall;
  318. return copy_to_user(buf, &out, sizeof(out));
  319. }
  320. default:
  321. return -EINVAL;
  322. }
  323. }
  324. static void shm_get_stat(unsigned long *rss, unsigned long *swp)
  325. {
  326. int i;
  327. *rss = 0;
  328. *swp = 0;
  329. for (i = 0; i <= shm_ids.max_id; i++) {
  330. struct shmid_kernel *shp;
  331. struct inode *inode;
  332. shp = shm_get(i);
  333. if(!shp)
  334. continue;
  335. inode = shp->shm_file->f_dentry->d_inode;
  336. if (is_file_hugepages(shp->shm_file)) {
  337. struct address_space *mapping = inode->i_mapping;
  338. *rss += (HPAGE_SIZE/PAGE_SIZE)*mapping->nrpages;
  339. } else {
  340. struct shmem_inode_info *info = SHMEM_I(inode);
  341. spin_lock(&info->lock);
  342. *rss += inode->i_mapping->nrpages;
  343. *swp += info->swapped;
  344. spin_unlock(&info->lock);
  345. }
  346. }
  347. }
  348. asmlinkage long sys_shmctl (int shmid, int cmd, struct shmid_ds __user *buf)
  349. {
  350. struct shm_setbuf setbuf;
  351. struct shmid_kernel *shp;
  352. int err, version;
  353. if (cmd < 0 || shmid < 0) {
  354. err = -EINVAL;
  355. goto out;
  356. }
  357. version = ipc_parse_version(&cmd);
  358. switch (cmd) { /* replace with proc interface ? */
  359. case IPC_INFO:
  360. {
  361. struct shminfo64 shminfo;
  362. err = security_shm_shmctl(NULL, cmd);
  363. if (err)
  364. return err;
  365. memset(&shminfo,0,sizeof(shminfo));
  366. shminfo.shmmni = shminfo.shmseg = shm_ctlmni;
  367. shminfo.shmmax = shm_ctlmax;
  368. shminfo.shmall = shm_ctlall;
  369. shminfo.shmmin = SHMMIN;
  370. if(copy_shminfo_to_user (buf, &shminfo, version))
  371. return -EFAULT;
  372. /* reading a integer is always atomic */
  373. err= shm_ids.max_id;
  374. if(err<0)
  375. err = 0;
  376. goto out;
  377. }
  378. case SHM_INFO:
  379. {
  380. struct shm_info shm_info;
  381. err = security_shm_shmctl(NULL, cmd);
  382. if (err)
  383. return err;
  384. memset(&shm_info,0,sizeof(shm_info));
  385. down(&shm_ids.sem);
  386. shm_info.used_ids = shm_ids.in_use;
  387. shm_get_stat (&shm_info.shm_rss, &shm_info.shm_swp);
  388. shm_info.shm_tot = shm_tot;
  389. shm_info.swap_attempts = 0;
  390. shm_info.swap_successes = 0;
  391. err = shm_ids.max_id;
  392. up(&shm_ids.sem);
  393. if(copy_to_user (buf, &shm_info, sizeof(shm_info))) {
  394. err = -EFAULT;
  395. goto out;
  396. }
  397. err = err < 0 ? 0 : err;
  398. goto out;
  399. }
  400. case SHM_STAT:
  401. case IPC_STAT:
  402. {
  403. struct shmid64_ds tbuf;
  404. int result;
  405. memset(&tbuf, 0, sizeof(tbuf));
  406. shp = shm_lock(shmid);
  407. if(shp==NULL) {
  408. err = -EINVAL;
  409. goto out;
  410. } else if(cmd==SHM_STAT) {
  411. err = -EINVAL;
  412. if (shmid > shm_ids.max_id)
  413. goto out_unlock;
  414. result = shm_buildid(shmid, shp->shm_perm.seq);
  415. } else {
  416. err = shm_checkid(shp,shmid);
  417. if(err)
  418. goto out_unlock;
  419. result = 0;
  420. }
  421. err=-EACCES;
  422. if (ipcperms (&shp->shm_perm, S_IRUGO))
  423. goto out_unlock;
  424. err = security_shm_shmctl(shp, cmd);
  425. if (err)
  426. goto out_unlock;
  427. kernel_to_ipc64_perm(&shp->shm_perm, &tbuf.shm_perm);
  428. tbuf.shm_segsz = shp->shm_segsz;
  429. tbuf.shm_atime = shp->shm_atim;
  430. tbuf.shm_dtime = shp->shm_dtim;
  431. tbuf.shm_ctime = shp->shm_ctim;
  432. tbuf.shm_cpid = shp->shm_cprid;
  433. tbuf.shm_lpid = shp->shm_lprid;
  434. if (!is_file_hugepages(shp->shm_file))
  435. tbuf.shm_nattch = shp->shm_nattch;
  436. else
  437. tbuf.shm_nattch = file_count(shp->shm_file) - 1;
  438. shm_unlock(shp);
  439. if(copy_shmid_to_user (buf, &tbuf, version))
  440. err = -EFAULT;
  441. else
  442. err = result;
  443. goto out;
  444. }
  445. case SHM_LOCK:
  446. case SHM_UNLOCK:
  447. {
  448. shp = shm_lock(shmid);
  449. if(shp==NULL) {
  450. err = -EINVAL;
  451. goto out;
  452. }
  453. err = shm_checkid(shp,shmid);
  454. if(err)
  455. goto out_unlock;
  456. if (!capable(CAP_IPC_LOCK)) {
  457. err = -EPERM;
  458. if (current->euid != shp->shm_perm.uid &&
  459. current->euid != shp->shm_perm.cuid)
  460. goto out_unlock;
  461. if (cmd == SHM_LOCK &&
  462. !current->signal->rlim[RLIMIT_MEMLOCK].rlim_cur)
  463. goto out_unlock;
  464. }
  465. err = security_shm_shmctl(shp, cmd);
  466. if (err)
  467. goto out_unlock;
  468. if(cmd==SHM_LOCK) {
  469. struct user_struct * user = current->user;
  470. if (!is_file_hugepages(shp->shm_file)) {
  471. err = shmem_lock(shp->shm_file, 1, user);
  472. if (!err) {
  473. shp->shm_flags |= SHM_LOCKED;
  474. shp->mlock_user = user;
  475. }
  476. }
  477. } else if (!is_file_hugepages(shp->shm_file)) {
  478. shmem_lock(shp->shm_file, 0, shp->mlock_user);
  479. shp->shm_flags &= ~SHM_LOCKED;
  480. shp->mlock_user = NULL;
  481. }
  482. shm_unlock(shp);
  483. goto out;
  484. }
  485. case IPC_RMID:
  486. {
  487. /*
  488. * We cannot simply remove the file. The SVID states
  489. * that the block remains until the last person
  490. * detaches from it, then is deleted. A shmat() on
  491. * an RMID segment is legal in older Linux and if
  492. * we change it apps break...
  493. *
  494. * Instead we set a destroyed flag, and then blow
  495. * the name away when the usage hits zero.
  496. */
  497. down(&shm_ids.sem);
  498. shp = shm_lock(shmid);
  499. err = -EINVAL;
  500. if (shp == NULL)
  501. goto out_up;
  502. err = shm_checkid(shp, shmid);
  503. if(err)
  504. goto out_unlock_up;
  505. if (current->euid != shp->shm_perm.uid &&
  506. current->euid != shp->shm_perm.cuid &&
  507. !capable(CAP_SYS_ADMIN)) {
  508. err=-EPERM;
  509. goto out_unlock_up;
  510. }
  511. err = security_shm_shmctl(shp, cmd);
  512. if (err)
  513. goto out_unlock_up;
  514. if (shp->shm_nattch){
  515. shp->shm_flags |= SHM_DEST;
  516. /* Do not find it any more */
  517. shp->shm_perm.key = IPC_PRIVATE;
  518. shm_unlock(shp);
  519. } else
  520. shm_destroy (shp);
  521. up(&shm_ids.sem);
  522. goto out;
  523. }
  524. case IPC_SET:
  525. {
  526. if (copy_shmid_from_user (&setbuf, buf, version)) {
  527. err = -EFAULT;
  528. goto out;
  529. }
  530. if ((err = audit_ipc_perms(0, setbuf.uid, setbuf.gid, setbuf.mode)))
  531. return err;
  532. down(&shm_ids.sem);
  533. shp = shm_lock(shmid);
  534. err=-EINVAL;
  535. if(shp==NULL)
  536. goto out_up;
  537. err = shm_checkid(shp,shmid);
  538. if(err)
  539. goto out_unlock_up;
  540. err=-EPERM;
  541. if (current->euid != shp->shm_perm.uid &&
  542. current->euid != shp->shm_perm.cuid &&
  543. !capable(CAP_SYS_ADMIN)) {
  544. goto out_unlock_up;
  545. }
  546. err = security_shm_shmctl(shp, cmd);
  547. if (err)
  548. goto out_unlock_up;
  549. shp->shm_perm.uid = setbuf.uid;
  550. shp->shm_perm.gid = setbuf.gid;
  551. shp->shm_flags = (shp->shm_flags & ~S_IRWXUGO)
  552. | (setbuf.mode & S_IRWXUGO);
  553. shp->shm_ctim = get_seconds();
  554. break;
  555. }
  556. default:
  557. err = -EINVAL;
  558. goto out;
  559. }
  560. err = 0;
  561. out_unlock_up:
  562. shm_unlock(shp);
  563. out_up:
  564. up(&shm_ids.sem);
  565. goto out;
  566. out_unlock:
  567. shm_unlock(shp);
  568. out:
  569. return err;
  570. }
  571. /*
  572. * Fix shmaddr, allocate descriptor, map shm, add attach descriptor to lists.
  573. *
  574. * NOTE! Despite the name, this is NOT a direct system call entrypoint. The
  575. * "raddr" thing points to kernel space, and there has to be a wrapper around
  576. * this.
  577. */
  578. long do_shmat(int shmid, char __user *shmaddr, int shmflg, ulong *raddr)
  579. {
  580. struct shmid_kernel *shp;
  581. unsigned long addr;
  582. unsigned long size;
  583. struct file * file;
  584. int err;
  585. unsigned long flags;
  586. unsigned long prot;
  587. unsigned long o_flags;
  588. int acc_mode;
  589. void *user_addr;
  590. if (shmid < 0) {
  591. err = -EINVAL;
  592. goto out;
  593. } else if ((addr = (ulong)shmaddr)) {
  594. if (addr & (SHMLBA-1)) {
  595. if (shmflg & SHM_RND)
  596. addr &= ~(SHMLBA-1); /* round down */
  597. else
  598. #ifndef __ARCH_FORCE_SHMLBA
  599. if (addr & ~PAGE_MASK)
  600. #endif
  601. return -EINVAL;
  602. }
  603. flags = MAP_SHARED | MAP_FIXED;
  604. } else {
  605. if ((shmflg & SHM_REMAP))
  606. return -EINVAL;
  607. flags = MAP_SHARED;
  608. }
  609. if (shmflg & SHM_RDONLY) {
  610. prot = PROT_READ;
  611. o_flags = O_RDONLY;
  612. acc_mode = S_IRUGO;
  613. } else {
  614. prot = PROT_READ | PROT_WRITE;
  615. o_flags = O_RDWR;
  616. acc_mode = S_IRUGO | S_IWUGO;
  617. }
  618. if (shmflg & SHM_EXEC) {
  619. prot |= PROT_EXEC;
  620. acc_mode |= S_IXUGO;
  621. }
  622. /*
  623. * We cannot rely on the fs check since SYSV IPC does have an
  624. * additional creator id...
  625. */
  626. shp = shm_lock(shmid);
  627. if(shp == NULL) {
  628. err = -EINVAL;
  629. goto out;
  630. }
  631. err = shm_checkid(shp,shmid);
  632. if (err) {
  633. shm_unlock(shp);
  634. goto out;
  635. }
  636. if (ipcperms(&shp->shm_perm, acc_mode)) {
  637. shm_unlock(shp);
  638. err = -EACCES;
  639. goto out;
  640. }
  641. err = security_shm_shmat(shp, shmaddr, shmflg);
  642. if (err) {
  643. shm_unlock(shp);
  644. return err;
  645. }
  646. file = shp->shm_file;
  647. size = i_size_read(file->f_dentry->d_inode);
  648. shp->shm_nattch++;
  649. shm_unlock(shp);
  650. down_write(&current->mm->mmap_sem);
  651. if (addr && !(shmflg & SHM_REMAP)) {
  652. user_addr = ERR_PTR(-EINVAL);
  653. if (find_vma_intersection(current->mm, addr, addr + size))
  654. goto invalid;
  655. /*
  656. * If shm segment goes below stack, make sure there is some
  657. * space left for the stack to grow (at least 4 pages).
  658. */
  659. if (addr < current->mm->start_stack &&
  660. addr > current->mm->start_stack - size - PAGE_SIZE * 5)
  661. goto invalid;
  662. }
  663. user_addr = (void*) do_mmap (file, addr, size, prot, flags, 0);
  664. invalid:
  665. up_write(&current->mm->mmap_sem);
  666. down (&shm_ids.sem);
  667. if(!(shp = shm_lock(shmid)))
  668. BUG();
  669. shp->shm_nattch--;
  670. if(shp->shm_nattch == 0 &&
  671. shp->shm_flags & SHM_DEST)
  672. shm_destroy (shp);
  673. else
  674. shm_unlock(shp);
  675. up (&shm_ids.sem);
  676. *raddr = (unsigned long) user_addr;
  677. err = 0;
  678. if (IS_ERR(user_addr))
  679. err = PTR_ERR(user_addr);
  680. out:
  681. return err;
  682. }
  683. asmlinkage long sys_shmat(int shmid, char __user *shmaddr, int shmflg)
  684. {
  685. unsigned long ret;
  686. long err;
  687. err = do_shmat(shmid, shmaddr, shmflg, &ret);
  688. if (err)
  689. return err;
  690. force_successful_syscall_return();
  691. return (long)ret;
  692. }
  693. /*
  694. * detach and kill segment if marked destroyed.
  695. * The work is done in shm_close.
  696. */
  697. asmlinkage long sys_shmdt(char __user *shmaddr)
  698. {
  699. struct mm_struct *mm = current->mm;
  700. struct vm_area_struct *vma, *next;
  701. unsigned long addr = (unsigned long)shmaddr;
  702. loff_t size = 0;
  703. int retval = -EINVAL;
  704. down_write(&mm->mmap_sem);
  705. /*
  706. * This function tries to be smart and unmap shm segments that
  707. * were modified by partial mlock or munmap calls:
  708. * - It first determines the size of the shm segment that should be
  709. * unmapped: It searches for a vma that is backed by shm and that
  710. * started at address shmaddr. It records it's size and then unmaps
  711. * it.
  712. * - Then it unmaps all shm vmas that started at shmaddr and that
  713. * are within the initially determined size.
  714. * Errors from do_munmap are ignored: the function only fails if
  715. * it's called with invalid parameters or if it's called to unmap
  716. * a part of a vma. Both calls in this function are for full vmas,
  717. * the parameters are directly copied from the vma itself and always
  718. * valid - therefore do_munmap cannot fail. (famous last words?)
  719. */
  720. /*
  721. * If it had been mremap()'d, the starting address would not
  722. * match the usual checks anyway. So assume all vma's are
  723. * above the starting address given.
  724. */
  725. vma = find_vma(mm, addr);
  726. while (vma) {
  727. next = vma->vm_next;
  728. /*
  729. * Check if the starting address would match, i.e. it's
  730. * a fragment created by mprotect() and/or munmap(), or it
  731. * otherwise it starts at this address with no hassles.
  732. */
  733. if ((vma->vm_ops == &shm_vm_ops || is_vm_hugetlb_page(vma)) &&
  734. (vma->vm_start - addr)/PAGE_SIZE == vma->vm_pgoff) {
  735. size = vma->vm_file->f_dentry->d_inode->i_size;
  736. do_munmap(mm, vma->vm_start, vma->vm_end - vma->vm_start);
  737. /*
  738. * We discovered the size of the shm segment, so
  739. * break out of here and fall through to the next
  740. * loop that uses the size information to stop
  741. * searching for matching vma's.
  742. */
  743. retval = 0;
  744. vma = next;
  745. break;
  746. }
  747. vma = next;
  748. }
  749. /*
  750. * We need look no further than the maximum address a fragment
  751. * could possibly have landed at. Also cast things to loff_t to
  752. * prevent overflows and make comparisions vs. equal-width types.
  753. */
  754. while (vma && (loff_t)(vma->vm_end - addr) <= size) {
  755. next = vma->vm_next;
  756. /* finding a matching vma now does not alter retval */
  757. if ((vma->vm_ops == &shm_vm_ops || is_vm_hugetlb_page(vma)) &&
  758. (vma->vm_start - addr)/PAGE_SIZE == vma->vm_pgoff)
  759. do_munmap(mm, vma->vm_start, vma->vm_end - vma->vm_start);
  760. vma = next;
  761. }
  762. up_write(&mm->mmap_sem);
  763. return retval;
  764. }
  765. #ifdef CONFIG_PROC_FS
  766. static int sysvipc_shm_read_proc(char *buffer, char **start, off_t offset, int length, int *eof, void *data)
  767. {
  768. off_t pos = 0;
  769. off_t begin = 0;
  770. int i, len = 0;
  771. down(&shm_ids.sem);
  772. len += sprintf(buffer, " key shmid perms size cpid lpid nattch uid gid cuid cgid atime dtime ctime\n");
  773. for(i = 0; i <= shm_ids.max_id; i++) {
  774. struct shmid_kernel* shp;
  775. shp = shm_lock(i);
  776. if(shp!=NULL) {
  777. #define SMALL_STRING "%10d %10d %4o %10u %5u %5u %5d %5u %5u %5u %5u %10lu %10lu %10lu\n"
  778. #define BIG_STRING "%10d %10d %4o %21u %5u %5u %5d %5u %5u %5u %5u %10lu %10lu %10lu\n"
  779. char *format;
  780. if (sizeof(size_t) <= sizeof(int))
  781. format = SMALL_STRING;
  782. else
  783. format = BIG_STRING;
  784. len += sprintf(buffer + len, format,
  785. shp->shm_perm.key,
  786. shm_buildid(i, shp->shm_perm.seq),
  787. shp->shm_flags,
  788. shp->shm_segsz,
  789. shp->shm_cprid,
  790. shp->shm_lprid,
  791. is_file_hugepages(shp->shm_file) ? (file_count(shp->shm_file) - 1) : shp->shm_nattch,
  792. shp->shm_perm.uid,
  793. shp->shm_perm.gid,
  794. shp->shm_perm.cuid,
  795. shp->shm_perm.cgid,
  796. shp->shm_atim,
  797. shp->shm_dtim,
  798. shp->shm_ctim);
  799. shm_unlock(shp);
  800. pos += len;
  801. if(pos < offset) {
  802. len = 0;
  803. begin = pos;
  804. }
  805. if(pos > offset + length)
  806. goto done;
  807. }
  808. }
  809. *eof = 1;
  810. done:
  811. up(&shm_ids.sem);
  812. *start = buffer + (offset - begin);
  813. len -= (offset - begin);
  814. if(len > length)
  815. len = length;
  816. if(len < 0)
  817. len = 0;
  818. return len;
  819. }
  820. #endif