vmalloc.c 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750
  1. /*
  2. * linux/mm/vmalloc.c
  3. *
  4. * Copyright (C) 1993 Linus Torvalds
  5. * Support of BIGMEM added by Gerhard Wichert, Siemens AG, July 1999
  6. * SMP-safe vmalloc/vfree/ioremap, Tigran Aivazian <tigran@veritas.com>, May 2000
  7. * Major rework to support vmap/vunmap, Christoph Hellwig, SGI, August 2002
  8. * Numa awareness, Christoph Lameter, SGI, June 2005
  9. */
  10. #include <linux/mm.h>
  11. #include <linux/module.h>
  12. #include <linux/highmem.h>
  13. #include <linux/slab.h>
  14. #include <linux/spinlock.h>
  15. #include <linux/interrupt.h>
  16. #include <linux/vmalloc.h>
  17. #include <asm/uaccess.h>
  18. #include <asm/tlbflush.h>
  19. DEFINE_RWLOCK(vmlist_lock);
  20. struct vm_struct *vmlist;
  21. static void *__vmalloc_node(unsigned long size, gfp_t gfp_mask, pgprot_t prot,
  22. int node);
  23. static void vunmap_pte_range(pmd_t *pmd, unsigned long addr, unsigned long end)
  24. {
  25. pte_t *pte;
  26. pte = pte_offset_kernel(pmd, addr);
  27. do {
  28. pte_t ptent = ptep_get_and_clear(&init_mm, addr, pte);
  29. WARN_ON(!pte_none(ptent) && !pte_present(ptent));
  30. } while (pte++, addr += PAGE_SIZE, addr != end);
  31. }
  32. static inline void vunmap_pmd_range(pud_t *pud, unsigned long addr,
  33. unsigned long end)
  34. {
  35. pmd_t *pmd;
  36. unsigned long next;
  37. pmd = pmd_offset(pud, addr);
  38. do {
  39. next = pmd_addr_end(addr, end);
  40. if (pmd_none_or_clear_bad(pmd))
  41. continue;
  42. vunmap_pte_range(pmd, addr, next);
  43. } while (pmd++, addr = next, addr != end);
  44. }
  45. static inline void vunmap_pud_range(pgd_t *pgd, unsigned long addr,
  46. unsigned long end)
  47. {
  48. pud_t *pud;
  49. unsigned long next;
  50. pud = pud_offset(pgd, addr);
  51. do {
  52. next = pud_addr_end(addr, end);
  53. if (pud_none_or_clear_bad(pud))
  54. continue;
  55. vunmap_pmd_range(pud, addr, next);
  56. } while (pud++, addr = next, addr != end);
  57. }
  58. void unmap_vm_area(struct vm_struct *area)
  59. {
  60. pgd_t *pgd;
  61. unsigned long next;
  62. unsigned long addr = (unsigned long) area->addr;
  63. unsigned long end = addr + area->size;
  64. BUG_ON(addr >= end);
  65. pgd = pgd_offset_k(addr);
  66. flush_cache_vunmap(addr, end);
  67. do {
  68. next = pgd_addr_end(addr, end);
  69. if (pgd_none_or_clear_bad(pgd))
  70. continue;
  71. vunmap_pud_range(pgd, addr, next);
  72. } while (pgd++, addr = next, addr != end);
  73. flush_tlb_kernel_range((unsigned long) area->addr, end);
  74. }
  75. static int vmap_pte_range(pmd_t *pmd, unsigned long addr,
  76. unsigned long end, pgprot_t prot, struct page ***pages)
  77. {
  78. pte_t *pte;
  79. pte = pte_alloc_kernel(pmd, addr);
  80. if (!pte)
  81. return -ENOMEM;
  82. do {
  83. struct page *page = **pages;
  84. WARN_ON(!pte_none(*pte));
  85. if (!page)
  86. return -ENOMEM;
  87. set_pte_at(&init_mm, addr, pte, mk_pte(page, prot));
  88. (*pages)++;
  89. } while (pte++, addr += PAGE_SIZE, addr != end);
  90. return 0;
  91. }
  92. static inline int vmap_pmd_range(pud_t *pud, unsigned long addr,
  93. unsigned long end, pgprot_t prot, struct page ***pages)
  94. {
  95. pmd_t *pmd;
  96. unsigned long next;
  97. pmd = pmd_alloc(&init_mm, pud, addr);
  98. if (!pmd)
  99. return -ENOMEM;
  100. do {
  101. next = pmd_addr_end(addr, end);
  102. if (vmap_pte_range(pmd, addr, next, prot, pages))
  103. return -ENOMEM;
  104. } while (pmd++, addr = next, addr != end);
  105. return 0;
  106. }
  107. static inline int vmap_pud_range(pgd_t *pgd, unsigned long addr,
  108. unsigned long end, pgprot_t prot, struct page ***pages)
  109. {
  110. pud_t *pud;
  111. unsigned long next;
  112. pud = pud_alloc(&init_mm, pgd, addr);
  113. if (!pud)
  114. return -ENOMEM;
  115. do {
  116. next = pud_addr_end(addr, end);
  117. if (vmap_pmd_range(pud, addr, next, prot, pages))
  118. return -ENOMEM;
  119. } while (pud++, addr = next, addr != end);
  120. return 0;
  121. }
  122. int map_vm_area(struct vm_struct *area, pgprot_t prot, struct page ***pages)
  123. {
  124. pgd_t *pgd;
  125. unsigned long next;
  126. unsigned long addr = (unsigned long) area->addr;
  127. unsigned long end = addr + area->size - PAGE_SIZE;
  128. int err;
  129. BUG_ON(addr >= end);
  130. pgd = pgd_offset_k(addr);
  131. do {
  132. next = pgd_addr_end(addr, end);
  133. err = vmap_pud_range(pgd, addr, next, prot, pages);
  134. if (err)
  135. break;
  136. } while (pgd++, addr = next, addr != end);
  137. flush_cache_vmap((unsigned long) area->addr, end);
  138. return err;
  139. }
  140. static struct vm_struct *__get_vm_area_node(unsigned long size, unsigned long flags,
  141. unsigned long start, unsigned long end,
  142. int node, gfp_t gfp_mask)
  143. {
  144. struct vm_struct **p, *tmp, *area;
  145. unsigned long align = 1;
  146. unsigned long addr;
  147. BUG_ON(in_interrupt());
  148. if (flags & VM_IOREMAP) {
  149. int bit = fls(size);
  150. if (bit > IOREMAP_MAX_ORDER)
  151. bit = IOREMAP_MAX_ORDER;
  152. else if (bit < PAGE_SHIFT)
  153. bit = PAGE_SHIFT;
  154. align = 1ul << bit;
  155. }
  156. addr = ALIGN(start, align);
  157. size = PAGE_ALIGN(size);
  158. area = kmalloc_node(sizeof(*area), gfp_mask & GFP_LEVEL_MASK, node);
  159. if (unlikely(!area))
  160. return NULL;
  161. if (unlikely(!size)) {
  162. kfree (area);
  163. return NULL;
  164. }
  165. /*
  166. * We always allocate a guard page.
  167. */
  168. size += PAGE_SIZE;
  169. write_lock(&vmlist_lock);
  170. for (p = &vmlist; (tmp = *p) != NULL ;p = &tmp->next) {
  171. if ((unsigned long)tmp->addr < addr) {
  172. if((unsigned long)tmp->addr + tmp->size >= addr)
  173. addr = ALIGN(tmp->size +
  174. (unsigned long)tmp->addr, align);
  175. continue;
  176. }
  177. if ((size + addr) < addr)
  178. goto out;
  179. if (size + addr <= (unsigned long)tmp->addr)
  180. goto found;
  181. addr = ALIGN(tmp->size + (unsigned long)tmp->addr, align);
  182. if (addr > end - size)
  183. goto out;
  184. }
  185. found:
  186. area->next = *p;
  187. *p = area;
  188. area->flags = flags;
  189. area->addr = (void *)addr;
  190. area->size = size;
  191. area->pages = NULL;
  192. area->nr_pages = 0;
  193. area->phys_addr = 0;
  194. write_unlock(&vmlist_lock);
  195. return area;
  196. out:
  197. write_unlock(&vmlist_lock);
  198. kfree(area);
  199. if (printk_ratelimit())
  200. printk(KERN_WARNING "allocation failed: out of vmalloc space - use vmalloc=<size> to increase size.\n");
  201. return NULL;
  202. }
  203. struct vm_struct *__get_vm_area(unsigned long size, unsigned long flags,
  204. unsigned long start, unsigned long end)
  205. {
  206. return __get_vm_area_node(size, flags, start, end, -1, GFP_KERNEL);
  207. }
  208. /**
  209. * get_vm_area - reserve a contingous kernel virtual area
  210. * @size: size of the area
  211. * @flags: %VM_IOREMAP for I/O mappings or VM_ALLOC
  212. *
  213. * Search an area of @size in the kernel virtual mapping area,
  214. * and reserved it for out purposes. Returns the area descriptor
  215. * on success or %NULL on failure.
  216. */
  217. struct vm_struct *get_vm_area(unsigned long size, unsigned long flags)
  218. {
  219. return __get_vm_area(size, flags, VMALLOC_START, VMALLOC_END);
  220. }
  221. struct vm_struct *get_vm_area_node(unsigned long size, unsigned long flags,
  222. int node, gfp_t gfp_mask)
  223. {
  224. return __get_vm_area_node(size, flags, VMALLOC_START, VMALLOC_END, node,
  225. gfp_mask);
  226. }
  227. /* Caller must hold vmlist_lock */
  228. static struct vm_struct *__find_vm_area(void *addr)
  229. {
  230. struct vm_struct *tmp;
  231. for (tmp = vmlist; tmp != NULL; tmp = tmp->next) {
  232. if (tmp->addr == addr)
  233. break;
  234. }
  235. return tmp;
  236. }
  237. /* Caller must hold vmlist_lock */
  238. static struct vm_struct *__remove_vm_area(void *addr)
  239. {
  240. struct vm_struct **p, *tmp;
  241. for (p = &vmlist ; (tmp = *p) != NULL ;p = &tmp->next) {
  242. if (tmp->addr == addr)
  243. goto found;
  244. }
  245. return NULL;
  246. found:
  247. unmap_vm_area(tmp);
  248. *p = tmp->next;
  249. /*
  250. * Remove the guard page.
  251. */
  252. tmp->size -= PAGE_SIZE;
  253. return tmp;
  254. }
  255. /**
  256. * remove_vm_area - find and remove a contingous kernel virtual area
  257. * @addr: base address
  258. *
  259. * Search for the kernel VM area starting at @addr, and remove it.
  260. * This function returns the found VM area, but using it is NOT safe
  261. * on SMP machines, except for its size or flags.
  262. */
  263. struct vm_struct *remove_vm_area(void *addr)
  264. {
  265. struct vm_struct *v;
  266. write_lock(&vmlist_lock);
  267. v = __remove_vm_area(addr);
  268. write_unlock(&vmlist_lock);
  269. return v;
  270. }
  271. void __vunmap(void *addr, int deallocate_pages)
  272. {
  273. struct vm_struct *area;
  274. if (!addr)
  275. return;
  276. if ((PAGE_SIZE-1) & (unsigned long)addr) {
  277. printk(KERN_ERR "Trying to vfree() bad address (%p)\n", addr);
  278. WARN_ON(1);
  279. return;
  280. }
  281. area = remove_vm_area(addr);
  282. if (unlikely(!area)) {
  283. printk(KERN_ERR "Trying to vfree() nonexistent vm area (%p)\n",
  284. addr);
  285. WARN_ON(1);
  286. return;
  287. }
  288. debug_check_no_locks_freed(addr, area->size);
  289. if (deallocate_pages) {
  290. int i;
  291. for (i = 0; i < area->nr_pages; i++) {
  292. BUG_ON(!area->pages[i]);
  293. __free_page(area->pages[i]);
  294. }
  295. if (area->flags & VM_VPAGES)
  296. vfree(area->pages);
  297. else
  298. kfree(area->pages);
  299. }
  300. kfree(area);
  301. return;
  302. }
  303. /**
  304. * vfree - release memory allocated by vmalloc()
  305. * @addr: memory base address
  306. *
  307. * Free the virtually contiguous memory area starting at @addr, as
  308. * obtained from vmalloc(), vmalloc_32() or __vmalloc(). If @addr is
  309. * NULL, no operation is performed.
  310. *
  311. * Must not be called in interrupt context.
  312. */
  313. void vfree(void *addr)
  314. {
  315. BUG_ON(in_interrupt());
  316. __vunmap(addr, 1);
  317. }
  318. EXPORT_SYMBOL(vfree);
  319. /**
  320. * vunmap - release virtual mapping obtained by vmap()
  321. * @addr: memory base address
  322. *
  323. * Free the virtually contiguous memory area starting at @addr,
  324. * which was created from the page array passed to vmap().
  325. *
  326. * Must not be called in interrupt context.
  327. */
  328. void vunmap(void *addr)
  329. {
  330. BUG_ON(in_interrupt());
  331. __vunmap(addr, 0);
  332. }
  333. EXPORT_SYMBOL(vunmap);
  334. /**
  335. * vmap - map an array of pages into virtually contiguous space
  336. * @pages: array of page pointers
  337. * @count: number of pages to map
  338. * @flags: vm_area->flags
  339. * @prot: page protection for the mapping
  340. *
  341. * Maps @count pages from @pages into contiguous kernel virtual
  342. * space.
  343. */
  344. void *vmap(struct page **pages, unsigned int count,
  345. unsigned long flags, pgprot_t prot)
  346. {
  347. struct vm_struct *area;
  348. if (count > num_physpages)
  349. return NULL;
  350. area = get_vm_area((count << PAGE_SHIFT), flags);
  351. if (!area)
  352. return NULL;
  353. if (map_vm_area(area, prot, &pages)) {
  354. vunmap(area->addr);
  355. return NULL;
  356. }
  357. return area->addr;
  358. }
  359. EXPORT_SYMBOL(vmap);
  360. void *__vmalloc_area_node(struct vm_struct *area, gfp_t gfp_mask,
  361. pgprot_t prot, int node)
  362. {
  363. struct page **pages;
  364. unsigned int nr_pages, array_size, i;
  365. nr_pages = (area->size - PAGE_SIZE) >> PAGE_SHIFT;
  366. array_size = (nr_pages * sizeof(struct page *));
  367. area->nr_pages = nr_pages;
  368. /* Please note that the recursion is strictly bounded. */
  369. if (array_size > PAGE_SIZE) {
  370. pages = __vmalloc_node(array_size, gfp_mask, PAGE_KERNEL, node);
  371. area->flags |= VM_VPAGES;
  372. } else {
  373. pages = kmalloc_node(array_size,
  374. (gfp_mask & ~(__GFP_HIGHMEM | __GFP_ZERO)),
  375. node);
  376. }
  377. area->pages = pages;
  378. if (!area->pages) {
  379. remove_vm_area(area->addr);
  380. kfree(area);
  381. return NULL;
  382. }
  383. memset(area->pages, 0, array_size);
  384. for (i = 0; i < area->nr_pages; i++) {
  385. if (node < 0)
  386. area->pages[i] = alloc_page(gfp_mask);
  387. else
  388. area->pages[i] = alloc_pages_node(node, gfp_mask, 0);
  389. if (unlikely(!area->pages[i])) {
  390. /* Successfully allocated i pages, free them in __vunmap() */
  391. area->nr_pages = i;
  392. goto fail;
  393. }
  394. }
  395. if (map_vm_area(area, prot, &pages))
  396. goto fail;
  397. return area->addr;
  398. fail:
  399. vfree(area->addr);
  400. return NULL;
  401. }
  402. void *__vmalloc_area(struct vm_struct *area, gfp_t gfp_mask, pgprot_t prot)
  403. {
  404. return __vmalloc_area_node(area, gfp_mask, prot, -1);
  405. }
  406. /**
  407. * __vmalloc_node - allocate virtually contiguous memory
  408. * @size: allocation size
  409. * @gfp_mask: flags for the page level allocator
  410. * @prot: protection mask for the allocated pages
  411. * @node: node to use for allocation or -1
  412. *
  413. * Allocate enough pages to cover @size from the page level
  414. * allocator with @gfp_mask flags. Map them into contiguous
  415. * kernel virtual space, using a pagetable protection of @prot.
  416. */
  417. static void *__vmalloc_node(unsigned long size, gfp_t gfp_mask, pgprot_t prot,
  418. int node)
  419. {
  420. struct vm_struct *area;
  421. size = PAGE_ALIGN(size);
  422. if (!size || (size >> PAGE_SHIFT) > num_physpages)
  423. return NULL;
  424. area = get_vm_area_node(size, VM_ALLOC, node, gfp_mask);
  425. if (!area)
  426. return NULL;
  427. return __vmalloc_area_node(area, gfp_mask, prot, node);
  428. }
  429. void *__vmalloc(unsigned long size, gfp_t gfp_mask, pgprot_t prot)
  430. {
  431. return __vmalloc_node(size, gfp_mask, prot, -1);
  432. }
  433. EXPORT_SYMBOL(__vmalloc);
  434. /**
  435. * vmalloc - allocate virtually contiguous memory
  436. * @size: allocation size
  437. * Allocate enough pages to cover @size from the page level
  438. * allocator and map them into contiguous kernel virtual space.
  439. *
  440. * For tight control over page level allocator and protection flags
  441. * use __vmalloc() instead.
  442. */
  443. void *vmalloc(unsigned long size)
  444. {
  445. return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM, PAGE_KERNEL);
  446. }
  447. EXPORT_SYMBOL(vmalloc);
  448. /**
  449. * vmalloc_user - allocate zeroed virtually contiguous memory for userspace
  450. * @size: allocation size
  451. *
  452. * The resulting memory area is zeroed so it can be mapped to userspace
  453. * without leaking data.
  454. */
  455. void *vmalloc_user(unsigned long size)
  456. {
  457. struct vm_struct *area;
  458. void *ret;
  459. ret = __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM | __GFP_ZERO, PAGE_KERNEL);
  460. write_lock(&vmlist_lock);
  461. area = __find_vm_area(ret);
  462. area->flags |= VM_USERMAP;
  463. write_unlock(&vmlist_lock);
  464. return ret;
  465. }
  466. EXPORT_SYMBOL(vmalloc_user);
  467. /**
  468. * vmalloc_node - allocate memory on a specific node
  469. * @size: allocation size
  470. * @node: numa node
  471. *
  472. * Allocate enough pages to cover @size from the page level
  473. * allocator and map them into contiguous kernel virtual space.
  474. *
  475. * For tight control over page level allocator and protection flags
  476. * use __vmalloc() instead.
  477. */
  478. void *vmalloc_node(unsigned long size, int node)
  479. {
  480. return __vmalloc_node(size, GFP_KERNEL | __GFP_HIGHMEM, PAGE_KERNEL, node);
  481. }
  482. EXPORT_SYMBOL(vmalloc_node);
  483. #ifndef PAGE_KERNEL_EXEC
  484. # define PAGE_KERNEL_EXEC PAGE_KERNEL
  485. #endif
  486. /**
  487. * vmalloc_exec - allocate virtually contiguous, executable memory
  488. * @size: allocation size
  489. *
  490. * Kernel-internal function to allocate enough pages to cover @size
  491. * the page level allocator and map them into contiguous and
  492. * executable kernel virtual space.
  493. *
  494. * For tight control over page level allocator and protection flags
  495. * use __vmalloc() instead.
  496. */
  497. void *vmalloc_exec(unsigned long size)
  498. {
  499. return __vmalloc(size, GFP_KERNEL | __GFP_HIGHMEM, PAGE_KERNEL_EXEC);
  500. }
  501. /**
  502. * vmalloc_32 - allocate virtually contiguous memory (32bit addressable)
  503. * @size: allocation size
  504. *
  505. * Allocate enough 32bit PA addressable pages to cover @size from the
  506. * page level allocator and map them into contiguous kernel virtual space.
  507. */
  508. void *vmalloc_32(unsigned long size)
  509. {
  510. return __vmalloc(size, GFP_KERNEL, PAGE_KERNEL);
  511. }
  512. EXPORT_SYMBOL(vmalloc_32);
  513. /**
  514. * vmalloc_32_user - allocate zeroed virtually contiguous 32bit memory
  515. * @size: allocation size
  516. *
  517. * The resulting memory area is 32bit addressable and zeroed so it can be
  518. * mapped to userspace without leaking data.
  519. */
  520. void *vmalloc_32_user(unsigned long size)
  521. {
  522. struct vm_struct *area;
  523. void *ret;
  524. ret = __vmalloc(size, GFP_KERNEL | __GFP_ZERO, PAGE_KERNEL);
  525. write_lock(&vmlist_lock);
  526. area = __find_vm_area(ret);
  527. area->flags |= VM_USERMAP;
  528. write_unlock(&vmlist_lock);
  529. return ret;
  530. }
  531. EXPORT_SYMBOL(vmalloc_32_user);
  532. long vread(char *buf, char *addr, unsigned long count)
  533. {
  534. struct vm_struct *tmp;
  535. char *vaddr, *buf_start = buf;
  536. unsigned long n;
  537. /* Don't allow overflow */
  538. if ((unsigned long) addr + count < count)
  539. count = -(unsigned long) addr;
  540. read_lock(&vmlist_lock);
  541. for (tmp = vmlist; tmp; tmp = tmp->next) {
  542. vaddr = (char *) tmp->addr;
  543. if (addr >= vaddr + tmp->size - PAGE_SIZE)
  544. continue;
  545. while (addr < vaddr) {
  546. if (count == 0)
  547. goto finished;
  548. *buf = '\0';
  549. buf++;
  550. addr++;
  551. count--;
  552. }
  553. n = vaddr + tmp->size - PAGE_SIZE - addr;
  554. do {
  555. if (count == 0)
  556. goto finished;
  557. *buf = *addr;
  558. buf++;
  559. addr++;
  560. count--;
  561. } while (--n > 0);
  562. }
  563. finished:
  564. read_unlock(&vmlist_lock);
  565. return buf - buf_start;
  566. }
  567. long vwrite(char *buf, char *addr, unsigned long count)
  568. {
  569. struct vm_struct *tmp;
  570. char *vaddr, *buf_start = buf;
  571. unsigned long n;
  572. /* Don't allow overflow */
  573. if ((unsigned long) addr + count < count)
  574. count = -(unsigned long) addr;
  575. read_lock(&vmlist_lock);
  576. for (tmp = vmlist; tmp; tmp = tmp->next) {
  577. vaddr = (char *) tmp->addr;
  578. if (addr >= vaddr + tmp->size - PAGE_SIZE)
  579. continue;
  580. while (addr < vaddr) {
  581. if (count == 0)
  582. goto finished;
  583. buf++;
  584. addr++;
  585. count--;
  586. }
  587. n = vaddr + tmp->size - PAGE_SIZE - addr;
  588. do {
  589. if (count == 0)
  590. goto finished;
  591. *addr = *buf;
  592. buf++;
  593. addr++;
  594. count--;
  595. } while (--n > 0);
  596. }
  597. finished:
  598. read_unlock(&vmlist_lock);
  599. return buf - buf_start;
  600. }
  601. /**
  602. * remap_vmalloc_range - map vmalloc pages to userspace
  603. * @vma: vma to cover (map full range of vma)
  604. * @addr: vmalloc memory
  605. * @pgoff: number of pages into addr before first page to map
  606. * @returns: 0 for success, -Exxx on failure
  607. *
  608. * This function checks that addr is a valid vmalloc'ed area, and
  609. * that it is big enough to cover the vma. Will return failure if
  610. * that criteria isn't met.
  611. *
  612. * Similar to remap_pfn_range (see mm/memory.c)
  613. */
  614. int remap_vmalloc_range(struct vm_area_struct *vma, void *addr,
  615. unsigned long pgoff)
  616. {
  617. struct vm_struct *area;
  618. unsigned long uaddr = vma->vm_start;
  619. unsigned long usize = vma->vm_end - vma->vm_start;
  620. int ret;
  621. if ((PAGE_SIZE-1) & (unsigned long)addr)
  622. return -EINVAL;
  623. read_lock(&vmlist_lock);
  624. area = __find_vm_area(addr);
  625. if (!area)
  626. goto out_einval_locked;
  627. if (!(area->flags & VM_USERMAP))
  628. goto out_einval_locked;
  629. if (usize + (pgoff << PAGE_SHIFT) > area->size - PAGE_SIZE)
  630. goto out_einval_locked;
  631. read_unlock(&vmlist_lock);
  632. addr += pgoff << PAGE_SHIFT;
  633. do {
  634. struct page *page = vmalloc_to_page(addr);
  635. ret = vm_insert_page(vma, uaddr, page);
  636. if (ret)
  637. return ret;
  638. uaddr += PAGE_SIZE;
  639. addr += PAGE_SIZE;
  640. usize -= PAGE_SIZE;
  641. } while (usize > 0);
  642. /* Prevent "things" like memory migration? VM_flags need a cleanup... */
  643. vma->vm_flags |= VM_RESERVED;
  644. return ret;
  645. out_einval_locked:
  646. read_unlock(&vmlist_lock);
  647. return -EINVAL;
  648. }
  649. EXPORT_SYMBOL(remap_vmalloc_range);