dmapool.c 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422
  1. #include <linux/device.h>
  2. #include <linux/mm.h>
  3. #include <asm/io.h> /* Needed for i386 to build */
  4. #include <asm/scatterlist.h> /* Needed for i386 to build */
  5. #include <linux/dma-mapping.h>
  6. #include <linux/dmapool.h>
  7. #include <linux/slab.h>
  8. #include <linux/module.h>
  9. #include <linux/poison.h>
  10. /*
  11. * Pool allocator ... wraps the dma_alloc_coherent page allocator, so
  12. * small blocks are easily used by drivers for bus mastering controllers.
  13. * This should probably be sharing the guts of the slab allocator.
  14. */
  15. struct dma_pool { /* the pool */
  16. struct list_head page_list;
  17. spinlock_t lock;
  18. size_t blocks_per_page;
  19. size_t size;
  20. struct device *dev;
  21. size_t allocation;
  22. char name [32];
  23. wait_queue_head_t waitq;
  24. struct list_head pools;
  25. };
  26. struct dma_page { /* cacheable header for 'allocation' bytes */
  27. struct list_head page_list;
  28. void *vaddr;
  29. dma_addr_t dma;
  30. unsigned in_use;
  31. unsigned long bitmap [0];
  32. };
  33. #define POOL_TIMEOUT_JIFFIES ((100 /* msec */ * HZ) / 1000)
  34. static DECLARE_MUTEX (pools_lock);
  35. static ssize_t
  36. show_pools (struct device *dev, struct device_attribute *attr, char *buf)
  37. {
  38. unsigned temp;
  39. unsigned size;
  40. char *next;
  41. struct dma_page *page;
  42. struct dma_pool *pool;
  43. next = buf;
  44. size = PAGE_SIZE;
  45. temp = scnprintf(next, size, "poolinfo - 0.1\n");
  46. size -= temp;
  47. next += temp;
  48. down (&pools_lock);
  49. list_for_each_entry(pool, &dev->dma_pools, pools) {
  50. unsigned pages = 0;
  51. unsigned blocks = 0;
  52. list_for_each_entry(page, &pool->page_list, page_list) {
  53. pages++;
  54. blocks += page->in_use;
  55. }
  56. /* per-pool info, no real statistics yet */
  57. temp = scnprintf(next, size, "%-16s %4u %4Zu %4Zu %2u\n",
  58. pool->name,
  59. blocks, pages * pool->blocks_per_page,
  60. pool->size, pages);
  61. size -= temp;
  62. next += temp;
  63. }
  64. up (&pools_lock);
  65. return PAGE_SIZE - size;
  66. }
  67. static DEVICE_ATTR (pools, S_IRUGO, show_pools, NULL);
  68. /**
  69. * dma_pool_create - Creates a pool of consistent memory blocks, for dma.
  70. * @name: name of pool, for diagnostics
  71. * @dev: device that will be doing the DMA
  72. * @size: size of the blocks in this pool.
  73. * @align: alignment requirement for blocks; must be a power of two
  74. * @allocation: returned blocks won't cross this boundary (or zero)
  75. * Context: !in_interrupt()
  76. *
  77. * Returns a dma allocation pool with the requested characteristics, or
  78. * null if one can't be created. Given one of these pools, dma_pool_alloc()
  79. * may be used to allocate memory. Such memory will all have "consistent"
  80. * DMA mappings, accessible by the device and its driver without using
  81. * cache flushing primitives. The actual size of blocks allocated may be
  82. * larger than requested because of alignment.
  83. *
  84. * If allocation is nonzero, objects returned from dma_pool_alloc() won't
  85. * cross that size boundary. This is useful for devices which have
  86. * addressing restrictions on individual DMA transfers, such as not crossing
  87. * boundaries of 4KBytes.
  88. */
  89. struct dma_pool *
  90. dma_pool_create (const char *name, struct device *dev,
  91. size_t size, size_t align, size_t allocation)
  92. {
  93. struct dma_pool *retval;
  94. if (align == 0)
  95. align = 1;
  96. if (size == 0)
  97. return NULL;
  98. else if (size < align)
  99. size = align;
  100. else if ((size % align) != 0) {
  101. size += align + 1;
  102. size &= ~(align - 1);
  103. }
  104. if (allocation == 0) {
  105. if (PAGE_SIZE < size)
  106. allocation = size;
  107. else
  108. allocation = PAGE_SIZE;
  109. // FIXME: round up for less fragmentation
  110. } else if (allocation < size)
  111. return NULL;
  112. if (!(retval = kmalloc (sizeof *retval, SLAB_KERNEL)))
  113. return retval;
  114. strlcpy (retval->name, name, sizeof retval->name);
  115. retval->dev = dev;
  116. INIT_LIST_HEAD (&retval->page_list);
  117. spin_lock_init (&retval->lock);
  118. retval->size = size;
  119. retval->allocation = allocation;
  120. retval->blocks_per_page = allocation / size;
  121. init_waitqueue_head (&retval->waitq);
  122. if (dev) {
  123. int ret;
  124. down (&pools_lock);
  125. if (list_empty (&dev->dma_pools))
  126. ret = device_create_file (dev, &dev_attr_pools);
  127. else
  128. ret = 0;
  129. /* note: not currently insisting "name" be unique */
  130. if (!ret)
  131. list_add (&retval->pools, &dev->dma_pools);
  132. else {
  133. kfree(retval);
  134. retval = NULL;
  135. }
  136. up (&pools_lock);
  137. } else
  138. INIT_LIST_HEAD (&retval->pools);
  139. return retval;
  140. }
  141. static struct dma_page *
  142. pool_alloc_page (struct dma_pool *pool, gfp_t mem_flags)
  143. {
  144. struct dma_page *page;
  145. int mapsize;
  146. mapsize = pool->blocks_per_page;
  147. mapsize = (mapsize + BITS_PER_LONG - 1) / BITS_PER_LONG;
  148. mapsize *= sizeof (long);
  149. page = (struct dma_page *) kmalloc (mapsize + sizeof *page, mem_flags);
  150. if (!page)
  151. return NULL;
  152. page->vaddr = dma_alloc_coherent (pool->dev,
  153. pool->allocation,
  154. &page->dma,
  155. mem_flags);
  156. if (page->vaddr) {
  157. memset (page->bitmap, 0xff, mapsize); // bit set == free
  158. #ifdef CONFIG_DEBUG_SLAB
  159. memset (page->vaddr, POOL_POISON_FREED, pool->allocation);
  160. #endif
  161. list_add (&page->page_list, &pool->page_list);
  162. page->in_use = 0;
  163. } else {
  164. kfree (page);
  165. page = NULL;
  166. }
  167. return page;
  168. }
  169. static inline int
  170. is_page_busy (int blocks, unsigned long *bitmap)
  171. {
  172. while (blocks > 0) {
  173. if (*bitmap++ != ~0UL)
  174. return 1;
  175. blocks -= BITS_PER_LONG;
  176. }
  177. return 0;
  178. }
  179. static void
  180. pool_free_page (struct dma_pool *pool, struct dma_page *page)
  181. {
  182. dma_addr_t dma = page->dma;
  183. #ifdef CONFIG_DEBUG_SLAB
  184. memset (page->vaddr, POOL_POISON_FREED, pool->allocation);
  185. #endif
  186. dma_free_coherent (pool->dev, pool->allocation, page->vaddr, dma);
  187. list_del (&page->page_list);
  188. kfree (page);
  189. }
  190. /**
  191. * dma_pool_destroy - destroys a pool of dma memory blocks.
  192. * @pool: dma pool that will be destroyed
  193. * Context: !in_interrupt()
  194. *
  195. * Caller guarantees that no more memory from the pool is in use,
  196. * and that nothing will try to use the pool after this call.
  197. */
  198. void
  199. dma_pool_destroy (struct dma_pool *pool)
  200. {
  201. down (&pools_lock);
  202. list_del (&pool->pools);
  203. if (pool->dev && list_empty (&pool->dev->dma_pools))
  204. device_remove_file (pool->dev, &dev_attr_pools);
  205. up (&pools_lock);
  206. while (!list_empty (&pool->page_list)) {
  207. struct dma_page *page;
  208. page = list_entry (pool->page_list.next,
  209. struct dma_page, page_list);
  210. if (is_page_busy (pool->blocks_per_page, page->bitmap)) {
  211. if (pool->dev)
  212. dev_err(pool->dev, "dma_pool_destroy %s, %p busy\n",
  213. pool->name, page->vaddr);
  214. else
  215. printk (KERN_ERR "dma_pool_destroy %s, %p busy\n",
  216. pool->name, page->vaddr);
  217. /* leak the still-in-use consistent memory */
  218. list_del (&page->page_list);
  219. kfree (page);
  220. } else
  221. pool_free_page (pool, page);
  222. }
  223. kfree (pool);
  224. }
  225. /**
  226. * dma_pool_alloc - get a block of consistent memory
  227. * @pool: dma pool that will produce the block
  228. * @mem_flags: GFP_* bitmask
  229. * @handle: pointer to dma address of block
  230. *
  231. * This returns the kernel virtual address of a currently unused block,
  232. * and reports its dma address through the handle.
  233. * If such a memory block can't be allocated, null is returned.
  234. */
  235. void *
  236. dma_pool_alloc (struct dma_pool *pool, gfp_t mem_flags, dma_addr_t *handle)
  237. {
  238. unsigned long flags;
  239. struct dma_page *page;
  240. int map, block;
  241. size_t offset;
  242. void *retval;
  243. restart:
  244. spin_lock_irqsave (&pool->lock, flags);
  245. list_for_each_entry(page, &pool->page_list, page_list) {
  246. int i;
  247. /* only cachable accesses here ... */
  248. for (map = 0, i = 0;
  249. i < pool->blocks_per_page;
  250. i += BITS_PER_LONG, map++) {
  251. if (page->bitmap [map] == 0)
  252. continue;
  253. block = ffz (~ page->bitmap [map]);
  254. if ((i + block) < pool->blocks_per_page) {
  255. clear_bit (block, &page->bitmap [map]);
  256. offset = (BITS_PER_LONG * map) + block;
  257. offset *= pool->size;
  258. goto ready;
  259. }
  260. }
  261. }
  262. if (!(page = pool_alloc_page (pool, SLAB_ATOMIC))) {
  263. if (mem_flags & __GFP_WAIT) {
  264. DECLARE_WAITQUEUE (wait, current);
  265. current->state = TASK_INTERRUPTIBLE;
  266. add_wait_queue (&pool->waitq, &wait);
  267. spin_unlock_irqrestore (&pool->lock, flags);
  268. schedule_timeout (POOL_TIMEOUT_JIFFIES);
  269. remove_wait_queue (&pool->waitq, &wait);
  270. goto restart;
  271. }
  272. retval = NULL;
  273. goto done;
  274. }
  275. clear_bit (0, &page->bitmap [0]);
  276. offset = 0;
  277. ready:
  278. page->in_use++;
  279. retval = offset + page->vaddr;
  280. *handle = offset + page->dma;
  281. #ifdef CONFIG_DEBUG_SLAB
  282. memset (retval, POOL_POISON_ALLOCATED, pool->size);
  283. #endif
  284. done:
  285. spin_unlock_irqrestore (&pool->lock, flags);
  286. return retval;
  287. }
  288. static struct dma_page *
  289. pool_find_page (struct dma_pool *pool, dma_addr_t dma)
  290. {
  291. unsigned long flags;
  292. struct dma_page *page;
  293. spin_lock_irqsave (&pool->lock, flags);
  294. list_for_each_entry(page, &pool->page_list, page_list) {
  295. if (dma < page->dma)
  296. continue;
  297. if (dma < (page->dma + pool->allocation))
  298. goto done;
  299. }
  300. page = NULL;
  301. done:
  302. spin_unlock_irqrestore (&pool->lock, flags);
  303. return page;
  304. }
  305. /**
  306. * dma_pool_free - put block back into dma pool
  307. * @pool: the dma pool holding the block
  308. * @vaddr: virtual address of block
  309. * @dma: dma address of block
  310. *
  311. * Caller promises neither device nor driver will again touch this block
  312. * unless it is first re-allocated.
  313. */
  314. void
  315. dma_pool_free (struct dma_pool *pool, void *vaddr, dma_addr_t dma)
  316. {
  317. struct dma_page *page;
  318. unsigned long flags;
  319. int map, block;
  320. if ((page = pool_find_page (pool, dma)) == 0) {
  321. if (pool->dev)
  322. dev_err(pool->dev, "dma_pool_free %s, %p/%lx (bad dma)\n",
  323. pool->name, vaddr, (unsigned long) dma);
  324. else
  325. printk (KERN_ERR "dma_pool_free %s, %p/%lx (bad dma)\n",
  326. pool->name, vaddr, (unsigned long) dma);
  327. return;
  328. }
  329. block = dma - page->dma;
  330. block /= pool->size;
  331. map = block / BITS_PER_LONG;
  332. block %= BITS_PER_LONG;
  333. #ifdef CONFIG_DEBUG_SLAB
  334. if (((dma - page->dma) + (void *)page->vaddr) != vaddr) {
  335. if (pool->dev)
  336. dev_err(pool->dev, "dma_pool_free %s, %p (bad vaddr)/%Lx\n",
  337. pool->name, vaddr, (unsigned long long) dma);
  338. else
  339. printk (KERN_ERR "dma_pool_free %s, %p (bad vaddr)/%Lx\n",
  340. pool->name, vaddr, (unsigned long long) dma);
  341. return;
  342. }
  343. if (page->bitmap [map] & (1UL << block)) {
  344. if (pool->dev)
  345. dev_err(pool->dev, "dma_pool_free %s, dma %Lx already free\n",
  346. pool->name, (unsigned long long)dma);
  347. else
  348. printk (KERN_ERR "dma_pool_free %s, dma %Lx already free\n",
  349. pool->name, (unsigned long long)dma);
  350. return;
  351. }
  352. memset (vaddr, POOL_POISON_FREED, pool->size);
  353. #endif
  354. spin_lock_irqsave (&pool->lock, flags);
  355. page->in_use--;
  356. set_bit (block, &page->bitmap [map]);
  357. if (waitqueue_active (&pool->waitq))
  358. wake_up (&pool->waitq);
  359. /*
  360. * Resist a temptation to do
  361. * if (!is_page_busy(bpp, page->bitmap)) pool_free_page(pool, page);
  362. * Better have a few empty pages hang around.
  363. */
  364. spin_unlock_irqrestore (&pool->lock, flags);
  365. }
  366. EXPORT_SYMBOL (dma_pool_create);
  367. EXPORT_SYMBOL (dma_pool_destroy);
  368. EXPORT_SYMBOL (dma_pool_alloc);
  369. EXPORT_SYMBOL (dma_pool_free);