ttm_bo_util.c 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560
  1. /**************************************************************************
  2. *
  3. * Copyright (c) 2007-2009 VMware, Inc., Palo Alto, CA., USA
  4. * All Rights Reserved.
  5. *
  6. * Permission is hereby granted, free of charge, to any person obtaining a
  7. * copy of this software and associated documentation files (the
  8. * "Software"), to deal in the Software without restriction, including
  9. * without limitation the rights to use, copy, modify, merge, publish,
  10. * distribute, sub license, and/or sell copies of the Software, and to
  11. * permit persons to whom the Software is furnished to do so, subject to
  12. * the following conditions:
  13. *
  14. * The above copyright notice and this permission notice (including the
  15. * next paragraph) shall be included in all copies or substantial portions
  16. * of the Software.
  17. *
  18. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  19. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  20. * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
  21. * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
  22. * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
  23. * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
  24. * USE OR OTHER DEALINGS IN THE SOFTWARE.
  25. *
  26. **************************************************************************/
  27. /*
  28. * Authors: Thomas Hellstrom <thellstrom-at-vmware-dot-com>
  29. */
  30. #include "ttm/ttm_bo_driver.h"
  31. #include "ttm/ttm_placement.h"
  32. #include <linux/io.h>
  33. #include <linux/highmem.h>
  34. #include <linux/wait.h>
  35. #include <linux/vmalloc.h>
  36. #include <linux/module.h>
  37. void ttm_bo_free_old_node(struct ttm_buffer_object *bo)
  38. {
  39. struct ttm_mem_reg *old_mem = &bo->mem;
  40. if (old_mem->mm_node) {
  41. spin_lock(&bo->bdev->lru_lock);
  42. drm_mm_put_block(old_mem->mm_node);
  43. spin_unlock(&bo->bdev->lru_lock);
  44. }
  45. old_mem->mm_node = NULL;
  46. }
  47. int ttm_bo_move_ttm(struct ttm_buffer_object *bo,
  48. bool evict, bool no_wait, struct ttm_mem_reg *new_mem)
  49. {
  50. struct ttm_tt *ttm = bo->ttm;
  51. struct ttm_mem_reg *old_mem = &bo->mem;
  52. uint32_t save_flags = old_mem->placement;
  53. int ret;
  54. if (old_mem->mem_type != TTM_PL_SYSTEM) {
  55. ttm_tt_unbind(ttm);
  56. ttm_bo_free_old_node(bo);
  57. ttm_flag_masked(&old_mem->placement, TTM_PL_FLAG_SYSTEM,
  58. TTM_PL_MASK_MEM);
  59. old_mem->mem_type = TTM_PL_SYSTEM;
  60. save_flags = old_mem->placement;
  61. }
  62. ret = ttm_tt_set_placement_caching(ttm, new_mem->placement);
  63. if (unlikely(ret != 0))
  64. return ret;
  65. if (new_mem->mem_type != TTM_PL_SYSTEM) {
  66. ret = ttm_tt_bind(ttm, new_mem);
  67. if (unlikely(ret != 0))
  68. return ret;
  69. }
  70. *old_mem = *new_mem;
  71. new_mem->mm_node = NULL;
  72. ttm_flag_masked(&save_flags, new_mem->placement, TTM_PL_MASK_MEMTYPE);
  73. return 0;
  74. }
  75. EXPORT_SYMBOL(ttm_bo_move_ttm);
  76. int ttm_mem_reg_ioremap(struct ttm_bo_device *bdev, struct ttm_mem_reg *mem,
  77. void **virtual)
  78. {
  79. struct ttm_mem_type_manager *man = &bdev->man[mem->mem_type];
  80. unsigned long bus_offset;
  81. unsigned long bus_size;
  82. unsigned long bus_base;
  83. int ret;
  84. void *addr;
  85. *virtual = NULL;
  86. ret = ttm_bo_pci_offset(bdev, mem, &bus_base, &bus_offset, &bus_size);
  87. if (ret || bus_size == 0)
  88. return ret;
  89. if (!(man->flags & TTM_MEMTYPE_FLAG_NEEDS_IOREMAP))
  90. addr = (void *)(((u8 *) man->io_addr) + bus_offset);
  91. else {
  92. if (mem->placement & TTM_PL_FLAG_WC)
  93. addr = ioremap_wc(bus_base + bus_offset, bus_size);
  94. else
  95. addr = ioremap_nocache(bus_base + bus_offset, bus_size);
  96. if (!addr)
  97. return -ENOMEM;
  98. }
  99. *virtual = addr;
  100. return 0;
  101. }
  102. void ttm_mem_reg_iounmap(struct ttm_bo_device *bdev, struct ttm_mem_reg *mem,
  103. void *virtual)
  104. {
  105. struct ttm_mem_type_manager *man;
  106. man = &bdev->man[mem->mem_type];
  107. if (virtual && (man->flags & TTM_MEMTYPE_FLAG_NEEDS_IOREMAP))
  108. iounmap(virtual);
  109. }
  110. static int ttm_copy_io_page(void *dst, void *src, unsigned long page)
  111. {
  112. uint32_t *dstP =
  113. (uint32_t *) ((unsigned long)dst + (page << PAGE_SHIFT));
  114. uint32_t *srcP =
  115. (uint32_t *) ((unsigned long)src + (page << PAGE_SHIFT));
  116. int i;
  117. for (i = 0; i < PAGE_SIZE / sizeof(uint32_t); ++i)
  118. iowrite32(ioread32(srcP++), dstP++);
  119. return 0;
  120. }
  121. static int ttm_copy_io_ttm_page(struct ttm_tt *ttm, void *src,
  122. unsigned long page)
  123. {
  124. struct page *d = ttm_tt_get_page(ttm, page);
  125. void *dst;
  126. if (!d)
  127. return -ENOMEM;
  128. src = (void *)((unsigned long)src + (page << PAGE_SHIFT));
  129. dst = kmap(d);
  130. if (!dst)
  131. return -ENOMEM;
  132. memcpy_fromio(dst, src, PAGE_SIZE);
  133. kunmap(d);
  134. return 0;
  135. }
  136. static int ttm_copy_ttm_io_page(struct ttm_tt *ttm, void *dst,
  137. unsigned long page)
  138. {
  139. struct page *s = ttm_tt_get_page(ttm, page);
  140. void *src;
  141. if (!s)
  142. return -ENOMEM;
  143. dst = (void *)((unsigned long)dst + (page << PAGE_SHIFT));
  144. src = kmap(s);
  145. if (!src)
  146. return -ENOMEM;
  147. memcpy_toio(dst, src, PAGE_SIZE);
  148. kunmap(s);
  149. return 0;
  150. }
  151. int ttm_bo_move_memcpy(struct ttm_buffer_object *bo,
  152. bool evict, bool no_wait, struct ttm_mem_reg *new_mem)
  153. {
  154. struct ttm_bo_device *bdev = bo->bdev;
  155. struct ttm_mem_type_manager *man = &bdev->man[new_mem->mem_type];
  156. struct ttm_tt *ttm = bo->ttm;
  157. struct ttm_mem_reg *old_mem = &bo->mem;
  158. struct ttm_mem_reg old_copy = *old_mem;
  159. void *old_iomap;
  160. void *new_iomap;
  161. int ret;
  162. uint32_t save_flags = old_mem->placement;
  163. unsigned long i;
  164. unsigned long page;
  165. unsigned long add = 0;
  166. int dir;
  167. ret = ttm_mem_reg_ioremap(bdev, old_mem, &old_iomap);
  168. if (ret)
  169. return ret;
  170. ret = ttm_mem_reg_ioremap(bdev, new_mem, &new_iomap);
  171. if (ret)
  172. goto out;
  173. if (old_iomap == NULL && new_iomap == NULL)
  174. goto out2;
  175. if (old_iomap == NULL && ttm == NULL)
  176. goto out2;
  177. add = 0;
  178. dir = 1;
  179. if ((old_mem->mem_type == new_mem->mem_type) &&
  180. (new_mem->mm_node->start <
  181. old_mem->mm_node->start + old_mem->mm_node->size)) {
  182. dir = -1;
  183. add = new_mem->num_pages - 1;
  184. }
  185. for (i = 0; i < new_mem->num_pages; ++i) {
  186. page = i * dir + add;
  187. if (old_iomap == NULL)
  188. ret = ttm_copy_ttm_io_page(ttm, new_iomap, page);
  189. else if (new_iomap == NULL)
  190. ret = ttm_copy_io_ttm_page(ttm, old_iomap, page);
  191. else
  192. ret = ttm_copy_io_page(new_iomap, old_iomap, page);
  193. if (ret)
  194. goto out1;
  195. }
  196. mb();
  197. out2:
  198. ttm_bo_free_old_node(bo);
  199. *old_mem = *new_mem;
  200. new_mem->mm_node = NULL;
  201. ttm_flag_masked(&save_flags, new_mem->placement, TTM_PL_MASK_MEMTYPE);
  202. if ((man->flags & TTM_MEMTYPE_FLAG_FIXED) && (ttm != NULL)) {
  203. ttm_tt_unbind(ttm);
  204. ttm_tt_destroy(ttm);
  205. bo->ttm = NULL;
  206. }
  207. out1:
  208. ttm_mem_reg_iounmap(bdev, new_mem, new_iomap);
  209. out:
  210. ttm_mem_reg_iounmap(bdev, &old_copy, old_iomap);
  211. return ret;
  212. }
  213. EXPORT_SYMBOL(ttm_bo_move_memcpy);
  214. static void ttm_transfered_destroy(struct ttm_buffer_object *bo)
  215. {
  216. kfree(bo);
  217. }
  218. /**
  219. * ttm_buffer_object_transfer
  220. *
  221. * @bo: A pointer to a struct ttm_buffer_object.
  222. * @new_obj: A pointer to a pointer to a newly created ttm_buffer_object,
  223. * holding the data of @bo with the old placement.
  224. *
  225. * This is a utility function that may be called after an accelerated move
  226. * has been scheduled. A new buffer object is created as a placeholder for
  227. * the old data while it's being copied. When that buffer object is idle,
  228. * it can be destroyed, releasing the space of the old placement.
  229. * Returns:
  230. * !0: Failure.
  231. */
  232. static int ttm_buffer_object_transfer(struct ttm_buffer_object *bo,
  233. struct ttm_buffer_object **new_obj)
  234. {
  235. struct ttm_buffer_object *fbo;
  236. struct ttm_bo_device *bdev = bo->bdev;
  237. struct ttm_bo_driver *driver = bdev->driver;
  238. fbo = kzalloc(sizeof(*fbo), GFP_KERNEL);
  239. if (!fbo)
  240. return -ENOMEM;
  241. *fbo = *bo;
  242. /**
  243. * Fix up members that we shouldn't copy directly:
  244. * TODO: Explicit member copy would probably be better here.
  245. */
  246. spin_lock_init(&fbo->lock);
  247. init_waitqueue_head(&fbo->event_queue);
  248. INIT_LIST_HEAD(&fbo->ddestroy);
  249. INIT_LIST_HEAD(&fbo->lru);
  250. INIT_LIST_HEAD(&fbo->swap);
  251. fbo->vm_node = NULL;
  252. fbo->sync_obj = driver->sync_obj_ref(bo->sync_obj);
  253. if (fbo->mem.mm_node)
  254. fbo->mem.mm_node->private = (void *)fbo;
  255. kref_init(&fbo->list_kref);
  256. kref_init(&fbo->kref);
  257. fbo->destroy = &ttm_transfered_destroy;
  258. *new_obj = fbo;
  259. return 0;
  260. }
  261. pgprot_t ttm_io_prot(uint32_t caching_flags, pgprot_t tmp)
  262. {
  263. #if defined(__i386__) || defined(__x86_64__)
  264. if (caching_flags & TTM_PL_FLAG_WC)
  265. tmp = pgprot_writecombine(tmp);
  266. else if (boot_cpu_data.x86 > 3)
  267. tmp = pgprot_noncached(tmp);
  268. #elif defined(__powerpc__)
  269. if (!(caching_flags & TTM_PL_FLAG_CACHED)) {
  270. pgprot_val(tmp) |= _PAGE_NO_CACHE;
  271. if (caching_flags & TTM_PL_FLAG_UNCACHED)
  272. pgprot_val(tmp) |= _PAGE_GUARDED;
  273. }
  274. #endif
  275. #if defined(__ia64__)
  276. if (caching_flags & TTM_PL_FLAG_WC)
  277. tmp = pgprot_writecombine(tmp);
  278. else
  279. tmp = pgprot_noncached(tmp);
  280. #endif
  281. #if defined(__sparc__)
  282. if (!(caching_flags & TTM_PL_FLAG_CACHED))
  283. tmp = pgprot_noncached(tmp);
  284. #endif
  285. return tmp;
  286. }
  287. static int ttm_bo_ioremap(struct ttm_buffer_object *bo,
  288. unsigned long bus_base,
  289. unsigned long bus_offset,
  290. unsigned long bus_size,
  291. struct ttm_bo_kmap_obj *map)
  292. {
  293. struct ttm_bo_device *bdev = bo->bdev;
  294. struct ttm_mem_reg *mem = &bo->mem;
  295. struct ttm_mem_type_manager *man = &bdev->man[mem->mem_type];
  296. if (!(man->flags & TTM_MEMTYPE_FLAG_NEEDS_IOREMAP)) {
  297. map->bo_kmap_type = ttm_bo_map_premapped;
  298. map->virtual = (void *)(((u8 *) man->io_addr) + bus_offset);
  299. } else {
  300. map->bo_kmap_type = ttm_bo_map_iomap;
  301. if (mem->placement & TTM_PL_FLAG_WC)
  302. map->virtual = ioremap_wc(bus_base + bus_offset,
  303. bus_size);
  304. else
  305. map->virtual = ioremap_nocache(bus_base + bus_offset,
  306. bus_size);
  307. }
  308. return (!map->virtual) ? -ENOMEM : 0;
  309. }
  310. static int ttm_bo_kmap_ttm(struct ttm_buffer_object *bo,
  311. unsigned long start_page,
  312. unsigned long num_pages,
  313. struct ttm_bo_kmap_obj *map)
  314. {
  315. struct ttm_mem_reg *mem = &bo->mem; pgprot_t prot;
  316. struct ttm_tt *ttm = bo->ttm;
  317. struct page *d;
  318. int i;
  319. BUG_ON(!ttm);
  320. if (num_pages == 1 && (mem->placement & TTM_PL_FLAG_CACHED)) {
  321. /*
  322. * We're mapping a single page, and the desired
  323. * page protection is consistent with the bo.
  324. */
  325. map->bo_kmap_type = ttm_bo_map_kmap;
  326. map->page = ttm_tt_get_page(ttm, start_page);
  327. map->virtual = kmap(map->page);
  328. } else {
  329. /*
  330. * Populate the part we're mapping;
  331. */
  332. for (i = start_page; i < start_page + num_pages; ++i) {
  333. d = ttm_tt_get_page(ttm, i);
  334. if (!d)
  335. return -ENOMEM;
  336. }
  337. /*
  338. * We need to use vmap to get the desired page protection
  339. * or to make the buffer object look contigous.
  340. */
  341. prot = (mem->placement & TTM_PL_FLAG_CACHED) ?
  342. PAGE_KERNEL :
  343. ttm_io_prot(mem->placement, PAGE_KERNEL);
  344. map->bo_kmap_type = ttm_bo_map_vmap;
  345. map->virtual = vmap(ttm->pages + start_page, num_pages,
  346. 0, prot);
  347. }
  348. return (!map->virtual) ? -ENOMEM : 0;
  349. }
  350. int ttm_bo_kmap(struct ttm_buffer_object *bo,
  351. unsigned long start_page, unsigned long num_pages,
  352. struct ttm_bo_kmap_obj *map)
  353. {
  354. int ret;
  355. unsigned long bus_base;
  356. unsigned long bus_offset;
  357. unsigned long bus_size;
  358. BUG_ON(!list_empty(&bo->swap));
  359. map->virtual = NULL;
  360. if (num_pages > bo->num_pages)
  361. return -EINVAL;
  362. if (start_page > bo->num_pages)
  363. return -EINVAL;
  364. #if 0
  365. if (num_pages > 1 && !DRM_SUSER(DRM_CURPROC))
  366. return -EPERM;
  367. #endif
  368. ret = ttm_bo_pci_offset(bo->bdev, &bo->mem, &bus_base,
  369. &bus_offset, &bus_size);
  370. if (ret)
  371. return ret;
  372. if (bus_size == 0) {
  373. return ttm_bo_kmap_ttm(bo, start_page, num_pages, map);
  374. } else {
  375. bus_offset += start_page << PAGE_SHIFT;
  376. bus_size = num_pages << PAGE_SHIFT;
  377. return ttm_bo_ioremap(bo, bus_base, bus_offset, bus_size, map);
  378. }
  379. }
  380. EXPORT_SYMBOL(ttm_bo_kmap);
  381. void ttm_bo_kunmap(struct ttm_bo_kmap_obj *map)
  382. {
  383. if (!map->virtual)
  384. return;
  385. switch (map->bo_kmap_type) {
  386. case ttm_bo_map_iomap:
  387. iounmap(map->virtual);
  388. break;
  389. case ttm_bo_map_vmap:
  390. vunmap(map->virtual);
  391. break;
  392. case ttm_bo_map_kmap:
  393. kunmap(map->page);
  394. break;
  395. case ttm_bo_map_premapped:
  396. break;
  397. default:
  398. BUG();
  399. }
  400. map->virtual = NULL;
  401. map->page = NULL;
  402. }
  403. EXPORT_SYMBOL(ttm_bo_kunmap);
  404. int ttm_bo_pfn_prot(struct ttm_buffer_object *bo,
  405. unsigned long dst_offset,
  406. unsigned long *pfn, pgprot_t *prot)
  407. {
  408. struct ttm_mem_reg *mem = &bo->mem;
  409. struct ttm_bo_device *bdev = bo->bdev;
  410. unsigned long bus_offset;
  411. unsigned long bus_size;
  412. unsigned long bus_base;
  413. int ret;
  414. ret = ttm_bo_pci_offset(bdev, mem, &bus_base, &bus_offset,
  415. &bus_size);
  416. if (ret)
  417. return -EINVAL;
  418. if (bus_size != 0)
  419. *pfn = (bus_base + bus_offset + dst_offset) >> PAGE_SHIFT;
  420. else
  421. if (!bo->ttm)
  422. return -EINVAL;
  423. else
  424. *pfn = page_to_pfn(ttm_tt_get_page(bo->ttm,
  425. dst_offset >>
  426. PAGE_SHIFT));
  427. *prot = (mem->placement & TTM_PL_FLAG_CACHED) ?
  428. PAGE_KERNEL : ttm_io_prot(mem->placement, PAGE_KERNEL);
  429. return 0;
  430. }
  431. int ttm_bo_move_accel_cleanup(struct ttm_buffer_object *bo,
  432. void *sync_obj,
  433. void *sync_obj_arg,
  434. bool evict, bool no_wait,
  435. struct ttm_mem_reg *new_mem)
  436. {
  437. struct ttm_bo_device *bdev = bo->bdev;
  438. struct ttm_bo_driver *driver = bdev->driver;
  439. struct ttm_mem_type_manager *man = &bdev->man[new_mem->mem_type];
  440. struct ttm_mem_reg *old_mem = &bo->mem;
  441. int ret;
  442. uint32_t save_flags = old_mem->placement;
  443. struct ttm_buffer_object *ghost_obj;
  444. void *tmp_obj = NULL;
  445. spin_lock(&bo->lock);
  446. if (bo->sync_obj) {
  447. tmp_obj = bo->sync_obj;
  448. bo->sync_obj = NULL;
  449. }
  450. bo->sync_obj = driver->sync_obj_ref(sync_obj);
  451. bo->sync_obj_arg = sync_obj_arg;
  452. if (evict) {
  453. ret = ttm_bo_wait(bo, false, false, false);
  454. spin_unlock(&bo->lock);
  455. driver->sync_obj_unref(&bo->sync_obj);
  456. if (ret)
  457. return ret;
  458. ttm_bo_free_old_node(bo);
  459. if ((man->flags & TTM_MEMTYPE_FLAG_FIXED) &&
  460. (bo->ttm != NULL)) {
  461. ttm_tt_unbind(bo->ttm);
  462. ttm_tt_destroy(bo->ttm);
  463. bo->ttm = NULL;
  464. }
  465. } else {
  466. /**
  467. * This should help pipeline ordinary buffer moves.
  468. *
  469. * Hang old buffer memory on a new buffer object,
  470. * and leave it to be released when the GPU
  471. * operation has completed.
  472. */
  473. set_bit(TTM_BO_PRIV_FLAG_MOVING, &bo->priv_flags);
  474. spin_unlock(&bo->lock);
  475. ret = ttm_buffer_object_transfer(bo, &ghost_obj);
  476. if (ret)
  477. return ret;
  478. /**
  479. * If we're not moving to fixed memory, the TTM object
  480. * needs to stay alive. Otherwhise hang it on the ghost
  481. * bo to be unbound and destroyed.
  482. */
  483. if (!(man->flags & TTM_MEMTYPE_FLAG_FIXED))
  484. ghost_obj->ttm = NULL;
  485. else
  486. bo->ttm = NULL;
  487. ttm_bo_unreserve(ghost_obj);
  488. ttm_bo_unref(&ghost_obj);
  489. }
  490. *old_mem = *new_mem;
  491. new_mem->mm_node = NULL;
  492. ttm_flag_masked(&save_flags, new_mem->placement, TTM_PL_MASK_MEMTYPE);
  493. return 0;
  494. }
  495. EXPORT_SYMBOL(ttm_bo_move_accel_cleanup);