ttm_bo_util.c 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561
  1. /**************************************************************************
  2. *
  3. * Copyright (c) 2007-2009 VMware, Inc., Palo Alto, CA., USA
  4. * All Rights Reserved.
  5. *
  6. * Permission is hereby granted, free of charge, to any person obtaining a
  7. * copy of this software and associated documentation files (the
  8. * "Software"), to deal in the Software without restriction, including
  9. * without limitation the rights to use, copy, modify, merge, publish,
  10. * distribute, sub license, and/or sell copies of the Software, and to
  11. * permit persons to whom the Software is furnished to do so, subject to
  12. * the following conditions:
  13. *
  14. * The above copyright notice and this permission notice (including the
  15. * next paragraph) shall be included in all copies or substantial portions
  16. * of the Software.
  17. *
  18. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  19. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  20. * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
  21. * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
  22. * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
  23. * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
  24. * USE OR OTHER DEALINGS IN THE SOFTWARE.
  25. *
  26. **************************************************************************/
  27. /*
  28. * Authors: Thomas Hellstrom <thellstrom-at-vmware-dot-com>
  29. */
  30. #include "ttm/ttm_bo_driver.h"
  31. #include "ttm/ttm_placement.h"
  32. #include <linux/io.h>
  33. #include <linux/highmem.h>
  34. #include <linux/wait.h>
  35. #include <linux/vmalloc.h>
  36. #include <linux/version.h>
  37. #include <linux/module.h>
  38. void ttm_bo_free_old_node(struct ttm_buffer_object *bo)
  39. {
  40. struct ttm_mem_reg *old_mem = &bo->mem;
  41. if (old_mem->mm_node) {
  42. spin_lock(&bo->bdev->lru_lock);
  43. drm_mm_put_block(old_mem->mm_node);
  44. spin_unlock(&bo->bdev->lru_lock);
  45. }
  46. old_mem->mm_node = NULL;
  47. }
  48. int ttm_bo_move_ttm(struct ttm_buffer_object *bo,
  49. bool evict, bool no_wait, struct ttm_mem_reg *new_mem)
  50. {
  51. struct ttm_tt *ttm = bo->ttm;
  52. struct ttm_mem_reg *old_mem = &bo->mem;
  53. uint32_t save_flags = old_mem->placement;
  54. int ret;
  55. if (old_mem->mem_type != TTM_PL_SYSTEM) {
  56. ttm_tt_unbind(ttm);
  57. ttm_bo_free_old_node(bo);
  58. ttm_flag_masked(&old_mem->placement, TTM_PL_FLAG_SYSTEM,
  59. TTM_PL_MASK_MEM);
  60. old_mem->mem_type = TTM_PL_SYSTEM;
  61. save_flags = old_mem->placement;
  62. }
  63. ret = ttm_tt_set_placement_caching(ttm, new_mem->placement);
  64. if (unlikely(ret != 0))
  65. return ret;
  66. if (new_mem->mem_type != TTM_PL_SYSTEM) {
  67. ret = ttm_tt_bind(ttm, new_mem);
  68. if (unlikely(ret != 0))
  69. return ret;
  70. }
  71. *old_mem = *new_mem;
  72. new_mem->mm_node = NULL;
  73. ttm_flag_masked(&save_flags, new_mem->placement, TTM_PL_MASK_MEMTYPE);
  74. return 0;
  75. }
  76. EXPORT_SYMBOL(ttm_bo_move_ttm);
  77. int ttm_mem_reg_ioremap(struct ttm_bo_device *bdev, struct ttm_mem_reg *mem,
  78. void **virtual)
  79. {
  80. struct ttm_mem_type_manager *man = &bdev->man[mem->mem_type];
  81. unsigned long bus_offset;
  82. unsigned long bus_size;
  83. unsigned long bus_base;
  84. int ret;
  85. void *addr;
  86. *virtual = NULL;
  87. ret = ttm_bo_pci_offset(bdev, mem, &bus_base, &bus_offset, &bus_size);
  88. if (ret || bus_size == 0)
  89. return ret;
  90. if (!(man->flags & TTM_MEMTYPE_FLAG_NEEDS_IOREMAP))
  91. addr = (void *)(((u8 *) man->io_addr) + bus_offset);
  92. else {
  93. if (mem->placement & TTM_PL_FLAG_WC)
  94. addr = ioremap_wc(bus_base + bus_offset, bus_size);
  95. else
  96. addr = ioremap_nocache(bus_base + bus_offset, bus_size);
  97. if (!addr)
  98. return -ENOMEM;
  99. }
  100. *virtual = addr;
  101. return 0;
  102. }
  103. void ttm_mem_reg_iounmap(struct ttm_bo_device *bdev, struct ttm_mem_reg *mem,
  104. void *virtual)
  105. {
  106. struct ttm_mem_type_manager *man;
  107. man = &bdev->man[mem->mem_type];
  108. if (virtual && (man->flags & TTM_MEMTYPE_FLAG_NEEDS_IOREMAP))
  109. iounmap(virtual);
  110. }
  111. static int ttm_copy_io_page(void *dst, void *src, unsigned long page)
  112. {
  113. uint32_t *dstP =
  114. (uint32_t *) ((unsigned long)dst + (page << PAGE_SHIFT));
  115. uint32_t *srcP =
  116. (uint32_t *) ((unsigned long)src + (page << PAGE_SHIFT));
  117. int i;
  118. for (i = 0; i < PAGE_SIZE / sizeof(uint32_t); ++i)
  119. iowrite32(ioread32(srcP++), dstP++);
  120. return 0;
  121. }
  122. static int ttm_copy_io_ttm_page(struct ttm_tt *ttm, void *src,
  123. unsigned long page)
  124. {
  125. struct page *d = ttm_tt_get_page(ttm, page);
  126. void *dst;
  127. if (!d)
  128. return -ENOMEM;
  129. src = (void *)((unsigned long)src + (page << PAGE_SHIFT));
  130. dst = kmap(d);
  131. if (!dst)
  132. return -ENOMEM;
  133. memcpy_fromio(dst, src, PAGE_SIZE);
  134. kunmap(d);
  135. return 0;
  136. }
  137. static int ttm_copy_ttm_io_page(struct ttm_tt *ttm, void *dst,
  138. unsigned long page)
  139. {
  140. struct page *s = ttm_tt_get_page(ttm, page);
  141. void *src;
  142. if (!s)
  143. return -ENOMEM;
  144. dst = (void *)((unsigned long)dst + (page << PAGE_SHIFT));
  145. src = kmap(s);
  146. if (!src)
  147. return -ENOMEM;
  148. memcpy_toio(dst, src, PAGE_SIZE);
  149. kunmap(s);
  150. return 0;
  151. }
  152. int ttm_bo_move_memcpy(struct ttm_buffer_object *bo,
  153. bool evict, bool no_wait, struct ttm_mem_reg *new_mem)
  154. {
  155. struct ttm_bo_device *bdev = bo->bdev;
  156. struct ttm_mem_type_manager *man = &bdev->man[new_mem->mem_type];
  157. struct ttm_tt *ttm = bo->ttm;
  158. struct ttm_mem_reg *old_mem = &bo->mem;
  159. struct ttm_mem_reg old_copy = *old_mem;
  160. void *old_iomap;
  161. void *new_iomap;
  162. int ret;
  163. uint32_t save_flags = old_mem->placement;
  164. unsigned long i;
  165. unsigned long page;
  166. unsigned long add = 0;
  167. int dir;
  168. ret = ttm_mem_reg_ioremap(bdev, old_mem, &old_iomap);
  169. if (ret)
  170. return ret;
  171. ret = ttm_mem_reg_ioremap(bdev, new_mem, &new_iomap);
  172. if (ret)
  173. goto out;
  174. if (old_iomap == NULL && new_iomap == NULL)
  175. goto out2;
  176. if (old_iomap == NULL && ttm == NULL)
  177. goto out2;
  178. add = 0;
  179. dir = 1;
  180. if ((old_mem->mem_type == new_mem->mem_type) &&
  181. (new_mem->mm_node->start <
  182. old_mem->mm_node->start + old_mem->mm_node->size)) {
  183. dir = -1;
  184. add = new_mem->num_pages - 1;
  185. }
  186. for (i = 0; i < new_mem->num_pages; ++i) {
  187. page = i * dir + add;
  188. if (old_iomap == NULL)
  189. ret = ttm_copy_ttm_io_page(ttm, new_iomap, page);
  190. else if (new_iomap == NULL)
  191. ret = ttm_copy_io_ttm_page(ttm, old_iomap, page);
  192. else
  193. ret = ttm_copy_io_page(new_iomap, old_iomap, page);
  194. if (ret)
  195. goto out1;
  196. }
  197. mb();
  198. out2:
  199. ttm_bo_free_old_node(bo);
  200. *old_mem = *new_mem;
  201. new_mem->mm_node = NULL;
  202. ttm_flag_masked(&save_flags, new_mem->placement, TTM_PL_MASK_MEMTYPE);
  203. if ((man->flags & TTM_MEMTYPE_FLAG_FIXED) && (ttm != NULL)) {
  204. ttm_tt_unbind(ttm);
  205. ttm_tt_destroy(ttm);
  206. bo->ttm = NULL;
  207. }
  208. out1:
  209. ttm_mem_reg_iounmap(bdev, new_mem, new_iomap);
  210. out:
  211. ttm_mem_reg_iounmap(bdev, &old_copy, old_iomap);
  212. return ret;
  213. }
  214. EXPORT_SYMBOL(ttm_bo_move_memcpy);
  215. static void ttm_transfered_destroy(struct ttm_buffer_object *bo)
  216. {
  217. kfree(bo);
  218. }
  219. /**
  220. * ttm_buffer_object_transfer
  221. *
  222. * @bo: A pointer to a struct ttm_buffer_object.
  223. * @new_obj: A pointer to a pointer to a newly created ttm_buffer_object,
  224. * holding the data of @bo with the old placement.
  225. *
  226. * This is a utility function that may be called after an accelerated move
  227. * has been scheduled. A new buffer object is created as a placeholder for
  228. * the old data while it's being copied. When that buffer object is idle,
  229. * it can be destroyed, releasing the space of the old placement.
  230. * Returns:
  231. * !0: Failure.
  232. */
  233. static int ttm_buffer_object_transfer(struct ttm_buffer_object *bo,
  234. struct ttm_buffer_object **new_obj)
  235. {
  236. struct ttm_buffer_object *fbo;
  237. struct ttm_bo_device *bdev = bo->bdev;
  238. struct ttm_bo_driver *driver = bdev->driver;
  239. fbo = kzalloc(sizeof(*fbo), GFP_KERNEL);
  240. if (!fbo)
  241. return -ENOMEM;
  242. *fbo = *bo;
  243. /**
  244. * Fix up members that we shouldn't copy directly:
  245. * TODO: Explicit member copy would probably be better here.
  246. */
  247. spin_lock_init(&fbo->lock);
  248. init_waitqueue_head(&fbo->event_queue);
  249. INIT_LIST_HEAD(&fbo->ddestroy);
  250. INIT_LIST_HEAD(&fbo->lru);
  251. INIT_LIST_HEAD(&fbo->swap);
  252. fbo->vm_node = NULL;
  253. fbo->sync_obj = driver->sync_obj_ref(bo->sync_obj);
  254. if (fbo->mem.mm_node)
  255. fbo->mem.mm_node->private = (void *)fbo;
  256. kref_init(&fbo->list_kref);
  257. kref_init(&fbo->kref);
  258. fbo->destroy = &ttm_transfered_destroy;
  259. *new_obj = fbo;
  260. return 0;
  261. }
  262. pgprot_t ttm_io_prot(uint32_t caching_flags, pgprot_t tmp)
  263. {
  264. #if defined(__i386__) || defined(__x86_64__)
  265. if (caching_flags & TTM_PL_FLAG_WC)
  266. tmp = pgprot_writecombine(tmp);
  267. else if (boot_cpu_data.x86 > 3)
  268. tmp = pgprot_noncached(tmp);
  269. #elif defined(__powerpc__)
  270. if (!(caching_flags & TTM_PL_FLAG_CACHED)) {
  271. pgprot_val(tmp) |= _PAGE_NO_CACHE;
  272. if (caching_flags & TTM_PL_FLAG_UNCACHED)
  273. pgprot_val(tmp) |= _PAGE_GUARDED;
  274. }
  275. #endif
  276. #if defined(__ia64__)
  277. if (caching_flags & TTM_PL_FLAG_WC)
  278. tmp = pgprot_writecombine(tmp);
  279. else
  280. tmp = pgprot_noncached(tmp);
  281. #endif
  282. #if defined(__sparc__)
  283. if (!(caching_flags & TTM_PL_FLAG_CACHED))
  284. tmp = pgprot_noncached(tmp);
  285. #endif
  286. return tmp;
  287. }
  288. static int ttm_bo_ioremap(struct ttm_buffer_object *bo,
  289. unsigned long bus_base,
  290. unsigned long bus_offset,
  291. unsigned long bus_size,
  292. struct ttm_bo_kmap_obj *map)
  293. {
  294. struct ttm_bo_device *bdev = bo->bdev;
  295. struct ttm_mem_reg *mem = &bo->mem;
  296. struct ttm_mem_type_manager *man = &bdev->man[mem->mem_type];
  297. if (!(man->flags & TTM_MEMTYPE_FLAG_NEEDS_IOREMAP)) {
  298. map->bo_kmap_type = ttm_bo_map_premapped;
  299. map->virtual = (void *)(((u8 *) man->io_addr) + bus_offset);
  300. } else {
  301. map->bo_kmap_type = ttm_bo_map_iomap;
  302. if (mem->placement & TTM_PL_FLAG_WC)
  303. map->virtual = ioremap_wc(bus_base + bus_offset,
  304. bus_size);
  305. else
  306. map->virtual = ioremap_nocache(bus_base + bus_offset,
  307. bus_size);
  308. }
  309. return (!map->virtual) ? -ENOMEM : 0;
  310. }
  311. static int ttm_bo_kmap_ttm(struct ttm_buffer_object *bo,
  312. unsigned long start_page,
  313. unsigned long num_pages,
  314. struct ttm_bo_kmap_obj *map)
  315. {
  316. struct ttm_mem_reg *mem = &bo->mem; pgprot_t prot;
  317. struct ttm_tt *ttm = bo->ttm;
  318. struct page *d;
  319. int i;
  320. BUG_ON(!ttm);
  321. if (num_pages == 1 && (mem->placement & TTM_PL_FLAG_CACHED)) {
  322. /*
  323. * We're mapping a single page, and the desired
  324. * page protection is consistent with the bo.
  325. */
  326. map->bo_kmap_type = ttm_bo_map_kmap;
  327. map->page = ttm_tt_get_page(ttm, start_page);
  328. map->virtual = kmap(map->page);
  329. } else {
  330. /*
  331. * Populate the part we're mapping;
  332. */
  333. for (i = start_page; i < start_page + num_pages; ++i) {
  334. d = ttm_tt_get_page(ttm, i);
  335. if (!d)
  336. return -ENOMEM;
  337. }
  338. /*
  339. * We need to use vmap to get the desired page protection
  340. * or to make the buffer object look contigous.
  341. */
  342. prot = (mem->placement & TTM_PL_FLAG_CACHED) ?
  343. PAGE_KERNEL :
  344. ttm_io_prot(mem->placement, PAGE_KERNEL);
  345. map->bo_kmap_type = ttm_bo_map_vmap;
  346. map->virtual = vmap(ttm->pages + start_page, num_pages,
  347. 0, prot);
  348. }
  349. return (!map->virtual) ? -ENOMEM : 0;
  350. }
  351. int ttm_bo_kmap(struct ttm_buffer_object *bo,
  352. unsigned long start_page, unsigned long num_pages,
  353. struct ttm_bo_kmap_obj *map)
  354. {
  355. int ret;
  356. unsigned long bus_base;
  357. unsigned long bus_offset;
  358. unsigned long bus_size;
  359. BUG_ON(!list_empty(&bo->swap));
  360. map->virtual = NULL;
  361. if (num_pages > bo->num_pages)
  362. return -EINVAL;
  363. if (start_page > bo->num_pages)
  364. return -EINVAL;
  365. #if 0
  366. if (num_pages > 1 && !DRM_SUSER(DRM_CURPROC))
  367. return -EPERM;
  368. #endif
  369. ret = ttm_bo_pci_offset(bo->bdev, &bo->mem, &bus_base,
  370. &bus_offset, &bus_size);
  371. if (ret)
  372. return ret;
  373. if (bus_size == 0) {
  374. return ttm_bo_kmap_ttm(bo, start_page, num_pages, map);
  375. } else {
  376. bus_offset += start_page << PAGE_SHIFT;
  377. bus_size = num_pages << PAGE_SHIFT;
  378. return ttm_bo_ioremap(bo, bus_base, bus_offset, bus_size, map);
  379. }
  380. }
  381. EXPORT_SYMBOL(ttm_bo_kmap);
  382. void ttm_bo_kunmap(struct ttm_bo_kmap_obj *map)
  383. {
  384. if (!map->virtual)
  385. return;
  386. switch (map->bo_kmap_type) {
  387. case ttm_bo_map_iomap:
  388. iounmap(map->virtual);
  389. break;
  390. case ttm_bo_map_vmap:
  391. vunmap(map->virtual);
  392. break;
  393. case ttm_bo_map_kmap:
  394. kunmap(map->page);
  395. break;
  396. case ttm_bo_map_premapped:
  397. break;
  398. default:
  399. BUG();
  400. }
  401. map->virtual = NULL;
  402. map->page = NULL;
  403. }
  404. EXPORT_SYMBOL(ttm_bo_kunmap);
  405. int ttm_bo_pfn_prot(struct ttm_buffer_object *bo,
  406. unsigned long dst_offset,
  407. unsigned long *pfn, pgprot_t *prot)
  408. {
  409. struct ttm_mem_reg *mem = &bo->mem;
  410. struct ttm_bo_device *bdev = bo->bdev;
  411. unsigned long bus_offset;
  412. unsigned long bus_size;
  413. unsigned long bus_base;
  414. int ret;
  415. ret = ttm_bo_pci_offset(bdev, mem, &bus_base, &bus_offset,
  416. &bus_size);
  417. if (ret)
  418. return -EINVAL;
  419. if (bus_size != 0)
  420. *pfn = (bus_base + bus_offset + dst_offset) >> PAGE_SHIFT;
  421. else
  422. if (!bo->ttm)
  423. return -EINVAL;
  424. else
  425. *pfn = page_to_pfn(ttm_tt_get_page(bo->ttm,
  426. dst_offset >>
  427. PAGE_SHIFT));
  428. *prot = (mem->placement & TTM_PL_FLAG_CACHED) ?
  429. PAGE_KERNEL : ttm_io_prot(mem->placement, PAGE_KERNEL);
  430. return 0;
  431. }
  432. int ttm_bo_move_accel_cleanup(struct ttm_buffer_object *bo,
  433. void *sync_obj,
  434. void *sync_obj_arg,
  435. bool evict, bool no_wait,
  436. struct ttm_mem_reg *new_mem)
  437. {
  438. struct ttm_bo_device *bdev = bo->bdev;
  439. struct ttm_bo_driver *driver = bdev->driver;
  440. struct ttm_mem_type_manager *man = &bdev->man[new_mem->mem_type];
  441. struct ttm_mem_reg *old_mem = &bo->mem;
  442. int ret;
  443. uint32_t save_flags = old_mem->placement;
  444. struct ttm_buffer_object *ghost_obj;
  445. void *tmp_obj = NULL;
  446. spin_lock(&bo->lock);
  447. if (bo->sync_obj) {
  448. tmp_obj = bo->sync_obj;
  449. bo->sync_obj = NULL;
  450. }
  451. bo->sync_obj = driver->sync_obj_ref(sync_obj);
  452. bo->sync_obj_arg = sync_obj_arg;
  453. if (evict) {
  454. ret = ttm_bo_wait(bo, false, false, false);
  455. spin_unlock(&bo->lock);
  456. driver->sync_obj_unref(&bo->sync_obj);
  457. if (ret)
  458. return ret;
  459. ttm_bo_free_old_node(bo);
  460. if ((man->flags & TTM_MEMTYPE_FLAG_FIXED) &&
  461. (bo->ttm != NULL)) {
  462. ttm_tt_unbind(bo->ttm);
  463. ttm_tt_destroy(bo->ttm);
  464. bo->ttm = NULL;
  465. }
  466. } else {
  467. /**
  468. * This should help pipeline ordinary buffer moves.
  469. *
  470. * Hang old buffer memory on a new buffer object,
  471. * and leave it to be released when the GPU
  472. * operation has completed.
  473. */
  474. set_bit(TTM_BO_PRIV_FLAG_MOVING, &bo->priv_flags);
  475. spin_unlock(&bo->lock);
  476. ret = ttm_buffer_object_transfer(bo, &ghost_obj);
  477. if (ret)
  478. return ret;
  479. /**
  480. * If we're not moving to fixed memory, the TTM object
  481. * needs to stay alive. Otherwhise hang it on the ghost
  482. * bo to be unbound and destroyed.
  483. */
  484. if (!(man->flags & TTM_MEMTYPE_FLAG_FIXED))
  485. ghost_obj->ttm = NULL;
  486. else
  487. bo->ttm = NULL;
  488. ttm_bo_unreserve(ghost_obj);
  489. ttm_bo_unref(&ghost_obj);
  490. }
  491. *old_mem = *new_mem;
  492. new_mem->mm_node = NULL;
  493. ttm_flag_masked(&save_flags, new_mem->placement, TTM_PL_MASK_MEMTYPE);
  494. return 0;
  495. }
  496. EXPORT_SYMBOL(ttm_bo_move_accel_cleanup);