msm_gem.c 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608
  1. /*
  2. * Copyright (C) 2013 Red Hat
  3. * Author: Rob Clark <robdclark@gmail.com>
  4. *
  5. * This program is free software; you can redistribute it and/or modify it
  6. * under the terms of the GNU General Public License version 2 as published by
  7. * the Free Software Foundation.
  8. *
  9. * This program is distributed in the hope that it will be useful, but WITHOUT
  10. * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11. * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
  12. * more details.
  13. *
  14. * You should have received a copy of the GNU General Public License along with
  15. * this program. If not, see <http://www.gnu.org/licenses/>.
  16. */
  17. #include <linux/spinlock.h>
  18. #include <linux/shmem_fs.h>
  19. #include "msm_drv.h"
  20. #include "msm_gem.h"
  21. #include "msm_gpu.h"
  22. /* called with dev->struct_mutex held */
  23. static struct page **get_pages(struct drm_gem_object *obj)
  24. {
  25. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  26. if (!msm_obj->pages) {
  27. struct drm_device *dev = obj->dev;
  28. struct page **p = drm_gem_get_pages(obj, 0);
  29. int npages = obj->size >> PAGE_SHIFT;
  30. if (IS_ERR(p)) {
  31. dev_err(dev->dev, "could not get pages: %ld\n",
  32. PTR_ERR(p));
  33. return p;
  34. }
  35. msm_obj->sgt = drm_prime_pages_to_sg(p, npages);
  36. if (IS_ERR(msm_obj->sgt)) {
  37. dev_err(dev->dev, "failed to allocate sgt\n");
  38. return ERR_CAST(msm_obj->sgt);
  39. }
  40. msm_obj->pages = p;
  41. /* For non-cached buffers, ensure the new pages are clean
  42. * because display controller, GPU, etc. are not coherent:
  43. */
  44. if (msm_obj->flags & (MSM_BO_WC|MSM_BO_UNCACHED))
  45. dma_map_sg(dev->dev, msm_obj->sgt->sgl,
  46. msm_obj->sgt->nents, DMA_BIDIRECTIONAL);
  47. }
  48. return msm_obj->pages;
  49. }
  50. static void put_pages(struct drm_gem_object *obj)
  51. {
  52. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  53. if (msm_obj->pages) {
  54. /* For non-cached buffers, ensure the new pages are clean
  55. * because display controller, GPU, etc. are not coherent:
  56. */
  57. if (msm_obj->flags & (MSM_BO_WC|MSM_BO_UNCACHED))
  58. dma_unmap_sg(obj->dev->dev, msm_obj->sgt->sgl,
  59. msm_obj->sgt->nents, DMA_BIDIRECTIONAL);
  60. sg_free_table(msm_obj->sgt);
  61. kfree(msm_obj->sgt);
  62. drm_gem_put_pages(obj, msm_obj->pages, true, false);
  63. msm_obj->pages = NULL;
  64. }
  65. }
  66. int msm_gem_mmap_obj(struct drm_gem_object *obj,
  67. struct vm_area_struct *vma)
  68. {
  69. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  70. vma->vm_flags &= ~VM_PFNMAP;
  71. vma->vm_flags |= VM_MIXEDMAP;
  72. if (msm_obj->flags & MSM_BO_WC) {
  73. vma->vm_page_prot = pgprot_writecombine(vm_get_page_prot(vma->vm_flags));
  74. } else if (msm_obj->flags & MSM_BO_UNCACHED) {
  75. vma->vm_page_prot = pgprot_noncached(vm_get_page_prot(vma->vm_flags));
  76. } else {
  77. /*
  78. * Shunt off cached objs to shmem file so they have their own
  79. * address_space (so unmap_mapping_range does what we want,
  80. * in particular in the case of mmap'd dmabufs)
  81. */
  82. fput(vma->vm_file);
  83. get_file(obj->filp);
  84. vma->vm_pgoff = 0;
  85. vma->vm_file = obj->filp;
  86. vma->vm_page_prot = vm_get_page_prot(vma->vm_flags);
  87. }
  88. return 0;
  89. }
  90. int msm_gem_mmap(struct file *filp, struct vm_area_struct *vma)
  91. {
  92. int ret;
  93. ret = drm_gem_mmap(filp, vma);
  94. if (ret) {
  95. DBG("mmap failed: %d", ret);
  96. return ret;
  97. }
  98. return msm_gem_mmap_obj(vma->vm_private_data, vma);
  99. }
  100. int msm_gem_fault(struct vm_area_struct *vma, struct vm_fault *vmf)
  101. {
  102. struct drm_gem_object *obj = vma->vm_private_data;
  103. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  104. struct drm_device *dev = obj->dev;
  105. struct page **pages;
  106. unsigned long pfn;
  107. pgoff_t pgoff;
  108. int ret;
  109. /* Make sure we don't parallel update on a fault, nor move or remove
  110. * something from beneath our feet
  111. */
  112. ret = mutex_lock_interruptible(&dev->struct_mutex);
  113. if (ret)
  114. goto out;
  115. /* make sure we have pages attached now */
  116. pages = get_pages(obj);
  117. if (IS_ERR(pages)) {
  118. ret = PTR_ERR(pages);
  119. goto out_unlock;
  120. }
  121. /* We don't use vmf->pgoff since that has the fake offset: */
  122. pgoff = ((unsigned long)vmf->virtual_address -
  123. vma->vm_start) >> PAGE_SHIFT;
  124. pfn = page_to_pfn(msm_obj->pages[pgoff]);
  125. VERB("Inserting %p pfn %lx, pa %lx", vmf->virtual_address,
  126. pfn, pfn << PAGE_SHIFT);
  127. ret = vm_insert_mixed(vma, (unsigned long)vmf->virtual_address, pfn);
  128. out_unlock:
  129. mutex_unlock(&dev->struct_mutex);
  130. out:
  131. switch (ret) {
  132. case -EAGAIN:
  133. set_need_resched();
  134. case 0:
  135. case -ERESTARTSYS:
  136. case -EINTR:
  137. return VM_FAULT_NOPAGE;
  138. case -ENOMEM:
  139. return VM_FAULT_OOM;
  140. default:
  141. return VM_FAULT_SIGBUS;
  142. }
  143. }
  144. /** get mmap offset */
  145. static uint64_t mmap_offset(struct drm_gem_object *obj)
  146. {
  147. struct drm_device *dev = obj->dev;
  148. int ret;
  149. WARN_ON(!mutex_is_locked(&dev->struct_mutex));
  150. /* Make it mmapable */
  151. ret = drm_gem_create_mmap_offset(obj);
  152. if (ret) {
  153. dev_err(dev->dev, "could not allocate mmap offset\n");
  154. return 0;
  155. }
  156. return drm_vma_node_offset_addr(&obj->vma_node);
  157. }
  158. uint64_t msm_gem_mmap_offset(struct drm_gem_object *obj)
  159. {
  160. uint64_t offset;
  161. mutex_lock(&obj->dev->struct_mutex);
  162. offset = mmap_offset(obj);
  163. mutex_unlock(&obj->dev->struct_mutex);
  164. return offset;
  165. }
  166. /* helpers for dealing w/ iommu: */
  167. static int map_range(struct iommu_domain *domain, unsigned int iova,
  168. struct sg_table *sgt, unsigned int len, int prot)
  169. {
  170. struct scatterlist *sg;
  171. unsigned int da = iova;
  172. unsigned int i, j;
  173. int ret;
  174. if (!domain || !sgt)
  175. return -EINVAL;
  176. for_each_sg(sgt->sgl, sg, sgt->nents, i) {
  177. u32 pa = sg_phys(sg) - sg->offset;
  178. size_t bytes = sg->length + sg->offset;
  179. VERB("map[%d]: %08x %08x(%x)", i, iova, pa, bytes);
  180. ret = iommu_map(domain, da, pa, bytes, prot);
  181. if (ret)
  182. goto fail;
  183. da += bytes;
  184. }
  185. return 0;
  186. fail:
  187. da = iova;
  188. for_each_sg(sgt->sgl, sg, i, j) {
  189. size_t bytes = sg->length + sg->offset;
  190. iommu_unmap(domain, da, bytes);
  191. da += bytes;
  192. }
  193. return ret;
  194. }
  195. static void unmap_range(struct iommu_domain *domain, unsigned int iova,
  196. struct sg_table *sgt, unsigned int len)
  197. {
  198. struct scatterlist *sg;
  199. unsigned int da = iova;
  200. int i;
  201. for_each_sg(sgt->sgl, sg, sgt->nents, i) {
  202. size_t bytes = sg->length + sg->offset;
  203. size_t unmapped;
  204. unmapped = iommu_unmap(domain, da, bytes);
  205. if (unmapped < bytes)
  206. break;
  207. VERB("unmap[%d]: %08x(%x)", i, iova, bytes);
  208. BUG_ON(!IS_ALIGNED(bytes, PAGE_SIZE));
  209. da += bytes;
  210. }
  211. }
  212. /* should be called under struct_mutex.. although it can be called
  213. * from atomic context without struct_mutex to acquire an extra
  214. * iova ref if you know one is already held.
  215. *
  216. * That means when I do eventually need to add support for unpinning
  217. * the refcnt counter needs to be atomic_t.
  218. */
  219. int msm_gem_get_iova_locked(struct drm_gem_object *obj, int id,
  220. uint32_t *iova)
  221. {
  222. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  223. int ret = 0;
  224. if (!msm_obj->domain[id].iova) {
  225. struct msm_drm_private *priv = obj->dev->dev_private;
  226. uint32_t offset = (uint32_t)mmap_offset(obj);
  227. struct page **pages;
  228. pages = get_pages(obj);
  229. if (IS_ERR(pages))
  230. return PTR_ERR(pages);
  231. // XXX ideally we would not map buffers writable when not needed...
  232. ret = map_range(priv->iommus[id], offset, msm_obj->sgt,
  233. obj->size, IOMMU_READ | IOMMU_WRITE);
  234. msm_obj->domain[id].iova = offset;
  235. }
  236. if (!ret)
  237. *iova = msm_obj->domain[id].iova;
  238. return ret;
  239. }
  240. int msm_gem_get_iova(struct drm_gem_object *obj, int id, uint32_t *iova)
  241. {
  242. int ret;
  243. mutex_lock(&obj->dev->struct_mutex);
  244. ret = msm_gem_get_iova_locked(obj, id, iova);
  245. mutex_unlock(&obj->dev->struct_mutex);
  246. return ret;
  247. }
  248. void msm_gem_put_iova(struct drm_gem_object *obj, int id)
  249. {
  250. // XXX TODO ..
  251. // NOTE: probably don't need a _locked() version.. we wouldn't
  252. // normally unmap here, but instead just mark that it could be
  253. // unmapped (if the iova refcnt drops to zero), but then later
  254. // if another _get_iova_locked() fails we can start unmapping
  255. // things that are no longer needed..
  256. }
  257. int msm_gem_dumb_create(struct drm_file *file, struct drm_device *dev,
  258. struct drm_mode_create_dumb *args)
  259. {
  260. args->pitch = align_pitch(args->width, args->bpp);
  261. args->size = PAGE_ALIGN(args->pitch * args->height);
  262. return msm_gem_new_handle(dev, file, args->size,
  263. MSM_BO_SCANOUT | MSM_BO_WC, &args->handle);
  264. }
  265. int msm_gem_dumb_destroy(struct drm_file *file, struct drm_device *dev,
  266. uint32_t handle)
  267. {
  268. /* No special work needed, drop the reference and see what falls out */
  269. return drm_gem_handle_delete(file, handle);
  270. }
  271. int msm_gem_dumb_map_offset(struct drm_file *file, struct drm_device *dev,
  272. uint32_t handle, uint64_t *offset)
  273. {
  274. struct drm_gem_object *obj;
  275. int ret = 0;
  276. /* GEM does all our handle to object mapping */
  277. obj = drm_gem_object_lookup(dev, file, handle);
  278. if (obj == NULL) {
  279. ret = -ENOENT;
  280. goto fail;
  281. }
  282. *offset = msm_gem_mmap_offset(obj);
  283. drm_gem_object_unreference_unlocked(obj);
  284. fail:
  285. return ret;
  286. }
  287. void *msm_gem_vaddr_locked(struct drm_gem_object *obj)
  288. {
  289. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  290. WARN_ON(!mutex_is_locked(&obj->dev->struct_mutex));
  291. if (!msm_obj->vaddr) {
  292. struct page **pages = get_pages(obj);
  293. if (IS_ERR(pages))
  294. return ERR_CAST(pages);
  295. msm_obj->vaddr = vmap(pages, obj->size >> PAGE_SHIFT,
  296. VM_MAP, pgprot_writecombine(PAGE_KERNEL));
  297. }
  298. return msm_obj->vaddr;
  299. }
  300. void *msm_gem_vaddr(struct drm_gem_object *obj)
  301. {
  302. void *ret;
  303. mutex_lock(&obj->dev->struct_mutex);
  304. ret = msm_gem_vaddr_locked(obj);
  305. mutex_unlock(&obj->dev->struct_mutex);
  306. return ret;
  307. }
  308. int msm_gem_queue_inactive_work(struct drm_gem_object *obj,
  309. struct work_struct *work)
  310. {
  311. struct drm_device *dev = obj->dev;
  312. struct msm_drm_private *priv = dev->dev_private;
  313. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  314. int ret = 0;
  315. mutex_lock(&dev->struct_mutex);
  316. if (!list_empty(&work->entry)) {
  317. ret = -EINVAL;
  318. } else if (is_active(msm_obj)) {
  319. list_add_tail(&work->entry, &msm_obj->inactive_work);
  320. } else {
  321. queue_work(priv->wq, work);
  322. }
  323. mutex_unlock(&dev->struct_mutex);
  324. return ret;
  325. }
  326. void msm_gem_move_to_active(struct drm_gem_object *obj,
  327. struct msm_gpu *gpu, bool write, uint32_t fence)
  328. {
  329. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  330. msm_obj->gpu = gpu;
  331. if (write)
  332. msm_obj->write_fence = fence;
  333. else
  334. msm_obj->read_fence = fence;
  335. list_del_init(&msm_obj->mm_list);
  336. list_add_tail(&msm_obj->mm_list, &gpu->active_list);
  337. }
  338. void msm_gem_move_to_inactive(struct drm_gem_object *obj)
  339. {
  340. struct drm_device *dev = obj->dev;
  341. struct msm_drm_private *priv = dev->dev_private;
  342. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  343. WARN_ON(!mutex_is_locked(&dev->struct_mutex));
  344. msm_obj->gpu = NULL;
  345. msm_obj->read_fence = 0;
  346. msm_obj->write_fence = 0;
  347. list_del_init(&msm_obj->mm_list);
  348. list_add_tail(&msm_obj->mm_list, &priv->inactive_list);
  349. while (!list_empty(&msm_obj->inactive_work)) {
  350. struct work_struct *work;
  351. work = list_first_entry(&msm_obj->inactive_work,
  352. struct work_struct, entry);
  353. list_del_init(&work->entry);
  354. queue_work(priv->wq, work);
  355. }
  356. }
  357. int msm_gem_cpu_prep(struct drm_gem_object *obj, uint32_t op,
  358. struct timespec *timeout)
  359. {
  360. struct drm_device *dev = obj->dev;
  361. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  362. int ret = 0;
  363. if (is_active(msm_obj) && !(op & MSM_PREP_NOSYNC)) {
  364. uint32_t fence = 0;
  365. if (op & MSM_PREP_READ)
  366. fence = msm_obj->write_fence;
  367. if (op & MSM_PREP_WRITE)
  368. fence = max(fence, msm_obj->read_fence);
  369. ret = msm_wait_fence_interruptable(dev, fence, timeout);
  370. }
  371. /* TODO cache maintenance */
  372. return ret;
  373. }
  374. int msm_gem_cpu_fini(struct drm_gem_object *obj)
  375. {
  376. /* TODO cache maintenance */
  377. return 0;
  378. }
  379. #ifdef CONFIG_DEBUG_FS
  380. void msm_gem_describe(struct drm_gem_object *obj, struct seq_file *m)
  381. {
  382. struct drm_device *dev = obj->dev;
  383. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  384. uint64_t off = drm_vma_node_start(&obj->vma_node);
  385. WARN_ON(!mutex_is_locked(&dev->struct_mutex));
  386. seq_printf(m, "%08x: %c(r=%u,w=%u) %2d (%2d) %08llx %p %d\n",
  387. msm_obj->flags, is_active(msm_obj) ? 'A' : 'I',
  388. msm_obj->read_fence, msm_obj->write_fence,
  389. obj->name, obj->refcount.refcount.counter,
  390. off, msm_obj->vaddr, obj->size);
  391. }
  392. void msm_gem_describe_objects(struct list_head *list, struct seq_file *m)
  393. {
  394. struct msm_gem_object *msm_obj;
  395. int count = 0;
  396. size_t size = 0;
  397. list_for_each_entry(msm_obj, list, mm_list) {
  398. struct drm_gem_object *obj = &msm_obj->base;
  399. seq_printf(m, " ");
  400. msm_gem_describe(obj, m);
  401. count++;
  402. size += obj->size;
  403. }
  404. seq_printf(m, "Total %d objects, %zu bytes\n", count, size);
  405. }
  406. #endif
  407. void msm_gem_free_object(struct drm_gem_object *obj)
  408. {
  409. struct drm_device *dev = obj->dev;
  410. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  411. int id;
  412. WARN_ON(!mutex_is_locked(&dev->struct_mutex));
  413. /* object should not be on active list: */
  414. WARN_ON(is_active(msm_obj));
  415. list_del(&msm_obj->mm_list);
  416. for (id = 0; id < ARRAY_SIZE(msm_obj->domain); id++) {
  417. if (msm_obj->domain[id].iova) {
  418. struct msm_drm_private *priv = obj->dev->dev_private;
  419. uint32_t offset = (uint32_t)mmap_offset(obj);
  420. unmap_range(priv->iommus[id], offset,
  421. msm_obj->sgt, obj->size);
  422. }
  423. }
  424. drm_gem_free_mmap_offset(obj);
  425. if (msm_obj->vaddr)
  426. vunmap(msm_obj->vaddr);
  427. put_pages(obj);
  428. if (msm_obj->resv == &msm_obj->_resv)
  429. reservation_object_fini(msm_obj->resv);
  430. drm_gem_object_release(obj);
  431. kfree(msm_obj);
  432. }
  433. /* convenience method to construct a GEM buffer object, and userspace handle */
  434. int msm_gem_new_handle(struct drm_device *dev, struct drm_file *file,
  435. uint32_t size, uint32_t flags, uint32_t *handle)
  436. {
  437. struct drm_gem_object *obj;
  438. int ret;
  439. ret = mutex_lock_interruptible(&dev->struct_mutex);
  440. if (ret)
  441. return ret;
  442. obj = msm_gem_new(dev, size, flags);
  443. mutex_unlock(&dev->struct_mutex);
  444. if (IS_ERR(obj))
  445. return PTR_ERR(obj);
  446. ret = drm_gem_handle_create(file, obj, handle);
  447. /* drop reference from allocate - handle holds it now */
  448. drm_gem_object_unreference_unlocked(obj);
  449. return ret;
  450. }
  451. struct drm_gem_object *msm_gem_new(struct drm_device *dev,
  452. uint32_t size, uint32_t flags)
  453. {
  454. struct msm_drm_private *priv = dev->dev_private;
  455. struct msm_gem_object *msm_obj;
  456. struct drm_gem_object *obj = NULL;
  457. int ret;
  458. WARN_ON(!mutex_is_locked(&dev->struct_mutex));
  459. size = PAGE_ALIGN(size);
  460. switch (flags & MSM_BO_CACHE_MASK) {
  461. case MSM_BO_UNCACHED:
  462. case MSM_BO_CACHED:
  463. case MSM_BO_WC:
  464. break;
  465. default:
  466. dev_err(dev->dev, "invalid cache flag: %x\n",
  467. (flags & MSM_BO_CACHE_MASK));
  468. ret = -EINVAL;
  469. goto fail;
  470. }
  471. msm_obj = kzalloc(sizeof(*msm_obj), GFP_KERNEL);
  472. if (!msm_obj) {
  473. ret = -ENOMEM;
  474. goto fail;
  475. }
  476. obj = &msm_obj->base;
  477. ret = drm_gem_object_init(dev, obj, size);
  478. if (ret)
  479. goto fail;
  480. msm_obj->flags = flags;
  481. msm_obj->resv = &msm_obj->_resv;
  482. reservation_object_init(msm_obj->resv);
  483. INIT_LIST_HEAD(&msm_obj->submit_entry);
  484. INIT_LIST_HEAD(&msm_obj->inactive_work);
  485. list_add_tail(&msm_obj->mm_list, &priv->inactive_list);
  486. return obj;
  487. fail:
  488. if (obj)
  489. drm_gem_object_unreference_unlocked(obj);
  490. return ERR_PTR(ret);
  491. }