msm_gem.c 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611
  1. /*
  2. * Copyright (C) 2013 Red Hat
  3. * Author: Rob Clark <robdclark@gmail.com>
  4. *
  5. * This program is free software; you can redistribute it and/or modify it
  6. * under the terms of the GNU General Public License version 2 as published by
  7. * the Free Software Foundation.
  8. *
  9. * This program is distributed in the hope that it will be useful, but WITHOUT
  10. * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  11. * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
  12. * more details.
  13. *
  14. * You should have received a copy of the GNU General Public License along with
  15. * this program. If not, see <http://www.gnu.org/licenses/>.
  16. */
  17. #include <linux/spinlock.h>
  18. #include <linux/shmem_fs.h>
  19. #include "msm_drv.h"
  20. #include "msm_gem.h"
  21. #include "msm_gpu.h"
  22. /* called with dev->struct_mutex held */
  23. static struct page **get_pages(struct drm_gem_object *obj)
  24. {
  25. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  26. if (!msm_obj->pages) {
  27. struct drm_device *dev = obj->dev;
  28. struct page **p = drm_gem_get_pages(obj, 0);
  29. int npages = obj->size >> PAGE_SHIFT;
  30. if (IS_ERR(p)) {
  31. dev_err(dev->dev, "could not get pages: %ld\n",
  32. PTR_ERR(p));
  33. return p;
  34. }
  35. msm_obj->sgt = drm_prime_pages_to_sg(p, npages);
  36. if (IS_ERR(msm_obj->sgt)) {
  37. dev_err(dev->dev, "failed to allocate sgt\n");
  38. return ERR_CAST(msm_obj->sgt);
  39. }
  40. msm_obj->pages = p;
  41. /* For non-cached buffers, ensure the new pages are clean
  42. * because display controller, GPU, etc. are not coherent:
  43. */
  44. if (msm_obj->flags & (MSM_BO_WC|MSM_BO_UNCACHED))
  45. dma_map_sg(dev->dev, msm_obj->sgt->sgl,
  46. msm_obj->sgt->nents, DMA_BIDIRECTIONAL);
  47. }
  48. return msm_obj->pages;
  49. }
  50. static void put_pages(struct drm_gem_object *obj)
  51. {
  52. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  53. if (msm_obj->pages) {
  54. /* For non-cached buffers, ensure the new pages are clean
  55. * because display controller, GPU, etc. are not coherent:
  56. */
  57. if (msm_obj->flags & (MSM_BO_WC|MSM_BO_UNCACHED))
  58. dma_unmap_sg(obj->dev->dev, msm_obj->sgt->sgl,
  59. msm_obj->sgt->nents, DMA_BIDIRECTIONAL);
  60. sg_free_table(msm_obj->sgt);
  61. kfree(msm_obj->sgt);
  62. drm_gem_put_pages(obj, msm_obj->pages, true, false);
  63. msm_obj->pages = NULL;
  64. }
  65. }
  66. int msm_gem_mmap_obj(struct drm_gem_object *obj,
  67. struct vm_area_struct *vma)
  68. {
  69. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  70. vma->vm_flags &= ~VM_PFNMAP;
  71. vma->vm_flags |= VM_MIXEDMAP;
  72. if (msm_obj->flags & MSM_BO_WC) {
  73. vma->vm_page_prot = pgprot_writecombine(vm_get_page_prot(vma->vm_flags));
  74. } else if (msm_obj->flags & MSM_BO_UNCACHED) {
  75. vma->vm_page_prot = pgprot_noncached(vm_get_page_prot(vma->vm_flags));
  76. } else {
  77. /*
  78. * Shunt off cached objs to shmem file so they have their own
  79. * address_space (so unmap_mapping_range does what we want,
  80. * in particular in the case of mmap'd dmabufs)
  81. */
  82. fput(vma->vm_file);
  83. get_file(obj->filp);
  84. vma->vm_pgoff = 0;
  85. vma->vm_file = obj->filp;
  86. vma->vm_page_prot = vm_get_page_prot(vma->vm_flags);
  87. }
  88. return 0;
  89. }
  90. int msm_gem_mmap(struct file *filp, struct vm_area_struct *vma)
  91. {
  92. int ret;
  93. ret = drm_gem_mmap(filp, vma);
  94. if (ret) {
  95. DBG("mmap failed: %d", ret);
  96. return ret;
  97. }
  98. return msm_gem_mmap_obj(vma->vm_private_data, vma);
  99. }
  100. int msm_gem_fault(struct vm_area_struct *vma, struct vm_fault *vmf)
  101. {
  102. struct drm_gem_object *obj = vma->vm_private_data;
  103. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  104. struct drm_device *dev = obj->dev;
  105. struct page **pages;
  106. unsigned long pfn;
  107. pgoff_t pgoff;
  108. int ret;
  109. /* Make sure we don't parallel update on a fault, nor move or remove
  110. * something from beneath our feet
  111. */
  112. ret = mutex_lock_interruptible(&dev->struct_mutex);
  113. if (ret)
  114. goto out;
  115. /* make sure we have pages attached now */
  116. pages = get_pages(obj);
  117. if (IS_ERR(pages)) {
  118. ret = PTR_ERR(pages);
  119. goto out_unlock;
  120. }
  121. /* We don't use vmf->pgoff since that has the fake offset: */
  122. pgoff = ((unsigned long)vmf->virtual_address -
  123. vma->vm_start) >> PAGE_SHIFT;
  124. pfn = page_to_pfn(msm_obj->pages[pgoff]);
  125. VERB("Inserting %p pfn %lx, pa %lx", vmf->virtual_address,
  126. pfn, pfn << PAGE_SHIFT);
  127. ret = vm_insert_mixed(vma, (unsigned long)vmf->virtual_address, pfn);
  128. out_unlock:
  129. mutex_unlock(&dev->struct_mutex);
  130. out:
  131. switch (ret) {
  132. case -EAGAIN:
  133. case 0:
  134. case -ERESTARTSYS:
  135. case -EINTR:
  136. return VM_FAULT_NOPAGE;
  137. case -ENOMEM:
  138. return VM_FAULT_OOM;
  139. default:
  140. return VM_FAULT_SIGBUS;
  141. }
  142. }
  143. /** get mmap offset */
  144. static uint64_t mmap_offset(struct drm_gem_object *obj)
  145. {
  146. struct drm_device *dev = obj->dev;
  147. int ret;
  148. WARN_ON(!mutex_is_locked(&dev->struct_mutex));
  149. /* Make it mmapable */
  150. ret = drm_gem_create_mmap_offset(obj);
  151. if (ret) {
  152. dev_err(dev->dev, "could not allocate mmap offset\n");
  153. return 0;
  154. }
  155. return drm_vma_node_offset_addr(&obj->vma_node);
  156. }
  157. uint64_t msm_gem_mmap_offset(struct drm_gem_object *obj)
  158. {
  159. uint64_t offset;
  160. mutex_lock(&obj->dev->struct_mutex);
  161. offset = mmap_offset(obj);
  162. mutex_unlock(&obj->dev->struct_mutex);
  163. return offset;
  164. }
  165. /* helpers for dealing w/ iommu: */
  166. static int map_range(struct iommu_domain *domain, unsigned int iova,
  167. struct sg_table *sgt, unsigned int len, int prot)
  168. {
  169. struct scatterlist *sg;
  170. unsigned int da = iova;
  171. unsigned int i, j;
  172. int ret;
  173. if (!domain || !sgt)
  174. return -EINVAL;
  175. for_each_sg(sgt->sgl, sg, sgt->nents, i) {
  176. u32 pa = sg_phys(sg) - sg->offset;
  177. size_t bytes = sg->length + sg->offset;
  178. VERB("map[%d]: %08x %08x(%x)", i, iova, pa, bytes);
  179. ret = iommu_map(domain, da, pa, bytes, prot);
  180. if (ret)
  181. goto fail;
  182. da += bytes;
  183. }
  184. return 0;
  185. fail:
  186. da = iova;
  187. for_each_sg(sgt->sgl, sg, i, j) {
  188. size_t bytes = sg->length + sg->offset;
  189. iommu_unmap(domain, da, bytes);
  190. da += bytes;
  191. }
  192. return ret;
  193. }
  194. static void unmap_range(struct iommu_domain *domain, unsigned int iova,
  195. struct sg_table *sgt, unsigned int len)
  196. {
  197. struct scatterlist *sg;
  198. unsigned int da = iova;
  199. int i;
  200. for_each_sg(sgt->sgl, sg, sgt->nents, i) {
  201. size_t bytes = sg->length + sg->offset;
  202. size_t unmapped;
  203. unmapped = iommu_unmap(domain, da, bytes);
  204. if (unmapped < bytes)
  205. break;
  206. VERB("unmap[%d]: %08x(%x)", i, iova, bytes);
  207. BUG_ON(!IS_ALIGNED(bytes, PAGE_SIZE));
  208. da += bytes;
  209. }
  210. }
  211. /* should be called under struct_mutex.. although it can be called
  212. * from atomic context without struct_mutex to acquire an extra
  213. * iova ref if you know one is already held.
  214. *
  215. * That means when I do eventually need to add support for unpinning
  216. * the refcnt counter needs to be atomic_t.
  217. */
  218. int msm_gem_get_iova_locked(struct drm_gem_object *obj, int id,
  219. uint32_t *iova)
  220. {
  221. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  222. int ret = 0;
  223. if (!msm_obj->domain[id].iova) {
  224. struct msm_drm_private *priv = obj->dev->dev_private;
  225. uint32_t offset = (uint32_t)mmap_offset(obj);
  226. struct page **pages;
  227. pages = get_pages(obj);
  228. if (IS_ERR(pages))
  229. return PTR_ERR(pages);
  230. // XXX ideally we would not map buffers writable when not needed...
  231. ret = map_range(priv->iommus[id], offset, msm_obj->sgt,
  232. obj->size, IOMMU_READ | IOMMU_WRITE);
  233. msm_obj->domain[id].iova = offset;
  234. }
  235. if (!ret)
  236. *iova = msm_obj->domain[id].iova;
  237. return ret;
  238. }
  239. int msm_gem_get_iova(struct drm_gem_object *obj, int id, uint32_t *iova)
  240. {
  241. int ret;
  242. mutex_lock(&obj->dev->struct_mutex);
  243. ret = msm_gem_get_iova_locked(obj, id, iova);
  244. mutex_unlock(&obj->dev->struct_mutex);
  245. return ret;
  246. }
  247. void msm_gem_put_iova(struct drm_gem_object *obj, int id)
  248. {
  249. // XXX TODO ..
  250. // NOTE: probably don't need a _locked() version.. we wouldn't
  251. // normally unmap here, but instead just mark that it could be
  252. // unmapped (if the iova refcnt drops to zero), but then later
  253. // if another _get_iova_locked() fails we can start unmapping
  254. // things that are no longer needed..
  255. }
  256. int msm_gem_dumb_create(struct drm_file *file, struct drm_device *dev,
  257. struct drm_mode_create_dumb *args)
  258. {
  259. args->pitch = align_pitch(args->width, args->bpp);
  260. args->size = PAGE_ALIGN(args->pitch * args->height);
  261. return msm_gem_new_handle(dev, file, args->size,
  262. MSM_BO_SCANOUT | MSM_BO_WC, &args->handle);
  263. }
  264. int msm_gem_dumb_destroy(struct drm_file *file, struct drm_device *dev,
  265. uint32_t handle)
  266. {
  267. /* No special work needed, drop the reference and see what falls out */
  268. return drm_gem_handle_delete(file, handle);
  269. }
  270. int msm_gem_dumb_map_offset(struct drm_file *file, struct drm_device *dev,
  271. uint32_t handle, uint64_t *offset)
  272. {
  273. struct drm_gem_object *obj;
  274. int ret = 0;
  275. /* GEM does all our handle to object mapping */
  276. obj = drm_gem_object_lookup(dev, file, handle);
  277. if (obj == NULL) {
  278. ret = -ENOENT;
  279. goto fail;
  280. }
  281. *offset = msm_gem_mmap_offset(obj);
  282. drm_gem_object_unreference_unlocked(obj);
  283. fail:
  284. return ret;
  285. }
  286. void *msm_gem_vaddr_locked(struct drm_gem_object *obj)
  287. {
  288. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  289. WARN_ON(!mutex_is_locked(&obj->dev->struct_mutex));
  290. if (!msm_obj->vaddr) {
  291. struct page **pages = get_pages(obj);
  292. if (IS_ERR(pages))
  293. return ERR_CAST(pages);
  294. msm_obj->vaddr = vmap(pages, obj->size >> PAGE_SHIFT,
  295. VM_MAP, pgprot_writecombine(PAGE_KERNEL));
  296. }
  297. return msm_obj->vaddr;
  298. }
  299. void *msm_gem_vaddr(struct drm_gem_object *obj)
  300. {
  301. void *ret;
  302. mutex_lock(&obj->dev->struct_mutex);
  303. ret = msm_gem_vaddr_locked(obj);
  304. mutex_unlock(&obj->dev->struct_mutex);
  305. return ret;
  306. }
  307. int msm_gem_queue_inactive_work(struct drm_gem_object *obj,
  308. struct work_struct *work)
  309. {
  310. struct drm_device *dev = obj->dev;
  311. struct msm_drm_private *priv = dev->dev_private;
  312. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  313. int ret = 0;
  314. mutex_lock(&dev->struct_mutex);
  315. if (!list_empty(&work->entry)) {
  316. ret = -EINVAL;
  317. } else if (is_active(msm_obj)) {
  318. list_add_tail(&work->entry, &msm_obj->inactive_work);
  319. } else {
  320. queue_work(priv->wq, work);
  321. }
  322. mutex_unlock(&dev->struct_mutex);
  323. return ret;
  324. }
  325. void msm_gem_move_to_active(struct drm_gem_object *obj,
  326. struct msm_gpu *gpu, bool write, uint32_t fence)
  327. {
  328. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  329. msm_obj->gpu = gpu;
  330. if (write)
  331. msm_obj->write_fence = fence;
  332. else
  333. msm_obj->read_fence = fence;
  334. list_del_init(&msm_obj->mm_list);
  335. list_add_tail(&msm_obj->mm_list, &gpu->active_list);
  336. }
  337. void msm_gem_move_to_inactive(struct drm_gem_object *obj)
  338. {
  339. struct drm_device *dev = obj->dev;
  340. struct msm_drm_private *priv = dev->dev_private;
  341. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  342. WARN_ON(!mutex_is_locked(&dev->struct_mutex));
  343. msm_obj->gpu = NULL;
  344. msm_obj->read_fence = 0;
  345. msm_obj->write_fence = 0;
  346. list_del_init(&msm_obj->mm_list);
  347. list_add_tail(&msm_obj->mm_list, &priv->inactive_list);
  348. while (!list_empty(&msm_obj->inactive_work)) {
  349. struct work_struct *work;
  350. work = list_first_entry(&msm_obj->inactive_work,
  351. struct work_struct, entry);
  352. list_del_init(&work->entry);
  353. queue_work(priv->wq, work);
  354. }
  355. }
  356. int msm_gem_cpu_prep(struct drm_gem_object *obj, uint32_t op,
  357. struct timespec *timeout)
  358. {
  359. struct drm_device *dev = obj->dev;
  360. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  361. int ret = 0;
  362. if (is_active(msm_obj)) {
  363. uint32_t fence = 0;
  364. if (op & MSM_PREP_READ)
  365. fence = msm_obj->write_fence;
  366. if (op & MSM_PREP_WRITE)
  367. fence = max(fence, msm_obj->read_fence);
  368. if (op & MSM_PREP_NOSYNC)
  369. timeout = NULL;
  370. ret = msm_wait_fence_interruptable(dev, fence, timeout);
  371. }
  372. /* TODO cache maintenance */
  373. return ret;
  374. }
  375. int msm_gem_cpu_fini(struct drm_gem_object *obj)
  376. {
  377. /* TODO cache maintenance */
  378. return 0;
  379. }
  380. #ifdef CONFIG_DEBUG_FS
  381. void msm_gem_describe(struct drm_gem_object *obj, struct seq_file *m)
  382. {
  383. struct drm_device *dev = obj->dev;
  384. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  385. uint64_t off = drm_vma_node_start(&obj->vma_node);
  386. WARN_ON(!mutex_is_locked(&dev->struct_mutex));
  387. seq_printf(m, "%08x: %c(r=%u,w=%u) %2d (%2d) %08llx %p %d\n",
  388. msm_obj->flags, is_active(msm_obj) ? 'A' : 'I',
  389. msm_obj->read_fence, msm_obj->write_fence,
  390. obj->name, obj->refcount.refcount.counter,
  391. off, msm_obj->vaddr, obj->size);
  392. }
  393. void msm_gem_describe_objects(struct list_head *list, struct seq_file *m)
  394. {
  395. struct msm_gem_object *msm_obj;
  396. int count = 0;
  397. size_t size = 0;
  398. list_for_each_entry(msm_obj, list, mm_list) {
  399. struct drm_gem_object *obj = &msm_obj->base;
  400. seq_printf(m, " ");
  401. msm_gem_describe(obj, m);
  402. count++;
  403. size += obj->size;
  404. }
  405. seq_printf(m, "Total %d objects, %zu bytes\n", count, size);
  406. }
  407. #endif
  408. void msm_gem_free_object(struct drm_gem_object *obj)
  409. {
  410. struct drm_device *dev = obj->dev;
  411. struct msm_gem_object *msm_obj = to_msm_bo(obj);
  412. int id;
  413. WARN_ON(!mutex_is_locked(&dev->struct_mutex));
  414. /* object should not be on active list: */
  415. WARN_ON(is_active(msm_obj));
  416. list_del(&msm_obj->mm_list);
  417. for (id = 0; id < ARRAY_SIZE(msm_obj->domain); id++) {
  418. if (msm_obj->domain[id].iova) {
  419. struct msm_drm_private *priv = obj->dev->dev_private;
  420. uint32_t offset = (uint32_t)mmap_offset(obj);
  421. unmap_range(priv->iommus[id], offset,
  422. msm_obj->sgt, obj->size);
  423. }
  424. }
  425. drm_gem_free_mmap_offset(obj);
  426. if (msm_obj->vaddr)
  427. vunmap(msm_obj->vaddr);
  428. put_pages(obj);
  429. if (msm_obj->resv == &msm_obj->_resv)
  430. reservation_object_fini(msm_obj->resv);
  431. drm_gem_object_release(obj);
  432. kfree(msm_obj);
  433. }
  434. /* convenience method to construct a GEM buffer object, and userspace handle */
  435. int msm_gem_new_handle(struct drm_device *dev, struct drm_file *file,
  436. uint32_t size, uint32_t flags, uint32_t *handle)
  437. {
  438. struct drm_gem_object *obj;
  439. int ret;
  440. ret = mutex_lock_interruptible(&dev->struct_mutex);
  441. if (ret)
  442. return ret;
  443. obj = msm_gem_new(dev, size, flags);
  444. mutex_unlock(&dev->struct_mutex);
  445. if (IS_ERR(obj))
  446. return PTR_ERR(obj);
  447. ret = drm_gem_handle_create(file, obj, handle);
  448. /* drop reference from allocate - handle holds it now */
  449. drm_gem_object_unreference_unlocked(obj);
  450. return ret;
  451. }
  452. struct drm_gem_object *msm_gem_new(struct drm_device *dev,
  453. uint32_t size, uint32_t flags)
  454. {
  455. struct msm_drm_private *priv = dev->dev_private;
  456. struct msm_gem_object *msm_obj;
  457. struct drm_gem_object *obj = NULL;
  458. int ret;
  459. WARN_ON(!mutex_is_locked(&dev->struct_mutex));
  460. size = PAGE_ALIGN(size);
  461. switch (flags & MSM_BO_CACHE_MASK) {
  462. case MSM_BO_UNCACHED:
  463. case MSM_BO_CACHED:
  464. case MSM_BO_WC:
  465. break;
  466. default:
  467. dev_err(dev->dev, "invalid cache flag: %x\n",
  468. (flags & MSM_BO_CACHE_MASK));
  469. ret = -EINVAL;
  470. goto fail;
  471. }
  472. msm_obj = kzalloc(sizeof(*msm_obj), GFP_KERNEL);
  473. if (!msm_obj) {
  474. ret = -ENOMEM;
  475. goto fail;
  476. }
  477. obj = &msm_obj->base;
  478. ret = drm_gem_object_init(dev, obj, size);
  479. if (ret)
  480. goto fail;
  481. msm_obj->flags = flags;
  482. msm_obj->resv = &msm_obj->_resv;
  483. reservation_object_init(msm_obj->resv);
  484. INIT_LIST_HEAD(&msm_obj->submit_entry);
  485. INIT_LIST_HEAD(&msm_obj->inactive_work);
  486. list_add_tail(&msm_obj->mm_list, &priv->inactive_list);
  487. return obj;
  488. fail:
  489. if (obj)
  490. drm_gem_object_unreference_unlocked(obj);
  491. return ERR_PTR(ret);
  492. }