vmwgfx_fifo.c 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537
  1. /**************************************************************************
  2. *
  3. * Copyright © 2009 VMware, Inc., Palo Alto, CA., USA
  4. * All Rights Reserved.
  5. *
  6. * Permission is hereby granted, free of charge, to any person obtaining a
  7. * copy of this software and associated documentation files (the
  8. * "Software"), to deal in the Software without restriction, including
  9. * without limitation the rights to use, copy, modify, merge, publish,
  10. * distribute, sub license, and/or sell copies of the Software, and to
  11. * permit persons to whom the Software is furnished to do so, subject to
  12. * the following conditions:
  13. *
  14. * The above copyright notice and this permission notice (including the
  15. * next paragraph) shall be included in all copies or substantial portions
  16. * of the Software.
  17. *
  18. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  19. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  20. * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
  21. * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
  22. * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
  23. * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
  24. * USE OR OTHER DEALINGS IN THE SOFTWARE.
  25. *
  26. **************************************************************************/
  27. #include "vmwgfx_drv.h"
  28. #include "drmP.h"
  29. #include "ttm/ttm_placement.h"
  30. bool vmw_fifo_have_3d(struct vmw_private *dev_priv)
  31. {
  32. __le32 __iomem *fifo_mem = dev_priv->mmio_virt;
  33. uint32_t fifo_min, hwversion;
  34. fifo_min = ioread32(fifo_mem + SVGA_FIFO_MIN);
  35. if (fifo_min <= SVGA_FIFO_3D_HWVERSION * sizeof(unsigned int))
  36. return false;
  37. hwversion = ioread32(fifo_mem + SVGA_FIFO_3D_HWVERSION);
  38. if (hwversion == 0)
  39. return false;
  40. if (hwversion < SVGA3D_HWVERSION_WS65_B1)
  41. return false;
  42. return true;
  43. }
  44. int vmw_fifo_init(struct vmw_private *dev_priv, struct vmw_fifo_state *fifo)
  45. {
  46. __le32 __iomem *fifo_mem = dev_priv->mmio_virt;
  47. uint32_t max;
  48. uint32_t min;
  49. uint32_t dummy;
  50. int ret;
  51. fifo->static_buffer_size = VMWGFX_FIFO_STATIC_SIZE;
  52. fifo->static_buffer = vmalloc(fifo->static_buffer_size);
  53. if (unlikely(fifo->static_buffer == NULL))
  54. return -ENOMEM;
  55. fifo->last_buffer_size = VMWGFX_FIFO_STATIC_SIZE;
  56. fifo->last_data_size = 0;
  57. fifo->last_buffer_add = false;
  58. fifo->last_buffer = vmalloc(fifo->last_buffer_size);
  59. if (unlikely(fifo->last_buffer == NULL)) {
  60. ret = -ENOMEM;
  61. goto out_err;
  62. }
  63. fifo->dynamic_buffer = NULL;
  64. fifo->reserved_size = 0;
  65. fifo->using_bounce_buffer = false;
  66. init_rwsem(&fifo->rwsem);
  67. /*
  68. * Allow mapping the first page read-only to user-space.
  69. */
  70. DRM_INFO("width %d\n", vmw_read(dev_priv, SVGA_REG_WIDTH));
  71. DRM_INFO("height %d\n", vmw_read(dev_priv, SVGA_REG_HEIGHT));
  72. DRM_INFO("bpp %d\n", vmw_read(dev_priv, SVGA_REG_BITS_PER_PIXEL));
  73. mutex_lock(&dev_priv->hw_mutex);
  74. dev_priv->enable_state = vmw_read(dev_priv, SVGA_REG_ENABLE);
  75. dev_priv->config_done_state = vmw_read(dev_priv, SVGA_REG_CONFIG_DONE);
  76. vmw_write(dev_priv, SVGA_REG_ENABLE, 1);
  77. min = 4;
  78. if (dev_priv->capabilities & SVGA_CAP_EXTENDED_FIFO)
  79. min = vmw_read(dev_priv, SVGA_REG_MEM_REGS);
  80. min <<= 2;
  81. if (min < PAGE_SIZE)
  82. min = PAGE_SIZE;
  83. iowrite32(min, fifo_mem + SVGA_FIFO_MIN);
  84. iowrite32(dev_priv->mmio_size, fifo_mem + SVGA_FIFO_MAX);
  85. wmb();
  86. iowrite32(min, fifo_mem + SVGA_FIFO_NEXT_CMD);
  87. iowrite32(min, fifo_mem + SVGA_FIFO_STOP);
  88. iowrite32(0, fifo_mem + SVGA_FIFO_BUSY);
  89. mb();
  90. vmw_write(dev_priv, SVGA_REG_CONFIG_DONE, 1);
  91. mutex_unlock(&dev_priv->hw_mutex);
  92. max = ioread32(fifo_mem + SVGA_FIFO_MAX);
  93. min = ioread32(fifo_mem + SVGA_FIFO_MIN);
  94. fifo->capabilities = ioread32(fifo_mem + SVGA_FIFO_CAPABILITIES);
  95. DRM_INFO("Fifo max 0x%08x min 0x%08x cap 0x%08x\n",
  96. (unsigned int) max,
  97. (unsigned int) min,
  98. (unsigned int) fifo->capabilities);
  99. dev_priv->fence_seq = dev_priv->last_read_sequence;
  100. iowrite32(dev_priv->last_read_sequence, fifo_mem + SVGA_FIFO_FENCE);
  101. return vmw_fifo_send_fence(dev_priv, &dummy);
  102. out_err:
  103. vfree(fifo->static_buffer);
  104. fifo->static_buffer = NULL;
  105. return ret;
  106. }
  107. void vmw_fifo_ping_host(struct vmw_private *dev_priv, uint32_t reason)
  108. {
  109. __le32 __iomem *fifo_mem = dev_priv->mmio_virt;
  110. mutex_lock(&dev_priv->hw_mutex);
  111. if (unlikely(ioread32(fifo_mem + SVGA_FIFO_BUSY) == 0)) {
  112. iowrite32(1, fifo_mem + SVGA_FIFO_BUSY);
  113. vmw_write(dev_priv, SVGA_REG_SYNC, reason);
  114. }
  115. mutex_unlock(&dev_priv->hw_mutex);
  116. }
  117. void vmw_fifo_release(struct vmw_private *dev_priv, struct vmw_fifo_state *fifo)
  118. {
  119. __le32 __iomem *fifo_mem = dev_priv->mmio_virt;
  120. mutex_lock(&dev_priv->hw_mutex);
  121. while (vmw_read(dev_priv, SVGA_REG_BUSY) != 0)
  122. vmw_write(dev_priv, SVGA_REG_SYNC, SVGA_SYNC_GENERIC);
  123. dev_priv->last_read_sequence = ioread32(fifo_mem + SVGA_FIFO_FENCE);
  124. vmw_write(dev_priv, SVGA_REG_CONFIG_DONE,
  125. dev_priv->config_done_state);
  126. vmw_write(dev_priv, SVGA_REG_ENABLE,
  127. dev_priv->enable_state);
  128. mutex_unlock(&dev_priv->hw_mutex);
  129. if (likely(fifo->last_buffer != NULL)) {
  130. vfree(fifo->last_buffer);
  131. fifo->last_buffer = NULL;
  132. }
  133. if (likely(fifo->static_buffer != NULL)) {
  134. vfree(fifo->static_buffer);
  135. fifo->static_buffer = NULL;
  136. }
  137. if (likely(fifo->dynamic_buffer != NULL)) {
  138. vfree(fifo->dynamic_buffer);
  139. fifo->dynamic_buffer = NULL;
  140. }
  141. }
  142. static bool vmw_fifo_is_full(struct vmw_private *dev_priv, uint32_t bytes)
  143. {
  144. __le32 __iomem *fifo_mem = dev_priv->mmio_virt;
  145. uint32_t max = ioread32(fifo_mem + SVGA_FIFO_MAX);
  146. uint32_t next_cmd = ioread32(fifo_mem + SVGA_FIFO_NEXT_CMD);
  147. uint32_t min = ioread32(fifo_mem + SVGA_FIFO_MIN);
  148. uint32_t stop = ioread32(fifo_mem + SVGA_FIFO_STOP);
  149. return ((max - next_cmd) + (stop - min) <= bytes);
  150. }
  151. static int vmw_fifo_wait_noirq(struct vmw_private *dev_priv,
  152. uint32_t bytes, bool interruptible,
  153. unsigned long timeout)
  154. {
  155. int ret = 0;
  156. unsigned long end_jiffies = jiffies + timeout;
  157. DEFINE_WAIT(__wait);
  158. DRM_INFO("Fifo wait noirq.\n");
  159. for (;;) {
  160. prepare_to_wait(&dev_priv->fifo_queue, &__wait,
  161. (interruptible) ?
  162. TASK_INTERRUPTIBLE : TASK_UNINTERRUPTIBLE);
  163. if (!vmw_fifo_is_full(dev_priv, bytes))
  164. break;
  165. if (time_after_eq(jiffies, end_jiffies)) {
  166. ret = -EBUSY;
  167. DRM_ERROR("SVGA device lockup.\n");
  168. break;
  169. }
  170. schedule_timeout(1);
  171. if (interruptible && signal_pending(current)) {
  172. ret = -ERESTARTSYS;
  173. break;
  174. }
  175. }
  176. finish_wait(&dev_priv->fifo_queue, &__wait);
  177. wake_up_all(&dev_priv->fifo_queue);
  178. DRM_INFO("Fifo noirq exit.\n");
  179. return ret;
  180. }
  181. static int vmw_fifo_wait(struct vmw_private *dev_priv,
  182. uint32_t bytes, bool interruptible,
  183. unsigned long timeout)
  184. {
  185. long ret = 1L;
  186. unsigned long irq_flags;
  187. if (likely(!vmw_fifo_is_full(dev_priv, bytes)))
  188. return 0;
  189. vmw_fifo_ping_host(dev_priv, SVGA_SYNC_FIFOFULL);
  190. if (!(dev_priv->capabilities & SVGA_CAP_IRQMASK))
  191. return vmw_fifo_wait_noirq(dev_priv, bytes,
  192. interruptible, timeout);
  193. mutex_lock(&dev_priv->hw_mutex);
  194. if (atomic_add_return(1, &dev_priv->fifo_queue_waiters) > 0) {
  195. spin_lock_irqsave(&dev_priv->irq_lock, irq_flags);
  196. outl(SVGA_IRQFLAG_FIFO_PROGRESS,
  197. dev_priv->io_start + VMWGFX_IRQSTATUS_PORT);
  198. vmw_write(dev_priv, SVGA_REG_IRQMASK,
  199. vmw_read(dev_priv, SVGA_REG_IRQMASK) |
  200. SVGA_IRQFLAG_FIFO_PROGRESS);
  201. spin_unlock_irqrestore(&dev_priv->irq_lock, irq_flags);
  202. }
  203. mutex_unlock(&dev_priv->hw_mutex);
  204. if (interruptible)
  205. ret = wait_event_interruptible_timeout
  206. (dev_priv->fifo_queue,
  207. !vmw_fifo_is_full(dev_priv, bytes), timeout);
  208. else
  209. ret = wait_event_timeout
  210. (dev_priv->fifo_queue,
  211. !vmw_fifo_is_full(dev_priv, bytes), timeout);
  212. if (unlikely(ret == 0))
  213. ret = -EBUSY;
  214. else if (likely(ret > 0))
  215. ret = 0;
  216. mutex_lock(&dev_priv->hw_mutex);
  217. if (atomic_dec_and_test(&dev_priv->fifo_queue_waiters)) {
  218. spin_lock_irqsave(&dev_priv->irq_lock, irq_flags);
  219. vmw_write(dev_priv, SVGA_REG_IRQMASK,
  220. vmw_read(dev_priv, SVGA_REG_IRQMASK) &
  221. ~SVGA_IRQFLAG_FIFO_PROGRESS);
  222. spin_unlock_irqrestore(&dev_priv->irq_lock, irq_flags);
  223. }
  224. mutex_unlock(&dev_priv->hw_mutex);
  225. return ret;
  226. }
  227. void *vmw_fifo_reserve(struct vmw_private *dev_priv, uint32_t bytes)
  228. {
  229. struct vmw_fifo_state *fifo_state = &dev_priv->fifo;
  230. __le32 __iomem *fifo_mem = dev_priv->mmio_virt;
  231. uint32_t max;
  232. uint32_t min;
  233. uint32_t next_cmd;
  234. uint32_t reserveable = fifo_state->capabilities & SVGA_FIFO_CAP_RESERVE;
  235. int ret;
  236. down_write(&fifo_state->rwsem);
  237. max = ioread32(fifo_mem + SVGA_FIFO_MAX);
  238. min = ioread32(fifo_mem + SVGA_FIFO_MIN);
  239. next_cmd = ioread32(fifo_mem + SVGA_FIFO_NEXT_CMD);
  240. if (unlikely(bytes >= (max - min)))
  241. goto out_err;
  242. BUG_ON(fifo_state->reserved_size != 0);
  243. BUG_ON(fifo_state->dynamic_buffer != NULL);
  244. fifo_state->reserved_size = bytes;
  245. while (1) {
  246. uint32_t stop = ioread32(fifo_mem + SVGA_FIFO_STOP);
  247. bool need_bounce = false;
  248. bool reserve_in_place = false;
  249. if (next_cmd >= stop) {
  250. if (likely((next_cmd + bytes < max ||
  251. (next_cmd + bytes == max && stop > min))))
  252. reserve_in_place = true;
  253. else if (vmw_fifo_is_full(dev_priv, bytes)) {
  254. ret = vmw_fifo_wait(dev_priv, bytes,
  255. false, 3 * HZ);
  256. if (unlikely(ret != 0))
  257. goto out_err;
  258. } else
  259. need_bounce = true;
  260. } else {
  261. if (likely((next_cmd + bytes < stop)))
  262. reserve_in_place = true;
  263. else {
  264. ret = vmw_fifo_wait(dev_priv, bytes,
  265. false, 3 * HZ);
  266. if (unlikely(ret != 0))
  267. goto out_err;
  268. }
  269. }
  270. if (reserve_in_place) {
  271. if (reserveable || bytes <= sizeof(uint32_t)) {
  272. fifo_state->using_bounce_buffer = false;
  273. if (reserveable)
  274. iowrite32(bytes, fifo_mem +
  275. SVGA_FIFO_RESERVED);
  276. return fifo_mem + (next_cmd >> 2);
  277. } else {
  278. need_bounce = true;
  279. }
  280. }
  281. if (need_bounce) {
  282. fifo_state->using_bounce_buffer = true;
  283. if (bytes < fifo_state->static_buffer_size)
  284. return fifo_state->static_buffer;
  285. else {
  286. fifo_state->dynamic_buffer = vmalloc(bytes);
  287. return fifo_state->dynamic_buffer;
  288. }
  289. }
  290. }
  291. out_err:
  292. fifo_state->reserved_size = 0;
  293. up_write(&fifo_state->rwsem);
  294. return NULL;
  295. }
  296. static void vmw_fifo_res_copy(struct vmw_fifo_state *fifo_state,
  297. __le32 __iomem *fifo_mem,
  298. uint32_t next_cmd,
  299. uint32_t max, uint32_t min, uint32_t bytes)
  300. {
  301. uint32_t chunk_size = max - next_cmd;
  302. uint32_t rest;
  303. uint32_t *buffer = (fifo_state->dynamic_buffer != NULL) ?
  304. fifo_state->dynamic_buffer : fifo_state->static_buffer;
  305. if (bytes < chunk_size)
  306. chunk_size = bytes;
  307. iowrite32(bytes, fifo_mem + SVGA_FIFO_RESERVED);
  308. mb();
  309. memcpy_toio(fifo_mem + (next_cmd >> 2), buffer, chunk_size);
  310. rest = bytes - chunk_size;
  311. if (rest)
  312. memcpy_toio(fifo_mem + (min >> 2), buffer + (chunk_size >> 2),
  313. rest);
  314. }
  315. static void vmw_fifo_slow_copy(struct vmw_fifo_state *fifo_state,
  316. __le32 __iomem *fifo_mem,
  317. uint32_t next_cmd,
  318. uint32_t max, uint32_t min, uint32_t bytes)
  319. {
  320. uint32_t *buffer = (fifo_state->dynamic_buffer != NULL) ?
  321. fifo_state->dynamic_buffer : fifo_state->static_buffer;
  322. while (bytes > 0) {
  323. iowrite32(*buffer++, fifo_mem + (next_cmd >> 2));
  324. next_cmd += sizeof(uint32_t);
  325. if (unlikely(next_cmd == max))
  326. next_cmd = min;
  327. mb();
  328. iowrite32(next_cmd, fifo_mem + SVGA_FIFO_NEXT_CMD);
  329. mb();
  330. bytes -= sizeof(uint32_t);
  331. }
  332. }
  333. void vmw_fifo_commit(struct vmw_private *dev_priv, uint32_t bytes)
  334. {
  335. struct vmw_fifo_state *fifo_state = &dev_priv->fifo;
  336. __le32 __iomem *fifo_mem = dev_priv->mmio_virt;
  337. uint32_t next_cmd = ioread32(fifo_mem + SVGA_FIFO_NEXT_CMD);
  338. uint32_t max = ioread32(fifo_mem + SVGA_FIFO_MAX);
  339. uint32_t min = ioread32(fifo_mem + SVGA_FIFO_MIN);
  340. bool reserveable = fifo_state->capabilities & SVGA_FIFO_CAP_RESERVE;
  341. BUG_ON((bytes & 3) != 0);
  342. BUG_ON(bytes > fifo_state->reserved_size);
  343. fifo_state->reserved_size = 0;
  344. if (fifo_state->using_bounce_buffer) {
  345. if (reserveable)
  346. vmw_fifo_res_copy(fifo_state, fifo_mem,
  347. next_cmd, max, min, bytes);
  348. else
  349. vmw_fifo_slow_copy(fifo_state, fifo_mem,
  350. next_cmd, max, min, bytes);
  351. if (fifo_state->dynamic_buffer) {
  352. vfree(fifo_state->dynamic_buffer);
  353. fifo_state->dynamic_buffer = NULL;
  354. }
  355. }
  356. if (fifo_state->using_bounce_buffer || reserveable) {
  357. next_cmd += bytes;
  358. if (next_cmd >= max)
  359. next_cmd -= max - min;
  360. mb();
  361. iowrite32(next_cmd, fifo_mem + SVGA_FIFO_NEXT_CMD);
  362. }
  363. if (reserveable)
  364. iowrite32(0, fifo_mem + SVGA_FIFO_RESERVED);
  365. mb();
  366. vmw_fifo_ping_host(dev_priv, SVGA_SYNC_GENERIC);
  367. up_write(&fifo_state->rwsem);
  368. }
  369. int vmw_fifo_send_fence(struct vmw_private *dev_priv, uint32_t *sequence)
  370. {
  371. struct vmw_fifo_state *fifo_state = &dev_priv->fifo;
  372. struct svga_fifo_cmd_fence *cmd_fence;
  373. void *fm;
  374. int ret = 0;
  375. uint32_t bytes = sizeof(__le32) + sizeof(*cmd_fence);
  376. fm = vmw_fifo_reserve(dev_priv, bytes);
  377. if (unlikely(fm == NULL)) {
  378. down_write(&fifo_state->rwsem);
  379. *sequence = dev_priv->fence_seq;
  380. up_write(&fifo_state->rwsem);
  381. ret = -ENOMEM;
  382. (void)vmw_fallback_wait(dev_priv, false, true, *sequence,
  383. false, 3*HZ);
  384. goto out_err;
  385. }
  386. do {
  387. *sequence = dev_priv->fence_seq++;
  388. } while (*sequence == 0);
  389. if (!(fifo_state->capabilities & SVGA_FIFO_CAP_FENCE)) {
  390. /*
  391. * Don't request hardware to send a fence. The
  392. * waiting code in vmwgfx_irq.c will emulate this.
  393. */
  394. vmw_fifo_commit(dev_priv, 0);
  395. return 0;
  396. }
  397. *(__le32 *) fm = cpu_to_le32(SVGA_CMD_FENCE);
  398. cmd_fence = (struct svga_fifo_cmd_fence *)
  399. ((unsigned long)fm + sizeof(__le32));
  400. iowrite32(*sequence, &cmd_fence->fence);
  401. fifo_state->last_buffer_add = true;
  402. vmw_fifo_commit(dev_priv, bytes);
  403. fifo_state->last_buffer_add = false;
  404. out_err:
  405. return ret;
  406. }
  407. /**
  408. * Map the first page of the FIFO read-only to user-space.
  409. */
  410. static int vmw_fifo_vm_fault(struct vm_area_struct *vma, struct vm_fault *vmf)
  411. {
  412. int ret;
  413. unsigned long address = (unsigned long)vmf->virtual_address;
  414. if (address != vma->vm_start)
  415. return VM_FAULT_SIGBUS;
  416. ret = vm_insert_pfn(vma, address, vma->vm_pgoff);
  417. if (likely(ret == -EBUSY || ret == 0))
  418. return VM_FAULT_NOPAGE;
  419. else if (ret == -ENOMEM)
  420. return VM_FAULT_OOM;
  421. return VM_FAULT_SIGBUS;
  422. }
  423. static struct vm_operations_struct vmw_fifo_vm_ops = {
  424. .fault = vmw_fifo_vm_fault,
  425. .open = NULL,
  426. .close = NULL
  427. };
  428. int vmw_fifo_mmap(struct file *filp, struct vm_area_struct *vma)
  429. {
  430. struct drm_file *file_priv;
  431. struct vmw_private *dev_priv;
  432. file_priv = (struct drm_file *)filp->private_data;
  433. dev_priv = vmw_priv(file_priv->minor->dev);
  434. if (vma->vm_pgoff != (dev_priv->mmio_start >> PAGE_SHIFT) ||
  435. (vma->vm_end - vma->vm_start) != PAGE_SIZE)
  436. return -EINVAL;
  437. vma->vm_flags &= ~(VM_WRITE | VM_MAYWRITE);
  438. vma->vm_flags |= VM_IO | VM_PFNMAP | VM_DONTEXPAND | VM_SHARED;
  439. vma->vm_page_prot = vm_get_page_prot(vma->vm_flags);
  440. vma->vm_page_prot = ttm_io_prot(TTM_PL_FLAG_UNCACHED,
  441. vma->vm_page_prot);
  442. vma->vm_ops = &vmw_fifo_vm_ops;
  443. return 0;
  444. }