intel_ringbuffer.c 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568
  1. /*
  2. * Copyright © 2008-2010 Intel Corporation
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice (including the next
  12. * paragraph) shall be included in all copies or substantial portions of the
  13. * Software.
  14. *
  15. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  16. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  17. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  18. * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  19. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  20. * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
  21. * IN THE SOFTWARE.
  22. *
  23. * Authors:
  24. * Eric Anholt <eric@anholt.net>
  25. * Zou Nan hai <nanhai.zou@intel.com>
  26. * Xiang Hai hao<haihao.xiang@intel.com>
  27. *
  28. */
  29. #include "drmP.h"
  30. #include "drm.h"
  31. #include "i915_drm.h"
  32. #include "i915_drv.h"
  33. #include "i915_trace.h"
  34. #include "intel_drv.h"
  35. void
  36. i915_gem_flush(struct drm_device *dev,
  37. uint32_t invalidate_domains,
  38. uint32_t flush_domains)
  39. {
  40. drm_i915_private_t *dev_priv = dev->dev_private;
  41. uint32_t cmd;
  42. RING_LOCALS;
  43. #if WATCH_EXEC
  44. DRM_INFO("%s: invalidate %08x flush %08x\n", __func__,
  45. invalidate_domains, flush_domains);
  46. #endif
  47. trace_i915_gem_request_flush(dev, dev_priv->mm.next_gem_seqno,
  48. invalidate_domains, flush_domains);
  49. if (flush_domains & I915_GEM_DOMAIN_CPU)
  50. drm_agp_chipset_flush(dev);
  51. if ((invalidate_domains | flush_domains) & I915_GEM_GPU_DOMAINS) {
  52. /*
  53. * read/write caches:
  54. *
  55. * I915_GEM_DOMAIN_RENDER is always invalidated, but is
  56. * only flushed if MI_NO_WRITE_FLUSH is unset. On 965, it is
  57. * also flushed at 2d versus 3d pipeline switches.
  58. *
  59. * read-only caches:
  60. *
  61. * I915_GEM_DOMAIN_SAMPLER is flushed on pre-965 if
  62. * MI_READ_FLUSH is set, and is always flushed on 965.
  63. *
  64. * I915_GEM_DOMAIN_COMMAND may not exist?
  65. *
  66. * I915_GEM_DOMAIN_INSTRUCTION, which exists on 965, is
  67. * invalidated when MI_EXE_FLUSH is set.
  68. *
  69. * I915_GEM_DOMAIN_VERTEX, which exists on 965, is
  70. * invalidated with every MI_FLUSH.
  71. *
  72. * TLBs:
  73. *
  74. * On 965, TLBs associated with I915_GEM_DOMAIN_COMMAND
  75. * and I915_GEM_DOMAIN_CPU in are invalidated at PTE write and
  76. * I915_GEM_DOMAIN_RENDER and I915_GEM_DOMAIN_SAMPLER
  77. * are flushed at any MI_FLUSH.
  78. */
  79. cmd = MI_FLUSH | MI_NO_WRITE_FLUSH;
  80. if ((invalidate_domains|flush_domains) &
  81. I915_GEM_DOMAIN_RENDER)
  82. cmd &= ~MI_NO_WRITE_FLUSH;
  83. if (!IS_I965G(dev)) {
  84. /*
  85. * On the 965, the sampler cache always gets flushed
  86. * and this bit is reserved.
  87. */
  88. if (invalidate_domains & I915_GEM_DOMAIN_SAMPLER)
  89. cmd |= MI_READ_FLUSH;
  90. }
  91. if (invalidate_domains & I915_GEM_DOMAIN_INSTRUCTION)
  92. cmd |= MI_EXE_FLUSH;
  93. #if WATCH_EXEC
  94. DRM_INFO("%s: queue flush %08x to ring\n", __func__, cmd);
  95. #endif
  96. BEGIN_LP_RING(2);
  97. OUT_RING(cmd);
  98. OUT_RING(MI_NOOP);
  99. ADVANCE_LP_RING();
  100. }
  101. }
  102. #define PIPE_CONTROL_FLUSH(addr) \
  103. OUT_RING(GFX_OP_PIPE_CONTROL | PIPE_CONTROL_QW_WRITE | \
  104. PIPE_CONTROL_DEPTH_STALL); \
  105. OUT_RING(addr | PIPE_CONTROL_GLOBAL_GTT); \
  106. OUT_RING(0); \
  107. OUT_RING(0); \
  108. /**
  109. * Creates a new sequence number, emitting a write of it to the status page
  110. * plus an interrupt, which will trigger i915_user_interrupt_handler.
  111. *
  112. * Must be called with struct_lock held.
  113. *
  114. * Returned sequence numbers are nonzero on success.
  115. */
  116. uint32_t
  117. i915_ring_add_request(struct drm_device *dev)
  118. {
  119. drm_i915_private_t *dev_priv = dev->dev_private;
  120. uint32_t seqno;
  121. RING_LOCALS;
  122. /* Grab the seqno we're going to make this request be, and bump the
  123. * next (skipping 0 so it can be the reserved no-seqno value).
  124. */
  125. seqno = dev_priv->mm.next_gem_seqno;
  126. dev_priv->mm.next_gem_seqno++;
  127. if (dev_priv->mm.next_gem_seqno == 0)
  128. dev_priv->mm.next_gem_seqno++;
  129. if (HAS_PIPE_CONTROL(dev)) {
  130. u32 scratch_addr = dev_priv->seqno_gfx_addr + 128;
  131. /*
  132. * Workaround qword write incoherence by flushing the
  133. * PIPE_NOTIFY buffers out to memory before requesting
  134. * an interrupt.
  135. */
  136. BEGIN_LP_RING(32);
  137. OUT_RING(GFX_OP_PIPE_CONTROL | PIPE_CONTROL_QW_WRITE |
  138. PIPE_CONTROL_WC_FLUSH | PIPE_CONTROL_TC_FLUSH);
  139. OUT_RING(dev_priv->seqno_gfx_addr | PIPE_CONTROL_GLOBAL_GTT);
  140. OUT_RING(seqno);
  141. OUT_RING(0);
  142. PIPE_CONTROL_FLUSH(scratch_addr);
  143. scratch_addr += 128; /* write to separate cachelines */
  144. PIPE_CONTROL_FLUSH(scratch_addr);
  145. scratch_addr += 128;
  146. PIPE_CONTROL_FLUSH(scratch_addr);
  147. scratch_addr += 128;
  148. PIPE_CONTROL_FLUSH(scratch_addr);
  149. scratch_addr += 128;
  150. PIPE_CONTROL_FLUSH(scratch_addr);
  151. scratch_addr += 128;
  152. PIPE_CONTROL_FLUSH(scratch_addr);
  153. OUT_RING(GFX_OP_PIPE_CONTROL | PIPE_CONTROL_QW_WRITE |
  154. PIPE_CONTROL_WC_FLUSH | PIPE_CONTROL_TC_FLUSH |
  155. PIPE_CONTROL_NOTIFY);
  156. OUT_RING(dev_priv->seqno_gfx_addr | PIPE_CONTROL_GLOBAL_GTT);
  157. OUT_RING(seqno);
  158. OUT_RING(0);
  159. ADVANCE_LP_RING();
  160. } else {
  161. BEGIN_LP_RING(4);
  162. OUT_RING(MI_STORE_DWORD_INDEX);
  163. OUT_RING(I915_GEM_HWS_INDEX << MI_STORE_DWORD_INDEX_SHIFT);
  164. OUT_RING(seqno);
  165. OUT_RING(MI_USER_INTERRUPT);
  166. ADVANCE_LP_RING();
  167. }
  168. return seqno;
  169. }
  170. void i915_user_irq_get(struct drm_device *dev)
  171. {
  172. drm_i915_private_t *dev_priv = (drm_i915_private_t *) dev->dev_private;
  173. unsigned long irqflags;
  174. spin_lock_irqsave(&dev_priv->user_irq_lock, irqflags);
  175. if (dev->irq_enabled && (++dev_priv->user_irq_refcount == 1)) {
  176. if (HAS_PCH_SPLIT(dev))
  177. ironlake_enable_graphics_irq(dev_priv, GT_PIPE_NOTIFY);
  178. else
  179. i915_enable_irq(dev_priv, I915_USER_INTERRUPT);
  180. }
  181. spin_unlock_irqrestore(&dev_priv->user_irq_lock, irqflags);
  182. }
  183. void i915_user_irq_put(struct drm_device *dev)
  184. {
  185. drm_i915_private_t *dev_priv = (drm_i915_private_t *) dev->dev_private;
  186. unsigned long irqflags;
  187. spin_lock_irqsave(&dev_priv->user_irq_lock, irqflags);
  188. BUG_ON(dev->irq_enabled && dev_priv->user_irq_refcount <= 0);
  189. if (dev->irq_enabled && (--dev_priv->user_irq_refcount == 0)) {
  190. if (HAS_PCH_SPLIT(dev))
  191. ironlake_disable_graphics_irq(dev_priv, GT_PIPE_NOTIFY);
  192. else
  193. i915_disable_irq(dev_priv, I915_USER_INTERRUPT);
  194. }
  195. spin_unlock_irqrestore(&dev_priv->user_irq_lock, irqflags);
  196. }
  197. /** Dispatch a batchbuffer to the ring
  198. */
  199. int
  200. i915_dispatch_gem_execbuffer(struct drm_device *dev,
  201. struct drm_i915_gem_execbuffer2 *exec,
  202. struct drm_clip_rect *cliprects,
  203. uint64_t exec_offset)
  204. {
  205. drm_i915_private_t *dev_priv = dev->dev_private;
  206. int nbox = exec->num_cliprects;
  207. int i = 0, count;
  208. uint32_t exec_start, exec_len;
  209. RING_LOCALS;
  210. exec_start = (uint32_t) exec_offset + exec->batch_start_offset;
  211. exec_len = (uint32_t) exec->batch_len;
  212. trace_i915_gem_request_submit(dev, dev_priv->mm.next_gem_seqno + 1);
  213. count = nbox ? nbox : 1;
  214. for (i = 0; i < count; i++) {
  215. if (i < nbox) {
  216. int ret = i915_emit_box(dev, cliprects, i,
  217. exec->DR1, exec->DR4);
  218. if (ret)
  219. return ret;
  220. }
  221. if (IS_I830(dev) || IS_845G(dev)) {
  222. BEGIN_LP_RING(4);
  223. OUT_RING(MI_BATCH_BUFFER);
  224. OUT_RING(exec_start | MI_BATCH_NON_SECURE);
  225. OUT_RING(exec_start + exec_len - 4);
  226. OUT_RING(0);
  227. ADVANCE_LP_RING();
  228. } else {
  229. BEGIN_LP_RING(2);
  230. if (IS_I965G(dev)) {
  231. OUT_RING(MI_BATCH_BUFFER_START |
  232. (2 << 6) |
  233. MI_BATCH_NON_SECURE_I965);
  234. OUT_RING(exec_start);
  235. } else {
  236. OUT_RING(MI_BATCH_BUFFER_START |
  237. (2 << 6));
  238. OUT_RING(exec_start | MI_BATCH_NON_SECURE);
  239. }
  240. ADVANCE_LP_RING();
  241. }
  242. }
  243. /* XXX breadcrumb */
  244. return 0;
  245. }
  246. static void
  247. i915_gem_cleanup_hws(struct drm_device *dev)
  248. {
  249. drm_i915_private_t *dev_priv = dev->dev_private;
  250. struct drm_gem_object *obj;
  251. struct drm_i915_gem_object *obj_priv;
  252. if (dev_priv->hws_obj == NULL)
  253. return;
  254. obj = dev_priv->hws_obj;
  255. obj_priv = to_intel_bo(obj);
  256. kunmap(obj_priv->pages[0]);
  257. i915_gem_object_unpin(obj);
  258. drm_gem_object_unreference(obj);
  259. dev_priv->hws_obj = NULL;
  260. memset(&dev_priv->hws_map, 0, sizeof(dev_priv->hws_map));
  261. dev_priv->hw_status_page = NULL;
  262. if (HAS_PIPE_CONTROL(dev))
  263. i915_gem_cleanup_pipe_control(dev);
  264. /* Write high address into HWS_PGA when disabling. */
  265. I915_WRITE(HWS_PGA, 0x1ffff000);
  266. }
  267. static int
  268. i915_gem_init_hws(struct drm_device *dev)
  269. {
  270. drm_i915_private_t *dev_priv = dev->dev_private;
  271. struct drm_gem_object *obj;
  272. struct drm_i915_gem_object *obj_priv;
  273. int ret;
  274. /* If we need a physical address for the status page, it's already
  275. * initialized at driver load time.
  276. */
  277. if (!I915_NEED_GFX_HWS(dev))
  278. return 0;
  279. obj = i915_gem_alloc_object(dev, 4096);
  280. if (obj == NULL) {
  281. DRM_ERROR("Failed to allocate status page\n");
  282. ret = -ENOMEM;
  283. goto err;
  284. }
  285. obj_priv = to_intel_bo(obj);
  286. obj_priv->agp_type = AGP_USER_CACHED_MEMORY;
  287. ret = i915_gem_object_pin(obj, 4096);
  288. if (ret != 0) {
  289. drm_gem_object_unreference(obj);
  290. goto err_unref;
  291. }
  292. dev_priv->status_gfx_addr = obj_priv->gtt_offset;
  293. dev_priv->hw_status_page = kmap(obj_priv->pages[0]);
  294. if (dev_priv->hw_status_page == NULL) {
  295. DRM_ERROR("Failed to map status page.\n");
  296. memset(&dev_priv->hws_map, 0, sizeof(dev_priv->hws_map));
  297. ret = -EINVAL;
  298. goto err_unpin;
  299. }
  300. if (HAS_PIPE_CONTROL(dev)) {
  301. ret = i915_gem_init_pipe_control(dev);
  302. if (ret)
  303. goto err_unpin;
  304. }
  305. dev_priv->hws_obj = obj;
  306. memset(dev_priv->hw_status_page, 0, PAGE_SIZE);
  307. if (IS_GEN6(dev)) {
  308. I915_WRITE(HWS_PGA_GEN6, dev_priv->status_gfx_addr);
  309. I915_READ(HWS_PGA_GEN6); /* posting read */
  310. } else {
  311. I915_WRITE(HWS_PGA, dev_priv->status_gfx_addr);
  312. I915_READ(HWS_PGA); /* posting read */
  313. }
  314. DRM_DEBUG_DRIVER("hws offset: 0x%08x\n", dev_priv->status_gfx_addr);
  315. return 0;
  316. err_unpin:
  317. i915_gem_object_unpin(obj);
  318. err_unref:
  319. drm_gem_object_unreference(obj);
  320. err:
  321. return 0;
  322. }
  323. int
  324. i915_gem_init_ringbuffer(struct drm_device *dev)
  325. {
  326. drm_i915_private_t *dev_priv = dev->dev_private;
  327. struct drm_gem_object *obj;
  328. struct drm_i915_gem_object *obj_priv;
  329. drm_i915_ring_buffer_t *ring = &dev_priv->ring;
  330. int ret;
  331. u32 head;
  332. ret = i915_gem_init_hws(dev);
  333. if (ret != 0)
  334. return ret;
  335. obj = i915_gem_alloc_object(dev, 128 * 1024);
  336. if (obj == NULL) {
  337. DRM_ERROR("Failed to allocate ringbuffer\n");
  338. i915_gem_cleanup_hws(dev);
  339. return -ENOMEM;
  340. }
  341. obj_priv = to_intel_bo(obj);
  342. ret = i915_gem_object_pin(obj, 4096);
  343. if (ret != 0) {
  344. drm_gem_object_unreference(obj);
  345. i915_gem_cleanup_hws(dev);
  346. return ret;
  347. }
  348. /* Set up the kernel mapping for the ring. */
  349. ring->Size = obj->size;
  350. ring->map.offset = dev->agp->base + obj_priv->gtt_offset;
  351. ring->map.size = obj->size;
  352. ring->map.type = 0;
  353. ring->map.flags = 0;
  354. ring->map.mtrr = 0;
  355. drm_core_ioremap_wc(&ring->map, dev);
  356. if (ring->map.handle == NULL) {
  357. DRM_ERROR("Failed to map ringbuffer.\n");
  358. memset(&dev_priv->ring, 0, sizeof(dev_priv->ring));
  359. i915_gem_object_unpin(obj);
  360. drm_gem_object_unreference(obj);
  361. i915_gem_cleanup_hws(dev);
  362. return -EINVAL;
  363. }
  364. ring->ring_obj = obj;
  365. ring->virtual_start = ring->map.handle;
  366. /* Stop the ring if it's running. */
  367. I915_WRITE(PRB0_CTL, 0);
  368. I915_WRITE(PRB0_TAIL, 0);
  369. I915_WRITE(PRB0_HEAD, 0);
  370. /* Initialize the ring. */
  371. I915_WRITE(PRB0_START, obj_priv->gtt_offset);
  372. head = I915_READ(PRB0_HEAD) & HEAD_ADDR;
  373. /* G45 ring initialization fails to reset head to zero */
  374. if (head != 0) {
  375. DRM_ERROR("Ring head not reset to zero "
  376. "ctl %08x head %08x tail %08x start %08x\n",
  377. I915_READ(PRB0_CTL),
  378. I915_READ(PRB0_HEAD),
  379. I915_READ(PRB0_TAIL),
  380. I915_READ(PRB0_START));
  381. I915_WRITE(PRB0_HEAD, 0);
  382. DRM_ERROR("Ring head forced to zero "
  383. "ctl %08x head %08x tail %08x start %08x\n",
  384. I915_READ(PRB0_CTL),
  385. I915_READ(PRB0_HEAD),
  386. I915_READ(PRB0_TAIL),
  387. I915_READ(PRB0_START));
  388. }
  389. I915_WRITE(PRB0_CTL,
  390. ((obj->size - 4096) & RING_NR_PAGES) |
  391. RING_NO_REPORT |
  392. RING_VALID);
  393. head = I915_READ(PRB0_HEAD) & HEAD_ADDR;
  394. /* If the head is still not zero, the ring is dead */
  395. if (head != 0) {
  396. DRM_ERROR("Ring initialization failed "
  397. "ctl %08x head %08x tail %08x start %08x\n",
  398. I915_READ(PRB0_CTL),
  399. I915_READ(PRB0_HEAD),
  400. I915_READ(PRB0_TAIL),
  401. I915_READ(PRB0_START));
  402. return -EIO;
  403. }
  404. /* Update our cache of the ring state */
  405. if (!drm_core_check_feature(dev, DRIVER_MODESET))
  406. i915_kernel_lost_context(dev);
  407. else {
  408. ring->head = I915_READ(PRB0_HEAD) & HEAD_ADDR;
  409. ring->tail = I915_READ(PRB0_TAIL) & TAIL_ADDR;
  410. ring->space = ring->head - (ring->tail + 8);
  411. if (ring->space < 0)
  412. ring->space += ring->Size;
  413. }
  414. if (IS_I9XX(dev) && !IS_GEN3(dev)) {
  415. I915_WRITE(MI_MODE,
  416. (VS_TIMER_DISPATCH) << 16 | VS_TIMER_DISPATCH);
  417. }
  418. return 0;
  419. }
  420. void
  421. i915_gem_cleanup_ringbuffer(struct drm_device *dev)
  422. {
  423. drm_i915_private_t *dev_priv = dev->dev_private;
  424. if (dev_priv->ring.ring_obj == NULL)
  425. return;
  426. drm_core_ioremapfree(&dev_priv->ring.map, dev);
  427. i915_gem_object_unpin(dev_priv->ring.ring_obj);
  428. drm_gem_object_unreference(dev_priv->ring.ring_obj);
  429. dev_priv->ring.ring_obj = NULL;
  430. memset(&dev_priv->ring, 0, sizeof(dev_priv->ring));
  431. i915_gem_cleanup_hws(dev);
  432. }
  433. /* As a ringbuffer is only allowed to wrap between instructions, fill
  434. * the tail with NOOPs.
  435. */
  436. int i915_wrap_ring(struct drm_device *dev)
  437. {
  438. drm_i915_private_t *dev_priv = dev->dev_private;
  439. volatile unsigned int *virt;
  440. int rem;
  441. rem = dev_priv->ring.Size - dev_priv->ring.tail;
  442. if (dev_priv->ring.space < rem) {
  443. int ret = i915_wait_ring(dev, rem, __func__);
  444. if (ret)
  445. return ret;
  446. }
  447. dev_priv->ring.space -= rem;
  448. virt = (unsigned int *)
  449. (dev_priv->ring.virtual_start + dev_priv->ring.tail);
  450. rem /= 4;
  451. while (rem--)
  452. *virt++ = MI_NOOP;
  453. dev_priv->ring.tail = 0;
  454. return 0;
  455. }
  456. int i915_wait_ring(struct drm_device * dev, int n, const char *caller)
  457. {
  458. drm_i915_private_t *dev_priv = dev->dev_private;
  459. drm_i915_ring_buffer_t *ring = &(dev_priv->ring);
  460. u32 acthd_reg = IS_I965G(dev) ? ACTHD_I965 : ACTHD;
  461. u32 last_acthd = I915_READ(acthd_reg);
  462. u32 acthd;
  463. u32 last_head = I915_READ(PRB0_HEAD) & HEAD_ADDR;
  464. int i;
  465. trace_i915_ring_wait_begin (dev);
  466. for (i = 0; i < 100000; i++) {
  467. ring->head = I915_READ(PRB0_HEAD) & HEAD_ADDR;
  468. acthd = I915_READ(acthd_reg);
  469. ring->space = ring->head - (ring->tail + 8);
  470. if (ring->space < 0)
  471. ring->space += ring->Size;
  472. if (ring->space >= n) {
  473. trace_i915_ring_wait_end (dev);
  474. return 0;
  475. }
  476. if (dev->primary->master) {
  477. struct drm_i915_master_private *master_priv = dev->primary->master->driver_priv;
  478. if (master_priv->sarea_priv)
  479. master_priv->sarea_priv->perf_boxes |= I915_BOX_WAIT;
  480. }
  481. if (ring->head != last_head)
  482. i = 0;
  483. if (acthd != last_acthd)
  484. i = 0;
  485. last_head = ring->head;
  486. last_acthd = acthd;
  487. msleep_interruptible(10);
  488. }
  489. trace_i915_ring_wait_end (dev);
  490. return -EBUSY;
  491. }