intel_ringbuffer.c 27 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028
  1. /*
  2. * Copyright © 2008-2010 Intel Corporation
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice (including the next
  12. * paragraph) shall be included in all copies or substantial portions of the
  13. * Software.
  14. *
  15. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  16. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  17. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  18. * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  19. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  20. * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
  21. * IN THE SOFTWARE.
  22. *
  23. * Authors:
  24. * Eric Anholt <eric@anholt.net>
  25. * Zou Nan hai <nanhai.zou@intel.com>
  26. * Xiang Hai hao<haihao.xiang@intel.com>
  27. *
  28. */
  29. #include "drmP.h"
  30. #include "drm.h"
  31. #include "i915_drv.h"
  32. #include "i915_drm.h"
  33. #include "i915_trace.h"
  34. #include "intel_drv.h"
  35. static u32 i915_gem_get_seqno(struct drm_device *dev)
  36. {
  37. drm_i915_private_t *dev_priv = dev->dev_private;
  38. u32 seqno;
  39. seqno = dev_priv->next_seqno;
  40. /* reserve 0 for non-seqno */
  41. if (++dev_priv->next_seqno == 0)
  42. dev_priv->next_seqno = 1;
  43. return seqno;
  44. }
  45. static void
  46. render_ring_flush(struct drm_device *dev,
  47. struct intel_ring_buffer *ring,
  48. u32 invalidate_domains,
  49. u32 flush_domains)
  50. {
  51. drm_i915_private_t *dev_priv = dev->dev_private;
  52. u32 cmd;
  53. #if WATCH_EXEC
  54. DRM_INFO("%s: invalidate %08x flush %08x\n", __func__,
  55. invalidate_domains, flush_domains);
  56. #endif
  57. trace_i915_gem_request_flush(dev, dev_priv->next_seqno,
  58. invalidate_domains, flush_domains);
  59. if ((invalidate_domains | flush_domains) & I915_GEM_GPU_DOMAINS) {
  60. /*
  61. * read/write caches:
  62. *
  63. * I915_GEM_DOMAIN_RENDER is always invalidated, but is
  64. * only flushed if MI_NO_WRITE_FLUSH is unset. On 965, it is
  65. * also flushed at 2d versus 3d pipeline switches.
  66. *
  67. * read-only caches:
  68. *
  69. * I915_GEM_DOMAIN_SAMPLER is flushed on pre-965 if
  70. * MI_READ_FLUSH is set, and is always flushed on 965.
  71. *
  72. * I915_GEM_DOMAIN_COMMAND may not exist?
  73. *
  74. * I915_GEM_DOMAIN_INSTRUCTION, which exists on 965, is
  75. * invalidated when MI_EXE_FLUSH is set.
  76. *
  77. * I915_GEM_DOMAIN_VERTEX, which exists on 965, is
  78. * invalidated with every MI_FLUSH.
  79. *
  80. * TLBs:
  81. *
  82. * On 965, TLBs associated with I915_GEM_DOMAIN_COMMAND
  83. * and I915_GEM_DOMAIN_CPU in are invalidated at PTE write and
  84. * I915_GEM_DOMAIN_RENDER and I915_GEM_DOMAIN_SAMPLER
  85. * are flushed at any MI_FLUSH.
  86. */
  87. cmd = MI_FLUSH | MI_NO_WRITE_FLUSH;
  88. if ((invalidate_domains|flush_domains) &
  89. I915_GEM_DOMAIN_RENDER)
  90. cmd &= ~MI_NO_WRITE_FLUSH;
  91. if (INTEL_INFO(dev)->gen < 4) {
  92. /*
  93. * On the 965, the sampler cache always gets flushed
  94. * and this bit is reserved.
  95. */
  96. if (invalidate_domains & I915_GEM_DOMAIN_SAMPLER)
  97. cmd |= MI_READ_FLUSH;
  98. }
  99. if (invalidate_domains & I915_GEM_DOMAIN_INSTRUCTION)
  100. cmd |= MI_EXE_FLUSH;
  101. #if WATCH_EXEC
  102. DRM_INFO("%s: queue flush %08x to ring\n", __func__, cmd);
  103. #endif
  104. intel_ring_begin(dev, ring, 2);
  105. intel_ring_emit(dev, ring, cmd);
  106. intel_ring_emit(dev, ring, MI_NOOP);
  107. intel_ring_advance(dev, ring);
  108. }
  109. }
  110. static void ring_write_tail(struct drm_device *dev,
  111. struct intel_ring_buffer *ring,
  112. u32 value)
  113. {
  114. drm_i915_private_t *dev_priv = dev->dev_private;
  115. I915_WRITE_TAIL(ring, value);
  116. }
  117. u32 intel_ring_get_active_head(struct drm_device *dev,
  118. struct intel_ring_buffer *ring)
  119. {
  120. drm_i915_private_t *dev_priv = dev->dev_private;
  121. u32 acthd_reg = INTEL_INFO(dev)->gen >= 4 ?
  122. RING_ACTHD(ring->mmio_base) : ACTHD;
  123. return I915_READ(acthd_reg);
  124. }
  125. static int init_ring_common(struct drm_device *dev,
  126. struct intel_ring_buffer *ring)
  127. {
  128. u32 head;
  129. drm_i915_private_t *dev_priv = dev->dev_private;
  130. struct drm_i915_gem_object *obj_priv;
  131. obj_priv = to_intel_bo(ring->gem_object);
  132. /* Stop the ring if it's running. */
  133. I915_WRITE_CTL(ring, 0);
  134. I915_WRITE_HEAD(ring, 0);
  135. ring->write_tail(dev, ring, 0);
  136. /* Initialize the ring. */
  137. I915_WRITE_START(ring, obj_priv->gtt_offset);
  138. head = I915_READ_HEAD(ring) & HEAD_ADDR;
  139. /* G45 ring initialization fails to reset head to zero */
  140. if (head != 0) {
  141. DRM_ERROR("%s head not reset to zero "
  142. "ctl %08x head %08x tail %08x start %08x\n",
  143. ring->name,
  144. I915_READ_CTL(ring),
  145. I915_READ_HEAD(ring),
  146. I915_READ_TAIL(ring),
  147. I915_READ_START(ring));
  148. I915_WRITE_HEAD(ring, 0);
  149. DRM_ERROR("%s head forced to zero "
  150. "ctl %08x head %08x tail %08x start %08x\n",
  151. ring->name,
  152. I915_READ_CTL(ring),
  153. I915_READ_HEAD(ring),
  154. I915_READ_TAIL(ring),
  155. I915_READ_START(ring));
  156. }
  157. I915_WRITE_CTL(ring,
  158. ((ring->gem_object->size - PAGE_SIZE) & RING_NR_PAGES)
  159. | RING_REPORT_64K | RING_VALID);
  160. head = I915_READ_HEAD(ring) & HEAD_ADDR;
  161. /* If the head is still not zero, the ring is dead */
  162. if (head != 0) {
  163. DRM_ERROR("%s initialization failed "
  164. "ctl %08x head %08x tail %08x start %08x\n",
  165. ring->name,
  166. I915_READ_CTL(ring),
  167. I915_READ_HEAD(ring),
  168. I915_READ_TAIL(ring),
  169. I915_READ_START(ring));
  170. return -EIO;
  171. }
  172. if (!drm_core_check_feature(dev, DRIVER_MODESET))
  173. i915_kernel_lost_context(dev);
  174. else {
  175. ring->head = I915_READ_HEAD(ring) & HEAD_ADDR;
  176. ring->tail = I915_READ_TAIL(ring) & TAIL_ADDR;
  177. ring->space = ring->head - (ring->tail + 8);
  178. if (ring->space < 0)
  179. ring->space += ring->size;
  180. }
  181. return 0;
  182. }
  183. static int init_render_ring(struct drm_device *dev,
  184. struct intel_ring_buffer *ring)
  185. {
  186. drm_i915_private_t *dev_priv = dev->dev_private;
  187. int ret = init_ring_common(dev, ring);
  188. int mode;
  189. if (INTEL_INFO(dev)->gen > 3) {
  190. mode = VS_TIMER_DISPATCH << 16 | VS_TIMER_DISPATCH;
  191. if (IS_GEN6(dev))
  192. mode |= MI_FLUSH_ENABLE << 16 | MI_FLUSH_ENABLE;
  193. I915_WRITE(MI_MODE, mode);
  194. }
  195. return ret;
  196. }
  197. #define PIPE_CONTROL_FLUSH(addr) \
  198. do { \
  199. OUT_RING(GFX_OP_PIPE_CONTROL | PIPE_CONTROL_QW_WRITE | \
  200. PIPE_CONTROL_DEPTH_STALL | 2); \
  201. OUT_RING(addr | PIPE_CONTROL_GLOBAL_GTT); \
  202. OUT_RING(0); \
  203. OUT_RING(0); \
  204. } while (0)
  205. /**
  206. * Creates a new sequence number, emitting a write of it to the status page
  207. * plus an interrupt, which will trigger i915_user_interrupt_handler.
  208. *
  209. * Must be called with struct_lock held.
  210. *
  211. * Returned sequence numbers are nonzero on success.
  212. */
  213. static u32
  214. render_ring_add_request(struct drm_device *dev,
  215. struct intel_ring_buffer *ring,
  216. u32 flush_domains)
  217. {
  218. drm_i915_private_t *dev_priv = dev->dev_private;
  219. u32 seqno;
  220. seqno = i915_gem_get_seqno(dev);
  221. if (IS_GEN6(dev)) {
  222. BEGIN_LP_RING(6);
  223. OUT_RING(GFX_OP_PIPE_CONTROL | 3);
  224. OUT_RING(PIPE_CONTROL_QW_WRITE |
  225. PIPE_CONTROL_WC_FLUSH | PIPE_CONTROL_IS_FLUSH |
  226. PIPE_CONTROL_NOTIFY);
  227. OUT_RING(dev_priv->seqno_gfx_addr | PIPE_CONTROL_GLOBAL_GTT);
  228. OUT_RING(seqno);
  229. OUT_RING(0);
  230. OUT_RING(0);
  231. ADVANCE_LP_RING();
  232. } else if (HAS_PIPE_CONTROL(dev)) {
  233. u32 scratch_addr = dev_priv->seqno_gfx_addr + 128;
  234. /*
  235. * Workaround qword write incoherence by flushing the
  236. * PIPE_NOTIFY buffers out to memory before requesting
  237. * an interrupt.
  238. */
  239. BEGIN_LP_RING(32);
  240. OUT_RING(GFX_OP_PIPE_CONTROL | PIPE_CONTROL_QW_WRITE |
  241. PIPE_CONTROL_WC_FLUSH | PIPE_CONTROL_TC_FLUSH);
  242. OUT_RING(dev_priv->seqno_gfx_addr | PIPE_CONTROL_GLOBAL_GTT);
  243. OUT_RING(seqno);
  244. OUT_RING(0);
  245. PIPE_CONTROL_FLUSH(scratch_addr);
  246. scratch_addr += 128; /* write to separate cachelines */
  247. PIPE_CONTROL_FLUSH(scratch_addr);
  248. scratch_addr += 128;
  249. PIPE_CONTROL_FLUSH(scratch_addr);
  250. scratch_addr += 128;
  251. PIPE_CONTROL_FLUSH(scratch_addr);
  252. scratch_addr += 128;
  253. PIPE_CONTROL_FLUSH(scratch_addr);
  254. scratch_addr += 128;
  255. PIPE_CONTROL_FLUSH(scratch_addr);
  256. OUT_RING(GFX_OP_PIPE_CONTROL | PIPE_CONTROL_QW_WRITE |
  257. PIPE_CONTROL_WC_FLUSH | PIPE_CONTROL_TC_FLUSH |
  258. PIPE_CONTROL_NOTIFY);
  259. OUT_RING(dev_priv->seqno_gfx_addr | PIPE_CONTROL_GLOBAL_GTT);
  260. OUT_RING(seqno);
  261. OUT_RING(0);
  262. ADVANCE_LP_RING();
  263. } else {
  264. BEGIN_LP_RING(4);
  265. OUT_RING(MI_STORE_DWORD_INDEX);
  266. OUT_RING(I915_GEM_HWS_INDEX << MI_STORE_DWORD_INDEX_SHIFT);
  267. OUT_RING(seqno);
  268. OUT_RING(MI_USER_INTERRUPT);
  269. ADVANCE_LP_RING();
  270. }
  271. return seqno;
  272. }
  273. static u32
  274. render_ring_get_seqno(struct drm_device *dev,
  275. struct intel_ring_buffer *ring)
  276. {
  277. drm_i915_private_t *dev_priv = (drm_i915_private_t *) dev->dev_private;
  278. if (HAS_PIPE_CONTROL(dev))
  279. return ((volatile u32 *)(dev_priv->seqno_page))[0];
  280. else
  281. return intel_read_status_page(ring, I915_GEM_HWS_INDEX);
  282. }
  283. static void
  284. render_ring_get_user_irq(struct drm_device *dev,
  285. struct intel_ring_buffer *ring)
  286. {
  287. drm_i915_private_t *dev_priv = (drm_i915_private_t *) dev->dev_private;
  288. unsigned long irqflags;
  289. spin_lock_irqsave(&dev_priv->user_irq_lock, irqflags);
  290. if (dev->irq_enabled && (++ring->user_irq_refcount == 1)) {
  291. if (HAS_PCH_SPLIT(dev))
  292. ironlake_enable_graphics_irq(dev_priv, GT_PIPE_NOTIFY);
  293. else
  294. i915_enable_irq(dev_priv, I915_USER_INTERRUPT);
  295. }
  296. spin_unlock_irqrestore(&dev_priv->user_irq_lock, irqflags);
  297. }
  298. static void
  299. render_ring_put_user_irq(struct drm_device *dev,
  300. struct intel_ring_buffer *ring)
  301. {
  302. drm_i915_private_t *dev_priv = (drm_i915_private_t *) dev->dev_private;
  303. unsigned long irqflags;
  304. spin_lock_irqsave(&dev_priv->user_irq_lock, irqflags);
  305. BUG_ON(dev->irq_enabled && ring->user_irq_refcount <= 0);
  306. if (dev->irq_enabled && (--ring->user_irq_refcount == 0)) {
  307. if (HAS_PCH_SPLIT(dev))
  308. ironlake_disable_graphics_irq(dev_priv, GT_PIPE_NOTIFY);
  309. else
  310. i915_disable_irq(dev_priv, I915_USER_INTERRUPT);
  311. }
  312. spin_unlock_irqrestore(&dev_priv->user_irq_lock, irqflags);
  313. }
  314. void intel_ring_setup_status_page(struct drm_device *dev,
  315. struct intel_ring_buffer *ring)
  316. {
  317. drm_i915_private_t *dev_priv = dev->dev_private;
  318. if (IS_GEN6(dev)) {
  319. I915_WRITE(RING_HWS_PGA_GEN6(ring->mmio_base),
  320. ring->status_page.gfx_addr);
  321. I915_READ(RING_HWS_PGA_GEN6(ring->mmio_base)); /* posting read */
  322. } else {
  323. I915_WRITE(RING_HWS_PGA(ring->mmio_base),
  324. ring->status_page.gfx_addr);
  325. I915_READ(RING_HWS_PGA(ring->mmio_base)); /* posting read */
  326. }
  327. }
  328. static void
  329. bsd_ring_flush(struct drm_device *dev,
  330. struct intel_ring_buffer *ring,
  331. u32 invalidate_domains,
  332. u32 flush_domains)
  333. {
  334. intel_ring_begin(dev, ring, 2);
  335. intel_ring_emit(dev, ring, MI_FLUSH);
  336. intel_ring_emit(dev, ring, MI_NOOP);
  337. intel_ring_advance(dev, ring);
  338. }
  339. static int init_bsd_ring(struct drm_device *dev,
  340. struct intel_ring_buffer *ring)
  341. {
  342. return init_ring_common(dev, ring);
  343. }
  344. static u32
  345. ring_add_request(struct drm_device *dev,
  346. struct intel_ring_buffer *ring,
  347. u32 flush_domains)
  348. {
  349. u32 seqno;
  350. seqno = i915_gem_get_seqno(dev);
  351. intel_ring_begin(dev, ring, 4);
  352. intel_ring_emit(dev, ring, MI_STORE_DWORD_INDEX);
  353. intel_ring_emit(dev, ring,
  354. I915_GEM_HWS_INDEX << MI_STORE_DWORD_INDEX_SHIFT);
  355. intel_ring_emit(dev, ring, seqno);
  356. intel_ring_emit(dev, ring, MI_USER_INTERRUPT);
  357. intel_ring_advance(dev, ring);
  358. DRM_DEBUG_DRIVER("%s %d\n", ring->name, seqno);
  359. return seqno;
  360. }
  361. static void
  362. bsd_ring_get_user_irq(struct drm_device *dev,
  363. struct intel_ring_buffer *ring)
  364. {
  365. /* do nothing */
  366. }
  367. static void
  368. bsd_ring_put_user_irq(struct drm_device *dev,
  369. struct intel_ring_buffer *ring)
  370. {
  371. /* do nothing */
  372. }
  373. static u32
  374. ring_status_page_get_seqno(struct drm_device *dev,
  375. struct intel_ring_buffer *ring)
  376. {
  377. return intel_read_status_page(ring, I915_GEM_HWS_INDEX);
  378. }
  379. static int
  380. ring_dispatch_gem_execbuffer(struct drm_device *dev,
  381. struct intel_ring_buffer *ring,
  382. struct drm_i915_gem_execbuffer2 *exec,
  383. struct drm_clip_rect *cliprects,
  384. uint64_t exec_offset)
  385. {
  386. uint32_t exec_start;
  387. exec_start = (uint32_t) exec_offset + exec->batch_start_offset;
  388. intel_ring_begin(dev, ring, 2);
  389. intel_ring_emit(dev, ring, MI_BATCH_BUFFER_START |
  390. (2 << 6) | MI_BATCH_NON_SECURE_I965);
  391. intel_ring_emit(dev, ring, exec_start);
  392. intel_ring_advance(dev, ring);
  393. return 0;
  394. }
  395. static int
  396. render_ring_dispatch_gem_execbuffer(struct drm_device *dev,
  397. struct intel_ring_buffer *ring,
  398. struct drm_i915_gem_execbuffer2 *exec,
  399. struct drm_clip_rect *cliprects,
  400. uint64_t exec_offset)
  401. {
  402. drm_i915_private_t *dev_priv = dev->dev_private;
  403. int nbox = exec->num_cliprects;
  404. int i = 0, count;
  405. uint32_t exec_start, exec_len;
  406. exec_start = (uint32_t) exec_offset + exec->batch_start_offset;
  407. exec_len = (uint32_t) exec->batch_len;
  408. trace_i915_gem_request_submit(dev, dev_priv->next_seqno + 1);
  409. count = nbox ? nbox : 1;
  410. for (i = 0; i < count; i++) {
  411. if (i < nbox) {
  412. int ret = i915_emit_box(dev, cliprects, i,
  413. exec->DR1, exec->DR4);
  414. if (ret)
  415. return ret;
  416. }
  417. if (IS_I830(dev) || IS_845G(dev)) {
  418. intel_ring_begin(dev, ring, 4);
  419. intel_ring_emit(dev, ring, MI_BATCH_BUFFER);
  420. intel_ring_emit(dev, ring,
  421. exec_start | MI_BATCH_NON_SECURE);
  422. intel_ring_emit(dev, ring, exec_start + exec_len - 4);
  423. intel_ring_emit(dev, ring, 0);
  424. } else {
  425. intel_ring_begin(dev, ring, 2);
  426. if (INTEL_INFO(dev)->gen >= 4) {
  427. intel_ring_emit(dev, ring,
  428. MI_BATCH_BUFFER_START | (2 << 6)
  429. | MI_BATCH_NON_SECURE_I965);
  430. intel_ring_emit(dev, ring, exec_start);
  431. } else {
  432. intel_ring_emit(dev, ring, MI_BATCH_BUFFER_START
  433. | (2 << 6));
  434. intel_ring_emit(dev, ring, exec_start |
  435. MI_BATCH_NON_SECURE);
  436. }
  437. }
  438. intel_ring_advance(dev, ring);
  439. }
  440. if (IS_G4X(dev) || IS_GEN5(dev)) {
  441. intel_ring_begin(dev, ring, 2);
  442. intel_ring_emit(dev, ring, MI_FLUSH |
  443. MI_NO_WRITE_FLUSH |
  444. MI_INVALIDATE_ISP );
  445. intel_ring_emit(dev, ring, MI_NOOP);
  446. intel_ring_advance(dev, ring);
  447. }
  448. /* XXX breadcrumb */
  449. return 0;
  450. }
  451. static void cleanup_status_page(struct drm_device *dev,
  452. struct intel_ring_buffer *ring)
  453. {
  454. drm_i915_private_t *dev_priv = dev->dev_private;
  455. struct drm_gem_object *obj;
  456. struct drm_i915_gem_object *obj_priv;
  457. obj = ring->status_page.obj;
  458. if (obj == NULL)
  459. return;
  460. obj_priv = to_intel_bo(obj);
  461. kunmap(obj_priv->pages[0]);
  462. i915_gem_object_unpin(obj);
  463. drm_gem_object_unreference(obj);
  464. ring->status_page.obj = NULL;
  465. memset(&dev_priv->hws_map, 0, sizeof(dev_priv->hws_map));
  466. }
  467. static int init_status_page(struct drm_device *dev,
  468. struct intel_ring_buffer *ring)
  469. {
  470. drm_i915_private_t *dev_priv = dev->dev_private;
  471. struct drm_gem_object *obj;
  472. struct drm_i915_gem_object *obj_priv;
  473. int ret;
  474. obj = i915_gem_alloc_object(dev, 4096);
  475. if (obj == NULL) {
  476. DRM_ERROR("Failed to allocate status page\n");
  477. ret = -ENOMEM;
  478. goto err;
  479. }
  480. obj_priv = to_intel_bo(obj);
  481. obj_priv->agp_type = AGP_USER_CACHED_MEMORY;
  482. ret = i915_gem_object_pin(obj, 4096);
  483. if (ret != 0) {
  484. goto err_unref;
  485. }
  486. ring->status_page.gfx_addr = obj_priv->gtt_offset;
  487. ring->status_page.page_addr = kmap(obj_priv->pages[0]);
  488. if (ring->status_page.page_addr == NULL) {
  489. memset(&dev_priv->hws_map, 0, sizeof(dev_priv->hws_map));
  490. goto err_unpin;
  491. }
  492. ring->status_page.obj = obj;
  493. memset(ring->status_page.page_addr, 0, PAGE_SIZE);
  494. intel_ring_setup_status_page(dev, ring);
  495. DRM_DEBUG_DRIVER("%s hws offset: 0x%08x\n",
  496. ring->name, ring->status_page.gfx_addr);
  497. return 0;
  498. err_unpin:
  499. i915_gem_object_unpin(obj);
  500. err_unref:
  501. drm_gem_object_unreference(obj);
  502. err:
  503. return ret;
  504. }
  505. int intel_init_ring_buffer(struct drm_device *dev,
  506. struct intel_ring_buffer *ring)
  507. {
  508. struct drm_i915_private *dev_priv = dev->dev_private;
  509. struct drm_i915_gem_object *obj_priv;
  510. struct drm_gem_object *obj;
  511. int ret;
  512. ring->dev = dev;
  513. INIT_LIST_HEAD(&ring->active_list);
  514. INIT_LIST_HEAD(&ring->request_list);
  515. INIT_LIST_HEAD(&ring->gpu_write_list);
  516. if (I915_NEED_GFX_HWS(dev)) {
  517. ret = init_status_page(dev, ring);
  518. if (ret)
  519. return ret;
  520. }
  521. obj = i915_gem_alloc_object(dev, ring->size);
  522. if (obj == NULL) {
  523. DRM_ERROR("Failed to allocate ringbuffer\n");
  524. ret = -ENOMEM;
  525. goto err_hws;
  526. }
  527. ring->gem_object = obj;
  528. ret = i915_gem_object_pin(obj, PAGE_SIZE);
  529. if (ret)
  530. goto err_unref;
  531. obj_priv = to_intel_bo(obj);
  532. ring->map.size = ring->size;
  533. ring->map.offset = dev->agp->base + obj_priv->gtt_offset;
  534. ring->map.type = 0;
  535. ring->map.flags = 0;
  536. ring->map.mtrr = 0;
  537. drm_core_ioremap_wc(&ring->map, dev);
  538. if (ring->map.handle == NULL) {
  539. DRM_ERROR("Failed to map ringbuffer.\n");
  540. ret = -EINVAL;
  541. goto err_unpin;
  542. }
  543. ring->virtual_start = ring->map.handle;
  544. ret = ring->init(dev, ring);
  545. if (ret)
  546. goto err_unmap;
  547. if (!drm_core_check_feature(dev, DRIVER_MODESET))
  548. i915_kernel_lost_context(dev);
  549. else {
  550. ring->head = I915_READ_HEAD(ring) & HEAD_ADDR;
  551. ring->tail = I915_READ_TAIL(ring) & TAIL_ADDR;
  552. ring->space = ring->head - (ring->tail + 8);
  553. if (ring->space < 0)
  554. ring->space += ring->size;
  555. }
  556. return ret;
  557. err_unmap:
  558. drm_core_ioremapfree(&ring->map, dev);
  559. err_unpin:
  560. i915_gem_object_unpin(obj);
  561. err_unref:
  562. drm_gem_object_unreference(obj);
  563. ring->gem_object = NULL;
  564. err_hws:
  565. cleanup_status_page(dev, ring);
  566. return ret;
  567. }
  568. void intel_cleanup_ring_buffer(struct drm_device *dev,
  569. struct intel_ring_buffer *ring)
  570. {
  571. if (ring->gem_object == NULL)
  572. return;
  573. drm_core_ioremapfree(&ring->map, dev);
  574. i915_gem_object_unpin(ring->gem_object);
  575. drm_gem_object_unreference(ring->gem_object);
  576. ring->gem_object = NULL;
  577. if (ring->cleanup)
  578. ring->cleanup(ring);
  579. cleanup_status_page(dev, ring);
  580. }
  581. static int intel_wrap_ring_buffer(struct drm_device *dev,
  582. struct intel_ring_buffer *ring)
  583. {
  584. unsigned int *virt;
  585. int rem;
  586. rem = ring->size - ring->tail;
  587. if (ring->space < rem) {
  588. int ret = intel_wait_ring_buffer(dev, ring, rem);
  589. if (ret)
  590. return ret;
  591. }
  592. virt = (unsigned int *)(ring->virtual_start + ring->tail);
  593. rem /= 8;
  594. while (rem--) {
  595. *virt++ = MI_NOOP;
  596. *virt++ = MI_NOOP;
  597. }
  598. ring->tail = 0;
  599. ring->space = ring->head - 8;
  600. return 0;
  601. }
  602. int intel_wait_ring_buffer(struct drm_device *dev,
  603. struct intel_ring_buffer *ring, int n)
  604. {
  605. unsigned long end;
  606. drm_i915_private_t *dev_priv = dev->dev_private;
  607. u32 head;
  608. head = intel_read_status_page(ring, 4);
  609. if (head) {
  610. ring->head = head & HEAD_ADDR;
  611. ring->space = ring->head - (ring->tail + 8);
  612. if (ring->space < 0)
  613. ring->space += ring->size;
  614. if (ring->space >= n)
  615. return 0;
  616. }
  617. trace_i915_ring_wait_begin (dev);
  618. end = jiffies + 3 * HZ;
  619. do {
  620. ring->head = I915_READ_HEAD(ring) & HEAD_ADDR;
  621. ring->space = ring->head - (ring->tail + 8);
  622. if (ring->space < 0)
  623. ring->space += ring->size;
  624. if (ring->space >= n) {
  625. trace_i915_ring_wait_end (dev);
  626. return 0;
  627. }
  628. if (dev->primary->master) {
  629. struct drm_i915_master_private *master_priv = dev->primary->master->driver_priv;
  630. if (master_priv->sarea_priv)
  631. master_priv->sarea_priv->perf_boxes |= I915_BOX_WAIT;
  632. }
  633. msleep(1);
  634. } while (!time_after(jiffies, end));
  635. trace_i915_ring_wait_end (dev);
  636. return -EBUSY;
  637. }
  638. void intel_ring_begin(struct drm_device *dev,
  639. struct intel_ring_buffer *ring,
  640. int num_dwords)
  641. {
  642. int n = 4*num_dwords;
  643. if (unlikely(ring->tail + n > ring->size))
  644. intel_wrap_ring_buffer(dev, ring);
  645. if (unlikely(ring->space < n))
  646. intel_wait_ring_buffer(dev, ring, n);
  647. ring->space -= n;
  648. }
  649. void intel_ring_advance(struct drm_device *dev,
  650. struct intel_ring_buffer *ring)
  651. {
  652. ring->tail &= ring->size - 1;
  653. ring->write_tail(dev, ring, ring->tail);
  654. }
  655. static const struct intel_ring_buffer render_ring = {
  656. .name = "render ring",
  657. .id = RING_RENDER,
  658. .mmio_base = RENDER_RING_BASE,
  659. .size = 32 * PAGE_SIZE,
  660. .init = init_render_ring,
  661. .write_tail = ring_write_tail,
  662. .flush = render_ring_flush,
  663. .add_request = render_ring_add_request,
  664. .get_seqno = render_ring_get_seqno,
  665. .user_irq_get = render_ring_get_user_irq,
  666. .user_irq_put = render_ring_put_user_irq,
  667. .dispatch_gem_execbuffer = render_ring_dispatch_gem_execbuffer,
  668. };
  669. /* ring buffer for bit-stream decoder */
  670. static const struct intel_ring_buffer bsd_ring = {
  671. .name = "bsd ring",
  672. .id = RING_BSD,
  673. .mmio_base = BSD_RING_BASE,
  674. .size = 32 * PAGE_SIZE,
  675. .init = init_bsd_ring,
  676. .write_tail = ring_write_tail,
  677. .flush = bsd_ring_flush,
  678. .add_request = ring_add_request,
  679. .get_seqno = ring_status_page_get_seqno,
  680. .user_irq_get = bsd_ring_get_user_irq,
  681. .user_irq_put = bsd_ring_put_user_irq,
  682. .dispatch_gem_execbuffer = ring_dispatch_gem_execbuffer,
  683. };
  684. static void gen6_bsd_ring_write_tail(struct drm_device *dev,
  685. struct intel_ring_buffer *ring,
  686. u32 value)
  687. {
  688. drm_i915_private_t *dev_priv = dev->dev_private;
  689. /* Every tail move must follow the sequence below */
  690. I915_WRITE(GEN6_BSD_SLEEP_PSMI_CONTROL,
  691. GEN6_BSD_SLEEP_PSMI_CONTROL_RC_ILDL_MESSAGE_MODIFY_MASK |
  692. GEN6_BSD_SLEEP_PSMI_CONTROL_RC_ILDL_MESSAGE_DISABLE);
  693. I915_WRITE(GEN6_BSD_RNCID, 0x0);
  694. if (wait_for((I915_READ(GEN6_BSD_SLEEP_PSMI_CONTROL) &
  695. GEN6_BSD_SLEEP_PSMI_CONTROL_IDLE_INDICATOR) == 0,
  696. 50))
  697. DRM_ERROR("timed out waiting for IDLE Indicator\n");
  698. I915_WRITE_TAIL(ring, value);
  699. I915_WRITE(GEN6_BSD_SLEEP_PSMI_CONTROL,
  700. GEN6_BSD_SLEEP_PSMI_CONTROL_RC_ILDL_MESSAGE_MODIFY_MASK |
  701. GEN6_BSD_SLEEP_PSMI_CONTROL_RC_ILDL_MESSAGE_ENABLE);
  702. }
  703. static void gen6_ring_flush(struct drm_device *dev,
  704. struct intel_ring_buffer *ring,
  705. u32 invalidate_domains,
  706. u32 flush_domains)
  707. {
  708. intel_ring_begin(dev, ring, 4);
  709. intel_ring_emit(dev, ring, MI_FLUSH_DW);
  710. intel_ring_emit(dev, ring, 0);
  711. intel_ring_emit(dev, ring, 0);
  712. intel_ring_emit(dev, ring, 0);
  713. intel_ring_advance(dev, ring);
  714. }
  715. static int
  716. gen6_ring_dispatch_gem_execbuffer(struct drm_device *dev,
  717. struct intel_ring_buffer *ring,
  718. struct drm_i915_gem_execbuffer2 *exec,
  719. struct drm_clip_rect *cliprects,
  720. uint64_t exec_offset)
  721. {
  722. uint32_t exec_start;
  723. exec_start = (uint32_t) exec_offset + exec->batch_start_offset;
  724. intel_ring_begin(dev, ring, 2);
  725. intel_ring_emit(dev, ring,
  726. MI_BATCH_BUFFER_START | MI_BATCH_NON_SECURE_I965);
  727. /* bit0-7 is the length on GEN6+ */
  728. intel_ring_emit(dev, ring, exec_start);
  729. intel_ring_advance(dev, ring);
  730. return 0;
  731. }
  732. /* ring buffer for Video Codec for Gen6+ */
  733. static const struct intel_ring_buffer gen6_bsd_ring = {
  734. .name = "gen6 bsd ring",
  735. .id = RING_BSD,
  736. .mmio_base = GEN6_BSD_RING_BASE,
  737. .size = 32 * PAGE_SIZE,
  738. .init = init_bsd_ring,
  739. .write_tail = gen6_bsd_ring_write_tail,
  740. .flush = gen6_ring_flush,
  741. .add_request = ring_add_request,
  742. .get_seqno = ring_status_page_get_seqno,
  743. .user_irq_get = bsd_ring_get_user_irq,
  744. .user_irq_put = bsd_ring_put_user_irq,
  745. .dispatch_gem_execbuffer = gen6_ring_dispatch_gem_execbuffer,
  746. };
  747. /* Blitter support (SandyBridge+) */
  748. static void
  749. blt_ring_get_user_irq(struct drm_device *dev,
  750. struct intel_ring_buffer *ring)
  751. {
  752. /* do nothing */
  753. }
  754. static void
  755. blt_ring_put_user_irq(struct drm_device *dev,
  756. struct intel_ring_buffer *ring)
  757. {
  758. /* do nothing */
  759. }
  760. /* Workaround for some stepping of SNB,
  761. * each time when BLT engine ring tail moved,
  762. * the first command in the ring to be parsed
  763. * should be MI_BATCH_BUFFER_START
  764. */
  765. #define NEED_BLT_WORKAROUND(dev) \
  766. (IS_GEN6(dev) && (dev->pdev->revision < 8))
  767. static inline struct drm_i915_gem_object *
  768. to_blt_workaround(struct intel_ring_buffer *ring)
  769. {
  770. return ring->private;
  771. }
  772. static int blt_ring_init(struct drm_device *dev,
  773. struct intel_ring_buffer *ring)
  774. {
  775. if (NEED_BLT_WORKAROUND(dev)) {
  776. struct drm_i915_gem_object *obj;
  777. u32 __iomem *ptr;
  778. int ret;
  779. obj = to_intel_bo(i915_gem_alloc_object(dev, 4096));
  780. if (obj == NULL)
  781. return -ENOMEM;
  782. ret = i915_gem_object_pin(&obj->base, 4096);
  783. if (ret) {
  784. drm_gem_object_unreference(&obj->base);
  785. return ret;
  786. }
  787. ptr = kmap(obj->pages[0]);
  788. iowrite32(MI_BATCH_BUFFER_END, ptr);
  789. iowrite32(MI_NOOP, ptr+1);
  790. kunmap(obj->pages[0]);
  791. ret = i915_gem_object_set_to_gtt_domain(&obj->base, false);
  792. if (ret) {
  793. i915_gem_object_unpin(&obj->base);
  794. drm_gem_object_unreference(&obj->base);
  795. return ret;
  796. }
  797. ring->private = obj;
  798. }
  799. return init_ring_common(dev, ring);
  800. }
  801. static void blt_ring_begin(struct drm_device *dev,
  802. struct intel_ring_buffer *ring,
  803. int num_dwords)
  804. {
  805. if (ring->private) {
  806. intel_ring_begin(dev, ring, num_dwords+2);
  807. intel_ring_emit(dev, ring, MI_BATCH_BUFFER_START);
  808. intel_ring_emit(dev, ring, to_blt_workaround(ring)->gtt_offset);
  809. } else
  810. intel_ring_begin(dev, ring, 4);
  811. }
  812. static void blt_ring_flush(struct drm_device *dev,
  813. struct intel_ring_buffer *ring,
  814. u32 invalidate_domains,
  815. u32 flush_domains)
  816. {
  817. blt_ring_begin(dev, ring, 4);
  818. intel_ring_emit(dev, ring, MI_FLUSH_DW);
  819. intel_ring_emit(dev, ring, 0);
  820. intel_ring_emit(dev, ring, 0);
  821. intel_ring_emit(dev, ring, 0);
  822. intel_ring_advance(dev, ring);
  823. }
  824. static u32
  825. blt_ring_add_request(struct drm_device *dev,
  826. struct intel_ring_buffer *ring,
  827. u32 flush_domains)
  828. {
  829. u32 seqno = i915_gem_get_seqno(dev);
  830. blt_ring_begin(dev, ring, 4);
  831. intel_ring_emit(dev, ring, MI_STORE_DWORD_INDEX);
  832. intel_ring_emit(dev, ring,
  833. I915_GEM_HWS_INDEX << MI_STORE_DWORD_INDEX_SHIFT);
  834. intel_ring_emit(dev, ring, seqno);
  835. intel_ring_emit(dev, ring, MI_USER_INTERRUPT);
  836. intel_ring_advance(dev, ring);
  837. DRM_DEBUG_DRIVER("%s %d\n", ring->name, seqno);
  838. return seqno;
  839. }
  840. static void blt_ring_cleanup(struct intel_ring_buffer *ring)
  841. {
  842. if (!ring->private)
  843. return;
  844. i915_gem_object_unpin(ring->private);
  845. drm_gem_object_unreference(ring->private);
  846. ring->private = NULL;
  847. }
  848. static const struct intel_ring_buffer gen6_blt_ring = {
  849. .name = "blt ring",
  850. .id = RING_BLT,
  851. .mmio_base = BLT_RING_BASE,
  852. .size = 32 * PAGE_SIZE,
  853. .init = blt_ring_init,
  854. .write_tail = ring_write_tail,
  855. .flush = blt_ring_flush,
  856. .add_request = blt_ring_add_request,
  857. .get_seqno = ring_status_page_get_seqno,
  858. .user_irq_get = blt_ring_get_user_irq,
  859. .user_irq_put = blt_ring_put_user_irq,
  860. .dispatch_gem_execbuffer = gen6_ring_dispatch_gem_execbuffer,
  861. .cleanup = blt_ring_cleanup,
  862. };
  863. int intel_init_render_ring_buffer(struct drm_device *dev)
  864. {
  865. drm_i915_private_t *dev_priv = dev->dev_private;
  866. dev_priv->render_ring = render_ring;
  867. if (!I915_NEED_GFX_HWS(dev)) {
  868. dev_priv->render_ring.status_page.page_addr
  869. = dev_priv->status_page_dmah->vaddr;
  870. memset(dev_priv->render_ring.status_page.page_addr,
  871. 0, PAGE_SIZE);
  872. }
  873. return intel_init_ring_buffer(dev, &dev_priv->render_ring);
  874. }
  875. int intel_init_bsd_ring_buffer(struct drm_device *dev)
  876. {
  877. drm_i915_private_t *dev_priv = dev->dev_private;
  878. if (IS_GEN6(dev))
  879. dev_priv->bsd_ring = gen6_bsd_ring;
  880. else
  881. dev_priv->bsd_ring = bsd_ring;
  882. return intel_init_ring_buffer(dev, &dev_priv->bsd_ring);
  883. }
  884. int intel_init_blt_ring_buffer(struct drm_device *dev)
  885. {
  886. drm_i915_private_t *dev_priv = dev->dev_private;
  887. dev_priv->blt_ring = gen6_blt_ring;
  888. return intel_init_ring_buffer(dev, &dev_priv->blt_ring);
  889. }