intel_ringbuffer.c 34 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444
  1. /*
  2. * Copyright © 2008-2010 Intel Corporation
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice (including the next
  12. * paragraph) shall be included in all copies or substantial portions of the
  13. * Software.
  14. *
  15. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  16. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  17. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  18. * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  19. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  20. * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
  21. * IN THE SOFTWARE.
  22. *
  23. * Authors:
  24. * Eric Anholt <eric@anholt.net>
  25. * Zou Nan hai <nanhai.zou@intel.com>
  26. * Xiang Hai hao<haihao.xiang@intel.com>
  27. *
  28. */
  29. #include "drmP.h"
  30. #include "drm.h"
  31. #include "i915_drv.h"
  32. #include "i915_drm.h"
  33. #include "i915_trace.h"
  34. #include "intel_drv.h"
  35. static inline int ring_space(struct intel_ring_buffer *ring)
  36. {
  37. int space = (ring->head & HEAD_ADDR) - (ring->tail + 8);
  38. if (space < 0)
  39. space += ring->size;
  40. return space;
  41. }
  42. static u32 i915_gem_get_seqno(struct drm_device *dev)
  43. {
  44. drm_i915_private_t *dev_priv = dev->dev_private;
  45. u32 seqno;
  46. seqno = dev_priv->next_seqno;
  47. /* reserve 0 for non-seqno */
  48. if (++dev_priv->next_seqno == 0)
  49. dev_priv->next_seqno = 1;
  50. return seqno;
  51. }
  52. static int
  53. render_ring_flush(struct intel_ring_buffer *ring,
  54. u32 invalidate_domains,
  55. u32 flush_domains)
  56. {
  57. struct drm_device *dev = ring->dev;
  58. u32 cmd;
  59. int ret;
  60. /*
  61. * read/write caches:
  62. *
  63. * I915_GEM_DOMAIN_RENDER is always invalidated, but is
  64. * only flushed if MI_NO_WRITE_FLUSH is unset. On 965, it is
  65. * also flushed at 2d versus 3d pipeline switches.
  66. *
  67. * read-only caches:
  68. *
  69. * I915_GEM_DOMAIN_SAMPLER is flushed on pre-965 if
  70. * MI_READ_FLUSH is set, and is always flushed on 965.
  71. *
  72. * I915_GEM_DOMAIN_COMMAND may not exist?
  73. *
  74. * I915_GEM_DOMAIN_INSTRUCTION, which exists on 965, is
  75. * invalidated when MI_EXE_FLUSH is set.
  76. *
  77. * I915_GEM_DOMAIN_VERTEX, which exists on 965, is
  78. * invalidated with every MI_FLUSH.
  79. *
  80. * TLBs:
  81. *
  82. * On 965, TLBs associated with I915_GEM_DOMAIN_COMMAND
  83. * and I915_GEM_DOMAIN_CPU in are invalidated at PTE write and
  84. * I915_GEM_DOMAIN_RENDER and I915_GEM_DOMAIN_SAMPLER
  85. * are flushed at any MI_FLUSH.
  86. */
  87. cmd = MI_FLUSH | MI_NO_WRITE_FLUSH;
  88. if ((invalidate_domains|flush_domains) &
  89. I915_GEM_DOMAIN_RENDER)
  90. cmd &= ~MI_NO_WRITE_FLUSH;
  91. if (INTEL_INFO(dev)->gen < 4) {
  92. /*
  93. * On the 965, the sampler cache always gets flushed
  94. * and this bit is reserved.
  95. */
  96. if (invalidate_domains & I915_GEM_DOMAIN_SAMPLER)
  97. cmd |= MI_READ_FLUSH;
  98. }
  99. if (invalidate_domains & I915_GEM_DOMAIN_INSTRUCTION)
  100. cmd |= MI_EXE_FLUSH;
  101. if (invalidate_domains & I915_GEM_DOMAIN_COMMAND &&
  102. (IS_G4X(dev) || IS_GEN5(dev)))
  103. cmd |= MI_INVALIDATE_ISP;
  104. ret = intel_ring_begin(ring, 2);
  105. if (ret)
  106. return ret;
  107. intel_ring_emit(ring, cmd);
  108. intel_ring_emit(ring, MI_NOOP);
  109. intel_ring_advance(ring);
  110. return 0;
  111. }
  112. static void ring_write_tail(struct intel_ring_buffer *ring,
  113. u32 value)
  114. {
  115. drm_i915_private_t *dev_priv = ring->dev->dev_private;
  116. I915_WRITE_TAIL(ring, value);
  117. }
  118. u32 intel_ring_get_active_head(struct intel_ring_buffer *ring)
  119. {
  120. drm_i915_private_t *dev_priv = ring->dev->dev_private;
  121. u32 acthd_reg = INTEL_INFO(ring->dev)->gen >= 4 ?
  122. RING_ACTHD(ring->mmio_base) : ACTHD;
  123. return I915_READ(acthd_reg);
  124. }
  125. static int init_ring_common(struct intel_ring_buffer *ring)
  126. {
  127. drm_i915_private_t *dev_priv = ring->dev->dev_private;
  128. struct drm_i915_gem_object *obj = ring->obj;
  129. u32 head;
  130. /* Stop the ring if it's running. */
  131. I915_WRITE_CTL(ring, 0);
  132. I915_WRITE_HEAD(ring, 0);
  133. ring->write_tail(ring, 0);
  134. /* Initialize the ring. */
  135. I915_WRITE_START(ring, obj->gtt_offset);
  136. head = I915_READ_HEAD(ring) & HEAD_ADDR;
  137. /* G45 ring initialization fails to reset head to zero */
  138. if (head != 0) {
  139. DRM_DEBUG_KMS("%s head not reset to zero "
  140. "ctl %08x head %08x tail %08x start %08x\n",
  141. ring->name,
  142. I915_READ_CTL(ring),
  143. I915_READ_HEAD(ring),
  144. I915_READ_TAIL(ring),
  145. I915_READ_START(ring));
  146. I915_WRITE_HEAD(ring, 0);
  147. if (I915_READ_HEAD(ring) & HEAD_ADDR) {
  148. DRM_ERROR("failed to set %s head to zero "
  149. "ctl %08x head %08x tail %08x start %08x\n",
  150. ring->name,
  151. I915_READ_CTL(ring),
  152. I915_READ_HEAD(ring),
  153. I915_READ_TAIL(ring),
  154. I915_READ_START(ring));
  155. }
  156. }
  157. I915_WRITE_CTL(ring,
  158. ((ring->size - PAGE_SIZE) & RING_NR_PAGES)
  159. | RING_REPORT_64K | RING_VALID);
  160. /* If the head is still not zero, the ring is dead */
  161. if ((I915_READ_CTL(ring) & RING_VALID) == 0 ||
  162. I915_READ_START(ring) != obj->gtt_offset ||
  163. (I915_READ_HEAD(ring) & HEAD_ADDR) != 0) {
  164. DRM_ERROR("%s initialization failed "
  165. "ctl %08x head %08x tail %08x start %08x\n",
  166. ring->name,
  167. I915_READ_CTL(ring),
  168. I915_READ_HEAD(ring),
  169. I915_READ_TAIL(ring),
  170. I915_READ_START(ring));
  171. return -EIO;
  172. }
  173. if (!drm_core_check_feature(ring->dev, DRIVER_MODESET))
  174. i915_kernel_lost_context(ring->dev);
  175. else {
  176. ring->head = I915_READ_HEAD(ring);
  177. ring->tail = I915_READ_TAIL(ring) & TAIL_ADDR;
  178. ring->space = ring_space(ring);
  179. }
  180. return 0;
  181. }
  182. /*
  183. * 965+ support PIPE_CONTROL commands, which provide finer grained control
  184. * over cache flushing.
  185. */
  186. struct pipe_control {
  187. struct drm_i915_gem_object *obj;
  188. volatile u32 *cpu_page;
  189. u32 gtt_offset;
  190. };
  191. static int
  192. init_pipe_control(struct intel_ring_buffer *ring)
  193. {
  194. struct pipe_control *pc;
  195. struct drm_i915_gem_object *obj;
  196. int ret;
  197. if (ring->private)
  198. return 0;
  199. pc = kmalloc(sizeof(*pc), GFP_KERNEL);
  200. if (!pc)
  201. return -ENOMEM;
  202. obj = i915_gem_alloc_object(ring->dev, 4096);
  203. if (obj == NULL) {
  204. DRM_ERROR("Failed to allocate seqno page\n");
  205. ret = -ENOMEM;
  206. goto err;
  207. }
  208. i915_gem_object_set_cache_level(obj, I915_CACHE_LLC);
  209. ret = i915_gem_object_pin(obj, 4096, true);
  210. if (ret)
  211. goto err_unref;
  212. pc->gtt_offset = obj->gtt_offset;
  213. pc->cpu_page = kmap(obj->pages[0]);
  214. if (pc->cpu_page == NULL)
  215. goto err_unpin;
  216. pc->obj = obj;
  217. ring->private = pc;
  218. return 0;
  219. err_unpin:
  220. i915_gem_object_unpin(obj);
  221. err_unref:
  222. drm_gem_object_unreference(&obj->base);
  223. err:
  224. kfree(pc);
  225. return ret;
  226. }
  227. static void
  228. cleanup_pipe_control(struct intel_ring_buffer *ring)
  229. {
  230. struct pipe_control *pc = ring->private;
  231. struct drm_i915_gem_object *obj;
  232. if (!ring->private)
  233. return;
  234. obj = pc->obj;
  235. kunmap(obj->pages[0]);
  236. i915_gem_object_unpin(obj);
  237. drm_gem_object_unreference(&obj->base);
  238. kfree(pc);
  239. ring->private = NULL;
  240. }
  241. static int init_render_ring(struct intel_ring_buffer *ring)
  242. {
  243. struct drm_device *dev = ring->dev;
  244. struct drm_i915_private *dev_priv = dev->dev_private;
  245. int ret = init_ring_common(ring);
  246. if (INTEL_INFO(dev)->gen > 3) {
  247. int mode = VS_TIMER_DISPATCH << 16 | VS_TIMER_DISPATCH;
  248. if (IS_GEN6(dev) || IS_GEN7(dev))
  249. mode |= MI_FLUSH_ENABLE << 16 | MI_FLUSH_ENABLE;
  250. I915_WRITE(MI_MODE, mode);
  251. if (IS_GEN7(dev))
  252. I915_WRITE(GFX_MODE_GEN7,
  253. GFX_MODE_DISABLE(GFX_TLB_INVALIDATE_ALWAYS) |
  254. GFX_MODE_ENABLE(GFX_REPLAY_MODE));
  255. }
  256. if (INTEL_INFO(dev)->gen >= 6) {
  257. } else if (IS_GEN5(dev)) {
  258. ret = init_pipe_control(ring);
  259. if (ret)
  260. return ret;
  261. }
  262. return ret;
  263. }
  264. static void render_ring_cleanup(struct intel_ring_buffer *ring)
  265. {
  266. if (!ring->private)
  267. return;
  268. cleanup_pipe_control(ring);
  269. }
  270. static void
  271. update_mboxes(struct intel_ring_buffer *ring,
  272. u32 seqno,
  273. u32 mmio_offset)
  274. {
  275. intel_ring_emit(ring, MI_SEMAPHORE_MBOX |
  276. MI_SEMAPHORE_GLOBAL_GTT |
  277. MI_SEMAPHORE_REGISTER |
  278. MI_SEMAPHORE_UPDATE);
  279. intel_ring_emit(ring, seqno);
  280. intel_ring_emit(ring, mmio_offset);
  281. }
  282. /**
  283. * gen6_add_request - Update the semaphore mailbox registers
  284. *
  285. * @ring - ring that is adding a request
  286. * @seqno - return seqno stuck into the ring
  287. *
  288. * Update the mailbox registers in the *other* rings with the current seqno.
  289. * This acts like a signal in the canonical semaphore.
  290. */
  291. static int
  292. gen6_add_request(struct intel_ring_buffer *ring,
  293. u32 *seqno)
  294. {
  295. u32 mbox1_reg;
  296. u32 mbox2_reg;
  297. int ret;
  298. ret = intel_ring_begin(ring, 10);
  299. if (ret)
  300. return ret;
  301. mbox1_reg = ring->signal_mbox[0];
  302. mbox2_reg = ring->signal_mbox[1];
  303. *seqno = i915_gem_get_seqno(ring->dev);
  304. update_mboxes(ring, *seqno, mbox1_reg);
  305. update_mboxes(ring, *seqno, mbox2_reg);
  306. intel_ring_emit(ring, MI_STORE_DWORD_INDEX);
  307. intel_ring_emit(ring, I915_GEM_HWS_INDEX << MI_STORE_DWORD_INDEX_SHIFT);
  308. intel_ring_emit(ring, *seqno);
  309. intel_ring_emit(ring, MI_USER_INTERRUPT);
  310. intel_ring_advance(ring);
  311. return 0;
  312. }
  313. /**
  314. * intel_ring_sync - sync the waiter to the signaller on seqno
  315. *
  316. * @waiter - ring that is waiting
  317. * @signaller - ring which has, or will signal
  318. * @seqno - seqno which the waiter will block on
  319. */
  320. static int
  321. intel_ring_sync(struct intel_ring_buffer *waiter,
  322. struct intel_ring_buffer *signaller,
  323. int ring,
  324. u32 seqno)
  325. {
  326. int ret;
  327. u32 dw1 = MI_SEMAPHORE_MBOX |
  328. MI_SEMAPHORE_COMPARE |
  329. MI_SEMAPHORE_REGISTER;
  330. ret = intel_ring_begin(waiter, 4);
  331. if (ret)
  332. return ret;
  333. intel_ring_emit(waiter, dw1 | signaller->semaphore_register[ring]);
  334. intel_ring_emit(waiter, seqno);
  335. intel_ring_emit(waiter, 0);
  336. intel_ring_emit(waiter, MI_NOOP);
  337. intel_ring_advance(waiter);
  338. return 0;
  339. }
  340. /* VCS->RCS (RVSYNC) or BCS->RCS (RBSYNC) */
  341. int
  342. render_ring_sync_to(struct intel_ring_buffer *waiter,
  343. struct intel_ring_buffer *signaller,
  344. u32 seqno)
  345. {
  346. WARN_ON(signaller->semaphore_register[RCS] == MI_SEMAPHORE_SYNC_INVALID);
  347. return intel_ring_sync(waiter,
  348. signaller,
  349. RCS,
  350. seqno);
  351. }
  352. /* RCS->VCS (VRSYNC) or BCS->VCS (VBSYNC) */
  353. int
  354. gen6_bsd_ring_sync_to(struct intel_ring_buffer *waiter,
  355. struct intel_ring_buffer *signaller,
  356. u32 seqno)
  357. {
  358. WARN_ON(signaller->semaphore_register[VCS] == MI_SEMAPHORE_SYNC_INVALID);
  359. return intel_ring_sync(waiter,
  360. signaller,
  361. VCS,
  362. seqno);
  363. }
  364. /* RCS->BCS (BRSYNC) or VCS->BCS (BVSYNC) */
  365. int
  366. gen6_blt_ring_sync_to(struct intel_ring_buffer *waiter,
  367. struct intel_ring_buffer *signaller,
  368. u32 seqno)
  369. {
  370. WARN_ON(signaller->semaphore_register[BCS] == MI_SEMAPHORE_SYNC_INVALID);
  371. return intel_ring_sync(waiter,
  372. signaller,
  373. BCS,
  374. seqno);
  375. }
  376. #define PIPE_CONTROL_FLUSH(ring__, addr__) \
  377. do { \
  378. intel_ring_emit(ring__, GFX_OP_PIPE_CONTROL(4) | PIPE_CONTROL_QW_WRITE | \
  379. PIPE_CONTROL_DEPTH_STALL); \
  380. intel_ring_emit(ring__, (addr__) | PIPE_CONTROL_GLOBAL_GTT); \
  381. intel_ring_emit(ring__, 0); \
  382. intel_ring_emit(ring__, 0); \
  383. } while (0)
  384. static int
  385. pc_render_add_request(struct intel_ring_buffer *ring,
  386. u32 *result)
  387. {
  388. struct drm_device *dev = ring->dev;
  389. u32 seqno = i915_gem_get_seqno(dev);
  390. struct pipe_control *pc = ring->private;
  391. u32 scratch_addr = pc->gtt_offset + 128;
  392. int ret;
  393. /* For Ironlake, MI_USER_INTERRUPT was deprecated and apparently
  394. * incoherent with writes to memory, i.e. completely fubar,
  395. * so we need to use PIPE_NOTIFY instead.
  396. *
  397. * However, we also need to workaround the qword write
  398. * incoherence by flushing the 6 PIPE_NOTIFY buffers out to
  399. * memory before requesting an interrupt.
  400. */
  401. ret = intel_ring_begin(ring, 32);
  402. if (ret)
  403. return ret;
  404. intel_ring_emit(ring, GFX_OP_PIPE_CONTROL(4) | PIPE_CONTROL_QW_WRITE |
  405. PIPE_CONTROL_WRITE_FLUSH |
  406. PIPE_CONTROL_TEXTURE_CACHE_INVALIDATE);
  407. intel_ring_emit(ring, pc->gtt_offset | PIPE_CONTROL_GLOBAL_GTT);
  408. intel_ring_emit(ring, seqno);
  409. intel_ring_emit(ring, 0);
  410. PIPE_CONTROL_FLUSH(ring, scratch_addr);
  411. scratch_addr += 128; /* write to separate cachelines */
  412. PIPE_CONTROL_FLUSH(ring, scratch_addr);
  413. scratch_addr += 128;
  414. PIPE_CONTROL_FLUSH(ring, scratch_addr);
  415. scratch_addr += 128;
  416. PIPE_CONTROL_FLUSH(ring, scratch_addr);
  417. scratch_addr += 128;
  418. PIPE_CONTROL_FLUSH(ring, scratch_addr);
  419. scratch_addr += 128;
  420. PIPE_CONTROL_FLUSH(ring, scratch_addr);
  421. intel_ring_emit(ring, GFX_OP_PIPE_CONTROL(4) | PIPE_CONTROL_QW_WRITE |
  422. PIPE_CONTROL_WRITE_FLUSH |
  423. PIPE_CONTROL_TEXTURE_CACHE_INVALIDATE |
  424. PIPE_CONTROL_NOTIFY);
  425. intel_ring_emit(ring, pc->gtt_offset | PIPE_CONTROL_GLOBAL_GTT);
  426. intel_ring_emit(ring, seqno);
  427. intel_ring_emit(ring, 0);
  428. intel_ring_advance(ring);
  429. *result = seqno;
  430. return 0;
  431. }
  432. static int
  433. render_ring_add_request(struct intel_ring_buffer *ring,
  434. u32 *result)
  435. {
  436. struct drm_device *dev = ring->dev;
  437. u32 seqno = i915_gem_get_seqno(dev);
  438. int ret;
  439. ret = intel_ring_begin(ring, 4);
  440. if (ret)
  441. return ret;
  442. intel_ring_emit(ring, MI_STORE_DWORD_INDEX);
  443. intel_ring_emit(ring, I915_GEM_HWS_INDEX << MI_STORE_DWORD_INDEX_SHIFT);
  444. intel_ring_emit(ring, seqno);
  445. intel_ring_emit(ring, MI_USER_INTERRUPT);
  446. intel_ring_advance(ring);
  447. *result = seqno;
  448. return 0;
  449. }
  450. static u32
  451. ring_get_seqno(struct intel_ring_buffer *ring)
  452. {
  453. return intel_read_status_page(ring, I915_GEM_HWS_INDEX);
  454. }
  455. static u32
  456. pc_render_get_seqno(struct intel_ring_buffer *ring)
  457. {
  458. struct pipe_control *pc = ring->private;
  459. return pc->cpu_page[0];
  460. }
  461. static void
  462. ironlake_enable_irq(drm_i915_private_t *dev_priv, u32 mask)
  463. {
  464. dev_priv->gt_irq_mask &= ~mask;
  465. I915_WRITE(GTIMR, dev_priv->gt_irq_mask);
  466. POSTING_READ(GTIMR);
  467. }
  468. static void
  469. ironlake_disable_irq(drm_i915_private_t *dev_priv, u32 mask)
  470. {
  471. dev_priv->gt_irq_mask |= mask;
  472. I915_WRITE(GTIMR, dev_priv->gt_irq_mask);
  473. POSTING_READ(GTIMR);
  474. }
  475. static void
  476. i915_enable_irq(drm_i915_private_t *dev_priv, u32 mask)
  477. {
  478. dev_priv->irq_mask &= ~mask;
  479. I915_WRITE(IMR, dev_priv->irq_mask);
  480. POSTING_READ(IMR);
  481. }
  482. static void
  483. i915_disable_irq(drm_i915_private_t *dev_priv, u32 mask)
  484. {
  485. dev_priv->irq_mask |= mask;
  486. I915_WRITE(IMR, dev_priv->irq_mask);
  487. POSTING_READ(IMR);
  488. }
  489. static bool
  490. render_ring_get_irq(struct intel_ring_buffer *ring)
  491. {
  492. struct drm_device *dev = ring->dev;
  493. drm_i915_private_t *dev_priv = dev->dev_private;
  494. if (!dev->irq_enabled)
  495. return false;
  496. spin_lock(&ring->irq_lock);
  497. if (ring->irq_refcount++ == 0) {
  498. if (HAS_PCH_SPLIT(dev))
  499. ironlake_enable_irq(dev_priv,
  500. GT_PIPE_NOTIFY | GT_USER_INTERRUPT);
  501. else
  502. i915_enable_irq(dev_priv, I915_USER_INTERRUPT);
  503. }
  504. spin_unlock(&ring->irq_lock);
  505. return true;
  506. }
  507. static void
  508. render_ring_put_irq(struct intel_ring_buffer *ring)
  509. {
  510. struct drm_device *dev = ring->dev;
  511. drm_i915_private_t *dev_priv = dev->dev_private;
  512. spin_lock(&ring->irq_lock);
  513. if (--ring->irq_refcount == 0) {
  514. if (HAS_PCH_SPLIT(dev))
  515. ironlake_disable_irq(dev_priv,
  516. GT_USER_INTERRUPT |
  517. GT_PIPE_NOTIFY);
  518. else
  519. i915_disable_irq(dev_priv, I915_USER_INTERRUPT);
  520. }
  521. spin_unlock(&ring->irq_lock);
  522. }
  523. void intel_ring_setup_status_page(struct intel_ring_buffer *ring)
  524. {
  525. struct drm_device *dev = ring->dev;
  526. drm_i915_private_t *dev_priv = ring->dev->dev_private;
  527. u32 mmio = 0;
  528. /* The ring status page addresses are no longer next to the rest of
  529. * the ring registers as of gen7.
  530. */
  531. if (IS_GEN7(dev)) {
  532. switch (ring->id) {
  533. case RING_RENDER:
  534. mmio = RENDER_HWS_PGA_GEN7;
  535. break;
  536. case RING_BLT:
  537. mmio = BLT_HWS_PGA_GEN7;
  538. break;
  539. case RING_BSD:
  540. mmio = BSD_HWS_PGA_GEN7;
  541. break;
  542. }
  543. } else if (IS_GEN6(ring->dev)) {
  544. mmio = RING_HWS_PGA_GEN6(ring->mmio_base);
  545. } else {
  546. mmio = RING_HWS_PGA(ring->mmio_base);
  547. }
  548. I915_WRITE(mmio, (u32)ring->status_page.gfx_addr);
  549. POSTING_READ(mmio);
  550. }
  551. static int
  552. bsd_ring_flush(struct intel_ring_buffer *ring,
  553. u32 invalidate_domains,
  554. u32 flush_domains)
  555. {
  556. int ret;
  557. ret = intel_ring_begin(ring, 2);
  558. if (ret)
  559. return ret;
  560. intel_ring_emit(ring, MI_FLUSH);
  561. intel_ring_emit(ring, MI_NOOP);
  562. intel_ring_advance(ring);
  563. return 0;
  564. }
  565. static int
  566. ring_add_request(struct intel_ring_buffer *ring,
  567. u32 *result)
  568. {
  569. u32 seqno;
  570. int ret;
  571. ret = intel_ring_begin(ring, 4);
  572. if (ret)
  573. return ret;
  574. seqno = i915_gem_get_seqno(ring->dev);
  575. intel_ring_emit(ring, MI_STORE_DWORD_INDEX);
  576. intel_ring_emit(ring, I915_GEM_HWS_INDEX << MI_STORE_DWORD_INDEX_SHIFT);
  577. intel_ring_emit(ring, seqno);
  578. intel_ring_emit(ring, MI_USER_INTERRUPT);
  579. intel_ring_advance(ring);
  580. *result = seqno;
  581. return 0;
  582. }
  583. static bool
  584. gen6_ring_get_irq(struct intel_ring_buffer *ring, u32 gflag, u32 rflag)
  585. {
  586. struct drm_device *dev = ring->dev;
  587. drm_i915_private_t *dev_priv = dev->dev_private;
  588. if (!dev->irq_enabled)
  589. return false;
  590. spin_lock(&ring->irq_lock);
  591. if (ring->irq_refcount++ == 0) {
  592. ring->irq_mask &= ~rflag;
  593. I915_WRITE_IMR(ring, ring->irq_mask);
  594. ironlake_enable_irq(dev_priv, gflag);
  595. }
  596. spin_unlock(&ring->irq_lock);
  597. return true;
  598. }
  599. static void
  600. gen6_ring_put_irq(struct intel_ring_buffer *ring, u32 gflag, u32 rflag)
  601. {
  602. struct drm_device *dev = ring->dev;
  603. drm_i915_private_t *dev_priv = dev->dev_private;
  604. spin_lock(&ring->irq_lock);
  605. if (--ring->irq_refcount == 0) {
  606. ring->irq_mask |= rflag;
  607. I915_WRITE_IMR(ring, ring->irq_mask);
  608. ironlake_disable_irq(dev_priv, gflag);
  609. }
  610. spin_unlock(&ring->irq_lock);
  611. }
  612. static bool
  613. bsd_ring_get_irq(struct intel_ring_buffer *ring)
  614. {
  615. struct drm_device *dev = ring->dev;
  616. drm_i915_private_t *dev_priv = dev->dev_private;
  617. if (!dev->irq_enabled)
  618. return false;
  619. spin_lock(&ring->irq_lock);
  620. if (ring->irq_refcount++ == 0) {
  621. if (IS_G4X(dev))
  622. i915_enable_irq(dev_priv, I915_BSD_USER_INTERRUPT);
  623. else
  624. ironlake_enable_irq(dev_priv, GT_BSD_USER_INTERRUPT);
  625. }
  626. spin_unlock(&ring->irq_lock);
  627. return true;
  628. }
  629. static void
  630. bsd_ring_put_irq(struct intel_ring_buffer *ring)
  631. {
  632. struct drm_device *dev = ring->dev;
  633. drm_i915_private_t *dev_priv = dev->dev_private;
  634. spin_lock(&ring->irq_lock);
  635. if (--ring->irq_refcount == 0) {
  636. if (IS_G4X(dev))
  637. i915_disable_irq(dev_priv, I915_BSD_USER_INTERRUPT);
  638. else
  639. ironlake_disable_irq(dev_priv, GT_BSD_USER_INTERRUPT);
  640. }
  641. spin_unlock(&ring->irq_lock);
  642. }
  643. static int
  644. ring_dispatch_execbuffer(struct intel_ring_buffer *ring, u32 offset, u32 length)
  645. {
  646. int ret;
  647. ret = intel_ring_begin(ring, 2);
  648. if (ret)
  649. return ret;
  650. intel_ring_emit(ring,
  651. MI_BATCH_BUFFER_START | (2 << 6) |
  652. MI_BATCH_NON_SECURE_I965);
  653. intel_ring_emit(ring, offset);
  654. intel_ring_advance(ring);
  655. return 0;
  656. }
  657. static int
  658. render_ring_dispatch_execbuffer(struct intel_ring_buffer *ring,
  659. u32 offset, u32 len)
  660. {
  661. struct drm_device *dev = ring->dev;
  662. int ret;
  663. if (IS_I830(dev) || IS_845G(dev)) {
  664. ret = intel_ring_begin(ring, 4);
  665. if (ret)
  666. return ret;
  667. intel_ring_emit(ring, MI_BATCH_BUFFER);
  668. intel_ring_emit(ring, offset | MI_BATCH_NON_SECURE);
  669. intel_ring_emit(ring, offset + len - 8);
  670. intel_ring_emit(ring, 0);
  671. } else {
  672. ret = intel_ring_begin(ring, 2);
  673. if (ret)
  674. return ret;
  675. if (INTEL_INFO(dev)->gen >= 4) {
  676. intel_ring_emit(ring,
  677. MI_BATCH_BUFFER_START | (2 << 6) |
  678. MI_BATCH_NON_SECURE_I965);
  679. intel_ring_emit(ring, offset);
  680. } else {
  681. intel_ring_emit(ring,
  682. MI_BATCH_BUFFER_START | (2 << 6));
  683. intel_ring_emit(ring, offset | MI_BATCH_NON_SECURE);
  684. }
  685. }
  686. intel_ring_advance(ring);
  687. return 0;
  688. }
  689. static void cleanup_status_page(struct intel_ring_buffer *ring)
  690. {
  691. drm_i915_private_t *dev_priv = ring->dev->dev_private;
  692. struct drm_i915_gem_object *obj;
  693. obj = ring->status_page.obj;
  694. if (obj == NULL)
  695. return;
  696. kunmap(obj->pages[0]);
  697. i915_gem_object_unpin(obj);
  698. drm_gem_object_unreference(&obj->base);
  699. ring->status_page.obj = NULL;
  700. memset(&dev_priv->hws_map, 0, sizeof(dev_priv->hws_map));
  701. }
  702. static int init_status_page(struct intel_ring_buffer *ring)
  703. {
  704. struct drm_device *dev = ring->dev;
  705. drm_i915_private_t *dev_priv = dev->dev_private;
  706. struct drm_i915_gem_object *obj;
  707. int ret;
  708. obj = i915_gem_alloc_object(dev, 4096);
  709. if (obj == NULL) {
  710. DRM_ERROR("Failed to allocate status page\n");
  711. ret = -ENOMEM;
  712. goto err;
  713. }
  714. i915_gem_object_set_cache_level(obj, I915_CACHE_LLC);
  715. ret = i915_gem_object_pin(obj, 4096, true);
  716. if (ret != 0) {
  717. goto err_unref;
  718. }
  719. ring->status_page.gfx_addr = obj->gtt_offset;
  720. ring->status_page.page_addr = kmap(obj->pages[0]);
  721. if (ring->status_page.page_addr == NULL) {
  722. memset(&dev_priv->hws_map, 0, sizeof(dev_priv->hws_map));
  723. goto err_unpin;
  724. }
  725. ring->status_page.obj = obj;
  726. memset(ring->status_page.page_addr, 0, PAGE_SIZE);
  727. intel_ring_setup_status_page(ring);
  728. DRM_DEBUG_DRIVER("%s hws offset: 0x%08x\n",
  729. ring->name, ring->status_page.gfx_addr);
  730. return 0;
  731. err_unpin:
  732. i915_gem_object_unpin(obj);
  733. err_unref:
  734. drm_gem_object_unreference(&obj->base);
  735. err:
  736. return ret;
  737. }
  738. int intel_init_ring_buffer(struct drm_device *dev,
  739. struct intel_ring_buffer *ring)
  740. {
  741. struct drm_i915_gem_object *obj;
  742. int ret;
  743. ring->dev = dev;
  744. INIT_LIST_HEAD(&ring->active_list);
  745. INIT_LIST_HEAD(&ring->request_list);
  746. INIT_LIST_HEAD(&ring->gpu_write_list);
  747. init_waitqueue_head(&ring->irq_queue);
  748. spin_lock_init(&ring->irq_lock);
  749. ring->irq_mask = ~0;
  750. if (I915_NEED_GFX_HWS(dev)) {
  751. ret = init_status_page(ring);
  752. if (ret)
  753. return ret;
  754. }
  755. obj = i915_gem_alloc_object(dev, ring->size);
  756. if (obj == NULL) {
  757. DRM_ERROR("Failed to allocate ringbuffer\n");
  758. ret = -ENOMEM;
  759. goto err_hws;
  760. }
  761. ring->obj = obj;
  762. ret = i915_gem_object_pin(obj, PAGE_SIZE, true);
  763. if (ret)
  764. goto err_unref;
  765. ring->map.size = ring->size;
  766. ring->map.offset = dev->agp->base + obj->gtt_offset;
  767. ring->map.type = 0;
  768. ring->map.flags = 0;
  769. ring->map.mtrr = 0;
  770. drm_core_ioremap_wc(&ring->map, dev);
  771. if (ring->map.handle == NULL) {
  772. DRM_ERROR("Failed to map ringbuffer.\n");
  773. ret = -EINVAL;
  774. goto err_unpin;
  775. }
  776. ring->virtual_start = ring->map.handle;
  777. ret = ring->init(ring);
  778. if (ret)
  779. goto err_unmap;
  780. /* Workaround an erratum on the i830 which causes a hang if
  781. * the TAIL pointer points to within the last 2 cachelines
  782. * of the buffer.
  783. */
  784. ring->effective_size = ring->size;
  785. if (IS_I830(ring->dev))
  786. ring->effective_size -= 128;
  787. return 0;
  788. err_unmap:
  789. drm_core_ioremapfree(&ring->map, dev);
  790. err_unpin:
  791. i915_gem_object_unpin(obj);
  792. err_unref:
  793. drm_gem_object_unreference(&obj->base);
  794. ring->obj = NULL;
  795. err_hws:
  796. cleanup_status_page(ring);
  797. return ret;
  798. }
  799. void intel_cleanup_ring_buffer(struct intel_ring_buffer *ring)
  800. {
  801. struct drm_i915_private *dev_priv;
  802. int ret;
  803. if (ring->obj == NULL)
  804. return;
  805. /* Disable the ring buffer. The ring must be idle at this point */
  806. dev_priv = ring->dev->dev_private;
  807. ret = intel_wait_ring_idle(ring);
  808. if (ret)
  809. DRM_ERROR("failed to quiesce %s whilst cleaning up: %d\n",
  810. ring->name, ret);
  811. I915_WRITE_CTL(ring, 0);
  812. drm_core_ioremapfree(&ring->map, ring->dev);
  813. i915_gem_object_unpin(ring->obj);
  814. drm_gem_object_unreference(&ring->obj->base);
  815. ring->obj = NULL;
  816. if (ring->cleanup)
  817. ring->cleanup(ring);
  818. cleanup_status_page(ring);
  819. }
  820. static int intel_wrap_ring_buffer(struct intel_ring_buffer *ring)
  821. {
  822. unsigned int *virt;
  823. int rem = ring->size - ring->tail;
  824. if (ring->space < rem) {
  825. int ret = intel_wait_ring_buffer(ring, rem);
  826. if (ret)
  827. return ret;
  828. }
  829. virt = (unsigned int *)(ring->virtual_start + ring->tail);
  830. rem /= 8;
  831. while (rem--) {
  832. *virt++ = MI_NOOP;
  833. *virt++ = MI_NOOP;
  834. }
  835. ring->tail = 0;
  836. ring->space = ring_space(ring);
  837. return 0;
  838. }
  839. int intel_wait_ring_buffer(struct intel_ring_buffer *ring, int n)
  840. {
  841. struct drm_device *dev = ring->dev;
  842. struct drm_i915_private *dev_priv = dev->dev_private;
  843. unsigned long end;
  844. u32 head;
  845. /* If the reported head position has wrapped or hasn't advanced,
  846. * fallback to the slow and accurate path.
  847. */
  848. head = intel_read_status_page(ring, 4);
  849. if (head > ring->head) {
  850. ring->head = head;
  851. ring->space = ring_space(ring);
  852. if (ring->space >= n)
  853. return 0;
  854. }
  855. trace_i915_ring_wait_begin(ring);
  856. end = jiffies + 3 * HZ;
  857. do {
  858. ring->head = I915_READ_HEAD(ring);
  859. ring->space = ring_space(ring);
  860. if (ring->space >= n) {
  861. trace_i915_ring_wait_end(ring);
  862. return 0;
  863. }
  864. if (dev->primary->master) {
  865. struct drm_i915_master_private *master_priv = dev->primary->master->driver_priv;
  866. if (master_priv->sarea_priv)
  867. master_priv->sarea_priv->perf_boxes |= I915_BOX_WAIT;
  868. }
  869. msleep(1);
  870. if (atomic_read(&dev_priv->mm.wedged))
  871. return -EAGAIN;
  872. } while (!time_after(jiffies, end));
  873. trace_i915_ring_wait_end(ring);
  874. return -EBUSY;
  875. }
  876. int intel_ring_begin(struct intel_ring_buffer *ring,
  877. int num_dwords)
  878. {
  879. struct drm_i915_private *dev_priv = ring->dev->dev_private;
  880. int n = 4*num_dwords;
  881. int ret;
  882. if (unlikely(atomic_read(&dev_priv->mm.wedged)))
  883. return -EIO;
  884. if (unlikely(ring->tail + n > ring->effective_size)) {
  885. ret = intel_wrap_ring_buffer(ring);
  886. if (unlikely(ret))
  887. return ret;
  888. }
  889. if (unlikely(ring->space < n)) {
  890. ret = intel_wait_ring_buffer(ring, n);
  891. if (unlikely(ret))
  892. return ret;
  893. }
  894. ring->space -= n;
  895. return 0;
  896. }
  897. void intel_ring_advance(struct intel_ring_buffer *ring)
  898. {
  899. ring->tail &= ring->size - 1;
  900. ring->write_tail(ring, ring->tail);
  901. }
  902. static const struct intel_ring_buffer render_ring = {
  903. .name = "render ring",
  904. .id = RING_RENDER,
  905. .mmio_base = RENDER_RING_BASE,
  906. .size = 32 * PAGE_SIZE,
  907. .init = init_render_ring,
  908. .write_tail = ring_write_tail,
  909. .flush = render_ring_flush,
  910. .add_request = render_ring_add_request,
  911. .get_seqno = ring_get_seqno,
  912. .irq_get = render_ring_get_irq,
  913. .irq_put = render_ring_put_irq,
  914. .dispatch_execbuffer = render_ring_dispatch_execbuffer,
  915. .cleanup = render_ring_cleanup,
  916. .sync_to = render_ring_sync_to,
  917. .semaphore_register = {MI_SEMAPHORE_SYNC_INVALID,
  918. MI_SEMAPHORE_SYNC_RV,
  919. MI_SEMAPHORE_SYNC_RB},
  920. .signal_mbox = {GEN6_VRSYNC, GEN6_BRSYNC},
  921. };
  922. /* ring buffer for bit-stream decoder */
  923. static const struct intel_ring_buffer bsd_ring = {
  924. .name = "bsd ring",
  925. .id = RING_BSD,
  926. .mmio_base = BSD_RING_BASE,
  927. .size = 32 * PAGE_SIZE,
  928. .init = init_ring_common,
  929. .write_tail = ring_write_tail,
  930. .flush = bsd_ring_flush,
  931. .add_request = ring_add_request,
  932. .get_seqno = ring_get_seqno,
  933. .irq_get = bsd_ring_get_irq,
  934. .irq_put = bsd_ring_put_irq,
  935. .dispatch_execbuffer = ring_dispatch_execbuffer,
  936. };
  937. static void gen6_bsd_ring_write_tail(struct intel_ring_buffer *ring,
  938. u32 value)
  939. {
  940. drm_i915_private_t *dev_priv = ring->dev->dev_private;
  941. /* Every tail move must follow the sequence below */
  942. I915_WRITE(GEN6_BSD_SLEEP_PSMI_CONTROL,
  943. GEN6_BSD_SLEEP_PSMI_CONTROL_RC_ILDL_MESSAGE_MODIFY_MASK |
  944. GEN6_BSD_SLEEP_PSMI_CONTROL_RC_ILDL_MESSAGE_DISABLE);
  945. I915_WRITE(GEN6_BSD_RNCID, 0x0);
  946. if (wait_for((I915_READ(GEN6_BSD_SLEEP_PSMI_CONTROL) &
  947. GEN6_BSD_SLEEP_PSMI_CONTROL_IDLE_INDICATOR) == 0,
  948. 50))
  949. DRM_ERROR("timed out waiting for IDLE Indicator\n");
  950. I915_WRITE_TAIL(ring, value);
  951. I915_WRITE(GEN6_BSD_SLEEP_PSMI_CONTROL,
  952. GEN6_BSD_SLEEP_PSMI_CONTROL_RC_ILDL_MESSAGE_MODIFY_MASK |
  953. GEN6_BSD_SLEEP_PSMI_CONTROL_RC_ILDL_MESSAGE_ENABLE);
  954. }
  955. static int gen6_ring_flush(struct intel_ring_buffer *ring,
  956. u32 invalidate, u32 flush)
  957. {
  958. uint32_t cmd;
  959. int ret;
  960. ret = intel_ring_begin(ring, 4);
  961. if (ret)
  962. return ret;
  963. cmd = MI_FLUSH_DW;
  964. if (invalidate & I915_GEM_GPU_DOMAINS)
  965. cmd |= MI_INVALIDATE_TLB | MI_INVALIDATE_BSD;
  966. intel_ring_emit(ring, cmd);
  967. intel_ring_emit(ring, 0);
  968. intel_ring_emit(ring, 0);
  969. intel_ring_emit(ring, MI_NOOP);
  970. intel_ring_advance(ring);
  971. return 0;
  972. }
  973. static int
  974. gen6_ring_dispatch_execbuffer(struct intel_ring_buffer *ring,
  975. u32 offset, u32 len)
  976. {
  977. int ret;
  978. ret = intel_ring_begin(ring, 2);
  979. if (ret)
  980. return ret;
  981. intel_ring_emit(ring, MI_BATCH_BUFFER_START | MI_BATCH_NON_SECURE_I965);
  982. /* bit0-7 is the length on GEN6+ */
  983. intel_ring_emit(ring, offset);
  984. intel_ring_advance(ring);
  985. return 0;
  986. }
  987. static bool
  988. gen6_render_ring_get_irq(struct intel_ring_buffer *ring)
  989. {
  990. return gen6_ring_get_irq(ring,
  991. GT_USER_INTERRUPT,
  992. GEN6_RENDER_USER_INTERRUPT);
  993. }
  994. static void
  995. gen6_render_ring_put_irq(struct intel_ring_buffer *ring)
  996. {
  997. return gen6_ring_put_irq(ring,
  998. GT_USER_INTERRUPT,
  999. GEN6_RENDER_USER_INTERRUPT);
  1000. }
  1001. static bool
  1002. gen6_bsd_ring_get_irq(struct intel_ring_buffer *ring)
  1003. {
  1004. return gen6_ring_get_irq(ring,
  1005. GT_GEN6_BSD_USER_INTERRUPT,
  1006. GEN6_BSD_USER_INTERRUPT);
  1007. }
  1008. static void
  1009. gen6_bsd_ring_put_irq(struct intel_ring_buffer *ring)
  1010. {
  1011. return gen6_ring_put_irq(ring,
  1012. GT_GEN6_BSD_USER_INTERRUPT,
  1013. GEN6_BSD_USER_INTERRUPT);
  1014. }
  1015. /* ring buffer for Video Codec for Gen6+ */
  1016. static const struct intel_ring_buffer gen6_bsd_ring = {
  1017. .name = "gen6 bsd ring",
  1018. .id = RING_BSD,
  1019. .mmio_base = GEN6_BSD_RING_BASE,
  1020. .size = 32 * PAGE_SIZE,
  1021. .init = init_ring_common,
  1022. .write_tail = gen6_bsd_ring_write_tail,
  1023. .flush = gen6_ring_flush,
  1024. .add_request = gen6_add_request,
  1025. .get_seqno = ring_get_seqno,
  1026. .irq_get = gen6_bsd_ring_get_irq,
  1027. .irq_put = gen6_bsd_ring_put_irq,
  1028. .dispatch_execbuffer = gen6_ring_dispatch_execbuffer,
  1029. .sync_to = gen6_bsd_ring_sync_to,
  1030. .semaphore_register = {MI_SEMAPHORE_SYNC_VR,
  1031. MI_SEMAPHORE_SYNC_INVALID,
  1032. MI_SEMAPHORE_SYNC_VB},
  1033. .signal_mbox = {GEN6_RVSYNC, GEN6_BVSYNC},
  1034. };
  1035. /* Blitter support (SandyBridge+) */
  1036. static bool
  1037. blt_ring_get_irq(struct intel_ring_buffer *ring)
  1038. {
  1039. return gen6_ring_get_irq(ring,
  1040. GT_BLT_USER_INTERRUPT,
  1041. GEN6_BLITTER_USER_INTERRUPT);
  1042. }
  1043. static void
  1044. blt_ring_put_irq(struct intel_ring_buffer *ring)
  1045. {
  1046. gen6_ring_put_irq(ring,
  1047. GT_BLT_USER_INTERRUPT,
  1048. GEN6_BLITTER_USER_INTERRUPT);
  1049. }
  1050. /* Workaround for some stepping of SNB,
  1051. * each time when BLT engine ring tail moved,
  1052. * the first command in the ring to be parsed
  1053. * should be MI_BATCH_BUFFER_START
  1054. */
  1055. #define NEED_BLT_WORKAROUND(dev) \
  1056. (IS_GEN6(dev) && (dev->pdev->revision < 8))
  1057. static inline struct drm_i915_gem_object *
  1058. to_blt_workaround(struct intel_ring_buffer *ring)
  1059. {
  1060. return ring->private;
  1061. }
  1062. static int blt_ring_init(struct intel_ring_buffer *ring)
  1063. {
  1064. if (NEED_BLT_WORKAROUND(ring->dev)) {
  1065. struct drm_i915_gem_object *obj;
  1066. u32 *ptr;
  1067. int ret;
  1068. obj = i915_gem_alloc_object(ring->dev, 4096);
  1069. if (obj == NULL)
  1070. return -ENOMEM;
  1071. ret = i915_gem_object_pin(obj, 4096, true);
  1072. if (ret) {
  1073. drm_gem_object_unreference(&obj->base);
  1074. return ret;
  1075. }
  1076. ptr = kmap(obj->pages[0]);
  1077. *ptr++ = MI_BATCH_BUFFER_END;
  1078. *ptr++ = MI_NOOP;
  1079. kunmap(obj->pages[0]);
  1080. ret = i915_gem_object_set_to_gtt_domain(obj, false);
  1081. if (ret) {
  1082. i915_gem_object_unpin(obj);
  1083. drm_gem_object_unreference(&obj->base);
  1084. return ret;
  1085. }
  1086. ring->private = obj;
  1087. }
  1088. return init_ring_common(ring);
  1089. }
  1090. static int blt_ring_begin(struct intel_ring_buffer *ring,
  1091. int num_dwords)
  1092. {
  1093. if (ring->private) {
  1094. int ret = intel_ring_begin(ring, num_dwords+2);
  1095. if (ret)
  1096. return ret;
  1097. intel_ring_emit(ring, MI_BATCH_BUFFER_START);
  1098. intel_ring_emit(ring, to_blt_workaround(ring)->gtt_offset);
  1099. return 0;
  1100. } else
  1101. return intel_ring_begin(ring, 4);
  1102. }
  1103. static int blt_ring_flush(struct intel_ring_buffer *ring,
  1104. u32 invalidate, u32 flush)
  1105. {
  1106. uint32_t cmd;
  1107. int ret;
  1108. ret = blt_ring_begin(ring, 4);
  1109. if (ret)
  1110. return ret;
  1111. cmd = MI_FLUSH_DW;
  1112. if (invalidate & I915_GEM_DOMAIN_RENDER)
  1113. cmd |= MI_INVALIDATE_TLB;
  1114. intel_ring_emit(ring, cmd);
  1115. intel_ring_emit(ring, 0);
  1116. intel_ring_emit(ring, 0);
  1117. intel_ring_emit(ring, MI_NOOP);
  1118. intel_ring_advance(ring);
  1119. return 0;
  1120. }
  1121. static void blt_ring_cleanup(struct intel_ring_buffer *ring)
  1122. {
  1123. if (!ring->private)
  1124. return;
  1125. i915_gem_object_unpin(ring->private);
  1126. drm_gem_object_unreference(ring->private);
  1127. ring->private = NULL;
  1128. }
  1129. static const struct intel_ring_buffer gen6_blt_ring = {
  1130. .name = "blt ring",
  1131. .id = RING_BLT,
  1132. .mmio_base = BLT_RING_BASE,
  1133. .size = 32 * PAGE_SIZE,
  1134. .init = blt_ring_init,
  1135. .write_tail = ring_write_tail,
  1136. .flush = blt_ring_flush,
  1137. .add_request = gen6_add_request,
  1138. .get_seqno = ring_get_seqno,
  1139. .irq_get = blt_ring_get_irq,
  1140. .irq_put = blt_ring_put_irq,
  1141. .dispatch_execbuffer = gen6_ring_dispatch_execbuffer,
  1142. .cleanup = blt_ring_cleanup,
  1143. .sync_to = gen6_blt_ring_sync_to,
  1144. .semaphore_register = {MI_SEMAPHORE_SYNC_BR,
  1145. MI_SEMAPHORE_SYNC_BV,
  1146. MI_SEMAPHORE_SYNC_INVALID},
  1147. .signal_mbox = {GEN6_RBSYNC, GEN6_VBSYNC},
  1148. };
  1149. int intel_init_render_ring_buffer(struct drm_device *dev)
  1150. {
  1151. drm_i915_private_t *dev_priv = dev->dev_private;
  1152. struct intel_ring_buffer *ring = &dev_priv->ring[RCS];
  1153. *ring = render_ring;
  1154. if (INTEL_INFO(dev)->gen >= 6) {
  1155. ring->add_request = gen6_add_request;
  1156. ring->irq_get = gen6_render_ring_get_irq;
  1157. ring->irq_put = gen6_render_ring_put_irq;
  1158. } else if (IS_GEN5(dev)) {
  1159. ring->add_request = pc_render_add_request;
  1160. ring->get_seqno = pc_render_get_seqno;
  1161. }
  1162. if (!I915_NEED_GFX_HWS(dev)) {
  1163. ring->status_page.page_addr = dev_priv->status_page_dmah->vaddr;
  1164. memset(ring->status_page.page_addr, 0, PAGE_SIZE);
  1165. }
  1166. return intel_init_ring_buffer(dev, ring);
  1167. }
  1168. int intel_render_ring_init_dri(struct drm_device *dev, u64 start, u32 size)
  1169. {
  1170. drm_i915_private_t *dev_priv = dev->dev_private;
  1171. struct intel_ring_buffer *ring = &dev_priv->ring[RCS];
  1172. *ring = render_ring;
  1173. if (INTEL_INFO(dev)->gen >= 6) {
  1174. ring->add_request = gen6_add_request;
  1175. ring->irq_get = gen6_render_ring_get_irq;
  1176. ring->irq_put = gen6_render_ring_put_irq;
  1177. } else if (IS_GEN5(dev)) {
  1178. ring->add_request = pc_render_add_request;
  1179. ring->get_seqno = pc_render_get_seqno;
  1180. }
  1181. if (!I915_NEED_GFX_HWS(dev))
  1182. ring->status_page.page_addr = dev_priv->status_page_dmah->vaddr;
  1183. ring->dev = dev;
  1184. INIT_LIST_HEAD(&ring->active_list);
  1185. INIT_LIST_HEAD(&ring->request_list);
  1186. INIT_LIST_HEAD(&ring->gpu_write_list);
  1187. ring->size = size;
  1188. ring->effective_size = ring->size;
  1189. if (IS_I830(ring->dev))
  1190. ring->effective_size -= 128;
  1191. ring->map.offset = start;
  1192. ring->map.size = size;
  1193. ring->map.type = 0;
  1194. ring->map.flags = 0;
  1195. ring->map.mtrr = 0;
  1196. drm_core_ioremap_wc(&ring->map, dev);
  1197. if (ring->map.handle == NULL) {
  1198. DRM_ERROR("can not ioremap virtual address for"
  1199. " ring buffer\n");
  1200. return -ENOMEM;
  1201. }
  1202. ring->virtual_start = (void __force __iomem *)ring->map.handle;
  1203. return 0;
  1204. }
  1205. int intel_init_bsd_ring_buffer(struct drm_device *dev)
  1206. {
  1207. drm_i915_private_t *dev_priv = dev->dev_private;
  1208. struct intel_ring_buffer *ring = &dev_priv->ring[VCS];
  1209. if (IS_GEN6(dev) || IS_GEN7(dev))
  1210. *ring = gen6_bsd_ring;
  1211. else
  1212. *ring = bsd_ring;
  1213. return intel_init_ring_buffer(dev, ring);
  1214. }
  1215. int intel_init_blt_ring_buffer(struct drm_device *dev)
  1216. {
  1217. drm_i915_private_t *dev_priv = dev->dev_private;
  1218. struct intel_ring_buffer *ring = &dev_priv->ring[BCS];
  1219. *ring = gen6_blt_ring;
  1220. return intel_init_ring_buffer(dev, ring);
  1221. }