intel_ringbuffer.c 34 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442
  1. /*
  2. * Copyright © 2008-2010 Intel Corporation
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice (including the next
  12. * paragraph) shall be included in all copies or substantial portions of the
  13. * Software.
  14. *
  15. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  16. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  17. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  18. * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  19. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  20. * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
  21. * IN THE SOFTWARE.
  22. *
  23. * Authors:
  24. * Eric Anholt <eric@anholt.net>
  25. * Zou Nan hai <nanhai.zou@intel.com>
  26. * Xiang Hai hao<haihao.xiang@intel.com>
  27. *
  28. */
  29. #include "drmP.h"
  30. #include "drm.h"
  31. #include "i915_drv.h"
  32. #include "i915_drm.h"
  33. #include "i915_trace.h"
  34. #include "intel_drv.h"
  35. static inline int ring_space(struct intel_ring_buffer *ring)
  36. {
  37. int space = (ring->head & HEAD_ADDR) - (ring->tail + 8);
  38. if (space < 0)
  39. space += ring->size;
  40. return space;
  41. }
  42. static u32 i915_gem_get_seqno(struct drm_device *dev)
  43. {
  44. drm_i915_private_t *dev_priv = dev->dev_private;
  45. u32 seqno;
  46. seqno = dev_priv->next_seqno;
  47. /* reserve 0 for non-seqno */
  48. if (++dev_priv->next_seqno == 0)
  49. dev_priv->next_seqno = 1;
  50. return seqno;
  51. }
  52. static int
  53. render_ring_flush(struct intel_ring_buffer *ring,
  54. u32 invalidate_domains,
  55. u32 flush_domains)
  56. {
  57. struct drm_device *dev = ring->dev;
  58. u32 cmd;
  59. int ret;
  60. /*
  61. * read/write caches:
  62. *
  63. * I915_GEM_DOMAIN_RENDER is always invalidated, but is
  64. * only flushed if MI_NO_WRITE_FLUSH is unset. On 965, it is
  65. * also flushed at 2d versus 3d pipeline switches.
  66. *
  67. * read-only caches:
  68. *
  69. * I915_GEM_DOMAIN_SAMPLER is flushed on pre-965 if
  70. * MI_READ_FLUSH is set, and is always flushed on 965.
  71. *
  72. * I915_GEM_DOMAIN_COMMAND may not exist?
  73. *
  74. * I915_GEM_DOMAIN_INSTRUCTION, which exists on 965, is
  75. * invalidated when MI_EXE_FLUSH is set.
  76. *
  77. * I915_GEM_DOMAIN_VERTEX, which exists on 965, is
  78. * invalidated with every MI_FLUSH.
  79. *
  80. * TLBs:
  81. *
  82. * On 965, TLBs associated with I915_GEM_DOMAIN_COMMAND
  83. * and I915_GEM_DOMAIN_CPU in are invalidated at PTE write and
  84. * I915_GEM_DOMAIN_RENDER and I915_GEM_DOMAIN_SAMPLER
  85. * are flushed at any MI_FLUSH.
  86. */
  87. cmd = MI_FLUSH | MI_NO_WRITE_FLUSH;
  88. if ((invalidate_domains|flush_domains) &
  89. I915_GEM_DOMAIN_RENDER)
  90. cmd &= ~MI_NO_WRITE_FLUSH;
  91. if (INTEL_INFO(dev)->gen < 4) {
  92. /*
  93. * On the 965, the sampler cache always gets flushed
  94. * and this bit is reserved.
  95. */
  96. if (invalidate_domains & I915_GEM_DOMAIN_SAMPLER)
  97. cmd |= MI_READ_FLUSH;
  98. }
  99. if (invalidate_domains & I915_GEM_DOMAIN_INSTRUCTION)
  100. cmd |= MI_EXE_FLUSH;
  101. if (invalidate_domains & I915_GEM_DOMAIN_COMMAND &&
  102. (IS_G4X(dev) || IS_GEN5(dev)))
  103. cmd |= MI_INVALIDATE_ISP;
  104. ret = intel_ring_begin(ring, 2);
  105. if (ret)
  106. return ret;
  107. intel_ring_emit(ring, cmd);
  108. intel_ring_emit(ring, MI_NOOP);
  109. intel_ring_advance(ring);
  110. return 0;
  111. }
  112. static void ring_write_tail(struct intel_ring_buffer *ring,
  113. u32 value)
  114. {
  115. drm_i915_private_t *dev_priv = ring->dev->dev_private;
  116. I915_WRITE_TAIL(ring, value);
  117. }
  118. u32 intel_ring_get_active_head(struct intel_ring_buffer *ring)
  119. {
  120. drm_i915_private_t *dev_priv = ring->dev->dev_private;
  121. u32 acthd_reg = INTEL_INFO(ring->dev)->gen >= 4 ?
  122. RING_ACTHD(ring->mmio_base) : ACTHD;
  123. return I915_READ(acthd_reg);
  124. }
  125. static int init_ring_common(struct intel_ring_buffer *ring)
  126. {
  127. drm_i915_private_t *dev_priv = ring->dev->dev_private;
  128. struct drm_i915_gem_object *obj = ring->obj;
  129. u32 head;
  130. /* Stop the ring if it's running. */
  131. I915_WRITE_CTL(ring, 0);
  132. I915_WRITE_HEAD(ring, 0);
  133. ring->write_tail(ring, 0);
  134. /* Initialize the ring. */
  135. I915_WRITE_START(ring, obj->gtt_offset);
  136. head = I915_READ_HEAD(ring) & HEAD_ADDR;
  137. /* G45 ring initialization fails to reset head to zero */
  138. if (head != 0) {
  139. DRM_DEBUG_KMS("%s head not reset to zero "
  140. "ctl %08x head %08x tail %08x start %08x\n",
  141. ring->name,
  142. I915_READ_CTL(ring),
  143. I915_READ_HEAD(ring),
  144. I915_READ_TAIL(ring),
  145. I915_READ_START(ring));
  146. I915_WRITE_HEAD(ring, 0);
  147. if (I915_READ_HEAD(ring) & HEAD_ADDR) {
  148. DRM_ERROR("failed to set %s head to zero "
  149. "ctl %08x head %08x tail %08x start %08x\n",
  150. ring->name,
  151. I915_READ_CTL(ring),
  152. I915_READ_HEAD(ring),
  153. I915_READ_TAIL(ring),
  154. I915_READ_START(ring));
  155. }
  156. }
  157. I915_WRITE_CTL(ring,
  158. ((ring->size - PAGE_SIZE) & RING_NR_PAGES)
  159. | RING_REPORT_64K | RING_VALID);
  160. /* If the head is still not zero, the ring is dead */
  161. if ((I915_READ_CTL(ring) & RING_VALID) == 0 ||
  162. I915_READ_START(ring) != obj->gtt_offset ||
  163. (I915_READ_HEAD(ring) & HEAD_ADDR) != 0) {
  164. DRM_ERROR("%s initialization failed "
  165. "ctl %08x head %08x tail %08x start %08x\n",
  166. ring->name,
  167. I915_READ_CTL(ring),
  168. I915_READ_HEAD(ring),
  169. I915_READ_TAIL(ring),
  170. I915_READ_START(ring));
  171. return -EIO;
  172. }
  173. if (!drm_core_check_feature(ring->dev, DRIVER_MODESET))
  174. i915_kernel_lost_context(ring->dev);
  175. else {
  176. ring->head = I915_READ_HEAD(ring);
  177. ring->tail = I915_READ_TAIL(ring) & TAIL_ADDR;
  178. ring->space = ring_space(ring);
  179. }
  180. return 0;
  181. }
  182. /*
  183. * 965+ support PIPE_CONTROL commands, which provide finer grained control
  184. * over cache flushing.
  185. */
  186. struct pipe_control {
  187. struct drm_i915_gem_object *obj;
  188. volatile u32 *cpu_page;
  189. u32 gtt_offset;
  190. };
  191. static int
  192. init_pipe_control(struct intel_ring_buffer *ring)
  193. {
  194. struct pipe_control *pc;
  195. struct drm_i915_gem_object *obj;
  196. int ret;
  197. if (ring->private)
  198. return 0;
  199. pc = kmalloc(sizeof(*pc), GFP_KERNEL);
  200. if (!pc)
  201. return -ENOMEM;
  202. obj = i915_gem_alloc_object(ring->dev, 4096);
  203. if (obj == NULL) {
  204. DRM_ERROR("Failed to allocate seqno page\n");
  205. ret = -ENOMEM;
  206. goto err;
  207. }
  208. i915_gem_object_set_cache_level(obj, I915_CACHE_LLC);
  209. ret = i915_gem_object_pin(obj, 4096, true);
  210. if (ret)
  211. goto err_unref;
  212. pc->gtt_offset = obj->gtt_offset;
  213. pc->cpu_page = kmap(obj->pages[0]);
  214. if (pc->cpu_page == NULL)
  215. goto err_unpin;
  216. pc->obj = obj;
  217. ring->private = pc;
  218. return 0;
  219. err_unpin:
  220. i915_gem_object_unpin(obj);
  221. err_unref:
  222. drm_gem_object_unreference(&obj->base);
  223. err:
  224. kfree(pc);
  225. return ret;
  226. }
  227. static void
  228. cleanup_pipe_control(struct intel_ring_buffer *ring)
  229. {
  230. struct pipe_control *pc = ring->private;
  231. struct drm_i915_gem_object *obj;
  232. if (!ring->private)
  233. return;
  234. obj = pc->obj;
  235. kunmap(obj->pages[0]);
  236. i915_gem_object_unpin(obj);
  237. drm_gem_object_unreference(&obj->base);
  238. kfree(pc);
  239. ring->private = NULL;
  240. }
  241. static int init_render_ring(struct intel_ring_buffer *ring)
  242. {
  243. struct drm_device *dev = ring->dev;
  244. struct drm_i915_private *dev_priv = dev->dev_private;
  245. int ret = init_ring_common(ring);
  246. if (INTEL_INFO(dev)->gen > 3) {
  247. int mode = VS_TIMER_DISPATCH << 16 | VS_TIMER_DISPATCH;
  248. if (IS_GEN6(dev) || IS_GEN7(dev))
  249. mode |= MI_FLUSH_ENABLE << 16 | MI_FLUSH_ENABLE;
  250. I915_WRITE(MI_MODE, mode);
  251. if (IS_GEN7(dev))
  252. I915_WRITE(GFX_MODE_GEN7,
  253. GFX_MODE_DISABLE(GFX_TLB_INVALIDATE_ALWAYS) |
  254. GFX_MODE_ENABLE(GFX_REPLAY_MODE));
  255. }
  256. if (INTEL_INFO(dev)->gen >= 6) {
  257. } else if (IS_GEN5(dev)) {
  258. ret = init_pipe_control(ring);
  259. if (ret)
  260. return ret;
  261. }
  262. return ret;
  263. }
  264. static void render_ring_cleanup(struct intel_ring_buffer *ring)
  265. {
  266. if (!ring->private)
  267. return;
  268. cleanup_pipe_control(ring);
  269. }
  270. static void
  271. update_mboxes(struct intel_ring_buffer *ring,
  272. u32 seqno,
  273. u32 mmio_offset)
  274. {
  275. intel_ring_emit(ring, MI_SEMAPHORE_MBOX |
  276. MI_SEMAPHORE_GLOBAL_GTT |
  277. MI_SEMAPHORE_REGISTER |
  278. MI_SEMAPHORE_UPDATE);
  279. intel_ring_emit(ring, seqno);
  280. intel_ring_emit(ring, mmio_offset);
  281. }
  282. /**
  283. * gen6_add_request - Update the semaphore mailbox registers
  284. *
  285. * @ring - ring that is adding a request
  286. * @seqno - return seqno stuck into the ring
  287. *
  288. * Update the mailbox registers in the *other* rings with the current seqno.
  289. * This acts like a signal in the canonical semaphore.
  290. */
  291. static int
  292. gen6_add_request(struct intel_ring_buffer *ring,
  293. u32 *seqno)
  294. {
  295. u32 mbox1_reg;
  296. u32 mbox2_reg;
  297. int ret;
  298. ret = intel_ring_begin(ring, 10);
  299. if (ret)
  300. return ret;
  301. mbox1_reg = ring->signal_mbox[0];
  302. mbox2_reg = ring->signal_mbox[1];
  303. *seqno = i915_gem_get_seqno(ring->dev);
  304. update_mboxes(ring, *seqno, mbox1_reg);
  305. update_mboxes(ring, *seqno, mbox2_reg);
  306. intel_ring_emit(ring, MI_STORE_DWORD_INDEX);
  307. intel_ring_emit(ring, I915_GEM_HWS_INDEX << MI_STORE_DWORD_INDEX_SHIFT);
  308. intel_ring_emit(ring, *seqno);
  309. intel_ring_emit(ring, MI_USER_INTERRUPT);
  310. intel_ring_advance(ring);
  311. return 0;
  312. }
  313. /**
  314. * intel_ring_sync - sync the waiter to the signaller on seqno
  315. *
  316. * @waiter - ring that is waiting
  317. * @signaller - ring which has, or will signal
  318. * @seqno - seqno which the waiter will block on
  319. */
  320. static int
  321. intel_ring_sync(struct intel_ring_buffer *waiter,
  322. struct intel_ring_buffer *signaller,
  323. int ring,
  324. u32 seqno)
  325. {
  326. int ret;
  327. u32 dw1 = MI_SEMAPHORE_MBOX |
  328. MI_SEMAPHORE_COMPARE |
  329. MI_SEMAPHORE_REGISTER;
  330. ret = intel_ring_begin(waiter, 4);
  331. if (ret)
  332. return ret;
  333. intel_ring_emit(waiter, dw1 | signaller->semaphore_register[ring]);
  334. intel_ring_emit(waiter, seqno);
  335. intel_ring_emit(waiter, 0);
  336. intel_ring_emit(waiter, MI_NOOP);
  337. intel_ring_advance(waiter);
  338. return 0;
  339. }
  340. /* VCS->RCS (RVSYNC) or BCS->RCS (RBSYNC) */
  341. int
  342. render_ring_sync_to(struct intel_ring_buffer *waiter,
  343. struct intel_ring_buffer *signaller,
  344. u32 seqno)
  345. {
  346. WARN_ON(signaller->semaphore_register[RCS] == MI_SEMAPHORE_SYNC_INVALID);
  347. return intel_ring_sync(waiter,
  348. signaller,
  349. RCS,
  350. seqno);
  351. }
  352. /* RCS->VCS (VRSYNC) or BCS->VCS (VBSYNC) */
  353. int
  354. gen6_bsd_ring_sync_to(struct intel_ring_buffer *waiter,
  355. struct intel_ring_buffer *signaller,
  356. u32 seqno)
  357. {
  358. WARN_ON(signaller->semaphore_register[VCS] == MI_SEMAPHORE_SYNC_INVALID);
  359. return intel_ring_sync(waiter,
  360. signaller,
  361. VCS,
  362. seqno);
  363. }
  364. /* RCS->BCS (BRSYNC) or VCS->BCS (BVSYNC) */
  365. int
  366. gen6_blt_ring_sync_to(struct intel_ring_buffer *waiter,
  367. struct intel_ring_buffer *signaller,
  368. u32 seqno)
  369. {
  370. WARN_ON(signaller->semaphore_register[BCS] == MI_SEMAPHORE_SYNC_INVALID);
  371. return intel_ring_sync(waiter,
  372. signaller,
  373. BCS,
  374. seqno);
  375. }
  376. #define PIPE_CONTROL_FLUSH(ring__, addr__) \
  377. do { \
  378. intel_ring_emit(ring__, GFX_OP_PIPE_CONTROL | PIPE_CONTROL_QW_WRITE | \
  379. PIPE_CONTROL_DEPTH_STALL | 2); \
  380. intel_ring_emit(ring__, (addr__) | PIPE_CONTROL_GLOBAL_GTT); \
  381. intel_ring_emit(ring__, 0); \
  382. intel_ring_emit(ring__, 0); \
  383. } while (0)
  384. static int
  385. pc_render_add_request(struct intel_ring_buffer *ring,
  386. u32 *result)
  387. {
  388. struct drm_device *dev = ring->dev;
  389. u32 seqno = i915_gem_get_seqno(dev);
  390. struct pipe_control *pc = ring->private;
  391. u32 scratch_addr = pc->gtt_offset + 128;
  392. int ret;
  393. /* For Ironlake, MI_USER_INTERRUPT was deprecated and apparently
  394. * incoherent with writes to memory, i.e. completely fubar,
  395. * so we need to use PIPE_NOTIFY instead.
  396. *
  397. * However, we also need to workaround the qword write
  398. * incoherence by flushing the 6 PIPE_NOTIFY buffers out to
  399. * memory before requesting an interrupt.
  400. */
  401. ret = intel_ring_begin(ring, 32);
  402. if (ret)
  403. return ret;
  404. intel_ring_emit(ring, GFX_OP_PIPE_CONTROL | PIPE_CONTROL_QW_WRITE |
  405. PIPE_CONTROL_WC_FLUSH | PIPE_CONTROL_TC_FLUSH);
  406. intel_ring_emit(ring, pc->gtt_offset | PIPE_CONTROL_GLOBAL_GTT);
  407. intel_ring_emit(ring, seqno);
  408. intel_ring_emit(ring, 0);
  409. PIPE_CONTROL_FLUSH(ring, scratch_addr);
  410. scratch_addr += 128; /* write to separate cachelines */
  411. PIPE_CONTROL_FLUSH(ring, scratch_addr);
  412. scratch_addr += 128;
  413. PIPE_CONTROL_FLUSH(ring, scratch_addr);
  414. scratch_addr += 128;
  415. PIPE_CONTROL_FLUSH(ring, scratch_addr);
  416. scratch_addr += 128;
  417. PIPE_CONTROL_FLUSH(ring, scratch_addr);
  418. scratch_addr += 128;
  419. PIPE_CONTROL_FLUSH(ring, scratch_addr);
  420. intel_ring_emit(ring, GFX_OP_PIPE_CONTROL | PIPE_CONTROL_QW_WRITE |
  421. PIPE_CONTROL_WC_FLUSH | PIPE_CONTROL_TC_FLUSH |
  422. PIPE_CONTROL_NOTIFY);
  423. intel_ring_emit(ring, pc->gtt_offset | PIPE_CONTROL_GLOBAL_GTT);
  424. intel_ring_emit(ring, seqno);
  425. intel_ring_emit(ring, 0);
  426. intel_ring_advance(ring);
  427. *result = seqno;
  428. return 0;
  429. }
  430. static int
  431. render_ring_add_request(struct intel_ring_buffer *ring,
  432. u32 *result)
  433. {
  434. struct drm_device *dev = ring->dev;
  435. u32 seqno = i915_gem_get_seqno(dev);
  436. int ret;
  437. ret = intel_ring_begin(ring, 4);
  438. if (ret)
  439. return ret;
  440. intel_ring_emit(ring, MI_STORE_DWORD_INDEX);
  441. intel_ring_emit(ring, I915_GEM_HWS_INDEX << MI_STORE_DWORD_INDEX_SHIFT);
  442. intel_ring_emit(ring, seqno);
  443. intel_ring_emit(ring, MI_USER_INTERRUPT);
  444. intel_ring_advance(ring);
  445. *result = seqno;
  446. return 0;
  447. }
  448. static u32
  449. ring_get_seqno(struct intel_ring_buffer *ring)
  450. {
  451. return intel_read_status_page(ring, I915_GEM_HWS_INDEX);
  452. }
  453. static u32
  454. pc_render_get_seqno(struct intel_ring_buffer *ring)
  455. {
  456. struct pipe_control *pc = ring->private;
  457. return pc->cpu_page[0];
  458. }
  459. static void
  460. ironlake_enable_irq(drm_i915_private_t *dev_priv, u32 mask)
  461. {
  462. dev_priv->gt_irq_mask &= ~mask;
  463. I915_WRITE(GTIMR, dev_priv->gt_irq_mask);
  464. POSTING_READ(GTIMR);
  465. }
  466. static void
  467. ironlake_disable_irq(drm_i915_private_t *dev_priv, u32 mask)
  468. {
  469. dev_priv->gt_irq_mask |= mask;
  470. I915_WRITE(GTIMR, dev_priv->gt_irq_mask);
  471. POSTING_READ(GTIMR);
  472. }
  473. static void
  474. i915_enable_irq(drm_i915_private_t *dev_priv, u32 mask)
  475. {
  476. dev_priv->irq_mask &= ~mask;
  477. I915_WRITE(IMR, dev_priv->irq_mask);
  478. POSTING_READ(IMR);
  479. }
  480. static void
  481. i915_disable_irq(drm_i915_private_t *dev_priv, u32 mask)
  482. {
  483. dev_priv->irq_mask |= mask;
  484. I915_WRITE(IMR, dev_priv->irq_mask);
  485. POSTING_READ(IMR);
  486. }
  487. static bool
  488. render_ring_get_irq(struct intel_ring_buffer *ring)
  489. {
  490. struct drm_device *dev = ring->dev;
  491. drm_i915_private_t *dev_priv = dev->dev_private;
  492. if (!dev->irq_enabled)
  493. return false;
  494. spin_lock(&ring->irq_lock);
  495. if (ring->irq_refcount++ == 0) {
  496. if (HAS_PCH_SPLIT(dev))
  497. ironlake_enable_irq(dev_priv,
  498. GT_PIPE_NOTIFY | GT_USER_INTERRUPT);
  499. else
  500. i915_enable_irq(dev_priv, I915_USER_INTERRUPT);
  501. }
  502. spin_unlock(&ring->irq_lock);
  503. return true;
  504. }
  505. static void
  506. render_ring_put_irq(struct intel_ring_buffer *ring)
  507. {
  508. struct drm_device *dev = ring->dev;
  509. drm_i915_private_t *dev_priv = dev->dev_private;
  510. spin_lock(&ring->irq_lock);
  511. if (--ring->irq_refcount == 0) {
  512. if (HAS_PCH_SPLIT(dev))
  513. ironlake_disable_irq(dev_priv,
  514. GT_USER_INTERRUPT |
  515. GT_PIPE_NOTIFY);
  516. else
  517. i915_disable_irq(dev_priv, I915_USER_INTERRUPT);
  518. }
  519. spin_unlock(&ring->irq_lock);
  520. }
  521. void intel_ring_setup_status_page(struct intel_ring_buffer *ring)
  522. {
  523. struct drm_device *dev = ring->dev;
  524. drm_i915_private_t *dev_priv = ring->dev->dev_private;
  525. u32 mmio = 0;
  526. /* The ring status page addresses are no longer next to the rest of
  527. * the ring registers as of gen7.
  528. */
  529. if (IS_GEN7(dev)) {
  530. switch (ring->id) {
  531. case RING_RENDER:
  532. mmio = RENDER_HWS_PGA_GEN7;
  533. break;
  534. case RING_BLT:
  535. mmio = BLT_HWS_PGA_GEN7;
  536. break;
  537. case RING_BSD:
  538. mmio = BSD_HWS_PGA_GEN7;
  539. break;
  540. }
  541. } else if (IS_GEN6(ring->dev)) {
  542. mmio = RING_HWS_PGA_GEN6(ring->mmio_base);
  543. } else {
  544. mmio = RING_HWS_PGA(ring->mmio_base);
  545. }
  546. I915_WRITE(mmio, (u32)ring->status_page.gfx_addr);
  547. POSTING_READ(mmio);
  548. }
  549. static int
  550. bsd_ring_flush(struct intel_ring_buffer *ring,
  551. u32 invalidate_domains,
  552. u32 flush_domains)
  553. {
  554. int ret;
  555. ret = intel_ring_begin(ring, 2);
  556. if (ret)
  557. return ret;
  558. intel_ring_emit(ring, MI_FLUSH);
  559. intel_ring_emit(ring, MI_NOOP);
  560. intel_ring_advance(ring);
  561. return 0;
  562. }
  563. static int
  564. ring_add_request(struct intel_ring_buffer *ring,
  565. u32 *result)
  566. {
  567. u32 seqno;
  568. int ret;
  569. ret = intel_ring_begin(ring, 4);
  570. if (ret)
  571. return ret;
  572. seqno = i915_gem_get_seqno(ring->dev);
  573. intel_ring_emit(ring, MI_STORE_DWORD_INDEX);
  574. intel_ring_emit(ring, I915_GEM_HWS_INDEX << MI_STORE_DWORD_INDEX_SHIFT);
  575. intel_ring_emit(ring, seqno);
  576. intel_ring_emit(ring, MI_USER_INTERRUPT);
  577. intel_ring_advance(ring);
  578. *result = seqno;
  579. return 0;
  580. }
  581. static bool
  582. gen6_ring_get_irq(struct intel_ring_buffer *ring, u32 gflag, u32 rflag)
  583. {
  584. struct drm_device *dev = ring->dev;
  585. drm_i915_private_t *dev_priv = dev->dev_private;
  586. if (!dev->irq_enabled)
  587. return false;
  588. spin_lock(&ring->irq_lock);
  589. if (ring->irq_refcount++ == 0) {
  590. ring->irq_mask &= ~rflag;
  591. I915_WRITE_IMR(ring, ring->irq_mask);
  592. ironlake_enable_irq(dev_priv, gflag);
  593. }
  594. spin_unlock(&ring->irq_lock);
  595. return true;
  596. }
  597. static void
  598. gen6_ring_put_irq(struct intel_ring_buffer *ring, u32 gflag, u32 rflag)
  599. {
  600. struct drm_device *dev = ring->dev;
  601. drm_i915_private_t *dev_priv = dev->dev_private;
  602. spin_lock(&ring->irq_lock);
  603. if (--ring->irq_refcount == 0) {
  604. ring->irq_mask |= rflag;
  605. I915_WRITE_IMR(ring, ring->irq_mask);
  606. ironlake_disable_irq(dev_priv, gflag);
  607. }
  608. spin_unlock(&ring->irq_lock);
  609. }
  610. static bool
  611. bsd_ring_get_irq(struct intel_ring_buffer *ring)
  612. {
  613. struct drm_device *dev = ring->dev;
  614. drm_i915_private_t *dev_priv = dev->dev_private;
  615. if (!dev->irq_enabled)
  616. return false;
  617. spin_lock(&ring->irq_lock);
  618. if (ring->irq_refcount++ == 0) {
  619. if (IS_G4X(dev))
  620. i915_enable_irq(dev_priv, I915_BSD_USER_INTERRUPT);
  621. else
  622. ironlake_enable_irq(dev_priv, GT_BSD_USER_INTERRUPT);
  623. }
  624. spin_unlock(&ring->irq_lock);
  625. return true;
  626. }
  627. static void
  628. bsd_ring_put_irq(struct intel_ring_buffer *ring)
  629. {
  630. struct drm_device *dev = ring->dev;
  631. drm_i915_private_t *dev_priv = dev->dev_private;
  632. spin_lock(&ring->irq_lock);
  633. if (--ring->irq_refcount == 0) {
  634. if (IS_G4X(dev))
  635. i915_disable_irq(dev_priv, I915_BSD_USER_INTERRUPT);
  636. else
  637. ironlake_disable_irq(dev_priv, GT_BSD_USER_INTERRUPT);
  638. }
  639. spin_unlock(&ring->irq_lock);
  640. }
  641. static int
  642. ring_dispatch_execbuffer(struct intel_ring_buffer *ring, u32 offset, u32 length)
  643. {
  644. int ret;
  645. ret = intel_ring_begin(ring, 2);
  646. if (ret)
  647. return ret;
  648. intel_ring_emit(ring,
  649. MI_BATCH_BUFFER_START | (2 << 6) |
  650. MI_BATCH_NON_SECURE_I965);
  651. intel_ring_emit(ring, offset);
  652. intel_ring_advance(ring);
  653. return 0;
  654. }
  655. static int
  656. render_ring_dispatch_execbuffer(struct intel_ring_buffer *ring,
  657. u32 offset, u32 len)
  658. {
  659. struct drm_device *dev = ring->dev;
  660. int ret;
  661. if (IS_I830(dev) || IS_845G(dev)) {
  662. ret = intel_ring_begin(ring, 4);
  663. if (ret)
  664. return ret;
  665. intel_ring_emit(ring, MI_BATCH_BUFFER);
  666. intel_ring_emit(ring, offset | MI_BATCH_NON_SECURE);
  667. intel_ring_emit(ring, offset + len - 8);
  668. intel_ring_emit(ring, 0);
  669. } else {
  670. ret = intel_ring_begin(ring, 2);
  671. if (ret)
  672. return ret;
  673. if (INTEL_INFO(dev)->gen >= 4) {
  674. intel_ring_emit(ring,
  675. MI_BATCH_BUFFER_START | (2 << 6) |
  676. MI_BATCH_NON_SECURE_I965);
  677. intel_ring_emit(ring, offset);
  678. } else {
  679. intel_ring_emit(ring,
  680. MI_BATCH_BUFFER_START | (2 << 6));
  681. intel_ring_emit(ring, offset | MI_BATCH_NON_SECURE);
  682. }
  683. }
  684. intel_ring_advance(ring);
  685. return 0;
  686. }
  687. static void cleanup_status_page(struct intel_ring_buffer *ring)
  688. {
  689. drm_i915_private_t *dev_priv = ring->dev->dev_private;
  690. struct drm_i915_gem_object *obj;
  691. obj = ring->status_page.obj;
  692. if (obj == NULL)
  693. return;
  694. kunmap(obj->pages[0]);
  695. i915_gem_object_unpin(obj);
  696. drm_gem_object_unreference(&obj->base);
  697. ring->status_page.obj = NULL;
  698. memset(&dev_priv->hws_map, 0, sizeof(dev_priv->hws_map));
  699. }
  700. static int init_status_page(struct intel_ring_buffer *ring)
  701. {
  702. struct drm_device *dev = ring->dev;
  703. drm_i915_private_t *dev_priv = dev->dev_private;
  704. struct drm_i915_gem_object *obj;
  705. int ret;
  706. obj = i915_gem_alloc_object(dev, 4096);
  707. if (obj == NULL) {
  708. DRM_ERROR("Failed to allocate status page\n");
  709. ret = -ENOMEM;
  710. goto err;
  711. }
  712. i915_gem_object_set_cache_level(obj, I915_CACHE_LLC);
  713. ret = i915_gem_object_pin(obj, 4096, true);
  714. if (ret != 0) {
  715. goto err_unref;
  716. }
  717. ring->status_page.gfx_addr = obj->gtt_offset;
  718. ring->status_page.page_addr = kmap(obj->pages[0]);
  719. if (ring->status_page.page_addr == NULL) {
  720. memset(&dev_priv->hws_map, 0, sizeof(dev_priv->hws_map));
  721. goto err_unpin;
  722. }
  723. ring->status_page.obj = obj;
  724. memset(ring->status_page.page_addr, 0, PAGE_SIZE);
  725. intel_ring_setup_status_page(ring);
  726. DRM_DEBUG_DRIVER("%s hws offset: 0x%08x\n",
  727. ring->name, ring->status_page.gfx_addr);
  728. return 0;
  729. err_unpin:
  730. i915_gem_object_unpin(obj);
  731. err_unref:
  732. drm_gem_object_unreference(&obj->base);
  733. err:
  734. return ret;
  735. }
  736. int intel_init_ring_buffer(struct drm_device *dev,
  737. struct intel_ring_buffer *ring)
  738. {
  739. struct drm_i915_gem_object *obj;
  740. int ret;
  741. ring->dev = dev;
  742. INIT_LIST_HEAD(&ring->active_list);
  743. INIT_LIST_HEAD(&ring->request_list);
  744. INIT_LIST_HEAD(&ring->gpu_write_list);
  745. init_waitqueue_head(&ring->irq_queue);
  746. spin_lock_init(&ring->irq_lock);
  747. ring->irq_mask = ~0;
  748. if (I915_NEED_GFX_HWS(dev)) {
  749. ret = init_status_page(ring);
  750. if (ret)
  751. return ret;
  752. }
  753. obj = i915_gem_alloc_object(dev, ring->size);
  754. if (obj == NULL) {
  755. DRM_ERROR("Failed to allocate ringbuffer\n");
  756. ret = -ENOMEM;
  757. goto err_hws;
  758. }
  759. ring->obj = obj;
  760. ret = i915_gem_object_pin(obj, PAGE_SIZE, true);
  761. if (ret)
  762. goto err_unref;
  763. ring->map.size = ring->size;
  764. ring->map.offset = dev->agp->base + obj->gtt_offset;
  765. ring->map.type = 0;
  766. ring->map.flags = 0;
  767. ring->map.mtrr = 0;
  768. drm_core_ioremap_wc(&ring->map, dev);
  769. if (ring->map.handle == NULL) {
  770. DRM_ERROR("Failed to map ringbuffer.\n");
  771. ret = -EINVAL;
  772. goto err_unpin;
  773. }
  774. ring->virtual_start = ring->map.handle;
  775. ret = ring->init(ring);
  776. if (ret)
  777. goto err_unmap;
  778. /* Workaround an erratum on the i830 which causes a hang if
  779. * the TAIL pointer points to within the last 2 cachelines
  780. * of the buffer.
  781. */
  782. ring->effective_size = ring->size;
  783. if (IS_I830(ring->dev))
  784. ring->effective_size -= 128;
  785. return 0;
  786. err_unmap:
  787. drm_core_ioremapfree(&ring->map, dev);
  788. err_unpin:
  789. i915_gem_object_unpin(obj);
  790. err_unref:
  791. drm_gem_object_unreference(&obj->base);
  792. ring->obj = NULL;
  793. err_hws:
  794. cleanup_status_page(ring);
  795. return ret;
  796. }
  797. void intel_cleanup_ring_buffer(struct intel_ring_buffer *ring)
  798. {
  799. struct drm_i915_private *dev_priv;
  800. int ret;
  801. if (ring->obj == NULL)
  802. return;
  803. /* Disable the ring buffer. The ring must be idle at this point */
  804. dev_priv = ring->dev->dev_private;
  805. ret = intel_wait_ring_idle(ring);
  806. if (ret)
  807. DRM_ERROR("failed to quiesce %s whilst cleaning up: %d\n",
  808. ring->name, ret);
  809. I915_WRITE_CTL(ring, 0);
  810. drm_core_ioremapfree(&ring->map, ring->dev);
  811. i915_gem_object_unpin(ring->obj);
  812. drm_gem_object_unreference(&ring->obj->base);
  813. ring->obj = NULL;
  814. if (ring->cleanup)
  815. ring->cleanup(ring);
  816. cleanup_status_page(ring);
  817. }
  818. static int intel_wrap_ring_buffer(struct intel_ring_buffer *ring)
  819. {
  820. unsigned int *virt;
  821. int rem = ring->size - ring->tail;
  822. if (ring->space < rem) {
  823. int ret = intel_wait_ring_buffer(ring, rem);
  824. if (ret)
  825. return ret;
  826. }
  827. virt = (unsigned int *)(ring->virtual_start + ring->tail);
  828. rem /= 8;
  829. while (rem--) {
  830. *virt++ = MI_NOOP;
  831. *virt++ = MI_NOOP;
  832. }
  833. ring->tail = 0;
  834. ring->space = ring_space(ring);
  835. return 0;
  836. }
  837. int intel_wait_ring_buffer(struct intel_ring_buffer *ring, int n)
  838. {
  839. struct drm_device *dev = ring->dev;
  840. struct drm_i915_private *dev_priv = dev->dev_private;
  841. unsigned long end;
  842. u32 head;
  843. /* If the reported head position has wrapped or hasn't advanced,
  844. * fallback to the slow and accurate path.
  845. */
  846. head = intel_read_status_page(ring, 4);
  847. if (head > ring->head) {
  848. ring->head = head;
  849. ring->space = ring_space(ring);
  850. if (ring->space >= n)
  851. return 0;
  852. }
  853. trace_i915_ring_wait_begin(ring);
  854. end = jiffies + 3 * HZ;
  855. do {
  856. ring->head = I915_READ_HEAD(ring);
  857. ring->space = ring_space(ring);
  858. if (ring->space >= n) {
  859. trace_i915_ring_wait_end(ring);
  860. return 0;
  861. }
  862. if (dev->primary->master) {
  863. struct drm_i915_master_private *master_priv = dev->primary->master->driver_priv;
  864. if (master_priv->sarea_priv)
  865. master_priv->sarea_priv->perf_boxes |= I915_BOX_WAIT;
  866. }
  867. msleep(1);
  868. if (atomic_read(&dev_priv->mm.wedged))
  869. return -EAGAIN;
  870. } while (!time_after(jiffies, end));
  871. trace_i915_ring_wait_end(ring);
  872. return -EBUSY;
  873. }
  874. int intel_ring_begin(struct intel_ring_buffer *ring,
  875. int num_dwords)
  876. {
  877. struct drm_i915_private *dev_priv = ring->dev->dev_private;
  878. int n = 4*num_dwords;
  879. int ret;
  880. if (unlikely(atomic_read(&dev_priv->mm.wedged)))
  881. return -EIO;
  882. if (unlikely(ring->tail + n > ring->effective_size)) {
  883. ret = intel_wrap_ring_buffer(ring);
  884. if (unlikely(ret))
  885. return ret;
  886. }
  887. if (unlikely(ring->space < n)) {
  888. ret = intel_wait_ring_buffer(ring, n);
  889. if (unlikely(ret))
  890. return ret;
  891. }
  892. ring->space -= n;
  893. return 0;
  894. }
  895. void intel_ring_advance(struct intel_ring_buffer *ring)
  896. {
  897. ring->tail &= ring->size - 1;
  898. ring->write_tail(ring, ring->tail);
  899. }
  900. static const struct intel_ring_buffer render_ring = {
  901. .name = "render ring",
  902. .id = RING_RENDER,
  903. .mmio_base = RENDER_RING_BASE,
  904. .size = 32 * PAGE_SIZE,
  905. .init = init_render_ring,
  906. .write_tail = ring_write_tail,
  907. .flush = render_ring_flush,
  908. .add_request = render_ring_add_request,
  909. .get_seqno = ring_get_seqno,
  910. .irq_get = render_ring_get_irq,
  911. .irq_put = render_ring_put_irq,
  912. .dispatch_execbuffer = render_ring_dispatch_execbuffer,
  913. .cleanup = render_ring_cleanup,
  914. .sync_to = render_ring_sync_to,
  915. .semaphore_register = {MI_SEMAPHORE_SYNC_INVALID,
  916. MI_SEMAPHORE_SYNC_RV,
  917. MI_SEMAPHORE_SYNC_RB},
  918. .signal_mbox = {GEN6_VRSYNC, GEN6_BRSYNC},
  919. };
  920. /* ring buffer for bit-stream decoder */
  921. static const struct intel_ring_buffer bsd_ring = {
  922. .name = "bsd ring",
  923. .id = RING_BSD,
  924. .mmio_base = BSD_RING_BASE,
  925. .size = 32 * PAGE_SIZE,
  926. .init = init_ring_common,
  927. .write_tail = ring_write_tail,
  928. .flush = bsd_ring_flush,
  929. .add_request = ring_add_request,
  930. .get_seqno = ring_get_seqno,
  931. .irq_get = bsd_ring_get_irq,
  932. .irq_put = bsd_ring_put_irq,
  933. .dispatch_execbuffer = ring_dispatch_execbuffer,
  934. };
  935. static void gen6_bsd_ring_write_tail(struct intel_ring_buffer *ring,
  936. u32 value)
  937. {
  938. drm_i915_private_t *dev_priv = ring->dev->dev_private;
  939. /* Every tail move must follow the sequence below */
  940. I915_WRITE(GEN6_BSD_SLEEP_PSMI_CONTROL,
  941. GEN6_BSD_SLEEP_PSMI_CONTROL_RC_ILDL_MESSAGE_MODIFY_MASK |
  942. GEN6_BSD_SLEEP_PSMI_CONTROL_RC_ILDL_MESSAGE_DISABLE);
  943. I915_WRITE(GEN6_BSD_RNCID, 0x0);
  944. if (wait_for((I915_READ(GEN6_BSD_SLEEP_PSMI_CONTROL) &
  945. GEN6_BSD_SLEEP_PSMI_CONTROL_IDLE_INDICATOR) == 0,
  946. 50))
  947. DRM_ERROR("timed out waiting for IDLE Indicator\n");
  948. I915_WRITE_TAIL(ring, value);
  949. I915_WRITE(GEN6_BSD_SLEEP_PSMI_CONTROL,
  950. GEN6_BSD_SLEEP_PSMI_CONTROL_RC_ILDL_MESSAGE_MODIFY_MASK |
  951. GEN6_BSD_SLEEP_PSMI_CONTROL_RC_ILDL_MESSAGE_ENABLE);
  952. }
  953. static int gen6_ring_flush(struct intel_ring_buffer *ring,
  954. u32 invalidate, u32 flush)
  955. {
  956. uint32_t cmd;
  957. int ret;
  958. ret = intel_ring_begin(ring, 4);
  959. if (ret)
  960. return ret;
  961. cmd = MI_FLUSH_DW;
  962. if (invalidate & I915_GEM_GPU_DOMAINS)
  963. cmd |= MI_INVALIDATE_TLB | MI_INVALIDATE_BSD;
  964. intel_ring_emit(ring, cmd);
  965. intel_ring_emit(ring, 0);
  966. intel_ring_emit(ring, 0);
  967. intel_ring_emit(ring, MI_NOOP);
  968. intel_ring_advance(ring);
  969. return 0;
  970. }
  971. static int
  972. gen6_ring_dispatch_execbuffer(struct intel_ring_buffer *ring,
  973. u32 offset, u32 len)
  974. {
  975. int ret;
  976. ret = intel_ring_begin(ring, 2);
  977. if (ret)
  978. return ret;
  979. intel_ring_emit(ring, MI_BATCH_BUFFER_START | MI_BATCH_NON_SECURE_I965);
  980. /* bit0-7 is the length on GEN6+ */
  981. intel_ring_emit(ring, offset);
  982. intel_ring_advance(ring);
  983. return 0;
  984. }
  985. static bool
  986. gen6_render_ring_get_irq(struct intel_ring_buffer *ring)
  987. {
  988. return gen6_ring_get_irq(ring,
  989. GT_USER_INTERRUPT,
  990. GEN6_RENDER_USER_INTERRUPT);
  991. }
  992. static void
  993. gen6_render_ring_put_irq(struct intel_ring_buffer *ring)
  994. {
  995. return gen6_ring_put_irq(ring,
  996. GT_USER_INTERRUPT,
  997. GEN6_RENDER_USER_INTERRUPT);
  998. }
  999. static bool
  1000. gen6_bsd_ring_get_irq(struct intel_ring_buffer *ring)
  1001. {
  1002. return gen6_ring_get_irq(ring,
  1003. GT_GEN6_BSD_USER_INTERRUPT,
  1004. GEN6_BSD_USER_INTERRUPT);
  1005. }
  1006. static void
  1007. gen6_bsd_ring_put_irq(struct intel_ring_buffer *ring)
  1008. {
  1009. return gen6_ring_put_irq(ring,
  1010. GT_GEN6_BSD_USER_INTERRUPT,
  1011. GEN6_BSD_USER_INTERRUPT);
  1012. }
  1013. /* ring buffer for Video Codec for Gen6+ */
  1014. static const struct intel_ring_buffer gen6_bsd_ring = {
  1015. .name = "gen6 bsd ring",
  1016. .id = RING_BSD,
  1017. .mmio_base = GEN6_BSD_RING_BASE,
  1018. .size = 32 * PAGE_SIZE,
  1019. .init = init_ring_common,
  1020. .write_tail = gen6_bsd_ring_write_tail,
  1021. .flush = gen6_ring_flush,
  1022. .add_request = gen6_add_request,
  1023. .get_seqno = ring_get_seqno,
  1024. .irq_get = gen6_bsd_ring_get_irq,
  1025. .irq_put = gen6_bsd_ring_put_irq,
  1026. .dispatch_execbuffer = gen6_ring_dispatch_execbuffer,
  1027. .sync_to = gen6_bsd_ring_sync_to,
  1028. .semaphore_register = {MI_SEMAPHORE_SYNC_VR,
  1029. MI_SEMAPHORE_SYNC_INVALID,
  1030. MI_SEMAPHORE_SYNC_VB},
  1031. .signal_mbox = {GEN6_RVSYNC, GEN6_BVSYNC},
  1032. };
  1033. /* Blitter support (SandyBridge+) */
  1034. static bool
  1035. blt_ring_get_irq(struct intel_ring_buffer *ring)
  1036. {
  1037. return gen6_ring_get_irq(ring,
  1038. GT_BLT_USER_INTERRUPT,
  1039. GEN6_BLITTER_USER_INTERRUPT);
  1040. }
  1041. static void
  1042. blt_ring_put_irq(struct intel_ring_buffer *ring)
  1043. {
  1044. gen6_ring_put_irq(ring,
  1045. GT_BLT_USER_INTERRUPT,
  1046. GEN6_BLITTER_USER_INTERRUPT);
  1047. }
  1048. /* Workaround for some stepping of SNB,
  1049. * each time when BLT engine ring tail moved,
  1050. * the first command in the ring to be parsed
  1051. * should be MI_BATCH_BUFFER_START
  1052. */
  1053. #define NEED_BLT_WORKAROUND(dev) \
  1054. (IS_GEN6(dev) && (dev->pdev->revision < 8))
  1055. static inline struct drm_i915_gem_object *
  1056. to_blt_workaround(struct intel_ring_buffer *ring)
  1057. {
  1058. return ring->private;
  1059. }
  1060. static int blt_ring_init(struct intel_ring_buffer *ring)
  1061. {
  1062. if (NEED_BLT_WORKAROUND(ring->dev)) {
  1063. struct drm_i915_gem_object *obj;
  1064. u32 *ptr;
  1065. int ret;
  1066. obj = i915_gem_alloc_object(ring->dev, 4096);
  1067. if (obj == NULL)
  1068. return -ENOMEM;
  1069. ret = i915_gem_object_pin(obj, 4096, true);
  1070. if (ret) {
  1071. drm_gem_object_unreference(&obj->base);
  1072. return ret;
  1073. }
  1074. ptr = kmap(obj->pages[0]);
  1075. *ptr++ = MI_BATCH_BUFFER_END;
  1076. *ptr++ = MI_NOOP;
  1077. kunmap(obj->pages[0]);
  1078. ret = i915_gem_object_set_to_gtt_domain(obj, false);
  1079. if (ret) {
  1080. i915_gem_object_unpin(obj);
  1081. drm_gem_object_unreference(&obj->base);
  1082. return ret;
  1083. }
  1084. ring->private = obj;
  1085. }
  1086. return init_ring_common(ring);
  1087. }
  1088. static int blt_ring_begin(struct intel_ring_buffer *ring,
  1089. int num_dwords)
  1090. {
  1091. if (ring->private) {
  1092. int ret = intel_ring_begin(ring, num_dwords+2);
  1093. if (ret)
  1094. return ret;
  1095. intel_ring_emit(ring, MI_BATCH_BUFFER_START);
  1096. intel_ring_emit(ring, to_blt_workaround(ring)->gtt_offset);
  1097. return 0;
  1098. } else
  1099. return intel_ring_begin(ring, 4);
  1100. }
  1101. static int blt_ring_flush(struct intel_ring_buffer *ring,
  1102. u32 invalidate, u32 flush)
  1103. {
  1104. uint32_t cmd;
  1105. int ret;
  1106. ret = blt_ring_begin(ring, 4);
  1107. if (ret)
  1108. return ret;
  1109. cmd = MI_FLUSH_DW;
  1110. if (invalidate & I915_GEM_DOMAIN_RENDER)
  1111. cmd |= MI_INVALIDATE_TLB;
  1112. intel_ring_emit(ring, cmd);
  1113. intel_ring_emit(ring, 0);
  1114. intel_ring_emit(ring, 0);
  1115. intel_ring_emit(ring, MI_NOOP);
  1116. intel_ring_advance(ring);
  1117. return 0;
  1118. }
  1119. static void blt_ring_cleanup(struct intel_ring_buffer *ring)
  1120. {
  1121. if (!ring->private)
  1122. return;
  1123. i915_gem_object_unpin(ring->private);
  1124. drm_gem_object_unreference(ring->private);
  1125. ring->private = NULL;
  1126. }
  1127. static const struct intel_ring_buffer gen6_blt_ring = {
  1128. .name = "blt ring",
  1129. .id = RING_BLT,
  1130. .mmio_base = BLT_RING_BASE,
  1131. .size = 32 * PAGE_SIZE,
  1132. .init = blt_ring_init,
  1133. .write_tail = ring_write_tail,
  1134. .flush = blt_ring_flush,
  1135. .add_request = gen6_add_request,
  1136. .get_seqno = ring_get_seqno,
  1137. .irq_get = blt_ring_get_irq,
  1138. .irq_put = blt_ring_put_irq,
  1139. .dispatch_execbuffer = gen6_ring_dispatch_execbuffer,
  1140. .cleanup = blt_ring_cleanup,
  1141. .sync_to = gen6_blt_ring_sync_to,
  1142. .semaphore_register = {MI_SEMAPHORE_SYNC_BR,
  1143. MI_SEMAPHORE_SYNC_BV,
  1144. MI_SEMAPHORE_SYNC_INVALID},
  1145. .signal_mbox = {GEN6_RBSYNC, GEN6_VBSYNC},
  1146. };
  1147. int intel_init_render_ring_buffer(struct drm_device *dev)
  1148. {
  1149. drm_i915_private_t *dev_priv = dev->dev_private;
  1150. struct intel_ring_buffer *ring = &dev_priv->ring[RCS];
  1151. *ring = render_ring;
  1152. if (INTEL_INFO(dev)->gen >= 6) {
  1153. ring->add_request = gen6_add_request;
  1154. ring->irq_get = gen6_render_ring_get_irq;
  1155. ring->irq_put = gen6_render_ring_put_irq;
  1156. } else if (IS_GEN5(dev)) {
  1157. ring->add_request = pc_render_add_request;
  1158. ring->get_seqno = pc_render_get_seqno;
  1159. }
  1160. if (!I915_NEED_GFX_HWS(dev)) {
  1161. ring->status_page.page_addr = dev_priv->status_page_dmah->vaddr;
  1162. memset(ring->status_page.page_addr, 0, PAGE_SIZE);
  1163. }
  1164. return intel_init_ring_buffer(dev, ring);
  1165. }
  1166. int intel_render_ring_init_dri(struct drm_device *dev, u64 start, u32 size)
  1167. {
  1168. drm_i915_private_t *dev_priv = dev->dev_private;
  1169. struct intel_ring_buffer *ring = &dev_priv->ring[RCS];
  1170. *ring = render_ring;
  1171. if (INTEL_INFO(dev)->gen >= 6) {
  1172. ring->add_request = gen6_add_request;
  1173. ring->irq_get = gen6_render_ring_get_irq;
  1174. ring->irq_put = gen6_render_ring_put_irq;
  1175. } else if (IS_GEN5(dev)) {
  1176. ring->add_request = pc_render_add_request;
  1177. ring->get_seqno = pc_render_get_seqno;
  1178. }
  1179. if (!I915_NEED_GFX_HWS(dev))
  1180. ring->status_page.page_addr = dev_priv->status_page_dmah->vaddr;
  1181. ring->dev = dev;
  1182. INIT_LIST_HEAD(&ring->active_list);
  1183. INIT_LIST_HEAD(&ring->request_list);
  1184. INIT_LIST_HEAD(&ring->gpu_write_list);
  1185. ring->size = size;
  1186. ring->effective_size = ring->size;
  1187. if (IS_I830(ring->dev))
  1188. ring->effective_size -= 128;
  1189. ring->map.offset = start;
  1190. ring->map.size = size;
  1191. ring->map.type = 0;
  1192. ring->map.flags = 0;
  1193. ring->map.mtrr = 0;
  1194. drm_core_ioremap_wc(&ring->map, dev);
  1195. if (ring->map.handle == NULL) {
  1196. DRM_ERROR("can not ioremap virtual address for"
  1197. " ring buffer\n");
  1198. return -ENOMEM;
  1199. }
  1200. ring->virtual_start = (void __force __iomem *)ring->map.handle;
  1201. return 0;
  1202. }
  1203. int intel_init_bsd_ring_buffer(struct drm_device *dev)
  1204. {
  1205. drm_i915_private_t *dev_priv = dev->dev_private;
  1206. struct intel_ring_buffer *ring = &dev_priv->ring[VCS];
  1207. if (IS_GEN6(dev) || IS_GEN7(dev))
  1208. *ring = gen6_bsd_ring;
  1209. else
  1210. *ring = bsd_ring;
  1211. return intel_init_ring_buffer(dev, ring);
  1212. }
  1213. int intel_init_blt_ring_buffer(struct drm_device *dev)
  1214. {
  1215. drm_i915_private_t *dev_priv = dev->dev_private;
  1216. struct intel_ring_buffer *ring = &dev_priv->ring[BCS];
  1217. *ring = gen6_blt_ring;
  1218. return intel_init_ring_buffer(dev, ring);
  1219. }