r300.c 30 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116
  1. /*
  2. * Copyright 2008 Advanced Micro Devices, Inc.
  3. * Copyright 2008 Red Hat Inc.
  4. * Copyright 2009 Jerome Glisse.
  5. *
  6. * Permission is hereby granted, free of charge, to any person obtaining a
  7. * copy of this software and associated documentation files (the "Software"),
  8. * to deal in the Software without restriction, including without limitation
  9. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  10. * and/or sell copies of the Software, and to permit persons to whom the
  11. * Software is furnished to do so, subject to the following conditions:
  12. *
  13. * The above copyright notice and this permission notice shall be included in
  14. * all copies or substantial portions of the Software.
  15. *
  16. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  17. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  18. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  19. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  20. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  21. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  22. * OTHER DEALINGS IN THE SOFTWARE.
  23. *
  24. * Authors: Dave Airlie
  25. * Alex Deucher
  26. * Jerome Glisse
  27. */
  28. #include <linux/seq_file.h>
  29. #include "drmP.h"
  30. #include "drm.h"
  31. #include "radeon_reg.h"
  32. #include "radeon.h"
  33. /* r300,r350,rv350,rv370,rv380 depends on : */
  34. void r100_hdp_reset(struct radeon_device *rdev);
  35. int r100_cp_reset(struct radeon_device *rdev);
  36. int r100_rb2d_reset(struct radeon_device *rdev);
  37. int r100_cp_init(struct radeon_device *rdev, unsigned ring_size);
  38. int r100_pci_gart_enable(struct radeon_device *rdev);
  39. void r100_pci_gart_disable(struct radeon_device *rdev);
  40. void r100_mc_setup(struct radeon_device *rdev);
  41. void r100_mc_disable_clients(struct radeon_device *rdev);
  42. int r100_gui_wait_for_idle(struct radeon_device *rdev);
  43. int r100_cs_packet_parse(struct radeon_cs_parser *p,
  44. struct radeon_cs_packet *pkt,
  45. unsigned idx);
  46. int r100_cs_packet_next_reloc(struct radeon_cs_parser *p,
  47. struct radeon_cs_reloc **cs_reloc);
  48. int r100_cs_parse_packet0(struct radeon_cs_parser *p,
  49. struct radeon_cs_packet *pkt,
  50. unsigned *auth, unsigned n,
  51. radeon_packet0_check_t check);
  52. int r100_cs_parse_packet3(struct radeon_cs_parser *p,
  53. struct radeon_cs_packet *pkt,
  54. unsigned *auth, unsigned n,
  55. radeon_packet3_check_t check);
  56. void r100_cs_dump_packet(struct radeon_cs_parser *p,
  57. struct radeon_cs_packet *pkt);
  58. /* This files gather functions specifics to:
  59. * r300,r350,rv350,rv370,rv380
  60. *
  61. * Some of these functions might be used by newer ASICs.
  62. */
  63. void r300_gpu_init(struct radeon_device *rdev);
  64. int r300_mc_wait_for_idle(struct radeon_device *rdev);
  65. int rv370_debugfs_pcie_gart_info_init(struct radeon_device *rdev);
  66. /*
  67. * rv370,rv380 PCIE GART
  68. */
  69. void rv370_pcie_gart_tlb_flush(struct radeon_device *rdev)
  70. {
  71. uint32_t tmp;
  72. int i;
  73. /* Workaround HW bug do flush 2 times */
  74. for (i = 0; i < 2; i++) {
  75. tmp = RREG32_PCIE(RADEON_PCIE_TX_GART_CNTL);
  76. WREG32_PCIE(RADEON_PCIE_TX_GART_CNTL, tmp | RADEON_PCIE_TX_GART_INVALIDATE_TLB);
  77. (void)RREG32_PCIE(RADEON_PCIE_TX_GART_CNTL);
  78. WREG32_PCIE(RADEON_PCIE_TX_GART_CNTL, tmp);
  79. mb();
  80. }
  81. }
  82. int rv370_pcie_gart_enable(struct radeon_device *rdev)
  83. {
  84. uint32_t table_addr;
  85. uint32_t tmp;
  86. int r;
  87. /* Initialize common gart structure */
  88. r = radeon_gart_init(rdev);
  89. if (r) {
  90. return r;
  91. }
  92. r = rv370_debugfs_pcie_gart_info_init(rdev);
  93. if (r) {
  94. DRM_ERROR("Failed to register debugfs file for PCIE gart !\n");
  95. }
  96. rdev->gart.table_size = rdev->gart.num_gpu_pages * 4;
  97. r = radeon_gart_table_vram_alloc(rdev);
  98. if (r) {
  99. return r;
  100. }
  101. /* discard memory request outside of configured range */
  102. tmp = RADEON_PCIE_TX_GART_UNMAPPED_ACCESS_DISCARD;
  103. WREG32_PCIE(RADEON_PCIE_TX_GART_CNTL, tmp);
  104. WREG32_PCIE(RADEON_PCIE_TX_GART_START_LO, rdev->mc.gtt_location);
  105. tmp = rdev->mc.gtt_location + rdev->mc.gtt_size - 4096;
  106. WREG32_PCIE(RADEON_PCIE_TX_GART_END_LO, tmp);
  107. WREG32_PCIE(RADEON_PCIE_TX_GART_START_HI, 0);
  108. WREG32_PCIE(RADEON_PCIE_TX_GART_END_HI, 0);
  109. table_addr = rdev->gart.table_addr;
  110. WREG32_PCIE(RADEON_PCIE_TX_GART_BASE, table_addr);
  111. /* FIXME: setup default page */
  112. WREG32_PCIE(RADEON_PCIE_TX_DISCARD_RD_ADDR_LO, rdev->mc.vram_location);
  113. WREG32_PCIE(RADEON_PCIE_TX_DISCARD_RD_ADDR_HI, 0);
  114. /* Clear error */
  115. WREG32_PCIE(0x18, 0);
  116. tmp = RREG32_PCIE(RADEON_PCIE_TX_GART_CNTL);
  117. tmp |= RADEON_PCIE_TX_GART_EN;
  118. tmp |= RADEON_PCIE_TX_GART_UNMAPPED_ACCESS_DISCARD;
  119. WREG32_PCIE(RADEON_PCIE_TX_GART_CNTL, tmp);
  120. rv370_pcie_gart_tlb_flush(rdev);
  121. DRM_INFO("PCIE GART of %uM enabled (table at 0x%08X).\n",
  122. rdev->mc.gtt_size >> 20, table_addr);
  123. rdev->gart.ready = true;
  124. return 0;
  125. }
  126. void rv370_pcie_gart_disable(struct radeon_device *rdev)
  127. {
  128. uint32_t tmp;
  129. tmp = RREG32_PCIE(RADEON_PCIE_TX_GART_CNTL);
  130. tmp |= RADEON_PCIE_TX_GART_UNMAPPED_ACCESS_DISCARD;
  131. WREG32_PCIE(RADEON_PCIE_TX_GART_CNTL, tmp & ~RADEON_PCIE_TX_GART_EN);
  132. if (rdev->gart.table.vram.robj) {
  133. radeon_object_kunmap(rdev->gart.table.vram.robj);
  134. radeon_object_unpin(rdev->gart.table.vram.robj);
  135. }
  136. }
  137. int rv370_pcie_gart_set_page(struct radeon_device *rdev, int i, uint64_t addr)
  138. {
  139. void __iomem *ptr = (void *)rdev->gart.table.vram.ptr;
  140. if (i < 0 || i > rdev->gart.num_gpu_pages) {
  141. return -EINVAL;
  142. }
  143. addr = (((u32)addr) >> 8) | ((upper_32_bits(addr) & 0xff) << 4) | 0xC;
  144. writel(cpu_to_le32(addr), ((void __iomem *)ptr) + (i * 4));
  145. return 0;
  146. }
  147. int r300_gart_enable(struct radeon_device *rdev)
  148. {
  149. #if __OS_HAS_AGP
  150. if (rdev->flags & RADEON_IS_AGP) {
  151. if (rdev->family > CHIP_RV350) {
  152. rv370_pcie_gart_disable(rdev);
  153. } else {
  154. r100_pci_gart_disable(rdev);
  155. }
  156. return 0;
  157. }
  158. #endif
  159. if (rdev->flags & RADEON_IS_PCIE) {
  160. rdev->asic->gart_disable = &rv370_pcie_gart_disable;
  161. rdev->asic->gart_tlb_flush = &rv370_pcie_gart_tlb_flush;
  162. rdev->asic->gart_set_page = &rv370_pcie_gart_set_page;
  163. return rv370_pcie_gart_enable(rdev);
  164. }
  165. return r100_pci_gart_enable(rdev);
  166. }
  167. /*
  168. * MC
  169. */
  170. int r300_mc_init(struct radeon_device *rdev)
  171. {
  172. int r;
  173. if (r100_debugfs_rbbm_init(rdev)) {
  174. DRM_ERROR("Failed to register debugfs file for RBBM !\n");
  175. }
  176. r300_gpu_init(rdev);
  177. r100_pci_gart_disable(rdev);
  178. if (rdev->flags & RADEON_IS_PCIE) {
  179. rv370_pcie_gart_disable(rdev);
  180. }
  181. /* Setup GPU memory space */
  182. rdev->mc.vram_location = 0xFFFFFFFFUL;
  183. rdev->mc.gtt_location = 0xFFFFFFFFUL;
  184. if (rdev->flags & RADEON_IS_AGP) {
  185. r = radeon_agp_init(rdev);
  186. if (r) {
  187. printk(KERN_WARNING "[drm] Disabling AGP\n");
  188. rdev->flags &= ~RADEON_IS_AGP;
  189. rdev->mc.gtt_size = radeon_gart_size * 1024 * 1024;
  190. } else {
  191. rdev->mc.gtt_location = rdev->mc.agp_base;
  192. }
  193. }
  194. r = radeon_mc_setup(rdev);
  195. if (r) {
  196. return r;
  197. }
  198. /* Program GPU memory space */
  199. r100_mc_disable_clients(rdev);
  200. if (r300_mc_wait_for_idle(rdev)) {
  201. printk(KERN_WARNING "Failed to wait MC idle while "
  202. "programming pipes. Bad things might happen.\n");
  203. }
  204. r100_mc_setup(rdev);
  205. return 0;
  206. }
  207. void r300_mc_fini(struct radeon_device *rdev)
  208. {
  209. if (rdev->flags & RADEON_IS_PCIE) {
  210. rv370_pcie_gart_disable(rdev);
  211. radeon_gart_table_vram_free(rdev);
  212. } else {
  213. r100_pci_gart_disable(rdev);
  214. radeon_gart_table_ram_free(rdev);
  215. }
  216. radeon_gart_fini(rdev);
  217. }
  218. /*
  219. * Fence emission
  220. */
  221. void r300_fence_ring_emit(struct radeon_device *rdev,
  222. struct radeon_fence *fence)
  223. {
  224. /* Who ever call radeon_fence_emit should call ring_lock and ask
  225. * for enough space (today caller are ib schedule and buffer move) */
  226. /* Write SC register so SC & US assert idle */
  227. radeon_ring_write(rdev, PACKET0(0x43E0, 0));
  228. radeon_ring_write(rdev, 0);
  229. radeon_ring_write(rdev, PACKET0(0x43E4, 0));
  230. radeon_ring_write(rdev, 0);
  231. /* Flush 3D cache */
  232. radeon_ring_write(rdev, PACKET0(0x4E4C, 0));
  233. radeon_ring_write(rdev, (2 << 0));
  234. radeon_ring_write(rdev, PACKET0(0x4F18, 0));
  235. radeon_ring_write(rdev, (1 << 0));
  236. /* Wait until IDLE & CLEAN */
  237. radeon_ring_write(rdev, PACKET0(0x1720, 0));
  238. radeon_ring_write(rdev, (1 << 17) | (1 << 16) | (1 << 9));
  239. /* Emit fence sequence & fire IRQ */
  240. radeon_ring_write(rdev, PACKET0(rdev->fence_drv.scratch_reg, 0));
  241. radeon_ring_write(rdev, fence->seq);
  242. radeon_ring_write(rdev, PACKET0(RADEON_GEN_INT_STATUS, 0));
  243. radeon_ring_write(rdev, RADEON_SW_INT_FIRE);
  244. }
  245. /*
  246. * Global GPU functions
  247. */
  248. int r300_copy_dma(struct radeon_device *rdev,
  249. uint64_t src_offset,
  250. uint64_t dst_offset,
  251. unsigned num_pages,
  252. struct radeon_fence *fence)
  253. {
  254. uint32_t size;
  255. uint32_t cur_size;
  256. int i, num_loops;
  257. int r = 0;
  258. /* radeon pitch is /64 */
  259. size = num_pages << PAGE_SHIFT;
  260. num_loops = DIV_ROUND_UP(size, 0x1FFFFF);
  261. r = radeon_ring_lock(rdev, num_loops * 4 + 64);
  262. if (r) {
  263. DRM_ERROR("radeon: moving bo (%d).\n", r);
  264. return r;
  265. }
  266. /* Must wait for 2D idle & clean before DMA or hangs might happen */
  267. radeon_ring_write(rdev, PACKET0(RADEON_WAIT_UNTIL, 0));
  268. radeon_ring_write(rdev, (1 << 16));
  269. for (i = 0; i < num_loops; i++) {
  270. cur_size = size;
  271. if (cur_size > 0x1FFFFF) {
  272. cur_size = 0x1FFFFF;
  273. }
  274. size -= cur_size;
  275. radeon_ring_write(rdev, PACKET0(0x720, 2));
  276. radeon_ring_write(rdev, src_offset);
  277. radeon_ring_write(rdev, dst_offset);
  278. radeon_ring_write(rdev, cur_size | (1 << 31) | (1 << 30));
  279. src_offset += cur_size;
  280. dst_offset += cur_size;
  281. }
  282. radeon_ring_write(rdev, PACKET0(RADEON_WAIT_UNTIL, 0));
  283. radeon_ring_write(rdev, RADEON_WAIT_DMA_GUI_IDLE);
  284. if (fence) {
  285. r = radeon_fence_emit(rdev, fence);
  286. }
  287. radeon_ring_unlock_commit(rdev);
  288. return r;
  289. }
  290. void r300_ring_start(struct radeon_device *rdev)
  291. {
  292. unsigned gb_tile_config;
  293. int r;
  294. /* Sub pixel 1/12 so we can have 4K rendering according to doc */
  295. gb_tile_config = (R300_ENABLE_TILING | R300_TILE_SIZE_16);
  296. switch (rdev->num_gb_pipes) {
  297. case 2:
  298. gb_tile_config |= R300_PIPE_COUNT_R300;
  299. break;
  300. case 3:
  301. gb_tile_config |= R300_PIPE_COUNT_R420_3P;
  302. break;
  303. case 4:
  304. gb_tile_config |= R300_PIPE_COUNT_R420;
  305. break;
  306. case 1:
  307. default:
  308. gb_tile_config |= R300_PIPE_COUNT_RV350;
  309. break;
  310. }
  311. r = radeon_ring_lock(rdev, 64);
  312. if (r) {
  313. return;
  314. }
  315. radeon_ring_write(rdev, PACKET0(RADEON_ISYNC_CNTL, 0));
  316. radeon_ring_write(rdev,
  317. RADEON_ISYNC_ANY2D_IDLE3D |
  318. RADEON_ISYNC_ANY3D_IDLE2D |
  319. RADEON_ISYNC_WAIT_IDLEGUI |
  320. RADEON_ISYNC_CPSCRATCH_IDLEGUI);
  321. radeon_ring_write(rdev, PACKET0(R300_GB_TILE_CONFIG, 0));
  322. radeon_ring_write(rdev, gb_tile_config);
  323. radeon_ring_write(rdev, PACKET0(RADEON_WAIT_UNTIL, 0));
  324. radeon_ring_write(rdev,
  325. RADEON_WAIT_2D_IDLECLEAN |
  326. RADEON_WAIT_3D_IDLECLEAN);
  327. radeon_ring_write(rdev, PACKET0(0x170C, 0));
  328. radeon_ring_write(rdev, 1 << 31);
  329. radeon_ring_write(rdev, PACKET0(R300_GB_SELECT, 0));
  330. radeon_ring_write(rdev, 0);
  331. radeon_ring_write(rdev, PACKET0(R300_GB_ENABLE, 0));
  332. radeon_ring_write(rdev, 0);
  333. radeon_ring_write(rdev, PACKET0(R300_RB3D_DSTCACHE_CTLSTAT, 0));
  334. radeon_ring_write(rdev, R300_RB3D_DC_FLUSH | R300_RB3D_DC_FREE);
  335. radeon_ring_write(rdev, PACKET0(R300_RB3D_ZCACHE_CTLSTAT, 0));
  336. radeon_ring_write(rdev, R300_ZC_FLUSH | R300_ZC_FREE);
  337. radeon_ring_write(rdev, PACKET0(RADEON_WAIT_UNTIL, 0));
  338. radeon_ring_write(rdev,
  339. RADEON_WAIT_2D_IDLECLEAN |
  340. RADEON_WAIT_3D_IDLECLEAN);
  341. radeon_ring_write(rdev, PACKET0(R300_GB_AA_CONFIG, 0));
  342. radeon_ring_write(rdev, 0);
  343. radeon_ring_write(rdev, PACKET0(R300_RB3D_DSTCACHE_CTLSTAT, 0));
  344. radeon_ring_write(rdev, R300_RB3D_DC_FLUSH | R300_RB3D_DC_FREE);
  345. radeon_ring_write(rdev, PACKET0(R300_RB3D_ZCACHE_CTLSTAT, 0));
  346. radeon_ring_write(rdev, R300_ZC_FLUSH | R300_ZC_FREE);
  347. radeon_ring_write(rdev, PACKET0(R300_GB_MSPOS0, 0));
  348. radeon_ring_write(rdev,
  349. ((6 << R300_MS_X0_SHIFT) |
  350. (6 << R300_MS_Y0_SHIFT) |
  351. (6 << R300_MS_X1_SHIFT) |
  352. (6 << R300_MS_Y1_SHIFT) |
  353. (6 << R300_MS_X2_SHIFT) |
  354. (6 << R300_MS_Y2_SHIFT) |
  355. (6 << R300_MSBD0_Y_SHIFT) |
  356. (6 << R300_MSBD0_X_SHIFT)));
  357. radeon_ring_write(rdev, PACKET0(R300_GB_MSPOS1, 0));
  358. radeon_ring_write(rdev,
  359. ((6 << R300_MS_X3_SHIFT) |
  360. (6 << R300_MS_Y3_SHIFT) |
  361. (6 << R300_MS_X4_SHIFT) |
  362. (6 << R300_MS_Y4_SHIFT) |
  363. (6 << R300_MS_X5_SHIFT) |
  364. (6 << R300_MS_Y5_SHIFT) |
  365. (6 << R300_MSBD1_SHIFT)));
  366. radeon_ring_write(rdev, PACKET0(R300_GA_ENHANCE, 0));
  367. radeon_ring_write(rdev, R300_GA_DEADLOCK_CNTL | R300_GA_FASTSYNC_CNTL);
  368. radeon_ring_write(rdev, PACKET0(R300_GA_POLY_MODE, 0));
  369. radeon_ring_write(rdev,
  370. R300_FRONT_PTYPE_TRIANGE | R300_BACK_PTYPE_TRIANGE);
  371. radeon_ring_write(rdev, PACKET0(R300_GA_ROUND_MODE, 0));
  372. radeon_ring_write(rdev,
  373. R300_GEOMETRY_ROUND_NEAREST |
  374. R300_COLOR_ROUND_NEAREST);
  375. radeon_ring_unlock_commit(rdev);
  376. }
  377. void r300_errata(struct radeon_device *rdev)
  378. {
  379. rdev->pll_errata = 0;
  380. if (rdev->family == CHIP_R300 &&
  381. (RREG32(RADEON_CONFIG_CNTL) & RADEON_CFG_ATI_REV_ID_MASK) == RADEON_CFG_ATI_REV_A11) {
  382. rdev->pll_errata |= CHIP_ERRATA_R300_CG;
  383. }
  384. }
  385. int r300_mc_wait_for_idle(struct radeon_device *rdev)
  386. {
  387. unsigned i;
  388. uint32_t tmp;
  389. for (i = 0; i < rdev->usec_timeout; i++) {
  390. /* read MC_STATUS */
  391. tmp = RREG32(0x0150);
  392. if (tmp & (1 << 4)) {
  393. return 0;
  394. }
  395. DRM_UDELAY(1);
  396. }
  397. return -1;
  398. }
  399. void r300_gpu_init(struct radeon_device *rdev)
  400. {
  401. uint32_t gb_tile_config, tmp;
  402. r100_hdp_reset(rdev);
  403. /* FIXME: rv380 one pipes ? */
  404. if ((rdev->family == CHIP_R300) || (rdev->family == CHIP_R350)) {
  405. /* r300,r350 */
  406. rdev->num_gb_pipes = 2;
  407. } else {
  408. /* rv350,rv370,rv380 */
  409. rdev->num_gb_pipes = 1;
  410. }
  411. gb_tile_config = (R300_ENABLE_TILING | R300_TILE_SIZE_16);
  412. switch (rdev->num_gb_pipes) {
  413. case 2:
  414. gb_tile_config |= R300_PIPE_COUNT_R300;
  415. break;
  416. case 3:
  417. gb_tile_config |= R300_PIPE_COUNT_R420_3P;
  418. break;
  419. case 4:
  420. gb_tile_config |= R300_PIPE_COUNT_R420;
  421. break;
  422. case 1:
  423. default:
  424. gb_tile_config |= R300_PIPE_COUNT_RV350;
  425. break;
  426. }
  427. WREG32(R300_GB_TILE_CONFIG, gb_tile_config);
  428. if (r100_gui_wait_for_idle(rdev)) {
  429. printk(KERN_WARNING "Failed to wait GUI idle while "
  430. "programming pipes. Bad things might happen.\n");
  431. }
  432. tmp = RREG32(0x170C);
  433. WREG32(0x170C, tmp | (1 << 31));
  434. WREG32(R300_RB2D_DSTCACHE_MODE,
  435. R300_DC_AUTOFLUSH_ENABLE |
  436. R300_DC_DC_DISABLE_IGNORE_PE);
  437. if (r100_gui_wait_for_idle(rdev)) {
  438. printk(KERN_WARNING "Failed to wait GUI idle while "
  439. "programming pipes. Bad things might happen.\n");
  440. }
  441. if (r300_mc_wait_for_idle(rdev)) {
  442. printk(KERN_WARNING "Failed to wait MC idle while "
  443. "programming pipes. Bad things might happen.\n");
  444. }
  445. DRM_INFO("radeon: %d pipes initialized.\n", rdev->num_gb_pipes);
  446. }
  447. int r300_ga_reset(struct radeon_device *rdev)
  448. {
  449. uint32_t tmp;
  450. bool reinit_cp;
  451. int i;
  452. reinit_cp = rdev->cp.ready;
  453. rdev->cp.ready = false;
  454. for (i = 0; i < rdev->usec_timeout; i++) {
  455. WREG32(RADEON_CP_CSQ_MODE, 0);
  456. WREG32(RADEON_CP_CSQ_CNTL, 0);
  457. WREG32(RADEON_RBBM_SOFT_RESET, 0x32005);
  458. (void)RREG32(RADEON_RBBM_SOFT_RESET);
  459. udelay(200);
  460. WREG32(RADEON_RBBM_SOFT_RESET, 0);
  461. /* Wait to prevent race in RBBM_STATUS */
  462. mdelay(1);
  463. tmp = RREG32(RADEON_RBBM_STATUS);
  464. if (tmp & ((1 << 20) | (1 << 26))) {
  465. DRM_ERROR("VAP & CP still busy (RBBM_STATUS=0x%08X)", tmp);
  466. /* GA still busy soft reset it */
  467. WREG32(0x429C, 0x200);
  468. WREG32(R300_VAP_PVS_STATE_FLUSH_REG, 0);
  469. WREG32(0x43E0, 0);
  470. WREG32(0x43E4, 0);
  471. WREG32(0x24AC, 0);
  472. }
  473. /* Wait to prevent race in RBBM_STATUS */
  474. mdelay(1);
  475. tmp = RREG32(RADEON_RBBM_STATUS);
  476. if (!(tmp & ((1 << 20) | (1 << 26)))) {
  477. break;
  478. }
  479. }
  480. for (i = 0; i < rdev->usec_timeout; i++) {
  481. tmp = RREG32(RADEON_RBBM_STATUS);
  482. if (!(tmp & ((1 << 20) | (1 << 26)))) {
  483. DRM_INFO("GA reset succeed (RBBM_STATUS=0x%08X)\n",
  484. tmp);
  485. if (reinit_cp) {
  486. return r100_cp_init(rdev, rdev->cp.ring_size);
  487. }
  488. return 0;
  489. }
  490. DRM_UDELAY(1);
  491. }
  492. tmp = RREG32(RADEON_RBBM_STATUS);
  493. DRM_ERROR("Failed to reset GA ! (RBBM_STATUS=0x%08X)\n", tmp);
  494. return -1;
  495. }
  496. int r300_gpu_reset(struct radeon_device *rdev)
  497. {
  498. uint32_t status;
  499. /* reset order likely matter */
  500. status = RREG32(RADEON_RBBM_STATUS);
  501. /* reset HDP */
  502. r100_hdp_reset(rdev);
  503. /* reset rb2d */
  504. if (status & ((1 << 17) | (1 << 18) | (1 << 27))) {
  505. r100_rb2d_reset(rdev);
  506. }
  507. /* reset GA */
  508. if (status & ((1 << 20) | (1 << 26))) {
  509. r300_ga_reset(rdev);
  510. }
  511. /* reset CP */
  512. status = RREG32(RADEON_RBBM_STATUS);
  513. if (status & (1 << 16)) {
  514. r100_cp_reset(rdev);
  515. }
  516. /* Check if GPU is idle */
  517. status = RREG32(RADEON_RBBM_STATUS);
  518. if (status & (1 << 31)) {
  519. DRM_ERROR("Failed to reset GPU (RBBM_STATUS=0x%08X)\n", status);
  520. return -1;
  521. }
  522. DRM_INFO("GPU reset succeed (RBBM_STATUS=0x%08X)\n", status);
  523. return 0;
  524. }
  525. /*
  526. * r300,r350,rv350,rv380 VRAM info
  527. */
  528. void r300_vram_info(struct radeon_device *rdev)
  529. {
  530. uint32_t tmp;
  531. /* DDR for all card after R300 & IGP */
  532. rdev->mc.vram_is_ddr = true;
  533. tmp = RREG32(RADEON_MEM_CNTL);
  534. if (tmp & R300_MEM_NUM_CHANNELS_MASK) {
  535. rdev->mc.vram_width = 128;
  536. } else {
  537. rdev->mc.vram_width = 64;
  538. }
  539. rdev->mc.vram_size = RREG32(RADEON_CONFIG_MEMSIZE);
  540. rdev->mc.aper_base = drm_get_resource_start(rdev->ddev, 0);
  541. rdev->mc.aper_size = drm_get_resource_len(rdev->ddev, 0);
  542. }
  543. /*
  544. * Indirect registers accessor
  545. */
  546. uint32_t rv370_pcie_rreg(struct radeon_device *rdev, uint32_t reg)
  547. {
  548. uint32_t r;
  549. WREG8(RADEON_PCIE_INDEX, ((reg) & 0xff));
  550. (void)RREG32(RADEON_PCIE_INDEX);
  551. r = RREG32(RADEON_PCIE_DATA);
  552. return r;
  553. }
  554. void rv370_pcie_wreg(struct radeon_device *rdev, uint32_t reg, uint32_t v)
  555. {
  556. WREG8(RADEON_PCIE_INDEX, ((reg) & 0xff));
  557. (void)RREG32(RADEON_PCIE_INDEX);
  558. WREG32(RADEON_PCIE_DATA, (v));
  559. (void)RREG32(RADEON_PCIE_DATA);
  560. }
  561. /*
  562. * PCIE Lanes
  563. */
  564. void rv370_set_pcie_lanes(struct radeon_device *rdev, int lanes)
  565. {
  566. uint32_t link_width_cntl, mask;
  567. if (rdev->flags & RADEON_IS_IGP)
  568. return;
  569. if (!(rdev->flags & RADEON_IS_PCIE))
  570. return;
  571. /* FIXME wait for idle */
  572. switch (lanes) {
  573. case 0:
  574. mask = RADEON_PCIE_LC_LINK_WIDTH_X0;
  575. break;
  576. case 1:
  577. mask = RADEON_PCIE_LC_LINK_WIDTH_X1;
  578. break;
  579. case 2:
  580. mask = RADEON_PCIE_LC_LINK_WIDTH_X2;
  581. break;
  582. case 4:
  583. mask = RADEON_PCIE_LC_LINK_WIDTH_X4;
  584. break;
  585. case 8:
  586. mask = RADEON_PCIE_LC_LINK_WIDTH_X8;
  587. break;
  588. case 12:
  589. mask = RADEON_PCIE_LC_LINK_WIDTH_X12;
  590. break;
  591. case 16:
  592. default:
  593. mask = RADEON_PCIE_LC_LINK_WIDTH_X16;
  594. break;
  595. }
  596. link_width_cntl = RREG32_PCIE(RADEON_PCIE_LC_LINK_WIDTH_CNTL);
  597. if ((link_width_cntl & RADEON_PCIE_LC_LINK_WIDTH_RD_MASK) ==
  598. (mask << RADEON_PCIE_LC_LINK_WIDTH_RD_SHIFT))
  599. return;
  600. link_width_cntl &= ~(RADEON_PCIE_LC_LINK_WIDTH_MASK |
  601. RADEON_PCIE_LC_RECONFIG_NOW |
  602. RADEON_PCIE_LC_RECONFIG_LATER |
  603. RADEON_PCIE_LC_SHORT_RECONFIG_EN);
  604. link_width_cntl |= mask;
  605. WREG32_PCIE(RADEON_PCIE_LC_LINK_WIDTH_CNTL, link_width_cntl);
  606. WREG32_PCIE(RADEON_PCIE_LC_LINK_WIDTH_CNTL, (link_width_cntl |
  607. RADEON_PCIE_LC_RECONFIG_NOW));
  608. /* wait for lane set to complete */
  609. link_width_cntl = RREG32_PCIE(RADEON_PCIE_LC_LINK_WIDTH_CNTL);
  610. while (link_width_cntl == 0xffffffff)
  611. link_width_cntl = RREG32_PCIE(RADEON_PCIE_LC_LINK_WIDTH_CNTL);
  612. }
  613. /*
  614. * Debugfs info
  615. */
  616. #if defined(CONFIG_DEBUG_FS)
  617. static int rv370_debugfs_pcie_gart_info(struct seq_file *m, void *data)
  618. {
  619. struct drm_info_node *node = (struct drm_info_node *) m->private;
  620. struct drm_device *dev = node->minor->dev;
  621. struct radeon_device *rdev = dev->dev_private;
  622. uint32_t tmp;
  623. tmp = RREG32_PCIE(RADEON_PCIE_TX_GART_CNTL);
  624. seq_printf(m, "PCIE_TX_GART_CNTL 0x%08x\n", tmp);
  625. tmp = RREG32_PCIE(RADEON_PCIE_TX_GART_BASE);
  626. seq_printf(m, "PCIE_TX_GART_BASE 0x%08x\n", tmp);
  627. tmp = RREG32_PCIE(RADEON_PCIE_TX_GART_START_LO);
  628. seq_printf(m, "PCIE_TX_GART_START_LO 0x%08x\n", tmp);
  629. tmp = RREG32_PCIE(RADEON_PCIE_TX_GART_START_HI);
  630. seq_printf(m, "PCIE_TX_GART_START_HI 0x%08x\n", tmp);
  631. tmp = RREG32_PCIE(RADEON_PCIE_TX_GART_END_LO);
  632. seq_printf(m, "PCIE_TX_GART_END_LO 0x%08x\n", tmp);
  633. tmp = RREG32_PCIE(RADEON_PCIE_TX_GART_END_HI);
  634. seq_printf(m, "PCIE_TX_GART_END_HI 0x%08x\n", tmp);
  635. tmp = RREG32_PCIE(RADEON_PCIE_TX_GART_ERROR);
  636. seq_printf(m, "PCIE_TX_GART_ERROR 0x%08x\n", tmp);
  637. return 0;
  638. }
  639. static struct drm_info_list rv370_pcie_gart_info_list[] = {
  640. {"rv370_pcie_gart_info", rv370_debugfs_pcie_gart_info, 0, NULL},
  641. };
  642. #endif
  643. int rv370_debugfs_pcie_gart_info_init(struct radeon_device *rdev)
  644. {
  645. #if defined(CONFIG_DEBUG_FS)
  646. return radeon_debugfs_add_files(rdev, rv370_pcie_gart_info_list, 1);
  647. #else
  648. return 0;
  649. #endif
  650. }
  651. /*
  652. * CS functions
  653. */
  654. struct r300_cs_track_cb {
  655. struct radeon_object *robj;
  656. unsigned pitch;
  657. unsigned cpp;
  658. unsigned offset;
  659. };
  660. struct r300_cs_track {
  661. unsigned num_cb;
  662. unsigned maxy;
  663. struct r300_cs_track_cb cb[4];
  664. struct r300_cs_track_cb zb;
  665. bool z_enabled;
  666. };
  667. int r300_cs_track_check(struct radeon_device *rdev, struct r300_cs_track *track)
  668. {
  669. unsigned i;
  670. unsigned long size;
  671. for (i = 0; i < track->num_cb; i++) {
  672. if (track->cb[i].robj == NULL) {
  673. DRM_ERROR("[drm] No buffer for color buffer %d !\n", i);
  674. return -EINVAL;
  675. }
  676. size = track->cb[i].pitch * track->cb[i].cpp * track->maxy;
  677. size += track->cb[i].offset;
  678. if (size > radeon_object_size(track->cb[i].robj)) {
  679. DRM_ERROR("[drm] Buffer too small for color buffer %d "
  680. "(need %lu have %lu) !\n", i, size,
  681. radeon_object_size(track->cb[i].robj));
  682. DRM_ERROR("[drm] color buffer %d (%u %u %u %u)\n",
  683. i, track->cb[i].pitch, track->cb[i].cpp,
  684. track->cb[i].offset, track->maxy);
  685. return -EINVAL;
  686. }
  687. }
  688. if (track->z_enabled) {
  689. if (track->zb.robj == NULL) {
  690. DRM_ERROR("[drm] No buffer for z buffer !\n");
  691. return -EINVAL;
  692. }
  693. size = track->zb.pitch * track->zb.cpp * track->maxy;
  694. size += track->zb.offset;
  695. if (size > radeon_object_size(track->zb.robj)) {
  696. DRM_ERROR("[drm] Buffer too small for z buffer "
  697. "(need %lu have %lu) !\n", size,
  698. radeon_object_size(track->zb.robj));
  699. return -EINVAL;
  700. }
  701. }
  702. return 0;
  703. }
  704. static inline void r300_cs_track_clear(struct r300_cs_track *track)
  705. {
  706. unsigned i;
  707. track->num_cb = 4;
  708. track->maxy = 4096;
  709. for (i = 0; i < track->num_cb; i++) {
  710. track->cb[i].robj = NULL;
  711. track->cb[i].pitch = 8192;
  712. track->cb[i].cpp = 16;
  713. track->cb[i].offset = 0;
  714. }
  715. track->z_enabled = true;
  716. track->zb.robj = NULL;
  717. track->zb.pitch = 8192;
  718. track->zb.cpp = 4;
  719. track->zb.offset = 0;
  720. }
  721. static unsigned r300_auth_reg[] = {
  722. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  723. 0xFFFFFFBF, 0xFFFFFFFF, 0xFFFFFFBF, 0xFFFFFFFF,
  724. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  725. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  726. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  727. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  728. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  729. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  730. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  731. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  732. 0x17FF1FFF, 0xFFFFFFFC, 0xFFFFFFFF, 0xFF30FFBF,
  733. 0xFFFFFFF8, 0xC3E6FFFF, 0xFFFFF6DF, 0xFFFFFFFF,
  734. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  735. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  736. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFF03F,
  737. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  738. 0xFFFFFFFF, 0xFFFFCFCC, 0xF00E9FFF, 0x007C0000,
  739. 0xF0000078, 0xFF000009, 0xFFFFFFFF, 0xFFFFFFFF,
  740. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  741. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  742. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  743. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  744. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  745. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  746. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  747. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  748. 0xFFFFF7FF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  749. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  750. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  751. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  752. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  753. 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF, 0xFFFFFFFF,
  754. 0xFFFFFC78, 0xFFFFFFFF, 0xFFFFFFFC, 0xFFFFFFFF,
  755. 0x38FF8F50, 0xFFF88082, 0xF000000C, 0xFAE009FF,
  756. 0x00000000, 0x00000000, 0xFFFF0000, 0x00000000,
  757. 0x00000000, 0x0000C100, 0x00000000, 0x00000000,
  758. 0x00000000, 0x00000000, 0x00000000, 0x00000000,
  759. 0x00000000, 0xFFFF0000, 0xFFFFFFFF, 0xFF80FFFF,
  760. 0x00000000, 0x00000000, 0x00000000, 0x00000000,
  761. 0x0003FC01, 0xFFFFFFF8, 0xFE800B19,
  762. };
  763. static int r300_packet0_check(struct radeon_cs_parser *p,
  764. struct radeon_cs_packet *pkt,
  765. unsigned idx, unsigned reg)
  766. {
  767. struct radeon_cs_chunk *ib_chunk;
  768. struct radeon_cs_reloc *reloc;
  769. struct r300_cs_track *track;
  770. volatile uint32_t *ib;
  771. uint32_t tmp;
  772. unsigned i;
  773. int r;
  774. ib = p->ib->ptr;
  775. ib_chunk = &p->chunks[p->chunk_ib_idx];
  776. track = (struct r300_cs_track *)p->track;
  777. switch (reg) {
  778. case RADEON_DST_PITCH_OFFSET:
  779. case RADEON_SRC_PITCH_OFFSET:
  780. r = r100_cs_packet_next_reloc(p, &reloc);
  781. if (r) {
  782. DRM_ERROR("No reloc for ib[%d]=0x%04X\n",
  783. idx, reg);
  784. r100_cs_dump_packet(p, pkt);
  785. return r;
  786. }
  787. tmp = ib_chunk->kdata[idx] & 0x003fffff;
  788. tmp += (((u32)reloc->lobj.gpu_offset) >> 10);
  789. ib[idx] = (ib_chunk->kdata[idx] & 0xffc00000) | tmp;
  790. break;
  791. case R300_RB3D_COLOROFFSET0:
  792. case R300_RB3D_COLOROFFSET1:
  793. case R300_RB3D_COLOROFFSET2:
  794. case R300_RB3D_COLOROFFSET3:
  795. i = (reg - R300_RB3D_COLOROFFSET0) >> 2;
  796. r = r100_cs_packet_next_reloc(p, &reloc);
  797. if (r) {
  798. DRM_ERROR("No reloc for ib[%d]=0x%04X\n",
  799. idx, reg);
  800. r100_cs_dump_packet(p, pkt);
  801. return r;
  802. }
  803. track->cb[i].robj = reloc->robj;
  804. track->cb[i].offset = ib_chunk->kdata[idx];
  805. ib[idx] = ib_chunk->kdata[idx] + ((u32)reloc->lobj.gpu_offset);
  806. break;
  807. case R300_ZB_DEPTHOFFSET:
  808. r = r100_cs_packet_next_reloc(p, &reloc);
  809. if (r) {
  810. DRM_ERROR("No reloc for ib[%d]=0x%04X\n",
  811. idx, reg);
  812. r100_cs_dump_packet(p, pkt);
  813. return r;
  814. }
  815. track->zb.robj = reloc->robj;
  816. track->zb.offset = ib_chunk->kdata[idx];
  817. ib[idx] = ib_chunk->kdata[idx] + ((u32)reloc->lobj.gpu_offset);
  818. break;
  819. case R300_TX_OFFSET_0:
  820. case R300_TX_OFFSET_0+4:
  821. case R300_TX_OFFSET_0+8:
  822. case R300_TX_OFFSET_0+12:
  823. case R300_TX_OFFSET_0+16:
  824. case R300_TX_OFFSET_0+20:
  825. case R300_TX_OFFSET_0+24:
  826. case R300_TX_OFFSET_0+28:
  827. case R300_TX_OFFSET_0+32:
  828. case R300_TX_OFFSET_0+36:
  829. case R300_TX_OFFSET_0+40:
  830. case R300_TX_OFFSET_0+44:
  831. case R300_TX_OFFSET_0+48:
  832. case R300_TX_OFFSET_0+52:
  833. case R300_TX_OFFSET_0+56:
  834. case R300_TX_OFFSET_0+60:
  835. r = r100_cs_packet_next_reloc(p, &reloc);
  836. if (r) {
  837. DRM_ERROR("No reloc for ib[%d]=0x%04X\n",
  838. idx, reg);
  839. r100_cs_dump_packet(p, pkt);
  840. return r;
  841. }
  842. ib[idx] = ib_chunk->kdata[idx] + ((u32)reloc->lobj.gpu_offset);
  843. break;
  844. /* Tracked registers */
  845. case 0x43E4:
  846. /* SC_SCISSOR1 */
  847. track->maxy = ((ib_chunk->kdata[idx] >> 13) & 0x1FFF) + 1;
  848. if (p->rdev->family < CHIP_RV515) {
  849. track->maxy -= 1440;
  850. }
  851. break;
  852. case 0x4E00:
  853. /* RB3D_CCTL */
  854. track->num_cb = ((ib_chunk->kdata[idx] >> 5) & 0x3) + 1;
  855. break;
  856. case 0x4E38:
  857. case 0x4E3C:
  858. case 0x4E40:
  859. case 0x4E44:
  860. /* RB3D_COLORPITCH0 */
  861. /* RB3D_COLORPITCH1 */
  862. /* RB3D_COLORPITCH2 */
  863. /* RB3D_COLORPITCH3 */
  864. i = (reg - 0x4E38) >> 2;
  865. track->cb[i].pitch = ib_chunk->kdata[idx] & 0x3FFE;
  866. switch (((ib_chunk->kdata[idx] >> 21) & 0xF)) {
  867. case 9:
  868. case 11:
  869. case 12:
  870. track->cb[i].cpp = 1;
  871. break;
  872. case 3:
  873. case 4:
  874. case 13:
  875. case 15:
  876. track->cb[i].cpp = 2;
  877. break;
  878. case 6:
  879. track->cb[i].cpp = 4;
  880. break;
  881. case 10:
  882. track->cb[i].cpp = 8;
  883. break;
  884. case 7:
  885. track->cb[i].cpp = 16;
  886. break;
  887. default:
  888. DRM_ERROR("Invalid color buffer format (%d) !\n",
  889. ((ib_chunk->kdata[idx] >> 21) & 0xF));
  890. return -EINVAL;
  891. }
  892. break;
  893. case 0x4F00:
  894. /* ZB_CNTL */
  895. if (ib_chunk->kdata[idx] & 2) {
  896. track->z_enabled = true;
  897. } else {
  898. track->z_enabled = false;
  899. }
  900. break;
  901. case 0x4F10:
  902. /* ZB_FORMAT */
  903. switch ((ib_chunk->kdata[idx] & 0xF)) {
  904. case 0:
  905. case 1:
  906. track->zb.cpp = 2;
  907. break;
  908. case 2:
  909. track->zb.cpp = 4;
  910. break;
  911. default:
  912. DRM_ERROR("Invalid z buffer format (%d) !\n",
  913. (ib_chunk->kdata[idx] & 0xF));
  914. return -EINVAL;
  915. }
  916. break;
  917. case 0x4F24:
  918. /* ZB_DEPTHPITCH */
  919. track->zb.pitch = ib_chunk->kdata[idx] & 0x3FFC;
  920. break;
  921. default:
  922. printk(KERN_ERR "Forbidden register 0x%04X in cs at %d\n", reg, idx);
  923. return -EINVAL;
  924. }
  925. return 0;
  926. }
  927. static int r300_packet3_check(struct radeon_cs_parser *p,
  928. struct radeon_cs_packet *pkt)
  929. {
  930. struct radeon_cs_chunk *ib_chunk;
  931. struct radeon_cs_reloc *reloc;
  932. struct r300_cs_track *track;
  933. volatile uint32_t *ib;
  934. unsigned idx;
  935. unsigned i, c;
  936. int r;
  937. ib = p->ib->ptr;
  938. ib_chunk = &p->chunks[p->chunk_ib_idx];
  939. idx = pkt->idx + 1;
  940. track = (struct r300_cs_track *)p->track;
  941. switch (pkt->opcode) {
  942. case PACKET3_3D_LOAD_VBPNTR:
  943. c = ib_chunk->kdata[idx++];
  944. for (i = 0; i < (c - 1); i += 2, idx += 3) {
  945. r = r100_cs_packet_next_reloc(p, &reloc);
  946. if (r) {
  947. DRM_ERROR("No reloc for packet3 %d\n",
  948. pkt->opcode);
  949. r100_cs_dump_packet(p, pkt);
  950. return r;
  951. }
  952. ib[idx+1] = ib_chunk->kdata[idx+1] + ((u32)reloc->lobj.gpu_offset);
  953. r = r100_cs_packet_next_reloc(p, &reloc);
  954. if (r) {
  955. DRM_ERROR("No reloc for packet3 %d\n",
  956. pkt->opcode);
  957. r100_cs_dump_packet(p, pkt);
  958. return r;
  959. }
  960. ib[idx+2] = ib_chunk->kdata[idx+2] + ((u32)reloc->lobj.gpu_offset);
  961. }
  962. if (c & 1) {
  963. r = r100_cs_packet_next_reloc(p, &reloc);
  964. if (r) {
  965. DRM_ERROR("No reloc for packet3 %d\n",
  966. pkt->opcode);
  967. r100_cs_dump_packet(p, pkt);
  968. return r;
  969. }
  970. ib[idx+1] = ib_chunk->kdata[idx+1] + ((u32)reloc->lobj.gpu_offset);
  971. }
  972. break;
  973. case PACKET3_INDX_BUFFER:
  974. r = r100_cs_packet_next_reloc(p, &reloc);
  975. if (r) {
  976. DRM_ERROR("No reloc for packet3 %d\n", pkt->opcode);
  977. r100_cs_dump_packet(p, pkt);
  978. return r;
  979. }
  980. ib[idx+1] = ib_chunk->kdata[idx+1] + ((u32)reloc->lobj.gpu_offset);
  981. break;
  982. /* Draw packet */
  983. case PACKET3_3D_DRAW_VBUF:
  984. case PACKET3_3D_DRAW_IMMD:
  985. case PACKET3_3D_DRAW_INDX:
  986. case PACKET3_3D_DRAW_VBUF_2:
  987. case PACKET3_3D_DRAW_IMMD_2:
  988. case PACKET3_3D_DRAW_INDX_2:
  989. r = r300_cs_track_check(p->rdev, track);
  990. if (r) {
  991. return r;
  992. }
  993. break;
  994. case PACKET3_NOP:
  995. break;
  996. default:
  997. DRM_ERROR("Packet3 opcode %x not supported\n", pkt->opcode);
  998. return -EINVAL;
  999. }
  1000. return 0;
  1001. }
  1002. int r300_cs_parse(struct radeon_cs_parser *p)
  1003. {
  1004. struct radeon_cs_packet pkt;
  1005. struct r300_cs_track track;
  1006. int r;
  1007. r300_cs_track_clear(&track);
  1008. p->track = &track;
  1009. do {
  1010. r = r100_cs_packet_parse(p, &pkt, p->idx);
  1011. if (r) {
  1012. return r;
  1013. }
  1014. p->idx += pkt.count + 2;
  1015. switch (pkt.type) {
  1016. case PACKET_TYPE0:
  1017. r = r100_cs_parse_packet0(p, &pkt,
  1018. r300_auth_reg,
  1019. ARRAY_SIZE(r300_auth_reg),
  1020. &r300_packet0_check);
  1021. break;
  1022. case PACKET_TYPE2:
  1023. break;
  1024. case PACKET_TYPE3:
  1025. r = r300_packet3_check(p, &pkt);
  1026. break;
  1027. default:
  1028. DRM_ERROR("Unknown packet type %d !\n", pkt.type);
  1029. return -EINVAL;
  1030. }
  1031. if (r) {
  1032. return r;
  1033. }
  1034. } while (p->idx < p->chunks[p->chunk_ib_idx].length_dw);
  1035. return 0;
  1036. }