r600.c 49 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772
  1. /*
  2. * Copyright 2008 Advanced Micro Devices, Inc.
  3. * Copyright 2008 Red Hat Inc.
  4. * Copyright 2009 Jerome Glisse.
  5. *
  6. * Permission is hereby granted, free of charge, to any person obtaining a
  7. * copy of this software and associated documentation files (the "Software"),
  8. * to deal in the Software without restriction, including without limitation
  9. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  10. * and/or sell copies of the Software, and to permit persons to whom the
  11. * Software is furnished to do so, subject to the following conditions:
  12. *
  13. * The above copyright notice and this permission notice shall be included in
  14. * all copies or substantial portions of the Software.
  15. *
  16. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  17. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  18. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  19. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  20. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  21. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  22. * OTHER DEALINGS IN THE SOFTWARE.
  23. *
  24. * Authors: Dave Airlie
  25. * Alex Deucher
  26. * Jerome Glisse
  27. */
  28. #include <linux/seq_file.h>
  29. #include <linux/firmware.h>
  30. #include <linux/platform_device.h>
  31. #include "drmP.h"
  32. #include "radeon_drm.h"
  33. #include "radeon.h"
  34. #include "radeon_mode.h"
  35. #include "r600d.h"
  36. #include "avivod.h"
  37. #include "atom.h"
  38. #define PFP_UCODE_SIZE 576
  39. #define PM4_UCODE_SIZE 1792
  40. #define R700_PFP_UCODE_SIZE 848
  41. #define R700_PM4_UCODE_SIZE 1360
  42. /* Firmware Names */
  43. MODULE_FIRMWARE("radeon/R600_pfp.bin");
  44. MODULE_FIRMWARE("radeon/R600_me.bin");
  45. MODULE_FIRMWARE("radeon/RV610_pfp.bin");
  46. MODULE_FIRMWARE("radeon/RV610_me.bin");
  47. MODULE_FIRMWARE("radeon/RV630_pfp.bin");
  48. MODULE_FIRMWARE("radeon/RV630_me.bin");
  49. MODULE_FIRMWARE("radeon/RV620_pfp.bin");
  50. MODULE_FIRMWARE("radeon/RV620_me.bin");
  51. MODULE_FIRMWARE("radeon/RV635_pfp.bin");
  52. MODULE_FIRMWARE("radeon/RV635_me.bin");
  53. MODULE_FIRMWARE("radeon/RV670_pfp.bin");
  54. MODULE_FIRMWARE("radeon/RV670_me.bin");
  55. MODULE_FIRMWARE("radeon/RS780_pfp.bin");
  56. MODULE_FIRMWARE("radeon/RS780_me.bin");
  57. MODULE_FIRMWARE("radeon/RV770_pfp.bin");
  58. MODULE_FIRMWARE("radeon/RV770_me.bin");
  59. MODULE_FIRMWARE("radeon/RV730_pfp.bin");
  60. MODULE_FIRMWARE("radeon/RV730_me.bin");
  61. MODULE_FIRMWARE("radeon/RV710_pfp.bin");
  62. MODULE_FIRMWARE("radeon/RV710_me.bin");
  63. int r600_debugfs_mc_info_init(struct radeon_device *rdev);
  64. /* This files gather functions specifics to:
  65. * r600,rv610,rv630,rv620,rv635,rv670
  66. *
  67. * Some of these functions might be used by newer ASICs.
  68. */
  69. int r600_mc_wait_for_idle(struct radeon_device *rdev);
  70. void r600_gpu_init(struct radeon_device *rdev);
  71. void r600_fini(struct radeon_device *rdev);
  72. /*
  73. * R600 PCIE GART
  74. */
  75. int r600_gart_clear_page(struct radeon_device *rdev, int i)
  76. {
  77. void __iomem *ptr = (void *)rdev->gart.table.vram.ptr;
  78. u64 pte;
  79. if (i < 0 || i > rdev->gart.num_gpu_pages)
  80. return -EINVAL;
  81. pte = 0;
  82. writeq(pte, ((void __iomem *)ptr) + (i * 8));
  83. return 0;
  84. }
  85. void r600_pcie_gart_tlb_flush(struct radeon_device *rdev)
  86. {
  87. unsigned i;
  88. u32 tmp;
  89. WREG32(VM_CONTEXT0_INVALIDATION_LOW_ADDR, rdev->mc.gtt_start >> 12);
  90. WREG32(VM_CONTEXT0_INVALIDATION_HIGH_ADDR, (rdev->mc.gtt_end - 1) >> 12);
  91. WREG32(VM_CONTEXT0_REQUEST_RESPONSE, REQUEST_TYPE(1));
  92. for (i = 0; i < rdev->usec_timeout; i++) {
  93. /* read MC_STATUS */
  94. tmp = RREG32(VM_CONTEXT0_REQUEST_RESPONSE);
  95. tmp = (tmp & RESPONSE_TYPE_MASK) >> RESPONSE_TYPE_SHIFT;
  96. if (tmp == 2) {
  97. printk(KERN_WARNING "[drm] r600 flush TLB failed\n");
  98. return;
  99. }
  100. if (tmp) {
  101. return;
  102. }
  103. udelay(1);
  104. }
  105. }
  106. int r600_pcie_gart_init(struct radeon_device *rdev)
  107. {
  108. int r;
  109. if (rdev->gart.table.vram.robj) {
  110. WARN(1, "R600 PCIE GART already initialized.\n");
  111. return 0;
  112. }
  113. /* Initialize common gart structure */
  114. r = radeon_gart_init(rdev);
  115. if (r)
  116. return r;
  117. rdev->gart.table_size = rdev->gart.num_gpu_pages * 8;
  118. return radeon_gart_table_vram_alloc(rdev);
  119. }
  120. int r600_pcie_gart_enable(struct radeon_device *rdev)
  121. {
  122. u32 tmp;
  123. int r, i;
  124. if (rdev->gart.table.vram.robj == NULL) {
  125. dev_err(rdev->dev, "No VRAM object for PCIE GART.\n");
  126. return -EINVAL;
  127. }
  128. r = radeon_gart_table_vram_pin(rdev);
  129. if (r)
  130. return r;
  131. for (i = 0; i < rdev->gart.num_gpu_pages; i++)
  132. r600_gart_clear_page(rdev, i);
  133. /* Setup L2 cache */
  134. WREG32(VM_L2_CNTL, ENABLE_L2_CACHE | ENABLE_L2_FRAGMENT_PROCESSING |
  135. ENABLE_L2_PTE_CACHE_LRU_UPDATE_BY_WRITE |
  136. EFFECTIVE_L2_QUEUE_SIZE(7));
  137. WREG32(VM_L2_CNTL2, 0);
  138. WREG32(VM_L2_CNTL3, BANK_SELECT_0(0) | BANK_SELECT_1(1));
  139. /* Setup TLB control */
  140. tmp = ENABLE_L1_TLB | ENABLE_L1_FRAGMENT_PROCESSING |
  141. SYSTEM_ACCESS_MODE_NOT_IN_SYS |
  142. EFFECTIVE_L1_TLB_SIZE(5) | EFFECTIVE_L1_QUEUE_SIZE(5) |
  143. ENABLE_WAIT_L2_QUERY;
  144. WREG32(MC_VM_L1_TLB_MCB_RD_SYS_CNTL, tmp);
  145. WREG32(MC_VM_L1_TLB_MCB_WR_SYS_CNTL, tmp);
  146. WREG32(MC_VM_L1_TLB_MCB_RD_HDP_CNTL, tmp | ENABLE_L1_STRICT_ORDERING);
  147. WREG32(MC_VM_L1_TLB_MCB_WR_HDP_CNTL, tmp);
  148. WREG32(MC_VM_L1_TLB_MCD_RD_A_CNTL, tmp);
  149. WREG32(MC_VM_L1_TLB_MCD_WR_A_CNTL, tmp);
  150. WREG32(MC_VM_L1_TLB_MCD_RD_B_CNTL, tmp);
  151. WREG32(MC_VM_L1_TLB_MCD_WR_B_CNTL, tmp);
  152. WREG32(MC_VM_L1_TLB_MCB_RD_GFX_CNTL, tmp);
  153. WREG32(MC_VM_L1_TLB_MCB_WR_GFX_CNTL, tmp);
  154. WREG32(MC_VM_L1_TLB_MCB_RD_PDMA_CNTL, tmp);
  155. WREG32(MC_VM_L1_TLB_MCB_WR_PDMA_CNTL, tmp);
  156. WREG32(MC_VM_L1_TLB_MCB_RD_SEM_CNTL, tmp | ENABLE_SEMAPHORE_MODE);
  157. WREG32(MC_VM_L1_TLB_MCB_WR_SEM_CNTL, tmp | ENABLE_SEMAPHORE_MODE);
  158. WREG32(VM_CONTEXT0_PAGE_TABLE_START_ADDR, rdev->mc.gtt_start >> 12);
  159. WREG32(VM_CONTEXT0_PAGE_TABLE_END_ADDR, (rdev->mc.gtt_end - 1) >> 12);
  160. WREG32(VM_CONTEXT0_PAGE_TABLE_BASE_ADDR, rdev->gart.table_addr >> 12);
  161. WREG32(VM_CONTEXT0_CNTL, ENABLE_CONTEXT | PAGE_TABLE_DEPTH(0) |
  162. RANGE_PROTECTION_FAULT_ENABLE_DEFAULT);
  163. WREG32(VM_CONTEXT0_PROTECTION_FAULT_DEFAULT_ADDR,
  164. (u32)(rdev->dummy_page.addr >> 12));
  165. for (i = 1; i < 7; i++)
  166. WREG32(VM_CONTEXT0_CNTL + (i * 4), 0);
  167. r600_pcie_gart_tlb_flush(rdev);
  168. rdev->gart.ready = true;
  169. return 0;
  170. }
  171. void r600_pcie_gart_disable(struct radeon_device *rdev)
  172. {
  173. u32 tmp;
  174. int i;
  175. /* Disable all tables */
  176. for (i = 0; i < 7; i++)
  177. WREG32(VM_CONTEXT0_CNTL + (i * 4), 0);
  178. /* Disable L2 cache */
  179. WREG32(VM_L2_CNTL, ENABLE_L2_FRAGMENT_PROCESSING |
  180. EFFECTIVE_L2_QUEUE_SIZE(7));
  181. WREG32(VM_L2_CNTL3, BANK_SELECT_0(0) | BANK_SELECT_1(1));
  182. /* Setup L1 TLB control */
  183. tmp = EFFECTIVE_L1_TLB_SIZE(5) | EFFECTIVE_L1_QUEUE_SIZE(5) |
  184. ENABLE_WAIT_L2_QUERY;
  185. WREG32(MC_VM_L1_TLB_MCD_RD_A_CNTL, tmp);
  186. WREG32(MC_VM_L1_TLB_MCD_WR_A_CNTL, tmp);
  187. WREG32(MC_VM_L1_TLB_MCD_RD_B_CNTL, tmp);
  188. WREG32(MC_VM_L1_TLB_MCD_WR_B_CNTL, tmp);
  189. WREG32(MC_VM_L1_TLB_MCB_RD_GFX_CNTL, tmp);
  190. WREG32(MC_VM_L1_TLB_MCB_WR_GFX_CNTL, tmp);
  191. WREG32(MC_VM_L1_TLB_MCB_RD_PDMA_CNTL, tmp);
  192. WREG32(MC_VM_L1_TLB_MCB_WR_PDMA_CNTL, tmp);
  193. WREG32(MC_VM_L1_TLB_MCB_RD_SEM_CNTL, tmp);
  194. WREG32(MC_VM_L1_TLB_MCB_WR_SEM_CNTL, tmp);
  195. WREG32(MC_VM_L1_TLB_MCB_RD_SYS_CNTL, tmp);
  196. WREG32(MC_VM_L1_TLB_MCB_WR_SYS_CNTL, tmp);
  197. WREG32(MC_VM_L1_TLB_MCB_RD_HDP_CNTL, tmp);
  198. WREG32(MC_VM_L1_TLB_MCB_WR_HDP_CNTL, tmp);
  199. if (rdev->gart.table.vram.robj) {
  200. radeon_object_kunmap(rdev->gart.table.vram.robj);
  201. radeon_object_unpin(rdev->gart.table.vram.robj);
  202. }
  203. }
  204. void r600_pcie_gart_fini(struct radeon_device *rdev)
  205. {
  206. r600_pcie_gart_disable(rdev);
  207. radeon_gart_table_vram_free(rdev);
  208. radeon_gart_fini(rdev);
  209. }
  210. int r600_mc_wait_for_idle(struct radeon_device *rdev)
  211. {
  212. unsigned i;
  213. u32 tmp;
  214. for (i = 0; i < rdev->usec_timeout; i++) {
  215. /* read MC_STATUS */
  216. tmp = RREG32(R_000E50_SRBM_STATUS) & 0x3F00;
  217. if (!tmp)
  218. return 0;
  219. udelay(1);
  220. }
  221. return -1;
  222. }
  223. static void r600_mc_resume(struct radeon_device *rdev)
  224. {
  225. u32 d1vga_control, d2vga_control;
  226. u32 vga_render_control, vga_hdp_control;
  227. u32 d1crtc_control, d2crtc_control;
  228. u32 new_d1grph_primary, new_d1grph_secondary;
  229. u32 new_d2grph_primary, new_d2grph_secondary;
  230. u64 old_vram_start;
  231. u32 tmp;
  232. int i, j;
  233. /* Initialize HDP */
  234. for (i = 0, j = 0; i < 32; i++, j += 0x18) {
  235. WREG32((0x2c14 + j), 0x00000000);
  236. WREG32((0x2c18 + j), 0x00000000);
  237. WREG32((0x2c1c + j), 0x00000000);
  238. WREG32((0x2c20 + j), 0x00000000);
  239. WREG32((0x2c24 + j), 0x00000000);
  240. }
  241. WREG32(HDP_REG_COHERENCY_FLUSH_CNTL, 0);
  242. d1vga_control = RREG32(D1VGA_CONTROL);
  243. d2vga_control = RREG32(D2VGA_CONTROL);
  244. vga_render_control = RREG32(VGA_RENDER_CONTROL);
  245. vga_hdp_control = RREG32(VGA_HDP_CONTROL);
  246. d1crtc_control = RREG32(D1CRTC_CONTROL);
  247. d2crtc_control = RREG32(D2CRTC_CONTROL);
  248. old_vram_start = (u64)(RREG32(MC_VM_FB_LOCATION) & 0xFFFF) << 24;
  249. new_d1grph_primary = RREG32(D1GRPH_PRIMARY_SURFACE_ADDRESS);
  250. new_d1grph_secondary = RREG32(D1GRPH_SECONDARY_SURFACE_ADDRESS);
  251. new_d1grph_primary += rdev->mc.vram_start - old_vram_start;
  252. new_d1grph_secondary += rdev->mc.vram_start - old_vram_start;
  253. new_d2grph_primary = RREG32(D2GRPH_PRIMARY_SURFACE_ADDRESS);
  254. new_d2grph_secondary = RREG32(D2GRPH_SECONDARY_SURFACE_ADDRESS);
  255. new_d2grph_primary += rdev->mc.vram_start - old_vram_start;
  256. new_d2grph_secondary += rdev->mc.vram_start - old_vram_start;
  257. /* Stop all video */
  258. WREG32(D1VGA_CONTROL, 0);
  259. WREG32(D2VGA_CONTROL, 0);
  260. WREG32(VGA_RENDER_CONTROL, 0);
  261. WREG32(D1CRTC_UPDATE_LOCK, 1);
  262. WREG32(D2CRTC_UPDATE_LOCK, 1);
  263. WREG32(D1CRTC_CONTROL, 0);
  264. WREG32(D2CRTC_CONTROL, 0);
  265. WREG32(D1CRTC_UPDATE_LOCK, 0);
  266. WREG32(D2CRTC_UPDATE_LOCK, 0);
  267. mdelay(1);
  268. if (r600_mc_wait_for_idle(rdev)) {
  269. printk(KERN_WARNING "[drm] MC not idle !\n");
  270. }
  271. /* Lockout access through VGA aperture*/
  272. WREG32(VGA_HDP_CONTROL, VGA_MEMORY_DISABLE);
  273. /* Update configuration */
  274. WREG32(MC_VM_SYSTEM_APERTURE_LOW_ADDR, rdev->mc.vram_start >> 12);
  275. WREG32(MC_VM_SYSTEM_APERTURE_HIGH_ADDR, (rdev->mc.vram_end - 1) >> 12);
  276. WREG32(MC_VM_SYSTEM_APERTURE_DEFAULT_ADDR, 0);
  277. tmp = (((rdev->mc.vram_end - 1) >> 24) & 0xFFFF) << 16;
  278. tmp |= ((rdev->mc.vram_start >> 24) & 0xFFFF);
  279. WREG32(MC_VM_FB_LOCATION, tmp);
  280. WREG32(HDP_NONSURFACE_BASE, (rdev->mc.vram_start >> 8));
  281. WREG32(HDP_NONSURFACE_INFO, (2 << 7));
  282. WREG32(HDP_NONSURFACE_SIZE, (rdev->mc.mc_vram_size - 1) | 0x3FF);
  283. if (rdev->flags & RADEON_IS_AGP) {
  284. WREG32(MC_VM_AGP_TOP, (rdev->mc.gtt_end - 1) >> 16);
  285. WREG32(MC_VM_AGP_BOT, rdev->mc.gtt_start >> 16);
  286. WREG32(MC_VM_AGP_BASE, rdev->mc.agp_base >> 22);
  287. } else {
  288. WREG32(MC_VM_AGP_BASE, 0);
  289. WREG32(MC_VM_AGP_TOP, 0x0FFFFFFF);
  290. WREG32(MC_VM_AGP_BOT, 0x0FFFFFFF);
  291. }
  292. WREG32(D1GRPH_PRIMARY_SURFACE_ADDRESS, new_d1grph_primary);
  293. WREG32(D1GRPH_SECONDARY_SURFACE_ADDRESS, new_d1grph_secondary);
  294. WREG32(D2GRPH_PRIMARY_SURFACE_ADDRESS, new_d2grph_primary);
  295. WREG32(D2GRPH_SECONDARY_SURFACE_ADDRESS, new_d2grph_secondary);
  296. WREG32(VGA_MEMORY_BASE_ADDRESS, rdev->mc.vram_start);
  297. /* Unlock host access */
  298. WREG32(VGA_HDP_CONTROL, vga_hdp_control);
  299. mdelay(1);
  300. if (r600_mc_wait_for_idle(rdev)) {
  301. printk(KERN_WARNING "[drm] MC not idle !\n");
  302. }
  303. /* Restore video state */
  304. WREG32(D1CRTC_UPDATE_LOCK, 1);
  305. WREG32(D2CRTC_UPDATE_LOCK, 1);
  306. WREG32(D1CRTC_CONTROL, d1crtc_control);
  307. WREG32(D2CRTC_CONTROL, d2crtc_control);
  308. WREG32(D1CRTC_UPDATE_LOCK, 0);
  309. WREG32(D2CRTC_UPDATE_LOCK, 0);
  310. WREG32(D1VGA_CONTROL, d1vga_control);
  311. WREG32(D2VGA_CONTROL, d2vga_control);
  312. WREG32(VGA_RENDER_CONTROL, vga_render_control);
  313. /* we need to own VRAM, so turn off the VGA renderer here
  314. * to stop it overwriting our objects */
  315. radeon_avivo_vga_render_disable(rdev);
  316. }
  317. int r600_mc_init(struct radeon_device *rdev)
  318. {
  319. fixed20_12 a;
  320. u32 tmp;
  321. int chansize;
  322. int r;
  323. /* Get VRAM informations */
  324. rdev->mc.vram_width = 128;
  325. rdev->mc.vram_is_ddr = true;
  326. tmp = RREG32(RAMCFG);
  327. if (tmp & CHANSIZE_OVERRIDE) {
  328. chansize = 16;
  329. } else if (tmp & CHANSIZE_MASK) {
  330. chansize = 64;
  331. } else {
  332. chansize = 32;
  333. }
  334. if (rdev->family == CHIP_R600) {
  335. rdev->mc.vram_width = 8 * chansize;
  336. } else if (rdev->family == CHIP_RV670) {
  337. rdev->mc.vram_width = 4 * chansize;
  338. } else if ((rdev->family == CHIP_RV610) ||
  339. (rdev->family == CHIP_RV620)) {
  340. rdev->mc.vram_width = chansize;
  341. } else if ((rdev->family == CHIP_RV630) ||
  342. (rdev->family == CHIP_RV635)) {
  343. rdev->mc.vram_width = 2 * chansize;
  344. }
  345. /* Could aper size report 0 ? */
  346. rdev->mc.aper_base = drm_get_resource_start(rdev->ddev, 0);
  347. rdev->mc.aper_size = drm_get_resource_len(rdev->ddev, 0);
  348. /* Setup GPU memory space */
  349. rdev->mc.mc_vram_size = RREG32(CONFIG_MEMSIZE);
  350. rdev->mc.real_vram_size = RREG32(CONFIG_MEMSIZE);
  351. if (rdev->flags & RADEON_IS_AGP) {
  352. r = radeon_agp_init(rdev);
  353. if (r)
  354. return r;
  355. /* gtt_size is setup by radeon_agp_init */
  356. rdev->mc.gtt_location = rdev->mc.agp_base;
  357. tmp = 0xFFFFFFFFUL - rdev->mc.agp_base - rdev->mc.gtt_size;
  358. /* Try to put vram before or after AGP because we
  359. * we want SYSTEM_APERTURE to cover both VRAM and
  360. * AGP so that GPU can catch out of VRAM/AGP access
  361. */
  362. if (rdev->mc.gtt_location > rdev->mc.mc_vram_size) {
  363. /* Enought place before */
  364. rdev->mc.vram_location = rdev->mc.gtt_location -
  365. rdev->mc.mc_vram_size;
  366. } else if (tmp > rdev->mc.mc_vram_size) {
  367. /* Enought place after */
  368. rdev->mc.vram_location = rdev->mc.gtt_location +
  369. rdev->mc.gtt_size;
  370. } else {
  371. /* Try to setup VRAM then AGP might not
  372. * not work on some card
  373. */
  374. rdev->mc.vram_location = 0x00000000UL;
  375. rdev->mc.gtt_location = rdev->mc.mc_vram_size;
  376. }
  377. } else {
  378. if (rdev->family == CHIP_RS780 || rdev->family == CHIP_RS880) {
  379. rdev->mc.vram_location = (RREG32(MC_VM_FB_LOCATION) &
  380. 0xFFFF) << 24;
  381. rdev->mc.gtt_size = radeon_gart_size * 1024 * 1024;
  382. tmp = rdev->mc.vram_location + rdev->mc.mc_vram_size;
  383. if ((0xFFFFFFFFUL - tmp) >= rdev->mc.gtt_size) {
  384. /* Enough place after vram */
  385. rdev->mc.gtt_location = tmp;
  386. } else if (rdev->mc.vram_location >= rdev->mc.gtt_size) {
  387. /* Enough place before vram */
  388. rdev->mc.gtt_location = 0;
  389. } else {
  390. /* Not enough place after or before shrink
  391. * gart size
  392. */
  393. if (rdev->mc.vram_location > (0xFFFFFFFFUL - tmp)) {
  394. rdev->mc.gtt_location = 0;
  395. rdev->mc.gtt_size = rdev->mc.vram_location;
  396. } else {
  397. rdev->mc.gtt_location = tmp;
  398. rdev->mc.gtt_size = 0xFFFFFFFFUL - tmp;
  399. }
  400. }
  401. rdev->mc.gtt_location = rdev->mc.mc_vram_size;
  402. } else {
  403. rdev->mc.vram_location = 0x00000000UL;
  404. rdev->mc.gtt_location = rdev->mc.mc_vram_size;
  405. rdev->mc.gtt_size = radeon_gart_size * 1024 * 1024;
  406. }
  407. }
  408. rdev->mc.vram_start = rdev->mc.vram_location;
  409. rdev->mc.vram_end = rdev->mc.vram_location + rdev->mc.mc_vram_size;
  410. rdev->mc.gtt_start = rdev->mc.gtt_location;
  411. rdev->mc.gtt_end = rdev->mc.gtt_location + rdev->mc.gtt_size;
  412. /* FIXME: we should enforce default clock in case GPU is not in
  413. * default setup
  414. */
  415. a.full = rfixed_const(100);
  416. rdev->pm.sclk.full = rfixed_const(rdev->clock.default_sclk);
  417. rdev->pm.sclk.full = rfixed_div(rdev->pm.sclk, a);
  418. return 0;
  419. }
  420. /* We doesn't check that the GPU really needs a reset we simply do the
  421. * reset, it's up to the caller to determine if the GPU needs one. We
  422. * might add an helper function to check that.
  423. */
  424. int r600_gpu_soft_reset(struct radeon_device *rdev)
  425. {
  426. u32 grbm_busy_mask = S_008010_VC_BUSY(1) | S_008010_VGT_BUSY_NO_DMA(1) |
  427. S_008010_VGT_BUSY(1) | S_008010_TA03_BUSY(1) |
  428. S_008010_TC_BUSY(1) | S_008010_SX_BUSY(1) |
  429. S_008010_SH_BUSY(1) | S_008010_SPI03_BUSY(1) |
  430. S_008010_SMX_BUSY(1) | S_008010_SC_BUSY(1) |
  431. S_008010_PA_BUSY(1) | S_008010_DB03_BUSY(1) |
  432. S_008010_CR_BUSY(1) | S_008010_CB03_BUSY(1) |
  433. S_008010_GUI_ACTIVE(1);
  434. u32 grbm2_busy_mask = S_008014_SPI0_BUSY(1) | S_008014_SPI1_BUSY(1) |
  435. S_008014_SPI2_BUSY(1) | S_008014_SPI3_BUSY(1) |
  436. S_008014_TA0_BUSY(1) | S_008014_TA1_BUSY(1) |
  437. S_008014_TA2_BUSY(1) | S_008014_TA3_BUSY(1) |
  438. S_008014_DB0_BUSY(1) | S_008014_DB1_BUSY(1) |
  439. S_008014_DB2_BUSY(1) | S_008014_DB3_BUSY(1) |
  440. S_008014_CB0_BUSY(1) | S_008014_CB1_BUSY(1) |
  441. S_008014_CB2_BUSY(1) | S_008014_CB3_BUSY(1);
  442. u32 srbm_reset = 0;
  443. /* Disable CP parsing/prefetching */
  444. WREG32(R_0086D8_CP_ME_CNTL, S_0086D8_CP_ME_HALT(0xff));
  445. /* Check if any of the rendering block is busy and reset it */
  446. if ((RREG32(R_008010_GRBM_STATUS) & grbm_busy_mask) ||
  447. (RREG32(R_008014_GRBM_STATUS2) & grbm2_busy_mask)) {
  448. WREG32(R_008020_GRBM_SOFT_RESET, S_008020_SOFT_RESET_CR(1) |
  449. S_008020_SOFT_RESET_DB(1) |
  450. S_008020_SOFT_RESET_CB(1) |
  451. S_008020_SOFT_RESET_PA(1) |
  452. S_008020_SOFT_RESET_SC(1) |
  453. S_008020_SOFT_RESET_SMX(1) |
  454. S_008020_SOFT_RESET_SPI(1) |
  455. S_008020_SOFT_RESET_SX(1) |
  456. S_008020_SOFT_RESET_SH(1) |
  457. S_008020_SOFT_RESET_TC(1) |
  458. S_008020_SOFT_RESET_TA(1) |
  459. S_008020_SOFT_RESET_VC(1) |
  460. S_008020_SOFT_RESET_VGT(1));
  461. (void)RREG32(R_008020_GRBM_SOFT_RESET);
  462. udelay(50);
  463. WREG32(R_008020_GRBM_SOFT_RESET, 0);
  464. (void)RREG32(R_008020_GRBM_SOFT_RESET);
  465. }
  466. /* Reset CP (we always reset CP) */
  467. WREG32(R_008020_GRBM_SOFT_RESET, S_008020_SOFT_RESET_CP(1));
  468. (void)RREG32(R_008020_GRBM_SOFT_RESET);
  469. udelay(50);
  470. WREG32(R_008020_GRBM_SOFT_RESET, 0);
  471. (void)RREG32(R_008020_GRBM_SOFT_RESET);
  472. /* Reset others GPU block if necessary */
  473. if (G_000E50_RLC_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  474. srbm_reset |= S_000E60_SOFT_RESET_RLC(1);
  475. if (G_000E50_GRBM_RQ_PENDING(RREG32(R_000E50_SRBM_STATUS)))
  476. srbm_reset |= S_000E60_SOFT_RESET_GRBM(1);
  477. if (G_000E50_HI_RQ_PENDING(RREG32(R_000E50_SRBM_STATUS)))
  478. srbm_reset |= S_000E60_SOFT_RESET_IH(1);
  479. if (G_000E50_VMC_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  480. srbm_reset |= S_000E60_SOFT_RESET_VMC(1);
  481. if (G_000E50_MCB_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  482. srbm_reset |= S_000E60_SOFT_RESET_MC(1);
  483. if (G_000E50_MCDZ_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  484. srbm_reset |= S_000E60_SOFT_RESET_MC(1);
  485. if (G_000E50_MCDY_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  486. srbm_reset |= S_000E60_SOFT_RESET_MC(1);
  487. if (G_000E50_MCDX_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  488. srbm_reset |= S_000E60_SOFT_RESET_MC(1);
  489. if (G_000E50_MCDW_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  490. srbm_reset |= S_000E60_SOFT_RESET_MC(1);
  491. if (G_000E50_RLC_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  492. srbm_reset |= S_000E60_SOFT_RESET_RLC(1);
  493. if (G_000E50_SEM_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  494. srbm_reset |= S_000E60_SOFT_RESET_SEM(1);
  495. WREG32(R_000E60_SRBM_SOFT_RESET, srbm_reset);
  496. (void)RREG32(R_000E60_SRBM_SOFT_RESET);
  497. udelay(50);
  498. WREG32(R_000E60_SRBM_SOFT_RESET, 0);
  499. (void)RREG32(R_000E60_SRBM_SOFT_RESET);
  500. /* Wait a little for things to settle down */
  501. udelay(50);
  502. return 0;
  503. }
  504. int r600_gpu_reset(struct radeon_device *rdev)
  505. {
  506. return r600_gpu_soft_reset(rdev);
  507. }
  508. static u32 r600_get_tile_pipe_to_backend_map(u32 num_tile_pipes,
  509. u32 num_backends,
  510. u32 backend_disable_mask)
  511. {
  512. u32 backend_map = 0;
  513. u32 enabled_backends_mask;
  514. u32 enabled_backends_count;
  515. u32 cur_pipe;
  516. u32 swizzle_pipe[R6XX_MAX_PIPES];
  517. u32 cur_backend;
  518. u32 i;
  519. if (num_tile_pipes > R6XX_MAX_PIPES)
  520. num_tile_pipes = R6XX_MAX_PIPES;
  521. if (num_tile_pipes < 1)
  522. num_tile_pipes = 1;
  523. if (num_backends > R6XX_MAX_BACKENDS)
  524. num_backends = R6XX_MAX_BACKENDS;
  525. if (num_backends < 1)
  526. num_backends = 1;
  527. enabled_backends_mask = 0;
  528. enabled_backends_count = 0;
  529. for (i = 0; i < R6XX_MAX_BACKENDS; ++i) {
  530. if (((backend_disable_mask >> i) & 1) == 0) {
  531. enabled_backends_mask |= (1 << i);
  532. ++enabled_backends_count;
  533. }
  534. if (enabled_backends_count == num_backends)
  535. break;
  536. }
  537. if (enabled_backends_count == 0) {
  538. enabled_backends_mask = 1;
  539. enabled_backends_count = 1;
  540. }
  541. if (enabled_backends_count != num_backends)
  542. num_backends = enabled_backends_count;
  543. memset((uint8_t *)&swizzle_pipe[0], 0, sizeof(u32) * R6XX_MAX_PIPES);
  544. switch (num_tile_pipes) {
  545. case 1:
  546. swizzle_pipe[0] = 0;
  547. break;
  548. case 2:
  549. swizzle_pipe[0] = 0;
  550. swizzle_pipe[1] = 1;
  551. break;
  552. case 3:
  553. swizzle_pipe[0] = 0;
  554. swizzle_pipe[1] = 1;
  555. swizzle_pipe[2] = 2;
  556. break;
  557. case 4:
  558. swizzle_pipe[0] = 0;
  559. swizzle_pipe[1] = 1;
  560. swizzle_pipe[2] = 2;
  561. swizzle_pipe[3] = 3;
  562. break;
  563. case 5:
  564. swizzle_pipe[0] = 0;
  565. swizzle_pipe[1] = 1;
  566. swizzle_pipe[2] = 2;
  567. swizzle_pipe[3] = 3;
  568. swizzle_pipe[4] = 4;
  569. break;
  570. case 6:
  571. swizzle_pipe[0] = 0;
  572. swizzle_pipe[1] = 2;
  573. swizzle_pipe[2] = 4;
  574. swizzle_pipe[3] = 5;
  575. swizzle_pipe[4] = 1;
  576. swizzle_pipe[5] = 3;
  577. break;
  578. case 7:
  579. swizzle_pipe[0] = 0;
  580. swizzle_pipe[1] = 2;
  581. swizzle_pipe[2] = 4;
  582. swizzle_pipe[3] = 6;
  583. swizzle_pipe[4] = 1;
  584. swizzle_pipe[5] = 3;
  585. swizzle_pipe[6] = 5;
  586. break;
  587. case 8:
  588. swizzle_pipe[0] = 0;
  589. swizzle_pipe[1] = 2;
  590. swizzle_pipe[2] = 4;
  591. swizzle_pipe[3] = 6;
  592. swizzle_pipe[4] = 1;
  593. swizzle_pipe[5] = 3;
  594. swizzle_pipe[6] = 5;
  595. swizzle_pipe[7] = 7;
  596. break;
  597. }
  598. cur_backend = 0;
  599. for (cur_pipe = 0; cur_pipe < num_tile_pipes; ++cur_pipe) {
  600. while (((1 << cur_backend) & enabled_backends_mask) == 0)
  601. cur_backend = (cur_backend + 1) % R6XX_MAX_BACKENDS;
  602. backend_map |= (u32)(((cur_backend & 3) << (swizzle_pipe[cur_pipe] * 2)));
  603. cur_backend = (cur_backend + 1) % R6XX_MAX_BACKENDS;
  604. }
  605. return backend_map;
  606. }
  607. int r600_count_pipe_bits(uint32_t val)
  608. {
  609. int i, ret = 0;
  610. for (i = 0; i < 32; i++) {
  611. ret += val & 1;
  612. val >>= 1;
  613. }
  614. return ret;
  615. }
  616. void r600_gpu_init(struct radeon_device *rdev)
  617. {
  618. u32 tiling_config;
  619. u32 ramcfg;
  620. u32 tmp;
  621. int i, j;
  622. u32 sq_config;
  623. u32 sq_gpr_resource_mgmt_1 = 0;
  624. u32 sq_gpr_resource_mgmt_2 = 0;
  625. u32 sq_thread_resource_mgmt = 0;
  626. u32 sq_stack_resource_mgmt_1 = 0;
  627. u32 sq_stack_resource_mgmt_2 = 0;
  628. /* FIXME: implement */
  629. switch (rdev->family) {
  630. case CHIP_R600:
  631. rdev->config.r600.max_pipes = 4;
  632. rdev->config.r600.max_tile_pipes = 8;
  633. rdev->config.r600.max_simds = 4;
  634. rdev->config.r600.max_backends = 4;
  635. rdev->config.r600.max_gprs = 256;
  636. rdev->config.r600.max_threads = 192;
  637. rdev->config.r600.max_stack_entries = 256;
  638. rdev->config.r600.max_hw_contexts = 8;
  639. rdev->config.r600.max_gs_threads = 16;
  640. rdev->config.r600.sx_max_export_size = 128;
  641. rdev->config.r600.sx_max_export_pos_size = 16;
  642. rdev->config.r600.sx_max_export_smx_size = 128;
  643. rdev->config.r600.sq_num_cf_insts = 2;
  644. break;
  645. case CHIP_RV630:
  646. case CHIP_RV635:
  647. rdev->config.r600.max_pipes = 2;
  648. rdev->config.r600.max_tile_pipes = 2;
  649. rdev->config.r600.max_simds = 3;
  650. rdev->config.r600.max_backends = 1;
  651. rdev->config.r600.max_gprs = 128;
  652. rdev->config.r600.max_threads = 192;
  653. rdev->config.r600.max_stack_entries = 128;
  654. rdev->config.r600.max_hw_contexts = 8;
  655. rdev->config.r600.max_gs_threads = 4;
  656. rdev->config.r600.sx_max_export_size = 128;
  657. rdev->config.r600.sx_max_export_pos_size = 16;
  658. rdev->config.r600.sx_max_export_smx_size = 128;
  659. rdev->config.r600.sq_num_cf_insts = 2;
  660. break;
  661. case CHIP_RV610:
  662. case CHIP_RV620:
  663. case CHIP_RS780:
  664. case CHIP_RS880:
  665. rdev->config.r600.max_pipes = 1;
  666. rdev->config.r600.max_tile_pipes = 1;
  667. rdev->config.r600.max_simds = 2;
  668. rdev->config.r600.max_backends = 1;
  669. rdev->config.r600.max_gprs = 128;
  670. rdev->config.r600.max_threads = 192;
  671. rdev->config.r600.max_stack_entries = 128;
  672. rdev->config.r600.max_hw_contexts = 4;
  673. rdev->config.r600.max_gs_threads = 4;
  674. rdev->config.r600.sx_max_export_size = 128;
  675. rdev->config.r600.sx_max_export_pos_size = 16;
  676. rdev->config.r600.sx_max_export_smx_size = 128;
  677. rdev->config.r600.sq_num_cf_insts = 1;
  678. break;
  679. case CHIP_RV670:
  680. rdev->config.r600.max_pipes = 4;
  681. rdev->config.r600.max_tile_pipes = 4;
  682. rdev->config.r600.max_simds = 4;
  683. rdev->config.r600.max_backends = 4;
  684. rdev->config.r600.max_gprs = 192;
  685. rdev->config.r600.max_threads = 192;
  686. rdev->config.r600.max_stack_entries = 256;
  687. rdev->config.r600.max_hw_contexts = 8;
  688. rdev->config.r600.max_gs_threads = 16;
  689. rdev->config.r600.sx_max_export_size = 128;
  690. rdev->config.r600.sx_max_export_pos_size = 16;
  691. rdev->config.r600.sx_max_export_smx_size = 128;
  692. rdev->config.r600.sq_num_cf_insts = 2;
  693. break;
  694. default:
  695. break;
  696. }
  697. /* Initialize HDP */
  698. for (i = 0, j = 0; i < 32; i++, j += 0x18) {
  699. WREG32((0x2c14 + j), 0x00000000);
  700. WREG32((0x2c18 + j), 0x00000000);
  701. WREG32((0x2c1c + j), 0x00000000);
  702. WREG32((0x2c20 + j), 0x00000000);
  703. WREG32((0x2c24 + j), 0x00000000);
  704. }
  705. WREG32(GRBM_CNTL, GRBM_READ_TIMEOUT(0xff));
  706. /* Setup tiling */
  707. tiling_config = 0;
  708. ramcfg = RREG32(RAMCFG);
  709. switch (rdev->config.r600.max_tile_pipes) {
  710. case 1:
  711. tiling_config |= PIPE_TILING(0);
  712. break;
  713. case 2:
  714. tiling_config |= PIPE_TILING(1);
  715. break;
  716. case 4:
  717. tiling_config |= PIPE_TILING(2);
  718. break;
  719. case 8:
  720. tiling_config |= PIPE_TILING(3);
  721. break;
  722. default:
  723. break;
  724. }
  725. tiling_config |= BANK_TILING((ramcfg & NOOFBANK_MASK) >> NOOFBANK_SHIFT);
  726. tiling_config |= GROUP_SIZE(0);
  727. tmp = (ramcfg & NOOFROWS_MASK) >> NOOFROWS_SHIFT;
  728. if (tmp > 3) {
  729. tiling_config |= ROW_TILING(3);
  730. tiling_config |= SAMPLE_SPLIT(3);
  731. } else {
  732. tiling_config |= ROW_TILING(tmp);
  733. tiling_config |= SAMPLE_SPLIT(tmp);
  734. }
  735. tiling_config |= BANK_SWAPS(1);
  736. tmp = r600_get_tile_pipe_to_backend_map(rdev->config.r600.max_tile_pipes,
  737. rdev->config.r600.max_backends,
  738. (0xff << rdev->config.r600.max_backends) & 0xff);
  739. tiling_config |= BACKEND_MAP(tmp);
  740. WREG32(GB_TILING_CONFIG, tiling_config);
  741. WREG32(DCP_TILING_CONFIG, tiling_config & 0xffff);
  742. WREG32(HDP_TILING_CONFIG, tiling_config & 0xffff);
  743. tmp = BACKEND_DISABLE((R6XX_MAX_BACKENDS_MASK << rdev->config.r600.max_backends) & R6XX_MAX_BACKENDS_MASK);
  744. WREG32(CC_RB_BACKEND_DISABLE, tmp);
  745. /* Setup pipes */
  746. tmp = INACTIVE_QD_PIPES((R6XX_MAX_PIPES_MASK << rdev->config.r600.max_pipes) & R6XX_MAX_PIPES_MASK);
  747. tmp |= INACTIVE_SIMDS((R6XX_MAX_SIMDS_MASK << rdev->config.r600.max_simds) & R6XX_MAX_SIMDS_MASK);
  748. WREG32(CC_GC_SHADER_PIPE_CONFIG, tmp);
  749. WREG32(GC_USER_SHADER_PIPE_CONFIG, tmp);
  750. tmp = R6XX_MAX_BACKENDS - r600_count_pipe_bits(tmp & INACTIVE_QD_PIPES_MASK);
  751. WREG32(VGT_OUT_DEALLOC_CNTL, (tmp * 4) & DEALLOC_DIST_MASK);
  752. WREG32(VGT_VERTEX_REUSE_BLOCK_CNTL, ((tmp * 4) - 2) & VTX_REUSE_DEPTH_MASK);
  753. /* Setup some CP states */
  754. WREG32(CP_QUEUE_THRESHOLDS, (ROQ_IB1_START(0x16) | ROQ_IB2_START(0x2b)));
  755. WREG32(CP_MEQ_THRESHOLDS, (MEQ_END(0x40) | ROQ_END(0x40)));
  756. WREG32(TA_CNTL_AUX, (DISABLE_CUBE_ANISO | SYNC_GRADIENT |
  757. SYNC_WALKER | SYNC_ALIGNER));
  758. /* Setup various GPU states */
  759. if (rdev->family == CHIP_RV670)
  760. WREG32(ARB_GDEC_RD_CNTL, 0x00000021);
  761. tmp = RREG32(SX_DEBUG_1);
  762. tmp |= SMX_EVENT_RELEASE;
  763. if ((rdev->family > CHIP_R600))
  764. tmp |= ENABLE_NEW_SMX_ADDRESS;
  765. WREG32(SX_DEBUG_1, tmp);
  766. if (((rdev->family) == CHIP_R600) ||
  767. ((rdev->family) == CHIP_RV630) ||
  768. ((rdev->family) == CHIP_RV610) ||
  769. ((rdev->family) == CHIP_RV620) ||
  770. ((rdev->family) == CHIP_RS780)) {
  771. WREG32(DB_DEBUG, PREZ_MUST_WAIT_FOR_POSTZ_DONE);
  772. } else {
  773. WREG32(DB_DEBUG, 0);
  774. }
  775. WREG32(DB_WATERMARKS, (DEPTH_FREE(4) | DEPTH_CACHELINE_FREE(16) |
  776. DEPTH_FLUSH(16) | DEPTH_PENDING_FREE(4)));
  777. WREG32(PA_SC_MULTI_CHIP_CNTL, 0);
  778. WREG32(VGT_NUM_INSTANCES, 0);
  779. WREG32(SPI_CONFIG_CNTL, GPR_WRITE_PRIORITY(0));
  780. WREG32(SPI_CONFIG_CNTL_1, VTX_DONE_DELAY(0));
  781. tmp = RREG32(SQ_MS_FIFO_SIZES);
  782. if (((rdev->family) == CHIP_RV610) ||
  783. ((rdev->family) == CHIP_RV620) ||
  784. ((rdev->family) == CHIP_RS780)) {
  785. tmp = (CACHE_FIFO_SIZE(0xa) |
  786. FETCH_FIFO_HIWATER(0xa) |
  787. DONE_FIFO_HIWATER(0xe0) |
  788. ALU_UPDATE_FIFO_HIWATER(0x8));
  789. } else if (((rdev->family) == CHIP_R600) ||
  790. ((rdev->family) == CHIP_RV630)) {
  791. tmp &= ~DONE_FIFO_HIWATER(0xff);
  792. tmp |= DONE_FIFO_HIWATER(0x4);
  793. }
  794. WREG32(SQ_MS_FIFO_SIZES, tmp);
  795. /* SQ_CONFIG, SQ_GPR_RESOURCE_MGMT, SQ_THREAD_RESOURCE_MGMT, SQ_STACK_RESOURCE_MGMT
  796. * should be adjusted as needed by the 2D/3D drivers. This just sets default values
  797. */
  798. sq_config = RREG32(SQ_CONFIG);
  799. sq_config &= ~(PS_PRIO(3) |
  800. VS_PRIO(3) |
  801. GS_PRIO(3) |
  802. ES_PRIO(3));
  803. sq_config |= (DX9_CONSTS |
  804. VC_ENABLE |
  805. PS_PRIO(0) |
  806. VS_PRIO(1) |
  807. GS_PRIO(2) |
  808. ES_PRIO(3));
  809. if ((rdev->family) == CHIP_R600) {
  810. sq_gpr_resource_mgmt_1 = (NUM_PS_GPRS(124) |
  811. NUM_VS_GPRS(124) |
  812. NUM_CLAUSE_TEMP_GPRS(4));
  813. sq_gpr_resource_mgmt_2 = (NUM_GS_GPRS(0) |
  814. NUM_ES_GPRS(0));
  815. sq_thread_resource_mgmt = (NUM_PS_THREADS(136) |
  816. NUM_VS_THREADS(48) |
  817. NUM_GS_THREADS(4) |
  818. NUM_ES_THREADS(4));
  819. sq_stack_resource_mgmt_1 = (NUM_PS_STACK_ENTRIES(128) |
  820. NUM_VS_STACK_ENTRIES(128));
  821. sq_stack_resource_mgmt_2 = (NUM_GS_STACK_ENTRIES(0) |
  822. NUM_ES_STACK_ENTRIES(0));
  823. } else if (((rdev->family) == CHIP_RV610) ||
  824. ((rdev->family) == CHIP_RV620) ||
  825. ((rdev->family) == CHIP_RS780)) {
  826. /* no vertex cache */
  827. sq_config &= ~VC_ENABLE;
  828. sq_gpr_resource_mgmt_1 = (NUM_PS_GPRS(44) |
  829. NUM_VS_GPRS(44) |
  830. NUM_CLAUSE_TEMP_GPRS(2));
  831. sq_gpr_resource_mgmt_2 = (NUM_GS_GPRS(17) |
  832. NUM_ES_GPRS(17));
  833. sq_thread_resource_mgmt = (NUM_PS_THREADS(79) |
  834. NUM_VS_THREADS(78) |
  835. NUM_GS_THREADS(4) |
  836. NUM_ES_THREADS(31));
  837. sq_stack_resource_mgmt_1 = (NUM_PS_STACK_ENTRIES(40) |
  838. NUM_VS_STACK_ENTRIES(40));
  839. sq_stack_resource_mgmt_2 = (NUM_GS_STACK_ENTRIES(32) |
  840. NUM_ES_STACK_ENTRIES(16));
  841. } else if (((rdev->family) == CHIP_RV630) ||
  842. ((rdev->family) == CHIP_RV635)) {
  843. sq_gpr_resource_mgmt_1 = (NUM_PS_GPRS(44) |
  844. NUM_VS_GPRS(44) |
  845. NUM_CLAUSE_TEMP_GPRS(2));
  846. sq_gpr_resource_mgmt_2 = (NUM_GS_GPRS(18) |
  847. NUM_ES_GPRS(18));
  848. sq_thread_resource_mgmt = (NUM_PS_THREADS(79) |
  849. NUM_VS_THREADS(78) |
  850. NUM_GS_THREADS(4) |
  851. NUM_ES_THREADS(31));
  852. sq_stack_resource_mgmt_1 = (NUM_PS_STACK_ENTRIES(40) |
  853. NUM_VS_STACK_ENTRIES(40));
  854. sq_stack_resource_mgmt_2 = (NUM_GS_STACK_ENTRIES(32) |
  855. NUM_ES_STACK_ENTRIES(16));
  856. } else if ((rdev->family) == CHIP_RV670) {
  857. sq_gpr_resource_mgmt_1 = (NUM_PS_GPRS(44) |
  858. NUM_VS_GPRS(44) |
  859. NUM_CLAUSE_TEMP_GPRS(2));
  860. sq_gpr_resource_mgmt_2 = (NUM_GS_GPRS(17) |
  861. NUM_ES_GPRS(17));
  862. sq_thread_resource_mgmt = (NUM_PS_THREADS(79) |
  863. NUM_VS_THREADS(78) |
  864. NUM_GS_THREADS(4) |
  865. NUM_ES_THREADS(31));
  866. sq_stack_resource_mgmt_1 = (NUM_PS_STACK_ENTRIES(64) |
  867. NUM_VS_STACK_ENTRIES(64));
  868. sq_stack_resource_mgmt_2 = (NUM_GS_STACK_ENTRIES(64) |
  869. NUM_ES_STACK_ENTRIES(64));
  870. }
  871. WREG32(SQ_CONFIG, sq_config);
  872. WREG32(SQ_GPR_RESOURCE_MGMT_1, sq_gpr_resource_mgmt_1);
  873. WREG32(SQ_GPR_RESOURCE_MGMT_2, sq_gpr_resource_mgmt_2);
  874. WREG32(SQ_THREAD_RESOURCE_MGMT, sq_thread_resource_mgmt);
  875. WREG32(SQ_STACK_RESOURCE_MGMT_1, sq_stack_resource_mgmt_1);
  876. WREG32(SQ_STACK_RESOURCE_MGMT_2, sq_stack_resource_mgmt_2);
  877. if (((rdev->family) == CHIP_RV610) ||
  878. ((rdev->family) == CHIP_RV620) ||
  879. ((rdev->family) == CHIP_RS780)) {
  880. WREG32(VGT_CACHE_INVALIDATION, CACHE_INVALIDATION(TC_ONLY));
  881. } else {
  882. WREG32(VGT_CACHE_INVALIDATION, CACHE_INVALIDATION(VC_AND_TC));
  883. }
  884. /* More default values. 2D/3D driver should adjust as needed */
  885. WREG32(PA_SC_AA_SAMPLE_LOCS_2S, (S0_X(0xc) | S0_Y(0x4) |
  886. S1_X(0x4) | S1_Y(0xc)));
  887. WREG32(PA_SC_AA_SAMPLE_LOCS_4S, (S0_X(0xe) | S0_Y(0xe) |
  888. S1_X(0x2) | S1_Y(0x2) |
  889. S2_X(0xa) | S2_Y(0x6) |
  890. S3_X(0x6) | S3_Y(0xa)));
  891. WREG32(PA_SC_AA_SAMPLE_LOCS_8S_WD0, (S0_X(0xe) | S0_Y(0xb) |
  892. S1_X(0x4) | S1_Y(0xc) |
  893. S2_X(0x1) | S2_Y(0x6) |
  894. S3_X(0xa) | S3_Y(0xe)));
  895. WREG32(PA_SC_AA_SAMPLE_LOCS_8S_WD1, (S4_X(0x6) | S4_Y(0x1) |
  896. S5_X(0x0) | S5_Y(0x0) |
  897. S6_X(0xb) | S6_Y(0x4) |
  898. S7_X(0x7) | S7_Y(0x8)));
  899. WREG32(VGT_STRMOUT_EN, 0);
  900. tmp = rdev->config.r600.max_pipes * 16;
  901. switch (rdev->family) {
  902. case CHIP_RV610:
  903. case CHIP_RS780:
  904. case CHIP_RV620:
  905. tmp += 32;
  906. break;
  907. case CHIP_RV670:
  908. tmp += 128;
  909. break;
  910. default:
  911. break;
  912. }
  913. if (tmp > 256) {
  914. tmp = 256;
  915. }
  916. WREG32(VGT_ES_PER_GS, 128);
  917. WREG32(VGT_GS_PER_ES, tmp);
  918. WREG32(VGT_GS_PER_VS, 2);
  919. WREG32(VGT_GS_VERTEX_REUSE, 16);
  920. /* more default values. 2D/3D driver should adjust as needed */
  921. WREG32(PA_SC_LINE_STIPPLE_STATE, 0);
  922. WREG32(VGT_STRMOUT_EN, 0);
  923. WREG32(SX_MISC, 0);
  924. WREG32(PA_SC_MODE_CNTL, 0);
  925. WREG32(PA_SC_AA_CONFIG, 0);
  926. WREG32(PA_SC_LINE_STIPPLE, 0);
  927. WREG32(SPI_INPUT_Z, 0);
  928. WREG32(SPI_PS_IN_CONTROL_0, NUM_INTERP(2));
  929. WREG32(CB_COLOR7_FRAG, 0);
  930. /* Clear render buffer base addresses */
  931. WREG32(CB_COLOR0_BASE, 0);
  932. WREG32(CB_COLOR1_BASE, 0);
  933. WREG32(CB_COLOR2_BASE, 0);
  934. WREG32(CB_COLOR3_BASE, 0);
  935. WREG32(CB_COLOR4_BASE, 0);
  936. WREG32(CB_COLOR5_BASE, 0);
  937. WREG32(CB_COLOR6_BASE, 0);
  938. WREG32(CB_COLOR7_BASE, 0);
  939. WREG32(CB_COLOR7_FRAG, 0);
  940. switch (rdev->family) {
  941. case CHIP_RV610:
  942. case CHIP_RS780:
  943. case CHIP_RV620:
  944. tmp = TC_L2_SIZE(8);
  945. break;
  946. case CHIP_RV630:
  947. case CHIP_RV635:
  948. tmp = TC_L2_SIZE(4);
  949. break;
  950. case CHIP_R600:
  951. tmp = TC_L2_SIZE(0) | L2_DISABLE_LATE_HIT;
  952. break;
  953. default:
  954. tmp = TC_L2_SIZE(0);
  955. break;
  956. }
  957. WREG32(TC_CNTL, tmp);
  958. tmp = RREG32(HDP_HOST_PATH_CNTL);
  959. WREG32(HDP_HOST_PATH_CNTL, tmp);
  960. tmp = RREG32(ARB_POP);
  961. tmp |= ENABLE_TC128;
  962. WREG32(ARB_POP, tmp);
  963. WREG32(PA_SC_MULTI_CHIP_CNTL, 0);
  964. WREG32(PA_CL_ENHANCE, (CLIP_VTX_REORDER_ENA |
  965. NUM_CLIP_SEQ(3)));
  966. WREG32(PA_SC_ENHANCE, FORCE_EOV_MAX_CLK_CNT(4095));
  967. }
  968. /*
  969. * Indirect registers accessor
  970. */
  971. u32 r600_pciep_rreg(struct radeon_device *rdev, u32 reg)
  972. {
  973. u32 r;
  974. WREG32(PCIE_PORT_INDEX, ((reg) & 0xff));
  975. (void)RREG32(PCIE_PORT_INDEX);
  976. r = RREG32(PCIE_PORT_DATA);
  977. return r;
  978. }
  979. void r600_pciep_wreg(struct radeon_device *rdev, u32 reg, u32 v)
  980. {
  981. WREG32(PCIE_PORT_INDEX, ((reg) & 0xff));
  982. (void)RREG32(PCIE_PORT_INDEX);
  983. WREG32(PCIE_PORT_DATA, (v));
  984. (void)RREG32(PCIE_PORT_DATA);
  985. }
  986. /*
  987. * CP & Ring
  988. */
  989. void r600_cp_stop(struct radeon_device *rdev)
  990. {
  991. WREG32(R_0086D8_CP_ME_CNTL, S_0086D8_CP_ME_HALT(1));
  992. }
  993. int r600_cp_init_microcode(struct radeon_device *rdev)
  994. {
  995. struct platform_device *pdev;
  996. const char *chip_name;
  997. size_t pfp_req_size, me_req_size;
  998. char fw_name[30];
  999. int err;
  1000. DRM_DEBUG("\n");
  1001. pdev = platform_device_register_simple("radeon_cp", 0, NULL, 0);
  1002. err = IS_ERR(pdev);
  1003. if (err) {
  1004. printk(KERN_ERR "radeon_cp: Failed to register firmware\n");
  1005. return -EINVAL;
  1006. }
  1007. switch (rdev->family) {
  1008. case CHIP_R600: chip_name = "R600"; break;
  1009. case CHIP_RV610: chip_name = "RV610"; break;
  1010. case CHIP_RV630: chip_name = "RV630"; break;
  1011. case CHIP_RV620: chip_name = "RV620"; break;
  1012. case CHIP_RV635: chip_name = "RV635"; break;
  1013. case CHIP_RV670: chip_name = "RV670"; break;
  1014. case CHIP_RS780:
  1015. case CHIP_RS880: chip_name = "RS780"; break;
  1016. case CHIP_RV770: chip_name = "RV770"; break;
  1017. case CHIP_RV730:
  1018. case CHIP_RV740: chip_name = "RV730"; break;
  1019. case CHIP_RV710: chip_name = "RV710"; break;
  1020. default: BUG();
  1021. }
  1022. if (rdev->family >= CHIP_RV770) {
  1023. pfp_req_size = R700_PFP_UCODE_SIZE * 4;
  1024. me_req_size = R700_PM4_UCODE_SIZE * 4;
  1025. } else {
  1026. pfp_req_size = PFP_UCODE_SIZE * 4;
  1027. me_req_size = PM4_UCODE_SIZE * 12;
  1028. }
  1029. DRM_INFO("Loading %s CP Microcode\n", chip_name);
  1030. snprintf(fw_name, sizeof(fw_name), "radeon/%s_pfp.bin", chip_name);
  1031. err = request_firmware(&rdev->pfp_fw, fw_name, &pdev->dev);
  1032. if (err)
  1033. goto out;
  1034. if (rdev->pfp_fw->size != pfp_req_size) {
  1035. printk(KERN_ERR
  1036. "r600_cp: Bogus length %zu in firmware \"%s\"\n",
  1037. rdev->pfp_fw->size, fw_name);
  1038. err = -EINVAL;
  1039. goto out;
  1040. }
  1041. snprintf(fw_name, sizeof(fw_name), "radeon/%s_me.bin", chip_name);
  1042. err = request_firmware(&rdev->me_fw, fw_name, &pdev->dev);
  1043. if (err)
  1044. goto out;
  1045. if (rdev->me_fw->size != me_req_size) {
  1046. printk(KERN_ERR
  1047. "r600_cp: Bogus length %zu in firmware \"%s\"\n",
  1048. rdev->me_fw->size, fw_name);
  1049. err = -EINVAL;
  1050. }
  1051. out:
  1052. platform_device_unregister(pdev);
  1053. if (err) {
  1054. if (err != -EINVAL)
  1055. printk(KERN_ERR
  1056. "r600_cp: Failed to load firmware \"%s\"\n",
  1057. fw_name);
  1058. release_firmware(rdev->pfp_fw);
  1059. rdev->pfp_fw = NULL;
  1060. release_firmware(rdev->me_fw);
  1061. rdev->me_fw = NULL;
  1062. }
  1063. return err;
  1064. }
  1065. static int r600_cp_load_microcode(struct radeon_device *rdev)
  1066. {
  1067. const __be32 *fw_data;
  1068. int i;
  1069. if (!rdev->me_fw || !rdev->pfp_fw)
  1070. return -EINVAL;
  1071. r600_cp_stop(rdev);
  1072. WREG32(CP_RB_CNTL, RB_NO_UPDATE | RB_BLKSZ(15) | RB_BUFSZ(3));
  1073. /* Reset cp */
  1074. WREG32(GRBM_SOFT_RESET, SOFT_RESET_CP);
  1075. RREG32(GRBM_SOFT_RESET);
  1076. mdelay(15);
  1077. WREG32(GRBM_SOFT_RESET, 0);
  1078. WREG32(CP_ME_RAM_WADDR, 0);
  1079. fw_data = (const __be32 *)rdev->me_fw->data;
  1080. WREG32(CP_ME_RAM_WADDR, 0);
  1081. for (i = 0; i < PM4_UCODE_SIZE * 3; i++)
  1082. WREG32(CP_ME_RAM_DATA,
  1083. be32_to_cpup(fw_data++));
  1084. fw_data = (const __be32 *)rdev->pfp_fw->data;
  1085. WREG32(CP_PFP_UCODE_ADDR, 0);
  1086. for (i = 0; i < PFP_UCODE_SIZE; i++)
  1087. WREG32(CP_PFP_UCODE_DATA,
  1088. be32_to_cpup(fw_data++));
  1089. WREG32(CP_PFP_UCODE_ADDR, 0);
  1090. WREG32(CP_ME_RAM_WADDR, 0);
  1091. WREG32(CP_ME_RAM_RADDR, 0);
  1092. return 0;
  1093. }
  1094. int r600_cp_start(struct radeon_device *rdev)
  1095. {
  1096. int r;
  1097. uint32_t cp_me;
  1098. r = radeon_ring_lock(rdev, 7);
  1099. if (r) {
  1100. DRM_ERROR("radeon: cp failed to lock ring (%d).\n", r);
  1101. return r;
  1102. }
  1103. radeon_ring_write(rdev, PACKET3(PACKET3_ME_INITIALIZE, 5));
  1104. radeon_ring_write(rdev, 0x1);
  1105. if (rdev->family < CHIP_RV770) {
  1106. radeon_ring_write(rdev, 0x3);
  1107. radeon_ring_write(rdev, rdev->config.r600.max_hw_contexts - 1);
  1108. } else {
  1109. radeon_ring_write(rdev, 0x0);
  1110. radeon_ring_write(rdev, rdev->config.rv770.max_hw_contexts - 1);
  1111. }
  1112. radeon_ring_write(rdev, PACKET3_ME_INITIALIZE_DEVICE_ID(1));
  1113. radeon_ring_write(rdev, 0);
  1114. radeon_ring_write(rdev, 0);
  1115. radeon_ring_unlock_commit(rdev);
  1116. cp_me = 0xff;
  1117. WREG32(R_0086D8_CP_ME_CNTL, cp_me);
  1118. return 0;
  1119. }
  1120. int r600_cp_resume(struct radeon_device *rdev)
  1121. {
  1122. u32 tmp;
  1123. u32 rb_bufsz;
  1124. int r;
  1125. /* Reset cp */
  1126. WREG32(GRBM_SOFT_RESET, SOFT_RESET_CP);
  1127. RREG32(GRBM_SOFT_RESET);
  1128. mdelay(15);
  1129. WREG32(GRBM_SOFT_RESET, 0);
  1130. /* Set ring buffer size */
  1131. rb_bufsz = drm_order(rdev->cp.ring_size / 8);
  1132. #ifdef __BIG_ENDIAN
  1133. WREG32(CP_RB_CNTL, BUF_SWAP_32BIT | RB_NO_UPDATE |
  1134. (drm_order(4096/8) << 8) | rb_bufsz);
  1135. #else
  1136. WREG32(CP_RB_CNTL, RB_NO_UPDATE | (drm_order(4096/8) << 8) | rb_bufsz);
  1137. #endif
  1138. WREG32(CP_SEM_WAIT_TIMER, 0x4);
  1139. /* Set the write pointer delay */
  1140. WREG32(CP_RB_WPTR_DELAY, 0);
  1141. /* Initialize the ring buffer's read and write pointers */
  1142. tmp = RREG32(CP_RB_CNTL);
  1143. WREG32(CP_RB_CNTL, tmp | RB_RPTR_WR_ENA);
  1144. WREG32(CP_RB_RPTR_WR, 0);
  1145. WREG32(CP_RB_WPTR, 0);
  1146. WREG32(CP_RB_RPTR_ADDR, rdev->cp.gpu_addr & 0xFFFFFFFF);
  1147. WREG32(CP_RB_RPTR_ADDR_HI, upper_32_bits(rdev->cp.gpu_addr));
  1148. mdelay(1);
  1149. WREG32(CP_RB_CNTL, tmp);
  1150. WREG32(CP_RB_BASE, rdev->cp.gpu_addr >> 8);
  1151. WREG32(CP_DEBUG, (1 << 27) | (1 << 28));
  1152. rdev->cp.rptr = RREG32(CP_RB_RPTR);
  1153. rdev->cp.wptr = RREG32(CP_RB_WPTR);
  1154. r600_cp_start(rdev);
  1155. rdev->cp.ready = true;
  1156. r = radeon_ring_test(rdev);
  1157. if (r) {
  1158. rdev->cp.ready = false;
  1159. return r;
  1160. }
  1161. return 0;
  1162. }
  1163. void r600_cp_commit(struct radeon_device *rdev)
  1164. {
  1165. WREG32(CP_RB_WPTR, rdev->cp.wptr);
  1166. (void)RREG32(CP_RB_WPTR);
  1167. }
  1168. void r600_ring_init(struct radeon_device *rdev, unsigned ring_size)
  1169. {
  1170. u32 rb_bufsz;
  1171. /* Align ring size */
  1172. rb_bufsz = drm_order(ring_size / 8);
  1173. ring_size = (1 << (rb_bufsz + 1)) * 4;
  1174. rdev->cp.ring_size = ring_size;
  1175. rdev->cp.align_mask = 16 - 1;
  1176. }
  1177. /*
  1178. * GPU scratch registers helpers function.
  1179. */
  1180. void r600_scratch_init(struct radeon_device *rdev)
  1181. {
  1182. int i;
  1183. rdev->scratch.num_reg = 7;
  1184. for (i = 0; i < rdev->scratch.num_reg; i++) {
  1185. rdev->scratch.free[i] = true;
  1186. rdev->scratch.reg[i] = SCRATCH_REG0 + (i * 4);
  1187. }
  1188. }
  1189. int r600_ring_test(struct radeon_device *rdev)
  1190. {
  1191. uint32_t scratch;
  1192. uint32_t tmp = 0;
  1193. unsigned i;
  1194. int r;
  1195. r = radeon_scratch_get(rdev, &scratch);
  1196. if (r) {
  1197. DRM_ERROR("radeon: cp failed to get scratch reg (%d).\n", r);
  1198. return r;
  1199. }
  1200. WREG32(scratch, 0xCAFEDEAD);
  1201. r = radeon_ring_lock(rdev, 3);
  1202. if (r) {
  1203. DRM_ERROR("radeon: cp failed to lock ring (%d).\n", r);
  1204. radeon_scratch_free(rdev, scratch);
  1205. return r;
  1206. }
  1207. radeon_ring_write(rdev, PACKET3(PACKET3_SET_CONFIG_REG, 1));
  1208. radeon_ring_write(rdev, ((scratch - PACKET3_SET_CONFIG_REG_OFFSET) >> 2));
  1209. radeon_ring_write(rdev, 0xDEADBEEF);
  1210. radeon_ring_unlock_commit(rdev);
  1211. for (i = 0; i < rdev->usec_timeout; i++) {
  1212. tmp = RREG32(scratch);
  1213. if (tmp == 0xDEADBEEF)
  1214. break;
  1215. DRM_UDELAY(1);
  1216. }
  1217. if (i < rdev->usec_timeout) {
  1218. DRM_INFO("ring test succeeded in %d usecs\n", i);
  1219. } else {
  1220. DRM_ERROR("radeon: ring test failed (scratch(0x%04X)=0x%08X)\n",
  1221. scratch, tmp);
  1222. r = -EINVAL;
  1223. }
  1224. radeon_scratch_free(rdev, scratch);
  1225. return r;
  1226. }
  1227. /*
  1228. * Writeback
  1229. */
  1230. int r600_wb_init(struct radeon_device *rdev)
  1231. {
  1232. int r;
  1233. if (rdev->wb.wb_obj == NULL) {
  1234. r = radeon_object_create(rdev, NULL, 4096,
  1235. true,
  1236. RADEON_GEM_DOMAIN_GTT,
  1237. false, &rdev->wb.wb_obj);
  1238. if (r) {
  1239. DRM_ERROR("radeon: failed to create WB buffer (%d).\n", r);
  1240. return r;
  1241. }
  1242. r = radeon_object_pin(rdev->wb.wb_obj,
  1243. RADEON_GEM_DOMAIN_GTT,
  1244. &rdev->wb.gpu_addr);
  1245. if (r) {
  1246. DRM_ERROR("radeon: failed to pin WB buffer (%d).\n", r);
  1247. return r;
  1248. }
  1249. r = radeon_object_kmap(rdev->wb.wb_obj, (void **)&rdev->wb.wb);
  1250. if (r) {
  1251. DRM_ERROR("radeon: failed to map WB buffer (%d).\n", r);
  1252. return r;
  1253. }
  1254. }
  1255. WREG32(SCRATCH_ADDR, (rdev->wb.gpu_addr >> 8) & 0xFFFFFFFF);
  1256. WREG32(CP_RB_RPTR_ADDR, (rdev->wb.gpu_addr + 1024) & 0xFFFFFFFC);
  1257. WREG32(CP_RB_RPTR_ADDR_HI, upper_32_bits(rdev->wb.gpu_addr + 1024) & 0xFF);
  1258. WREG32(SCRATCH_UMSK, 0xff);
  1259. return 0;
  1260. }
  1261. void r600_wb_fini(struct radeon_device *rdev)
  1262. {
  1263. if (rdev->wb.wb_obj) {
  1264. radeon_object_kunmap(rdev->wb.wb_obj);
  1265. radeon_object_unpin(rdev->wb.wb_obj);
  1266. radeon_object_unref(&rdev->wb.wb_obj);
  1267. rdev->wb.wb = NULL;
  1268. rdev->wb.wb_obj = NULL;
  1269. }
  1270. }
  1271. /*
  1272. * CS
  1273. */
  1274. void r600_fence_ring_emit(struct radeon_device *rdev,
  1275. struct radeon_fence *fence)
  1276. {
  1277. /* Emit fence sequence & fire IRQ */
  1278. radeon_ring_write(rdev, PACKET3(PACKET3_SET_CONFIG_REG, 1));
  1279. radeon_ring_write(rdev, ((rdev->fence_drv.scratch_reg - PACKET3_SET_CONFIG_REG_OFFSET) >> 2));
  1280. radeon_ring_write(rdev, fence->seq);
  1281. }
  1282. int r600_copy_dma(struct radeon_device *rdev,
  1283. uint64_t src_offset,
  1284. uint64_t dst_offset,
  1285. unsigned num_pages,
  1286. struct radeon_fence *fence)
  1287. {
  1288. /* FIXME: implement */
  1289. return 0;
  1290. }
  1291. int r600_copy_blit(struct radeon_device *rdev,
  1292. uint64_t src_offset, uint64_t dst_offset,
  1293. unsigned num_pages, struct radeon_fence *fence)
  1294. {
  1295. r600_blit_prepare_copy(rdev, num_pages * 4096);
  1296. r600_kms_blit_copy(rdev, src_offset, dst_offset, num_pages * 4096);
  1297. r600_blit_done_copy(rdev, fence);
  1298. return 0;
  1299. }
  1300. int r600_irq_process(struct radeon_device *rdev)
  1301. {
  1302. /* FIXME: implement */
  1303. return 0;
  1304. }
  1305. int r600_irq_set(struct radeon_device *rdev)
  1306. {
  1307. /* FIXME: implement */
  1308. return 0;
  1309. }
  1310. int r600_set_surface_reg(struct radeon_device *rdev, int reg,
  1311. uint32_t tiling_flags, uint32_t pitch,
  1312. uint32_t offset, uint32_t obj_size)
  1313. {
  1314. /* FIXME: implement */
  1315. return 0;
  1316. }
  1317. void r600_clear_surface_reg(struct radeon_device *rdev, int reg)
  1318. {
  1319. /* FIXME: implement */
  1320. }
  1321. bool r600_card_posted(struct radeon_device *rdev)
  1322. {
  1323. uint32_t reg;
  1324. /* first check CRTCs */
  1325. reg = RREG32(D1CRTC_CONTROL) |
  1326. RREG32(D2CRTC_CONTROL);
  1327. if (reg & CRTC_EN)
  1328. return true;
  1329. /* then check MEM_SIZE, in case the crtcs are off */
  1330. if (RREG32(CONFIG_MEMSIZE))
  1331. return true;
  1332. return false;
  1333. }
  1334. int r600_resume(struct radeon_device *rdev)
  1335. {
  1336. int r;
  1337. r600_gpu_reset(rdev);
  1338. r600_mc_resume(rdev);
  1339. r = r600_pcie_gart_enable(rdev);
  1340. if (r)
  1341. return r;
  1342. r600_gpu_init(rdev);
  1343. r = radeon_ring_init(rdev, rdev->cp.ring_size);
  1344. if (r)
  1345. return r;
  1346. r = r600_cp_load_microcode(rdev);
  1347. if (r)
  1348. return r;
  1349. r = r600_cp_resume(rdev);
  1350. if (r)
  1351. return r;
  1352. r = r600_wb_init(rdev);
  1353. if (r)
  1354. return r;
  1355. return 0;
  1356. }
  1357. int r600_suspend(struct radeon_device *rdev)
  1358. {
  1359. /* FIXME: we should wait for ring to be empty */
  1360. r600_cp_stop(rdev);
  1361. r600_pcie_gart_disable(rdev);
  1362. return 0;
  1363. }
  1364. /* Plan is to move initialization in that function and use
  1365. * helper function so that radeon_device_init pretty much
  1366. * do nothing more than calling asic specific function. This
  1367. * should also allow to remove a bunch of callback function
  1368. * like vram_info.
  1369. */
  1370. int r600_init(struct radeon_device *rdev)
  1371. {
  1372. int r;
  1373. rdev->new_init_path = true;
  1374. r = radeon_dummy_page_init(rdev);
  1375. if (r)
  1376. return r;
  1377. if (r600_debugfs_mc_info_init(rdev)) {
  1378. DRM_ERROR("Failed to register debugfs file for mc !\n");
  1379. }
  1380. /* This don't do much */
  1381. r = radeon_gem_init(rdev);
  1382. if (r)
  1383. return r;
  1384. /* Read BIOS */
  1385. if (!radeon_get_bios(rdev)) {
  1386. if (ASIC_IS_AVIVO(rdev))
  1387. return -EINVAL;
  1388. }
  1389. /* Must be an ATOMBIOS */
  1390. if (!rdev->is_atom_bios)
  1391. return -EINVAL;
  1392. r = radeon_atombios_init(rdev);
  1393. if (r)
  1394. return r;
  1395. /* Post card if necessary */
  1396. if (!r600_card_posted(rdev) && rdev->bios) {
  1397. DRM_INFO("GPU not posted. posting now...\n");
  1398. atom_asic_init(rdev->mode_info.atom_context);
  1399. }
  1400. /* Initialize scratch registers */
  1401. r600_scratch_init(rdev);
  1402. /* Initialize surface registers */
  1403. radeon_surface_init(rdev);
  1404. radeon_get_clock_info(rdev->ddev);
  1405. r = radeon_clocks_init(rdev);
  1406. if (r)
  1407. return r;
  1408. /* Fence driver */
  1409. r = radeon_fence_driver_init(rdev);
  1410. if (r)
  1411. return r;
  1412. r = r600_mc_init(rdev);
  1413. if (r) {
  1414. if (rdev->flags & RADEON_IS_AGP) {
  1415. /* Retry with disabling AGP */
  1416. r600_fini(rdev);
  1417. rdev->flags &= ~RADEON_IS_AGP;
  1418. return r600_init(rdev);
  1419. }
  1420. return r;
  1421. }
  1422. /* Memory manager */
  1423. r = radeon_object_init(rdev);
  1424. if (r)
  1425. return r;
  1426. rdev->cp.ring_obj = NULL;
  1427. r600_ring_init(rdev, 1024 * 1024);
  1428. if (!rdev->me_fw || !rdev->pfp_fw) {
  1429. r = r600_cp_init_microcode(rdev);
  1430. if (r) {
  1431. DRM_ERROR("Failed to load firmware!\n");
  1432. return r;
  1433. }
  1434. }
  1435. r = r600_pcie_gart_init(rdev);
  1436. if (r)
  1437. return r;
  1438. rdev->accel_working = true;
  1439. r = r600_resume(rdev);
  1440. if (r) {
  1441. if (rdev->flags & RADEON_IS_AGP) {
  1442. /* Retry with disabling AGP */
  1443. r600_fini(rdev);
  1444. rdev->flags &= ~RADEON_IS_AGP;
  1445. return r600_init(rdev);
  1446. }
  1447. rdev->accel_working = false;
  1448. }
  1449. if (rdev->accel_working) {
  1450. r = radeon_ib_pool_init(rdev);
  1451. if (r) {
  1452. DRM_ERROR("radeon: failled initializing IB pool (%d).\n", r);
  1453. rdev->accel_working = false;
  1454. }
  1455. r = r600_blit_init(rdev);
  1456. if (r) {
  1457. DRM_ERROR("radeon: failled blitter (%d).\n", r);
  1458. rdev->accel_working = false;
  1459. }
  1460. r = radeon_ib_test(rdev);
  1461. if (r) {
  1462. DRM_ERROR("radeon: failled testing IB (%d).\n", r);
  1463. rdev->accel_working = false;
  1464. }
  1465. }
  1466. return 0;
  1467. }
  1468. void r600_fini(struct radeon_device *rdev)
  1469. {
  1470. /* Suspend operations */
  1471. r600_suspend(rdev);
  1472. r600_blit_fini(rdev);
  1473. radeon_ring_fini(rdev);
  1474. r600_pcie_gart_fini(rdev);
  1475. radeon_gem_fini(rdev);
  1476. radeon_fence_driver_fini(rdev);
  1477. radeon_clocks_fini(rdev);
  1478. #if __OS_HAS_AGP
  1479. if (rdev->flags & RADEON_IS_AGP)
  1480. radeon_agp_fini(rdev);
  1481. #endif
  1482. radeon_object_fini(rdev);
  1483. if (rdev->is_atom_bios)
  1484. radeon_atombios_fini(rdev);
  1485. else
  1486. radeon_combios_fini(rdev);
  1487. kfree(rdev->bios);
  1488. rdev->bios = NULL;
  1489. radeon_dummy_page_fini(rdev);
  1490. }
  1491. /*
  1492. * CS stuff
  1493. */
  1494. void r600_ring_ib_execute(struct radeon_device *rdev, struct radeon_ib *ib)
  1495. {
  1496. /* FIXME: implement */
  1497. radeon_ring_write(rdev, PACKET3(PACKET3_INDIRECT_BUFFER, 2));
  1498. radeon_ring_write(rdev, ib->gpu_addr & 0xFFFFFFFC);
  1499. radeon_ring_write(rdev, upper_32_bits(ib->gpu_addr) & 0xFF);
  1500. radeon_ring_write(rdev, ib->length_dw);
  1501. }
  1502. int r600_ib_test(struct radeon_device *rdev)
  1503. {
  1504. struct radeon_ib *ib;
  1505. uint32_t scratch;
  1506. uint32_t tmp = 0;
  1507. unsigned i;
  1508. int r;
  1509. r = radeon_scratch_get(rdev, &scratch);
  1510. if (r) {
  1511. DRM_ERROR("radeon: failed to get scratch reg (%d).\n", r);
  1512. return r;
  1513. }
  1514. WREG32(scratch, 0xCAFEDEAD);
  1515. r = radeon_ib_get(rdev, &ib);
  1516. if (r) {
  1517. DRM_ERROR("radeon: failed to get ib (%d).\n", r);
  1518. return r;
  1519. }
  1520. ib->ptr[0] = PACKET3(PACKET3_SET_CONFIG_REG, 1);
  1521. ib->ptr[1] = ((scratch - PACKET3_SET_CONFIG_REG_OFFSET) >> 2);
  1522. ib->ptr[2] = 0xDEADBEEF;
  1523. ib->ptr[3] = PACKET2(0);
  1524. ib->ptr[4] = PACKET2(0);
  1525. ib->ptr[5] = PACKET2(0);
  1526. ib->ptr[6] = PACKET2(0);
  1527. ib->ptr[7] = PACKET2(0);
  1528. ib->ptr[8] = PACKET2(0);
  1529. ib->ptr[9] = PACKET2(0);
  1530. ib->ptr[10] = PACKET2(0);
  1531. ib->ptr[11] = PACKET2(0);
  1532. ib->ptr[12] = PACKET2(0);
  1533. ib->ptr[13] = PACKET2(0);
  1534. ib->ptr[14] = PACKET2(0);
  1535. ib->ptr[15] = PACKET2(0);
  1536. ib->length_dw = 16;
  1537. r = radeon_ib_schedule(rdev, ib);
  1538. if (r) {
  1539. radeon_scratch_free(rdev, scratch);
  1540. radeon_ib_free(rdev, &ib);
  1541. DRM_ERROR("radeon: failed to schedule ib (%d).\n", r);
  1542. return r;
  1543. }
  1544. r = radeon_fence_wait(ib->fence, false);
  1545. if (r) {
  1546. DRM_ERROR("radeon: fence wait failed (%d).\n", r);
  1547. return r;
  1548. }
  1549. for (i = 0; i < rdev->usec_timeout; i++) {
  1550. tmp = RREG32(scratch);
  1551. if (tmp == 0xDEADBEEF)
  1552. break;
  1553. DRM_UDELAY(1);
  1554. }
  1555. if (i < rdev->usec_timeout) {
  1556. DRM_INFO("ib test succeeded in %u usecs\n", i);
  1557. } else {
  1558. DRM_ERROR("radeon: ib test failed (sracth(0x%04X)=0x%08X)\n",
  1559. scratch, tmp);
  1560. r = -EINVAL;
  1561. }
  1562. radeon_scratch_free(rdev, scratch);
  1563. radeon_ib_free(rdev, &ib);
  1564. return r;
  1565. }
  1566. /*
  1567. * Debugfs info
  1568. */
  1569. #if defined(CONFIG_DEBUG_FS)
  1570. static int r600_debugfs_cp_ring_info(struct seq_file *m, void *data)
  1571. {
  1572. struct drm_info_node *node = (struct drm_info_node *) m->private;
  1573. struct drm_device *dev = node->minor->dev;
  1574. struct radeon_device *rdev = dev->dev_private;
  1575. uint32_t rdp, wdp;
  1576. unsigned count, i, j;
  1577. radeon_ring_free_size(rdev);
  1578. rdp = RREG32(CP_RB_RPTR);
  1579. wdp = RREG32(CP_RB_WPTR);
  1580. count = (rdp + rdev->cp.ring_size - wdp) & rdev->cp.ptr_mask;
  1581. seq_printf(m, "CP_STAT 0x%08x\n", RREG32(CP_STAT));
  1582. seq_printf(m, "CP_RB_WPTR 0x%08x\n", wdp);
  1583. seq_printf(m, "CP_RB_RPTR 0x%08x\n", rdp);
  1584. seq_printf(m, "%u free dwords in ring\n", rdev->cp.ring_free_dw);
  1585. seq_printf(m, "%u dwords in ring\n", count);
  1586. for (j = 0; j <= count; j++) {
  1587. i = (rdp + j) & rdev->cp.ptr_mask;
  1588. seq_printf(m, "r[%04d]=0x%08x\n", i, rdev->cp.ring[i]);
  1589. }
  1590. return 0;
  1591. }
  1592. static int r600_debugfs_mc_info(struct seq_file *m, void *data)
  1593. {
  1594. struct drm_info_node *node = (struct drm_info_node *) m->private;
  1595. struct drm_device *dev = node->minor->dev;
  1596. struct radeon_device *rdev = dev->dev_private;
  1597. DREG32_SYS(m, rdev, R_000E50_SRBM_STATUS);
  1598. DREG32_SYS(m, rdev, VM_L2_STATUS);
  1599. return 0;
  1600. }
  1601. static struct drm_info_list r600_mc_info_list[] = {
  1602. {"r600_mc_info", r600_debugfs_mc_info, 0, NULL},
  1603. {"r600_ring_info", r600_debugfs_cp_ring_info, 0, NULL},
  1604. };
  1605. #endif
  1606. int r600_debugfs_mc_info_init(struct radeon_device *rdev)
  1607. {
  1608. #if defined(CONFIG_DEBUG_FS)
  1609. return radeon_debugfs_add_files(rdev, r600_mc_info_list, ARRAY_SIZE(r600_mc_info_list));
  1610. #else
  1611. return 0;
  1612. #endif
  1613. }