r600.c 50 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832
  1. /*
  2. * Copyright 2008 Advanced Micro Devices, Inc.
  3. * Copyright 2008 Red Hat Inc.
  4. * Copyright 2009 Jerome Glisse.
  5. *
  6. * Permission is hereby granted, free of charge, to any person obtaining a
  7. * copy of this software and associated documentation files (the "Software"),
  8. * to deal in the Software without restriction, including without limitation
  9. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  10. * and/or sell copies of the Software, and to permit persons to whom the
  11. * Software is furnished to do so, subject to the following conditions:
  12. *
  13. * The above copyright notice and this permission notice shall be included in
  14. * all copies or substantial portions of the Software.
  15. *
  16. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  17. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  18. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  19. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  20. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  21. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  22. * OTHER DEALINGS IN THE SOFTWARE.
  23. *
  24. * Authors: Dave Airlie
  25. * Alex Deucher
  26. * Jerome Glisse
  27. */
  28. #include <linux/seq_file.h>
  29. #include <linux/firmware.h>
  30. #include <linux/platform_device.h>
  31. #include "drmP.h"
  32. #include "radeon_drm.h"
  33. #include "radeon.h"
  34. #include "radeon_mode.h"
  35. #include "r600d.h"
  36. #include "avivod.h"
  37. #include "atom.h"
  38. #define PFP_UCODE_SIZE 576
  39. #define PM4_UCODE_SIZE 1792
  40. #define R700_PFP_UCODE_SIZE 848
  41. #define R700_PM4_UCODE_SIZE 1360
  42. /* Firmware Names */
  43. MODULE_FIRMWARE("radeon/R600_pfp.bin");
  44. MODULE_FIRMWARE("radeon/R600_me.bin");
  45. MODULE_FIRMWARE("radeon/RV610_pfp.bin");
  46. MODULE_FIRMWARE("radeon/RV610_me.bin");
  47. MODULE_FIRMWARE("radeon/RV630_pfp.bin");
  48. MODULE_FIRMWARE("radeon/RV630_me.bin");
  49. MODULE_FIRMWARE("radeon/RV620_pfp.bin");
  50. MODULE_FIRMWARE("radeon/RV620_me.bin");
  51. MODULE_FIRMWARE("radeon/RV635_pfp.bin");
  52. MODULE_FIRMWARE("radeon/RV635_me.bin");
  53. MODULE_FIRMWARE("radeon/RV670_pfp.bin");
  54. MODULE_FIRMWARE("radeon/RV670_me.bin");
  55. MODULE_FIRMWARE("radeon/RS780_pfp.bin");
  56. MODULE_FIRMWARE("radeon/RS780_me.bin");
  57. MODULE_FIRMWARE("radeon/RV770_pfp.bin");
  58. MODULE_FIRMWARE("radeon/RV770_me.bin");
  59. MODULE_FIRMWARE("radeon/RV730_pfp.bin");
  60. MODULE_FIRMWARE("radeon/RV730_me.bin");
  61. MODULE_FIRMWARE("radeon/RV710_pfp.bin");
  62. MODULE_FIRMWARE("radeon/RV710_me.bin");
  63. int r600_debugfs_mc_info_init(struct radeon_device *rdev);
  64. /* This files gather functions specifics to:
  65. * r600,rv610,rv630,rv620,rv635,rv670
  66. *
  67. * Some of these functions might be used by newer ASICs.
  68. */
  69. int r600_mc_wait_for_idle(struct radeon_device *rdev);
  70. void r600_gpu_init(struct radeon_device *rdev);
  71. void r600_fini(struct radeon_device *rdev);
  72. /*
  73. * R600 PCIE GART
  74. */
  75. int r600_gart_clear_page(struct radeon_device *rdev, int i)
  76. {
  77. void __iomem *ptr = (void *)rdev->gart.table.vram.ptr;
  78. u64 pte;
  79. if (i < 0 || i > rdev->gart.num_gpu_pages)
  80. return -EINVAL;
  81. pte = 0;
  82. writeq(pte, ((void __iomem *)ptr) + (i * 8));
  83. return 0;
  84. }
  85. void r600_pcie_gart_tlb_flush(struct radeon_device *rdev)
  86. {
  87. unsigned i;
  88. u32 tmp;
  89. WREG32(VM_CONTEXT0_INVALIDATION_LOW_ADDR, rdev->mc.gtt_start >> 12);
  90. WREG32(VM_CONTEXT0_INVALIDATION_HIGH_ADDR, (rdev->mc.gtt_end - 1) >> 12);
  91. WREG32(VM_CONTEXT0_REQUEST_RESPONSE, REQUEST_TYPE(1));
  92. for (i = 0; i < rdev->usec_timeout; i++) {
  93. /* read MC_STATUS */
  94. tmp = RREG32(VM_CONTEXT0_REQUEST_RESPONSE);
  95. tmp = (tmp & RESPONSE_TYPE_MASK) >> RESPONSE_TYPE_SHIFT;
  96. if (tmp == 2) {
  97. printk(KERN_WARNING "[drm] r600 flush TLB failed\n");
  98. return;
  99. }
  100. if (tmp) {
  101. return;
  102. }
  103. udelay(1);
  104. }
  105. }
  106. int r600_pcie_gart_init(struct radeon_device *rdev)
  107. {
  108. int r;
  109. if (rdev->gart.table.vram.robj) {
  110. WARN(1, "R600 PCIE GART already initialized.\n");
  111. return 0;
  112. }
  113. /* Initialize common gart structure */
  114. r = radeon_gart_init(rdev);
  115. if (r)
  116. return r;
  117. rdev->gart.table_size = rdev->gart.num_gpu_pages * 8;
  118. return radeon_gart_table_vram_alloc(rdev);
  119. }
  120. int r600_pcie_gart_enable(struct radeon_device *rdev)
  121. {
  122. u32 tmp;
  123. int r, i;
  124. if (rdev->gart.table.vram.robj == NULL) {
  125. dev_err(rdev->dev, "No VRAM object for PCIE GART.\n");
  126. return -EINVAL;
  127. }
  128. r = radeon_gart_table_vram_pin(rdev);
  129. if (r)
  130. return r;
  131. /* Setup L2 cache */
  132. WREG32(VM_L2_CNTL, ENABLE_L2_CACHE | ENABLE_L2_FRAGMENT_PROCESSING |
  133. ENABLE_L2_PTE_CACHE_LRU_UPDATE_BY_WRITE |
  134. EFFECTIVE_L2_QUEUE_SIZE(7));
  135. WREG32(VM_L2_CNTL2, 0);
  136. WREG32(VM_L2_CNTL3, BANK_SELECT_0(0) | BANK_SELECT_1(1));
  137. /* Setup TLB control */
  138. tmp = ENABLE_L1_TLB | ENABLE_L1_FRAGMENT_PROCESSING |
  139. SYSTEM_ACCESS_MODE_NOT_IN_SYS |
  140. EFFECTIVE_L1_TLB_SIZE(5) | EFFECTIVE_L1_QUEUE_SIZE(5) |
  141. ENABLE_WAIT_L2_QUERY;
  142. WREG32(MC_VM_L1_TLB_MCB_RD_SYS_CNTL, tmp);
  143. WREG32(MC_VM_L1_TLB_MCB_WR_SYS_CNTL, tmp);
  144. WREG32(MC_VM_L1_TLB_MCB_RD_HDP_CNTL, tmp | ENABLE_L1_STRICT_ORDERING);
  145. WREG32(MC_VM_L1_TLB_MCB_WR_HDP_CNTL, tmp);
  146. WREG32(MC_VM_L1_TLB_MCD_RD_A_CNTL, tmp);
  147. WREG32(MC_VM_L1_TLB_MCD_WR_A_CNTL, tmp);
  148. WREG32(MC_VM_L1_TLB_MCD_RD_B_CNTL, tmp);
  149. WREG32(MC_VM_L1_TLB_MCD_WR_B_CNTL, tmp);
  150. WREG32(MC_VM_L1_TLB_MCB_RD_GFX_CNTL, tmp);
  151. WREG32(MC_VM_L1_TLB_MCB_WR_GFX_CNTL, tmp);
  152. WREG32(MC_VM_L1_TLB_MCB_RD_PDMA_CNTL, tmp);
  153. WREG32(MC_VM_L1_TLB_MCB_WR_PDMA_CNTL, tmp);
  154. WREG32(MC_VM_L1_TLB_MCB_RD_SEM_CNTL, tmp | ENABLE_SEMAPHORE_MODE);
  155. WREG32(MC_VM_L1_TLB_MCB_WR_SEM_CNTL, tmp | ENABLE_SEMAPHORE_MODE);
  156. WREG32(VM_CONTEXT0_PAGE_TABLE_START_ADDR, rdev->mc.gtt_start >> 12);
  157. WREG32(VM_CONTEXT0_PAGE_TABLE_END_ADDR, (rdev->mc.gtt_end - 1) >> 12);
  158. WREG32(VM_CONTEXT0_PAGE_TABLE_BASE_ADDR, rdev->gart.table_addr >> 12);
  159. WREG32(VM_CONTEXT0_CNTL, ENABLE_CONTEXT | PAGE_TABLE_DEPTH(0) |
  160. RANGE_PROTECTION_FAULT_ENABLE_DEFAULT);
  161. WREG32(VM_CONTEXT0_PROTECTION_FAULT_DEFAULT_ADDR,
  162. (u32)(rdev->dummy_page.addr >> 12));
  163. for (i = 1; i < 7; i++)
  164. WREG32(VM_CONTEXT0_CNTL + (i * 4), 0);
  165. r600_pcie_gart_tlb_flush(rdev);
  166. rdev->gart.ready = true;
  167. return 0;
  168. }
  169. void r600_pcie_gart_disable(struct radeon_device *rdev)
  170. {
  171. u32 tmp;
  172. int i;
  173. /* Disable all tables */
  174. for (i = 0; i < 7; i++)
  175. WREG32(VM_CONTEXT0_CNTL + (i * 4), 0);
  176. /* Disable L2 cache */
  177. WREG32(VM_L2_CNTL, ENABLE_L2_FRAGMENT_PROCESSING |
  178. EFFECTIVE_L2_QUEUE_SIZE(7));
  179. WREG32(VM_L2_CNTL3, BANK_SELECT_0(0) | BANK_SELECT_1(1));
  180. /* Setup L1 TLB control */
  181. tmp = EFFECTIVE_L1_TLB_SIZE(5) | EFFECTIVE_L1_QUEUE_SIZE(5) |
  182. ENABLE_WAIT_L2_QUERY;
  183. WREG32(MC_VM_L1_TLB_MCD_RD_A_CNTL, tmp);
  184. WREG32(MC_VM_L1_TLB_MCD_WR_A_CNTL, tmp);
  185. WREG32(MC_VM_L1_TLB_MCD_RD_B_CNTL, tmp);
  186. WREG32(MC_VM_L1_TLB_MCD_WR_B_CNTL, tmp);
  187. WREG32(MC_VM_L1_TLB_MCB_RD_GFX_CNTL, tmp);
  188. WREG32(MC_VM_L1_TLB_MCB_WR_GFX_CNTL, tmp);
  189. WREG32(MC_VM_L1_TLB_MCB_RD_PDMA_CNTL, tmp);
  190. WREG32(MC_VM_L1_TLB_MCB_WR_PDMA_CNTL, tmp);
  191. WREG32(MC_VM_L1_TLB_MCB_RD_SEM_CNTL, tmp);
  192. WREG32(MC_VM_L1_TLB_MCB_WR_SEM_CNTL, tmp);
  193. WREG32(MC_VM_L1_TLB_MCB_RD_SYS_CNTL, tmp);
  194. WREG32(MC_VM_L1_TLB_MCB_WR_SYS_CNTL, tmp);
  195. WREG32(MC_VM_L1_TLB_MCB_RD_HDP_CNTL, tmp);
  196. WREG32(MC_VM_L1_TLB_MCB_WR_HDP_CNTL, tmp);
  197. if (rdev->gart.table.vram.robj) {
  198. radeon_object_kunmap(rdev->gart.table.vram.robj);
  199. radeon_object_unpin(rdev->gart.table.vram.robj);
  200. }
  201. }
  202. void r600_pcie_gart_fini(struct radeon_device *rdev)
  203. {
  204. r600_pcie_gart_disable(rdev);
  205. radeon_gart_table_vram_free(rdev);
  206. radeon_gart_fini(rdev);
  207. }
  208. int r600_mc_wait_for_idle(struct radeon_device *rdev)
  209. {
  210. unsigned i;
  211. u32 tmp;
  212. for (i = 0; i < rdev->usec_timeout; i++) {
  213. /* read MC_STATUS */
  214. tmp = RREG32(R_000E50_SRBM_STATUS) & 0x3F00;
  215. if (!tmp)
  216. return 0;
  217. udelay(1);
  218. }
  219. return -1;
  220. }
  221. static void r600_mc_resume(struct radeon_device *rdev)
  222. {
  223. u32 d1vga_control, d2vga_control;
  224. u32 vga_render_control, vga_hdp_control;
  225. u32 d1crtc_control, d2crtc_control;
  226. u32 new_d1grph_primary, new_d1grph_secondary;
  227. u32 new_d2grph_primary, new_d2grph_secondary;
  228. u64 old_vram_start;
  229. u32 tmp;
  230. int i, j;
  231. /* Initialize HDP */
  232. for (i = 0, j = 0; i < 32; i++, j += 0x18) {
  233. WREG32((0x2c14 + j), 0x00000000);
  234. WREG32((0x2c18 + j), 0x00000000);
  235. WREG32((0x2c1c + j), 0x00000000);
  236. WREG32((0x2c20 + j), 0x00000000);
  237. WREG32((0x2c24 + j), 0x00000000);
  238. }
  239. WREG32(HDP_REG_COHERENCY_FLUSH_CNTL, 0);
  240. d1vga_control = RREG32(D1VGA_CONTROL);
  241. d2vga_control = RREG32(D2VGA_CONTROL);
  242. vga_render_control = RREG32(VGA_RENDER_CONTROL);
  243. vga_hdp_control = RREG32(VGA_HDP_CONTROL);
  244. d1crtc_control = RREG32(D1CRTC_CONTROL);
  245. d2crtc_control = RREG32(D2CRTC_CONTROL);
  246. old_vram_start = (u64)(RREG32(MC_VM_FB_LOCATION) & 0xFFFF) << 24;
  247. new_d1grph_primary = RREG32(D1GRPH_PRIMARY_SURFACE_ADDRESS);
  248. new_d1grph_secondary = RREG32(D1GRPH_SECONDARY_SURFACE_ADDRESS);
  249. new_d1grph_primary += rdev->mc.vram_start - old_vram_start;
  250. new_d1grph_secondary += rdev->mc.vram_start - old_vram_start;
  251. new_d2grph_primary = RREG32(D2GRPH_PRIMARY_SURFACE_ADDRESS);
  252. new_d2grph_secondary = RREG32(D2GRPH_SECONDARY_SURFACE_ADDRESS);
  253. new_d2grph_primary += rdev->mc.vram_start - old_vram_start;
  254. new_d2grph_secondary += rdev->mc.vram_start - old_vram_start;
  255. /* Stop all video */
  256. WREG32(D1VGA_CONTROL, 0);
  257. WREG32(D2VGA_CONTROL, 0);
  258. WREG32(VGA_RENDER_CONTROL, 0);
  259. WREG32(D1CRTC_UPDATE_LOCK, 1);
  260. WREG32(D2CRTC_UPDATE_LOCK, 1);
  261. WREG32(D1CRTC_CONTROL, 0);
  262. WREG32(D2CRTC_CONTROL, 0);
  263. WREG32(D1CRTC_UPDATE_LOCK, 0);
  264. WREG32(D2CRTC_UPDATE_LOCK, 0);
  265. mdelay(1);
  266. if (r600_mc_wait_for_idle(rdev)) {
  267. printk(KERN_WARNING "[drm] MC not idle !\n");
  268. }
  269. /* Lockout access through VGA aperture*/
  270. WREG32(VGA_HDP_CONTROL, VGA_MEMORY_DISABLE);
  271. /* Update configuration */
  272. WREG32(MC_VM_SYSTEM_APERTURE_LOW_ADDR, rdev->mc.vram_start >> 12);
  273. WREG32(MC_VM_SYSTEM_APERTURE_HIGH_ADDR, (rdev->mc.vram_end - 1) >> 12);
  274. WREG32(MC_VM_SYSTEM_APERTURE_DEFAULT_ADDR, 0);
  275. tmp = (((rdev->mc.vram_end - 1) >> 24) & 0xFFFF) << 16;
  276. tmp |= ((rdev->mc.vram_start >> 24) & 0xFFFF);
  277. WREG32(MC_VM_FB_LOCATION, tmp);
  278. WREG32(HDP_NONSURFACE_BASE, (rdev->mc.vram_start >> 8));
  279. WREG32(HDP_NONSURFACE_INFO, (2 << 7));
  280. WREG32(HDP_NONSURFACE_SIZE, (rdev->mc.mc_vram_size - 1) | 0x3FF);
  281. if (rdev->flags & RADEON_IS_AGP) {
  282. WREG32(MC_VM_AGP_TOP, (rdev->mc.gtt_end - 1) >> 16);
  283. WREG32(MC_VM_AGP_BOT, rdev->mc.gtt_start >> 16);
  284. WREG32(MC_VM_AGP_BASE, rdev->mc.agp_base >> 22);
  285. } else {
  286. WREG32(MC_VM_AGP_BASE, 0);
  287. WREG32(MC_VM_AGP_TOP, 0x0FFFFFFF);
  288. WREG32(MC_VM_AGP_BOT, 0x0FFFFFFF);
  289. }
  290. WREG32(D1GRPH_PRIMARY_SURFACE_ADDRESS, new_d1grph_primary);
  291. WREG32(D1GRPH_SECONDARY_SURFACE_ADDRESS, new_d1grph_secondary);
  292. WREG32(D2GRPH_PRIMARY_SURFACE_ADDRESS, new_d2grph_primary);
  293. WREG32(D2GRPH_SECONDARY_SURFACE_ADDRESS, new_d2grph_secondary);
  294. WREG32(VGA_MEMORY_BASE_ADDRESS, rdev->mc.vram_start);
  295. /* Unlock host access */
  296. WREG32(VGA_HDP_CONTROL, vga_hdp_control);
  297. mdelay(1);
  298. if (r600_mc_wait_for_idle(rdev)) {
  299. printk(KERN_WARNING "[drm] MC not idle !\n");
  300. }
  301. /* Restore video state */
  302. WREG32(D1CRTC_UPDATE_LOCK, 1);
  303. WREG32(D2CRTC_UPDATE_LOCK, 1);
  304. WREG32(D1CRTC_CONTROL, d1crtc_control);
  305. WREG32(D2CRTC_CONTROL, d2crtc_control);
  306. WREG32(D1CRTC_UPDATE_LOCK, 0);
  307. WREG32(D2CRTC_UPDATE_LOCK, 0);
  308. WREG32(D1VGA_CONTROL, d1vga_control);
  309. WREG32(D2VGA_CONTROL, d2vga_control);
  310. WREG32(VGA_RENDER_CONTROL, vga_render_control);
  311. /* we need to own VRAM, so turn off the VGA renderer here
  312. * to stop it overwriting our objects */
  313. radeon_avivo_vga_render_disable(rdev);
  314. }
  315. int r600_mc_init(struct radeon_device *rdev)
  316. {
  317. fixed20_12 a;
  318. u32 tmp;
  319. int chansize;
  320. int r;
  321. /* Get VRAM informations */
  322. rdev->mc.vram_width = 128;
  323. rdev->mc.vram_is_ddr = true;
  324. tmp = RREG32(RAMCFG);
  325. if (tmp & CHANSIZE_OVERRIDE) {
  326. chansize = 16;
  327. } else if (tmp & CHANSIZE_MASK) {
  328. chansize = 64;
  329. } else {
  330. chansize = 32;
  331. }
  332. if (rdev->family == CHIP_R600) {
  333. rdev->mc.vram_width = 8 * chansize;
  334. } else if (rdev->family == CHIP_RV670) {
  335. rdev->mc.vram_width = 4 * chansize;
  336. } else if ((rdev->family == CHIP_RV610) ||
  337. (rdev->family == CHIP_RV620)) {
  338. rdev->mc.vram_width = chansize;
  339. } else if ((rdev->family == CHIP_RV630) ||
  340. (rdev->family == CHIP_RV635)) {
  341. rdev->mc.vram_width = 2 * chansize;
  342. }
  343. /* Could aper size report 0 ? */
  344. rdev->mc.aper_base = drm_get_resource_start(rdev->ddev, 0);
  345. rdev->mc.aper_size = drm_get_resource_len(rdev->ddev, 0);
  346. /* Setup GPU memory space */
  347. rdev->mc.mc_vram_size = RREG32(CONFIG_MEMSIZE);
  348. rdev->mc.real_vram_size = RREG32(CONFIG_MEMSIZE);
  349. if (rdev->flags & RADEON_IS_AGP) {
  350. r = radeon_agp_init(rdev);
  351. if (r)
  352. return r;
  353. /* gtt_size is setup by radeon_agp_init */
  354. rdev->mc.gtt_location = rdev->mc.agp_base;
  355. tmp = 0xFFFFFFFFUL - rdev->mc.agp_base - rdev->mc.gtt_size;
  356. /* Try to put vram before or after AGP because we
  357. * we want SYSTEM_APERTURE to cover both VRAM and
  358. * AGP so that GPU can catch out of VRAM/AGP access
  359. */
  360. if (rdev->mc.gtt_location > rdev->mc.mc_vram_size) {
  361. /* Enought place before */
  362. rdev->mc.vram_location = rdev->mc.gtt_location -
  363. rdev->mc.mc_vram_size;
  364. } else if (tmp > rdev->mc.mc_vram_size) {
  365. /* Enought place after */
  366. rdev->mc.vram_location = rdev->mc.gtt_location +
  367. rdev->mc.gtt_size;
  368. } else {
  369. /* Try to setup VRAM then AGP might not
  370. * not work on some card
  371. */
  372. rdev->mc.vram_location = 0x00000000UL;
  373. rdev->mc.gtt_location = rdev->mc.mc_vram_size;
  374. }
  375. } else {
  376. if (rdev->family == CHIP_RS780 || rdev->family == CHIP_RS880) {
  377. rdev->mc.vram_location = (RREG32(MC_VM_FB_LOCATION) &
  378. 0xFFFF) << 24;
  379. rdev->mc.gtt_size = radeon_gart_size * 1024 * 1024;
  380. tmp = rdev->mc.vram_location + rdev->mc.mc_vram_size;
  381. if ((0xFFFFFFFFUL - tmp) >= rdev->mc.gtt_size) {
  382. /* Enough place after vram */
  383. rdev->mc.gtt_location = tmp;
  384. } else if (rdev->mc.vram_location >= rdev->mc.gtt_size) {
  385. /* Enough place before vram */
  386. rdev->mc.gtt_location = 0;
  387. } else {
  388. /* Not enough place after or before shrink
  389. * gart size
  390. */
  391. if (rdev->mc.vram_location > (0xFFFFFFFFUL - tmp)) {
  392. rdev->mc.gtt_location = 0;
  393. rdev->mc.gtt_size = rdev->mc.vram_location;
  394. } else {
  395. rdev->mc.gtt_location = tmp;
  396. rdev->mc.gtt_size = 0xFFFFFFFFUL - tmp;
  397. }
  398. }
  399. rdev->mc.gtt_location = rdev->mc.mc_vram_size;
  400. } else {
  401. rdev->mc.vram_location = 0x00000000UL;
  402. rdev->mc.gtt_location = rdev->mc.mc_vram_size;
  403. rdev->mc.gtt_size = radeon_gart_size * 1024 * 1024;
  404. }
  405. }
  406. rdev->mc.vram_start = rdev->mc.vram_location;
  407. rdev->mc.vram_end = rdev->mc.vram_location + rdev->mc.mc_vram_size;
  408. rdev->mc.gtt_start = rdev->mc.gtt_location;
  409. rdev->mc.gtt_end = rdev->mc.gtt_location + rdev->mc.gtt_size;
  410. /* FIXME: we should enforce default clock in case GPU is not in
  411. * default setup
  412. */
  413. a.full = rfixed_const(100);
  414. rdev->pm.sclk.full = rfixed_const(rdev->clock.default_sclk);
  415. rdev->pm.sclk.full = rfixed_div(rdev->pm.sclk, a);
  416. return 0;
  417. }
  418. /* We doesn't check that the GPU really needs a reset we simply do the
  419. * reset, it's up to the caller to determine if the GPU needs one. We
  420. * might add an helper function to check that.
  421. */
  422. int r600_gpu_soft_reset(struct radeon_device *rdev)
  423. {
  424. u32 grbm_busy_mask = S_008010_VC_BUSY(1) | S_008010_VGT_BUSY_NO_DMA(1) |
  425. S_008010_VGT_BUSY(1) | S_008010_TA03_BUSY(1) |
  426. S_008010_TC_BUSY(1) | S_008010_SX_BUSY(1) |
  427. S_008010_SH_BUSY(1) | S_008010_SPI03_BUSY(1) |
  428. S_008010_SMX_BUSY(1) | S_008010_SC_BUSY(1) |
  429. S_008010_PA_BUSY(1) | S_008010_DB03_BUSY(1) |
  430. S_008010_CR_BUSY(1) | S_008010_CB03_BUSY(1) |
  431. S_008010_GUI_ACTIVE(1);
  432. u32 grbm2_busy_mask = S_008014_SPI0_BUSY(1) | S_008014_SPI1_BUSY(1) |
  433. S_008014_SPI2_BUSY(1) | S_008014_SPI3_BUSY(1) |
  434. S_008014_TA0_BUSY(1) | S_008014_TA1_BUSY(1) |
  435. S_008014_TA2_BUSY(1) | S_008014_TA3_BUSY(1) |
  436. S_008014_DB0_BUSY(1) | S_008014_DB1_BUSY(1) |
  437. S_008014_DB2_BUSY(1) | S_008014_DB3_BUSY(1) |
  438. S_008014_CB0_BUSY(1) | S_008014_CB1_BUSY(1) |
  439. S_008014_CB2_BUSY(1) | S_008014_CB3_BUSY(1);
  440. u32 srbm_reset = 0;
  441. /* Disable CP parsing/prefetching */
  442. WREG32(R_0086D8_CP_ME_CNTL, S_0086D8_CP_ME_HALT(0xff));
  443. /* Check if any of the rendering block is busy and reset it */
  444. if ((RREG32(R_008010_GRBM_STATUS) & grbm_busy_mask) ||
  445. (RREG32(R_008014_GRBM_STATUS2) & grbm2_busy_mask)) {
  446. WREG32(R_008020_GRBM_SOFT_RESET, S_008020_SOFT_RESET_CR(1) |
  447. S_008020_SOFT_RESET_DB(1) |
  448. S_008020_SOFT_RESET_CB(1) |
  449. S_008020_SOFT_RESET_PA(1) |
  450. S_008020_SOFT_RESET_SC(1) |
  451. S_008020_SOFT_RESET_SMX(1) |
  452. S_008020_SOFT_RESET_SPI(1) |
  453. S_008020_SOFT_RESET_SX(1) |
  454. S_008020_SOFT_RESET_SH(1) |
  455. S_008020_SOFT_RESET_TC(1) |
  456. S_008020_SOFT_RESET_TA(1) |
  457. S_008020_SOFT_RESET_VC(1) |
  458. S_008020_SOFT_RESET_VGT(1));
  459. (void)RREG32(R_008020_GRBM_SOFT_RESET);
  460. udelay(50);
  461. WREG32(R_008020_GRBM_SOFT_RESET, 0);
  462. (void)RREG32(R_008020_GRBM_SOFT_RESET);
  463. }
  464. /* Reset CP (we always reset CP) */
  465. WREG32(R_008020_GRBM_SOFT_RESET, S_008020_SOFT_RESET_CP(1));
  466. (void)RREG32(R_008020_GRBM_SOFT_RESET);
  467. udelay(50);
  468. WREG32(R_008020_GRBM_SOFT_RESET, 0);
  469. (void)RREG32(R_008020_GRBM_SOFT_RESET);
  470. /* Reset others GPU block if necessary */
  471. if (G_000E50_RLC_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  472. srbm_reset |= S_000E60_SOFT_RESET_RLC(1);
  473. if (G_000E50_GRBM_RQ_PENDING(RREG32(R_000E50_SRBM_STATUS)))
  474. srbm_reset |= S_000E60_SOFT_RESET_GRBM(1);
  475. if (G_000E50_HI_RQ_PENDING(RREG32(R_000E50_SRBM_STATUS)))
  476. srbm_reset |= S_000E60_SOFT_RESET_IH(1);
  477. if (G_000E50_VMC_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  478. srbm_reset |= S_000E60_SOFT_RESET_VMC(1);
  479. if (G_000E50_MCB_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  480. srbm_reset |= S_000E60_SOFT_RESET_MC(1);
  481. if (G_000E50_MCDZ_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  482. srbm_reset |= S_000E60_SOFT_RESET_MC(1);
  483. if (G_000E50_MCDY_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  484. srbm_reset |= S_000E60_SOFT_RESET_MC(1);
  485. if (G_000E50_MCDX_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  486. srbm_reset |= S_000E60_SOFT_RESET_MC(1);
  487. if (G_000E50_MCDW_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  488. srbm_reset |= S_000E60_SOFT_RESET_MC(1);
  489. if (G_000E50_RLC_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  490. srbm_reset |= S_000E60_SOFT_RESET_RLC(1);
  491. if (G_000E50_SEM_BUSY(RREG32(R_000E50_SRBM_STATUS)))
  492. srbm_reset |= S_000E60_SOFT_RESET_SEM(1);
  493. WREG32(R_000E60_SRBM_SOFT_RESET, srbm_reset);
  494. (void)RREG32(R_000E60_SRBM_SOFT_RESET);
  495. udelay(50);
  496. WREG32(R_000E60_SRBM_SOFT_RESET, 0);
  497. (void)RREG32(R_000E60_SRBM_SOFT_RESET);
  498. /* Wait a little for things to settle down */
  499. udelay(50);
  500. return 0;
  501. }
  502. int r600_gpu_reset(struct radeon_device *rdev)
  503. {
  504. return r600_gpu_soft_reset(rdev);
  505. }
  506. static u32 r600_get_tile_pipe_to_backend_map(u32 num_tile_pipes,
  507. u32 num_backends,
  508. u32 backend_disable_mask)
  509. {
  510. u32 backend_map = 0;
  511. u32 enabled_backends_mask;
  512. u32 enabled_backends_count;
  513. u32 cur_pipe;
  514. u32 swizzle_pipe[R6XX_MAX_PIPES];
  515. u32 cur_backend;
  516. u32 i;
  517. if (num_tile_pipes > R6XX_MAX_PIPES)
  518. num_tile_pipes = R6XX_MAX_PIPES;
  519. if (num_tile_pipes < 1)
  520. num_tile_pipes = 1;
  521. if (num_backends > R6XX_MAX_BACKENDS)
  522. num_backends = R6XX_MAX_BACKENDS;
  523. if (num_backends < 1)
  524. num_backends = 1;
  525. enabled_backends_mask = 0;
  526. enabled_backends_count = 0;
  527. for (i = 0; i < R6XX_MAX_BACKENDS; ++i) {
  528. if (((backend_disable_mask >> i) & 1) == 0) {
  529. enabled_backends_mask |= (1 << i);
  530. ++enabled_backends_count;
  531. }
  532. if (enabled_backends_count == num_backends)
  533. break;
  534. }
  535. if (enabled_backends_count == 0) {
  536. enabled_backends_mask = 1;
  537. enabled_backends_count = 1;
  538. }
  539. if (enabled_backends_count != num_backends)
  540. num_backends = enabled_backends_count;
  541. memset((uint8_t *)&swizzle_pipe[0], 0, sizeof(u32) * R6XX_MAX_PIPES);
  542. switch (num_tile_pipes) {
  543. case 1:
  544. swizzle_pipe[0] = 0;
  545. break;
  546. case 2:
  547. swizzle_pipe[0] = 0;
  548. swizzle_pipe[1] = 1;
  549. break;
  550. case 3:
  551. swizzle_pipe[0] = 0;
  552. swizzle_pipe[1] = 1;
  553. swizzle_pipe[2] = 2;
  554. break;
  555. case 4:
  556. swizzle_pipe[0] = 0;
  557. swizzle_pipe[1] = 1;
  558. swizzle_pipe[2] = 2;
  559. swizzle_pipe[3] = 3;
  560. break;
  561. case 5:
  562. swizzle_pipe[0] = 0;
  563. swizzle_pipe[1] = 1;
  564. swizzle_pipe[2] = 2;
  565. swizzle_pipe[3] = 3;
  566. swizzle_pipe[4] = 4;
  567. break;
  568. case 6:
  569. swizzle_pipe[0] = 0;
  570. swizzle_pipe[1] = 2;
  571. swizzle_pipe[2] = 4;
  572. swizzle_pipe[3] = 5;
  573. swizzle_pipe[4] = 1;
  574. swizzle_pipe[5] = 3;
  575. break;
  576. case 7:
  577. swizzle_pipe[0] = 0;
  578. swizzle_pipe[1] = 2;
  579. swizzle_pipe[2] = 4;
  580. swizzle_pipe[3] = 6;
  581. swizzle_pipe[4] = 1;
  582. swizzle_pipe[5] = 3;
  583. swizzle_pipe[6] = 5;
  584. break;
  585. case 8:
  586. swizzle_pipe[0] = 0;
  587. swizzle_pipe[1] = 2;
  588. swizzle_pipe[2] = 4;
  589. swizzle_pipe[3] = 6;
  590. swizzle_pipe[4] = 1;
  591. swizzle_pipe[5] = 3;
  592. swizzle_pipe[6] = 5;
  593. swizzle_pipe[7] = 7;
  594. break;
  595. }
  596. cur_backend = 0;
  597. for (cur_pipe = 0; cur_pipe < num_tile_pipes; ++cur_pipe) {
  598. while (((1 << cur_backend) & enabled_backends_mask) == 0)
  599. cur_backend = (cur_backend + 1) % R6XX_MAX_BACKENDS;
  600. backend_map |= (u32)(((cur_backend & 3) << (swizzle_pipe[cur_pipe] * 2)));
  601. cur_backend = (cur_backend + 1) % R6XX_MAX_BACKENDS;
  602. }
  603. return backend_map;
  604. }
  605. int r600_count_pipe_bits(uint32_t val)
  606. {
  607. int i, ret = 0;
  608. for (i = 0; i < 32; i++) {
  609. ret += val & 1;
  610. val >>= 1;
  611. }
  612. return ret;
  613. }
  614. void r600_gpu_init(struct radeon_device *rdev)
  615. {
  616. u32 tiling_config;
  617. u32 ramcfg;
  618. u32 tmp;
  619. int i, j;
  620. u32 sq_config;
  621. u32 sq_gpr_resource_mgmt_1 = 0;
  622. u32 sq_gpr_resource_mgmt_2 = 0;
  623. u32 sq_thread_resource_mgmt = 0;
  624. u32 sq_stack_resource_mgmt_1 = 0;
  625. u32 sq_stack_resource_mgmt_2 = 0;
  626. /* FIXME: implement */
  627. switch (rdev->family) {
  628. case CHIP_R600:
  629. rdev->config.r600.max_pipes = 4;
  630. rdev->config.r600.max_tile_pipes = 8;
  631. rdev->config.r600.max_simds = 4;
  632. rdev->config.r600.max_backends = 4;
  633. rdev->config.r600.max_gprs = 256;
  634. rdev->config.r600.max_threads = 192;
  635. rdev->config.r600.max_stack_entries = 256;
  636. rdev->config.r600.max_hw_contexts = 8;
  637. rdev->config.r600.max_gs_threads = 16;
  638. rdev->config.r600.sx_max_export_size = 128;
  639. rdev->config.r600.sx_max_export_pos_size = 16;
  640. rdev->config.r600.sx_max_export_smx_size = 128;
  641. rdev->config.r600.sq_num_cf_insts = 2;
  642. break;
  643. case CHIP_RV630:
  644. case CHIP_RV635:
  645. rdev->config.r600.max_pipes = 2;
  646. rdev->config.r600.max_tile_pipes = 2;
  647. rdev->config.r600.max_simds = 3;
  648. rdev->config.r600.max_backends = 1;
  649. rdev->config.r600.max_gprs = 128;
  650. rdev->config.r600.max_threads = 192;
  651. rdev->config.r600.max_stack_entries = 128;
  652. rdev->config.r600.max_hw_contexts = 8;
  653. rdev->config.r600.max_gs_threads = 4;
  654. rdev->config.r600.sx_max_export_size = 128;
  655. rdev->config.r600.sx_max_export_pos_size = 16;
  656. rdev->config.r600.sx_max_export_smx_size = 128;
  657. rdev->config.r600.sq_num_cf_insts = 2;
  658. break;
  659. case CHIP_RV610:
  660. case CHIP_RV620:
  661. case CHIP_RS780:
  662. case CHIP_RS880:
  663. rdev->config.r600.max_pipes = 1;
  664. rdev->config.r600.max_tile_pipes = 1;
  665. rdev->config.r600.max_simds = 2;
  666. rdev->config.r600.max_backends = 1;
  667. rdev->config.r600.max_gprs = 128;
  668. rdev->config.r600.max_threads = 192;
  669. rdev->config.r600.max_stack_entries = 128;
  670. rdev->config.r600.max_hw_contexts = 4;
  671. rdev->config.r600.max_gs_threads = 4;
  672. rdev->config.r600.sx_max_export_size = 128;
  673. rdev->config.r600.sx_max_export_pos_size = 16;
  674. rdev->config.r600.sx_max_export_smx_size = 128;
  675. rdev->config.r600.sq_num_cf_insts = 1;
  676. break;
  677. case CHIP_RV670:
  678. rdev->config.r600.max_pipes = 4;
  679. rdev->config.r600.max_tile_pipes = 4;
  680. rdev->config.r600.max_simds = 4;
  681. rdev->config.r600.max_backends = 4;
  682. rdev->config.r600.max_gprs = 192;
  683. rdev->config.r600.max_threads = 192;
  684. rdev->config.r600.max_stack_entries = 256;
  685. rdev->config.r600.max_hw_contexts = 8;
  686. rdev->config.r600.max_gs_threads = 16;
  687. rdev->config.r600.sx_max_export_size = 128;
  688. rdev->config.r600.sx_max_export_pos_size = 16;
  689. rdev->config.r600.sx_max_export_smx_size = 128;
  690. rdev->config.r600.sq_num_cf_insts = 2;
  691. break;
  692. default:
  693. break;
  694. }
  695. /* Initialize HDP */
  696. for (i = 0, j = 0; i < 32; i++, j += 0x18) {
  697. WREG32((0x2c14 + j), 0x00000000);
  698. WREG32((0x2c18 + j), 0x00000000);
  699. WREG32((0x2c1c + j), 0x00000000);
  700. WREG32((0x2c20 + j), 0x00000000);
  701. WREG32((0x2c24 + j), 0x00000000);
  702. }
  703. WREG32(GRBM_CNTL, GRBM_READ_TIMEOUT(0xff));
  704. /* Setup tiling */
  705. tiling_config = 0;
  706. ramcfg = RREG32(RAMCFG);
  707. switch (rdev->config.r600.max_tile_pipes) {
  708. case 1:
  709. tiling_config |= PIPE_TILING(0);
  710. break;
  711. case 2:
  712. tiling_config |= PIPE_TILING(1);
  713. break;
  714. case 4:
  715. tiling_config |= PIPE_TILING(2);
  716. break;
  717. case 8:
  718. tiling_config |= PIPE_TILING(3);
  719. break;
  720. default:
  721. break;
  722. }
  723. tiling_config |= BANK_TILING((ramcfg & NOOFBANK_MASK) >> NOOFBANK_SHIFT);
  724. tiling_config |= GROUP_SIZE(0);
  725. tmp = (ramcfg & NOOFROWS_MASK) >> NOOFROWS_SHIFT;
  726. if (tmp > 3) {
  727. tiling_config |= ROW_TILING(3);
  728. tiling_config |= SAMPLE_SPLIT(3);
  729. } else {
  730. tiling_config |= ROW_TILING(tmp);
  731. tiling_config |= SAMPLE_SPLIT(tmp);
  732. }
  733. tiling_config |= BANK_SWAPS(1);
  734. tmp = r600_get_tile_pipe_to_backend_map(rdev->config.r600.max_tile_pipes,
  735. rdev->config.r600.max_backends,
  736. (0xff << rdev->config.r600.max_backends) & 0xff);
  737. tiling_config |= BACKEND_MAP(tmp);
  738. WREG32(GB_TILING_CONFIG, tiling_config);
  739. WREG32(DCP_TILING_CONFIG, tiling_config & 0xffff);
  740. WREG32(HDP_TILING_CONFIG, tiling_config & 0xffff);
  741. tmp = BACKEND_DISABLE((R6XX_MAX_BACKENDS_MASK << rdev->config.r600.max_backends) & R6XX_MAX_BACKENDS_MASK);
  742. WREG32(CC_RB_BACKEND_DISABLE, tmp);
  743. /* Setup pipes */
  744. tmp = INACTIVE_QD_PIPES((R6XX_MAX_PIPES_MASK << rdev->config.r600.max_pipes) & R6XX_MAX_PIPES_MASK);
  745. tmp |= INACTIVE_SIMDS((R6XX_MAX_SIMDS_MASK << rdev->config.r600.max_simds) & R6XX_MAX_SIMDS_MASK);
  746. WREG32(CC_GC_SHADER_PIPE_CONFIG, tmp);
  747. WREG32(GC_USER_SHADER_PIPE_CONFIG, tmp);
  748. tmp = R6XX_MAX_BACKENDS - r600_count_pipe_bits(tmp & INACTIVE_QD_PIPES_MASK);
  749. WREG32(VGT_OUT_DEALLOC_CNTL, (tmp * 4) & DEALLOC_DIST_MASK);
  750. WREG32(VGT_VERTEX_REUSE_BLOCK_CNTL, ((tmp * 4) - 2) & VTX_REUSE_DEPTH_MASK);
  751. /* Setup some CP states */
  752. WREG32(CP_QUEUE_THRESHOLDS, (ROQ_IB1_START(0x16) | ROQ_IB2_START(0x2b)));
  753. WREG32(CP_MEQ_THRESHOLDS, (MEQ_END(0x40) | ROQ_END(0x40)));
  754. WREG32(TA_CNTL_AUX, (DISABLE_CUBE_ANISO | SYNC_GRADIENT |
  755. SYNC_WALKER | SYNC_ALIGNER));
  756. /* Setup various GPU states */
  757. if (rdev->family == CHIP_RV670)
  758. WREG32(ARB_GDEC_RD_CNTL, 0x00000021);
  759. tmp = RREG32(SX_DEBUG_1);
  760. tmp |= SMX_EVENT_RELEASE;
  761. if ((rdev->family > CHIP_R600))
  762. tmp |= ENABLE_NEW_SMX_ADDRESS;
  763. WREG32(SX_DEBUG_1, tmp);
  764. if (((rdev->family) == CHIP_R600) ||
  765. ((rdev->family) == CHIP_RV630) ||
  766. ((rdev->family) == CHIP_RV610) ||
  767. ((rdev->family) == CHIP_RV620) ||
  768. ((rdev->family) == CHIP_RS780)) {
  769. WREG32(DB_DEBUG, PREZ_MUST_WAIT_FOR_POSTZ_DONE);
  770. } else {
  771. WREG32(DB_DEBUG, 0);
  772. }
  773. WREG32(DB_WATERMARKS, (DEPTH_FREE(4) | DEPTH_CACHELINE_FREE(16) |
  774. DEPTH_FLUSH(16) | DEPTH_PENDING_FREE(4)));
  775. WREG32(PA_SC_MULTI_CHIP_CNTL, 0);
  776. WREG32(VGT_NUM_INSTANCES, 0);
  777. WREG32(SPI_CONFIG_CNTL, GPR_WRITE_PRIORITY(0));
  778. WREG32(SPI_CONFIG_CNTL_1, VTX_DONE_DELAY(0));
  779. tmp = RREG32(SQ_MS_FIFO_SIZES);
  780. if (((rdev->family) == CHIP_RV610) ||
  781. ((rdev->family) == CHIP_RV620) ||
  782. ((rdev->family) == CHIP_RS780)) {
  783. tmp = (CACHE_FIFO_SIZE(0xa) |
  784. FETCH_FIFO_HIWATER(0xa) |
  785. DONE_FIFO_HIWATER(0xe0) |
  786. ALU_UPDATE_FIFO_HIWATER(0x8));
  787. } else if (((rdev->family) == CHIP_R600) ||
  788. ((rdev->family) == CHIP_RV630)) {
  789. tmp &= ~DONE_FIFO_HIWATER(0xff);
  790. tmp |= DONE_FIFO_HIWATER(0x4);
  791. }
  792. WREG32(SQ_MS_FIFO_SIZES, tmp);
  793. /* SQ_CONFIG, SQ_GPR_RESOURCE_MGMT, SQ_THREAD_RESOURCE_MGMT, SQ_STACK_RESOURCE_MGMT
  794. * should be adjusted as needed by the 2D/3D drivers. This just sets default values
  795. */
  796. sq_config = RREG32(SQ_CONFIG);
  797. sq_config &= ~(PS_PRIO(3) |
  798. VS_PRIO(3) |
  799. GS_PRIO(3) |
  800. ES_PRIO(3));
  801. sq_config |= (DX9_CONSTS |
  802. VC_ENABLE |
  803. PS_PRIO(0) |
  804. VS_PRIO(1) |
  805. GS_PRIO(2) |
  806. ES_PRIO(3));
  807. if ((rdev->family) == CHIP_R600) {
  808. sq_gpr_resource_mgmt_1 = (NUM_PS_GPRS(124) |
  809. NUM_VS_GPRS(124) |
  810. NUM_CLAUSE_TEMP_GPRS(4));
  811. sq_gpr_resource_mgmt_2 = (NUM_GS_GPRS(0) |
  812. NUM_ES_GPRS(0));
  813. sq_thread_resource_mgmt = (NUM_PS_THREADS(136) |
  814. NUM_VS_THREADS(48) |
  815. NUM_GS_THREADS(4) |
  816. NUM_ES_THREADS(4));
  817. sq_stack_resource_mgmt_1 = (NUM_PS_STACK_ENTRIES(128) |
  818. NUM_VS_STACK_ENTRIES(128));
  819. sq_stack_resource_mgmt_2 = (NUM_GS_STACK_ENTRIES(0) |
  820. NUM_ES_STACK_ENTRIES(0));
  821. } else if (((rdev->family) == CHIP_RV610) ||
  822. ((rdev->family) == CHIP_RV620) ||
  823. ((rdev->family) == CHIP_RS780)) {
  824. /* no vertex cache */
  825. sq_config &= ~VC_ENABLE;
  826. sq_gpr_resource_mgmt_1 = (NUM_PS_GPRS(44) |
  827. NUM_VS_GPRS(44) |
  828. NUM_CLAUSE_TEMP_GPRS(2));
  829. sq_gpr_resource_mgmt_2 = (NUM_GS_GPRS(17) |
  830. NUM_ES_GPRS(17));
  831. sq_thread_resource_mgmt = (NUM_PS_THREADS(79) |
  832. NUM_VS_THREADS(78) |
  833. NUM_GS_THREADS(4) |
  834. NUM_ES_THREADS(31));
  835. sq_stack_resource_mgmt_1 = (NUM_PS_STACK_ENTRIES(40) |
  836. NUM_VS_STACK_ENTRIES(40));
  837. sq_stack_resource_mgmt_2 = (NUM_GS_STACK_ENTRIES(32) |
  838. NUM_ES_STACK_ENTRIES(16));
  839. } else if (((rdev->family) == CHIP_RV630) ||
  840. ((rdev->family) == CHIP_RV635)) {
  841. sq_gpr_resource_mgmt_1 = (NUM_PS_GPRS(44) |
  842. NUM_VS_GPRS(44) |
  843. NUM_CLAUSE_TEMP_GPRS(2));
  844. sq_gpr_resource_mgmt_2 = (NUM_GS_GPRS(18) |
  845. NUM_ES_GPRS(18));
  846. sq_thread_resource_mgmt = (NUM_PS_THREADS(79) |
  847. NUM_VS_THREADS(78) |
  848. NUM_GS_THREADS(4) |
  849. NUM_ES_THREADS(31));
  850. sq_stack_resource_mgmt_1 = (NUM_PS_STACK_ENTRIES(40) |
  851. NUM_VS_STACK_ENTRIES(40));
  852. sq_stack_resource_mgmt_2 = (NUM_GS_STACK_ENTRIES(32) |
  853. NUM_ES_STACK_ENTRIES(16));
  854. } else if ((rdev->family) == CHIP_RV670) {
  855. sq_gpr_resource_mgmt_1 = (NUM_PS_GPRS(44) |
  856. NUM_VS_GPRS(44) |
  857. NUM_CLAUSE_TEMP_GPRS(2));
  858. sq_gpr_resource_mgmt_2 = (NUM_GS_GPRS(17) |
  859. NUM_ES_GPRS(17));
  860. sq_thread_resource_mgmt = (NUM_PS_THREADS(79) |
  861. NUM_VS_THREADS(78) |
  862. NUM_GS_THREADS(4) |
  863. NUM_ES_THREADS(31));
  864. sq_stack_resource_mgmt_1 = (NUM_PS_STACK_ENTRIES(64) |
  865. NUM_VS_STACK_ENTRIES(64));
  866. sq_stack_resource_mgmt_2 = (NUM_GS_STACK_ENTRIES(64) |
  867. NUM_ES_STACK_ENTRIES(64));
  868. }
  869. WREG32(SQ_CONFIG, sq_config);
  870. WREG32(SQ_GPR_RESOURCE_MGMT_1, sq_gpr_resource_mgmt_1);
  871. WREG32(SQ_GPR_RESOURCE_MGMT_2, sq_gpr_resource_mgmt_2);
  872. WREG32(SQ_THREAD_RESOURCE_MGMT, sq_thread_resource_mgmt);
  873. WREG32(SQ_STACK_RESOURCE_MGMT_1, sq_stack_resource_mgmt_1);
  874. WREG32(SQ_STACK_RESOURCE_MGMT_2, sq_stack_resource_mgmt_2);
  875. if (((rdev->family) == CHIP_RV610) ||
  876. ((rdev->family) == CHIP_RV620) ||
  877. ((rdev->family) == CHIP_RS780)) {
  878. WREG32(VGT_CACHE_INVALIDATION, CACHE_INVALIDATION(TC_ONLY));
  879. } else {
  880. WREG32(VGT_CACHE_INVALIDATION, CACHE_INVALIDATION(VC_AND_TC));
  881. }
  882. /* More default values. 2D/3D driver should adjust as needed */
  883. WREG32(PA_SC_AA_SAMPLE_LOCS_2S, (S0_X(0xc) | S0_Y(0x4) |
  884. S1_X(0x4) | S1_Y(0xc)));
  885. WREG32(PA_SC_AA_SAMPLE_LOCS_4S, (S0_X(0xe) | S0_Y(0xe) |
  886. S1_X(0x2) | S1_Y(0x2) |
  887. S2_X(0xa) | S2_Y(0x6) |
  888. S3_X(0x6) | S3_Y(0xa)));
  889. WREG32(PA_SC_AA_SAMPLE_LOCS_8S_WD0, (S0_X(0xe) | S0_Y(0xb) |
  890. S1_X(0x4) | S1_Y(0xc) |
  891. S2_X(0x1) | S2_Y(0x6) |
  892. S3_X(0xa) | S3_Y(0xe)));
  893. WREG32(PA_SC_AA_SAMPLE_LOCS_8S_WD1, (S4_X(0x6) | S4_Y(0x1) |
  894. S5_X(0x0) | S5_Y(0x0) |
  895. S6_X(0xb) | S6_Y(0x4) |
  896. S7_X(0x7) | S7_Y(0x8)));
  897. WREG32(VGT_STRMOUT_EN, 0);
  898. tmp = rdev->config.r600.max_pipes * 16;
  899. switch (rdev->family) {
  900. case CHIP_RV610:
  901. case CHIP_RS780:
  902. case CHIP_RV620:
  903. tmp += 32;
  904. break;
  905. case CHIP_RV670:
  906. tmp += 128;
  907. break;
  908. default:
  909. break;
  910. }
  911. if (tmp > 256) {
  912. tmp = 256;
  913. }
  914. WREG32(VGT_ES_PER_GS, 128);
  915. WREG32(VGT_GS_PER_ES, tmp);
  916. WREG32(VGT_GS_PER_VS, 2);
  917. WREG32(VGT_GS_VERTEX_REUSE, 16);
  918. /* more default values. 2D/3D driver should adjust as needed */
  919. WREG32(PA_SC_LINE_STIPPLE_STATE, 0);
  920. WREG32(VGT_STRMOUT_EN, 0);
  921. WREG32(SX_MISC, 0);
  922. WREG32(PA_SC_MODE_CNTL, 0);
  923. WREG32(PA_SC_AA_CONFIG, 0);
  924. WREG32(PA_SC_LINE_STIPPLE, 0);
  925. WREG32(SPI_INPUT_Z, 0);
  926. WREG32(SPI_PS_IN_CONTROL_0, NUM_INTERP(2));
  927. WREG32(CB_COLOR7_FRAG, 0);
  928. /* Clear render buffer base addresses */
  929. WREG32(CB_COLOR0_BASE, 0);
  930. WREG32(CB_COLOR1_BASE, 0);
  931. WREG32(CB_COLOR2_BASE, 0);
  932. WREG32(CB_COLOR3_BASE, 0);
  933. WREG32(CB_COLOR4_BASE, 0);
  934. WREG32(CB_COLOR5_BASE, 0);
  935. WREG32(CB_COLOR6_BASE, 0);
  936. WREG32(CB_COLOR7_BASE, 0);
  937. WREG32(CB_COLOR7_FRAG, 0);
  938. switch (rdev->family) {
  939. case CHIP_RV610:
  940. case CHIP_RS780:
  941. case CHIP_RV620:
  942. tmp = TC_L2_SIZE(8);
  943. break;
  944. case CHIP_RV630:
  945. case CHIP_RV635:
  946. tmp = TC_L2_SIZE(4);
  947. break;
  948. case CHIP_R600:
  949. tmp = TC_L2_SIZE(0) | L2_DISABLE_LATE_HIT;
  950. break;
  951. default:
  952. tmp = TC_L2_SIZE(0);
  953. break;
  954. }
  955. WREG32(TC_CNTL, tmp);
  956. tmp = RREG32(HDP_HOST_PATH_CNTL);
  957. WREG32(HDP_HOST_PATH_CNTL, tmp);
  958. tmp = RREG32(ARB_POP);
  959. tmp |= ENABLE_TC128;
  960. WREG32(ARB_POP, tmp);
  961. WREG32(PA_SC_MULTI_CHIP_CNTL, 0);
  962. WREG32(PA_CL_ENHANCE, (CLIP_VTX_REORDER_ENA |
  963. NUM_CLIP_SEQ(3)));
  964. WREG32(PA_SC_ENHANCE, FORCE_EOV_MAX_CLK_CNT(4095));
  965. }
  966. /*
  967. * Indirect registers accessor
  968. */
  969. u32 r600_pciep_rreg(struct radeon_device *rdev, u32 reg)
  970. {
  971. u32 r;
  972. WREG32(PCIE_PORT_INDEX, ((reg) & 0xff));
  973. (void)RREG32(PCIE_PORT_INDEX);
  974. r = RREG32(PCIE_PORT_DATA);
  975. return r;
  976. }
  977. void r600_pciep_wreg(struct radeon_device *rdev, u32 reg, u32 v)
  978. {
  979. WREG32(PCIE_PORT_INDEX, ((reg) & 0xff));
  980. (void)RREG32(PCIE_PORT_INDEX);
  981. WREG32(PCIE_PORT_DATA, (v));
  982. (void)RREG32(PCIE_PORT_DATA);
  983. }
  984. /*
  985. * CP & Ring
  986. */
  987. void r600_cp_stop(struct radeon_device *rdev)
  988. {
  989. WREG32(R_0086D8_CP_ME_CNTL, S_0086D8_CP_ME_HALT(1));
  990. }
  991. int r600_cp_init_microcode(struct radeon_device *rdev)
  992. {
  993. struct platform_device *pdev;
  994. const char *chip_name;
  995. size_t pfp_req_size, me_req_size;
  996. char fw_name[30];
  997. int err;
  998. DRM_DEBUG("\n");
  999. pdev = platform_device_register_simple("radeon_cp", 0, NULL, 0);
  1000. err = IS_ERR(pdev);
  1001. if (err) {
  1002. printk(KERN_ERR "radeon_cp: Failed to register firmware\n");
  1003. return -EINVAL;
  1004. }
  1005. switch (rdev->family) {
  1006. case CHIP_R600: chip_name = "R600"; break;
  1007. case CHIP_RV610: chip_name = "RV610"; break;
  1008. case CHIP_RV630: chip_name = "RV630"; break;
  1009. case CHIP_RV620: chip_name = "RV620"; break;
  1010. case CHIP_RV635: chip_name = "RV635"; break;
  1011. case CHIP_RV670: chip_name = "RV670"; break;
  1012. case CHIP_RS780:
  1013. case CHIP_RS880: chip_name = "RS780"; break;
  1014. case CHIP_RV770: chip_name = "RV770"; break;
  1015. case CHIP_RV730:
  1016. case CHIP_RV740: chip_name = "RV730"; break;
  1017. case CHIP_RV710: chip_name = "RV710"; break;
  1018. default: BUG();
  1019. }
  1020. if (rdev->family >= CHIP_RV770) {
  1021. pfp_req_size = R700_PFP_UCODE_SIZE * 4;
  1022. me_req_size = R700_PM4_UCODE_SIZE * 4;
  1023. } else {
  1024. pfp_req_size = PFP_UCODE_SIZE * 4;
  1025. me_req_size = PM4_UCODE_SIZE * 12;
  1026. }
  1027. DRM_INFO("Loading %s CP Microcode\n", chip_name);
  1028. snprintf(fw_name, sizeof(fw_name), "radeon/%s_pfp.bin", chip_name);
  1029. err = request_firmware(&rdev->pfp_fw, fw_name, &pdev->dev);
  1030. if (err)
  1031. goto out;
  1032. if (rdev->pfp_fw->size != pfp_req_size) {
  1033. printk(KERN_ERR
  1034. "r600_cp: Bogus length %zu in firmware \"%s\"\n",
  1035. rdev->pfp_fw->size, fw_name);
  1036. err = -EINVAL;
  1037. goto out;
  1038. }
  1039. snprintf(fw_name, sizeof(fw_name), "radeon/%s_me.bin", chip_name);
  1040. err = request_firmware(&rdev->me_fw, fw_name, &pdev->dev);
  1041. if (err)
  1042. goto out;
  1043. if (rdev->me_fw->size != me_req_size) {
  1044. printk(KERN_ERR
  1045. "r600_cp: Bogus length %zu in firmware \"%s\"\n",
  1046. rdev->me_fw->size, fw_name);
  1047. err = -EINVAL;
  1048. }
  1049. out:
  1050. platform_device_unregister(pdev);
  1051. if (err) {
  1052. if (err != -EINVAL)
  1053. printk(KERN_ERR
  1054. "r600_cp: Failed to load firmware \"%s\"\n",
  1055. fw_name);
  1056. release_firmware(rdev->pfp_fw);
  1057. rdev->pfp_fw = NULL;
  1058. release_firmware(rdev->me_fw);
  1059. rdev->me_fw = NULL;
  1060. }
  1061. return err;
  1062. }
  1063. static int r600_cp_load_microcode(struct radeon_device *rdev)
  1064. {
  1065. const __be32 *fw_data;
  1066. int i;
  1067. if (!rdev->me_fw || !rdev->pfp_fw)
  1068. return -EINVAL;
  1069. r600_cp_stop(rdev);
  1070. WREG32(CP_RB_CNTL, RB_NO_UPDATE | RB_BLKSZ(15) | RB_BUFSZ(3));
  1071. /* Reset cp */
  1072. WREG32(GRBM_SOFT_RESET, SOFT_RESET_CP);
  1073. RREG32(GRBM_SOFT_RESET);
  1074. mdelay(15);
  1075. WREG32(GRBM_SOFT_RESET, 0);
  1076. WREG32(CP_ME_RAM_WADDR, 0);
  1077. fw_data = (const __be32 *)rdev->me_fw->data;
  1078. WREG32(CP_ME_RAM_WADDR, 0);
  1079. for (i = 0; i < PM4_UCODE_SIZE * 3; i++)
  1080. WREG32(CP_ME_RAM_DATA,
  1081. be32_to_cpup(fw_data++));
  1082. fw_data = (const __be32 *)rdev->pfp_fw->data;
  1083. WREG32(CP_PFP_UCODE_ADDR, 0);
  1084. for (i = 0; i < PFP_UCODE_SIZE; i++)
  1085. WREG32(CP_PFP_UCODE_DATA,
  1086. be32_to_cpup(fw_data++));
  1087. WREG32(CP_PFP_UCODE_ADDR, 0);
  1088. WREG32(CP_ME_RAM_WADDR, 0);
  1089. WREG32(CP_ME_RAM_RADDR, 0);
  1090. return 0;
  1091. }
  1092. int r600_cp_start(struct radeon_device *rdev)
  1093. {
  1094. int r;
  1095. uint32_t cp_me;
  1096. r = radeon_ring_lock(rdev, 7);
  1097. if (r) {
  1098. DRM_ERROR("radeon: cp failed to lock ring (%d).\n", r);
  1099. return r;
  1100. }
  1101. radeon_ring_write(rdev, PACKET3(PACKET3_ME_INITIALIZE, 5));
  1102. radeon_ring_write(rdev, 0x1);
  1103. if (rdev->family < CHIP_RV770) {
  1104. radeon_ring_write(rdev, 0x3);
  1105. radeon_ring_write(rdev, rdev->config.r600.max_hw_contexts - 1);
  1106. } else {
  1107. radeon_ring_write(rdev, 0x0);
  1108. radeon_ring_write(rdev, rdev->config.rv770.max_hw_contexts - 1);
  1109. }
  1110. radeon_ring_write(rdev, PACKET3_ME_INITIALIZE_DEVICE_ID(1));
  1111. radeon_ring_write(rdev, 0);
  1112. radeon_ring_write(rdev, 0);
  1113. radeon_ring_unlock_commit(rdev);
  1114. cp_me = 0xff;
  1115. WREG32(R_0086D8_CP_ME_CNTL, cp_me);
  1116. return 0;
  1117. }
  1118. int r600_cp_resume(struct radeon_device *rdev)
  1119. {
  1120. u32 tmp;
  1121. u32 rb_bufsz;
  1122. int r;
  1123. /* Reset cp */
  1124. WREG32(GRBM_SOFT_RESET, SOFT_RESET_CP);
  1125. RREG32(GRBM_SOFT_RESET);
  1126. mdelay(15);
  1127. WREG32(GRBM_SOFT_RESET, 0);
  1128. /* Set ring buffer size */
  1129. rb_bufsz = drm_order(rdev->cp.ring_size / 8);
  1130. #ifdef __BIG_ENDIAN
  1131. WREG32(CP_RB_CNTL, BUF_SWAP_32BIT | RB_NO_UPDATE |
  1132. (drm_order(4096/8) << 8) | rb_bufsz);
  1133. #else
  1134. WREG32(CP_RB_CNTL, RB_NO_UPDATE | (drm_order(4096/8) << 8) | rb_bufsz);
  1135. #endif
  1136. WREG32(CP_SEM_WAIT_TIMER, 0x4);
  1137. /* Set the write pointer delay */
  1138. WREG32(CP_RB_WPTR_DELAY, 0);
  1139. /* Initialize the ring buffer's read and write pointers */
  1140. tmp = RREG32(CP_RB_CNTL);
  1141. WREG32(CP_RB_CNTL, tmp | RB_RPTR_WR_ENA);
  1142. WREG32(CP_RB_RPTR_WR, 0);
  1143. WREG32(CP_RB_WPTR, 0);
  1144. WREG32(CP_RB_RPTR_ADDR, rdev->cp.gpu_addr & 0xFFFFFFFF);
  1145. WREG32(CP_RB_RPTR_ADDR_HI, upper_32_bits(rdev->cp.gpu_addr));
  1146. mdelay(1);
  1147. WREG32(CP_RB_CNTL, tmp);
  1148. WREG32(CP_RB_BASE, rdev->cp.gpu_addr >> 8);
  1149. WREG32(CP_DEBUG, (1 << 27) | (1 << 28));
  1150. rdev->cp.rptr = RREG32(CP_RB_RPTR);
  1151. rdev->cp.wptr = RREG32(CP_RB_WPTR);
  1152. r600_cp_start(rdev);
  1153. rdev->cp.ready = true;
  1154. r = radeon_ring_test(rdev);
  1155. if (r) {
  1156. rdev->cp.ready = false;
  1157. return r;
  1158. }
  1159. return 0;
  1160. }
  1161. void r600_cp_commit(struct radeon_device *rdev)
  1162. {
  1163. WREG32(CP_RB_WPTR, rdev->cp.wptr);
  1164. (void)RREG32(CP_RB_WPTR);
  1165. }
  1166. void r600_ring_init(struct radeon_device *rdev, unsigned ring_size)
  1167. {
  1168. u32 rb_bufsz;
  1169. /* Align ring size */
  1170. rb_bufsz = drm_order(ring_size / 8);
  1171. ring_size = (1 << (rb_bufsz + 1)) * 4;
  1172. rdev->cp.ring_size = ring_size;
  1173. rdev->cp.align_mask = 16 - 1;
  1174. }
  1175. /*
  1176. * GPU scratch registers helpers function.
  1177. */
  1178. void r600_scratch_init(struct radeon_device *rdev)
  1179. {
  1180. int i;
  1181. rdev->scratch.num_reg = 7;
  1182. for (i = 0; i < rdev->scratch.num_reg; i++) {
  1183. rdev->scratch.free[i] = true;
  1184. rdev->scratch.reg[i] = SCRATCH_REG0 + (i * 4);
  1185. }
  1186. }
  1187. int r600_ring_test(struct radeon_device *rdev)
  1188. {
  1189. uint32_t scratch;
  1190. uint32_t tmp = 0;
  1191. unsigned i;
  1192. int r;
  1193. r = radeon_scratch_get(rdev, &scratch);
  1194. if (r) {
  1195. DRM_ERROR("radeon: cp failed to get scratch reg (%d).\n", r);
  1196. return r;
  1197. }
  1198. WREG32(scratch, 0xCAFEDEAD);
  1199. r = radeon_ring_lock(rdev, 3);
  1200. if (r) {
  1201. DRM_ERROR("radeon: cp failed to lock ring (%d).\n", r);
  1202. radeon_scratch_free(rdev, scratch);
  1203. return r;
  1204. }
  1205. radeon_ring_write(rdev, PACKET3(PACKET3_SET_CONFIG_REG, 1));
  1206. radeon_ring_write(rdev, ((scratch - PACKET3_SET_CONFIG_REG_OFFSET) >> 2));
  1207. radeon_ring_write(rdev, 0xDEADBEEF);
  1208. radeon_ring_unlock_commit(rdev);
  1209. for (i = 0; i < rdev->usec_timeout; i++) {
  1210. tmp = RREG32(scratch);
  1211. if (tmp == 0xDEADBEEF)
  1212. break;
  1213. DRM_UDELAY(1);
  1214. }
  1215. if (i < rdev->usec_timeout) {
  1216. DRM_INFO("ring test succeeded in %d usecs\n", i);
  1217. } else {
  1218. DRM_ERROR("radeon: ring test failed (scratch(0x%04X)=0x%08X)\n",
  1219. scratch, tmp);
  1220. r = -EINVAL;
  1221. }
  1222. radeon_scratch_free(rdev, scratch);
  1223. return r;
  1224. }
  1225. /*
  1226. * Writeback
  1227. */
  1228. int r600_wb_init(struct radeon_device *rdev)
  1229. {
  1230. int r;
  1231. if (rdev->wb.wb_obj == NULL) {
  1232. r = radeon_object_create(rdev, NULL, 4096,
  1233. true,
  1234. RADEON_GEM_DOMAIN_GTT,
  1235. false, &rdev->wb.wb_obj);
  1236. if (r) {
  1237. DRM_ERROR("radeon: failed to create WB buffer (%d).\n", r);
  1238. return r;
  1239. }
  1240. r = radeon_object_pin(rdev->wb.wb_obj,
  1241. RADEON_GEM_DOMAIN_GTT,
  1242. &rdev->wb.gpu_addr);
  1243. if (r) {
  1244. DRM_ERROR("radeon: failed to pin WB buffer (%d).\n", r);
  1245. return r;
  1246. }
  1247. r = radeon_object_kmap(rdev->wb.wb_obj, (void **)&rdev->wb.wb);
  1248. if (r) {
  1249. DRM_ERROR("radeon: failed to map WB buffer (%d).\n", r);
  1250. return r;
  1251. }
  1252. }
  1253. WREG32(SCRATCH_ADDR, (rdev->wb.gpu_addr >> 8) & 0xFFFFFFFF);
  1254. WREG32(CP_RB_RPTR_ADDR, (rdev->wb.gpu_addr + 1024) & 0xFFFFFFFC);
  1255. WREG32(CP_RB_RPTR_ADDR_HI, upper_32_bits(rdev->wb.gpu_addr + 1024) & 0xFF);
  1256. WREG32(SCRATCH_UMSK, 0xff);
  1257. return 0;
  1258. }
  1259. void r600_wb_fini(struct radeon_device *rdev)
  1260. {
  1261. if (rdev->wb.wb_obj) {
  1262. radeon_object_kunmap(rdev->wb.wb_obj);
  1263. radeon_object_unpin(rdev->wb.wb_obj);
  1264. radeon_object_unref(&rdev->wb.wb_obj);
  1265. rdev->wb.wb = NULL;
  1266. rdev->wb.wb_obj = NULL;
  1267. }
  1268. }
  1269. /*
  1270. * CS
  1271. */
  1272. void r600_fence_ring_emit(struct radeon_device *rdev,
  1273. struct radeon_fence *fence)
  1274. {
  1275. /* Emit fence sequence & fire IRQ */
  1276. radeon_ring_write(rdev, PACKET3(PACKET3_SET_CONFIG_REG, 1));
  1277. radeon_ring_write(rdev, ((rdev->fence_drv.scratch_reg - PACKET3_SET_CONFIG_REG_OFFSET) >> 2));
  1278. radeon_ring_write(rdev, fence->seq);
  1279. }
  1280. int r600_copy_dma(struct radeon_device *rdev,
  1281. uint64_t src_offset,
  1282. uint64_t dst_offset,
  1283. unsigned num_pages,
  1284. struct radeon_fence *fence)
  1285. {
  1286. /* FIXME: implement */
  1287. return 0;
  1288. }
  1289. int r600_copy_blit(struct radeon_device *rdev,
  1290. uint64_t src_offset, uint64_t dst_offset,
  1291. unsigned num_pages, struct radeon_fence *fence)
  1292. {
  1293. r600_blit_prepare_copy(rdev, num_pages * 4096);
  1294. r600_kms_blit_copy(rdev, src_offset, dst_offset, num_pages * 4096);
  1295. r600_blit_done_copy(rdev, fence);
  1296. return 0;
  1297. }
  1298. int r600_irq_process(struct radeon_device *rdev)
  1299. {
  1300. /* FIXME: implement */
  1301. return 0;
  1302. }
  1303. int r600_irq_set(struct radeon_device *rdev)
  1304. {
  1305. /* FIXME: implement */
  1306. return 0;
  1307. }
  1308. int r600_set_surface_reg(struct radeon_device *rdev, int reg,
  1309. uint32_t tiling_flags, uint32_t pitch,
  1310. uint32_t offset, uint32_t obj_size)
  1311. {
  1312. /* FIXME: implement */
  1313. return 0;
  1314. }
  1315. void r600_clear_surface_reg(struct radeon_device *rdev, int reg)
  1316. {
  1317. /* FIXME: implement */
  1318. }
  1319. bool r600_card_posted(struct radeon_device *rdev)
  1320. {
  1321. uint32_t reg;
  1322. /* first check CRTCs */
  1323. reg = RREG32(D1CRTC_CONTROL) |
  1324. RREG32(D2CRTC_CONTROL);
  1325. if (reg & CRTC_EN)
  1326. return true;
  1327. /* then check MEM_SIZE, in case the crtcs are off */
  1328. if (RREG32(CONFIG_MEMSIZE))
  1329. return true;
  1330. return false;
  1331. }
  1332. int r600_startup(struct radeon_device *rdev)
  1333. {
  1334. int r;
  1335. r600_gpu_reset(rdev);
  1336. r600_mc_resume(rdev);
  1337. r = r600_pcie_gart_enable(rdev);
  1338. if (r)
  1339. return r;
  1340. r600_gpu_init(rdev);
  1341. r = radeon_object_pin(rdev->r600_blit.shader_obj, RADEON_GEM_DOMAIN_VRAM,
  1342. &rdev->r600_blit.shader_gpu_addr);
  1343. if (r) {
  1344. DRM_ERROR("failed to pin blit object %d\n", r);
  1345. return r;
  1346. }
  1347. r = radeon_ring_init(rdev, rdev->cp.ring_size);
  1348. if (r)
  1349. return r;
  1350. r = r600_cp_load_microcode(rdev);
  1351. if (r)
  1352. return r;
  1353. r = r600_cp_resume(rdev);
  1354. if (r)
  1355. return r;
  1356. r = r600_wb_init(rdev);
  1357. if (r)
  1358. return r;
  1359. return 0;
  1360. }
  1361. void r600_vga_set_state(struct radeon_device *rdev, bool state)
  1362. {
  1363. uint32_t temp;
  1364. temp = RREG32(CONFIG_CNTL);
  1365. if (state == false) {
  1366. temp &= ~(1<<0);
  1367. temp |= (1<<1);
  1368. } else {
  1369. temp &= ~(1<<1);
  1370. }
  1371. WREG32(CONFIG_CNTL, temp);
  1372. }
  1373. int r600_resume(struct radeon_device *rdev)
  1374. {
  1375. int r;
  1376. if (radeon_gpu_reset(rdev)) {
  1377. /* FIXME: what do we want to do here ? */
  1378. }
  1379. /* post card */
  1380. if (rdev->is_atom_bios) {
  1381. atom_asic_init(rdev->mode_info.atom_context);
  1382. } else {
  1383. radeon_combios_asic_init(rdev->ddev);
  1384. }
  1385. /* Initialize clocks */
  1386. r = radeon_clocks_init(rdev);
  1387. if (r) {
  1388. return r;
  1389. }
  1390. r = r600_startup(rdev);
  1391. if (r) {
  1392. DRM_ERROR("r600 startup failed on resume\n");
  1393. return r;
  1394. }
  1395. r = radeon_ib_test(rdev);
  1396. if (r) {
  1397. DRM_ERROR("radeon: failled testing IB (%d).\n", r);
  1398. return r;
  1399. }
  1400. return r;
  1401. }
  1402. int r600_suspend(struct radeon_device *rdev)
  1403. {
  1404. /* FIXME: we should wait for ring to be empty */
  1405. r600_cp_stop(rdev);
  1406. rdev->cp.ready = false;
  1407. r600_pcie_gart_disable(rdev);
  1408. /* unpin shaders bo */
  1409. radeon_object_unpin(rdev->r600_blit.shader_obj);
  1410. return 0;
  1411. }
  1412. /* Plan is to move initialization in that function and use
  1413. * helper function so that radeon_device_init pretty much
  1414. * do nothing more than calling asic specific function. This
  1415. * should also allow to remove a bunch of callback function
  1416. * like vram_info.
  1417. */
  1418. int r600_init(struct radeon_device *rdev)
  1419. {
  1420. int r;
  1421. rdev->new_init_path = true;
  1422. r = radeon_dummy_page_init(rdev);
  1423. if (r)
  1424. return r;
  1425. if (r600_debugfs_mc_info_init(rdev)) {
  1426. DRM_ERROR("Failed to register debugfs file for mc !\n");
  1427. }
  1428. /* This don't do much */
  1429. r = radeon_gem_init(rdev);
  1430. if (r)
  1431. return r;
  1432. /* Read BIOS */
  1433. if (!radeon_get_bios(rdev)) {
  1434. if (ASIC_IS_AVIVO(rdev))
  1435. return -EINVAL;
  1436. }
  1437. /* Must be an ATOMBIOS */
  1438. if (!rdev->is_atom_bios)
  1439. return -EINVAL;
  1440. r = radeon_atombios_init(rdev);
  1441. if (r)
  1442. return r;
  1443. /* Post card if necessary */
  1444. if (!r600_card_posted(rdev) && rdev->bios) {
  1445. DRM_INFO("GPU not posted. posting now...\n");
  1446. atom_asic_init(rdev->mode_info.atom_context);
  1447. }
  1448. /* Initialize scratch registers */
  1449. r600_scratch_init(rdev);
  1450. /* Initialize surface registers */
  1451. radeon_surface_init(rdev);
  1452. radeon_get_clock_info(rdev->ddev);
  1453. r = radeon_clocks_init(rdev);
  1454. if (r)
  1455. return r;
  1456. /* Fence driver */
  1457. r = radeon_fence_driver_init(rdev);
  1458. if (r)
  1459. return r;
  1460. r = r600_mc_init(rdev);
  1461. if (r) {
  1462. if (rdev->flags & RADEON_IS_AGP) {
  1463. /* Retry with disabling AGP */
  1464. r600_fini(rdev);
  1465. rdev->flags &= ~RADEON_IS_AGP;
  1466. return r600_init(rdev);
  1467. }
  1468. return r;
  1469. }
  1470. /* Memory manager */
  1471. r = radeon_object_init(rdev);
  1472. if (r)
  1473. return r;
  1474. rdev->cp.ring_obj = NULL;
  1475. r600_ring_init(rdev, 1024 * 1024);
  1476. if (!rdev->me_fw || !rdev->pfp_fw) {
  1477. r = r600_cp_init_microcode(rdev);
  1478. if (r) {
  1479. DRM_ERROR("Failed to load firmware!\n");
  1480. return r;
  1481. }
  1482. }
  1483. r = r600_pcie_gart_init(rdev);
  1484. if (r)
  1485. return r;
  1486. rdev->accel_working = true;
  1487. r = r600_blit_init(rdev);
  1488. if (r) {
  1489. DRM_ERROR("radeon: failled blitter (%d).\n", r);
  1490. return r;
  1491. }
  1492. r = r600_startup(rdev);
  1493. if (r) {
  1494. if (rdev->flags & RADEON_IS_AGP) {
  1495. /* Retry with disabling AGP */
  1496. r600_fini(rdev);
  1497. rdev->flags &= ~RADEON_IS_AGP;
  1498. return r600_init(rdev);
  1499. }
  1500. rdev->accel_working = false;
  1501. }
  1502. if (rdev->accel_working) {
  1503. r = radeon_ib_pool_init(rdev);
  1504. if (r) {
  1505. DRM_ERROR("radeon: failled initializing IB pool (%d).\n", r);
  1506. rdev->accel_working = false;
  1507. }
  1508. r = radeon_ib_test(rdev);
  1509. if (r) {
  1510. DRM_ERROR("radeon: failled testing IB (%d).\n", r);
  1511. rdev->accel_working = false;
  1512. }
  1513. }
  1514. return 0;
  1515. }
  1516. void r600_fini(struct radeon_device *rdev)
  1517. {
  1518. /* Suspend operations */
  1519. r600_suspend(rdev);
  1520. r600_blit_fini(rdev);
  1521. radeon_ring_fini(rdev);
  1522. r600_pcie_gart_fini(rdev);
  1523. radeon_gem_fini(rdev);
  1524. radeon_fence_driver_fini(rdev);
  1525. radeon_clocks_fini(rdev);
  1526. #if __OS_HAS_AGP
  1527. if (rdev->flags & RADEON_IS_AGP)
  1528. radeon_agp_fini(rdev);
  1529. #endif
  1530. radeon_object_fini(rdev);
  1531. if (rdev->is_atom_bios)
  1532. radeon_atombios_fini(rdev);
  1533. else
  1534. radeon_combios_fini(rdev);
  1535. kfree(rdev->bios);
  1536. rdev->bios = NULL;
  1537. radeon_dummy_page_fini(rdev);
  1538. }
  1539. /*
  1540. * CS stuff
  1541. */
  1542. void r600_ring_ib_execute(struct radeon_device *rdev, struct radeon_ib *ib)
  1543. {
  1544. /* FIXME: implement */
  1545. radeon_ring_write(rdev, PACKET3(PACKET3_INDIRECT_BUFFER, 2));
  1546. radeon_ring_write(rdev, ib->gpu_addr & 0xFFFFFFFC);
  1547. radeon_ring_write(rdev, upper_32_bits(ib->gpu_addr) & 0xFF);
  1548. radeon_ring_write(rdev, ib->length_dw);
  1549. }
  1550. int r600_ib_test(struct radeon_device *rdev)
  1551. {
  1552. struct radeon_ib *ib;
  1553. uint32_t scratch;
  1554. uint32_t tmp = 0;
  1555. unsigned i;
  1556. int r;
  1557. r = radeon_scratch_get(rdev, &scratch);
  1558. if (r) {
  1559. DRM_ERROR("radeon: failed to get scratch reg (%d).\n", r);
  1560. return r;
  1561. }
  1562. WREG32(scratch, 0xCAFEDEAD);
  1563. r = radeon_ib_get(rdev, &ib);
  1564. if (r) {
  1565. DRM_ERROR("radeon: failed to get ib (%d).\n", r);
  1566. return r;
  1567. }
  1568. ib->ptr[0] = PACKET3(PACKET3_SET_CONFIG_REG, 1);
  1569. ib->ptr[1] = ((scratch - PACKET3_SET_CONFIG_REG_OFFSET) >> 2);
  1570. ib->ptr[2] = 0xDEADBEEF;
  1571. ib->ptr[3] = PACKET2(0);
  1572. ib->ptr[4] = PACKET2(0);
  1573. ib->ptr[5] = PACKET2(0);
  1574. ib->ptr[6] = PACKET2(0);
  1575. ib->ptr[7] = PACKET2(0);
  1576. ib->ptr[8] = PACKET2(0);
  1577. ib->ptr[9] = PACKET2(0);
  1578. ib->ptr[10] = PACKET2(0);
  1579. ib->ptr[11] = PACKET2(0);
  1580. ib->ptr[12] = PACKET2(0);
  1581. ib->ptr[13] = PACKET2(0);
  1582. ib->ptr[14] = PACKET2(0);
  1583. ib->ptr[15] = PACKET2(0);
  1584. ib->length_dw = 16;
  1585. r = radeon_ib_schedule(rdev, ib);
  1586. if (r) {
  1587. radeon_scratch_free(rdev, scratch);
  1588. radeon_ib_free(rdev, &ib);
  1589. DRM_ERROR("radeon: failed to schedule ib (%d).\n", r);
  1590. return r;
  1591. }
  1592. r = radeon_fence_wait(ib->fence, false);
  1593. if (r) {
  1594. DRM_ERROR("radeon: fence wait failed (%d).\n", r);
  1595. return r;
  1596. }
  1597. for (i = 0; i < rdev->usec_timeout; i++) {
  1598. tmp = RREG32(scratch);
  1599. if (tmp == 0xDEADBEEF)
  1600. break;
  1601. DRM_UDELAY(1);
  1602. }
  1603. if (i < rdev->usec_timeout) {
  1604. DRM_INFO("ib test succeeded in %u usecs\n", i);
  1605. } else {
  1606. DRM_ERROR("radeon: ib test failed (sracth(0x%04X)=0x%08X)\n",
  1607. scratch, tmp);
  1608. r = -EINVAL;
  1609. }
  1610. radeon_scratch_free(rdev, scratch);
  1611. radeon_ib_free(rdev, &ib);
  1612. return r;
  1613. }
  1614. /*
  1615. * Debugfs info
  1616. */
  1617. #if defined(CONFIG_DEBUG_FS)
  1618. static int r600_debugfs_cp_ring_info(struct seq_file *m, void *data)
  1619. {
  1620. struct drm_info_node *node = (struct drm_info_node *) m->private;
  1621. struct drm_device *dev = node->minor->dev;
  1622. struct radeon_device *rdev = dev->dev_private;
  1623. uint32_t rdp, wdp;
  1624. unsigned count, i, j;
  1625. radeon_ring_free_size(rdev);
  1626. rdp = RREG32(CP_RB_RPTR);
  1627. wdp = RREG32(CP_RB_WPTR);
  1628. count = (rdp + rdev->cp.ring_size - wdp) & rdev->cp.ptr_mask;
  1629. seq_printf(m, "CP_STAT 0x%08x\n", RREG32(CP_STAT));
  1630. seq_printf(m, "CP_RB_WPTR 0x%08x\n", wdp);
  1631. seq_printf(m, "CP_RB_RPTR 0x%08x\n", rdp);
  1632. seq_printf(m, "%u free dwords in ring\n", rdev->cp.ring_free_dw);
  1633. seq_printf(m, "%u dwords in ring\n", count);
  1634. for (j = 0; j <= count; j++) {
  1635. i = (rdp + j) & rdev->cp.ptr_mask;
  1636. seq_printf(m, "r[%04d]=0x%08x\n", i, rdev->cp.ring[i]);
  1637. }
  1638. return 0;
  1639. }
  1640. static int r600_debugfs_mc_info(struct seq_file *m, void *data)
  1641. {
  1642. struct drm_info_node *node = (struct drm_info_node *) m->private;
  1643. struct drm_device *dev = node->minor->dev;
  1644. struct radeon_device *rdev = dev->dev_private;
  1645. DREG32_SYS(m, rdev, R_000E50_SRBM_STATUS);
  1646. DREG32_SYS(m, rdev, VM_L2_STATUS);
  1647. return 0;
  1648. }
  1649. static struct drm_info_list r600_mc_info_list[] = {
  1650. {"r600_mc_info", r600_debugfs_mc_info, 0, NULL},
  1651. {"r600_ring_info", r600_debugfs_cp_ring_info, 0, NULL},
  1652. };
  1653. #endif
  1654. int r600_debugfs_mc_info_init(struct radeon_device *rdev)
  1655. {
  1656. #if defined(CONFIG_DEBUG_FS)
  1657. return radeon_debugfs_add_files(rdev, r600_mc_info_list, ARRAY_SIZE(r600_mc_info_list));
  1658. #else
  1659. return 0;
  1660. #endif
  1661. }