nouveau_mem.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533
  1. /*
  2. * Copyright (C) The Weather Channel, Inc. 2002. All Rights Reserved.
  3. * Copyright 2005 Stephane Marchesin
  4. *
  5. * The Weather Channel (TM) funded Tungsten Graphics to develop the
  6. * initial release of the Radeon 8500 driver under the XFree86 license.
  7. * This notice must be preserved.
  8. *
  9. * Permission is hereby granted, free of charge, to any person obtaining a
  10. * copy of this software and associated documentation files (the "Software"),
  11. * to deal in the Software without restriction, including without limitation
  12. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  13. * and/or sell copies of the Software, and to permit persons to whom the
  14. * Software is furnished to do so, subject to the following conditions:
  15. *
  16. * The above copyright notice and this permission notice (including the next
  17. * paragraph) shall be included in all copies or substantial portions of the
  18. * Software.
  19. *
  20. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  21. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  22. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  23. * THE AUTHORS AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
  24. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  25. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
  26. * DEALINGS IN THE SOFTWARE.
  27. *
  28. * Authors:
  29. * Keith Whitwell <keith@tungstengraphics.com>
  30. */
  31. #include "drmP.h"
  32. #include "drm.h"
  33. #include "drm_sarea.h"
  34. #include "nouveau_drv.h"
  35. /*
  36. * NV10-NV40 tiling helpers
  37. */
  38. static void
  39. nv10_mem_set_region_tiling(struct drm_device *dev, int i, uint32_t addr,
  40. uint32_t size, uint32_t pitch)
  41. {
  42. struct drm_nouveau_private *dev_priv = dev->dev_private;
  43. struct nouveau_fifo_engine *pfifo = &dev_priv->engine.fifo;
  44. struct nouveau_fb_engine *pfb = &dev_priv->engine.fb;
  45. struct nouveau_pgraph_engine *pgraph = &dev_priv->engine.graph;
  46. struct nouveau_tile_reg *tile = &dev_priv->tile.reg[i];
  47. tile->addr = addr;
  48. tile->size = size;
  49. tile->used = !!pitch;
  50. nouveau_fence_unref((void **)&tile->fence);
  51. if (!pfifo->cache_flush(dev))
  52. return;
  53. pfifo->reassign(dev, false);
  54. pfifo->cache_flush(dev);
  55. pfifo->cache_pull(dev, false);
  56. nouveau_wait_for_idle(dev);
  57. pgraph->set_region_tiling(dev, i, addr, size, pitch);
  58. pfb->set_region_tiling(dev, i, addr, size, pitch);
  59. pfifo->cache_pull(dev, true);
  60. pfifo->reassign(dev, true);
  61. }
  62. struct nouveau_tile_reg *
  63. nv10_mem_set_tiling(struct drm_device *dev, uint32_t addr, uint32_t size,
  64. uint32_t pitch)
  65. {
  66. struct drm_nouveau_private *dev_priv = dev->dev_private;
  67. struct nouveau_fb_engine *pfb = &dev_priv->engine.fb;
  68. struct nouveau_tile_reg *tile = dev_priv->tile.reg, *found = NULL;
  69. int i;
  70. spin_lock(&dev_priv->tile.lock);
  71. for (i = 0; i < pfb->num_tiles; i++) {
  72. if (tile[i].used)
  73. /* Tile region in use. */
  74. continue;
  75. if (tile[i].fence &&
  76. !nouveau_fence_signalled(tile[i].fence, NULL))
  77. /* Pending tile region. */
  78. continue;
  79. if (max(tile[i].addr, addr) <
  80. min(tile[i].addr + tile[i].size, addr + size))
  81. /* Kill an intersecting tile region. */
  82. nv10_mem_set_region_tiling(dev, i, 0, 0, 0);
  83. if (pitch && !found) {
  84. /* Free tile region. */
  85. nv10_mem_set_region_tiling(dev, i, addr, size, pitch);
  86. found = &tile[i];
  87. }
  88. }
  89. spin_unlock(&dev_priv->tile.lock);
  90. return found;
  91. }
  92. void
  93. nv10_mem_expire_tiling(struct drm_device *dev, struct nouveau_tile_reg *tile,
  94. struct nouveau_fence *fence)
  95. {
  96. if (fence) {
  97. /* Mark it as pending. */
  98. tile->fence = fence;
  99. nouveau_fence_ref(fence);
  100. }
  101. tile->used = false;
  102. }
  103. /*
  104. * NV50 VM helpers
  105. */
  106. int
  107. nv50_mem_vm_bind_linear(struct drm_device *dev, uint64_t virt, uint32_t size,
  108. uint32_t flags, uint64_t phys)
  109. {
  110. struct drm_nouveau_private *dev_priv = dev->dev_private;
  111. struct nouveau_gpuobj *pgt;
  112. unsigned block;
  113. int i;
  114. virt = ((virt - dev_priv->vm_vram_base) >> 16) << 1;
  115. size = (size >> 16) << 1;
  116. phys |= ((uint64_t)flags << 32);
  117. phys |= 1;
  118. if (dev_priv->vram_sys_base) {
  119. phys += dev_priv->vram_sys_base;
  120. phys |= 0x30;
  121. }
  122. while (size) {
  123. unsigned offset_h = upper_32_bits(phys);
  124. unsigned offset_l = lower_32_bits(phys);
  125. unsigned pte, end;
  126. for (i = 7; i >= 0; i--) {
  127. block = 1 << (i + 1);
  128. if (size >= block && !(virt & (block - 1)))
  129. break;
  130. }
  131. offset_l |= (i << 7);
  132. phys += block << 15;
  133. size -= block;
  134. while (block) {
  135. pgt = dev_priv->vm_vram_pt[virt >> 14];
  136. pte = virt & 0x3ffe;
  137. end = pte + block;
  138. if (end > 16384)
  139. end = 16384;
  140. block -= (end - pte);
  141. virt += (end - pte);
  142. while (pte < end) {
  143. nv_wo32(dev, pgt, pte++, offset_l);
  144. nv_wo32(dev, pgt, pte++, offset_h);
  145. }
  146. }
  147. }
  148. dev_priv->engine.instmem.flush(dev);
  149. nv50_vm_flush(dev, 5);
  150. nv50_vm_flush(dev, 0);
  151. nv50_vm_flush(dev, 4);
  152. nv50_vm_flush(dev, 6);
  153. return 0;
  154. }
  155. void
  156. nv50_mem_vm_unbind(struct drm_device *dev, uint64_t virt, uint32_t size)
  157. {
  158. struct drm_nouveau_private *dev_priv = dev->dev_private;
  159. struct nouveau_gpuobj *pgt;
  160. unsigned pages, pte, end;
  161. virt -= dev_priv->vm_vram_base;
  162. pages = (size >> 16) << 1;
  163. while (pages) {
  164. pgt = dev_priv->vm_vram_pt[virt >> 29];
  165. pte = (virt & 0x1ffe0000ULL) >> 15;
  166. end = pte + pages;
  167. if (end > 16384)
  168. end = 16384;
  169. pages -= (end - pte);
  170. virt += (end - pte) << 15;
  171. while (pte < end)
  172. nv_wo32(dev, pgt, pte++, 0);
  173. }
  174. dev_priv->engine.instmem.flush(dev);
  175. nv50_vm_flush(dev, 5);
  176. nv50_vm_flush(dev, 0);
  177. nv50_vm_flush(dev, 4);
  178. nv50_vm_flush(dev, 6);
  179. }
  180. /*
  181. * Cleanup everything
  182. */
  183. void
  184. nouveau_mem_close(struct drm_device *dev)
  185. {
  186. struct drm_nouveau_private *dev_priv = dev->dev_private;
  187. nouveau_bo_unpin(dev_priv->vga_ram);
  188. nouveau_bo_ref(NULL, &dev_priv->vga_ram);
  189. ttm_bo_device_release(&dev_priv->ttm.bdev);
  190. nouveau_ttm_global_release(dev_priv);
  191. if (drm_core_has_AGP(dev) && dev->agp) {
  192. struct drm_agp_mem *entry, *tempe;
  193. /* Remove AGP resources, but leave dev->agp
  194. intact until drv_cleanup is called. */
  195. list_for_each_entry_safe(entry, tempe, &dev->agp->memory, head) {
  196. if (entry->bound)
  197. drm_unbind_agp(entry->memory);
  198. drm_free_agp(entry->memory, entry->pages);
  199. kfree(entry);
  200. }
  201. INIT_LIST_HEAD(&dev->agp->memory);
  202. if (dev->agp->acquired)
  203. drm_agp_release(dev);
  204. dev->agp->acquired = 0;
  205. dev->agp->enabled = 0;
  206. }
  207. if (dev_priv->fb_mtrr) {
  208. drm_mtrr_del(dev_priv->fb_mtrr,
  209. pci_resource_start(dev->pdev, 1),
  210. pci_resource_len(dev->pdev, 1), DRM_MTRR_WC);
  211. dev_priv->fb_mtrr = -1;
  212. }
  213. }
  214. static uint32_t
  215. nouveau_mem_detect_nv04(struct drm_device *dev)
  216. {
  217. uint32_t boot0 = nv_rd32(dev, NV04_PFB_BOOT_0);
  218. if (boot0 & 0x00000100)
  219. return (((boot0 >> 12) & 0xf) * 2 + 2) * 1024 * 1024;
  220. switch (boot0 & NV04_PFB_BOOT_0_RAM_AMOUNT) {
  221. case NV04_PFB_BOOT_0_RAM_AMOUNT_32MB:
  222. return 32 * 1024 * 1024;
  223. case NV04_PFB_BOOT_0_RAM_AMOUNT_16MB:
  224. return 16 * 1024 * 1024;
  225. case NV04_PFB_BOOT_0_RAM_AMOUNT_8MB:
  226. return 8 * 1024 * 1024;
  227. case NV04_PFB_BOOT_0_RAM_AMOUNT_4MB:
  228. return 4 * 1024 * 1024;
  229. }
  230. return 0;
  231. }
  232. static uint32_t
  233. nouveau_mem_detect_nforce(struct drm_device *dev)
  234. {
  235. struct drm_nouveau_private *dev_priv = dev->dev_private;
  236. struct pci_dev *bridge;
  237. uint32_t mem;
  238. bridge = pci_get_bus_and_slot(0, PCI_DEVFN(0, 1));
  239. if (!bridge) {
  240. NV_ERROR(dev, "no bridge device\n");
  241. return 0;
  242. }
  243. if (dev_priv->flags & NV_NFORCE) {
  244. pci_read_config_dword(bridge, 0x7C, &mem);
  245. return (uint64_t)(((mem >> 6) & 31) + 1)*1024*1024;
  246. } else
  247. if (dev_priv->flags & NV_NFORCE2) {
  248. pci_read_config_dword(bridge, 0x84, &mem);
  249. return (uint64_t)(((mem >> 4) & 127) + 1)*1024*1024;
  250. }
  251. NV_ERROR(dev, "impossible!\n");
  252. return 0;
  253. }
  254. /* returns the amount of FB ram in bytes */
  255. int
  256. nouveau_mem_detect(struct drm_device *dev)
  257. {
  258. struct drm_nouveau_private *dev_priv = dev->dev_private;
  259. if (dev_priv->card_type == NV_04) {
  260. dev_priv->vram_size = nouveau_mem_detect_nv04(dev);
  261. } else
  262. if (dev_priv->flags & (NV_NFORCE | NV_NFORCE2)) {
  263. dev_priv->vram_size = nouveau_mem_detect_nforce(dev);
  264. } else
  265. if (dev_priv->card_type < NV_50) {
  266. dev_priv->vram_size = nv_rd32(dev, NV04_PFB_FIFO_DATA);
  267. dev_priv->vram_size &= NV10_PFB_FIFO_DATA_RAM_AMOUNT_MB_MASK;
  268. } else
  269. if (dev_priv->card_type < NV_C0) {
  270. dev_priv->vram_size = nv_rd32(dev, NV04_PFB_FIFO_DATA);
  271. dev_priv->vram_size |= (dev_priv->vram_size & 0xff) << 32;
  272. dev_priv->vram_size &= 0xffffffff00ll;
  273. if (dev_priv->chipset == 0xaa || dev_priv->chipset == 0xac) {
  274. dev_priv->vram_sys_base = nv_rd32(dev, 0x100e10);
  275. dev_priv->vram_sys_base <<= 12;
  276. }
  277. } else {
  278. dev_priv->vram_size = nv_rd32(dev, 0x10f20c) << 20;
  279. dev_priv->vram_size *= nv_rd32(dev, 0x121c74);
  280. }
  281. NV_INFO(dev, "Detected %dMiB VRAM\n", (int)(dev_priv->vram_size >> 20));
  282. if (dev_priv->vram_sys_base) {
  283. NV_INFO(dev, "Stolen system memory at: 0x%010llx\n",
  284. dev_priv->vram_sys_base);
  285. }
  286. if (dev_priv->vram_size)
  287. return 0;
  288. return -ENOMEM;
  289. }
  290. int
  291. nouveau_mem_reset_agp(struct drm_device *dev)
  292. {
  293. #if __OS_HAS_AGP
  294. uint32_t saved_pci_nv_1, pmc_enable;
  295. int ret;
  296. /* First of all, disable fast writes, otherwise if it's
  297. * already enabled in the AGP bridge and we disable the card's
  298. * AGP controller we might be locking ourselves out of it. */
  299. if (nv_rd32(dev, NV04_PBUS_PCI_NV_19) & PCI_AGP_COMMAND_FW) {
  300. struct drm_agp_info info;
  301. struct drm_agp_mode mode;
  302. ret = drm_agp_info(dev, &info);
  303. if (ret)
  304. return ret;
  305. mode.mode = info.mode & ~PCI_AGP_COMMAND_FW;
  306. ret = drm_agp_enable(dev, mode);
  307. if (ret)
  308. return ret;
  309. }
  310. saved_pci_nv_1 = nv_rd32(dev, NV04_PBUS_PCI_NV_1);
  311. /* clear busmaster bit */
  312. nv_wr32(dev, NV04_PBUS_PCI_NV_1, saved_pci_nv_1 & ~0x4);
  313. /* disable AGP */
  314. nv_wr32(dev, NV04_PBUS_PCI_NV_19, 0);
  315. /* power cycle pgraph, if enabled */
  316. pmc_enable = nv_rd32(dev, NV03_PMC_ENABLE);
  317. if (pmc_enable & NV_PMC_ENABLE_PGRAPH) {
  318. nv_wr32(dev, NV03_PMC_ENABLE,
  319. pmc_enable & ~NV_PMC_ENABLE_PGRAPH);
  320. nv_wr32(dev, NV03_PMC_ENABLE, nv_rd32(dev, NV03_PMC_ENABLE) |
  321. NV_PMC_ENABLE_PGRAPH);
  322. }
  323. /* and restore (gives effect of resetting AGP) */
  324. nv_wr32(dev, NV04_PBUS_PCI_NV_1, saved_pci_nv_1);
  325. #endif
  326. return 0;
  327. }
  328. int
  329. nouveau_mem_init_agp(struct drm_device *dev)
  330. {
  331. #if __OS_HAS_AGP
  332. struct drm_nouveau_private *dev_priv = dev->dev_private;
  333. struct drm_agp_info info;
  334. struct drm_agp_mode mode;
  335. int ret;
  336. if (!dev->agp->acquired) {
  337. ret = drm_agp_acquire(dev);
  338. if (ret) {
  339. NV_ERROR(dev, "Unable to acquire AGP: %d\n", ret);
  340. return ret;
  341. }
  342. }
  343. nouveau_mem_reset_agp(dev);
  344. ret = drm_agp_info(dev, &info);
  345. if (ret) {
  346. NV_ERROR(dev, "Unable to get AGP info: %d\n", ret);
  347. return ret;
  348. }
  349. /* see agp.h for the AGPSTAT_* modes available */
  350. mode.mode = info.mode;
  351. ret = drm_agp_enable(dev, mode);
  352. if (ret) {
  353. NV_ERROR(dev, "Unable to enable AGP: %d\n", ret);
  354. return ret;
  355. }
  356. dev_priv->gart_info.type = NOUVEAU_GART_AGP;
  357. dev_priv->gart_info.aper_base = info.aperture_base;
  358. dev_priv->gart_info.aper_size = info.aperture_size;
  359. #endif
  360. return 0;
  361. }
  362. int
  363. nouveau_mem_init(struct drm_device *dev)
  364. {
  365. struct drm_nouveau_private *dev_priv = dev->dev_private;
  366. struct ttm_bo_device *bdev = &dev_priv->ttm.bdev;
  367. int ret, dma_bits = 32;
  368. dev_priv->fb_phys = pci_resource_start(dev->pdev, 1);
  369. dev_priv->gart_info.type = NOUVEAU_GART_NONE;
  370. if (dev_priv->card_type >= NV_50 &&
  371. pci_dma_supported(dev->pdev, DMA_BIT_MASK(40)))
  372. dma_bits = 40;
  373. ret = pci_set_dma_mask(dev->pdev, DMA_BIT_MASK(dma_bits));
  374. if (ret) {
  375. NV_ERROR(dev, "Error setting DMA mask: %d\n", ret);
  376. return ret;
  377. }
  378. ret = nouveau_ttm_global_init(dev_priv);
  379. if (ret)
  380. return ret;
  381. ret = ttm_bo_device_init(&dev_priv->ttm.bdev,
  382. dev_priv->ttm.bo_global_ref.ref.object,
  383. &nouveau_bo_driver, DRM_FILE_PAGE_OFFSET,
  384. dma_bits <= 32 ? true : false);
  385. if (ret) {
  386. NV_ERROR(dev, "Error initialising bo driver: %d\n", ret);
  387. return ret;
  388. }
  389. spin_lock_init(&dev_priv->tile.lock);
  390. dev_priv->fb_available_size = dev_priv->vram_size;
  391. dev_priv->fb_mappable_pages = dev_priv->fb_available_size;
  392. if (dev_priv->fb_mappable_pages > pci_resource_len(dev->pdev, 1))
  393. dev_priv->fb_mappable_pages =
  394. pci_resource_len(dev->pdev, 1);
  395. dev_priv->fb_mappable_pages >>= PAGE_SHIFT;
  396. /* remove reserved space at end of vram from available amount */
  397. dev_priv->fb_available_size -= dev_priv->ramin_rsvd_vram;
  398. dev_priv->fb_aper_free = dev_priv->fb_available_size;
  399. /* mappable vram */
  400. ret = ttm_bo_init_mm(bdev, TTM_PL_VRAM,
  401. dev_priv->fb_available_size >> PAGE_SHIFT);
  402. if (ret) {
  403. NV_ERROR(dev, "Failed VRAM mm init: %d\n", ret);
  404. return ret;
  405. }
  406. ret = nouveau_bo_new(dev, NULL, 256*1024, 0, TTM_PL_FLAG_VRAM,
  407. 0, 0, true, true, &dev_priv->vga_ram);
  408. if (ret == 0)
  409. ret = nouveau_bo_pin(dev_priv->vga_ram, TTM_PL_FLAG_VRAM);
  410. if (ret) {
  411. NV_WARN(dev, "failed to reserve VGA memory\n");
  412. nouveau_bo_ref(NULL, &dev_priv->vga_ram);
  413. }
  414. /* GART */
  415. #if !defined(__powerpc__) && !defined(__ia64__)
  416. if (drm_device_is_agp(dev) && dev->agp && !nouveau_noagp) {
  417. ret = nouveau_mem_init_agp(dev);
  418. if (ret)
  419. NV_ERROR(dev, "Error initialising AGP: %d\n", ret);
  420. }
  421. #endif
  422. if (dev_priv->gart_info.type == NOUVEAU_GART_NONE) {
  423. ret = nouveau_sgdma_init(dev);
  424. if (ret) {
  425. NV_ERROR(dev, "Error initialising PCI(E): %d\n", ret);
  426. return ret;
  427. }
  428. }
  429. NV_INFO(dev, "%d MiB GART (aperture)\n",
  430. (int)(dev_priv->gart_info.aper_size >> 20));
  431. dev_priv->gart_info.aper_free = dev_priv->gart_info.aper_size;
  432. ret = ttm_bo_init_mm(bdev, TTM_PL_TT,
  433. dev_priv->gart_info.aper_size >> PAGE_SHIFT);
  434. if (ret) {
  435. NV_ERROR(dev, "Failed TT mm init: %d\n", ret);
  436. return ret;
  437. }
  438. dev_priv->fb_mtrr = drm_mtrr_add(pci_resource_start(dev->pdev, 1),
  439. pci_resource_len(dev->pdev, 1),
  440. DRM_MTRR_WC);
  441. return 0;
  442. }