r600_cs.c 21 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782
  1. /*
  2. * Copyright 2008 Advanced Micro Devices, Inc.
  3. * Copyright 2008 Red Hat Inc.
  4. * Copyright 2009 Jerome Glisse.
  5. *
  6. * Permission is hereby granted, free of charge, to any person obtaining a
  7. * copy of this software and associated documentation files (the "Software"),
  8. * to deal in the Software without restriction, including without limitation
  9. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  10. * and/or sell copies of the Software, and to permit persons to whom the
  11. * Software is furnished to do so, subject to the following conditions:
  12. *
  13. * The above copyright notice and this permission notice shall be included in
  14. * all copies or substantial portions of the Software.
  15. *
  16. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  17. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  18. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  19. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  20. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  21. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  22. * OTHER DEALINGS IN THE SOFTWARE.
  23. *
  24. * Authors: Dave Airlie
  25. * Alex Deucher
  26. * Jerome Glisse
  27. */
  28. #include "drmP.h"
  29. #include "radeon.h"
  30. #include "r600d.h"
  31. #include "avivod.h"
  32. static int r600_cs_packet_next_reloc_mm(struct radeon_cs_parser *p,
  33. struct radeon_cs_reloc **cs_reloc);
  34. static int r600_cs_packet_next_reloc_nomm(struct radeon_cs_parser *p,
  35. struct radeon_cs_reloc **cs_reloc);
  36. typedef int (*next_reloc_t)(struct radeon_cs_parser*, struct radeon_cs_reloc**);
  37. static next_reloc_t r600_cs_packet_next_reloc = &r600_cs_packet_next_reloc_mm;
  38. /**
  39. * r600_cs_packet_parse() - parse cp packet and point ib index to next packet
  40. * @parser: parser structure holding parsing context.
  41. * @pkt: where to store packet informations
  42. *
  43. * Assume that chunk_ib_index is properly set. Will return -EINVAL
  44. * if packet is bigger than remaining ib size. or if packets is unknown.
  45. **/
  46. int r600_cs_packet_parse(struct radeon_cs_parser *p,
  47. struct radeon_cs_packet *pkt,
  48. unsigned idx)
  49. {
  50. struct radeon_cs_chunk *ib_chunk = &p->chunks[p->chunk_ib_idx];
  51. uint32_t header;
  52. if (idx >= ib_chunk->length_dw) {
  53. DRM_ERROR("Can not parse packet at %d after CS end %d !\n",
  54. idx, ib_chunk->length_dw);
  55. return -EINVAL;
  56. }
  57. header = radeon_get_ib_value(p, idx);
  58. pkt->idx = idx;
  59. pkt->type = CP_PACKET_GET_TYPE(header);
  60. pkt->count = CP_PACKET_GET_COUNT(header);
  61. pkt->one_reg_wr = 0;
  62. switch (pkt->type) {
  63. case PACKET_TYPE0:
  64. pkt->reg = CP_PACKET0_GET_REG(header);
  65. break;
  66. case PACKET_TYPE3:
  67. pkt->opcode = CP_PACKET3_GET_OPCODE(header);
  68. break;
  69. case PACKET_TYPE2:
  70. pkt->count = -1;
  71. break;
  72. default:
  73. DRM_ERROR("Unknown packet type %d at %d !\n", pkt->type, idx);
  74. return -EINVAL;
  75. }
  76. if ((pkt->count + 1 + pkt->idx) >= ib_chunk->length_dw) {
  77. DRM_ERROR("Packet (%d:%d:%d) end after CS buffer (%d) !\n",
  78. pkt->idx, pkt->type, pkt->count, ib_chunk->length_dw);
  79. return -EINVAL;
  80. }
  81. return 0;
  82. }
  83. /**
  84. * r600_cs_packet_next_reloc_mm() - parse next packet which should be reloc packet3
  85. * @parser: parser structure holding parsing context.
  86. * @data: pointer to relocation data
  87. * @offset_start: starting offset
  88. * @offset_mask: offset mask (to align start offset on)
  89. * @reloc: reloc informations
  90. *
  91. * Check next packet is relocation packet3, do bo validation and compute
  92. * GPU offset using the provided start.
  93. **/
  94. static int r600_cs_packet_next_reloc_mm(struct radeon_cs_parser *p,
  95. struct radeon_cs_reloc **cs_reloc)
  96. {
  97. struct radeon_cs_chunk *relocs_chunk;
  98. struct radeon_cs_packet p3reloc;
  99. unsigned idx;
  100. int r;
  101. if (p->chunk_relocs_idx == -1) {
  102. DRM_ERROR("No relocation chunk !\n");
  103. return -EINVAL;
  104. }
  105. *cs_reloc = NULL;
  106. relocs_chunk = &p->chunks[p->chunk_relocs_idx];
  107. r = r600_cs_packet_parse(p, &p3reloc, p->idx);
  108. if (r) {
  109. return r;
  110. }
  111. p->idx += p3reloc.count + 2;
  112. if (p3reloc.type != PACKET_TYPE3 || p3reloc.opcode != PACKET3_NOP) {
  113. DRM_ERROR("No packet3 for relocation for packet at %d.\n",
  114. p3reloc.idx);
  115. return -EINVAL;
  116. }
  117. idx = radeon_get_ib_value(p, p3reloc.idx + 1);
  118. if (idx >= relocs_chunk->length_dw) {
  119. DRM_ERROR("Relocs at %d after relocations chunk end %d !\n",
  120. idx, relocs_chunk->length_dw);
  121. return -EINVAL;
  122. }
  123. /* FIXME: we assume reloc size is 4 dwords */
  124. *cs_reloc = p->relocs_ptr[(idx / 4)];
  125. return 0;
  126. }
  127. /**
  128. * r600_cs_packet_next_reloc_nomm() - parse next packet which should be reloc packet3
  129. * @parser: parser structure holding parsing context.
  130. * @data: pointer to relocation data
  131. * @offset_start: starting offset
  132. * @offset_mask: offset mask (to align start offset on)
  133. * @reloc: reloc informations
  134. *
  135. * Check next packet is relocation packet3, do bo validation and compute
  136. * GPU offset using the provided start.
  137. **/
  138. static int r600_cs_packet_next_reloc_nomm(struct radeon_cs_parser *p,
  139. struct radeon_cs_reloc **cs_reloc)
  140. {
  141. struct radeon_cs_chunk *relocs_chunk;
  142. struct radeon_cs_packet p3reloc;
  143. unsigned idx;
  144. int r;
  145. if (p->chunk_relocs_idx == -1) {
  146. DRM_ERROR("No relocation chunk !\n");
  147. return -EINVAL;
  148. }
  149. *cs_reloc = NULL;
  150. relocs_chunk = &p->chunks[p->chunk_relocs_idx];
  151. r = r600_cs_packet_parse(p, &p3reloc, p->idx);
  152. if (r) {
  153. return r;
  154. }
  155. p->idx += p3reloc.count + 2;
  156. if (p3reloc.type != PACKET_TYPE3 || p3reloc.opcode != PACKET3_NOP) {
  157. DRM_ERROR("No packet3 for relocation for packet at %d.\n",
  158. p3reloc.idx);
  159. return -EINVAL;
  160. }
  161. idx = radeon_get_ib_value(p, p3reloc.idx + 1);
  162. if (idx >= relocs_chunk->length_dw) {
  163. DRM_ERROR("Relocs at %d after relocations chunk end %d !\n",
  164. idx, relocs_chunk->length_dw);
  165. return -EINVAL;
  166. }
  167. *cs_reloc = &p->relocs[0];
  168. (*cs_reloc)->lobj.gpu_offset = (u64)relocs_chunk->kdata[idx + 3] << 32;
  169. (*cs_reloc)->lobj.gpu_offset |= relocs_chunk->kdata[idx + 0];
  170. return 0;
  171. }
  172. /**
  173. * r600_cs_packet_next_vline() - parse userspace VLINE packet
  174. * @parser: parser structure holding parsing context.
  175. *
  176. * Userspace sends a special sequence for VLINE waits.
  177. * PACKET0 - VLINE_START_END + value
  178. * PACKET3 - WAIT_REG_MEM poll vline status reg
  179. * RELOC (P3) - crtc_id in reloc.
  180. *
  181. * This function parses this and relocates the VLINE START END
  182. * and WAIT_REG_MEM packets to the correct crtc.
  183. * It also detects a switched off crtc and nulls out the
  184. * wait in that case.
  185. */
  186. static int r600_cs_packet_parse_vline(struct radeon_cs_parser *p)
  187. {
  188. struct drm_mode_object *obj;
  189. struct drm_crtc *crtc;
  190. struct radeon_crtc *radeon_crtc;
  191. struct radeon_cs_packet p3reloc, wait_reg_mem;
  192. int crtc_id;
  193. int r;
  194. uint32_t header, h_idx, reg, wait_reg_mem_info;
  195. volatile uint32_t *ib;
  196. ib = p->ib->ptr;
  197. /* parse the WAIT_REG_MEM */
  198. r = r600_cs_packet_parse(p, &wait_reg_mem, p->idx);
  199. if (r)
  200. return r;
  201. /* check its a WAIT_REG_MEM */
  202. if (wait_reg_mem.type != PACKET_TYPE3 ||
  203. wait_reg_mem.opcode != PACKET3_WAIT_REG_MEM) {
  204. DRM_ERROR("vline wait missing WAIT_REG_MEM segment\n");
  205. r = -EINVAL;
  206. return r;
  207. }
  208. wait_reg_mem_info = radeon_get_ib_value(p, wait_reg_mem.idx + 1);
  209. /* bit 4 is reg (0) or mem (1) */
  210. if (wait_reg_mem_info & 0x10) {
  211. DRM_ERROR("vline WAIT_REG_MEM waiting on MEM rather than REG\n");
  212. r = -EINVAL;
  213. return r;
  214. }
  215. /* waiting for value to be equal */
  216. if ((wait_reg_mem_info & 0x7) != 0x3) {
  217. DRM_ERROR("vline WAIT_REG_MEM function not equal\n");
  218. r = -EINVAL;
  219. return r;
  220. }
  221. if ((radeon_get_ib_value(p, wait_reg_mem.idx + 2) << 2) != AVIVO_D1MODE_VLINE_STATUS) {
  222. DRM_ERROR("vline WAIT_REG_MEM bad reg\n");
  223. r = -EINVAL;
  224. return r;
  225. }
  226. if (radeon_get_ib_value(p, wait_reg_mem.idx + 5) != AVIVO_D1MODE_VLINE_STAT) {
  227. DRM_ERROR("vline WAIT_REG_MEM bad bit mask\n");
  228. r = -EINVAL;
  229. return r;
  230. }
  231. /* jump over the NOP */
  232. r = r600_cs_packet_parse(p, &p3reloc, p->idx + wait_reg_mem.count + 2);
  233. if (r)
  234. return r;
  235. h_idx = p->idx - 2;
  236. p->idx += wait_reg_mem.count + 2;
  237. p->idx += p3reloc.count + 2;
  238. header = radeon_get_ib_value(p, h_idx);
  239. crtc_id = radeon_get_ib_value(p, h_idx + 2 + 7 + 1);
  240. reg = header >> 2;
  241. mutex_lock(&p->rdev->ddev->mode_config.mutex);
  242. obj = drm_mode_object_find(p->rdev->ddev, crtc_id, DRM_MODE_OBJECT_CRTC);
  243. if (!obj) {
  244. DRM_ERROR("cannot find crtc %d\n", crtc_id);
  245. r = -EINVAL;
  246. goto out;
  247. }
  248. crtc = obj_to_crtc(obj);
  249. radeon_crtc = to_radeon_crtc(crtc);
  250. crtc_id = radeon_crtc->crtc_id;
  251. if (!crtc->enabled) {
  252. /* if the CRTC isn't enabled - we need to nop out the WAIT_REG_MEM */
  253. ib[h_idx + 2] = PACKET2(0);
  254. ib[h_idx + 3] = PACKET2(0);
  255. ib[h_idx + 4] = PACKET2(0);
  256. ib[h_idx + 5] = PACKET2(0);
  257. ib[h_idx + 6] = PACKET2(0);
  258. ib[h_idx + 7] = PACKET2(0);
  259. ib[h_idx + 8] = PACKET2(0);
  260. } else if (crtc_id == 1) {
  261. switch (reg) {
  262. case AVIVO_D1MODE_VLINE_START_END:
  263. header &= ~R600_CP_PACKET0_REG_MASK;
  264. header |= AVIVO_D2MODE_VLINE_START_END >> 2;
  265. break;
  266. default:
  267. DRM_ERROR("unknown crtc reloc\n");
  268. r = -EINVAL;
  269. goto out;
  270. }
  271. ib[h_idx] = header;
  272. ib[h_idx + 4] = AVIVO_D2MODE_VLINE_STATUS >> 2;
  273. }
  274. out:
  275. mutex_unlock(&p->rdev->ddev->mode_config.mutex);
  276. return r;
  277. }
  278. static int r600_packet0_check(struct radeon_cs_parser *p,
  279. struct radeon_cs_packet *pkt,
  280. unsigned idx, unsigned reg)
  281. {
  282. int r;
  283. switch (reg) {
  284. case AVIVO_D1MODE_VLINE_START_END:
  285. r = r600_cs_packet_parse_vline(p);
  286. if (r) {
  287. DRM_ERROR("No reloc for ib[%d]=0x%04X\n",
  288. idx, reg);
  289. return r;
  290. }
  291. break;
  292. default:
  293. printk(KERN_ERR "Forbidden register 0x%04X in cs at %d\n",
  294. reg, idx);
  295. return -EINVAL;
  296. }
  297. return 0;
  298. }
  299. static int r600_cs_parse_packet0(struct radeon_cs_parser *p,
  300. struct radeon_cs_packet *pkt)
  301. {
  302. unsigned reg, i;
  303. unsigned idx;
  304. int r;
  305. idx = pkt->idx + 1;
  306. reg = pkt->reg;
  307. for (i = 0; i <= pkt->count; i++, idx++, reg += 4) {
  308. r = r600_packet0_check(p, pkt, idx, reg);
  309. if (r) {
  310. return r;
  311. }
  312. }
  313. return 0;
  314. }
  315. static int r600_packet3_check(struct radeon_cs_parser *p,
  316. struct radeon_cs_packet *pkt)
  317. {
  318. struct radeon_cs_reloc *reloc;
  319. volatile u32 *ib;
  320. unsigned idx;
  321. unsigned i;
  322. unsigned start_reg, end_reg, reg;
  323. int r;
  324. u32 idx_value;
  325. ib = p->ib->ptr;
  326. idx = pkt->idx + 1;
  327. idx_value = radeon_get_ib_value(p, idx);
  328. switch (pkt->opcode) {
  329. case PACKET3_START_3D_CMDBUF:
  330. if (p->family >= CHIP_RV770 || pkt->count) {
  331. DRM_ERROR("bad START_3D\n");
  332. return -EINVAL;
  333. }
  334. break;
  335. case PACKET3_CONTEXT_CONTROL:
  336. if (pkt->count != 1) {
  337. DRM_ERROR("bad CONTEXT_CONTROL\n");
  338. return -EINVAL;
  339. }
  340. break;
  341. case PACKET3_INDEX_TYPE:
  342. case PACKET3_NUM_INSTANCES:
  343. if (pkt->count) {
  344. DRM_ERROR("bad INDEX_TYPE/NUM_INSTANCES\n");
  345. return -EINVAL;
  346. }
  347. break;
  348. case PACKET3_DRAW_INDEX:
  349. if (pkt->count != 3) {
  350. DRM_ERROR("bad DRAW_INDEX\n");
  351. return -EINVAL;
  352. }
  353. r = r600_cs_packet_next_reloc(p, &reloc);
  354. if (r) {
  355. DRM_ERROR("bad DRAW_INDEX\n");
  356. return -EINVAL;
  357. }
  358. ib[idx+0] = idx_value + (u32)(reloc->lobj.gpu_offset & 0xffffffff);
  359. ib[idx+1] += upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
  360. break;
  361. case PACKET3_DRAW_INDEX_AUTO:
  362. if (pkt->count != 1) {
  363. DRM_ERROR("bad DRAW_INDEX_AUTO\n");
  364. return -EINVAL;
  365. }
  366. break;
  367. case PACKET3_DRAW_INDEX_IMMD_BE:
  368. case PACKET3_DRAW_INDEX_IMMD:
  369. if (pkt->count < 2) {
  370. DRM_ERROR("bad DRAW_INDEX_IMMD\n");
  371. return -EINVAL;
  372. }
  373. break;
  374. case PACKET3_WAIT_REG_MEM:
  375. if (pkt->count != 5) {
  376. DRM_ERROR("bad WAIT_REG_MEM\n");
  377. return -EINVAL;
  378. }
  379. /* bit 4 is reg (0) or mem (1) */
  380. if (idx_value & 0x10) {
  381. r = r600_cs_packet_next_reloc(p, &reloc);
  382. if (r) {
  383. DRM_ERROR("bad WAIT_REG_MEM\n");
  384. return -EINVAL;
  385. }
  386. ib[idx+1] += (u32)(reloc->lobj.gpu_offset & 0xffffffff);
  387. ib[idx+2] += upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
  388. }
  389. break;
  390. case PACKET3_SURFACE_SYNC:
  391. if (pkt->count != 3) {
  392. DRM_ERROR("bad SURFACE_SYNC\n");
  393. return -EINVAL;
  394. }
  395. /* 0xffffffff/0x0 is flush all cache flag */
  396. if (radeon_get_ib_value(p, idx + 1) != 0xffffffff ||
  397. radeon_get_ib_value(p, idx + 2) != 0) {
  398. r = r600_cs_packet_next_reloc(p, &reloc);
  399. if (r) {
  400. DRM_ERROR("bad SURFACE_SYNC\n");
  401. return -EINVAL;
  402. }
  403. ib[idx+2] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
  404. }
  405. break;
  406. case PACKET3_EVENT_WRITE:
  407. if (pkt->count != 2 && pkt->count != 0) {
  408. DRM_ERROR("bad EVENT_WRITE\n");
  409. return -EINVAL;
  410. }
  411. if (pkt->count) {
  412. r = r600_cs_packet_next_reloc(p, &reloc);
  413. if (r) {
  414. DRM_ERROR("bad EVENT_WRITE\n");
  415. return -EINVAL;
  416. }
  417. ib[idx+1] += (u32)(reloc->lobj.gpu_offset & 0xffffffff);
  418. ib[idx+2] += upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
  419. }
  420. break;
  421. case PACKET3_EVENT_WRITE_EOP:
  422. if (pkt->count != 4) {
  423. DRM_ERROR("bad EVENT_WRITE_EOP\n");
  424. return -EINVAL;
  425. }
  426. r = r600_cs_packet_next_reloc(p, &reloc);
  427. if (r) {
  428. DRM_ERROR("bad EVENT_WRITE\n");
  429. return -EINVAL;
  430. }
  431. ib[idx+1] += (u32)(reloc->lobj.gpu_offset & 0xffffffff);
  432. ib[idx+2] += upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
  433. break;
  434. case PACKET3_SET_CONFIG_REG:
  435. start_reg = (idx_value << 2) + PACKET3_SET_CONFIG_REG_OFFSET;
  436. end_reg = 4 * pkt->count + start_reg - 4;
  437. if ((start_reg < PACKET3_SET_CONFIG_REG_OFFSET) ||
  438. (start_reg >= PACKET3_SET_CONFIG_REG_END) ||
  439. (end_reg >= PACKET3_SET_CONFIG_REG_END)) {
  440. DRM_ERROR("bad PACKET3_SET_CONFIG_REG\n");
  441. return -EINVAL;
  442. }
  443. for (i = 0; i < pkt->count; i++) {
  444. reg = start_reg + (4 * i);
  445. switch (reg) {
  446. case CP_COHER_BASE:
  447. /* use PACKET3_SURFACE_SYNC */
  448. return -EINVAL;
  449. default:
  450. break;
  451. }
  452. }
  453. break;
  454. case PACKET3_SET_CONTEXT_REG:
  455. start_reg = (idx_value << 2) + PACKET3_SET_CONTEXT_REG_OFFSET;
  456. end_reg = 4 * pkt->count + start_reg - 4;
  457. if ((start_reg < PACKET3_SET_CONTEXT_REG_OFFSET) ||
  458. (start_reg >= PACKET3_SET_CONTEXT_REG_END) ||
  459. (end_reg >= PACKET3_SET_CONTEXT_REG_END)) {
  460. DRM_ERROR("bad PACKET3_SET_CONTEXT_REG\n");
  461. return -EINVAL;
  462. }
  463. for (i = 0; i < pkt->count; i++) {
  464. reg = start_reg + (4 * i);
  465. switch (reg) {
  466. case DB_DEPTH_BASE:
  467. case CB_COLOR0_BASE:
  468. case CB_COLOR1_BASE:
  469. case CB_COLOR2_BASE:
  470. case CB_COLOR3_BASE:
  471. case CB_COLOR4_BASE:
  472. case CB_COLOR5_BASE:
  473. case CB_COLOR6_BASE:
  474. case CB_COLOR7_BASE:
  475. case SQ_PGM_START_FS:
  476. case SQ_PGM_START_ES:
  477. case SQ_PGM_START_VS:
  478. case SQ_PGM_START_GS:
  479. case SQ_PGM_START_PS:
  480. r = r600_cs_packet_next_reloc(p, &reloc);
  481. if (r) {
  482. DRM_ERROR("bad SET_CONTEXT_REG "
  483. "0x%04X\n", reg);
  484. return -EINVAL;
  485. }
  486. ib[idx+1+i] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
  487. break;
  488. case VGT_DMA_BASE:
  489. case VGT_DMA_BASE_HI:
  490. /* These should be handled by DRAW_INDEX packet 3 */
  491. case VGT_STRMOUT_BASE_OFFSET_0:
  492. case VGT_STRMOUT_BASE_OFFSET_1:
  493. case VGT_STRMOUT_BASE_OFFSET_2:
  494. case VGT_STRMOUT_BASE_OFFSET_3:
  495. case VGT_STRMOUT_BASE_OFFSET_HI_0:
  496. case VGT_STRMOUT_BASE_OFFSET_HI_1:
  497. case VGT_STRMOUT_BASE_OFFSET_HI_2:
  498. case VGT_STRMOUT_BASE_OFFSET_HI_3:
  499. case VGT_STRMOUT_BUFFER_BASE_0:
  500. case VGT_STRMOUT_BUFFER_BASE_1:
  501. case VGT_STRMOUT_BUFFER_BASE_2:
  502. case VGT_STRMOUT_BUFFER_BASE_3:
  503. case VGT_STRMOUT_BUFFER_OFFSET_0:
  504. case VGT_STRMOUT_BUFFER_OFFSET_1:
  505. case VGT_STRMOUT_BUFFER_OFFSET_2:
  506. case VGT_STRMOUT_BUFFER_OFFSET_3:
  507. /* These should be handled by STRMOUT_BUFFER packet 3 */
  508. DRM_ERROR("bad context reg: 0x%08x\n", reg);
  509. return -EINVAL;
  510. default:
  511. break;
  512. }
  513. }
  514. break;
  515. case PACKET3_SET_RESOURCE:
  516. if (pkt->count % 7) {
  517. DRM_ERROR("bad SET_RESOURCE\n");
  518. return -EINVAL;
  519. }
  520. start_reg = (idx_value << 2) + PACKET3_SET_RESOURCE_OFFSET;
  521. end_reg = 4 * pkt->count + start_reg - 4;
  522. if ((start_reg < PACKET3_SET_RESOURCE_OFFSET) ||
  523. (start_reg >= PACKET3_SET_RESOURCE_END) ||
  524. (end_reg >= PACKET3_SET_RESOURCE_END)) {
  525. DRM_ERROR("bad SET_RESOURCE\n");
  526. return -EINVAL;
  527. }
  528. for (i = 0; i < (pkt->count / 7); i++) {
  529. switch (G__SQ_VTX_CONSTANT_TYPE(radeon_get_ib_value(p, idx+(i*7)+6+1))) {
  530. case SQ_TEX_VTX_VALID_TEXTURE:
  531. /* tex base */
  532. r = r600_cs_packet_next_reloc(p, &reloc);
  533. if (r) {
  534. DRM_ERROR("bad SET_RESOURCE\n");
  535. return -EINVAL;
  536. }
  537. ib[idx+1+(i*7)+2] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
  538. /* tex mip base */
  539. r = r600_cs_packet_next_reloc(p, &reloc);
  540. if (r) {
  541. DRM_ERROR("bad SET_RESOURCE\n");
  542. return -EINVAL;
  543. }
  544. ib[idx+1+(i*7)+3] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
  545. break;
  546. case SQ_TEX_VTX_VALID_BUFFER:
  547. /* vtx base */
  548. r = r600_cs_packet_next_reloc(p, &reloc);
  549. if (r) {
  550. DRM_ERROR("bad SET_RESOURCE\n");
  551. return -EINVAL;
  552. }
  553. ib[idx+1+(i*7)+0] += (u32)((reloc->lobj.gpu_offset) & 0xffffffff);
  554. ib[idx+1+(i*7)+2] += upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
  555. break;
  556. case SQ_TEX_VTX_INVALID_TEXTURE:
  557. case SQ_TEX_VTX_INVALID_BUFFER:
  558. default:
  559. DRM_ERROR("bad SET_RESOURCE\n");
  560. return -EINVAL;
  561. }
  562. }
  563. break;
  564. case PACKET3_SET_ALU_CONST:
  565. start_reg = (idx_value << 2) + PACKET3_SET_ALU_CONST_OFFSET;
  566. end_reg = 4 * pkt->count + start_reg - 4;
  567. if ((start_reg < PACKET3_SET_ALU_CONST_OFFSET) ||
  568. (start_reg >= PACKET3_SET_ALU_CONST_END) ||
  569. (end_reg >= PACKET3_SET_ALU_CONST_END)) {
  570. DRM_ERROR("bad SET_ALU_CONST\n");
  571. return -EINVAL;
  572. }
  573. break;
  574. case PACKET3_SET_BOOL_CONST:
  575. start_reg = (idx_value << 2) + PACKET3_SET_BOOL_CONST_OFFSET;
  576. end_reg = 4 * pkt->count + start_reg - 4;
  577. if ((start_reg < PACKET3_SET_BOOL_CONST_OFFSET) ||
  578. (start_reg >= PACKET3_SET_BOOL_CONST_END) ||
  579. (end_reg >= PACKET3_SET_BOOL_CONST_END)) {
  580. DRM_ERROR("bad SET_BOOL_CONST\n");
  581. return -EINVAL;
  582. }
  583. break;
  584. case PACKET3_SET_LOOP_CONST:
  585. start_reg = (idx_value << 2) + PACKET3_SET_LOOP_CONST_OFFSET;
  586. end_reg = 4 * pkt->count + start_reg - 4;
  587. if ((start_reg < PACKET3_SET_LOOP_CONST_OFFSET) ||
  588. (start_reg >= PACKET3_SET_LOOP_CONST_END) ||
  589. (end_reg >= PACKET3_SET_LOOP_CONST_END)) {
  590. DRM_ERROR("bad SET_LOOP_CONST\n");
  591. return -EINVAL;
  592. }
  593. break;
  594. case PACKET3_SET_CTL_CONST:
  595. start_reg = (idx_value << 2) + PACKET3_SET_CTL_CONST_OFFSET;
  596. end_reg = 4 * pkt->count + start_reg - 4;
  597. if ((start_reg < PACKET3_SET_CTL_CONST_OFFSET) ||
  598. (start_reg >= PACKET3_SET_CTL_CONST_END) ||
  599. (end_reg >= PACKET3_SET_CTL_CONST_END)) {
  600. DRM_ERROR("bad SET_CTL_CONST\n");
  601. return -EINVAL;
  602. }
  603. break;
  604. case PACKET3_SET_SAMPLER:
  605. if (pkt->count % 3) {
  606. DRM_ERROR("bad SET_SAMPLER\n");
  607. return -EINVAL;
  608. }
  609. start_reg = (idx_value << 2) + PACKET3_SET_SAMPLER_OFFSET;
  610. end_reg = 4 * pkt->count + start_reg - 4;
  611. if ((start_reg < PACKET3_SET_SAMPLER_OFFSET) ||
  612. (start_reg >= PACKET3_SET_SAMPLER_END) ||
  613. (end_reg >= PACKET3_SET_SAMPLER_END)) {
  614. DRM_ERROR("bad SET_SAMPLER\n");
  615. return -EINVAL;
  616. }
  617. break;
  618. case PACKET3_SURFACE_BASE_UPDATE:
  619. if (p->family >= CHIP_RV770 || p->family == CHIP_R600) {
  620. DRM_ERROR("bad SURFACE_BASE_UPDATE\n");
  621. return -EINVAL;
  622. }
  623. if (pkt->count) {
  624. DRM_ERROR("bad SURFACE_BASE_UPDATE\n");
  625. return -EINVAL;
  626. }
  627. break;
  628. case PACKET3_NOP:
  629. break;
  630. default:
  631. DRM_ERROR("Packet3 opcode %x not supported\n", pkt->opcode);
  632. return -EINVAL;
  633. }
  634. return 0;
  635. }
  636. int r600_cs_parse(struct radeon_cs_parser *p)
  637. {
  638. struct radeon_cs_packet pkt;
  639. int r;
  640. do {
  641. r = r600_cs_packet_parse(p, &pkt, p->idx);
  642. if (r) {
  643. return r;
  644. }
  645. p->idx += pkt.count + 2;
  646. switch (pkt.type) {
  647. case PACKET_TYPE0:
  648. r = r600_cs_parse_packet0(p, &pkt);
  649. break;
  650. case PACKET_TYPE2:
  651. break;
  652. case PACKET_TYPE3:
  653. r = r600_packet3_check(p, &pkt);
  654. break;
  655. default:
  656. DRM_ERROR("Unknown packet type %d !\n", pkt.type);
  657. return -EINVAL;
  658. }
  659. if (r) {
  660. return r;
  661. }
  662. } while (p->idx < p->chunks[p->chunk_ib_idx].length_dw);
  663. #if 0
  664. for (r = 0; r < p->ib->length_dw; r++) {
  665. printk(KERN_INFO "%05d 0x%08X\n", r, p->ib->ptr[r]);
  666. mdelay(1);
  667. }
  668. #endif
  669. return 0;
  670. }
  671. static int r600_cs_parser_relocs_legacy(struct radeon_cs_parser *p)
  672. {
  673. if (p->chunk_relocs_idx == -1) {
  674. return 0;
  675. }
  676. p->relocs = kcalloc(1, sizeof(struct radeon_cs_reloc), GFP_KERNEL);
  677. if (p->relocs == NULL) {
  678. return -ENOMEM;
  679. }
  680. return 0;
  681. }
  682. /**
  683. * cs_parser_fini() - clean parser states
  684. * @parser: parser structure holding parsing context.
  685. * @error: error number
  686. *
  687. * If error is set than unvalidate buffer, otherwise just free memory
  688. * used by parsing context.
  689. **/
  690. static void r600_cs_parser_fini(struct radeon_cs_parser *parser, int error)
  691. {
  692. unsigned i;
  693. kfree(parser->relocs);
  694. for (i = 0; i < parser->nchunks; i++) {
  695. kfree(parser->chunks[i].kdata);
  696. }
  697. kfree(parser->chunks);
  698. kfree(parser->chunks_array);
  699. }
  700. int r600_cs_legacy(struct drm_device *dev, void *data, struct drm_file *filp,
  701. unsigned family, u32 *ib, int *l)
  702. {
  703. struct radeon_cs_parser parser;
  704. struct radeon_cs_chunk *ib_chunk;
  705. struct radeon_ib fake_ib;
  706. int r;
  707. /* initialize parser */
  708. memset(&parser, 0, sizeof(struct radeon_cs_parser));
  709. parser.filp = filp;
  710. parser.rdev = NULL;
  711. parser.family = family;
  712. parser.ib = &fake_ib;
  713. fake_ib.ptr = ib;
  714. r = radeon_cs_parser_init(&parser, data);
  715. if (r) {
  716. DRM_ERROR("Failed to initialize parser !\n");
  717. r600_cs_parser_fini(&parser, r);
  718. return r;
  719. }
  720. r = r600_cs_parser_relocs_legacy(&parser);
  721. if (r) {
  722. DRM_ERROR("Failed to parse relocation !\n");
  723. r600_cs_parser_fini(&parser, r);
  724. return r;
  725. }
  726. /* Copy the packet into the IB, the parser will read from the
  727. * input memory (cached) and write to the IB (which can be
  728. * uncached). */
  729. ib_chunk = &parser.chunks[parser.chunk_ib_idx];
  730. parser.ib->length_dw = ib_chunk->length_dw;
  731. *l = parser.ib->length_dw;
  732. r = r600_cs_parse(&parser);
  733. if (r) {
  734. DRM_ERROR("Invalid command stream !\n");
  735. r600_cs_parser_fini(&parser, r);
  736. return r;
  737. }
  738. r = radeon_cs_finish_pages(&parser);
  739. if (r) {
  740. DRM_ERROR("Invalid command stream !\n");
  741. r600_cs_parser_fini(&parser, r);
  742. return r;
  743. }
  744. r600_cs_parser_fini(&parser, r);
  745. return r;
  746. }
  747. void r600_cs_legacy_init(void)
  748. {
  749. r600_cs_packet_next_reloc = &r600_cs_packet_next_reloc_nomm;
  750. }