r600_cs.c 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657
  1. /*
  2. * Copyright 2008 Advanced Micro Devices, Inc.
  3. * Copyright 2008 Red Hat Inc.
  4. * Copyright 2009 Jerome Glisse.
  5. *
  6. * Permission is hereby granted, free of charge, to any person obtaining a
  7. * copy of this software and associated documentation files (the "Software"),
  8. * to deal in the Software without restriction, including without limitation
  9. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  10. * and/or sell copies of the Software, and to permit persons to whom the
  11. * Software is furnished to do so, subject to the following conditions:
  12. *
  13. * The above copyright notice and this permission notice shall be included in
  14. * all copies or substantial portions of the Software.
  15. *
  16. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  17. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  18. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
  19. * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
  20. * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  21. * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  22. * OTHER DEALINGS IN THE SOFTWARE.
  23. *
  24. * Authors: Dave Airlie
  25. * Alex Deucher
  26. * Jerome Glisse
  27. */
  28. #include "drmP.h"
  29. #include "radeon.h"
  30. #include "r600d.h"
  31. #include "avivod.h"
  32. static int r600_cs_packet_next_reloc_mm(struct radeon_cs_parser *p,
  33. struct radeon_cs_reloc **cs_reloc);
  34. static int r600_cs_packet_next_reloc_nomm(struct radeon_cs_parser *p,
  35. struct radeon_cs_reloc **cs_reloc);
  36. typedef int (*next_reloc_t)(struct radeon_cs_parser*, struct radeon_cs_reloc**);
  37. static next_reloc_t r600_cs_packet_next_reloc = &r600_cs_packet_next_reloc_mm;
  38. /**
  39. * r600_cs_packet_parse() - parse cp packet and point ib index to next packet
  40. * @parser: parser structure holding parsing context.
  41. * @pkt: where to store packet informations
  42. *
  43. * Assume that chunk_ib_index is properly set. Will return -EINVAL
  44. * if packet is bigger than remaining ib size. or if packets is unknown.
  45. **/
  46. int r600_cs_packet_parse(struct radeon_cs_parser *p,
  47. struct radeon_cs_packet *pkt,
  48. unsigned idx)
  49. {
  50. struct radeon_cs_chunk *ib_chunk = &p->chunks[p->chunk_ib_idx];
  51. uint32_t header;
  52. if (idx >= ib_chunk->length_dw) {
  53. DRM_ERROR("Can not parse packet at %d after CS end %d !\n",
  54. idx, ib_chunk->length_dw);
  55. return -EINVAL;
  56. }
  57. header = ib_chunk->kdata[idx];
  58. pkt->idx = idx;
  59. pkt->type = CP_PACKET_GET_TYPE(header);
  60. pkt->count = CP_PACKET_GET_COUNT(header);
  61. pkt->one_reg_wr = 0;
  62. switch (pkt->type) {
  63. case PACKET_TYPE0:
  64. pkt->reg = CP_PACKET0_GET_REG(header);
  65. break;
  66. case PACKET_TYPE3:
  67. pkt->opcode = CP_PACKET3_GET_OPCODE(header);
  68. break;
  69. case PACKET_TYPE2:
  70. pkt->count = -1;
  71. break;
  72. default:
  73. DRM_ERROR("Unknown packet type %d at %d !\n", pkt->type, idx);
  74. return -EINVAL;
  75. }
  76. if ((pkt->count + 1 + pkt->idx) >= ib_chunk->length_dw) {
  77. DRM_ERROR("Packet (%d:%d:%d) end after CS buffer (%d) !\n",
  78. pkt->idx, pkt->type, pkt->count, ib_chunk->length_dw);
  79. return -EINVAL;
  80. }
  81. return 0;
  82. }
  83. /**
  84. * r600_cs_packet_next_reloc_mm() - parse next packet which should be reloc packet3
  85. * @parser: parser structure holding parsing context.
  86. * @data: pointer to relocation data
  87. * @offset_start: starting offset
  88. * @offset_mask: offset mask (to align start offset on)
  89. * @reloc: reloc informations
  90. *
  91. * Check next packet is relocation packet3, do bo validation and compute
  92. * GPU offset using the provided start.
  93. **/
  94. static int r600_cs_packet_next_reloc_mm(struct radeon_cs_parser *p,
  95. struct radeon_cs_reloc **cs_reloc)
  96. {
  97. struct radeon_cs_chunk *ib_chunk;
  98. struct radeon_cs_chunk *relocs_chunk;
  99. struct radeon_cs_packet p3reloc;
  100. unsigned idx;
  101. int r;
  102. if (p->chunk_relocs_idx == -1) {
  103. DRM_ERROR("No relocation chunk !\n");
  104. return -EINVAL;
  105. }
  106. *cs_reloc = NULL;
  107. ib_chunk = &p->chunks[p->chunk_ib_idx];
  108. relocs_chunk = &p->chunks[p->chunk_relocs_idx];
  109. r = r600_cs_packet_parse(p, &p3reloc, p->idx);
  110. if (r) {
  111. return r;
  112. }
  113. p->idx += p3reloc.count + 2;
  114. if (p3reloc.type != PACKET_TYPE3 || p3reloc.opcode != PACKET3_NOP) {
  115. DRM_ERROR("No packet3 for relocation for packet at %d.\n",
  116. p3reloc.idx);
  117. return -EINVAL;
  118. }
  119. idx = ib_chunk->kdata[p3reloc.idx + 1];
  120. if (idx >= relocs_chunk->length_dw) {
  121. DRM_ERROR("Relocs at %d after relocations chunk end %d !\n",
  122. idx, relocs_chunk->length_dw);
  123. return -EINVAL;
  124. }
  125. /* FIXME: we assume reloc size is 4 dwords */
  126. *cs_reloc = p->relocs_ptr[(idx / 4)];
  127. return 0;
  128. }
  129. /**
  130. * r600_cs_packet_next_reloc_nomm() - parse next packet which should be reloc packet3
  131. * @parser: parser structure holding parsing context.
  132. * @data: pointer to relocation data
  133. * @offset_start: starting offset
  134. * @offset_mask: offset mask (to align start offset on)
  135. * @reloc: reloc informations
  136. *
  137. * Check next packet is relocation packet3, do bo validation and compute
  138. * GPU offset using the provided start.
  139. **/
  140. static int r600_cs_packet_next_reloc_nomm(struct radeon_cs_parser *p,
  141. struct radeon_cs_reloc **cs_reloc)
  142. {
  143. struct radeon_cs_chunk *ib_chunk;
  144. struct radeon_cs_chunk *relocs_chunk;
  145. struct radeon_cs_packet p3reloc;
  146. unsigned idx;
  147. int r;
  148. if (p->chunk_relocs_idx == -1) {
  149. DRM_ERROR("No relocation chunk !\n");
  150. return -EINVAL;
  151. }
  152. *cs_reloc = NULL;
  153. ib_chunk = &p->chunks[p->chunk_ib_idx];
  154. relocs_chunk = &p->chunks[p->chunk_relocs_idx];
  155. r = r600_cs_packet_parse(p, &p3reloc, p->idx);
  156. if (r) {
  157. return r;
  158. }
  159. p->idx += p3reloc.count + 2;
  160. if (p3reloc.type != PACKET_TYPE3 || p3reloc.opcode != PACKET3_NOP) {
  161. DRM_ERROR("No packet3 for relocation for packet at %d.\n",
  162. p3reloc.idx);
  163. return -EINVAL;
  164. }
  165. idx = ib_chunk->kdata[p3reloc.idx + 1];
  166. if (idx >= relocs_chunk->length_dw) {
  167. DRM_ERROR("Relocs at %d after relocations chunk end %d !\n",
  168. idx, relocs_chunk->length_dw);
  169. return -EINVAL;
  170. }
  171. *cs_reloc = &p->relocs[0];
  172. (*cs_reloc)->lobj.gpu_offset = (u64)relocs_chunk->kdata[idx + 3] << 32;
  173. (*cs_reloc)->lobj.gpu_offset |= relocs_chunk->kdata[idx + 0];
  174. return 0;
  175. }
  176. static int r600_packet0_check(struct radeon_cs_parser *p,
  177. struct radeon_cs_packet *pkt,
  178. unsigned idx, unsigned reg)
  179. {
  180. switch (reg) {
  181. case AVIVO_D1MODE_VLINE_START_END:
  182. case AVIVO_D2MODE_VLINE_START_END:
  183. break;
  184. default:
  185. printk(KERN_ERR "Forbidden register 0x%04X in cs at %d\n",
  186. reg, idx);
  187. return -EINVAL;
  188. }
  189. return 0;
  190. }
  191. static int r600_cs_parse_packet0(struct radeon_cs_parser *p,
  192. struct radeon_cs_packet *pkt)
  193. {
  194. unsigned reg, i;
  195. unsigned idx;
  196. int r;
  197. idx = pkt->idx + 1;
  198. reg = pkt->reg;
  199. for (i = 0; i <= pkt->count; i++, idx++, reg += 4) {
  200. r = r600_packet0_check(p, pkt, idx, reg);
  201. if (r) {
  202. return r;
  203. }
  204. }
  205. return 0;
  206. }
  207. static int r600_packet3_check(struct radeon_cs_parser *p,
  208. struct radeon_cs_packet *pkt)
  209. {
  210. struct radeon_cs_chunk *ib_chunk;
  211. struct radeon_cs_reloc *reloc;
  212. volatile u32 *ib;
  213. unsigned idx;
  214. unsigned i;
  215. unsigned start_reg, end_reg, reg;
  216. int r;
  217. ib = p->ib->ptr;
  218. ib_chunk = &p->chunks[p->chunk_ib_idx];
  219. idx = pkt->idx + 1;
  220. switch (pkt->opcode) {
  221. case PACKET3_START_3D_CMDBUF:
  222. if (p->family >= CHIP_RV770 || pkt->count) {
  223. DRM_ERROR("bad START_3D\n");
  224. return -EINVAL;
  225. }
  226. break;
  227. case PACKET3_CONTEXT_CONTROL:
  228. if (pkt->count != 1) {
  229. DRM_ERROR("bad CONTEXT_CONTROL\n");
  230. return -EINVAL;
  231. }
  232. break;
  233. case PACKET3_INDEX_TYPE:
  234. case PACKET3_NUM_INSTANCES:
  235. if (pkt->count) {
  236. DRM_ERROR("bad INDEX_TYPE/NUM_INSTANCES\n");
  237. return -EINVAL;
  238. }
  239. break;
  240. case PACKET3_DRAW_INDEX:
  241. if (pkt->count != 3) {
  242. DRM_ERROR("bad DRAW_INDEX\n");
  243. return -EINVAL;
  244. }
  245. r = r600_cs_packet_next_reloc(p, &reloc);
  246. if (r) {
  247. DRM_ERROR("bad DRAW_INDEX\n");
  248. return -EINVAL;
  249. }
  250. ib[idx+0] += (u32)(reloc->lobj.gpu_offset & 0xffffffff);
  251. ib[idx+1] = upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
  252. break;
  253. case PACKET3_DRAW_INDEX_AUTO:
  254. if (pkt->count != 1) {
  255. DRM_ERROR("bad DRAW_INDEX_AUTO\n");
  256. return -EINVAL;
  257. }
  258. break;
  259. case PACKET3_DRAW_INDEX_IMMD_BE:
  260. case PACKET3_DRAW_INDEX_IMMD:
  261. if (pkt->count < 2) {
  262. DRM_ERROR("bad DRAW_INDEX_IMMD\n");
  263. return -EINVAL;
  264. }
  265. break;
  266. case PACKET3_WAIT_REG_MEM:
  267. if (pkt->count != 5) {
  268. DRM_ERROR("bad WAIT_REG_MEM\n");
  269. return -EINVAL;
  270. }
  271. /* bit 4 is reg (0) or mem (1) */
  272. if (ib_chunk->kdata[idx+0] & 0x10) {
  273. r = r600_cs_packet_next_reloc(p, &reloc);
  274. if (r) {
  275. DRM_ERROR("bad WAIT_REG_MEM\n");
  276. return -EINVAL;
  277. }
  278. ib[idx+1] += (u32)(reloc->lobj.gpu_offset & 0xffffffff);
  279. ib[idx+2] = upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
  280. }
  281. break;
  282. case PACKET3_SURFACE_SYNC:
  283. if (pkt->count != 3) {
  284. DRM_ERROR("bad SURFACE_SYNC\n");
  285. return -EINVAL;
  286. }
  287. /* 0xffffffff/0x0 is flush all cache flag */
  288. if (ib_chunk->kdata[idx+1] != 0xffffffff ||
  289. ib_chunk->kdata[idx+2] != 0) {
  290. r = r600_cs_packet_next_reloc(p, &reloc);
  291. if (r) {
  292. DRM_ERROR("bad SURFACE_SYNC\n");
  293. return -EINVAL;
  294. }
  295. ib[idx+2] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
  296. }
  297. break;
  298. case PACKET3_EVENT_WRITE:
  299. if (pkt->count != 2 && pkt->count != 0) {
  300. DRM_ERROR("bad EVENT_WRITE\n");
  301. return -EINVAL;
  302. }
  303. if (pkt->count) {
  304. r = r600_cs_packet_next_reloc(p, &reloc);
  305. if (r) {
  306. DRM_ERROR("bad EVENT_WRITE\n");
  307. return -EINVAL;
  308. }
  309. ib[idx+1] += (u32)(reloc->lobj.gpu_offset & 0xffffffff);
  310. ib[idx+2] |= upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
  311. }
  312. break;
  313. case PACKET3_EVENT_WRITE_EOP:
  314. if (pkt->count != 4) {
  315. DRM_ERROR("bad EVENT_WRITE_EOP\n");
  316. return -EINVAL;
  317. }
  318. r = r600_cs_packet_next_reloc(p, &reloc);
  319. if (r) {
  320. DRM_ERROR("bad EVENT_WRITE\n");
  321. return -EINVAL;
  322. }
  323. ib[idx+1] += (u32)(reloc->lobj.gpu_offset & 0xffffffff);
  324. ib[idx+2] |= upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
  325. break;
  326. case PACKET3_SET_CONFIG_REG:
  327. start_reg = (ib[idx+0] << 2) + PACKET3_SET_CONFIG_REG_OFFSET;
  328. end_reg = 4 * pkt->count + start_reg - 4;
  329. if ((start_reg < PACKET3_SET_CONFIG_REG_OFFSET) ||
  330. (start_reg >= PACKET3_SET_CONFIG_REG_END) ||
  331. (end_reg >= PACKET3_SET_CONFIG_REG_END)) {
  332. DRM_ERROR("bad PACKET3_SET_CONFIG_REG\n");
  333. return -EINVAL;
  334. }
  335. for (i = 0; i < pkt->count; i++) {
  336. reg = start_reg + (4 * i);
  337. switch (reg) {
  338. case CP_COHER_BASE:
  339. /* use PACKET3_SURFACE_SYNC */
  340. return -EINVAL;
  341. default:
  342. break;
  343. }
  344. }
  345. break;
  346. case PACKET3_SET_CONTEXT_REG:
  347. start_reg = (ib[idx+0] << 2) + PACKET3_SET_CONTEXT_REG_OFFSET;
  348. end_reg = 4 * pkt->count + start_reg - 4;
  349. if ((start_reg < PACKET3_SET_CONTEXT_REG_OFFSET) ||
  350. (start_reg >= PACKET3_SET_CONTEXT_REG_END) ||
  351. (end_reg >= PACKET3_SET_CONTEXT_REG_END)) {
  352. DRM_ERROR("bad PACKET3_SET_CONTEXT_REG\n");
  353. return -EINVAL;
  354. }
  355. for (i = 0; i < pkt->count; i++) {
  356. reg = start_reg + (4 * i);
  357. switch (reg) {
  358. case DB_DEPTH_BASE:
  359. case CB_COLOR0_BASE:
  360. case CB_COLOR1_BASE:
  361. case CB_COLOR2_BASE:
  362. case CB_COLOR3_BASE:
  363. case CB_COLOR4_BASE:
  364. case CB_COLOR5_BASE:
  365. case CB_COLOR6_BASE:
  366. case CB_COLOR7_BASE:
  367. case SQ_PGM_START_FS:
  368. case SQ_PGM_START_ES:
  369. case SQ_PGM_START_VS:
  370. case SQ_PGM_START_GS:
  371. case SQ_PGM_START_PS:
  372. r = r600_cs_packet_next_reloc(p, &reloc);
  373. if (r) {
  374. DRM_ERROR("bad SET_CONTEXT_REG "
  375. "0x%04X\n", reg);
  376. return -EINVAL;
  377. }
  378. ib[idx+1+i] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
  379. break;
  380. case VGT_DMA_BASE:
  381. case VGT_DMA_BASE_HI:
  382. /* These should be handled by DRAW_INDEX packet 3 */
  383. case VGT_STRMOUT_BASE_OFFSET_0:
  384. case VGT_STRMOUT_BASE_OFFSET_1:
  385. case VGT_STRMOUT_BASE_OFFSET_2:
  386. case VGT_STRMOUT_BASE_OFFSET_3:
  387. case VGT_STRMOUT_BASE_OFFSET_HI_0:
  388. case VGT_STRMOUT_BASE_OFFSET_HI_1:
  389. case VGT_STRMOUT_BASE_OFFSET_HI_2:
  390. case VGT_STRMOUT_BASE_OFFSET_HI_3:
  391. case VGT_STRMOUT_BUFFER_BASE_0:
  392. case VGT_STRMOUT_BUFFER_BASE_1:
  393. case VGT_STRMOUT_BUFFER_BASE_2:
  394. case VGT_STRMOUT_BUFFER_BASE_3:
  395. case VGT_STRMOUT_BUFFER_OFFSET_0:
  396. case VGT_STRMOUT_BUFFER_OFFSET_1:
  397. case VGT_STRMOUT_BUFFER_OFFSET_2:
  398. case VGT_STRMOUT_BUFFER_OFFSET_3:
  399. /* These should be handled by STRMOUT_BUFFER packet 3 */
  400. DRM_ERROR("bad context reg: 0x%08x\n", reg);
  401. return -EINVAL;
  402. default:
  403. break;
  404. }
  405. }
  406. break;
  407. case PACKET3_SET_RESOURCE:
  408. if (pkt->count % 7) {
  409. DRM_ERROR("bad SET_RESOURCE\n");
  410. return -EINVAL;
  411. }
  412. start_reg = (ib[idx+0] << 2) + PACKET3_SET_RESOURCE_OFFSET;
  413. end_reg = 4 * pkt->count + start_reg - 4;
  414. if ((start_reg < PACKET3_SET_RESOURCE_OFFSET) ||
  415. (start_reg >= PACKET3_SET_RESOURCE_END) ||
  416. (end_reg >= PACKET3_SET_RESOURCE_END)) {
  417. DRM_ERROR("bad SET_RESOURCE\n");
  418. return -EINVAL;
  419. }
  420. for (i = 0; i < (pkt->count / 7); i++) {
  421. switch (G__SQ_VTX_CONSTANT_TYPE(ib[idx+(i*7)+6+1])) {
  422. case SQ_TEX_VTX_VALID_TEXTURE:
  423. /* tex base */
  424. r = r600_cs_packet_next_reloc(p, &reloc);
  425. if (r) {
  426. DRM_ERROR("bad SET_RESOURCE\n");
  427. return -EINVAL;
  428. }
  429. ib[idx+1+(i*7)+2] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
  430. /* tex mip base */
  431. r = r600_cs_packet_next_reloc(p, &reloc);
  432. if (r) {
  433. DRM_ERROR("bad SET_RESOURCE\n");
  434. return -EINVAL;
  435. }
  436. ib[idx+1+(i*7)+3] += (u32)((reloc->lobj.gpu_offset >> 8) & 0xffffffff);
  437. break;
  438. case SQ_TEX_VTX_VALID_BUFFER:
  439. /* vtx base */
  440. r = r600_cs_packet_next_reloc(p, &reloc);
  441. if (r) {
  442. DRM_ERROR("bad SET_RESOURCE\n");
  443. return -EINVAL;
  444. }
  445. ib[idx+1+(i*7)+0] += (u32)((reloc->lobj.gpu_offset) & 0xffffffff);
  446. ib[idx+1+(i*7)+2] |= upper_32_bits(reloc->lobj.gpu_offset) & 0xff;
  447. break;
  448. case SQ_TEX_VTX_INVALID_TEXTURE:
  449. case SQ_TEX_VTX_INVALID_BUFFER:
  450. default:
  451. DRM_ERROR("bad SET_RESOURCE\n");
  452. return -EINVAL;
  453. }
  454. }
  455. break;
  456. case PACKET3_SET_ALU_CONST:
  457. start_reg = (ib[idx+0] << 2) + PACKET3_SET_ALU_CONST_OFFSET;
  458. end_reg = 4 * pkt->count + start_reg - 4;
  459. if ((start_reg < PACKET3_SET_ALU_CONST_OFFSET) ||
  460. (start_reg >= PACKET3_SET_ALU_CONST_END) ||
  461. (end_reg >= PACKET3_SET_ALU_CONST_END)) {
  462. DRM_ERROR("bad SET_ALU_CONST\n");
  463. return -EINVAL;
  464. }
  465. break;
  466. case PACKET3_SET_BOOL_CONST:
  467. start_reg = (ib[idx+0] << 2) + PACKET3_SET_BOOL_CONST_OFFSET;
  468. end_reg = 4 * pkt->count + start_reg - 4;
  469. if ((start_reg < PACKET3_SET_BOOL_CONST_OFFSET) ||
  470. (start_reg >= PACKET3_SET_BOOL_CONST_END) ||
  471. (end_reg >= PACKET3_SET_BOOL_CONST_END)) {
  472. DRM_ERROR("bad SET_BOOL_CONST\n");
  473. return -EINVAL;
  474. }
  475. break;
  476. case PACKET3_SET_LOOP_CONST:
  477. start_reg = (ib[idx+0] << 2) + PACKET3_SET_LOOP_CONST_OFFSET;
  478. end_reg = 4 * pkt->count + start_reg - 4;
  479. if ((start_reg < PACKET3_SET_LOOP_CONST_OFFSET) ||
  480. (start_reg >= PACKET3_SET_LOOP_CONST_END) ||
  481. (end_reg >= PACKET3_SET_LOOP_CONST_END)) {
  482. DRM_ERROR("bad SET_LOOP_CONST\n");
  483. return -EINVAL;
  484. }
  485. break;
  486. case PACKET3_SET_CTL_CONST:
  487. start_reg = (ib[idx+0] << 2) + PACKET3_SET_CTL_CONST_OFFSET;
  488. end_reg = 4 * pkt->count + start_reg - 4;
  489. if ((start_reg < PACKET3_SET_CTL_CONST_OFFSET) ||
  490. (start_reg >= PACKET3_SET_CTL_CONST_END) ||
  491. (end_reg >= PACKET3_SET_CTL_CONST_END)) {
  492. DRM_ERROR("bad SET_CTL_CONST\n");
  493. return -EINVAL;
  494. }
  495. break;
  496. case PACKET3_SET_SAMPLER:
  497. if (pkt->count % 3) {
  498. DRM_ERROR("bad SET_SAMPLER\n");
  499. return -EINVAL;
  500. }
  501. start_reg = (ib[idx+0] << 2) + PACKET3_SET_SAMPLER_OFFSET;
  502. end_reg = 4 * pkt->count + start_reg - 4;
  503. if ((start_reg < PACKET3_SET_SAMPLER_OFFSET) ||
  504. (start_reg >= PACKET3_SET_SAMPLER_END) ||
  505. (end_reg >= PACKET3_SET_SAMPLER_END)) {
  506. DRM_ERROR("bad SET_SAMPLER\n");
  507. return -EINVAL;
  508. }
  509. break;
  510. case PACKET3_SURFACE_BASE_UPDATE:
  511. if (p->family >= CHIP_RV770 || p->family == CHIP_R600) {
  512. DRM_ERROR("bad SURFACE_BASE_UPDATE\n");
  513. return -EINVAL;
  514. }
  515. if (pkt->count) {
  516. DRM_ERROR("bad SURFACE_BASE_UPDATE\n");
  517. return -EINVAL;
  518. }
  519. break;
  520. case PACKET3_NOP:
  521. break;
  522. default:
  523. DRM_ERROR("Packet3 opcode %x not supported\n", pkt->opcode);
  524. return -EINVAL;
  525. }
  526. return 0;
  527. }
  528. int r600_cs_parse(struct radeon_cs_parser *p)
  529. {
  530. struct radeon_cs_packet pkt;
  531. int r;
  532. do {
  533. r = r600_cs_packet_parse(p, &pkt, p->idx);
  534. if (r) {
  535. return r;
  536. }
  537. p->idx += pkt.count + 2;
  538. switch (pkt.type) {
  539. case PACKET_TYPE0:
  540. r = r600_cs_parse_packet0(p, &pkt);
  541. break;
  542. case PACKET_TYPE2:
  543. break;
  544. case PACKET_TYPE3:
  545. r = r600_packet3_check(p, &pkt);
  546. break;
  547. default:
  548. DRM_ERROR("Unknown packet type %d !\n", pkt.type);
  549. return -EINVAL;
  550. }
  551. if (r) {
  552. return r;
  553. }
  554. } while (p->idx < p->chunks[p->chunk_ib_idx].length_dw);
  555. #if 0
  556. for (r = 0; r < p->ib->length_dw; r++) {
  557. printk(KERN_INFO "%05d 0x%08X\n", r, p->ib->ptr[r]);
  558. mdelay(1);
  559. }
  560. #endif
  561. return 0;
  562. }
  563. static int r600_cs_parser_relocs_legacy(struct radeon_cs_parser *p)
  564. {
  565. if (p->chunk_relocs_idx == -1) {
  566. return 0;
  567. }
  568. p->relocs = kcalloc(1, sizeof(struct radeon_cs_reloc), GFP_KERNEL);
  569. if (p->relocs == NULL) {
  570. return -ENOMEM;
  571. }
  572. return 0;
  573. }
  574. /**
  575. * cs_parser_fini() - clean parser states
  576. * @parser: parser structure holding parsing context.
  577. * @error: error number
  578. *
  579. * If error is set than unvalidate buffer, otherwise just free memory
  580. * used by parsing context.
  581. **/
  582. static void r600_cs_parser_fini(struct radeon_cs_parser *parser, int error)
  583. {
  584. unsigned i;
  585. kfree(parser->relocs);
  586. for (i = 0; i < parser->nchunks; i++) {
  587. kfree(parser->chunks[i].kdata);
  588. }
  589. kfree(parser->chunks);
  590. kfree(parser->chunks_array);
  591. }
  592. int r600_cs_legacy(struct drm_device *dev, void *data, struct drm_file *filp,
  593. unsigned family, u32 *ib, int *l)
  594. {
  595. struct radeon_cs_parser parser;
  596. struct radeon_cs_chunk *ib_chunk;
  597. struct radeon_ib fake_ib;
  598. int r;
  599. /* initialize parser */
  600. memset(&parser, 0, sizeof(struct radeon_cs_parser));
  601. parser.filp = filp;
  602. parser.rdev = NULL;
  603. parser.family = family;
  604. parser.ib = &fake_ib;
  605. fake_ib.ptr = ib;
  606. r = radeon_cs_parser_init(&parser, data);
  607. if (r) {
  608. DRM_ERROR("Failed to initialize parser !\n");
  609. r600_cs_parser_fini(&parser, r);
  610. return r;
  611. }
  612. r = r600_cs_parser_relocs_legacy(&parser);
  613. if (r) {
  614. DRM_ERROR("Failed to parse relocation !\n");
  615. r600_cs_parser_fini(&parser, r);
  616. return r;
  617. }
  618. /* Copy the packet into the IB, the parser will read from the
  619. * input memory (cached) and write to the IB (which can be
  620. * uncached). */
  621. ib_chunk = &parser.chunks[parser.chunk_ib_idx];
  622. parser.ib->length_dw = ib_chunk->length_dw;
  623. memcpy((void *)parser.ib->ptr, ib_chunk->kdata, ib_chunk->length_dw*4);
  624. *l = parser.ib->length_dw;
  625. r = r600_cs_parse(&parser);
  626. if (r) {
  627. DRM_ERROR("Invalid command stream !\n");
  628. r600_cs_parser_fini(&parser, r);
  629. return r;
  630. }
  631. r600_cs_parser_fini(&parser, r);
  632. return r;
  633. }
  634. void r600_cs_legacy_init(void)
  635. {
  636. r600_cs_packet_next_reloc = &r600_cs_packet_next_reloc_nomm;
  637. }