spu.c 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635
  1. /*
  2. * PS3 Platform spu routines.
  3. *
  4. * Copyright (C) 2006 Sony Computer Entertainment Inc.
  5. * Copyright 2006 Sony Corp.
  6. *
  7. * This program is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU General Public License as published by
  9. * the Free Software Foundation; version 2 of the License.
  10. *
  11. * This program is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  14. * GNU General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU General Public License
  17. * along with this program; if not, write to the Free Software
  18. * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
  19. */
  20. #include <linux/kernel.h>
  21. #include <linux/init.h>
  22. #include <linux/slab.h>
  23. #include <linux/mmzone.h>
  24. #include <linux/io.h>
  25. #include <linux/mm.h>
  26. #include <asm/spu.h>
  27. #include <asm/spu_priv1.h>
  28. #include <asm/lv1call.h>
  29. #include <asm/ps3.h>
  30. #include "../cell/spufs/spufs.h"
  31. #include "platform.h"
  32. /* spu_management_ops */
  33. /**
  34. * enum spe_type - Type of spe to create.
  35. * @spe_type_logical: Standard logical spe.
  36. *
  37. * For use with lv1_construct_logical_spe(). The current HV does not support
  38. * any types other than those listed.
  39. */
  40. enum spe_type {
  41. SPE_TYPE_LOGICAL = 0,
  42. };
  43. /**
  44. * struct spe_shadow - logical spe shadow register area.
  45. *
  46. * Read-only shadow of spe registers.
  47. */
  48. struct spe_shadow {
  49. u8 padding_0140[0x0140];
  50. u64 int_status_class0_RW; /* 0x0140 */
  51. u64 int_status_class1_RW; /* 0x0148 */
  52. u64 int_status_class2_RW; /* 0x0150 */
  53. u8 padding_0158[0x0610-0x0158];
  54. u64 mfc_dsisr_RW; /* 0x0610 */
  55. u8 padding_0618[0x0620-0x0618];
  56. u64 mfc_dar_RW; /* 0x0620 */
  57. u8 padding_0628[0x0800-0x0628];
  58. u64 mfc_dsipr_R; /* 0x0800 */
  59. u8 padding_0808[0x0810-0x0808];
  60. u64 mfc_lscrr_R; /* 0x0810 */
  61. u8 padding_0818[0x0c00-0x0818];
  62. u64 mfc_cer_R; /* 0x0c00 */
  63. u8 padding_0c08[0x0f00-0x0c08];
  64. u64 spe_execution_status; /* 0x0f00 */
  65. u8 padding_0f08[0x1000-0x0f08];
  66. };
  67. /**
  68. * enum spe_ex_state - Logical spe execution state.
  69. * @spe_ex_state_unexecutable: Uninitialized.
  70. * @spe_ex_state_executable: Enabled, not ready.
  71. * @spe_ex_state_executed: Ready for use.
  72. *
  73. * The execution state (status) of the logical spe as reported in
  74. * struct spe_shadow:spe_execution_status.
  75. */
  76. enum spe_ex_state {
  77. SPE_EX_STATE_UNEXECUTABLE = 0,
  78. SPE_EX_STATE_EXECUTABLE = 2,
  79. SPE_EX_STATE_EXECUTED = 3,
  80. };
  81. /**
  82. * struct priv1_cache - Cached values of priv1 registers.
  83. * @masks[]: Array of cached spe interrupt masks, indexed by class.
  84. * @sr1: Cached mfc_sr1 register.
  85. * @tclass_id: Cached mfc_tclass_id register.
  86. */
  87. struct priv1_cache {
  88. u64 masks[3];
  89. u64 sr1;
  90. u64 tclass_id;
  91. };
  92. /**
  93. * struct spu_pdata - Platform state variables.
  94. * @spe_id: HV spe id returned by lv1_construct_logical_spe().
  95. * @resource_id: HV spe resource id returned by
  96. * ps3_repository_read_spe_resource_id().
  97. * @priv2_addr: lpar address of spe priv2 area returned by
  98. * lv1_construct_logical_spe().
  99. * @shadow_addr: lpar address of spe register shadow area returned by
  100. * lv1_construct_logical_spe().
  101. * @shadow: Virtual (ioremap) address of spe register shadow area.
  102. * @cache: Cached values of priv1 registers.
  103. */
  104. struct spu_pdata {
  105. u64 spe_id;
  106. u64 resource_id;
  107. u64 priv2_addr;
  108. u64 shadow_addr;
  109. struct spe_shadow __iomem *shadow;
  110. struct priv1_cache cache;
  111. };
  112. static struct spu_pdata *spu_pdata(struct spu *spu)
  113. {
  114. return spu->pdata;
  115. }
  116. #define dump_areas(_a, _b, _c, _d, _e) \
  117. _dump_areas(_a, _b, _c, _d, _e, __func__, __LINE__)
  118. static void _dump_areas(unsigned int spe_id, unsigned long priv2,
  119. unsigned long problem, unsigned long ls, unsigned long shadow,
  120. const char* func, int line)
  121. {
  122. pr_debug("%s:%d: spe_id: %xh (%u)\n", func, line, spe_id, spe_id);
  123. pr_debug("%s:%d: priv2: %lxh\n", func, line, priv2);
  124. pr_debug("%s:%d: problem: %lxh\n", func, line, problem);
  125. pr_debug("%s:%d: ls: %lxh\n", func, line, ls);
  126. pr_debug("%s:%d: shadow: %lxh\n", func, line, shadow);
  127. }
  128. inline u64 ps3_get_spe_id(void *arg)
  129. {
  130. return spu_pdata(arg)->spe_id;
  131. }
  132. EXPORT_SYMBOL_GPL(ps3_get_spe_id);
  133. static unsigned long get_vas_id(void)
  134. {
  135. u64 id;
  136. lv1_get_logical_ppe_id(&id);
  137. lv1_get_virtual_address_space_id_of_ppe(id, &id);
  138. return id;
  139. }
  140. static int __init construct_spu(struct spu *spu)
  141. {
  142. int result;
  143. u64 unused;
  144. u64 problem_phys;
  145. u64 local_store_phys;
  146. result = lv1_construct_logical_spe(PAGE_SHIFT, PAGE_SHIFT, PAGE_SHIFT,
  147. PAGE_SHIFT, PAGE_SHIFT, get_vas_id(), SPE_TYPE_LOGICAL,
  148. &spu_pdata(spu)->priv2_addr, &problem_phys,
  149. &local_store_phys, &unused,
  150. &spu_pdata(spu)->shadow_addr,
  151. &spu_pdata(spu)->spe_id);
  152. spu->problem_phys = problem_phys;
  153. spu->local_store_phys = local_store_phys;
  154. if (result) {
  155. pr_debug("%s:%d: lv1_construct_logical_spe failed: %s\n",
  156. __func__, __LINE__, ps3_result(result));
  157. return result;
  158. }
  159. return result;
  160. }
  161. static void spu_unmap(struct spu *spu)
  162. {
  163. iounmap(spu->priv2);
  164. iounmap(spu->problem);
  165. iounmap((__force u8 __iomem *)spu->local_store);
  166. iounmap(spu_pdata(spu)->shadow);
  167. }
  168. /**
  169. * setup_areas - Map the spu regions into the address space.
  170. *
  171. * The current HV requires the spu shadow regs to be mapped with the
  172. * PTE page protection bits set as read-only (PP=3). This implementation
  173. * uses the low level __ioremap() to bypass the page protection settings
  174. * inforced by ioremap_prot() to get the needed PTE bits set for the
  175. * shadow regs.
  176. */
  177. static int __init setup_areas(struct spu *spu)
  178. {
  179. struct table {char* name; unsigned long addr; unsigned long size;};
  180. static const unsigned long shadow_flags = _PAGE_NO_CACHE | 3;
  181. spu_pdata(spu)->shadow = __ioremap(spu_pdata(spu)->shadow_addr,
  182. sizeof(struct spe_shadow),
  183. shadow_flags);
  184. if (!spu_pdata(spu)->shadow) {
  185. pr_debug("%s:%d: ioremap shadow failed\n", __func__, __LINE__);
  186. goto fail_ioremap;
  187. }
  188. spu->local_store = (__force void *)ioremap_prot(spu->local_store_phys,
  189. LS_SIZE, _PAGE_NO_CACHE);
  190. if (!spu->local_store) {
  191. pr_debug("%s:%d: ioremap local_store failed\n",
  192. __func__, __LINE__);
  193. goto fail_ioremap;
  194. }
  195. spu->problem = ioremap(spu->problem_phys,
  196. sizeof(struct spu_problem));
  197. if (!spu->problem) {
  198. pr_debug("%s:%d: ioremap problem failed\n", __func__, __LINE__);
  199. goto fail_ioremap;
  200. }
  201. spu->priv2 = ioremap(spu_pdata(spu)->priv2_addr,
  202. sizeof(struct spu_priv2));
  203. if (!spu->priv2) {
  204. pr_debug("%s:%d: ioremap priv2 failed\n", __func__, __LINE__);
  205. goto fail_ioremap;
  206. }
  207. dump_areas(spu_pdata(spu)->spe_id, spu_pdata(spu)->priv2_addr,
  208. spu->problem_phys, spu->local_store_phys,
  209. spu_pdata(spu)->shadow_addr);
  210. dump_areas(spu_pdata(spu)->spe_id, (unsigned long)spu->priv2,
  211. (unsigned long)spu->problem, (unsigned long)spu->local_store,
  212. (unsigned long)spu_pdata(spu)->shadow);
  213. return 0;
  214. fail_ioremap:
  215. spu_unmap(spu);
  216. return -ENOMEM;
  217. }
  218. static int __init setup_interrupts(struct spu *spu)
  219. {
  220. int result;
  221. result = ps3_spe_irq_setup(PS3_BINDING_CPU_ANY, spu_pdata(spu)->spe_id,
  222. 0, &spu->irqs[0]);
  223. if (result)
  224. goto fail_alloc_0;
  225. result = ps3_spe_irq_setup(PS3_BINDING_CPU_ANY, spu_pdata(spu)->spe_id,
  226. 1, &spu->irqs[1]);
  227. if (result)
  228. goto fail_alloc_1;
  229. result = ps3_spe_irq_setup(PS3_BINDING_CPU_ANY, spu_pdata(spu)->spe_id,
  230. 2, &spu->irqs[2]);
  231. if (result)
  232. goto fail_alloc_2;
  233. return result;
  234. fail_alloc_2:
  235. ps3_spe_irq_destroy(spu->irqs[1]);
  236. fail_alloc_1:
  237. ps3_spe_irq_destroy(spu->irqs[0]);
  238. fail_alloc_0:
  239. spu->irqs[0] = spu->irqs[1] = spu->irqs[2] = NO_IRQ;
  240. return result;
  241. }
  242. static int __init enable_spu(struct spu *spu)
  243. {
  244. int result;
  245. result = lv1_enable_logical_spe(spu_pdata(spu)->spe_id,
  246. spu_pdata(spu)->resource_id);
  247. if (result) {
  248. pr_debug("%s:%d: lv1_enable_logical_spe failed: %s\n",
  249. __func__, __LINE__, ps3_result(result));
  250. goto fail_enable;
  251. }
  252. result = setup_areas(spu);
  253. if (result)
  254. goto fail_areas;
  255. result = setup_interrupts(spu);
  256. if (result)
  257. goto fail_interrupts;
  258. return 0;
  259. fail_interrupts:
  260. spu_unmap(spu);
  261. fail_areas:
  262. lv1_disable_logical_spe(spu_pdata(spu)->spe_id, 0);
  263. fail_enable:
  264. return result;
  265. }
  266. static int ps3_destroy_spu(struct spu *spu)
  267. {
  268. int result;
  269. pr_debug("%s:%d spu_%d\n", __func__, __LINE__, spu->number);
  270. result = lv1_disable_logical_spe(spu_pdata(spu)->spe_id, 0);
  271. BUG_ON(result);
  272. ps3_spe_irq_destroy(spu->irqs[2]);
  273. ps3_spe_irq_destroy(spu->irqs[1]);
  274. ps3_spe_irq_destroy(spu->irqs[0]);
  275. spu->irqs[0] = spu->irqs[1] = spu->irqs[2] = NO_IRQ;
  276. spu_unmap(spu);
  277. result = lv1_destruct_logical_spe(spu_pdata(spu)->spe_id);
  278. BUG_ON(result);
  279. kfree(spu->pdata);
  280. spu->pdata = NULL;
  281. return 0;
  282. }
  283. static int __init ps3_create_spu(struct spu *spu, void *data)
  284. {
  285. int result;
  286. pr_debug("%s:%d spu_%d\n", __func__, __LINE__, spu->number);
  287. spu->pdata = kzalloc(sizeof(struct spu_pdata),
  288. GFP_KERNEL);
  289. if (!spu->pdata) {
  290. result = -ENOMEM;
  291. goto fail_malloc;
  292. }
  293. spu_pdata(spu)->resource_id = (unsigned long)data;
  294. /* Init cached reg values to HV defaults. */
  295. spu_pdata(spu)->cache.sr1 = 0x33;
  296. result = construct_spu(spu);
  297. if (result)
  298. goto fail_construct;
  299. /* For now, just go ahead and enable it. */
  300. result = enable_spu(spu);
  301. if (result)
  302. goto fail_enable;
  303. /* Make sure the spu is in SPE_EX_STATE_EXECUTED. */
  304. /* need something better here!!! */
  305. while (in_be64(&spu_pdata(spu)->shadow->spe_execution_status)
  306. != SPE_EX_STATE_EXECUTED)
  307. (void)0;
  308. return result;
  309. fail_enable:
  310. fail_construct:
  311. ps3_destroy_spu(spu);
  312. fail_malloc:
  313. return result;
  314. }
  315. static int __init ps3_enumerate_spus(int (*fn)(void *data))
  316. {
  317. int result;
  318. unsigned int num_resource_id;
  319. unsigned int i;
  320. result = ps3_repository_read_num_spu_resource_id(&num_resource_id);
  321. pr_debug("%s:%d: num_resource_id %u\n", __func__, __LINE__,
  322. num_resource_id);
  323. /*
  324. * For now, just create logical spus equal to the number
  325. * of physical spus reserved for the partition.
  326. */
  327. for (i = 0; i < num_resource_id; i++) {
  328. enum ps3_spu_resource_type resource_type;
  329. unsigned int resource_id;
  330. result = ps3_repository_read_spu_resource_id(i,
  331. &resource_type, &resource_id);
  332. if (result)
  333. break;
  334. if (resource_type == PS3_SPU_RESOURCE_TYPE_EXCLUSIVE) {
  335. result = fn((void*)(unsigned long)resource_id);
  336. if (result)
  337. break;
  338. }
  339. }
  340. if (result) {
  341. printk(KERN_WARNING "%s:%d: Error initializing spus\n",
  342. __func__, __LINE__);
  343. return result;
  344. }
  345. return num_resource_id;
  346. }
  347. static int ps3_init_affinity(void)
  348. {
  349. return 0;
  350. }
  351. /**
  352. * ps3_enable_spu - Enable SPU run control.
  353. *
  354. * An outstanding enhancement for the PS3 would be to add a guard to check
  355. * for incorrect access to the spu problem state when the spu context is
  356. * disabled. This check could be implemented with a flag added to the spu
  357. * context that would inhibit mapping problem state pages, and a routine
  358. * to unmap spu problem state pages. When the spu is enabled with
  359. * ps3_enable_spu() the flag would be set allowing pages to be mapped,
  360. * and when the spu is disabled with ps3_disable_spu() the flag would be
  361. * cleared and the mapped problem state pages would be unmapped.
  362. */
  363. static void ps3_enable_spu(struct spu_context *ctx)
  364. {
  365. }
  366. static void ps3_disable_spu(struct spu_context *ctx)
  367. {
  368. ctx->ops->runcntl_stop(ctx);
  369. }
  370. const struct spu_management_ops spu_management_ps3_ops = {
  371. .enumerate_spus = ps3_enumerate_spus,
  372. .create_spu = ps3_create_spu,
  373. .destroy_spu = ps3_destroy_spu,
  374. .enable_spu = ps3_enable_spu,
  375. .disable_spu = ps3_disable_spu,
  376. .init_affinity = ps3_init_affinity,
  377. };
  378. /* spu_priv1_ops */
  379. static void int_mask_and(struct spu *spu, int class, u64 mask)
  380. {
  381. u64 old_mask;
  382. /* are these serialized by caller??? */
  383. old_mask = spu_int_mask_get(spu, class);
  384. spu_int_mask_set(spu, class, old_mask & mask);
  385. }
  386. static void int_mask_or(struct spu *spu, int class, u64 mask)
  387. {
  388. u64 old_mask;
  389. old_mask = spu_int_mask_get(spu, class);
  390. spu_int_mask_set(spu, class, old_mask | mask);
  391. }
  392. static void int_mask_set(struct spu *spu, int class, u64 mask)
  393. {
  394. spu_pdata(spu)->cache.masks[class] = mask;
  395. lv1_set_spe_interrupt_mask(spu_pdata(spu)->spe_id, class,
  396. spu_pdata(spu)->cache.masks[class]);
  397. }
  398. static u64 int_mask_get(struct spu *spu, int class)
  399. {
  400. return spu_pdata(spu)->cache.masks[class];
  401. }
  402. static void int_stat_clear(struct spu *spu, int class, u64 stat)
  403. {
  404. /* Note that MFC_DSISR will be cleared when class1[MF] is set. */
  405. lv1_clear_spe_interrupt_status(spu_pdata(spu)->spe_id, class,
  406. stat, 0);
  407. }
  408. static u64 int_stat_get(struct spu *spu, int class)
  409. {
  410. u64 stat;
  411. lv1_get_spe_interrupt_status(spu_pdata(spu)->spe_id, class, &stat);
  412. return stat;
  413. }
  414. static void cpu_affinity_set(struct spu *spu, int cpu)
  415. {
  416. /* No support. */
  417. }
  418. static u64 mfc_dar_get(struct spu *spu)
  419. {
  420. return in_be64(&spu_pdata(spu)->shadow->mfc_dar_RW);
  421. }
  422. static void mfc_dsisr_set(struct spu *spu, u64 dsisr)
  423. {
  424. /* Nothing to do, cleared in int_stat_clear(). */
  425. }
  426. static u64 mfc_dsisr_get(struct spu *spu)
  427. {
  428. return in_be64(&spu_pdata(spu)->shadow->mfc_dsisr_RW);
  429. }
  430. static void mfc_sdr_setup(struct spu *spu)
  431. {
  432. /* Nothing to do. */
  433. }
  434. static void mfc_sr1_set(struct spu *spu, u64 sr1)
  435. {
  436. /* Check bits allowed by HV. */
  437. static const u64 allowed = ~(MFC_STATE1_LOCAL_STORAGE_DECODE_MASK
  438. | MFC_STATE1_PROBLEM_STATE_MASK);
  439. BUG_ON((sr1 & allowed) != (spu_pdata(spu)->cache.sr1 & allowed));
  440. spu_pdata(spu)->cache.sr1 = sr1;
  441. lv1_set_spe_privilege_state_area_1_register(
  442. spu_pdata(spu)->spe_id,
  443. offsetof(struct spu_priv1, mfc_sr1_RW),
  444. spu_pdata(spu)->cache.sr1);
  445. }
  446. static u64 mfc_sr1_get(struct spu *spu)
  447. {
  448. return spu_pdata(spu)->cache.sr1;
  449. }
  450. static void mfc_tclass_id_set(struct spu *spu, u64 tclass_id)
  451. {
  452. spu_pdata(spu)->cache.tclass_id = tclass_id;
  453. lv1_set_spe_privilege_state_area_1_register(
  454. spu_pdata(spu)->spe_id,
  455. offsetof(struct spu_priv1, mfc_tclass_id_RW),
  456. spu_pdata(spu)->cache.tclass_id);
  457. }
  458. static u64 mfc_tclass_id_get(struct spu *spu)
  459. {
  460. return spu_pdata(spu)->cache.tclass_id;
  461. }
  462. static void tlb_invalidate(struct spu *spu)
  463. {
  464. /* Nothing to do. */
  465. }
  466. static void resource_allocation_groupID_set(struct spu *spu, u64 id)
  467. {
  468. /* No support. */
  469. }
  470. static u64 resource_allocation_groupID_get(struct spu *spu)
  471. {
  472. return 0; /* No support. */
  473. }
  474. static void resource_allocation_enable_set(struct spu *spu, u64 enable)
  475. {
  476. /* No support. */
  477. }
  478. static u64 resource_allocation_enable_get(struct spu *spu)
  479. {
  480. return 0; /* No support. */
  481. }
  482. const struct spu_priv1_ops spu_priv1_ps3_ops = {
  483. .int_mask_and = int_mask_and,
  484. .int_mask_or = int_mask_or,
  485. .int_mask_set = int_mask_set,
  486. .int_mask_get = int_mask_get,
  487. .int_stat_clear = int_stat_clear,
  488. .int_stat_get = int_stat_get,
  489. .cpu_affinity_set = cpu_affinity_set,
  490. .mfc_dar_get = mfc_dar_get,
  491. .mfc_dsisr_set = mfc_dsisr_set,
  492. .mfc_dsisr_get = mfc_dsisr_get,
  493. .mfc_sdr_setup = mfc_sdr_setup,
  494. .mfc_sr1_set = mfc_sr1_set,
  495. .mfc_sr1_get = mfc_sr1_get,
  496. .mfc_tclass_id_set = mfc_tclass_id_set,
  497. .mfc_tclass_id_get = mfc_tclass_id_get,
  498. .tlb_invalidate = tlb_invalidate,
  499. .resource_allocation_groupID_set = resource_allocation_groupID_set,
  500. .resource_allocation_groupID_get = resource_allocation_groupID_get,
  501. .resource_allocation_enable_set = resource_allocation_enable_set,
  502. .resource_allocation_enable_get = resource_allocation_enable_get,
  503. };
  504. void ps3_spu_set_platform(void)
  505. {
  506. spu_priv1_ops = &spu_priv1_ps3_ops;
  507. spu_management_ops = &spu_management_ps3_ops;
  508. }