prom.c 26 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974
  1. /*
  2. * Procedures for creating, accessing and interpreting the device tree.
  3. *
  4. * Paul Mackerras August 1996.
  5. * Copyright (C) 1996-2005 Paul Mackerras.
  6. *
  7. * Adapted for 64bit PowerPC by Dave Engebretsen and Peter Bergner.
  8. * {engebret|bergner}@us.ibm.com
  9. *
  10. * This program is free software; you can redistribute it and/or
  11. * modify it under the terms of the GNU General Public License
  12. * as published by the Free Software Foundation; either version
  13. * 2 of the License, or (at your option) any later version.
  14. */
  15. #undef DEBUG
  16. #include <stdarg.h>
  17. #include <linux/kernel.h>
  18. #include <linux/string.h>
  19. #include <linux/init.h>
  20. #include <linux/threads.h>
  21. #include <linux/spinlock.h>
  22. #include <linux/types.h>
  23. #include <linux/pci.h>
  24. #include <linux/stringify.h>
  25. #include <linux/delay.h>
  26. #include <linux/initrd.h>
  27. #include <linux/bitops.h>
  28. #include <linux/export.h>
  29. #include <linux/kexec.h>
  30. #include <linux/debugfs.h>
  31. #include <linux/irq.h>
  32. #include <linux/memblock.h>
  33. #include <asm/prom.h>
  34. #include <asm/rtas.h>
  35. #include <asm/page.h>
  36. #include <asm/processor.h>
  37. #include <asm/irq.h>
  38. #include <asm/io.h>
  39. #include <asm/kdump.h>
  40. #include <asm/smp.h>
  41. #include <asm/system.h>
  42. #include <asm/mmu.h>
  43. #include <asm/paca.h>
  44. #include <asm/pgtable.h>
  45. #include <asm/pci.h>
  46. #include <asm/iommu.h>
  47. #include <asm/btext.h>
  48. #include <asm/sections.h>
  49. #include <asm/machdep.h>
  50. #include <asm/pSeries_reconfig.h>
  51. #include <asm/pci-bridge.h>
  52. #include <asm/phyp_dump.h>
  53. #include <asm/kexec.h>
  54. #include <asm/opal.h>
  55. #include <mm/mmu_decl.h>
  56. #ifdef DEBUG
  57. #define DBG(fmt...) printk(KERN_ERR fmt)
  58. #else
  59. #define DBG(fmt...)
  60. #endif
  61. #ifdef CONFIG_PPC64
  62. int __initdata iommu_is_off;
  63. int __initdata iommu_force_on;
  64. unsigned long tce_alloc_start, tce_alloc_end;
  65. u64 ppc64_rma_size;
  66. #endif
  67. static phys_addr_t first_memblock_size;
  68. static int __initdata boot_cpu_count;
  69. static int __init early_parse_mem(char *p)
  70. {
  71. if (!p)
  72. return 1;
  73. memory_limit = PAGE_ALIGN(memparse(p, &p));
  74. DBG("memory limit = 0x%llx\n", (unsigned long long)memory_limit);
  75. return 0;
  76. }
  77. early_param("mem", early_parse_mem);
  78. /*
  79. * overlaps_initrd - check for overlap with page aligned extension of
  80. * initrd.
  81. */
  82. static inline int overlaps_initrd(unsigned long start, unsigned long size)
  83. {
  84. #ifdef CONFIG_BLK_DEV_INITRD
  85. if (!initrd_start)
  86. return 0;
  87. return (start + size) > _ALIGN_DOWN(initrd_start, PAGE_SIZE) &&
  88. start <= _ALIGN_UP(initrd_end, PAGE_SIZE);
  89. #else
  90. return 0;
  91. #endif
  92. }
  93. /**
  94. * move_device_tree - move tree to an unused area, if needed.
  95. *
  96. * The device tree may be allocated beyond our memory limit, or inside the
  97. * crash kernel region for kdump, or within the page aligned range of initrd.
  98. * If so, move it out of the way.
  99. */
  100. static void __init move_device_tree(void)
  101. {
  102. unsigned long start, size;
  103. void *p;
  104. DBG("-> move_device_tree\n");
  105. start = __pa(initial_boot_params);
  106. size = be32_to_cpu(initial_boot_params->totalsize);
  107. if ((memory_limit && (start + size) > PHYSICAL_START + memory_limit) ||
  108. overlaps_crashkernel(start, size) ||
  109. overlaps_initrd(start, size)) {
  110. p = __va(memblock_alloc(size, PAGE_SIZE));
  111. memcpy(p, initial_boot_params, size);
  112. initial_boot_params = (struct boot_param_header *)p;
  113. DBG("Moved device tree to 0x%p\n", p);
  114. }
  115. DBG("<- move_device_tree\n");
  116. }
  117. /*
  118. * ibm,pa-features is a per-cpu property that contains a string of
  119. * attribute descriptors, each of which has a 2 byte header plus up
  120. * to 254 bytes worth of processor attribute bits. First header
  121. * byte specifies the number of bytes following the header.
  122. * Second header byte is an "attribute-specifier" type, of which
  123. * zero is the only currently-defined value.
  124. * Implementation: Pass in the byte and bit offset for the feature
  125. * that we are interested in. The function will return -1 if the
  126. * pa-features property is missing, or a 1/0 to indicate if the feature
  127. * is supported/not supported. Note that the bit numbers are
  128. * big-endian to match the definition in PAPR.
  129. */
  130. static struct ibm_pa_feature {
  131. unsigned long cpu_features; /* CPU_FTR_xxx bit */
  132. unsigned long mmu_features; /* MMU_FTR_xxx bit */
  133. unsigned int cpu_user_ftrs; /* PPC_FEATURE_xxx bit */
  134. unsigned char pabyte; /* byte number in ibm,pa-features */
  135. unsigned char pabit; /* bit number (big-endian) */
  136. unsigned char invert; /* if 1, pa bit set => clear feature */
  137. } ibm_pa_features[] __initdata = {
  138. {0, 0, PPC_FEATURE_HAS_MMU, 0, 0, 0},
  139. {0, 0, PPC_FEATURE_HAS_FPU, 0, 1, 0},
  140. {0, MMU_FTR_SLB, 0, 0, 2, 0},
  141. {CPU_FTR_CTRL, 0, 0, 0, 3, 0},
  142. {CPU_FTR_NOEXECUTE, 0, 0, 0, 6, 0},
  143. {CPU_FTR_NODSISRALIGN, 0, 0, 1, 1, 1},
  144. {0, MMU_FTR_CI_LARGE_PAGE, 0, 1, 2, 0},
  145. {CPU_FTR_REAL_LE, PPC_FEATURE_TRUE_LE, 5, 0, 0},
  146. };
  147. static void __init scan_features(unsigned long node, unsigned char *ftrs,
  148. unsigned long tablelen,
  149. struct ibm_pa_feature *fp,
  150. unsigned long ft_size)
  151. {
  152. unsigned long i, len, bit;
  153. /* find descriptor with type == 0 */
  154. for (;;) {
  155. if (tablelen < 3)
  156. return;
  157. len = 2 + ftrs[0];
  158. if (tablelen < len)
  159. return; /* descriptor 0 not found */
  160. if (ftrs[1] == 0)
  161. break;
  162. tablelen -= len;
  163. ftrs += len;
  164. }
  165. /* loop over bits we know about */
  166. for (i = 0; i < ft_size; ++i, ++fp) {
  167. if (fp->pabyte >= ftrs[0])
  168. continue;
  169. bit = (ftrs[2 + fp->pabyte] >> (7 - fp->pabit)) & 1;
  170. if (bit ^ fp->invert) {
  171. cur_cpu_spec->cpu_features |= fp->cpu_features;
  172. cur_cpu_spec->cpu_user_features |= fp->cpu_user_ftrs;
  173. cur_cpu_spec->mmu_features |= fp->mmu_features;
  174. } else {
  175. cur_cpu_spec->cpu_features &= ~fp->cpu_features;
  176. cur_cpu_spec->cpu_user_features &= ~fp->cpu_user_ftrs;
  177. cur_cpu_spec->mmu_features &= ~fp->mmu_features;
  178. }
  179. }
  180. }
  181. static void __init check_cpu_pa_features(unsigned long node)
  182. {
  183. unsigned char *pa_ftrs;
  184. unsigned long tablelen;
  185. pa_ftrs = of_get_flat_dt_prop(node, "ibm,pa-features", &tablelen);
  186. if (pa_ftrs == NULL)
  187. return;
  188. scan_features(node, pa_ftrs, tablelen,
  189. ibm_pa_features, ARRAY_SIZE(ibm_pa_features));
  190. }
  191. #ifdef CONFIG_PPC_STD_MMU_64
  192. static void __init check_cpu_slb_size(unsigned long node)
  193. {
  194. u32 *slb_size_ptr;
  195. slb_size_ptr = of_get_flat_dt_prop(node, "slb-size", NULL);
  196. if (slb_size_ptr != NULL) {
  197. mmu_slb_size = *slb_size_ptr;
  198. return;
  199. }
  200. slb_size_ptr = of_get_flat_dt_prop(node, "ibm,slb-size", NULL);
  201. if (slb_size_ptr != NULL) {
  202. mmu_slb_size = *slb_size_ptr;
  203. }
  204. }
  205. #else
  206. #define check_cpu_slb_size(node) do { } while(0)
  207. #endif
  208. static struct feature_property {
  209. const char *name;
  210. u32 min_value;
  211. unsigned long cpu_feature;
  212. unsigned long cpu_user_ftr;
  213. } feature_properties[] __initdata = {
  214. #ifdef CONFIG_ALTIVEC
  215. {"altivec", 0, CPU_FTR_ALTIVEC, PPC_FEATURE_HAS_ALTIVEC},
  216. {"ibm,vmx", 1, CPU_FTR_ALTIVEC, PPC_FEATURE_HAS_ALTIVEC},
  217. #endif /* CONFIG_ALTIVEC */
  218. #ifdef CONFIG_VSX
  219. /* Yes, this _really_ is ibm,vmx == 2 to enable VSX */
  220. {"ibm,vmx", 2, CPU_FTR_VSX, PPC_FEATURE_HAS_VSX},
  221. #endif /* CONFIG_VSX */
  222. #ifdef CONFIG_PPC64
  223. {"ibm,dfp", 1, 0, PPC_FEATURE_HAS_DFP},
  224. {"ibm,purr", 1, CPU_FTR_PURR, 0},
  225. {"ibm,spurr", 1, CPU_FTR_SPURR, 0},
  226. #endif /* CONFIG_PPC64 */
  227. };
  228. #if defined(CONFIG_44x) && defined(CONFIG_PPC_FPU)
  229. static inline void identical_pvr_fixup(unsigned long node)
  230. {
  231. unsigned int pvr;
  232. char *model = of_get_flat_dt_prop(node, "model", NULL);
  233. /*
  234. * Since 440GR(x)/440EP(x) processors have the same pvr,
  235. * we check the node path and set bit 28 in the cur_cpu_spec
  236. * pvr for EP(x) processor version. This bit is always 0 in
  237. * the "real" pvr. Then we call identify_cpu again with
  238. * the new logical pvr to enable FPU support.
  239. */
  240. if (model && strstr(model, "440EP")) {
  241. pvr = cur_cpu_spec->pvr_value | 0x8;
  242. identify_cpu(0, pvr);
  243. DBG("Using logical pvr %x for %s\n", pvr, model);
  244. }
  245. }
  246. #else
  247. #define identical_pvr_fixup(node) do { } while(0)
  248. #endif
  249. static void __init check_cpu_feature_properties(unsigned long node)
  250. {
  251. unsigned long i;
  252. struct feature_property *fp = feature_properties;
  253. const u32 *prop;
  254. for (i = 0; i < ARRAY_SIZE(feature_properties); ++i, ++fp) {
  255. prop = of_get_flat_dt_prop(node, fp->name, NULL);
  256. if (prop && *prop >= fp->min_value) {
  257. cur_cpu_spec->cpu_features |= fp->cpu_feature;
  258. cur_cpu_spec->cpu_user_features |= fp->cpu_user_ftr;
  259. }
  260. }
  261. }
  262. static int __init early_init_dt_scan_cpus(unsigned long node,
  263. const char *uname, int depth,
  264. void *data)
  265. {
  266. char *type = of_get_flat_dt_prop(node, "device_type", NULL);
  267. const u32 *prop;
  268. const u32 *intserv;
  269. int i, nthreads;
  270. unsigned long len;
  271. int found = -1;
  272. int found_thread = 0;
  273. /* We are scanning "cpu" nodes only */
  274. if (type == NULL || strcmp(type, "cpu") != 0)
  275. return 0;
  276. /* Get physical cpuid */
  277. intserv = of_get_flat_dt_prop(node, "ibm,ppc-interrupt-server#s", &len);
  278. if (intserv) {
  279. nthreads = len / sizeof(int);
  280. } else {
  281. intserv = of_get_flat_dt_prop(node, "reg", NULL);
  282. nthreads = 1;
  283. }
  284. /*
  285. * Now see if any of these threads match our boot cpu.
  286. * NOTE: This must match the parsing done in smp_setup_cpu_maps.
  287. */
  288. for (i = 0; i < nthreads; i++) {
  289. /*
  290. * version 2 of the kexec param format adds the phys cpuid of
  291. * booted proc.
  292. */
  293. if (initial_boot_params->version >= 2) {
  294. if (intserv[i] == initial_boot_params->boot_cpuid_phys) {
  295. found = boot_cpu_count;
  296. found_thread = i;
  297. }
  298. } else {
  299. /*
  300. * Check if it's the boot-cpu, set it's hw index now,
  301. * unfortunately this format did not support booting
  302. * off secondary threads.
  303. */
  304. if (of_get_flat_dt_prop(node,
  305. "linux,boot-cpu", NULL) != NULL)
  306. found = boot_cpu_count;
  307. }
  308. #ifdef CONFIG_SMP
  309. /* logical cpu id is always 0 on UP kernels */
  310. boot_cpu_count++;
  311. #endif
  312. }
  313. if (found >= 0) {
  314. DBG("boot cpu: logical %d physical %d\n", found,
  315. intserv[found_thread]);
  316. boot_cpuid = found;
  317. set_hard_smp_processor_id(found, intserv[found_thread]);
  318. /*
  319. * PAPR defines "logical" PVR values for cpus that
  320. * meet various levels of the architecture:
  321. * 0x0f000001 Architecture version 2.04
  322. * 0x0f000002 Architecture version 2.05
  323. * If the cpu-version property in the cpu node contains
  324. * such a value, we call identify_cpu again with the
  325. * logical PVR value in order to use the cpu feature
  326. * bits appropriate for the architecture level.
  327. *
  328. * A POWER6 partition in "POWER6 architected" mode
  329. * uses the 0x0f000002 PVR value; in POWER5+ mode
  330. * it uses 0x0f000001.
  331. */
  332. prop = of_get_flat_dt_prop(node, "cpu-version", NULL);
  333. if (prop && (*prop & 0xff000000) == 0x0f000000)
  334. identify_cpu(0, *prop);
  335. identical_pvr_fixup(node);
  336. }
  337. check_cpu_feature_properties(node);
  338. check_cpu_pa_features(node);
  339. check_cpu_slb_size(node);
  340. #ifdef CONFIG_PPC_PSERIES
  341. if (nthreads > 1)
  342. cur_cpu_spec->cpu_features |= CPU_FTR_SMT;
  343. else
  344. cur_cpu_spec->cpu_features &= ~CPU_FTR_SMT;
  345. #endif
  346. return 0;
  347. }
  348. int __init early_init_dt_scan_chosen_ppc(unsigned long node, const char *uname,
  349. int depth, void *data)
  350. {
  351. unsigned long *lprop;
  352. /* Use common scan routine to determine if this is the chosen node */
  353. if (early_init_dt_scan_chosen(node, uname, depth, data) == 0)
  354. return 0;
  355. #ifdef CONFIG_PPC64
  356. /* check if iommu is forced on or off */
  357. if (of_get_flat_dt_prop(node, "linux,iommu-off", NULL) != NULL)
  358. iommu_is_off = 1;
  359. if (of_get_flat_dt_prop(node, "linux,iommu-force-on", NULL) != NULL)
  360. iommu_force_on = 1;
  361. #endif
  362. /* mem=x on the command line is the preferred mechanism */
  363. lprop = of_get_flat_dt_prop(node, "linux,memory-limit", NULL);
  364. if (lprop)
  365. memory_limit = *lprop;
  366. #ifdef CONFIG_PPC64
  367. lprop = of_get_flat_dt_prop(node, "linux,tce-alloc-start", NULL);
  368. if (lprop)
  369. tce_alloc_start = *lprop;
  370. lprop = of_get_flat_dt_prop(node, "linux,tce-alloc-end", NULL);
  371. if (lprop)
  372. tce_alloc_end = *lprop;
  373. #endif
  374. #ifdef CONFIG_KEXEC
  375. lprop = of_get_flat_dt_prop(node, "linux,crashkernel-base", NULL);
  376. if (lprop)
  377. crashk_res.start = *lprop;
  378. lprop = of_get_flat_dt_prop(node, "linux,crashkernel-size", NULL);
  379. if (lprop)
  380. crashk_res.end = crashk_res.start + *lprop - 1;
  381. #endif
  382. /* break now */
  383. return 1;
  384. }
  385. #ifdef CONFIG_PPC_PSERIES
  386. /*
  387. * Interpret the ibm,dynamic-memory property in the
  388. * /ibm,dynamic-reconfiguration-memory node.
  389. * This contains a list of memory blocks along with NUMA affinity
  390. * information.
  391. */
  392. static int __init early_init_dt_scan_drconf_memory(unsigned long node)
  393. {
  394. __be32 *dm, *ls, *usm;
  395. unsigned long l, n, flags;
  396. u64 base, size, memblock_size;
  397. unsigned int is_kexec_kdump = 0, rngs;
  398. ls = of_get_flat_dt_prop(node, "ibm,lmb-size", &l);
  399. if (ls == NULL || l < dt_root_size_cells * sizeof(__be32))
  400. return 0;
  401. memblock_size = dt_mem_next_cell(dt_root_size_cells, &ls);
  402. dm = of_get_flat_dt_prop(node, "ibm,dynamic-memory", &l);
  403. if (dm == NULL || l < sizeof(__be32))
  404. return 0;
  405. n = *dm++; /* number of entries */
  406. if (l < (n * (dt_root_addr_cells + 4) + 1) * sizeof(__be32))
  407. return 0;
  408. /* check if this is a kexec/kdump kernel. */
  409. usm = of_get_flat_dt_prop(node, "linux,drconf-usable-memory",
  410. &l);
  411. if (usm != NULL)
  412. is_kexec_kdump = 1;
  413. for (; n != 0; --n) {
  414. base = dt_mem_next_cell(dt_root_addr_cells, &dm);
  415. flags = dm[3];
  416. /* skip DRC index, pad, assoc. list index, flags */
  417. dm += 4;
  418. /* skip this block if the reserved bit is set in flags (0x80)
  419. or if the block is not assigned to this partition (0x8) */
  420. if ((flags & 0x80) || !(flags & 0x8))
  421. continue;
  422. size = memblock_size;
  423. rngs = 1;
  424. if (is_kexec_kdump) {
  425. /*
  426. * For each memblock in ibm,dynamic-memory, a corresponding
  427. * entry in linux,drconf-usable-memory property contains
  428. * a counter 'p' followed by 'p' (base, size) duple.
  429. * Now read the counter from
  430. * linux,drconf-usable-memory property
  431. */
  432. rngs = dt_mem_next_cell(dt_root_size_cells, &usm);
  433. if (!rngs) /* there are no (base, size) duple */
  434. continue;
  435. }
  436. do {
  437. if (is_kexec_kdump) {
  438. base = dt_mem_next_cell(dt_root_addr_cells,
  439. &usm);
  440. size = dt_mem_next_cell(dt_root_size_cells,
  441. &usm);
  442. }
  443. if (iommu_is_off) {
  444. if (base >= 0x80000000ul)
  445. continue;
  446. if ((base + size) > 0x80000000ul)
  447. size = 0x80000000ul - base;
  448. }
  449. memblock_add(base, size);
  450. } while (--rngs);
  451. }
  452. memblock_dump_all();
  453. return 0;
  454. }
  455. #else
  456. #define early_init_dt_scan_drconf_memory(node) 0
  457. #endif /* CONFIG_PPC_PSERIES */
  458. static int __init early_init_dt_scan_memory_ppc(unsigned long node,
  459. const char *uname,
  460. int depth, void *data)
  461. {
  462. if (depth == 1 &&
  463. strcmp(uname, "ibm,dynamic-reconfiguration-memory") == 0)
  464. return early_init_dt_scan_drconf_memory(node);
  465. return early_init_dt_scan_memory(node, uname, depth, data);
  466. }
  467. void __init early_init_dt_add_memory_arch(u64 base, u64 size)
  468. {
  469. #ifdef CONFIG_PPC64
  470. if (iommu_is_off) {
  471. if (base >= 0x80000000ul)
  472. return;
  473. if ((base + size) > 0x80000000ul)
  474. size = 0x80000000ul - base;
  475. }
  476. #endif
  477. /* Keep track of the beginning of memory -and- the size of
  478. * the very first block in the device-tree as it represents
  479. * the RMA on ppc64 server
  480. */
  481. if (base < memstart_addr) {
  482. memstart_addr = base;
  483. first_memblock_size = size;
  484. }
  485. /* Add the chunk to the MEMBLOCK list */
  486. memblock_add(base, size);
  487. }
  488. void * __init early_init_dt_alloc_memory_arch(u64 size, u64 align)
  489. {
  490. return __va(memblock_alloc(size, align));
  491. }
  492. #ifdef CONFIG_BLK_DEV_INITRD
  493. void __init early_init_dt_setup_initrd_arch(unsigned long start,
  494. unsigned long end)
  495. {
  496. initrd_start = (unsigned long)__va(start);
  497. initrd_end = (unsigned long)__va(end);
  498. initrd_below_start_ok = 1;
  499. }
  500. #endif
  501. static void __init early_reserve_mem(void)
  502. {
  503. u64 base, size;
  504. u64 *reserve_map;
  505. unsigned long self_base;
  506. unsigned long self_size;
  507. reserve_map = (u64 *)(((unsigned long)initial_boot_params) +
  508. initial_boot_params->off_mem_rsvmap);
  509. /* before we do anything, lets reserve the dt blob */
  510. self_base = __pa((unsigned long)initial_boot_params);
  511. self_size = initial_boot_params->totalsize;
  512. memblock_reserve(self_base, self_size);
  513. #ifdef CONFIG_BLK_DEV_INITRD
  514. /* then reserve the initrd, if any */
  515. if (initrd_start && (initrd_end > initrd_start))
  516. memblock_reserve(_ALIGN_DOWN(__pa(initrd_start), PAGE_SIZE),
  517. _ALIGN_UP(initrd_end, PAGE_SIZE) -
  518. _ALIGN_DOWN(initrd_start, PAGE_SIZE));
  519. #endif /* CONFIG_BLK_DEV_INITRD */
  520. #ifdef CONFIG_PPC32
  521. /*
  522. * Handle the case where we might be booting from an old kexec
  523. * image that setup the mem_rsvmap as pairs of 32-bit values
  524. */
  525. if (*reserve_map > 0xffffffffull) {
  526. u32 base_32, size_32;
  527. u32 *reserve_map_32 = (u32 *)reserve_map;
  528. while (1) {
  529. base_32 = *(reserve_map_32++);
  530. size_32 = *(reserve_map_32++);
  531. if (size_32 == 0)
  532. break;
  533. /* skip if the reservation is for the blob */
  534. if (base_32 == self_base && size_32 == self_size)
  535. continue;
  536. DBG("reserving: %x -> %x\n", base_32, size_32);
  537. memblock_reserve(base_32, size_32);
  538. }
  539. return;
  540. }
  541. #endif
  542. while (1) {
  543. base = *(reserve_map++);
  544. size = *(reserve_map++);
  545. if (size == 0)
  546. break;
  547. DBG("reserving: %llx -> %llx\n", base, size);
  548. memblock_reserve(base, size);
  549. }
  550. }
  551. #ifdef CONFIG_PHYP_DUMP
  552. /**
  553. * phyp_dump_calculate_reserve_size() - reserve variable boot area 5% or arg
  554. *
  555. * Function to find the largest size we need to reserve
  556. * during early boot process.
  557. *
  558. * It either looks for boot param and returns that OR
  559. * returns larger of 256 or 5% rounded down to multiples of 256MB.
  560. *
  561. */
  562. static inline unsigned long phyp_dump_calculate_reserve_size(void)
  563. {
  564. unsigned long tmp;
  565. if (phyp_dump_info->reserve_bootvar)
  566. return phyp_dump_info->reserve_bootvar;
  567. /* divide by 20 to get 5% of value */
  568. tmp = memblock_end_of_DRAM();
  569. do_div(tmp, 20);
  570. /* round it down in multiples of 256 */
  571. tmp = tmp & ~0x0FFFFFFFUL;
  572. return (tmp > PHYP_DUMP_RMR_END ? tmp : PHYP_DUMP_RMR_END);
  573. }
  574. /**
  575. * phyp_dump_reserve_mem() - reserve all not-yet-dumped mmemory
  576. *
  577. * This routine may reserve memory regions in the kernel only
  578. * if the system is supported and a dump was taken in last
  579. * boot instance or if the hardware is supported and the
  580. * scratch area needs to be setup. In other instances it returns
  581. * without reserving anything. The memory in case of dump being
  582. * active is freed when the dump is collected (by userland tools).
  583. */
  584. static void __init phyp_dump_reserve_mem(void)
  585. {
  586. unsigned long base, size;
  587. unsigned long variable_reserve_size;
  588. if (!phyp_dump_info->phyp_dump_configured) {
  589. printk(KERN_ERR "Phyp-dump not supported on this hardware\n");
  590. return;
  591. }
  592. if (!phyp_dump_info->phyp_dump_at_boot) {
  593. printk(KERN_INFO "Phyp-dump disabled at boot time\n");
  594. return;
  595. }
  596. variable_reserve_size = phyp_dump_calculate_reserve_size();
  597. if (phyp_dump_info->phyp_dump_is_active) {
  598. /* Reserve *everything* above RMR.Area freed by userland tools*/
  599. base = variable_reserve_size;
  600. size = memblock_end_of_DRAM() - base;
  601. /* XXX crashed_ram_end is wrong, since it may be beyond
  602. * the memory_limit, it will need to be adjusted. */
  603. memblock_reserve(base, size);
  604. phyp_dump_info->init_reserve_start = base;
  605. phyp_dump_info->init_reserve_size = size;
  606. } else {
  607. size = phyp_dump_info->cpu_state_size +
  608. phyp_dump_info->hpte_region_size +
  609. variable_reserve_size;
  610. base = memblock_end_of_DRAM() - size;
  611. memblock_reserve(base, size);
  612. phyp_dump_info->init_reserve_start = base;
  613. phyp_dump_info->init_reserve_size = size;
  614. }
  615. }
  616. #else
  617. static inline void __init phyp_dump_reserve_mem(void) {}
  618. #endif /* CONFIG_PHYP_DUMP && CONFIG_PPC_RTAS */
  619. void __init early_init_devtree(void *params)
  620. {
  621. phys_addr_t limit;
  622. DBG(" -> early_init_devtree(%p)\n", params);
  623. /* Setup flat device-tree pointer */
  624. initial_boot_params = params;
  625. #ifdef CONFIG_PPC_RTAS
  626. /* Some machines might need RTAS info for debugging, grab it now. */
  627. of_scan_flat_dt(early_init_dt_scan_rtas, NULL);
  628. #endif
  629. #ifdef CONFIG_PPC_POWERNV
  630. /* Some machines might need OPAL info for debugging, grab it now. */
  631. of_scan_flat_dt(early_init_dt_scan_opal, NULL);
  632. #endif
  633. #ifdef CONFIG_PHYP_DUMP
  634. /* scan tree to see if dump occurred during last boot */
  635. of_scan_flat_dt(early_init_dt_scan_phyp_dump, NULL);
  636. #endif
  637. /* Pre-initialize the cmd_line with the content of boot_commmand_line,
  638. * which will be empty except when the content of the variable has
  639. * been overriden by a bootloading mechanism. This happens typically
  640. * with HAL takeover
  641. */
  642. strlcpy(cmd_line, boot_command_line, COMMAND_LINE_SIZE);
  643. /* Retrieve various informations from the /chosen node of the
  644. * device-tree, including the platform type, initrd location and
  645. * size, TCE reserve, and more ...
  646. */
  647. of_scan_flat_dt(early_init_dt_scan_chosen_ppc, cmd_line);
  648. /* Scan memory nodes and rebuild MEMBLOCKs */
  649. memblock_init();
  650. of_scan_flat_dt(early_init_dt_scan_root, NULL);
  651. of_scan_flat_dt(early_init_dt_scan_memory_ppc, NULL);
  652. /* Save command line for /proc/cmdline and then parse parameters */
  653. strlcpy(boot_command_line, cmd_line, COMMAND_LINE_SIZE);
  654. parse_early_param();
  655. /* make sure we've parsed cmdline for mem= before this */
  656. if (memory_limit)
  657. first_memblock_size = min(first_memblock_size, memory_limit);
  658. setup_initial_memory_limit(memstart_addr, first_memblock_size);
  659. /* Reserve MEMBLOCK regions used by kernel, initrd, dt, etc... */
  660. memblock_reserve(PHYSICAL_START, __pa(klimit) - PHYSICAL_START);
  661. /* If relocatable, reserve first 32k for interrupt vectors etc. */
  662. if (PHYSICAL_START > MEMORY_START)
  663. memblock_reserve(MEMORY_START, 0x8000);
  664. reserve_kdump_trampoline();
  665. reserve_crashkernel();
  666. early_reserve_mem();
  667. phyp_dump_reserve_mem();
  668. limit = memory_limit;
  669. if (! limit) {
  670. phys_addr_t memsize;
  671. /* Ensure that total memory size is page-aligned, because
  672. * otherwise mark_bootmem() gets upset. */
  673. memblock_analyze();
  674. memsize = memblock_phys_mem_size();
  675. if ((memsize & PAGE_MASK) != memsize)
  676. limit = memsize & PAGE_MASK;
  677. }
  678. memblock_enforce_memory_limit(limit);
  679. memblock_analyze();
  680. memblock_dump_all();
  681. DBG("Phys. mem: %llx\n", memblock_phys_mem_size());
  682. /* We may need to relocate the flat tree, do it now.
  683. * FIXME .. and the initrd too? */
  684. move_device_tree();
  685. allocate_pacas();
  686. DBG("Scanning CPUs ...\n");
  687. /* Retrieve CPU related informations from the flat tree
  688. * (altivec support, boot CPU ID, ...)
  689. */
  690. of_scan_flat_dt(early_init_dt_scan_cpus, NULL);
  691. #if defined(CONFIG_SMP) && defined(CONFIG_PPC64)
  692. /* We'll later wait for secondaries to check in; there are
  693. * NCPUS-1 non-boot CPUs :-)
  694. */
  695. spinning_secondaries = boot_cpu_count - 1;
  696. #endif
  697. DBG(" <- early_init_devtree()\n");
  698. }
  699. /*******
  700. *
  701. * New implementation of the OF "find" APIs, return a refcounted
  702. * object, call of_node_put() when done. The device tree and list
  703. * are protected by a rw_lock.
  704. *
  705. * Note that property management will need some locking as well,
  706. * this isn't dealt with yet.
  707. *
  708. *******/
  709. /**
  710. * of_find_next_cache_node - Find a node's subsidiary cache
  711. * @np: node of type "cpu" or "cache"
  712. *
  713. * Returns a node pointer with refcount incremented, use
  714. * of_node_put() on it when done. Caller should hold a reference
  715. * to np.
  716. */
  717. struct device_node *of_find_next_cache_node(struct device_node *np)
  718. {
  719. struct device_node *child;
  720. const phandle *handle;
  721. handle = of_get_property(np, "l2-cache", NULL);
  722. if (!handle)
  723. handle = of_get_property(np, "next-level-cache", NULL);
  724. if (handle)
  725. return of_find_node_by_phandle(*handle);
  726. /* OF on pmac has nodes instead of properties named "l2-cache"
  727. * beneath CPU nodes.
  728. */
  729. if (!strcmp(np->type, "cpu"))
  730. for_each_child_of_node(np, child)
  731. if (!strcmp(child->type, "cache"))
  732. return child;
  733. return NULL;
  734. }
  735. #ifdef CONFIG_PPC_PSERIES
  736. /*
  737. * Fix up the uninitialized fields in a new device node:
  738. * name, type and pci-specific fields
  739. */
  740. static int of_finish_dynamic_node(struct device_node *node)
  741. {
  742. struct device_node *parent = of_get_parent(node);
  743. int err = 0;
  744. const phandle *ibm_phandle;
  745. node->name = of_get_property(node, "name", NULL);
  746. node->type = of_get_property(node, "device_type", NULL);
  747. if (!node->name)
  748. node->name = "<NULL>";
  749. if (!node->type)
  750. node->type = "<NULL>";
  751. if (!parent) {
  752. err = -ENODEV;
  753. goto out;
  754. }
  755. /* We don't support that function on PowerMac, at least
  756. * not yet
  757. */
  758. if (machine_is(powermac))
  759. return -ENODEV;
  760. /* fix up new node's phandle field */
  761. if ((ibm_phandle = of_get_property(node, "ibm,phandle", NULL)))
  762. node->phandle = *ibm_phandle;
  763. out:
  764. of_node_put(parent);
  765. return err;
  766. }
  767. static int prom_reconfig_notifier(struct notifier_block *nb,
  768. unsigned long action, void *node)
  769. {
  770. int err;
  771. switch (action) {
  772. case PSERIES_RECONFIG_ADD:
  773. err = of_finish_dynamic_node(node);
  774. if (err < 0)
  775. printk(KERN_ERR "finish_node returned %d\n", err);
  776. break;
  777. default:
  778. err = 0;
  779. break;
  780. }
  781. return notifier_from_errno(err);
  782. }
  783. static struct notifier_block prom_reconfig_nb = {
  784. .notifier_call = prom_reconfig_notifier,
  785. .priority = 10, /* This one needs to run first */
  786. };
  787. static int __init prom_reconfig_setup(void)
  788. {
  789. return pSeries_reconfig_notifier_register(&prom_reconfig_nb);
  790. }
  791. __initcall(prom_reconfig_setup);
  792. #endif
  793. /* Find the device node for a given logical cpu number, also returns the cpu
  794. * local thread number (index in ibm,interrupt-server#s) if relevant and
  795. * asked for (non NULL)
  796. */
  797. struct device_node *of_get_cpu_node(int cpu, unsigned int *thread)
  798. {
  799. int hardid;
  800. struct device_node *np;
  801. hardid = get_hard_smp_processor_id(cpu);
  802. for_each_node_by_type(np, "cpu") {
  803. const u32 *intserv;
  804. unsigned int plen, t;
  805. /* Check for ibm,ppc-interrupt-server#s. If it doesn't exist
  806. * fallback to "reg" property and assume no threads
  807. */
  808. intserv = of_get_property(np, "ibm,ppc-interrupt-server#s",
  809. &plen);
  810. if (intserv == NULL) {
  811. const u32 *reg = of_get_property(np, "reg", NULL);
  812. if (reg == NULL)
  813. continue;
  814. if (*reg == hardid) {
  815. if (thread)
  816. *thread = 0;
  817. return np;
  818. }
  819. } else {
  820. plen /= sizeof(u32);
  821. for (t = 0; t < plen; t++) {
  822. if (hardid == intserv[t]) {
  823. if (thread)
  824. *thread = t;
  825. return np;
  826. }
  827. }
  828. }
  829. }
  830. return NULL;
  831. }
  832. EXPORT_SYMBOL(of_get_cpu_node);
  833. #if defined(CONFIG_DEBUG_FS) && defined(DEBUG)
  834. static struct debugfs_blob_wrapper flat_dt_blob;
  835. static int __init export_flat_device_tree(void)
  836. {
  837. struct dentry *d;
  838. flat_dt_blob.data = initial_boot_params;
  839. flat_dt_blob.size = initial_boot_params->totalsize;
  840. d = debugfs_create_blob("flat-device-tree", S_IFREG | S_IRUSR,
  841. powerpc_debugfs_root, &flat_dt_blob);
  842. if (!d)
  843. return 1;
  844. return 0;
  845. }
  846. __initcall(export_flat_device_tree);
  847. #endif