prom.c 28 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086
  1. /*
  2. * Procedures for creating, accessing and interpreting the device tree.
  3. *
  4. * Paul Mackerras August 1996.
  5. * Copyright (C) 1996-2005 Paul Mackerras.
  6. *
  7. * Adapted for 64bit PowerPC by Dave Engebretsen and Peter Bergner.
  8. * {engebret|bergner}@us.ibm.com
  9. *
  10. * This program is free software; you can redistribute it and/or
  11. * modify it under the terms of the GNU General Public License
  12. * as published by the Free Software Foundation; either version
  13. * 2 of the License, or (at your option) any later version.
  14. */
  15. #undef DEBUG
  16. #include <stdarg.h>
  17. #include <linux/kernel.h>
  18. #include <linux/string.h>
  19. #include <linux/init.h>
  20. #include <linux/threads.h>
  21. #include <linux/spinlock.h>
  22. #include <linux/types.h>
  23. #include <linux/pci.h>
  24. #include <linux/stringify.h>
  25. #include <linux/delay.h>
  26. #include <linux/initrd.h>
  27. #include <linux/bitops.h>
  28. #include <linux/module.h>
  29. #include <linux/kexec.h>
  30. #include <linux/debugfs.h>
  31. #include <linux/irq.h>
  32. #include <linux/lmb.h>
  33. #include <asm/prom.h>
  34. #include <asm/rtas.h>
  35. #include <asm/page.h>
  36. #include <asm/processor.h>
  37. #include <asm/irq.h>
  38. #include <asm/io.h>
  39. #include <asm/kdump.h>
  40. #include <asm/smp.h>
  41. #include <asm/system.h>
  42. #include <asm/mmu.h>
  43. #include <asm/pgtable.h>
  44. #include <asm/pci.h>
  45. #include <asm/iommu.h>
  46. #include <asm/btext.h>
  47. #include <asm/sections.h>
  48. #include <asm/machdep.h>
  49. #include <asm/pSeries_reconfig.h>
  50. #include <asm/pci-bridge.h>
  51. #include <asm/phyp_dump.h>
  52. #include <asm/kexec.h>
  53. #include <mm/mmu_decl.h>
  54. #ifdef DEBUG
  55. #define DBG(fmt...) printk(KERN_ERR fmt)
  56. #else
  57. #define DBG(fmt...)
  58. #endif
  59. #ifdef CONFIG_PPC64
  60. int __initdata iommu_is_off;
  61. int __initdata iommu_force_on;
  62. unsigned long tce_alloc_start, tce_alloc_end;
  63. #endif
  64. extern rwlock_t devtree_lock; /* temporary while merging */
  65. /* export that to outside world */
  66. struct device_node *of_chosen;
  67. static int __init early_parse_mem(char *p)
  68. {
  69. if (!p)
  70. return 1;
  71. memory_limit = PAGE_ALIGN(memparse(p, &p));
  72. DBG("memory limit = 0x%llx\n", (unsigned long long)memory_limit);
  73. return 0;
  74. }
  75. early_param("mem", early_parse_mem);
  76. /**
  77. * move_device_tree - move tree to an unused area, if needed.
  78. *
  79. * The device tree may be allocated beyond our memory limit, or inside the
  80. * crash kernel region for kdump. If so, move it out of the way.
  81. */
  82. static void __init move_device_tree(void)
  83. {
  84. unsigned long start, size;
  85. void *p;
  86. DBG("-> move_device_tree\n");
  87. start = __pa(initial_boot_params);
  88. size = initial_boot_params->totalsize;
  89. if ((memory_limit && (start + size) > memory_limit) ||
  90. overlaps_crashkernel(start, size)) {
  91. p = __va(lmb_alloc_base(size, PAGE_SIZE, lmb.rmo_size));
  92. memcpy(p, initial_boot_params, size);
  93. initial_boot_params = (struct boot_param_header *)p;
  94. DBG("Moved device tree to 0x%p\n", p);
  95. }
  96. DBG("<- move_device_tree\n");
  97. }
  98. /*
  99. * ibm,pa-features is a per-cpu property that contains a string of
  100. * attribute descriptors, each of which has a 2 byte header plus up
  101. * to 254 bytes worth of processor attribute bits. First header
  102. * byte specifies the number of bytes following the header.
  103. * Second header byte is an "attribute-specifier" type, of which
  104. * zero is the only currently-defined value.
  105. * Implementation: Pass in the byte and bit offset for the feature
  106. * that we are interested in. The function will return -1 if the
  107. * pa-features property is missing, or a 1/0 to indicate if the feature
  108. * is supported/not supported. Note that the bit numbers are
  109. * big-endian to match the definition in PAPR.
  110. */
  111. static struct ibm_pa_feature {
  112. unsigned long cpu_features; /* CPU_FTR_xxx bit */
  113. unsigned int cpu_user_ftrs; /* PPC_FEATURE_xxx bit */
  114. unsigned char pabyte; /* byte number in ibm,pa-features */
  115. unsigned char pabit; /* bit number (big-endian) */
  116. unsigned char invert; /* if 1, pa bit set => clear feature */
  117. } ibm_pa_features[] __initdata = {
  118. {0, PPC_FEATURE_HAS_MMU, 0, 0, 0},
  119. {0, PPC_FEATURE_HAS_FPU, 0, 1, 0},
  120. {CPU_FTR_SLB, 0, 0, 2, 0},
  121. {CPU_FTR_CTRL, 0, 0, 3, 0},
  122. {CPU_FTR_NOEXECUTE, 0, 0, 6, 0},
  123. {CPU_FTR_NODSISRALIGN, 0, 1, 1, 1},
  124. {CPU_FTR_CI_LARGE_PAGE, 0, 1, 2, 0},
  125. {CPU_FTR_REAL_LE, PPC_FEATURE_TRUE_LE, 5, 0, 0},
  126. };
  127. static void __init scan_features(unsigned long node, unsigned char *ftrs,
  128. unsigned long tablelen,
  129. struct ibm_pa_feature *fp,
  130. unsigned long ft_size)
  131. {
  132. unsigned long i, len, bit;
  133. /* find descriptor with type == 0 */
  134. for (;;) {
  135. if (tablelen < 3)
  136. return;
  137. len = 2 + ftrs[0];
  138. if (tablelen < len)
  139. return; /* descriptor 0 not found */
  140. if (ftrs[1] == 0)
  141. break;
  142. tablelen -= len;
  143. ftrs += len;
  144. }
  145. /* loop over bits we know about */
  146. for (i = 0; i < ft_size; ++i, ++fp) {
  147. if (fp->pabyte >= ftrs[0])
  148. continue;
  149. bit = (ftrs[2 + fp->pabyte] >> (7 - fp->pabit)) & 1;
  150. if (bit ^ fp->invert) {
  151. cur_cpu_spec->cpu_features |= fp->cpu_features;
  152. cur_cpu_spec->cpu_user_features |= fp->cpu_user_ftrs;
  153. } else {
  154. cur_cpu_spec->cpu_features &= ~fp->cpu_features;
  155. cur_cpu_spec->cpu_user_features &= ~fp->cpu_user_ftrs;
  156. }
  157. }
  158. }
  159. static void __init check_cpu_pa_features(unsigned long node)
  160. {
  161. unsigned char *pa_ftrs;
  162. unsigned long tablelen;
  163. pa_ftrs = of_get_flat_dt_prop(node, "ibm,pa-features", &tablelen);
  164. if (pa_ftrs == NULL)
  165. return;
  166. scan_features(node, pa_ftrs, tablelen,
  167. ibm_pa_features, ARRAY_SIZE(ibm_pa_features));
  168. }
  169. #ifdef CONFIG_PPC_STD_MMU_64
  170. static void __init check_cpu_slb_size(unsigned long node)
  171. {
  172. u32 *slb_size_ptr;
  173. slb_size_ptr = of_get_flat_dt_prop(node, "slb-size", NULL);
  174. if (slb_size_ptr != NULL) {
  175. mmu_slb_size = *slb_size_ptr;
  176. return;
  177. }
  178. slb_size_ptr = of_get_flat_dt_prop(node, "ibm,slb-size", NULL);
  179. if (slb_size_ptr != NULL) {
  180. mmu_slb_size = *slb_size_ptr;
  181. }
  182. }
  183. #else
  184. #define check_cpu_slb_size(node) do { } while(0)
  185. #endif
  186. static struct feature_property {
  187. const char *name;
  188. u32 min_value;
  189. unsigned long cpu_feature;
  190. unsigned long cpu_user_ftr;
  191. } feature_properties[] __initdata = {
  192. #ifdef CONFIG_ALTIVEC
  193. {"altivec", 0, CPU_FTR_ALTIVEC, PPC_FEATURE_HAS_ALTIVEC},
  194. {"ibm,vmx", 1, CPU_FTR_ALTIVEC, PPC_FEATURE_HAS_ALTIVEC},
  195. #endif /* CONFIG_ALTIVEC */
  196. #ifdef CONFIG_VSX
  197. /* Yes, this _really_ is ibm,vmx == 2 to enable VSX */
  198. {"ibm,vmx", 2, CPU_FTR_VSX, PPC_FEATURE_HAS_VSX},
  199. #endif /* CONFIG_VSX */
  200. #ifdef CONFIG_PPC64
  201. {"ibm,dfp", 1, 0, PPC_FEATURE_HAS_DFP},
  202. {"ibm,purr", 1, CPU_FTR_PURR, 0},
  203. {"ibm,spurr", 1, CPU_FTR_SPURR, 0},
  204. #endif /* CONFIG_PPC64 */
  205. };
  206. #if defined(CONFIG_44x) && defined(CONFIG_PPC_FPU)
  207. static inline void identical_pvr_fixup(unsigned long node)
  208. {
  209. unsigned int pvr;
  210. char *model = of_get_flat_dt_prop(node, "model", NULL);
  211. /*
  212. * Since 440GR(x)/440EP(x) processors have the same pvr,
  213. * we check the node path and set bit 28 in the cur_cpu_spec
  214. * pvr for EP(x) processor version. This bit is always 0 in
  215. * the "real" pvr. Then we call identify_cpu again with
  216. * the new logical pvr to enable FPU support.
  217. */
  218. if (model && strstr(model, "440EP")) {
  219. pvr = cur_cpu_spec->pvr_value | 0x8;
  220. identify_cpu(0, pvr);
  221. DBG("Using logical pvr %x for %s\n", pvr, model);
  222. }
  223. }
  224. #else
  225. #define identical_pvr_fixup(node) do { } while(0)
  226. #endif
  227. static void __init check_cpu_feature_properties(unsigned long node)
  228. {
  229. unsigned long i;
  230. struct feature_property *fp = feature_properties;
  231. const u32 *prop;
  232. for (i = 0; i < ARRAY_SIZE(feature_properties); ++i, ++fp) {
  233. prop = of_get_flat_dt_prop(node, fp->name, NULL);
  234. if (prop && *prop >= fp->min_value) {
  235. cur_cpu_spec->cpu_features |= fp->cpu_feature;
  236. cur_cpu_spec->cpu_user_features |= fp->cpu_user_ftr;
  237. }
  238. }
  239. }
  240. static int __init early_init_dt_scan_cpus(unsigned long node,
  241. const char *uname, int depth,
  242. void *data)
  243. {
  244. static int logical_cpuid = 0;
  245. char *type = of_get_flat_dt_prop(node, "device_type", NULL);
  246. const u32 *prop;
  247. const u32 *intserv;
  248. int i, nthreads;
  249. unsigned long len;
  250. int found = 0;
  251. /* We are scanning "cpu" nodes only */
  252. if (type == NULL || strcmp(type, "cpu") != 0)
  253. return 0;
  254. /* Get physical cpuid */
  255. intserv = of_get_flat_dt_prop(node, "ibm,ppc-interrupt-server#s", &len);
  256. if (intserv) {
  257. nthreads = len / sizeof(int);
  258. } else {
  259. intserv = of_get_flat_dt_prop(node, "reg", NULL);
  260. nthreads = 1;
  261. }
  262. /*
  263. * Now see if any of these threads match our boot cpu.
  264. * NOTE: This must match the parsing done in smp_setup_cpu_maps.
  265. */
  266. for (i = 0; i < nthreads; i++) {
  267. /*
  268. * version 2 of the kexec param format adds the phys cpuid of
  269. * booted proc.
  270. */
  271. if (initial_boot_params && initial_boot_params->version >= 2) {
  272. if (intserv[i] ==
  273. initial_boot_params->boot_cpuid_phys) {
  274. found = 1;
  275. break;
  276. }
  277. } else {
  278. /*
  279. * Check if it's the boot-cpu, set it's hw index now,
  280. * unfortunately this format did not support booting
  281. * off secondary threads.
  282. */
  283. if (of_get_flat_dt_prop(node,
  284. "linux,boot-cpu", NULL) != NULL) {
  285. found = 1;
  286. break;
  287. }
  288. }
  289. #ifdef CONFIG_SMP
  290. /* logical cpu id is always 0 on UP kernels */
  291. logical_cpuid++;
  292. #endif
  293. }
  294. if (found) {
  295. DBG("boot cpu: logical %d physical %d\n", logical_cpuid,
  296. intserv[i]);
  297. boot_cpuid = logical_cpuid;
  298. set_hard_smp_processor_id(boot_cpuid, intserv[i]);
  299. /*
  300. * PAPR defines "logical" PVR values for cpus that
  301. * meet various levels of the architecture:
  302. * 0x0f000001 Architecture version 2.04
  303. * 0x0f000002 Architecture version 2.05
  304. * If the cpu-version property in the cpu node contains
  305. * such a value, we call identify_cpu again with the
  306. * logical PVR value in order to use the cpu feature
  307. * bits appropriate for the architecture level.
  308. *
  309. * A POWER6 partition in "POWER6 architected" mode
  310. * uses the 0x0f000002 PVR value; in POWER5+ mode
  311. * it uses 0x0f000001.
  312. */
  313. prop = of_get_flat_dt_prop(node, "cpu-version", NULL);
  314. if (prop && (*prop & 0xff000000) == 0x0f000000)
  315. identify_cpu(0, *prop);
  316. identical_pvr_fixup(node);
  317. }
  318. check_cpu_feature_properties(node);
  319. check_cpu_pa_features(node);
  320. check_cpu_slb_size(node);
  321. #ifdef CONFIG_PPC_PSERIES
  322. if (nthreads > 1)
  323. cur_cpu_spec->cpu_features |= CPU_FTR_SMT;
  324. else
  325. cur_cpu_spec->cpu_features &= ~CPU_FTR_SMT;
  326. #endif
  327. return 0;
  328. }
  329. void __init early_init_dt_scan_chosen_arch(unsigned long node)
  330. {
  331. unsigned long *lprop;
  332. #ifdef CONFIG_PPC64
  333. /* check if iommu is forced on or off */
  334. if (of_get_flat_dt_prop(node, "linux,iommu-off", NULL) != NULL)
  335. iommu_is_off = 1;
  336. if (of_get_flat_dt_prop(node, "linux,iommu-force-on", NULL) != NULL)
  337. iommu_force_on = 1;
  338. #endif
  339. /* mem=x on the command line is the preferred mechanism */
  340. lprop = of_get_flat_dt_prop(node, "linux,memory-limit", NULL);
  341. if (lprop)
  342. memory_limit = *lprop;
  343. #ifdef CONFIG_PPC64
  344. lprop = of_get_flat_dt_prop(node, "linux,tce-alloc-start", NULL);
  345. if (lprop)
  346. tce_alloc_start = *lprop;
  347. lprop = of_get_flat_dt_prop(node, "linux,tce-alloc-end", NULL);
  348. if (lprop)
  349. tce_alloc_end = *lprop;
  350. #endif
  351. #ifdef CONFIG_KEXEC
  352. lprop = of_get_flat_dt_prop(node, "linux,crashkernel-base", NULL);
  353. if (lprop)
  354. crashk_res.start = *lprop;
  355. lprop = of_get_flat_dt_prop(node, "linux,crashkernel-size", NULL);
  356. if (lprop)
  357. crashk_res.end = crashk_res.start + *lprop - 1;
  358. #endif
  359. }
  360. #ifdef CONFIG_PPC_PSERIES
  361. /*
  362. * Interpret the ibm,dynamic-memory property in the
  363. * /ibm,dynamic-reconfiguration-memory node.
  364. * This contains a list of memory blocks along with NUMA affinity
  365. * information.
  366. */
  367. static int __init early_init_dt_scan_drconf_memory(unsigned long node)
  368. {
  369. __be32 *dm, *ls, *usm;
  370. unsigned long l, n, flags;
  371. u64 base, size, lmb_size;
  372. unsigned int is_kexec_kdump = 0, rngs;
  373. ls = of_get_flat_dt_prop(node, "ibm,lmb-size", &l);
  374. if (ls == NULL || l < dt_root_size_cells * sizeof(__be32))
  375. return 0;
  376. lmb_size = dt_mem_next_cell(dt_root_size_cells, &ls);
  377. dm = of_get_flat_dt_prop(node, "ibm,dynamic-memory", &l);
  378. if (dm == NULL || l < sizeof(__be32))
  379. return 0;
  380. n = *dm++; /* number of entries */
  381. if (l < (n * (dt_root_addr_cells + 4) + 1) * sizeof(__be32))
  382. return 0;
  383. /* check if this is a kexec/kdump kernel. */
  384. usm = of_get_flat_dt_prop(node, "linux,drconf-usable-memory",
  385. &l);
  386. if (usm != NULL)
  387. is_kexec_kdump = 1;
  388. for (; n != 0; --n) {
  389. base = dt_mem_next_cell(dt_root_addr_cells, &dm);
  390. flags = dm[3];
  391. /* skip DRC index, pad, assoc. list index, flags */
  392. dm += 4;
  393. /* skip this block if the reserved bit is set in flags (0x80)
  394. or if the block is not assigned to this partition (0x8) */
  395. if ((flags & 0x80) || !(flags & 0x8))
  396. continue;
  397. size = lmb_size;
  398. rngs = 1;
  399. if (is_kexec_kdump) {
  400. /*
  401. * For each lmb in ibm,dynamic-memory, a corresponding
  402. * entry in linux,drconf-usable-memory property contains
  403. * a counter 'p' followed by 'p' (base, size) duple.
  404. * Now read the counter from
  405. * linux,drconf-usable-memory property
  406. */
  407. rngs = dt_mem_next_cell(dt_root_size_cells, &usm);
  408. if (!rngs) /* there are no (base, size) duple */
  409. continue;
  410. }
  411. do {
  412. if (is_kexec_kdump) {
  413. base = dt_mem_next_cell(dt_root_addr_cells,
  414. &usm);
  415. size = dt_mem_next_cell(dt_root_size_cells,
  416. &usm);
  417. }
  418. if (iommu_is_off) {
  419. if (base >= 0x80000000ul)
  420. continue;
  421. if ((base + size) > 0x80000000ul)
  422. size = 0x80000000ul - base;
  423. }
  424. lmb_add(base, size);
  425. } while (--rngs);
  426. }
  427. lmb_dump_all();
  428. return 0;
  429. }
  430. #else
  431. #define early_init_dt_scan_drconf_memory(node) 0
  432. #endif /* CONFIG_PPC_PSERIES */
  433. static int __init early_init_dt_scan_memory(unsigned long node,
  434. const char *uname, int depth, void *data)
  435. {
  436. char *type = of_get_flat_dt_prop(node, "device_type", NULL);
  437. __be32 *reg, *endp;
  438. unsigned long l;
  439. /* Look for the ibm,dynamic-reconfiguration-memory node */
  440. if (depth == 1 &&
  441. strcmp(uname, "ibm,dynamic-reconfiguration-memory") == 0)
  442. return early_init_dt_scan_drconf_memory(node);
  443. /* We are scanning "memory" nodes only */
  444. if (type == NULL) {
  445. /*
  446. * The longtrail doesn't have a device_type on the
  447. * /memory node, so look for the node called /memory@0.
  448. */
  449. if (depth != 1 || strcmp(uname, "memory@0") != 0)
  450. return 0;
  451. } else if (strcmp(type, "memory") != 0)
  452. return 0;
  453. reg = of_get_flat_dt_prop(node, "linux,usable-memory", &l);
  454. if (reg == NULL)
  455. reg = of_get_flat_dt_prop(node, "reg", &l);
  456. if (reg == NULL)
  457. return 0;
  458. endp = reg + (l / sizeof(__be32));
  459. DBG("memory scan node %s, reg size %ld, data: %x %x %x %x,\n",
  460. uname, l, reg[0], reg[1], reg[2], reg[3]);
  461. while ((endp - reg) >= (dt_root_addr_cells + dt_root_size_cells)) {
  462. u64 base, size;
  463. base = dt_mem_next_cell(dt_root_addr_cells, &reg);
  464. size = dt_mem_next_cell(dt_root_size_cells, &reg);
  465. if (size == 0)
  466. continue;
  467. DBG(" - %llx , %llx\n", (unsigned long long)base,
  468. (unsigned long long)size);
  469. #ifdef CONFIG_PPC64
  470. if (iommu_is_off) {
  471. if (base >= 0x80000000ul)
  472. continue;
  473. if ((base + size) > 0x80000000ul)
  474. size = 0x80000000ul - base;
  475. }
  476. #endif
  477. lmb_add(base, size);
  478. memstart_addr = min((u64)memstart_addr, base);
  479. }
  480. return 0;
  481. }
  482. static void __init early_reserve_mem(void)
  483. {
  484. u64 base, size;
  485. u64 *reserve_map;
  486. unsigned long self_base;
  487. unsigned long self_size;
  488. reserve_map = (u64 *)(((unsigned long)initial_boot_params) +
  489. initial_boot_params->off_mem_rsvmap);
  490. /* before we do anything, lets reserve the dt blob */
  491. self_base = __pa((unsigned long)initial_boot_params);
  492. self_size = initial_boot_params->totalsize;
  493. lmb_reserve(self_base, self_size);
  494. #ifdef CONFIG_BLK_DEV_INITRD
  495. /* then reserve the initrd, if any */
  496. if (initrd_start && (initrd_end > initrd_start))
  497. lmb_reserve(__pa(initrd_start), initrd_end - initrd_start);
  498. #endif /* CONFIG_BLK_DEV_INITRD */
  499. #ifdef CONFIG_PPC32
  500. /*
  501. * Handle the case where we might be booting from an old kexec
  502. * image that setup the mem_rsvmap as pairs of 32-bit values
  503. */
  504. if (*reserve_map > 0xffffffffull) {
  505. u32 base_32, size_32;
  506. u32 *reserve_map_32 = (u32 *)reserve_map;
  507. while (1) {
  508. base_32 = *(reserve_map_32++);
  509. size_32 = *(reserve_map_32++);
  510. if (size_32 == 0)
  511. break;
  512. /* skip if the reservation is for the blob */
  513. if (base_32 == self_base && size_32 == self_size)
  514. continue;
  515. DBG("reserving: %x -> %x\n", base_32, size_32);
  516. lmb_reserve(base_32, size_32);
  517. }
  518. return;
  519. }
  520. #endif
  521. while (1) {
  522. base = *(reserve_map++);
  523. size = *(reserve_map++);
  524. if (size == 0)
  525. break;
  526. DBG("reserving: %llx -> %llx\n", base, size);
  527. lmb_reserve(base, size);
  528. }
  529. }
  530. #ifdef CONFIG_PHYP_DUMP
  531. /**
  532. * phyp_dump_calculate_reserve_size() - reserve variable boot area 5% or arg
  533. *
  534. * Function to find the largest size we need to reserve
  535. * during early boot process.
  536. *
  537. * It either looks for boot param and returns that OR
  538. * returns larger of 256 or 5% rounded down to multiples of 256MB.
  539. *
  540. */
  541. static inline unsigned long phyp_dump_calculate_reserve_size(void)
  542. {
  543. unsigned long tmp;
  544. if (phyp_dump_info->reserve_bootvar)
  545. return phyp_dump_info->reserve_bootvar;
  546. /* divide by 20 to get 5% of value */
  547. tmp = lmb_end_of_DRAM();
  548. do_div(tmp, 20);
  549. /* round it down in multiples of 256 */
  550. tmp = tmp & ~0x0FFFFFFFUL;
  551. return (tmp > PHYP_DUMP_RMR_END ? tmp : PHYP_DUMP_RMR_END);
  552. }
  553. /**
  554. * phyp_dump_reserve_mem() - reserve all not-yet-dumped mmemory
  555. *
  556. * This routine may reserve memory regions in the kernel only
  557. * if the system is supported and a dump was taken in last
  558. * boot instance or if the hardware is supported and the
  559. * scratch area needs to be setup. In other instances it returns
  560. * without reserving anything. The memory in case of dump being
  561. * active is freed when the dump is collected (by userland tools).
  562. */
  563. static void __init phyp_dump_reserve_mem(void)
  564. {
  565. unsigned long base, size;
  566. unsigned long variable_reserve_size;
  567. if (!phyp_dump_info->phyp_dump_configured) {
  568. printk(KERN_ERR "Phyp-dump not supported on this hardware\n");
  569. return;
  570. }
  571. if (!phyp_dump_info->phyp_dump_at_boot) {
  572. printk(KERN_INFO "Phyp-dump disabled at boot time\n");
  573. return;
  574. }
  575. variable_reserve_size = phyp_dump_calculate_reserve_size();
  576. if (phyp_dump_info->phyp_dump_is_active) {
  577. /* Reserve *everything* above RMR.Area freed by userland tools*/
  578. base = variable_reserve_size;
  579. size = lmb_end_of_DRAM() - base;
  580. /* XXX crashed_ram_end is wrong, since it may be beyond
  581. * the memory_limit, it will need to be adjusted. */
  582. lmb_reserve(base, size);
  583. phyp_dump_info->init_reserve_start = base;
  584. phyp_dump_info->init_reserve_size = size;
  585. } else {
  586. size = phyp_dump_info->cpu_state_size +
  587. phyp_dump_info->hpte_region_size +
  588. variable_reserve_size;
  589. base = lmb_end_of_DRAM() - size;
  590. lmb_reserve(base, size);
  591. phyp_dump_info->init_reserve_start = base;
  592. phyp_dump_info->init_reserve_size = size;
  593. }
  594. }
  595. #else
  596. static inline void __init phyp_dump_reserve_mem(void) {}
  597. #endif /* CONFIG_PHYP_DUMP && CONFIG_PPC_RTAS */
  598. void __init early_init_devtree(void *params)
  599. {
  600. phys_addr_t limit;
  601. DBG(" -> early_init_devtree(%p)\n", params);
  602. /* Setup flat device-tree pointer */
  603. initial_boot_params = params;
  604. #ifdef CONFIG_PPC_RTAS
  605. /* Some machines might need RTAS info for debugging, grab it now. */
  606. of_scan_flat_dt(early_init_dt_scan_rtas, NULL);
  607. #endif
  608. #ifdef CONFIG_PHYP_DUMP
  609. /* scan tree to see if dump occured during last boot */
  610. of_scan_flat_dt(early_init_dt_scan_phyp_dump, NULL);
  611. #endif
  612. /* Retrieve various informations from the /chosen node of the
  613. * device-tree, including the platform type, initrd location and
  614. * size, TCE reserve, and more ...
  615. */
  616. of_scan_flat_dt(early_init_dt_scan_chosen, NULL);
  617. /* Scan memory nodes and rebuild LMBs */
  618. lmb_init();
  619. of_scan_flat_dt(early_init_dt_scan_root, NULL);
  620. of_scan_flat_dt(early_init_dt_scan_memory, NULL);
  621. /* Save command line for /proc/cmdline and then parse parameters */
  622. strlcpy(boot_command_line, cmd_line, COMMAND_LINE_SIZE);
  623. parse_early_param();
  624. /* Reserve LMB regions used by kernel, initrd, dt, etc... */
  625. lmb_reserve(PHYSICAL_START, __pa(klimit) - PHYSICAL_START);
  626. /* If relocatable, reserve first 32k for interrupt vectors etc. */
  627. if (PHYSICAL_START > MEMORY_START)
  628. lmb_reserve(MEMORY_START, 0x8000);
  629. reserve_kdump_trampoline();
  630. reserve_crashkernel();
  631. early_reserve_mem();
  632. phyp_dump_reserve_mem();
  633. limit = memory_limit;
  634. if (! limit) {
  635. phys_addr_t memsize;
  636. /* Ensure that total memory size is page-aligned, because
  637. * otherwise mark_bootmem() gets upset. */
  638. lmb_analyze();
  639. memsize = lmb_phys_mem_size();
  640. if ((memsize & PAGE_MASK) != memsize)
  641. limit = memsize & PAGE_MASK;
  642. }
  643. lmb_enforce_memory_limit(limit);
  644. lmb_analyze();
  645. lmb_dump_all();
  646. DBG("Phys. mem: %llx\n", lmb_phys_mem_size());
  647. /* We may need to relocate the flat tree, do it now.
  648. * FIXME .. and the initrd too? */
  649. move_device_tree();
  650. DBG("Scanning CPUs ...\n");
  651. /* Retreive CPU related informations from the flat tree
  652. * (altivec support, boot CPU ID, ...)
  653. */
  654. of_scan_flat_dt(early_init_dt_scan_cpus, NULL);
  655. DBG(" <- early_init_devtree()\n");
  656. }
  657. /*******
  658. *
  659. * New implementation of the OF "find" APIs, return a refcounted
  660. * object, call of_node_put() when done. The device tree and list
  661. * are protected by a rw_lock.
  662. *
  663. * Note that property management will need some locking as well,
  664. * this isn't dealt with yet.
  665. *
  666. *******/
  667. /**
  668. * of_find_node_by_phandle - Find a node given a phandle
  669. * @handle: phandle of the node to find
  670. *
  671. * Returns a node pointer with refcount incremented, use
  672. * of_node_put() on it when done.
  673. */
  674. struct device_node *of_find_node_by_phandle(phandle handle)
  675. {
  676. struct device_node *np;
  677. read_lock(&devtree_lock);
  678. for (np = allnodes; np != 0; np = np->allnext)
  679. if (np->linux_phandle == handle)
  680. break;
  681. of_node_get(np);
  682. read_unlock(&devtree_lock);
  683. return np;
  684. }
  685. EXPORT_SYMBOL(of_find_node_by_phandle);
  686. /**
  687. * of_find_next_cache_node - Find a node's subsidiary cache
  688. * @np: node of type "cpu" or "cache"
  689. *
  690. * Returns a node pointer with refcount incremented, use
  691. * of_node_put() on it when done. Caller should hold a reference
  692. * to np.
  693. */
  694. struct device_node *of_find_next_cache_node(struct device_node *np)
  695. {
  696. struct device_node *child;
  697. const phandle *handle;
  698. handle = of_get_property(np, "l2-cache", NULL);
  699. if (!handle)
  700. handle = of_get_property(np, "next-level-cache", NULL);
  701. if (handle)
  702. return of_find_node_by_phandle(*handle);
  703. /* OF on pmac has nodes instead of properties named "l2-cache"
  704. * beneath CPU nodes.
  705. */
  706. if (!strcmp(np->type, "cpu"))
  707. for_each_child_of_node(np, child)
  708. if (!strcmp(child->type, "cache"))
  709. return child;
  710. return NULL;
  711. }
  712. /**
  713. * of_node_get - Increment refcount of a node
  714. * @node: Node to inc refcount, NULL is supported to
  715. * simplify writing of callers
  716. *
  717. * Returns node.
  718. */
  719. struct device_node *of_node_get(struct device_node *node)
  720. {
  721. if (node)
  722. kref_get(&node->kref);
  723. return node;
  724. }
  725. EXPORT_SYMBOL(of_node_get);
  726. static inline struct device_node * kref_to_device_node(struct kref *kref)
  727. {
  728. return container_of(kref, struct device_node, kref);
  729. }
  730. /**
  731. * of_node_release - release a dynamically allocated node
  732. * @kref: kref element of the node to be released
  733. *
  734. * In of_node_put() this function is passed to kref_put()
  735. * as the destructor.
  736. */
  737. static void of_node_release(struct kref *kref)
  738. {
  739. struct device_node *node = kref_to_device_node(kref);
  740. struct property *prop = node->properties;
  741. /* We should never be releasing nodes that haven't been detached. */
  742. if (!of_node_check_flag(node, OF_DETACHED)) {
  743. printk("WARNING: Bad of_node_put() on %s\n", node->full_name);
  744. dump_stack();
  745. kref_init(&node->kref);
  746. return;
  747. }
  748. if (!of_node_check_flag(node, OF_DYNAMIC))
  749. return;
  750. while (prop) {
  751. struct property *next = prop->next;
  752. kfree(prop->name);
  753. kfree(prop->value);
  754. kfree(prop);
  755. prop = next;
  756. if (!prop) {
  757. prop = node->deadprops;
  758. node->deadprops = NULL;
  759. }
  760. }
  761. kfree(node->full_name);
  762. kfree(node->data);
  763. kfree(node);
  764. }
  765. /**
  766. * of_node_put - Decrement refcount of a node
  767. * @node: Node to dec refcount, NULL is supported to
  768. * simplify writing of callers
  769. *
  770. */
  771. void of_node_put(struct device_node *node)
  772. {
  773. if (node)
  774. kref_put(&node->kref, of_node_release);
  775. }
  776. EXPORT_SYMBOL(of_node_put);
  777. /*
  778. * Plug a device node into the tree and global list.
  779. */
  780. void of_attach_node(struct device_node *np)
  781. {
  782. unsigned long flags;
  783. write_lock_irqsave(&devtree_lock, flags);
  784. np->sibling = np->parent->child;
  785. np->allnext = allnodes;
  786. np->parent->child = np;
  787. allnodes = np;
  788. write_unlock_irqrestore(&devtree_lock, flags);
  789. }
  790. /*
  791. * "Unplug" a node from the device tree. The caller must hold
  792. * a reference to the node. The memory associated with the node
  793. * is not freed until its refcount goes to zero.
  794. */
  795. void of_detach_node(struct device_node *np)
  796. {
  797. struct device_node *parent;
  798. unsigned long flags;
  799. write_lock_irqsave(&devtree_lock, flags);
  800. parent = np->parent;
  801. if (!parent)
  802. goto out_unlock;
  803. if (allnodes == np)
  804. allnodes = np->allnext;
  805. else {
  806. struct device_node *prev;
  807. for (prev = allnodes;
  808. prev->allnext != np;
  809. prev = prev->allnext)
  810. ;
  811. prev->allnext = np->allnext;
  812. }
  813. if (parent->child == np)
  814. parent->child = np->sibling;
  815. else {
  816. struct device_node *prevsib;
  817. for (prevsib = np->parent->child;
  818. prevsib->sibling != np;
  819. prevsib = prevsib->sibling)
  820. ;
  821. prevsib->sibling = np->sibling;
  822. }
  823. of_node_set_flag(np, OF_DETACHED);
  824. out_unlock:
  825. write_unlock_irqrestore(&devtree_lock, flags);
  826. }
  827. #ifdef CONFIG_PPC_PSERIES
  828. /*
  829. * Fix up the uninitialized fields in a new device node:
  830. * name, type and pci-specific fields
  831. */
  832. static int of_finish_dynamic_node(struct device_node *node)
  833. {
  834. struct device_node *parent = of_get_parent(node);
  835. int err = 0;
  836. const phandle *ibm_phandle;
  837. node->name = of_get_property(node, "name", NULL);
  838. node->type = of_get_property(node, "device_type", NULL);
  839. if (!node->name)
  840. node->name = "<NULL>";
  841. if (!node->type)
  842. node->type = "<NULL>";
  843. if (!parent) {
  844. err = -ENODEV;
  845. goto out;
  846. }
  847. /* We don't support that function on PowerMac, at least
  848. * not yet
  849. */
  850. if (machine_is(powermac))
  851. return -ENODEV;
  852. /* fix up new node's linux_phandle field */
  853. if ((ibm_phandle = of_get_property(node, "ibm,phandle", NULL)))
  854. node->linux_phandle = *ibm_phandle;
  855. out:
  856. of_node_put(parent);
  857. return err;
  858. }
  859. static int prom_reconfig_notifier(struct notifier_block *nb,
  860. unsigned long action, void *node)
  861. {
  862. int err;
  863. switch (action) {
  864. case PSERIES_RECONFIG_ADD:
  865. err = of_finish_dynamic_node(node);
  866. if (err < 0) {
  867. printk(KERN_ERR "finish_node returned %d\n", err);
  868. err = NOTIFY_BAD;
  869. }
  870. break;
  871. default:
  872. err = NOTIFY_DONE;
  873. break;
  874. }
  875. return err;
  876. }
  877. static struct notifier_block prom_reconfig_nb = {
  878. .notifier_call = prom_reconfig_notifier,
  879. .priority = 10, /* This one needs to run first */
  880. };
  881. static int __init prom_reconfig_setup(void)
  882. {
  883. return pSeries_reconfig_notifier_register(&prom_reconfig_nb);
  884. }
  885. __initcall(prom_reconfig_setup);
  886. #endif
  887. /* Find the device node for a given logical cpu number, also returns the cpu
  888. * local thread number (index in ibm,interrupt-server#s) if relevant and
  889. * asked for (non NULL)
  890. */
  891. struct device_node *of_get_cpu_node(int cpu, unsigned int *thread)
  892. {
  893. int hardid;
  894. struct device_node *np;
  895. hardid = get_hard_smp_processor_id(cpu);
  896. for_each_node_by_type(np, "cpu") {
  897. const u32 *intserv;
  898. unsigned int plen, t;
  899. /* Check for ibm,ppc-interrupt-server#s. If it doesn't exist
  900. * fallback to "reg" property and assume no threads
  901. */
  902. intserv = of_get_property(np, "ibm,ppc-interrupt-server#s",
  903. &plen);
  904. if (intserv == NULL) {
  905. const u32 *reg = of_get_property(np, "reg", NULL);
  906. if (reg == NULL)
  907. continue;
  908. if (*reg == hardid) {
  909. if (thread)
  910. *thread = 0;
  911. return np;
  912. }
  913. } else {
  914. plen /= sizeof(u32);
  915. for (t = 0; t < plen; t++) {
  916. if (hardid == intserv[t]) {
  917. if (thread)
  918. *thread = t;
  919. return np;
  920. }
  921. }
  922. }
  923. }
  924. return NULL;
  925. }
  926. EXPORT_SYMBOL(of_get_cpu_node);
  927. #if defined(CONFIG_DEBUG_FS) && defined(DEBUG)
  928. static struct debugfs_blob_wrapper flat_dt_blob;
  929. static int __init export_flat_device_tree(void)
  930. {
  931. struct dentry *d;
  932. flat_dt_blob.data = initial_boot_params;
  933. flat_dt_blob.size = initial_boot_params->totalsize;
  934. d = debugfs_create_blob("flat-device-tree", S_IFREG | S_IRUSR,
  935. powerpc_debugfs_root, &flat_dt_blob);
  936. if (!d)
  937. return 1;
  938. return 0;
  939. }
  940. __initcall(export_flat_device_tree);
  941. #endif