setup_64.c 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634
  1. /*
  2. *
  3. * Common boot and setup code.
  4. *
  5. * Copyright (C) 2001 PPC64 Team, IBM Corp
  6. *
  7. * This program is free software; you can redistribute it and/or
  8. * modify it under the terms of the GNU General Public License
  9. * as published by the Free Software Foundation; either version
  10. * 2 of the License, or (at your option) any later version.
  11. */
  12. #undef DEBUG
  13. #include <linux/config.h>
  14. #include <linux/module.h>
  15. #include <linux/string.h>
  16. #include <linux/sched.h>
  17. #include <linux/init.h>
  18. #include <linux/kernel.h>
  19. #include <linux/reboot.h>
  20. #include <linux/delay.h>
  21. #include <linux/initrd.h>
  22. #include <linux/ide.h>
  23. #include <linux/seq_file.h>
  24. #include <linux/ioport.h>
  25. #include <linux/console.h>
  26. #include <linux/utsname.h>
  27. #include <linux/tty.h>
  28. #include <linux/root_dev.h>
  29. #include <linux/notifier.h>
  30. #include <linux/cpu.h>
  31. #include <linux/unistd.h>
  32. #include <linux/serial.h>
  33. #include <linux/serial_8250.h>
  34. #include <linux/bootmem.h>
  35. #include <asm/io.h>
  36. #include <asm/kdump.h>
  37. #include <asm/prom.h>
  38. #include <asm/processor.h>
  39. #include <asm/pgtable.h>
  40. #include <asm/smp.h>
  41. #include <asm/elf.h>
  42. #include <asm/machdep.h>
  43. #include <asm/paca.h>
  44. #include <asm/time.h>
  45. #include <asm/cputable.h>
  46. #include <asm/sections.h>
  47. #include <asm/btext.h>
  48. #include <asm/nvram.h>
  49. #include <asm/setup.h>
  50. #include <asm/system.h>
  51. #include <asm/rtas.h>
  52. #include <asm/iommu.h>
  53. #include <asm/serial.h>
  54. #include <asm/cache.h>
  55. #include <asm/page.h>
  56. #include <asm/mmu.h>
  57. #include <asm/lmb.h>
  58. #include <asm/iseries/it_lp_naca.h>
  59. #include <asm/firmware.h>
  60. #include <asm/xmon.h>
  61. #include <asm/udbg.h>
  62. #include <asm/kexec.h>
  63. #include "setup.h"
  64. #ifdef DEBUG
  65. #define DBG(fmt...) udbg_printf(fmt)
  66. #else
  67. #define DBG(fmt...)
  68. #endif
  69. int have_of = 1;
  70. int boot_cpuid = 0;
  71. dev_t boot_dev;
  72. u64 ppc64_pft_size;
  73. /* Pick defaults since we might want to patch instructions
  74. * before we've read this from the device tree.
  75. */
  76. struct ppc64_caches ppc64_caches = {
  77. .dline_size = 0x80,
  78. .log_dline_size = 7,
  79. .iline_size = 0x80,
  80. .log_iline_size = 7
  81. };
  82. EXPORT_SYMBOL_GPL(ppc64_caches);
  83. /*
  84. * These are used in binfmt_elf.c to put aux entries on the stack
  85. * for each elf executable being started.
  86. */
  87. int dcache_bsize;
  88. int icache_bsize;
  89. int ucache_bsize;
  90. #ifdef CONFIG_MAGIC_SYSRQ
  91. unsigned long SYSRQ_KEY;
  92. #endif /* CONFIG_MAGIC_SYSRQ */
  93. static int ppc64_panic_event(struct notifier_block *, unsigned long, void *);
  94. static struct notifier_block ppc64_panic_block = {
  95. .notifier_call = ppc64_panic_event,
  96. .priority = INT_MIN /* may not return; must be done last */
  97. };
  98. #ifdef CONFIG_SMP
  99. static int smt_enabled_cmdline;
  100. /* Look for ibm,smt-enabled OF option */
  101. static void check_smt_enabled(void)
  102. {
  103. struct device_node *dn;
  104. char *smt_option;
  105. /* Allow the command line to overrule the OF option */
  106. if (smt_enabled_cmdline)
  107. return;
  108. dn = of_find_node_by_path("/options");
  109. if (dn) {
  110. smt_option = (char *)get_property(dn, "ibm,smt-enabled", NULL);
  111. if (smt_option) {
  112. if (!strcmp(smt_option, "on"))
  113. smt_enabled_at_boot = 1;
  114. else if (!strcmp(smt_option, "off"))
  115. smt_enabled_at_boot = 0;
  116. }
  117. }
  118. }
  119. /* Look for smt-enabled= cmdline option */
  120. static int __init early_smt_enabled(char *p)
  121. {
  122. smt_enabled_cmdline = 1;
  123. if (!p)
  124. return 0;
  125. if (!strcmp(p, "on") || !strcmp(p, "1"))
  126. smt_enabled_at_boot = 1;
  127. else if (!strcmp(p, "off") || !strcmp(p, "0"))
  128. smt_enabled_at_boot = 0;
  129. return 0;
  130. }
  131. early_param("smt-enabled", early_smt_enabled);
  132. #else
  133. #define check_smt_enabled()
  134. #endif /* CONFIG_SMP */
  135. /*
  136. * Early initialization entry point. This is called by head.S
  137. * with MMU translation disabled. We rely on the "feature" of
  138. * the CPU that ignores the top 2 bits of the address in real
  139. * mode so we can access kernel globals normally provided we
  140. * only toy with things in the RMO region. From here, we do
  141. * some early parsing of the device-tree to setup out LMB
  142. * data structures, and allocate & initialize the hash table
  143. * and segment tables so we can start running with translation
  144. * enabled.
  145. *
  146. * It is this function which will call the probe() callback of
  147. * the various platform types and copy the matching one to the
  148. * global ppc_md structure. Your platform can eventually do
  149. * some very early initializations from the probe() routine, but
  150. * this is not recommended, be very careful as, for example, the
  151. * device-tree is not accessible via normal means at this point.
  152. */
  153. void __init early_setup(unsigned long dt_ptr)
  154. {
  155. /* Enable early debugging if any specified (see udbg.h) */
  156. udbg_early_init();
  157. DBG(" -> early_setup(), dt_ptr: 0x%lx\n", dt_ptr);
  158. /*
  159. * Do early initializations using the flattened device
  160. * tree, like retreiving the physical memory map or
  161. * calculating/retreiving the hash table size
  162. */
  163. early_init_devtree(__va(dt_ptr));
  164. /* Now we know the logical id of our boot cpu, setup the paca. */
  165. setup_boot_paca();
  166. /* Fix up paca fields required for the boot cpu */
  167. get_paca()->cpu_start = 1;
  168. get_paca()->stab_real = __pa((u64)&initial_stab);
  169. get_paca()->stab_addr = (u64)&initial_stab;
  170. /* Probe the machine type */
  171. probe_machine();
  172. #ifdef CONFIG_CRASH_DUMP
  173. kdump_setup();
  174. #endif
  175. DBG("Found, Initializing memory management...\n");
  176. /*
  177. * Initialize the MMU Hash table and create the linear mapping
  178. * of memory. Has to be done before stab/slb initialization as
  179. * this is currently where the page size encoding is obtained
  180. */
  181. htab_initialize();
  182. /*
  183. * Initialize stab / SLB management except on iSeries
  184. */
  185. if (cpu_has_feature(CPU_FTR_SLB))
  186. slb_initialize();
  187. else if (!firmware_has_feature(FW_FEATURE_ISERIES))
  188. stab_initialize(get_paca()->stab_real);
  189. DBG(" <- early_setup()\n");
  190. }
  191. #ifdef CONFIG_SMP
  192. void early_setup_secondary(void)
  193. {
  194. struct paca_struct *lpaca = get_paca();
  195. /* Mark enabled in PACA */
  196. lpaca->proc_enabled = 0;
  197. /* Initialize hash table for that CPU */
  198. htab_initialize_secondary();
  199. /* Initialize STAB/SLB. We use a virtual address as it works
  200. * in real mode on pSeries and we want a virutal address on
  201. * iSeries anyway
  202. */
  203. if (cpu_has_feature(CPU_FTR_SLB))
  204. slb_initialize();
  205. else
  206. stab_initialize(lpaca->stab_addr);
  207. }
  208. #endif /* CONFIG_SMP */
  209. #if defined(CONFIG_SMP) || defined(CONFIG_KEXEC)
  210. void smp_release_cpus(void)
  211. {
  212. extern unsigned long __secondary_hold_spinloop;
  213. unsigned long *ptr;
  214. DBG(" -> smp_release_cpus()\n");
  215. /* All secondary cpus are spinning on a common spinloop, release them
  216. * all now so they can start to spin on their individual paca
  217. * spinloops. For non SMP kernels, the secondary cpus never get out
  218. * of the common spinloop.
  219. * This is useless but harmless on iSeries, secondaries are already
  220. * waiting on their paca spinloops. */
  221. ptr = (unsigned long *)((unsigned long)&__secondary_hold_spinloop
  222. - PHYSICAL_START);
  223. *ptr = 1;
  224. mb();
  225. DBG(" <- smp_release_cpus()\n");
  226. }
  227. #endif /* CONFIG_SMP || CONFIG_KEXEC */
  228. /*
  229. * Initialize some remaining members of the ppc64_caches and systemcfg
  230. * structures
  231. * (at least until we get rid of them completely). This is mostly some
  232. * cache informations about the CPU that will be used by cache flush
  233. * routines and/or provided to userland
  234. */
  235. static void __init initialize_cache_info(void)
  236. {
  237. struct device_node *np;
  238. unsigned long num_cpus = 0;
  239. DBG(" -> initialize_cache_info()\n");
  240. for (np = NULL; (np = of_find_node_by_type(np, "cpu"));) {
  241. num_cpus += 1;
  242. /* We're assuming *all* of the CPUs have the same
  243. * d-cache and i-cache sizes... -Peter
  244. */
  245. if ( num_cpus == 1 ) {
  246. u32 *sizep, *lsizep;
  247. u32 size, lsize;
  248. const char *dc, *ic;
  249. /* Then read cache informations */
  250. if (machine_is(powermac)) {
  251. dc = "d-cache-block-size";
  252. ic = "i-cache-block-size";
  253. } else {
  254. dc = "d-cache-line-size";
  255. ic = "i-cache-line-size";
  256. }
  257. size = 0;
  258. lsize = cur_cpu_spec->dcache_bsize;
  259. sizep = (u32 *)get_property(np, "d-cache-size", NULL);
  260. if (sizep != NULL)
  261. size = *sizep;
  262. lsizep = (u32 *) get_property(np, dc, NULL);
  263. if (lsizep != NULL)
  264. lsize = *lsizep;
  265. if (sizep == 0 || lsizep == 0)
  266. DBG("Argh, can't find dcache properties ! "
  267. "sizep: %p, lsizep: %p\n", sizep, lsizep);
  268. ppc64_caches.dsize = size;
  269. ppc64_caches.dline_size = lsize;
  270. ppc64_caches.log_dline_size = __ilog2(lsize);
  271. ppc64_caches.dlines_per_page = PAGE_SIZE / lsize;
  272. size = 0;
  273. lsize = cur_cpu_spec->icache_bsize;
  274. sizep = (u32 *)get_property(np, "i-cache-size", NULL);
  275. if (sizep != NULL)
  276. size = *sizep;
  277. lsizep = (u32 *)get_property(np, ic, NULL);
  278. if (lsizep != NULL)
  279. lsize = *lsizep;
  280. if (sizep == 0 || lsizep == 0)
  281. DBG("Argh, can't find icache properties ! "
  282. "sizep: %p, lsizep: %p\n", sizep, lsizep);
  283. ppc64_caches.isize = size;
  284. ppc64_caches.iline_size = lsize;
  285. ppc64_caches.log_iline_size = __ilog2(lsize);
  286. ppc64_caches.ilines_per_page = PAGE_SIZE / lsize;
  287. }
  288. }
  289. DBG(" <- initialize_cache_info()\n");
  290. }
  291. /*
  292. * Do some initial setup of the system. The parameters are those which
  293. * were passed in from the bootloader.
  294. */
  295. void __init setup_system(void)
  296. {
  297. DBG(" -> setup_system()\n");
  298. #ifdef CONFIG_KEXEC
  299. kdump_move_device_tree();
  300. #endif
  301. /*
  302. * Unflatten the device-tree passed by prom_init or kexec
  303. */
  304. unflatten_device_tree();
  305. #ifdef CONFIG_KEXEC
  306. kexec_setup(); /* requires unflattened device tree. */
  307. #endif
  308. /*
  309. * Fill the ppc64_caches & systemcfg structures with informations
  310. * retrieved from the device-tree. Need to be called before
  311. * finish_device_tree() since the later requires some of the
  312. * informations filled up here to properly parse the interrupt
  313. * tree.
  314. * It also sets up the cache line sizes which allows to call
  315. * routines like flush_icache_range (used by the hash init
  316. * later on).
  317. */
  318. initialize_cache_info();
  319. #ifdef CONFIG_PPC_RTAS
  320. /*
  321. * Initialize RTAS if available
  322. */
  323. rtas_initialize();
  324. #endif /* CONFIG_PPC_RTAS */
  325. /*
  326. * Check if we have an initrd provided via the device-tree
  327. */
  328. check_for_initrd();
  329. /*
  330. * Do some platform specific early initializations, that includes
  331. * setting up the hash table pointers. It also sets up some interrupt-mapping
  332. * related options that will be used by finish_device_tree()
  333. */
  334. ppc_md.init_early();
  335. /*
  336. * We can discover serial ports now since the above did setup the
  337. * hash table management for us, thus ioremap works. We do that early
  338. * so that further code can be debugged
  339. */
  340. find_legacy_serial_ports();
  341. /*
  342. * "Finish" the device-tree, that is do the actual parsing of
  343. * some of the properties like the interrupt map
  344. */
  345. finish_device_tree();
  346. /*
  347. * Initialize xmon
  348. */
  349. #ifdef CONFIG_XMON_DEFAULT
  350. xmon_init(1);
  351. #endif
  352. /*
  353. * Register early console
  354. */
  355. register_early_udbg_console();
  356. /* Save unparsed command line copy for /proc/cmdline */
  357. strlcpy(saved_command_line, cmd_line, COMMAND_LINE_SIZE);
  358. parse_early_param();
  359. check_smt_enabled();
  360. smp_setup_cpu_maps();
  361. #ifdef CONFIG_SMP
  362. /* Release secondary cpus out of their spinloops at 0x60 now that
  363. * we can map physical -> logical CPU ids
  364. */
  365. smp_release_cpus();
  366. #endif
  367. printk("Starting Linux PPC64 %s\n", system_utsname.version);
  368. printk("-----------------------------------------------------\n");
  369. printk("ppc64_pft_size = 0x%lx\n", ppc64_pft_size);
  370. printk("ppc64_interrupt_controller = 0x%ld\n",
  371. ppc64_interrupt_controller);
  372. printk("physicalMemorySize = 0x%lx\n", lmb_phys_mem_size());
  373. printk("ppc64_caches.dcache_line_size = 0x%x\n",
  374. ppc64_caches.dline_size);
  375. printk("ppc64_caches.icache_line_size = 0x%x\n",
  376. ppc64_caches.iline_size);
  377. printk("htab_address = 0x%p\n", htab_address);
  378. printk("htab_hash_mask = 0x%lx\n", htab_hash_mask);
  379. #if PHYSICAL_START > 0
  380. printk("physical_start = 0x%x\n", PHYSICAL_START);
  381. #endif
  382. printk("-----------------------------------------------------\n");
  383. DBG(" <- setup_system()\n");
  384. }
  385. static int ppc64_panic_event(struct notifier_block *this,
  386. unsigned long event, void *ptr)
  387. {
  388. ppc_md.panic((char *)ptr); /* May not return */
  389. return NOTIFY_DONE;
  390. }
  391. #ifdef CONFIG_IRQSTACKS
  392. static void __init irqstack_early_init(void)
  393. {
  394. unsigned int i;
  395. /*
  396. * interrupt stacks must be under 256MB, we cannot afford to take
  397. * SLB misses on them.
  398. */
  399. for_each_possible_cpu(i) {
  400. softirq_ctx[i] = (struct thread_info *)
  401. __va(lmb_alloc_base(THREAD_SIZE,
  402. THREAD_SIZE, 0x10000000));
  403. hardirq_ctx[i] = (struct thread_info *)
  404. __va(lmb_alloc_base(THREAD_SIZE,
  405. THREAD_SIZE, 0x10000000));
  406. }
  407. }
  408. #else
  409. #define irqstack_early_init()
  410. #endif
  411. /*
  412. * Stack space used when we detect a bad kernel stack pointer, and
  413. * early in SMP boots before relocation is enabled.
  414. */
  415. static void __init emergency_stack_init(void)
  416. {
  417. unsigned long limit;
  418. unsigned int i;
  419. /*
  420. * Emergency stacks must be under 256MB, we cannot afford to take
  421. * SLB misses on them. The ABI also requires them to be 128-byte
  422. * aligned.
  423. *
  424. * Since we use these as temporary stacks during secondary CPU
  425. * bringup, we need to get at them in real mode. This means they
  426. * must also be within the RMO region.
  427. */
  428. limit = min(0x10000000UL, lmb.rmo_size);
  429. for_each_possible_cpu(i)
  430. paca[i].emergency_sp =
  431. __va(lmb_alloc_base(HW_PAGE_SIZE, 128, limit)) + HW_PAGE_SIZE;
  432. }
  433. /*
  434. * Called into from start_kernel, after lock_kernel has been called.
  435. * Initializes bootmem, which is unsed to manage page allocation until
  436. * mem_init is called.
  437. */
  438. void __init setup_arch(char **cmdline_p)
  439. {
  440. extern void do_init_bootmem(void);
  441. ppc64_boot_msg(0x12, "Setup Arch");
  442. *cmdline_p = cmd_line;
  443. /*
  444. * Set cache line size based on type of cpu as a default.
  445. * Systems with OF can look in the properties on the cpu node(s)
  446. * for a possibly more accurate value.
  447. */
  448. dcache_bsize = ppc64_caches.dline_size;
  449. icache_bsize = ppc64_caches.iline_size;
  450. /* reboot on panic */
  451. panic_timeout = 180;
  452. if (ppc_md.panic)
  453. atomic_notifier_chain_register(&panic_notifier_list,
  454. &ppc64_panic_block);
  455. init_mm.start_code = PAGE_OFFSET;
  456. init_mm.end_code = (unsigned long) _etext;
  457. init_mm.end_data = (unsigned long) _edata;
  458. init_mm.brk = klimit;
  459. irqstack_early_init();
  460. emergency_stack_init();
  461. stabs_alloc();
  462. /* set up the bootmem stuff with available memory */
  463. do_init_bootmem();
  464. sparse_init();
  465. #ifdef CONFIG_DUMMY_CONSOLE
  466. conswitchp = &dummy_con;
  467. #endif
  468. ppc_md.setup_arch();
  469. paging_init();
  470. ppc64_boot_msg(0x15, "Setup Done");
  471. }
  472. /* ToDo: do something useful if ppc_md is not yet setup. */
  473. #define PPC64_LINUX_FUNCTION 0x0f000000
  474. #define PPC64_IPL_MESSAGE 0xc0000000
  475. #define PPC64_TERM_MESSAGE 0xb0000000
  476. static void ppc64_do_msg(unsigned int src, const char *msg)
  477. {
  478. if (ppc_md.progress) {
  479. char buf[128];
  480. sprintf(buf, "%08X\n", src);
  481. ppc_md.progress(buf, 0);
  482. snprintf(buf, 128, "%s", msg);
  483. ppc_md.progress(buf, 0);
  484. }
  485. }
  486. /* Print a boot progress message. */
  487. void ppc64_boot_msg(unsigned int src, const char *msg)
  488. {
  489. ppc64_do_msg(PPC64_LINUX_FUNCTION|PPC64_IPL_MESSAGE|src, msg);
  490. printk("[boot]%04x %s\n", src, msg);
  491. }
  492. /* Print a termination message (print only -- does not stop the kernel) */
  493. void ppc64_terminate_msg(unsigned int src, const char *msg)
  494. {
  495. ppc64_do_msg(PPC64_LINUX_FUNCTION|PPC64_TERM_MESSAGE|src, msg);
  496. printk("[terminate]%04x %s\n", src, msg);
  497. }
  498. int check_legacy_ioport(unsigned long base_port)
  499. {
  500. if (ppc_md.check_legacy_ioport == NULL)
  501. return 0;
  502. return ppc_md.check_legacy_ioport(base_port);
  503. }
  504. EXPORT_SYMBOL(check_legacy_ioport);
  505. void cpu_die(void)
  506. {
  507. if (ppc_md.cpu_die)
  508. ppc_md.cpu_die();
  509. }
  510. #ifdef CONFIG_SMP
  511. void __init setup_per_cpu_areas(void)
  512. {
  513. int i;
  514. unsigned long size;
  515. char *ptr;
  516. /* Copy section for each CPU (we discard the original) */
  517. size = ALIGN(__per_cpu_end - __per_cpu_start, SMP_CACHE_BYTES);
  518. #ifdef CONFIG_MODULES
  519. if (size < PERCPU_ENOUGH_ROOM)
  520. size = PERCPU_ENOUGH_ROOM;
  521. #endif
  522. for_each_possible_cpu(i) {
  523. ptr = alloc_bootmem_node(NODE_DATA(cpu_to_node(i)), size);
  524. if (!ptr)
  525. panic("Cannot allocate cpu data for CPU %d\n", i);
  526. paca[i].data_offset = ptr - __per_cpu_start;
  527. memcpy(ptr, __per_cpu_start, __per_cpu_end - __per_cpu_start);
  528. }
  529. }
  530. #endif