setup.c 42 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620
  1. /*
  2. * linux/arch/i386/kernel/setup.c
  3. *
  4. * Copyright (C) 1995 Linus Torvalds
  5. *
  6. * Support of BIGMEM added by Gerhard Wichert, Siemens AG, July 1999
  7. *
  8. * Memory region support
  9. * David Parsons <orc@pell.chi.il.us>, July-August 1999
  10. *
  11. * Added E820 sanitization routine (removes overlapping memory regions);
  12. * Brian Moyle <bmoyle@mvista.com>, February 2001
  13. *
  14. * Moved CPU detection code to cpu/${cpu}.c
  15. * Patrick Mochel <mochel@osdl.org>, March 2002
  16. *
  17. * Provisions for empty E820 memory regions (reported by certain BIOSes).
  18. * Alex Achenbach <xela@slit.de>, December 2002.
  19. *
  20. */
  21. /*
  22. * This file handles the architecture-dependent parts of initialization
  23. */
  24. #include <linux/config.h>
  25. #include <linux/sched.h>
  26. #include <linux/mm.h>
  27. #include <linux/mmzone.h>
  28. #include <linux/tty.h>
  29. #include <linux/ioport.h>
  30. #include <linux/acpi.h>
  31. #include <linux/apm_bios.h>
  32. #include <linux/initrd.h>
  33. #include <linux/bootmem.h>
  34. #include <linux/seq_file.h>
  35. #include <linux/console.h>
  36. #include <linux/mca.h>
  37. #include <linux/root_dev.h>
  38. #include <linux/highmem.h>
  39. #include <linux/module.h>
  40. #include <linux/efi.h>
  41. #include <linux/init.h>
  42. #include <linux/edd.h>
  43. #include <linux/nodemask.h>
  44. #include <linux/kexec.h>
  45. #include <linux/crash_dump.h>
  46. #include <video/edid.h>
  47. #include <asm/apic.h>
  48. #include <asm/e820.h>
  49. #include <asm/mpspec.h>
  50. #include <asm/setup.h>
  51. #include <asm/arch_hooks.h>
  52. #include <asm/sections.h>
  53. #include <asm/io_apic.h>
  54. #include <asm/ist.h>
  55. #include <asm/io.h>
  56. #include "setup_arch_pre.h"
  57. #include <bios_ebda.h>
  58. /* Forward Declaration. */
  59. void __init find_max_pfn(void);
  60. /* This value is set up by the early boot code to point to the value
  61. immediately after the boot time page tables. It contains a *physical*
  62. address, and must not be in the .bss segment! */
  63. unsigned long init_pg_tables_end __initdata = ~0UL;
  64. int disable_pse __devinitdata = 0;
  65. /*
  66. * Machine setup..
  67. */
  68. #ifdef CONFIG_EFI
  69. int efi_enabled = 0;
  70. EXPORT_SYMBOL(efi_enabled);
  71. #endif
  72. /* cpu data as detected by the assembly code in head.S */
  73. struct cpuinfo_x86 new_cpu_data __initdata = { 0, 0, 0, 0, -1, 1, 0, 0, -1 };
  74. /* common cpu data for all cpus */
  75. struct cpuinfo_x86 boot_cpu_data __read_mostly = { 0, 0, 0, 0, -1, 1, 0, 0, -1 };
  76. EXPORT_SYMBOL(boot_cpu_data);
  77. unsigned long mmu_cr4_features;
  78. #ifdef CONFIG_ACPI
  79. int acpi_disabled = 0;
  80. #else
  81. int acpi_disabled = 1;
  82. #endif
  83. EXPORT_SYMBOL(acpi_disabled);
  84. #ifdef CONFIG_ACPI
  85. int __initdata acpi_force = 0;
  86. extern acpi_interrupt_flags acpi_sci_flags;
  87. #endif
  88. /* for MCA, but anyone else can use it if they want */
  89. unsigned int machine_id;
  90. #ifdef CONFIG_MCA
  91. EXPORT_SYMBOL(machine_id);
  92. #endif
  93. unsigned int machine_submodel_id;
  94. unsigned int BIOS_revision;
  95. unsigned int mca_pentium_flag;
  96. /* For PCI or other memory-mapped resources */
  97. unsigned long pci_mem_start = 0x10000000;
  98. #ifdef CONFIG_PCI
  99. EXPORT_SYMBOL(pci_mem_start);
  100. #endif
  101. /* Boot loader ID as an integer, for the benefit of proc_dointvec */
  102. int bootloader_type;
  103. /* user-defined highmem size */
  104. static unsigned int highmem_pages = -1;
  105. /*
  106. * Setup options
  107. */
  108. struct drive_info_struct { char dummy[32]; } drive_info;
  109. #if defined(CONFIG_BLK_DEV_IDE) || defined(CONFIG_BLK_DEV_HD) || \
  110. defined(CONFIG_BLK_DEV_IDE_MODULE) || defined(CONFIG_BLK_DEV_HD_MODULE)
  111. EXPORT_SYMBOL(drive_info);
  112. #endif
  113. struct screen_info screen_info;
  114. #ifdef CONFIG_VT
  115. EXPORT_SYMBOL(screen_info);
  116. #endif
  117. struct apm_info apm_info;
  118. EXPORT_SYMBOL(apm_info);
  119. struct sys_desc_table_struct {
  120. unsigned short length;
  121. unsigned char table[0];
  122. };
  123. struct edid_info edid_info;
  124. struct ist_info ist_info;
  125. #if defined(CONFIG_X86_SPEEDSTEP_SMI) || \
  126. defined(CONFIG_X86_SPEEDSTEP_SMI_MODULE)
  127. EXPORT_SYMBOL(ist_info);
  128. #endif
  129. struct e820map e820;
  130. extern void early_cpu_init(void);
  131. extern void dmi_scan_machine(void);
  132. extern void generic_apic_probe(char *);
  133. extern int root_mountflags;
  134. unsigned long saved_videomode;
  135. #define RAMDISK_IMAGE_START_MASK 0x07FF
  136. #define RAMDISK_PROMPT_FLAG 0x8000
  137. #define RAMDISK_LOAD_FLAG 0x4000
  138. static char command_line[COMMAND_LINE_SIZE];
  139. unsigned char __initdata boot_params[PARAM_SIZE];
  140. static struct resource data_resource = {
  141. .name = "Kernel data",
  142. .start = 0,
  143. .end = 0,
  144. .flags = IORESOURCE_BUSY | IORESOURCE_MEM
  145. };
  146. static struct resource code_resource = {
  147. .name = "Kernel code",
  148. .start = 0,
  149. .end = 0,
  150. .flags = IORESOURCE_BUSY | IORESOURCE_MEM
  151. };
  152. static struct resource system_rom_resource = {
  153. .name = "System ROM",
  154. .start = 0xf0000,
  155. .end = 0xfffff,
  156. .flags = IORESOURCE_BUSY | IORESOURCE_READONLY | IORESOURCE_MEM
  157. };
  158. static struct resource extension_rom_resource = {
  159. .name = "Extension ROM",
  160. .start = 0xe0000,
  161. .end = 0xeffff,
  162. .flags = IORESOURCE_BUSY | IORESOURCE_READONLY | IORESOURCE_MEM
  163. };
  164. static struct resource adapter_rom_resources[] = { {
  165. .name = "Adapter ROM",
  166. .start = 0xc8000,
  167. .end = 0,
  168. .flags = IORESOURCE_BUSY | IORESOURCE_READONLY | IORESOURCE_MEM
  169. }, {
  170. .name = "Adapter ROM",
  171. .start = 0,
  172. .end = 0,
  173. .flags = IORESOURCE_BUSY | IORESOURCE_READONLY | IORESOURCE_MEM
  174. }, {
  175. .name = "Adapter ROM",
  176. .start = 0,
  177. .end = 0,
  178. .flags = IORESOURCE_BUSY | IORESOURCE_READONLY | IORESOURCE_MEM
  179. }, {
  180. .name = "Adapter ROM",
  181. .start = 0,
  182. .end = 0,
  183. .flags = IORESOURCE_BUSY | IORESOURCE_READONLY | IORESOURCE_MEM
  184. }, {
  185. .name = "Adapter ROM",
  186. .start = 0,
  187. .end = 0,
  188. .flags = IORESOURCE_BUSY | IORESOURCE_READONLY | IORESOURCE_MEM
  189. }, {
  190. .name = "Adapter ROM",
  191. .start = 0,
  192. .end = 0,
  193. .flags = IORESOURCE_BUSY | IORESOURCE_READONLY | IORESOURCE_MEM
  194. } };
  195. #define ADAPTER_ROM_RESOURCES \
  196. (sizeof adapter_rom_resources / sizeof adapter_rom_resources[0])
  197. static struct resource video_rom_resource = {
  198. .name = "Video ROM",
  199. .start = 0xc0000,
  200. .end = 0xc7fff,
  201. .flags = IORESOURCE_BUSY | IORESOURCE_READONLY | IORESOURCE_MEM
  202. };
  203. static struct resource video_ram_resource = {
  204. .name = "Video RAM area",
  205. .start = 0xa0000,
  206. .end = 0xbffff,
  207. .flags = IORESOURCE_BUSY | IORESOURCE_MEM
  208. };
  209. static struct resource standard_io_resources[] = { {
  210. .name = "dma1",
  211. .start = 0x0000,
  212. .end = 0x001f,
  213. .flags = IORESOURCE_BUSY | IORESOURCE_IO
  214. }, {
  215. .name = "pic1",
  216. .start = 0x0020,
  217. .end = 0x0021,
  218. .flags = IORESOURCE_BUSY | IORESOURCE_IO
  219. }, {
  220. .name = "timer0",
  221. .start = 0x0040,
  222. .end = 0x0043,
  223. .flags = IORESOURCE_BUSY | IORESOURCE_IO
  224. }, {
  225. .name = "timer1",
  226. .start = 0x0050,
  227. .end = 0x0053,
  228. .flags = IORESOURCE_BUSY | IORESOURCE_IO
  229. }, {
  230. .name = "keyboard",
  231. .start = 0x0060,
  232. .end = 0x006f,
  233. .flags = IORESOURCE_BUSY | IORESOURCE_IO
  234. }, {
  235. .name = "dma page reg",
  236. .start = 0x0080,
  237. .end = 0x008f,
  238. .flags = IORESOURCE_BUSY | IORESOURCE_IO
  239. }, {
  240. .name = "pic2",
  241. .start = 0x00a0,
  242. .end = 0x00a1,
  243. .flags = IORESOURCE_BUSY | IORESOURCE_IO
  244. }, {
  245. .name = "dma2",
  246. .start = 0x00c0,
  247. .end = 0x00df,
  248. .flags = IORESOURCE_BUSY | IORESOURCE_IO
  249. }, {
  250. .name = "fpu",
  251. .start = 0x00f0,
  252. .end = 0x00ff,
  253. .flags = IORESOURCE_BUSY | IORESOURCE_IO
  254. } };
  255. #define STANDARD_IO_RESOURCES \
  256. (sizeof standard_io_resources / sizeof standard_io_resources[0])
  257. #define romsignature(x) (*(unsigned short *)(x) == 0xaa55)
  258. static int __init romchecksum(unsigned char *rom, unsigned long length)
  259. {
  260. unsigned char *p, sum = 0;
  261. for (p = rom; p < rom + length; p++)
  262. sum += *p;
  263. return sum == 0;
  264. }
  265. static void __init probe_roms(void)
  266. {
  267. unsigned long start, length, upper;
  268. unsigned char *rom;
  269. int i;
  270. /* video rom */
  271. upper = adapter_rom_resources[0].start;
  272. for (start = video_rom_resource.start; start < upper; start += 2048) {
  273. rom = isa_bus_to_virt(start);
  274. if (!romsignature(rom))
  275. continue;
  276. video_rom_resource.start = start;
  277. /* 0 < length <= 0x7f * 512, historically */
  278. length = rom[2] * 512;
  279. /* if checksum okay, trust length byte */
  280. if (length && romchecksum(rom, length))
  281. video_rom_resource.end = start + length - 1;
  282. request_resource(&iomem_resource, &video_rom_resource);
  283. break;
  284. }
  285. start = (video_rom_resource.end + 1 + 2047) & ~2047UL;
  286. if (start < upper)
  287. start = upper;
  288. /* system rom */
  289. request_resource(&iomem_resource, &system_rom_resource);
  290. upper = system_rom_resource.start;
  291. /* check for extension rom (ignore length byte!) */
  292. rom = isa_bus_to_virt(extension_rom_resource.start);
  293. if (romsignature(rom)) {
  294. length = extension_rom_resource.end - extension_rom_resource.start + 1;
  295. if (romchecksum(rom, length)) {
  296. request_resource(&iomem_resource, &extension_rom_resource);
  297. upper = extension_rom_resource.start;
  298. }
  299. }
  300. /* check for adapter roms on 2k boundaries */
  301. for (i = 0; i < ADAPTER_ROM_RESOURCES && start < upper; start += 2048) {
  302. rom = isa_bus_to_virt(start);
  303. if (!romsignature(rom))
  304. continue;
  305. /* 0 < length <= 0x7f * 512, historically */
  306. length = rom[2] * 512;
  307. /* but accept any length that fits if checksum okay */
  308. if (!length || start + length > upper || !romchecksum(rom, length))
  309. continue;
  310. adapter_rom_resources[i].start = start;
  311. adapter_rom_resources[i].end = start + length - 1;
  312. request_resource(&iomem_resource, &adapter_rom_resources[i]);
  313. start = adapter_rom_resources[i++].end & ~2047UL;
  314. }
  315. }
  316. static void __init limit_regions(unsigned long long size)
  317. {
  318. unsigned long long current_addr = 0;
  319. int i;
  320. if (efi_enabled) {
  321. efi_memory_desc_t *md;
  322. void *p;
  323. for (p = memmap.map, i = 0; p < memmap.map_end;
  324. p += memmap.desc_size, i++) {
  325. md = p;
  326. current_addr = md->phys_addr + (md->num_pages << 12);
  327. if (md->type == EFI_CONVENTIONAL_MEMORY) {
  328. if (current_addr >= size) {
  329. md->num_pages -=
  330. (((current_addr-size) + PAGE_SIZE-1) >> PAGE_SHIFT);
  331. memmap.nr_map = i + 1;
  332. return;
  333. }
  334. }
  335. }
  336. }
  337. for (i = 0; i < e820.nr_map; i++) {
  338. if (e820.map[i].type == E820_RAM) {
  339. current_addr = e820.map[i].addr + e820.map[i].size;
  340. if (current_addr >= size) {
  341. e820.map[i].size -= current_addr-size;
  342. e820.nr_map = i + 1;
  343. return;
  344. }
  345. }
  346. }
  347. }
  348. static void __init add_memory_region(unsigned long long start,
  349. unsigned long long size, int type)
  350. {
  351. int x;
  352. if (!efi_enabled) {
  353. x = e820.nr_map;
  354. if (x == E820MAX) {
  355. printk(KERN_ERR "Ooops! Too many entries in the memory map!\n");
  356. return;
  357. }
  358. e820.map[x].addr = start;
  359. e820.map[x].size = size;
  360. e820.map[x].type = type;
  361. e820.nr_map++;
  362. }
  363. } /* add_memory_region */
  364. #define E820_DEBUG 1
  365. static void __init print_memory_map(char *who)
  366. {
  367. int i;
  368. for (i = 0; i < e820.nr_map; i++) {
  369. printk(" %s: %016Lx - %016Lx ", who,
  370. e820.map[i].addr,
  371. e820.map[i].addr + e820.map[i].size);
  372. switch (e820.map[i].type) {
  373. case E820_RAM: printk("(usable)\n");
  374. break;
  375. case E820_RESERVED:
  376. printk("(reserved)\n");
  377. break;
  378. case E820_ACPI:
  379. printk("(ACPI data)\n");
  380. break;
  381. case E820_NVS:
  382. printk("(ACPI NVS)\n");
  383. break;
  384. default: printk("type %lu\n", e820.map[i].type);
  385. break;
  386. }
  387. }
  388. }
  389. /*
  390. * Sanitize the BIOS e820 map.
  391. *
  392. * Some e820 responses include overlapping entries. The following
  393. * replaces the original e820 map with a new one, removing overlaps.
  394. *
  395. */
  396. struct change_member {
  397. struct e820entry *pbios; /* pointer to original bios entry */
  398. unsigned long long addr; /* address for this change point */
  399. };
  400. static struct change_member change_point_list[2*E820MAX] __initdata;
  401. static struct change_member *change_point[2*E820MAX] __initdata;
  402. static struct e820entry *overlap_list[E820MAX] __initdata;
  403. static struct e820entry new_bios[E820MAX] __initdata;
  404. static int __init sanitize_e820_map(struct e820entry * biosmap, char * pnr_map)
  405. {
  406. struct change_member *change_tmp;
  407. unsigned long current_type, last_type;
  408. unsigned long long last_addr;
  409. int chgidx, still_changing;
  410. int overlap_entries;
  411. int new_bios_entry;
  412. int old_nr, new_nr, chg_nr;
  413. int i;
  414. /*
  415. Visually we're performing the following (1,2,3,4 = memory types)...
  416. Sample memory map (w/overlaps):
  417. ____22__________________
  418. ______________________4_
  419. ____1111________________
  420. _44_____________________
  421. 11111111________________
  422. ____________________33__
  423. ___________44___________
  424. __________33333_________
  425. ______________22________
  426. ___________________2222_
  427. _________111111111______
  428. _____________________11_
  429. _________________4______
  430. Sanitized equivalent (no overlap):
  431. 1_______________________
  432. _44_____________________
  433. ___1____________________
  434. ____22__________________
  435. ______11________________
  436. _________1______________
  437. __________3_____________
  438. ___________44___________
  439. _____________33_________
  440. _______________2________
  441. ________________1_______
  442. _________________4______
  443. ___________________2____
  444. ____________________33__
  445. ______________________4_
  446. */
  447. /* if there's only one memory region, don't bother */
  448. if (*pnr_map < 2)
  449. return -1;
  450. old_nr = *pnr_map;
  451. /* bail out if we find any unreasonable addresses in bios map */
  452. for (i=0; i<old_nr; i++)
  453. if (biosmap[i].addr + biosmap[i].size < biosmap[i].addr)
  454. return -1;
  455. /* create pointers for initial change-point information (for sorting) */
  456. for (i=0; i < 2*old_nr; i++)
  457. change_point[i] = &change_point_list[i];
  458. /* record all known change-points (starting and ending addresses),
  459. omitting those that are for empty memory regions */
  460. chgidx = 0;
  461. for (i=0; i < old_nr; i++) {
  462. if (biosmap[i].size != 0) {
  463. change_point[chgidx]->addr = biosmap[i].addr;
  464. change_point[chgidx++]->pbios = &biosmap[i];
  465. change_point[chgidx]->addr = biosmap[i].addr + biosmap[i].size;
  466. change_point[chgidx++]->pbios = &biosmap[i];
  467. }
  468. }
  469. chg_nr = chgidx; /* true number of change-points */
  470. /* sort change-point list by memory addresses (low -> high) */
  471. still_changing = 1;
  472. while (still_changing) {
  473. still_changing = 0;
  474. for (i=1; i < chg_nr; i++) {
  475. /* if <current_addr> > <last_addr>, swap */
  476. /* or, if current=<start_addr> & last=<end_addr>, swap */
  477. if ((change_point[i]->addr < change_point[i-1]->addr) ||
  478. ((change_point[i]->addr == change_point[i-1]->addr) &&
  479. (change_point[i]->addr == change_point[i]->pbios->addr) &&
  480. (change_point[i-1]->addr != change_point[i-1]->pbios->addr))
  481. )
  482. {
  483. change_tmp = change_point[i];
  484. change_point[i] = change_point[i-1];
  485. change_point[i-1] = change_tmp;
  486. still_changing=1;
  487. }
  488. }
  489. }
  490. /* create a new bios memory map, removing overlaps */
  491. overlap_entries=0; /* number of entries in the overlap table */
  492. new_bios_entry=0; /* index for creating new bios map entries */
  493. last_type = 0; /* start with undefined memory type */
  494. last_addr = 0; /* start with 0 as last starting address */
  495. /* loop through change-points, determining affect on the new bios map */
  496. for (chgidx=0; chgidx < chg_nr; chgidx++)
  497. {
  498. /* keep track of all overlapping bios entries */
  499. if (change_point[chgidx]->addr == change_point[chgidx]->pbios->addr)
  500. {
  501. /* add map entry to overlap list (> 1 entry implies an overlap) */
  502. overlap_list[overlap_entries++]=change_point[chgidx]->pbios;
  503. }
  504. else
  505. {
  506. /* remove entry from list (order independent, so swap with last) */
  507. for (i=0; i<overlap_entries; i++)
  508. {
  509. if (overlap_list[i] == change_point[chgidx]->pbios)
  510. overlap_list[i] = overlap_list[overlap_entries-1];
  511. }
  512. overlap_entries--;
  513. }
  514. /* if there are overlapping entries, decide which "type" to use */
  515. /* (larger value takes precedence -- 1=usable, 2,3,4,4+=unusable) */
  516. current_type = 0;
  517. for (i=0; i<overlap_entries; i++)
  518. if (overlap_list[i]->type > current_type)
  519. current_type = overlap_list[i]->type;
  520. /* continue building up new bios map based on this information */
  521. if (current_type != last_type) {
  522. if (last_type != 0) {
  523. new_bios[new_bios_entry].size =
  524. change_point[chgidx]->addr - last_addr;
  525. /* move forward only if the new size was non-zero */
  526. if (new_bios[new_bios_entry].size != 0)
  527. if (++new_bios_entry >= E820MAX)
  528. break; /* no more space left for new bios entries */
  529. }
  530. if (current_type != 0) {
  531. new_bios[new_bios_entry].addr = change_point[chgidx]->addr;
  532. new_bios[new_bios_entry].type = current_type;
  533. last_addr=change_point[chgidx]->addr;
  534. }
  535. last_type = current_type;
  536. }
  537. }
  538. new_nr = new_bios_entry; /* retain count for new bios entries */
  539. /* copy new bios mapping into original location */
  540. memcpy(biosmap, new_bios, new_nr*sizeof(struct e820entry));
  541. *pnr_map = new_nr;
  542. return 0;
  543. }
  544. /*
  545. * Copy the BIOS e820 map into a safe place.
  546. *
  547. * Sanity-check it while we're at it..
  548. *
  549. * If we're lucky and live on a modern system, the setup code
  550. * will have given us a memory map that we can use to properly
  551. * set up memory. If we aren't, we'll fake a memory map.
  552. *
  553. * We check to see that the memory map contains at least 2 elements
  554. * before we'll use it, because the detection code in setup.S may
  555. * not be perfect and most every PC known to man has two memory
  556. * regions: one from 0 to 640k, and one from 1mb up. (The IBM
  557. * thinkpad 560x, for example, does not cooperate with the memory
  558. * detection code.)
  559. */
  560. static int __init copy_e820_map(struct e820entry * biosmap, int nr_map)
  561. {
  562. /* Only one memory region (or negative)? Ignore it */
  563. if (nr_map < 2)
  564. return -1;
  565. do {
  566. unsigned long long start = biosmap->addr;
  567. unsigned long long size = biosmap->size;
  568. unsigned long long end = start + size;
  569. unsigned long type = biosmap->type;
  570. /* Overflow in 64 bits? Ignore the memory map. */
  571. if (start > end)
  572. return -1;
  573. /*
  574. * Some BIOSes claim RAM in the 640k - 1M region.
  575. * Not right. Fix it up.
  576. */
  577. if (type == E820_RAM) {
  578. if (start < 0x100000ULL && end > 0xA0000ULL) {
  579. if (start < 0xA0000ULL)
  580. add_memory_region(start, 0xA0000ULL-start, type);
  581. if (end <= 0x100000ULL)
  582. continue;
  583. start = 0x100000ULL;
  584. size = end - start;
  585. }
  586. }
  587. add_memory_region(start, size, type);
  588. } while (biosmap++,--nr_map);
  589. return 0;
  590. }
  591. #if defined(CONFIG_EDD) || defined(CONFIG_EDD_MODULE)
  592. struct edd edd;
  593. #ifdef CONFIG_EDD_MODULE
  594. EXPORT_SYMBOL(edd);
  595. #endif
  596. /**
  597. * copy_edd() - Copy the BIOS EDD information
  598. * from boot_params into a safe place.
  599. *
  600. */
  601. static inline void copy_edd(void)
  602. {
  603. memcpy(edd.mbr_signature, EDD_MBR_SIGNATURE, sizeof(edd.mbr_signature));
  604. memcpy(edd.edd_info, EDD_BUF, sizeof(edd.edd_info));
  605. edd.mbr_signature_nr = EDD_MBR_SIG_NR;
  606. edd.edd_info_nr = EDD_NR;
  607. }
  608. #else
  609. static inline void copy_edd(void)
  610. {
  611. }
  612. #endif
  613. /*
  614. * Do NOT EVER look at the BIOS memory size location.
  615. * It does not work on many machines.
  616. */
  617. #define LOWMEMSIZE() (0x9f000)
  618. static void __init parse_cmdline_early (char ** cmdline_p)
  619. {
  620. char c = ' ', *to = command_line, *from = saved_command_line;
  621. int len = 0;
  622. int userdef = 0;
  623. /* Save unparsed command line copy for /proc/cmdline */
  624. saved_command_line[COMMAND_LINE_SIZE-1] = '\0';
  625. for (;;) {
  626. if (c != ' ')
  627. goto next_char;
  628. /*
  629. * "mem=nopentium" disables the 4MB page tables.
  630. * "mem=XXX[kKmM]" defines a memory region from HIGH_MEM
  631. * to <mem>, overriding the bios size.
  632. * "memmap=XXX[KkmM]@XXX[KkmM]" defines a memory region from
  633. * <start> to <start>+<mem>, overriding the bios size.
  634. *
  635. * HPA tells me bootloaders need to parse mem=, so no new
  636. * option should be mem= [also see Documentation/i386/boot.txt]
  637. */
  638. if (!memcmp(from, "mem=", 4)) {
  639. if (to != command_line)
  640. to--;
  641. if (!memcmp(from+4, "nopentium", 9)) {
  642. from += 9+4;
  643. clear_bit(X86_FEATURE_PSE, boot_cpu_data.x86_capability);
  644. disable_pse = 1;
  645. } else {
  646. /* If the user specifies memory size, we
  647. * limit the BIOS-provided memory map to
  648. * that size. exactmap can be used to specify
  649. * the exact map. mem=number can be used to
  650. * trim the existing memory map.
  651. */
  652. unsigned long long mem_size;
  653. mem_size = memparse(from+4, &from);
  654. limit_regions(mem_size);
  655. userdef=1;
  656. }
  657. }
  658. else if (!memcmp(from, "memmap=", 7)) {
  659. if (to != command_line)
  660. to--;
  661. if (!memcmp(from+7, "exactmap", 8)) {
  662. #ifdef CONFIG_CRASH_DUMP
  663. /* If we are doing a crash dump, we
  664. * still need to know the real mem
  665. * size before original memory map is
  666. * reset.
  667. */
  668. find_max_pfn();
  669. saved_max_pfn = max_pfn;
  670. #endif
  671. from += 8+7;
  672. e820.nr_map = 0;
  673. userdef = 1;
  674. } else {
  675. /* If the user specifies memory size, we
  676. * limit the BIOS-provided memory map to
  677. * that size. exactmap can be used to specify
  678. * the exact map. mem=number can be used to
  679. * trim the existing memory map.
  680. */
  681. unsigned long long start_at, mem_size;
  682. mem_size = memparse(from+7, &from);
  683. if (*from == '@') {
  684. start_at = memparse(from+1, &from);
  685. add_memory_region(start_at, mem_size, E820_RAM);
  686. } else if (*from == '#') {
  687. start_at = memparse(from+1, &from);
  688. add_memory_region(start_at, mem_size, E820_ACPI);
  689. } else if (*from == '$') {
  690. start_at = memparse(from+1, &from);
  691. add_memory_region(start_at, mem_size, E820_RESERVED);
  692. } else {
  693. limit_regions(mem_size);
  694. userdef=1;
  695. }
  696. }
  697. }
  698. else if (!memcmp(from, "noexec=", 7))
  699. noexec_setup(from + 7);
  700. #ifdef CONFIG_X86_SMP
  701. /*
  702. * If the BIOS enumerates physical processors before logical,
  703. * maxcpus=N at enumeration-time can be used to disable HT.
  704. */
  705. else if (!memcmp(from, "maxcpus=", 8)) {
  706. extern unsigned int maxcpus;
  707. maxcpus = simple_strtoul(from + 8, NULL, 0);
  708. }
  709. #endif
  710. #ifdef CONFIG_ACPI
  711. /* "acpi=off" disables both ACPI table parsing and interpreter */
  712. else if (!memcmp(from, "acpi=off", 8)) {
  713. disable_acpi();
  714. }
  715. /* acpi=force to over-ride black-list */
  716. else if (!memcmp(from, "acpi=force", 10)) {
  717. acpi_force = 1;
  718. acpi_ht = 1;
  719. acpi_disabled = 0;
  720. }
  721. /* acpi=strict disables out-of-spec workarounds */
  722. else if (!memcmp(from, "acpi=strict", 11)) {
  723. acpi_strict = 1;
  724. }
  725. /* Limit ACPI just to boot-time to enable HT */
  726. else if (!memcmp(from, "acpi=ht", 7)) {
  727. if (!acpi_force)
  728. disable_acpi();
  729. acpi_ht = 1;
  730. }
  731. /* "pci=noacpi" disable ACPI IRQ routing and PCI scan */
  732. else if (!memcmp(from, "pci=noacpi", 10)) {
  733. acpi_disable_pci();
  734. }
  735. /* "acpi=noirq" disables ACPI interrupt routing */
  736. else if (!memcmp(from, "acpi=noirq", 10)) {
  737. acpi_noirq_set();
  738. }
  739. else if (!memcmp(from, "acpi_sci=edge", 13))
  740. acpi_sci_flags.trigger = 1;
  741. else if (!memcmp(from, "acpi_sci=level", 14))
  742. acpi_sci_flags.trigger = 3;
  743. else if (!memcmp(from, "acpi_sci=high", 13))
  744. acpi_sci_flags.polarity = 1;
  745. else if (!memcmp(from, "acpi_sci=low", 12))
  746. acpi_sci_flags.polarity = 3;
  747. #ifdef CONFIG_X86_IO_APIC
  748. else if (!memcmp(from, "acpi_skip_timer_override", 24))
  749. acpi_skip_timer_override = 1;
  750. #endif
  751. #ifdef CONFIG_X86_LOCAL_APIC
  752. /* disable IO-APIC */
  753. else if (!memcmp(from, "noapic", 6))
  754. disable_ioapic_setup();
  755. #endif /* CONFIG_X86_LOCAL_APIC */
  756. #endif /* CONFIG_ACPI */
  757. #ifdef CONFIG_X86_LOCAL_APIC
  758. /* enable local APIC */
  759. else if (!memcmp(from, "lapic", 5))
  760. lapic_enable();
  761. /* disable local APIC */
  762. else if (!memcmp(from, "nolapic", 6))
  763. lapic_disable();
  764. #endif /* CONFIG_X86_LOCAL_APIC */
  765. #ifdef CONFIG_KEXEC
  766. /* crashkernel=size@addr specifies the location to reserve for
  767. * a crash kernel. By reserving this memory we guarantee
  768. * that linux never set's it up as a DMA target.
  769. * Useful for holding code to do something appropriate
  770. * after a kernel panic.
  771. */
  772. else if (!memcmp(from, "crashkernel=", 12)) {
  773. unsigned long size, base;
  774. size = memparse(from+12, &from);
  775. if (*from == '@') {
  776. base = memparse(from+1, &from);
  777. /* FIXME: Do I want a sanity check
  778. * to validate the memory range?
  779. */
  780. crashk_res.start = base;
  781. crashk_res.end = base + size - 1;
  782. }
  783. }
  784. #endif
  785. #ifdef CONFIG_CRASH_DUMP
  786. /* elfcorehdr= specifies the location of elf core header
  787. * stored by the crashed kernel.
  788. */
  789. else if (!memcmp(from, "elfcorehdr=", 11))
  790. elfcorehdr_addr = memparse(from+11, &from);
  791. #endif
  792. /*
  793. * highmem=size forces highmem to be exactly 'size' bytes.
  794. * This works even on boxes that have no highmem otherwise.
  795. * This also works to reduce highmem size on bigger boxes.
  796. */
  797. else if (!memcmp(from, "highmem=", 8))
  798. highmem_pages = memparse(from+8, &from) >> PAGE_SHIFT;
  799. /*
  800. * vmalloc=size forces the vmalloc area to be exactly 'size'
  801. * bytes. This can be used to increase (or decrease) the
  802. * vmalloc area - the default is 128m.
  803. */
  804. else if (!memcmp(from, "vmalloc=", 8))
  805. __VMALLOC_RESERVE = memparse(from+8, &from);
  806. next_char:
  807. c = *(from++);
  808. if (!c)
  809. break;
  810. if (COMMAND_LINE_SIZE <= ++len)
  811. break;
  812. *(to++) = c;
  813. }
  814. *to = '\0';
  815. *cmdline_p = command_line;
  816. if (userdef) {
  817. printk(KERN_INFO "user-defined physical RAM map:\n");
  818. print_memory_map("user");
  819. }
  820. }
  821. /*
  822. * Callback for efi_memory_walk.
  823. */
  824. static int __init
  825. efi_find_max_pfn(unsigned long start, unsigned long end, void *arg)
  826. {
  827. unsigned long *max_pfn = arg, pfn;
  828. if (start < end) {
  829. pfn = PFN_UP(end -1);
  830. if (pfn > *max_pfn)
  831. *max_pfn = pfn;
  832. }
  833. return 0;
  834. }
  835. /*
  836. * Find the highest page frame number we have available
  837. */
  838. void __init find_max_pfn(void)
  839. {
  840. int i;
  841. max_pfn = 0;
  842. if (efi_enabled) {
  843. efi_memmap_walk(efi_find_max_pfn, &max_pfn);
  844. return;
  845. }
  846. for (i = 0; i < e820.nr_map; i++) {
  847. unsigned long start, end;
  848. /* RAM? */
  849. if (e820.map[i].type != E820_RAM)
  850. continue;
  851. start = PFN_UP(e820.map[i].addr);
  852. end = PFN_DOWN(e820.map[i].addr + e820.map[i].size);
  853. if (start >= end)
  854. continue;
  855. if (end > max_pfn)
  856. max_pfn = end;
  857. }
  858. }
  859. /*
  860. * Determine low and high memory ranges:
  861. */
  862. unsigned long __init find_max_low_pfn(void)
  863. {
  864. unsigned long max_low_pfn;
  865. max_low_pfn = max_pfn;
  866. if (max_low_pfn > MAXMEM_PFN) {
  867. if (highmem_pages == -1)
  868. highmem_pages = max_pfn - MAXMEM_PFN;
  869. if (highmem_pages + MAXMEM_PFN < max_pfn)
  870. max_pfn = MAXMEM_PFN + highmem_pages;
  871. if (highmem_pages + MAXMEM_PFN > max_pfn) {
  872. printk("only %luMB highmem pages available, ignoring highmem size of %uMB.\n", pages_to_mb(max_pfn - MAXMEM_PFN), pages_to_mb(highmem_pages));
  873. highmem_pages = 0;
  874. }
  875. max_low_pfn = MAXMEM_PFN;
  876. #ifndef CONFIG_HIGHMEM
  877. /* Maximum memory usable is what is directly addressable */
  878. printk(KERN_WARNING "Warning only %ldMB will be used.\n",
  879. MAXMEM>>20);
  880. if (max_pfn > MAX_NONPAE_PFN)
  881. printk(KERN_WARNING "Use a PAE enabled kernel.\n");
  882. else
  883. printk(KERN_WARNING "Use a HIGHMEM enabled kernel.\n");
  884. max_pfn = MAXMEM_PFN;
  885. #else /* !CONFIG_HIGHMEM */
  886. #ifndef CONFIG_X86_PAE
  887. if (max_pfn > MAX_NONPAE_PFN) {
  888. max_pfn = MAX_NONPAE_PFN;
  889. printk(KERN_WARNING "Warning only 4GB will be used.\n");
  890. printk(KERN_WARNING "Use a PAE enabled kernel.\n");
  891. }
  892. #endif /* !CONFIG_X86_PAE */
  893. #endif /* !CONFIG_HIGHMEM */
  894. } else {
  895. if (highmem_pages == -1)
  896. highmem_pages = 0;
  897. #ifdef CONFIG_HIGHMEM
  898. if (highmem_pages >= max_pfn) {
  899. printk(KERN_ERR "highmem size specified (%uMB) is bigger than pages available (%luMB)!.\n", pages_to_mb(highmem_pages), pages_to_mb(max_pfn));
  900. highmem_pages = 0;
  901. }
  902. if (highmem_pages) {
  903. if (max_low_pfn-highmem_pages < 64*1024*1024/PAGE_SIZE){
  904. printk(KERN_ERR "highmem size %uMB results in smaller than 64MB lowmem, ignoring it.\n", pages_to_mb(highmem_pages));
  905. highmem_pages = 0;
  906. }
  907. max_low_pfn -= highmem_pages;
  908. }
  909. #else
  910. if (highmem_pages)
  911. printk(KERN_ERR "ignoring highmem size on non-highmem kernel!\n");
  912. #endif
  913. }
  914. return max_low_pfn;
  915. }
  916. /*
  917. * Free all available memory for boot time allocation. Used
  918. * as a callback function by efi_memory_walk()
  919. */
  920. static int __init
  921. free_available_memory(unsigned long start, unsigned long end, void *arg)
  922. {
  923. /* check max_low_pfn */
  924. if (start >= ((max_low_pfn + 1) << PAGE_SHIFT))
  925. return 0;
  926. if (end >= ((max_low_pfn + 1) << PAGE_SHIFT))
  927. end = (max_low_pfn + 1) << PAGE_SHIFT;
  928. if (start < end)
  929. free_bootmem(start, end - start);
  930. return 0;
  931. }
  932. /*
  933. * Register fully available low RAM pages with the bootmem allocator.
  934. */
  935. static void __init register_bootmem_low_pages(unsigned long max_low_pfn)
  936. {
  937. int i;
  938. if (efi_enabled) {
  939. efi_memmap_walk(free_available_memory, NULL);
  940. return;
  941. }
  942. for (i = 0; i < e820.nr_map; i++) {
  943. unsigned long curr_pfn, last_pfn, size;
  944. /*
  945. * Reserve usable low memory
  946. */
  947. if (e820.map[i].type != E820_RAM)
  948. continue;
  949. /*
  950. * We are rounding up the start address of usable memory:
  951. */
  952. curr_pfn = PFN_UP(e820.map[i].addr);
  953. if (curr_pfn >= max_low_pfn)
  954. continue;
  955. /*
  956. * ... and at the end of the usable range downwards:
  957. */
  958. last_pfn = PFN_DOWN(e820.map[i].addr + e820.map[i].size);
  959. if (last_pfn > max_low_pfn)
  960. last_pfn = max_low_pfn;
  961. /*
  962. * .. finally, did all the rounding and playing
  963. * around just make the area go away?
  964. */
  965. if (last_pfn <= curr_pfn)
  966. continue;
  967. size = last_pfn - curr_pfn;
  968. free_bootmem(PFN_PHYS(curr_pfn), PFN_PHYS(size));
  969. }
  970. }
  971. /*
  972. * workaround for Dell systems that neglect to reserve EBDA
  973. */
  974. static void __init reserve_ebda_region(void)
  975. {
  976. unsigned int addr;
  977. addr = get_bios_ebda();
  978. if (addr)
  979. reserve_bootmem(addr, PAGE_SIZE);
  980. }
  981. #ifndef CONFIG_NEED_MULTIPLE_NODES
  982. void __init setup_bootmem_allocator(void);
  983. static unsigned long __init setup_memory(void)
  984. {
  985. /*
  986. * partially used pages are not usable - thus
  987. * we are rounding upwards:
  988. */
  989. min_low_pfn = PFN_UP(init_pg_tables_end);
  990. find_max_pfn();
  991. max_low_pfn = find_max_low_pfn();
  992. #ifdef CONFIG_HIGHMEM
  993. highstart_pfn = highend_pfn = max_pfn;
  994. if (max_pfn > max_low_pfn) {
  995. highstart_pfn = max_low_pfn;
  996. }
  997. printk(KERN_NOTICE "%ldMB HIGHMEM available.\n",
  998. pages_to_mb(highend_pfn - highstart_pfn));
  999. #endif
  1000. printk(KERN_NOTICE "%ldMB LOWMEM available.\n",
  1001. pages_to_mb(max_low_pfn));
  1002. setup_bootmem_allocator();
  1003. return max_low_pfn;
  1004. }
  1005. void __init zone_sizes_init(void)
  1006. {
  1007. unsigned long zones_size[MAX_NR_ZONES] = {0, 0, 0};
  1008. unsigned int max_dma, low;
  1009. max_dma = virt_to_phys((char *)MAX_DMA_ADDRESS) >> PAGE_SHIFT;
  1010. low = max_low_pfn;
  1011. if (low < max_dma)
  1012. zones_size[ZONE_DMA] = low;
  1013. else {
  1014. zones_size[ZONE_DMA] = max_dma;
  1015. zones_size[ZONE_NORMAL] = low - max_dma;
  1016. #ifdef CONFIG_HIGHMEM
  1017. zones_size[ZONE_HIGHMEM] = highend_pfn - low;
  1018. #endif
  1019. }
  1020. free_area_init(zones_size);
  1021. }
  1022. #else
  1023. extern unsigned long __init setup_memory(void);
  1024. extern void zone_sizes_init(void);
  1025. #endif /* !CONFIG_NEED_MULTIPLE_NODES */
  1026. void __init setup_bootmem_allocator(void)
  1027. {
  1028. unsigned long bootmap_size;
  1029. /*
  1030. * Initialize the boot-time allocator (with low memory only):
  1031. */
  1032. bootmap_size = init_bootmem(min_low_pfn, max_low_pfn);
  1033. register_bootmem_low_pages(max_low_pfn);
  1034. /*
  1035. * Reserve the bootmem bitmap itself as well. We do this in two
  1036. * steps (first step was init_bootmem()) because this catches
  1037. * the (very unlikely) case of us accidentally initializing the
  1038. * bootmem allocator with an invalid RAM area.
  1039. */
  1040. reserve_bootmem(__PHYSICAL_START, (PFN_PHYS(min_low_pfn) +
  1041. bootmap_size + PAGE_SIZE-1) - (__PHYSICAL_START));
  1042. /*
  1043. * reserve physical page 0 - it's a special BIOS page on many boxes,
  1044. * enabling clean reboots, SMP operation, laptop functions.
  1045. */
  1046. reserve_bootmem(0, PAGE_SIZE);
  1047. /* reserve EBDA region, it's a 4K region */
  1048. reserve_ebda_region();
  1049. /* could be an AMD 768MPX chipset. Reserve a page before VGA to prevent
  1050. PCI prefetch into it (errata #56). Usually the page is reserved anyways,
  1051. unless you have no PS/2 mouse plugged in. */
  1052. if (boot_cpu_data.x86_vendor == X86_VENDOR_AMD &&
  1053. boot_cpu_data.x86 == 6)
  1054. reserve_bootmem(0xa0000 - 4096, 4096);
  1055. #ifdef CONFIG_SMP
  1056. /*
  1057. * But first pinch a few for the stack/trampoline stuff
  1058. * FIXME: Don't need the extra page at 4K, but need to fix
  1059. * trampoline before removing it. (see the GDT stuff)
  1060. */
  1061. reserve_bootmem(PAGE_SIZE, PAGE_SIZE);
  1062. #endif
  1063. #ifdef CONFIG_ACPI_SLEEP
  1064. /*
  1065. * Reserve low memory region for sleep support.
  1066. */
  1067. acpi_reserve_bootmem();
  1068. #endif
  1069. #ifdef CONFIG_X86_FIND_SMP_CONFIG
  1070. /*
  1071. * Find and reserve possible boot-time SMP configuration:
  1072. */
  1073. find_smp_config();
  1074. #endif
  1075. #ifdef CONFIG_BLK_DEV_INITRD
  1076. if (LOADER_TYPE && INITRD_START) {
  1077. if (INITRD_START + INITRD_SIZE <= (max_low_pfn << PAGE_SHIFT)) {
  1078. reserve_bootmem(INITRD_START, INITRD_SIZE);
  1079. initrd_start =
  1080. INITRD_START ? INITRD_START + PAGE_OFFSET : 0;
  1081. initrd_end = initrd_start+INITRD_SIZE;
  1082. }
  1083. else {
  1084. printk(KERN_ERR "initrd extends beyond end of memory "
  1085. "(0x%08lx > 0x%08lx)\ndisabling initrd\n",
  1086. INITRD_START + INITRD_SIZE,
  1087. max_low_pfn << PAGE_SHIFT);
  1088. initrd_start = 0;
  1089. }
  1090. }
  1091. #endif
  1092. #ifdef CONFIG_KEXEC
  1093. if (crashk_res.start != crashk_res.end)
  1094. reserve_bootmem(crashk_res.start,
  1095. crashk_res.end - crashk_res.start + 1);
  1096. #endif
  1097. }
  1098. /*
  1099. * The node 0 pgdat is initialized before all of these because
  1100. * it's needed for bootmem. node>0 pgdats have their virtual
  1101. * space allocated before the pagetables are in place to access
  1102. * them, so they can't be cleared then.
  1103. *
  1104. * This should all compile down to nothing when NUMA is off.
  1105. */
  1106. void __init remapped_pgdat_init(void)
  1107. {
  1108. int nid;
  1109. for_each_online_node(nid) {
  1110. if (nid != 0)
  1111. memset(NODE_DATA(nid), 0, sizeof(struct pglist_data));
  1112. }
  1113. }
  1114. /*
  1115. * Request address space for all standard RAM and ROM resources
  1116. * and also for regions reported as reserved by the e820.
  1117. */
  1118. static void __init
  1119. legacy_init_iomem_resources(struct resource *code_resource, struct resource *data_resource)
  1120. {
  1121. int i;
  1122. probe_roms();
  1123. for (i = 0; i < e820.nr_map; i++) {
  1124. struct resource *res;
  1125. if (e820.map[i].addr + e820.map[i].size > 0x100000000ULL)
  1126. continue;
  1127. res = alloc_bootmem_low(sizeof(struct resource));
  1128. switch (e820.map[i].type) {
  1129. case E820_RAM: res->name = "System RAM"; break;
  1130. case E820_ACPI: res->name = "ACPI Tables"; break;
  1131. case E820_NVS: res->name = "ACPI Non-volatile Storage"; break;
  1132. default: res->name = "reserved";
  1133. }
  1134. res->start = e820.map[i].addr;
  1135. res->end = res->start + e820.map[i].size - 1;
  1136. res->flags = IORESOURCE_MEM | IORESOURCE_BUSY;
  1137. request_resource(&iomem_resource, res);
  1138. if (e820.map[i].type == E820_RAM) {
  1139. /*
  1140. * We don't know which RAM region contains kernel data,
  1141. * so we try it repeatedly and let the resource manager
  1142. * test it.
  1143. */
  1144. request_resource(res, code_resource);
  1145. request_resource(res, data_resource);
  1146. #ifdef CONFIG_KEXEC
  1147. request_resource(res, &crashk_res);
  1148. #endif
  1149. }
  1150. }
  1151. }
  1152. /*
  1153. * Request address space for all standard resources
  1154. */
  1155. static void __init register_memory(void)
  1156. {
  1157. unsigned long gapstart, gapsize;
  1158. unsigned long long last;
  1159. int i;
  1160. if (efi_enabled)
  1161. efi_initialize_iomem_resources(&code_resource, &data_resource);
  1162. else
  1163. legacy_init_iomem_resources(&code_resource, &data_resource);
  1164. /* EFI systems may still have VGA */
  1165. request_resource(&iomem_resource, &video_ram_resource);
  1166. /* request I/O space for devices used on all i[345]86 PCs */
  1167. for (i = 0; i < STANDARD_IO_RESOURCES; i++)
  1168. request_resource(&ioport_resource, &standard_io_resources[i]);
  1169. /*
  1170. * Search for the bigest gap in the low 32 bits of the e820
  1171. * memory space.
  1172. */
  1173. last = 0x100000000ull;
  1174. gapstart = 0x10000000;
  1175. gapsize = 0x400000;
  1176. i = e820.nr_map;
  1177. while (--i >= 0) {
  1178. unsigned long long start = e820.map[i].addr;
  1179. unsigned long long end = start + e820.map[i].size;
  1180. /*
  1181. * Since "last" is at most 4GB, we know we'll
  1182. * fit in 32 bits if this condition is true
  1183. */
  1184. if (last > end) {
  1185. unsigned long gap = last - end;
  1186. if (gap > gapsize) {
  1187. gapsize = gap;
  1188. gapstart = end;
  1189. }
  1190. }
  1191. if (start < last)
  1192. last = start;
  1193. }
  1194. /*
  1195. * Start allocating dynamic PCI memory a bit into the gap,
  1196. * aligned up to the nearest megabyte.
  1197. *
  1198. * Question: should we try to pad it up a bit (do something
  1199. * like " + (gapsize >> 3)" in there too?). We now have the
  1200. * technology.
  1201. */
  1202. pci_mem_start = (gapstart + 0xfffff) & ~0xfffff;
  1203. printk("Allocating PCI resources starting at %08lx (gap: %08lx:%08lx)\n",
  1204. pci_mem_start, gapstart, gapsize);
  1205. }
  1206. /* Use inline assembly to define this because the nops are defined
  1207. as inline assembly strings in the include files and we cannot
  1208. get them easily into strings. */
  1209. asm("\t.data\nintelnops: "
  1210. GENERIC_NOP1 GENERIC_NOP2 GENERIC_NOP3 GENERIC_NOP4 GENERIC_NOP5 GENERIC_NOP6
  1211. GENERIC_NOP7 GENERIC_NOP8);
  1212. asm("\t.data\nk8nops: "
  1213. K8_NOP1 K8_NOP2 K8_NOP3 K8_NOP4 K8_NOP5 K8_NOP6
  1214. K8_NOP7 K8_NOP8);
  1215. asm("\t.data\nk7nops: "
  1216. K7_NOP1 K7_NOP2 K7_NOP3 K7_NOP4 K7_NOP5 K7_NOP6
  1217. K7_NOP7 K7_NOP8);
  1218. extern unsigned char intelnops[], k8nops[], k7nops[];
  1219. static unsigned char *intel_nops[ASM_NOP_MAX+1] = {
  1220. NULL,
  1221. intelnops,
  1222. intelnops + 1,
  1223. intelnops + 1 + 2,
  1224. intelnops + 1 + 2 + 3,
  1225. intelnops + 1 + 2 + 3 + 4,
  1226. intelnops + 1 + 2 + 3 + 4 + 5,
  1227. intelnops + 1 + 2 + 3 + 4 + 5 + 6,
  1228. intelnops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
  1229. };
  1230. static unsigned char *k8_nops[ASM_NOP_MAX+1] = {
  1231. NULL,
  1232. k8nops,
  1233. k8nops + 1,
  1234. k8nops + 1 + 2,
  1235. k8nops + 1 + 2 + 3,
  1236. k8nops + 1 + 2 + 3 + 4,
  1237. k8nops + 1 + 2 + 3 + 4 + 5,
  1238. k8nops + 1 + 2 + 3 + 4 + 5 + 6,
  1239. k8nops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
  1240. };
  1241. static unsigned char *k7_nops[ASM_NOP_MAX+1] = {
  1242. NULL,
  1243. k7nops,
  1244. k7nops + 1,
  1245. k7nops + 1 + 2,
  1246. k7nops + 1 + 2 + 3,
  1247. k7nops + 1 + 2 + 3 + 4,
  1248. k7nops + 1 + 2 + 3 + 4 + 5,
  1249. k7nops + 1 + 2 + 3 + 4 + 5 + 6,
  1250. k7nops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
  1251. };
  1252. static struct nop {
  1253. int cpuid;
  1254. unsigned char **noptable;
  1255. } noptypes[] = {
  1256. { X86_FEATURE_K8, k8_nops },
  1257. { X86_FEATURE_K7, k7_nops },
  1258. { -1, NULL }
  1259. };
  1260. /* Replace instructions with better alternatives for this CPU type.
  1261. This runs before SMP is initialized to avoid SMP problems with
  1262. self modifying code. This implies that assymetric systems where
  1263. APs have less capabilities than the boot processor are not handled.
  1264. Tough. Make sure you disable such features by hand. */
  1265. void apply_alternatives(void *start, void *end)
  1266. {
  1267. struct alt_instr *a;
  1268. int diff, i, k;
  1269. unsigned char **noptable = intel_nops;
  1270. for (i = 0; noptypes[i].cpuid >= 0; i++) {
  1271. if (boot_cpu_has(noptypes[i].cpuid)) {
  1272. noptable = noptypes[i].noptable;
  1273. break;
  1274. }
  1275. }
  1276. for (a = start; (void *)a < end; a++) {
  1277. if (!boot_cpu_has(a->cpuid))
  1278. continue;
  1279. BUG_ON(a->replacementlen > a->instrlen);
  1280. memcpy(a->instr, a->replacement, a->replacementlen);
  1281. diff = a->instrlen - a->replacementlen;
  1282. /* Pad the rest with nops */
  1283. for (i = a->replacementlen; diff > 0; diff -= k, i += k) {
  1284. k = diff;
  1285. if (k > ASM_NOP_MAX)
  1286. k = ASM_NOP_MAX;
  1287. memcpy(a->instr + i, noptable[k], k);
  1288. }
  1289. }
  1290. }
  1291. void __init alternative_instructions(void)
  1292. {
  1293. extern struct alt_instr __alt_instructions[], __alt_instructions_end[];
  1294. apply_alternatives(__alt_instructions, __alt_instructions_end);
  1295. }
  1296. static char * __init machine_specific_memory_setup(void);
  1297. #ifdef CONFIG_MCA
  1298. static void set_mca_bus(int x)
  1299. {
  1300. MCA_bus = x;
  1301. }
  1302. #else
  1303. static void set_mca_bus(int x) { }
  1304. #endif
  1305. /*
  1306. * Determine if we were loaded by an EFI loader. If so, then we have also been
  1307. * passed the efi memmap, systab, etc., so we should use these data structures
  1308. * for initialization. Note, the efi init code path is determined by the
  1309. * global efi_enabled. This allows the same kernel image to be used on existing
  1310. * systems (with a traditional BIOS) as well as on EFI systems.
  1311. */
  1312. void __init setup_arch(char **cmdline_p)
  1313. {
  1314. unsigned long max_low_pfn;
  1315. memcpy(&boot_cpu_data, &new_cpu_data, sizeof(new_cpu_data));
  1316. pre_setup_arch_hook();
  1317. early_cpu_init();
  1318. /*
  1319. * FIXME: This isn't an official loader_type right
  1320. * now but does currently work with elilo.
  1321. * If we were configured as an EFI kernel, check to make
  1322. * sure that we were loaded correctly from elilo and that
  1323. * the system table is valid. If not, then initialize normally.
  1324. */
  1325. #ifdef CONFIG_EFI
  1326. if ((LOADER_TYPE == 0x50) && EFI_SYSTAB)
  1327. efi_enabled = 1;
  1328. #endif
  1329. ROOT_DEV = old_decode_dev(ORIG_ROOT_DEV);
  1330. drive_info = DRIVE_INFO;
  1331. screen_info = SCREEN_INFO;
  1332. edid_info = EDID_INFO;
  1333. apm_info.bios = APM_BIOS_INFO;
  1334. ist_info = IST_INFO;
  1335. saved_videomode = VIDEO_MODE;
  1336. if( SYS_DESC_TABLE.length != 0 ) {
  1337. set_mca_bus(SYS_DESC_TABLE.table[3] & 0x2);
  1338. machine_id = SYS_DESC_TABLE.table[0];
  1339. machine_submodel_id = SYS_DESC_TABLE.table[1];
  1340. BIOS_revision = SYS_DESC_TABLE.table[2];
  1341. }
  1342. bootloader_type = LOADER_TYPE;
  1343. #ifdef CONFIG_BLK_DEV_RAM
  1344. rd_image_start = RAMDISK_FLAGS & RAMDISK_IMAGE_START_MASK;
  1345. rd_prompt = ((RAMDISK_FLAGS & RAMDISK_PROMPT_FLAG) != 0);
  1346. rd_doload = ((RAMDISK_FLAGS & RAMDISK_LOAD_FLAG) != 0);
  1347. #endif
  1348. ARCH_SETUP
  1349. if (efi_enabled)
  1350. efi_init();
  1351. else {
  1352. printk(KERN_INFO "BIOS-provided physical RAM map:\n");
  1353. print_memory_map(machine_specific_memory_setup());
  1354. }
  1355. copy_edd();
  1356. if (!MOUNT_ROOT_RDONLY)
  1357. root_mountflags &= ~MS_RDONLY;
  1358. init_mm.start_code = (unsigned long) _text;
  1359. init_mm.end_code = (unsigned long) _etext;
  1360. init_mm.end_data = (unsigned long) _edata;
  1361. init_mm.brk = init_pg_tables_end + PAGE_OFFSET;
  1362. code_resource.start = virt_to_phys(_text);
  1363. code_resource.end = virt_to_phys(_etext)-1;
  1364. data_resource.start = virt_to_phys(_etext);
  1365. data_resource.end = virt_to_phys(_edata)-1;
  1366. parse_cmdline_early(cmdline_p);
  1367. max_low_pfn = setup_memory();
  1368. /*
  1369. * NOTE: before this point _nobody_ is allowed to allocate
  1370. * any memory using the bootmem allocator. Although the
  1371. * alloctor is now initialised only the first 8Mb of the kernel
  1372. * virtual address space has been mapped. All allocations before
  1373. * paging_init() has completed must use the alloc_bootmem_low_pages()
  1374. * variant (which allocates DMA'able memory) and care must be taken
  1375. * not to exceed the 8Mb limit.
  1376. */
  1377. #ifdef CONFIG_SMP
  1378. smp_alloc_memory(); /* AP processor realmode stacks in low memory*/
  1379. #endif
  1380. paging_init();
  1381. remapped_pgdat_init();
  1382. sparse_init();
  1383. zone_sizes_init();
  1384. /*
  1385. * NOTE: at this point the bootmem allocator is fully available.
  1386. */
  1387. #ifdef CONFIG_EARLY_PRINTK
  1388. {
  1389. char *s = strstr(*cmdline_p, "earlyprintk=");
  1390. if (s) {
  1391. extern void setup_early_printk(char *);
  1392. setup_early_printk(s);
  1393. printk("early console enabled\n");
  1394. }
  1395. }
  1396. #endif
  1397. dmi_scan_machine();
  1398. #ifdef CONFIG_X86_GENERICARCH
  1399. generic_apic_probe(*cmdline_p);
  1400. #endif
  1401. if (efi_enabled)
  1402. efi_map_memmap();
  1403. #ifdef CONFIG_ACPI
  1404. /*
  1405. * Parse the ACPI tables for possible boot-time SMP configuration.
  1406. */
  1407. acpi_boot_table_init();
  1408. acpi_boot_init();
  1409. #if defined(CONFIG_SMP) && defined(CONFIG_X86_PC)
  1410. if (def_to_bigsmp)
  1411. printk(KERN_WARNING "More than 8 CPUs detected and "
  1412. "CONFIG_X86_PC cannot handle it.\nUse "
  1413. "CONFIG_X86_GENERICARCH or CONFIG_X86_BIGSMP.\n");
  1414. #endif
  1415. #endif
  1416. #ifdef CONFIG_X86_LOCAL_APIC
  1417. if (smp_found_config)
  1418. get_smp_config();
  1419. #endif
  1420. register_memory();
  1421. #ifdef CONFIG_VT
  1422. #if defined(CONFIG_VGA_CONSOLE)
  1423. if (!efi_enabled || (efi_mem_type(0xa0000) != EFI_CONVENTIONAL_MEMORY))
  1424. conswitchp = &vga_con;
  1425. #elif defined(CONFIG_DUMMY_CONSOLE)
  1426. conswitchp = &dummy_con;
  1427. #endif
  1428. #endif
  1429. }
  1430. #include "setup_arch_post.h"
  1431. /*
  1432. * Local Variables:
  1433. * mode:c
  1434. * c-file-style:"k&r"
  1435. * c-basic-offset:8
  1436. * End:
  1437. */