common.c 27 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141
  1. #include <linux/init.h>
  2. #include <linux/kernel.h>
  3. #include <linux/sched.h>
  4. #include <linux/string.h>
  5. #include <linux/bootmem.h>
  6. #include <linux/bitops.h>
  7. #include <linux/module.h>
  8. #include <linux/kgdb.h>
  9. #include <linux/topology.h>
  10. #include <linux/delay.h>
  11. #include <linux/smp.h>
  12. #include <linux/percpu.h>
  13. #include <asm/i387.h>
  14. #include <asm/msr.h>
  15. #include <asm/io.h>
  16. #include <asm/linkage.h>
  17. #include <asm/mmu_context.h>
  18. #include <asm/mtrr.h>
  19. #include <asm/mce.h>
  20. #include <asm/pat.h>
  21. #include <asm/asm.h>
  22. #include <asm/numa.h>
  23. #ifdef CONFIG_X86_LOCAL_APIC
  24. #include <asm/mpspec.h>
  25. #include <asm/apic.h>
  26. #include <mach_apic.h>
  27. #include <asm/genapic.h>
  28. #endif
  29. #include <asm/pda.h>
  30. #include <asm/pgtable.h>
  31. #include <asm/processor.h>
  32. #include <asm/desc.h>
  33. #include <asm/atomic.h>
  34. #include <asm/proto.h>
  35. #include <asm/sections.h>
  36. #include <asm/setup.h>
  37. #include "cpu.h"
  38. static struct cpu_dev *this_cpu __cpuinitdata;
  39. #ifdef CONFIG_X86_64
  40. /* We need valid kernel segments for data and code in long mode too
  41. * IRET will check the segment types kkeil 2000/10/28
  42. * Also sysret mandates a special GDT layout
  43. */
  44. /* The TLS descriptors are currently at a different place compared to i386.
  45. Hopefully nobody expects them at a fixed place (Wine?) */
  46. DEFINE_PER_CPU(struct gdt_page, gdt_page) = { .gdt = {
  47. [GDT_ENTRY_KERNEL32_CS] = { { { 0x0000ffff, 0x00cf9b00 } } },
  48. [GDT_ENTRY_KERNEL_CS] = { { { 0x0000ffff, 0x00af9b00 } } },
  49. [GDT_ENTRY_KERNEL_DS] = { { { 0x0000ffff, 0x00cf9300 } } },
  50. [GDT_ENTRY_DEFAULT_USER32_CS] = { { { 0x0000ffff, 0x00cffb00 } } },
  51. [GDT_ENTRY_DEFAULT_USER_DS] = { { { 0x0000ffff, 0x00cff300 } } },
  52. [GDT_ENTRY_DEFAULT_USER_CS] = { { { 0x0000ffff, 0x00affb00 } } },
  53. } };
  54. #else
  55. DEFINE_PER_CPU_PAGE_ALIGNED(struct gdt_page, gdt_page) = { .gdt = {
  56. [GDT_ENTRY_KERNEL_CS] = { { { 0x0000ffff, 0x00cf9a00 } } },
  57. [GDT_ENTRY_KERNEL_DS] = { { { 0x0000ffff, 0x00cf9200 } } },
  58. [GDT_ENTRY_DEFAULT_USER_CS] = { { { 0x0000ffff, 0x00cffa00 } } },
  59. [GDT_ENTRY_DEFAULT_USER_DS] = { { { 0x0000ffff, 0x00cff200 } } },
  60. /*
  61. * Segments used for calling PnP BIOS have byte granularity.
  62. * They code segments and data segments have fixed 64k limits,
  63. * the transfer segment sizes are set at run time.
  64. */
  65. /* 32-bit code */
  66. [GDT_ENTRY_PNPBIOS_CS32] = { { { 0x0000ffff, 0x00409a00 } } },
  67. /* 16-bit code */
  68. [GDT_ENTRY_PNPBIOS_CS16] = { { { 0x0000ffff, 0x00009a00 } } },
  69. /* 16-bit data */
  70. [GDT_ENTRY_PNPBIOS_DS] = { { { 0x0000ffff, 0x00009200 } } },
  71. /* 16-bit data */
  72. [GDT_ENTRY_PNPBIOS_TS1] = { { { 0x00000000, 0x00009200 } } },
  73. /* 16-bit data */
  74. [GDT_ENTRY_PNPBIOS_TS2] = { { { 0x00000000, 0x00009200 } } },
  75. /*
  76. * The APM segments have byte granularity and their bases
  77. * are set at run time. All have 64k limits.
  78. */
  79. /* 32-bit code */
  80. [GDT_ENTRY_APMBIOS_BASE] = { { { 0x0000ffff, 0x00409a00 } } },
  81. /* 16-bit code */
  82. [GDT_ENTRY_APMBIOS_BASE+1] = { { { 0x0000ffff, 0x00009a00 } } },
  83. /* data */
  84. [GDT_ENTRY_APMBIOS_BASE+2] = { { { 0x0000ffff, 0x00409200 } } },
  85. [GDT_ENTRY_ESPFIX_SS] = { { { 0x00000000, 0x00c09200 } } },
  86. [GDT_ENTRY_PERCPU] = { { { 0x00000000, 0x00000000 } } },
  87. } };
  88. #endif
  89. EXPORT_PER_CPU_SYMBOL_GPL(gdt_page);
  90. #ifdef CONFIG_X86_32
  91. static int cachesize_override __cpuinitdata = -1;
  92. static int disable_x86_serial_nr __cpuinitdata = 1;
  93. static int __init cachesize_setup(char *str)
  94. {
  95. get_option(&str, &cachesize_override);
  96. return 1;
  97. }
  98. __setup("cachesize=", cachesize_setup);
  99. static int __init x86_fxsr_setup(char *s)
  100. {
  101. setup_clear_cpu_cap(X86_FEATURE_FXSR);
  102. setup_clear_cpu_cap(X86_FEATURE_XMM);
  103. return 1;
  104. }
  105. __setup("nofxsr", x86_fxsr_setup);
  106. static int __init x86_sep_setup(char *s)
  107. {
  108. setup_clear_cpu_cap(X86_FEATURE_SEP);
  109. return 1;
  110. }
  111. __setup("nosep", x86_sep_setup);
  112. /* Standard macro to see if a specific flag is changeable */
  113. static inline int flag_is_changeable_p(u32 flag)
  114. {
  115. u32 f1, f2;
  116. asm("pushfl\n\t"
  117. "pushfl\n\t"
  118. "popl %0\n\t"
  119. "movl %0,%1\n\t"
  120. "xorl %2,%0\n\t"
  121. "pushl %0\n\t"
  122. "popfl\n\t"
  123. "pushfl\n\t"
  124. "popl %0\n\t"
  125. "popfl\n\t"
  126. : "=&r" (f1), "=&r" (f2)
  127. : "ir" (flag));
  128. return ((f1^f2) & flag) != 0;
  129. }
  130. /* Probe for the CPUID instruction */
  131. static int __cpuinit have_cpuid_p(void)
  132. {
  133. return flag_is_changeable_p(X86_EFLAGS_ID);
  134. }
  135. static void __cpuinit squash_the_stupid_serial_number(struct cpuinfo_x86 *c)
  136. {
  137. if (cpu_has(c, X86_FEATURE_PN) && disable_x86_serial_nr) {
  138. /* Disable processor serial number */
  139. unsigned long lo, hi;
  140. rdmsr(MSR_IA32_BBL_CR_CTL, lo, hi);
  141. lo |= 0x200000;
  142. wrmsr(MSR_IA32_BBL_CR_CTL, lo, hi);
  143. printk(KERN_NOTICE "CPU serial number disabled.\n");
  144. clear_cpu_cap(c, X86_FEATURE_PN);
  145. /* Disabling the serial number may affect the cpuid level */
  146. c->cpuid_level = cpuid_eax(0);
  147. }
  148. }
  149. static int __init x86_serial_nr_setup(char *s)
  150. {
  151. disable_x86_serial_nr = 0;
  152. return 1;
  153. }
  154. __setup("serialnumber", x86_serial_nr_setup);
  155. #else
  156. static inline int flag_is_changeable_p(u32 flag)
  157. {
  158. return 1;
  159. }
  160. /* Probe for the CPUID instruction */
  161. static inline int have_cpuid_p(void)
  162. {
  163. return 1;
  164. }
  165. static inline void squash_the_stupid_serial_number(struct cpuinfo_x86 *c)
  166. {
  167. }
  168. #endif
  169. /*
  170. * Naming convention should be: <Name> [(<Codename>)]
  171. * This table only is used unless init_<vendor>() below doesn't set it;
  172. * in particular, if CPUID levels 0x80000002..4 are supported, this isn't used
  173. *
  174. */
  175. /* Look up CPU names by table lookup. */
  176. static char __cpuinit *table_lookup_model(struct cpuinfo_x86 *c)
  177. {
  178. struct cpu_model_info *info;
  179. if (c->x86_model >= 16)
  180. return NULL; /* Range check */
  181. if (!this_cpu)
  182. return NULL;
  183. info = this_cpu->c_models;
  184. while (info && info->family) {
  185. if (info->family == c->x86)
  186. return info->model_names[c->x86_model];
  187. info++;
  188. }
  189. return NULL; /* Not found */
  190. }
  191. __u32 cleared_cpu_caps[NCAPINTS] __cpuinitdata;
  192. /* Current gdt points %fs at the "master" per-cpu area: after this,
  193. * it's on the real one. */
  194. void switch_to_new_gdt(void)
  195. {
  196. struct desc_ptr gdt_descr;
  197. gdt_descr.address = (long)get_cpu_gdt_table(smp_processor_id());
  198. gdt_descr.size = GDT_SIZE - 1;
  199. load_gdt(&gdt_descr);
  200. #ifdef CONFIG_X86_32
  201. asm("mov %0, %%fs" : : "r" (__KERNEL_PERCPU) : "memory");
  202. #endif
  203. }
  204. static struct cpu_dev *cpu_devs[X86_VENDOR_NUM] = {};
  205. static void __cpuinit default_init(struct cpuinfo_x86 *c)
  206. {
  207. #ifdef CONFIG_X86_64
  208. display_cacheinfo(c);
  209. #else
  210. /* Not much we can do here... */
  211. /* Check if at least it has cpuid */
  212. if (c->cpuid_level == -1) {
  213. /* No cpuid. It must be an ancient CPU */
  214. if (c->x86 == 4)
  215. strcpy(c->x86_model_id, "486");
  216. else if (c->x86 == 3)
  217. strcpy(c->x86_model_id, "386");
  218. }
  219. #endif
  220. }
  221. static struct cpu_dev __cpuinitdata default_cpu = {
  222. .c_init = default_init,
  223. .c_vendor = "Unknown",
  224. .c_x86_vendor = X86_VENDOR_UNKNOWN,
  225. };
  226. static void __cpuinit get_model_name(struct cpuinfo_x86 *c)
  227. {
  228. unsigned int *v;
  229. char *p, *q;
  230. if (c->extended_cpuid_level < 0x80000004)
  231. return;
  232. v = (unsigned int *) c->x86_model_id;
  233. cpuid(0x80000002, &v[0], &v[1], &v[2], &v[3]);
  234. cpuid(0x80000003, &v[4], &v[5], &v[6], &v[7]);
  235. cpuid(0x80000004, &v[8], &v[9], &v[10], &v[11]);
  236. c->x86_model_id[48] = 0;
  237. /* Intel chips right-justify this string for some dumb reason;
  238. undo that brain damage */
  239. p = q = &c->x86_model_id[0];
  240. while (*p == ' ')
  241. p++;
  242. if (p != q) {
  243. while (*p)
  244. *q++ = *p++;
  245. while (q <= &c->x86_model_id[48])
  246. *q++ = '\0'; /* Zero-pad the rest */
  247. }
  248. }
  249. void __cpuinit display_cacheinfo(struct cpuinfo_x86 *c)
  250. {
  251. unsigned int n, dummy, ebx, ecx, edx, l2size;
  252. n = c->extended_cpuid_level;
  253. if (n >= 0x80000005) {
  254. cpuid(0x80000005, &dummy, &ebx, &ecx, &edx);
  255. printk(KERN_INFO "CPU: L1 I Cache: %dK (%d bytes/line), D cache %dK (%d bytes/line)\n",
  256. edx>>24, edx&0xFF, ecx>>24, ecx&0xFF);
  257. c->x86_cache_size = (ecx>>24) + (edx>>24);
  258. #ifdef CONFIG_X86_64
  259. /* On K8 L1 TLB is inclusive, so don't count it */
  260. c->x86_tlbsize = 0;
  261. #endif
  262. }
  263. if (n < 0x80000006) /* Some chips just has a large L1. */
  264. return;
  265. cpuid(0x80000006, &dummy, &ebx, &ecx, &edx);
  266. l2size = ecx >> 16;
  267. #ifdef CONFIG_X86_64
  268. c->x86_tlbsize += ((ebx >> 16) & 0xfff) + (ebx & 0xfff);
  269. #else
  270. /* do processor-specific cache resizing */
  271. if (this_cpu->c_size_cache)
  272. l2size = this_cpu->c_size_cache(c, l2size);
  273. /* Allow user to override all this if necessary. */
  274. if (cachesize_override != -1)
  275. l2size = cachesize_override;
  276. if (l2size == 0)
  277. return; /* Again, no L2 cache is possible */
  278. #endif
  279. c->x86_cache_size = l2size;
  280. printk(KERN_INFO "CPU: L2 Cache: %dK (%d bytes/line)\n",
  281. l2size, ecx & 0xFF);
  282. }
  283. void __cpuinit detect_ht(struct cpuinfo_x86 *c)
  284. {
  285. #ifdef CONFIG_X86_HT
  286. u32 eax, ebx, ecx, edx;
  287. int index_msb, core_bits;
  288. if (!cpu_has(c, X86_FEATURE_HT))
  289. return;
  290. if (cpu_has(c, X86_FEATURE_CMP_LEGACY))
  291. goto out;
  292. if (cpu_has(c, X86_FEATURE_XTOPOLOGY))
  293. return;
  294. cpuid(1, &eax, &ebx, &ecx, &edx);
  295. smp_num_siblings = (ebx & 0xff0000) >> 16;
  296. if (smp_num_siblings == 1) {
  297. printk(KERN_INFO "CPU: Hyper-Threading is disabled\n");
  298. } else if (smp_num_siblings > 1) {
  299. if (smp_num_siblings > NR_CPUS) {
  300. printk(KERN_WARNING "CPU: Unsupported number of siblings %d",
  301. smp_num_siblings);
  302. smp_num_siblings = 1;
  303. return;
  304. }
  305. index_msb = get_count_order(smp_num_siblings);
  306. #ifdef CONFIG_X86_64
  307. c->phys_proc_id = phys_pkg_id(index_msb);
  308. #else
  309. c->phys_proc_id = phys_pkg_id(c->initial_apicid, index_msb);
  310. #endif
  311. smp_num_siblings = smp_num_siblings / c->x86_max_cores;
  312. index_msb = get_count_order(smp_num_siblings);
  313. core_bits = get_count_order(c->x86_max_cores);
  314. #ifdef CONFIG_X86_64
  315. c->cpu_core_id = phys_pkg_id(index_msb) &
  316. ((1 << core_bits) - 1);
  317. #else
  318. c->cpu_core_id = phys_pkg_id(c->initial_apicid, index_msb) &
  319. ((1 << core_bits) - 1);
  320. #endif
  321. }
  322. out:
  323. if ((c->x86_max_cores * smp_num_siblings) > 1) {
  324. printk(KERN_INFO "CPU: Physical Processor ID: %d\n",
  325. c->phys_proc_id);
  326. printk(KERN_INFO "CPU: Processor Core ID: %d\n",
  327. c->cpu_core_id);
  328. }
  329. #endif
  330. }
  331. static void __cpuinit get_cpu_vendor(struct cpuinfo_x86 *c)
  332. {
  333. char *v = c->x86_vendor_id;
  334. int i;
  335. static int printed;
  336. for (i = 0; i < X86_VENDOR_NUM; i++) {
  337. if (!cpu_devs[i])
  338. break;
  339. if (!strcmp(v, cpu_devs[i]->c_ident[0]) ||
  340. (cpu_devs[i]->c_ident[1] &&
  341. !strcmp(v, cpu_devs[i]->c_ident[1]))) {
  342. this_cpu = cpu_devs[i];
  343. c->x86_vendor = this_cpu->c_x86_vendor;
  344. return;
  345. }
  346. }
  347. if (!printed) {
  348. printed++;
  349. printk(KERN_ERR "CPU: Vendor unknown, using generic init.\n");
  350. printk(KERN_ERR "CPU: Your system may be unstable.\n");
  351. }
  352. c->x86_vendor = X86_VENDOR_UNKNOWN;
  353. this_cpu = &default_cpu;
  354. }
  355. void __cpuinit cpu_detect(struct cpuinfo_x86 *c)
  356. {
  357. /* Get vendor name */
  358. cpuid(0x00000000, (unsigned int *)&c->cpuid_level,
  359. (unsigned int *)&c->x86_vendor_id[0],
  360. (unsigned int *)&c->x86_vendor_id[8],
  361. (unsigned int *)&c->x86_vendor_id[4]);
  362. c->x86 = 4;
  363. /* Intel-defined flags: level 0x00000001 */
  364. if (c->cpuid_level >= 0x00000001) {
  365. u32 junk, tfms, cap0, misc;
  366. cpuid(0x00000001, &tfms, &misc, &junk, &cap0);
  367. c->x86 = (tfms >> 8) & 0xf;
  368. c->x86_model = (tfms >> 4) & 0xf;
  369. c->x86_mask = tfms & 0xf;
  370. if (c->x86 == 0xf)
  371. c->x86 += (tfms >> 20) & 0xff;
  372. if (c->x86 >= 0x6)
  373. c->x86_model += ((tfms >> 16) & 0xf) << 4;
  374. if (cap0 & (1<<19)) {
  375. c->x86_clflush_size = ((misc >> 8) & 0xff) * 8;
  376. c->x86_cache_alignment = c->x86_clflush_size;
  377. }
  378. }
  379. }
  380. static void __cpuinit get_cpu_cap(struct cpuinfo_x86 *c)
  381. {
  382. u32 tfms, xlvl;
  383. u32 ebx;
  384. /* Intel-defined flags: level 0x00000001 */
  385. if (c->cpuid_level >= 0x00000001) {
  386. u32 capability, excap;
  387. cpuid(0x00000001, &tfms, &ebx, &excap, &capability);
  388. c->x86_capability[0] = capability;
  389. c->x86_capability[4] = excap;
  390. }
  391. /* AMD-defined flags: level 0x80000001 */
  392. xlvl = cpuid_eax(0x80000000);
  393. c->extended_cpuid_level = xlvl;
  394. if ((xlvl & 0xffff0000) == 0x80000000) {
  395. if (xlvl >= 0x80000001) {
  396. c->x86_capability[1] = cpuid_edx(0x80000001);
  397. c->x86_capability[6] = cpuid_ecx(0x80000001);
  398. }
  399. }
  400. #ifdef CONFIG_X86_64
  401. /* Transmeta-defined flags: level 0x80860001 */
  402. xlvl = cpuid_eax(0x80860000);
  403. if ((xlvl & 0xffff0000) == 0x80860000) {
  404. /* Don't set x86_cpuid_level here for now to not confuse. */
  405. if (xlvl >= 0x80860001)
  406. c->x86_capability[2] = cpuid_edx(0x80860001);
  407. }
  408. if (c->extended_cpuid_level >= 0x80000008) {
  409. u32 eax = cpuid_eax(0x80000008);
  410. c->x86_virt_bits = (eax >> 8) & 0xff;
  411. c->x86_phys_bits = eax & 0xff;
  412. }
  413. #endif
  414. if (c->extended_cpuid_level >= 0x80000007)
  415. c->x86_power = cpuid_edx(0x80000007);
  416. }
  417. /*
  418. * Do minimum CPU detection early.
  419. * Fields really needed: vendor, cpuid_level, family, model, mask,
  420. * cache alignment.
  421. * The others are not touched to avoid unwanted side effects.
  422. *
  423. * WARNING: this function is only called on the BP. Don't add code here
  424. * that is supposed to run on all CPUs.
  425. */
  426. static void __init early_identify_cpu(struct cpuinfo_x86 *c)
  427. {
  428. #ifdef CONFIG_X86_64
  429. c->x86_clflush_size = 64;
  430. #else
  431. c->x86_clflush_size = 32;
  432. #endif
  433. c->x86_cache_alignment = c->x86_clflush_size;
  434. if (!have_cpuid_p())
  435. return;
  436. memset(&c->x86_capability, 0, sizeof c->x86_capability);
  437. c->extended_cpuid_level = 0;
  438. cpu_detect(c);
  439. get_cpu_vendor(c);
  440. get_cpu_cap(c);
  441. if (this_cpu->c_early_init)
  442. this_cpu->c_early_init(c);
  443. validate_pat_support(c);
  444. }
  445. void __init early_cpu_init(void)
  446. {
  447. struct cpu_dev **cdev;
  448. int count = 0;
  449. printk("KERNEL supported cpus:\n");
  450. for (cdev = __x86_cpu_dev_start; cdev < __x86_cpu_dev_end; cdev++) {
  451. struct cpu_dev *cpudev = *cdev;
  452. unsigned int j;
  453. if (count >= X86_VENDOR_NUM)
  454. break;
  455. cpu_devs[count] = cpudev;
  456. count++;
  457. for (j = 0; j < 2; j++) {
  458. if (!cpudev->c_ident[j])
  459. continue;
  460. printk(" %s %s\n", cpudev->c_vendor,
  461. cpudev->c_ident[j]);
  462. }
  463. }
  464. early_identify_cpu(&boot_cpu_data);
  465. }
  466. /*
  467. * The NOPL instruction is supposed to exist on all CPUs with
  468. * family >= 6, unfortunately, that's not true in practice because
  469. * of early VIA chips and (more importantly) broken virtualizers that
  470. * are not easy to detect. Hence, probe for it based on first
  471. * principles.
  472. *
  473. * Note: no 64-bit chip is known to lack these, but put the code here
  474. * for consistency with 32 bits, and to make it utterly trivial to
  475. * diagnose the problem should it ever surface.
  476. */
  477. static void __cpuinit detect_nopl(struct cpuinfo_x86 *c)
  478. {
  479. const u32 nopl_signature = 0x888c53b1; /* Random number */
  480. u32 has_nopl = nopl_signature;
  481. clear_cpu_cap(c, X86_FEATURE_NOPL);
  482. if (c->x86 >= 6) {
  483. asm volatile("\n"
  484. "1: .byte 0x0f,0x1f,0xc0\n" /* nopl %eax */
  485. "2:\n"
  486. " .section .fixup,\"ax\"\n"
  487. "3: xor %0,%0\n"
  488. " jmp 2b\n"
  489. " .previous\n"
  490. _ASM_EXTABLE(1b,3b)
  491. : "+a" (has_nopl));
  492. if (has_nopl == nopl_signature)
  493. set_cpu_cap(c, X86_FEATURE_NOPL);
  494. }
  495. }
  496. static void __cpuinit generic_identify(struct cpuinfo_x86 *c)
  497. {
  498. if (!have_cpuid_p())
  499. return;
  500. c->extended_cpuid_level = 0;
  501. cpu_detect(c);
  502. get_cpu_vendor(c);
  503. get_cpu_cap(c);
  504. if (c->cpuid_level >= 0x00000001) {
  505. c->initial_apicid = (cpuid_ebx(1) >> 24) & 0xFF;
  506. #ifdef CONFIG_X86_32
  507. # ifdef CONFIG_X86_HT
  508. c->apicid = phys_pkg_id(c->initial_apicid, 0);
  509. # else
  510. c->apicid = c->initial_apicid;
  511. # endif
  512. #endif
  513. #ifdef CONFIG_X86_HT
  514. c->phys_proc_id = c->initial_apicid;
  515. #endif
  516. }
  517. get_model_name(c); /* Default name */
  518. init_scattered_cpuid_features(c);
  519. detect_nopl(c);
  520. }
  521. /*
  522. * This does the hard work of actually picking apart the CPU stuff...
  523. */
  524. static void __cpuinit identify_cpu(struct cpuinfo_x86 *c)
  525. {
  526. int i;
  527. c->loops_per_jiffy = loops_per_jiffy;
  528. c->x86_cache_size = -1;
  529. c->x86_vendor = X86_VENDOR_UNKNOWN;
  530. c->x86_model = c->x86_mask = 0; /* So far unknown... */
  531. c->x86_vendor_id[0] = '\0'; /* Unset */
  532. c->x86_model_id[0] = '\0'; /* Unset */
  533. c->x86_max_cores = 1;
  534. #ifdef CONFIG_X86_64
  535. c->x86_coreid_bits = 0;
  536. c->x86_clflush_size = 64;
  537. #else
  538. c->cpuid_level = -1; /* CPUID not detected */
  539. c->x86_clflush_size = 32;
  540. #endif
  541. c->x86_cache_alignment = c->x86_clflush_size;
  542. memset(&c->x86_capability, 0, sizeof c->x86_capability);
  543. if (!have_cpuid_p()) {
  544. /*
  545. * First of all, decide if this is a 486 or higher
  546. * It's a 486 if we can modify the AC flag
  547. */
  548. if (flag_is_changeable_p(X86_EFLAGS_AC))
  549. c->x86 = 4;
  550. else
  551. c->x86 = 3;
  552. }
  553. generic_identify(c);
  554. if (this_cpu->c_identify)
  555. this_cpu->c_identify(c);
  556. #ifdef CONFIG_X86_64
  557. c->apicid = phys_pkg_id(0);
  558. #endif
  559. /*
  560. * Vendor-specific initialization. In this section we
  561. * canonicalize the feature flags, meaning if there are
  562. * features a certain CPU supports which CPUID doesn't
  563. * tell us, CPUID claiming incorrect flags, or other bugs,
  564. * we handle them here.
  565. *
  566. * At the end of this section, c->x86_capability better
  567. * indicate the features this CPU genuinely supports!
  568. */
  569. if (this_cpu->c_init)
  570. this_cpu->c_init(c);
  571. /* Disable the PN if appropriate */
  572. squash_the_stupid_serial_number(c);
  573. /*
  574. * The vendor-specific functions might have changed features. Now
  575. * we do "generic changes."
  576. */
  577. /* If the model name is still unset, do table lookup. */
  578. if (!c->x86_model_id[0]) {
  579. char *p;
  580. p = table_lookup_model(c);
  581. if (p)
  582. strcpy(c->x86_model_id, p);
  583. else
  584. /* Last resort... */
  585. sprintf(c->x86_model_id, "%02x/%02x",
  586. c->x86, c->x86_model);
  587. }
  588. #ifdef CONFIG_X86_64
  589. detect_ht(c);
  590. #endif
  591. /*
  592. * On SMP, boot_cpu_data holds the common feature set between
  593. * all CPUs; so make sure that we indicate which features are
  594. * common between the CPUs. The first time this routine gets
  595. * executed, c == &boot_cpu_data.
  596. */
  597. if (c != &boot_cpu_data) {
  598. /* AND the already accumulated flags with these */
  599. for (i = 0; i < NCAPINTS; i++)
  600. boot_cpu_data.x86_capability[i] &= c->x86_capability[i];
  601. }
  602. /* Clear all flags overriden by options */
  603. for (i = 0; i < NCAPINTS; i++)
  604. c->x86_capability[i] &= ~cleared_cpu_caps[i];
  605. #ifdef CONFIG_X86_MCE
  606. /* Init Machine Check Exception if available. */
  607. mcheck_init(c);
  608. #endif
  609. select_idle_routine(c);
  610. #if defined(CONFIG_NUMA) && defined(CONFIG_X86_64)
  611. numa_add_cpu(smp_processor_id());
  612. #endif
  613. }
  614. void __init identify_boot_cpu(void)
  615. {
  616. identify_cpu(&boot_cpu_data);
  617. #ifdef CONFIG_X86_32
  618. sysenter_setup();
  619. enable_sep_cpu();
  620. #endif
  621. }
  622. void __cpuinit identify_secondary_cpu(struct cpuinfo_x86 *c)
  623. {
  624. BUG_ON(c == &boot_cpu_data);
  625. identify_cpu(c);
  626. #ifdef CONFIG_X86_32
  627. enable_sep_cpu();
  628. #endif
  629. mtrr_ap_init();
  630. }
  631. struct msr_range {
  632. unsigned min;
  633. unsigned max;
  634. };
  635. static struct msr_range msr_range_array[] __cpuinitdata = {
  636. { 0x00000000, 0x00000418},
  637. { 0xc0000000, 0xc000040b},
  638. { 0xc0010000, 0xc0010142},
  639. { 0xc0011000, 0xc001103b},
  640. };
  641. static void __cpuinit print_cpu_msr(void)
  642. {
  643. unsigned index;
  644. u64 val;
  645. int i;
  646. unsigned index_min, index_max;
  647. for (i = 0; i < ARRAY_SIZE(msr_range_array); i++) {
  648. index_min = msr_range_array[i].min;
  649. index_max = msr_range_array[i].max;
  650. for (index = index_min; index < index_max; index++) {
  651. if (rdmsrl_amd_safe(index, &val))
  652. continue;
  653. printk(KERN_INFO " MSR%08x: %016llx\n", index, val);
  654. }
  655. }
  656. }
  657. static int show_msr __cpuinitdata;
  658. static __init int setup_show_msr(char *arg)
  659. {
  660. int num;
  661. get_option(&arg, &num);
  662. if (num > 0)
  663. show_msr = num;
  664. return 1;
  665. }
  666. __setup("show_msr=", setup_show_msr);
  667. static __init int setup_noclflush(char *arg)
  668. {
  669. setup_clear_cpu_cap(X86_FEATURE_CLFLSH);
  670. return 1;
  671. }
  672. __setup("noclflush", setup_noclflush);
  673. void __cpuinit print_cpu_info(struct cpuinfo_x86 *c)
  674. {
  675. char *vendor = NULL;
  676. if (c->x86_vendor < X86_VENDOR_NUM)
  677. vendor = this_cpu->c_vendor;
  678. else if (c->cpuid_level >= 0)
  679. vendor = c->x86_vendor_id;
  680. if (vendor && strncmp(c->x86_model_id, vendor, strlen(vendor)))
  681. printk(KERN_CONT "%s ", vendor);
  682. if (c->x86_model_id[0])
  683. printk(KERN_CONT "%s", c->x86_model_id);
  684. else
  685. printk(KERN_CONT "%d86", c->x86);
  686. if (c->x86_mask || c->cpuid_level >= 0)
  687. printk(KERN_CONT " stepping %02x\n", c->x86_mask);
  688. else
  689. printk(KERN_CONT "\n");
  690. #ifdef CONFIG_SMP
  691. if (c->cpu_index < show_msr)
  692. print_cpu_msr();
  693. #else
  694. if (show_msr)
  695. print_cpu_msr();
  696. #endif
  697. }
  698. static __init int setup_disablecpuid(char *arg)
  699. {
  700. int bit;
  701. if (get_option(&arg, &bit) && bit < NCAPINTS*32)
  702. setup_clear_cpu_cap(bit);
  703. else
  704. return 0;
  705. return 1;
  706. }
  707. __setup("clearcpuid=", setup_disablecpuid);
  708. cpumask_t cpu_initialized __cpuinitdata = CPU_MASK_NONE;
  709. #ifdef CONFIG_X86_64
  710. struct x8664_pda **_cpu_pda __read_mostly;
  711. EXPORT_SYMBOL(_cpu_pda);
  712. struct desc_ptr idt_descr = { 256 * 16 - 1, (unsigned long) idt_table };
  713. char boot_cpu_stack[IRQSTACKSIZE] __page_aligned_bss;
  714. void pda_init(int cpu)
  715. {
  716. struct x8664_pda *pda = cpu_pda(cpu);
  717. /* Setup up data that may be needed in __get_free_pages early */
  718. loadsegment(fs, 0);
  719. loadsegment(gs, 0);
  720. /* Memory clobbers used to order PDA accessed */
  721. mb();
  722. wrmsrl(MSR_GS_BASE, pda);
  723. mb();
  724. pda->cpunumber = cpu;
  725. pda->irqcount = -1;
  726. pda->kernelstack = (unsigned long)stack_thread_info() -
  727. PDA_STACKOFFSET + THREAD_SIZE;
  728. pda->active_mm = &init_mm;
  729. pda->mmu_state = 0;
  730. if (cpu == 0) {
  731. /* others are initialized in smpboot.c */
  732. pda->pcurrent = &init_task;
  733. pda->irqstackptr = boot_cpu_stack;
  734. pda->irqstackptr += IRQSTACKSIZE - 64;
  735. } else {
  736. if (!pda->irqstackptr) {
  737. pda->irqstackptr = (char *)
  738. __get_free_pages(GFP_ATOMIC, IRQSTACK_ORDER);
  739. if (!pda->irqstackptr)
  740. panic("cannot allocate irqstack for cpu %d",
  741. cpu);
  742. pda->irqstackptr += IRQSTACKSIZE - 64;
  743. }
  744. if (pda->nodenumber == 0 && cpu_to_node(cpu) != NUMA_NO_NODE)
  745. pda->nodenumber = cpu_to_node(cpu);
  746. }
  747. }
  748. char boot_exception_stacks[(N_EXCEPTION_STACKS - 1) * EXCEPTION_STKSZ +
  749. DEBUG_STKSZ] __page_aligned_bss;
  750. extern asmlinkage void ignore_sysret(void);
  751. /* May not be marked __init: used by software suspend */
  752. void syscall_init(void)
  753. {
  754. /*
  755. * LSTAR and STAR live in a bit strange symbiosis.
  756. * They both write to the same internal register. STAR allows to
  757. * set CS/DS but only a 32bit target. LSTAR sets the 64bit rip.
  758. */
  759. wrmsrl(MSR_STAR, ((u64)__USER32_CS)<<48 | ((u64)__KERNEL_CS)<<32);
  760. wrmsrl(MSR_LSTAR, system_call);
  761. wrmsrl(MSR_CSTAR, ignore_sysret);
  762. #ifdef CONFIG_IA32_EMULATION
  763. syscall32_cpu_init();
  764. #endif
  765. /* Flags to clear on syscall */
  766. wrmsrl(MSR_SYSCALL_MASK,
  767. X86_EFLAGS_TF|X86_EFLAGS_DF|X86_EFLAGS_IF|X86_EFLAGS_IOPL);
  768. }
  769. unsigned long kernel_eflags;
  770. /*
  771. * Copies of the original ist values from the tss are only accessed during
  772. * debugging, no special alignment required.
  773. */
  774. DEFINE_PER_CPU(struct orig_ist, orig_ist);
  775. #else
  776. /* Make sure %fs is initialized properly in idle threads */
  777. struct pt_regs * __cpuinit idle_regs(struct pt_regs *regs)
  778. {
  779. memset(regs, 0, sizeof(struct pt_regs));
  780. regs->fs = __KERNEL_PERCPU;
  781. return regs;
  782. }
  783. #endif
  784. /*
  785. * cpu_init() initializes state that is per-CPU. Some data is already
  786. * initialized (naturally) in the bootstrap process, such as the GDT
  787. * and IDT. We reload them nevertheless, this function acts as a
  788. * 'CPU state barrier', nothing should get across.
  789. * A lot of state is already set up in PDA init for 64 bit
  790. */
  791. #ifdef CONFIG_X86_64
  792. void __cpuinit cpu_init(void)
  793. {
  794. int cpu = stack_smp_processor_id();
  795. struct tss_struct *t = &per_cpu(init_tss, cpu);
  796. struct orig_ist *orig_ist = &per_cpu(orig_ist, cpu);
  797. unsigned long v;
  798. char *estacks = NULL;
  799. struct task_struct *me;
  800. int i;
  801. /* CPU 0 is initialised in head64.c */
  802. if (cpu != 0)
  803. pda_init(cpu);
  804. else
  805. estacks = boot_exception_stacks;
  806. me = current;
  807. if (cpu_test_and_set(cpu, cpu_initialized))
  808. panic("CPU#%d already initialized!\n", cpu);
  809. printk(KERN_INFO "Initializing CPU#%d\n", cpu);
  810. clear_in_cr4(X86_CR4_VME|X86_CR4_PVI|X86_CR4_TSD|X86_CR4_DE);
  811. /*
  812. * Initialize the per-CPU GDT with the boot GDT,
  813. * and set up the GDT descriptor:
  814. */
  815. switch_to_new_gdt();
  816. load_idt((const struct desc_ptr *)&idt_descr);
  817. memset(me->thread.tls_array, 0, GDT_ENTRY_TLS_ENTRIES * 8);
  818. syscall_init();
  819. wrmsrl(MSR_FS_BASE, 0);
  820. wrmsrl(MSR_KERNEL_GS_BASE, 0);
  821. barrier();
  822. check_efer();
  823. if (cpu != 0 && x2apic)
  824. enable_x2apic();
  825. /*
  826. * set up and load the per-CPU TSS
  827. */
  828. if (!orig_ist->ist[0]) {
  829. static const unsigned int order[N_EXCEPTION_STACKS] = {
  830. [0 ... N_EXCEPTION_STACKS - 1] = EXCEPTION_STACK_ORDER,
  831. [DEBUG_STACK - 1] = DEBUG_STACK_ORDER
  832. };
  833. for (v = 0; v < N_EXCEPTION_STACKS; v++) {
  834. if (cpu) {
  835. estacks = (char *)__get_free_pages(GFP_ATOMIC, order[v]);
  836. if (!estacks)
  837. panic("Cannot allocate exception "
  838. "stack %ld %d\n", v, cpu);
  839. }
  840. estacks += PAGE_SIZE << order[v];
  841. orig_ist->ist[v] = t->x86_tss.ist[v] =
  842. (unsigned long)estacks;
  843. }
  844. }
  845. t->x86_tss.io_bitmap_base = offsetof(struct tss_struct, io_bitmap);
  846. /*
  847. * <= is required because the CPU will access up to
  848. * 8 bits beyond the end of the IO permission bitmap.
  849. */
  850. for (i = 0; i <= IO_BITMAP_LONGS; i++)
  851. t->io_bitmap[i] = ~0UL;
  852. atomic_inc(&init_mm.mm_count);
  853. me->active_mm = &init_mm;
  854. if (me->mm)
  855. BUG();
  856. enter_lazy_tlb(&init_mm, me);
  857. load_sp0(t, &current->thread);
  858. set_tss_desc(cpu, t);
  859. load_TR_desc();
  860. load_LDT(&init_mm.context);
  861. #ifdef CONFIG_KGDB
  862. /*
  863. * If the kgdb is connected no debug regs should be altered. This
  864. * is only applicable when KGDB and a KGDB I/O module are built
  865. * into the kernel and you are using early debugging with
  866. * kgdbwait. KGDB will control the kernel HW breakpoint registers.
  867. */
  868. if (kgdb_connected && arch_kgdb_ops.correct_hw_break)
  869. arch_kgdb_ops.correct_hw_break();
  870. else {
  871. #endif
  872. /*
  873. * Clear all 6 debug registers:
  874. */
  875. set_debugreg(0UL, 0);
  876. set_debugreg(0UL, 1);
  877. set_debugreg(0UL, 2);
  878. set_debugreg(0UL, 3);
  879. set_debugreg(0UL, 6);
  880. set_debugreg(0UL, 7);
  881. #ifdef CONFIG_KGDB
  882. /* If the kgdb is connected no debug regs should be altered. */
  883. }
  884. #endif
  885. fpu_init();
  886. raw_local_save_flags(kernel_eflags);
  887. if (is_uv_system())
  888. uv_cpu_init();
  889. }
  890. #else
  891. void __cpuinit cpu_init(void)
  892. {
  893. int cpu = smp_processor_id();
  894. struct task_struct *curr = current;
  895. struct tss_struct *t = &per_cpu(init_tss, cpu);
  896. struct thread_struct *thread = &curr->thread;
  897. if (cpu_test_and_set(cpu, cpu_initialized)) {
  898. printk(KERN_WARNING "CPU#%d already initialized!\n", cpu);
  899. for (;;) local_irq_enable();
  900. }
  901. printk(KERN_INFO "Initializing CPU#%d\n", cpu);
  902. if (cpu_has_vme || cpu_has_tsc || cpu_has_de)
  903. clear_in_cr4(X86_CR4_VME|X86_CR4_PVI|X86_CR4_TSD|X86_CR4_DE);
  904. load_idt(&idt_descr);
  905. switch_to_new_gdt();
  906. /*
  907. * Set up and load the per-CPU TSS and LDT
  908. */
  909. atomic_inc(&init_mm.mm_count);
  910. curr->active_mm = &init_mm;
  911. if (curr->mm)
  912. BUG();
  913. enter_lazy_tlb(&init_mm, curr);
  914. load_sp0(t, thread);
  915. set_tss_desc(cpu, t);
  916. load_TR_desc();
  917. load_LDT(&init_mm.context);
  918. #ifdef CONFIG_DOUBLEFAULT
  919. /* Set up doublefault TSS pointer in the GDT */
  920. __set_tss_desc(cpu, GDT_ENTRY_DOUBLEFAULT_TSS, &doublefault_tss);
  921. #endif
  922. /* Clear %gs. */
  923. asm volatile ("mov %0, %%gs" : : "r" (0));
  924. /* Clear all 6 debug registers: */
  925. set_debugreg(0, 0);
  926. set_debugreg(0, 1);
  927. set_debugreg(0, 2);
  928. set_debugreg(0, 3);
  929. set_debugreg(0, 6);
  930. set_debugreg(0, 7);
  931. /*
  932. * Force FPU initialization:
  933. */
  934. if (cpu_has_xsave)
  935. current_thread_info()->status = TS_XSAVE;
  936. else
  937. current_thread_info()->status = 0;
  938. clear_used_math();
  939. mxcsr_feature_mask_init();
  940. /*
  941. * Boot processor to setup the FP and extended state context info.
  942. */
  943. if (!smp_processor_id())
  944. init_thread_xstate();
  945. xsave_init();
  946. }
  947. #ifdef CONFIG_HOTPLUG_CPU
  948. void __cpuinit cpu_uninit(void)
  949. {
  950. int cpu = raw_smp_processor_id();
  951. cpu_clear(cpu, cpu_initialized);
  952. /* lazy TLB state */
  953. per_cpu(cpu_tlbstate, cpu).state = 0;
  954. per_cpu(cpu_tlbstate, cpu).active_mm = &init_mm;
  955. }
  956. #endif
  957. #endif