trampoline.S 4.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211
  1. /*
  2. *
  3. * Trampoline.S Derived from Setup.S by Linus Torvalds
  4. *
  5. * 4 Jan 1997 Michael Chastain: changed to gnu as.
  6. * 15 Sept 2005 Eric Biederman: 64bit PIC support
  7. *
  8. * Entry: CS:IP point to the start of our code, we are
  9. * in real mode with no stack, but the rest of the
  10. * trampoline page to make our stack and everything else
  11. * is a mystery.
  12. *
  13. * In fact we don't actually need a stack so we don't
  14. * set one up.
  15. *
  16. * On entry to trampoline_data, the processor is in real mode
  17. * with 16-bit addressing and 16-bit data. CS has some value
  18. * and IP is zero. Thus, data addresses need to be absolute
  19. * (no relocation) and are taken with regard to r_base.
  20. *
  21. * With the addition of trampoline_level4_pgt this code can
  22. * now enter a 64bit kernel that lives at arbitrary 64bit
  23. * physical addresses.
  24. *
  25. * If you work on this file, check the object module with objdump
  26. * --full-contents --reloc to make sure there are no relocation
  27. * entries.
  28. */
  29. #include <linux/linkage.h>
  30. #include <asm/pgtable.h>
  31. #include <asm/page.h>
  32. #include <asm/msr.h>
  33. #include <asm/segment.h>
  34. .data
  35. .code16
  36. ENTRY(trampoline_data)
  37. r_base = .
  38. cli # We should be safe anyway
  39. wbinvd
  40. mov %cs, %ax # Code and data in the same place
  41. mov %ax, %ds
  42. mov %ax, %es
  43. mov %ax, %ss
  44. movl $0xA5A5A5A5, trampoline_data - r_base
  45. # write marker for master knows we're running
  46. # Setup stack
  47. movw $(trampoline_stack_end - r_base), %sp
  48. call verify_cpu # Verify the cpu supports long mode
  49. mov %cs, %ax
  50. movzx %ax, %esi # Find the 32bit trampoline location
  51. shll $4, %esi
  52. # Fixup the vectors
  53. addl %esi, startup_32_vector - r_base
  54. addl %esi, startup_64_vector - r_base
  55. addl %esi, tgdt + 2 - r_base # Fixup the gdt pointer
  56. /*
  57. * GDT tables in non default location kernel can be beyond 16MB and
  58. * lgdt will not be able to load the address as in real mode default
  59. * operand size is 16bit. Use lgdtl instead to force operand size
  60. * to 32 bit.
  61. */
  62. lidtl tidt - r_base # load idt with 0, 0
  63. lgdtl tgdt - r_base # load gdt with whatever is appropriate
  64. xor %ax, %ax
  65. inc %ax # protected mode (PE) bit
  66. lmsw %ax # into protected mode
  67. # flush prefetch and jump to startup_32
  68. ljmpl *(startup_32_vector - r_base)
  69. .code32
  70. .balign 4
  71. startup_32:
  72. movl $__KERNEL_DS, %eax # Initialize the %ds segment register
  73. movl %eax, %ds
  74. xorl %eax, %eax
  75. btsl $5, %eax # Enable PAE mode
  76. movl %eax, %cr4
  77. # Setup trampoline 4 level pagetables
  78. leal (trampoline_level4_pgt - r_base)(%esi), %eax
  79. movl %eax, %cr3
  80. movl $MSR_EFER, %ecx
  81. movl $(1 << _EFER_LME), %eax # Enable Long Mode
  82. xorl %edx, %edx
  83. wrmsr
  84. xorl %eax, %eax
  85. btsl $31, %eax # Enable paging and in turn activate Long Mode
  86. btsl $0, %eax # Enable protected mode
  87. movl %eax, %cr0
  88. /*
  89. * At this point we're in long mode but in 32bit compatibility mode
  90. * with EFER.LME = 1, CS.L = 0, CS.D = 1 (and in turn
  91. * EFER.LMA = 1). Now we want to jump in 64bit mode, to do that we use
  92. * the new gdt/idt that has __KERNEL_CS with CS.L = 1.
  93. */
  94. ljmp *(startup_64_vector - r_base)(%esi)
  95. .code64
  96. .balign 4
  97. startup_64:
  98. # Now jump into the kernel using virtual addresses
  99. movq $secondary_startup_64, %rax
  100. jmp *%rax
  101. .code16
  102. verify_cpu:
  103. pushl $0 # Kill any dangerous flags
  104. popfl
  105. /* minimum CPUID flags for x86-64 */
  106. /* see http://www.x86-64.org/lists/discuss/msg02971.html */
  107. #define REQUIRED_MASK1 ((1<<0)|(1<<3)|(1<<4)|(1<<5)|(1<<6)|(1<<8)|\
  108. (1<<13)|(1<<15)|(1<<24)|(1<<25)|(1<<26))
  109. #define REQUIRED_MASK2 (1<<29)
  110. pushfl # check for cpuid
  111. popl %eax
  112. movl %eax, %ebx
  113. xorl $0x200000,%eax
  114. pushl %eax
  115. popfl
  116. pushfl
  117. popl %eax
  118. pushl %ebx
  119. popfl
  120. cmpl %eax, %ebx
  121. jz no_longmode
  122. xorl %eax, %eax # See if cpuid 1 is implemented
  123. cpuid
  124. cmpl $0x1, %eax
  125. jb no_longmode
  126. movl $0x01, %eax # Does the cpu have what it takes?
  127. cpuid
  128. andl $REQUIRED_MASK1, %edx
  129. xorl $REQUIRED_MASK1, %edx
  130. jnz no_longmode
  131. movl $0x80000000, %eax # See if extended cpuid is implemented
  132. cpuid
  133. cmpl $0x80000001, %eax
  134. jb no_longmode
  135. movl $0x80000001, %eax # Does the cpu have what it takes?
  136. cpuid
  137. andl $REQUIRED_MASK2, %edx
  138. xorl $REQUIRED_MASK2, %edx
  139. jnz no_longmode
  140. ret # The cpu supports long mode
  141. no_longmode:
  142. hlt
  143. jmp no_longmode
  144. # Careful these need to be in the same 64K segment as the above;
  145. tidt:
  146. .word 0 # idt limit = 0
  147. .word 0, 0 # idt base = 0L
  148. # Duplicate the global descriptor table
  149. # so the kernel can live anywhere
  150. .balign 4
  151. tgdt:
  152. .short tgdt_end - tgdt # gdt limit
  153. .long tgdt - r_base
  154. .short 0
  155. .quad 0x00cf9b000000ffff # __KERNEL32_CS
  156. .quad 0x00af9b000000ffff # __KERNEL_CS
  157. .quad 0x00cf93000000ffff # __KERNEL_DS
  158. tgdt_end:
  159. .balign 4
  160. startup_32_vector:
  161. .long startup_32 - r_base
  162. .word __KERNEL32_CS, 0
  163. .balign 4
  164. startup_64_vector:
  165. .long startup_64 - r_base
  166. .word __KERNEL_CS, 0
  167. trampoline_stack:
  168. .org 0x1000
  169. trampoline_stack_end:
  170. ENTRY(trampoline_level4_pgt)
  171. .quad level3_ident_pgt - __START_KERNEL_map + _KERNPG_TABLE
  172. .fill 510,8,0
  173. .quad level3_kernel_pgt - __START_KERNEL_map + _KERNPG_TABLE
  174. ENTRY(trampoline_end)