head.S 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555
  1. /*
  2. * Low-level CPU initialisation
  3. * Based on arch/arm/kernel/head.S
  4. *
  5. * Copyright (C) 1994-2002 Russell King
  6. * Copyright (C) 2003-2012 ARM Ltd.
  7. * Authors: Catalin Marinas <catalin.marinas@arm.com>
  8. * Will Deacon <will.deacon@arm.com>
  9. *
  10. * This program is free software; you can redistribute it and/or modify
  11. * it under the terms of the GNU General Public License version 2 as
  12. * published by the Free Software Foundation.
  13. *
  14. * This program is distributed in the hope that it will be useful,
  15. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  16. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  17. * GNU General Public License for more details.
  18. *
  19. * You should have received a copy of the GNU General Public License
  20. * along with this program. If not, see <http://www.gnu.org/licenses/>.
  21. */
  22. #include <linux/linkage.h>
  23. #include <linux/init.h>
  24. #include <asm/assembler.h>
  25. #include <asm/ptrace.h>
  26. #include <asm/asm-offsets.h>
  27. #include <asm/cputype.h>
  28. #include <asm/memory.h>
  29. #include <asm/thread_info.h>
  30. #include <asm/pgtable-hwdef.h>
  31. #include <asm/pgtable.h>
  32. #include <asm/page.h>
  33. #include <asm/virt.h>
  34. /*
  35. * swapper_pg_dir is the virtual address of the initial page table. We place
  36. * the page tables 3 * PAGE_SIZE below KERNEL_RAM_VADDR. The idmap_pg_dir has
  37. * 2 pages and is placed below swapper_pg_dir.
  38. */
  39. #define KERNEL_RAM_VADDR (PAGE_OFFSET + TEXT_OFFSET)
  40. #if (KERNEL_RAM_VADDR & 0xfffff) != 0x80000
  41. #error KERNEL_RAM_VADDR must start at 0xXXX80000
  42. #endif
  43. #define SWAPPER_DIR_SIZE (3 * PAGE_SIZE)
  44. #define IDMAP_DIR_SIZE (2 * PAGE_SIZE)
  45. .globl swapper_pg_dir
  46. .equ swapper_pg_dir, KERNEL_RAM_VADDR - SWAPPER_DIR_SIZE
  47. .globl idmap_pg_dir
  48. .equ idmap_pg_dir, swapper_pg_dir - IDMAP_DIR_SIZE
  49. .macro pgtbl, ttb0, ttb1, phys
  50. add \ttb1, \phys, #TEXT_OFFSET - SWAPPER_DIR_SIZE
  51. sub \ttb0, \ttb1, #IDMAP_DIR_SIZE
  52. .endm
  53. #ifdef CONFIG_ARM64_64K_PAGES
  54. #define BLOCK_SHIFT PAGE_SHIFT
  55. #define BLOCK_SIZE PAGE_SIZE
  56. #else
  57. #define BLOCK_SHIFT SECTION_SHIFT
  58. #define BLOCK_SIZE SECTION_SIZE
  59. #endif
  60. #define KERNEL_START KERNEL_RAM_VADDR
  61. #define KERNEL_END _end
  62. /*
  63. * Initial memory map attributes.
  64. */
  65. #ifndef CONFIG_SMP
  66. #define PTE_FLAGS PTE_TYPE_PAGE | PTE_AF
  67. #define PMD_FLAGS PMD_TYPE_SECT | PMD_SECT_AF
  68. #else
  69. #define PTE_FLAGS PTE_TYPE_PAGE | PTE_AF | PTE_SHARED
  70. #define PMD_FLAGS PMD_TYPE_SECT | PMD_SECT_AF | PMD_SECT_S
  71. #endif
  72. #ifdef CONFIG_ARM64_64K_PAGES
  73. #define MM_MMUFLAGS PTE_ATTRINDX(MT_NORMAL) | PTE_FLAGS
  74. #else
  75. #define MM_MMUFLAGS PMD_ATTRINDX(MT_NORMAL) | PMD_FLAGS
  76. #endif
  77. /*
  78. * Kernel startup entry point.
  79. * ---------------------------
  80. *
  81. * The requirements are:
  82. * MMU = off, D-cache = off, I-cache = on or off,
  83. * x0 = physical address to the FDT blob.
  84. *
  85. * This code is mostly position independent so you call this at
  86. * __pa(PAGE_OFFSET + TEXT_OFFSET).
  87. *
  88. * Note that the callee-saved registers are used for storing variables
  89. * that are useful before the MMU is enabled. The allocations are described
  90. * in the entry routines.
  91. */
  92. __HEAD
  93. /*
  94. * DO NOT MODIFY. Image header expected by Linux boot-loaders.
  95. */
  96. b stext // branch to kernel start, magic
  97. .long 0 // reserved
  98. .quad TEXT_OFFSET // Image load offset from start of RAM
  99. .quad 0 // reserved
  100. .quad 0 // reserved
  101. .quad 0 // reserved
  102. .quad 0 // reserved
  103. .quad 0 // reserved
  104. .byte 0x41 // Magic number, "ARM\x64"
  105. .byte 0x52
  106. .byte 0x4d
  107. .byte 0x64
  108. .word 0 // reserved
  109. ENTRY(stext)
  110. mov x21, x0 // x21=FDT
  111. bl __calc_phys_offset // x24=PHYS_OFFSET, x28=PHYS_OFFSET-PAGE_OFFSET
  112. bl el2_setup // Drop to EL1
  113. mrs x22, midr_el1 // x22=cpuid
  114. mov x0, x22
  115. bl lookup_processor_type
  116. mov x23, x0 // x23=current cpu_table
  117. cbz x23, __error_p // invalid processor (x23=0)?
  118. bl __vet_fdt
  119. bl __create_page_tables // x25=TTBR0, x26=TTBR1
  120. /*
  121. * The following calls CPU specific code in a position independent
  122. * manner. See arch/arm64/mm/proc.S for details. x23 = base of
  123. * cpu_info structure selected by lookup_processor_type above.
  124. * On return, the CPU will be ready for the MMU to be turned on and
  125. * the TCR will have been set.
  126. */
  127. ldr x27, __switch_data // address to jump to after
  128. // MMU has been enabled
  129. adr lr, __enable_mmu // return (PIC) address
  130. ldr x12, [x23, #CPU_INFO_SETUP]
  131. add x12, x12, x28 // __virt_to_phys
  132. br x12 // initialise processor
  133. ENDPROC(stext)
  134. /*
  135. * If we're fortunate enough to boot at EL2, ensure that the world is
  136. * sane before dropping to EL1.
  137. */
  138. ENTRY(el2_setup)
  139. mrs x0, CurrentEL
  140. cmp x0, #PSR_MODE_EL2t
  141. ccmp x0, #PSR_MODE_EL2h, #0x4, ne
  142. ldr x0, =__boot_cpu_mode // Compute __boot_cpu_mode
  143. add x0, x0, x28
  144. b.eq 1f
  145. str wzr, [x0] // Remember we don't have EL2...
  146. ret
  147. /* Hyp configuration. */
  148. 1: ldr w1, =BOOT_CPU_MODE_EL2
  149. str w1, [x0, #4] // This CPU has EL2
  150. mov x0, #(1 << 31) // 64-bit EL1
  151. msr hcr_el2, x0
  152. /* Generic timers. */
  153. mrs x0, cnthctl_el2
  154. orr x0, x0, #3 // Enable EL1 physical timers
  155. msr cnthctl_el2, x0
  156. msr cntvoff_el2, xzr // Clear virtual offset
  157. /* Populate ID registers. */
  158. mrs x0, midr_el1
  159. mrs x1, mpidr_el1
  160. msr vpidr_el2, x0
  161. msr vmpidr_el2, x1
  162. /* sctlr_el1 */
  163. mov x0, #0x0800 // Set/clear RES{1,0} bits
  164. movk x0, #0x30d0, lsl #16
  165. msr sctlr_el1, x0
  166. /* Coprocessor traps. */
  167. mov x0, #0x33ff
  168. msr cptr_el2, x0 // Disable copro. traps to EL2
  169. #ifdef CONFIG_COMPAT
  170. msr hstr_el2, xzr // Disable CP15 traps to EL2
  171. #endif
  172. /* Stage-2 translation */
  173. msr vttbr_el2, xzr
  174. /* Hypervisor stub */
  175. adr x0, __hyp_stub_vectors
  176. msr vbar_el2, x0
  177. /* spsr */
  178. mov x0, #(PSR_F_BIT | PSR_I_BIT | PSR_A_BIT | PSR_D_BIT |\
  179. PSR_MODE_EL1h)
  180. msr spsr_el2, x0
  181. msr elr_el2, lr
  182. eret
  183. ENDPROC(el2_setup)
  184. /*
  185. * We need to find out the CPU boot mode long after boot, so we need to
  186. * store it in a writable variable.
  187. *
  188. * This is not in .bss, because we set it sufficiently early that the boot-time
  189. * zeroing of .bss would clobber it.
  190. */
  191. .pushsection .data
  192. ENTRY(__boot_cpu_mode)
  193. .long BOOT_CPU_MODE_EL2
  194. .long 0
  195. .popsection
  196. .align 3
  197. 2: .quad .
  198. .quad PAGE_OFFSET
  199. #ifdef CONFIG_SMP
  200. .pushsection .smp.pen.text, "ax"
  201. .align 3
  202. 1: .quad .
  203. .quad secondary_holding_pen_release
  204. /*
  205. * This provides a "holding pen" for platforms to hold all secondary
  206. * cores are held until we're ready for them to initialise.
  207. */
  208. ENTRY(secondary_holding_pen)
  209. bl __calc_phys_offset // x24=phys offset
  210. bl el2_setup // Drop to EL1
  211. mrs x0, mpidr_el1
  212. ldr x1, =MPIDR_HWID_BITMASK
  213. and x0, x0, x1
  214. adr x1, 1b
  215. ldp x2, x3, [x1]
  216. sub x1, x1, x2
  217. add x3, x3, x1
  218. pen: ldr x4, [x3]
  219. cmp x4, x0
  220. b.eq secondary_startup
  221. wfe
  222. b pen
  223. ENDPROC(secondary_holding_pen)
  224. .popsection
  225. ENTRY(secondary_startup)
  226. /*
  227. * Common entry point for secondary CPUs.
  228. */
  229. mrs x22, midr_el1 // x22=cpuid
  230. mov x0, x22
  231. bl lookup_processor_type
  232. mov x23, x0 // x23=current cpu_table
  233. cbz x23, __error_p // invalid processor (x23=0)?
  234. pgtbl x25, x26, x24 // x25=TTBR0, x26=TTBR1
  235. ldr x12, [x23, #CPU_INFO_SETUP]
  236. add x12, x12, x28 // __virt_to_phys
  237. blr x12 // initialise processor
  238. ldr x21, =secondary_data
  239. ldr x27, =__secondary_switched // address to jump to after enabling the MMU
  240. b __enable_mmu
  241. ENDPROC(secondary_startup)
  242. ENTRY(__secondary_switched)
  243. ldr x0, [x21] // get secondary_data.stack
  244. mov sp, x0
  245. mov x29, #0
  246. b secondary_start_kernel
  247. ENDPROC(__secondary_switched)
  248. #endif /* CONFIG_SMP */
  249. /*
  250. * Setup common bits before finally enabling the MMU. Essentially this is just
  251. * loading the page table pointer and vector base registers.
  252. *
  253. * On entry to this code, x0 must contain the SCTLR_EL1 value for turning on
  254. * the MMU.
  255. */
  256. __enable_mmu:
  257. ldr x5, =vectors
  258. msr vbar_el1, x5
  259. msr ttbr0_el1, x25 // load TTBR0
  260. msr ttbr1_el1, x26 // load TTBR1
  261. isb
  262. b __turn_mmu_on
  263. ENDPROC(__enable_mmu)
  264. /*
  265. * Enable the MMU. This completely changes the structure of the visible memory
  266. * space. You will not be able to trace execution through this.
  267. *
  268. * x0 = system control register
  269. * x27 = *virtual* address to jump to upon completion
  270. *
  271. * other registers depend on the function called upon completion
  272. */
  273. .align 6
  274. __turn_mmu_on:
  275. msr sctlr_el1, x0
  276. isb
  277. br x27
  278. ENDPROC(__turn_mmu_on)
  279. /*
  280. * Calculate the start of physical memory.
  281. */
  282. __calc_phys_offset:
  283. adr x0, 1f
  284. ldp x1, x2, [x0]
  285. sub x28, x0, x1 // x28 = PHYS_OFFSET - PAGE_OFFSET
  286. add x24, x2, x28 // x24 = PHYS_OFFSET
  287. ret
  288. ENDPROC(__calc_phys_offset)
  289. .align 3
  290. 1: .quad .
  291. .quad PAGE_OFFSET
  292. /*
  293. * Macro to populate the PGD for the corresponding block entry in the next
  294. * level (tbl) for the given virtual address.
  295. *
  296. * Preserves: pgd, tbl, virt
  297. * Corrupts: tmp1, tmp2
  298. */
  299. .macro create_pgd_entry, pgd, tbl, virt, tmp1, tmp2
  300. lsr \tmp1, \virt, #PGDIR_SHIFT
  301. and \tmp1, \tmp1, #PTRS_PER_PGD - 1 // PGD index
  302. orr \tmp2, \tbl, #3 // PGD entry table type
  303. str \tmp2, [\pgd, \tmp1, lsl #3]
  304. .endm
  305. /*
  306. * Macro to populate block entries in the page table for the start..end
  307. * virtual range (inclusive).
  308. *
  309. * Preserves: tbl, flags
  310. * Corrupts: phys, start, end, pstate
  311. */
  312. .macro create_block_map, tbl, flags, phys, start, end, idmap=0
  313. lsr \phys, \phys, #BLOCK_SHIFT
  314. .if \idmap
  315. and \start, \phys, #PTRS_PER_PTE - 1 // table index
  316. .else
  317. lsr \start, \start, #BLOCK_SHIFT
  318. and \start, \start, #PTRS_PER_PTE - 1 // table index
  319. .endif
  320. orr \phys, \flags, \phys, lsl #BLOCK_SHIFT // table entry
  321. .ifnc \start,\end
  322. lsr \end, \end, #BLOCK_SHIFT
  323. and \end, \end, #PTRS_PER_PTE - 1 // table end index
  324. .endif
  325. 9999: str \phys, [\tbl, \start, lsl #3] // store the entry
  326. .ifnc \start,\end
  327. add \start, \start, #1 // next entry
  328. add \phys, \phys, #BLOCK_SIZE // next block
  329. cmp \start, \end
  330. b.ls 9999b
  331. .endif
  332. .endm
  333. /*
  334. * Setup the initial page tables. We only setup the barest amount which is
  335. * required to get the kernel running. The following sections are required:
  336. * - identity mapping to enable the MMU (low address, TTBR0)
  337. * - first few MB of the kernel linear mapping to jump to once the MMU has
  338. * been enabled, including the FDT blob (TTBR1)
  339. * - UART mapping if CONFIG_EARLY_PRINTK is enabled (TTBR1)
  340. */
  341. __create_page_tables:
  342. pgtbl x25, x26, x24 // idmap_pg_dir and swapper_pg_dir addresses
  343. /*
  344. * Clear the idmap and swapper page tables.
  345. */
  346. mov x0, x25
  347. add x6, x26, #SWAPPER_DIR_SIZE
  348. 1: stp xzr, xzr, [x0], #16
  349. stp xzr, xzr, [x0], #16
  350. stp xzr, xzr, [x0], #16
  351. stp xzr, xzr, [x0], #16
  352. cmp x0, x6
  353. b.lo 1b
  354. ldr x7, =MM_MMUFLAGS
  355. /*
  356. * Create the identity mapping.
  357. */
  358. add x0, x25, #PAGE_SIZE // section table address
  359. adr x3, __turn_mmu_on // virtual/physical address
  360. create_pgd_entry x25, x0, x3, x5, x6
  361. create_block_map x0, x7, x3, x5, x5, idmap=1
  362. /*
  363. * Map the kernel image (starting with PHYS_OFFSET).
  364. */
  365. add x0, x26, #PAGE_SIZE // section table address
  366. mov x5, #PAGE_OFFSET
  367. create_pgd_entry x26, x0, x5, x3, x6
  368. ldr x6, =KERNEL_END - 1
  369. mov x3, x24 // phys offset
  370. create_block_map x0, x7, x3, x5, x6
  371. /*
  372. * Map the FDT blob (maximum 2MB; must be within 512MB of
  373. * PHYS_OFFSET).
  374. */
  375. mov x3, x21 // FDT phys address
  376. and x3, x3, #~((1 << 21) - 1) // 2MB aligned
  377. mov x6, #PAGE_OFFSET
  378. sub x5, x3, x24 // subtract PHYS_OFFSET
  379. tst x5, #~((1 << 29) - 1) // within 512MB?
  380. csel x21, xzr, x21, ne // zero the FDT pointer
  381. b.ne 1f
  382. add x5, x5, x6 // __va(FDT blob)
  383. add x6, x5, #1 << 21 // 2MB for the FDT blob
  384. sub x6, x6, #1 // inclusive range
  385. create_block_map x0, x7, x3, x5, x6
  386. 1:
  387. #ifdef CONFIG_EARLY_PRINTK
  388. /*
  389. * Create the pgd entry for the UART mapping. The full mapping is done
  390. * later based earlyprintk kernel parameter.
  391. */
  392. ldr x5, =EARLYCON_IOBASE // UART virtual address
  393. add x0, x26, #2 * PAGE_SIZE // section table address
  394. create_pgd_entry x26, x0, x5, x6, x7
  395. #endif
  396. ret
  397. ENDPROC(__create_page_tables)
  398. .ltorg
  399. .align 3
  400. .type __switch_data, %object
  401. __switch_data:
  402. .quad __mmap_switched
  403. .quad __data_loc // x4
  404. .quad _data // x5
  405. .quad __bss_start // x6
  406. .quad _end // x7
  407. .quad processor_id // x4
  408. .quad __fdt_pointer // x5
  409. .quad memstart_addr // x6
  410. .quad init_thread_union + THREAD_START_SP // sp
  411. /*
  412. * The following fragment of code is executed with the MMU on in MMU mode, and
  413. * uses absolute addresses; this is not position independent.
  414. */
  415. __mmap_switched:
  416. adr x3, __switch_data + 8
  417. ldp x4, x5, [x3], #16
  418. ldp x6, x7, [x3], #16
  419. cmp x4, x5 // Copy data segment if needed
  420. 1: ccmp x5, x6, #4, ne
  421. b.eq 2f
  422. ldr x16, [x4], #8
  423. str x16, [x5], #8
  424. b 1b
  425. 2:
  426. 1: cmp x6, x7
  427. b.hs 2f
  428. str xzr, [x6], #8 // Clear BSS
  429. b 1b
  430. 2:
  431. ldp x4, x5, [x3], #16
  432. ldr x6, [x3], #8
  433. ldr x16, [x3]
  434. mov sp, x16
  435. str x22, [x4] // Save processor ID
  436. str x21, [x5] // Save FDT pointer
  437. str x24, [x6] // Save PHYS_OFFSET
  438. mov x29, #0
  439. b start_kernel
  440. ENDPROC(__mmap_switched)
  441. /*
  442. * Exception handling. Something went wrong and we can't proceed. We ought to
  443. * tell the user, but since we don't have any guarantee that we're even
  444. * running on the right architecture, we do virtually nothing.
  445. */
  446. __error_p:
  447. ENDPROC(__error_p)
  448. __error:
  449. 1: nop
  450. b 1b
  451. ENDPROC(__error)
  452. /*
  453. * This function gets the processor ID in w0 and searches the cpu_table[] for
  454. * a match. It returns a pointer to the struct cpu_info it found. The
  455. * cpu_table[] must end with an empty (all zeros) structure.
  456. *
  457. * This routine can be called via C code and it needs to work with the MMU
  458. * both disabled and enabled (the offset is calculated automatically).
  459. */
  460. ENTRY(lookup_processor_type)
  461. adr x1, __lookup_processor_type_data
  462. ldp x2, x3, [x1]
  463. sub x1, x1, x2 // get offset between VA and PA
  464. add x3, x3, x1 // convert VA to PA
  465. 1:
  466. ldp w5, w6, [x3] // load cpu_id_val and cpu_id_mask
  467. cbz w5, 2f // end of list?
  468. and w6, w6, w0
  469. cmp w5, w6
  470. b.eq 3f
  471. add x3, x3, #CPU_INFO_SZ
  472. b 1b
  473. 2:
  474. mov x3, #0 // unknown processor
  475. 3:
  476. mov x0, x3
  477. ret
  478. ENDPROC(lookup_processor_type)
  479. .align 3
  480. .type __lookup_processor_type_data, %object
  481. __lookup_processor_type_data:
  482. .quad .
  483. .quad cpu_table
  484. .size __lookup_processor_type_data, . - __lookup_processor_type_data
  485. /*
  486. * Determine validity of the x21 FDT pointer.
  487. * The dtb must be 8-byte aligned and live in the first 512M of memory.
  488. */
  489. __vet_fdt:
  490. tst x21, #0x7
  491. b.ne 1f
  492. cmp x21, x24
  493. b.lt 1f
  494. mov x0, #(1 << 29)
  495. add x0, x0, x24
  496. cmp x21, x0
  497. b.ge 1f
  498. ret
  499. 1:
  500. mov x21, #0
  501. ret
  502. ENDPROC(__vet_fdt)