vfphw.S 8.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319
  1. /*
  2. * linux/arch/arm/vfp/vfphw.S
  3. *
  4. * Copyright (C) 2004 ARM Limited.
  5. * Written by Deep Blue Solutions Limited.
  6. *
  7. * This program is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU General Public License version 2 as
  9. * published by the Free Software Foundation.
  10. *
  11. * This code is called from the kernel's undefined instruction trap.
  12. * r9 holds the return address for successful handling.
  13. * lr holds the return address for unrecognised instructions.
  14. * r10 points at the start of the private FP workspace in the thread structure
  15. * sp points to a struct pt_regs (as defined in include/asm/proc/ptrace.h)
  16. */
  17. #include <asm/thread_info.h>
  18. #include <asm/vfpmacros.h>
  19. #include <linux/kern_levels.h>
  20. #include "../kernel/entry-header.S"
  21. .macro DBGSTR, str
  22. #ifdef DEBUG
  23. stmfd sp!, {r0-r3, ip, lr}
  24. ldr r0, =1f
  25. bl printk
  26. ldmfd sp!, {r0-r3, ip, lr}
  27. .pushsection .rodata, "a"
  28. 1: .ascii KERN_DEBUG "VFP: \str\n"
  29. .byte 0
  30. .previous
  31. #endif
  32. .endm
  33. .macro DBGSTR1, str, arg
  34. #ifdef DEBUG
  35. stmfd sp!, {r0-r3, ip, lr}
  36. mov r1, \arg
  37. ldr r0, =1f
  38. bl printk
  39. ldmfd sp!, {r0-r3, ip, lr}
  40. .pushsection .rodata, "a"
  41. 1: .ascii KERN_DEBUG "VFP: \str\n"
  42. .byte 0
  43. .previous
  44. #endif
  45. .endm
  46. .macro DBGSTR3, str, arg1, arg2, arg3
  47. #ifdef DEBUG
  48. stmfd sp!, {r0-r3, ip, lr}
  49. mov r3, \arg3
  50. mov r2, \arg2
  51. mov r1, \arg1
  52. ldr r0, =1f
  53. bl printk
  54. ldmfd sp!, {r0-r3, ip, lr}
  55. .pushsection .rodata, "a"
  56. 1: .ascii KERN_DEBUG "VFP: \str\n"
  57. .byte 0
  58. .previous
  59. #endif
  60. .endm
  61. @ VFP hardware support entry point.
  62. @
  63. @ r0 = instruction opcode (32-bit ARM or two 16-bit Thumb)
  64. @ r2 = PC value to resume execution after successful emulation
  65. @ r9 = normal "successful" return address
  66. @ r10 = vfp_state union
  67. @ r11 = CPU number
  68. @ lr = unrecognised instruction return address
  69. @ IRQs enabled.
  70. ENTRY(vfp_support_entry)
  71. DBGSTR3 "instr %08x pc %08x state %p", r0, r2, r10
  72. VFPFMRX r1, FPEXC @ Is the VFP enabled?
  73. DBGSTR1 "fpexc %08x", r1
  74. tst r1, #FPEXC_EN
  75. bne look_for_VFP_exceptions @ VFP is already enabled
  76. DBGSTR1 "enable %x", r10
  77. ldr r3, vfp_current_hw_state_address
  78. orr r1, r1, #FPEXC_EN @ user FPEXC has the enable bit set
  79. ldr r4, [r3, r11, lsl #2] @ vfp_current_hw_state pointer
  80. bic r5, r1, #FPEXC_EX @ make sure exceptions are disabled
  81. cmp r4, r10 @ this thread owns the hw context?
  82. #ifndef CONFIG_SMP
  83. @ For UP, checking that this thread owns the hw context is
  84. @ sufficient to determine that the hardware state is valid.
  85. beq vfp_hw_state_valid
  86. @ On UP, we lazily save the VFP context. As a different
  87. @ thread wants ownership of the VFP hardware, save the old
  88. @ state if there was a previous (valid) owner.
  89. VFPFMXR FPEXC, r5 @ enable VFP, disable any pending
  90. @ exceptions, so we can get at the
  91. @ rest of it
  92. DBGSTR1 "save old state %p", r4
  93. cmp r4, #0 @ if the vfp_current_hw_state is NULL
  94. beq vfp_reload_hw @ then the hw state needs reloading
  95. VFPFSTMIA r4, r5 @ save the working registers
  96. VFPFMRX r5, FPSCR @ current status
  97. #ifndef CONFIG_CPU_FEROCEON
  98. tst r1, #FPEXC_EX @ is there additional state to save?
  99. beq 1f
  100. VFPFMRX r6, FPINST @ FPINST (only if FPEXC.EX is set)
  101. tst r1, #FPEXC_FP2V @ is there an FPINST2 to read?
  102. beq 1f
  103. VFPFMRX r8, FPINST2 @ FPINST2 if needed (and present)
  104. 1:
  105. #endif
  106. stmia r4, {r1, r5, r6, r8} @ save FPEXC, FPSCR, FPINST, FPINST2
  107. vfp_reload_hw:
  108. #else
  109. @ For SMP, if this thread does not own the hw context, then we
  110. @ need to reload it. No need to save the old state as on SMP,
  111. @ we always save the state when we switch away from a thread.
  112. bne vfp_reload_hw
  113. @ This thread has ownership of the current hardware context.
  114. @ However, it may have been migrated to another CPU, in which
  115. @ case the saved state is newer than the hardware context.
  116. @ Check this by looking at the CPU number which the state was
  117. @ last loaded onto.
  118. ldr ip, [r10, #VFP_CPU]
  119. teq ip, r11
  120. beq vfp_hw_state_valid
  121. vfp_reload_hw:
  122. @ We're loading this threads state into the VFP hardware. Update
  123. @ the CPU number which contains the most up to date VFP context.
  124. str r11, [r10, #VFP_CPU]
  125. VFPFMXR FPEXC, r5 @ enable VFP, disable any pending
  126. @ exceptions, so we can get at the
  127. @ rest of it
  128. #endif
  129. DBGSTR1 "load state %p", r10
  130. str r10, [r3, r11, lsl #2] @ update the vfp_current_hw_state pointer
  131. @ Load the saved state back into the VFP
  132. VFPFLDMIA r10, r5 @ reload the working registers while
  133. @ FPEXC is in a safe state
  134. ldmia r10, {r1, r5, r6, r8} @ load FPEXC, FPSCR, FPINST, FPINST2
  135. #ifndef CONFIG_CPU_FEROCEON
  136. tst r1, #FPEXC_EX @ is there additional state to restore?
  137. beq 1f
  138. VFPFMXR FPINST, r6 @ restore FPINST (only if FPEXC.EX is set)
  139. tst r1, #FPEXC_FP2V @ is there an FPINST2 to write?
  140. beq 1f
  141. VFPFMXR FPINST2, r8 @ FPINST2 if needed (and present)
  142. 1:
  143. #endif
  144. VFPFMXR FPSCR, r5 @ restore status
  145. @ The context stored in the VFP hardware is up to date with this thread
  146. vfp_hw_state_valid:
  147. tst r1, #FPEXC_EX
  148. bne process_exception @ might as well handle the pending
  149. @ exception before retrying branch
  150. @ out before setting an FPEXC that
  151. @ stops us reading stuff
  152. VFPFMXR FPEXC, r1 @ Restore FPEXC last
  153. sub r2, r2, #4 @ Retry current instruction - if Thumb
  154. str r2, [sp, #S_PC] @ mode it's two 16-bit instructions,
  155. @ else it's one 32-bit instruction, so
  156. @ always subtract 4 from the following
  157. @ instruction address.
  158. #ifdef CONFIG_PREEMPT_COUNT
  159. get_thread_info r10
  160. ldr r4, [r10, #TI_PREEMPT] @ get preempt count
  161. sub r11, r4, #1 @ decrement it
  162. str r11, [r10, #TI_PREEMPT]
  163. #endif
  164. mov pc, r9 @ we think we have handled things
  165. look_for_VFP_exceptions:
  166. @ Check for synchronous or asynchronous exception
  167. tst r1, #FPEXC_EX | FPEXC_DEX
  168. bne process_exception
  169. @ On some implementations of the VFP subarch 1, setting FPSCR.IXE
  170. @ causes all the CDP instructions to be bounced synchronously without
  171. @ setting the FPEXC.EX bit
  172. VFPFMRX r5, FPSCR
  173. tst r5, #FPSCR_IXE
  174. bne process_exception
  175. @ Fall into hand on to next handler - appropriate coproc instr
  176. @ not recognised by VFP
  177. DBGSTR "not VFP"
  178. #ifdef CONFIG_PREEMPT_COUNT
  179. get_thread_info r10
  180. ldr r4, [r10, #TI_PREEMPT] @ get preempt count
  181. sub r11, r4, #1 @ decrement it
  182. str r11, [r10, #TI_PREEMPT]
  183. #endif
  184. mov pc, lr
  185. process_exception:
  186. DBGSTR "bounce"
  187. mov r2, sp @ nothing stacked - regdump is at TOS
  188. mov lr, r9 @ setup for a return to the user code.
  189. @ Now call the C code to package up the bounce to the support code
  190. @ r0 holds the trigger instruction
  191. @ r1 holds the FPEXC value
  192. @ r2 pointer to register dump
  193. b VFP_bounce @ we have handled this - the support
  194. @ code will raise an exception if
  195. @ required. If not, the user code will
  196. @ retry the faulted instruction
  197. ENDPROC(vfp_support_entry)
  198. ENTRY(vfp_save_state)
  199. @ Save the current VFP state
  200. @ r0 - save location
  201. @ r1 - FPEXC
  202. DBGSTR1 "save VFP state %p", r0
  203. VFPFSTMIA r0, r2 @ save the working registers
  204. VFPFMRX r2, FPSCR @ current status
  205. tst r1, #FPEXC_EX @ is there additional state to save?
  206. beq 1f
  207. VFPFMRX r3, FPINST @ FPINST (only if FPEXC.EX is set)
  208. tst r1, #FPEXC_FP2V @ is there an FPINST2 to read?
  209. beq 1f
  210. VFPFMRX r12, FPINST2 @ FPINST2 if needed (and present)
  211. 1:
  212. stmia r0, {r1, r2, r3, r12} @ save FPEXC, FPSCR, FPINST, FPINST2
  213. mov pc, lr
  214. ENDPROC(vfp_save_state)
  215. .align
  216. vfp_current_hw_state_address:
  217. .word vfp_current_hw_state
  218. .macro tbl_branch, base, tmp, shift
  219. #ifdef CONFIG_THUMB2_KERNEL
  220. adr \tmp, 1f
  221. add \tmp, \tmp, \base, lsl \shift
  222. mov pc, \tmp
  223. #else
  224. add pc, pc, \base, lsl \shift
  225. mov r0, r0
  226. #endif
  227. 1:
  228. .endm
  229. ENTRY(vfp_get_float)
  230. tbl_branch r0, r3, #3
  231. .irp dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
  232. 1: mrc p10, 0, r0, c\dr, c0, 0 @ fmrs r0, s0
  233. mov pc, lr
  234. .org 1b + 8
  235. 1: mrc p10, 0, r0, c\dr, c0, 4 @ fmrs r0, s1
  236. mov pc, lr
  237. .org 1b + 8
  238. .endr
  239. ENDPROC(vfp_get_float)
  240. ENTRY(vfp_put_float)
  241. tbl_branch r1, r3, #3
  242. .irp dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
  243. 1: mcr p10, 0, r0, c\dr, c0, 0 @ fmsr r0, s0
  244. mov pc, lr
  245. .org 1b + 8
  246. 1: mcr p10, 0, r0, c\dr, c0, 4 @ fmsr r0, s1
  247. mov pc, lr
  248. .org 1b + 8
  249. .endr
  250. ENDPROC(vfp_put_float)
  251. ENTRY(vfp_get_double)
  252. tbl_branch r0, r3, #3
  253. .irp dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
  254. 1: fmrrd r0, r1, d\dr
  255. mov pc, lr
  256. .org 1b + 8
  257. .endr
  258. #ifdef CONFIG_VFPv3
  259. @ d16 - d31 registers
  260. .irp dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
  261. 1: mrrc p11, 3, r0, r1, c\dr @ fmrrd r0, r1, d\dr
  262. mov pc, lr
  263. .org 1b + 8
  264. .endr
  265. #endif
  266. @ virtual register 16 (or 32 if VFPv3) for compare with zero
  267. mov r0, #0
  268. mov r1, #0
  269. mov pc, lr
  270. ENDPROC(vfp_get_double)
  271. ENTRY(vfp_put_double)
  272. tbl_branch r2, r3, #3
  273. .irp dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
  274. 1: fmdrr d\dr, r0, r1
  275. mov pc, lr
  276. .org 1b + 8
  277. .endr
  278. #ifdef CONFIG_VFPv3
  279. @ d16 - d31 registers
  280. .irp dr,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15
  281. 1: mcrr p11, 3, r0, r1, c\dr @ fmdrr r0, r1, d\dr
  282. mov pc, lr
  283. .org 1b + 8
  284. .endr
  285. #endif
  286. ENDPROC(vfp_put_double)