fpu.S 4.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191
  1. /*
  2. * FPU support code, moved here from head.S so that it can be used
  3. * by chips which use other head-whatever.S files.
  4. *
  5. * Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org)
  6. * Copyright (C) 1996 Cort Dougan <cort@cs.nmt.edu>
  7. * Copyright (C) 1996 Paul Mackerras.
  8. * Copyright (C) 1997 Dan Malek (dmalek@jlc.net).
  9. *
  10. * This program is free software; you can redistribute it and/or
  11. * modify it under the terms of the GNU General Public License
  12. * as published by the Free Software Foundation; either version
  13. * 2 of the License, or (at your option) any later version.
  14. *
  15. */
  16. #include <asm/reg.h>
  17. #include <asm/page.h>
  18. #include <asm/mmu.h>
  19. #include <asm/pgtable.h>
  20. #include <asm/cputable.h>
  21. #include <asm/cache.h>
  22. #include <asm/thread_info.h>
  23. #include <asm/ppc_asm.h>
  24. #include <asm/asm-offsets.h>
  25. #include <asm/ptrace.h>
  26. #ifdef CONFIG_VSX
  27. #define __REST_32FPVSRS(n,c,base) \
  28. BEGIN_FTR_SECTION \
  29. b 2f; \
  30. END_FTR_SECTION_IFSET(CPU_FTR_VSX); \
  31. REST_32FPRS(n,base); \
  32. b 3f; \
  33. 2: REST_32VSRS(n,c,base); \
  34. 3:
  35. #define __REST_32FPVSRS_TRANSACT(n,c,base) \
  36. BEGIN_FTR_SECTION \
  37. b 2f; \
  38. END_FTR_SECTION_IFSET(CPU_FTR_VSX); \
  39. REST_32FPRS_TRANSACT(n,base); \
  40. b 3f; \
  41. 2: REST_32VSRS_TRANSACT(n,c,base); \
  42. 3:
  43. #define __SAVE_32FPVSRS(n,c,base) \
  44. BEGIN_FTR_SECTION \
  45. b 2f; \
  46. END_FTR_SECTION_IFSET(CPU_FTR_VSX); \
  47. SAVE_32FPRS(n,base); \
  48. b 3f; \
  49. 2: SAVE_32VSRS(n,c,base); \
  50. 3:
  51. #else
  52. #define __REST_32FPVSRS(n,b,base) REST_32FPRS(n, base)
  53. #define __REST_32FPVSRS_TRANSACT(n,b,base) REST_32FPRS(n, base)
  54. #define __SAVE_32FPVSRS(n,b,base) SAVE_32FPRS(n, base)
  55. #endif
  56. #define REST_32FPVSRS(n,c,base) __REST_32FPVSRS(n,__REG_##c,__REG_##base)
  57. #define REST_32FPVSRS_TRANSACT(n,c,base) \
  58. __REST_32FPVSRS_TRANSACT(n,__REG_##c,__REG_##base)
  59. #define SAVE_32FPVSRS(n,c,base) __SAVE_32FPVSRS(n,__REG_##c,__REG_##base)
  60. /*
  61. * This task wants to use the FPU now.
  62. * On UP, disable FP for the task which had the FPU previously,
  63. * and save its floating-point registers in its thread_struct.
  64. * Load up this task's FP registers from its thread_struct,
  65. * enable the FPU for the current task and return to the task.
  66. */
  67. _GLOBAL(load_up_fpu)
  68. mfmsr r5
  69. ori r5,r5,MSR_FP
  70. #ifdef CONFIG_VSX
  71. BEGIN_FTR_SECTION
  72. oris r5,r5,MSR_VSX@h
  73. END_FTR_SECTION_IFSET(CPU_FTR_VSX)
  74. #endif
  75. SYNC
  76. MTMSRD(r5) /* enable use of fpu now */
  77. isync
  78. /*
  79. * For SMP, we don't do lazy FPU switching because it just gets too
  80. * horrendously complex, especially when a task switches from one CPU
  81. * to another. Instead we call giveup_fpu in switch_to.
  82. */
  83. #ifndef CONFIG_SMP
  84. LOAD_REG_ADDRBASE(r3, last_task_used_math)
  85. toreal(r3)
  86. PPC_LL r4,ADDROFF(last_task_used_math)(r3)
  87. PPC_LCMPI 0,r4,0
  88. beq 1f
  89. toreal(r4)
  90. addi r4,r4,THREAD /* want last_task_used_math->thread */
  91. SAVE_32FPVSRS(0, R5, R4)
  92. mffs fr0
  93. stfd fr0,THREAD_FPSCR(r4)
  94. PPC_LL r5,PT_REGS(r4)
  95. toreal(r5)
  96. PPC_LL r4,_MSR-STACK_FRAME_OVERHEAD(r5)
  97. li r10,MSR_FP|MSR_FE0|MSR_FE1
  98. andc r4,r4,r10 /* disable FP for previous task */
  99. PPC_STL r4,_MSR-STACK_FRAME_OVERHEAD(r5)
  100. 1:
  101. #endif /* CONFIG_SMP */
  102. /* enable use of FP after return */
  103. #ifdef CONFIG_PPC32
  104. mfspr r5,SPRN_SPRG_THREAD /* current task's THREAD (phys) */
  105. lwz r4,THREAD_FPEXC_MODE(r5)
  106. ori r9,r9,MSR_FP /* enable FP for current */
  107. or r9,r9,r4
  108. #else
  109. ld r4,PACACURRENT(r13)
  110. addi r5,r4,THREAD /* Get THREAD */
  111. lwz r4,THREAD_FPEXC_MODE(r5)
  112. ori r12,r12,MSR_FP
  113. or r12,r12,r4
  114. std r12,_MSR(r1)
  115. #endif
  116. lfd fr0,THREAD_FPSCR(r5)
  117. MTFSF_L(fr0)
  118. REST_32FPVSRS(0, R4, R5)
  119. #ifndef CONFIG_SMP
  120. subi r4,r5,THREAD
  121. fromreal(r4)
  122. PPC_STL r4,ADDROFF(last_task_used_math)(r3)
  123. #endif /* CONFIG_SMP */
  124. /* restore registers and return */
  125. /* we haven't used ctr or xer or lr */
  126. blr
  127. /*
  128. * giveup_fpu(tsk)
  129. * Disable FP for the task given as the argument,
  130. * and save the floating-point registers in its thread_struct.
  131. * Enables the FPU for use in the kernel on return.
  132. */
  133. _GLOBAL(giveup_fpu)
  134. mfmsr r5
  135. ori r5,r5,MSR_FP
  136. #ifdef CONFIG_VSX
  137. BEGIN_FTR_SECTION
  138. oris r5,r5,MSR_VSX@h
  139. END_FTR_SECTION_IFSET(CPU_FTR_VSX)
  140. #endif
  141. SYNC_601
  142. ISYNC_601
  143. MTMSRD(r5) /* enable use of fpu now */
  144. SYNC_601
  145. isync
  146. PPC_LCMPI 0,r3,0
  147. beqlr- /* if no previous owner, done */
  148. addi r3,r3,THREAD /* want THREAD of task */
  149. PPC_LL r5,PT_REGS(r3)
  150. PPC_LCMPI 0,r5,0
  151. SAVE_32FPVSRS(0, R4 ,R3)
  152. mffs fr0
  153. stfd fr0,THREAD_FPSCR(r3)
  154. beq 1f
  155. PPC_LL r4,_MSR-STACK_FRAME_OVERHEAD(r5)
  156. li r3,MSR_FP|MSR_FE0|MSR_FE1
  157. #ifdef CONFIG_VSX
  158. BEGIN_FTR_SECTION
  159. oris r3,r3,MSR_VSX@h
  160. END_FTR_SECTION_IFSET(CPU_FTR_VSX)
  161. #endif
  162. andc r4,r4,r3 /* disable FP for previous task */
  163. PPC_STL r4,_MSR-STACK_FRAME_OVERHEAD(r5)
  164. 1:
  165. #ifndef CONFIG_SMP
  166. li r5,0
  167. LOAD_REG_ADDRBASE(r4,last_task_used_math)
  168. PPC_STL r5,ADDROFF(last_task_used_math)(r4)
  169. #endif /* CONFIG_SMP */
  170. blr
  171. /*
  172. * These are used in the alignment trap handler when emulating
  173. * single-precision loads and stores.
  174. */
  175. _GLOBAL(cvt_fd)
  176. lfs 0,0(r3)
  177. stfd 0,0(r4)
  178. blr
  179. _GLOBAL(cvt_df)
  180. lfd 0,0(r3)
  181. stfs 0,0(r4)
  182. blr