fpu.S 4.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200
  1. /*
  2. * FPU support code, moved here from head.S so that it can be used
  3. * by chips which use other head-whatever.S files.
  4. *
  5. * Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org)
  6. * Copyright (C) 1996 Cort Dougan <cort@cs.nmt.edu>
  7. * Copyright (C) 1996 Paul Mackerras.
  8. * Copyright (C) 1997 Dan Malek (dmalek@jlc.net).
  9. *
  10. * This program is free software; you can redistribute it and/or
  11. * modify it under the terms of the GNU General Public License
  12. * as published by the Free Software Foundation; either version
  13. * 2 of the License, or (at your option) any later version.
  14. *
  15. */
  16. #include <asm/reg.h>
  17. #include <asm/page.h>
  18. #include <asm/mmu.h>
  19. #include <asm/pgtable.h>
  20. #include <asm/cputable.h>
  21. #include <asm/cache.h>
  22. #include <asm/thread_info.h>
  23. #include <asm/ppc_asm.h>
  24. #include <asm/asm-offsets.h>
  25. #include <asm/ptrace.h>
  26. #ifdef CONFIG_VSX
  27. #define __REST_32FPVSRS(n,c,base) \
  28. BEGIN_FTR_SECTION \
  29. b 2f; \
  30. END_FTR_SECTION_IFSET(CPU_FTR_VSX); \
  31. REST_32FPRS(n,base); \
  32. b 3f; \
  33. 2: REST_32VSRS(n,c,base); \
  34. 3:
  35. #define __SAVE_32FPVSRS(n,c,base) \
  36. BEGIN_FTR_SECTION \
  37. b 2f; \
  38. END_FTR_SECTION_IFSET(CPU_FTR_VSX); \
  39. SAVE_32FPRS(n,base); \
  40. b 3f; \
  41. 2: SAVE_32VSRS(n,c,base); \
  42. 3:
  43. #else
  44. #define __REST_32FPVSRS(n,b,base) REST_32FPRS(n, base)
  45. #define __SAVE_32FPVSRS(n,b,base) SAVE_32FPRS(n, base)
  46. #endif
  47. #define REST_32FPVSRS(n,c,base) __REST_32FPVSRS(n,__REG_##c,__REG_##base)
  48. #define SAVE_32FPVSRS(n,c,base) __SAVE_32FPVSRS(n,__REG_##c,__REG_##base)
  49. #ifdef CONFIG_PPC_TRANSACTIONAL_MEM
  50. /* void do_load_up_transact_fpu(struct thread_struct *thread)
  51. *
  52. * This is similar to load_up_fpu but for the transactional version of the FP
  53. * register set. It doesn't mess with the task MSR or valid flags.
  54. * Furthermore, we don't do lazy FP with TM currently.
  55. */
  56. _GLOBAL(do_load_up_transact_fpu)
  57. mfmsr r6
  58. ori r5,r6,MSR_FP
  59. #ifdef CONFIG_VSX
  60. BEGIN_FTR_SECTION
  61. oris r5,r5,MSR_VSX@h
  62. END_FTR_SECTION_IFSET(CPU_FTR_VSX)
  63. #endif
  64. SYNC
  65. MTMSRD(r5)
  66. addi r7,r3,THREAD_TRANSACT_FPSTATE
  67. lfd fr0,FPSTATE_FPSCR(r7)
  68. MTFSF_L(fr0)
  69. REST_32FPVSRS(0, R4, R7)
  70. blr
  71. #endif /* CONFIG_PPC_TRANSACTIONAL_MEM */
  72. /*
  73. * Enable use of the FPU, and VSX if possible, for the caller.
  74. */
  75. _GLOBAL(fp_enable)
  76. mfmsr r3
  77. ori r3,r3,MSR_FP
  78. #ifdef CONFIG_VSX
  79. BEGIN_FTR_SECTION
  80. oris r3,r3,MSR_VSX@h
  81. END_FTR_SECTION_IFSET(CPU_FTR_VSX)
  82. #endif
  83. SYNC
  84. MTMSRD(r3)
  85. isync /* (not necessary for arch 2.02 and later) */
  86. blr
  87. /*
  88. * Load state from memory into FP registers including FPSCR.
  89. * Assumes the caller has enabled FP in the MSR.
  90. */
  91. _GLOBAL(load_fp_state)
  92. lfd fr0,FPSTATE_FPSCR(r3)
  93. MTFSF_L(fr0)
  94. REST_32FPVSRS(0, R4, R3)
  95. blr
  96. /*
  97. * Store FP state into memory, including FPSCR
  98. * Assumes the caller has enabled FP in the MSR.
  99. */
  100. _GLOBAL(store_fp_state)
  101. SAVE_32FPVSRS(0, R4, R3)
  102. mffs fr0
  103. stfd fr0,FPSTATE_FPSCR(r3)
  104. blr
  105. /*
  106. * This task wants to use the FPU now.
  107. * On UP, disable FP for the task which had the FPU previously,
  108. * and save its floating-point registers in its thread_struct.
  109. * Load up this task's FP registers from its thread_struct,
  110. * enable the FPU for the current task and return to the task.
  111. * Note that on 32-bit this can only use registers that will be
  112. * restored by fast_exception_return, i.e. r3 - r6, r10 and r11.
  113. */
  114. _GLOBAL(load_up_fpu)
  115. mfmsr r5
  116. ori r5,r5,MSR_FP
  117. #ifdef CONFIG_VSX
  118. BEGIN_FTR_SECTION
  119. oris r5,r5,MSR_VSX@h
  120. END_FTR_SECTION_IFSET(CPU_FTR_VSX)
  121. #endif
  122. SYNC
  123. MTMSRD(r5) /* enable use of fpu now */
  124. isync
  125. /* enable use of FP after return */
  126. #ifdef CONFIG_PPC32
  127. mfspr r5,SPRN_SPRG_THREAD /* current task's THREAD (phys) */
  128. lwz r4,THREAD_FPEXC_MODE(r5)
  129. ori r9,r9,MSR_FP /* enable FP for current */
  130. or r9,r9,r4
  131. #else
  132. ld r4,PACACURRENT(r13)
  133. addi r5,r4,THREAD /* Get THREAD */
  134. lwz r4,THREAD_FPEXC_MODE(r5)
  135. ori r12,r12,MSR_FP
  136. or r12,r12,r4
  137. std r12,_MSR(r1)
  138. #endif
  139. addi r10,r5,THREAD_FPSTATE
  140. lfd fr0,FPSTATE_FPSCR(r10)
  141. MTFSF_L(fr0)
  142. REST_32FPVSRS(0, R4, R10)
  143. /* restore registers and return */
  144. /* we haven't used ctr or xer or lr */
  145. blr
  146. /*
  147. * __giveup_fpu(tsk)
  148. * Disable FP for the task given as the argument,
  149. * and save the floating-point registers in its thread_struct.
  150. * Enables the FPU for use in the kernel on return.
  151. */
  152. _GLOBAL(__giveup_fpu)
  153. addi r3,r3,THREAD /* want THREAD of task */
  154. PPC_LL r6,THREAD_FPSAVEAREA(r3)
  155. PPC_LL r5,PT_REGS(r3)
  156. PPC_LCMPI 0,r6,0
  157. bne 2f
  158. addi r6,r3,THREAD_FPSTATE
  159. 2: PPC_LCMPI 0,r5,0
  160. SAVE_32FPVSRS(0, R4, R6)
  161. mffs fr0
  162. stfd fr0,FPSTATE_FPSCR(r6)
  163. beq 1f
  164. PPC_LL r4,_MSR-STACK_FRAME_OVERHEAD(r5)
  165. li r3,MSR_FP|MSR_FE0|MSR_FE1
  166. #ifdef CONFIG_VSX
  167. BEGIN_FTR_SECTION
  168. oris r3,r3,MSR_VSX@h
  169. END_FTR_SECTION_IFSET(CPU_FTR_VSX)
  170. #endif
  171. andc r4,r4,r3 /* disable FP for previous task */
  172. PPC_STL r4,_MSR-STACK_FRAME_OVERHEAD(r5)
  173. 1:
  174. blr
  175. /*
  176. * These are used in the alignment trap handler when emulating
  177. * single-precision loads and stores.
  178. */
  179. _GLOBAL(cvt_fd)
  180. lfs 0,0(r3)
  181. stfd 0,0(r4)
  182. blr
  183. _GLOBAL(cvt_df)
  184. lfd 0,0(r3)
  185. stfs 0,0(r4)
  186. blr