octeon_switch.S 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603
  1. /*
  2. * This file is subject to the terms and conditions of the GNU General Public
  3. * License. See the file "COPYING" in the main directory of this archive
  4. * for more details.
  5. *
  6. * Copyright (C) 1994, 1995, 1996, 1998, 1999, 2002, 2003 Ralf Baechle
  7. * Copyright (C) 1996 David S. Miller (davem@davemloft.net)
  8. * Copyright (C) 1994, 1995, 1996, by Andreas Busse
  9. * Copyright (C) 1999 Silicon Graphics, Inc.
  10. * Copyright (C) 2000 MIPS Technologies, Inc.
  11. * written by Carsten Langgaard, carstenl@mips.com
  12. */
  13. #define USE_ALTERNATE_RESUME_IMPL 1
  14. .set push
  15. .set arch=mips64r2
  16. #include "r4k_switch.S"
  17. .set pop
  18. /*
  19. * task_struct *resume(task_struct *prev, task_struct *next,
  20. * struct thread_info *next_ti, int usedfpu)
  21. */
  22. .align 7
  23. LEAF(resume)
  24. .set arch=octeon
  25. mfc0 t1, CP0_STATUS
  26. LONG_S t1, THREAD_STATUS(a0)
  27. cpu_save_nonscratch a0
  28. LONG_S ra, THREAD_REG31(a0)
  29. /*
  30. * check if we need to save FPU registers
  31. */
  32. .set push
  33. .set noreorder
  34. beqz a3, 1f
  35. PTR_L t3, TASK_THREAD_INFO(a0)
  36. .set pop
  37. /*
  38. * clear saved user stack CU1 bit
  39. */
  40. LONG_L t0, ST_OFF(t3)
  41. li t1, ~ST0_CU1
  42. and t0, t0, t1
  43. LONG_S t0, ST_OFF(t3)
  44. .set push
  45. .set arch=mips64r2
  46. fpu_save_double a0 t0 t1 # c0_status passed in t0
  47. # clobbers t1
  48. .set pop
  49. 1:
  50. /* check if we need to save COP2 registers */
  51. LONG_L t0, ST_OFF(t3)
  52. bbit0 t0, 30, 1f
  53. /* Disable COP2 in the stored process state */
  54. li t1, ST0_CU2
  55. xor t0, t1
  56. LONG_S t0, ST_OFF(t3)
  57. /* Enable COP2 so we can save it */
  58. mfc0 t0, CP0_STATUS
  59. or t0, t1
  60. mtc0 t0, CP0_STATUS
  61. /* Save COP2 */
  62. daddu a0, THREAD_CP2
  63. jal octeon_cop2_save
  64. dsubu a0, THREAD_CP2
  65. /* Disable COP2 now that we are done */
  66. mfc0 t0, CP0_STATUS
  67. li t1, ST0_CU2
  68. xor t0, t1
  69. mtc0 t0, CP0_STATUS
  70. 1:
  71. #if CONFIG_CAVIUM_OCTEON_CVMSEG_SIZE > 0
  72. /* Check if we need to store CVMSEG state */
  73. dmfc0 t0, $11,7 /* CvmMemCtl */
  74. bbit0 t0, 6, 3f /* Is user access enabled? */
  75. /* Store the CVMSEG state */
  76. /* Extract the size of CVMSEG */
  77. andi t0, 0x3f
  78. /* Multiply * (cache line size/sizeof(long)/2) */
  79. sll t0, 7-LONGLOG-1
  80. li t1, -32768 /* Base address of CVMSEG */
  81. LONG_ADDI t2, a0, THREAD_CVMSEG /* Where to store CVMSEG to */
  82. synciobdma
  83. 2:
  84. .set noreorder
  85. LONG_L t8, 0(t1) /* Load from CVMSEG */
  86. subu t0, 1 /* Decrement loop var */
  87. LONG_L t9, LONGSIZE(t1)/* Load from CVMSEG */
  88. LONG_ADDU t1, LONGSIZE*2 /* Increment loc in CVMSEG */
  89. LONG_S t8, 0(t2) /* Store CVMSEG to thread storage */
  90. LONG_ADDU t2, LONGSIZE*2 /* Increment loc in thread storage */
  91. bnez t0, 2b /* Loop until we've copied it all */
  92. LONG_S t9, -LONGSIZE(t2)/* Store CVMSEG to thread storage */
  93. .set reorder
  94. /* Disable access to CVMSEG */
  95. dmfc0 t0, $11,7 /* CvmMemCtl */
  96. xori t0, t0, 0x40 /* Bit 6 is CVMSEG user enable */
  97. dmtc0 t0, $11,7 /* CvmMemCtl */
  98. #endif
  99. 3:
  100. #if defined(CONFIG_CC_STACKPROTECTOR) && !defined(CONFIG_SMP)
  101. PTR_LA t8, __stack_chk_guard
  102. LONG_L t9, TASK_STACK_CANARY(a1)
  103. LONG_S t9, 0(t8)
  104. #endif
  105. /*
  106. * The order of restoring the registers takes care of the race
  107. * updating $28, $29 and kernelsp without disabling ints.
  108. */
  109. move $28, a2
  110. cpu_restore_nonscratch a1
  111. PTR_ADDU t0, $28, _THREAD_SIZE - 32
  112. set_saved_sp t0, t1, t2
  113. mfc0 t1, CP0_STATUS /* Do we really need this? */
  114. li a3, 0xff01
  115. and t1, a3
  116. LONG_L a2, THREAD_STATUS(a1)
  117. nor a3, $0, a3
  118. and a2, a3
  119. or a2, t1
  120. mtc0 a2, CP0_STATUS
  121. move v0, a0
  122. jr ra
  123. END(resume)
  124. /*
  125. * void octeon_cop2_save(struct octeon_cop2_state *a0)
  126. */
  127. .align 7
  128. .set push
  129. .set noreorder
  130. LEAF(octeon_cop2_save)
  131. dmfc0 t9, $9,7 /* CvmCtl register. */
  132. /* Save the COP2 CRC state */
  133. dmfc2 t0, 0x0201
  134. dmfc2 t1, 0x0202
  135. dmfc2 t2, 0x0200
  136. sd t0, OCTEON_CP2_CRC_IV(a0)
  137. sd t1, OCTEON_CP2_CRC_LENGTH(a0)
  138. /* Skip next instructions if CvmCtl[NODFA_CP2] set */
  139. bbit1 t9, 28, 1f
  140. sd t2, OCTEON_CP2_CRC_POLY(a0)
  141. /* Save the LLM state */
  142. dmfc2 t0, 0x0402
  143. dmfc2 t1, 0x040A
  144. sd t0, OCTEON_CP2_LLM_DAT(a0)
  145. 1: bbit1 t9, 26, 3f /* done if CvmCtl[NOCRYPTO] set */
  146. sd t1, OCTEON_CP2_LLM_DAT+8(a0)
  147. /* Save the COP2 crypto state */
  148. /* this part is mostly common to both pass 1 and later revisions */
  149. dmfc2 t0, 0x0084
  150. dmfc2 t1, 0x0080
  151. dmfc2 t2, 0x0081
  152. dmfc2 t3, 0x0082
  153. sd t0, OCTEON_CP2_3DES_IV(a0)
  154. dmfc2 t0, 0x0088
  155. sd t1, OCTEON_CP2_3DES_KEY(a0)
  156. dmfc2 t1, 0x0111 /* only necessary for pass 1 */
  157. sd t2, OCTEON_CP2_3DES_KEY+8(a0)
  158. dmfc2 t2, 0x0102
  159. sd t3, OCTEON_CP2_3DES_KEY+16(a0)
  160. dmfc2 t3, 0x0103
  161. sd t0, OCTEON_CP2_3DES_RESULT(a0)
  162. dmfc2 t0, 0x0104
  163. sd t1, OCTEON_CP2_AES_INP0(a0) /* only necessary for pass 1 */
  164. dmfc2 t1, 0x0105
  165. sd t2, OCTEON_CP2_AES_IV(a0)
  166. dmfc2 t2, 0x0106
  167. sd t3, OCTEON_CP2_AES_IV+8(a0)
  168. dmfc2 t3, 0x0107
  169. sd t0, OCTEON_CP2_AES_KEY(a0)
  170. dmfc2 t0, 0x0110
  171. sd t1, OCTEON_CP2_AES_KEY+8(a0)
  172. dmfc2 t1, 0x0100
  173. sd t2, OCTEON_CP2_AES_KEY+16(a0)
  174. dmfc2 t2, 0x0101
  175. sd t3, OCTEON_CP2_AES_KEY+24(a0)
  176. mfc0 v0, $15,0 /* Get the processor ID register */
  177. sd t0, OCTEON_CP2_AES_KEYLEN(a0)
  178. li v1, 0x000d0000 /* This is the processor ID of Octeon Pass1 */
  179. sd t1, OCTEON_CP2_AES_RESULT(a0)
  180. /* Skip to the Pass1 version of the remainder of the COP2 state */
  181. beq v0, v1, 2f
  182. sd t2, OCTEON_CP2_AES_RESULT+8(a0)
  183. /* the non-pass1 state when !CvmCtl[NOCRYPTO] */
  184. dmfc2 t1, 0x0240
  185. dmfc2 t2, 0x0241
  186. ori v1, v1, 0x9500 /* lowest OCTEON III PrId*/
  187. dmfc2 t3, 0x0242
  188. subu v1, v0, v1 /* prid - lowest OCTEON III PrId */
  189. dmfc2 t0, 0x0243
  190. sd t1, OCTEON_CP2_HSH_DATW(a0)
  191. dmfc2 t1, 0x0244
  192. sd t2, OCTEON_CP2_HSH_DATW+8(a0)
  193. dmfc2 t2, 0x0245
  194. sd t3, OCTEON_CP2_HSH_DATW+16(a0)
  195. dmfc2 t3, 0x0246
  196. sd t0, OCTEON_CP2_HSH_DATW+24(a0)
  197. dmfc2 t0, 0x0247
  198. sd t1, OCTEON_CP2_HSH_DATW+32(a0)
  199. dmfc2 t1, 0x0248
  200. sd t2, OCTEON_CP2_HSH_DATW+40(a0)
  201. dmfc2 t2, 0x0249
  202. sd t3, OCTEON_CP2_HSH_DATW+48(a0)
  203. dmfc2 t3, 0x024A
  204. sd t0, OCTEON_CP2_HSH_DATW+56(a0)
  205. dmfc2 t0, 0x024B
  206. sd t1, OCTEON_CP2_HSH_DATW+64(a0)
  207. dmfc2 t1, 0x024C
  208. sd t2, OCTEON_CP2_HSH_DATW+72(a0)
  209. dmfc2 t2, 0x024D
  210. sd t3, OCTEON_CP2_HSH_DATW+80(a0)
  211. dmfc2 t3, 0x024E
  212. sd t0, OCTEON_CP2_HSH_DATW+88(a0)
  213. dmfc2 t0, 0x0250
  214. sd t1, OCTEON_CP2_HSH_DATW+96(a0)
  215. dmfc2 t1, 0x0251
  216. sd t2, OCTEON_CP2_HSH_DATW+104(a0)
  217. dmfc2 t2, 0x0252
  218. sd t3, OCTEON_CP2_HSH_DATW+112(a0)
  219. dmfc2 t3, 0x0253
  220. sd t0, OCTEON_CP2_HSH_IVW(a0)
  221. dmfc2 t0, 0x0254
  222. sd t1, OCTEON_CP2_HSH_IVW+8(a0)
  223. dmfc2 t1, 0x0255
  224. sd t2, OCTEON_CP2_HSH_IVW+16(a0)
  225. dmfc2 t2, 0x0256
  226. sd t3, OCTEON_CP2_HSH_IVW+24(a0)
  227. dmfc2 t3, 0x0257
  228. sd t0, OCTEON_CP2_HSH_IVW+32(a0)
  229. dmfc2 t0, 0x0258
  230. sd t1, OCTEON_CP2_HSH_IVW+40(a0)
  231. dmfc2 t1, 0x0259
  232. sd t2, OCTEON_CP2_HSH_IVW+48(a0)
  233. dmfc2 t2, 0x025E
  234. sd t3, OCTEON_CP2_HSH_IVW+56(a0)
  235. dmfc2 t3, 0x025A
  236. sd t0, OCTEON_CP2_GFM_MULT(a0)
  237. dmfc2 t0, 0x025B
  238. sd t1, OCTEON_CP2_GFM_MULT+8(a0)
  239. sd t2, OCTEON_CP2_GFM_POLY(a0)
  240. sd t3, OCTEON_CP2_GFM_RESULT(a0)
  241. bltz v1, 4f
  242. sd t0, OCTEON_CP2_GFM_RESULT+8(a0)
  243. /* OCTEON III things*/
  244. dmfc2 t0, 0x024F
  245. dmfc2 t1, 0x0050
  246. sd t0, OCTEON_CP2_SHA3(a0)
  247. sd t1, OCTEON_CP2_SHA3+8(a0)
  248. 4:
  249. jr ra
  250. nop
  251. 2: /* pass 1 special stuff when !CvmCtl[NOCRYPTO] */
  252. dmfc2 t3, 0x0040
  253. dmfc2 t0, 0x0041
  254. dmfc2 t1, 0x0042
  255. dmfc2 t2, 0x0043
  256. sd t3, OCTEON_CP2_HSH_DATW(a0)
  257. dmfc2 t3, 0x0044
  258. sd t0, OCTEON_CP2_HSH_DATW+8(a0)
  259. dmfc2 t0, 0x0045
  260. sd t1, OCTEON_CP2_HSH_DATW+16(a0)
  261. dmfc2 t1, 0x0046
  262. sd t2, OCTEON_CP2_HSH_DATW+24(a0)
  263. dmfc2 t2, 0x0048
  264. sd t3, OCTEON_CP2_HSH_DATW+32(a0)
  265. dmfc2 t3, 0x0049
  266. sd t0, OCTEON_CP2_HSH_DATW+40(a0)
  267. dmfc2 t0, 0x004A
  268. sd t1, OCTEON_CP2_HSH_DATW+48(a0)
  269. sd t2, OCTEON_CP2_HSH_IVW(a0)
  270. sd t3, OCTEON_CP2_HSH_IVW+8(a0)
  271. sd t0, OCTEON_CP2_HSH_IVW+16(a0)
  272. 3: /* pass 1 or CvmCtl[NOCRYPTO] set */
  273. jr ra
  274. nop
  275. END(octeon_cop2_save)
  276. .set pop
  277. /*
  278. * void octeon_cop2_restore(struct octeon_cop2_state *a0)
  279. */
  280. .align 7
  281. .set push
  282. .set noreorder
  283. LEAF(octeon_cop2_restore)
  284. /* First cache line was prefetched before the call */
  285. pref 4, 128(a0)
  286. dmfc0 t9, $9,7 /* CvmCtl register. */
  287. pref 4, 256(a0)
  288. ld t0, OCTEON_CP2_CRC_IV(a0)
  289. pref 4, 384(a0)
  290. ld t1, OCTEON_CP2_CRC_LENGTH(a0)
  291. ld t2, OCTEON_CP2_CRC_POLY(a0)
  292. /* Restore the COP2 CRC state */
  293. dmtc2 t0, 0x0201
  294. dmtc2 t1, 0x1202
  295. bbit1 t9, 28, 2f /* Skip LLM if CvmCtl[NODFA_CP2] is set */
  296. dmtc2 t2, 0x4200
  297. /* Restore the LLM state */
  298. ld t0, OCTEON_CP2_LLM_DAT(a0)
  299. ld t1, OCTEON_CP2_LLM_DAT+8(a0)
  300. dmtc2 t0, 0x0402
  301. dmtc2 t1, 0x040A
  302. 2:
  303. bbit1 t9, 26, done_restore /* done if CvmCtl[NOCRYPTO] set */
  304. nop
  305. /* Restore the COP2 crypto state common to pass 1 and pass 2 */
  306. ld t0, OCTEON_CP2_3DES_IV(a0)
  307. ld t1, OCTEON_CP2_3DES_KEY(a0)
  308. ld t2, OCTEON_CP2_3DES_KEY+8(a0)
  309. dmtc2 t0, 0x0084
  310. ld t0, OCTEON_CP2_3DES_KEY+16(a0)
  311. dmtc2 t1, 0x0080
  312. ld t1, OCTEON_CP2_3DES_RESULT(a0)
  313. dmtc2 t2, 0x0081
  314. ld t2, OCTEON_CP2_AES_INP0(a0) /* only really needed for pass 1 */
  315. dmtc2 t0, 0x0082
  316. ld t0, OCTEON_CP2_AES_IV(a0)
  317. dmtc2 t1, 0x0098
  318. ld t1, OCTEON_CP2_AES_IV+8(a0)
  319. dmtc2 t2, 0x010A /* only really needed for pass 1 */
  320. ld t2, OCTEON_CP2_AES_KEY(a0)
  321. dmtc2 t0, 0x0102
  322. ld t0, OCTEON_CP2_AES_KEY+8(a0)
  323. dmtc2 t1, 0x0103
  324. ld t1, OCTEON_CP2_AES_KEY+16(a0)
  325. dmtc2 t2, 0x0104
  326. ld t2, OCTEON_CP2_AES_KEY+24(a0)
  327. dmtc2 t0, 0x0105
  328. ld t0, OCTEON_CP2_AES_KEYLEN(a0)
  329. dmtc2 t1, 0x0106
  330. ld t1, OCTEON_CP2_AES_RESULT(a0)
  331. dmtc2 t2, 0x0107
  332. ld t2, OCTEON_CP2_AES_RESULT+8(a0)
  333. mfc0 t3, $15,0 /* Get the processor ID register */
  334. dmtc2 t0, 0x0110
  335. li v0, 0x000d0000 /* This is the processor ID of Octeon Pass1 */
  336. dmtc2 t1, 0x0100
  337. bne v0, t3, 3f /* Skip the next stuff for non-pass1 */
  338. dmtc2 t2, 0x0101
  339. /* this code is specific for pass 1 */
  340. ld t0, OCTEON_CP2_HSH_DATW(a0)
  341. ld t1, OCTEON_CP2_HSH_DATW+8(a0)
  342. ld t2, OCTEON_CP2_HSH_DATW+16(a0)
  343. dmtc2 t0, 0x0040
  344. ld t0, OCTEON_CP2_HSH_DATW+24(a0)
  345. dmtc2 t1, 0x0041
  346. ld t1, OCTEON_CP2_HSH_DATW+32(a0)
  347. dmtc2 t2, 0x0042
  348. ld t2, OCTEON_CP2_HSH_DATW+40(a0)
  349. dmtc2 t0, 0x0043
  350. ld t0, OCTEON_CP2_HSH_DATW+48(a0)
  351. dmtc2 t1, 0x0044
  352. ld t1, OCTEON_CP2_HSH_IVW(a0)
  353. dmtc2 t2, 0x0045
  354. ld t2, OCTEON_CP2_HSH_IVW+8(a0)
  355. dmtc2 t0, 0x0046
  356. ld t0, OCTEON_CP2_HSH_IVW+16(a0)
  357. dmtc2 t1, 0x0048
  358. dmtc2 t2, 0x0049
  359. b done_restore /* unconditional branch */
  360. dmtc2 t0, 0x004A
  361. 3: /* this is post-pass1 code */
  362. ld t2, OCTEON_CP2_HSH_DATW(a0)
  363. ori v0, v0, 0x9500 /* lowest OCTEON III PrId*/
  364. ld t0, OCTEON_CP2_HSH_DATW+8(a0)
  365. ld t1, OCTEON_CP2_HSH_DATW+16(a0)
  366. dmtc2 t2, 0x0240
  367. ld t2, OCTEON_CP2_HSH_DATW+24(a0)
  368. dmtc2 t0, 0x0241
  369. ld t0, OCTEON_CP2_HSH_DATW+32(a0)
  370. dmtc2 t1, 0x0242
  371. ld t1, OCTEON_CP2_HSH_DATW+40(a0)
  372. dmtc2 t2, 0x0243
  373. ld t2, OCTEON_CP2_HSH_DATW+48(a0)
  374. dmtc2 t0, 0x0244
  375. ld t0, OCTEON_CP2_HSH_DATW+56(a0)
  376. dmtc2 t1, 0x0245
  377. ld t1, OCTEON_CP2_HSH_DATW+64(a0)
  378. dmtc2 t2, 0x0246
  379. ld t2, OCTEON_CP2_HSH_DATW+72(a0)
  380. dmtc2 t0, 0x0247
  381. ld t0, OCTEON_CP2_HSH_DATW+80(a0)
  382. dmtc2 t1, 0x0248
  383. ld t1, OCTEON_CP2_HSH_DATW+88(a0)
  384. dmtc2 t2, 0x0249
  385. ld t2, OCTEON_CP2_HSH_DATW+96(a0)
  386. dmtc2 t0, 0x024A
  387. ld t0, OCTEON_CP2_HSH_DATW+104(a0)
  388. dmtc2 t1, 0x024B
  389. ld t1, OCTEON_CP2_HSH_DATW+112(a0)
  390. dmtc2 t2, 0x024C
  391. ld t2, OCTEON_CP2_HSH_IVW(a0)
  392. dmtc2 t0, 0x024D
  393. ld t0, OCTEON_CP2_HSH_IVW+8(a0)
  394. dmtc2 t1, 0x024E
  395. ld t1, OCTEON_CP2_HSH_IVW+16(a0)
  396. dmtc2 t2, 0x0250
  397. ld t2, OCTEON_CP2_HSH_IVW+24(a0)
  398. dmtc2 t0, 0x0251
  399. ld t0, OCTEON_CP2_HSH_IVW+32(a0)
  400. dmtc2 t1, 0x0252
  401. ld t1, OCTEON_CP2_HSH_IVW+40(a0)
  402. dmtc2 t2, 0x0253
  403. ld t2, OCTEON_CP2_HSH_IVW+48(a0)
  404. dmtc2 t0, 0x0254
  405. ld t0, OCTEON_CP2_HSH_IVW+56(a0)
  406. dmtc2 t1, 0x0255
  407. ld t1, OCTEON_CP2_GFM_MULT(a0)
  408. dmtc2 t2, 0x0256
  409. ld t2, OCTEON_CP2_GFM_MULT+8(a0)
  410. dmtc2 t0, 0x0257
  411. ld t0, OCTEON_CP2_GFM_POLY(a0)
  412. dmtc2 t1, 0x0258
  413. ld t1, OCTEON_CP2_GFM_RESULT(a0)
  414. dmtc2 t2, 0x0259
  415. ld t2, OCTEON_CP2_GFM_RESULT+8(a0)
  416. dmtc2 t0, 0x025E
  417. subu v0, t3, v0 /* prid - lowest OCTEON III PrId */
  418. dmtc2 t1, 0x025A
  419. bltz v0, done_restore
  420. dmtc2 t2, 0x025B
  421. /* OCTEON III things*/
  422. ld t0, OCTEON_CP2_SHA3(a0)
  423. ld t1, OCTEON_CP2_SHA3+8(a0)
  424. dmtc2 t0, 0x0051
  425. dmtc2 t1, 0x0050
  426. done_restore:
  427. jr ra
  428. nop
  429. END(octeon_cop2_restore)
  430. .set pop
  431. /*
  432. * void octeon_mult_save()
  433. * sp is assumed to point to a struct pt_regs
  434. *
  435. * NOTE: This is called in SAVE_TEMP in stackframe.h. It can
  436. * safely modify v1,k0, k1,$10-$15, and $24. It will
  437. * be overwritten with a processor specific version of the code.
  438. */
  439. .p2align 7
  440. .set push
  441. .set noreorder
  442. LEAF(octeon_mult_save)
  443. jr ra
  444. nop
  445. .space 30 * 4, 0
  446. octeon_mult_save_end:
  447. EXPORT(octeon_mult_save_end)
  448. END(octeon_mult_save)
  449. LEAF(octeon_mult_save2)
  450. /* Save the multiplier state OCTEON II and earlier*/
  451. v3mulu k0, $0, $0
  452. v3mulu k1, $0, $0
  453. sd k0, PT_MTP(sp) /* PT_MTP has P0 */
  454. v3mulu k0, $0, $0
  455. sd k1, PT_MTP+8(sp) /* PT_MTP+8 has P1 */
  456. ori k1, $0, 1
  457. v3mulu k1, k1, $0
  458. sd k0, PT_MTP+16(sp) /* PT_MTP+16 has P2 */
  459. v3mulu k0, $0, $0
  460. sd k1, PT_MPL(sp) /* PT_MPL has MPL0 */
  461. v3mulu k1, $0, $0
  462. sd k0, PT_MPL+8(sp) /* PT_MPL+8 has MPL1 */
  463. jr ra
  464. sd k1, PT_MPL+16(sp) /* PT_MPL+16 has MPL2 */
  465. octeon_mult_save2_end:
  466. EXPORT(octeon_mult_save2_end)
  467. END(octeon_mult_save2)
  468. LEAF(octeon_mult_save3)
  469. /* Save the multiplier state OCTEON III */
  470. v3mulu $10, $0, $0 /* read P0 */
  471. v3mulu $11, $0, $0 /* read P1 */
  472. v3mulu $12, $0, $0 /* read P2 */
  473. sd $10, PT_MTP+(0*8)(sp) /* store P0 */
  474. v3mulu $10, $0, $0 /* read P3 */
  475. sd $11, PT_MTP+(1*8)(sp) /* store P1 */
  476. v3mulu $11, $0, $0 /* read P4 */
  477. sd $12, PT_MTP+(2*8)(sp) /* store P2 */
  478. ori $13, $0, 1
  479. v3mulu $12, $0, $0 /* read P5 */
  480. sd $10, PT_MTP+(3*8)(sp) /* store P3 */
  481. v3mulu $13, $13, $0 /* P4-P0 = MPL5-MPL1, $13 = MPL0 */
  482. sd $11, PT_MTP+(4*8)(sp) /* store P4 */
  483. v3mulu $10, $0, $0 /* read MPL1 */
  484. sd $12, PT_MTP+(5*8)(sp) /* store P5 */
  485. v3mulu $11, $0, $0 /* read MPL2 */
  486. sd $13, PT_MPL+(0*8)(sp) /* store MPL0 */
  487. v3mulu $12, $0, $0 /* read MPL3 */
  488. sd $10, PT_MPL+(1*8)(sp) /* store MPL1 */
  489. v3mulu $10, $0, $0 /* read MPL4 */
  490. sd $11, PT_MPL+(2*8)(sp) /* store MPL2 */
  491. v3mulu $11, $0, $0 /* read MPL5 */
  492. sd $12, PT_MPL+(3*8)(sp) /* store MPL3 */
  493. sd $10, PT_MPL+(4*8)(sp) /* store MPL4 */
  494. jr ra
  495. sd $11, PT_MPL+(5*8)(sp) /* store MPL5 */
  496. octeon_mult_save3_end:
  497. EXPORT(octeon_mult_save3_end)
  498. END(octeon_mult_save3)
  499. .set pop
  500. /*
  501. * void octeon_mult_restore()
  502. * sp is assumed to point to a struct pt_regs
  503. *
  504. * NOTE: This is called in RESTORE_TEMP in stackframe.h.
  505. */
  506. .p2align 7
  507. .set push
  508. .set noreorder
  509. LEAF(octeon_mult_restore)
  510. jr ra
  511. nop
  512. .space 30 * 4, 0
  513. octeon_mult_restore_end:
  514. EXPORT(octeon_mult_restore_end)
  515. END(octeon_mult_restore)
  516. LEAF(octeon_mult_restore2)
  517. ld v0, PT_MPL(sp) /* MPL0 */
  518. ld v1, PT_MPL+8(sp) /* MPL1 */
  519. ld k0, PT_MPL+16(sp) /* MPL2 */
  520. /* Restore the multiplier state */
  521. ld k1, PT_MTP+16(sp) /* P2 */
  522. mtm0 v0 /* MPL0 */
  523. ld v0, PT_MTP+8(sp) /* P1 */
  524. mtm1 v1 /* MPL1 */
  525. ld v1, PT_MTP(sp) /* P0 */
  526. mtm2 k0 /* MPL2 */
  527. mtp2 k1 /* P2 */
  528. mtp1 v0 /* P1 */
  529. jr ra
  530. mtp0 v1 /* P0 */
  531. octeon_mult_restore2_end:
  532. EXPORT(octeon_mult_restore2_end)
  533. END(octeon_mult_restore2)
  534. LEAF(octeon_mult_restore3)
  535. ld $12, PT_MPL+(0*8)(sp) /* read MPL0 */
  536. ld $13, PT_MPL+(3*8)(sp) /* read MPL3 */
  537. ld $10, PT_MPL+(1*8)(sp) /* read MPL1 */
  538. ld $11, PT_MPL+(4*8)(sp) /* read MPL4 */
  539. .word 0x718d0008
  540. /* mtm0 $12, $13 restore MPL0 and MPL3 */
  541. ld $12, PT_MPL+(2*8)(sp) /* read MPL2 */
  542. .word 0x714b000c
  543. /* mtm1 $10, $11 restore MPL1 and MPL4 */
  544. ld $13, PT_MPL+(5*8)(sp) /* read MPL5 */
  545. ld $10, PT_MTP+(0*8)(sp) /* read P0 */
  546. ld $11, PT_MTP+(3*8)(sp) /* read P3 */
  547. .word 0x718d000d
  548. /* mtm2 $12, $13 restore MPL2 and MPL5 */
  549. ld $12, PT_MTP+(1*8)(sp) /* read P1 */
  550. .word 0x714b0009
  551. /* mtp0 $10, $11 restore P0 and P3 */
  552. ld $13, PT_MTP+(4*8)(sp) /* read P4 */
  553. ld $10, PT_MTP+(2*8)(sp) /* read P2 */
  554. ld $11, PT_MTP+(5*8)(sp) /* read P5 */
  555. .word 0x718d000a
  556. /* mtp1 $12, $13 restore P1 and P4 */
  557. jr ra
  558. .word 0x714b000b
  559. /* mtp2 $10, $11 restore P2 and P5 */
  560. octeon_mult_restore3_end:
  561. EXPORT(octeon_mult_restore3_end)
  562. END(octeon_mult_restore3)
  563. .set pop