octeon_switch.S 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554
  1. /*
  2. * This file is subject to the terms and conditions of the GNU General Public
  3. * License. See the file "COPYING" in the main directory of this archive
  4. * for more details.
  5. *
  6. * Copyright (C) 1994, 1995, 1996, 1998, 1999, 2002, 2003 Ralf Baechle
  7. * Copyright (C) 1996 David S. Miller ([email protected])
  8. * Copyright (C) 1994, 1995, 1996, by Andreas Busse
  9. * Copyright (C) 1999 Silicon Graphics, Inc.
  10. * Copyright (C) 2000 MIPS Technologies, Inc.
  11. * written by Carsten Langgaard, [email protected]
  12. */
  13. #include <asm/asm.h>
  14. #include <asm/export.h>
  15. #include <asm/asm-offsets.h>
  16. #include <asm/mipsregs.h>
  17. #include <asm/regdef.h>
  18. #include <asm/stackframe.h>
  19. /*
  20. * task_struct *resume(task_struct *prev, task_struct *next,
  21. * struct thread_info *next_ti)
  22. */
  23. .align 7
  24. LEAF(resume)
  25. .set arch=octeon
  26. mfc0 t1, CP0_STATUS
  27. LONG_S t1, THREAD_STATUS(a0)
  28. cpu_save_nonscratch a0
  29. LONG_S ra, THREAD_REG31(a0)
  30. #if CONFIG_CAVIUM_OCTEON_CVMSEG_SIZE > 0
  31. /* Check if we need to store CVMSEG state */
  32. dmfc0 t0, $11,7 /* CvmMemCtl */
  33. bbit0 t0, 6, 3f /* Is user access enabled? */
  34. /* Store the CVMSEG state */
  35. /* Extract the size of CVMSEG */
  36. andi t0, 0x3f
  37. /* Multiply * (cache line size/sizeof(long)/2) */
  38. sll t0, 7-LONGLOG-1
  39. li t1, -32768 /* Base address of CVMSEG */
  40. LONG_ADDI t2, a0, THREAD_CVMSEG /* Where to store CVMSEG to */
  41. synciobdma
  42. 2:
  43. .set noreorder
  44. LONG_L t8, 0(t1) /* Load from CVMSEG */
  45. subu t0, 1 /* Decrement loop var */
  46. LONG_L t9, LONGSIZE(t1)/* Load from CVMSEG */
  47. LONG_ADDU t1, LONGSIZE*2 /* Increment loc in CVMSEG */
  48. LONG_S t8, 0(t2) /* Store CVMSEG to thread storage */
  49. LONG_ADDU t2, LONGSIZE*2 /* Increment loc in thread storage */
  50. bnez t0, 2b /* Loop until we've copied it all */
  51. LONG_S t9, -LONGSIZE(t2)/* Store CVMSEG to thread storage */
  52. .set reorder
  53. /* Disable access to CVMSEG */
  54. dmfc0 t0, $11,7 /* CvmMemCtl */
  55. xori t0, t0, 0x40 /* Bit 6 is CVMSEG user enable */
  56. dmtc0 t0, $11,7 /* CvmMemCtl */
  57. #endif
  58. 3:
  59. #if defined(CONFIG_STACKPROTECTOR) && !defined(CONFIG_SMP)
  60. PTR_LA t8, __stack_chk_guard
  61. LONG_L t9, TASK_STACK_CANARY(a1)
  62. LONG_S t9, 0(t8)
  63. #endif
  64. /*
  65. * The order of restoring the registers takes care of the race
  66. * updating $28, $29 and kernelsp without disabling ints.
  67. */
  68. move $28, a2
  69. cpu_restore_nonscratch a1
  70. PTR_ADDU t0, $28, _THREAD_SIZE - 32
  71. set_saved_sp t0, t1, t2
  72. mfc0 t1, CP0_STATUS /* Do we really need this? */
  73. li a3, 0xff01
  74. and t1, a3
  75. LONG_L a2, THREAD_STATUS(a1)
  76. nor a3, $0, a3
  77. and a2, a3
  78. or a2, t1
  79. mtc0 a2, CP0_STATUS
  80. move v0, a0
  81. jr ra
  82. END(resume)
  83. /*
  84. * void octeon_cop2_save(struct octeon_cop2_state *a0)
  85. */
  86. .align 7
  87. .set push
  88. .set noreorder
  89. LEAF(octeon_cop2_save)
  90. dmfc0 t9, $9,7 /* CvmCtl register. */
  91. /* Save the COP2 CRC state */
  92. dmfc2 t0, 0x0201
  93. dmfc2 t1, 0x0202
  94. dmfc2 t2, 0x0200
  95. sd t0, OCTEON_CP2_CRC_IV(a0)
  96. sd t1, OCTEON_CP2_CRC_LENGTH(a0)
  97. /* Skip next instructions if CvmCtl[NODFA_CP2] set */
  98. bbit1 t9, 28, 1f
  99. sd t2, OCTEON_CP2_CRC_POLY(a0)
  100. /* Save the LLM state */
  101. dmfc2 t0, 0x0402
  102. dmfc2 t1, 0x040A
  103. sd t0, OCTEON_CP2_LLM_DAT(a0)
  104. 1: bbit1 t9, 26, 3f /* done if CvmCtl[NOCRYPTO] set */
  105. sd t1, OCTEON_CP2_LLM_DAT+8(a0)
  106. /* Save the COP2 crypto state */
  107. /* this part is mostly common to both pass 1 and later revisions */
  108. dmfc2 t0, 0x0084
  109. dmfc2 t1, 0x0080
  110. dmfc2 t2, 0x0081
  111. dmfc2 t3, 0x0082
  112. sd t0, OCTEON_CP2_3DES_IV(a0)
  113. dmfc2 t0, 0x0088
  114. sd t1, OCTEON_CP2_3DES_KEY(a0)
  115. dmfc2 t1, 0x0111 /* only necessary for pass 1 */
  116. sd t2, OCTEON_CP2_3DES_KEY+8(a0)
  117. dmfc2 t2, 0x0102
  118. sd t3, OCTEON_CP2_3DES_KEY+16(a0)
  119. dmfc2 t3, 0x0103
  120. sd t0, OCTEON_CP2_3DES_RESULT(a0)
  121. dmfc2 t0, 0x0104
  122. sd t1, OCTEON_CP2_AES_INP0(a0) /* only necessary for pass 1 */
  123. dmfc2 t1, 0x0105
  124. sd t2, OCTEON_CP2_AES_IV(a0)
  125. dmfc2 t2, 0x0106
  126. sd t3, OCTEON_CP2_AES_IV+8(a0)
  127. dmfc2 t3, 0x0107
  128. sd t0, OCTEON_CP2_AES_KEY(a0)
  129. dmfc2 t0, 0x0110
  130. sd t1, OCTEON_CP2_AES_KEY+8(a0)
  131. dmfc2 t1, 0x0100
  132. sd t2, OCTEON_CP2_AES_KEY+16(a0)
  133. dmfc2 t2, 0x0101
  134. sd t3, OCTEON_CP2_AES_KEY+24(a0)
  135. mfc0 v0, $15,0 /* Get the processor ID register */
  136. sd t0, OCTEON_CP2_AES_KEYLEN(a0)
  137. li v1, 0x000d0000 /* This is the processor ID of Octeon Pass1 */
  138. sd t1, OCTEON_CP2_AES_RESULT(a0)
  139. /* Skip to the Pass1 version of the remainder of the COP2 state */
  140. beq v0, v1, 2f
  141. sd t2, OCTEON_CP2_AES_RESULT+8(a0)
  142. /* the non-pass1 state when !CvmCtl[NOCRYPTO] */
  143. dmfc2 t1, 0x0240
  144. dmfc2 t2, 0x0241
  145. ori v1, v1, 0x9500 /* lowest OCTEON III PrId*/
  146. dmfc2 t3, 0x0242
  147. subu v1, v0, v1 /* prid - lowest OCTEON III PrId */
  148. dmfc2 t0, 0x0243
  149. sd t1, OCTEON_CP2_HSH_DATW(a0)
  150. dmfc2 t1, 0x0244
  151. sd t2, OCTEON_CP2_HSH_DATW+8(a0)
  152. dmfc2 t2, 0x0245
  153. sd t3, OCTEON_CP2_HSH_DATW+16(a0)
  154. dmfc2 t3, 0x0246
  155. sd t0, OCTEON_CP2_HSH_DATW+24(a0)
  156. dmfc2 t0, 0x0247
  157. sd t1, OCTEON_CP2_HSH_DATW+32(a0)
  158. dmfc2 t1, 0x0248
  159. sd t2, OCTEON_CP2_HSH_DATW+40(a0)
  160. dmfc2 t2, 0x0249
  161. sd t3, OCTEON_CP2_HSH_DATW+48(a0)
  162. dmfc2 t3, 0x024A
  163. sd t0, OCTEON_CP2_HSH_DATW+56(a0)
  164. dmfc2 t0, 0x024B
  165. sd t1, OCTEON_CP2_HSH_DATW+64(a0)
  166. dmfc2 t1, 0x024C
  167. sd t2, OCTEON_CP2_HSH_DATW+72(a0)
  168. dmfc2 t2, 0x024D
  169. sd t3, OCTEON_CP2_HSH_DATW+80(a0)
  170. dmfc2 t3, 0x024E
  171. sd t0, OCTEON_CP2_HSH_DATW+88(a0)
  172. dmfc2 t0, 0x0250
  173. sd t1, OCTEON_CP2_HSH_DATW+96(a0)
  174. dmfc2 t1, 0x0251
  175. sd t2, OCTEON_CP2_HSH_DATW+104(a0)
  176. dmfc2 t2, 0x0252
  177. sd t3, OCTEON_CP2_HSH_DATW+112(a0)
  178. dmfc2 t3, 0x0253
  179. sd t0, OCTEON_CP2_HSH_IVW(a0)
  180. dmfc2 t0, 0x0254
  181. sd t1, OCTEON_CP2_HSH_IVW+8(a0)
  182. dmfc2 t1, 0x0255
  183. sd t2, OCTEON_CP2_HSH_IVW+16(a0)
  184. dmfc2 t2, 0x0256
  185. sd t3, OCTEON_CP2_HSH_IVW+24(a0)
  186. dmfc2 t3, 0x0257
  187. sd t0, OCTEON_CP2_HSH_IVW+32(a0)
  188. dmfc2 t0, 0x0258
  189. sd t1, OCTEON_CP2_HSH_IVW+40(a0)
  190. dmfc2 t1, 0x0259
  191. sd t2, OCTEON_CP2_HSH_IVW+48(a0)
  192. dmfc2 t2, 0x025E
  193. sd t3, OCTEON_CP2_HSH_IVW+56(a0)
  194. dmfc2 t3, 0x025A
  195. sd t0, OCTEON_CP2_GFM_MULT(a0)
  196. dmfc2 t0, 0x025B
  197. sd t1, OCTEON_CP2_GFM_MULT+8(a0)
  198. sd t2, OCTEON_CP2_GFM_POLY(a0)
  199. sd t3, OCTEON_CP2_GFM_RESULT(a0)
  200. bltz v1, 4f
  201. sd t0, OCTEON_CP2_GFM_RESULT+8(a0)
  202. /* OCTEON III things*/
  203. dmfc2 t0, 0x024F
  204. dmfc2 t1, 0x0050
  205. sd t0, OCTEON_CP2_SHA3(a0)
  206. sd t1, OCTEON_CP2_SHA3+8(a0)
  207. 4:
  208. jr ra
  209. nop
  210. 2: /* pass 1 special stuff when !CvmCtl[NOCRYPTO] */
  211. dmfc2 t3, 0x0040
  212. dmfc2 t0, 0x0041
  213. dmfc2 t1, 0x0042
  214. dmfc2 t2, 0x0043
  215. sd t3, OCTEON_CP2_HSH_DATW(a0)
  216. dmfc2 t3, 0x0044
  217. sd t0, OCTEON_CP2_HSH_DATW+8(a0)
  218. dmfc2 t0, 0x0045
  219. sd t1, OCTEON_CP2_HSH_DATW+16(a0)
  220. dmfc2 t1, 0x0046
  221. sd t2, OCTEON_CP2_HSH_DATW+24(a0)
  222. dmfc2 t2, 0x0048
  223. sd t3, OCTEON_CP2_HSH_DATW+32(a0)
  224. dmfc2 t3, 0x0049
  225. sd t0, OCTEON_CP2_HSH_DATW+40(a0)
  226. dmfc2 t0, 0x004A
  227. sd t1, OCTEON_CP2_HSH_DATW+48(a0)
  228. sd t2, OCTEON_CP2_HSH_IVW(a0)
  229. sd t3, OCTEON_CP2_HSH_IVW+8(a0)
  230. sd t0, OCTEON_CP2_HSH_IVW+16(a0)
  231. 3: /* pass 1 or CvmCtl[NOCRYPTO] set */
  232. jr ra
  233. nop
  234. END(octeon_cop2_save)
  235. .set pop
  236. /*
  237. * void octeon_cop2_restore(struct octeon_cop2_state *a0)
  238. */
  239. .align 7
  240. .set push
  241. .set noreorder
  242. LEAF(octeon_cop2_restore)
  243. /* First cache line was prefetched before the call */
  244. pref 4, 128(a0)
  245. dmfc0 t9, $9,7 /* CvmCtl register. */
  246. pref 4, 256(a0)
  247. ld t0, OCTEON_CP2_CRC_IV(a0)
  248. pref 4, 384(a0)
  249. ld t1, OCTEON_CP2_CRC_LENGTH(a0)
  250. ld t2, OCTEON_CP2_CRC_POLY(a0)
  251. /* Restore the COP2 CRC state */
  252. dmtc2 t0, 0x0201
  253. dmtc2 t1, 0x1202
  254. bbit1 t9, 28, 2f /* Skip LLM if CvmCtl[NODFA_CP2] is set */
  255. dmtc2 t2, 0x4200
  256. /* Restore the LLM state */
  257. ld t0, OCTEON_CP2_LLM_DAT(a0)
  258. ld t1, OCTEON_CP2_LLM_DAT+8(a0)
  259. dmtc2 t0, 0x0402
  260. dmtc2 t1, 0x040A
  261. 2:
  262. bbit1 t9, 26, done_restore /* done if CvmCtl[NOCRYPTO] set */
  263. nop
  264. /* Restore the COP2 crypto state common to pass 1 and pass 2 */
  265. ld t0, OCTEON_CP2_3DES_IV(a0)
  266. ld t1, OCTEON_CP2_3DES_KEY(a0)
  267. ld t2, OCTEON_CP2_3DES_KEY+8(a0)
  268. dmtc2 t0, 0x0084
  269. ld t0, OCTEON_CP2_3DES_KEY+16(a0)
  270. dmtc2 t1, 0x0080
  271. ld t1, OCTEON_CP2_3DES_RESULT(a0)
  272. dmtc2 t2, 0x0081
  273. ld t2, OCTEON_CP2_AES_INP0(a0) /* only really needed for pass 1 */
  274. dmtc2 t0, 0x0082
  275. ld t0, OCTEON_CP2_AES_IV(a0)
  276. dmtc2 t1, 0x0098
  277. ld t1, OCTEON_CP2_AES_IV+8(a0)
  278. dmtc2 t2, 0x010A /* only really needed for pass 1 */
  279. ld t2, OCTEON_CP2_AES_KEY(a0)
  280. dmtc2 t0, 0x0102
  281. ld t0, OCTEON_CP2_AES_KEY+8(a0)
  282. dmtc2 t1, 0x0103
  283. ld t1, OCTEON_CP2_AES_KEY+16(a0)
  284. dmtc2 t2, 0x0104
  285. ld t2, OCTEON_CP2_AES_KEY+24(a0)
  286. dmtc2 t0, 0x0105
  287. ld t0, OCTEON_CP2_AES_KEYLEN(a0)
  288. dmtc2 t1, 0x0106
  289. ld t1, OCTEON_CP2_AES_RESULT(a0)
  290. dmtc2 t2, 0x0107
  291. ld t2, OCTEON_CP2_AES_RESULT+8(a0)
  292. mfc0 t3, $15,0 /* Get the processor ID register */
  293. dmtc2 t0, 0x0110
  294. li v0, 0x000d0000 /* This is the processor ID of Octeon Pass1 */
  295. dmtc2 t1, 0x0100
  296. bne v0, t3, 3f /* Skip the next stuff for non-pass1 */
  297. dmtc2 t2, 0x0101
  298. /* this code is specific for pass 1 */
  299. ld t0, OCTEON_CP2_HSH_DATW(a0)
  300. ld t1, OCTEON_CP2_HSH_DATW+8(a0)
  301. ld t2, OCTEON_CP2_HSH_DATW+16(a0)
  302. dmtc2 t0, 0x0040
  303. ld t0, OCTEON_CP2_HSH_DATW+24(a0)
  304. dmtc2 t1, 0x0041
  305. ld t1, OCTEON_CP2_HSH_DATW+32(a0)
  306. dmtc2 t2, 0x0042
  307. ld t2, OCTEON_CP2_HSH_DATW+40(a0)
  308. dmtc2 t0, 0x0043
  309. ld t0, OCTEON_CP2_HSH_DATW+48(a0)
  310. dmtc2 t1, 0x0044
  311. ld t1, OCTEON_CP2_HSH_IVW(a0)
  312. dmtc2 t2, 0x0045
  313. ld t2, OCTEON_CP2_HSH_IVW+8(a0)
  314. dmtc2 t0, 0x0046
  315. ld t0, OCTEON_CP2_HSH_IVW+16(a0)
  316. dmtc2 t1, 0x0048
  317. dmtc2 t2, 0x0049
  318. b done_restore /* unconditional branch */
  319. dmtc2 t0, 0x004A
  320. 3: /* this is post-pass1 code */
  321. ld t2, OCTEON_CP2_HSH_DATW(a0)
  322. ori v0, v0, 0x9500 /* lowest OCTEON III PrId*/
  323. ld t0, OCTEON_CP2_HSH_DATW+8(a0)
  324. ld t1, OCTEON_CP2_HSH_DATW+16(a0)
  325. dmtc2 t2, 0x0240
  326. ld t2, OCTEON_CP2_HSH_DATW+24(a0)
  327. dmtc2 t0, 0x0241
  328. ld t0, OCTEON_CP2_HSH_DATW+32(a0)
  329. dmtc2 t1, 0x0242
  330. ld t1, OCTEON_CP2_HSH_DATW+40(a0)
  331. dmtc2 t2, 0x0243
  332. ld t2, OCTEON_CP2_HSH_DATW+48(a0)
  333. dmtc2 t0, 0x0244
  334. ld t0, OCTEON_CP2_HSH_DATW+56(a0)
  335. dmtc2 t1, 0x0245
  336. ld t1, OCTEON_CP2_HSH_DATW+64(a0)
  337. dmtc2 t2, 0x0246
  338. ld t2, OCTEON_CP2_HSH_DATW+72(a0)
  339. dmtc2 t0, 0x0247
  340. ld t0, OCTEON_CP2_HSH_DATW+80(a0)
  341. dmtc2 t1, 0x0248
  342. ld t1, OCTEON_CP2_HSH_DATW+88(a0)
  343. dmtc2 t2, 0x0249
  344. ld t2, OCTEON_CP2_HSH_DATW+96(a0)
  345. dmtc2 t0, 0x024A
  346. ld t0, OCTEON_CP2_HSH_DATW+104(a0)
  347. dmtc2 t1, 0x024B
  348. ld t1, OCTEON_CP2_HSH_DATW+112(a0)
  349. dmtc2 t2, 0x024C
  350. ld t2, OCTEON_CP2_HSH_IVW(a0)
  351. dmtc2 t0, 0x024D
  352. ld t0, OCTEON_CP2_HSH_IVW+8(a0)
  353. dmtc2 t1, 0x024E
  354. ld t1, OCTEON_CP2_HSH_IVW+16(a0)
  355. dmtc2 t2, 0x0250
  356. ld t2, OCTEON_CP2_HSH_IVW+24(a0)
  357. dmtc2 t0, 0x0251
  358. ld t0, OCTEON_CP2_HSH_IVW+32(a0)
  359. dmtc2 t1, 0x0252
  360. ld t1, OCTEON_CP2_HSH_IVW+40(a0)
  361. dmtc2 t2, 0x0253
  362. ld t2, OCTEON_CP2_HSH_IVW+48(a0)
  363. dmtc2 t0, 0x0254
  364. ld t0, OCTEON_CP2_HSH_IVW+56(a0)
  365. dmtc2 t1, 0x0255
  366. ld t1, OCTEON_CP2_GFM_MULT(a0)
  367. dmtc2 t2, 0x0256
  368. ld t2, OCTEON_CP2_GFM_MULT+8(a0)
  369. dmtc2 t0, 0x0257
  370. ld t0, OCTEON_CP2_GFM_POLY(a0)
  371. dmtc2 t1, 0x0258
  372. ld t1, OCTEON_CP2_GFM_RESULT(a0)
  373. dmtc2 t2, 0x0259
  374. ld t2, OCTEON_CP2_GFM_RESULT+8(a0)
  375. dmtc2 t0, 0x025E
  376. subu v0, t3, v0 /* prid - lowest OCTEON III PrId */
  377. dmtc2 t1, 0x025A
  378. bltz v0, done_restore
  379. dmtc2 t2, 0x025B
  380. /* OCTEON III things*/
  381. ld t0, OCTEON_CP2_SHA3(a0)
  382. ld t1, OCTEON_CP2_SHA3+8(a0)
  383. dmtc2 t0, 0x0051
  384. dmtc2 t1, 0x0050
  385. done_restore:
  386. jr ra
  387. nop
  388. END(octeon_cop2_restore)
  389. .set pop
  390. /*
  391. * void octeon_mult_save()
  392. * sp is assumed to point to a struct pt_regs
  393. *
  394. * NOTE: This is called in SAVE_TEMP in stackframe.h. It can
  395. * safely modify v1,k0, k1,$10-$15, and $24. It will
  396. * be overwritten with a processor specific version of the code.
  397. */
  398. .p2align 7
  399. .set push
  400. .set noreorder
  401. LEAF(octeon_mult_save)
  402. jr ra
  403. nop
  404. .space 30 * 4, 0
  405. octeon_mult_save_end:
  406. EXPORT(octeon_mult_save_end)
  407. END(octeon_mult_save)
  408. LEAF(octeon_mult_save2)
  409. /* Save the multiplier state OCTEON II and earlier*/
  410. v3mulu k0, $0, $0
  411. v3mulu k1, $0, $0
  412. sd k0, PT_MTP(sp) /* PT_MTP has P0 */
  413. v3mulu k0, $0, $0
  414. sd k1, PT_MTP+8(sp) /* PT_MTP+8 has P1 */
  415. ori k1, $0, 1
  416. v3mulu k1, k1, $0
  417. sd k0, PT_MTP+16(sp) /* PT_MTP+16 has P2 */
  418. v3mulu k0, $0, $0
  419. sd k1, PT_MPL(sp) /* PT_MPL has MPL0 */
  420. v3mulu k1, $0, $0
  421. sd k0, PT_MPL+8(sp) /* PT_MPL+8 has MPL1 */
  422. jr ra
  423. sd k1, PT_MPL+16(sp) /* PT_MPL+16 has MPL2 */
  424. octeon_mult_save2_end:
  425. EXPORT(octeon_mult_save2_end)
  426. END(octeon_mult_save2)
  427. LEAF(octeon_mult_save3)
  428. /* Save the multiplier state OCTEON III */
  429. v3mulu $10, $0, $0 /* read P0 */
  430. v3mulu $11, $0, $0 /* read P1 */
  431. v3mulu $12, $0, $0 /* read P2 */
  432. sd $10, PT_MTP+(0*8)(sp) /* store P0 */
  433. v3mulu $10, $0, $0 /* read P3 */
  434. sd $11, PT_MTP+(1*8)(sp) /* store P1 */
  435. v3mulu $11, $0, $0 /* read P4 */
  436. sd $12, PT_MTP+(2*8)(sp) /* store P2 */
  437. ori $13, $0, 1
  438. v3mulu $12, $0, $0 /* read P5 */
  439. sd $10, PT_MTP+(3*8)(sp) /* store P3 */
  440. v3mulu $13, $13, $0 /* P4-P0 = MPL5-MPL1, $13 = MPL0 */
  441. sd $11, PT_MTP+(4*8)(sp) /* store P4 */
  442. v3mulu $10, $0, $0 /* read MPL1 */
  443. sd $12, PT_MTP+(5*8)(sp) /* store P5 */
  444. v3mulu $11, $0, $0 /* read MPL2 */
  445. sd $13, PT_MPL+(0*8)(sp) /* store MPL0 */
  446. v3mulu $12, $0, $0 /* read MPL3 */
  447. sd $10, PT_MPL+(1*8)(sp) /* store MPL1 */
  448. v3mulu $10, $0, $0 /* read MPL4 */
  449. sd $11, PT_MPL+(2*8)(sp) /* store MPL2 */
  450. v3mulu $11, $0, $0 /* read MPL5 */
  451. sd $12, PT_MPL+(3*8)(sp) /* store MPL3 */
  452. sd $10, PT_MPL+(4*8)(sp) /* store MPL4 */
  453. jr ra
  454. sd $11, PT_MPL+(5*8)(sp) /* store MPL5 */
  455. octeon_mult_save3_end:
  456. EXPORT(octeon_mult_save3_end)
  457. END(octeon_mult_save3)
  458. .set pop
  459. /*
  460. * void octeon_mult_restore()
  461. * sp is assumed to point to a struct pt_regs
  462. *
  463. * NOTE: This is called in RESTORE_TEMP in stackframe.h.
  464. */
  465. .p2align 7
  466. .set push
  467. .set noreorder
  468. LEAF(octeon_mult_restore)
  469. jr ra
  470. nop
  471. .space 30 * 4, 0
  472. octeon_mult_restore_end:
  473. EXPORT(octeon_mult_restore_end)
  474. END(octeon_mult_restore)
  475. LEAF(octeon_mult_restore2)
  476. ld v0, PT_MPL(sp) /* MPL0 */
  477. ld v1, PT_MPL+8(sp) /* MPL1 */
  478. ld k0, PT_MPL+16(sp) /* MPL2 */
  479. /* Restore the multiplier state */
  480. ld k1, PT_MTP+16(sp) /* P2 */
  481. mtm0 v0 /* MPL0 */
  482. ld v0, PT_MTP+8(sp) /* P1 */
  483. mtm1 v1 /* MPL1 */
  484. ld v1, PT_MTP(sp) /* P0 */
  485. mtm2 k0 /* MPL2 */
  486. mtp2 k1 /* P2 */
  487. mtp1 v0 /* P1 */
  488. jr ra
  489. mtp0 v1 /* P0 */
  490. octeon_mult_restore2_end:
  491. EXPORT(octeon_mult_restore2_end)
  492. END(octeon_mult_restore2)
  493. LEAF(octeon_mult_restore3)
  494. ld $12, PT_MPL+(0*8)(sp) /* read MPL0 */
  495. ld $13, PT_MPL+(3*8)(sp) /* read MPL3 */
  496. ld $10, PT_MPL+(1*8)(sp) /* read MPL1 */
  497. ld $11, PT_MPL+(4*8)(sp) /* read MPL4 */
  498. .word 0x718d0008
  499. /* mtm0 $12, $13 restore MPL0 and MPL3 */
  500. ld $12, PT_MPL+(2*8)(sp) /* read MPL2 */
  501. .word 0x714b000c
  502. /* mtm1 $10, $11 restore MPL1 and MPL4 */
  503. ld $13, PT_MPL+(5*8)(sp) /* read MPL5 */
  504. ld $10, PT_MTP+(0*8)(sp) /* read P0 */
  505. ld $11, PT_MTP+(3*8)(sp) /* read P3 */
  506. .word 0x718d000d
  507. /* mtm2 $12, $13 restore MPL2 and MPL5 */
  508. ld $12, PT_MTP+(1*8)(sp) /* read P1 */
  509. .word 0x714b0009
  510. /* mtp0 $10, $11 restore P0 and P3 */
  511. ld $13, PT_MTP+(4*8)(sp) /* read P4 */
  512. ld $10, PT_MTP+(2*8)(sp) /* read P2 */
  513. ld $11, PT_MTP+(5*8)(sp) /* read P5 */
  514. .word 0x718d000a
  515. /* mtp1 $12, $13 restore P1 and P4 */
  516. jr ra
  517. .word 0x714b000b
  518. /* mtp2 $10, $11 restore P2 and P5 */
  519. octeon_mult_restore3_end:
  520. EXPORT(octeon_mult_restore3_end)
  521. END(octeon_mult_restore3)
  522. .set pop