Kyle Swenson | 8d8f654 | 2021-03-15 11:02:55 -0600 | [diff] [blame^] | 1 | /* |
| 2 | * This file is subject to the terms and conditions of the GNU General Public |
| 3 | * License. See the file "COPYING" in the main directory of this archive |
| 4 | * for more details. |
| 5 | * |
| 6 | * Copyright (C) 1994, 1995, 1996, 1998, 1999, 2002, 2003 Ralf Baechle |
| 7 | * Copyright (C) 1996 David S. Miller (davem@davemloft.net) |
| 8 | * Copyright (C) 1994, 1995, 1996, by Andreas Busse |
| 9 | * Copyright (C) 1999 Silicon Graphics, Inc. |
| 10 | * Copyright (C) 2000 MIPS Technologies, Inc. |
| 11 | * written by Carsten Langgaard, carstenl@mips.com |
| 12 | */ |
| 13 | |
| 14 | #define USE_ALTERNATE_RESUME_IMPL 1 |
| 15 | .set push |
| 16 | .set arch=mips64r2 |
| 17 | #include "r4k_switch.S" |
| 18 | .set pop |
| 19 | /* |
| 20 | * task_struct *resume(task_struct *prev, task_struct *next, |
| 21 | * struct thread_info *next_ti) |
| 22 | */ |
| 23 | .align 7 |
| 24 | LEAF(resume) |
| 25 | .set arch=octeon |
| 26 | mfc0 t1, CP0_STATUS |
| 27 | LONG_S t1, THREAD_STATUS(a0) |
| 28 | cpu_save_nonscratch a0 |
| 29 | LONG_S ra, THREAD_REG31(a0) |
| 30 | |
| 31 | #if CONFIG_CAVIUM_OCTEON_CVMSEG_SIZE > 0 |
| 32 | /* Check if we need to store CVMSEG state */ |
| 33 | dmfc0 t0, $11,7 /* CvmMemCtl */ |
| 34 | bbit0 t0, 6, 3f /* Is user access enabled? */ |
| 35 | |
| 36 | /* Store the CVMSEG state */ |
| 37 | /* Extract the size of CVMSEG */ |
| 38 | andi t0, 0x3f |
| 39 | /* Multiply * (cache line size/sizeof(long)/2) */ |
| 40 | sll t0, 7-LONGLOG-1 |
| 41 | li t1, -32768 /* Base address of CVMSEG */ |
| 42 | LONG_ADDI t2, a0, THREAD_CVMSEG /* Where to store CVMSEG to */ |
| 43 | synciobdma |
| 44 | 2: |
| 45 | .set noreorder |
| 46 | LONG_L t8, 0(t1) /* Load from CVMSEG */ |
| 47 | subu t0, 1 /* Decrement loop var */ |
| 48 | LONG_L t9, LONGSIZE(t1)/* Load from CVMSEG */ |
| 49 | LONG_ADDU t1, LONGSIZE*2 /* Increment loc in CVMSEG */ |
| 50 | LONG_S t8, 0(t2) /* Store CVMSEG to thread storage */ |
| 51 | LONG_ADDU t2, LONGSIZE*2 /* Increment loc in thread storage */ |
| 52 | bnez t0, 2b /* Loop until we've copied it all */ |
| 53 | LONG_S t9, -LONGSIZE(t2)/* Store CVMSEG to thread storage */ |
| 54 | .set reorder |
| 55 | |
| 56 | /* Disable access to CVMSEG */ |
| 57 | dmfc0 t0, $11,7 /* CvmMemCtl */ |
| 58 | xori t0, t0, 0x40 /* Bit 6 is CVMSEG user enable */ |
| 59 | dmtc0 t0, $11,7 /* CvmMemCtl */ |
| 60 | #endif |
| 61 | 3: |
| 62 | |
| 63 | #if defined(CONFIG_CC_STACKPROTECTOR) && !defined(CONFIG_SMP) |
| 64 | PTR_LA t8, __stack_chk_guard |
| 65 | LONG_L t9, TASK_STACK_CANARY(a1) |
| 66 | LONG_S t9, 0(t8) |
| 67 | #endif |
| 68 | |
| 69 | /* |
| 70 | * The order of restoring the registers takes care of the race |
| 71 | * updating $28, $29 and kernelsp without disabling ints. |
| 72 | */ |
| 73 | move $28, a2 |
| 74 | cpu_restore_nonscratch a1 |
| 75 | |
| 76 | PTR_ADDU t0, $28, _THREAD_SIZE - 32 |
| 77 | set_saved_sp t0, t1, t2 |
| 78 | |
| 79 | mfc0 t1, CP0_STATUS /* Do we really need this? */ |
| 80 | li a3, 0xff01 |
| 81 | and t1, a3 |
| 82 | LONG_L a2, THREAD_STATUS(a1) |
| 83 | nor a3, $0, a3 |
| 84 | and a2, a3 |
| 85 | or a2, t1 |
| 86 | mtc0 a2, CP0_STATUS |
| 87 | move v0, a0 |
| 88 | jr ra |
| 89 | END(resume) |
| 90 | |
| 91 | /* |
| 92 | * void octeon_cop2_save(struct octeon_cop2_state *a0) |
| 93 | */ |
| 94 | .align 7 |
| 95 | .set push |
| 96 | .set noreorder |
| 97 | LEAF(octeon_cop2_save) |
| 98 | |
| 99 | dmfc0 t9, $9,7 /* CvmCtl register. */ |
| 100 | |
| 101 | /* Save the COP2 CRC state */ |
| 102 | dmfc2 t0, 0x0201 |
| 103 | dmfc2 t1, 0x0202 |
| 104 | dmfc2 t2, 0x0200 |
| 105 | sd t0, OCTEON_CP2_CRC_IV(a0) |
| 106 | sd t1, OCTEON_CP2_CRC_LENGTH(a0) |
| 107 | /* Skip next instructions if CvmCtl[NODFA_CP2] set */ |
| 108 | bbit1 t9, 28, 1f |
| 109 | sd t2, OCTEON_CP2_CRC_POLY(a0) |
| 110 | |
| 111 | /* Save the LLM state */ |
| 112 | dmfc2 t0, 0x0402 |
| 113 | dmfc2 t1, 0x040A |
| 114 | sd t0, OCTEON_CP2_LLM_DAT(a0) |
| 115 | |
| 116 | 1: bbit1 t9, 26, 3f /* done if CvmCtl[NOCRYPTO] set */ |
| 117 | sd t1, OCTEON_CP2_LLM_DAT+8(a0) |
| 118 | |
| 119 | /* Save the COP2 crypto state */ |
| 120 | /* this part is mostly common to both pass 1 and later revisions */ |
| 121 | dmfc2 t0, 0x0084 |
| 122 | dmfc2 t1, 0x0080 |
| 123 | dmfc2 t2, 0x0081 |
| 124 | dmfc2 t3, 0x0082 |
| 125 | sd t0, OCTEON_CP2_3DES_IV(a0) |
| 126 | dmfc2 t0, 0x0088 |
| 127 | sd t1, OCTEON_CP2_3DES_KEY(a0) |
| 128 | dmfc2 t1, 0x0111 /* only necessary for pass 1 */ |
| 129 | sd t2, OCTEON_CP2_3DES_KEY+8(a0) |
| 130 | dmfc2 t2, 0x0102 |
| 131 | sd t3, OCTEON_CP2_3DES_KEY+16(a0) |
| 132 | dmfc2 t3, 0x0103 |
| 133 | sd t0, OCTEON_CP2_3DES_RESULT(a0) |
| 134 | dmfc2 t0, 0x0104 |
| 135 | sd t1, OCTEON_CP2_AES_INP0(a0) /* only necessary for pass 1 */ |
| 136 | dmfc2 t1, 0x0105 |
| 137 | sd t2, OCTEON_CP2_AES_IV(a0) |
| 138 | dmfc2 t2, 0x0106 |
| 139 | sd t3, OCTEON_CP2_AES_IV+8(a0) |
| 140 | dmfc2 t3, 0x0107 |
| 141 | sd t0, OCTEON_CP2_AES_KEY(a0) |
| 142 | dmfc2 t0, 0x0110 |
| 143 | sd t1, OCTEON_CP2_AES_KEY+8(a0) |
| 144 | dmfc2 t1, 0x0100 |
| 145 | sd t2, OCTEON_CP2_AES_KEY+16(a0) |
| 146 | dmfc2 t2, 0x0101 |
| 147 | sd t3, OCTEON_CP2_AES_KEY+24(a0) |
| 148 | mfc0 v0, $15,0 /* Get the processor ID register */ |
| 149 | sd t0, OCTEON_CP2_AES_KEYLEN(a0) |
| 150 | li v1, 0x000d0000 /* This is the processor ID of Octeon Pass1 */ |
| 151 | sd t1, OCTEON_CP2_AES_RESULT(a0) |
| 152 | /* Skip to the Pass1 version of the remainder of the COP2 state */ |
| 153 | beq v0, v1, 2f |
| 154 | sd t2, OCTEON_CP2_AES_RESULT+8(a0) |
| 155 | |
| 156 | /* the non-pass1 state when !CvmCtl[NOCRYPTO] */ |
| 157 | dmfc2 t1, 0x0240 |
| 158 | dmfc2 t2, 0x0241 |
| 159 | ori v1, v1, 0x9500 /* lowest OCTEON III PrId*/ |
| 160 | dmfc2 t3, 0x0242 |
| 161 | subu v1, v0, v1 /* prid - lowest OCTEON III PrId */ |
| 162 | dmfc2 t0, 0x0243 |
| 163 | sd t1, OCTEON_CP2_HSH_DATW(a0) |
| 164 | dmfc2 t1, 0x0244 |
| 165 | sd t2, OCTEON_CP2_HSH_DATW+8(a0) |
| 166 | dmfc2 t2, 0x0245 |
| 167 | sd t3, OCTEON_CP2_HSH_DATW+16(a0) |
| 168 | dmfc2 t3, 0x0246 |
| 169 | sd t0, OCTEON_CP2_HSH_DATW+24(a0) |
| 170 | dmfc2 t0, 0x0247 |
| 171 | sd t1, OCTEON_CP2_HSH_DATW+32(a0) |
| 172 | dmfc2 t1, 0x0248 |
| 173 | sd t2, OCTEON_CP2_HSH_DATW+40(a0) |
| 174 | dmfc2 t2, 0x0249 |
| 175 | sd t3, OCTEON_CP2_HSH_DATW+48(a0) |
| 176 | dmfc2 t3, 0x024A |
| 177 | sd t0, OCTEON_CP2_HSH_DATW+56(a0) |
| 178 | dmfc2 t0, 0x024B |
| 179 | sd t1, OCTEON_CP2_HSH_DATW+64(a0) |
| 180 | dmfc2 t1, 0x024C |
| 181 | sd t2, OCTEON_CP2_HSH_DATW+72(a0) |
| 182 | dmfc2 t2, 0x024D |
| 183 | sd t3, OCTEON_CP2_HSH_DATW+80(a0) |
| 184 | dmfc2 t3, 0x024E |
| 185 | sd t0, OCTEON_CP2_HSH_DATW+88(a0) |
| 186 | dmfc2 t0, 0x0250 |
| 187 | sd t1, OCTEON_CP2_HSH_DATW+96(a0) |
| 188 | dmfc2 t1, 0x0251 |
| 189 | sd t2, OCTEON_CP2_HSH_DATW+104(a0) |
| 190 | dmfc2 t2, 0x0252 |
| 191 | sd t3, OCTEON_CP2_HSH_DATW+112(a0) |
| 192 | dmfc2 t3, 0x0253 |
| 193 | sd t0, OCTEON_CP2_HSH_IVW(a0) |
| 194 | dmfc2 t0, 0x0254 |
| 195 | sd t1, OCTEON_CP2_HSH_IVW+8(a0) |
| 196 | dmfc2 t1, 0x0255 |
| 197 | sd t2, OCTEON_CP2_HSH_IVW+16(a0) |
| 198 | dmfc2 t2, 0x0256 |
| 199 | sd t3, OCTEON_CP2_HSH_IVW+24(a0) |
| 200 | dmfc2 t3, 0x0257 |
| 201 | sd t0, OCTEON_CP2_HSH_IVW+32(a0) |
| 202 | dmfc2 t0, 0x0258 |
| 203 | sd t1, OCTEON_CP2_HSH_IVW+40(a0) |
| 204 | dmfc2 t1, 0x0259 |
| 205 | sd t2, OCTEON_CP2_HSH_IVW+48(a0) |
| 206 | dmfc2 t2, 0x025E |
| 207 | sd t3, OCTEON_CP2_HSH_IVW+56(a0) |
| 208 | dmfc2 t3, 0x025A |
| 209 | sd t0, OCTEON_CP2_GFM_MULT(a0) |
| 210 | dmfc2 t0, 0x025B |
| 211 | sd t1, OCTEON_CP2_GFM_MULT+8(a0) |
| 212 | sd t2, OCTEON_CP2_GFM_POLY(a0) |
| 213 | sd t3, OCTEON_CP2_GFM_RESULT(a0) |
| 214 | bltz v1, 4f |
| 215 | sd t0, OCTEON_CP2_GFM_RESULT+8(a0) |
| 216 | /* OCTEON III things*/ |
| 217 | dmfc2 t0, 0x024F |
| 218 | dmfc2 t1, 0x0050 |
| 219 | sd t0, OCTEON_CP2_SHA3(a0) |
| 220 | sd t1, OCTEON_CP2_SHA3+8(a0) |
| 221 | 4: |
| 222 | jr ra |
| 223 | nop |
| 224 | |
| 225 | 2: /* pass 1 special stuff when !CvmCtl[NOCRYPTO] */ |
| 226 | dmfc2 t3, 0x0040 |
| 227 | dmfc2 t0, 0x0041 |
| 228 | dmfc2 t1, 0x0042 |
| 229 | dmfc2 t2, 0x0043 |
| 230 | sd t3, OCTEON_CP2_HSH_DATW(a0) |
| 231 | dmfc2 t3, 0x0044 |
| 232 | sd t0, OCTEON_CP2_HSH_DATW+8(a0) |
| 233 | dmfc2 t0, 0x0045 |
| 234 | sd t1, OCTEON_CP2_HSH_DATW+16(a0) |
| 235 | dmfc2 t1, 0x0046 |
| 236 | sd t2, OCTEON_CP2_HSH_DATW+24(a0) |
| 237 | dmfc2 t2, 0x0048 |
| 238 | sd t3, OCTEON_CP2_HSH_DATW+32(a0) |
| 239 | dmfc2 t3, 0x0049 |
| 240 | sd t0, OCTEON_CP2_HSH_DATW+40(a0) |
| 241 | dmfc2 t0, 0x004A |
| 242 | sd t1, OCTEON_CP2_HSH_DATW+48(a0) |
| 243 | sd t2, OCTEON_CP2_HSH_IVW(a0) |
| 244 | sd t3, OCTEON_CP2_HSH_IVW+8(a0) |
| 245 | sd t0, OCTEON_CP2_HSH_IVW+16(a0) |
| 246 | |
| 247 | 3: /* pass 1 or CvmCtl[NOCRYPTO] set */ |
| 248 | jr ra |
| 249 | nop |
| 250 | END(octeon_cop2_save) |
| 251 | .set pop |
| 252 | |
| 253 | /* |
| 254 | * void octeon_cop2_restore(struct octeon_cop2_state *a0) |
| 255 | */ |
| 256 | .align 7 |
| 257 | .set push |
| 258 | .set noreorder |
| 259 | LEAF(octeon_cop2_restore) |
| 260 | /* First cache line was prefetched before the call */ |
| 261 | pref 4, 128(a0) |
| 262 | dmfc0 t9, $9,7 /* CvmCtl register. */ |
| 263 | |
| 264 | pref 4, 256(a0) |
| 265 | ld t0, OCTEON_CP2_CRC_IV(a0) |
| 266 | pref 4, 384(a0) |
| 267 | ld t1, OCTEON_CP2_CRC_LENGTH(a0) |
| 268 | ld t2, OCTEON_CP2_CRC_POLY(a0) |
| 269 | |
| 270 | /* Restore the COP2 CRC state */ |
| 271 | dmtc2 t0, 0x0201 |
| 272 | dmtc2 t1, 0x1202 |
| 273 | bbit1 t9, 28, 2f /* Skip LLM if CvmCtl[NODFA_CP2] is set */ |
| 274 | dmtc2 t2, 0x4200 |
| 275 | |
| 276 | /* Restore the LLM state */ |
| 277 | ld t0, OCTEON_CP2_LLM_DAT(a0) |
| 278 | ld t1, OCTEON_CP2_LLM_DAT+8(a0) |
| 279 | dmtc2 t0, 0x0402 |
| 280 | dmtc2 t1, 0x040A |
| 281 | |
| 282 | 2: |
| 283 | bbit1 t9, 26, done_restore /* done if CvmCtl[NOCRYPTO] set */ |
| 284 | nop |
| 285 | |
| 286 | /* Restore the COP2 crypto state common to pass 1 and pass 2 */ |
| 287 | ld t0, OCTEON_CP2_3DES_IV(a0) |
| 288 | ld t1, OCTEON_CP2_3DES_KEY(a0) |
| 289 | ld t2, OCTEON_CP2_3DES_KEY+8(a0) |
| 290 | dmtc2 t0, 0x0084 |
| 291 | ld t0, OCTEON_CP2_3DES_KEY+16(a0) |
| 292 | dmtc2 t1, 0x0080 |
| 293 | ld t1, OCTEON_CP2_3DES_RESULT(a0) |
| 294 | dmtc2 t2, 0x0081 |
| 295 | ld t2, OCTEON_CP2_AES_INP0(a0) /* only really needed for pass 1 */ |
| 296 | dmtc2 t0, 0x0082 |
| 297 | ld t0, OCTEON_CP2_AES_IV(a0) |
| 298 | dmtc2 t1, 0x0098 |
| 299 | ld t1, OCTEON_CP2_AES_IV+8(a0) |
| 300 | dmtc2 t2, 0x010A /* only really needed for pass 1 */ |
| 301 | ld t2, OCTEON_CP2_AES_KEY(a0) |
| 302 | dmtc2 t0, 0x0102 |
| 303 | ld t0, OCTEON_CP2_AES_KEY+8(a0) |
| 304 | dmtc2 t1, 0x0103 |
| 305 | ld t1, OCTEON_CP2_AES_KEY+16(a0) |
| 306 | dmtc2 t2, 0x0104 |
| 307 | ld t2, OCTEON_CP2_AES_KEY+24(a0) |
| 308 | dmtc2 t0, 0x0105 |
| 309 | ld t0, OCTEON_CP2_AES_KEYLEN(a0) |
| 310 | dmtc2 t1, 0x0106 |
| 311 | ld t1, OCTEON_CP2_AES_RESULT(a0) |
| 312 | dmtc2 t2, 0x0107 |
| 313 | ld t2, OCTEON_CP2_AES_RESULT+8(a0) |
| 314 | mfc0 t3, $15,0 /* Get the processor ID register */ |
| 315 | dmtc2 t0, 0x0110 |
| 316 | li v0, 0x000d0000 /* This is the processor ID of Octeon Pass1 */ |
| 317 | dmtc2 t1, 0x0100 |
| 318 | bne v0, t3, 3f /* Skip the next stuff for non-pass1 */ |
| 319 | dmtc2 t2, 0x0101 |
| 320 | |
| 321 | /* this code is specific for pass 1 */ |
| 322 | ld t0, OCTEON_CP2_HSH_DATW(a0) |
| 323 | ld t1, OCTEON_CP2_HSH_DATW+8(a0) |
| 324 | ld t2, OCTEON_CP2_HSH_DATW+16(a0) |
| 325 | dmtc2 t0, 0x0040 |
| 326 | ld t0, OCTEON_CP2_HSH_DATW+24(a0) |
| 327 | dmtc2 t1, 0x0041 |
| 328 | ld t1, OCTEON_CP2_HSH_DATW+32(a0) |
| 329 | dmtc2 t2, 0x0042 |
| 330 | ld t2, OCTEON_CP2_HSH_DATW+40(a0) |
| 331 | dmtc2 t0, 0x0043 |
| 332 | ld t0, OCTEON_CP2_HSH_DATW+48(a0) |
| 333 | dmtc2 t1, 0x0044 |
| 334 | ld t1, OCTEON_CP2_HSH_IVW(a0) |
| 335 | dmtc2 t2, 0x0045 |
| 336 | ld t2, OCTEON_CP2_HSH_IVW+8(a0) |
| 337 | dmtc2 t0, 0x0046 |
| 338 | ld t0, OCTEON_CP2_HSH_IVW+16(a0) |
| 339 | dmtc2 t1, 0x0048 |
| 340 | dmtc2 t2, 0x0049 |
| 341 | b done_restore /* unconditional branch */ |
| 342 | dmtc2 t0, 0x004A |
| 343 | |
| 344 | 3: /* this is post-pass1 code */ |
| 345 | ld t2, OCTEON_CP2_HSH_DATW(a0) |
| 346 | ori v0, v0, 0x9500 /* lowest OCTEON III PrId*/ |
| 347 | ld t0, OCTEON_CP2_HSH_DATW+8(a0) |
| 348 | ld t1, OCTEON_CP2_HSH_DATW+16(a0) |
| 349 | dmtc2 t2, 0x0240 |
| 350 | ld t2, OCTEON_CP2_HSH_DATW+24(a0) |
| 351 | dmtc2 t0, 0x0241 |
| 352 | ld t0, OCTEON_CP2_HSH_DATW+32(a0) |
| 353 | dmtc2 t1, 0x0242 |
| 354 | ld t1, OCTEON_CP2_HSH_DATW+40(a0) |
| 355 | dmtc2 t2, 0x0243 |
| 356 | ld t2, OCTEON_CP2_HSH_DATW+48(a0) |
| 357 | dmtc2 t0, 0x0244 |
| 358 | ld t0, OCTEON_CP2_HSH_DATW+56(a0) |
| 359 | dmtc2 t1, 0x0245 |
| 360 | ld t1, OCTEON_CP2_HSH_DATW+64(a0) |
| 361 | dmtc2 t2, 0x0246 |
| 362 | ld t2, OCTEON_CP2_HSH_DATW+72(a0) |
| 363 | dmtc2 t0, 0x0247 |
| 364 | ld t0, OCTEON_CP2_HSH_DATW+80(a0) |
| 365 | dmtc2 t1, 0x0248 |
| 366 | ld t1, OCTEON_CP2_HSH_DATW+88(a0) |
| 367 | dmtc2 t2, 0x0249 |
| 368 | ld t2, OCTEON_CP2_HSH_DATW+96(a0) |
| 369 | dmtc2 t0, 0x024A |
| 370 | ld t0, OCTEON_CP2_HSH_DATW+104(a0) |
| 371 | dmtc2 t1, 0x024B |
| 372 | ld t1, OCTEON_CP2_HSH_DATW+112(a0) |
| 373 | dmtc2 t2, 0x024C |
| 374 | ld t2, OCTEON_CP2_HSH_IVW(a0) |
| 375 | dmtc2 t0, 0x024D |
| 376 | ld t0, OCTEON_CP2_HSH_IVW+8(a0) |
| 377 | dmtc2 t1, 0x024E |
| 378 | ld t1, OCTEON_CP2_HSH_IVW+16(a0) |
| 379 | dmtc2 t2, 0x0250 |
| 380 | ld t2, OCTEON_CP2_HSH_IVW+24(a0) |
| 381 | dmtc2 t0, 0x0251 |
| 382 | ld t0, OCTEON_CP2_HSH_IVW+32(a0) |
| 383 | dmtc2 t1, 0x0252 |
| 384 | ld t1, OCTEON_CP2_HSH_IVW+40(a0) |
| 385 | dmtc2 t2, 0x0253 |
| 386 | ld t2, OCTEON_CP2_HSH_IVW+48(a0) |
| 387 | dmtc2 t0, 0x0254 |
| 388 | ld t0, OCTEON_CP2_HSH_IVW+56(a0) |
| 389 | dmtc2 t1, 0x0255 |
| 390 | ld t1, OCTEON_CP2_GFM_MULT(a0) |
| 391 | dmtc2 t2, 0x0256 |
| 392 | ld t2, OCTEON_CP2_GFM_MULT+8(a0) |
| 393 | dmtc2 t0, 0x0257 |
| 394 | ld t0, OCTEON_CP2_GFM_POLY(a0) |
| 395 | dmtc2 t1, 0x0258 |
| 396 | ld t1, OCTEON_CP2_GFM_RESULT(a0) |
| 397 | dmtc2 t2, 0x0259 |
| 398 | ld t2, OCTEON_CP2_GFM_RESULT+8(a0) |
| 399 | dmtc2 t0, 0x025E |
| 400 | subu v0, t3, v0 /* prid - lowest OCTEON III PrId */ |
| 401 | dmtc2 t1, 0x025A |
| 402 | bltz v0, done_restore |
| 403 | dmtc2 t2, 0x025B |
| 404 | /* OCTEON III things*/ |
| 405 | ld t0, OCTEON_CP2_SHA3(a0) |
| 406 | ld t1, OCTEON_CP2_SHA3+8(a0) |
| 407 | dmtc2 t0, 0x0051 |
| 408 | dmtc2 t1, 0x0050 |
| 409 | done_restore: |
| 410 | jr ra |
| 411 | nop |
| 412 | END(octeon_cop2_restore) |
| 413 | .set pop |
| 414 | |
| 415 | /* |
| 416 | * void octeon_mult_save() |
| 417 | * sp is assumed to point to a struct pt_regs |
| 418 | * |
| 419 | * NOTE: This is called in SAVE_TEMP in stackframe.h. It can |
| 420 | * safely modify v1,k0, k1,$10-$15, and $24. It will |
| 421 | * be overwritten with a processor specific version of the code. |
| 422 | */ |
| 423 | .p2align 7 |
| 424 | .set push |
| 425 | .set noreorder |
| 426 | LEAF(octeon_mult_save) |
| 427 | jr ra |
| 428 | nop |
| 429 | .space 30 * 4, 0 |
| 430 | octeon_mult_save_end: |
| 431 | EXPORT(octeon_mult_save_end) |
| 432 | END(octeon_mult_save) |
| 433 | |
| 434 | LEAF(octeon_mult_save2) |
| 435 | /* Save the multiplier state OCTEON II and earlier*/ |
| 436 | v3mulu k0, $0, $0 |
| 437 | v3mulu k1, $0, $0 |
| 438 | sd k0, PT_MTP(sp) /* PT_MTP has P0 */ |
| 439 | v3mulu k0, $0, $0 |
| 440 | sd k1, PT_MTP+8(sp) /* PT_MTP+8 has P1 */ |
| 441 | ori k1, $0, 1 |
| 442 | v3mulu k1, k1, $0 |
| 443 | sd k0, PT_MTP+16(sp) /* PT_MTP+16 has P2 */ |
| 444 | v3mulu k0, $0, $0 |
| 445 | sd k1, PT_MPL(sp) /* PT_MPL has MPL0 */ |
| 446 | v3mulu k1, $0, $0 |
| 447 | sd k0, PT_MPL+8(sp) /* PT_MPL+8 has MPL1 */ |
| 448 | jr ra |
| 449 | sd k1, PT_MPL+16(sp) /* PT_MPL+16 has MPL2 */ |
| 450 | octeon_mult_save2_end: |
| 451 | EXPORT(octeon_mult_save2_end) |
| 452 | END(octeon_mult_save2) |
| 453 | |
| 454 | LEAF(octeon_mult_save3) |
| 455 | /* Save the multiplier state OCTEON III */ |
| 456 | v3mulu $10, $0, $0 /* read P0 */ |
| 457 | v3mulu $11, $0, $0 /* read P1 */ |
| 458 | v3mulu $12, $0, $0 /* read P2 */ |
| 459 | sd $10, PT_MTP+(0*8)(sp) /* store P0 */ |
| 460 | v3mulu $10, $0, $0 /* read P3 */ |
| 461 | sd $11, PT_MTP+(1*8)(sp) /* store P1 */ |
| 462 | v3mulu $11, $0, $0 /* read P4 */ |
| 463 | sd $12, PT_MTP+(2*8)(sp) /* store P2 */ |
| 464 | ori $13, $0, 1 |
| 465 | v3mulu $12, $0, $0 /* read P5 */ |
| 466 | sd $10, PT_MTP+(3*8)(sp) /* store P3 */ |
| 467 | v3mulu $13, $13, $0 /* P4-P0 = MPL5-MPL1, $13 = MPL0 */ |
| 468 | sd $11, PT_MTP+(4*8)(sp) /* store P4 */ |
| 469 | v3mulu $10, $0, $0 /* read MPL1 */ |
| 470 | sd $12, PT_MTP+(5*8)(sp) /* store P5 */ |
| 471 | v3mulu $11, $0, $0 /* read MPL2 */ |
| 472 | sd $13, PT_MPL+(0*8)(sp) /* store MPL0 */ |
| 473 | v3mulu $12, $0, $0 /* read MPL3 */ |
| 474 | sd $10, PT_MPL+(1*8)(sp) /* store MPL1 */ |
| 475 | v3mulu $10, $0, $0 /* read MPL4 */ |
| 476 | sd $11, PT_MPL+(2*8)(sp) /* store MPL2 */ |
| 477 | v3mulu $11, $0, $0 /* read MPL5 */ |
| 478 | sd $12, PT_MPL+(3*8)(sp) /* store MPL3 */ |
| 479 | sd $10, PT_MPL+(4*8)(sp) /* store MPL4 */ |
| 480 | jr ra |
| 481 | sd $11, PT_MPL+(5*8)(sp) /* store MPL5 */ |
| 482 | octeon_mult_save3_end: |
| 483 | EXPORT(octeon_mult_save3_end) |
| 484 | END(octeon_mult_save3) |
| 485 | .set pop |
| 486 | |
| 487 | /* |
| 488 | * void octeon_mult_restore() |
| 489 | * sp is assumed to point to a struct pt_regs |
| 490 | * |
| 491 | * NOTE: This is called in RESTORE_TEMP in stackframe.h. |
| 492 | */ |
| 493 | .p2align 7 |
| 494 | .set push |
| 495 | .set noreorder |
| 496 | LEAF(octeon_mult_restore) |
| 497 | jr ra |
| 498 | nop |
| 499 | .space 30 * 4, 0 |
| 500 | octeon_mult_restore_end: |
| 501 | EXPORT(octeon_mult_restore_end) |
| 502 | END(octeon_mult_restore) |
| 503 | |
| 504 | LEAF(octeon_mult_restore2) |
| 505 | ld v0, PT_MPL(sp) /* MPL0 */ |
| 506 | ld v1, PT_MPL+8(sp) /* MPL1 */ |
| 507 | ld k0, PT_MPL+16(sp) /* MPL2 */ |
| 508 | /* Restore the multiplier state */ |
| 509 | ld k1, PT_MTP+16(sp) /* P2 */ |
| 510 | mtm0 v0 /* MPL0 */ |
| 511 | ld v0, PT_MTP+8(sp) /* P1 */ |
| 512 | mtm1 v1 /* MPL1 */ |
| 513 | ld v1, PT_MTP(sp) /* P0 */ |
| 514 | mtm2 k0 /* MPL2 */ |
| 515 | mtp2 k1 /* P2 */ |
| 516 | mtp1 v0 /* P1 */ |
| 517 | jr ra |
| 518 | mtp0 v1 /* P0 */ |
| 519 | octeon_mult_restore2_end: |
| 520 | EXPORT(octeon_mult_restore2_end) |
| 521 | END(octeon_mult_restore2) |
| 522 | |
| 523 | LEAF(octeon_mult_restore3) |
| 524 | ld $12, PT_MPL+(0*8)(sp) /* read MPL0 */ |
| 525 | ld $13, PT_MPL+(3*8)(sp) /* read MPL3 */ |
| 526 | ld $10, PT_MPL+(1*8)(sp) /* read MPL1 */ |
| 527 | ld $11, PT_MPL+(4*8)(sp) /* read MPL4 */ |
| 528 | .word 0x718d0008 |
| 529 | /* mtm0 $12, $13 restore MPL0 and MPL3 */ |
| 530 | ld $12, PT_MPL+(2*8)(sp) /* read MPL2 */ |
| 531 | .word 0x714b000c |
| 532 | /* mtm1 $10, $11 restore MPL1 and MPL4 */ |
| 533 | ld $13, PT_MPL+(5*8)(sp) /* read MPL5 */ |
| 534 | ld $10, PT_MTP+(0*8)(sp) /* read P0 */ |
| 535 | ld $11, PT_MTP+(3*8)(sp) /* read P3 */ |
| 536 | .word 0x718d000d |
| 537 | /* mtm2 $12, $13 restore MPL2 and MPL5 */ |
| 538 | ld $12, PT_MTP+(1*8)(sp) /* read P1 */ |
| 539 | .word 0x714b0009 |
| 540 | /* mtp0 $10, $11 restore P0 and P3 */ |
| 541 | ld $13, PT_MTP+(4*8)(sp) /* read P4 */ |
| 542 | ld $10, PT_MTP+(2*8)(sp) /* read P2 */ |
| 543 | ld $11, PT_MTP+(5*8)(sp) /* read P5 */ |
| 544 | .word 0x718d000a |
| 545 | /* mtp1 $12, $13 restore P1 and P4 */ |
| 546 | jr ra |
| 547 | .word 0x714b000b |
| 548 | /* mtp2 $10, $11 restore P2 and P5 */ |
| 549 | |
| 550 | octeon_mult_restore3_end: |
| 551 | EXPORT(octeon_mult_restore3_end) |
| 552 | END(octeon_mult_restore3) |
| 553 | .set pop |