123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503 |
- /*
- * This file is subject to the terms and conditions of the GNU General Public
- * License. See the file "COPYING" in the main directory of this archive
- * for more details.
- *
- * Copyright (C) 1994, 1995, 1996, 1998, 1999, 2002, 2003 Ralf Baechle
- * Copyright (C) 1996 David S. Miller (davem@davemloft.net)
- * Copyright (C) 1994, 1995, 1996, by Andreas Busse
- * Copyright (C) 1999 Silicon Graphics, Inc.
- * Copyright (C) 2000 MIPS Technologies, Inc.
- * written by Carsten Langgaard, carstenl@mips.com
- */
- #include <asm/asm.h>
- #include <asm/cachectl.h>
- #include <asm/fpregdef.h>
- #include <asm/mipsregs.h>
- #include <asm/asm-offsets.h>
- #include <asm/page.h>
- #include <asm/pgtable-bits.h>
- #include <asm/regdef.h>
- #include <asm/stackframe.h>
- #include <asm/thread_info.h>
- #include <asm/asmmacro.h>
- /*
- * Offset to the current process status flags, the first 32 bytes of the
- * stack are not used.
- */
- #define ST_OFF (_THREAD_SIZE - 32 - PT_SIZE + PT_STATUS)
- /*
- * task_struct *resume(task_struct *prev, task_struct *next,
- * struct thread_info *next_ti)
- */
- .align 7
- LEAF(resume)
- .set arch=octeon
- mfc0 t1, CP0_STATUS
- LONG_S t1, THREAD_STATUS(a0)
- cpu_save_nonscratch a0
- LONG_S ra, THREAD_REG31(a0)
- /* check if we need to save COP2 registers */
- PTR_L t2, TASK_THREAD_INFO(a0)
- LONG_L t0, ST_OFF(t2)
- bbit0 t0, 30, 1f
- /* Disable COP2 in the stored process state */
- li t1, ST0_CU2
- xor t0, t1
- LONG_S t0, ST_OFF(t2)
- /* Enable COP2 so we can save it */
- mfc0 t0, CP0_STATUS
- or t0, t1
- mtc0 t0, CP0_STATUS
- /* Save COP2 */
- daddu a0, THREAD_CP2
- jal octeon_cop2_save
- dsubu a0, THREAD_CP2
- /* Disable COP2 now that we are done */
- mfc0 t0, CP0_STATUS
- li t1, ST0_CU2
- xor t0, t1
- mtc0 t0, CP0_STATUS
- 1:
- #if CONFIG_CAVIUM_OCTEON_CVMSEG_SIZE > 0
- /* Check if we need to store CVMSEG state */
- mfc0 t0, $11,7 /* CvmMemCtl */
- bbit0 t0, 6, 3f /* Is user access enabled? */
- /* Store the CVMSEG state */
- /* Extract the size of CVMSEG */
- andi t0, 0x3f
- /* Multiply * (cache line size/sizeof(long)/2) */
- sll t0, 7-LONGLOG-1
- li t1, -32768 /* Base address of CVMSEG */
- LONG_ADDI t2, a0, THREAD_CVMSEG /* Where to store CVMSEG to */
- synciobdma
- 2:
- .set noreorder
- LONG_L t8, 0(t1) /* Load from CVMSEG */
- subu t0, 1 /* Decrement loop var */
- LONG_L t9, LONGSIZE(t1)/* Load from CVMSEG */
- LONG_ADDU t1, LONGSIZE*2 /* Increment loc in CVMSEG */
- LONG_S t8, 0(t2) /* Store CVMSEG to thread storage */
- LONG_ADDU t2, LONGSIZE*2 /* Increment loc in thread storage */
- bnez t0, 2b /* Loop until we've copied it all */
- LONG_S t9, -LONGSIZE(t2)/* Store CVMSEG to thread storage */
- .set reorder
- /* Disable access to CVMSEG */
- mfc0 t0, $11,7 /* CvmMemCtl */
- xori t0, t0, 0x40 /* Bit 6 is CVMSEG user enable */
- mtc0 t0, $11,7 /* CvmMemCtl */
- #endif
- 3:
- /*
- * The order of restoring the registers takes care of the race
- * updating $28, $29 and kernelsp without disabling ints.
- */
- move $28, a2
- cpu_restore_nonscratch a1
- #if (_THREAD_SIZE - 32) < 0x8000
- PTR_ADDIU t0, $28, _THREAD_SIZE - 32
- #else
- PTR_LI t0, _THREAD_SIZE - 32
- PTR_ADDU t0, $28
- #endif
- set_saved_sp t0, t1, t2
- mfc0 t1, CP0_STATUS /* Do we really need this? */
- li a3, 0xff01
- and t1, a3
- LONG_L a2, THREAD_STATUS(a1)
- nor a3, $0, a3
- and a2, a3
- or a2, t1
- mtc0 a2, CP0_STATUS
- move v0, a0
- jr ra
- END(resume)
- /*
- * void octeon_cop2_save(struct octeon_cop2_state *a0)
- */
- .align 7
- LEAF(octeon_cop2_save)
- dmfc0 t9, $9,7 /* CvmCtl register. */
- /* Save the COP2 CRC state */
- dmfc2 t0, 0x0201
- dmfc2 t1, 0x0202
- dmfc2 t2, 0x0200
- sd t0, OCTEON_CP2_CRC_IV(a0)
- sd t1, OCTEON_CP2_CRC_LENGTH(a0)
- sd t2, OCTEON_CP2_CRC_POLY(a0)
- /* Skip next instructions if CvmCtl[NODFA_CP2] set */
- bbit1 t9, 28, 1f
- /* Save the LLM state */
- dmfc2 t0, 0x0402
- dmfc2 t1, 0x040A
- sd t0, OCTEON_CP2_LLM_DAT(a0)
- sd t1, OCTEON_CP2_LLM_DAT+8(a0)
- 1: bbit1 t9, 26, 3f /* done if CvmCtl[NOCRYPTO] set */
- /* Save the COP2 crypto state */
- /* this part is mostly common to both pass 1 and later revisions */
- dmfc2 t0, 0x0084
- dmfc2 t1, 0x0080
- dmfc2 t2, 0x0081
- dmfc2 t3, 0x0082
- sd t0, OCTEON_CP2_3DES_IV(a0)
- dmfc2 t0, 0x0088
- sd t1, OCTEON_CP2_3DES_KEY(a0)
- dmfc2 t1, 0x0111 /* only necessary for pass 1 */
- sd t2, OCTEON_CP2_3DES_KEY+8(a0)
- dmfc2 t2, 0x0102
- sd t3, OCTEON_CP2_3DES_KEY+16(a0)
- dmfc2 t3, 0x0103
- sd t0, OCTEON_CP2_3DES_RESULT(a0)
- dmfc2 t0, 0x0104
- sd t1, OCTEON_CP2_AES_INP0(a0) /* only necessary for pass 1 */
- dmfc2 t1, 0x0105
- sd t2, OCTEON_CP2_AES_IV(a0)
- dmfc2 t2, 0x0106
- sd t3, OCTEON_CP2_AES_IV+8(a0)
- dmfc2 t3, 0x0107
- sd t0, OCTEON_CP2_AES_KEY(a0)
- dmfc2 t0, 0x0110
- sd t1, OCTEON_CP2_AES_KEY+8(a0)
- dmfc2 t1, 0x0100
- sd t2, OCTEON_CP2_AES_KEY+16(a0)
- dmfc2 t2, 0x0101
- sd t3, OCTEON_CP2_AES_KEY+24(a0)
- mfc0 t3, $15,0 /* Get the processor ID register */
- sd t0, OCTEON_CP2_AES_KEYLEN(a0)
- li t0, 0x000d0000 /* This is the processor ID of Octeon Pass1 */
- sd t1, OCTEON_CP2_AES_RESULT(a0)
- sd t2, OCTEON_CP2_AES_RESULT+8(a0)
- /* Skip to the Pass1 version of the remainder of the COP2 state */
- beq t3, t0, 2f
- /* the non-pass1 state when !CvmCtl[NOCRYPTO] */
- dmfc2 t1, 0x0240
- dmfc2 t2, 0x0241
- dmfc2 t3, 0x0242
- dmfc2 t0, 0x0243
- sd t1, OCTEON_CP2_HSH_DATW(a0)
- dmfc2 t1, 0x0244
- sd t2, OCTEON_CP2_HSH_DATW+8(a0)
- dmfc2 t2, 0x0245
- sd t3, OCTEON_CP2_HSH_DATW+16(a0)
- dmfc2 t3, 0x0246
- sd t0, OCTEON_CP2_HSH_DATW+24(a0)
- dmfc2 t0, 0x0247
- sd t1, OCTEON_CP2_HSH_DATW+32(a0)
- dmfc2 t1, 0x0248
- sd t2, OCTEON_CP2_HSH_DATW+40(a0)
- dmfc2 t2, 0x0249
- sd t3, OCTEON_CP2_HSH_DATW+48(a0)
- dmfc2 t3, 0x024A
- sd t0, OCTEON_CP2_HSH_DATW+56(a0)
- dmfc2 t0, 0x024B
- sd t1, OCTEON_CP2_HSH_DATW+64(a0)
- dmfc2 t1, 0x024C
- sd t2, OCTEON_CP2_HSH_DATW+72(a0)
- dmfc2 t2, 0x024D
- sd t3, OCTEON_CP2_HSH_DATW+80(a0)
- dmfc2 t3, 0x024E
- sd t0, OCTEON_CP2_HSH_DATW+88(a0)
- dmfc2 t0, 0x0250
- sd t1, OCTEON_CP2_HSH_DATW+96(a0)
- dmfc2 t1, 0x0251
- sd t2, OCTEON_CP2_HSH_DATW+104(a0)
- dmfc2 t2, 0x0252
- sd t3, OCTEON_CP2_HSH_DATW+112(a0)
- dmfc2 t3, 0x0253
- sd t0, OCTEON_CP2_HSH_IVW(a0)
- dmfc2 t0, 0x0254
- sd t1, OCTEON_CP2_HSH_IVW+8(a0)
- dmfc2 t1, 0x0255
- sd t2, OCTEON_CP2_HSH_IVW+16(a0)
- dmfc2 t2, 0x0256
- sd t3, OCTEON_CP2_HSH_IVW+24(a0)
- dmfc2 t3, 0x0257
- sd t0, OCTEON_CP2_HSH_IVW+32(a0)
- dmfc2 t0, 0x0258
- sd t1, OCTEON_CP2_HSH_IVW+40(a0)
- dmfc2 t1, 0x0259
- sd t2, OCTEON_CP2_HSH_IVW+48(a0)
- dmfc2 t2, 0x025E
- sd t3, OCTEON_CP2_HSH_IVW+56(a0)
- dmfc2 t3, 0x025A
- sd t0, OCTEON_CP2_GFM_MULT(a0)
- dmfc2 t0, 0x025B
- sd t1, OCTEON_CP2_GFM_MULT+8(a0)
- sd t2, OCTEON_CP2_GFM_POLY(a0)
- sd t3, OCTEON_CP2_GFM_RESULT(a0)
- sd t0, OCTEON_CP2_GFM_RESULT+8(a0)
- jr ra
- 2: /* pass 1 special stuff when !CvmCtl[NOCRYPTO] */
- dmfc2 t3, 0x0040
- dmfc2 t0, 0x0041
- dmfc2 t1, 0x0042
- dmfc2 t2, 0x0043
- sd t3, OCTEON_CP2_HSH_DATW(a0)
- dmfc2 t3, 0x0044
- sd t0, OCTEON_CP2_HSH_DATW+8(a0)
- dmfc2 t0, 0x0045
- sd t1, OCTEON_CP2_HSH_DATW+16(a0)
- dmfc2 t1, 0x0046
- sd t2, OCTEON_CP2_HSH_DATW+24(a0)
- dmfc2 t2, 0x0048
- sd t3, OCTEON_CP2_HSH_DATW+32(a0)
- dmfc2 t3, 0x0049
- sd t0, OCTEON_CP2_HSH_DATW+40(a0)
- dmfc2 t0, 0x004A
- sd t1, OCTEON_CP2_HSH_DATW+48(a0)
- sd t2, OCTEON_CP2_HSH_IVW(a0)
- sd t3, OCTEON_CP2_HSH_IVW+8(a0)
- sd t0, OCTEON_CP2_HSH_IVW+16(a0)
- 3: /* pass 1 or CvmCtl[NOCRYPTO] set */
- jr ra
- END(octeon_cop2_save)
- /*
- * void octeon_cop2_restore(struct octeon_cop2_state *a0)
- */
- .align 7
- .set push
- .set noreorder
- LEAF(octeon_cop2_restore)
- /* First cache line was prefetched before the call */
- pref 4, 128(a0)
- dmfc0 t9, $9,7 /* CvmCtl register. */
- pref 4, 256(a0)
- ld t0, OCTEON_CP2_CRC_IV(a0)
- pref 4, 384(a0)
- ld t1, OCTEON_CP2_CRC_LENGTH(a0)
- ld t2, OCTEON_CP2_CRC_POLY(a0)
- /* Restore the COP2 CRC state */
- dmtc2 t0, 0x0201
- dmtc2 t1, 0x1202
- bbit1 t9, 28, 2f /* Skip LLM if CvmCtl[NODFA_CP2] is set */
- dmtc2 t2, 0x4200
- /* Restore the LLM state */
- ld t0, OCTEON_CP2_LLM_DAT(a0)
- ld t1, OCTEON_CP2_LLM_DAT+8(a0)
- dmtc2 t0, 0x0402
- dmtc2 t1, 0x040A
- 2:
- bbit1 t9, 26, done_restore /* done if CvmCtl[NOCRYPTO] set */
- nop
- /* Restore the COP2 crypto state common to pass 1 and pass 2 */
- ld t0, OCTEON_CP2_3DES_IV(a0)
- ld t1, OCTEON_CP2_3DES_KEY(a0)
- ld t2, OCTEON_CP2_3DES_KEY+8(a0)
- dmtc2 t0, 0x0084
- ld t0, OCTEON_CP2_3DES_KEY+16(a0)
- dmtc2 t1, 0x0080
- ld t1, OCTEON_CP2_3DES_RESULT(a0)
- dmtc2 t2, 0x0081
- ld t2, OCTEON_CP2_AES_INP0(a0) /* only really needed for pass 1 */
- dmtc2 t0, 0x0082
- ld t0, OCTEON_CP2_AES_IV(a0)
- dmtc2 t1, 0x0098
- ld t1, OCTEON_CP2_AES_IV+8(a0)
- dmtc2 t2, 0x010A /* only really needed for pass 1 */
- ld t2, OCTEON_CP2_AES_KEY(a0)
- dmtc2 t0, 0x0102
- ld t0, OCTEON_CP2_AES_KEY+8(a0)
- dmtc2 t1, 0x0103
- ld t1, OCTEON_CP2_AES_KEY+16(a0)
- dmtc2 t2, 0x0104
- ld t2, OCTEON_CP2_AES_KEY+24(a0)
- dmtc2 t0, 0x0105
- ld t0, OCTEON_CP2_AES_KEYLEN(a0)
- dmtc2 t1, 0x0106
- ld t1, OCTEON_CP2_AES_RESULT(a0)
- dmtc2 t2, 0x0107
- ld t2, OCTEON_CP2_AES_RESULT+8(a0)
- mfc0 t3, $15,0 /* Get the processor ID register */
- dmtc2 t0, 0x0110
- li t0, 0x000d0000 /* This is the processor ID of Octeon Pass1 */
- dmtc2 t1, 0x0100
- bne t0, t3, 3f /* Skip the next stuff for non-pass1 */
- dmtc2 t2, 0x0101
- /* this code is specific for pass 1 */
- ld t0, OCTEON_CP2_HSH_DATW(a0)
- ld t1, OCTEON_CP2_HSH_DATW+8(a0)
- ld t2, OCTEON_CP2_HSH_DATW+16(a0)
- dmtc2 t0, 0x0040
- ld t0, OCTEON_CP2_HSH_DATW+24(a0)
- dmtc2 t1, 0x0041
- ld t1, OCTEON_CP2_HSH_DATW+32(a0)
- dmtc2 t2, 0x0042
- ld t2, OCTEON_CP2_HSH_DATW+40(a0)
- dmtc2 t0, 0x0043
- ld t0, OCTEON_CP2_HSH_DATW+48(a0)
- dmtc2 t1, 0x0044
- ld t1, OCTEON_CP2_HSH_IVW(a0)
- dmtc2 t2, 0x0045
- ld t2, OCTEON_CP2_HSH_IVW+8(a0)
- dmtc2 t0, 0x0046
- ld t0, OCTEON_CP2_HSH_IVW+16(a0)
- dmtc2 t1, 0x0048
- dmtc2 t2, 0x0049
- b done_restore /* unconditional branch */
- dmtc2 t0, 0x004A
- 3: /* this is post-pass1 code */
- ld t2, OCTEON_CP2_HSH_DATW(a0)
- ld t0, OCTEON_CP2_HSH_DATW+8(a0)
- ld t1, OCTEON_CP2_HSH_DATW+16(a0)
- dmtc2 t2, 0x0240
- ld t2, OCTEON_CP2_HSH_DATW+24(a0)
- dmtc2 t0, 0x0241
- ld t0, OCTEON_CP2_HSH_DATW+32(a0)
- dmtc2 t1, 0x0242
- ld t1, OCTEON_CP2_HSH_DATW+40(a0)
- dmtc2 t2, 0x0243
- ld t2, OCTEON_CP2_HSH_DATW+48(a0)
- dmtc2 t0, 0x0244
- ld t0, OCTEON_CP2_HSH_DATW+56(a0)
- dmtc2 t1, 0x0245
- ld t1, OCTEON_CP2_HSH_DATW+64(a0)
- dmtc2 t2, 0x0246
- ld t2, OCTEON_CP2_HSH_DATW+72(a0)
- dmtc2 t0, 0x0247
- ld t0, OCTEON_CP2_HSH_DATW+80(a0)
- dmtc2 t1, 0x0248
- ld t1, OCTEON_CP2_HSH_DATW+88(a0)
- dmtc2 t2, 0x0249
- ld t2, OCTEON_CP2_HSH_DATW+96(a0)
- dmtc2 t0, 0x024A
- ld t0, OCTEON_CP2_HSH_DATW+104(a0)
- dmtc2 t1, 0x024B
- ld t1, OCTEON_CP2_HSH_DATW+112(a0)
- dmtc2 t2, 0x024C
- ld t2, OCTEON_CP2_HSH_IVW(a0)
- dmtc2 t0, 0x024D
- ld t0, OCTEON_CP2_HSH_IVW+8(a0)
- dmtc2 t1, 0x024E
- ld t1, OCTEON_CP2_HSH_IVW+16(a0)
- dmtc2 t2, 0x0250
- ld t2, OCTEON_CP2_HSH_IVW+24(a0)
- dmtc2 t0, 0x0251
- ld t0, OCTEON_CP2_HSH_IVW+32(a0)
- dmtc2 t1, 0x0252
- ld t1, OCTEON_CP2_HSH_IVW+40(a0)
- dmtc2 t2, 0x0253
- ld t2, OCTEON_CP2_HSH_IVW+48(a0)
- dmtc2 t0, 0x0254
- ld t0, OCTEON_CP2_HSH_IVW+56(a0)
- dmtc2 t1, 0x0255
- ld t1, OCTEON_CP2_GFM_MULT(a0)
- dmtc2 t2, 0x0256
- ld t2, OCTEON_CP2_GFM_MULT+8(a0)
- dmtc2 t0, 0x0257
- ld t0, OCTEON_CP2_GFM_POLY(a0)
- dmtc2 t1, 0x0258
- ld t1, OCTEON_CP2_GFM_RESULT(a0)
- dmtc2 t2, 0x0259
- ld t2, OCTEON_CP2_GFM_RESULT+8(a0)
- dmtc2 t0, 0x025E
- dmtc2 t1, 0x025A
- dmtc2 t2, 0x025B
- done_restore:
- jr ra
- nop
- END(octeon_cop2_restore)
- .set pop
- /*
- * void octeon_mult_save()
- * sp is assumed to point to a struct pt_regs
- *
- * NOTE: This is called in SAVE_SOME in stackframe.h. It can only
- * safely modify k0 and k1.
- */
- .align 7
- .set push
- .set noreorder
- LEAF(octeon_mult_save)
- dmfc0 k0, $9,7 /* CvmCtl register. */
- bbit1 k0, 27, 1f /* Skip CvmCtl[NOMUL] */
- nop
- /* Save the multiplier state */
- v3mulu k0, $0, $0
- v3mulu k1, $0, $0
- sd k0, PT_MTP(sp) /* PT_MTP has P0 */
- v3mulu k0, $0, $0
- sd k1, PT_MTP+8(sp) /* PT_MTP+8 has P1 */
- ori k1, $0, 1
- v3mulu k1, k1, $0
- sd k0, PT_MTP+16(sp) /* PT_MTP+16 has P2 */
- v3mulu k0, $0, $0
- sd k1, PT_MPL(sp) /* PT_MPL has MPL0 */
- v3mulu k1, $0, $0
- sd k0, PT_MPL+8(sp) /* PT_MPL+8 has MPL1 */
- jr ra
- sd k1, PT_MPL+16(sp) /* PT_MPL+16 has MPL2 */
- 1: /* Resume here if CvmCtl[NOMUL] */
- jr ra
- END(octeon_mult_save)
- .set pop
- /*
- * void octeon_mult_restore()
- * sp is assumed to point to a struct pt_regs
- *
- * NOTE: This is called in RESTORE_SOME in stackframe.h.
- */
- .align 7
- .set push
- .set noreorder
- LEAF(octeon_mult_restore)
- dmfc0 k1, $9,7 /* CvmCtl register. */
- ld v0, PT_MPL(sp) /* MPL0 */
- ld v1, PT_MPL+8(sp) /* MPL1 */
- ld k0, PT_MPL+16(sp) /* MPL2 */
- bbit1 k1, 27, 1f /* Skip CvmCtl[NOMUL] */
- /* Normally falls through, so no time wasted here */
- nop
- /* Restore the multiplier state */
- ld k1, PT_MTP+16(sp) /* P2 */
- MTM0 v0 /* MPL0 */
- ld v0, PT_MTP+8(sp) /* P1 */
- MTM1 v1 /* MPL1 */
- ld v1, PT_MTP(sp) /* P0 */
- MTM2 k0 /* MPL2 */
- MTP2 k1 /* P2 */
- MTP1 v0 /* P1 */
- jr ra
- MTP0 v1 /* P0 */
- 1: /* Resume here if CvmCtl[NOMUL] */
- jr ra
- nop
- END(octeon_mult_restore)
- .set pop
|