123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337 |
- /*
- * spu_restore.c
- *
- * (C) Copyright IBM Corp. 2005
- *
- * SPU-side context restore sequence outlined in
- * Synergistic Processor Element Book IV
- *
- * Author: Mark Nutter <mnutter@us.ibm.com>
- *
- * This program is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License as published by
- * the Free Software Foundation; either version 2, or (at your option)
- * any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with this program; if not, write to the Free Software
- * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
- *
- */
- #ifndef LS_SIZE
- #define LS_SIZE 0x40000 /* 256K (in bytes) */
- #endif
- typedef unsigned int u32;
- typedef unsigned long long u64;
- #include <spu_intrinsics.h>
- #include <asm/spu_csa.h>
- #include "spu_utils.h"
- #define BR_INSTR 0x327fff80 /* br -4 */
- #define NOP_INSTR 0x40200000 /* nop */
- #define HEQ_INSTR 0x7b000000 /* heq $0, $0 */
- #define STOP_INSTR 0x00000000 /* stop 0x0 */
- #define ILLEGAL_INSTR 0x00800000 /* illegal instr */
- #define RESTORE_COMPLETE 0x00003ffc /* stop 0x3ffc */
- static inline void fetch_regs_from_mem(addr64 lscsa_ea)
- {
- unsigned int ls = (unsigned int)®s_spill[0];
- unsigned int size = sizeof(regs_spill);
- unsigned int tag_id = 0;
- unsigned int cmd = 0x40; /* GET */
- spu_writech(MFC_LSA, ls);
- spu_writech(MFC_EAH, lscsa_ea.ui[0]);
- spu_writech(MFC_EAL, lscsa_ea.ui[1]);
- spu_writech(MFC_Size, size);
- spu_writech(MFC_TagID, tag_id);
- spu_writech(MFC_Cmd, cmd);
- }
- static inline void restore_upper_240kb(addr64 lscsa_ea)
- {
- unsigned int ls = 16384;
- unsigned int list = (unsigned int)&dma_list[0];
- unsigned int size = sizeof(dma_list);
- unsigned int tag_id = 0;
- unsigned int cmd = 0x44; /* GETL */
- /* Restore, Step 4:
- * Enqueue the GETL command (tag 0) to the MFC SPU command
- * queue to transfer the upper 240 kb of LS from CSA.
- */
- spu_writech(MFC_LSA, ls);
- spu_writech(MFC_EAH, lscsa_ea.ui[0]);
- spu_writech(MFC_EAL, list);
- spu_writech(MFC_Size, size);
- spu_writech(MFC_TagID, tag_id);
- spu_writech(MFC_Cmd, cmd);
- }
- static inline void restore_decr(void)
- {
- unsigned int offset;
- unsigned int decr_running;
- unsigned int decr;
- /* Restore, Step 6(moved):
- * If the LSCSA "decrementer running" flag is set
- * then write the SPU_WrDec channel with the
- * decrementer value from LSCSA.
- */
- offset = LSCSA_QW_OFFSET(decr_status);
- decr_running = regs_spill[offset].slot[0] & SPU_DECR_STATUS_RUNNING;
- if (decr_running) {
- offset = LSCSA_QW_OFFSET(decr);
- decr = regs_spill[offset].slot[0];
- spu_writech(SPU_WrDec, decr);
- }
- }
- static inline void write_ppu_mb(void)
- {
- unsigned int offset;
- unsigned int data;
- /* Restore, Step 11:
- * Write the MFC_WrOut_MB channel with the PPU_MB
- * data from LSCSA.
- */
- offset = LSCSA_QW_OFFSET(ppu_mb);
- data = regs_spill[offset].slot[0];
- spu_writech(SPU_WrOutMbox, data);
- }
- static inline void write_ppuint_mb(void)
- {
- unsigned int offset;
- unsigned int data;
- /* Restore, Step 12:
- * Write the MFC_WrInt_MB channel with the PPUINT_MB
- * data from LSCSA.
- */
- offset = LSCSA_QW_OFFSET(ppuint_mb);
- data = regs_spill[offset].slot[0];
- spu_writech(SPU_WrOutIntrMbox, data);
- }
- static inline void restore_fpcr(void)
- {
- unsigned int offset;
- vector unsigned int fpcr;
- /* Restore, Step 13:
- * Restore the floating-point status and control
- * register from the LSCSA.
- */
- offset = LSCSA_QW_OFFSET(fpcr);
- fpcr = regs_spill[offset].v;
- spu_mtfpscr(fpcr);
- }
- static inline void restore_srr0(void)
- {
- unsigned int offset;
- unsigned int srr0;
- /* Restore, Step 14:
- * Restore the SPU SRR0 data from the LSCSA.
- */
- offset = LSCSA_QW_OFFSET(srr0);
- srr0 = regs_spill[offset].slot[0];
- spu_writech(SPU_WrSRR0, srr0);
- }
- static inline void restore_event_mask(void)
- {
- unsigned int offset;
- unsigned int event_mask;
- /* Restore, Step 15:
- * Restore the SPU_RdEventMsk data from the LSCSA.
- */
- offset = LSCSA_QW_OFFSET(event_mask);
- event_mask = regs_spill[offset].slot[0];
- spu_writech(SPU_WrEventMask, event_mask);
- }
- static inline void restore_tag_mask(void)
- {
- unsigned int offset;
- unsigned int tag_mask;
- /* Restore, Step 16:
- * Restore the SPU_RdTagMsk data from the LSCSA.
- */
- offset = LSCSA_QW_OFFSET(tag_mask);
- tag_mask = regs_spill[offset].slot[0];
- spu_writech(MFC_WrTagMask, tag_mask);
- }
- static inline void restore_complete(void)
- {
- extern void exit_fini(void);
- unsigned int *exit_instrs = (unsigned int *)exit_fini;
- unsigned int offset;
- unsigned int stopped_status;
- unsigned int stopped_code;
- /* Restore, Step 18:
- * Issue a stop-and-signal instruction with
- * "good context restore" signal value.
- *
- * Restore, Step 19:
- * There may be additional instructions placed
- * here by the PPE Sequence for SPU Context
- * Restore in order to restore the correct
- * "stopped state".
- *
- * This step is handled here by analyzing the
- * LSCSA.stopped_status and then modifying the
- * exit() function to behave appropriately.
- */
- offset = LSCSA_QW_OFFSET(stopped_status);
- stopped_status = regs_spill[offset].slot[0];
- stopped_code = regs_spill[offset].slot[1];
- switch (stopped_status) {
- case SPU_STOPPED_STATUS_P_I:
- /* SPU_Status[P,I]=1. Add illegal instruction
- * followed by stop-and-signal instruction after
- * end of restore code.
- */
- exit_instrs[0] = RESTORE_COMPLETE;
- exit_instrs[1] = ILLEGAL_INSTR;
- exit_instrs[2] = STOP_INSTR | stopped_code;
- break;
- case SPU_STOPPED_STATUS_P_H:
- /* SPU_Status[P,H]=1. Add 'heq $0, $0' followed
- * by stop-and-signal instruction after end of
- * restore code.
- */
- exit_instrs[0] = RESTORE_COMPLETE;
- exit_instrs[1] = HEQ_INSTR;
- exit_instrs[2] = STOP_INSTR | stopped_code;
- break;
- case SPU_STOPPED_STATUS_S_P:
- /* SPU_Status[S,P]=1. Add nop instruction
- * followed by 'br -4' after end of restore
- * code.
- */
- exit_instrs[0] = RESTORE_COMPLETE;
- exit_instrs[1] = STOP_INSTR | stopped_code;
- exit_instrs[2] = NOP_INSTR;
- exit_instrs[3] = BR_INSTR;
- break;
- case SPU_STOPPED_STATUS_S_I:
- /* SPU_Status[S,I]=1. Add illegal instruction
- * followed by 'br -4' after end of restore code.
- */
- exit_instrs[0] = RESTORE_COMPLETE;
- exit_instrs[1] = ILLEGAL_INSTR;
- exit_instrs[2] = NOP_INSTR;
- exit_instrs[3] = BR_INSTR;
- break;
- case SPU_STOPPED_STATUS_I:
- /* SPU_Status[I]=1. Add illegal instruction followed
- * by infinite loop after end of restore sequence.
- */
- exit_instrs[0] = RESTORE_COMPLETE;
- exit_instrs[1] = ILLEGAL_INSTR;
- exit_instrs[2] = NOP_INSTR;
- exit_instrs[3] = BR_INSTR;
- break;
- case SPU_STOPPED_STATUS_S:
- /* SPU_Status[S]=1. Add two 'nop' instructions. */
- exit_instrs[0] = RESTORE_COMPLETE;
- exit_instrs[1] = NOP_INSTR;
- exit_instrs[2] = NOP_INSTR;
- exit_instrs[3] = BR_INSTR;
- break;
- case SPU_STOPPED_STATUS_H:
- /* SPU_Status[H]=1. Add 'heq $0, $0' instruction
- * after end of restore code.
- */
- exit_instrs[0] = RESTORE_COMPLETE;
- exit_instrs[1] = HEQ_INSTR;
- exit_instrs[2] = NOP_INSTR;
- exit_instrs[3] = BR_INSTR;
- break;
- case SPU_STOPPED_STATUS_P:
- /* SPU_Status[P]=1. Add stop-and-signal instruction
- * after end of restore code.
- */
- exit_instrs[0] = RESTORE_COMPLETE;
- exit_instrs[1] = STOP_INSTR | stopped_code;
- break;
- case SPU_STOPPED_STATUS_R:
- /* SPU_Status[I,S,H,P,R]=0. Add infinite loop. */
- exit_instrs[0] = RESTORE_COMPLETE;
- exit_instrs[1] = NOP_INSTR;
- exit_instrs[2] = NOP_INSTR;
- exit_instrs[3] = BR_INSTR;
- break;
- default:
- /* SPU_Status[R]=1. No additional instructions. */
- break;
- }
- spu_sync();
- }
- /**
- * main - entry point for SPU-side context restore.
- *
- * This code deviates from the documented sequence in the
- * following aspects:
- *
- * 1. The EA for LSCSA is passed from PPE in the
- * signal notification channels.
- * 2. The register spill area is pulled by SPU
- * into LS, rather than pushed by PPE.
- * 3. All 128 registers are restored by exit().
- * 4. The exit() function is modified at run
- * time in order to properly restore the
- * SPU_Status register.
- */
- int main()
- {
- addr64 lscsa_ea;
- lscsa_ea.ui[0] = spu_readch(SPU_RdSigNotify1);
- lscsa_ea.ui[1] = spu_readch(SPU_RdSigNotify2);
- fetch_regs_from_mem(lscsa_ea);
- set_event_mask(); /* Step 1. */
- set_tag_mask(); /* Step 2. */
- build_dma_list(lscsa_ea); /* Step 3. */
- restore_upper_240kb(lscsa_ea); /* Step 4. */
- /* Step 5: done by 'exit'. */
- enqueue_putllc(lscsa_ea); /* Step 7. */
- set_tag_update(); /* Step 8. */
- read_tag_status(); /* Step 9. */
- restore_decr(); /* moved Step 6. */
- read_llar_status(); /* Step 10. */
- write_ppu_mb(); /* Step 11. */
- write_ppuint_mb(); /* Step 12. */
- restore_fpcr(); /* Step 13. */
- restore_srr0(); /* Step 14. */
- restore_event_mask(); /* Step 15. */
- restore_tag_mask(); /* Step 16. */
- /* Step 17. done by 'exit'. */
- restore_complete(); /* Step 18. */
- return 0;
- }
|