1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0 */ 2*4882a593Smuzhiyun #ifndef __SPARC_SWITCH_TO_H 3*4882a593Smuzhiyun #define __SPARC_SWITCH_TO_H 4*4882a593Smuzhiyun 5*4882a593Smuzhiyun #include <asm/smp.h> 6*4882a593Smuzhiyun 7*4882a593Smuzhiyun extern struct thread_info *current_set[NR_CPUS]; 8*4882a593Smuzhiyun 9*4882a593Smuzhiyun /* 10*4882a593Smuzhiyun * Flush windows so that the VM switch which follows 11*4882a593Smuzhiyun * would not pull the stack from under us. 12*4882a593Smuzhiyun * 13*4882a593Smuzhiyun * SWITCH_ENTER and SWITCH_DO_LAZY_FPU do not work yet (e.g. SMP does not work) 14*4882a593Smuzhiyun * XXX WTF is the above comment? Found in late teen 2.4.x. 15*4882a593Smuzhiyun */ 16*4882a593Smuzhiyun #ifdef CONFIG_SMP 17*4882a593Smuzhiyun #define SWITCH_ENTER(prv) \ 18*4882a593Smuzhiyun do { \ 19*4882a593Smuzhiyun if (test_tsk_thread_flag(prv, TIF_USEDFPU)) { \ 20*4882a593Smuzhiyun put_psr(get_psr() | PSR_EF); \ 21*4882a593Smuzhiyun fpsave(&(prv)->thread.float_regs[0], &(prv)->thread.fsr, \ 22*4882a593Smuzhiyun &(prv)->thread.fpqueue[0], &(prv)->thread.fpqdepth); \ 23*4882a593Smuzhiyun clear_tsk_thread_flag(prv, TIF_USEDFPU); \ 24*4882a593Smuzhiyun (prv)->thread.kregs->psr &= ~PSR_EF; \ 25*4882a593Smuzhiyun } \ 26*4882a593Smuzhiyun } while(0) 27*4882a593Smuzhiyun 28*4882a593Smuzhiyun #define SWITCH_DO_LAZY_FPU(next) /* */ 29*4882a593Smuzhiyun #else 30*4882a593Smuzhiyun #define SWITCH_ENTER(prv) /* */ 31*4882a593Smuzhiyun #define SWITCH_DO_LAZY_FPU(nxt) \ 32*4882a593Smuzhiyun do { \ 33*4882a593Smuzhiyun if (last_task_used_math != (nxt)) \ 34*4882a593Smuzhiyun (nxt)->thread.kregs->psr&=~PSR_EF; \ 35*4882a593Smuzhiyun } while(0) 36*4882a593Smuzhiyun #endif 37*4882a593Smuzhiyun 38*4882a593Smuzhiyun #define prepare_arch_switch(next) do { \ 39*4882a593Smuzhiyun __asm__ __volatile__( \ 40*4882a593Smuzhiyun ".globl\tflush_patch_switch\nflush_patch_switch:\n\t" \ 41*4882a593Smuzhiyun "save %sp, -0x40, %sp; save %sp, -0x40, %sp; save %sp, -0x40, %sp\n\t" \ 42*4882a593Smuzhiyun "save %sp, -0x40, %sp; save %sp, -0x40, %sp; save %sp, -0x40, %sp\n\t" \ 43*4882a593Smuzhiyun "save %sp, -0x40, %sp\n\t" \ 44*4882a593Smuzhiyun "restore; restore; restore; restore; restore; restore; restore"); \ 45*4882a593Smuzhiyun } while(0) 46*4882a593Smuzhiyun 47*4882a593Smuzhiyun /* Much care has gone into this code, do not touch it. 48*4882a593Smuzhiyun * 49*4882a593Smuzhiyun * We need to loadup regs l0/l1 for the newly forked child 50*4882a593Smuzhiyun * case because the trap return path relies on those registers 51*4882a593Smuzhiyun * holding certain values, gcc is told that they are clobbered. 52*4882a593Smuzhiyun * Gcc needs registers for 3 values in and 1 value out, so we 53*4882a593Smuzhiyun * clobber every non-fixed-usage register besides l2/l3/o4/o5. -DaveM 54*4882a593Smuzhiyun * 55*4882a593Smuzhiyun * Hey Dave, that do not touch sign is too much of an incentive 56*4882a593Smuzhiyun * - Anton & Pete 57*4882a593Smuzhiyun */ 58*4882a593Smuzhiyun #define switch_to(prev, next, last) do { \ 59*4882a593Smuzhiyun SWITCH_ENTER(prev); \ 60*4882a593Smuzhiyun SWITCH_DO_LAZY_FPU(next); \ 61*4882a593Smuzhiyun cpumask_set_cpu(smp_processor_id(), mm_cpumask(next->active_mm)); \ 62*4882a593Smuzhiyun __asm__ __volatile__( \ 63*4882a593Smuzhiyun "sethi %%hi(here - 0x8), %%o7\n\t" \ 64*4882a593Smuzhiyun "mov %%g6, %%g3\n\t" \ 65*4882a593Smuzhiyun "or %%o7, %%lo(here - 0x8), %%o7\n\t" \ 66*4882a593Smuzhiyun "rd %%psr, %%g4\n\t" \ 67*4882a593Smuzhiyun "std %%sp, [%%g6 + %4]\n\t" \ 68*4882a593Smuzhiyun "rd %%wim, %%g5\n\t" \ 69*4882a593Smuzhiyun "wr %%g4, 0x20, %%psr\n\t" \ 70*4882a593Smuzhiyun "nop\n\t" \ 71*4882a593Smuzhiyun "std %%g4, [%%g6 + %3]\n\t" \ 72*4882a593Smuzhiyun "ldd [%2 + %3], %%g4\n\t" \ 73*4882a593Smuzhiyun "mov %2, %%g6\n\t" \ 74*4882a593Smuzhiyun ".globl patchme_store_new_current\n" \ 75*4882a593Smuzhiyun "patchme_store_new_current:\n\t" \ 76*4882a593Smuzhiyun "st %2, [%1]\n\t" \ 77*4882a593Smuzhiyun "wr %%g4, 0x20, %%psr\n\t" \ 78*4882a593Smuzhiyun "nop\n\t" \ 79*4882a593Smuzhiyun "nop\n\t" \ 80*4882a593Smuzhiyun "nop\n\t" /* LEON needs all 3 nops: load to %sp depends on CWP. */ \ 81*4882a593Smuzhiyun "ldd [%%g6 + %4], %%sp\n\t" \ 82*4882a593Smuzhiyun "wr %%g5, 0x0, %%wim\n\t" \ 83*4882a593Smuzhiyun "ldd [%%sp + 0x00], %%l0\n\t" \ 84*4882a593Smuzhiyun "ldd [%%sp + 0x38], %%i6\n\t" \ 85*4882a593Smuzhiyun "wr %%g4, 0x0, %%psr\n\t" \ 86*4882a593Smuzhiyun "nop\n\t" \ 87*4882a593Smuzhiyun "nop\n\t" \ 88*4882a593Smuzhiyun "jmpl %%o7 + 0x8, %%g0\n\t" \ 89*4882a593Smuzhiyun " ld [%%g3 + %5], %0\n\t" \ 90*4882a593Smuzhiyun "here:\n" \ 91*4882a593Smuzhiyun : "=&r" (last) \ 92*4882a593Smuzhiyun : "r" (&(current_set[hard_smp_processor_id()])), \ 93*4882a593Smuzhiyun "r" (task_thread_info(next)), \ 94*4882a593Smuzhiyun "i" (TI_KPSR), \ 95*4882a593Smuzhiyun "i" (TI_KSP), \ 96*4882a593Smuzhiyun "i" (TI_TASK) \ 97*4882a593Smuzhiyun : "g1", "g2", "g3", "g4", "g5", "g7", \ 98*4882a593Smuzhiyun "l0", "l1", "l3", "l4", "l5", "l6", "l7", \ 99*4882a593Smuzhiyun "i0", "i1", "i2", "i3", "i4", "i5", \ 100*4882a593Smuzhiyun "o0", "o1", "o2", "o3", "o7"); \ 101*4882a593Smuzhiyun } while(0) 102*4882a593Smuzhiyun 103*4882a593Smuzhiyun void fpsave(unsigned long *fpregs, unsigned long *fsr, 104*4882a593Smuzhiyun void *fpqueue, unsigned long *fpqdepth); 105*4882a593Smuzhiyun void synchronize_user_stack(void); 106*4882a593Smuzhiyun 107*4882a593Smuzhiyun #endif /* __SPARC_SWITCH_TO_H */ 108