xref: /OK3568_Linux_fs/kernel/arch/sparc/include/asm/switch_to_32.h (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0 */
2*4882a593Smuzhiyun #ifndef __SPARC_SWITCH_TO_H
3*4882a593Smuzhiyun #define __SPARC_SWITCH_TO_H
4*4882a593Smuzhiyun 
5*4882a593Smuzhiyun #include <asm/smp.h>
6*4882a593Smuzhiyun 
7*4882a593Smuzhiyun extern struct thread_info *current_set[NR_CPUS];
8*4882a593Smuzhiyun 
9*4882a593Smuzhiyun /*
10*4882a593Smuzhiyun  * Flush windows so that the VM switch which follows
11*4882a593Smuzhiyun  * would not pull the stack from under us.
12*4882a593Smuzhiyun  *
13*4882a593Smuzhiyun  * SWITCH_ENTER and SWITCH_DO_LAZY_FPU do not work yet (e.g. SMP does not work)
14*4882a593Smuzhiyun  * XXX WTF is the above comment? Found in late teen 2.4.x.
15*4882a593Smuzhiyun  */
16*4882a593Smuzhiyun #ifdef CONFIG_SMP
17*4882a593Smuzhiyun #define SWITCH_ENTER(prv) \
18*4882a593Smuzhiyun 	do {			\
19*4882a593Smuzhiyun 	if (test_tsk_thread_flag(prv, TIF_USEDFPU)) { \
20*4882a593Smuzhiyun 		put_psr(get_psr() | PSR_EF); \
21*4882a593Smuzhiyun 		fpsave(&(prv)->thread.float_regs[0], &(prv)->thread.fsr, \
22*4882a593Smuzhiyun 		       &(prv)->thread.fpqueue[0], &(prv)->thread.fpqdepth); \
23*4882a593Smuzhiyun 		clear_tsk_thread_flag(prv, TIF_USEDFPU); \
24*4882a593Smuzhiyun 		(prv)->thread.kregs->psr &= ~PSR_EF; \
25*4882a593Smuzhiyun 	} \
26*4882a593Smuzhiyun 	} while(0)
27*4882a593Smuzhiyun 
28*4882a593Smuzhiyun #define SWITCH_DO_LAZY_FPU(next)	/* */
29*4882a593Smuzhiyun #else
30*4882a593Smuzhiyun #define SWITCH_ENTER(prv)		/* */
31*4882a593Smuzhiyun #define SWITCH_DO_LAZY_FPU(nxt)	\
32*4882a593Smuzhiyun 	do {			\
33*4882a593Smuzhiyun 	if (last_task_used_math != (nxt))		\
34*4882a593Smuzhiyun 		(nxt)->thread.kregs->psr&=~PSR_EF;	\
35*4882a593Smuzhiyun 	} while(0)
36*4882a593Smuzhiyun #endif
37*4882a593Smuzhiyun 
38*4882a593Smuzhiyun #define prepare_arch_switch(next) do { \
39*4882a593Smuzhiyun 	__asm__ __volatile__( \
40*4882a593Smuzhiyun 	".globl\tflush_patch_switch\nflush_patch_switch:\n\t" \
41*4882a593Smuzhiyun 	"save %sp, -0x40, %sp; save %sp, -0x40, %sp; save %sp, -0x40, %sp\n\t" \
42*4882a593Smuzhiyun 	"save %sp, -0x40, %sp; save %sp, -0x40, %sp; save %sp, -0x40, %sp\n\t" \
43*4882a593Smuzhiyun 	"save %sp, -0x40, %sp\n\t" \
44*4882a593Smuzhiyun 	"restore; restore; restore; restore; restore; restore; restore"); \
45*4882a593Smuzhiyun } while(0)
46*4882a593Smuzhiyun 
47*4882a593Smuzhiyun 	/* Much care has gone into this code, do not touch it.
48*4882a593Smuzhiyun 	 *
49*4882a593Smuzhiyun 	 * We need to loadup regs l0/l1 for the newly forked child
50*4882a593Smuzhiyun 	 * case because the trap return path relies on those registers
51*4882a593Smuzhiyun 	 * holding certain values, gcc is told that they are clobbered.
52*4882a593Smuzhiyun 	 * Gcc needs registers for 3 values in and 1 value out, so we
53*4882a593Smuzhiyun 	 * clobber every non-fixed-usage register besides l2/l3/o4/o5.  -DaveM
54*4882a593Smuzhiyun 	 *
55*4882a593Smuzhiyun 	 * Hey Dave, that do not touch sign is too much of an incentive
56*4882a593Smuzhiyun 	 * - Anton & Pete
57*4882a593Smuzhiyun 	 */
58*4882a593Smuzhiyun #define switch_to(prev, next, last) do {						\
59*4882a593Smuzhiyun 	SWITCH_ENTER(prev);								\
60*4882a593Smuzhiyun 	SWITCH_DO_LAZY_FPU(next);							\
61*4882a593Smuzhiyun 	cpumask_set_cpu(smp_processor_id(), mm_cpumask(next->active_mm));		\
62*4882a593Smuzhiyun 	__asm__ __volatile__(								\
63*4882a593Smuzhiyun 	"sethi	%%hi(here - 0x8), %%o7\n\t"						\
64*4882a593Smuzhiyun 	"mov	%%g6, %%g3\n\t"								\
65*4882a593Smuzhiyun 	"or	%%o7, %%lo(here - 0x8), %%o7\n\t"					\
66*4882a593Smuzhiyun 	"rd	%%psr, %%g4\n\t"							\
67*4882a593Smuzhiyun 	"std	%%sp, [%%g6 + %4]\n\t"							\
68*4882a593Smuzhiyun 	"rd	%%wim, %%g5\n\t"							\
69*4882a593Smuzhiyun 	"wr	%%g4, 0x20, %%psr\n\t"							\
70*4882a593Smuzhiyun 	"nop\n\t"									\
71*4882a593Smuzhiyun 	"std	%%g4, [%%g6 + %3]\n\t"							\
72*4882a593Smuzhiyun 	"ldd	[%2 + %3], %%g4\n\t"							\
73*4882a593Smuzhiyun 	"mov	%2, %%g6\n\t"								\
74*4882a593Smuzhiyun 	".globl	patchme_store_new_current\n"						\
75*4882a593Smuzhiyun "patchme_store_new_current:\n\t"							\
76*4882a593Smuzhiyun 	"st	%2, [%1]\n\t"								\
77*4882a593Smuzhiyun 	"wr	%%g4, 0x20, %%psr\n\t"							\
78*4882a593Smuzhiyun 	"nop\n\t"									\
79*4882a593Smuzhiyun 	"nop\n\t"									\
80*4882a593Smuzhiyun 	"nop\n\t"	/* LEON needs all 3 nops: load to %sp depends on CWP. */		\
81*4882a593Smuzhiyun 	"ldd	[%%g6 + %4], %%sp\n\t"							\
82*4882a593Smuzhiyun 	"wr	%%g5, 0x0, %%wim\n\t"							\
83*4882a593Smuzhiyun 	"ldd	[%%sp + 0x00], %%l0\n\t"						\
84*4882a593Smuzhiyun 	"ldd	[%%sp + 0x38], %%i6\n\t"						\
85*4882a593Smuzhiyun 	"wr	%%g4, 0x0, %%psr\n\t"							\
86*4882a593Smuzhiyun 	"nop\n\t"									\
87*4882a593Smuzhiyun 	"nop\n\t"									\
88*4882a593Smuzhiyun 	"jmpl	%%o7 + 0x8, %%g0\n\t"							\
89*4882a593Smuzhiyun 	" ld	[%%g3 + %5], %0\n\t"							\
90*4882a593Smuzhiyun 	"here:\n"									\
91*4882a593Smuzhiyun         : "=&r" (last)									\
92*4882a593Smuzhiyun         : "r" (&(current_set[hard_smp_processor_id()])),	\
93*4882a593Smuzhiyun 	  "r" (task_thread_info(next)),				\
94*4882a593Smuzhiyun 	  "i" (TI_KPSR),					\
95*4882a593Smuzhiyun 	  "i" (TI_KSP),						\
96*4882a593Smuzhiyun 	  "i" (TI_TASK)						\
97*4882a593Smuzhiyun 	:       "g1", "g2", "g3", "g4", "g5",       "g7",	\
98*4882a593Smuzhiyun 	  "l0", "l1",       "l3", "l4", "l5", "l6", "l7",	\
99*4882a593Smuzhiyun 	  "i0", "i1", "i2", "i3", "i4", "i5",			\
100*4882a593Smuzhiyun 	  "o0", "o1", "o2", "o3",                   "o7");	\
101*4882a593Smuzhiyun 	} while(0)
102*4882a593Smuzhiyun 
103*4882a593Smuzhiyun void fpsave(unsigned long *fpregs, unsigned long *fsr,
104*4882a593Smuzhiyun 	    void *fpqueue, unsigned long *fpqdepth);
105*4882a593Smuzhiyun void synchronize_user_stack(void);
106*4882a593Smuzhiyun 
107*4882a593Smuzhiyun #endif /* __SPARC_SWITCH_TO_H */
108