xref: /OK3568_Linux_fs/kernel/arch/sparc/include/asm/mmu_context_64.h (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0 */
2*4882a593Smuzhiyun #ifndef __SPARC64_MMU_CONTEXT_H
3*4882a593Smuzhiyun #define __SPARC64_MMU_CONTEXT_H
4*4882a593Smuzhiyun 
5*4882a593Smuzhiyun /* Derived heavily from Linus's Alpha/AXP ASN code... */
6*4882a593Smuzhiyun 
7*4882a593Smuzhiyun #ifndef __ASSEMBLY__
8*4882a593Smuzhiyun 
9*4882a593Smuzhiyun #include <linux/spinlock.h>
10*4882a593Smuzhiyun #include <linux/mm_types.h>
11*4882a593Smuzhiyun #include <linux/smp.h>
12*4882a593Smuzhiyun #include <linux/sched.h>
13*4882a593Smuzhiyun 
14*4882a593Smuzhiyun #include <asm/spitfire.h>
15*4882a593Smuzhiyun #include <asm/adi_64.h>
16*4882a593Smuzhiyun #include <asm-generic/mm_hooks.h>
17*4882a593Smuzhiyun #include <asm/percpu.h>
18*4882a593Smuzhiyun 
enter_lazy_tlb(struct mm_struct * mm,struct task_struct * tsk)19*4882a593Smuzhiyun static inline void enter_lazy_tlb(struct mm_struct *mm, struct task_struct *tsk)
20*4882a593Smuzhiyun {
21*4882a593Smuzhiyun }
22*4882a593Smuzhiyun 
23*4882a593Smuzhiyun extern spinlock_t ctx_alloc_lock;
24*4882a593Smuzhiyun extern unsigned long tlb_context_cache;
25*4882a593Smuzhiyun extern unsigned long mmu_context_bmap[];
26*4882a593Smuzhiyun 
27*4882a593Smuzhiyun DECLARE_PER_CPU(struct mm_struct *, per_cpu_secondary_mm);
28*4882a593Smuzhiyun void get_new_mmu_context(struct mm_struct *mm);
29*4882a593Smuzhiyun int init_new_context(struct task_struct *tsk, struct mm_struct *mm);
30*4882a593Smuzhiyun void destroy_context(struct mm_struct *mm);
31*4882a593Smuzhiyun 
32*4882a593Smuzhiyun void __tsb_context_switch(unsigned long pgd_pa,
33*4882a593Smuzhiyun 			  struct tsb_config *tsb_base,
34*4882a593Smuzhiyun 			  struct tsb_config *tsb_huge,
35*4882a593Smuzhiyun 			  unsigned long tsb_descr_pa,
36*4882a593Smuzhiyun 			  unsigned long secondary_ctx);
37*4882a593Smuzhiyun 
tsb_context_switch_ctx(struct mm_struct * mm,unsigned long ctx)38*4882a593Smuzhiyun static inline void tsb_context_switch_ctx(struct mm_struct *mm,
39*4882a593Smuzhiyun 					  unsigned long ctx)
40*4882a593Smuzhiyun {
41*4882a593Smuzhiyun 	__tsb_context_switch(__pa(mm->pgd),
42*4882a593Smuzhiyun 			     &mm->context.tsb_block[MM_TSB_BASE],
43*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
44*4882a593Smuzhiyun 			     (mm->context.tsb_block[MM_TSB_HUGE].tsb ?
45*4882a593Smuzhiyun 			      &mm->context.tsb_block[MM_TSB_HUGE] :
46*4882a593Smuzhiyun 			      NULL)
47*4882a593Smuzhiyun #else
48*4882a593Smuzhiyun 			     NULL
49*4882a593Smuzhiyun #endif
50*4882a593Smuzhiyun 			     , __pa(&mm->context.tsb_descr[MM_TSB_BASE]),
51*4882a593Smuzhiyun 			     ctx);
52*4882a593Smuzhiyun }
53*4882a593Smuzhiyun 
54*4882a593Smuzhiyun #define tsb_context_switch(X) tsb_context_switch_ctx(X, 0)
55*4882a593Smuzhiyun 
56*4882a593Smuzhiyun void tsb_grow(struct mm_struct *mm,
57*4882a593Smuzhiyun 	      unsigned long tsb_index,
58*4882a593Smuzhiyun 	      unsigned long mm_rss);
59*4882a593Smuzhiyun #ifdef CONFIG_SMP
60*4882a593Smuzhiyun void smp_tsb_sync(struct mm_struct *mm);
61*4882a593Smuzhiyun #else
62*4882a593Smuzhiyun #define smp_tsb_sync(__mm) do { } while (0)
63*4882a593Smuzhiyun #endif
64*4882a593Smuzhiyun 
65*4882a593Smuzhiyun /* Set MMU context in the actual hardware. */
66*4882a593Smuzhiyun #define load_secondary_context(__mm) \
67*4882a593Smuzhiyun 	__asm__ __volatile__( \
68*4882a593Smuzhiyun 	"\n661:	stxa		%0, [%1] %2\n" \
69*4882a593Smuzhiyun 	"	.section	.sun4v_1insn_patch, \"ax\"\n" \
70*4882a593Smuzhiyun 	"	.word		661b\n" \
71*4882a593Smuzhiyun 	"	stxa		%0, [%1] %3\n" \
72*4882a593Smuzhiyun 	"	.previous\n" \
73*4882a593Smuzhiyun 	"	flush		%%g6\n" \
74*4882a593Smuzhiyun 	: /* No outputs */ \
75*4882a593Smuzhiyun 	: "r" (CTX_HWBITS((__mm)->context)), \
76*4882a593Smuzhiyun 	  "r" (SECONDARY_CONTEXT), "i" (ASI_DMMU), "i" (ASI_MMU))
77*4882a593Smuzhiyun 
78*4882a593Smuzhiyun void __flush_tlb_mm(unsigned long, unsigned long);
79*4882a593Smuzhiyun 
80*4882a593Smuzhiyun /* Switch the current MM context. */
switch_mm(struct mm_struct * old_mm,struct mm_struct * mm,struct task_struct * tsk)81*4882a593Smuzhiyun static inline void switch_mm(struct mm_struct *old_mm, struct mm_struct *mm, struct task_struct *tsk)
82*4882a593Smuzhiyun {
83*4882a593Smuzhiyun 	unsigned long ctx_valid, flags;
84*4882a593Smuzhiyun 	int cpu = smp_processor_id();
85*4882a593Smuzhiyun 
86*4882a593Smuzhiyun 	per_cpu(per_cpu_secondary_mm, cpu) = mm;
87*4882a593Smuzhiyun 	if (unlikely(mm == &init_mm))
88*4882a593Smuzhiyun 		return;
89*4882a593Smuzhiyun 
90*4882a593Smuzhiyun 	spin_lock_irqsave(&mm->context.lock, flags);
91*4882a593Smuzhiyun 	ctx_valid = CTX_VALID(mm->context);
92*4882a593Smuzhiyun 	if (!ctx_valid)
93*4882a593Smuzhiyun 		get_new_mmu_context(mm);
94*4882a593Smuzhiyun 
95*4882a593Smuzhiyun 	/* We have to be extremely careful here or else we will miss
96*4882a593Smuzhiyun 	 * a TSB grow if we switch back and forth between a kernel
97*4882a593Smuzhiyun 	 * thread and an address space which has it's TSB size increased
98*4882a593Smuzhiyun 	 * on another processor.
99*4882a593Smuzhiyun 	 *
100*4882a593Smuzhiyun 	 * It is possible to play some games in order to optimize the
101*4882a593Smuzhiyun 	 * switch, but the safest thing to do is to unconditionally
102*4882a593Smuzhiyun 	 * perform the secondary context load and the TSB context switch.
103*4882a593Smuzhiyun 	 *
104*4882a593Smuzhiyun 	 * For reference the bad case is, for address space "A":
105*4882a593Smuzhiyun 	 *
106*4882a593Smuzhiyun 	 *		CPU 0			CPU 1
107*4882a593Smuzhiyun 	 *	run address space A
108*4882a593Smuzhiyun 	 *	set cpu0's bits in cpu_vm_mask
109*4882a593Smuzhiyun 	 *	switch to kernel thread, borrow
110*4882a593Smuzhiyun 	 *	address space A via entry_lazy_tlb
111*4882a593Smuzhiyun 	 *					run address space A
112*4882a593Smuzhiyun 	 *					set cpu1's bit in cpu_vm_mask
113*4882a593Smuzhiyun 	 *					flush_tlb_pending()
114*4882a593Smuzhiyun 	 *					reset cpu_vm_mask to just cpu1
115*4882a593Smuzhiyun 	 *					TSB grow
116*4882a593Smuzhiyun 	 *	run address space A
117*4882a593Smuzhiyun 	 *	context was valid, so skip
118*4882a593Smuzhiyun 	 *	TSB context switch
119*4882a593Smuzhiyun 	 *
120*4882a593Smuzhiyun 	 * At that point cpu0 continues to use a stale TSB, the one from
121*4882a593Smuzhiyun 	 * before the TSB grow performed on cpu1.  cpu1 did not cross-call
122*4882a593Smuzhiyun 	 * cpu0 to update it's TSB because at that point the cpu_vm_mask
123*4882a593Smuzhiyun 	 * only had cpu1 set in it.
124*4882a593Smuzhiyun 	 */
125*4882a593Smuzhiyun 	tsb_context_switch_ctx(mm, CTX_HWBITS(mm->context));
126*4882a593Smuzhiyun 
127*4882a593Smuzhiyun 	/* Any time a processor runs a context on an address space
128*4882a593Smuzhiyun 	 * for the first time, we must flush that context out of the
129*4882a593Smuzhiyun 	 * local TLB.
130*4882a593Smuzhiyun 	 */
131*4882a593Smuzhiyun 	if (!ctx_valid || !cpumask_test_cpu(cpu, mm_cpumask(mm))) {
132*4882a593Smuzhiyun 		cpumask_set_cpu(cpu, mm_cpumask(mm));
133*4882a593Smuzhiyun 		__flush_tlb_mm(CTX_HWBITS(mm->context),
134*4882a593Smuzhiyun 			       SECONDARY_CONTEXT);
135*4882a593Smuzhiyun 	}
136*4882a593Smuzhiyun 	spin_unlock_irqrestore(&mm->context.lock, flags);
137*4882a593Smuzhiyun }
138*4882a593Smuzhiyun 
139*4882a593Smuzhiyun #define deactivate_mm(tsk,mm)	do { } while (0)
140*4882a593Smuzhiyun #define activate_mm(active_mm, mm) switch_mm(active_mm, mm, NULL)
141*4882a593Smuzhiyun 
142*4882a593Smuzhiyun #define  __HAVE_ARCH_START_CONTEXT_SWITCH
arch_start_context_switch(struct task_struct * prev)143*4882a593Smuzhiyun static inline void arch_start_context_switch(struct task_struct *prev)
144*4882a593Smuzhiyun {
145*4882a593Smuzhiyun 	/* Save the current state of MCDPER register for the process
146*4882a593Smuzhiyun 	 * we are switching from
147*4882a593Smuzhiyun 	 */
148*4882a593Smuzhiyun 	if (adi_capable()) {
149*4882a593Smuzhiyun 		register unsigned long tmp_mcdper;
150*4882a593Smuzhiyun 
151*4882a593Smuzhiyun 		__asm__ __volatile__(
152*4882a593Smuzhiyun 			".word 0x83438000\n\t"	/* rd  %mcdper, %g1 */
153*4882a593Smuzhiyun 			"mov %%g1, %0\n\t"
154*4882a593Smuzhiyun 			: "=r" (tmp_mcdper)
155*4882a593Smuzhiyun 			:
156*4882a593Smuzhiyun 			: "g1");
157*4882a593Smuzhiyun 		if (tmp_mcdper)
158*4882a593Smuzhiyun 			set_tsk_thread_flag(prev, TIF_MCDPER);
159*4882a593Smuzhiyun 		else
160*4882a593Smuzhiyun 			clear_tsk_thread_flag(prev, TIF_MCDPER);
161*4882a593Smuzhiyun 	}
162*4882a593Smuzhiyun }
163*4882a593Smuzhiyun 
164*4882a593Smuzhiyun #define finish_arch_post_lock_switch	finish_arch_post_lock_switch
finish_arch_post_lock_switch(void)165*4882a593Smuzhiyun static inline void finish_arch_post_lock_switch(void)
166*4882a593Smuzhiyun {
167*4882a593Smuzhiyun 	/* Restore the state of MCDPER register for the new process
168*4882a593Smuzhiyun 	 * just switched to.
169*4882a593Smuzhiyun 	 */
170*4882a593Smuzhiyun 	if (adi_capable()) {
171*4882a593Smuzhiyun 		register unsigned long tmp_mcdper;
172*4882a593Smuzhiyun 
173*4882a593Smuzhiyun 		tmp_mcdper = test_thread_flag(TIF_MCDPER);
174*4882a593Smuzhiyun 		__asm__ __volatile__(
175*4882a593Smuzhiyun 			"mov %0, %%g1\n\t"
176*4882a593Smuzhiyun 			".word 0x9d800001\n\t"	/* wr %g0, %g1, %mcdper" */
177*4882a593Smuzhiyun 			".word 0xaf902001\n\t"	/* wrpr %g0, 1, %pmcdper */
178*4882a593Smuzhiyun 			:
179*4882a593Smuzhiyun 			: "ir" (tmp_mcdper)
180*4882a593Smuzhiyun 			: "g1");
181*4882a593Smuzhiyun 		if (current && current->mm && current->mm->context.adi) {
182*4882a593Smuzhiyun 			struct pt_regs *regs;
183*4882a593Smuzhiyun 
184*4882a593Smuzhiyun 			regs = task_pt_regs(current);
185*4882a593Smuzhiyun 			regs->tstate |= TSTATE_MCDE;
186*4882a593Smuzhiyun 		}
187*4882a593Smuzhiyun 	}
188*4882a593Smuzhiyun }
189*4882a593Smuzhiyun 
190*4882a593Smuzhiyun #endif /* !(__ASSEMBLY__) */
191*4882a593Smuzhiyun 
192*4882a593Smuzhiyun #endif /* !(__SPARC64_MMU_CONTEXT_H) */
193