1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0 */
2*4882a593Smuzhiyun #ifndef __SPARC64_MMU_CONTEXT_H
3*4882a593Smuzhiyun #define __SPARC64_MMU_CONTEXT_H
4*4882a593Smuzhiyun
5*4882a593Smuzhiyun /* Derived heavily from Linus's Alpha/AXP ASN code... */
6*4882a593Smuzhiyun
7*4882a593Smuzhiyun #ifndef __ASSEMBLY__
8*4882a593Smuzhiyun
9*4882a593Smuzhiyun #include <linux/spinlock.h>
10*4882a593Smuzhiyun #include <linux/mm_types.h>
11*4882a593Smuzhiyun #include <linux/smp.h>
12*4882a593Smuzhiyun #include <linux/sched.h>
13*4882a593Smuzhiyun
14*4882a593Smuzhiyun #include <asm/spitfire.h>
15*4882a593Smuzhiyun #include <asm/adi_64.h>
16*4882a593Smuzhiyun #include <asm-generic/mm_hooks.h>
17*4882a593Smuzhiyun #include <asm/percpu.h>
18*4882a593Smuzhiyun
enter_lazy_tlb(struct mm_struct * mm,struct task_struct * tsk)19*4882a593Smuzhiyun static inline void enter_lazy_tlb(struct mm_struct *mm, struct task_struct *tsk)
20*4882a593Smuzhiyun {
21*4882a593Smuzhiyun }
22*4882a593Smuzhiyun
23*4882a593Smuzhiyun extern spinlock_t ctx_alloc_lock;
24*4882a593Smuzhiyun extern unsigned long tlb_context_cache;
25*4882a593Smuzhiyun extern unsigned long mmu_context_bmap[];
26*4882a593Smuzhiyun
27*4882a593Smuzhiyun DECLARE_PER_CPU(struct mm_struct *, per_cpu_secondary_mm);
28*4882a593Smuzhiyun void get_new_mmu_context(struct mm_struct *mm);
29*4882a593Smuzhiyun int init_new_context(struct task_struct *tsk, struct mm_struct *mm);
30*4882a593Smuzhiyun void destroy_context(struct mm_struct *mm);
31*4882a593Smuzhiyun
32*4882a593Smuzhiyun void __tsb_context_switch(unsigned long pgd_pa,
33*4882a593Smuzhiyun struct tsb_config *tsb_base,
34*4882a593Smuzhiyun struct tsb_config *tsb_huge,
35*4882a593Smuzhiyun unsigned long tsb_descr_pa,
36*4882a593Smuzhiyun unsigned long secondary_ctx);
37*4882a593Smuzhiyun
tsb_context_switch_ctx(struct mm_struct * mm,unsigned long ctx)38*4882a593Smuzhiyun static inline void tsb_context_switch_ctx(struct mm_struct *mm,
39*4882a593Smuzhiyun unsigned long ctx)
40*4882a593Smuzhiyun {
41*4882a593Smuzhiyun __tsb_context_switch(__pa(mm->pgd),
42*4882a593Smuzhiyun &mm->context.tsb_block[MM_TSB_BASE],
43*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
44*4882a593Smuzhiyun (mm->context.tsb_block[MM_TSB_HUGE].tsb ?
45*4882a593Smuzhiyun &mm->context.tsb_block[MM_TSB_HUGE] :
46*4882a593Smuzhiyun NULL)
47*4882a593Smuzhiyun #else
48*4882a593Smuzhiyun NULL
49*4882a593Smuzhiyun #endif
50*4882a593Smuzhiyun , __pa(&mm->context.tsb_descr[MM_TSB_BASE]),
51*4882a593Smuzhiyun ctx);
52*4882a593Smuzhiyun }
53*4882a593Smuzhiyun
54*4882a593Smuzhiyun #define tsb_context_switch(X) tsb_context_switch_ctx(X, 0)
55*4882a593Smuzhiyun
56*4882a593Smuzhiyun void tsb_grow(struct mm_struct *mm,
57*4882a593Smuzhiyun unsigned long tsb_index,
58*4882a593Smuzhiyun unsigned long mm_rss);
59*4882a593Smuzhiyun #ifdef CONFIG_SMP
60*4882a593Smuzhiyun void smp_tsb_sync(struct mm_struct *mm);
61*4882a593Smuzhiyun #else
62*4882a593Smuzhiyun #define smp_tsb_sync(__mm) do { } while (0)
63*4882a593Smuzhiyun #endif
64*4882a593Smuzhiyun
65*4882a593Smuzhiyun /* Set MMU context in the actual hardware. */
66*4882a593Smuzhiyun #define load_secondary_context(__mm) \
67*4882a593Smuzhiyun __asm__ __volatile__( \
68*4882a593Smuzhiyun "\n661: stxa %0, [%1] %2\n" \
69*4882a593Smuzhiyun " .section .sun4v_1insn_patch, \"ax\"\n" \
70*4882a593Smuzhiyun " .word 661b\n" \
71*4882a593Smuzhiyun " stxa %0, [%1] %3\n" \
72*4882a593Smuzhiyun " .previous\n" \
73*4882a593Smuzhiyun " flush %%g6\n" \
74*4882a593Smuzhiyun : /* No outputs */ \
75*4882a593Smuzhiyun : "r" (CTX_HWBITS((__mm)->context)), \
76*4882a593Smuzhiyun "r" (SECONDARY_CONTEXT), "i" (ASI_DMMU), "i" (ASI_MMU))
77*4882a593Smuzhiyun
78*4882a593Smuzhiyun void __flush_tlb_mm(unsigned long, unsigned long);
79*4882a593Smuzhiyun
80*4882a593Smuzhiyun /* Switch the current MM context. */
switch_mm(struct mm_struct * old_mm,struct mm_struct * mm,struct task_struct * tsk)81*4882a593Smuzhiyun static inline void switch_mm(struct mm_struct *old_mm, struct mm_struct *mm, struct task_struct *tsk)
82*4882a593Smuzhiyun {
83*4882a593Smuzhiyun unsigned long ctx_valid, flags;
84*4882a593Smuzhiyun int cpu = smp_processor_id();
85*4882a593Smuzhiyun
86*4882a593Smuzhiyun per_cpu(per_cpu_secondary_mm, cpu) = mm;
87*4882a593Smuzhiyun if (unlikely(mm == &init_mm))
88*4882a593Smuzhiyun return;
89*4882a593Smuzhiyun
90*4882a593Smuzhiyun spin_lock_irqsave(&mm->context.lock, flags);
91*4882a593Smuzhiyun ctx_valid = CTX_VALID(mm->context);
92*4882a593Smuzhiyun if (!ctx_valid)
93*4882a593Smuzhiyun get_new_mmu_context(mm);
94*4882a593Smuzhiyun
95*4882a593Smuzhiyun /* We have to be extremely careful here or else we will miss
96*4882a593Smuzhiyun * a TSB grow if we switch back and forth between a kernel
97*4882a593Smuzhiyun * thread and an address space which has it's TSB size increased
98*4882a593Smuzhiyun * on another processor.
99*4882a593Smuzhiyun *
100*4882a593Smuzhiyun * It is possible to play some games in order to optimize the
101*4882a593Smuzhiyun * switch, but the safest thing to do is to unconditionally
102*4882a593Smuzhiyun * perform the secondary context load and the TSB context switch.
103*4882a593Smuzhiyun *
104*4882a593Smuzhiyun * For reference the bad case is, for address space "A":
105*4882a593Smuzhiyun *
106*4882a593Smuzhiyun * CPU 0 CPU 1
107*4882a593Smuzhiyun * run address space A
108*4882a593Smuzhiyun * set cpu0's bits in cpu_vm_mask
109*4882a593Smuzhiyun * switch to kernel thread, borrow
110*4882a593Smuzhiyun * address space A via entry_lazy_tlb
111*4882a593Smuzhiyun * run address space A
112*4882a593Smuzhiyun * set cpu1's bit in cpu_vm_mask
113*4882a593Smuzhiyun * flush_tlb_pending()
114*4882a593Smuzhiyun * reset cpu_vm_mask to just cpu1
115*4882a593Smuzhiyun * TSB grow
116*4882a593Smuzhiyun * run address space A
117*4882a593Smuzhiyun * context was valid, so skip
118*4882a593Smuzhiyun * TSB context switch
119*4882a593Smuzhiyun *
120*4882a593Smuzhiyun * At that point cpu0 continues to use a stale TSB, the one from
121*4882a593Smuzhiyun * before the TSB grow performed on cpu1. cpu1 did not cross-call
122*4882a593Smuzhiyun * cpu0 to update it's TSB because at that point the cpu_vm_mask
123*4882a593Smuzhiyun * only had cpu1 set in it.
124*4882a593Smuzhiyun */
125*4882a593Smuzhiyun tsb_context_switch_ctx(mm, CTX_HWBITS(mm->context));
126*4882a593Smuzhiyun
127*4882a593Smuzhiyun /* Any time a processor runs a context on an address space
128*4882a593Smuzhiyun * for the first time, we must flush that context out of the
129*4882a593Smuzhiyun * local TLB.
130*4882a593Smuzhiyun */
131*4882a593Smuzhiyun if (!ctx_valid || !cpumask_test_cpu(cpu, mm_cpumask(mm))) {
132*4882a593Smuzhiyun cpumask_set_cpu(cpu, mm_cpumask(mm));
133*4882a593Smuzhiyun __flush_tlb_mm(CTX_HWBITS(mm->context),
134*4882a593Smuzhiyun SECONDARY_CONTEXT);
135*4882a593Smuzhiyun }
136*4882a593Smuzhiyun spin_unlock_irqrestore(&mm->context.lock, flags);
137*4882a593Smuzhiyun }
138*4882a593Smuzhiyun
139*4882a593Smuzhiyun #define deactivate_mm(tsk,mm) do { } while (0)
140*4882a593Smuzhiyun #define activate_mm(active_mm, mm) switch_mm(active_mm, mm, NULL)
141*4882a593Smuzhiyun
142*4882a593Smuzhiyun #define __HAVE_ARCH_START_CONTEXT_SWITCH
arch_start_context_switch(struct task_struct * prev)143*4882a593Smuzhiyun static inline void arch_start_context_switch(struct task_struct *prev)
144*4882a593Smuzhiyun {
145*4882a593Smuzhiyun /* Save the current state of MCDPER register for the process
146*4882a593Smuzhiyun * we are switching from
147*4882a593Smuzhiyun */
148*4882a593Smuzhiyun if (adi_capable()) {
149*4882a593Smuzhiyun register unsigned long tmp_mcdper;
150*4882a593Smuzhiyun
151*4882a593Smuzhiyun __asm__ __volatile__(
152*4882a593Smuzhiyun ".word 0x83438000\n\t" /* rd %mcdper, %g1 */
153*4882a593Smuzhiyun "mov %%g1, %0\n\t"
154*4882a593Smuzhiyun : "=r" (tmp_mcdper)
155*4882a593Smuzhiyun :
156*4882a593Smuzhiyun : "g1");
157*4882a593Smuzhiyun if (tmp_mcdper)
158*4882a593Smuzhiyun set_tsk_thread_flag(prev, TIF_MCDPER);
159*4882a593Smuzhiyun else
160*4882a593Smuzhiyun clear_tsk_thread_flag(prev, TIF_MCDPER);
161*4882a593Smuzhiyun }
162*4882a593Smuzhiyun }
163*4882a593Smuzhiyun
164*4882a593Smuzhiyun #define finish_arch_post_lock_switch finish_arch_post_lock_switch
finish_arch_post_lock_switch(void)165*4882a593Smuzhiyun static inline void finish_arch_post_lock_switch(void)
166*4882a593Smuzhiyun {
167*4882a593Smuzhiyun /* Restore the state of MCDPER register for the new process
168*4882a593Smuzhiyun * just switched to.
169*4882a593Smuzhiyun */
170*4882a593Smuzhiyun if (adi_capable()) {
171*4882a593Smuzhiyun register unsigned long tmp_mcdper;
172*4882a593Smuzhiyun
173*4882a593Smuzhiyun tmp_mcdper = test_thread_flag(TIF_MCDPER);
174*4882a593Smuzhiyun __asm__ __volatile__(
175*4882a593Smuzhiyun "mov %0, %%g1\n\t"
176*4882a593Smuzhiyun ".word 0x9d800001\n\t" /* wr %g0, %g1, %mcdper" */
177*4882a593Smuzhiyun ".word 0xaf902001\n\t" /* wrpr %g0, 1, %pmcdper */
178*4882a593Smuzhiyun :
179*4882a593Smuzhiyun : "ir" (tmp_mcdper)
180*4882a593Smuzhiyun : "g1");
181*4882a593Smuzhiyun if (current && current->mm && current->mm->context.adi) {
182*4882a593Smuzhiyun struct pt_regs *regs;
183*4882a593Smuzhiyun
184*4882a593Smuzhiyun regs = task_pt_regs(current);
185*4882a593Smuzhiyun regs->tstate |= TSTATE_MCDE;
186*4882a593Smuzhiyun }
187*4882a593Smuzhiyun }
188*4882a593Smuzhiyun }
189*4882a593Smuzhiyun
190*4882a593Smuzhiyun #endif /* !(__ASSEMBLY__) */
191*4882a593Smuzhiyun
192*4882a593Smuzhiyun #endif /* !(__SPARC64_MMU_CONTEXT_H) */
193