1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * TLB flush routines for radix kernels.
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright 2015-2016, Aneesh Kumar K.V, IBM Corporation.
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #include <linux/mm.h>
9*4882a593Smuzhiyun #include <linux/hugetlb.h>
10*4882a593Smuzhiyun #include <linux/memblock.h>
11*4882a593Smuzhiyun #include <linux/mmu_context.h>
12*4882a593Smuzhiyun #include <linux/sched/mm.h>
13*4882a593Smuzhiyun
14*4882a593Smuzhiyun #include <asm/ppc-opcode.h>
15*4882a593Smuzhiyun #include <asm/tlb.h>
16*4882a593Smuzhiyun #include <asm/tlbflush.h>
17*4882a593Smuzhiyun #include <asm/trace.h>
18*4882a593Smuzhiyun #include <asm/cputhreads.h>
19*4882a593Smuzhiyun #include <asm/plpar_wrappers.h>
20*4882a593Smuzhiyun
21*4882a593Smuzhiyun #define RIC_FLUSH_TLB 0
22*4882a593Smuzhiyun #define RIC_FLUSH_PWC 1
23*4882a593Smuzhiyun #define RIC_FLUSH_ALL 2
24*4882a593Smuzhiyun
25*4882a593Smuzhiyun /*
26*4882a593Smuzhiyun * tlbiel instruction for radix, set invalidation
27*4882a593Smuzhiyun * i.e., r=1 and is=01 or is=10 or is=11
28*4882a593Smuzhiyun */
tlbiel_radix_set_isa300(unsigned int set,unsigned int is,unsigned int pid,unsigned int ric,unsigned int prs)29*4882a593Smuzhiyun static __always_inline void tlbiel_radix_set_isa300(unsigned int set, unsigned int is,
30*4882a593Smuzhiyun unsigned int pid,
31*4882a593Smuzhiyun unsigned int ric, unsigned int prs)
32*4882a593Smuzhiyun {
33*4882a593Smuzhiyun unsigned long rb;
34*4882a593Smuzhiyun unsigned long rs;
35*4882a593Smuzhiyun
36*4882a593Smuzhiyun rb = (set << PPC_BITLSHIFT(51)) | (is << PPC_BITLSHIFT(53));
37*4882a593Smuzhiyun rs = ((unsigned long)pid << PPC_BITLSHIFT(31));
38*4882a593Smuzhiyun
39*4882a593Smuzhiyun asm volatile(PPC_TLBIEL(%0, %1, %2, %3, 1)
40*4882a593Smuzhiyun : : "r"(rb), "r"(rs), "i"(ric), "i"(prs)
41*4882a593Smuzhiyun : "memory");
42*4882a593Smuzhiyun }
43*4882a593Smuzhiyun
tlbiel_all_isa300(unsigned int num_sets,unsigned int is)44*4882a593Smuzhiyun static void tlbiel_all_isa300(unsigned int num_sets, unsigned int is)
45*4882a593Smuzhiyun {
46*4882a593Smuzhiyun unsigned int set;
47*4882a593Smuzhiyun
48*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
49*4882a593Smuzhiyun
50*4882a593Smuzhiyun /*
51*4882a593Smuzhiyun * Flush the first set of the TLB, and the entire Page Walk Cache
52*4882a593Smuzhiyun * and partition table entries. Then flush the remaining sets of the
53*4882a593Smuzhiyun * TLB.
54*4882a593Smuzhiyun */
55*4882a593Smuzhiyun
56*4882a593Smuzhiyun if (early_cpu_has_feature(CPU_FTR_HVMODE)) {
57*4882a593Smuzhiyun /* MSR[HV] should flush partition scope translations first. */
58*4882a593Smuzhiyun tlbiel_radix_set_isa300(0, is, 0, RIC_FLUSH_ALL, 0);
59*4882a593Smuzhiyun for (set = 1; set < num_sets; set++)
60*4882a593Smuzhiyun tlbiel_radix_set_isa300(set, is, 0, RIC_FLUSH_TLB, 0);
61*4882a593Smuzhiyun }
62*4882a593Smuzhiyun
63*4882a593Smuzhiyun /* Flush process scoped entries. */
64*4882a593Smuzhiyun tlbiel_radix_set_isa300(0, is, 0, RIC_FLUSH_ALL, 1);
65*4882a593Smuzhiyun for (set = 1; set < num_sets; set++)
66*4882a593Smuzhiyun tlbiel_radix_set_isa300(set, is, 0, RIC_FLUSH_TLB, 1);
67*4882a593Smuzhiyun
68*4882a593Smuzhiyun ppc_after_tlbiel_barrier();
69*4882a593Smuzhiyun }
70*4882a593Smuzhiyun
radix__tlbiel_all(unsigned int action)71*4882a593Smuzhiyun void radix__tlbiel_all(unsigned int action)
72*4882a593Smuzhiyun {
73*4882a593Smuzhiyun unsigned int is;
74*4882a593Smuzhiyun
75*4882a593Smuzhiyun switch (action) {
76*4882a593Smuzhiyun case TLB_INVAL_SCOPE_GLOBAL:
77*4882a593Smuzhiyun is = 3;
78*4882a593Smuzhiyun break;
79*4882a593Smuzhiyun case TLB_INVAL_SCOPE_LPID:
80*4882a593Smuzhiyun is = 2;
81*4882a593Smuzhiyun break;
82*4882a593Smuzhiyun default:
83*4882a593Smuzhiyun BUG();
84*4882a593Smuzhiyun }
85*4882a593Smuzhiyun
86*4882a593Smuzhiyun if (early_cpu_has_feature(CPU_FTR_ARCH_300))
87*4882a593Smuzhiyun tlbiel_all_isa300(POWER9_TLB_SETS_RADIX, is);
88*4882a593Smuzhiyun else
89*4882a593Smuzhiyun WARN(1, "%s called on pre-POWER9 CPU\n", __func__);
90*4882a593Smuzhiyun
91*4882a593Smuzhiyun asm volatile(PPC_ISA_3_0_INVALIDATE_ERAT "; isync" : : :"memory");
92*4882a593Smuzhiyun }
93*4882a593Smuzhiyun
__tlbiel_pid(unsigned long pid,int set,unsigned long ric)94*4882a593Smuzhiyun static __always_inline void __tlbiel_pid(unsigned long pid, int set,
95*4882a593Smuzhiyun unsigned long ric)
96*4882a593Smuzhiyun {
97*4882a593Smuzhiyun unsigned long rb,rs,prs,r;
98*4882a593Smuzhiyun
99*4882a593Smuzhiyun rb = PPC_BIT(53); /* IS = 1 */
100*4882a593Smuzhiyun rb |= set << PPC_BITLSHIFT(51);
101*4882a593Smuzhiyun rs = ((unsigned long)pid) << PPC_BITLSHIFT(31);
102*4882a593Smuzhiyun prs = 1; /* process scoped */
103*4882a593Smuzhiyun r = 1; /* radix format */
104*4882a593Smuzhiyun
105*4882a593Smuzhiyun asm volatile(PPC_TLBIEL(%0, %4, %3, %2, %1)
106*4882a593Smuzhiyun : : "r"(rb), "i"(r), "i"(prs), "i"(ric), "r"(rs) : "memory");
107*4882a593Smuzhiyun trace_tlbie(0, 1, rb, rs, ric, prs, r);
108*4882a593Smuzhiyun }
109*4882a593Smuzhiyun
__tlbie_pid(unsigned long pid,unsigned long ric)110*4882a593Smuzhiyun static __always_inline void __tlbie_pid(unsigned long pid, unsigned long ric)
111*4882a593Smuzhiyun {
112*4882a593Smuzhiyun unsigned long rb,rs,prs,r;
113*4882a593Smuzhiyun
114*4882a593Smuzhiyun rb = PPC_BIT(53); /* IS = 1 */
115*4882a593Smuzhiyun rs = pid << PPC_BITLSHIFT(31);
116*4882a593Smuzhiyun prs = 1; /* process scoped */
117*4882a593Smuzhiyun r = 1; /* radix format */
118*4882a593Smuzhiyun
119*4882a593Smuzhiyun asm volatile(PPC_TLBIE_5(%0, %4, %3, %2, %1)
120*4882a593Smuzhiyun : : "r"(rb), "i"(r), "i"(prs), "i"(ric), "r"(rs) : "memory");
121*4882a593Smuzhiyun trace_tlbie(0, 0, rb, rs, ric, prs, r);
122*4882a593Smuzhiyun }
123*4882a593Smuzhiyun
__tlbie_lpid(unsigned long lpid,unsigned long ric)124*4882a593Smuzhiyun static __always_inline void __tlbie_lpid(unsigned long lpid, unsigned long ric)
125*4882a593Smuzhiyun {
126*4882a593Smuzhiyun unsigned long rb,rs,prs,r;
127*4882a593Smuzhiyun
128*4882a593Smuzhiyun rb = PPC_BIT(52); /* IS = 2 */
129*4882a593Smuzhiyun rs = lpid;
130*4882a593Smuzhiyun prs = 0; /* partition scoped */
131*4882a593Smuzhiyun r = 1; /* radix format */
132*4882a593Smuzhiyun
133*4882a593Smuzhiyun asm volatile(PPC_TLBIE_5(%0, %4, %3, %2, %1)
134*4882a593Smuzhiyun : : "r"(rb), "i"(r), "i"(prs), "i"(ric), "r"(rs) : "memory");
135*4882a593Smuzhiyun trace_tlbie(lpid, 0, rb, rs, ric, prs, r);
136*4882a593Smuzhiyun }
137*4882a593Smuzhiyun
__tlbie_lpid_guest(unsigned long lpid,unsigned long ric)138*4882a593Smuzhiyun static __always_inline void __tlbie_lpid_guest(unsigned long lpid, unsigned long ric)
139*4882a593Smuzhiyun {
140*4882a593Smuzhiyun unsigned long rb,rs,prs,r;
141*4882a593Smuzhiyun
142*4882a593Smuzhiyun rb = PPC_BIT(52); /* IS = 2 */
143*4882a593Smuzhiyun rs = lpid;
144*4882a593Smuzhiyun prs = 1; /* process scoped */
145*4882a593Smuzhiyun r = 1; /* radix format */
146*4882a593Smuzhiyun
147*4882a593Smuzhiyun asm volatile(PPC_TLBIE_5(%0, %4, %3, %2, %1)
148*4882a593Smuzhiyun : : "r"(rb), "i"(r), "i"(prs), "i"(ric), "r"(rs) : "memory");
149*4882a593Smuzhiyun trace_tlbie(lpid, 0, rb, rs, ric, prs, r);
150*4882a593Smuzhiyun }
151*4882a593Smuzhiyun
__tlbiel_va(unsigned long va,unsigned long pid,unsigned long ap,unsigned long ric)152*4882a593Smuzhiyun static __always_inline void __tlbiel_va(unsigned long va, unsigned long pid,
153*4882a593Smuzhiyun unsigned long ap, unsigned long ric)
154*4882a593Smuzhiyun {
155*4882a593Smuzhiyun unsigned long rb,rs,prs,r;
156*4882a593Smuzhiyun
157*4882a593Smuzhiyun rb = va & ~(PPC_BITMASK(52, 63));
158*4882a593Smuzhiyun rb |= ap << PPC_BITLSHIFT(58);
159*4882a593Smuzhiyun rs = pid << PPC_BITLSHIFT(31);
160*4882a593Smuzhiyun prs = 1; /* process scoped */
161*4882a593Smuzhiyun r = 1; /* radix format */
162*4882a593Smuzhiyun
163*4882a593Smuzhiyun asm volatile(PPC_TLBIEL(%0, %4, %3, %2, %1)
164*4882a593Smuzhiyun : : "r"(rb), "i"(r), "i"(prs), "i"(ric), "r"(rs) : "memory");
165*4882a593Smuzhiyun trace_tlbie(0, 1, rb, rs, ric, prs, r);
166*4882a593Smuzhiyun }
167*4882a593Smuzhiyun
__tlbie_va(unsigned long va,unsigned long pid,unsigned long ap,unsigned long ric)168*4882a593Smuzhiyun static __always_inline void __tlbie_va(unsigned long va, unsigned long pid,
169*4882a593Smuzhiyun unsigned long ap, unsigned long ric)
170*4882a593Smuzhiyun {
171*4882a593Smuzhiyun unsigned long rb,rs,prs,r;
172*4882a593Smuzhiyun
173*4882a593Smuzhiyun rb = va & ~(PPC_BITMASK(52, 63));
174*4882a593Smuzhiyun rb |= ap << PPC_BITLSHIFT(58);
175*4882a593Smuzhiyun rs = pid << PPC_BITLSHIFT(31);
176*4882a593Smuzhiyun prs = 1; /* process scoped */
177*4882a593Smuzhiyun r = 1; /* radix format */
178*4882a593Smuzhiyun
179*4882a593Smuzhiyun asm volatile(PPC_TLBIE_5(%0, %4, %3, %2, %1)
180*4882a593Smuzhiyun : : "r"(rb), "i"(r), "i"(prs), "i"(ric), "r"(rs) : "memory");
181*4882a593Smuzhiyun trace_tlbie(0, 0, rb, rs, ric, prs, r);
182*4882a593Smuzhiyun }
183*4882a593Smuzhiyun
__tlbie_lpid_va(unsigned long va,unsigned long lpid,unsigned long ap,unsigned long ric)184*4882a593Smuzhiyun static __always_inline void __tlbie_lpid_va(unsigned long va, unsigned long lpid,
185*4882a593Smuzhiyun unsigned long ap, unsigned long ric)
186*4882a593Smuzhiyun {
187*4882a593Smuzhiyun unsigned long rb,rs,prs,r;
188*4882a593Smuzhiyun
189*4882a593Smuzhiyun rb = va & ~(PPC_BITMASK(52, 63));
190*4882a593Smuzhiyun rb |= ap << PPC_BITLSHIFT(58);
191*4882a593Smuzhiyun rs = lpid;
192*4882a593Smuzhiyun prs = 0; /* partition scoped */
193*4882a593Smuzhiyun r = 1; /* radix format */
194*4882a593Smuzhiyun
195*4882a593Smuzhiyun asm volatile(PPC_TLBIE_5(%0, %4, %3, %2, %1)
196*4882a593Smuzhiyun : : "r"(rb), "i"(r), "i"(prs), "i"(ric), "r"(rs) : "memory");
197*4882a593Smuzhiyun trace_tlbie(lpid, 0, rb, rs, ric, prs, r);
198*4882a593Smuzhiyun }
199*4882a593Smuzhiyun
200*4882a593Smuzhiyun
fixup_tlbie_va(unsigned long va,unsigned long pid,unsigned long ap)201*4882a593Smuzhiyun static inline void fixup_tlbie_va(unsigned long va, unsigned long pid,
202*4882a593Smuzhiyun unsigned long ap)
203*4882a593Smuzhiyun {
204*4882a593Smuzhiyun if (cpu_has_feature(CPU_FTR_P9_TLBIE_ERAT_BUG)) {
205*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
206*4882a593Smuzhiyun __tlbie_va(va, 0, ap, RIC_FLUSH_TLB);
207*4882a593Smuzhiyun }
208*4882a593Smuzhiyun
209*4882a593Smuzhiyun if (cpu_has_feature(CPU_FTR_P9_TLBIE_STQ_BUG)) {
210*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
211*4882a593Smuzhiyun __tlbie_va(va, pid, ap, RIC_FLUSH_TLB);
212*4882a593Smuzhiyun }
213*4882a593Smuzhiyun }
214*4882a593Smuzhiyun
fixup_tlbie_va_range(unsigned long va,unsigned long pid,unsigned long ap)215*4882a593Smuzhiyun static inline void fixup_tlbie_va_range(unsigned long va, unsigned long pid,
216*4882a593Smuzhiyun unsigned long ap)
217*4882a593Smuzhiyun {
218*4882a593Smuzhiyun if (cpu_has_feature(CPU_FTR_P9_TLBIE_ERAT_BUG)) {
219*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
220*4882a593Smuzhiyun __tlbie_pid(0, RIC_FLUSH_TLB);
221*4882a593Smuzhiyun }
222*4882a593Smuzhiyun
223*4882a593Smuzhiyun if (cpu_has_feature(CPU_FTR_P9_TLBIE_STQ_BUG)) {
224*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
225*4882a593Smuzhiyun __tlbie_va(va, pid, ap, RIC_FLUSH_TLB);
226*4882a593Smuzhiyun }
227*4882a593Smuzhiyun }
228*4882a593Smuzhiyun
fixup_tlbie_pid(unsigned long pid)229*4882a593Smuzhiyun static inline void fixup_tlbie_pid(unsigned long pid)
230*4882a593Smuzhiyun {
231*4882a593Smuzhiyun /*
232*4882a593Smuzhiyun * We can use any address for the invalidation, pick one which is
233*4882a593Smuzhiyun * probably unused as an optimisation.
234*4882a593Smuzhiyun */
235*4882a593Smuzhiyun unsigned long va = ((1UL << 52) - 1);
236*4882a593Smuzhiyun
237*4882a593Smuzhiyun if (cpu_has_feature(CPU_FTR_P9_TLBIE_ERAT_BUG)) {
238*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
239*4882a593Smuzhiyun __tlbie_pid(0, RIC_FLUSH_TLB);
240*4882a593Smuzhiyun }
241*4882a593Smuzhiyun
242*4882a593Smuzhiyun if (cpu_has_feature(CPU_FTR_P9_TLBIE_STQ_BUG)) {
243*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
244*4882a593Smuzhiyun __tlbie_va(va, pid, mmu_get_ap(MMU_PAGE_64K), RIC_FLUSH_TLB);
245*4882a593Smuzhiyun }
246*4882a593Smuzhiyun }
247*4882a593Smuzhiyun
248*4882a593Smuzhiyun
fixup_tlbie_lpid_va(unsigned long va,unsigned long lpid,unsigned long ap)249*4882a593Smuzhiyun static inline void fixup_tlbie_lpid_va(unsigned long va, unsigned long lpid,
250*4882a593Smuzhiyun unsigned long ap)
251*4882a593Smuzhiyun {
252*4882a593Smuzhiyun if (cpu_has_feature(CPU_FTR_P9_TLBIE_ERAT_BUG)) {
253*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
254*4882a593Smuzhiyun __tlbie_lpid_va(va, 0, ap, RIC_FLUSH_TLB);
255*4882a593Smuzhiyun }
256*4882a593Smuzhiyun
257*4882a593Smuzhiyun if (cpu_has_feature(CPU_FTR_P9_TLBIE_STQ_BUG)) {
258*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
259*4882a593Smuzhiyun __tlbie_lpid_va(va, lpid, ap, RIC_FLUSH_TLB);
260*4882a593Smuzhiyun }
261*4882a593Smuzhiyun }
262*4882a593Smuzhiyun
fixup_tlbie_lpid(unsigned long lpid)263*4882a593Smuzhiyun static inline void fixup_tlbie_lpid(unsigned long lpid)
264*4882a593Smuzhiyun {
265*4882a593Smuzhiyun /*
266*4882a593Smuzhiyun * We can use any address for the invalidation, pick one which is
267*4882a593Smuzhiyun * probably unused as an optimisation.
268*4882a593Smuzhiyun */
269*4882a593Smuzhiyun unsigned long va = ((1UL << 52) - 1);
270*4882a593Smuzhiyun
271*4882a593Smuzhiyun if (cpu_has_feature(CPU_FTR_P9_TLBIE_ERAT_BUG)) {
272*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
273*4882a593Smuzhiyun __tlbie_lpid(0, RIC_FLUSH_TLB);
274*4882a593Smuzhiyun }
275*4882a593Smuzhiyun
276*4882a593Smuzhiyun if (cpu_has_feature(CPU_FTR_P9_TLBIE_STQ_BUG)) {
277*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
278*4882a593Smuzhiyun __tlbie_lpid_va(va, lpid, mmu_get_ap(MMU_PAGE_64K), RIC_FLUSH_TLB);
279*4882a593Smuzhiyun }
280*4882a593Smuzhiyun }
281*4882a593Smuzhiyun
282*4882a593Smuzhiyun /*
283*4882a593Smuzhiyun * We use 128 set in radix mode and 256 set in hpt mode.
284*4882a593Smuzhiyun */
_tlbiel_pid(unsigned long pid,unsigned long ric)285*4882a593Smuzhiyun static inline void _tlbiel_pid(unsigned long pid, unsigned long ric)
286*4882a593Smuzhiyun {
287*4882a593Smuzhiyun int set;
288*4882a593Smuzhiyun
289*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
290*4882a593Smuzhiyun
291*4882a593Smuzhiyun switch (ric) {
292*4882a593Smuzhiyun case RIC_FLUSH_PWC:
293*4882a593Smuzhiyun
294*4882a593Smuzhiyun /* For PWC, only one flush is needed */
295*4882a593Smuzhiyun __tlbiel_pid(pid, 0, RIC_FLUSH_PWC);
296*4882a593Smuzhiyun ppc_after_tlbiel_barrier();
297*4882a593Smuzhiyun return;
298*4882a593Smuzhiyun case RIC_FLUSH_TLB:
299*4882a593Smuzhiyun __tlbiel_pid(pid, 0, RIC_FLUSH_TLB);
300*4882a593Smuzhiyun break;
301*4882a593Smuzhiyun case RIC_FLUSH_ALL:
302*4882a593Smuzhiyun default:
303*4882a593Smuzhiyun /*
304*4882a593Smuzhiyun * Flush the first set of the TLB, and if
305*4882a593Smuzhiyun * we're doing a RIC_FLUSH_ALL, also flush
306*4882a593Smuzhiyun * the entire Page Walk Cache.
307*4882a593Smuzhiyun */
308*4882a593Smuzhiyun __tlbiel_pid(pid, 0, RIC_FLUSH_ALL);
309*4882a593Smuzhiyun }
310*4882a593Smuzhiyun
311*4882a593Smuzhiyun /* For the remaining sets, just flush the TLB */
312*4882a593Smuzhiyun for (set = 1; set < POWER9_TLB_SETS_RADIX ; set++)
313*4882a593Smuzhiyun __tlbiel_pid(pid, set, RIC_FLUSH_TLB);
314*4882a593Smuzhiyun
315*4882a593Smuzhiyun ppc_after_tlbiel_barrier();
316*4882a593Smuzhiyun asm volatile(PPC_RADIX_INVALIDATE_ERAT_USER "; isync" : : :"memory");
317*4882a593Smuzhiyun }
318*4882a593Smuzhiyun
_tlbie_pid(unsigned long pid,unsigned long ric)319*4882a593Smuzhiyun static inline void _tlbie_pid(unsigned long pid, unsigned long ric)
320*4882a593Smuzhiyun {
321*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
322*4882a593Smuzhiyun
323*4882a593Smuzhiyun /*
324*4882a593Smuzhiyun * Workaround the fact that the "ric" argument to __tlbie_pid
325*4882a593Smuzhiyun * must be a compile-time contraint to match the "i" constraint
326*4882a593Smuzhiyun * in the asm statement.
327*4882a593Smuzhiyun */
328*4882a593Smuzhiyun switch (ric) {
329*4882a593Smuzhiyun case RIC_FLUSH_TLB:
330*4882a593Smuzhiyun __tlbie_pid(pid, RIC_FLUSH_TLB);
331*4882a593Smuzhiyun fixup_tlbie_pid(pid);
332*4882a593Smuzhiyun break;
333*4882a593Smuzhiyun case RIC_FLUSH_PWC:
334*4882a593Smuzhiyun __tlbie_pid(pid, RIC_FLUSH_PWC);
335*4882a593Smuzhiyun break;
336*4882a593Smuzhiyun case RIC_FLUSH_ALL:
337*4882a593Smuzhiyun default:
338*4882a593Smuzhiyun __tlbie_pid(pid, RIC_FLUSH_ALL);
339*4882a593Smuzhiyun fixup_tlbie_pid(pid);
340*4882a593Smuzhiyun }
341*4882a593Smuzhiyun asm volatile("eieio; tlbsync; ptesync": : :"memory");
342*4882a593Smuzhiyun }
343*4882a593Smuzhiyun
344*4882a593Smuzhiyun struct tlbiel_pid {
345*4882a593Smuzhiyun unsigned long pid;
346*4882a593Smuzhiyun unsigned long ric;
347*4882a593Smuzhiyun };
348*4882a593Smuzhiyun
do_tlbiel_pid(void * info)349*4882a593Smuzhiyun static void do_tlbiel_pid(void *info)
350*4882a593Smuzhiyun {
351*4882a593Smuzhiyun struct tlbiel_pid *t = info;
352*4882a593Smuzhiyun
353*4882a593Smuzhiyun if (t->ric == RIC_FLUSH_TLB)
354*4882a593Smuzhiyun _tlbiel_pid(t->pid, RIC_FLUSH_TLB);
355*4882a593Smuzhiyun else if (t->ric == RIC_FLUSH_PWC)
356*4882a593Smuzhiyun _tlbiel_pid(t->pid, RIC_FLUSH_PWC);
357*4882a593Smuzhiyun else
358*4882a593Smuzhiyun _tlbiel_pid(t->pid, RIC_FLUSH_ALL);
359*4882a593Smuzhiyun }
360*4882a593Smuzhiyun
_tlbiel_pid_multicast(struct mm_struct * mm,unsigned long pid,unsigned long ric)361*4882a593Smuzhiyun static inline void _tlbiel_pid_multicast(struct mm_struct *mm,
362*4882a593Smuzhiyun unsigned long pid, unsigned long ric)
363*4882a593Smuzhiyun {
364*4882a593Smuzhiyun struct cpumask *cpus = mm_cpumask(mm);
365*4882a593Smuzhiyun struct tlbiel_pid t = { .pid = pid, .ric = ric };
366*4882a593Smuzhiyun
367*4882a593Smuzhiyun on_each_cpu_mask(cpus, do_tlbiel_pid, &t, 1);
368*4882a593Smuzhiyun /*
369*4882a593Smuzhiyun * Always want the CPU translations to be invalidated with tlbiel in
370*4882a593Smuzhiyun * these paths, so while coprocessors must use tlbie, we can not
371*4882a593Smuzhiyun * optimise away the tlbiel component.
372*4882a593Smuzhiyun */
373*4882a593Smuzhiyun if (atomic_read(&mm->context.copros) > 0)
374*4882a593Smuzhiyun _tlbie_pid(pid, RIC_FLUSH_ALL);
375*4882a593Smuzhiyun }
376*4882a593Smuzhiyun
_tlbie_lpid(unsigned long lpid,unsigned long ric)377*4882a593Smuzhiyun static inline void _tlbie_lpid(unsigned long lpid, unsigned long ric)
378*4882a593Smuzhiyun {
379*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
380*4882a593Smuzhiyun
381*4882a593Smuzhiyun /*
382*4882a593Smuzhiyun * Workaround the fact that the "ric" argument to __tlbie_pid
383*4882a593Smuzhiyun * must be a compile-time contraint to match the "i" constraint
384*4882a593Smuzhiyun * in the asm statement.
385*4882a593Smuzhiyun */
386*4882a593Smuzhiyun switch (ric) {
387*4882a593Smuzhiyun case RIC_FLUSH_TLB:
388*4882a593Smuzhiyun __tlbie_lpid(lpid, RIC_FLUSH_TLB);
389*4882a593Smuzhiyun fixup_tlbie_lpid(lpid);
390*4882a593Smuzhiyun break;
391*4882a593Smuzhiyun case RIC_FLUSH_PWC:
392*4882a593Smuzhiyun __tlbie_lpid(lpid, RIC_FLUSH_PWC);
393*4882a593Smuzhiyun break;
394*4882a593Smuzhiyun case RIC_FLUSH_ALL:
395*4882a593Smuzhiyun default:
396*4882a593Smuzhiyun __tlbie_lpid(lpid, RIC_FLUSH_ALL);
397*4882a593Smuzhiyun fixup_tlbie_lpid(lpid);
398*4882a593Smuzhiyun }
399*4882a593Smuzhiyun asm volatile("eieio; tlbsync; ptesync": : :"memory");
400*4882a593Smuzhiyun }
401*4882a593Smuzhiyun
_tlbie_lpid_guest(unsigned long lpid,unsigned long ric)402*4882a593Smuzhiyun static __always_inline void _tlbie_lpid_guest(unsigned long lpid, unsigned long ric)
403*4882a593Smuzhiyun {
404*4882a593Smuzhiyun /*
405*4882a593Smuzhiyun * Workaround the fact that the "ric" argument to __tlbie_pid
406*4882a593Smuzhiyun * must be a compile-time contraint to match the "i" constraint
407*4882a593Smuzhiyun * in the asm statement.
408*4882a593Smuzhiyun */
409*4882a593Smuzhiyun switch (ric) {
410*4882a593Smuzhiyun case RIC_FLUSH_TLB:
411*4882a593Smuzhiyun __tlbie_lpid_guest(lpid, RIC_FLUSH_TLB);
412*4882a593Smuzhiyun break;
413*4882a593Smuzhiyun case RIC_FLUSH_PWC:
414*4882a593Smuzhiyun __tlbie_lpid_guest(lpid, RIC_FLUSH_PWC);
415*4882a593Smuzhiyun break;
416*4882a593Smuzhiyun case RIC_FLUSH_ALL:
417*4882a593Smuzhiyun default:
418*4882a593Smuzhiyun __tlbie_lpid_guest(lpid, RIC_FLUSH_ALL);
419*4882a593Smuzhiyun }
420*4882a593Smuzhiyun fixup_tlbie_lpid(lpid);
421*4882a593Smuzhiyun asm volatile("eieio; tlbsync; ptesync": : :"memory");
422*4882a593Smuzhiyun }
423*4882a593Smuzhiyun
__tlbiel_va_range(unsigned long start,unsigned long end,unsigned long pid,unsigned long page_size,unsigned long psize)424*4882a593Smuzhiyun static inline void __tlbiel_va_range(unsigned long start, unsigned long end,
425*4882a593Smuzhiyun unsigned long pid, unsigned long page_size,
426*4882a593Smuzhiyun unsigned long psize)
427*4882a593Smuzhiyun {
428*4882a593Smuzhiyun unsigned long addr;
429*4882a593Smuzhiyun unsigned long ap = mmu_get_ap(psize);
430*4882a593Smuzhiyun
431*4882a593Smuzhiyun for (addr = start; addr < end; addr += page_size)
432*4882a593Smuzhiyun __tlbiel_va(addr, pid, ap, RIC_FLUSH_TLB);
433*4882a593Smuzhiyun }
434*4882a593Smuzhiyun
_tlbiel_va(unsigned long va,unsigned long pid,unsigned long psize,unsigned long ric)435*4882a593Smuzhiyun static __always_inline void _tlbiel_va(unsigned long va, unsigned long pid,
436*4882a593Smuzhiyun unsigned long psize, unsigned long ric)
437*4882a593Smuzhiyun {
438*4882a593Smuzhiyun unsigned long ap = mmu_get_ap(psize);
439*4882a593Smuzhiyun
440*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
441*4882a593Smuzhiyun __tlbiel_va(va, pid, ap, ric);
442*4882a593Smuzhiyun ppc_after_tlbiel_barrier();
443*4882a593Smuzhiyun }
444*4882a593Smuzhiyun
_tlbiel_va_range(unsigned long start,unsigned long end,unsigned long pid,unsigned long page_size,unsigned long psize,bool also_pwc)445*4882a593Smuzhiyun static inline void _tlbiel_va_range(unsigned long start, unsigned long end,
446*4882a593Smuzhiyun unsigned long pid, unsigned long page_size,
447*4882a593Smuzhiyun unsigned long psize, bool also_pwc)
448*4882a593Smuzhiyun {
449*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
450*4882a593Smuzhiyun if (also_pwc)
451*4882a593Smuzhiyun __tlbiel_pid(pid, 0, RIC_FLUSH_PWC);
452*4882a593Smuzhiyun __tlbiel_va_range(start, end, pid, page_size, psize);
453*4882a593Smuzhiyun ppc_after_tlbiel_barrier();
454*4882a593Smuzhiyun }
455*4882a593Smuzhiyun
__tlbie_va_range(unsigned long start,unsigned long end,unsigned long pid,unsigned long page_size,unsigned long psize)456*4882a593Smuzhiyun static inline void __tlbie_va_range(unsigned long start, unsigned long end,
457*4882a593Smuzhiyun unsigned long pid, unsigned long page_size,
458*4882a593Smuzhiyun unsigned long psize)
459*4882a593Smuzhiyun {
460*4882a593Smuzhiyun unsigned long addr;
461*4882a593Smuzhiyun unsigned long ap = mmu_get_ap(psize);
462*4882a593Smuzhiyun
463*4882a593Smuzhiyun for (addr = start; addr < end; addr += page_size)
464*4882a593Smuzhiyun __tlbie_va(addr, pid, ap, RIC_FLUSH_TLB);
465*4882a593Smuzhiyun
466*4882a593Smuzhiyun fixup_tlbie_va_range(addr - page_size, pid, ap);
467*4882a593Smuzhiyun }
468*4882a593Smuzhiyun
_tlbie_va(unsigned long va,unsigned long pid,unsigned long psize,unsigned long ric)469*4882a593Smuzhiyun static __always_inline void _tlbie_va(unsigned long va, unsigned long pid,
470*4882a593Smuzhiyun unsigned long psize, unsigned long ric)
471*4882a593Smuzhiyun {
472*4882a593Smuzhiyun unsigned long ap = mmu_get_ap(psize);
473*4882a593Smuzhiyun
474*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
475*4882a593Smuzhiyun __tlbie_va(va, pid, ap, ric);
476*4882a593Smuzhiyun fixup_tlbie_va(va, pid, ap);
477*4882a593Smuzhiyun asm volatile("eieio; tlbsync; ptesync": : :"memory");
478*4882a593Smuzhiyun }
479*4882a593Smuzhiyun
480*4882a593Smuzhiyun struct tlbiel_va {
481*4882a593Smuzhiyun unsigned long pid;
482*4882a593Smuzhiyun unsigned long va;
483*4882a593Smuzhiyun unsigned long psize;
484*4882a593Smuzhiyun unsigned long ric;
485*4882a593Smuzhiyun };
486*4882a593Smuzhiyun
do_tlbiel_va(void * info)487*4882a593Smuzhiyun static void do_tlbiel_va(void *info)
488*4882a593Smuzhiyun {
489*4882a593Smuzhiyun struct tlbiel_va *t = info;
490*4882a593Smuzhiyun
491*4882a593Smuzhiyun if (t->ric == RIC_FLUSH_TLB)
492*4882a593Smuzhiyun _tlbiel_va(t->va, t->pid, t->psize, RIC_FLUSH_TLB);
493*4882a593Smuzhiyun else if (t->ric == RIC_FLUSH_PWC)
494*4882a593Smuzhiyun _tlbiel_va(t->va, t->pid, t->psize, RIC_FLUSH_PWC);
495*4882a593Smuzhiyun else
496*4882a593Smuzhiyun _tlbiel_va(t->va, t->pid, t->psize, RIC_FLUSH_ALL);
497*4882a593Smuzhiyun }
498*4882a593Smuzhiyun
_tlbiel_va_multicast(struct mm_struct * mm,unsigned long va,unsigned long pid,unsigned long psize,unsigned long ric)499*4882a593Smuzhiyun static inline void _tlbiel_va_multicast(struct mm_struct *mm,
500*4882a593Smuzhiyun unsigned long va, unsigned long pid,
501*4882a593Smuzhiyun unsigned long psize, unsigned long ric)
502*4882a593Smuzhiyun {
503*4882a593Smuzhiyun struct cpumask *cpus = mm_cpumask(mm);
504*4882a593Smuzhiyun struct tlbiel_va t = { .va = va, .pid = pid, .psize = psize, .ric = ric };
505*4882a593Smuzhiyun on_each_cpu_mask(cpus, do_tlbiel_va, &t, 1);
506*4882a593Smuzhiyun if (atomic_read(&mm->context.copros) > 0)
507*4882a593Smuzhiyun _tlbie_va(va, pid, psize, RIC_FLUSH_TLB);
508*4882a593Smuzhiyun }
509*4882a593Smuzhiyun
510*4882a593Smuzhiyun struct tlbiel_va_range {
511*4882a593Smuzhiyun unsigned long pid;
512*4882a593Smuzhiyun unsigned long start;
513*4882a593Smuzhiyun unsigned long end;
514*4882a593Smuzhiyun unsigned long page_size;
515*4882a593Smuzhiyun unsigned long psize;
516*4882a593Smuzhiyun bool also_pwc;
517*4882a593Smuzhiyun };
518*4882a593Smuzhiyun
do_tlbiel_va_range(void * info)519*4882a593Smuzhiyun static void do_tlbiel_va_range(void *info)
520*4882a593Smuzhiyun {
521*4882a593Smuzhiyun struct tlbiel_va_range *t = info;
522*4882a593Smuzhiyun
523*4882a593Smuzhiyun _tlbiel_va_range(t->start, t->end, t->pid, t->page_size,
524*4882a593Smuzhiyun t->psize, t->also_pwc);
525*4882a593Smuzhiyun }
526*4882a593Smuzhiyun
_tlbie_lpid_va(unsigned long va,unsigned long lpid,unsigned long psize,unsigned long ric)527*4882a593Smuzhiyun static __always_inline void _tlbie_lpid_va(unsigned long va, unsigned long lpid,
528*4882a593Smuzhiyun unsigned long psize, unsigned long ric)
529*4882a593Smuzhiyun {
530*4882a593Smuzhiyun unsigned long ap = mmu_get_ap(psize);
531*4882a593Smuzhiyun
532*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
533*4882a593Smuzhiyun __tlbie_lpid_va(va, lpid, ap, ric);
534*4882a593Smuzhiyun fixup_tlbie_lpid_va(va, lpid, ap);
535*4882a593Smuzhiyun asm volatile("eieio; tlbsync; ptesync": : :"memory");
536*4882a593Smuzhiyun }
537*4882a593Smuzhiyun
_tlbie_va_range(unsigned long start,unsigned long end,unsigned long pid,unsigned long page_size,unsigned long psize,bool also_pwc)538*4882a593Smuzhiyun static inline void _tlbie_va_range(unsigned long start, unsigned long end,
539*4882a593Smuzhiyun unsigned long pid, unsigned long page_size,
540*4882a593Smuzhiyun unsigned long psize, bool also_pwc)
541*4882a593Smuzhiyun {
542*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
543*4882a593Smuzhiyun if (also_pwc)
544*4882a593Smuzhiyun __tlbie_pid(pid, RIC_FLUSH_PWC);
545*4882a593Smuzhiyun __tlbie_va_range(start, end, pid, page_size, psize);
546*4882a593Smuzhiyun asm volatile("eieio; tlbsync; ptesync": : :"memory");
547*4882a593Smuzhiyun }
548*4882a593Smuzhiyun
_tlbiel_va_range_multicast(struct mm_struct * mm,unsigned long start,unsigned long end,unsigned long pid,unsigned long page_size,unsigned long psize,bool also_pwc)549*4882a593Smuzhiyun static inline void _tlbiel_va_range_multicast(struct mm_struct *mm,
550*4882a593Smuzhiyun unsigned long start, unsigned long end,
551*4882a593Smuzhiyun unsigned long pid, unsigned long page_size,
552*4882a593Smuzhiyun unsigned long psize, bool also_pwc)
553*4882a593Smuzhiyun {
554*4882a593Smuzhiyun struct cpumask *cpus = mm_cpumask(mm);
555*4882a593Smuzhiyun struct tlbiel_va_range t = { .start = start, .end = end,
556*4882a593Smuzhiyun .pid = pid, .page_size = page_size,
557*4882a593Smuzhiyun .psize = psize, .also_pwc = also_pwc };
558*4882a593Smuzhiyun
559*4882a593Smuzhiyun on_each_cpu_mask(cpus, do_tlbiel_va_range, &t, 1);
560*4882a593Smuzhiyun if (atomic_read(&mm->context.copros) > 0)
561*4882a593Smuzhiyun _tlbie_va_range(start, end, pid, page_size, psize, also_pwc);
562*4882a593Smuzhiyun }
563*4882a593Smuzhiyun
564*4882a593Smuzhiyun /*
565*4882a593Smuzhiyun * Base TLB flushing operations:
566*4882a593Smuzhiyun *
567*4882a593Smuzhiyun * - flush_tlb_mm(mm) flushes the specified mm context TLB's
568*4882a593Smuzhiyun * - flush_tlb_page(vma, vmaddr) flushes one page
569*4882a593Smuzhiyun * - flush_tlb_range(vma, start, end) flushes a range of pages
570*4882a593Smuzhiyun * - flush_tlb_kernel_range(start, end) flushes kernel pages
571*4882a593Smuzhiyun *
572*4882a593Smuzhiyun * - local_* variants of page and mm only apply to the current
573*4882a593Smuzhiyun * processor
574*4882a593Smuzhiyun */
radix__local_flush_tlb_mm(struct mm_struct * mm)575*4882a593Smuzhiyun void radix__local_flush_tlb_mm(struct mm_struct *mm)
576*4882a593Smuzhiyun {
577*4882a593Smuzhiyun unsigned long pid;
578*4882a593Smuzhiyun
579*4882a593Smuzhiyun preempt_disable();
580*4882a593Smuzhiyun pid = mm->context.id;
581*4882a593Smuzhiyun if (pid != MMU_NO_CONTEXT)
582*4882a593Smuzhiyun _tlbiel_pid(pid, RIC_FLUSH_TLB);
583*4882a593Smuzhiyun preempt_enable();
584*4882a593Smuzhiyun }
585*4882a593Smuzhiyun EXPORT_SYMBOL(radix__local_flush_tlb_mm);
586*4882a593Smuzhiyun
587*4882a593Smuzhiyun #ifndef CONFIG_SMP
radix__local_flush_all_mm(struct mm_struct * mm)588*4882a593Smuzhiyun void radix__local_flush_all_mm(struct mm_struct *mm)
589*4882a593Smuzhiyun {
590*4882a593Smuzhiyun unsigned long pid;
591*4882a593Smuzhiyun
592*4882a593Smuzhiyun preempt_disable();
593*4882a593Smuzhiyun pid = mm->context.id;
594*4882a593Smuzhiyun if (pid != MMU_NO_CONTEXT)
595*4882a593Smuzhiyun _tlbiel_pid(pid, RIC_FLUSH_ALL);
596*4882a593Smuzhiyun preempt_enable();
597*4882a593Smuzhiyun }
598*4882a593Smuzhiyun EXPORT_SYMBOL(radix__local_flush_all_mm);
599*4882a593Smuzhiyun
__flush_all_mm(struct mm_struct * mm,bool fullmm)600*4882a593Smuzhiyun static void __flush_all_mm(struct mm_struct *mm, bool fullmm)
601*4882a593Smuzhiyun {
602*4882a593Smuzhiyun radix__local_flush_all_mm(mm);
603*4882a593Smuzhiyun }
604*4882a593Smuzhiyun #endif /* CONFIG_SMP */
605*4882a593Smuzhiyun
radix__local_flush_tlb_page_psize(struct mm_struct * mm,unsigned long vmaddr,int psize)606*4882a593Smuzhiyun void radix__local_flush_tlb_page_psize(struct mm_struct *mm, unsigned long vmaddr,
607*4882a593Smuzhiyun int psize)
608*4882a593Smuzhiyun {
609*4882a593Smuzhiyun unsigned long pid;
610*4882a593Smuzhiyun
611*4882a593Smuzhiyun preempt_disable();
612*4882a593Smuzhiyun pid = mm->context.id;
613*4882a593Smuzhiyun if (pid != MMU_NO_CONTEXT)
614*4882a593Smuzhiyun _tlbiel_va(vmaddr, pid, psize, RIC_FLUSH_TLB);
615*4882a593Smuzhiyun preempt_enable();
616*4882a593Smuzhiyun }
617*4882a593Smuzhiyun
radix__local_flush_tlb_page(struct vm_area_struct * vma,unsigned long vmaddr)618*4882a593Smuzhiyun void radix__local_flush_tlb_page(struct vm_area_struct *vma, unsigned long vmaddr)
619*4882a593Smuzhiyun {
620*4882a593Smuzhiyun #ifdef CONFIG_HUGETLB_PAGE
621*4882a593Smuzhiyun /* need the return fix for nohash.c */
622*4882a593Smuzhiyun if (is_vm_hugetlb_page(vma))
623*4882a593Smuzhiyun return radix__local_flush_hugetlb_page(vma, vmaddr);
624*4882a593Smuzhiyun #endif
625*4882a593Smuzhiyun radix__local_flush_tlb_page_psize(vma->vm_mm, vmaddr, mmu_virtual_psize);
626*4882a593Smuzhiyun }
627*4882a593Smuzhiyun EXPORT_SYMBOL(radix__local_flush_tlb_page);
628*4882a593Smuzhiyun
mm_is_singlethreaded(struct mm_struct * mm)629*4882a593Smuzhiyun static bool mm_is_singlethreaded(struct mm_struct *mm)
630*4882a593Smuzhiyun {
631*4882a593Smuzhiyun if (atomic_read(&mm->context.copros) > 0)
632*4882a593Smuzhiyun return false;
633*4882a593Smuzhiyun if (atomic_read(&mm->mm_users) <= 1 && current->mm == mm)
634*4882a593Smuzhiyun return true;
635*4882a593Smuzhiyun return false;
636*4882a593Smuzhiyun }
637*4882a593Smuzhiyun
mm_needs_flush_escalation(struct mm_struct * mm)638*4882a593Smuzhiyun static bool mm_needs_flush_escalation(struct mm_struct *mm)
639*4882a593Smuzhiyun {
640*4882a593Smuzhiyun /*
641*4882a593Smuzhiyun * P9 nest MMU has issues with the page walk cache
642*4882a593Smuzhiyun * caching PTEs and not flushing them properly when
643*4882a593Smuzhiyun * RIC = 0 for a PID/LPID invalidate
644*4882a593Smuzhiyun */
645*4882a593Smuzhiyun if (atomic_read(&mm->context.copros) > 0)
646*4882a593Smuzhiyun return true;
647*4882a593Smuzhiyun return false;
648*4882a593Smuzhiyun }
649*4882a593Smuzhiyun
650*4882a593Smuzhiyun #ifdef CONFIG_SMP
do_exit_flush_lazy_tlb(void * arg)651*4882a593Smuzhiyun static void do_exit_flush_lazy_tlb(void *arg)
652*4882a593Smuzhiyun {
653*4882a593Smuzhiyun struct mm_struct *mm = arg;
654*4882a593Smuzhiyun unsigned long pid = mm->context.id;
655*4882a593Smuzhiyun
656*4882a593Smuzhiyun /*
657*4882a593Smuzhiyun * A kthread could have done a mmget_not_zero() after the flushing CPU
658*4882a593Smuzhiyun * checked mm_is_singlethreaded, and be in the process of
659*4882a593Smuzhiyun * kthread_use_mm when interrupted here. In that case, current->mm will
660*4882a593Smuzhiyun * be set to mm, because kthread_use_mm() setting ->mm and switching to
661*4882a593Smuzhiyun * the mm is done with interrupts off.
662*4882a593Smuzhiyun */
663*4882a593Smuzhiyun if (current->mm == mm)
664*4882a593Smuzhiyun goto out_flush;
665*4882a593Smuzhiyun
666*4882a593Smuzhiyun if (current->active_mm == mm) {
667*4882a593Smuzhiyun WARN_ON_ONCE(current->mm != NULL);
668*4882a593Smuzhiyun /* Is a kernel thread and is using mm as the lazy tlb */
669*4882a593Smuzhiyun mmgrab(&init_mm);
670*4882a593Smuzhiyun current->active_mm = &init_mm;
671*4882a593Smuzhiyun switch_mm_irqs_off(mm, &init_mm, current);
672*4882a593Smuzhiyun mmdrop(mm);
673*4882a593Smuzhiyun }
674*4882a593Smuzhiyun
675*4882a593Smuzhiyun atomic_dec(&mm->context.active_cpus);
676*4882a593Smuzhiyun cpumask_clear_cpu(smp_processor_id(), mm_cpumask(mm));
677*4882a593Smuzhiyun
678*4882a593Smuzhiyun out_flush:
679*4882a593Smuzhiyun _tlbiel_pid(pid, RIC_FLUSH_ALL);
680*4882a593Smuzhiyun }
681*4882a593Smuzhiyun
exit_flush_lazy_tlbs(struct mm_struct * mm)682*4882a593Smuzhiyun static void exit_flush_lazy_tlbs(struct mm_struct *mm)
683*4882a593Smuzhiyun {
684*4882a593Smuzhiyun /*
685*4882a593Smuzhiyun * Would be nice if this was async so it could be run in
686*4882a593Smuzhiyun * parallel with our local flush, but generic code does not
687*4882a593Smuzhiyun * give a good API for it. Could extend the generic code or
688*4882a593Smuzhiyun * make a special powerpc IPI for flushing TLBs.
689*4882a593Smuzhiyun * For now it's not too performance critical.
690*4882a593Smuzhiyun */
691*4882a593Smuzhiyun smp_call_function_many(mm_cpumask(mm), do_exit_flush_lazy_tlb,
692*4882a593Smuzhiyun (void *)mm, 1);
693*4882a593Smuzhiyun }
694*4882a593Smuzhiyun
radix__flush_tlb_mm(struct mm_struct * mm)695*4882a593Smuzhiyun void radix__flush_tlb_mm(struct mm_struct *mm)
696*4882a593Smuzhiyun {
697*4882a593Smuzhiyun unsigned long pid;
698*4882a593Smuzhiyun
699*4882a593Smuzhiyun pid = mm->context.id;
700*4882a593Smuzhiyun if (unlikely(pid == MMU_NO_CONTEXT))
701*4882a593Smuzhiyun return;
702*4882a593Smuzhiyun
703*4882a593Smuzhiyun preempt_disable();
704*4882a593Smuzhiyun /*
705*4882a593Smuzhiyun * Order loads of mm_cpumask vs previous stores to clear ptes before
706*4882a593Smuzhiyun * the invalidate. See barrier in switch_mm_irqs_off
707*4882a593Smuzhiyun */
708*4882a593Smuzhiyun smp_mb();
709*4882a593Smuzhiyun if (!mm_is_thread_local(mm)) {
710*4882a593Smuzhiyun if (unlikely(mm_is_singlethreaded(mm))) {
711*4882a593Smuzhiyun exit_flush_lazy_tlbs(mm);
712*4882a593Smuzhiyun goto local;
713*4882a593Smuzhiyun }
714*4882a593Smuzhiyun
715*4882a593Smuzhiyun if (!mmu_has_feature(MMU_FTR_GTSE)) {
716*4882a593Smuzhiyun unsigned long tgt = H_RPTI_TARGET_CMMU;
717*4882a593Smuzhiyun
718*4882a593Smuzhiyun if (atomic_read(&mm->context.copros) > 0)
719*4882a593Smuzhiyun tgt |= H_RPTI_TARGET_NMMU;
720*4882a593Smuzhiyun pseries_rpt_invalidate(pid, tgt, H_RPTI_TYPE_TLB,
721*4882a593Smuzhiyun H_RPTI_PAGE_ALL, 0, -1UL);
722*4882a593Smuzhiyun } else if (cputlb_use_tlbie()) {
723*4882a593Smuzhiyun if (mm_needs_flush_escalation(mm))
724*4882a593Smuzhiyun _tlbie_pid(pid, RIC_FLUSH_ALL);
725*4882a593Smuzhiyun else
726*4882a593Smuzhiyun _tlbie_pid(pid, RIC_FLUSH_TLB);
727*4882a593Smuzhiyun } else {
728*4882a593Smuzhiyun _tlbiel_pid_multicast(mm, pid, RIC_FLUSH_TLB);
729*4882a593Smuzhiyun }
730*4882a593Smuzhiyun } else {
731*4882a593Smuzhiyun local:
732*4882a593Smuzhiyun _tlbiel_pid(pid, RIC_FLUSH_TLB);
733*4882a593Smuzhiyun }
734*4882a593Smuzhiyun preempt_enable();
735*4882a593Smuzhiyun }
736*4882a593Smuzhiyun EXPORT_SYMBOL(radix__flush_tlb_mm);
737*4882a593Smuzhiyun
__flush_all_mm(struct mm_struct * mm,bool fullmm)738*4882a593Smuzhiyun static void __flush_all_mm(struct mm_struct *mm, bool fullmm)
739*4882a593Smuzhiyun {
740*4882a593Smuzhiyun unsigned long pid;
741*4882a593Smuzhiyun
742*4882a593Smuzhiyun pid = mm->context.id;
743*4882a593Smuzhiyun if (unlikely(pid == MMU_NO_CONTEXT))
744*4882a593Smuzhiyun return;
745*4882a593Smuzhiyun
746*4882a593Smuzhiyun preempt_disable();
747*4882a593Smuzhiyun smp_mb(); /* see radix__flush_tlb_mm */
748*4882a593Smuzhiyun if (!mm_is_thread_local(mm)) {
749*4882a593Smuzhiyun if (unlikely(mm_is_singlethreaded(mm))) {
750*4882a593Smuzhiyun if (!fullmm) {
751*4882a593Smuzhiyun exit_flush_lazy_tlbs(mm);
752*4882a593Smuzhiyun goto local;
753*4882a593Smuzhiyun }
754*4882a593Smuzhiyun }
755*4882a593Smuzhiyun if (!mmu_has_feature(MMU_FTR_GTSE)) {
756*4882a593Smuzhiyun unsigned long tgt = H_RPTI_TARGET_CMMU;
757*4882a593Smuzhiyun unsigned long type = H_RPTI_TYPE_TLB | H_RPTI_TYPE_PWC |
758*4882a593Smuzhiyun H_RPTI_TYPE_PRT;
759*4882a593Smuzhiyun
760*4882a593Smuzhiyun if (atomic_read(&mm->context.copros) > 0)
761*4882a593Smuzhiyun tgt |= H_RPTI_TARGET_NMMU;
762*4882a593Smuzhiyun pseries_rpt_invalidate(pid, tgt, type,
763*4882a593Smuzhiyun H_RPTI_PAGE_ALL, 0, -1UL);
764*4882a593Smuzhiyun } else if (cputlb_use_tlbie())
765*4882a593Smuzhiyun _tlbie_pid(pid, RIC_FLUSH_ALL);
766*4882a593Smuzhiyun else
767*4882a593Smuzhiyun _tlbiel_pid_multicast(mm, pid, RIC_FLUSH_ALL);
768*4882a593Smuzhiyun } else {
769*4882a593Smuzhiyun local:
770*4882a593Smuzhiyun _tlbiel_pid(pid, RIC_FLUSH_ALL);
771*4882a593Smuzhiyun }
772*4882a593Smuzhiyun preempt_enable();
773*4882a593Smuzhiyun }
774*4882a593Smuzhiyun
radix__flush_all_mm(struct mm_struct * mm)775*4882a593Smuzhiyun void radix__flush_all_mm(struct mm_struct *mm)
776*4882a593Smuzhiyun {
777*4882a593Smuzhiyun __flush_all_mm(mm, false);
778*4882a593Smuzhiyun }
779*4882a593Smuzhiyun EXPORT_SYMBOL(radix__flush_all_mm);
780*4882a593Smuzhiyun
radix__flush_tlb_page_psize(struct mm_struct * mm,unsigned long vmaddr,int psize)781*4882a593Smuzhiyun void radix__flush_tlb_page_psize(struct mm_struct *mm, unsigned long vmaddr,
782*4882a593Smuzhiyun int psize)
783*4882a593Smuzhiyun {
784*4882a593Smuzhiyun unsigned long pid;
785*4882a593Smuzhiyun
786*4882a593Smuzhiyun pid = mm->context.id;
787*4882a593Smuzhiyun if (unlikely(pid == MMU_NO_CONTEXT))
788*4882a593Smuzhiyun return;
789*4882a593Smuzhiyun
790*4882a593Smuzhiyun preempt_disable();
791*4882a593Smuzhiyun smp_mb(); /* see radix__flush_tlb_mm */
792*4882a593Smuzhiyun if (!mm_is_thread_local(mm)) {
793*4882a593Smuzhiyun if (unlikely(mm_is_singlethreaded(mm))) {
794*4882a593Smuzhiyun exit_flush_lazy_tlbs(mm);
795*4882a593Smuzhiyun goto local;
796*4882a593Smuzhiyun }
797*4882a593Smuzhiyun if (!mmu_has_feature(MMU_FTR_GTSE)) {
798*4882a593Smuzhiyun unsigned long tgt, pg_sizes, size;
799*4882a593Smuzhiyun
800*4882a593Smuzhiyun tgt = H_RPTI_TARGET_CMMU;
801*4882a593Smuzhiyun pg_sizes = psize_to_rpti_pgsize(psize);
802*4882a593Smuzhiyun size = 1UL << mmu_psize_to_shift(psize);
803*4882a593Smuzhiyun
804*4882a593Smuzhiyun if (atomic_read(&mm->context.copros) > 0)
805*4882a593Smuzhiyun tgt |= H_RPTI_TARGET_NMMU;
806*4882a593Smuzhiyun pseries_rpt_invalidate(pid, tgt, H_RPTI_TYPE_TLB,
807*4882a593Smuzhiyun pg_sizes, vmaddr,
808*4882a593Smuzhiyun vmaddr + size);
809*4882a593Smuzhiyun } else if (cputlb_use_tlbie())
810*4882a593Smuzhiyun _tlbie_va(vmaddr, pid, psize, RIC_FLUSH_TLB);
811*4882a593Smuzhiyun else
812*4882a593Smuzhiyun _tlbiel_va_multicast(mm, vmaddr, pid, psize, RIC_FLUSH_TLB);
813*4882a593Smuzhiyun } else {
814*4882a593Smuzhiyun local:
815*4882a593Smuzhiyun _tlbiel_va(vmaddr, pid, psize, RIC_FLUSH_TLB);
816*4882a593Smuzhiyun }
817*4882a593Smuzhiyun preempt_enable();
818*4882a593Smuzhiyun }
819*4882a593Smuzhiyun
radix__flush_tlb_page(struct vm_area_struct * vma,unsigned long vmaddr)820*4882a593Smuzhiyun void radix__flush_tlb_page(struct vm_area_struct *vma, unsigned long vmaddr)
821*4882a593Smuzhiyun {
822*4882a593Smuzhiyun #ifdef CONFIG_HUGETLB_PAGE
823*4882a593Smuzhiyun if (is_vm_hugetlb_page(vma))
824*4882a593Smuzhiyun return radix__flush_hugetlb_page(vma, vmaddr);
825*4882a593Smuzhiyun #endif
826*4882a593Smuzhiyun radix__flush_tlb_page_psize(vma->vm_mm, vmaddr, mmu_virtual_psize);
827*4882a593Smuzhiyun }
828*4882a593Smuzhiyun EXPORT_SYMBOL(radix__flush_tlb_page);
829*4882a593Smuzhiyun
830*4882a593Smuzhiyun #else /* CONFIG_SMP */
exit_flush_lazy_tlbs(struct mm_struct * mm)831*4882a593Smuzhiyun static inline void exit_flush_lazy_tlbs(struct mm_struct *mm) { }
832*4882a593Smuzhiyun #endif /* CONFIG_SMP */
833*4882a593Smuzhiyun
do_tlbiel_kernel(void * info)834*4882a593Smuzhiyun static void do_tlbiel_kernel(void *info)
835*4882a593Smuzhiyun {
836*4882a593Smuzhiyun _tlbiel_pid(0, RIC_FLUSH_ALL);
837*4882a593Smuzhiyun }
838*4882a593Smuzhiyun
_tlbiel_kernel_broadcast(void)839*4882a593Smuzhiyun static inline void _tlbiel_kernel_broadcast(void)
840*4882a593Smuzhiyun {
841*4882a593Smuzhiyun on_each_cpu(do_tlbiel_kernel, NULL, 1);
842*4882a593Smuzhiyun if (tlbie_capable) {
843*4882a593Smuzhiyun /*
844*4882a593Smuzhiyun * Coherent accelerators don't refcount kernel memory mappings,
845*4882a593Smuzhiyun * so have to always issue a tlbie for them. This is quite a
846*4882a593Smuzhiyun * slow path anyway.
847*4882a593Smuzhiyun */
848*4882a593Smuzhiyun _tlbie_pid(0, RIC_FLUSH_ALL);
849*4882a593Smuzhiyun }
850*4882a593Smuzhiyun }
851*4882a593Smuzhiyun
852*4882a593Smuzhiyun /*
853*4882a593Smuzhiyun * If kernel TLBIs ever become local rather than global, then
854*4882a593Smuzhiyun * drivers/misc/ocxl/link.c:ocxl_link_add_pe will need some work, as it
855*4882a593Smuzhiyun * assumes kernel TLBIs are global.
856*4882a593Smuzhiyun */
radix__flush_tlb_kernel_range(unsigned long start,unsigned long end)857*4882a593Smuzhiyun void radix__flush_tlb_kernel_range(unsigned long start, unsigned long end)
858*4882a593Smuzhiyun {
859*4882a593Smuzhiyun if (!mmu_has_feature(MMU_FTR_GTSE)) {
860*4882a593Smuzhiyun unsigned long tgt = H_RPTI_TARGET_CMMU | H_RPTI_TARGET_NMMU;
861*4882a593Smuzhiyun unsigned long type = H_RPTI_TYPE_TLB | H_RPTI_TYPE_PWC |
862*4882a593Smuzhiyun H_RPTI_TYPE_PRT;
863*4882a593Smuzhiyun
864*4882a593Smuzhiyun pseries_rpt_invalidate(0, tgt, type, H_RPTI_PAGE_ALL,
865*4882a593Smuzhiyun start, end);
866*4882a593Smuzhiyun } else if (cputlb_use_tlbie())
867*4882a593Smuzhiyun _tlbie_pid(0, RIC_FLUSH_ALL);
868*4882a593Smuzhiyun else
869*4882a593Smuzhiyun _tlbiel_kernel_broadcast();
870*4882a593Smuzhiyun }
871*4882a593Smuzhiyun EXPORT_SYMBOL(radix__flush_tlb_kernel_range);
872*4882a593Smuzhiyun
873*4882a593Smuzhiyun #define TLB_FLUSH_ALL -1UL
874*4882a593Smuzhiyun
875*4882a593Smuzhiyun /*
876*4882a593Smuzhiyun * Number of pages above which we invalidate the entire PID rather than
877*4882a593Smuzhiyun * flush individual pages, for local and global flushes respectively.
878*4882a593Smuzhiyun *
879*4882a593Smuzhiyun * tlbie goes out to the interconnect and individual ops are more costly.
880*4882a593Smuzhiyun * It also does not iterate over sets like the local tlbiel variant when
881*4882a593Smuzhiyun * invalidating a full PID, so it has a far lower threshold to change from
882*4882a593Smuzhiyun * individual page flushes to full-pid flushes.
883*4882a593Smuzhiyun */
884*4882a593Smuzhiyun static unsigned long tlb_single_page_flush_ceiling __read_mostly = 33;
885*4882a593Smuzhiyun static unsigned long tlb_local_single_page_flush_ceiling __read_mostly = POWER9_TLB_SETS_RADIX * 2;
886*4882a593Smuzhiyun
__radix__flush_tlb_range(struct mm_struct * mm,unsigned long start,unsigned long end)887*4882a593Smuzhiyun static inline void __radix__flush_tlb_range(struct mm_struct *mm,
888*4882a593Smuzhiyun unsigned long start, unsigned long end)
889*4882a593Smuzhiyun
890*4882a593Smuzhiyun {
891*4882a593Smuzhiyun unsigned long pid;
892*4882a593Smuzhiyun unsigned int page_shift = mmu_psize_defs[mmu_virtual_psize].shift;
893*4882a593Smuzhiyun unsigned long page_size = 1UL << page_shift;
894*4882a593Smuzhiyun unsigned long nr_pages = (end - start) >> page_shift;
895*4882a593Smuzhiyun bool local, full;
896*4882a593Smuzhiyun
897*4882a593Smuzhiyun pid = mm->context.id;
898*4882a593Smuzhiyun if (unlikely(pid == MMU_NO_CONTEXT))
899*4882a593Smuzhiyun return;
900*4882a593Smuzhiyun
901*4882a593Smuzhiyun preempt_disable();
902*4882a593Smuzhiyun smp_mb(); /* see radix__flush_tlb_mm */
903*4882a593Smuzhiyun if (!mm_is_thread_local(mm)) {
904*4882a593Smuzhiyun if (unlikely(mm_is_singlethreaded(mm))) {
905*4882a593Smuzhiyun if (end != TLB_FLUSH_ALL) {
906*4882a593Smuzhiyun exit_flush_lazy_tlbs(mm);
907*4882a593Smuzhiyun goto is_local;
908*4882a593Smuzhiyun }
909*4882a593Smuzhiyun }
910*4882a593Smuzhiyun local = false;
911*4882a593Smuzhiyun full = (end == TLB_FLUSH_ALL ||
912*4882a593Smuzhiyun nr_pages > tlb_single_page_flush_ceiling);
913*4882a593Smuzhiyun } else {
914*4882a593Smuzhiyun is_local:
915*4882a593Smuzhiyun local = true;
916*4882a593Smuzhiyun full = (end == TLB_FLUSH_ALL ||
917*4882a593Smuzhiyun nr_pages > tlb_local_single_page_flush_ceiling);
918*4882a593Smuzhiyun }
919*4882a593Smuzhiyun
920*4882a593Smuzhiyun if (!mmu_has_feature(MMU_FTR_GTSE) && !local) {
921*4882a593Smuzhiyun unsigned long tgt = H_RPTI_TARGET_CMMU;
922*4882a593Smuzhiyun unsigned long pg_sizes = psize_to_rpti_pgsize(mmu_virtual_psize);
923*4882a593Smuzhiyun
924*4882a593Smuzhiyun if (IS_ENABLED(CONFIG_TRANSPARENT_HUGEPAGE))
925*4882a593Smuzhiyun pg_sizes |= psize_to_rpti_pgsize(MMU_PAGE_2M);
926*4882a593Smuzhiyun if (atomic_read(&mm->context.copros) > 0)
927*4882a593Smuzhiyun tgt |= H_RPTI_TARGET_NMMU;
928*4882a593Smuzhiyun pseries_rpt_invalidate(pid, tgt, H_RPTI_TYPE_TLB, pg_sizes,
929*4882a593Smuzhiyun start, end);
930*4882a593Smuzhiyun } else if (full) {
931*4882a593Smuzhiyun if (local) {
932*4882a593Smuzhiyun _tlbiel_pid(pid, RIC_FLUSH_TLB);
933*4882a593Smuzhiyun } else {
934*4882a593Smuzhiyun if (cputlb_use_tlbie()) {
935*4882a593Smuzhiyun if (mm_needs_flush_escalation(mm))
936*4882a593Smuzhiyun _tlbie_pid(pid, RIC_FLUSH_ALL);
937*4882a593Smuzhiyun else
938*4882a593Smuzhiyun _tlbie_pid(pid, RIC_FLUSH_TLB);
939*4882a593Smuzhiyun } else {
940*4882a593Smuzhiyun _tlbiel_pid_multicast(mm, pid, RIC_FLUSH_TLB);
941*4882a593Smuzhiyun }
942*4882a593Smuzhiyun }
943*4882a593Smuzhiyun } else {
944*4882a593Smuzhiyun bool hflush = false;
945*4882a593Smuzhiyun unsigned long hstart, hend;
946*4882a593Smuzhiyun
947*4882a593Smuzhiyun if (IS_ENABLED(CONFIG_TRANSPARENT_HUGEPAGE)) {
948*4882a593Smuzhiyun hstart = (start + PMD_SIZE - 1) & PMD_MASK;
949*4882a593Smuzhiyun hend = end & PMD_MASK;
950*4882a593Smuzhiyun if (hstart < hend)
951*4882a593Smuzhiyun hflush = true;
952*4882a593Smuzhiyun }
953*4882a593Smuzhiyun
954*4882a593Smuzhiyun if (local) {
955*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
956*4882a593Smuzhiyun __tlbiel_va_range(start, end, pid, page_size, mmu_virtual_psize);
957*4882a593Smuzhiyun if (hflush)
958*4882a593Smuzhiyun __tlbiel_va_range(hstart, hend, pid,
959*4882a593Smuzhiyun PMD_SIZE, MMU_PAGE_2M);
960*4882a593Smuzhiyun ppc_after_tlbiel_barrier();
961*4882a593Smuzhiyun } else if (cputlb_use_tlbie()) {
962*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
963*4882a593Smuzhiyun __tlbie_va_range(start, end, pid, page_size, mmu_virtual_psize);
964*4882a593Smuzhiyun if (hflush)
965*4882a593Smuzhiyun __tlbie_va_range(hstart, hend, pid,
966*4882a593Smuzhiyun PMD_SIZE, MMU_PAGE_2M);
967*4882a593Smuzhiyun asm volatile("eieio; tlbsync; ptesync": : :"memory");
968*4882a593Smuzhiyun } else {
969*4882a593Smuzhiyun _tlbiel_va_range_multicast(mm,
970*4882a593Smuzhiyun start, end, pid, page_size, mmu_virtual_psize, false);
971*4882a593Smuzhiyun if (hflush)
972*4882a593Smuzhiyun _tlbiel_va_range_multicast(mm,
973*4882a593Smuzhiyun hstart, hend, pid, PMD_SIZE, MMU_PAGE_2M, false);
974*4882a593Smuzhiyun }
975*4882a593Smuzhiyun }
976*4882a593Smuzhiyun preempt_enable();
977*4882a593Smuzhiyun }
978*4882a593Smuzhiyun
radix__flush_tlb_range(struct vm_area_struct * vma,unsigned long start,unsigned long end)979*4882a593Smuzhiyun void radix__flush_tlb_range(struct vm_area_struct *vma, unsigned long start,
980*4882a593Smuzhiyun unsigned long end)
981*4882a593Smuzhiyun
982*4882a593Smuzhiyun {
983*4882a593Smuzhiyun #ifdef CONFIG_HUGETLB_PAGE
984*4882a593Smuzhiyun if (is_vm_hugetlb_page(vma))
985*4882a593Smuzhiyun return radix__flush_hugetlb_tlb_range(vma, start, end);
986*4882a593Smuzhiyun #endif
987*4882a593Smuzhiyun
988*4882a593Smuzhiyun __radix__flush_tlb_range(vma->vm_mm, start, end);
989*4882a593Smuzhiyun }
990*4882a593Smuzhiyun EXPORT_SYMBOL(radix__flush_tlb_range);
991*4882a593Smuzhiyun
radix_get_mmu_psize(int page_size)992*4882a593Smuzhiyun static int radix_get_mmu_psize(int page_size)
993*4882a593Smuzhiyun {
994*4882a593Smuzhiyun int psize;
995*4882a593Smuzhiyun
996*4882a593Smuzhiyun if (page_size == (1UL << mmu_psize_defs[mmu_virtual_psize].shift))
997*4882a593Smuzhiyun psize = mmu_virtual_psize;
998*4882a593Smuzhiyun else if (page_size == (1UL << mmu_psize_defs[MMU_PAGE_2M].shift))
999*4882a593Smuzhiyun psize = MMU_PAGE_2M;
1000*4882a593Smuzhiyun else if (page_size == (1UL << mmu_psize_defs[MMU_PAGE_1G].shift))
1001*4882a593Smuzhiyun psize = MMU_PAGE_1G;
1002*4882a593Smuzhiyun else
1003*4882a593Smuzhiyun return -1;
1004*4882a593Smuzhiyun return psize;
1005*4882a593Smuzhiyun }
1006*4882a593Smuzhiyun
1007*4882a593Smuzhiyun /*
1008*4882a593Smuzhiyun * Flush partition scoped LPID address translation for all CPUs.
1009*4882a593Smuzhiyun */
radix__flush_tlb_lpid_page(unsigned int lpid,unsigned long addr,unsigned long page_size)1010*4882a593Smuzhiyun void radix__flush_tlb_lpid_page(unsigned int lpid,
1011*4882a593Smuzhiyun unsigned long addr,
1012*4882a593Smuzhiyun unsigned long page_size)
1013*4882a593Smuzhiyun {
1014*4882a593Smuzhiyun int psize = radix_get_mmu_psize(page_size);
1015*4882a593Smuzhiyun
1016*4882a593Smuzhiyun _tlbie_lpid_va(addr, lpid, psize, RIC_FLUSH_TLB);
1017*4882a593Smuzhiyun }
1018*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(radix__flush_tlb_lpid_page);
1019*4882a593Smuzhiyun
1020*4882a593Smuzhiyun /*
1021*4882a593Smuzhiyun * Flush partition scoped PWC from LPID for all CPUs.
1022*4882a593Smuzhiyun */
radix__flush_pwc_lpid(unsigned int lpid)1023*4882a593Smuzhiyun void radix__flush_pwc_lpid(unsigned int lpid)
1024*4882a593Smuzhiyun {
1025*4882a593Smuzhiyun _tlbie_lpid(lpid, RIC_FLUSH_PWC);
1026*4882a593Smuzhiyun }
1027*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(radix__flush_pwc_lpid);
1028*4882a593Smuzhiyun
1029*4882a593Smuzhiyun /*
1030*4882a593Smuzhiyun * Flush partition scoped translations from LPID (=LPIDR)
1031*4882a593Smuzhiyun */
radix__flush_all_lpid(unsigned int lpid)1032*4882a593Smuzhiyun void radix__flush_all_lpid(unsigned int lpid)
1033*4882a593Smuzhiyun {
1034*4882a593Smuzhiyun _tlbie_lpid(lpid, RIC_FLUSH_ALL);
1035*4882a593Smuzhiyun }
1036*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(radix__flush_all_lpid);
1037*4882a593Smuzhiyun
1038*4882a593Smuzhiyun /*
1039*4882a593Smuzhiyun * Flush process scoped translations from LPID (=LPIDR)
1040*4882a593Smuzhiyun */
radix__flush_all_lpid_guest(unsigned int lpid)1041*4882a593Smuzhiyun void radix__flush_all_lpid_guest(unsigned int lpid)
1042*4882a593Smuzhiyun {
1043*4882a593Smuzhiyun _tlbie_lpid_guest(lpid, RIC_FLUSH_ALL);
1044*4882a593Smuzhiyun }
1045*4882a593Smuzhiyun
1046*4882a593Smuzhiyun static void radix__flush_tlb_pwc_range_psize(struct mm_struct *mm, unsigned long start,
1047*4882a593Smuzhiyun unsigned long end, int psize);
1048*4882a593Smuzhiyun
radix__tlb_flush(struct mmu_gather * tlb)1049*4882a593Smuzhiyun void radix__tlb_flush(struct mmu_gather *tlb)
1050*4882a593Smuzhiyun {
1051*4882a593Smuzhiyun int psize = 0;
1052*4882a593Smuzhiyun struct mm_struct *mm = tlb->mm;
1053*4882a593Smuzhiyun int page_size = tlb->page_size;
1054*4882a593Smuzhiyun unsigned long start = tlb->start;
1055*4882a593Smuzhiyun unsigned long end = tlb->end;
1056*4882a593Smuzhiyun
1057*4882a593Smuzhiyun /*
1058*4882a593Smuzhiyun * if page size is not something we understand, do a full mm flush
1059*4882a593Smuzhiyun *
1060*4882a593Smuzhiyun * A "fullmm" flush must always do a flush_all_mm (RIC=2) flush
1061*4882a593Smuzhiyun * that flushes the process table entry cache upon process teardown.
1062*4882a593Smuzhiyun * See the comment for radix in arch_exit_mmap().
1063*4882a593Smuzhiyun */
1064*4882a593Smuzhiyun if (tlb->fullmm || tlb->need_flush_all) {
1065*4882a593Smuzhiyun __flush_all_mm(mm, true);
1066*4882a593Smuzhiyun } else if ( (psize = radix_get_mmu_psize(page_size)) == -1) {
1067*4882a593Smuzhiyun if (!tlb->freed_tables)
1068*4882a593Smuzhiyun radix__flush_tlb_mm(mm);
1069*4882a593Smuzhiyun else
1070*4882a593Smuzhiyun radix__flush_all_mm(mm);
1071*4882a593Smuzhiyun } else {
1072*4882a593Smuzhiyun if (!tlb->freed_tables)
1073*4882a593Smuzhiyun radix__flush_tlb_range_psize(mm, start, end, psize);
1074*4882a593Smuzhiyun else
1075*4882a593Smuzhiyun radix__flush_tlb_pwc_range_psize(mm, start, end, psize);
1076*4882a593Smuzhiyun }
1077*4882a593Smuzhiyun }
1078*4882a593Smuzhiyun
__radix__flush_tlb_range_psize(struct mm_struct * mm,unsigned long start,unsigned long end,int psize,bool also_pwc)1079*4882a593Smuzhiyun static void __radix__flush_tlb_range_psize(struct mm_struct *mm,
1080*4882a593Smuzhiyun unsigned long start, unsigned long end,
1081*4882a593Smuzhiyun int psize, bool also_pwc)
1082*4882a593Smuzhiyun {
1083*4882a593Smuzhiyun unsigned long pid;
1084*4882a593Smuzhiyun unsigned int page_shift = mmu_psize_defs[psize].shift;
1085*4882a593Smuzhiyun unsigned long page_size = 1UL << page_shift;
1086*4882a593Smuzhiyun unsigned long nr_pages = (end - start) >> page_shift;
1087*4882a593Smuzhiyun bool local, full;
1088*4882a593Smuzhiyun
1089*4882a593Smuzhiyun pid = mm->context.id;
1090*4882a593Smuzhiyun if (unlikely(pid == MMU_NO_CONTEXT))
1091*4882a593Smuzhiyun return;
1092*4882a593Smuzhiyun
1093*4882a593Smuzhiyun preempt_disable();
1094*4882a593Smuzhiyun smp_mb(); /* see radix__flush_tlb_mm */
1095*4882a593Smuzhiyun if (!mm_is_thread_local(mm)) {
1096*4882a593Smuzhiyun if (unlikely(mm_is_singlethreaded(mm))) {
1097*4882a593Smuzhiyun if (end != TLB_FLUSH_ALL) {
1098*4882a593Smuzhiyun exit_flush_lazy_tlbs(mm);
1099*4882a593Smuzhiyun goto is_local;
1100*4882a593Smuzhiyun }
1101*4882a593Smuzhiyun }
1102*4882a593Smuzhiyun local = false;
1103*4882a593Smuzhiyun full = (end == TLB_FLUSH_ALL ||
1104*4882a593Smuzhiyun nr_pages > tlb_single_page_flush_ceiling);
1105*4882a593Smuzhiyun } else {
1106*4882a593Smuzhiyun is_local:
1107*4882a593Smuzhiyun local = true;
1108*4882a593Smuzhiyun full = (end == TLB_FLUSH_ALL ||
1109*4882a593Smuzhiyun nr_pages > tlb_local_single_page_flush_ceiling);
1110*4882a593Smuzhiyun }
1111*4882a593Smuzhiyun
1112*4882a593Smuzhiyun if (!mmu_has_feature(MMU_FTR_GTSE) && !local) {
1113*4882a593Smuzhiyun unsigned long tgt = H_RPTI_TARGET_CMMU;
1114*4882a593Smuzhiyun unsigned long type = H_RPTI_TYPE_TLB;
1115*4882a593Smuzhiyun unsigned long pg_sizes = psize_to_rpti_pgsize(psize);
1116*4882a593Smuzhiyun
1117*4882a593Smuzhiyun if (also_pwc)
1118*4882a593Smuzhiyun type |= H_RPTI_TYPE_PWC;
1119*4882a593Smuzhiyun if (atomic_read(&mm->context.copros) > 0)
1120*4882a593Smuzhiyun tgt |= H_RPTI_TARGET_NMMU;
1121*4882a593Smuzhiyun pseries_rpt_invalidate(pid, tgt, type, pg_sizes, start, end);
1122*4882a593Smuzhiyun } else if (full) {
1123*4882a593Smuzhiyun if (local) {
1124*4882a593Smuzhiyun _tlbiel_pid(pid, also_pwc ? RIC_FLUSH_ALL : RIC_FLUSH_TLB);
1125*4882a593Smuzhiyun } else {
1126*4882a593Smuzhiyun if (cputlb_use_tlbie()) {
1127*4882a593Smuzhiyun if (mm_needs_flush_escalation(mm))
1128*4882a593Smuzhiyun also_pwc = true;
1129*4882a593Smuzhiyun
1130*4882a593Smuzhiyun _tlbie_pid(pid,
1131*4882a593Smuzhiyun also_pwc ? RIC_FLUSH_ALL : RIC_FLUSH_TLB);
1132*4882a593Smuzhiyun } else {
1133*4882a593Smuzhiyun _tlbiel_pid_multicast(mm, pid,
1134*4882a593Smuzhiyun also_pwc ? RIC_FLUSH_ALL : RIC_FLUSH_TLB);
1135*4882a593Smuzhiyun }
1136*4882a593Smuzhiyun
1137*4882a593Smuzhiyun }
1138*4882a593Smuzhiyun } else {
1139*4882a593Smuzhiyun if (local)
1140*4882a593Smuzhiyun _tlbiel_va_range(start, end, pid, page_size, psize, also_pwc);
1141*4882a593Smuzhiyun else if (cputlb_use_tlbie())
1142*4882a593Smuzhiyun _tlbie_va_range(start, end, pid, page_size, psize, also_pwc);
1143*4882a593Smuzhiyun else
1144*4882a593Smuzhiyun _tlbiel_va_range_multicast(mm,
1145*4882a593Smuzhiyun start, end, pid, page_size, psize, also_pwc);
1146*4882a593Smuzhiyun }
1147*4882a593Smuzhiyun preempt_enable();
1148*4882a593Smuzhiyun }
1149*4882a593Smuzhiyun
radix__flush_tlb_range_psize(struct mm_struct * mm,unsigned long start,unsigned long end,int psize)1150*4882a593Smuzhiyun void radix__flush_tlb_range_psize(struct mm_struct *mm, unsigned long start,
1151*4882a593Smuzhiyun unsigned long end, int psize)
1152*4882a593Smuzhiyun {
1153*4882a593Smuzhiyun return __radix__flush_tlb_range_psize(mm, start, end, psize, false);
1154*4882a593Smuzhiyun }
1155*4882a593Smuzhiyun
radix__flush_tlb_pwc_range_psize(struct mm_struct * mm,unsigned long start,unsigned long end,int psize)1156*4882a593Smuzhiyun static void radix__flush_tlb_pwc_range_psize(struct mm_struct *mm, unsigned long start,
1157*4882a593Smuzhiyun unsigned long end, int psize)
1158*4882a593Smuzhiyun {
1159*4882a593Smuzhiyun __radix__flush_tlb_range_psize(mm, start, end, psize, true);
1160*4882a593Smuzhiyun }
1161*4882a593Smuzhiyun
1162*4882a593Smuzhiyun #ifdef CONFIG_TRANSPARENT_HUGEPAGE
radix__flush_tlb_collapsed_pmd(struct mm_struct * mm,unsigned long addr)1163*4882a593Smuzhiyun void radix__flush_tlb_collapsed_pmd(struct mm_struct *mm, unsigned long addr)
1164*4882a593Smuzhiyun {
1165*4882a593Smuzhiyun unsigned long pid, end;
1166*4882a593Smuzhiyun
1167*4882a593Smuzhiyun pid = mm->context.id;
1168*4882a593Smuzhiyun if (unlikely(pid == MMU_NO_CONTEXT))
1169*4882a593Smuzhiyun return;
1170*4882a593Smuzhiyun
1171*4882a593Smuzhiyun /* 4k page size, just blow the world */
1172*4882a593Smuzhiyun if (PAGE_SIZE == 0x1000) {
1173*4882a593Smuzhiyun radix__flush_all_mm(mm);
1174*4882a593Smuzhiyun return;
1175*4882a593Smuzhiyun }
1176*4882a593Smuzhiyun
1177*4882a593Smuzhiyun end = addr + HPAGE_PMD_SIZE;
1178*4882a593Smuzhiyun
1179*4882a593Smuzhiyun /* Otherwise first do the PWC, then iterate the pages. */
1180*4882a593Smuzhiyun preempt_disable();
1181*4882a593Smuzhiyun smp_mb(); /* see radix__flush_tlb_mm */
1182*4882a593Smuzhiyun if (!mm_is_thread_local(mm)) {
1183*4882a593Smuzhiyun if (unlikely(mm_is_singlethreaded(mm))) {
1184*4882a593Smuzhiyun exit_flush_lazy_tlbs(mm);
1185*4882a593Smuzhiyun goto local;
1186*4882a593Smuzhiyun }
1187*4882a593Smuzhiyun if (!mmu_has_feature(MMU_FTR_GTSE)) {
1188*4882a593Smuzhiyun unsigned long tgt, type, pg_sizes;
1189*4882a593Smuzhiyun
1190*4882a593Smuzhiyun tgt = H_RPTI_TARGET_CMMU;
1191*4882a593Smuzhiyun type = H_RPTI_TYPE_TLB | H_RPTI_TYPE_PWC |
1192*4882a593Smuzhiyun H_RPTI_TYPE_PRT;
1193*4882a593Smuzhiyun pg_sizes = psize_to_rpti_pgsize(mmu_virtual_psize);
1194*4882a593Smuzhiyun
1195*4882a593Smuzhiyun if (atomic_read(&mm->context.copros) > 0)
1196*4882a593Smuzhiyun tgt |= H_RPTI_TARGET_NMMU;
1197*4882a593Smuzhiyun pseries_rpt_invalidate(pid, tgt, type, pg_sizes,
1198*4882a593Smuzhiyun addr, end);
1199*4882a593Smuzhiyun } else if (cputlb_use_tlbie())
1200*4882a593Smuzhiyun _tlbie_va_range(addr, end, pid, PAGE_SIZE, mmu_virtual_psize, true);
1201*4882a593Smuzhiyun else
1202*4882a593Smuzhiyun _tlbiel_va_range_multicast(mm,
1203*4882a593Smuzhiyun addr, end, pid, PAGE_SIZE, mmu_virtual_psize, true);
1204*4882a593Smuzhiyun } else {
1205*4882a593Smuzhiyun local:
1206*4882a593Smuzhiyun _tlbiel_va_range(addr, end, pid, PAGE_SIZE, mmu_virtual_psize, true);
1207*4882a593Smuzhiyun }
1208*4882a593Smuzhiyun
1209*4882a593Smuzhiyun preempt_enable();
1210*4882a593Smuzhiyun }
1211*4882a593Smuzhiyun #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
1212*4882a593Smuzhiyun
radix__flush_pmd_tlb_range(struct vm_area_struct * vma,unsigned long start,unsigned long end)1213*4882a593Smuzhiyun void radix__flush_pmd_tlb_range(struct vm_area_struct *vma,
1214*4882a593Smuzhiyun unsigned long start, unsigned long end)
1215*4882a593Smuzhiyun {
1216*4882a593Smuzhiyun radix__flush_tlb_range_psize(vma->vm_mm, start, end, MMU_PAGE_2M);
1217*4882a593Smuzhiyun }
1218*4882a593Smuzhiyun EXPORT_SYMBOL(radix__flush_pmd_tlb_range);
1219*4882a593Smuzhiyun
radix__flush_tlb_all(void)1220*4882a593Smuzhiyun void radix__flush_tlb_all(void)
1221*4882a593Smuzhiyun {
1222*4882a593Smuzhiyun unsigned long rb,prs,r,rs;
1223*4882a593Smuzhiyun unsigned long ric = RIC_FLUSH_ALL;
1224*4882a593Smuzhiyun
1225*4882a593Smuzhiyun rb = 0x3 << PPC_BITLSHIFT(53); /* IS = 3 */
1226*4882a593Smuzhiyun prs = 0; /* partition scoped */
1227*4882a593Smuzhiyun r = 1; /* radix format */
1228*4882a593Smuzhiyun rs = 1 & ((1UL << 32) - 1); /* any LPID value to flush guest mappings */
1229*4882a593Smuzhiyun
1230*4882a593Smuzhiyun asm volatile("ptesync": : :"memory");
1231*4882a593Smuzhiyun /*
1232*4882a593Smuzhiyun * now flush guest entries by passing PRS = 1 and LPID != 0
1233*4882a593Smuzhiyun */
1234*4882a593Smuzhiyun asm volatile(PPC_TLBIE_5(%0, %4, %3, %2, %1)
1235*4882a593Smuzhiyun : : "r"(rb), "i"(r), "i"(1), "i"(ric), "r"(rs) : "memory");
1236*4882a593Smuzhiyun /*
1237*4882a593Smuzhiyun * now flush host entires by passing PRS = 0 and LPID == 0
1238*4882a593Smuzhiyun */
1239*4882a593Smuzhiyun asm volatile(PPC_TLBIE_5(%0, %4, %3, %2, %1)
1240*4882a593Smuzhiyun : : "r"(rb), "i"(r), "i"(prs), "i"(ric), "r"(0) : "memory");
1241*4882a593Smuzhiyun asm volatile("eieio; tlbsync; ptesync": : :"memory");
1242*4882a593Smuzhiyun }
1243*4882a593Smuzhiyun
1244*4882a593Smuzhiyun #ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
radix_kvm_prefetch_workaround(struct mm_struct * mm)1245*4882a593Smuzhiyun extern void radix_kvm_prefetch_workaround(struct mm_struct *mm)
1246*4882a593Smuzhiyun {
1247*4882a593Smuzhiyun unsigned long pid = mm->context.id;
1248*4882a593Smuzhiyun
1249*4882a593Smuzhiyun if (unlikely(pid == MMU_NO_CONTEXT))
1250*4882a593Smuzhiyun return;
1251*4882a593Smuzhiyun
1252*4882a593Smuzhiyun if (!cpu_has_feature(CPU_FTR_P9_RADIX_PREFETCH_BUG))
1253*4882a593Smuzhiyun return;
1254*4882a593Smuzhiyun
1255*4882a593Smuzhiyun /*
1256*4882a593Smuzhiyun * If this context hasn't run on that CPU before and KVM is
1257*4882a593Smuzhiyun * around, there's a slim chance that the guest on another
1258*4882a593Smuzhiyun * CPU just brought in obsolete translation into the TLB of
1259*4882a593Smuzhiyun * this CPU due to a bad prefetch using the guest PID on
1260*4882a593Smuzhiyun * the way into the hypervisor.
1261*4882a593Smuzhiyun *
1262*4882a593Smuzhiyun * We work around this here. If KVM is possible, we check if
1263*4882a593Smuzhiyun * any sibling thread is in KVM. If it is, the window may exist
1264*4882a593Smuzhiyun * and thus we flush that PID from the core.
1265*4882a593Smuzhiyun *
1266*4882a593Smuzhiyun * A potential future improvement would be to mark which PIDs
1267*4882a593Smuzhiyun * have never been used on the system and avoid it if the PID
1268*4882a593Smuzhiyun * is new and the process has no other cpumask bit set.
1269*4882a593Smuzhiyun */
1270*4882a593Smuzhiyun if (cpu_has_feature(CPU_FTR_HVMODE) && radix_enabled()) {
1271*4882a593Smuzhiyun int cpu = smp_processor_id();
1272*4882a593Smuzhiyun int sib = cpu_first_thread_sibling(cpu);
1273*4882a593Smuzhiyun bool flush = false;
1274*4882a593Smuzhiyun
1275*4882a593Smuzhiyun for (; sib <= cpu_last_thread_sibling(cpu) && !flush; sib++) {
1276*4882a593Smuzhiyun if (sib == cpu)
1277*4882a593Smuzhiyun continue;
1278*4882a593Smuzhiyun if (!cpu_possible(sib))
1279*4882a593Smuzhiyun continue;
1280*4882a593Smuzhiyun if (paca_ptrs[sib]->kvm_hstate.kvm_vcpu)
1281*4882a593Smuzhiyun flush = true;
1282*4882a593Smuzhiyun }
1283*4882a593Smuzhiyun if (flush)
1284*4882a593Smuzhiyun _tlbiel_pid(pid, RIC_FLUSH_ALL);
1285*4882a593Smuzhiyun }
1286*4882a593Smuzhiyun }
1287*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(radix_kvm_prefetch_workaround);
1288*4882a593Smuzhiyun #endif /* CONFIG_KVM_BOOK3S_HV_POSSIBLE */
1289