1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /* arch/sparc64/mm/tsb.c
3*4882a593Smuzhiyun *
4*4882a593Smuzhiyun * Copyright (C) 2006, 2008 David S. Miller <davem@davemloft.net>
5*4882a593Smuzhiyun */
6*4882a593Smuzhiyun
7*4882a593Smuzhiyun #include <linux/kernel.h>
8*4882a593Smuzhiyun #include <linux/preempt.h>
9*4882a593Smuzhiyun #include <linux/slab.h>
10*4882a593Smuzhiyun #include <linux/mm_types.h>
11*4882a593Smuzhiyun #include <linux/pgtable.h>
12*4882a593Smuzhiyun
13*4882a593Smuzhiyun #include <asm/page.h>
14*4882a593Smuzhiyun #include <asm/mmu_context.h>
15*4882a593Smuzhiyun #include <asm/setup.h>
16*4882a593Smuzhiyun #include <asm/tsb.h>
17*4882a593Smuzhiyun #include <asm/tlb.h>
18*4882a593Smuzhiyun #include <asm/oplib.h>
19*4882a593Smuzhiyun
20*4882a593Smuzhiyun extern struct tsb swapper_tsb[KERNEL_TSB_NENTRIES];
21*4882a593Smuzhiyun
tsb_hash(unsigned long vaddr,unsigned long hash_shift,unsigned long nentries)22*4882a593Smuzhiyun static inline unsigned long tsb_hash(unsigned long vaddr, unsigned long hash_shift, unsigned long nentries)
23*4882a593Smuzhiyun {
24*4882a593Smuzhiyun vaddr >>= hash_shift;
25*4882a593Smuzhiyun return vaddr & (nentries - 1);
26*4882a593Smuzhiyun }
27*4882a593Smuzhiyun
tag_compare(unsigned long tag,unsigned long vaddr)28*4882a593Smuzhiyun static inline int tag_compare(unsigned long tag, unsigned long vaddr)
29*4882a593Smuzhiyun {
30*4882a593Smuzhiyun return (tag == (vaddr >> 22));
31*4882a593Smuzhiyun }
32*4882a593Smuzhiyun
flush_tsb_kernel_range_scan(unsigned long start,unsigned long end)33*4882a593Smuzhiyun static void flush_tsb_kernel_range_scan(unsigned long start, unsigned long end)
34*4882a593Smuzhiyun {
35*4882a593Smuzhiyun unsigned long idx;
36*4882a593Smuzhiyun
37*4882a593Smuzhiyun for (idx = 0; idx < KERNEL_TSB_NENTRIES; idx++) {
38*4882a593Smuzhiyun struct tsb *ent = &swapper_tsb[idx];
39*4882a593Smuzhiyun unsigned long match = idx << 13;
40*4882a593Smuzhiyun
41*4882a593Smuzhiyun match |= (ent->tag << 22);
42*4882a593Smuzhiyun if (match >= start && match < end)
43*4882a593Smuzhiyun ent->tag = (1UL << TSB_TAG_INVALID_BIT);
44*4882a593Smuzhiyun }
45*4882a593Smuzhiyun }
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun /* TSB flushes need only occur on the processor initiating the address
48*4882a593Smuzhiyun * space modification, not on each cpu the address space has run on.
49*4882a593Smuzhiyun * Only the TLB flush needs that treatment.
50*4882a593Smuzhiyun */
51*4882a593Smuzhiyun
flush_tsb_kernel_range(unsigned long start,unsigned long end)52*4882a593Smuzhiyun void flush_tsb_kernel_range(unsigned long start, unsigned long end)
53*4882a593Smuzhiyun {
54*4882a593Smuzhiyun unsigned long v;
55*4882a593Smuzhiyun
56*4882a593Smuzhiyun if ((end - start) >> PAGE_SHIFT >= 2 * KERNEL_TSB_NENTRIES)
57*4882a593Smuzhiyun return flush_tsb_kernel_range_scan(start, end);
58*4882a593Smuzhiyun
59*4882a593Smuzhiyun for (v = start; v < end; v += PAGE_SIZE) {
60*4882a593Smuzhiyun unsigned long hash = tsb_hash(v, PAGE_SHIFT,
61*4882a593Smuzhiyun KERNEL_TSB_NENTRIES);
62*4882a593Smuzhiyun struct tsb *ent = &swapper_tsb[hash];
63*4882a593Smuzhiyun
64*4882a593Smuzhiyun if (tag_compare(ent->tag, v))
65*4882a593Smuzhiyun ent->tag = (1UL << TSB_TAG_INVALID_BIT);
66*4882a593Smuzhiyun }
67*4882a593Smuzhiyun }
68*4882a593Smuzhiyun
__flush_tsb_one_entry(unsigned long tsb,unsigned long v,unsigned long hash_shift,unsigned long nentries)69*4882a593Smuzhiyun static void __flush_tsb_one_entry(unsigned long tsb, unsigned long v,
70*4882a593Smuzhiyun unsigned long hash_shift,
71*4882a593Smuzhiyun unsigned long nentries)
72*4882a593Smuzhiyun {
73*4882a593Smuzhiyun unsigned long tag, ent, hash;
74*4882a593Smuzhiyun
75*4882a593Smuzhiyun v &= ~0x1UL;
76*4882a593Smuzhiyun hash = tsb_hash(v, hash_shift, nentries);
77*4882a593Smuzhiyun ent = tsb + (hash * sizeof(struct tsb));
78*4882a593Smuzhiyun tag = (v >> 22UL);
79*4882a593Smuzhiyun
80*4882a593Smuzhiyun tsb_flush(ent, tag);
81*4882a593Smuzhiyun }
82*4882a593Smuzhiyun
__flush_tsb_one(struct tlb_batch * tb,unsigned long hash_shift,unsigned long tsb,unsigned long nentries)83*4882a593Smuzhiyun static void __flush_tsb_one(struct tlb_batch *tb, unsigned long hash_shift,
84*4882a593Smuzhiyun unsigned long tsb, unsigned long nentries)
85*4882a593Smuzhiyun {
86*4882a593Smuzhiyun unsigned long i;
87*4882a593Smuzhiyun
88*4882a593Smuzhiyun for (i = 0; i < tb->tlb_nr; i++)
89*4882a593Smuzhiyun __flush_tsb_one_entry(tsb, tb->vaddrs[i], hash_shift, nentries);
90*4882a593Smuzhiyun }
91*4882a593Smuzhiyun
92*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
__flush_huge_tsb_one_entry(unsigned long tsb,unsigned long v,unsigned long hash_shift,unsigned long nentries,unsigned int hugepage_shift)93*4882a593Smuzhiyun static void __flush_huge_tsb_one_entry(unsigned long tsb, unsigned long v,
94*4882a593Smuzhiyun unsigned long hash_shift,
95*4882a593Smuzhiyun unsigned long nentries,
96*4882a593Smuzhiyun unsigned int hugepage_shift)
97*4882a593Smuzhiyun {
98*4882a593Smuzhiyun unsigned int hpage_entries;
99*4882a593Smuzhiyun unsigned int i;
100*4882a593Smuzhiyun
101*4882a593Smuzhiyun hpage_entries = 1 << (hugepage_shift - hash_shift);
102*4882a593Smuzhiyun for (i = 0; i < hpage_entries; i++)
103*4882a593Smuzhiyun __flush_tsb_one_entry(tsb, v + (i << hash_shift), hash_shift,
104*4882a593Smuzhiyun nentries);
105*4882a593Smuzhiyun }
106*4882a593Smuzhiyun
__flush_huge_tsb_one(struct tlb_batch * tb,unsigned long hash_shift,unsigned long tsb,unsigned long nentries,unsigned int hugepage_shift)107*4882a593Smuzhiyun static void __flush_huge_tsb_one(struct tlb_batch *tb, unsigned long hash_shift,
108*4882a593Smuzhiyun unsigned long tsb, unsigned long nentries,
109*4882a593Smuzhiyun unsigned int hugepage_shift)
110*4882a593Smuzhiyun {
111*4882a593Smuzhiyun unsigned long i;
112*4882a593Smuzhiyun
113*4882a593Smuzhiyun for (i = 0; i < tb->tlb_nr; i++)
114*4882a593Smuzhiyun __flush_huge_tsb_one_entry(tsb, tb->vaddrs[i], hash_shift,
115*4882a593Smuzhiyun nentries, hugepage_shift);
116*4882a593Smuzhiyun }
117*4882a593Smuzhiyun #endif
118*4882a593Smuzhiyun
flush_tsb_user(struct tlb_batch * tb)119*4882a593Smuzhiyun void flush_tsb_user(struct tlb_batch *tb)
120*4882a593Smuzhiyun {
121*4882a593Smuzhiyun struct mm_struct *mm = tb->mm;
122*4882a593Smuzhiyun unsigned long nentries, base, flags;
123*4882a593Smuzhiyun
124*4882a593Smuzhiyun spin_lock_irqsave(&mm->context.lock, flags);
125*4882a593Smuzhiyun
126*4882a593Smuzhiyun if (tb->hugepage_shift < REAL_HPAGE_SHIFT) {
127*4882a593Smuzhiyun base = (unsigned long) mm->context.tsb_block[MM_TSB_BASE].tsb;
128*4882a593Smuzhiyun nentries = mm->context.tsb_block[MM_TSB_BASE].tsb_nentries;
129*4882a593Smuzhiyun if (tlb_type == cheetah_plus || tlb_type == hypervisor)
130*4882a593Smuzhiyun base = __pa(base);
131*4882a593Smuzhiyun if (tb->hugepage_shift == PAGE_SHIFT)
132*4882a593Smuzhiyun __flush_tsb_one(tb, PAGE_SHIFT, base, nentries);
133*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE)
134*4882a593Smuzhiyun else
135*4882a593Smuzhiyun __flush_huge_tsb_one(tb, PAGE_SHIFT, base, nentries,
136*4882a593Smuzhiyun tb->hugepage_shift);
137*4882a593Smuzhiyun #endif
138*4882a593Smuzhiyun }
139*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
140*4882a593Smuzhiyun else if (mm->context.tsb_block[MM_TSB_HUGE].tsb) {
141*4882a593Smuzhiyun base = (unsigned long) mm->context.tsb_block[MM_TSB_HUGE].tsb;
142*4882a593Smuzhiyun nentries = mm->context.tsb_block[MM_TSB_HUGE].tsb_nentries;
143*4882a593Smuzhiyun if (tlb_type == cheetah_plus || tlb_type == hypervisor)
144*4882a593Smuzhiyun base = __pa(base);
145*4882a593Smuzhiyun __flush_huge_tsb_one(tb, REAL_HPAGE_SHIFT, base, nentries,
146*4882a593Smuzhiyun tb->hugepage_shift);
147*4882a593Smuzhiyun }
148*4882a593Smuzhiyun #endif
149*4882a593Smuzhiyun spin_unlock_irqrestore(&mm->context.lock, flags);
150*4882a593Smuzhiyun }
151*4882a593Smuzhiyun
flush_tsb_user_page(struct mm_struct * mm,unsigned long vaddr,unsigned int hugepage_shift)152*4882a593Smuzhiyun void flush_tsb_user_page(struct mm_struct *mm, unsigned long vaddr,
153*4882a593Smuzhiyun unsigned int hugepage_shift)
154*4882a593Smuzhiyun {
155*4882a593Smuzhiyun unsigned long nentries, base, flags;
156*4882a593Smuzhiyun
157*4882a593Smuzhiyun spin_lock_irqsave(&mm->context.lock, flags);
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun if (hugepage_shift < REAL_HPAGE_SHIFT) {
160*4882a593Smuzhiyun base = (unsigned long) mm->context.tsb_block[MM_TSB_BASE].tsb;
161*4882a593Smuzhiyun nentries = mm->context.tsb_block[MM_TSB_BASE].tsb_nentries;
162*4882a593Smuzhiyun if (tlb_type == cheetah_plus || tlb_type == hypervisor)
163*4882a593Smuzhiyun base = __pa(base);
164*4882a593Smuzhiyun if (hugepage_shift == PAGE_SHIFT)
165*4882a593Smuzhiyun __flush_tsb_one_entry(base, vaddr, PAGE_SHIFT,
166*4882a593Smuzhiyun nentries);
167*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE)
168*4882a593Smuzhiyun else
169*4882a593Smuzhiyun __flush_huge_tsb_one_entry(base, vaddr, PAGE_SHIFT,
170*4882a593Smuzhiyun nentries, hugepage_shift);
171*4882a593Smuzhiyun #endif
172*4882a593Smuzhiyun }
173*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
174*4882a593Smuzhiyun else if (mm->context.tsb_block[MM_TSB_HUGE].tsb) {
175*4882a593Smuzhiyun base = (unsigned long) mm->context.tsb_block[MM_TSB_HUGE].tsb;
176*4882a593Smuzhiyun nentries = mm->context.tsb_block[MM_TSB_HUGE].tsb_nentries;
177*4882a593Smuzhiyun if (tlb_type == cheetah_plus || tlb_type == hypervisor)
178*4882a593Smuzhiyun base = __pa(base);
179*4882a593Smuzhiyun __flush_huge_tsb_one_entry(base, vaddr, REAL_HPAGE_SHIFT,
180*4882a593Smuzhiyun nentries, hugepage_shift);
181*4882a593Smuzhiyun }
182*4882a593Smuzhiyun #endif
183*4882a593Smuzhiyun spin_unlock_irqrestore(&mm->context.lock, flags);
184*4882a593Smuzhiyun }
185*4882a593Smuzhiyun
186*4882a593Smuzhiyun #define HV_PGSZ_IDX_BASE HV_PGSZ_IDX_8K
187*4882a593Smuzhiyun #define HV_PGSZ_MASK_BASE HV_PGSZ_MASK_8K
188*4882a593Smuzhiyun
189*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
190*4882a593Smuzhiyun #define HV_PGSZ_IDX_HUGE HV_PGSZ_IDX_4MB
191*4882a593Smuzhiyun #define HV_PGSZ_MASK_HUGE HV_PGSZ_MASK_4MB
192*4882a593Smuzhiyun #endif
193*4882a593Smuzhiyun
setup_tsb_params(struct mm_struct * mm,unsigned long tsb_idx,unsigned long tsb_bytes)194*4882a593Smuzhiyun static void setup_tsb_params(struct mm_struct *mm, unsigned long tsb_idx, unsigned long tsb_bytes)
195*4882a593Smuzhiyun {
196*4882a593Smuzhiyun unsigned long tsb_reg, base, tsb_paddr;
197*4882a593Smuzhiyun unsigned long page_sz, tte;
198*4882a593Smuzhiyun
199*4882a593Smuzhiyun mm->context.tsb_block[tsb_idx].tsb_nentries =
200*4882a593Smuzhiyun tsb_bytes / sizeof(struct tsb);
201*4882a593Smuzhiyun
202*4882a593Smuzhiyun switch (tsb_idx) {
203*4882a593Smuzhiyun case MM_TSB_BASE:
204*4882a593Smuzhiyun base = TSBMAP_8K_BASE;
205*4882a593Smuzhiyun break;
206*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
207*4882a593Smuzhiyun case MM_TSB_HUGE:
208*4882a593Smuzhiyun base = TSBMAP_4M_BASE;
209*4882a593Smuzhiyun break;
210*4882a593Smuzhiyun #endif
211*4882a593Smuzhiyun default:
212*4882a593Smuzhiyun BUG();
213*4882a593Smuzhiyun }
214*4882a593Smuzhiyun
215*4882a593Smuzhiyun tte = pgprot_val(PAGE_KERNEL_LOCKED);
216*4882a593Smuzhiyun tsb_paddr = __pa(mm->context.tsb_block[tsb_idx].tsb);
217*4882a593Smuzhiyun BUG_ON(tsb_paddr & (tsb_bytes - 1UL));
218*4882a593Smuzhiyun
219*4882a593Smuzhiyun /* Use the smallest page size that can map the whole TSB
220*4882a593Smuzhiyun * in one TLB entry.
221*4882a593Smuzhiyun */
222*4882a593Smuzhiyun switch (tsb_bytes) {
223*4882a593Smuzhiyun case 8192 << 0:
224*4882a593Smuzhiyun tsb_reg = 0x0UL;
225*4882a593Smuzhiyun #ifdef DCACHE_ALIASING_POSSIBLE
226*4882a593Smuzhiyun base += (tsb_paddr & 8192);
227*4882a593Smuzhiyun #endif
228*4882a593Smuzhiyun page_sz = 8192;
229*4882a593Smuzhiyun break;
230*4882a593Smuzhiyun
231*4882a593Smuzhiyun case 8192 << 1:
232*4882a593Smuzhiyun tsb_reg = 0x1UL;
233*4882a593Smuzhiyun page_sz = 64 * 1024;
234*4882a593Smuzhiyun break;
235*4882a593Smuzhiyun
236*4882a593Smuzhiyun case 8192 << 2:
237*4882a593Smuzhiyun tsb_reg = 0x2UL;
238*4882a593Smuzhiyun page_sz = 64 * 1024;
239*4882a593Smuzhiyun break;
240*4882a593Smuzhiyun
241*4882a593Smuzhiyun case 8192 << 3:
242*4882a593Smuzhiyun tsb_reg = 0x3UL;
243*4882a593Smuzhiyun page_sz = 64 * 1024;
244*4882a593Smuzhiyun break;
245*4882a593Smuzhiyun
246*4882a593Smuzhiyun case 8192 << 4:
247*4882a593Smuzhiyun tsb_reg = 0x4UL;
248*4882a593Smuzhiyun page_sz = 512 * 1024;
249*4882a593Smuzhiyun break;
250*4882a593Smuzhiyun
251*4882a593Smuzhiyun case 8192 << 5:
252*4882a593Smuzhiyun tsb_reg = 0x5UL;
253*4882a593Smuzhiyun page_sz = 512 * 1024;
254*4882a593Smuzhiyun break;
255*4882a593Smuzhiyun
256*4882a593Smuzhiyun case 8192 << 6:
257*4882a593Smuzhiyun tsb_reg = 0x6UL;
258*4882a593Smuzhiyun page_sz = 512 * 1024;
259*4882a593Smuzhiyun break;
260*4882a593Smuzhiyun
261*4882a593Smuzhiyun case 8192 << 7:
262*4882a593Smuzhiyun tsb_reg = 0x7UL;
263*4882a593Smuzhiyun page_sz = 4 * 1024 * 1024;
264*4882a593Smuzhiyun break;
265*4882a593Smuzhiyun
266*4882a593Smuzhiyun default:
267*4882a593Smuzhiyun printk(KERN_ERR "TSB[%s:%d]: Impossible TSB size %lu, killing process.\n",
268*4882a593Smuzhiyun current->comm, current->pid, tsb_bytes);
269*4882a593Smuzhiyun do_exit(SIGSEGV);
270*4882a593Smuzhiyun }
271*4882a593Smuzhiyun tte |= pte_sz_bits(page_sz);
272*4882a593Smuzhiyun
273*4882a593Smuzhiyun if (tlb_type == cheetah_plus || tlb_type == hypervisor) {
274*4882a593Smuzhiyun /* Physical mapping, no locked TLB entry for TSB. */
275*4882a593Smuzhiyun tsb_reg |= tsb_paddr;
276*4882a593Smuzhiyun
277*4882a593Smuzhiyun mm->context.tsb_block[tsb_idx].tsb_reg_val = tsb_reg;
278*4882a593Smuzhiyun mm->context.tsb_block[tsb_idx].tsb_map_vaddr = 0;
279*4882a593Smuzhiyun mm->context.tsb_block[tsb_idx].tsb_map_pte = 0;
280*4882a593Smuzhiyun } else {
281*4882a593Smuzhiyun tsb_reg |= base;
282*4882a593Smuzhiyun tsb_reg |= (tsb_paddr & (page_sz - 1UL));
283*4882a593Smuzhiyun tte |= (tsb_paddr & ~(page_sz - 1UL));
284*4882a593Smuzhiyun
285*4882a593Smuzhiyun mm->context.tsb_block[tsb_idx].tsb_reg_val = tsb_reg;
286*4882a593Smuzhiyun mm->context.tsb_block[tsb_idx].tsb_map_vaddr = base;
287*4882a593Smuzhiyun mm->context.tsb_block[tsb_idx].tsb_map_pte = tte;
288*4882a593Smuzhiyun }
289*4882a593Smuzhiyun
290*4882a593Smuzhiyun /* Setup the Hypervisor TSB descriptor. */
291*4882a593Smuzhiyun if (tlb_type == hypervisor) {
292*4882a593Smuzhiyun struct hv_tsb_descr *hp = &mm->context.tsb_descr[tsb_idx];
293*4882a593Smuzhiyun
294*4882a593Smuzhiyun switch (tsb_idx) {
295*4882a593Smuzhiyun case MM_TSB_BASE:
296*4882a593Smuzhiyun hp->pgsz_idx = HV_PGSZ_IDX_BASE;
297*4882a593Smuzhiyun break;
298*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
299*4882a593Smuzhiyun case MM_TSB_HUGE:
300*4882a593Smuzhiyun hp->pgsz_idx = HV_PGSZ_IDX_HUGE;
301*4882a593Smuzhiyun break;
302*4882a593Smuzhiyun #endif
303*4882a593Smuzhiyun default:
304*4882a593Smuzhiyun BUG();
305*4882a593Smuzhiyun }
306*4882a593Smuzhiyun hp->assoc = 1;
307*4882a593Smuzhiyun hp->num_ttes = tsb_bytes / 16;
308*4882a593Smuzhiyun hp->ctx_idx = 0;
309*4882a593Smuzhiyun switch (tsb_idx) {
310*4882a593Smuzhiyun case MM_TSB_BASE:
311*4882a593Smuzhiyun hp->pgsz_mask = HV_PGSZ_MASK_BASE;
312*4882a593Smuzhiyun break;
313*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
314*4882a593Smuzhiyun case MM_TSB_HUGE:
315*4882a593Smuzhiyun hp->pgsz_mask = HV_PGSZ_MASK_HUGE;
316*4882a593Smuzhiyun break;
317*4882a593Smuzhiyun #endif
318*4882a593Smuzhiyun default:
319*4882a593Smuzhiyun BUG();
320*4882a593Smuzhiyun }
321*4882a593Smuzhiyun hp->tsb_base = tsb_paddr;
322*4882a593Smuzhiyun hp->resv = 0;
323*4882a593Smuzhiyun }
324*4882a593Smuzhiyun }
325*4882a593Smuzhiyun
326*4882a593Smuzhiyun struct kmem_cache *pgtable_cache __read_mostly;
327*4882a593Smuzhiyun
328*4882a593Smuzhiyun static struct kmem_cache *tsb_caches[8] __read_mostly;
329*4882a593Smuzhiyun
330*4882a593Smuzhiyun static const char *tsb_cache_names[8] = {
331*4882a593Smuzhiyun "tsb_8KB",
332*4882a593Smuzhiyun "tsb_16KB",
333*4882a593Smuzhiyun "tsb_32KB",
334*4882a593Smuzhiyun "tsb_64KB",
335*4882a593Smuzhiyun "tsb_128KB",
336*4882a593Smuzhiyun "tsb_256KB",
337*4882a593Smuzhiyun "tsb_512KB",
338*4882a593Smuzhiyun "tsb_1MB",
339*4882a593Smuzhiyun };
340*4882a593Smuzhiyun
pgtable_cache_init(void)341*4882a593Smuzhiyun void __init pgtable_cache_init(void)
342*4882a593Smuzhiyun {
343*4882a593Smuzhiyun unsigned long i;
344*4882a593Smuzhiyun
345*4882a593Smuzhiyun pgtable_cache = kmem_cache_create("pgtable_cache",
346*4882a593Smuzhiyun PAGE_SIZE, PAGE_SIZE,
347*4882a593Smuzhiyun 0,
348*4882a593Smuzhiyun _clear_page);
349*4882a593Smuzhiyun if (!pgtable_cache) {
350*4882a593Smuzhiyun prom_printf("pgtable_cache_init(): Could not create!\n");
351*4882a593Smuzhiyun prom_halt();
352*4882a593Smuzhiyun }
353*4882a593Smuzhiyun
354*4882a593Smuzhiyun for (i = 0; i < ARRAY_SIZE(tsb_cache_names); i++) {
355*4882a593Smuzhiyun unsigned long size = 8192 << i;
356*4882a593Smuzhiyun const char *name = tsb_cache_names[i];
357*4882a593Smuzhiyun
358*4882a593Smuzhiyun tsb_caches[i] = kmem_cache_create(name,
359*4882a593Smuzhiyun size, size,
360*4882a593Smuzhiyun 0, NULL);
361*4882a593Smuzhiyun if (!tsb_caches[i]) {
362*4882a593Smuzhiyun prom_printf("Could not create %s cache\n", name);
363*4882a593Smuzhiyun prom_halt();
364*4882a593Smuzhiyun }
365*4882a593Smuzhiyun }
366*4882a593Smuzhiyun }
367*4882a593Smuzhiyun
368*4882a593Smuzhiyun int sysctl_tsb_ratio = -2;
369*4882a593Smuzhiyun
tsb_size_to_rss_limit(unsigned long new_size)370*4882a593Smuzhiyun static unsigned long tsb_size_to_rss_limit(unsigned long new_size)
371*4882a593Smuzhiyun {
372*4882a593Smuzhiyun unsigned long num_ents = (new_size / sizeof(struct tsb));
373*4882a593Smuzhiyun
374*4882a593Smuzhiyun if (sysctl_tsb_ratio < 0)
375*4882a593Smuzhiyun return num_ents - (num_ents >> -sysctl_tsb_ratio);
376*4882a593Smuzhiyun else
377*4882a593Smuzhiyun return num_ents + (num_ents >> sysctl_tsb_ratio);
378*4882a593Smuzhiyun }
379*4882a593Smuzhiyun
380*4882a593Smuzhiyun /* When the RSS of an address space exceeds tsb_rss_limit for a TSB,
381*4882a593Smuzhiyun * do_sparc64_fault() invokes this routine to try and grow it.
382*4882a593Smuzhiyun *
383*4882a593Smuzhiyun * When we reach the maximum TSB size supported, we stick ~0UL into
384*4882a593Smuzhiyun * tsb_rss_limit for that TSB so the grow checks in do_sparc64_fault()
385*4882a593Smuzhiyun * will not trigger any longer.
386*4882a593Smuzhiyun *
387*4882a593Smuzhiyun * The TSB can be anywhere from 8K to 1MB in size, in increasing powers
388*4882a593Smuzhiyun * of two. The TSB must be aligned to it's size, so f.e. a 512K TSB
389*4882a593Smuzhiyun * must be 512K aligned. It also must be physically contiguous, so we
390*4882a593Smuzhiyun * cannot use vmalloc().
391*4882a593Smuzhiyun *
392*4882a593Smuzhiyun * The idea here is to grow the TSB when the RSS of the process approaches
393*4882a593Smuzhiyun * the number of entries that the current TSB can hold at once. Currently,
394*4882a593Smuzhiyun * we trigger when the RSS hits 3/4 of the TSB capacity.
395*4882a593Smuzhiyun */
tsb_grow(struct mm_struct * mm,unsigned long tsb_index,unsigned long rss)396*4882a593Smuzhiyun void tsb_grow(struct mm_struct *mm, unsigned long tsb_index, unsigned long rss)
397*4882a593Smuzhiyun {
398*4882a593Smuzhiyun unsigned long max_tsb_size = 1 * 1024 * 1024;
399*4882a593Smuzhiyun unsigned long new_size, old_size, flags;
400*4882a593Smuzhiyun struct tsb *old_tsb, *new_tsb;
401*4882a593Smuzhiyun unsigned long new_cache_index, old_cache_index;
402*4882a593Smuzhiyun unsigned long new_rss_limit;
403*4882a593Smuzhiyun gfp_t gfp_flags;
404*4882a593Smuzhiyun
405*4882a593Smuzhiyun if (max_tsb_size > (PAGE_SIZE << MAX_ORDER))
406*4882a593Smuzhiyun max_tsb_size = (PAGE_SIZE << MAX_ORDER);
407*4882a593Smuzhiyun
408*4882a593Smuzhiyun new_cache_index = 0;
409*4882a593Smuzhiyun for (new_size = 8192; new_size < max_tsb_size; new_size <<= 1UL) {
410*4882a593Smuzhiyun new_rss_limit = tsb_size_to_rss_limit(new_size);
411*4882a593Smuzhiyun if (new_rss_limit > rss)
412*4882a593Smuzhiyun break;
413*4882a593Smuzhiyun new_cache_index++;
414*4882a593Smuzhiyun }
415*4882a593Smuzhiyun
416*4882a593Smuzhiyun if (new_size == max_tsb_size)
417*4882a593Smuzhiyun new_rss_limit = ~0UL;
418*4882a593Smuzhiyun
419*4882a593Smuzhiyun retry_tsb_alloc:
420*4882a593Smuzhiyun gfp_flags = GFP_KERNEL;
421*4882a593Smuzhiyun if (new_size > (PAGE_SIZE * 2))
422*4882a593Smuzhiyun gfp_flags |= __GFP_NOWARN | __GFP_NORETRY;
423*4882a593Smuzhiyun
424*4882a593Smuzhiyun new_tsb = kmem_cache_alloc_node(tsb_caches[new_cache_index],
425*4882a593Smuzhiyun gfp_flags, numa_node_id());
426*4882a593Smuzhiyun if (unlikely(!new_tsb)) {
427*4882a593Smuzhiyun /* Not being able to fork due to a high-order TSB
428*4882a593Smuzhiyun * allocation failure is very bad behavior. Just back
429*4882a593Smuzhiyun * down to a 0-order allocation and force no TSB
430*4882a593Smuzhiyun * growing for this address space.
431*4882a593Smuzhiyun */
432*4882a593Smuzhiyun if (mm->context.tsb_block[tsb_index].tsb == NULL &&
433*4882a593Smuzhiyun new_cache_index > 0) {
434*4882a593Smuzhiyun new_cache_index = 0;
435*4882a593Smuzhiyun new_size = 8192;
436*4882a593Smuzhiyun new_rss_limit = ~0UL;
437*4882a593Smuzhiyun goto retry_tsb_alloc;
438*4882a593Smuzhiyun }
439*4882a593Smuzhiyun
440*4882a593Smuzhiyun /* If we failed on a TSB grow, we are under serious
441*4882a593Smuzhiyun * memory pressure so don't try to grow any more.
442*4882a593Smuzhiyun */
443*4882a593Smuzhiyun if (mm->context.tsb_block[tsb_index].tsb != NULL)
444*4882a593Smuzhiyun mm->context.tsb_block[tsb_index].tsb_rss_limit = ~0UL;
445*4882a593Smuzhiyun return;
446*4882a593Smuzhiyun }
447*4882a593Smuzhiyun
448*4882a593Smuzhiyun /* Mark all tags as invalid. */
449*4882a593Smuzhiyun tsb_init(new_tsb, new_size);
450*4882a593Smuzhiyun
451*4882a593Smuzhiyun /* Ok, we are about to commit the changes. If we are
452*4882a593Smuzhiyun * growing an existing TSB the locking is very tricky,
453*4882a593Smuzhiyun * so WATCH OUT!
454*4882a593Smuzhiyun *
455*4882a593Smuzhiyun * We have to hold mm->context.lock while committing to the
456*4882a593Smuzhiyun * new TSB, this synchronizes us with processors in
457*4882a593Smuzhiyun * flush_tsb_user() and switch_mm() for this address space.
458*4882a593Smuzhiyun *
459*4882a593Smuzhiyun * But even with that lock held, processors run asynchronously
460*4882a593Smuzhiyun * accessing the old TSB via TLB miss handling. This is OK
461*4882a593Smuzhiyun * because those actions are just propagating state from the
462*4882a593Smuzhiyun * Linux page tables into the TSB, page table mappings are not
463*4882a593Smuzhiyun * being changed. If a real fault occurs, the processor will
464*4882a593Smuzhiyun * synchronize with us when it hits flush_tsb_user(), this is
465*4882a593Smuzhiyun * also true for the case where vmscan is modifying the page
466*4882a593Smuzhiyun * tables. The only thing we need to be careful with is to
467*4882a593Smuzhiyun * skip any locked TSB entries during copy_tsb().
468*4882a593Smuzhiyun *
469*4882a593Smuzhiyun * When we finish committing to the new TSB, we have to drop
470*4882a593Smuzhiyun * the lock and ask all other cpus running this address space
471*4882a593Smuzhiyun * to run tsb_context_switch() to see the new TSB table.
472*4882a593Smuzhiyun */
473*4882a593Smuzhiyun spin_lock_irqsave(&mm->context.lock, flags);
474*4882a593Smuzhiyun
475*4882a593Smuzhiyun old_tsb = mm->context.tsb_block[tsb_index].tsb;
476*4882a593Smuzhiyun old_cache_index =
477*4882a593Smuzhiyun (mm->context.tsb_block[tsb_index].tsb_reg_val & 0x7UL);
478*4882a593Smuzhiyun old_size = (mm->context.tsb_block[tsb_index].tsb_nentries *
479*4882a593Smuzhiyun sizeof(struct tsb));
480*4882a593Smuzhiyun
481*4882a593Smuzhiyun
482*4882a593Smuzhiyun /* Handle multiple threads trying to grow the TSB at the same time.
483*4882a593Smuzhiyun * One will get in here first, and bump the size and the RSS limit.
484*4882a593Smuzhiyun * The others will get in here next and hit this check.
485*4882a593Smuzhiyun */
486*4882a593Smuzhiyun if (unlikely(old_tsb &&
487*4882a593Smuzhiyun (rss < mm->context.tsb_block[tsb_index].tsb_rss_limit))) {
488*4882a593Smuzhiyun spin_unlock_irqrestore(&mm->context.lock, flags);
489*4882a593Smuzhiyun
490*4882a593Smuzhiyun kmem_cache_free(tsb_caches[new_cache_index], new_tsb);
491*4882a593Smuzhiyun return;
492*4882a593Smuzhiyun }
493*4882a593Smuzhiyun
494*4882a593Smuzhiyun mm->context.tsb_block[tsb_index].tsb_rss_limit = new_rss_limit;
495*4882a593Smuzhiyun
496*4882a593Smuzhiyun if (old_tsb) {
497*4882a593Smuzhiyun extern void copy_tsb(unsigned long old_tsb_base,
498*4882a593Smuzhiyun unsigned long old_tsb_size,
499*4882a593Smuzhiyun unsigned long new_tsb_base,
500*4882a593Smuzhiyun unsigned long new_tsb_size,
501*4882a593Smuzhiyun unsigned long page_size_shift);
502*4882a593Smuzhiyun unsigned long old_tsb_base = (unsigned long) old_tsb;
503*4882a593Smuzhiyun unsigned long new_tsb_base = (unsigned long) new_tsb;
504*4882a593Smuzhiyun
505*4882a593Smuzhiyun if (tlb_type == cheetah_plus || tlb_type == hypervisor) {
506*4882a593Smuzhiyun old_tsb_base = __pa(old_tsb_base);
507*4882a593Smuzhiyun new_tsb_base = __pa(new_tsb_base);
508*4882a593Smuzhiyun }
509*4882a593Smuzhiyun copy_tsb(old_tsb_base, old_size, new_tsb_base, new_size,
510*4882a593Smuzhiyun tsb_index == MM_TSB_BASE ?
511*4882a593Smuzhiyun PAGE_SHIFT : REAL_HPAGE_SHIFT);
512*4882a593Smuzhiyun }
513*4882a593Smuzhiyun
514*4882a593Smuzhiyun mm->context.tsb_block[tsb_index].tsb = new_tsb;
515*4882a593Smuzhiyun setup_tsb_params(mm, tsb_index, new_size);
516*4882a593Smuzhiyun
517*4882a593Smuzhiyun spin_unlock_irqrestore(&mm->context.lock, flags);
518*4882a593Smuzhiyun
519*4882a593Smuzhiyun /* If old_tsb is NULL, we're being invoked for the first time
520*4882a593Smuzhiyun * from init_new_context().
521*4882a593Smuzhiyun */
522*4882a593Smuzhiyun if (old_tsb) {
523*4882a593Smuzhiyun /* Reload it on the local cpu. */
524*4882a593Smuzhiyun tsb_context_switch(mm);
525*4882a593Smuzhiyun
526*4882a593Smuzhiyun /* Now force other processors to do the same. */
527*4882a593Smuzhiyun preempt_disable();
528*4882a593Smuzhiyun smp_tsb_sync(mm);
529*4882a593Smuzhiyun preempt_enable();
530*4882a593Smuzhiyun
531*4882a593Smuzhiyun /* Now it is safe to free the old tsb. */
532*4882a593Smuzhiyun kmem_cache_free(tsb_caches[old_cache_index], old_tsb);
533*4882a593Smuzhiyun }
534*4882a593Smuzhiyun }
535*4882a593Smuzhiyun
init_new_context(struct task_struct * tsk,struct mm_struct * mm)536*4882a593Smuzhiyun int init_new_context(struct task_struct *tsk, struct mm_struct *mm)
537*4882a593Smuzhiyun {
538*4882a593Smuzhiyun unsigned long mm_rss = get_mm_rss(mm);
539*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
540*4882a593Smuzhiyun unsigned long saved_hugetlb_pte_count;
541*4882a593Smuzhiyun unsigned long saved_thp_pte_count;
542*4882a593Smuzhiyun #endif
543*4882a593Smuzhiyun unsigned int i;
544*4882a593Smuzhiyun
545*4882a593Smuzhiyun spin_lock_init(&mm->context.lock);
546*4882a593Smuzhiyun
547*4882a593Smuzhiyun mm->context.sparc64_ctx_val = 0UL;
548*4882a593Smuzhiyun
549*4882a593Smuzhiyun mm->context.tag_store = NULL;
550*4882a593Smuzhiyun spin_lock_init(&mm->context.tag_lock);
551*4882a593Smuzhiyun
552*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
553*4882a593Smuzhiyun /* We reset them to zero because the fork() page copying
554*4882a593Smuzhiyun * will re-increment the counters as the parent PTEs are
555*4882a593Smuzhiyun * copied into the child address space.
556*4882a593Smuzhiyun */
557*4882a593Smuzhiyun saved_hugetlb_pte_count = mm->context.hugetlb_pte_count;
558*4882a593Smuzhiyun saved_thp_pte_count = mm->context.thp_pte_count;
559*4882a593Smuzhiyun mm->context.hugetlb_pte_count = 0;
560*4882a593Smuzhiyun mm->context.thp_pte_count = 0;
561*4882a593Smuzhiyun
562*4882a593Smuzhiyun mm_rss -= saved_thp_pte_count * (HPAGE_SIZE / PAGE_SIZE);
563*4882a593Smuzhiyun #endif
564*4882a593Smuzhiyun
565*4882a593Smuzhiyun /* copy_mm() copies over the parent's mm_struct before calling
566*4882a593Smuzhiyun * us, so we need to zero out the TSB pointer or else tsb_grow()
567*4882a593Smuzhiyun * will be confused and think there is an older TSB to free up.
568*4882a593Smuzhiyun */
569*4882a593Smuzhiyun for (i = 0; i < MM_NUM_TSBS; i++)
570*4882a593Smuzhiyun mm->context.tsb_block[i].tsb = NULL;
571*4882a593Smuzhiyun
572*4882a593Smuzhiyun /* If this is fork, inherit the parent's TSB size. We would
573*4882a593Smuzhiyun * grow it to that size on the first page fault anyways.
574*4882a593Smuzhiyun */
575*4882a593Smuzhiyun tsb_grow(mm, MM_TSB_BASE, mm_rss);
576*4882a593Smuzhiyun
577*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
578*4882a593Smuzhiyun if (unlikely(saved_hugetlb_pte_count + saved_thp_pte_count))
579*4882a593Smuzhiyun tsb_grow(mm, MM_TSB_HUGE,
580*4882a593Smuzhiyun (saved_hugetlb_pte_count + saved_thp_pte_count) *
581*4882a593Smuzhiyun REAL_HPAGE_PER_HPAGE);
582*4882a593Smuzhiyun #endif
583*4882a593Smuzhiyun
584*4882a593Smuzhiyun if (unlikely(!mm->context.tsb_block[MM_TSB_BASE].tsb))
585*4882a593Smuzhiyun return -ENOMEM;
586*4882a593Smuzhiyun
587*4882a593Smuzhiyun return 0;
588*4882a593Smuzhiyun }
589*4882a593Smuzhiyun
tsb_destroy_one(struct tsb_config * tp)590*4882a593Smuzhiyun static void tsb_destroy_one(struct tsb_config *tp)
591*4882a593Smuzhiyun {
592*4882a593Smuzhiyun unsigned long cache_index;
593*4882a593Smuzhiyun
594*4882a593Smuzhiyun if (!tp->tsb)
595*4882a593Smuzhiyun return;
596*4882a593Smuzhiyun cache_index = tp->tsb_reg_val & 0x7UL;
597*4882a593Smuzhiyun kmem_cache_free(tsb_caches[cache_index], tp->tsb);
598*4882a593Smuzhiyun tp->tsb = NULL;
599*4882a593Smuzhiyun tp->tsb_reg_val = 0UL;
600*4882a593Smuzhiyun }
601*4882a593Smuzhiyun
destroy_context(struct mm_struct * mm)602*4882a593Smuzhiyun void destroy_context(struct mm_struct *mm)
603*4882a593Smuzhiyun {
604*4882a593Smuzhiyun unsigned long flags, i;
605*4882a593Smuzhiyun
606*4882a593Smuzhiyun for (i = 0; i < MM_NUM_TSBS; i++)
607*4882a593Smuzhiyun tsb_destroy_one(&mm->context.tsb_block[i]);
608*4882a593Smuzhiyun
609*4882a593Smuzhiyun spin_lock_irqsave(&ctx_alloc_lock, flags);
610*4882a593Smuzhiyun
611*4882a593Smuzhiyun if (CTX_VALID(mm->context)) {
612*4882a593Smuzhiyun unsigned long nr = CTX_NRBITS(mm->context);
613*4882a593Smuzhiyun mmu_context_bmap[nr>>6] &= ~(1UL << (nr & 63));
614*4882a593Smuzhiyun }
615*4882a593Smuzhiyun
616*4882a593Smuzhiyun spin_unlock_irqrestore(&ctx_alloc_lock, flags);
617*4882a593Smuzhiyun
618*4882a593Smuzhiyun /* If ADI tag storage was allocated for this task, free it */
619*4882a593Smuzhiyun if (mm->context.tag_store) {
620*4882a593Smuzhiyun tag_storage_desc_t *tag_desc;
621*4882a593Smuzhiyun unsigned long max_desc;
622*4882a593Smuzhiyun unsigned char *tags;
623*4882a593Smuzhiyun
624*4882a593Smuzhiyun tag_desc = mm->context.tag_store;
625*4882a593Smuzhiyun max_desc = PAGE_SIZE/sizeof(tag_storage_desc_t);
626*4882a593Smuzhiyun for (i = 0; i < max_desc; i++) {
627*4882a593Smuzhiyun tags = tag_desc->tags;
628*4882a593Smuzhiyun tag_desc->tags = NULL;
629*4882a593Smuzhiyun kfree(tags);
630*4882a593Smuzhiyun tag_desc++;
631*4882a593Smuzhiyun }
632*4882a593Smuzhiyun kfree(mm->context.tag_store);
633*4882a593Smuzhiyun mm->context.tag_store = NULL;
634*4882a593Smuzhiyun }
635*4882a593Smuzhiyun }
636