xref: /OK3568_Linux_fs/kernel/arch/sparc/mm/tsb.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /* arch/sparc64/mm/tsb.c
3*4882a593Smuzhiyun  *
4*4882a593Smuzhiyun  * Copyright (C) 2006, 2008 David S. Miller <davem@davemloft.net>
5*4882a593Smuzhiyun  */
6*4882a593Smuzhiyun 
7*4882a593Smuzhiyun #include <linux/kernel.h>
8*4882a593Smuzhiyun #include <linux/preempt.h>
9*4882a593Smuzhiyun #include <linux/slab.h>
10*4882a593Smuzhiyun #include <linux/mm_types.h>
11*4882a593Smuzhiyun #include <linux/pgtable.h>
12*4882a593Smuzhiyun 
13*4882a593Smuzhiyun #include <asm/page.h>
14*4882a593Smuzhiyun #include <asm/mmu_context.h>
15*4882a593Smuzhiyun #include <asm/setup.h>
16*4882a593Smuzhiyun #include <asm/tsb.h>
17*4882a593Smuzhiyun #include <asm/tlb.h>
18*4882a593Smuzhiyun #include <asm/oplib.h>
19*4882a593Smuzhiyun 
20*4882a593Smuzhiyun extern struct tsb swapper_tsb[KERNEL_TSB_NENTRIES];
21*4882a593Smuzhiyun 
tsb_hash(unsigned long vaddr,unsigned long hash_shift,unsigned long nentries)22*4882a593Smuzhiyun static inline unsigned long tsb_hash(unsigned long vaddr, unsigned long hash_shift, unsigned long nentries)
23*4882a593Smuzhiyun {
24*4882a593Smuzhiyun 	vaddr >>= hash_shift;
25*4882a593Smuzhiyun 	return vaddr & (nentries - 1);
26*4882a593Smuzhiyun }
27*4882a593Smuzhiyun 
tag_compare(unsigned long tag,unsigned long vaddr)28*4882a593Smuzhiyun static inline int tag_compare(unsigned long tag, unsigned long vaddr)
29*4882a593Smuzhiyun {
30*4882a593Smuzhiyun 	return (tag == (vaddr >> 22));
31*4882a593Smuzhiyun }
32*4882a593Smuzhiyun 
flush_tsb_kernel_range_scan(unsigned long start,unsigned long end)33*4882a593Smuzhiyun static void flush_tsb_kernel_range_scan(unsigned long start, unsigned long end)
34*4882a593Smuzhiyun {
35*4882a593Smuzhiyun 	unsigned long idx;
36*4882a593Smuzhiyun 
37*4882a593Smuzhiyun 	for (idx = 0; idx < KERNEL_TSB_NENTRIES; idx++) {
38*4882a593Smuzhiyun 		struct tsb *ent = &swapper_tsb[idx];
39*4882a593Smuzhiyun 		unsigned long match = idx << 13;
40*4882a593Smuzhiyun 
41*4882a593Smuzhiyun 		match |= (ent->tag << 22);
42*4882a593Smuzhiyun 		if (match >= start && match < end)
43*4882a593Smuzhiyun 			ent->tag = (1UL << TSB_TAG_INVALID_BIT);
44*4882a593Smuzhiyun 	}
45*4882a593Smuzhiyun }
46*4882a593Smuzhiyun 
47*4882a593Smuzhiyun /* TSB flushes need only occur on the processor initiating the address
48*4882a593Smuzhiyun  * space modification, not on each cpu the address space has run on.
49*4882a593Smuzhiyun  * Only the TLB flush needs that treatment.
50*4882a593Smuzhiyun  */
51*4882a593Smuzhiyun 
flush_tsb_kernel_range(unsigned long start,unsigned long end)52*4882a593Smuzhiyun void flush_tsb_kernel_range(unsigned long start, unsigned long end)
53*4882a593Smuzhiyun {
54*4882a593Smuzhiyun 	unsigned long v;
55*4882a593Smuzhiyun 
56*4882a593Smuzhiyun 	if ((end - start) >> PAGE_SHIFT >= 2 * KERNEL_TSB_NENTRIES)
57*4882a593Smuzhiyun 		return flush_tsb_kernel_range_scan(start, end);
58*4882a593Smuzhiyun 
59*4882a593Smuzhiyun 	for (v = start; v < end; v += PAGE_SIZE) {
60*4882a593Smuzhiyun 		unsigned long hash = tsb_hash(v, PAGE_SHIFT,
61*4882a593Smuzhiyun 					      KERNEL_TSB_NENTRIES);
62*4882a593Smuzhiyun 		struct tsb *ent = &swapper_tsb[hash];
63*4882a593Smuzhiyun 
64*4882a593Smuzhiyun 		if (tag_compare(ent->tag, v))
65*4882a593Smuzhiyun 			ent->tag = (1UL << TSB_TAG_INVALID_BIT);
66*4882a593Smuzhiyun 	}
67*4882a593Smuzhiyun }
68*4882a593Smuzhiyun 
__flush_tsb_one_entry(unsigned long tsb,unsigned long v,unsigned long hash_shift,unsigned long nentries)69*4882a593Smuzhiyun static void __flush_tsb_one_entry(unsigned long tsb, unsigned long v,
70*4882a593Smuzhiyun 				  unsigned long hash_shift,
71*4882a593Smuzhiyun 				  unsigned long nentries)
72*4882a593Smuzhiyun {
73*4882a593Smuzhiyun 	unsigned long tag, ent, hash;
74*4882a593Smuzhiyun 
75*4882a593Smuzhiyun 	v &= ~0x1UL;
76*4882a593Smuzhiyun 	hash = tsb_hash(v, hash_shift, nentries);
77*4882a593Smuzhiyun 	ent = tsb + (hash * sizeof(struct tsb));
78*4882a593Smuzhiyun 	tag = (v >> 22UL);
79*4882a593Smuzhiyun 
80*4882a593Smuzhiyun 	tsb_flush(ent, tag);
81*4882a593Smuzhiyun }
82*4882a593Smuzhiyun 
__flush_tsb_one(struct tlb_batch * tb,unsigned long hash_shift,unsigned long tsb,unsigned long nentries)83*4882a593Smuzhiyun static void __flush_tsb_one(struct tlb_batch *tb, unsigned long hash_shift,
84*4882a593Smuzhiyun 			    unsigned long tsb, unsigned long nentries)
85*4882a593Smuzhiyun {
86*4882a593Smuzhiyun 	unsigned long i;
87*4882a593Smuzhiyun 
88*4882a593Smuzhiyun 	for (i = 0; i < tb->tlb_nr; i++)
89*4882a593Smuzhiyun 		__flush_tsb_one_entry(tsb, tb->vaddrs[i], hash_shift, nentries);
90*4882a593Smuzhiyun }
91*4882a593Smuzhiyun 
92*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
__flush_huge_tsb_one_entry(unsigned long tsb,unsigned long v,unsigned long hash_shift,unsigned long nentries,unsigned int hugepage_shift)93*4882a593Smuzhiyun static void __flush_huge_tsb_one_entry(unsigned long tsb, unsigned long v,
94*4882a593Smuzhiyun 				       unsigned long hash_shift,
95*4882a593Smuzhiyun 				       unsigned long nentries,
96*4882a593Smuzhiyun 				       unsigned int hugepage_shift)
97*4882a593Smuzhiyun {
98*4882a593Smuzhiyun 	unsigned int hpage_entries;
99*4882a593Smuzhiyun 	unsigned int i;
100*4882a593Smuzhiyun 
101*4882a593Smuzhiyun 	hpage_entries = 1 << (hugepage_shift - hash_shift);
102*4882a593Smuzhiyun 	for (i = 0; i < hpage_entries; i++)
103*4882a593Smuzhiyun 		__flush_tsb_one_entry(tsb, v + (i << hash_shift), hash_shift,
104*4882a593Smuzhiyun 				      nentries);
105*4882a593Smuzhiyun }
106*4882a593Smuzhiyun 
__flush_huge_tsb_one(struct tlb_batch * tb,unsigned long hash_shift,unsigned long tsb,unsigned long nentries,unsigned int hugepage_shift)107*4882a593Smuzhiyun static void __flush_huge_tsb_one(struct tlb_batch *tb, unsigned long hash_shift,
108*4882a593Smuzhiyun 				 unsigned long tsb, unsigned long nentries,
109*4882a593Smuzhiyun 				 unsigned int hugepage_shift)
110*4882a593Smuzhiyun {
111*4882a593Smuzhiyun 	unsigned long i;
112*4882a593Smuzhiyun 
113*4882a593Smuzhiyun 	for (i = 0; i < tb->tlb_nr; i++)
114*4882a593Smuzhiyun 		__flush_huge_tsb_one_entry(tsb, tb->vaddrs[i], hash_shift,
115*4882a593Smuzhiyun 					   nentries, hugepage_shift);
116*4882a593Smuzhiyun }
117*4882a593Smuzhiyun #endif
118*4882a593Smuzhiyun 
flush_tsb_user(struct tlb_batch * tb)119*4882a593Smuzhiyun void flush_tsb_user(struct tlb_batch *tb)
120*4882a593Smuzhiyun {
121*4882a593Smuzhiyun 	struct mm_struct *mm = tb->mm;
122*4882a593Smuzhiyun 	unsigned long nentries, base, flags;
123*4882a593Smuzhiyun 
124*4882a593Smuzhiyun 	spin_lock_irqsave(&mm->context.lock, flags);
125*4882a593Smuzhiyun 
126*4882a593Smuzhiyun 	if (tb->hugepage_shift < REAL_HPAGE_SHIFT) {
127*4882a593Smuzhiyun 		base = (unsigned long) mm->context.tsb_block[MM_TSB_BASE].tsb;
128*4882a593Smuzhiyun 		nentries = mm->context.tsb_block[MM_TSB_BASE].tsb_nentries;
129*4882a593Smuzhiyun 		if (tlb_type == cheetah_plus || tlb_type == hypervisor)
130*4882a593Smuzhiyun 			base = __pa(base);
131*4882a593Smuzhiyun 		if (tb->hugepage_shift == PAGE_SHIFT)
132*4882a593Smuzhiyun 			__flush_tsb_one(tb, PAGE_SHIFT, base, nentries);
133*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE)
134*4882a593Smuzhiyun 		else
135*4882a593Smuzhiyun 			__flush_huge_tsb_one(tb, PAGE_SHIFT, base, nentries,
136*4882a593Smuzhiyun 					     tb->hugepage_shift);
137*4882a593Smuzhiyun #endif
138*4882a593Smuzhiyun 	}
139*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
140*4882a593Smuzhiyun 	else if (mm->context.tsb_block[MM_TSB_HUGE].tsb) {
141*4882a593Smuzhiyun 		base = (unsigned long) mm->context.tsb_block[MM_TSB_HUGE].tsb;
142*4882a593Smuzhiyun 		nentries = mm->context.tsb_block[MM_TSB_HUGE].tsb_nentries;
143*4882a593Smuzhiyun 		if (tlb_type == cheetah_plus || tlb_type == hypervisor)
144*4882a593Smuzhiyun 			base = __pa(base);
145*4882a593Smuzhiyun 		__flush_huge_tsb_one(tb, REAL_HPAGE_SHIFT, base, nentries,
146*4882a593Smuzhiyun 				     tb->hugepage_shift);
147*4882a593Smuzhiyun 	}
148*4882a593Smuzhiyun #endif
149*4882a593Smuzhiyun 	spin_unlock_irqrestore(&mm->context.lock, flags);
150*4882a593Smuzhiyun }
151*4882a593Smuzhiyun 
flush_tsb_user_page(struct mm_struct * mm,unsigned long vaddr,unsigned int hugepage_shift)152*4882a593Smuzhiyun void flush_tsb_user_page(struct mm_struct *mm, unsigned long vaddr,
153*4882a593Smuzhiyun 			 unsigned int hugepage_shift)
154*4882a593Smuzhiyun {
155*4882a593Smuzhiyun 	unsigned long nentries, base, flags;
156*4882a593Smuzhiyun 
157*4882a593Smuzhiyun 	spin_lock_irqsave(&mm->context.lock, flags);
158*4882a593Smuzhiyun 
159*4882a593Smuzhiyun 	if (hugepage_shift < REAL_HPAGE_SHIFT) {
160*4882a593Smuzhiyun 		base = (unsigned long) mm->context.tsb_block[MM_TSB_BASE].tsb;
161*4882a593Smuzhiyun 		nentries = mm->context.tsb_block[MM_TSB_BASE].tsb_nentries;
162*4882a593Smuzhiyun 		if (tlb_type == cheetah_plus || tlb_type == hypervisor)
163*4882a593Smuzhiyun 			base = __pa(base);
164*4882a593Smuzhiyun 		if (hugepage_shift == PAGE_SHIFT)
165*4882a593Smuzhiyun 			__flush_tsb_one_entry(base, vaddr, PAGE_SHIFT,
166*4882a593Smuzhiyun 					      nentries);
167*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE)
168*4882a593Smuzhiyun 		else
169*4882a593Smuzhiyun 			__flush_huge_tsb_one_entry(base, vaddr, PAGE_SHIFT,
170*4882a593Smuzhiyun 						   nentries, hugepage_shift);
171*4882a593Smuzhiyun #endif
172*4882a593Smuzhiyun 	}
173*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
174*4882a593Smuzhiyun 	else if (mm->context.tsb_block[MM_TSB_HUGE].tsb) {
175*4882a593Smuzhiyun 		base = (unsigned long) mm->context.tsb_block[MM_TSB_HUGE].tsb;
176*4882a593Smuzhiyun 		nentries = mm->context.tsb_block[MM_TSB_HUGE].tsb_nentries;
177*4882a593Smuzhiyun 		if (tlb_type == cheetah_plus || tlb_type == hypervisor)
178*4882a593Smuzhiyun 			base = __pa(base);
179*4882a593Smuzhiyun 		__flush_huge_tsb_one_entry(base, vaddr, REAL_HPAGE_SHIFT,
180*4882a593Smuzhiyun 					   nentries, hugepage_shift);
181*4882a593Smuzhiyun 	}
182*4882a593Smuzhiyun #endif
183*4882a593Smuzhiyun 	spin_unlock_irqrestore(&mm->context.lock, flags);
184*4882a593Smuzhiyun }
185*4882a593Smuzhiyun 
186*4882a593Smuzhiyun #define HV_PGSZ_IDX_BASE	HV_PGSZ_IDX_8K
187*4882a593Smuzhiyun #define HV_PGSZ_MASK_BASE	HV_PGSZ_MASK_8K
188*4882a593Smuzhiyun 
189*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
190*4882a593Smuzhiyun #define HV_PGSZ_IDX_HUGE	HV_PGSZ_IDX_4MB
191*4882a593Smuzhiyun #define HV_PGSZ_MASK_HUGE	HV_PGSZ_MASK_4MB
192*4882a593Smuzhiyun #endif
193*4882a593Smuzhiyun 
setup_tsb_params(struct mm_struct * mm,unsigned long tsb_idx,unsigned long tsb_bytes)194*4882a593Smuzhiyun static void setup_tsb_params(struct mm_struct *mm, unsigned long tsb_idx, unsigned long tsb_bytes)
195*4882a593Smuzhiyun {
196*4882a593Smuzhiyun 	unsigned long tsb_reg, base, tsb_paddr;
197*4882a593Smuzhiyun 	unsigned long page_sz, tte;
198*4882a593Smuzhiyun 
199*4882a593Smuzhiyun 	mm->context.tsb_block[tsb_idx].tsb_nentries =
200*4882a593Smuzhiyun 		tsb_bytes / sizeof(struct tsb);
201*4882a593Smuzhiyun 
202*4882a593Smuzhiyun 	switch (tsb_idx) {
203*4882a593Smuzhiyun 	case MM_TSB_BASE:
204*4882a593Smuzhiyun 		base = TSBMAP_8K_BASE;
205*4882a593Smuzhiyun 		break;
206*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
207*4882a593Smuzhiyun 	case MM_TSB_HUGE:
208*4882a593Smuzhiyun 		base = TSBMAP_4M_BASE;
209*4882a593Smuzhiyun 		break;
210*4882a593Smuzhiyun #endif
211*4882a593Smuzhiyun 	default:
212*4882a593Smuzhiyun 		BUG();
213*4882a593Smuzhiyun 	}
214*4882a593Smuzhiyun 
215*4882a593Smuzhiyun 	tte = pgprot_val(PAGE_KERNEL_LOCKED);
216*4882a593Smuzhiyun 	tsb_paddr = __pa(mm->context.tsb_block[tsb_idx].tsb);
217*4882a593Smuzhiyun 	BUG_ON(tsb_paddr & (tsb_bytes - 1UL));
218*4882a593Smuzhiyun 
219*4882a593Smuzhiyun 	/* Use the smallest page size that can map the whole TSB
220*4882a593Smuzhiyun 	 * in one TLB entry.
221*4882a593Smuzhiyun 	 */
222*4882a593Smuzhiyun 	switch (tsb_bytes) {
223*4882a593Smuzhiyun 	case 8192 << 0:
224*4882a593Smuzhiyun 		tsb_reg = 0x0UL;
225*4882a593Smuzhiyun #ifdef DCACHE_ALIASING_POSSIBLE
226*4882a593Smuzhiyun 		base += (tsb_paddr & 8192);
227*4882a593Smuzhiyun #endif
228*4882a593Smuzhiyun 		page_sz = 8192;
229*4882a593Smuzhiyun 		break;
230*4882a593Smuzhiyun 
231*4882a593Smuzhiyun 	case 8192 << 1:
232*4882a593Smuzhiyun 		tsb_reg = 0x1UL;
233*4882a593Smuzhiyun 		page_sz = 64 * 1024;
234*4882a593Smuzhiyun 		break;
235*4882a593Smuzhiyun 
236*4882a593Smuzhiyun 	case 8192 << 2:
237*4882a593Smuzhiyun 		tsb_reg = 0x2UL;
238*4882a593Smuzhiyun 		page_sz = 64 * 1024;
239*4882a593Smuzhiyun 		break;
240*4882a593Smuzhiyun 
241*4882a593Smuzhiyun 	case 8192 << 3:
242*4882a593Smuzhiyun 		tsb_reg = 0x3UL;
243*4882a593Smuzhiyun 		page_sz = 64 * 1024;
244*4882a593Smuzhiyun 		break;
245*4882a593Smuzhiyun 
246*4882a593Smuzhiyun 	case 8192 << 4:
247*4882a593Smuzhiyun 		tsb_reg = 0x4UL;
248*4882a593Smuzhiyun 		page_sz = 512 * 1024;
249*4882a593Smuzhiyun 		break;
250*4882a593Smuzhiyun 
251*4882a593Smuzhiyun 	case 8192 << 5:
252*4882a593Smuzhiyun 		tsb_reg = 0x5UL;
253*4882a593Smuzhiyun 		page_sz = 512 * 1024;
254*4882a593Smuzhiyun 		break;
255*4882a593Smuzhiyun 
256*4882a593Smuzhiyun 	case 8192 << 6:
257*4882a593Smuzhiyun 		tsb_reg = 0x6UL;
258*4882a593Smuzhiyun 		page_sz = 512 * 1024;
259*4882a593Smuzhiyun 		break;
260*4882a593Smuzhiyun 
261*4882a593Smuzhiyun 	case 8192 << 7:
262*4882a593Smuzhiyun 		tsb_reg = 0x7UL;
263*4882a593Smuzhiyun 		page_sz = 4 * 1024 * 1024;
264*4882a593Smuzhiyun 		break;
265*4882a593Smuzhiyun 
266*4882a593Smuzhiyun 	default:
267*4882a593Smuzhiyun 		printk(KERN_ERR "TSB[%s:%d]: Impossible TSB size %lu, killing process.\n",
268*4882a593Smuzhiyun 		       current->comm, current->pid, tsb_bytes);
269*4882a593Smuzhiyun 		do_exit(SIGSEGV);
270*4882a593Smuzhiyun 	}
271*4882a593Smuzhiyun 	tte |= pte_sz_bits(page_sz);
272*4882a593Smuzhiyun 
273*4882a593Smuzhiyun 	if (tlb_type == cheetah_plus || tlb_type == hypervisor) {
274*4882a593Smuzhiyun 		/* Physical mapping, no locked TLB entry for TSB.  */
275*4882a593Smuzhiyun 		tsb_reg |= tsb_paddr;
276*4882a593Smuzhiyun 
277*4882a593Smuzhiyun 		mm->context.tsb_block[tsb_idx].tsb_reg_val = tsb_reg;
278*4882a593Smuzhiyun 		mm->context.tsb_block[tsb_idx].tsb_map_vaddr = 0;
279*4882a593Smuzhiyun 		mm->context.tsb_block[tsb_idx].tsb_map_pte = 0;
280*4882a593Smuzhiyun 	} else {
281*4882a593Smuzhiyun 		tsb_reg |= base;
282*4882a593Smuzhiyun 		tsb_reg |= (tsb_paddr & (page_sz - 1UL));
283*4882a593Smuzhiyun 		tte |= (tsb_paddr & ~(page_sz - 1UL));
284*4882a593Smuzhiyun 
285*4882a593Smuzhiyun 		mm->context.tsb_block[tsb_idx].tsb_reg_val = tsb_reg;
286*4882a593Smuzhiyun 		mm->context.tsb_block[tsb_idx].tsb_map_vaddr = base;
287*4882a593Smuzhiyun 		mm->context.tsb_block[tsb_idx].tsb_map_pte = tte;
288*4882a593Smuzhiyun 	}
289*4882a593Smuzhiyun 
290*4882a593Smuzhiyun 	/* Setup the Hypervisor TSB descriptor.  */
291*4882a593Smuzhiyun 	if (tlb_type == hypervisor) {
292*4882a593Smuzhiyun 		struct hv_tsb_descr *hp = &mm->context.tsb_descr[tsb_idx];
293*4882a593Smuzhiyun 
294*4882a593Smuzhiyun 		switch (tsb_idx) {
295*4882a593Smuzhiyun 		case MM_TSB_BASE:
296*4882a593Smuzhiyun 			hp->pgsz_idx = HV_PGSZ_IDX_BASE;
297*4882a593Smuzhiyun 			break;
298*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
299*4882a593Smuzhiyun 		case MM_TSB_HUGE:
300*4882a593Smuzhiyun 			hp->pgsz_idx = HV_PGSZ_IDX_HUGE;
301*4882a593Smuzhiyun 			break;
302*4882a593Smuzhiyun #endif
303*4882a593Smuzhiyun 		default:
304*4882a593Smuzhiyun 			BUG();
305*4882a593Smuzhiyun 		}
306*4882a593Smuzhiyun 		hp->assoc = 1;
307*4882a593Smuzhiyun 		hp->num_ttes = tsb_bytes / 16;
308*4882a593Smuzhiyun 		hp->ctx_idx = 0;
309*4882a593Smuzhiyun 		switch (tsb_idx) {
310*4882a593Smuzhiyun 		case MM_TSB_BASE:
311*4882a593Smuzhiyun 			hp->pgsz_mask = HV_PGSZ_MASK_BASE;
312*4882a593Smuzhiyun 			break;
313*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
314*4882a593Smuzhiyun 		case MM_TSB_HUGE:
315*4882a593Smuzhiyun 			hp->pgsz_mask = HV_PGSZ_MASK_HUGE;
316*4882a593Smuzhiyun 			break;
317*4882a593Smuzhiyun #endif
318*4882a593Smuzhiyun 		default:
319*4882a593Smuzhiyun 			BUG();
320*4882a593Smuzhiyun 		}
321*4882a593Smuzhiyun 		hp->tsb_base = tsb_paddr;
322*4882a593Smuzhiyun 		hp->resv = 0;
323*4882a593Smuzhiyun 	}
324*4882a593Smuzhiyun }
325*4882a593Smuzhiyun 
326*4882a593Smuzhiyun struct kmem_cache *pgtable_cache __read_mostly;
327*4882a593Smuzhiyun 
328*4882a593Smuzhiyun static struct kmem_cache *tsb_caches[8] __read_mostly;
329*4882a593Smuzhiyun 
330*4882a593Smuzhiyun static const char *tsb_cache_names[8] = {
331*4882a593Smuzhiyun 	"tsb_8KB",
332*4882a593Smuzhiyun 	"tsb_16KB",
333*4882a593Smuzhiyun 	"tsb_32KB",
334*4882a593Smuzhiyun 	"tsb_64KB",
335*4882a593Smuzhiyun 	"tsb_128KB",
336*4882a593Smuzhiyun 	"tsb_256KB",
337*4882a593Smuzhiyun 	"tsb_512KB",
338*4882a593Smuzhiyun 	"tsb_1MB",
339*4882a593Smuzhiyun };
340*4882a593Smuzhiyun 
pgtable_cache_init(void)341*4882a593Smuzhiyun void __init pgtable_cache_init(void)
342*4882a593Smuzhiyun {
343*4882a593Smuzhiyun 	unsigned long i;
344*4882a593Smuzhiyun 
345*4882a593Smuzhiyun 	pgtable_cache = kmem_cache_create("pgtable_cache",
346*4882a593Smuzhiyun 					  PAGE_SIZE, PAGE_SIZE,
347*4882a593Smuzhiyun 					  0,
348*4882a593Smuzhiyun 					  _clear_page);
349*4882a593Smuzhiyun 	if (!pgtable_cache) {
350*4882a593Smuzhiyun 		prom_printf("pgtable_cache_init(): Could not create!\n");
351*4882a593Smuzhiyun 		prom_halt();
352*4882a593Smuzhiyun 	}
353*4882a593Smuzhiyun 
354*4882a593Smuzhiyun 	for (i = 0; i < ARRAY_SIZE(tsb_cache_names); i++) {
355*4882a593Smuzhiyun 		unsigned long size = 8192 << i;
356*4882a593Smuzhiyun 		const char *name = tsb_cache_names[i];
357*4882a593Smuzhiyun 
358*4882a593Smuzhiyun 		tsb_caches[i] = kmem_cache_create(name,
359*4882a593Smuzhiyun 						  size, size,
360*4882a593Smuzhiyun 						  0, NULL);
361*4882a593Smuzhiyun 		if (!tsb_caches[i]) {
362*4882a593Smuzhiyun 			prom_printf("Could not create %s cache\n", name);
363*4882a593Smuzhiyun 			prom_halt();
364*4882a593Smuzhiyun 		}
365*4882a593Smuzhiyun 	}
366*4882a593Smuzhiyun }
367*4882a593Smuzhiyun 
368*4882a593Smuzhiyun int sysctl_tsb_ratio = -2;
369*4882a593Smuzhiyun 
tsb_size_to_rss_limit(unsigned long new_size)370*4882a593Smuzhiyun static unsigned long tsb_size_to_rss_limit(unsigned long new_size)
371*4882a593Smuzhiyun {
372*4882a593Smuzhiyun 	unsigned long num_ents = (new_size / sizeof(struct tsb));
373*4882a593Smuzhiyun 
374*4882a593Smuzhiyun 	if (sysctl_tsb_ratio < 0)
375*4882a593Smuzhiyun 		return num_ents - (num_ents >> -sysctl_tsb_ratio);
376*4882a593Smuzhiyun 	else
377*4882a593Smuzhiyun 		return num_ents + (num_ents >> sysctl_tsb_ratio);
378*4882a593Smuzhiyun }
379*4882a593Smuzhiyun 
380*4882a593Smuzhiyun /* When the RSS of an address space exceeds tsb_rss_limit for a TSB,
381*4882a593Smuzhiyun  * do_sparc64_fault() invokes this routine to try and grow it.
382*4882a593Smuzhiyun  *
383*4882a593Smuzhiyun  * When we reach the maximum TSB size supported, we stick ~0UL into
384*4882a593Smuzhiyun  * tsb_rss_limit for that TSB so the grow checks in do_sparc64_fault()
385*4882a593Smuzhiyun  * will not trigger any longer.
386*4882a593Smuzhiyun  *
387*4882a593Smuzhiyun  * The TSB can be anywhere from 8K to 1MB in size, in increasing powers
388*4882a593Smuzhiyun  * of two.  The TSB must be aligned to it's size, so f.e. a 512K TSB
389*4882a593Smuzhiyun  * must be 512K aligned.  It also must be physically contiguous, so we
390*4882a593Smuzhiyun  * cannot use vmalloc().
391*4882a593Smuzhiyun  *
392*4882a593Smuzhiyun  * The idea here is to grow the TSB when the RSS of the process approaches
393*4882a593Smuzhiyun  * the number of entries that the current TSB can hold at once.  Currently,
394*4882a593Smuzhiyun  * we trigger when the RSS hits 3/4 of the TSB capacity.
395*4882a593Smuzhiyun  */
tsb_grow(struct mm_struct * mm,unsigned long tsb_index,unsigned long rss)396*4882a593Smuzhiyun void tsb_grow(struct mm_struct *mm, unsigned long tsb_index, unsigned long rss)
397*4882a593Smuzhiyun {
398*4882a593Smuzhiyun 	unsigned long max_tsb_size = 1 * 1024 * 1024;
399*4882a593Smuzhiyun 	unsigned long new_size, old_size, flags;
400*4882a593Smuzhiyun 	struct tsb *old_tsb, *new_tsb;
401*4882a593Smuzhiyun 	unsigned long new_cache_index, old_cache_index;
402*4882a593Smuzhiyun 	unsigned long new_rss_limit;
403*4882a593Smuzhiyun 	gfp_t gfp_flags;
404*4882a593Smuzhiyun 
405*4882a593Smuzhiyun 	if (max_tsb_size > (PAGE_SIZE << MAX_ORDER))
406*4882a593Smuzhiyun 		max_tsb_size = (PAGE_SIZE << MAX_ORDER);
407*4882a593Smuzhiyun 
408*4882a593Smuzhiyun 	new_cache_index = 0;
409*4882a593Smuzhiyun 	for (new_size = 8192; new_size < max_tsb_size; new_size <<= 1UL) {
410*4882a593Smuzhiyun 		new_rss_limit = tsb_size_to_rss_limit(new_size);
411*4882a593Smuzhiyun 		if (new_rss_limit > rss)
412*4882a593Smuzhiyun 			break;
413*4882a593Smuzhiyun 		new_cache_index++;
414*4882a593Smuzhiyun 	}
415*4882a593Smuzhiyun 
416*4882a593Smuzhiyun 	if (new_size == max_tsb_size)
417*4882a593Smuzhiyun 		new_rss_limit = ~0UL;
418*4882a593Smuzhiyun 
419*4882a593Smuzhiyun retry_tsb_alloc:
420*4882a593Smuzhiyun 	gfp_flags = GFP_KERNEL;
421*4882a593Smuzhiyun 	if (new_size > (PAGE_SIZE * 2))
422*4882a593Smuzhiyun 		gfp_flags |= __GFP_NOWARN | __GFP_NORETRY;
423*4882a593Smuzhiyun 
424*4882a593Smuzhiyun 	new_tsb = kmem_cache_alloc_node(tsb_caches[new_cache_index],
425*4882a593Smuzhiyun 					gfp_flags, numa_node_id());
426*4882a593Smuzhiyun 	if (unlikely(!new_tsb)) {
427*4882a593Smuzhiyun 		/* Not being able to fork due to a high-order TSB
428*4882a593Smuzhiyun 		 * allocation failure is very bad behavior.  Just back
429*4882a593Smuzhiyun 		 * down to a 0-order allocation and force no TSB
430*4882a593Smuzhiyun 		 * growing for this address space.
431*4882a593Smuzhiyun 		 */
432*4882a593Smuzhiyun 		if (mm->context.tsb_block[tsb_index].tsb == NULL &&
433*4882a593Smuzhiyun 		    new_cache_index > 0) {
434*4882a593Smuzhiyun 			new_cache_index = 0;
435*4882a593Smuzhiyun 			new_size = 8192;
436*4882a593Smuzhiyun 			new_rss_limit = ~0UL;
437*4882a593Smuzhiyun 			goto retry_tsb_alloc;
438*4882a593Smuzhiyun 		}
439*4882a593Smuzhiyun 
440*4882a593Smuzhiyun 		/* If we failed on a TSB grow, we are under serious
441*4882a593Smuzhiyun 		 * memory pressure so don't try to grow any more.
442*4882a593Smuzhiyun 		 */
443*4882a593Smuzhiyun 		if (mm->context.tsb_block[tsb_index].tsb != NULL)
444*4882a593Smuzhiyun 			mm->context.tsb_block[tsb_index].tsb_rss_limit = ~0UL;
445*4882a593Smuzhiyun 		return;
446*4882a593Smuzhiyun 	}
447*4882a593Smuzhiyun 
448*4882a593Smuzhiyun 	/* Mark all tags as invalid.  */
449*4882a593Smuzhiyun 	tsb_init(new_tsb, new_size);
450*4882a593Smuzhiyun 
451*4882a593Smuzhiyun 	/* Ok, we are about to commit the changes.  If we are
452*4882a593Smuzhiyun 	 * growing an existing TSB the locking is very tricky,
453*4882a593Smuzhiyun 	 * so WATCH OUT!
454*4882a593Smuzhiyun 	 *
455*4882a593Smuzhiyun 	 * We have to hold mm->context.lock while committing to the
456*4882a593Smuzhiyun 	 * new TSB, this synchronizes us with processors in
457*4882a593Smuzhiyun 	 * flush_tsb_user() and switch_mm() for this address space.
458*4882a593Smuzhiyun 	 *
459*4882a593Smuzhiyun 	 * But even with that lock held, processors run asynchronously
460*4882a593Smuzhiyun 	 * accessing the old TSB via TLB miss handling.  This is OK
461*4882a593Smuzhiyun 	 * because those actions are just propagating state from the
462*4882a593Smuzhiyun 	 * Linux page tables into the TSB, page table mappings are not
463*4882a593Smuzhiyun 	 * being changed.  If a real fault occurs, the processor will
464*4882a593Smuzhiyun 	 * synchronize with us when it hits flush_tsb_user(), this is
465*4882a593Smuzhiyun 	 * also true for the case where vmscan is modifying the page
466*4882a593Smuzhiyun 	 * tables.  The only thing we need to be careful with is to
467*4882a593Smuzhiyun 	 * skip any locked TSB entries during copy_tsb().
468*4882a593Smuzhiyun 	 *
469*4882a593Smuzhiyun 	 * When we finish committing to the new TSB, we have to drop
470*4882a593Smuzhiyun 	 * the lock and ask all other cpus running this address space
471*4882a593Smuzhiyun 	 * to run tsb_context_switch() to see the new TSB table.
472*4882a593Smuzhiyun 	 */
473*4882a593Smuzhiyun 	spin_lock_irqsave(&mm->context.lock, flags);
474*4882a593Smuzhiyun 
475*4882a593Smuzhiyun 	old_tsb = mm->context.tsb_block[tsb_index].tsb;
476*4882a593Smuzhiyun 	old_cache_index =
477*4882a593Smuzhiyun 		(mm->context.tsb_block[tsb_index].tsb_reg_val & 0x7UL);
478*4882a593Smuzhiyun 	old_size = (mm->context.tsb_block[tsb_index].tsb_nentries *
479*4882a593Smuzhiyun 		    sizeof(struct tsb));
480*4882a593Smuzhiyun 
481*4882a593Smuzhiyun 
482*4882a593Smuzhiyun 	/* Handle multiple threads trying to grow the TSB at the same time.
483*4882a593Smuzhiyun 	 * One will get in here first, and bump the size and the RSS limit.
484*4882a593Smuzhiyun 	 * The others will get in here next and hit this check.
485*4882a593Smuzhiyun 	 */
486*4882a593Smuzhiyun 	if (unlikely(old_tsb &&
487*4882a593Smuzhiyun 		     (rss < mm->context.tsb_block[tsb_index].tsb_rss_limit))) {
488*4882a593Smuzhiyun 		spin_unlock_irqrestore(&mm->context.lock, flags);
489*4882a593Smuzhiyun 
490*4882a593Smuzhiyun 		kmem_cache_free(tsb_caches[new_cache_index], new_tsb);
491*4882a593Smuzhiyun 		return;
492*4882a593Smuzhiyun 	}
493*4882a593Smuzhiyun 
494*4882a593Smuzhiyun 	mm->context.tsb_block[tsb_index].tsb_rss_limit = new_rss_limit;
495*4882a593Smuzhiyun 
496*4882a593Smuzhiyun 	if (old_tsb) {
497*4882a593Smuzhiyun 		extern void copy_tsb(unsigned long old_tsb_base,
498*4882a593Smuzhiyun 				     unsigned long old_tsb_size,
499*4882a593Smuzhiyun 				     unsigned long new_tsb_base,
500*4882a593Smuzhiyun 				     unsigned long new_tsb_size,
501*4882a593Smuzhiyun 				     unsigned long page_size_shift);
502*4882a593Smuzhiyun 		unsigned long old_tsb_base = (unsigned long) old_tsb;
503*4882a593Smuzhiyun 		unsigned long new_tsb_base = (unsigned long) new_tsb;
504*4882a593Smuzhiyun 
505*4882a593Smuzhiyun 		if (tlb_type == cheetah_plus || tlb_type == hypervisor) {
506*4882a593Smuzhiyun 			old_tsb_base = __pa(old_tsb_base);
507*4882a593Smuzhiyun 			new_tsb_base = __pa(new_tsb_base);
508*4882a593Smuzhiyun 		}
509*4882a593Smuzhiyun 		copy_tsb(old_tsb_base, old_size, new_tsb_base, new_size,
510*4882a593Smuzhiyun 			tsb_index == MM_TSB_BASE ?
511*4882a593Smuzhiyun 			PAGE_SHIFT : REAL_HPAGE_SHIFT);
512*4882a593Smuzhiyun 	}
513*4882a593Smuzhiyun 
514*4882a593Smuzhiyun 	mm->context.tsb_block[tsb_index].tsb = new_tsb;
515*4882a593Smuzhiyun 	setup_tsb_params(mm, tsb_index, new_size);
516*4882a593Smuzhiyun 
517*4882a593Smuzhiyun 	spin_unlock_irqrestore(&mm->context.lock, flags);
518*4882a593Smuzhiyun 
519*4882a593Smuzhiyun 	/* If old_tsb is NULL, we're being invoked for the first time
520*4882a593Smuzhiyun 	 * from init_new_context().
521*4882a593Smuzhiyun 	 */
522*4882a593Smuzhiyun 	if (old_tsb) {
523*4882a593Smuzhiyun 		/* Reload it on the local cpu.  */
524*4882a593Smuzhiyun 		tsb_context_switch(mm);
525*4882a593Smuzhiyun 
526*4882a593Smuzhiyun 		/* Now force other processors to do the same.  */
527*4882a593Smuzhiyun 		preempt_disable();
528*4882a593Smuzhiyun 		smp_tsb_sync(mm);
529*4882a593Smuzhiyun 		preempt_enable();
530*4882a593Smuzhiyun 
531*4882a593Smuzhiyun 		/* Now it is safe to free the old tsb.  */
532*4882a593Smuzhiyun 		kmem_cache_free(tsb_caches[old_cache_index], old_tsb);
533*4882a593Smuzhiyun 	}
534*4882a593Smuzhiyun }
535*4882a593Smuzhiyun 
init_new_context(struct task_struct * tsk,struct mm_struct * mm)536*4882a593Smuzhiyun int init_new_context(struct task_struct *tsk, struct mm_struct *mm)
537*4882a593Smuzhiyun {
538*4882a593Smuzhiyun 	unsigned long mm_rss = get_mm_rss(mm);
539*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
540*4882a593Smuzhiyun 	unsigned long saved_hugetlb_pte_count;
541*4882a593Smuzhiyun 	unsigned long saved_thp_pte_count;
542*4882a593Smuzhiyun #endif
543*4882a593Smuzhiyun 	unsigned int i;
544*4882a593Smuzhiyun 
545*4882a593Smuzhiyun 	spin_lock_init(&mm->context.lock);
546*4882a593Smuzhiyun 
547*4882a593Smuzhiyun 	mm->context.sparc64_ctx_val = 0UL;
548*4882a593Smuzhiyun 
549*4882a593Smuzhiyun 	mm->context.tag_store = NULL;
550*4882a593Smuzhiyun 	spin_lock_init(&mm->context.tag_lock);
551*4882a593Smuzhiyun 
552*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
553*4882a593Smuzhiyun 	/* We reset them to zero because the fork() page copying
554*4882a593Smuzhiyun 	 * will re-increment the counters as the parent PTEs are
555*4882a593Smuzhiyun 	 * copied into the child address space.
556*4882a593Smuzhiyun 	 */
557*4882a593Smuzhiyun 	saved_hugetlb_pte_count = mm->context.hugetlb_pte_count;
558*4882a593Smuzhiyun 	saved_thp_pte_count = mm->context.thp_pte_count;
559*4882a593Smuzhiyun 	mm->context.hugetlb_pte_count = 0;
560*4882a593Smuzhiyun 	mm->context.thp_pte_count = 0;
561*4882a593Smuzhiyun 
562*4882a593Smuzhiyun 	mm_rss -= saved_thp_pte_count * (HPAGE_SIZE / PAGE_SIZE);
563*4882a593Smuzhiyun #endif
564*4882a593Smuzhiyun 
565*4882a593Smuzhiyun 	/* copy_mm() copies over the parent's mm_struct before calling
566*4882a593Smuzhiyun 	 * us, so we need to zero out the TSB pointer or else tsb_grow()
567*4882a593Smuzhiyun 	 * will be confused and think there is an older TSB to free up.
568*4882a593Smuzhiyun 	 */
569*4882a593Smuzhiyun 	for (i = 0; i < MM_NUM_TSBS; i++)
570*4882a593Smuzhiyun 		mm->context.tsb_block[i].tsb = NULL;
571*4882a593Smuzhiyun 
572*4882a593Smuzhiyun 	/* If this is fork, inherit the parent's TSB size.  We would
573*4882a593Smuzhiyun 	 * grow it to that size on the first page fault anyways.
574*4882a593Smuzhiyun 	 */
575*4882a593Smuzhiyun 	tsb_grow(mm, MM_TSB_BASE, mm_rss);
576*4882a593Smuzhiyun 
577*4882a593Smuzhiyun #if defined(CONFIG_HUGETLB_PAGE) || defined(CONFIG_TRANSPARENT_HUGEPAGE)
578*4882a593Smuzhiyun 	if (unlikely(saved_hugetlb_pte_count + saved_thp_pte_count))
579*4882a593Smuzhiyun 		tsb_grow(mm, MM_TSB_HUGE,
580*4882a593Smuzhiyun 			 (saved_hugetlb_pte_count + saved_thp_pte_count) *
581*4882a593Smuzhiyun 			 REAL_HPAGE_PER_HPAGE);
582*4882a593Smuzhiyun #endif
583*4882a593Smuzhiyun 
584*4882a593Smuzhiyun 	if (unlikely(!mm->context.tsb_block[MM_TSB_BASE].tsb))
585*4882a593Smuzhiyun 		return -ENOMEM;
586*4882a593Smuzhiyun 
587*4882a593Smuzhiyun 	return 0;
588*4882a593Smuzhiyun }
589*4882a593Smuzhiyun 
tsb_destroy_one(struct tsb_config * tp)590*4882a593Smuzhiyun static void tsb_destroy_one(struct tsb_config *tp)
591*4882a593Smuzhiyun {
592*4882a593Smuzhiyun 	unsigned long cache_index;
593*4882a593Smuzhiyun 
594*4882a593Smuzhiyun 	if (!tp->tsb)
595*4882a593Smuzhiyun 		return;
596*4882a593Smuzhiyun 	cache_index = tp->tsb_reg_val & 0x7UL;
597*4882a593Smuzhiyun 	kmem_cache_free(tsb_caches[cache_index], tp->tsb);
598*4882a593Smuzhiyun 	tp->tsb = NULL;
599*4882a593Smuzhiyun 	tp->tsb_reg_val = 0UL;
600*4882a593Smuzhiyun }
601*4882a593Smuzhiyun 
destroy_context(struct mm_struct * mm)602*4882a593Smuzhiyun void destroy_context(struct mm_struct *mm)
603*4882a593Smuzhiyun {
604*4882a593Smuzhiyun 	unsigned long flags, i;
605*4882a593Smuzhiyun 
606*4882a593Smuzhiyun 	for (i = 0; i < MM_NUM_TSBS; i++)
607*4882a593Smuzhiyun 		tsb_destroy_one(&mm->context.tsb_block[i]);
608*4882a593Smuzhiyun 
609*4882a593Smuzhiyun 	spin_lock_irqsave(&ctx_alloc_lock, flags);
610*4882a593Smuzhiyun 
611*4882a593Smuzhiyun 	if (CTX_VALID(mm->context)) {
612*4882a593Smuzhiyun 		unsigned long nr = CTX_NRBITS(mm->context);
613*4882a593Smuzhiyun 		mmu_context_bmap[nr>>6] &= ~(1UL << (nr & 63));
614*4882a593Smuzhiyun 	}
615*4882a593Smuzhiyun 
616*4882a593Smuzhiyun 	spin_unlock_irqrestore(&ctx_alloc_lock, flags);
617*4882a593Smuzhiyun 
618*4882a593Smuzhiyun 	/* If ADI tag storage was allocated for this task, free it */
619*4882a593Smuzhiyun 	if (mm->context.tag_store) {
620*4882a593Smuzhiyun 		tag_storage_desc_t *tag_desc;
621*4882a593Smuzhiyun 		unsigned long max_desc;
622*4882a593Smuzhiyun 		unsigned char *tags;
623*4882a593Smuzhiyun 
624*4882a593Smuzhiyun 		tag_desc = mm->context.tag_store;
625*4882a593Smuzhiyun 		max_desc = PAGE_SIZE/sizeof(tag_storage_desc_t);
626*4882a593Smuzhiyun 		for (i = 0; i < max_desc; i++) {
627*4882a593Smuzhiyun 			tags = tag_desc->tags;
628*4882a593Smuzhiyun 			tag_desc->tags = NULL;
629*4882a593Smuzhiyun 			kfree(tags);
630*4882a593Smuzhiyun 			tag_desc++;
631*4882a593Smuzhiyun 		}
632*4882a593Smuzhiyun 		kfree(mm->context.tag_store);
633*4882a593Smuzhiyun 		mm->context.tag_store = NULL;
634*4882a593Smuzhiyun 	}
635*4882a593Smuzhiyun }
636