xref: /OK3568_Linux_fs/kernel/arch/sparc/mm/tlb.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /* arch/sparc64/mm/tlb.c
3*4882a593Smuzhiyun  *
4*4882a593Smuzhiyun  * Copyright (C) 2004 David S. Miller <davem@redhat.com>
5*4882a593Smuzhiyun  */
6*4882a593Smuzhiyun 
7*4882a593Smuzhiyun #include <linux/kernel.h>
8*4882a593Smuzhiyun #include <linux/percpu.h>
9*4882a593Smuzhiyun #include <linux/mm.h>
10*4882a593Smuzhiyun #include <linux/swap.h>
11*4882a593Smuzhiyun #include <linux/preempt.h>
12*4882a593Smuzhiyun 
13*4882a593Smuzhiyun #include <asm/tlbflush.h>
14*4882a593Smuzhiyun #include <asm/cacheflush.h>
15*4882a593Smuzhiyun #include <asm/mmu_context.h>
16*4882a593Smuzhiyun #include <asm/tlb.h>
17*4882a593Smuzhiyun 
18*4882a593Smuzhiyun /* Heavily inspired by the ppc64 code.  */
19*4882a593Smuzhiyun 
20*4882a593Smuzhiyun static DEFINE_PER_CPU(struct tlb_batch, tlb_batch);
21*4882a593Smuzhiyun 
flush_tlb_pending(void)22*4882a593Smuzhiyun void flush_tlb_pending(void)
23*4882a593Smuzhiyun {
24*4882a593Smuzhiyun 	struct tlb_batch *tb = &get_cpu_var(tlb_batch);
25*4882a593Smuzhiyun 	struct mm_struct *mm = tb->mm;
26*4882a593Smuzhiyun 
27*4882a593Smuzhiyun 	if (!tb->tlb_nr)
28*4882a593Smuzhiyun 		goto out;
29*4882a593Smuzhiyun 
30*4882a593Smuzhiyun 	flush_tsb_user(tb);
31*4882a593Smuzhiyun 
32*4882a593Smuzhiyun 	if (CTX_VALID(mm->context)) {
33*4882a593Smuzhiyun 		if (tb->tlb_nr == 1) {
34*4882a593Smuzhiyun 			global_flush_tlb_page(mm, tb->vaddrs[0]);
35*4882a593Smuzhiyun 		} else {
36*4882a593Smuzhiyun #ifdef CONFIG_SMP
37*4882a593Smuzhiyun 			smp_flush_tlb_pending(tb->mm, tb->tlb_nr,
38*4882a593Smuzhiyun 					      &tb->vaddrs[0]);
39*4882a593Smuzhiyun #else
40*4882a593Smuzhiyun 			__flush_tlb_pending(CTX_HWBITS(tb->mm->context),
41*4882a593Smuzhiyun 					    tb->tlb_nr, &tb->vaddrs[0]);
42*4882a593Smuzhiyun #endif
43*4882a593Smuzhiyun 		}
44*4882a593Smuzhiyun 	}
45*4882a593Smuzhiyun 
46*4882a593Smuzhiyun 	tb->tlb_nr = 0;
47*4882a593Smuzhiyun 
48*4882a593Smuzhiyun out:
49*4882a593Smuzhiyun 	put_cpu_var(tlb_batch);
50*4882a593Smuzhiyun }
51*4882a593Smuzhiyun 
arch_enter_lazy_mmu_mode(void)52*4882a593Smuzhiyun void arch_enter_lazy_mmu_mode(void)
53*4882a593Smuzhiyun {
54*4882a593Smuzhiyun 	struct tlb_batch *tb = this_cpu_ptr(&tlb_batch);
55*4882a593Smuzhiyun 
56*4882a593Smuzhiyun 	tb->active = 1;
57*4882a593Smuzhiyun }
58*4882a593Smuzhiyun 
arch_leave_lazy_mmu_mode(void)59*4882a593Smuzhiyun void arch_leave_lazy_mmu_mode(void)
60*4882a593Smuzhiyun {
61*4882a593Smuzhiyun 	struct tlb_batch *tb = this_cpu_ptr(&tlb_batch);
62*4882a593Smuzhiyun 
63*4882a593Smuzhiyun 	if (tb->tlb_nr)
64*4882a593Smuzhiyun 		flush_tlb_pending();
65*4882a593Smuzhiyun 	tb->active = 0;
66*4882a593Smuzhiyun }
67*4882a593Smuzhiyun 
tlb_batch_add_one(struct mm_struct * mm,unsigned long vaddr,bool exec,unsigned int hugepage_shift)68*4882a593Smuzhiyun static void tlb_batch_add_one(struct mm_struct *mm, unsigned long vaddr,
69*4882a593Smuzhiyun 			      bool exec, unsigned int hugepage_shift)
70*4882a593Smuzhiyun {
71*4882a593Smuzhiyun 	struct tlb_batch *tb = &get_cpu_var(tlb_batch);
72*4882a593Smuzhiyun 	unsigned long nr;
73*4882a593Smuzhiyun 
74*4882a593Smuzhiyun 	vaddr &= PAGE_MASK;
75*4882a593Smuzhiyun 	if (exec)
76*4882a593Smuzhiyun 		vaddr |= 0x1UL;
77*4882a593Smuzhiyun 
78*4882a593Smuzhiyun 	nr = tb->tlb_nr;
79*4882a593Smuzhiyun 
80*4882a593Smuzhiyun 	if (unlikely(nr != 0 && mm != tb->mm)) {
81*4882a593Smuzhiyun 		flush_tlb_pending();
82*4882a593Smuzhiyun 		nr = 0;
83*4882a593Smuzhiyun 	}
84*4882a593Smuzhiyun 
85*4882a593Smuzhiyun 	if (!tb->active) {
86*4882a593Smuzhiyun 		flush_tsb_user_page(mm, vaddr, hugepage_shift);
87*4882a593Smuzhiyun 		global_flush_tlb_page(mm, vaddr);
88*4882a593Smuzhiyun 		goto out;
89*4882a593Smuzhiyun 	}
90*4882a593Smuzhiyun 
91*4882a593Smuzhiyun 	if (nr == 0) {
92*4882a593Smuzhiyun 		tb->mm = mm;
93*4882a593Smuzhiyun 		tb->hugepage_shift = hugepage_shift;
94*4882a593Smuzhiyun 	}
95*4882a593Smuzhiyun 
96*4882a593Smuzhiyun 	if (tb->hugepage_shift != hugepage_shift) {
97*4882a593Smuzhiyun 		flush_tlb_pending();
98*4882a593Smuzhiyun 		tb->hugepage_shift = hugepage_shift;
99*4882a593Smuzhiyun 		nr = 0;
100*4882a593Smuzhiyun 	}
101*4882a593Smuzhiyun 
102*4882a593Smuzhiyun 	tb->vaddrs[nr] = vaddr;
103*4882a593Smuzhiyun 	tb->tlb_nr = ++nr;
104*4882a593Smuzhiyun 	if (nr >= TLB_BATCH_NR)
105*4882a593Smuzhiyun 		flush_tlb_pending();
106*4882a593Smuzhiyun 
107*4882a593Smuzhiyun out:
108*4882a593Smuzhiyun 	put_cpu_var(tlb_batch);
109*4882a593Smuzhiyun }
110*4882a593Smuzhiyun 
tlb_batch_add(struct mm_struct * mm,unsigned long vaddr,pte_t * ptep,pte_t orig,int fullmm,unsigned int hugepage_shift)111*4882a593Smuzhiyun void tlb_batch_add(struct mm_struct *mm, unsigned long vaddr,
112*4882a593Smuzhiyun 		   pte_t *ptep, pte_t orig, int fullmm,
113*4882a593Smuzhiyun 		   unsigned int hugepage_shift)
114*4882a593Smuzhiyun {
115*4882a593Smuzhiyun 	if (tlb_type != hypervisor &&
116*4882a593Smuzhiyun 	    pte_dirty(orig)) {
117*4882a593Smuzhiyun 		unsigned long paddr, pfn = pte_pfn(orig);
118*4882a593Smuzhiyun 		struct address_space *mapping;
119*4882a593Smuzhiyun 		struct page *page;
120*4882a593Smuzhiyun 
121*4882a593Smuzhiyun 		if (!pfn_valid(pfn))
122*4882a593Smuzhiyun 			goto no_cache_flush;
123*4882a593Smuzhiyun 
124*4882a593Smuzhiyun 		page = pfn_to_page(pfn);
125*4882a593Smuzhiyun 		if (PageReserved(page))
126*4882a593Smuzhiyun 			goto no_cache_flush;
127*4882a593Smuzhiyun 
128*4882a593Smuzhiyun 		/* A real file page? */
129*4882a593Smuzhiyun 		mapping = page_mapping_file(page);
130*4882a593Smuzhiyun 		if (!mapping)
131*4882a593Smuzhiyun 			goto no_cache_flush;
132*4882a593Smuzhiyun 
133*4882a593Smuzhiyun 		paddr = (unsigned long) page_address(page);
134*4882a593Smuzhiyun 		if ((paddr ^ vaddr) & (1 << 13))
135*4882a593Smuzhiyun 			flush_dcache_page_all(mm, page);
136*4882a593Smuzhiyun 	}
137*4882a593Smuzhiyun 
138*4882a593Smuzhiyun no_cache_flush:
139*4882a593Smuzhiyun 	if (!fullmm)
140*4882a593Smuzhiyun 		tlb_batch_add_one(mm, vaddr, pte_exec(orig), hugepage_shift);
141*4882a593Smuzhiyun }
142*4882a593Smuzhiyun 
143*4882a593Smuzhiyun #ifdef CONFIG_TRANSPARENT_HUGEPAGE
tlb_batch_pmd_scan(struct mm_struct * mm,unsigned long vaddr,pmd_t pmd)144*4882a593Smuzhiyun static void tlb_batch_pmd_scan(struct mm_struct *mm, unsigned long vaddr,
145*4882a593Smuzhiyun 			       pmd_t pmd)
146*4882a593Smuzhiyun {
147*4882a593Smuzhiyun 	unsigned long end;
148*4882a593Smuzhiyun 	pte_t *pte;
149*4882a593Smuzhiyun 
150*4882a593Smuzhiyun 	pte = pte_offset_map(&pmd, vaddr);
151*4882a593Smuzhiyun 	end = vaddr + HPAGE_SIZE;
152*4882a593Smuzhiyun 	while (vaddr < end) {
153*4882a593Smuzhiyun 		if (pte_val(*pte) & _PAGE_VALID) {
154*4882a593Smuzhiyun 			bool exec = pte_exec(*pte);
155*4882a593Smuzhiyun 
156*4882a593Smuzhiyun 			tlb_batch_add_one(mm, vaddr, exec, PAGE_SHIFT);
157*4882a593Smuzhiyun 		}
158*4882a593Smuzhiyun 		pte++;
159*4882a593Smuzhiyun 		vaddr += PAGE_SIZE;
160*4882a593Smuzhiyun 	}
161*4882a593Smuzhiyun 	pte_unmap(pte);
162*4882a593Smuzhiyun }
163*4882a593Smuzhiyun 
164*4882a593Smuzhiyun 
__set_pmd_acct(struct mm_struct * mm,unsigned long addr,pmd_t orig,pmd_t pmd)165*4882a593Smuzhiyun static void __set_pmd_acct(struct mm_struct *mm, unsigned long addr,
166*4882a593Smuzhiyun 			   pmd_t orig, pmd_t pmd)
167*4882a593Smuzhiyun {
168*4882a593Smuzhiyun 	if (mm == &init_mm)
169*4882a593Smuzhiyun 		return;
170*4882a593Smuzhiyun 
171*4882a593Smuzhiyun 	if ((pmd_val(pmd) ^ pmd_val(orig)) & _PAGE_PMD_HUGE) {
172*4882a593Smuzhiyun 		/*
173*4882a593Smuzhiyun 		 * Note that this routine only sets pmds for THP pages.
174*4882a593Smuzhiyun 		 * Hugetlb pages are handled elsewhere.  We need to check
175*4882a593Smuzhiyun 		 * for huge zero page.  Huge zero pages are like hugetlb
176*4882a593Smuzhiyun 		 * pages in that there is no RSS, but there is the need
177*4882a593Smuzhiyun 		 * for TSB entries.  So, huge zero page counts go into
178*4882a593Smuzhiyun 		 * hugetlb_pte_count.
179*4882a593Smuzhiyun 		 */
180*4882a593Smuzhiyun 		if (pmd_val(pmd) & _PAGE_PMD_HUGE) {
181*4882a593Smuzhiyun 			if (is_huge_zero_page(pmd_page(pmd)))
182*4882a593Smuzhiyun 				mm->context.hugetlb_pte_count++;
183*4882a593Smuzhiyun 			else
184*4882a593Smuzhiyun 				mm->context.thp_pte_count++;
185*4882a593Smuzhiyun 		} else {
186*4882a593Smuzhiyun 			if (is_huge_zero_page(pmd_page(orig)))
187*4882a593Smuzhiyun 				mm->context.hugetlb_pte_count--;
188*4882a593Smuzhiyun 			else
189*4882a593Smuzhiyun 				mm->context.thp_pte_count--;
190*4882a593Smuzhiyun 		}
191*4882a593Smuzhiyun 
192*4882a593Smuzhiyun 		/* Do not try to allocate the TSB hash table if we
193*4882a593Smuzhiyun 		 * don't have one already.  We have various locks held
194*4882a593Smuzhiyun 		 * and thus we'll end up doing a GFP_KERNEL allocation
195*4882a593Smuzhiyun 		 * in an atomic context.
196*4882a593Smuzhiyun 		 *
197*4882a593Smuzhiyun 		 * Instead, we let the first TLB miss on a hugepage
198*4882a593Smuzhiyun 		 * take care of this.
199*4882a593Smuzhiyun 		 */
200*4882a593Smuzhiyun 	}
201*4882a593Smuzhiyun 
202*4882a593Smuzhiyun 	if (!pmd_none(orig)) {
203*4882a593Smuzhiyun 		addr &= HPAGE_MASK;
204*4882a593Smuzhiyun 		if (pmd_trans_huge(orig)) {
205*4882a593Smuzhiyun 			pte_t orig_pte = __pte(pmd_val(orig));
206*4882a593Smuzhiyun 			bool exec = pte_exec(orig_pte);
207*4882a593Smuzhiyun 
208*4882a593Smuzhiyun 			tlb_batch_add_one(mm, addr, exec, REAL_HPAGE_SHIFT);
209*4882a593Smuzhiyun 			tlb_batch_add_one(mm, addr + REAL_HPAGE_SIZE, exec,
210*4882a593Smuzhiyun 					  REAL_HPAGE_SHIFT);
211*4882a593Smuzhiyun 		} else {
212*4882a593Smuzhiyun 			tlb_batch_pmd_scan(mm, addr, orig);
213*4882a593Smuzhiyun 		}
214*4882a593Smuzhiyun 	}
215*4882a593Smuzhiyun }
216*4882a593Smuzhiyun 
set_pmd_at(struct mm_struct * mm,unsigned long addr,pmd_t * pmdp,pmd_t pmd)217*4882a593Smuzhiyun void set_pmd_at(struct mm_struct *mm, unsigned long addr,
218*4882a593Smuzhiyun 		pmd_t *pmdp, pmd_t pmd)
219*4882a593Smuzhiyun {
220*4882a593Smuzhiyun 	pmd_t orig = *pmdp;
221*4882a593Smuzhiyun 
222*4882a593Smuzhiyun 	*pmdp = pmd;
223*4882a593Smuzhiyun 	__set_pmd_acct(mm, addr, orig, pmd);
224*4882a593Smuzhiyun }
225*4882a593Smuzhiyun 
pmdp_establish(struct vm_area_struct * vma,unsigned long address,pmd_t * pmdp,pmd_t pmd)226*4882a593Smuzhiyun static inline pmd_t pmdp_establish(struct vm_area_struct *vma,
227*4882a593Smuzhiyun 		unsigned long address, pmd_t *pmdp, pmd_t pmd)
228*4882a593Smuzhiyun {
229*4882a593Smuzhiyun 	pmd_t old;
230*4882a593Smuzhiyun 
231*4882a593Smuzhiyun 	do {
232*4882a593Smuzhiyun 		old = *pmdp;
233*4882a593Smuzhiyun 	} while (cmpxchg64(&pmdp->pmd, old.pmd, pmd.pmd) != old.pmd);
234*4882a593Smuzhiyun 	__set_pmd_acct(vma->vm_mm, address, old, pmd);
235*4882a593Smuzhiyun 
236*4882a593Smuzhiyun 	return old;
237*4882a593Smuzhiyun }
238*4882a593Smuzhiyun 
239*4882a593Smuzhiyun /*
240*4882a593Smuzhiyun  * This routine is only called when splitting a THP
241*4882a593Smuzhiyun  */
pmdp_invalidate(struct vm_area_struct * vma,unsigned long address,pmd_t * pmdp)242*4882a593Smuzhiyun pmd_t pmdp_invalidate(struct vm_area_struct *vma, unsigned long address,
243*4882a593Smuzhiyun 		     pmd_t *pmdp)
244*4882a593Smuzhiyun {
245*4882a593Smuzhiyun 	pmd_t old, entry;
246*4882a593Smuzhiyun 
247*4882a593Smuzhiyun 	entry = __pmd(pmd_val(*pmdp) & ~_PAGE_VALID);
248*4882a593Smuzhiyun 	old = pmdp_establish(vma, address, pmdp, entry);
249*4882a593Smuzhiyun 	flush_tlb_range(vma, address, address + HPAGE_PMD_SIZE);
250*4882a593Smuzhiyun 
251*4882a593Smuzhiyun 	/*
252*4882a593Smuzhiyun 	 * set_pmd_at() will not be called in a way to decrement
253*4882a593Smuzhiyun 	 * thp_pte_count when splitting a THP, so do it now.
254*4882a593Smuzhiyun 	 * Sanity check pmd before doing the actual decrement.
255*4882a593Smuzhiyun 	 */
256*4882a593Smuzhiyun 	if ((pmd_val(entry) & _PAGE_PMD_HUGE) &&
257*4882a593Smuzhiyun 	    !is_huge_zero_page(pmd_page(entry)))
258*4882a593Smuzhiyun 		(vma->vm_mm)->context.thp_pte_count--;
259*4882a593Smuzhiyun 
260*4882a593Smuzhiyun 	return old;
261*4882a593Smuzhiyun }
262*4882a593Smuzhiyun 
pgtable_trans_huge_deposit(struct mm_struct * mm,pmd_t * pmdp,pgtable_t pgtable)263*4882a593Smuzhiyun void pgtable_trans_huge_deposit(struct mm_struct *mm, pmd_t *pmdp,
264*4882a593Smuzhiyun 				pgtable_t pgtable)
265*4882a593Smuzhiyun {
266*4882a593Smuzhiyun 	struct list_head *lh = (struct list_head *) pgtable;
267*4882a593Smuzhiyun 
268*4882a593Smuzhiyun 	assert_spin_locked(&mm->page_table_lock);
269*4882a593Smuzhiyun 
270*4882a593Smuzhiyun 	/* FIFO */
271*4882a593Smuzhiyun 	if (!pmd_huge_pte(mm, pmdp))
272*4882a593Smuzhiyun 		INIT_LIST_HEAD(lh);
273*4882a593Smuzhiyun 	else
274*4882a593Smuzhiyun 		list_add(lh, (struct list_head *) pmd_huge_pte(mm, pmdp));
275*4882a593Smuzhiyun 	pmd_huge_pte(mm, pmdp) = pgtable;
276*4882a593Smuzhiyun }
277*4882a593Smuzhiyun 
pgtable_trans_huge_withdraw(struct mm_struct * mm,pmd_t * pmdp)278*4882a593Smuzhiyun pgtable_t pgtable_trans_huge_withdraw(struct mm_struct *mm, pmd_t *pmdp)
279*4882a593Smuzhiyun {
280*4882a593Smuzhiyun 	struct list_head *lh;
281*4882a593Smuzhiyun 	pgtable_t pgtable;
282*4882a593Smuzhiyun 
283*4882a593Smuzhiyun 	assert_spin_locked(&mm->page_table_lock);
284*4882a593Smuzhiyun 
285*4882a593Smuzhiyun 	/* FIFO */
286*4882a593Smuzhiyun 	pgtable = pmd_huge_pte(mm, pmdp);
287*4882a593Smuzhiyun 	lh = (struct list_head *) pgtable;
288*4882a593Smuzhiyun 	if (list_empty(lh))
289*4882a593Smuzhiyun 		pmd_huge_pte(mm, pmdp) = NULL;
290*4882a593Smuzhiyun 	else {
291*4882a593Smuzhiyun 		pmd_huge_pte(mm, pmdp) = (pgtable_t) lh->next;
292*4882a593Smuzhiyun 		list_del(lh);
293*4882a593Smuzhiyun 	}
294*4882a593Smuzhiyun 	pte_val(pgtable[0]) = 0;
295*4882a593Smuzhiyun 	pte_val(pgtable[1]) = 0;
296*4882a593Smuzhiyun 
297*4882a593Smuzhiyun 	return pgtable;
298*4882a593Smuzhiyun }
299*4882a593Smuzhiyun #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
300