1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /* arch/sparc64/mm/tlb.c
3*4882a593Smuzhiyun *
4*4882a593Smuzhiyun * Copyright (C) 2004 David S. Miller <davem@redhat.com>
5*4882a593Smuzhiyun */
6*4882a593Smuzhiyun
7*4882a593Smuzhiyun #include <linux/kernel.h>
8*4882a593Smuzhiyun #include <linux/percpu.h>
9*4882a593Smuzhiyun #include <linux/mm.h>
10*4882a593Smuzhiyun #include <linux/swap.h>
11*4882a593Smuzhiyun #include <linux/preempt.h>
12*4882a593Smuzhiyun
13*4882a593Smuzhiyun #include <asm/tlbflush.h>
14*4882a593Smuzhiyun #include <asm/cacheflush.h>
15*4882a593Smuzhiyun #include <asm/mmu_context.h>
16*4882a593Smuzhiyun #include <asm/tlb.h>
17*4882a593Smuzhiyun
18*4882a593Smuzhiyun /* Heavily inspired by the ppc64 code. */
19*4882a593Smuzhiyun
20*4882a593Smuzhiyun static DEFINE_PER_CPU(struct tlb_batch, tlb_batch);
21*4882a593Smuzhiyun
flush_tlb_pending(void)22*4882a593Smuzhiyun void flush_tlb_pending(void)
23*4882a593Smuzhiyun {
24*4882a593Smuzhiyun struct tlb_batch *tb = &get_cpu_var(tlb_batch);
25*4882a593Smuzhiyun struct mm_struct *mm = tb->mm;
26*4882a593Smuzhiyun
27*4882a593Smuzhiyun if (!tb->tlb_nr)
28*4882a593Smuzhiyun goto out;
29*4882a593Smuzhiyun
30*4882a593Smuzhiyun flush_tsb_user(tb);
31*4882a593Smuzhiyun
32*4882a593Smuzhiyun if (CTX_VALID(mm->context)) {
33*4882a593Smuzhiyun if (tb->tlb_nr == 1) {
34*4882a593Smuzhiyun global_flush_tlb_page(mm, tb->vaddrs[0]);
35*4882a593Smuzhiyun } else {
36*4882a593Smuzhiyun #ifdef CONFIG_SMP
37*4882a593Smuzhiyun smp_flush_tlb_pending(tb->mm, tb->tlb_nr,
38*4882a593Smuzhiyun &tb->vaddrs[0]);
39*4882a593Smuzhiyun #else
40*4882a593Smuzhiyun __flush_tlb_pending(CTX_HWBITS(tb->mm->context),
41*4882a593Smuzhiyun tb->tlb_nr, &tb->vaddrs[0]);
42*4882a593Smuzhiyun #endif
43*4882a593Smuzhiyun }
44*4882a593Smuzhiyun }
45*4882a593Smuzhiyun
46*4882a593Smuzhiyun tb->tlb_nr = 0;
47*4882a593Smuzhiyun
48*4882a593Smuzhiyun out:
49*4882a593Smuzhiyun put_cpu_var(tlb_batch);
50*4882a593Smuzhiyun }
51*4882a593Smuzhiyun
arch_enter_lazy_mmu_mode(void)52*4882a593Smuzhiyun void arch_enter_lazy_mmu_mode(void)
53*4882a593Smuzhiyun {
54*4882a593Smuzhiyun struct tlb_batch *tb = this_cpu_ptr(&tlb_batch);
55*4882a593Smuzhiyun
56*4882a593Smuzhiyun tb->active = 1;
57*4882a593Smuzhiyun }
58*4882a593Smuzhiyun
arch_leave_lazy_mmu_mode(void)59*4882a593Smuzhiyun void arch_leave_lazy_mmu_mode(void)
60*4882a593Smuzhiyun {
61*4882a593Smuzhiyun struct tlb_batch *tb = this_cpu_ptr(&tlb_batch);
62*4882a593Smuzhiyun
63*4882a593Smuzhiyun if (tb->tlb_nr)
64*4882a593Smuzhiyun flush_tlb_pending();
65*4882a593Smuzhiyun tb->active = 0;
66*4882a593Smuzhiyun }
67*4882a593Smuzhiyun
tlb_batch_add_one(struct mm_struct * mm,unsigned long vaddr,bool exec,unsigned int hugepage_shift)68*4882a593Smuzhiyun static void tlb_batch_add_one(struct mm_struct *mm, unsigned long vaddr,
69*4882a593Smuzhiyun bool exec, unsigned int hugepage_shift)
70*4882a593Smuzhiyun {
71*4882a593Smuzhiyun struct tlb_batch *tb = &get_cpu_var(tlb_batch);
72*4882a593Smuzhiyun unsigned long nr;
73*4882a593Smuzhiyun
74*4882a593Smuzhiyun vaddr &= PAGE_MASK;
75*4882a593Smuzhiyun if (exec)
76*4882a593Smuzhiyun vaddr |= 0x1UL;
77*4882a593Smuzhiyun
78*4882a593Smuzhiyun nr = tb->tlb_nr;
79*4882a593Smuzhiyun
80*4882a593Smuzhiyun if (unlikely(nr != 0 && mm != tb->mm)) {
81*4882a593Smuzhiyun flush_tlb_pending();
82*4882a593Smuzhiyun nr = 0;
83*4882a593Smuzhiyun }
84*4882a593Smuzhiyun
85*4882a593Smuzhiyun if (!tb->active) {
86*4882a593Smuzhiyun flush_tsb_user_page(mm, vaddr, hugepage_shift);
87*4882a593Smuzhiyun global_flush_tlb_page(mm, vaddr);
88*4882a593Smuzhiyun goto out;
89*4882a593Smuzhiyun }
90*4882a593Smuzhiyun
91*4882a593Smuzhiyun if (nr == 0) {
92*4882a593Smuzhiyun tb->mm = mm;
93*4882a593Smuzhiyun tb->hugepage_shift = hugepage_shift;
94*4882a593Smuzhiyun }
95*4882a593Smuzhiyun
96*4882a593Smuzhiyun if (tb->hugepage_shift != hugepage_shift) {
97*4882a593Smuzhiyun flush_tlb_pending();
98*4882a593Smuzhiyun tb->hugepage_shift = hugepage_shift;
99*4882a593Smuzhiyun nr = 0;
100*4882a593Smuzhiyun }
101*4882a593Smuzhiyun
102*4882a593Smuzhiyun tb->vaddrs[nr] = vaddr;
103*4882a593Smuzhiyun tb->tlb_nr = ++nr;
104*4882a593Smuzhiyun if (nr >= TLB_BATCH_NR)
105*4882a593Smuzhiyun flush_tlb_pending();
106*4882a593Smuzhiyun
107*4882a593Smuzhiyun out:
108*4882a593Smuzhiyun put_cpu_var(tlb_batch);
109*4882a593Smuzhiyun }
110*4882a593Smuzhiyun
tlb_batch_add(struct mm_struct * mm,unsigned long vaddr,pte_t * ptep,pte_t orig,int fullmm,unsigned int hugepage_shift)111*4882a593Smuzhiyun void tlb_batch_add(struct mm_struct *mm, unsigned long vaddr,
112*4882a593Smuzhiyun pte_t *ptep, pte_t orig, int fullmm,
113*4882a593Smuzhiyun unsigned int hugepage_shift)
114*4882a593Smuzhiyun {
115*4882a593Smuzhiyun if (tlb_type != hypervisor &&
116*4882a593Smuzhiyun pte_dirty(orig)) {
117*4882a593Smuzhiyun unsigned long paddr, pfn = pte_pfn(orig);
118*4882a593Smuzhiyun struct address_space *mapping;
119*4882a593Smuzhiyun struct page *page;
120*4882a593Smuzhiyun
121*4882a593Smuzhiyun if (!pfn_valid(pfn))
122*4882a593Smuzhiyun goto no_cache_flush;
123*4882a593Smuzhiyun
124*4882a593Smuzhiyun page = pfn_to_page(pfn);
125*4882a593Smuzhiyun if (PageReserved(page))
126*4882a593Smuzhiyun goto no_cache_flush;
127*4882a593Smuzhiyun
128*4882a593Smuzhiyun /* A real file page? */
129*4882a593Smuzhiyun mapping = page_mapping_file(page);
130*4882a593Smuzhiyun if (!mapping)
131*4882a593Smuzhiyun goto no_cache_flush;
132*4882a593Smuzhiyun
133*4882a593Smuzhiyun paddr = (unsigned long) page_address(page);
134*4882a593Smuzhiyun if ((paddr ^ vaddr) & (1 << 13))
135*4882a593Smuzhiyun flush_dcache_page_all(mm, page);
136*4882a593Smuzhiyun }
137*4882a593Smuzhiyun
138*4882a593Smuzhiyun no_cache_flush:
139*4882a593Smuzhiyun if (!fullmm)
140*4882a593Smuzhiyun tlb_batch_add_one(mm, vaddr, pte_exec(orig), hugepage_shift);
141*4882a593Smuzhiyun }
142*4882a593Smuzhiyun
143*4882a593Smuzhiyun #ifdef CONFIG_TRANSPARENT_HUGEPAGE
tlb_batch_pmd_scan(struct mm_struct * mm,unsigned long vaddr,pmd_t pmd)144*4882a593Smuzhiyun static void tlb_batch_pmd_scan(struct mm_struct *mm, unsigned long vaddr,
145*4882a593Smuzhiyun pmd_t pmd)
146*4882a593Smuzhiyun {
147*4882a593Smuzhiyun unsigned long end;
148*4882a593Smuzhiyun pte_t *pte;
149*4882a593Smuzhiyun
150*4882a593Smuzhiyun pte = pte_offset_map(&pmd, vaddr);
151*4882a593Smuzhiyun end = vaddr + HPAGE_SIZE;
152*4882a593Smuzhiyun while (vaddr < end) {
153*4882a593Smuzhiyun if (pte_val(*pte) & _PAGE_VALID) {
154*4882a593Smuzhiyun bool exec = pte_exec(*pte);
155*4882a593Smuzhiyun
156*4882a593Smuzhiyun tlb_batch_add_one(mm, vaddr, exec, PAGE_SHIFT);
157*4882a593Smuzhiyun }
158*4882a593Smuzhiyun pte++;
159*4882a593Smuzhiyun vaddr += PAGE_SIZE;
160*4882a593Smuzhiyun }
161*4882a593Smuzhiyun pte_unmap(pte);
162*4882a593Smuzhiyun }
163*4882a593Smuzhiyun
164*4882a593Smuzhiyun
__set_pmd_acct(struct mm_struct * mm,unsigned long addr,pmd_t orig,pmd_t pmd)165*4882a593Smuzhiyun static void __set_pmd_acct(struct mm_struct *mm, unsigned long addr,
166*4882a593Smuzhiyun pmd_t orig, pmd_t pmd)
167*4882a593Smuzhiyun {
168*4882a593Smuzhiyun if (mm == &init_mm)
169*4882a593Smuzhiyun return;
170*4882a593Smuzhiyun
171*4882a593Smuzhiyun if ((pmd_val(pmd) ^ pmd_val(orig)) & _PAGE_PMD_HUGE) {
172*4882a593Smuzhiyun /*
173*4882a593Smuzhiyun * Note that this routine only sets pmds for THP pages.
174*4882a593Smuzhiyun * Hugetlb pages are handled elsewhere. We need to check
175*4882a593Smuzhiyun * for huge zero page. Huge zero pages are like hugetlb
176*4882a593Smuzhiyun * pages in that there is no RSS, but there is the need
177*4882a593Smuzhiyun * for TSB entries. So, huge zero page counts go into
178*4882a593Smuzhiyun * hugetlb_pte_count.
179*4882a593Smuzhiyun */
180*4882a593Smuzhiyun if (pmd_val(pmd) & _PAGE_PMD_HUGE) {
181*4882a593Smuzhiyun if (is_huge_zero_page(pmd_page(pmd)))
182*4882a593Smuzhiyun mm->context.hugetlb_pte_count++;
183*4882a593Smuzhiyun else
184*4882a593Smuzhiyun mm->context.thp_pte_count++;
185*4882a593Smuzhiyun } else {
186*4882a593Smuzhiyun if (is_huge_zero_page(pmd_page(orig)))
187*4882a593Smuzhiyun mm->context.hugetlb_pte_count--;
188*4882a593Smuzhiyun else
189*4882a593Smuzhiyun mm->context.thp_pte_count--;
190*4882a593Smuzhiyun }
191*4882a593Smuzhiyun
192*4882a593Smuzhiyun /* Do not try to allocate the TSB hash table if we
193*4882a593Smuzhiyun * don't have one already. We have various locks held
194*4882a593Smuzhiyun * and thus we'll end up doing a GFP_KERNEL allocation
195*4882a593Smuzhiyun * in an atomic context.
196*4882a593Smuzhiyun *
197*4882a593Smuzhiyun * Instead, we let the first TLB miss on a hugepage
198*4882a593Smuzhiyun * take care of this.
199*4882a593Smuzhiyun */
200*4882a593Smuzhiyun }
201*4882a593Smuzhiyun
202*4882a593Smuzhiyun if (!pmd_none(orig)) {
203*4882a593Smuzhiyun addr &= HPAGE_MASK;
204*4882a593Smuzhiyun if (pmd_trans_huge(orig)) {
205*4882a593Smuzhiyun pte_t orig_pte = __pte(pmd_val(orig));
206*4882a593Smuzhiyun bool exec = pte_exec(orig_pte);
207*4882a593Smuzhiyun
208*4882a593Smuzhiyun tlb_batch_add_one(mm, addr, exec, REAL_HPAGE_SHIFT);
209*4882a593Smuzhiyun tlb_batch_add_one(mm, addr + REAL_HPAGE_SIZE, exec,
210*4882a593Smuzhiyun REAL_HPAGE_SHIFT);
211*4882a593Smuzhiyun } else {
212*4882a593Smuzhiyun tlb_batch_pmd_scan(mm, addr, orig);
213*4882a593Smuzhiyun }
214*4882a593Smuzhiyun }
215*4882a593Smuzhiyun }
216*4882a593Smuzhiyun
set_pmd_at(struct mm_struct * mm,unsigned long addr,pmd_t * pmdp,pmd_t pmd)217*4882a593Smuzhiyun void set_pmd_at(struct mm_struct *mm, unsigned long addr,
218*4882a593Smuzhiyun pmd_t *pmdp, pmd_t pmd)
219*4882a593Smuzhiyun {
220*4882a593Smuzhiyun pmd_t orig = *pmdp;
221*4882a593Smuzhiyun
222*4882a593Smuzhiyun *pmdp = pmd;
223*4882a593Smuzhiyun __set_pmd_acct(mm, addr, orig, pmd);
224*4882a593Smuzhiyun }
225*4882a593Smuzhiyun
pmdp_establish(struct vm_area_struct * vma,unsigned long address,pmd_t * pmdp,pmd_t pmd)226*4882a593Smuzhiyun static inline pmd_t pmdp_establish(struct vm_area_struct *vma,
227*4882a593Smuzhiyun unsigned long address, pmd_t *pmdp, pmd_t pmd)
228*4882a593Smuzhiyun {
229*4882a593Smuzhiyun pmd_t old;
230*4882a593Smuzhiyun
231*4882a593Smuzhiyun do {
232*4882a593Smuzhiyun old = *pmdp;
233*4882a593Smuzhiyun } while (cmpxchg64(&pmdp->pmd, old.pmd, pmd.pmd) != old.pmd);
234*4882a593Smuzhiyun __set_pmd_acct(vma->vm_mm, address, old, pmd);
235*4882a593Smuzhiyun
236*4882a593Smuzhiyun return old;
237*4882a593Smuzhiyun }
238*4882a593Smuzhiyun
239*4882a593Smuzhiyun /*
240*4882a593Smuzhiyun * This routine is only called when splitting a THP
241*4882a593Smuzhiyun */
pmdp_invalidate(struct vm_area_struct * vma,unsigned long address,pmd_t * pmdp)242*4882a593Smuzhiyun pmd_t pmdp_invalidate(struct vm_area_struct *vma, unsigned long address,
243*4882a593Smuzhiyun pmd_t *pmdp)
244*4882a593Smuzhiyun {
245*4882a593Smuzhiyun pmd_t old, entry;
246*4882a593Smuzhiyun
247*4882a593Smuzhiyun entry = __pmd(pmd_val(*pmdp) & ~_PAGE_VALID);
248*4882a593Smuzhiyun old = pmdp_establish(vma, address, pmdp, entry);
249*4882a593Smuzhiyun flush_tlb_range(vma, address, address + HPAGE_PMD_SIZE);
250*4882a593Smuzhiyun
251*4882a593Smuzhiyun /*
252*4882a593Smuzhiyun * set_pmd_at() will not be called in a way to decrement
253*4882a593Smuzhiyun * thp_pte_count when splitting a THP, so do it now.
254*4882a593Smuzhiyun * Sanity check pmd before doing the actual decrement.
255*4882a593Smuzhiyun */
256*4882a593Smuzhiyun if ((pmd_val(entry) & _PAGE_PMD_HUGE) &&
257*4882a593Smuzhiyun !is_huge_zero_page(pmd_page(entry)))
258*4882a593Smuzhiyun (vma->vm_mm)->context.thp_pte_count--;
259*4882a593Smuzhiyun
260*4882a593Smuzhiyun return old;
261*4882a593Smuzhiyun }
262*4882a593Smuzhiyun
pgtable_trans_huge_deposit(struct mm_struct * mm,pmd_t * pmdp,pgtable_t pgtable)263*4882a593Smuzhiyun void pgtable_trans_huge_deposit(struct mm_struct *mm, pmd_t *pmdp,
264*4882a593Smuzhiyun pgtable_t pgtable)
265*4882a593Smuzhiyun {
266*4882a593Smuzhiyun struct list_head *lh = (struct list_head *) pgtable;
267*4882a593Smuzhiyun
268*4882a593Smuzhiyun assert_spin_locked(&mm->page_table_lock);
269*4882a593Smuzhiyun
270*4882a593Smuzhiyun /* FIFO */
271*4882a593Smuzhiyun if (!pmd_huge_pte(mm, pmdp))
272*4882a593Smuzhiyun INIT_LIST_HEAD(lh);
273*4882a593Smuzhiyun else
274*4882a593Smuzhiyun list_add(lh, (struct list_head *) pmd_huge_pte(mm, pmdp));
275*4882a593Smuzhiyun pmd_huge_pte(mm, pmdp) = pgtable;
276*4882a593Smuzhiyun }
277*4882a593Smuzhiyun
pgtable_trans_huge_withdraw(struct mm_struct * mm,pmd_t * pmdp)278*4882a593Smuzhiyun pgtable_t pgtable_trans_huge_withdraw(struct mm_struct *mm, pmd_t *pmdp)
279*4882a593Smuzhiyun {
280*4882a593Smuzhiyun struct list_head *lh;
281*4882a593Smuzhiyun pgtable_t pgtable;
282*4882a593Smuzhiyun
283*4882a593Smuzhiyun assert_spin_locked(&mm->page_table_lock);
284*4882a593Smuzhiyun
285*4882a593Smuzhiyun /* FIFO */
286*4882a593Smuzhiyun pgtable = pmd_huge_pte(mm, pmdp);
287*4882a593Smuzhiyun lh = (struct list_head *) pgtable;
288*4882a593Smuzhiyun if (list_empty(lh))
289*4882a593Smuzhiyun pmd_huge_pte(mm, pmdp) = NULL;
290*4882a593Smuzhiyun else {
291*4882a593Smuzhiyun pmd_huge_pte(mm, pmdp) = (pgtable_t) lh->next;
292*4882a593Smuzhiyun list_del(lh);
293*4882a593Smuzhiyun }
294*4882a593Smuzhiyun pte_val(pgtable[0]) = 0;
295*4882a593Smuzhiyun pte_val(pgtable[1]) = 0;
296*4882a593Smuzhiyun
297*4882a593Smuzhiyun return pgtable;
298*4882a593Smuzhiyun }
299*4882a593Smuzhiyun #endif /* CONFIG_TRANSPARENT_HUGEPAGE */
300