1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Copyright (c) 2014, The Linux Foundation. All rights reserved.
4*4882a593Smuzhiyun */
5*4882a593Smuzhiyun #include <linux/kernel.h>
6*4882a593Smuzhiyun #include <linux/mm.h>
7*4882a593Smuzhiyun #include <linux/module.h>
8*4882a593Smuzhiyun #include <linux/sched.h>
9*4882a593Smuzhiyun #include <linux/vmalloc.h>
10*4882a593Smuzhiyun
11*4882a593Smuzhiyun #include <asm/cacheflush.h>
12*4882a593Smuzhiyun #include <asm/set_memory.h>
13*4882a593Smuzhiyun #include <asm/tlbflush.h>
14*4882a593Smuzhiyun
15*4882a593Smuzhiyun struct page_change_data {
16*4882a593Smuzhiyun pgprot_t set_mask;
17*4882a593Smuzhiyun pgprot_t clear_mask;
18*4882a593Smuzhiyun };
19*4882a593Smuzhiyun
20*4882a593Smuzhiyun bool rodata_full __ro_after_init = IS_ENABLED(CONFIG_RODATA_FULL_DEFAULT_ENABLED);
21*4882a593Smuzhiyun
change_page_range(pte_t * ptep,unsigned long addr,void * data)22*4882a593Smuzhiyun static int change_page_range(pte_t *ptep, unsigned long addr, void *data)
23*4882a593Smuzhiyun {
24*4882a593Smuzhiyun struct page_change_data *cdata = data;
25*4882a593Smuzhiyun pte_t pte = READ_ONCE(*ptep);
26*4882a593Smuzhiyun
27*4882a593Smuzhiyun pte = clear_pte_bit(pte, cdata->clear_mask);
28*4882a593Smuzhiyun pte = set_pte_bit(pte, cdata->set_mask);
29*4882a593Smuzhiyun
30*4882a593Smuzhiyun set_pte(ptep, pte);
31*4882a593Smuzhiyun return 0;
32*4882a593Smuzhiyun }
33*4882a593Smuzhiyun
34*4882a593Smuzhiyun /*
35*4882a593Smuzhiyun * This function assumes that the range is mapped with PAGE_SIZE pages.
36*4882a593Smuzhiyun */
__change_memory_common(unsigned long start,unsigned long size,pgprot_t set_mask,pgprot_t clear_mask)37*4882a593Smuzhiyun static int __change_memory_common(unsigned long start, unsigned long size,
38*4882a593Smuzhiyun pgprot_t set_mask, pgprot_t clear_mask)
39*4882a593Smuzhiyun {
40*4882a593Smuzhiyun struct page_change_data data;
41*4882a593Smuzhiyun int ret;
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun data.set_mask = set_mask;
44*4882a593Smuzhiyun data.clear_mask = clear_mask;
45*4882a593Smuzhiyun
46*4882a593Smuzhiyun ret = apply_to_page_range(&init_mm, start, size, change_page_range,
47*4882a593Smuzhiyun &data);
48*4882a593Smuzhiyun
49*4882a593Smuzhiyun flush_tlb_kernel_range(start, start + size);
50*4882a593Smuzhiyun return ret;
51*4882a593Smuzhiyun }
52*4882a593Smuzhiyun
change_memory_common(unsigned long addr,int numpages,pgprot_t set_mask,pgprot_t clear_mask)53*4882a593Smuzhiyun static int change_memory_common(unsigned long addr, int numpages,
54*4882a593Smuzhiyun pgprot_t set_mask, pgprot_t clear_mask)
55*4882a593Smuzhiyun {
56*4882a593Smuzhiyun unsigned long start = addr;
57*4882a593Smuzhiyun unsigned long size = PAGE_SIZE * numpages;
58*4882a593Smuzhiyun unsigned long end = start + size;
59*4882a593Smuzhiyun struct vm_struct *area;
60*4882a593Smuzhiyun int i;
61*4882a593Smuzhiyun
62*4882a593Smuzhiyun if (!PAGE_ALIGNED(addr)) {
63*4882a593Smuzhiyun start &= PAGE_MASK;
64*4882a593Smuzhiyun end = start + size;
65*4882a593Smuzhiyun WARN_ON_ONCE(1);
66*4882a593Smuzhiyun }
67*4882a593Smuzhiyun
68*4882a593Smuzhiyun /*
69*4882a593Smuzhiyun * Kernel VA mappings are always live, and splitting live section
70*4882a593Smuzhiyun * mappings into page mappings may cause TLB conflicts. This means
71*4882a593Smuzhiyun * we have to ensure that changing the permission bits of the range
72*4882a593Smuzhiyun * we are operating on does not result in such splitting.
73*4882a593Smuzhiyun *
74*4882a593Smuzhiyun * Let's restrict ourselves to mappings created by vmalloc (or vmap).
75*4882a593Smuzhiyun * Those are guaranteed to consist entirely of page mappings, and
76*4882a593Smuzhiyun * splitting is never needed.
77*4882a593Smuzhiyun *
78*4882a593Smuzhiyun * So check whether the [addr, addr + size) interval is entirely
79*4882a593Smuzhiyun * covered by precisely one VM area that has the VM_ALLOC flag set.
80*4882a593Smuzhiyun */
81*4882a593Smuzhiyun area = find_vm_area((void *)addr);
82*4882a593Smuzhiyun if (!area ||
83*4882a593Smuzhiyun end > (unsigned long)area->addr + area->size ||
84*4882a593Smuzhiyun !(area->flags & VM_ALLOC))
85*4882a593Smuzhiyun return -EINVAL;
86*4882a593Smuzhiyun
87*4882a593Smuzhiyun if (!numpages)
88*4882a593Smuzhiyun return 0;
89*4882a593Smuzhiyun
90*4882a593Smuzhiyun /*
91*4882a593Smuzhiyun * If we are manipulating read-only permissions, apply the same
92*4882a593Smuzhiyun * change to the linear mapping of the pages that back this VM area.
93*4882a593Smuzhiyun */
94*4882a593Smuzhiyun if (rodata_full && (pgprot_val(set_mask) == PTE_RDONLY ||
95*4882a593Smuzhiyun pgprot_val(clear_mask) == PTE_RDONLY)) {
96*4882a593Smuzhiyun for (i = 0; i < area->nr_pages; i++) {
97*4882a593Smuzhiyun __change_memory_common((u64)page_address(area->pages[i]),
98*4882a593Smuzhiyun PAGE_SIZE, set_mask, clear_mask);
99*4882a593Smuzhiyun }
100*4882a593Smuzhiyun }
101*4882a593Smuzhiyun
102*4882a593Smuzhiyun /*
103*4882a593Smuzhiyun * Get rid of potentially aliasing lazily unmapped vm areas that may
104*4882a593Smuzhiyun * have permissions set that deviate from the ones we are setting here.
105*4882a593Smuzhiyun */
106*4882a593Smuzhiyun vm_unmap_aliases();
107*4882a593Smuzhiyun
108*4882a593Smuzhiyun return __change_memory_common(start, size, set_mask, clear_mask);
109*4882a593Smuzhiyun }
110*4882a593Smuzhiyun
set_memory_ro(unsigned long addr,int numpages)111*4882a593Smuzhiyun int set_memory_ro(unsigned long addr, int numpages)
112*4882a593Smuzhiyun {
113*4882a593Smuzhiyun return change_memory_common(addr, numpages,
114*4882a593Smuzhiyun __pgprot(PTE_RDONLY),
115*4882a593Smuzhiyun __pgprot(PTE_WRITE));
116*4882a593Smuzhiyun }
117*4882a593Smuzhiyun
set_memory_rw(unsigned long addr,int numpages)118*4882a593Smuzhiyun int set_memory_rw(unsigned long addr, int numpages)
119*4882a593Smuzhiyun {
120*4882a593Smuzhiyun return change_memory_common(addr, numpages,
121*4882a593Smuzhiyun __pgprot(PTE_WRITE),
122*4882a593Smuzhiyun __pgprot(PTE_RDONLY));
123*4882a593Smuzhiyun }
124*4882a593Smuzhiyun
set_memory_nx(unsigned long addr,int numpages)125*4882a593Smuzhiyun int set_memory_nx(unsigned long addr, int numpages)
126*4882a593Smuzhiyun {
127*4882a593Smuzhiyun return change_memory_common(addr, numpages,
128*4882a593Smuzhiyun __pgprot(PTE_PXN),
129*4882a593Smuzhiyun __pgprot(PTE_MAYBE_GP));
130*4882a593Smuzhiyun }
131*4882a593Smuzhiyun
set_memory_x(unsigned long addr,int numpages)132*4882a593Smuzhiyun int set_memory_x(unsigned long addr, int numpages)
133*4882a593Smuzhiyun {
134*4882a593Smuzhiyun return change_memory_common(addr, numpages,
135*4882a593Smuzhiyun __pgprot(PTE_MAYBE_GP),
136*4882a593Smuzhiyun __pgprot(PTE_PXN));
137*4882a593Smuzhiyun }
138*4882a593Smuzhiyun
set_memory_valid(unsigned long addr,int numpages,int enable)139*4882a593Smuzhiyun int set_memory_valid(unsigned long addr, int numpages, int enable)
140*4882a593Smuzhiyun {
141*4882a593Smuzhiyun if (enable)
142*4882a593Smuzhiyun return __change_memory_common(addr, PAGE_SIZE * numpages,
143*4882a593Smuzhiyun __pgprot(PTE_VALID),
144*4882a593Smuzhiyun __pgprot(0));
145*4882a593Smuzhiyun else
146*4882a593Smuzhiyun return __change_memory_common(addr, PAGE_SIZE * numpages,
147*4882a593Smuzhiyun __pgprot(0),
148*4882a593Smuzhiyun __pgprot(PTE_VALID));
149*4882a593Smuzhiyun }
150*4882a593Smuzhiyun
set_direct_map_invalid_noflush(struct page * page)151*4882a593Smuzhiyun int set_direct_map_invalid_noflush(struct page *page)
152*4882a593Smuzhiyun {
153*4882a593Smuzhiyun struct page_change_data data = {
154*4882a593Smuzhiyun .set_mask = __pgprot(0),
155*4882a593Smuzhiyun .clear_mask = __pgprot(PTE_VALID),
156*4882a593Smuzhiyun };
157*4882a593Smuzhiyun
158*4882a593Smuzhiyun if (!rodata_full)
159*4882a593Smuzhiyun return 0;
160*4882a593Smuzhiyun
161*4882a593Smuzhiyun return apply_to_page_range(&init_mm,
162*4882a593Smuzhiyun (unsigned long)page_address(page),
163*4882a593Smuzhiyun PAGE_SIZE, change_page_range, &data);
164*4882a593Smuzhiyun }
165*4882a593Smuzhiyun
set_direct_map_default_noflush(struct page * page)166*4882a593Smuzhiyun int set_direct_map_default_noflush(struct page *page)
167*4882a593Smuzhiyun {
168*4882a593Smuzhiyun struct page_change_data data = {
169*4882a593Smuzhiyun .set_mask = __pgprot(PTE_VALID | PTE_WRITE),
170*4882a593Smuzhiyun .clear_mask = __pgprot(PTE_RDONLY),
171*4882a593Smuzhiyun };
172*4882a593Smuzhiyun
173*4882a593Smuzhiyun if (!rodata_full)
174*4882a593Smuzhiyun return 0;
175*4882a593Smuzhiyun
176*4882a593Smuzhiyun return apply_to_page_range(&init_mm,
177*4882a593Smuzhiyun (unsigned long)page_address(page),
178*4882a593Smuzhiyun PAGE_SIZE, change_page_range, &data);
179*4882a593Smuzhiyun }
180*4882a593Smuzhiyun
__kernel_map_pages(struct page * page,int numpages,int enable)181*4882a593Smuzhiyun void __kernel_map_pages(struct page *page, int numpages, int enable)
182*4882a593Smuzhiyun {
183*4882a593Smuzhiyun if (!debug_pagealloc_enabled() && !rodata_full)
184*4882a593Smuzhiyun return;
185*4882a593Smuzhiyun
186*4882a593Smuzhiyun set_memory_valid((unsigned long)page_address(page), numpages, enable);
187*4882a593Smuzhiyun }
188*4882a593Smuzhiyun
189*4882a593Smuzhiyun /*
190*4882a593Smuzhiyun * This function is used to determine if a linear map page has been marked as
191*4882a593Smuzhiyun * not-valid. Walk the page table and check the PTE_VALID bit. This is based
192*4882a593Smuzhiyun * on kern_addr_valid(), which almost does what we need.
193*4882a593Smuzhiyun *
194*4882a593Smuzhiyun * Because this is only called on the kernel linear map, p?d_sect() implies
195*4882a593Smuzhiyun * p?d_present(). When debug_pagealloc is enabled, sections mappings are
196*4882a593Smuzhiyun * disabled.
197*4882a593Smuzhiyun */
kernel_page_present(struct page * page)198*4882a593Smuzhiyun bool kernel_page_present(struct page *page)
199*4882a593Smuzhiyun {
200*4882a593Smuzhiyun pgd_t *pgdp;
201*4882a593Smuzhiyun p4d_t *p4dp;
202*4882a593Smuzhiyun pud_t *pudp, pud;
203*4882a593Smuzhiyun pmd_t *pmdp, pmd;
204*4882a593Smuzhiyun pte_t *ptep;
205*4882a593Smuzhiyun unsigned long addr = (unsigned long)page_address(page);
206*4882a593Smuzhiyun
207*4882a593Smuzhiyun if (!debug_pagealloc_enabled() && !rodata_full)
208*4882a593Smuzhiyun return true;
209*4882a593Smuzhiyun
210*4882a593Smuzhiyun pgdp = pgd_offset_k(addr);
211*4882a593Smuzhiyun if (pgd_none(READ_ONCE(*pgdp)))
212*4882a593Smuzhiyun return false;
213*4882a593Smuzhiyun
214*4882a593Smuzhiyun p4dp = p4d_offset(pgdp, addr);
215*4882a593Smuzhiyun if (p4d_none(READ_ONCE(*p4dp)))
216*4882a593Smuzhiyun return false;
217*4882a593Smuzhiyun
218*4882a593Smuzhiyun pudp = pud_offset(p4dp, addr);
219*4882a593Smuzhiyun pud = READ_ONCE(*pudp);
220*4882a593Smuzhiyun if (pud_none(pud))
221*4882a593Smuzhiyun return false;
222*4882a593Smuzhiyun if (pud_sect(pud))
223*4882a593Smuzhiyun return true;
224*4882a593Smuzhiyun
225*4882a593Smuzhiyun pmdp = pmd_offset(pudp, addr);
226*4882a593Smuzhiyun pmd = READ_ONCE(*pmdp);
227*4882a593Smuzhiyun if (pmd_none(pmd))
228*4882a593Smuzhiyun return false;
229*4882a593Smuzhiyun if (pmd_sect(pmd))
230*4882a593Smuzhiyun return true;
231*4882a593Smuzhiyun
232*4882a593Smuzhiyun ptep = pte_offset_kernel(pmdp, addr);
233*4882a593Smuzhiyun return pte_valid(READ_ONCE(*ptep));
234*4882a593Smuzhiyun }
235