1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Copyright (C) 2019 SiFive
4*4882a593Smuzhiyun */
5*4882a593Smuzhiyun
6*4882a593Smuzhiyun #include <linux/efi.h>
7*4882a593Smuzhiyun #include <linux/init.h>
8*4882a593Smuzhiyun #include <linux/debugfs.h>
9*4882a593Smuzhiyun #include <linux/seq_file.h>
10*4882a593Smuzhiyun #include <linux/ptdump.h>
11*4882a593Smuzhiyun
12*4882a593Smuzhiyun #include <asm/ptdump.h>
13*4882a593Smuzhiyun #include <linux/pgtable.h>
14*4882a593Smuzhiyun #include <asm/kasan.h>
15*4882a593Smuzhiyun
16*4882a593Smuzhiyun #define pt_dump_seq_printf(m, fmt, args...) \
17*4882a593Smuzhiyun ({ \
18*4882a593Smuzhiyun if (m) \
19*4882a593Smuzhiyun seq_printf(m, fmt, ##args); \
20*4882a593Smuzhiyun })
21*4882a593Smuzhiyun
22*4882a593Smuzhiyun #define pt_dump_seq_puts(m, fmt) \
23*4882a593Smuzhiyun ({ \
24*4882a593Smuzhiyun if (m) \
25*4882a593Smuzhiyun seq_printf(m, fmt); \
26*4882a593Smuzhiyun })
27*4882a593Smuzhiyun
28*4882a593Smuzhiyun /*
29*4882a593Smuzhiyun * The page dumper groups page table entries of the same type into a single
30*4882a593Smuzhiyun * description. It uses pg_state to track the range information while
31*4882a593Smuzhiyun * iterating over the pte entries. When the continuity is broken it then
32*4882a593Smuzhiyun * dumps out a description of the range.
33*4882a593Smuzhiyun */
34*4882a593Smuzhiyun struct pg_state {
35*4882a593Smuzhiyun struct ptdump_state ptdump;
36*4882a593Smuzhiyun struct seq_file *seq;
37*4882a593Smuzhiyun const struct addr_marker *marker;
38*4882a593Smuzhiyun unsigned long start_address;
39*4882a593Smuzhiyun unsigned long start_pa;
40*4882a593Smuzhiyun unsigned long last_pa;
41*4882a593Smuzhiyun int level;
42*4882a593Smuzhiyun u64 current_prot;
43*4882a593Smuzhiyun bool check_wx;
44*4882a593Smuzhiyun unsigned long wx_pages;
45*4882a593Smuzhiyun };
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun /* Address marker */
48*4882a593Smuzhiyun struct addr_marker {
49*4882a593Smuzhiyun unsigned long start_address;
50*4882a593Smuzhiyun const char *name;
51*4882a593Smuzhiyun };
52*4882a593Smuzhiyun
53*4882a593Smuzhiyun /* Private information for debugfs */
54*4882a593Smuzhiyun struct ptd_mm_info {
55*4882a593Smuzhiyun struct mm_struct *mm;
56*4882a593Smuzhiyun const struct addr_marker *markers;
57*4882a593Smuzhiyun unsigned long base_addr;
58*4882a593Smuzhiyun unsigned long end;
59*4882a593Smuzhiyun };
60*4882a593Smuzhiyun
61*4882a593Smuzhiyun static struct addr_marker address_markers[] = {
62*4882a593Smuzhiyun #ifdef CONFIG_KASAN
63*4882a593Smuzhiyun {KASAN_SHADOW_START, "Kasan shadow start"},
64*4882a593Smuzhiyun {KASAN_SHADOW_END, "Kasan shadow end"},
65*4882a593Smuzhiyun #endif
66*4882a593Smuzhiyun {FIXADDR_START, "Fixmap start"},
67*4882a593Smuzhiyun {FIXADDR_TOP, "Fixmap end"},
68*4882a593Smuzhiyun {PCI_IO_START, "PCI I/O start"},
69*4882a593Smuzhiyun {PCI_IO_END, "PCI I/O end"},
70*4882a593Smuzhiyun #ifdef CONFIG_SPARSEMEM_VMEMMAP
71*4882a593Smuzhiyun {VMEMMAP_START, "vmemmap start"},
72*4882a593Smuzhiyun {VMEMMAP_END, "vmemmap end"},
73*4882a593Smuzhiyun #endif
74*4882a593Smuzhiyun {VMALLOC_START, "vmalloc() area"},
75*4882a593Smuzhiyun {VMALLOC_END, "vmalloc() end"},
76*4882a593Smuzhiyun {PAGE_OFFSET, "Linear mapping"},
77*4882a593Smuzhiyun {-1, NULL},
78*4882a593Smuzhiyun };
79*4882a593Smuzhiyun
80*4882a593Smuzhiyun static struct ptd_mm_info kernel_ptd_info = {
81*4882a593Smuzhiyun .mm = &init_mm,
82*4882a593Smuzhiyun .markers = address_markers,
83*4882a593Smuzhiyun .base_addr = KERN_VIRT_START,
84*4882a593Smuzhiyun .end = ULONG_MAX,
85*4882a593Smuzhiyun };
86*4882a593Smuzhiyun
87*4882a593Smuzhiyun #ifdef CONFIG_EFI
88*4882a593Smuzhiyun static struct addr_marker efi_addr_markers[] = {
89*4882a593Smuzhiyun { 0, "UEFI runtime start" },
90*4882a593Smuzhiyun { SZ_1G, "UEFI runtime end" },
91*4882a593Smuzhiyun { -1, NULL }
92*4882a593Smuzhiyun };
93*4882a593Smuzhiyun
94*4882a593Smuzhiyun static struct ptd_mm_info efi_ptd_info = {
95*4882a593Smuzhiyun .mm = &efi_mm,
96*4882a593Smuzhiyun .markers = efi_addr_markers,
97*4882a593Smuzhiyun .base_addr = 0,
98*4882a593Smuzhiyun .end = SZ_2G,
99*4882a593Smuzhiyun };
100*4882a593Smuzhiyun #endif
101*4882a593Smuzhiyun
102*4882a593Smuzhiyun /* Page Table Entry */
103*4882a593Smuzhiyun struct prot_bits {
104*4882a593Smuzhiyun u64 mask;
105*4882a593Smuzhiyun u64 val;
106*4882a593Smuzhiyun const char *set;
107*4882a593Smuzhiyun const char *clear;
108*4882a593Smuzhiyun };
109*4882a593Smuzhiyun
110*4882a593Smuzhiyun static const struct prot_bits pte_bits[] = {
111*4882a593Smuzhiyun {
112*4882a593Smuzhiyun .mask = _PAGE_SOFT,
113*4882a593Smuzhiyun .val = _PAGE_SOFT,
114*4882a593Smuzhiyun .set = "RSW",
115*4882a593Smuzhiyun .clear = " ",
116*4882a593Smuzhiyun }, {
117*4882a593Smuzhiyun .mask = _PAGE_DIRTY,
118*4882a593Smuzhiyun .val = _PAGE_DIRTY,
119*4882a593Smuzhiyun .set = "D",
120*4882a593Smuzhiyun .clear = ".",
121*4882a593Smuzhiyun }, {
122*4882a593Smuzhiyun .mask = _PAGE_ACCESSED,
123*4882a593Smuzhiyun .val = _PAGE_ACCESSED,
124*4882a593Smuzhiyun .set = "A",
125*4882a593Smuzhiyun .clear = ".",
126*4882a593Smuzhiyun }, {
127*4882a593Smuzhiyun .mask = _PAGE_GLOBAL,
128*4882a593Smuzhiyun .val = _PAGE_GLOBAL,
129*4882a593Smuzhiyun .set = "G",
130*4882a593Smuzhiyun .clear = ".",
131*4882a593Smuzhiyun }, {
132*4882a593Smuzhiyun .mask = _PAGE_USER,
133*4882a593Smuzhiyun .val = _PAGE_USER,
134*4882a593Smuzhiyun .set = "U",
135*4882a593Smuzhiyun .clear = ".",
136*4882a593Smuzhiyun }, {
137*4882a593Smuzhiyun .mask = _PAGE_EXEC,
138*4882a593Smuzhiyun .val = _PAGE_EXEC,
139*4882a593Smuzhiyun .set = "X",
140*4882a593Smuzhiyun .clear = ".",
141*4882a593Smuzhiyun }, {
142*4882a593Smuzhiyun .mask = _PAGE_WRITE,
143*4882a593Smuzhiyun .val = _PAGE_WRITE,
144*4882a593Smuzhiyun .set = "W",
145*4882a593Smuzhiyun .clear = ".",
146*4882a593Smuzhiyun }, {
147*4882a593Smuzhiyun .mask = _PAGE_READ,
148*4882a593Smuzhiyun .val = _PAGE_READ,
149*4882a593Smuzhiyun .set = "R",
150*4882a593Smuzhiyun .clear = ".",
151*4882a593Smuzhiyun }, {
152*4882a593Smuzhiyun .mask = _PAGE_PRESENT,
153*4882a593Smuzhiyun .val = _PAGE_PRESENT,
154*4882a593Smuzhiyun .set = "V",
155*4882a593Smuzhiyun .clear = ".",
156*4882a593Smuzhiyun }
157*4882a593Smuzhiyun };
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun /* Page Level */
160*4882a593Smuzhiyun struct pg_level {
161*4882a593Smuzhiyun const char *name;
162*4882a593Smuzhiyun u64 mask;
163*4882a593Smuzhiyun };
164*4882a593Smuzhiyun
165*4882a593Smuzhiyun static struct pg_level pg_level[] = {
166*4882a593Smuzhiyun { /* pgd */
167*4882a593Smuzhiyun .name = "PGD",
168*4882a593Smuzhiyun }, { /* p4d */
169*4882a593Smuzhiyun .name = (CONFIG_PGTABLE_LEVELS > 4) ? "P4D" : "PGD",
170*4882a593Smuzhiyun }, { /* pud */
171*4882a593Smuzhiyun .name = (CONFIG_PGTABLE_LEVELS > 3) ? "PUD" : "PGD",
172*4882a593Smuzhiyun }, { /* pmd */
173*4882a593Smuzhiyun .name = (CONFIG_PGTABLE_LEVELS > 2) ? "PMD" : "PGD",
174*4882a593Smuzhiyun }, { /* pte */
175*4882a593Smuzhiyun .name = "PTE",
176*4882a593Smuzhiyun },
177*4882a593Smuzhiyun };
178*4882a593Smuzhiyun
dump_prot(struct pg_state * st)179*4882a593Smuzhiyun static void dump_prot(struct pg_state *st)
180*4882a593Smuzhiyun {
181*4882a593Smuzhiyun unsigned int i;
182*4882a593Smuzhiyun
183*4882a593Smuzhiyun for (i = 0; i < ARRAY_SIZE(pte_bits); i++) {
184*4882a593Smuzhiyun const char *s;
185*4882a593Smuzhiyun
186*4882a593Smuzhiyun if ((st->current_prot & pte_bits[i].mask) == pte_bits[i].val)
187*4882a593Smuzhiyun s = pte_bits[i].set;
188*4882a593Smuzhiyun else
189*4882a593Smuzhiyun s = pte_bits[i].clear;
190*4882a593Smuzhiyun
191*4882a593Smuzhiyun if (s)
192*4882a593Smuzhiyun pt_dump_seq_printf(st->seq, " %s", s);
193*4882a593Smuzhiyun }
194*4882a593Smuzhiyun }
195*4882a593Smuzhiyun
196*4882a593Smuzhiyun #ifdef CONFIG_64BIT
197*4882a593Smuzhiyun #define ADDR_FORMAT "0x%016lx"
198*4882a593Smuzhiyun #else
199*4882a593Smuzhiyun #define ADDR_FORMAT "0x%08lx"
200*4882a593Smuzhiyun #endif
dump_addr(struct pg_state * st,unsigned long addr)201*4882a593Smuzhiyun static void dump_addr(struct pg_state *st, unsigned long addr)
202*4882a593Smuzhiyun {
203*4882a593Smuzhiyun static const char units[] = "KMGTPE";
204*4882a593Smuzhiyun const char *unit = units;
205*4882a593Smuzhiyun unsigned long delta;
206*4882a593Smuzhiyun
207*4882a593Smuzhiyun pt_dump_seq_printf(st->seq, ADDR_FORMAT "-" ADDR_FORMAT " ",
208*4882a593Smuzhiyun st->start_address, addr);
209*4882a593Smuzhiyun
210*4882a593Smuzhiyun pt_dump_seq_printf(st->seq, " " ADDR_FORMAT " ", st->start_pa);
211*4882a593Smuzhiyun delta = (addr - st->start_address) >> 10;
212*4882a593Smuzhiyun
213*4882a593Smuzhiyun while (!(delta & 1023) && unit[1]) {
214*4882a593Smuzhiyun delta >>= 10;
215*4882a593Smuzhiyun unit++;
216*4882a593Smuzhiyun }
217*4882a593Smuzhiyun
218*4882a593Smuzhiyun pt_dump_seq_printf(st->seq, "%9lu%c %s", delta, *unit,
219*4882a593Smuzhiyun pg_level[st->level].name);
220*4882a593Smuzhiyun }
221*4882a593Smuzhiyun
note_prot_wx(struct pg_state * st,unsigned long addr)222*4882a593Smuzhiyun static void note_prot_wx(struct pg_state *st, unsigned long addr)
223*4882a593Smuzhiyun {
224*4882a593Smuzhiyun if (!st->check_wx)
225*4882a593Smuzhiyun return;
226*4882a593Smuzhiyun
227*4882a593Smuzhiyun if ((st->current_prot & (_PAGE_WRITE | _PAGE_EXEC)) !=
228*4882a593Smuzhiyun (_PAGE_WRITE | _PAGE_EXEC))
229*4882a593Smuzhiyun return;
230*4882a593Smuzhiyun
231*4882a593Smuzhiyun WARN_ONCE(1, "riscv/mm: Found insecure W+X mapping at address %p/%pS\n",
232*4882a593Smuzhiyun (void *)st->start_address, (void *)st->start_address);
233*4882a593Smuzhiyun
234*4882a593Smuzhiyun st->wx_pages += (addr - st->start_address) / PAGE_SIZE;
235*4882a593Smuzhiyun }
236*4882a593Smuzhiyun
note_page(struct ptdump_state * pt_st,unsigned long addr,int level,u64 val)237*4882a593Smuzhiyun static void note_page(struct ptdump_state *pt_st, unsigned long addr,
238*4882a593Smuzhiyun int level, u64 val)
239*4882a593Smuzhiyun {
240*4882a593Smuzhiyun struct pg_state *st = container_of(pt_st, struct pg_state, ptdump);
241*4882a593Smuzhiyun u64 pa = PFN_PHYS(pte_pfn(__pte(val)));
242*4882a593Smuzhiyun u64 prot = 0;
243*4882a593Smuzhiyun
244*4882a593Smuzhiyun if (level >= 0)
245*4882a593Smuzhiyun prot = val & pg_level[level].mask;
246*4882a593Smuzhiyun
247*4882a593Smuzhiyun if (st->level == -1) {
248*4882a593Smuzhiyun st->level = level;
249*4882a593Smuzhiyun st->current_prot = prot;
250*4882a593Smuzhiyun st->start_address = addr;
251*4882a593Smuzhiyun st->start_pa = pa;
252*4882a593Smuzhiyun st->last_pa = pa;
253*4882a593Smuzhiyun pt_dump_seq_printf(st->seq, "---[ %s ]---\n", st->marker->name);
254*4882a593Smuzhiyun } else if (prot != st->current_prot ||
255*4882a593Smuzhiyun level != st->level || addr >= st->marker[1].start_address) {
256*4882a593Smuzhiyun if (st->current_prot) {
257*4882a593Smuzhiyun note_prot_wx(st, addr);
258*4882a593Smuzhiyun dump_addr(st, addr);
259*4882a593Smuzhiyun dump_prot(st);
260*4882a593Smuzhiyun pt_dump_seq_puts(st->seq, "\n");
261*4882a593Smuzhiyun }
262*4882a593Smuzhiyun
263*4882a593Smuzhiyun while (addr >= st->marker[1].start_address) {
264*4882a593Smuzhiyun st->marker++;
265*4882a593Smuzhiyun pt_dump_seq_printf(st->seq, "---[ %s ]---\n",
266*4882a593Smuzhiyun st->marker->name);
267*4882a593Smuzhiyun }
268*4882a593Smuzhiyun
269*4882a593Smuzhiyun st->start_address = addr;
270*4882a593Smuzhiyun st->start_pa = pa;
271*4882a593Smuzhiyun st->last_pa = pa;
272*4882a593Smuzhiyun st->current_prot = prot;
273*4882a593Smuzhiyun st->level = level;
274*4882a593Smuzhiyun } else {
275*4882a593Smuzhiyun st->last_pa = pa;
276*4882a593Smuzhiyun }
277*4882a593Smuzhiyun }
278*4882a593Smuzhiyun
ptdump_walk(struct seq_file * s,struct ptd_mm_info * pinfo)279*4882a593Smuzhiyun static void ptdump_walk(struct seq_file *s, struct ptd_mm_info *pinfo)
280*4882a593Smuzhiyun {
281*4882a593Smuzhiyun struct pg_state st = {
282*4882a593Smuzhiyun .seq = s,
283*4882a593Smuzhiyun .marker = pinfo->markers,
284*4882a593Smuzhiyun .level = -1,
285*4882a593Smuzhiyun .ptdump = {
286*4882a593Smuzhiyun .note_page = note_page,
287*4882a593Smuzhiyun .range = (struct ptdump_range[]) {
288*4882a593Smuzhiyun {pinfo->base_addr, pinfo->end},
289*4882a593Smuzhiyun {0, 0}
290*4882a593Smuzhiyun }
291*4882a593Smuzhiyun }
292*4882a593Smuzhiyun };
293*4882a593Smuzhiyun
294*4882a593Smuzhiyun ptdump_walk_pgd(&st.ptdump, pinfo->mm, NULL);
295*4882a593Smuzhiyun }
296*4882a593Smuzhiyun
ptdump_check_wx(void)297*4882a593Smuzhiyun void ptdump_check_wx(void)
298*4882a593Smuzhiyun {
299*4882a593Smuzhiyun struct pg_state st = {
300*4882a593Smuzhiyun .seq = NULL,
301*4882a593Smuzhiyun .marker = (struct addr_marker[]) {
302*4882a593Smuzhiyun {0, NULL},
303*4882a593Smuzhiyun {-1, NULL},
304*4882a593Smuzhiyun },
305*4882a593Smuzhiyun .level = -1,
306*4882a593Smuzhiyun .check_wx = true,
307*4882a593Smuzhiyun .ptdump = {
308*4882a593Smuzhiyun .note_page = note_page,
309*4882a593Smuzhiyun .range = (struct ptdump_range[]) {
310*4882a593Smuzhiyun {KERN_VIRT_START, ULONG_MAX},
311*4882a593Smuzhiyun {0, 0}
312*4882a593Smuzhiyun }
313*4882a593Smuzhiyun }
314*4882a593Smuzhiyun };
315*4882a593Smuzhiyun
316*4882a593Smuzhiyun ptdump_walk_pgd(&st.ptdump, &init_mm, NULL);
317*4882a593Smuzhiyun
318*4882a593Smuzhiyun if (st.wx_pages)
319*4882a593Smuzhiyun pr_warn("Checked W+X mappings: failed, %lu W+X pages found\n",
320*4882a593Smuzhiyun st.wx_pages);
321*4882a593Smuzhiyun else
322*4882a593Smuzhiyun pr_info("Checked W+X mappings: passed, no W+X pages found\n");
323*4882a593Smuzhiyun }
324*4882a593Smuzhiyun
ptdump_show(struct seq_file * m,void * v)325*4882a593Smuzhiyun static int ptdump_show(struct seq_file *m, void *v)
326*4882a593Smuzhiyun {
327*4882a593Smuzhiyun ptdump_walk(m, m->private);
328*4882a593Smuzhiyun
329*4882a593Smuzhiyun return 0;
330*4882a593Smuzhiyun }
331*4882a593Smuzhiyun
332*4882a593Smuzhiyun DEFINE_SHOW_ATTRIBUTE(ptdump);
333*4882a593Smuzhiyun
ptdump_init(void)334*4882a593Smuzhiyun static int ptdump_init(void)
335*4882a593Smuzhiyun {
336*4882a593Smuzhiyun unsigned int i, j;
337*4882a593Smuzhiyun
338*4882a593Smuzhiyun for (i = 0; i < ARRAY_SIZE(pg_level); i++)
339*4882a593Smuzhiyun for (j = 0; j < ARRAY_SIZE(pte_bits); j++)
340*4882a593Smuzhiyun pg_level[i].mask |= pte_bits[j].mask;
341*4882a593Smuzhiyun
342*4882a593Smuzhiyun debugfs_create_file("kernel_page_tables", 0400, NULL, &kernel_ptd_info,
343*4882a593Smuzhiyun &ptdump_fops);
344*4882a593Smuzhiyun #ifdef CONFIG_EFI
345*4882a593Smuzhiyun if (efi_enabled(EFI_RUNTIME_SERVICES))
346*4882a593Smuzhiyun debugfs_create_file("efi_page_tables", 0400, NULL, &efi_ptd_info,
347*4882a593Smuzhiyun &ptdump_fops);
348*4882a593Smuzhiyun #endif
349*4882a593Smuzhiyun
350*4882a593Smuzhiyun return 0;
351*4882a593Smuzhiyun }
352*4882a593Smuzhiyun
353*4882a593Smuzhiyun device_initcall(ptdump_init);
354