xref: /OK3568_Linux_fs/u-boot/arch/arm/cpu/armv8/cache_v8.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun  * (C) Copyright 2013
3*4882a593Smuzhiyun  * David Feng <fenghua@phytium.com.cn>
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * (C) Copyright 2016
6*4882a593Smuzhiyun  * Alexander Graf <agraf@suse.de>
7*4882a593Smuzhiyun  *
8*4882a593Smuzhiyun  * SPDX-License-Identifier:	GPL-2.0+
9*4882a593Smuzhiyun  */
10*4882a593Smuzhiyun 
11*4882a593Smuzhiyun #include <common.h>
12*4882a593Smuzhiyun #include <asm/system.h>
13*4882a593Smuzhiyun #include <asm/armv8/mmu.h>
14*4882a593Smuzhiyun 
15*4882a593Smuzhiyun DECLARE_GLOBAL_DATA_PTR;
16*4882a593Smuzhiyun 
17*4882a593Smuzhiyun #ifndef CONFIG_SYS_DCACHE_OFF
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun /*
20*4882a593Smuzhiyun  *  With 4k page granule, a virtual address is split into 4 lookup parts
21*4882a593Smuzhiyun  *  spanning 9 bits each:
22*4882a593Smuzhiyun  *
23*4882a593Smuzhiyun  *    _______________________________________________
24*4882a593Smuzhiyun  *   |       |       |       |       |       |       |
25*4882a593Smuzhiyun  *   |   0   |  Lv0  |  Lv1  |  Lv2  |  Lv3  |  off  |
26*4882a593Smuzhiyun  *   |_______|_______|_______|_______|_______|_______|
27*4882a593Smuzhiyun  *     63-48   47-39   38-30   29-21   20-12   11-00
28*4882a593Smuzhiyun  *
29*4882a593Smuzhiyun  *             mask        page size
30*4882a593Smuzhiyun  *
31*4882a593Smuzhiyun  *    Lv0: FF8000000000       --
32*4882a593Smuzhiyun  *    Lv1:   7FC0000000       1G
33*4882a593Smuzhiyun  *    Lv2:     3FE00000       2M
34*4882a593Smuzhiyun  *    Lv3:       1FF000       4K
35*4882a593Smuzhiyun  *    off:          FFF
36*4882a593Smuzhiyun  */
37*4882a593Smuzhiyun 
get_tcr(int el,u64 * pips,u64 * pva_bits)38*4882a593Smuzhiyun u64 get_tcr(int el, u64 *pips, u64 *pva_bits)
39*4882a593Smuzhiyun {
40*4882a593Smuzhiyun 	u64 max_addr = 0;
41*4882a593Smuzhiyun 	u64 ips, va_bits;
42*4882a593Smuzhiyun 	u64 tcr;
43*4882a593Smuzhiyun 	int i;
44*4882a593Smuzhiyun 
45*4882a593Smuzhiyun 	/* Find the largest address we need to support */
46*4882a593Smuzhiyun 	for (i = 0; mem_map[i].size || mem_map[i].attrs; i++)
47*4882a593Smuzhiyun 		max_addr = max(max_addr, mem_map[i].virt + mem_map[i].size);
48*4882a593Smuzhiyun 
49*4882a593Smuzhiyun 	/* Calculate the maximum physical (and thus virtual) address */
50*4882a593Smuzhiyun 	if (max_addr > (1ULL << 44)) {
51*4882a593Smuzhiyun 		ips = 5;
52*4882a593Smuzhiyun 		va_bits = 48;
53*4882a593Smuzhiyun 	} else  if (max_addr > (1ULL << 42)) {
54*4882a593Smuzhiyun 		ips = 4;
55*4882a593Smuzhiyun 		va_bits = 44;
56*4882a593Smuzhiyun 	} else  if (max_addr > (1ULL << 40)) {
57*4882a593Smuzhiyun 		ips = 3;
58*4882a593Smuzhiyun 		va_bits = 42;
59*4882a593Smuzhiyun 	} else  if (max_addr > (1ULL << 36)) {
60*4882a593Smuzhiyun 		ips = 2;
61*4882a593Smuzhiyun 		va_bits = 40;
62*4882a593Smuzhiyun 	} else  if (max_addr > (1ULL << 32)) {
63*4882a593Smuzhiyun 		ips = 1;
64*4882a593Smuzhiyun 		va_bits = 36;
65*4882a593Smuzhiyun 	} else {
66*4882a593Smuzhiyun 		ips = 0;
67*4882a593Smuzhiyun 		va_bits = 32;
68*4882a593Smuzhiyun 	}
69*4882a593Smuzhiyun 
70*4882a593Smuzhiyun 	if (el == 1) {
71*4882a593Smuzhiyun 		tcr = TCR_EL1_RSVD | (ips << 32) | TCR_EPD1_DISABLE;
72*4882a593Smuzhiyun 	} else if (el == 2) {
73*4882a593Smuzhiyun 		tcr = TCR_EL2_RSVD | (ips << 16);
74*4882a593Smuzhiyun 	} else {
75*4882a593Smuzhiyun 		tcr = TCR_EL3_RSVD | (ips << 16);
76*4882a593Smuzhiyun 	}
77*4882a593Smuzhiyun 
78*4882a593Smuzhiyun 	/* PTWs cacheable, inner/outer WBWA and inner shareable */
79*4882a593Smuzhiyun 	tcr |= TCR_TG0_4K | TCR_SHARED_INNER | TCR_ORGN_WBWA | TCR_IRGN_WBWA;
80*4882a593Smuzhiyun 	tcr |= TCR_T0SZ(va_bits);
81*4882a593Smuzhiyun 
82*4882a593Smuzhiyun 	if (pips)
83*4882a593Smuzhiyun 		*pips = ips;
84*4882a593Smuzhiyun 	if (pva_bits)
85*4882a593Smuzhiyun 		*pva_bits = va_bits;
86*4882a593Smuzhiyun 
87*4882a593Smuzhiyun 	return tcr;
88*4882a593Smuzhiyun }
89*4882a593Smuzhiyun 
90*4882a593Smuzhiyun #define MAX_PTE_ENTRIES 512
91*4882a593Smuzhiyun 
pte_type(u64 * pte)92*4882a593Smuzhiyun static int pte_type(u64 *pte)
93*4882a593Smuzhiyun {
94*4882a593Smuzhiyun 	return *pte & PTE_TYPE_MASK;
95*4882a593Smuzhiyun }
96*4882a593Smuzhiyun 
97*4882a593Smuzhiyun /* Returns the LSB number for a PTE on level <level> */
level2shift(int level)98*4882a593Smuzhiyun static int level2shift(int level)
99*4882a593Smuzhiyun {
100*4882a593Smuzhiyun 	/* Page is 12 bits wide, every level translates 9 bits */
101*4882a593Smuzhiyun 	return (12 + 9 * (3 - level));
102*4882a593Smuzhiyun }
103*4882a593Smuzhiyun 
find_pte(u64 addr,int level)104*4882a593Smuzhiyun static u64 *find_pte(u64 addr, int level)
105*4882a593Smuzhiyun {
106*4882a593Smuzhiyun 	int start_level = 0;
107*4882a593Smuzhiyun 	u64 *pte;
108*4882a593Smuzhiyun 	u64 idx;
109*4882a593Smuzhiyun 	u64 va_bits;
110*4882a593Smuzhiyun 	int i;
111*4882a593Smuzhiyun 
112*4882a593Smuzhiyun 	pr_debug("addr=%llx level=%d\n", addr, level);
113*4882a593Smuzhiyun 
114*4882a593Smuzhiyun 	get_tcr(0, NULL, &va_bits);
115*4882a593Smuzhiyun 	if (va_bits < 39)
116*4882a593Smuzhiyun 		start_level = 1;
117*4882a593Smuzhiyun 
118*4882a593Smuzhiyun 	if (level < start_level)
119*4882a593Smuzhiyun 		return NULL;
120*4882a593Smuzhiyun 
121*4882a593Smuzhiyun 	/* Walk through all page table levels to find our PTE */
122*4882a593Smuzhiyun 	pte = (u64*)gd->arch.tlb_addr;
123*4882a593Smuzhiyun 	for (i = start_level; i < 4; i++) {
124*4882a593Smuzhiyun 		idx = (addr >> level2shift(i)) & 0x1FF;
125*4882a593Smuzhiyun 		pte += idx;
126*4882a593Smuzhiyun 		pr_debug("idx=%llx PTE %p at level %d: %llx\n", idx, pte, i, *pte);
127*4882a593Smuzhiyun 
128*4882a593Smuzhiyun 		/* Found it */
129*4882a593Smuzhiyun 		if (i == level)
130*4882a593Smuzhiyun 			return pte;
131*4882a593Smuzhiyun 		/* PTE is no table (either invalid or block), can't traverse */
132*4882a593Smuzhiyun 		if (pte_type(pte) != PTE_TYPE_TABLE)
133*4882a593Smuzhiyun 			return NULL;
134*4882a593Smuzhiyun 		/* Off to the next level */
135*4882a593Smuzhiyun 		pte = (u64*)(*pte & 0x0000fffffffff000ULL);
136*4882a593Smuzhiyun 	}
137*4882a593Smuzhiyun 
138*4882a593Smuzhiyun 	/* Should never reach here */
139*4882a593Smuzhiyun 	return NULL;
140*4882a593Smuzhiyun }
141*4882a593Smuzhiyun 
142*4882a593Smuzhiyun /* Returns and creates a new full table (512 entries) */
create_table(void)143*4882a593Smuzhiyun static u64 *create_table(void)
144*4882a593Smuzhiyun {
145*4882a593Smuzhiyun 	u64 *new_table = (u64*)gd->arch.tlb_fillptr;
146*4882a593Smuzhiyun 	u64 pt_len = MAX_PTE_ENTRIES * sizeof(u64);
147*4882a593Smuzhiyun 
148*4882a593Smuzhiyun 	/* Allocate MAX_PTE_ENTRIES pte entries */
149*4882a593Smuzhiyun 	gd->arch.tlb_fillptr += pt_len;
150*4882a593Smuzhiyun 
151*4882a593Smuzhiyun 	if (gd->arch.tlb_fillptr - gd->arch.tlb_addr > gd->arch.tlb_size)
152*4882a593Smuzhiyun 		panic("Insufficient RAM for page table: 0x%lx > 0x%lx. "
153*4882a593Smuzhiyun 		      "Please increase the size in get_page_table_size()",
154*4882a593Smuzhiyun 			gd->arch.tlb_fillptr - gd->arch.tlb_addr,
155*4882a593Smuzhiyun 			gd->arch.tlb_size);
156*4882a593Smuzhiyun 
157*4882a593Smuzhiyun 	/* Mark all entries as invalid */
158*4882a593Smuzhiyun 	memset(new_table, 0, pt_len);
159*4882a593Smuzhiyun 
160*4882a593Smuzhiyun 	return new_table;
161*4882a593Smuzhiyun }
162*4882a593Smuzhiyun 
set_pte_table(u64 * pte,u64 * table)163*4882a593Smuzhiyun static void set_pte_table(u64 *pte, u64 *table)
164*4882a593Smuzhiyun {
165*4882a593Smuzhiyun 	/* Point *pte to the new table */
166*4882a593Smuzhiyun 	pr_debug("Setting %p to addr=%p\n", pte, table);
167*4882a593Smuzhiyun 	*pte = PTE_TYPE_TABLE | (ulong)table;
168*4882a593Smuzhiyun }
169*4882a593Smuzhiyun 
170*4882a593Smuzhiyun /* Splits a block PTE into table with subpages spanning the old block */
split_block(u64 * pte,int level)171*4882a593Smuzhiyun static void split_block(u64 *pte, int level)
172*4882a593Smuzhiyun {
173*4882a593Smuzhiyun 	u64 old_pte = *pte;
174*4882a593Smuzhiyun 	u64 *new_table;
175*4882a593Smuzhiyun 	u64 i = 0;
176*4882a593Smuzhiyun 	/* level describes the parent level, we need the child ones */
177*4882a593Smuzhiyun 	int levelshift = level2shift(level + 1);
178*4882a593Smuzhiyun 
179*4882a593Smuzhiyun 	if (pte_type(pte) != PTE_TYPE_BLOCK)
180*4882a593Smuzhiyun 		panic("PTE %p (%llx) is not a block. Some driver code wants to "
181*4882a593Smuzhiyun 		      "modify dcache settings for an range not covered in "
182*4882a593Smuzhiyun 		      "mem_map.", pte, old_pte);
183*4882a593Smuzhiyun 
184*4882a593Smuzhiyun 	new_table = create_table();
185*4882a593Smuzhiyun 	pr_debug("Splitting pte %p (%llx) into %p\n", pte, old_pte, new_table);
186*4882a593Smuzhiyun 
187*4882a593Smuzhiyun 	for (i = 0; i < MAX_PTE_ENTRIES; i++) {
188*4882a593Smuzhiyun 		new_table[i] = old_pte | (i << levelshift);
189*4882a593Smuzhiyun 
190*4882a593Smuzhiyun 		/* Level 3 block PTEs have the table type */
191*4882a593Smuzhiyun 		if ((level + 1) == 3)
192*4882a593Smuzhiyun 			new_table[i] |= PTE_TYPE_TABLE;
193*4882a593Smuzhiyun 
194*4882a593Smuzhiyun 		pr_debug("Setting new_table[%lld] = %llx\n", i, new_table[i]);
195*4882a593Smuzhiyun 	}
196*4882a593Smuzhiyun 
197*4882a593Smuzhiyun 	/* Set the new table into effect */
198*4882a593Smuzhiyun 	set_pte_table(pte, new_table);
199*4882a593Smuzhiyun }
200*4882a593Smuzhiyun 
201*4882a593Smuzhiyun /* Add one mm_region map entry to the page tables */
add_map(struct mm_region * map)202*4882a593Smuzhiyun static void add_map(struct mm_region *map)
203*4882a593Smuzhiyun {
204*4882a593Smuzhiyun 	u64 *pte;
205*4882a593Smuzhiyun 	u64 virt = map->virt;
206*4882a593Smuzhiyun 	u64 phys = map->phys;
207*4882a593Smuzhiyun 	u64 size = map->size;
208*4882a593Smuzhiyun 	u64 attrs = map->attrs | PTE_TYPE_BLOCK | PTE_BLOCK_AF;
209*4882a593Smuzhiyun 	u64 blocksize;
210*4882a593Smuzhiyun 	int level;
211*4882a593Smuzhiyun 	u64 *new_table;
212*4882a593Smuzhiyun 
213*4882a593Smuzhiyun 	while (size) {
214*4882a593Smuzhiyun 		pte = find_pte(virt, 0);
215*4882a593Smuzhiyun 		if (pte && (pte_type(pte) == PTE_TYPE_FAULT)) {
216*4882a593Smuzhiyun 			pr_debug("Creating table for virt 0x%llx\n", virt);
217*4882a593Smuzhiyun 			new_table = create_table();
218*4882a593Smuzhiyun 			set_pte_table(pte, new_table);
219*4882a593Smuzhiyun 		}
220*4882a593Smuzhiyun 
221*4882a593Smuzhiyun 		for (level = 1; level < 4; level++) {
222*4882a593Smuzhiyun 			pte = find_pte(virt, level);
223*4882a593Smuzhiyun 			if (!pte)
224*4882a593Smuzhiyun 				panic("pte not found\n");
225*4882a593Smuzhiyun 
226*4882a593Smuzhiyun 			blocksize = 1ULL << level2shift(level);
227*4882a593Smuzhiyun 			pr_debug("Checking if pte fits for virt=%llx size=%llx blocksize=%llx\n",
228*4882a593Smuzhiyun 			      virt, size, blocksize);
229*4882a593Smuzhiyun 			if (size >= blocksize && !(virt & (blocksize - 1))) {
230*4882a593Smuzhiyun 				/* Page fits, create block PTE */
231*4882a593Smuzhiyun 				pr_debug("Setting PTE %p to block virt=%llx\n",
232*4882a593Smuzhiyun 				      pte, virt);
233*4882a593Smuzhiyun 				if (level == 3)
234*4882a593Smuzhiyun 					*pte = phys | attrs | PTE_TYPE_PAGE;
235*4882a593Smuzhiyun 				else
236*4882a593Smuzhiyun 					*pte = phys | attrs;
237*4882a593Smuzhiyun 				virt += blocksize;
238*4882a593Smuzhiyun 				phys += blocksize;
239*4882a593Smuzhiyun 				size -= blocksize;
240*4882a593Smuzhiyun 				break;
241*4882a593Smuzhiyun 			} else if (pte_type(pte) == PTE_TYPE_FAULT) {
242*4882a593Smuzhiyun 				/* Page doesn't fit, create subpages */
243*4882a593Smuzhiyun 				pr_debug("Creating subtable for virt 0x%llx blksize=%llx\n",
244*4882a593Smuzhiyun 				      virt, blocksize);
245*4882a593Smuzhiyun 				new_table = create_table();
246*4882a593Smuzhiyun 				set_pte_table(pte, new_table);
247*4882a593Smuzhiyun 			} else if (pte_type(pte) == PTE_TYPE_BLOCK) {
248*4882a593Smuzhiyun 				pr_debug("Split block into subtable for virt 0x%llx blksize=0x%llx\n",
249*4882a593Smuzhiyun 				      virt, blocksize);
250*4882a593Smuzhiyun 				split_block(pte, level);
251*4882a593Smuzhiyun 			}
252*4882a593Smuzhiyun 		}
253*4882a593Smuzhiyun 	}
254*4882a593Smuzhiyun }
255*4882a593Smuzhiyun 
256*4882a593Smuzhiyun enum pte_type {
257*4882a593Smuzhiyun 	PTE_INVAL,
258*4882a593Smuzhiyun 	PTE_BLOCK,
259*4882a593Smuzhiyun 	PTE_LEVEL,
260*4882a593Smuzhiyun };
261*4882a593Smuzhiyun 
262*4882a593Smuzhiyun /*
263*4882a593Smuzhiyun  * This is a recursively called function to count the number of
264*4882a593Smuzhiyun  * page tables we need to cover a particular PTE range. If you
265*4882a593Smuzhiyun  * call this with level = -1 you basically get the full 48 bit
266*4882a593Smuzhiyun  * coverage.
267*4882a593Smuzhiyun  */
count_required_pts(u64 addr,int level,u64 maxaddr)268*4882a593Smuzhiyun static int count_required_pts(u64 addr, int level, u64 maxaddr)
269*4882a593Smuzhiyun {
270*4882a593Smuzhiyun 	int levelshift = level2shift(level);
271*4882a593Smuzhiyun 	u64 levelsize = 1ULL << levelshift;
272*4882a593Smuzhiyun 	u64 levelmask = levelsize - 1;
273*4882a593Smuzhiyun 	u64 levelend = addr + levelsize;
274*4882a593Smuzhiyun 	int r = 0;
275*4882a593Smuzhiyun 	int i;
276*4882a593Smuzhiyun 	enum pte_type pte_type = PTE_INVAL;
277*4882a593Smuzhiyun 
278*4882a593Smuzhiyun 	for (i = 0; mem_map[i].size || mem_map[i].attrs; i++) {
279*4882a593Smuzhiyun 		struct mm_region *map = &mem_map[i];
280*4882a593Smuzhiyun 		u64 start = map->virt;
281*4882a593Smuzhiyun 		u64 end = start + map->size;
282*4882a593Smuzhiyun 
283*4882a593Smuzhiyun 		/* Check if the PTE would overlap with the map */
284*4882a593Smuzhiyun 		if (max(addr, start) <= min(levelend, end)) {
285*4882a593Smuzhiyun 			start = max(addr, start);
286*4882a593Smuzhiyun 			end = min(levelend, end);
287*4882a593Smuzhiyun 
288*4882a593Smuzhiyun 			/* We need a sub-pt for this level */
289*4882a593Smuzhiyun 			if ((start & levelmask) || (end & levelmask)) {
290*4882a593Smuzhiyun 				pte_type = PTE_LEVEL;
291*4882a593Smuzhiyun 				break;
292*4882a593Smuzhiyun 			}
293*4882a593Smuzhiyun 
294*4882a593Smuzhiyun 			/* Lv0 can not do block PTEs, so do levels here too */
295*4882a593Smuzhiyun 			if (level <= 0) {
296*4882a593Smuzhiyun 				pte_type = PTE_LEVEL;
297*4882a593Smuzhiyun 				break;
298*4882a593Smuzhiyun 			}
299*4882a593Smuzhiyun 
300*4882a593Smuzhiyun 			/* PTE is active, but fits into a block */
301*4882a593Smuzhiyun 			pte_type = PTE_BLOCK;
302*4882a593Smuzhiyun 		}
303*4882a593Smuzhiyun 	}
304*4882a593Smuzhiyun 
305*4882a593Smuzhiyun 	/*
306*4882a593Smuzhiyun 	 * Block PTEs at this level are already covered by the parent page
307*4882a593Smuzhiyun 	 * table, so we only need to count sub page tables.
308*4882a593Smuzhiyun 	 */
309*4882a593Smuzhiyun 	if (pte_type == PTE_LEVEL) {
310*4882a593Smuzhiyun 		int sublevel = level + 1;
311*4882a593Smuzhiyun 		u64 sublevelsize = 1ULL << level2shift(sublevel);
312*4882a593Smuzhiyun 
313*4882a593Smuzhiyun 		/* Account for the new sub page table ... */
314*4882a593Smuzhiyun 		r = 1;
315*4882a593Smuzhiyun 
316*4882a593Smuzhiyun 		/* ... and for all child page tables that one might have */
317*4882a593Smuzhiyun 		for (i = 0; i < MAX_PTE_ENTRIES; i++) {
318*4882a593Smuzhiyun 			r += count_required_pts(addr, sublevel, maxaddr);
319*4882a593Smuzhiyun 			addr += sublevelsize;
320*4882a593Smuzhiyun 
321*4882a593Smuzhiyun 			if (addr >= maxaddr) {
322*4882a593Smuzhiyun 				/*
323*4882a593Smuzhiyun 				 * We reached the end of address space, no need
324*4882a593Smuzhiyun 				 * to look any further.
325*4882a593Smuzhiyun 				 */
326*4882a593Smuzhiyun 				break;
327*4882a593Smuzhiyun 			}
328*4882a593Smuzhiyun 		}
329*4882a593Smuzhiyun 	}
330*4882a593Smuzhiyun 
331*4882a593Smuzhiyun 	return r;
332*4882a593Smuzhiyun }
333*4882a593Smuzhiyun 
334*4882a593Smuzhiyun /* Returns the estimated required size of all page tables */
get_page_table_size(void)335*4882a593Smuzhiyun __weak u64 get_page_table_size(void)
336*4882a593Smuzhiyun {
337*4882a593Smuzhiyun 	u64 one_pt = MAX_PTE_ENTRIES * sizeof(u64);
338*4882a593Smuzhiyun 	u64 size = 0;
339*4882a593Smuzhiyun 	u64 va_bits;
340*4882a593Smuzhiyun 	int start_level = 0;
341*4882a593Smuzhiyun 
342*4882a593Smuzhiyun 	get_tcr(0, NULL, &va_bits);
343*4882a593Smuzhiyun 	if (va_bits < 39)
344*4882a593Smuzhiyun 		start_level = 1;
345*4882a593Smuzhiyun 
346*4882a593Smuzhiyun 	/* Account for all page tables we would need to cover our memory map */
347*4882a593Smuzhiyun 	size = one_pt * count_required_pts(0, start_level - 1, 1ULL << va_bits);
348*4882a593Smuzhiyun 
349*4882a593Smuzhiyun 	/*
350*4882a593Smuzhiyun 	 * We need to duplicate our page table once to have an emergency pt to
351*4882a593Smuzhiyun 	 * resort to when splitting page tables later on
352*4882a593Smuzhiyun 	 */
353*4882a593Smuzhiyun 	size *= 2;
354*4882a593Smuzhiyun 
355*4882a593Smuzhiyun 	/*
356*4882a593Smuzhiyun 	 * We may need to split page tables later on if dcache settings change,
357*4882a593Smuzhiyun 	 * so reserve up to 4 (random pick) page tables for that.
358*4882a593Smuzhiyun 	 */
359*4882a593Smuzhiyun 	size += one_pt * 4;
360*4882a593Smuzhiyun 
361*4882a593Smuzhiyun 	return size;
362*4882a593Smuzhiyun }
363*4882a593Smuzhiyun 
setup_pgtables(void)364*4882a593Smuzhiyun void setup_pgtables(void)
365*4882a593Smuzhiyun {
366*4882a593Smuzhiyun 	int i;
367*4882a593Smuzhiyun 
368*4882a593Smuzhiyun 	if (!gd->arch.tlb_fillptr || !gd->arch.tlb_addr)
369*4882a593Smuzhiyun 		panic("Page table pointer not setup.");
370*4882a593Smuzhiyun 
371*4882a593Smuzhiyun 	/*
372*4882a593Smuzhiyun 	 * Allocate the first level we're on with invalidate entries.
373*4882a593Smuzhiyun 	 * If the starting level is 0 (va_bits >= 39), then this is our
374*4882a593Smuzhiyun 	 * Lv0 page table, otherwise it's the entry Lv1 page table.
375*4882a593Smuzhiyun 	 */
376*4882a593Smuzhiyun 	create_table();
377*4882a593Smuzhiyun 
378*4882a593Smuzhiyun 	/* Now add all MMU table entries one after another to the table */
379*4882a593Smuzhiyun 	for (i = 0; mem_map[i].size || mem_map[i].attrs; i++)
380*4882a593Smuzhiyun 		add_map(&mem_map[i]);
381*4882a593Smuzhiyun }
382*4882a593Smuzhiyun 
setup_all_pgtables(void)383*4882a593Smuzhiyun static void setup_all_pgtables(void)
384*4882a593Smuzhiyun {
385*4882a593Smuzhiyun 	u64 tlb_addr = gd->arch.tlb_addr;
386*4882a593Smuzhiyun 	u64 tlb_size = gd->arch.tlb_size;
387*4882a593Smuzhiyun 
388*4882a593Smuzhiyun 	/* Reset the fill ptr */
389*4882a593Smuzhiyun 	gd->arch.tlb_fillptr = tlb_addr;
390*4882a593Smuzhiyun 
391*4882a593Smuzhiyun 	/* Create normal system page tables */
392*4882a593Smuzhiyun 	setup_pgtables();
393*4882a593Smuzhiyun 
394*4882a593Smuzhiyun 	/* Create emergency page tables */
395*4882a593Smuzhiyun 	gd->arch.tlb_size -= (uintptr_t)gd->arch.tlb_fillptr -
396*4882a593Smuzhiyun 			     (uintptr_t)gd->arch.tlb_addr;
397*4882a593Smuzhiyun 	gd->arch.tlb_addr = gd->arch.tlb_fillptr;
398*4882a593Smuzhiyun 	setup_pgtables();
399*4882a593Smuzhiyun 	gd->arch.tlb_emerg = gd->arch.tlb_addr;
400*4882a593Smuzhiyun 	gd->arch.tlb_addr = tlb_addr;
401*4882a593Smuzhiyun 	gd->arch.tlb_size = tlb_size;
402*4882a593Smuzhiyun }
403*4882a593Smuzhiyun 
404*4882a593Smuzhiyun /* to activate the MMU we need to set up virtual memory */
mmu_setup(void)405*4882a593Smuzhiyun __weak void mmu_setup(void)
406*4882a593Smuzhiyun {
407*4882a593Smuzhiyun 	int el;
408*4882a593Smuzhiyun 
409*4882a593Smuzhiyun 	/* Set up page tables only once */
410*4882a593Smuzhiyun 	if (!gd->arch.tlb_fillptr)
411*4882a593Smuzhiyun 		setup_all_pgtables();
412*4882a593Smuzhiyun 
413*4882a593Smuzhiyun 	el = current_el();
414*4882a593Smuzhiyun 	set_ttbr_tcr_mair(el, gd->arch.tlb_addr, get_tcr(el, NULL, NULL),
415*4882a593Smuzhiyun 			  MEMORY_ATTRIBUTES);
416*4882a593Smuzhiyun 
417*4882a593Smuzhiyun 	/* enable the mmu */
418*4882a593Smuzhiyun 	set_sctlr(get_sctlr() | CR_M);
419*4882a593Smuzhiyun }
420*4882a593Smuzhiyun 
421*4882a593Smuzhiyun /*
422*4882a593Smuzhiyun  * Performs a invalidation of the entire data cache at all levels
423*4882a593Smuzhiyun  */
invalidate_dcache_all(void)424*4882a593Smuzhiyun void invalidate_dcache_all(void)
425*4882a593Smuzhiyun {
426*4882a593Smuzhiyun 	__asm_invalidate_dcache_all();
427*4882a593Smuzhiyun 	__asm_invalidate_l3_dcache();
428*4882a593Smuzhiyun }
429*4882a593Smuzhiyun 
430*4882a593Smuzhiyun /*
431*4882a593Smuzhiyun  * Performs a clean & invalidation of the entire data cache at all levels.
432*4882a593Smuzhiyun  * This function needs to be inline to avoid using stack.
433*4882a593Smuzhiyun  * __asm_flush_l3_dcache return status of timeout
434*4882a593Smuzhiyun  */
flush_dcache_all(void)435*4882a593Smuzhiyun inline void flush_dcache_all(void)
436*4882a593Smuzhiyun {
437*4882a593Smuzhiyun 	int ret;
438*4882a593Smuzhiyun 
439*4882a593Smuzhiyun 	__asm_flush_dcache_all();
440*4882a593Smuzhiyun 	ret = __asm_flush_l3_dcache();
441*4882a593Smuzhiyun 	if (ret)
442*4882a593Smuzhiyun 		pr_debug("flushing dcache returns 0x%x\n", ret);
443*4882a593Smuzhiyun 	else
444*4882a593Smuzhiyun 		pr_debug("flushing dcache successfully.\n");
445*4882a593Smuzhiyun }
446*4882a593Smuzhiyun 
447*4882a593Smuzhiyun /*
448*4882a593Smuzhiyun  * Invalidates range in all levels of D-cache/unified cache
449*4882a593Smuzhiyun  */
invalidate_dcache_range(unsigned long start,unsigned long stop)450*4882a593Smuzhiyun void invalidate_dcache_range(unsigned long start, unsigned long stop)
451*4882a593Smuzhiyun {
452*4882a593Smuzhiyun 	__asm_invalidate_dcache_range(start, stop);
453*4882a593Smuzhiyun }
454*4882a593Smuzhiyun 
455*4882a593Smuzhiyun /*
456*4882a593Smuzhiyun  * Flush range(clean & invalidate) from all levels of D-cache/unified cache
457*4882a593Smuzhiyun  */
flush_dcache_range(unsigned long start,unsigned long stop)458*4882a593Smuzhiyun void flush_dcache_range(unsigned long start, unsigned long stop)
459*4882a593Smuzhiyun {
460*4882a593Smuzhiyun 	__asm_flush_dcache_range(start, stop);
461*4882a593Smuzhiyun }
462*4882a593Smuzhiyun 
dcache_enable(void)463*4882a593Smuzhiyun void dcache_enable(void)
464*4882a593Smuzhiyun {
465*4882a593Smuzhiyun 	/* The data cache is not active unless the mmu is enabled */
466*4882a593Smuzhiyun 	if (!(get_sctlr() & CR_M)) {
467*4882a593Smuzhiyun 		invalidate_dcache_all();
468*4882a593Smuzhiyun 		__asm_invalidate_tlb_all();
469*4882a593Smuzhiyun 		mmu_setup();
470*4882a593Smuzhiyun 	}
471*4882a593Smuzhiyun 
472*4882a593Smuzhiyun 	set_sctlr(get_sctlr() | CR_C);
473*4882a593Smuzhiyun }
474*4882a593Smuzhiyun 
dcache_disable(void)475*4882a593Smuzhiyun void dcache_disable(void)
476*4882a593Smuzhiyun {
477*4882a593Smuzhiyun 	uint32_t sctlr;
478*4882a593Smuzhiyun 
479*4882a593Smuzhiyun 	sctlr = get_sctlr();
480*4882a593Smuzhiyun 
481*4882a593Smuzhiyun 	/* if cache isn't enabled no need to disable */
482*4882a593Smuzhiyun 	if (!(sctlr & CR_C))
483*4882a593Smuzhiyun 		return;
484*4882a593Smuzhiyun 
485*4882a593Smuzhiyun 	set_sctlr(sctlr & ~(CR_C|CR_M));
486*4882a593Smuzhiyun 
487*4882a593Smuzhiyun 	flush_dcache_all();
488*4882a593Smuzhiyun 	__asm_invalidate_tlb_all();
489*4882a593Smuzhiyun }
490*4882a593Smuzhiyun 
dcache_status(void)491*4882a593Smuzhiyun int dcache_status(void)
492*4882a593Smuzhiyun {
493*4882a593Smuzhiyun 	return (get_sctlr() & CR_C) != 0;
494*4882a593Smuzhiyun }
495*4882a593Smuzhiyun 
arch_get_page_table(void)496*4882a593Smuzhiyun u64 *__weak arch_get_page_table(void) {
497*4882a593Smuzhiyun 	puts("No page table offset defined\n");
498*4882a593Smuzhiyun 
499*4882a593Smuzhiyun 	return NULL;
500*4882a593Smuzhiyun }
501*4882a593Smuzhiyun 
is_aligned(u64 addr,u64 size,u64 align)502*4882a593Smuzhiyun static bool is_aligned(u64 addr, u64 size, u64 align)
503*4882a593Smuzhiyun {
504*4882a593Smuzhiyun 	return !(addr & (align - 1)) && !(size & (align - 1));
505*4882a593Smuzhiyun }
506*4882a593Smuzhiyun 
507*4882a593Smuzhiyun /* Use flag to indicate if attrs has more than d-cache attributes */
set_one_region(u64 start,u64 size,u64 attrs,bool flag,int level)508*4882a593Smuzhiyun static u64 set_one_region(u64 start, u64 size, u64 attrs, bool flag, int level)
509*4882a593Smuzhiyun {
510*4882a593Smuzhiyun 	int levelshift = level2shift(level);
511*4882a593Smuzhiyun 	u64 levelsize = 1ULL << levelshift;
512*4882a593Smuzhiyun 	u64 *pte = find_pte(start, level);
513*4882a593Smuzhiyun 
514*4882a593Smuzhiyun 	/* Can we can just modify the current level block PTE? */
515*4882a593Smuzhiyun 	if (is_aligned(start, size, levelsize)) {
516*4882a593Smuzhiyun 		if (flag) {
517*4882a593Smuzhiyun 			*pte &= ~PMD_ATTRMASK;
518*4882a593Smuzhiyun 			*pte |= attrs & PMD_ATTRMASK;
519*4882a593Smuzhiyun 		} else {
520*4882a593Smuzhiyun 			*pte &= ~PMD_ATTRINDX_MASK;
521*4882a593Smuzhiyun 			*pte |= attrs & PMD_ATTRINDX_MASK;
522*4882a593Smuzhiyun 		}
523*4882a593Smuzhiyun 		pr_debug("Set attrs=%llx pte=%p level=%d\n", attrs, pte, level);
524*4882a593Smuzhiyun 
525*4882a593Smuzhiyun 		return levelsize;
526*4882a593Smuzhiyun 	}
527*4882a593Smuzhiyun 
528*4882a593Smuzhiyun 	/* Unaligned or doesn't fit, maybe split block into table */
529*4882a593Smuzhiyun 	pr_debug("addr=%llx level=%d pte=%p (%llx)\n", start, level, pte, *pte);
530*4882a593Smuzhiyun 
531*4882a593Smuzhiyun 	/* Maybe we need to split the block into a table */
532*4882a593Smuzhiyun 	if (pte_type(pte) == PTE_TYPE_BLOCK)
533*4882a593Smuzhiyun 		split_block(pte, level);
534*4882a593Smuzhiyun 
535*4882a593Smuzhiyun 	/* And then double-check it became a table or already is one */
536*4882a593Smuzhiyun 	if (pte_type(pte) != PTE_TYPE_TABLE)
537*4882a593Smuzhiyun 		panic("PTE %p (%llx) for addr=%llx should be a table",
538*4882a593Smuzhiyun 		      pte, *pte, start);
539*4882a593Smuzhiyun 
540*4882a593Smuzhiyun 	/* Roll on to the next page table level */
541*4882a593Smuzhiyun 	return 0;
542*4882a593Smuzhiyun }
543*4882a593Smuzhiyun 
mmu_set_region_dcache_behaviour(phys_addr_t start,size_t size,enum dcache_option option)544*4882a593Smuzhiyun void mmu_set_region_dcache_behaviour(phys_addr_t start, size_t size,
545*4882a593Smuzhiyun 				     enum dcache_option option)
546*4882a593Smuzhiyun {
547*4882a593Smuzhiyun 	u64 attrs = PMD_ATTRINDX(option);
548*4882a593Smuzhiyun 	u64 real_start = start;
549*4882a593Smuzhiyun 	u64 real_size = size;
550*4882a593Smuzhiyun 
551*4882a593Smuzhiyun 	pr_debug("start=%lx size=%lx\n", (ulong)start, (ulong)size);
552*4882a593Smuzhiyun 
553*4882a593Smuzhiyun 	if (!gd->arch.tlb_emerg)
554*4882a593Smuzhiyun 		panic("Emergency page table not setup.");
555*4882a593Smuzhiyun 
556*4882a593Smuzhiyun 	/*
557*4882a593Smuzhiyun 	 * We can not modify page tables that we're currently running on,
558*4882a593Smuzhiyun 	 * so we first need to switch to the "emergency" page tables where
559*4882a593Smuzhiyun 	 * we can safely modify our primary page tables and then switch back
560*4882a593Smuzhiyun 	 */
561*4882a593Smuzhiyun 	__asm_switch_ttbr(gd->arch.tlb_emerg);
562*4882a593Smuzhiyun 
563*4882a593Smuzhiyun 	/*
564*4882a593Smuzhiyun 	 * Loop through the address range until we find a page granule that fits
565*4882a593Smuzhiyun 	 * our alignment constraints, then set it to the new cache attributes
566*4882a593Smuzhiyun 	 */
567*4882a593Smuzhiyun 	while (size > 0) {
568*4882a593Smuzhiyun 		int level;
569*4882a593Smuzhiyun 		u64 r;
570*4882a593Smuzhiyun 
571*4882a593Smuzhiyun 		for (level = 1; level < 4; level++) {
572*4882a593Smuzhiyun 			/* Set d-cache attributes only */
573*4882a593Smuzhiyun 			r = set_one_region(start, size, attrs, false, level);
574*4882a593Smuzhiyun 			if (r) {
575*4882a593Smuzhiyun 				/* PTE successfully replaced */
576*4882a593Smuzhiyun 				size -= r;
577*4882a593Smuzhiyun 				start += r;
578*4882a593Smuzhiyun 				break;
579*4882a593Smuzhiyun 			}
580*4882a593Smuzhiyun 		}
581*4882a593Smuzhiyun 
582*4882a593Smuzhiyun 	}
583*4882a593Smuzhiyun 
584*4882a593Smuzhiyun 	/* We're done modifying page tables, switch back to our primary ones */
585*4882a593Smuzhiyun 	__asm_switch_ttbr(gd->arch.tlb_addr);
586*4882a593Smuzhiyun 
587*4882a593Smuzhiyun 	/*
588*4882a593Smuzhiyun 	 * Make sure there's nothing stale in dcache for a region that might
589*4882a593Smuzhiyun 	 * have caches off now
590*4882a593Smuzhiyun 	 */
591*4882a593Smuzhiyun 	flush_dcache_range(real_start, real_start + real_size);
592*4882a593Smuzhiyun }
593*4882a593Smuzhiyun 
594*4882a593Smuzhiyun /*
595*4882a593Smuzhiyun  * Modify MMU table for a region with updated PXN/UXN/Memory type/valid bits.
596*4882a593Smuzhiyun  * The procecess is break-before-make. The target region will be marked as
597*4882a593Smuzhiyun  * invalid during the process of changing.
598*4882a593Smuzhiyun  */
mmu_change_region_attr(phys_addr_t addr,size_t siz,u64 attrs)599*4882a593Smuzhiyun void mmu_change_region_attr(phys_addr_t addr, size_t siz, u64 attrs)
600*4882a593Smuzhiyun {
601*4882a593Smuzhiyun 	int level;
602*4882a593Smuzhiyun 	u64 r, size, start;
603*4882a593Smuzhiyun 
604*4882a593Smuzhiyun 	start = addr;
605*4882a593Smuzhiyun 	size = siz;
606*4882a593Smuzhiyun 	/*
607*4882a593Smuzhiyun 	 * Loop through the address range until we find a page granule that fits
608*4882a593Smuzhiyun 	 * our alignment constraints, then set it to "invalid".
609*4882a593Smuzhiyun 	 */
610*4882a593Smuzhiyun 	while (size > 0) {
611*4882a593Smuzhiyun 		for (level = 1; level < 4; level++) {
612*4882a593Smuzhiyun 			/* Set PTE to fault */
613*4882a593Smuzhiyun 			r = set_one_region(start, size, PTE_TYPE_FAULT, true,
614*4882a593Smuzhiyun 					   level);
615*4882a593Smuzhiyun 			if (r) {
616*4882a593Smuzhiyun 				/* PTE successfully invalidated */
617*4882a593Smuzhiyun 				size -= r;
618*4882a593Smuzhiyun 				start += r;
619*4882a593Smuzhiyun 				break;
620*4882a593Smuzhiyun 			}
621*4882a593Smuzhiyun 		}
622*4882a593Smuzhiyun 	}
623*4882a593Smuzhiyun 
624*4882a593Smuzhiyun 	flush_dcache_range(gd->arch.tlb_addr,
625*4882a593Smuzhiyun 			   gd->arch.tlb_addr + gd->arch.tlb_size);
626*4882a593Smuzhiyun 	__asm_invalidate_tlb_all();
627*4882a593Smuzhiyun 
628*4882a593Smuzhiyun 	/*
629*4882a593Smuzhiyun 	 * Loop through the address range until we find a page granule that fits
630*4882a593Smuzhiyun 	 * our alignment constraints, then set it to the new cache attributes
631*4882a593Smuzhiyun 	 */
632*4882a593Smuzhiyun 	start = addr;
633*4882a593Smuzhiyun 	size = siz;
634*4882a593Smuzhiyun 	while (size > 0) {
635*4882a593Smuzhiyun 		for (level = 1; level < 4; level++) {
636*4882a593Smuzhiyun 			/* Set PTE to new attributes */
637*4882a593Smuzhiyun 			r = set_one_region(start, size, attrs, true, level);
638*4882a593Smuzhiyun 			if (r) {
639*4882a593Smuzhiyun 				/* PTE successfully updated */
640*4882a593Smuzhiyun 				size -= r;
641*4882a593Smuzhiyun 				start += r;
642*4882a593Smuzhiyun 				break;
643*4882a593Smuzhiyun 			}
644*4882a593Smuzhiyun 		}
645*4882a593Smuzhiyun 	}
646*4882a593Smuzhiyun 	flush_dcache_range(gd->arch.tlb_addr,
647*4882a593Smuzhiyun 			   gd->arch.tlb_addr + gd->arch.tlb_size);
648*4882a593Smuzhiyun 	__asm_invalidate_tlb_all();
649*4882a593Smuzhiyun }
650*4882a593Smuzhiyun 
651*4882a593Smuzhiyun #else	/* CONFIG_SYS_DCACHE_OFF */
get_page_table_size(void)652*4882a593Smuzhiyun u64 get_page_table_size(void)
653*4882a593Smuzhiyun {
654*4882a593Smuzhiyun 	return SZ_64K;
655*4882a593Smuzhiyun }
656*4882a593Smuzhiyun /*
657*4882a593Smuzhiyun  * For SPL builds, we may want to not have dcache enabled. Any real U-Boot
658*4882a593Smuzhiyun  * running however really wants to have dcache and the MMU active. Check that
659*4882a593Smuzhiyun  * everything is sane and give the developer a hint if it isn't.
660*4882a593Smuzhiyun  */
invalidate_dcache_all(void)661*4882a593Smuzhiyun void invalidate_dcache_all(void)
662*4882a593Smuzhiyun {
663*4882a593Smuzhiyun }
664*4882a593Smuzhiyun 
flush_dcache_all(void)665*4882a593Smuzhiyun void flush_dcache_all(void)
666*4882a593Smuzhiyun {
667*4882a593Smuzhiyun }
668*4882a593Smuzhiyun 
dcache_enable(void)669*4882a593Smuzhiyun void dcache_enable(void)
670*4882a593Smuzhiyun {
671*4882a593Smuzhiyun }
672*4882a593Smuzhiyun 
dcache_disable(void)673*4882a593Smuzhiyun void dcache_disable(void)
674*4882a593Smuzhiyun {
675*4882a593Smuzhiyun }
676*4882a593Smuzhiyun 
dcache_status(void)677*4882a593Smuzhiyun int dcache_status(void)
678*4882a593Smuzhiyun {
679*4882a593Smuzhiyun 	return 0;
680*4882a593Smuzhiyun }
681*4882a593Smuzhiyun 
mmu_set_region_dcache_behaviour(phys_addr_t start,size_t size,enum dcache_option option)682*4882a593Smuzhiyun void mmu_set_region_dcache_behaviour(phys_addr_t start, size_t size,
683*4882a593Smuzhiyun 				     enum dcache_option option)
684*4882a593Smuzhiyun {
685*4882a593Smuzhiyun }
686*4882a593Smuzhiyun 
687*4882a593Smuzhiyun #endif	/* CONFIG_SYS_DCACHE_OFF */
688*4882a593Smuzhiyun 
689*4882a593Smuzhiyun #ifndef CONFIG_SYS_ICACHE_OFF
690*4882a593Smuzhiyun 
icache_enable(void)691*4882a593Smuzhiyun void icache_enable(void)
692*4882a593Smuzhiyun {
693*4882a593Smuzhiyun 	invalidate_icache_all();
694*4882a593Smuzhiyun 	set_sctlr(get_sctlr() | CR_I);
695*4882a593Smuzhiyun }
696*4882a593Smuzhiyun 
icache_disable(void)697*4882a593Smuzhiyun void icache_disable(void)
698*4882a593Smuzhiyun {
699*4882a593Smuzhiyun 	set_sctlr(get_sctlr() & ~CR_I);
700*4882a593Smuzhiyun }
701*4882a593Smuzhiyun 
icache_status(void)702*4882a593Smuzhiyun int icache_status(void)
703*4882a593Smuzhiyun {
704*4882a593Smuzhiyun 	return (get_sctlr() & CR_I) != 0;
705*4882a593Smuzhiyun }
706*4882a593Smuzhiyun 
invalidate_icache_all(void)707*4882a593Smuzhiyun void invalidate_icache_all(void)
708*4882a593Smuzhiyun {
709*4882a593Smuzhiyun 	__asm_invalidate_icache_all();
710*4882a593Smuzhiyun 	__asm_invalidate_l3_icache();
711*4882a593Smuzhiyun }
712*4882a593Smuzhiyun 
713*4882a593Smuzhiyun #else	/* CONFIG_SYS_ICACHE_OFF */
714*4882a593Smuzhiyun 
icache_enable(void)715*4882a593Smuzhiyun void icache_enable(void)
716*4882a593Smuzhiyun {
717*4882a593Smuzhiyun }
718*4882a593Smuzhiyun 
icache_disable(void)719*4882a593Smuzhiyun void icache_disable(void)
720*4882a593Smuzhiyun {
721*4882a593Smuzhiyun }
722*4882a593Smuzhiyun 
icache_status(void)723*4882a593Smuzhiyun int icache_status(void)
724*4882a593Smuzhiyun {
725*4882a593Smuzhiyun 	return 0;
726*4882a593Smuzhiyun }
727*4882a593Smuzhiyun 
invalidate_icache_all(void)728*4882a593Smuzhiyun void invalidate_icache_all(void)
729*4882a593Smuzhiyun {
730*4882a593Smuzhiyun }
731*4882a593Smuzhiyun 
732*4882a593Smuzhiyun #endif	/* CONFIG_SYS_ICACHE_OFF */
733*4882a593Smuzhiyun 
734*4882a593Smuzhiyun /*
735*4882a593Smuzhiyun  * Enable dCache & iCache, whether cache is actually enabled
736*4882a593Smuzhiyun  * depend on CONFIG_SYS_DCACHE_OFF and CONFIG_SYS_ICACHE_OFF
737*4882a593Smuzhiyun  */
enable_caches(void)738*4882a593Smuzhiyun void __weak enable_caches(void)
739*4882a593Smuzhiyun {
740*4882a593Smuzhiyun 	icache_enable();
741*4882a593Smuzhiyun 	dcache_enable();
742*4882a593Smuzhiyun }
743