xref: /OK3568_Linux_fs/kernel/arch/mips/loongson64/numa.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Copyright (C) 2010 Loongson Inc. & Lemote Inc. &
4*4882a593Smuzhiyun  *                    Institute of Computing Technology
5*4882a593Smuzhiyun  * Author:  Xiang Gao, gaoxiang@ict.ac.cn
6*4882a593Smuzhiyun  *          Huacai Chen, chenhc@lemote.com
7*4882a593Smuzhiyun  *          Xiaofu Meng, Shuangshuang Zhang
8*4882a593Smuzhiyun  */
9*4882a593Smuzhiyun #include <linux/init.h>
10*4882a593Smuzhiyun #include <linux/kernel.h>
11*4882a593Smuzhiyun #include <linux/mm.h>
12*4882a593Smuzhiyun #include <linux/mmzone.h>
13*4882a593Smuzhiyun #include <linux/export.h>
14*4882a593Smuzhiyun #include <linux/nodemask.h>
15*4882a593Smuzhiyun #include <linux/swap.h>
16*4882a593Smuzhiyun #include <linux/memblock.h>
17*4882a593Smuzhiyun #include <linux/pfn.h>
18*4882a593Smuzhiyun #include <linux/highmem.h>
19*4882a593Smuzhiyun #include <asm/page.h>
20*4882a593Smuzhiyun #include <asm/pgalloc.h>
21*4882a593Smuzhiyun #include <asm/sections.h>
22*4882a593Smuzhiyun #include <linux/irq.h>
23*4882a593Smuzhiyun #include <asm/bootinfo.h>
24*4882a593Smuzhiyun #include <asm/mc146818-time.h>
25*4882a593Smuzhiyun #include <asm/time.h>
26*4882a593Smuzhiyun #include <asm/wbflush.h>
27*4882a593Smuzhiyun #include <boot_param.h>
28*4882a593Smuzhiyun 
29*4882a593Smuzhiyun static struct pglist_data prealloc__node_data[MAX_NUMNODES];
30*4882a593Smuzhiyun unsigned char __node_distances[MAX_NUMNODES][MAX_NUMNODES];
31*4882a593Smuzhiyun EXPORT_SYMBOL(__node_distances);
32*4882a593Smuzhiyun struct pglist_data *__node_data[MAX_NUMNODES];
33*4882a593Smuzhiyun EXPORT_SYMBOL(__node_data);
34*4882a593Smuzhiyun 
35*4882a593Smuzhiyun cpumask_t __node_cpumask[MAX_NUMNODES];
36*4882a593Smuzhiyun EXPORT_SYMBOL(__node_cpumask);
37*4882a593Smuzhiyun 
enable_lpa(void)38*4882a593Smuzhiyun static void enable_lpa(void)
39*4882a593Smuzhiyun {
40*4882a593Smuzhiyun 	unsigned long value;
41*4882a593Smuzhiyun 
42*4882a593Smuzhiyun 	value = __read_32bit_c0_register($16, 3);
43*4882a593Smuzhiyun 	value |= 0x00000080;
44*4882a593Smuzhiyun 	__write_32bit_c0_register($16, 3, value);
45*4882a593Smuzhiyun 	value = __read_32bit_c0_register($16, 3);
46*4882a593Smuzhiyun 	pr_info("CP0_Config3: CP0 16.3 (0x%lx)\n", value);
47*4882a593Smuzhiyun 
48*4882a593Smuzhiyun 	value = __read_32bit_c0_register($5, 1);
49*4882a593Smuzhiyun 	value |= 0x20000000;
50*4882a593Smuzhiyun 	__write_32bit_c0_register($5, 1, value);
51*4882a593Smuzhiyun 	value = __read_32bit_c0_register($5, 1);
52*4882a593Smuzhiyun 	pr_info("CP0_PageGrain: CP0 5.1 (0x%lx)\n", value);
53*4882a593Smuzhiyun }
54*4882a593Smuzhiyun 
cpu_node_probe(void)55*4882a593Smuzhiyun static void cpu_node_probe(void)
56*4882a593Smuzhiyun {
57*4882a593Smuzhiyun 	int i;
58*4882a593Smuzhiyun 
59*4882a593Smuzhiyun 	nodes_clear(node_possible_map);
60*4882a593Smuzhiyun 	nodes_clear(node_online_map);
61*4882a593Smuzhiyun 	for (i = 0; i < loongson_sysconf.nr_nodes; i++) {
62*4882a593Smuzhiyun 		node_set_state(num_online_nodes(), N_POSSIBLE);
63*4882a593Smuzhiyun 		node_set_online(num_online_nodes());
64*4882a593Smuzhiyun 	}
65*4882a593Smuzhiyun 
66*4882a593Smuzhiyun 	pr_info("NUMA: Discovered %d cpus on %d nodes\n",
67*4882a593Smuzhiyun 		loongson_sysconf.nr_cpus, num_online_nodes());
68*4882a593Smuzhiyun }
69*4882a593Smuzhiyun 
compute_node_distance(int row,int col)70*4882a593Smuzhiyun static int __init compute_node_distance(int row, int col)
71*4882a593Smuzhiyun {
72*4882a593Smuzhiyun 	int package_row = row * loongson_sysconf.cores_per_node /
73*4882a593Smuzhiyun 				loongson_sysconf.cores_per_package;
74*4882a593Smuzhiyun 	int package_col = col * loongson_sysconf.cores_per_node /
75*4882a593Smuzhiyun 				loongson_sysconf.cores_per_package;
76*4882a593Smuzhiyun 
77*4882a593Smuzhiyun 	if (col == row)
78*4882a593Smuzhiyun 		return LOCAL_DISTANCE;
79*4882a593Smuzhiyun 	else if (package_row == package_col)
80*4882a593Smuzhiyun 		return 40;
81*4882a593Smuzhiyun 	else
82*4882a593Smuzhiyun 		return 100;
83*4882a593Smuzhiyun }
84*4882a593Smuzhiyun 
init_topology_matrix(void)85*4882a593Smuzhiyun static void __init init_topology_matrix(void)
86*4882a593Smuzhiyun {
87*4882a593Smuzhiyun 	int row, col;
88*4882a593Smuzhiyun 
89*4882a593Smuzhiyun 	for (row = 0; row < MAX_NUMNODES; row++)
90*4882a593Smuzhiyun 		for (col = 0; col < MAX_NUMNODES; col++)
91*4882a593Smuzhiyun 			__node_distances[row][col] = -1;
92*4882a593Smuzhiyun 
93*4882a593Smuzhiyun 	for_each_online_node(row) {
94*4882a593Smuzhiyun 		for_each_online_node(col) {
95*4882a593Smuzhiyun 			__node_distances[row][col] =
96*4882a593Smuzhiyun 				compute_node_distance(row, col);
97*4882a593Smuzhiyun 		}
98*4882a593Smuzhiyun 	}
99*4882a593Smuzhiyun }
100*4882a593Smuzhiyun 
szmem(unsigned int node)101*4882a593Smuzhiyun static void __init szmem(unsigned int node)
102*4882a593Smuzhiyun {
103*4882a593Smuzhiyun 	u32 i, mem_type;
104*4882a593Smuzhiyun 	static unsigned long num_physpages;
105*4882a593Smuzhiyun 	u64 node_id, node_psize, start_pfn, end_pfn, mem_start, mem_size;
106*4882a593Smuzhiyun 
107*4882a593Smuzhiyun 	/* Parse memory information and activate */
108*4882a593Smuzhiyun 	for (i = 0; i < loongson_memmap->nr_map; i++) {
109*4882a593Smuzhiyun 		node_id = loongson_memmap->map[i].node_id;
110*4882a593Smuzhiyun 		if (node_id != node)
111*4882a593Smuzhiyun 			continue;
112*4882a593Smuzhiyun 
113*4882a593Smuzhiyun 		mem_type = loongson_memmap->map[i].mem_type;
114*4882a593Smuzhiyun 		mem_size = loongson_memmap->map[i].mem_size;
115*4882a593Smuzhiyun 		mem_start = loongson_memmap->map[i].mem_start;
116*4882a593Smuzhiyun 
117*4882a593Smuzhiyun 		switch (mem_type) {
118*4882a593Smuzhiyun 		case SYSTEM_RAM_LOW:
119*4882a593Smuzhiyun 			start_pfn = ((node_id << 44) + mem_start) >> PAGE_SHIFT;
120*4882a593Smuzhiyun 			node_psize = (mem_size << 20) >> PAGE_SHIFT;
121*4882a593Smuzhiyun 			end_pfn  = start_pfn + node_psize;
122*4882a593Smuzhiyun 			num_physpages += node_psize;
123*4882a593Smuzhiyun 			pr_info("Node%d: mem_type:%d, mem_start:0x%llx, mem_size:0x%llx MB\n",
124*4882a593Smuzhiyun 				(u32)node_id, mem_type, mem_start, mem_size);
125*4882a593Smuzhiyun 			pr_info("       start_pfn:0x%llx, end_pfn:0x%llx, num_physpages:0x%lx\n",
126*4882a593Smuzhiyun 				start_pfn, end_pfn, num_physpages);
127*4882a593Smuzhiyun 			memblock_add_node(PFN_PHYS(start_pfn),
128*4882a593Smuzhiyun 				PFN_PHYS(node_psize), node);
129*4882a593Smuzhiyun 			break;
130*4882a593Smuzhiyun 		case SYSTEM_RAM_HIGH:
131*4882a593Smuzhiyun 			start_pfn = ((node_id << 44) + mem_start) >> PAGE_SHIFT;
132*4882a593Smuzhiyun 			node_psize = (mem_size << 20) >> PAGE_SHIFT;
133*4882a593Smuzhiyun 			end_pfn  = start_pfn + node_psize;
134*4882a593Smuzhiyun 			num_physpages += node_psize;
135*4882a593Smuzhiyun 			pr_info("Node%d: mem_type:%d, mem_start:0x%llx, mem_size:0x%llx MB\n",
136*4882a593Smuzhiyun 				(u32)node_id, mem_type, mem_start, mem_size);
137*4882a593Smuzhiyun 			pr_info("       start_pfn:0x%llx, end_pfn:0x%llx, num_physpages:0x%lx\n",
138*4882a593Smuzhiyun 				start_pfn, end_pfn, num_physpages);
139*4882a593Smuzhiyun 			memblock_add_node(PFN_PHYS(start_pfn),
140*4882a593Smuzhiyun 				PFN_PHYS(node_psize), node);
141*4882a593Smuzhiyun 			break;
142*4882a593Smuzhiyun 		case SYSTEM_RAM_RESERVED:
143*4882a593Smuzhiyun 			pr_info("Node%d: mem_type:%d, mem_start:0x%llx, mem_size:0x%llx MB\n",
144*4882a593Smuzhiyun 				(u32)node_id, mem_type, mem_start, mem_size);
145*4882a593Smuzhiyun 			memblock_reserve(((node_id << 44) + mem_start),
146*4882a593Smuzhiyun 				mem_size << 20);
147*4882a593Smuzhiyun 			break;
148*4882a593Smuzhiyun 		}
149*4882a593Smuzhiyun 	}
150*4882a593Smuzhiyun }
151*4882a593Smuzhiyun 
node_mem_init(unsigned int node)152*4882a593Smuzhiyun static void __init node_mem_init(unsigned int node)
153*4882a593Smuzhiyun {
154*4882a593Smuzhiyun 	unsigned long node_addrspace_offset;
155*4882a593Smuzhiyun 	unsigned long start_pfn, end_pfn;
156*4882a593Smuzhiyun 
157*4882a593Smuzhiyun 	node_addrspace_offset = nid_to_addrbase(node);
158*4882a593Smuzhiyun 	pr_info("Node%d's addrspace_offset is 0x%lx\n",
159*4882a593Smuzhiyun 			node, node_addrspace_offset);
160*4882a593Smuzhiyun 
161*4882a593Smuzhiyun 	get_pfn_range_for_nid(node, &start_pfn, &end_pfn);
162*4882a593Smuzhiyun 	pr_info("Node%d: start_pfn=0x%lx, end_pfn=0x%lx\n",
163*4882a593Smuzhiyun 		node, start_pfn, end_pfn);
164*4882a593Smuzhiyun 
165*4882a593Smuzhiyun 	__node_data[node] = prealloc__node_data + node;
166*4882a593Smuzhiyun 
167*4882a593Smuzhiyun 	NODE_DATA(node)->node_start_pfn = start_pfn;
168*4882a593Smuzhiyun 	NODE_DATA(node)->node_spanned_pages = end_pfn - start_pfn;
169*4882a593Smuzhiyun 
170*4882a593Smuzhiyun 	if (node == 0) {
171*4882a593Smuzhiyun 		/* kernel end address */
172*4882a593Smuzhiyun 		unsigned long kernel_end_pfn = PFN_UP(__pa_symbol(&_end));
173*4882a593Smuzhiyun 
174*4882a593Smuzhiyun 		/* used by finalize_initrd() */
175*4882a593Smuzhiyun 		max_low_pfn = end_pfn;
176*4882a593Smuzhiyun 
177*4882a593Smuzhiyun 		/* Reserve the kernel text/data/bss */
178*4882a593Smuzhiyun 		memblock_reserve(start_pfn << PAGE_SHIFT,
179*4882a593Smuzhiyun 				 ((kernel_end_pfn - start_pfn) << PAGE_SHIFT));
180*4882a593Smuzhiyun 
181*4882a593Smuzhiyun 		/* Reserve 0xfe000000~0xffffffff for RS780E integrated GPU */
182*4882a593Smuzhiyun 		if (node_end_pfn(0) >= (0xffffffff >> PAGE_SHIFT))
183*4882a593Smuzhiyun 			memblock_reserve((node_addrspace_offset | 0xfe000000),
184*4882a593Smuzhiyun 					 32 << 20);
185*4882a593Smuzhiyun 
186*4882a593Smuzhiyun 		/* Reserve pfn range 0~node[0]->node_start_pfn */
187*4882a593Smuzhiyun 		memblock_reserve(0, PAGE_SIZE * start_pfn);
188*4882a593Smuzhiyun 	}
189*4882a593Smuzhiyun }
190*4882a593Smuzhiyun 
prom_meminit(void)191*4882a593Smuzhiyun static __init void prom_meminit(void)
192*4882a593Smuzhiyun {
193*4882a593Smuzhiyun 	unsigned int node, cpu, active_cpu = 0;
194*4882a593Smuzhiyun 
195*4882a593Smuzhiyun 	cpu_node_probe();
196*4882a593Smuzhiyun 	init_topology_matrix();
197*4882a593Smuzhiyun 
198*4882a593Smuzhiyun 	for (node = 0; node < loongson_sysconf.nr_nodes; node++) {
199*4882a593Smuzhiyun 		if (node_online(node)) {
200*4882a593Smuzhiyun 			szmem(node);
201*4882a593Smuzhiyun 			node_mem_init(node);
202*4882a593Smuzhiyun 			cpumask_clear(&__node_cpumask[node]);
203*4882a593Smuzhiyun 		}
204*4882a593Smuzhiyun 	}
205*4882a593Smuzhiyun 	max_low_pfn = PHYS_PFN(memblock_end_of_DRAM());
206*4882a593Smuzhiyun 
207*4882a593Smuzhiyun 	for (cpu = 0; cpu < loongson_sysconf.nr_cpus; cpu++) {
208*4882a593Smuzhiyun 		node = cpu / loongson_sysconf.cores_per_node;
209*4882a593Smuzhiyun 		if (node >= num_online_nodes())
210*4882a593Smuzhiyun 			node = 0;
211*4882a593Smuzhiyun 
212*4882a593Smuzhiyun 		if (loongson_sysconf.reserved_cpus_mask & (1<<cpu))
213*4882a593Smuzhiyun 			continue;
214*4882a593Smuzhiyun 
215*4882a593Smuzhiyun 		cpumask_set_cpu(active_cpu, &__node_cpumask[node]);
216*4882a593Smuzhiyun 		pr_info("NUMA: set cpumask cpu %d on node %d\n", active_cpu, node);
217*4882a593Smuzhiyun 
218*4882a593Smuzhiyun 		active_cpu++;
219*4882a593Smuzhiyun 	}
220*4882a593Smuzhiyun }
221*4882a593Smuzhiyun 
paging_init(void)222*4882a593Smuzhiyun void __init paging_init(void)
223*4882a593Smuzhiyun {
224*4882a593Smuzhiyun 	unsigned long zones_size[MAX_NR_ZONES] = {0, };
225*4882a593Smuzhiyun 
226*4882a593Smuzhiyun 	pagetable_init();
227*4882a593Smuzhiyun 	zones_size[ZONE_DMA32] = MAX_DMA32_PFN;
228*4882a593Smuzhiyun 	zones_size[ZONE_NORMAL] = max_low_pfn;
229*4882a593Smuzhiyun 	free_area_init(zones_size);
230*4882a593Smuzhiyun }
231*4882a593Smuzhiyun 
mem_init(void)232*4882a593Smuzhiyun void __init mem_init(void)
233*4882a593Smuzhiyun {
234*4882a593Smuzhiyun 	high_memory = (void *) __va(get_num_physpages() << PAGE_SHIFT);
235*4882a593Smuzhiyun 	memblock_free_all();
236*4882a593Smuzhiyun 	setup_zero_pages();	/* This comes from node 0 */
237*4882a593Smuzhiyun 	mem_init_print_info(NULL);
238*4882a593Smuzhiyun }
239*4882a593Smuzhiyun 
240*4882a593Smuzhiyun /* All PCI device belongs to logical Node-0 */
pcibus_to_node(struct pci_bus * bus)241*4882a593Smuzhiyun int pcibus_to_node(struct pci_bus *bus)
242*4882a593Smuzhiyun {
243*4882a593Smuzhiyun 	return 0;
244*4882a593Smuzhiyun }
245*4882a593Smuzhiyun EXPORT_SYMBOL(pcibus_to_node);
246*4882a593Smuzhiyun 
prom_init_numa_memory(void)247*4882a593Smuzhiyun void __init prom_init_numa_memory(void)
248*4882a593Smuzhiyun {
249*4882a593Smuzhiyun 	enable_lpa();
250*4882a593Smuzhiyun 	prom_meminit();
251*4882a593Smuzhiyun }
252*4882a593Smuzhiyun EXPORT_SYMBOL(prom_init_numa_memory);
253