1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Copyright (C) 2010 Loongson Inc. & Lemote Inc. &
4*4882a593Smuzhiyun * Institute of Computing Technology
5*4882a593Smuzhiyun * Author: Xiang Gao, gaoxiang@ict.ac.cn
6*4882a593Smuzhiyun * Huacai Chen, chenhc@lemote.com
7*4882a593Smuzhiyun * Xiaofu Meng, Shuangshuang Zhang
8*4882a593Smuzhiyun */
9*4882a593Smuzhiyun #include <linux/init.h>
10*4882a593Smuzhiyun #include <linux/kernel.h>
11*4882a593Smuzhiyun #include <linux/mm.h>
12*4882a593Smuzhiyun #include <linux/mmzone.h>
13*4882a593Smuzhiyun #include <linux/export.h>
14*4882a593Smuzhiyun #include <linux/nodemask.h>
15*4882a593Smuzhiyun #include <linux/swap.h>
16*4882a593Smuzhiyun #include <linux/memblock.h>
17*4882a593Smuzhiyun #include <linux/pfn.h>
18*4882a593Smuzhiyun #include <linux/highmem.h>
19*4882a593Smuzhiyun #include <asm/page.h>
20*4882a593Smuzhiyun #include <asm/pgalloc.h>
21*4882a593Smuzhiyun #include <asm/sections.h>
22*4882a593Smuzhiyun #include <linux/irq.h>
23*4882a593Smuzhiyun #include <asm/bootinfo.h>
24*4882a593Smuzhiyun #include <asm/mc146818-time.h>
25*4882a593Smuzhiyun #include <asm/time.h>
26*4882a593Smuzhiyun #include <asm/wbflush.h>
27*4882a593Smuzhiyun #include <boot_param.h>
28*4882a593Smuzhiyun
29*4882a593Smuzhiyun static struct pglist_data prealloc__node_data[MAX_NUMNODES];
30*4882a593Smuzhiyun unsigned char __node_distances[MAX_NUMNODES][MAX_NUMNODES];
31*4882a593Smuzhiyun EXPORT_SYMBOL(__node_distances);
32*4882a593Smuzhiyun struct pglist_data *__node_data[MAX_NUMNODES];
33*4882a593Smuzhiyun EXPORT_SYMBOL(__node_data);
34*4882a593Smuzhiyun
35*4882a593Smuzhiyun cpumask_t __node_cpumask[MAX_NUMNODES];
36*4882a593Smuzhiyun EXPORT_SYMBOL(__node_cpumask);
37*4882a593Smuzhiyun
enable_lpa(void)38*4882a593Smuzhiyun static void enable_lpa(void)
39*4882a593Smuzhiyun {
40*4882a593Smuzhiyun unsigned long value;
41*4882a593Smuzhiyun
42*4882a593Smuzhiyun value = __read_32bit_c0_register($16, 3);
43*4882a593Smuzhiyun value |= 0x00000080;
44*4882a593Smuzhiyun __write_32bit_c0_register($16, 3, value);
45*4882a593Smuzhiyun value = __read_32bit_c0_register($16, 3);
46*4882a593Smuzhiyun pr_info("CP0_Config3: CP0 16.3 (0x%lx)\n", value);
47*4882a593Smuzhiyun
48*4882a593Smuzhiyun value = __read_32bit_c0_register($5, 1);
49*4882a593Smuzhiyun value |= 0x20000000;
50*4882a593Smuzhiyun __write_32bit_c0_register($5, 1, value);
51*4882a593Smuzhiyun value = __read_32bit_c0_register($5, 1);
52*4882a593Smuzhiyun pr_info("CP0_PageGrain: CP0 5.1 (0x%lx)\n", value);
53*4882a593Smuzhiyun }
54*4882a593Smuzhiyun
cpu_node_probe(void)55*4882a593Smuzhiyun static void cpu_node_probe(void)
56*4882a593Smuzhiyun {
57*4882a593Smuzhiyun int i;
58*4882a593Smuzhiyun
59*4882a593Smuzhiyun nodes_clear(node_possible_map);
60*4882a593Smuzhiyun nodes_clear(node_online_map);
61*4882a593Smuzhiyun for (i = 0; i < loongson_sysconf.nr_nodes; i++) {
62*4882a593Smuzhiyun node_set_state(num_online_nodes(), N_POSSIBLE);
63*4882a593Smuzhiyun node_set_online(num_online_nodes());
64*4882a593Smuzhiyun }
65*4882a593Smuzhiyun
66*4882a593Smuzhiyun pr_info("NUMA: Discovered %d cpus on %d nodes\n",
67*4882a593Smuzhiyun loongson_sysconf.nr_cpus, num_online_nodes());
68*4882a593Smuzhiyun }
69*4882a593Smuzhiyun
compute_node_distance(int row,int col)70*4882a593Smuzhiyun static int __init compute_node_distance(int row, int col)
71*4882a593Smuzhiyun {
72*4882a593Smuzhiyun int package_row = row * loongson_sysconf.cores_per_node /
73*4882a593Smuzhiyun loongson_sysconf.cores_per_package;
74*4882a593Smuzhiyun int package_col = col * loongson_sysconf.cores_per_node /
75*4882a593Smuzhiyun loongson_sysconf.cores_per_package;
76*4882a593Smuzhiyun
77*4882a593Smuzhiyun if (col == row)
78*4882a593Smuzhiyun return LOCAL_DISTANCE;
79*4882a593Smuzhiyun else if (package_row == package_col)
80*4882a593Smuzhiyun return 40;
81*4882a593Smuzhiyun else
82*4882a593Smuzhiyun return 100;
83*4882a593Smuzhiyun }
84*4882a593Smuzhiyun
init_topology_matrix(void)85*4882a593Smuzhiyun static void __init init_topology_matrix(void)
86*4882a593Smuzhiyun {
87*4882a593Smuzhiyun int row, col;
88*4882a593Smuzhiyun
89*4882a593Smuzhiyun for (row = 0; row < MAX_NUMNODES; row++)
90*4882a593Smuzhiyun for (col = 0; col < MAX_NUMNODES; col++)
91*4882a593Smuzhiyun __node_distances[row][col] = -1;
92*4882a593Smuzhiyun
93*4882a593Smuzhiyun for_each_online_node(row) {
94*4882a593Smuzhiyun for_each_online_node(col) {
95*4882a593Smuzhiyun __node_distances[row][col] =
96*4882a593Smuzhiyun compute_node_distance(row, col);
97*4882a593Smuzhiyun }
98*4882a593Smuzhiyun }
99*4882a593Smuzhiyun }
100*4882a593Smuzhiyun
szmem(unsigned int node)101*4882a593Smuzhiyun static void __init szmem(unsigned int node)
102*4882a593Smuzhiyun {
103*4882a593Smuzhiyun u32 i, mem_type;
104*4882a593Smuzhiyun static unsigned long num_physpages;
105*4882a593Smuzhiyun u64 node_id, node_psize, start_pfn, end_pfn, mem_start, mem_size;
106*4882a593Smuzhiyun
107*4882a593Smuzhiyun /* Parse memory information and activate */
108*4882a593Smuzhiyun for (i = 0; i < loongson_memmap->nr_map; i++) {
109*4882a593Smuzhiyun node_id = loongson_memmap->map[i].node_id;
110*4882a593Smuzhiyun if (node_id != node)
111*4882a593Smuzhiyun continue;
112*4882a593Smuzhiyun
113*4882a593Smuzhiyun mem_type = loongson_memmap->map[i].mem_type;
114*4882a593Smuzhiyun mem_size = loongson_memmap->map[i].mem_size;
115*4882a593Smuzhiyun mem_start = loongson_memmap->map[i].mem_start;
116*4882a593Smuzhiyun
117*4882a593Smuzhiyun switch (mem_type) {
118*4882a593Smuzhiyun case SYSTEM_RAM_LOW:
119*4882a593Smuzhiyun start_pfn = ((node_id << 44) + mem_start) >> PAGE_SHIFT;
120*4882a593Smuzhiyun node_psize = (mem_size << 20) >> PAGE_SHIFT;
121*4882a593Smuzhiyun end_pfn = start_pfn + node_psize;
122*4882a593Smuzhiyun num_physpages += node_psize;
123*4882a593Smuzhiyun pr_info("Node%d: mem_type:%d, mem_start:0x%llx, mem_size:0x%llx MB\n",
124*4882a593Smuzhiyun (u32)node_id, mem_type, mem_start, mem_size);
125*4882a593Smuzhiyun pr_info(" start_pfn:0x%llx, end_pfn:0x%llx, num_physpages:0x%lx\n",
126*4882a593Smuzhiyun start_pfn, end_pfn, num_physpages);
127*4882a593Smuzhiyun memblock_add_node(PFN_PHYS(start_pfn),
128*4882a593Smuzhiyun PFN_PHYS(node_psize), node);
129*4882a593Smuzhiyun break;
130*4882a593Smuzhiyun case SYSTEM_RAM_HIGH:
131*4882a593Smuzhiyun start_pfn = ((node_id << 44) + mem_start) >> PAGE_SHIFT;
132*4882a593Smuzhiyun node_psize = (mem_size << 20) >> PAGE_SHIFT;
133*4882a593Smuzhiyun end_pfn = start_pfn + node_psize;
134*4882a593Smuzhiyun num_physpages += node_psize;
135*4882a593Smuzhiyun pr_info("Node%d: mem_type:%d, mem_start:0x%llx, mem_size:0x%llx MB\n",
136*4882a593Smuzhiyun (u32)node_id, mem_type, mem_start, mem_size);
137*4882a593Smuzhiyun pr_info(" start_pfn:0x%llx, end_pfn:0x%llx, num_physpages:0x%lx\n",
138*4882a593Smuzhiyun start_pfn, end_pfn, num_physpages);
139*4882a593Smuzhiyun memblock_add_node(PFN_PHYS(start_pfn),
140*4882a593Smuzhiyun PFN_PHYS(node_psize), node);
141*4882a593Smuzhiyun break;
142*4882a593Smuzhiyun case SYSTEM_RAM_RESERVED:
143*4882a593Smuzhiyun pr_info("Node%d: mem_type:%d, mem_start:0x%llx, mem_size:0x%llx MB\n",
144*4882a593Smuzhiyun (u32)node_id, mem_type, mem_start, mem_size);
145*4882a593Smuzhiyun memblock_reserve(((node_id << 44) + mem_start),
146*4882a593Smuzhiyun mem_size << 20);
147*4882a593Smuzhiyun break;
148*4882a593Smuzhiyun }
149*4882a593Smuzhiyun }
150*4882a593Smuzhiyun }
151*4882a593Smuzhiyun
node_mem_init(unsigned int node)152*4882a593Smuzhiyun static void __init node_mem_init(unsigned int node)
153*4882a593Smuzhiyun {
154*4882a593Smuzhiyun unsigned long node_addrspace_offset;
155*4882a593Smuzhiyun unsigned long start_pfn, end_pfn;
156*4882a593Smuzhiyun
157*4882a593Smuzhiyun node_addrspace_offset = nid_to_addrbase(node);
158*4882a593Smuzhiyun pr_info("Node%d's addrspace_offset is 0x%lx\n",
159*4882a593Smuzhiyun node, node_addrspace_offset);
160*4882a593Smuzhiyun
161*4882a593Smuzhiyun get_pfn_range_for_nid(node, &start_pfn, &end_pfn);
162*4882a593Smuzhiyun pr_info("Node%d: start_pfn=0x%lx, end_pfn=0x%lx\n",
163*4882a593Smuzhiyun node, start_pfn, end_pfn);
164*4882a593Smuzhiyun
165*4882a593Smuzhiyun __node_data[node] = prealloc__node_data + node;
166*4882a593Smuzhiyun
167*4882a593Smuzhiyun NODE_DATA(node)->node_start_pfn = start_pfn;
168*4882a593Smuzhiyun NODE_DATA(node)->node_spanned_pages = end_pfn - start_pfn;
169*4882a593Smuzhiyun
170*4882a593Smuzhiyun if (node == 0) {
171*4882a593Smuzhiyun /* kernel end address */
172*4882a593Smuzhiyun unsigned long kernel_end_pfn = PFN_UP(__pa_symbol(&_end));
173*4882a593Smuzhiyun
174*4882a593Smuzhiyun /* used by finalize_initrd() */
175*4882a593Smuzhiyun max_low_pfn = end_pfn;
176*4882a593Smuzhiyun
177*4882a593Smuzhiyun /* Reserve the kernel text/data/bss */
178*4882a593Smuzhiyun memblock_reserve(start_pfn << PAGE_SHIFT,
179*4882a593Smuzhiyun ((kernel_end_pfn - start_pfn) << PAGE_SHIFT));
180*4882a593Smuzhiyun
181*4882a593Smuzhiyun /* Reserve 0xfe000000~0xffffffff for RS780E integrated GPU */
182*4882a593Smuzhiyun if (node_end_pfn(0) >= (0xffffffff >> PAGE_SHIFT))
183*4882a593Smuzhiyun memblock_reserve((node_addrspace_offset | 0xfe000000),
184*4882a593Smuzhiyun 32 << 20);
185*4882a593Smuzhiyun
186*4882a593Smuzhiyun /* Reserve pfn range 0~node[0]->node_start_pfn */
187*4882a593Smuzhiyun memblock_reserve(0, PAGE_SIZE * start_pfn);
188*4882a593Smuzhiyun }
189*4882a593Smuzhiyun }
190*4882a593Smuzhiyun
prom_meminit(void)191*4882a593Smuzhiyun static __init void prom_meminit(void)
192*4882a593Smuzhiyun {
193*4882a593Smuzhiyun unsigned int node, cpu, active_cpu = 0;
194*4882a593Smuzhiyun
195*4882a593Smuzhiyun cpu_node_probe();
196*4882a593Smuzhiyun init_topology_matrix();
197*4882a593Smuzhiyun
198*4882a593Smuzhiyun for (node = 0; node < loongson_sysconf.nr_nodes; node++) {
199*4882a593Smuzhiyun if (node_online(node)) {
200*4882a593Smuzhiyun szmem(node);
201*4882a593Smuzhiyun node_mem_init(node);
202*4882a593Smuzhiyun cpumask_clear(&__node_cpumask[node]);
203*4882a593Smuzhiyun }
204*4882a593Smuzhiyun }
205*4882a593Smuzhiyun max_low_pfn = PHYS_PFN(memblock_end_of_DRAM());
206*4882a593Smuzhiyun
207*4882a593Smuzhiyun for (cpu = 0; cpu < loongson_sysconf.nr_cpus; cpu++) {
208*4882a593Smuzhiyun node = cpu / loongson_sysconf.cores_per_node;
209*4882a593Smuzhiyun if (node >= num_online_nodes())
210*4882a593Smuzhiyun node = 0;
211*4882a593Smuzhiyun
212*4882a593Smuzhiyun if (loongson_sysconf.reserved_cpus_mask & (1<<cpu))
213*4882a593Smuzhiyun continue;
214*4882a593Smuzhiyun
215*4882a593Smuzhiyun cpumask_set_cpu(active_cpu, &__node_cpumask[node]);
216*4882a593Smuzhiyun pr_info("NUMA: set cpumask cpu %d on node %d\n", active_cpu, node);
217*4882a593Smuzhiyun
218*4882a593Smuzhiyun active_cpu++;
219*4882a593Smuzhiyun }
220*4882a593Smuzhiyun }
221*4882a593Smuzhiyun
paging_init(void)222*4882a593Smuzhiyun void __init paging_init(void)
223*4882a593Smuzhiyun {
224*4882a593Smuzhiyun unsigned long zones_size[MAX_NR_ZONES] = {0, };
225*4882a593Smuzhiyun
226*4882a593Smuzhiyun pagetable_init();
227*4882a593Smuzhiyun zones_size[ZONE_DMA32] = MAX_DMA32_PFN;
228*4882a593Smuzhiyun zones_size[ZONE_NORMAL] = max_low_pfn;
229*4882a593Smuzhiyun free_area_init(zones_size);
230*4882a593Smuzhiyun }
231*4882a593Smuzhiyun
mem_init(void)232*4882a593Smuzhiyun void __init mem_init(void)
233*4882a593Smuzhiyun {
234*4882a593Smuzhiyun high_memory = (void *) __va(get_num_physpages() << PAGE_SHIFT);
235*4882a593Smuzhiyun memblock_free_all();
236*4882a593Smuzhiyun setup_zero_pages(); /* This comes from node 0 */
237*4882a593Smuzhiyun mem_init_print_info(NULL);
238*4882a593Smuzhiyun }
239*4882a593Smuzhiyun
240*4882a593Smuzhiyun /* All PCI device belongs to logical Node-0 */
pcibus_to_node(struct pci_bus * bus)241*4882a593Smuzhiyun int pcibus_to_node(struct pci_bus *bus)
242*4882a593Smuzhiyun {
243*4882a593Smuzhiyun return 0;
244*4882a593Smuzhiyun }
245*4882a593Smuzhiyun EXPORT_SYMBOL(pcibus_to_node);
246*4882a593Smuzhiyun
prom_init_numa_memory(void)247*4882a593Smuzhiyun void __init prom_init_numa_memory(void)
248*4882a593Smuzhiyun {
249*4882a593Smuzhiyun enable_lpa();
250*4882a593Smuzhiyun prom_meminit();
251*4882a593Smuzhiyun }
252*4882a593Smuzhiyun EXPORT_SYMBOL(prom_init_numa_memory);
253