1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * This file is subject to the terms and conditions of the GNU General Public
3*4882a593Smuzhiyun * License. See the file "COPYING" in the main directory of this archive
4*4882a593Smuzhiyun * for more details.
5*4882a593Smuzhiyun *
6*4882a593Smuzhiyun * SGI UV architectural definitions
7*4882a593Smuzhiyun *
8*4882a593Smuzhiyun * Copyright (C) 2008 Silicon Graphics, Inc. All rights reserved.
9*4882a593Smuzhiyun */
10*4882a593Smuzhiyun
11*4882a593Smuzhiyun #ifndef __ASM_IA64_UV_HUB_H__
12*4882a593Smuzhiyun #define __ASM_IA64_UV_HUB_H__
13*4882a593Smuzhiyun
14*4882a593Smuzhiyun #include <linux/numa.h>
15*4882a593Smuzhiyun #include <linux/percpu.h>
16*4882a593Smuzhiyun #include <asm/types.h>
17*4882a593Smuzhiyun #include <asm/percpu.h>
18*4882a593Smuzhiyun
19*4882a593Smuzhiyun
20*4882a593Smuzhiyun /*
21*4882a593Smuzhiyun * Addressing Terminology
22*4882a593Smuzhiyun *
23*4882a593Smuzhiyun * M - The low M bits of a physical address represent the offset
24*4882a593Smuzhiyun * into the blade local memory. RAM memory on a blade is physically
25*4882a593Smuzhiyun * contiguous (although various IO spaces may punch holes in
26*4882a593Smuzhiyun * it)..
27*4882a593Smuzhiyun *
28*4882a593Smuzhiyun * N - Number of bits in the node portion of a socket physical
29*4882a593Smuzhiyun * address.
30*4882a593Smuzhiyun *
31*4882a593Smuzhiyun * NASID - network ID of a router, Mbrick or Cbrick. Nasid values of
32*4882a593Smuzhiyun * routers always have low bit of 1, C/MBricks have low bit
33*4882a593Smuzhiyun * equal to 0. Most addressing macros that target UV hub chips
34*4882a593Smuzhiyun * right shift the NASID by 1 to exclude the always-zero bit.
35*4882a593Smuzhiyun * NASIDs contain up to 15 bits.
36*4882a593Smuzhiyun *
37*4882a593Smuzhiyun * GNODE - NASID right shifted by 1 bit. Most mmrs contain gnodes instead
38*4882a593Smuzhiyun * of nasids.
39*4882a593Smuzhiyun *
40*4882a593Smuzhiyun * PNODE - the low N bits of the GNODE. The PNODE is the most useful variant
41*4882a593Smuzhiyun * of the nasid for socket usage.
42*4882a593Smuzhiyun *
43*4882a593Smuzhiyun *
44*4882a593Smuzhiyun * NumaLink Global Physical Address Format:
45*4882a593Smuzhiyun * +--------------------------------+---------------------+
46*4882a593Smuzhiyun * |00..000| GNODE | NodeOffset |
47*4882a593Smuzhiyun * +--------------------------------+---------------------+
48*4882a593Smuzhiyun * |<-------53 - M bits --->|<--------M bits ----->
49*4882a593Smuzhiyun *
50*4882a593Smuzhiyun * M - number of node offset bits (35 .. 40)
51*4882a593Smuzhiyun *
52*4882a593Smuzhiyun *
53*4882a593Smuzhiyun * Memory/UV-HUB Processor Socket Address Format:
54*4882a593Smuzhiyun * +----------------+---------------+---------------------+
55*4882a593Smuzhiyun * |00..000000000000| PNODE | NodeOffset |
56*4882a593Smuzhiyun * +----------------+---------------+---------------------+
57*4882a593Smuzhiyun * <--- N bits --->|<--------M bits ----->
58*4882a593Smuzhiyun *
59*4882a593Smuzhiyun * M - number of node offset bits (35 .. 40)
60*4882a593Smuzhiyun * N - number of PNODE bits (0 .. 10)
61*4882a593Smuzhiyun *
62*4882a593Smuzhiyun * Note: M + N cannot currently exceed 44 (x86_64) or 46 (IA64).
63*4882a593Smuzhiyun * The actual values are configuration dependent and are set at
64*4882a593Smuzhiyun * boot time. M & N values are set by the hardware/BIOS at boot.
65*4882a593Smuzhiyun */
66*4882a593Smuzhiyun
67*4882a593Smuzhiyun
68*4882a593Smuzhiyun /*
69*4882a593Smuzhiyun * Maximum number of bricks in all partitions and in all coherency domains.
70*4882a593Smuzhiyun * This is the total number of bricks accessible in the numalink fabric. It
71*4882a593Smuzhiyun * includes all C & M bricks. Routers are NOT included.
72*4882a593Smuzhiyun *
73*4882a593Smuzhiyun * This value is also the value of the maximum number of non-router NASIDs
74*4882a593Smuzhiyun * in the numalink fabric.
75*4882a593Smuzhiyun *
76*4882a593Smuzhiyun * NOTE: a brick may contain 1 or 2 OS nodes. Don't get these confused.
77*4882a593Smuzhiyun */
78*4882a593Smuzhiyun #define UV_MAX_NUMALINK_BLADES 16384
79*4882a593Smuzhiyun
80*4882a593Smuzhiyun /*
81*4882a593Smuzhiyun * Maximum number of C/Mbricks within a software SSI (hardware may support
82*4882a593Smuzhiyun * more).
83*4882a593Smuzhiyun */
84*4882a593Smuzhiyun #define UV_MAX_SSI_BLADES 1
85*4882a593Smuzhiyun
86*4882a593Smuzhiyun /*
87*4882a593Smuzhiyun * The largest possible NASID of a C or M brick (+ 2)
88*4882a593Smuzhiyun */
89*4882a593Smuzhiyun #define UV_MAX_NASID_VALUE (UV_MAX_NUMALINK_NODES * 2)
90*4882a593Smuzhiyun
91*4882a593Smuzhiyun /*
92*4882a593Smuzhiyun * The following defines attributes of the HUB chip. These attributes are
93*4882a593Smuzhiyun * frequently referenced and are kept in the per-cpu data areas of each cpu.
94*4882a593Smuzhiyun * They are kept together in a struct to minimize cache misses.
95*4882a593Smuzhiyun */
96*4882a593Smuzhiyun struct uv_hub_info_s {
97*4882a593Smuzhiyun unsigned long global_mmr_base;
98*4882a593Smuzhiyun unsigned long gpa_mask;
99*4882a593Smuzhiyun unsigned long gnode_upper;
100*4882a593Smuzhiyun unsigned long lowmem_remap_top;
101*4882a593Smuzhiyun unsigned long lowmem_remap_base;
102*4882a593Smuzhiyun unsigned short pnode;
103*4882a593Smuzhiyun unsigned short pnode_mask;
104*4882a593Smuzhiyun unsigned short coherency_domain_number;
105*4882a593Smuzhiyun unsigned short numa_blade_id;
106*4882a593Smuzhiyun unsigned char blade_processor_id;
107*4882a593Smuzhiyun unsigned char m_val;
108*4882a593Smuzhiyun unsigned char n_val;
109*4882a593Smuzhiyun };
110*4882a593Smuzhiyun DECLARE_PER_CPU(struct uv_hub_info_s, __uv_hub_info);
111*4882a593Smuzhiyun #define uv_hub_info this_cpu_ptr(&__uv_hub_info)
112*4882a593Smuzhiyun #define uv_cpu_hub_info(cpu) (&per_cpu(__uv_hub_info, cpu))
113*4882a593Smuzhiyun
114*4882a593Smuzhiyun /*
115*4882a593Smuzhiyun * Local & Global MMR space macros.
116*4882a593Smuzhiyun * Note: macros are intended to be used ONLY by inline functions
117*4882a593Smuzhiyun * in this file - not by other kernel code.
118*4882a593Smuzhiyun * n - NASID (full 15-bit global nasid)
119*4882a593Smuzhiyun * g - GNODE (full 15-bit global nasid, right shifted 1)
120*4882a593Smuzhiyun * p - PNODE (local part of nsids, right shifted 1)
121*4882a593Smuzhiyun */
122*4882a593Smuzhiyun #define UV_NASID_TO_PNODE(n) (((n) >> 1) & uv_hub_info->pnode_mask)
123*4882a593Smuzhiyun #define UV_PNODE_TO_NASID(p) (((p) << 1) | uv_hub_info->gnode_upper)
124*4882a593Smuzhiyun
125*4882a593Smuzhiyun #define UV_LOCAL_MMR_BASE 0xf4000000UL
126*4882a593Smuzhiyun #define UV_GLOBAL_MMR32_BASE 0xf8000000UL
127*4882a593Smuzhiyun #define UV_GLOBAL_MMR64_BASE (uv_hub_info->global_mmr_base)
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun #define UV_GLOBAL_MMR32_PNODE_SHIFT 15
130*4882a593Smuzhiyun #define UV_GLOBAL_MMR64_PNODE_SHIFT 26
131*4882a593Smuzhiyun
132*4882a593Smuzhiyun #define UV_GLOBAL_MMR32_PNODE_BITS(p) ((p) << (UV_GLOBAL_MMR32_PNODE_SHIFT))
133*4882a593Smuzhiyun
134*4882a593Smuzhiyun #define UV_GLOBAL_MMR64_PNODE_BITS(p) \
135*4882a593Smuzhiyun ((unsigned long)(p) << UV_GLOBAL_MMR64_PNODE_SHIFT)
136*4882a593Smuzhiyun
137*4882a593Smuzhiyun /*
138*4882a593Smuzhiyun * Macros for converting between kernel virtual addresses, socket local physical
139*4882a593Smuzhiyun * addresses, and UV global physical addresses.
140*4882a593Smuzhiyun * Note: use the standard __pa() & __va() macros for converting
141*4882a593Smuzhiyun * between socket virtual and socket physical addresses.
142*4882a593Smuzhiyun */
143*4882a593Smuzhiyun
144*4882a593Smuzhiyun /* socket phys RAM --> UV global physical address */
uv_soc_phys_ram_to_gpa(unsigned long paddr)145*4882a593Smuzhiyun static inline unsigned long uv_soc_phys_ram_to_gpa(unsigned long paddr)
146*4882a593Smuzhiyun {
147*4882a593Smuzhiyun if (paddr < uv_hub_info->lowmem_remap_top)
148*4882a593Smuzhiyun paddr += uv_hub_info->lowmem_remap_base;
149*4882a593Smuzhiyun return paddr | uv_hub_info->gnode_upper;
150*4882a593Smuzhiyun }
151*4882a593Smuzhiyun
152*4882a593Smuzhiyun
153*4882a593Smuzhiyun /* socket virtual --> UV global physical address */
uv_gpa(void * v)154*4882a593Smuzhiyun static inline unsigned long uv_gpa(void *v)
155*4882a593Smuzhiyun {
156*4882a593Smuzhiyun return __pa(v) | uv_hub_info->gnode_upper;
157*4882a593Smuzhiyun }
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun /* socket virtual --> UV global physical address */
uv_vgpa(void * v)160*4882a593Smuzhiyun static inline void *uv_vgpa(void *v)
161*4882a593Smuzhiyun {
162*4882a593Smuzhiyun return (void *)uv_gpa(v);
163*4882a593Smuzhiyun }
164*4882a593Smuzhiyun
165*4882a593Smuzhiyun /* UV global physical address --> socket virtual */
uv_va(unsigned long gpa)166*4882a593Smuzhiyun static inline void *uv_va(unsigned long gpa)
167*4882a593Smuzhiyun {
168*4882a593Smuzhiyun return __va(gpa & uv_hub_info->gpa_mask);
169*4882a593Smuzhiyun }
170*4882a593Smuzhiyun
171*4882a593Smuzhiyun /* pnode, offset --> socket virtual */
uv_pnode_offset_to_vaddr(int pnode,unsigned long offset)172*4882a593Smuzhiyun static inline void *uv_pnode_offset_to_vaddr(int pnode, unsigned long offset)
173*4882a593Smuzhiyun {
174*4882a593Smuzhiyun return __va(((unsigned long)pnode << uv_hub_info->m_val) | offset);
175*4882a593Smuzhiyun }
176*4882a593Smuzhiyun
177*4882a593Smuzhiyun
178*4882a593Smuzhiyun /*
179*4882a593Smuzhiyun * Access global MMRs using the low memory MMR32 space. This region supports
180*4882a593Smuzhiyun * faster MMR access but not all MMRs are accessible in this space.
181*4882a593Smuzhiyun */
uv_global_mmr32_address(int pnode,unsigned long offset)182*4882a593Smuzhiyun static inline unsigned long *uv_global_mmr32_address(int pnode,
183*4882a593Smuzhiyun unsigned long offset)
184*4882a593Smuzhiyun {
185*4882a593Smuzhiyun return __va(UV_GLOBAL_MMR32_BASE |
186*4882a593Smuzhiyun UV_GLOBAL_MMR32_PNODE_BITS(pnode) | offset);
187*4882a593Smuzhiyun }
188*4882a593Smuzhiyun
uv_write_global_mmr32(int pnode,unsigned long offset,unsigned long val)189*4882a593Smuzhiyun static inline void uv_write_global_mmr32(int pnode, unsigned long offset,
190*4882a593Smuzhiyun unsigned long val)
191*4882a593Smuzhiyun {
192*4882a593Smuzhiyun *uv_global_mmr32_address(pnode, offset) = val;
193*4882a593Smuzhiyun }
194*4882a593Smuzhiyun
uv_read_global_mmr32(int pnode,unsigned long offset)195*4882a593Smuzhiyun static inline unsigned long uv_read_global_mmr32(int pnode,
196*4882a593Smuzhiyun unsigned long offset)
197*4882a593Smuzhiyun {
198*4882a593Smuzhiyun return *uv_global_mmr32_address(pnode, offset);
199*4882a593Smuzhiyun }
200*4882a593Smuzhiyun
201*4882a593Smuzhiyun /*
202*4882a593Smuzhiyun * Access Global MMR space using the MMR space located at the top of physical
203*4882a593Smuzhiyun * memory.
204*4882a593Smuzhiyun */
uv_global_mmr64_address(int pnode,unsigned long offset)205*4882a593Smuzhiyun static inline unsigned long *uv_global_mmr64_address(int pnode,
206*4882a593Smuzhiyun unsigned long offset)
207*4882a593Smuzhiyun {
208*4882a593Smuzhiyun return __va(UV_GLOBAL_MMR64_BASE |
209*4882a593Smuzhiyun UV_GLOBAL_MMR64_PNODE_BITS(pnode) | offset);
210*4882a593Smuzhiyun }
211*4882a593Smuzhiyun
uv_write_global_mmr64(int pnode,unsigned long offset,unsigned long val)212*4882a593Smuzhiyun static inline void uv_write_global_mmr64(int pnode, unsigned long offset,
213*4882a593Smuzhiyun unsigned long val)
214*4882a593Smuzhiyun {
215*4882a593Smuzhiyun *uv_global_mmr64_address(pnode, offset) = val;
216*4882a593Smuzhiyun }
217*4882a593Smuzhiyun
uv_read_global_mmr64(int pnode,unsigned long offset)218*4882a593Smuzhiyun static inline unsigned long uv_read_global_mmr64(int pnode,
219*4882a593Smuzhiyun unsigned long offset)
220*4882a593Smuzhiyun {
221*4882a593Smuzhiyun return *uv_global_mmr64_address(pnode, offset);
222*4882a593Smuzhiyun }
223*4882a593Smuzhiyun
224*4882a593Smuzhiyun /*
225*4882a593Smuzhiyun * Access hub local MMRs. Faster than using global space but only local MMRs
226*4882a593Smuzhiyun * are accessible.
227*4882a593Smuzhiyun */
uv_local_mmr_address(unsigned long offset)228*4882a593Smuzhiyun static inline unsigned long *uv_local_mmr_address(unsigned long offset)
229*4882a593Smuzhiyun {
230*4882a593Smuzhiyun return __va(UV_LOCAL_MMR_BASE | offset);
231*4882a593Smuzhiyun }
232*4882a593Smuzhiyun
uv_read_local_mmr(unsigned long offset)233*4882a593Smuzhiyun static inline unsigned long uv_read_local_mmr(unsigned long offset)
234*4882a593Smuzhiyun {
235*4882a593Smuzhiyun return *uv_local_mmr_address(offset);
236*4882a593Smuzhiyun }
237*4882a593Smuzhiyun
uv_write_local_mmr(unsigned long offset,unsigned long val)238*4882a593Smuzhiyun static inline void uv_write_local_mmr(unsigned long offset, unsigned long val)
239*4882a593Smuzhiyun {
240*4882a593Smuzhiyun *uv_local_mmr_address(offset) = val;
241*4882a593Smuzhiyun }
242*4882a593Smuzhiyun
243*4882a593Smuzhiyun /*
244*4882a593Smuzhiyun * Structures and definitions for converting between cpu, node, pnode, and blade
245*4882a593Smuzhiyun * numbers.
246*4882a593Smuzhiyun */
247*4882a593Smuzhiyun
248*4882a593Smuzhiyun /* Blade-local cpu number of current cpu. Numbered 0 .. <# cpus on the blade> */
uv_blade_processor_id(void)249*4882a593Smuzhiyun static inline int uv_blade_processor_id(void)
250*4882a593Smuzhiyun {
251*4882a593Smuzhiyun return smp_processor_id();
252*4882a593Smuzhiyun }
253*4882a593Smuzhiyun
254*4882a593Smuzhiyun /* Blade number of current cpu. Numnbered 0 .. <#blades -1> */
uv_numa_blade_id(void)255*4882a593Smuzhiyun static inline int uv_numa_blade_id(void)
256*4882a593Smuzhiyun {
257*4882a593Smuzhiyun return 0;
258*4882a593Smuzhiyun }
259*4882a593Smuzhiyun
260*4882a593Smuzhiyun /* Convert a cpu number to the the UV blade number */
uv_cpu_to_blade_id(int cpu)261*4882a593Smuzhiyun static inline int uv_cpu_to_blade_id(int cpu)
262*4882a593Smuzhiyun {
263*4882a593Smuzhiyun return 0;
264*4882a593Smuzhiyun }
265*4882a593Smuzhiyun
266*4882a593Smuzhiyun /* Convert linux node number to the UV blade number */
uv_node_to_blade_id(int nid)267*4882a593Smuzhiyun static inline int uv_node_to_blade_id(int nid)
268*4882a593Smuzhiyun {
269*4882a593Smuzhiyun return 0;
270*4882a593Smuzhiyun }
271*4882a593Smuzhiyun
272*4882a593Smuzhiyun /* Convert a blade id to the PNODE of the blade */
uv_blade_to_pnode(int bid)273*4882a593Smuzhiyun static inline int uv_blade_to_pnode(int bid)
274*4882a593Smuzhiyun {
275*4882a593Smuzhiyun return 0;
276*4882a593Smuzhiyun }
277*4882a593Smuzhiyun
278*4882a593Smuzhiyun /* Determine the number of possible cpus on a blade */
uv_blade_nr_possible_cpus(int bid)279*4882a593Smuzhiyun static inline int uv_blade_nr_possible_cpus(int bid)
280*4882a593Smuzhiyun {
281*4882a593Smuzhiyun return num_possible_cpus();
282*4882a593Smuzhiyun }
283*4882a593Smuzhiyun
284*4882a593Smuzhiyun /* Determine the number of online cpus on a blade */
uv_blade_nr_online_cpus(int bid)285*4882a593Smuzhiyun static inline int uv_blade_nr_online_cpus(int bid)
286*4882a593Smuzhiyun {
287*4882a593Smuzhiyun return num_online_cpus();
288*4882a593Smuzhiyun }
289*4882a593Smuzhiyun
290*4882a593Smuzhiyun /* Convert a cpu id to the PNODE of the blade containing the cpu */
uv_cpu_to_pnode(int cpu)291*4882a593Smuzhiyun static inline int uv_cpu_to_pnode(int cpu)
292*4882a593Smuzhiyun {
293*4882a593Smuzhiyun return 0;
294*4882a593Smuzhiyun }
295*4882a593Smuzhiyun
296*4882a593Smuzhiyun /* Convert a linux node number to the PNODE of the blade */
uv_node_to_pnode(int nid)297*4882a593Smuzhiyun static inline int uv_node_to_pnode(int nid)
298*4882a593Smuzhiyun {
299*4882a593Smuzhiyun return 0;
300*4882a593Smuzhiyun }
301*4882a593Smuzhiyun
302*4882a593Smuzhiyun /* Maximum possible number of blades */
uv_num_possible_blades(void)303*4882a593Smuzhiyun static inline int uv_num_possible_blades(void)
304*4882a593Smuzhiyun {
305*4882a593Smuzhiyun return 1;
306*4882a593Smuzhiyun }
307*4882a593Smuzhiyun
uv_hub_send_ipi(int pnode,int apicid,int vector)308*4882a593Smuzhiyun static inline void uv_hub_send_ipi(int pnode, int apicid, int vector)
309*4882a593Smuzhiyun {
310*4882a593Smuzhiyun /* not currently needed on ia64 */
311*4882a593Smuzhiyun }
312*4882a593Smuzhiyun
313*4882a593Smuzhiyun
314*4882a593Smuzhiyun #endif /* __ASM_IA64_UV_HUB__ */
315*4882a593Smuzhiyun
316