1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0 */
2*4882a593Smuzhiyun #ifndef _ASM_IA64_PROCESSOR_H
3*4882a593Smuzhiyun #define _ASM_IA64_PROCESSOR_H
4*4882a593Smuzhiyun
5*4882a593Smuzhiyun /*
6*4882a593Smuzhiyun * Copyright (C) 1998-2004 Hewlett-Packard Co
7*4882a593Smuzhiyun * David Mosberger-Tang <davidm@hpl.hp.com>
8*4882a593Smuzhiyun * Stephane Eranian <eranian@hpl.hp.com>
9*4882a593Smuzhiyun * Copyright (C) 1999 Asit Mallick <asit.k.mallick@intel.com>
10*4882a593Smuzhiyun * Copyright (C) 1999 Don Dugger <don.dugger@intel.com>
11*4882a593Smuzhiyun *
12*4882a593Smuzhiyun * 11/24/98 S.Eranian added ia64_set_iva()
13*4882a593Smuzhiyun * 12/03/99 D. Mosberger implement thread_saved_pc() via kernel unwind API
14*4882a593Smuzhiyun * 06/16/00 A. Mallick added csd/ssd/tssd for ia32 support
15*4882a593Smuzhiyun */
16*4882a593Smuzhiyun
17*4882a593Smuzhiyun
18*4882a593Smuzhiyun #include <asm/intrinsics.h>
19*4882a593Smuzhiyun #include <asm/kregs.h>
20*4882a593Smuzhiyun #include <asm/ptrace.h>
21*4882a593Smuzhiyun #include <asm/ustack.h>
22*4882a593Smuzhiyun
23*4882a593Smuzhiyun #define IA64_NUM_PHYS_STACK_REG 96
24*4882a593Smuzhiyun #define IA64_NUM_DBG_REGS 8
25*4882a593Smuzhiyun
26*4882a593Smuzhiyun #define DEFAULT_MAP_BASE __IA64_UL_CONST(0x2000000000000000)
27*4882a593Smuzhiyun #define DEFAULT_TASK_SIZE __IA64_UL_CONST(0xa000000000000000)
28*4882a593Smuzhiyun
29*4882a593Smuzhiyun /*
30*4882a593Smuzhiyun * TASK_SIZE really is a mis-named. It really is the maximum user
31*4882a593Smuzhiyun * space address (plus one). On IA-64, there are five regions of 2TB
32*4882a593Smuzhiyun * each (assuming 8KB page size), for a total of 8TB of user virtual
33*4882a593Smuzhiyun * address space.
34*4882a593Smuzhiyun */
35*4882a593Smuzhiyun #define TASK_SIZE DEFAULT_TASK_SIZE
36*4882a593Smuzhiyun
37*4882a593Smuzhiyun /*
38*4882a593Smuzhiyun * This decides where the kernel will search for a free chunk of vm
39*4882a593Smuzhiyun * space during mmap's.
40*4882a593Smuzhiyun */
41*4882a593Smuzhiyun #define TASK_UNMAPPED_BASE (current->thread.map_base)
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun #define IA64_THREAD_FPH_VALID (__IA64_UL(1) << 0) /* floating-point high state valid? */
44*4882a593Smuzhiyun #define IA64_THREAD_DBG_VALID (__IA64_UL(1) << 1) /* debug registers valid? */
45*4882a593Smuzhiyun #define IA64_THREAD_PM_VALID (__IA64_UL(1) << 2) /* performance registers valid? */
46*4882a593Smuzhiyun #define IA64_THREAD_UAC_NOPRINT (__IA64_UL(1) << 3) /* don't log unaligned accesses */
47*4882a593Smuzhiyun #define IA64_THREAD_UAC_SIGBUS (__IA64_UL(1) << 4) /* generate SIGBUS on unaligned acc. */
48*4882a593Smuzhiyun #define IA64_THREAD_MIGRATION (__IA64_UL(1) << 5) /* require migration
49*4882a593Smuzhiyun sync at ctx sw */
50*4882a593Smuzhiyun #define IA64_THREAD_FPEMU_NOPRINT (__IA64_UL(1) << 6) /* don't log any fpswa faults */
51*4882a593Smuzhiyun #define IA64_THREAD_FPEMU_SIGFPE (__IA64_UL(1) << 7) /* send a SIGFPE for fpswa faults */
52*4882a593Smuzhiyun
53*4882a593Smuzhiyun #define IA64_THREAD_UAC_SHIFT 3
54*4882a593Smuzhiyun #define IA64_THREAD_UAC_MASK (IA64_THREAD_UAC_NOPRINT | IA64_THREAD_UAC_SIGBUS)
55*4882a593Smuzhiyun #define IA64_THREAD_FPEMU_SHIFT 6
56*4882a593Smuzhiyun #define IA64_THREAD_FPEMU_MASK (IA64_THREAD_FPEMU_NOPRINT | IA64_THREAD_FPEMU_SIGFPE)
57*4882a593Smuzhiyun
58*4882a593Smuzhiyun
59*4882a593Smuzhiyun /*
60*4882a593Smuzhiyun * This shift should be large enough to be able to represent 1000000000/itc_freq with good
61*4882a593Smuzhiyun * accuracy while being small enough to fit 10*1000000000<<IA64_NSEC_PER_CYC_SHIFT in 64 bits
62*4882a593Smuzhiyun * (this will give enough slack to represent 10 seconds worth of time as a scaled number).
63*4882a593Smuzhiyun */
64*4882a593Smuzhiyun #define IA64_NSEC_PER_CYC_SHIFT 30
65*4882a593Smuzhiyun
66*4882a593Smuzhiyun #ifndef __ASSEMBLY__
67*4882a593Smuzhiyun
68*4882a593Smuzhiyun #include <linux/cache.h>
69*4882a593Smuzhiyun #include <linux/compiler.h>
70*4882a593Smuzhiyun #include <linux/threads.h>
71*4882a593Smuzhiyun #include <linux/types.h>
72*4882a593Smuzhiyun #include <linux/bitops.h>
73*4882a593Smuzhiyun
74*4882a593Smuzhiyun #include <asm/fpu.h>
75*4882a593Smuzhiyun #include <asm/page.h>
76*4882a593Smuzhiyun #include <asm/percpu.h>
77*4882a593Smuzhiyun #include <asm/rse.h>
78*4882a593Smuzhiyun #include <asm/unwind.h>
79*4882a593Smuzhiyun #include <linux/atomic.h>
80*4882a593Smuzhiyun #ifdef CONFIG_NUMA
81*4882a593Smuzhiyun #include <asm/nodedata.h>
82*4882a593Smuzhiyun #endif
83*4882a593Smuzhiyun
84*4882a593Smuzhiyun /* like above but expressed as bitfields for more efficient access: */
85*4882a593Smuzhiyun struct ia64_psr {
86*4882a593Smuzhiyun __u64 reserved0 : 1;
87*4882a593Smuzhiyun __u64 be : 1;
88*4882a593Smuzhiyun __u64 up : 1;
89*4882a593Smuzhiyun __u64 ac : 1;
90*4882a593Smuzhiyun __u64 mfl : 1;
91*4882a593Smuzhiyun __u64 mfh : 1;
92*4882a593Smuzhiyun __u64 reserved1 : 7;
93*4882a593Smuzhiyun __u64 ic : 1;
94*4882a593Smuzhiyun __u64 i : 1;
95*4882a593Smuzhiyun __u64 pk : 1;
96*4882a593Smuzhiyun __u64 reserved2 : 1;
97*4882a593Smuzhiyun __u64 dt : 1;
98*4882a593Smuzhiyun __u64 dfl : 1;
99*4882a593Smuzhiyun __u64 dfh : 1;
100*4882a593Smuzhiyun __u64 sp : 1;
101*4882a593Smuzhiyun __u64 pp : 1;
102*4882a593Smuzhiyun __u64 di : 1;
103*4882a593Smuzhiyun __u64 si : 1;
104*4882a593Smuzhiyun __u64 db : 1;
105*4882a593Smuzhiyun __u64 lp : 1;
106*4882a593Smuzhiyun __u64 tb : 1;
107*4882a593Smuzhiyun __u64 rt : 1;
108*4882a593Smuzhiyun __u64 reserved3 : 4;
109*4882a593Smuzhiyun __u64 cpl : 2;
110*4882a593Smuzhiyun __u64 is : 1;
111*4882a593Smuzhiyun __u64 mc : 1;
112*4882a593Smuzhiyun __u64 it : 1;
113*4882a593Smuzhiyun __u64 id : 1;
114*4882a593Smuzhiyun __u64 da : 1;
115*4882a593Smuzhiyun __u64 dd : 1;
116*4882a593Smuzhiyun __u64 ss : 1;
117*4882a593Smuzhiyun __u64 ri : 2;
118*4882a593Smuzhiyun __u64 ed : 1;
119*4882a593Smuzhiyun __u64 bn : 1;
120*4882a593Smuzhiyun __u64 reserved4 : 19;
121*4882a593Smuzhiyun };
122*4882a593Smuzhiyun
123*4882a593Smuzhiyun union ia64_isr {
124*4882a593Smuzhiyun __u64 val;
125*4882a593Smuzhiyun struct {
126*4882a593Smuzhiyun __u64 code : 16;
127*4882a593Smuzhiyun __u64 vector : 8;
128*4882a593Smuzhiyun __u64 reserved1 : 8;
129*4882a593Smuzhiyun __u64 x : 1;
130*4882a593Smuzhiyun __u64 w : 1;
131*4882a593Smuzhiyun __u64 r : 1;
132*4882a593Smuzhiyun __u64 na : 1;
133*4882a593Smuzhiyun __u64 sp : 1;
134*4882a593Smuzhiyun __u64 rs : 1;
135*4882a593Smuzhiyun __u64 ir : 1;
136*4882a593Smuzhiyun __u64 ni : 1;
137*4882a593Smuzhiyun __u64 so : 1;
138*4882a593Smuzhiyun __u64 ei : 2;
139*4882a593Smuzhiyun __u64 ed : 1;
140*4882a593Smuzhiyun __u64 reserved2 : 20;
141*4882a593Smuzhiyun };
142*4882a593Smuzhiyun };
143*4882a593Smuzhiyun
144*4882a593Smuzhiyun union ia64_lid {
145*4882a593Smuzhiyun __u64 val;
146*4882a593Smuzhiyun struct {
147*4882a593Smuzhiyun __u64 rv : 16;
148*4882a593Smuzhiyun __u64 eid : 8;
149*4882a593Smuzhiyun __u64 id : 8;
150*4882a593Smuzhiyun __u64 ig : 32;
151*4882a593Smuzhiyun };
152*4882a593Smuzhiyun };
153*4882a593Smuzhiyun
154*4882a593Smuzhiyun union ia64_tpr {
155*4882a593Smuzhiyun __u64 val;
156*4882a593Smuzhiyun struct {
157*4882a593Smuzhiyun __u64 ig0 : 4;
158*4882a593Smuzhiyun __u64 mic : 4;
159*4882a593Smuzhiyun __u64 rsv : 8;
160*4882a593Smuzhiyun __u64 mmi : 1;
161*4882a593Smuzhiyun __u64 ig1 : 47;
162*4882a593Smuzhiyun };
163*4882a593Smuzhiyun };
164*4882a593Smuzhiyun
165*4882a593Smuzhiyun union ia64_itir {
166*4882a593Smuzhiyun __u64 val;
167*4882a593Smuzhiyun struct {
168*4882a593Smuzhiyun __u64 rv3 : 2; /* 0-1 */
169*4882a593Smuzhiyun __u64 ps : 6; /* 2-7 */
170*4882a593Smuzhiyun __u64 key : 24; /* 8-31 */
171*4882a593Smuzhiyun __u64 rv4 : 32; /* 32-63 */
172*4882a593Smuzhiyun };
173*4882a593Smuzhiyun };
174*4882a593Smuzhiyun
175*4882a593Smuzhiyun union ia64_rr {
176*4882a593Smuzhiyun __u64 val;
177*4882a593Smuzhiyun struct {
178*4882a593Smuzhiyun __u64 ve : 1; /* enable hw walker */
179*4882a593Smuzhiyun __u64 reserved0: 1; /* reserved */
180*4882a593Smuzhiyun __u64 ps : 6; /* log page size */
181*4882a593Smuzhiyun __u64 rid : 24; /* region id */
182*4882a593Smuzhiyun __u64 reserved1: 32; /* reserved */
183*4882a593Smuzhiyun };
184*4882a593Smuzhiyun };
185*4882a593Smuzhiyun
186*4882a593Smuzhiyun /*
187*4882a593Smuzhiyun * CPU type, hardware bug flags, and per-CPU state. Frequently used
188*4882a593Smuzhiyun * state comes earlier:
189*4882a593Smuzhiyun */
190*4882a593Smuzhiyun struct cpuinfo_ia64 {
191*4882a593Smuzhiyun unsigned int softirq_pending;
192*4882a593Smuzhiyun unsigned long itm_delta; /* # of clock cycles between clock ticks */
193*4882a593Smuzhiyun unsigned long itm_next; /* interval timer mask value to use for next clock tick */
194*4882a593Smuzhiyun unsigned long nsec_per_cyc; /* (1000000000<<IA64_NSEC_PER_CYC_SHIFT)/itc_freq */
195*4882a593Smuzhiyun unsigned long unimpl_va_mask; /* mask of unimplemented virtual address bits (from PAL) */
196*4882a593Smuzhiyun unsigned long unimpl_pa_mask; /* mask of unimplemented physical address bits (from PAL) */
197*4882a593Smuzhiyun unsigned long itc_freq; /* frequency of ITC counter */
198*4882a593Smuzhiyun unsigned long proc_freq; /* frequency of processor */
199*4882a593Smuzhiyun unsigned long cyc_per_usec; /* itc_freq/1000000 */
200*4882a593Smuzhiyun unsigned long ptce_base;
201*4882a593Smuzhiyun unsigned int ptce_count[2];
202*4882a593Smuzhiyun unsigned int ptce_stride[2];
203*4882a593Smuzhiyun struct task_struct *ksoftirqd; /* kernel softirq daemon for this CPU */
204*4882a593Smuzhiyun
205*4882a593Smuzhiyun #ifdef CONFIG_SMP
206*4882a593Smuzhiyun unsigned long loops_per_jiffy;
207*4882a593Smuzhiyun int cpu;
208*4882a593Smuzhiyun unsigned int socket_id; /* physical processor socket id */
209*4882a593Smuzhiyun unsigned short core_id; /* core id */
210*4882a593Smuzhiyun unsigned short thread_id; /* thread id */
211*4882a593Smuzhiyun unsigned short num_log; /* Total number of logical processors on
212*4882a593Smuzhiyun * this socket that were successfully booted */
213*4882a593Smuzhiyun unsigned char cores_per_socket; /* Cores per processor socket */
214*4882a593Smuzhiyun unsigned char threads_per_core; /* Threads per core */
215*4882a593Smuzhiyun #endif
216*4882a593Smuzhiyun
217*4882a593Smuzhiyun /* CPUID-derived information: */
218*4882a593Smuzhiyun unsigned long ppn;
219*4882a593Smuzhiyun unsigned long features;
220*4882a593Smuzhiyun unsigned char number;
221*4882a593Smuzhiyun unsigned char revision;
222*4882a593Smuzhiyun unsigned char model;
223*4882a593Smuzhiyun unsigned char family;
224*4882a593Smuzhiyun unsigned char archrev;
225*4882a593Smuzhiyun char vendor[16];
226*4882a593Smuzhiyun char *model_name;
227*4882a593Smuzhiyun
228*4882a593Smuzhiyun #ifdef CONFIG_NUMA
229*4882a593Smuzhiyun struct ia64_node_data *node_data;
230*4882a593Smuzhiyun #endif
231*4882a593Smuzhiyun };
232*4882a593Smuzhiyun
233*4882a593Smuzhiyun DECLARE_PER_CPU(struct cpuinfo_ia64, ia64_cpu_info);
234*4882a593Smuzhiyun
235*4882a593Smuzhiyun /*
236*4882a593Smuzhiyun * The "local" data variable. It refers to the per-CPU data of the currently executing
237*4882a593Smuzhiyun * CPU, much like "current" points to the per-task data of the currently executing task.
238*4882a593Smuzhiyun * Do not use the address of local_cpu_data, since it will be different from
239*4882a593Smuzhiyun * cpu_data(smp_processor_id())!
240*4882a593Smuzhiyun */
241*4882a593Smuzhiyun #define local_cpu_data (&__ia64_per_cpu_var(ia64_cpu_info))
242*4882a593Smuzhiyun #define cpu_data(cpu) (&per_cpu(ia64_cpu_info, cpu))
243*4882a593Smuzhiyun
244*4882a593Smuzhiyun extern void print_cpu_info (struct cpuinfo_ia64 *);
245*4882a593Smuzhiyun
246*4882a593Smuzhiyun typedef struct {
247*4882a593Smuzhiyun unsigned long seg;
248*4882a593Smuzhiyun } mm_segment_t;
249*4882a593Smuzhiyun
250*4882a593Smuzhiyun #define SET_UNALIGN_CTL(task,value) \
251*4882a593Smuzhiyun ({ \
252*4882a593Smuzhiyun (task)->thread.flags = (((task)->thread.flags & ~IA64_THREAD_UAC_MASK) \
253*4882a593Smuzhiyun | (((value) << IA64_THREAD_UAC_SHIFT) & IA64_THREAD_UAC_MASK)); \
254*4882a593Smuzhiyun 0; \
255*4882a593Smuzhiyun })
256*4882a593Smuzhiyun #define GET_UNALIGN_CTL(task,addr) \
257*4882a593Smuzhiyun ({ \
258*4882a593Smuzhiyun put_user(((task)->thread.flags & IA64_THREAD_UAC_MASK) >> IA64_THREAD_UAC_SHIFT, \
259*4882a593Smuzhiyun (int __user *) (addr)); \
260*4882a593Smuzhiyun })
261*4882a593Smuzhiyun
262*4882a593Smuzhiyun #define SET_FPEMU_CTL(task,value) \
263*4882a593Smuzhiyun ({ \
264*4882a593Smuzhiyun (task)->thread.flags = (((task)->thread.flags & ~IA64_THREAD_FPEMU_MASK) \
265*4882a593Smuzhiyun | (((value) << IA64_THREAD_FPEMU_SHIFT) & IA64_THREAD_FPEMU_MASK)); \
266*4882a593Smuzhiyun 0; \
267*4882a593Smuzhiyun })
268*4882a593Smuzhiyun #define GET_FPEMU_CTL(task,addr) \
269*4882a593Smuzhiyun ({ \
270*4882a593Smuzhiyun put_user(((task)->thread.flags & IA64_THREAD_FPEMU_MASK) >> IA64_THREAD_FPEMU_SHIFT, \
271*4882a593Smuzhiyun (int __user *) (addr)); \
272*4882a593Smuzhiyun })
273*4882a593Smuzhiyun
274*4882a593Smuzhiyun struct thread_struct {
275*4882a593Smuzhiyun __u32 flags; /* various thread flags (see IA64_THREAD_*) */
276*4882a593Smuzhiyun /* writing on_ustack is performance-critical, so it's worth spending 8 bits on it... */
277*4882a593Smuzhiyun __u8 on_ustack; /* executing on user-stacks? */
278*4882a593Smuzhiyun __u8 pad[3];
279*4882a593Smuzhiyun __u64 ksp; /* kernel stack pointer */
280*4882a593Smuzhiyun __u64 map_base; /* base address for get_unmapped_area() */
281*4882a593Smuzhiyun __u64 rbs_bot; /* the base address for the RBS */
282*4882a593Smuzhiyun int last_fph_cpu; /* CPU that may hold the contents of f32-f127 */
283*4882a593Smuzhiyun unsigned long dbr[IA64_NUM_DBG_REGS];
284*4882a593Smuzhiyun unsigned long ibr[IA64_NUM_DBG_REGS];
285*4882a593Smuzhiyun struct ia64_fpreg fph[96]; /* saved/loaded on demand */
286*4882a593Smuzhiyun };
287*4882a593Smuzhiyun
288*4882a593Smuzhiyun #define INIT_THREAD { \
289*4882a593Smuzhiyun .flags = 0, \
290*4882a593Smuzhiyun .on_ustack = 0, \
291*4882a593Smuzhiyun .ksp = 0, \
292*4882a593Smuzhiyun .map_base = DEFAULT_MAP_BASE, \
293*4882a593Smuzhiyun .rbs_bot = STACK_TOP - DEFAULT_USER_STACK_SIZE, \
294*4882a593Smuzhiyun .last_fph_cpu = -1, \
295*4882a593Smuzhiyun .dbr = {0, }, \
296*4882a593Smuzhiyun .ibr = {0, }, \
297*4882a593Smuzhiyun .fph = {{{{0}}}, } \
298*4882a593Smuzhiyun }
299*4882a593Smuzhiyun
300*4882a593Smuzhiyun #define start_thread(regs,new_ip,new_sp) do { \
301*4882a593Smuzhiyun regs->cr_ipsr = ((regs->cr_ipsr | (IA64_PSR_BITS_TO_SET | IA64_PSR_CPL)) \
302*4882a593Smuzhiyun & ~(IA64_PSR_BITS_TO_CLEAR | IA64_PSR_RI | IA64_PSR_IS)); \
303*4882a593Smuzhiyun regs->cr_iip = new_ip; \
304*4882a593Smuzhiyun regs->ar_rsc = 0xf; /* eager mode, privilege level 3 */ \
305*4882a593Smuzhiyun regs->ar_rnat = 0; \
306*4882a593Smuzhiyun regs->ar_bspstore = current->thread.rbs_bot; \
307*4882a593Smuzhiyun regs->ar_fpsr = FPSR_DEFAULT; \
308*4882a593Smuzhiyun regs->loadrs = 0; \
309*4882a593Smuzhiyun regs->r8 = get_dumpable(current->mm); /* set "don't zap registers" flag */ \
310*4882a593Smuzhiyun regs->r12 = new_sp - 16; /* allocate 16 byte scratch area */ \
311*4882a593Smuzhiyun if (unlikely(get_dumpable(current->mm) != SUID_DUMP_USER)) { \
312*4882a593Smuzhiyun /* \
313*4882a593Smuzhiyun * Zap scratch regs to avoid leaking bits between processes with different \
314*4882a593Smuzhiyun * uid/privileges. \
315*4882a593Smuzhiyun */ \
316*4882a593Smuzhiyun regs->ar_pfs = 0; regs->b0 = 0; regs->pr = 0; \
317*4882a593Smuzhiyun regs->r1 = 0; regs->r9 = 0; regs->r11 = 0; regs->r13 = 0; regs->r15 = 0; \
318*4882a593Smuzhiyun } \
319*4882a593Smuzhiyun } while (0)
320*4882a593Smuzhiyun
321*4882a593Smuzhiyun /* Forward declarations, a strange C thing... */
322*4882a593Smuzhiyun struct mm_struct;
323*4882a593Smuzhiyun struct task_struct;
324*4882a593Smuzhiyun
325*4882a593Smuzhiyun /*
326*4882a593Smuzhiyun * Free all resources held by a thread. This is called after the
327*4882a593Smuzhiyun * parent of DEAD_TASK has collected the exit status of the task via
328*4882a593Smuzhiyun * wait().
329*4882a593Smuzhiyun */
330*4882a593Smuzhiyun #define release_thread(dead_task)
331*4882a593Smuzhiyun
332*4882a593Smuzhiyun /* Get wait channel for task P. */
333*4882a593Smuzhiyun extern unsigned long get_wchan (struct task_struct *p);
334*4882a593Smuzhiyun
335*4882a593Smuzhiyun /* Return instruction pointer of blocked task TSK. */
336*4882a593Smuzhiyun #define KSTK_EIP(tsk) \
337*4882a593Smuzhiyun ({ \
338*4882a593Smuzhiyun struct pt_regs *_regs = task_pt_regs(tsk); \
339*4882a593Smuzhiyun _regs->cr_iip + ia64_psr(_regs)->ri; \
340*4882a593Smuzhiyun })
341*4882a593Smuzhiyun
342*4882a593Smuzhiyun /* Return stack pointer of blocked task TSK. */
343*4882a593Smuzhiyun #define KSTK_ESP(tsk) ((tsk)->thread.ksp)
344*4882a593Smuzhiyun
345*4882a593Smuzhiyun extern void ia64_getreg_unknown_kr (void);
346*4882a593Smuzhiyun extern void ia64_setreg_unknown_kr (void);
347*4882a593Smuzhiyun
348*4882a593Smuzhiyun #define ia64_get_kr(regnum) \
349*4882a593Smuzhiyun ({ \
350*4882a593Smuzhiyun unsigned long r = 0; \
351*4882a593Smuzhiyun \
352*4882a593Smuzhiyun switch (regnum) { \
353*4882a593Smuzhiyun case 0: r = ia64_getreg(_IA64_REG_AR_KR0); break; \
354*4882a593Smuzhiyun case 1: r = ia64_getreg(_IA64_REG_AR_KR1); break; \
355*4882a593Smuzhiyun case 2: r = ia64_getreg(_IA64_REG_AR_KR2); break; \
356*4882a593Smuzhiyun case 3: r = ia64_getreg(_IA64_REG_AR_KR3); break; \
357*4882a593Smuzhiyun case 4: r = ia64_getreg(_IA64_REG_AR_KR4); break; \
358*4882a593Smuzhiyun case 5: r = ia64_getreg(_IA64_REG_AR_KR5); break; \
359*4882a593Smuzhiyun case 6: r = ia64_getreg(_IA64_REG_AR_KR6); break; \
360*4882a593Smuzhiyun case 7: r = ia64_getreg(_IA64_REG_AR_KR7); break; \
361*4882a593Smuzhiyun default: ia64_getreg_unknown_kr(); break; \
362*4882a593Smuzhiyun } \
363*4882a593Smuzhiyun r; \
364*4882a593Smuzhiyun })
365*4882a593Smuzhiyun
366*4882a593Smuzhiyun #define ia64_set_kr(regnum, r) \
367*4882a593Smuzhiyun ({ \
368*4882a593Smuzhiyun switch (regnum) { \
369*4882a593Smuzhiyun case 0: ia64_setreg(_IA64_REG_AR_KR0, r); break; \
370*4882a593Smuzhiyun case 1: ia64_setreg(_IA64_REG_AR_KR1, r); break; \
371*4882a593Smuzhiyun case 2: ia64_setreg(_IA64_REG_AR_KR2, r); break; \
372*4882a593Smuzhiyun case 3: ia64_setreg(_IA64_REG_AR_KR3, r); break; \
373*4882a593Smuzhiyun case 4: ia64_setreg(_IA64_REG_AR_KR4, r); break; \
374*4882a593Smuzhiyun case 5: ia64_setreg(_IA64_REG_AR_KR5, r); break; \
375*4882a593Smuzhiyun case 6: ia64_setreg(_IA64_REG_AR_KR6, r); break; \
376*4882a593Smuzhiyun case 7: ia64_setreg(_IA64_REG_AR_KR7, r); break; \
377*4882a593Smuzhiyun default: ia64_setreg_unknown_kr(); break; \
378*4882a593Smuzhiyun } \
379*4882a593Smuzhiyun })
380*4882a593Smuzhiyun
381*4882a593Smuzhiyun /*
382*4882a593Smuzhiyun * The following three macros can't be inline functions because we don't have struct
383*4882a593Smuzhiyun * task_struct at this point.
384*4882a593Smuzhiyun */
385*4882a593Smuzhiyun
386*4882a593Smuzhiyun /*
387*4882a593Smuzhiyun * Return TRUE if task T owns the fph partition of the CPU we're running on.
388*4882a593Smuzhiyun * Must be called from code that has preemption disabled.
389*4882a593Smuzhiyun */
390*4882a593Smuzhiyun #define ia64_is_local_fpu_owner(t) \
391*4882a593Smuzhiyun ({ \
392*4882a593Smuzhiyun struct task_struct *__ia64_islfo_task = (t); \
393*4882a593Smuzhiyun (__ia64_islfo_task->thread.last_fph_cpu == smp_processor_id() \
394*4882a593Smuzhiyun && __ia64_islfo_task == (struct task_struct *) ia64_get_kr(IA64_KR_FPU_OWNER)); \
395*4882a593Smuzhiyun })
396*4882a593Smuzhiyun
397*4882a593Smuzhiyun /*
398*4882a593Smuzhiyun * Mark task T as owning the fph partition of the CPU we're running on.
399*4882a593Smuzhiyun * Must be called from code that has preemption disabled.
400*4882a593Smuzhiyun */
401*4882a593Smuzhiyun #define ia64_set_local_fpu_owner(t) do { \
402*4882a593Smuzhiyun struct task_struct *__ia64_slfo_task = (t); \
403*4882a593Smuzhiyun __ia64_slfo_task->thread.last_fph_cpu = smp_processor_id(); \
404*4882a593Smuzhiyun ia64_set_kr(IA64_KR_FPU_OWNER, (unsigned long) __ia64_slfo_task); \
405*4882a593Smuzhiyun } while (0)
406*4882a593Smuzhiyun
407*4882a593Smuzhiyun /* Mark the fph partition of task T as being invalid on all CPUs. */
408*4882a593Smuzhiyun #define ia64_drop_fpu(t) ((t)->thread.last_fph_cpu = -1)
409*4882a593Smuzhiyun
410*4882a593Smuzhiyun extern void __ia64_init_fpu (void);
411*4882a593Smuzhiyun extern void __ia64_save_fpu (struct ia64_fpreg *fph);
412*4882a593Smuzhiyun extern void __ia64_load_fpu (struct ia64_fpreg *fph);
413*4882a593Smuzhiyun extern void ia64_save_debug_regs (unsigned long *save_area);
414*4882a593Smuzhiyun extern void ia64_load_debug_regs (unsigned long *save_area);
415*4882a593Smuzhiyun
416*4882a593Smuzhiyun #define ia64_fph_enable() do { ia64_rsm(IA64_PSR_DFH); ia64_srlz_d(); } while (0)
417*4882a593Smuzhiyun #define ia64_fph_disable() do { ia64_ssm(IA64_PSR_DFH); ia64_srlz_d(); } while (0)
418*4882a593Smuzhiyun
419*4882a593Smuzhiyun /* load fp 0.0 into fph */
420*4882a593Smuzhiyun static inline void
ia64_init_fpu(void)421*4882a593Smuzhiyun ia64_init_fpu (void) {
422*4882a593Smuzhiyun ia64_fph_enable();
423*4882a593Smuzhiyun __ia64_init_fpu();
424*4882a593Smuzhiyun ia64_fph_disable();
425*4882a593Smuzhiyun }
426*4882a593Smuzhiyun
427*4882a593Smuzhiyun /* save f32-f127 at FPH */
428*4882a593Smuzhiyun static inline void
ia64_save_fpu(struct ia64_fpreg * fph)429*4882a593Smuzhiyun ia64_save_fpu (struct ia64_fpreg *fph) {
430*4882a593Smuzhiyun ia64_fph_enable();
431*4882a593Smuzhiyun __ia64_save_fpu(fph);
432*4882a593Smuzhiyun ia64_fph_disable();
433*4882a593Smuzhiyun }
434*4882a593Smuzhiyun
435*4882a593Smuzhiyun /* load f32-f127 from FPH */
436*4882a593Smuzhiyun static inline void
ia64_load_fpu(struct ia64_fpreg * fph)437*4882a593Smuzhiyun ia64_load_fpu (struct ia64_fpreg *fph) {
438*4882a593Smuzhiyun ia64_fph_enable();
439*4882a593Smuzhiyun __ia64_load_fpu(fph);
440*4882a593Smuzhiyun ia64_fph_disable();
441*4882a593Smuzhiyun }
442*4882a593Smuzhiyun
443*4882a593Smuzhiyun static inline __u64
ia64_clear_ic(void)444*4882a593Smuzhiyun ia64_clear_ic (void)
445*4882a593Smuzhiyun {
446*4882a593Smuzhiyun __u64 psr;
447*4882a593Smuzhiyun psr = ia64_getreg(_IA64_REG_PSR);
448*4882a593Smuzhiyun ia64_stop();
449*4882a593Smuzhiyun ia64_rsm(IA64_PSR_I | IA64_PSR_IC);
450*4882a593Smuzhiyun ia64_srlz_i();
451*4882a593Smuzhiyun return psr;
452*4882a593Smuzhiyun }
453*4882a593Smuzhiyun
454*4882a593Smuzhiyun /*
455*4882a593Smuzhiyun * Restore the psr.
456*4882a593Smuzhiyun */
457*4882a593Smuzhiyun static inline void
ia64_set_psr(__u64 psr)458*4882a593Smuzhiyun ia64_set_psr (__u64 psr)
459*4882a593Smuzhiyun {
460*4882a593Smuzhiyun ia64_stop();
461*4882a593Smuzhiyun ia64_setreg(_IA64_REG_PSR_L, psr);
462*4882a593Smuzhiyun ia64_srlz_i();
463*4882a593Smuzhiyun }
464*4882a593Smuzhiyun
465*4882a593Smuzhiyun /*
466*4882a593Smuzhiyun * Insert a translation into an instruction and/or data translation
467*4882a593Smuzhiyun * register.
468*4882a593Smuzhiyun */
469*4882a593Smuzhiyun static inline void
ia64_itr(__u64 target_mask,__u64 tr_num,__u64 vmaddr,__u64 pte,__u64 log_page_size)470*4882a593Smuzhiyun ia64_itr (__u64 target_mask, __u64 tr_num,
471*4882a593Smuzhiyun __u64 vmaddr, __u64 pte,
472*4882a593Smuzhiyun __u64 log_page_size)
473*4882a593Smuzhiyun {
474*4882a593Smuzhiyun ia64_setreg(_IA64_REG_CR_ITIR, (log_page_size << 2));
475*4882a593Smuzhiyun ia64_setreg(_IA64_REG_CR_IFA, vmaddr);
476*4882a593Smuzhiyun ia64_stop();
477*4882a593Smuzhiyun if (target_mask & 0x1)
478*4882a593Smuzhiyun ia64_itri(tr_num, pte);
479*4882a593Smuzhiyun if (target_mask & 0x2)
480*4882a593Smuzhiyun ia64_itrd(tr_num, pte);
481*4882a593Smuzhiyun }
482*4882a593Smuzhiyun
483*4882a593Smuzhiyun /*
484*4882a593Smuzhiyun * Insert a translation into the instruction and/or data translation
485*4882a593Smuzhiyun * cache.
486*4882a593Smuzhiyun */
487*4882a593Smuzhiyun static inline void
ia64_itc(__u64 target_mask,__u64 vmaddr,__u64 pte,__u64 log_page_size)488*4882a593Smuzhiyun ia64_itc (__u64 target_mask, __u64 vmaddr, __u64 pte,
489*4882a593Smuzhiyun __u64 log_page_size)
490*4882a593Smuzhiyun {
491*4882a593Smuzhiyun ia64_setreg(_IA64_REG_CR_ITIR, (log_page_size << 2));
492*4882a593Smuzhiyun ia64_setreg(_IA64_REG_CR_IFA, vmaddr);
493*4882a593Smuzhiyun ia64_stop();
494*4882a593Smuzhiyun /* as per EAS2.6, itc must be the last instruction in an instruction group */
495*4882a593Smuzhiyun if (target_mask & 0x1)
496*4882a593Smuzhiyun ia64_itci(pte);
497*4882a593Smuzhiyun if (target_mask & 0x2)
498*4882a593Smuzhiyun ia64_itcd(pte);
499*4882a593Smuzhiyun }
500*4882a593Smuzhiyun
501*4882a593Smuzhiyun /*
502*4882a593Smuzhiyun * Purge a range of addresses from instruction and/or data translation
503*4882a593Smuzhiyun * register(s).
504*4882a593Smuzhiyun */
505*4882a593Smuzhiyun static inline void
ia64_ptr(__u64 target_mask,__u64 vmaddr,__u64 log_size)506*4882a593Smuzhiyun ia64_ptr (__u64 target_mask, __u64 vmaddr, __u64 log_size)
507*4882a593Smuzhiyun {
508*4882a593Smuzhiyun if (target_mask & 0x1)
509*4882a593Smuzhiyun ia64_ptri(vmaddr, (log_size << 2));
510*4882a593Smuzhiyun if (target_mask & 0x2)
511*4882a593Smuzhiyun ia64_ptrd(vmaddr, (log_size << 2));
512*4882a593Smuzhiyun }
513*4882a593Smuzhiyun
514*4882a593Smuzhiyun /* Set the interrupt vector address. The address must be suitably aligned (32KB). */
515*4882a593Smuzhiyun static inline void
ia64_set_iva(void * ivt_addr)516*4882a593Smuzhiyun ia64_set_iva (void *ivt_addr)
517*4882a593Smuzhiyun {
518*4882a593Smuzhiyun ia64_setreg(_IA64_REG_CR_IVA, (__u64) ivt_addr);
519*4882a593Smuzhiyun ia64_srlz_i();
520*4882a593Smuzhiyun }
521*4882a593Smuzhiyun
522*4882a593Smuzhiyun /* Set the page table address and control bits. */
523*4882a593Smuzhiyun static inline void
ia64_set_pta(__u64 pta)524*4882a593Smuzhiyun ia64_set_pta (__u64 pta)
525*4882a593Smuzhiyun {
526*4882a593Smuzhiyun /* Note: srlz.i implies srlz.d */
527*4882a593Smuzhiyun ia64_setreg(_IA64_REG_CR_PTA, pta);
528*4882a593Smuzhiyun ia64_srlz_i();
529*4882a593Smuzhiyun }
530*4882a593Smuzhiyun
531*4882a593Smuzhiyun static inline void
ia64_eoi(void)532*4882a593Smuzhiyun ia64_eoi (void)
533*4882a593Smuzhiyun {
534*4882a593Smuzhiyun ia64_setreg(_IA64_REG_CR_EOI, 0);
535*4882a593Smuzhiyun ia64_srlz_d();
536*4882a593Smuzhiyun }
537*4882a593Smuzhiyun
538*4882a593Smuzhiyun #define cpu_relax() ia64_hint(ia64_hint_pause)
539*4882a593Smuzhiyun
540*4882a593Smuzhiyun static inline int
ia64_get_irr(unsigned int vector)541*4882a593Smuzhiyun ia64_get_irr(unsigned int vector)
542*4882a593Smuzhiyun {
543*4882a593Smuzhiyun unsigned int reg = vector / 64;
544*4882a593Smuzhiyun unsigned int bit = vector % 64;
545*4882a593Smuzhiyun unsigned long irr;
546*4882a593Smuzhiyun
547*4882a593Smuzhiyun switch (reg) {
548*4882a593Smuzhiyun case 0: irr = ia64_getreg(_IA64_REG_CR_IRR0); break;
549*4882a593Smuzhiyun case 1: irr = ia64_getreg(_IA64_REG_CR_IRR1); break;
550*4882a593Smuzhiyun case 2: irr = ia64_getreg(_IA64_REG_CR_IRR2); break;
551*4882a593Smuzhiyun case 3: irr = ia64_getreg(_IA64_REG_CR_IRR3); break;
552*4882a593Smuzhiyun }
553*4882a593Smuzhiyun
554*4882a593Smuzhiyun return test_bit(bit, &irr);
555*4882a593Smuzhiyun }
556*4882a593Smuzhiyun
557*4882a593Smuzhiyun static inline void
ia64_set_lrr0(unsigned long val)558*4882a593Smuzhiyun ia64_set_lrr0 (unsigned long val)
559*4882a593Smuzhiyun {
560*4882a593Smuzhiyun ia64_setreg(_IA64_REG_CR_LRR0, val);
561*4882a593Smuzhiyun ia64_srlz_d();
562*4882a593Smuzhiyun }
563*4882a593Smuzhiyun
564*4882a593Smuzhiyun static inline void
ia64_set_lrr1(unsigned long val)565*4882a593Smuzhiyun ia64_set_lrr1 (unsigned long val)
566*4882a593Smuzhiyun {
567*4882a593Smuzhiyun ia64_setreg(_IA64_REG_CR_LRR1, val);
568*4882a593Smuzhiyun ia64_srlz_d();
569*4882a593Smuzhiyun }
570*4882a593Smuzhiyun
571*4882a593Smuzhiyun
572*4882a593Smuzhiyun /*
573*4882a593Smuzhiyun * Given the address to which a spill occurred, return the unat bit
574*4882a593Smuzhiyun * number that corresponds to this address.
575*4882a593Smuzhiyun */
576*4882a593Smuzhiyun static inline __u64
ia64_unat_pos(void * spill_addr)577*4882a593Smuzhiyun ia64_unat_pos (void *spill_addr)
578*4882a593Smuzhiyun {
579*4882a593Smuzhiyun return ((__u64) spill_addr >> 3) & 0x3f;
580*4882a593Smuzhiyun }
581*4882a593Smuzhiyun
582*4882a593Smuzhiyun /*
583*4882a593Smuzhiyun * Set the NaT bit of an integer register which was spilled at address
584*4882a593Smuzhiyun * SPILL_ADDR. UNAT is the mask to be updated.
585*4882a593Smuzhiyun */
586*4882a593Smuzhiyun static inline void
ia64_set_unat(__u64 * unat,void * spill_addr,unsigned long nat)587*4882a593Smuzhiyun ia64_set_unat (__u64 *unat, void *spill_addr, unsigned long nat)
588*4882a593Smuzhiyun {
589*4882a593Smuzhiyun __u64 bit = ia64_unat_pos(spill_addr);
590*4882a593Smuzhiyun __u64 mask = 1UL << bit;
591*4882a593Smuzhiyun
592*4882a593Smuzhiyun *unat = (*unat & ~mask) | (nat << bit);
593*4882a593Smuzhiyun }
594*4882a593Smuzhiyun
595*4882a593Smuzhiyun static inline __u64
ia64_get_ivr(void)596*4882a593Smuzhiyun ia64_get_ivr (void)
597*4882a593Smuzhiyun {
598*4882a593Smuzhiyun __u64 r;
599*4882a593Smuzhiyun ia64_srlz_d();
600*4882a593Smuzhiyun r = ia64_getreg(_IA64_REG_CR_IVR);
601*4882a593Smuzhiyun ia64_srlz_d();
602*4882a593Smuzhiyun return r;
603*4882a593Smuzhiyun }
604*4882a593Smuzhiyun
605*4882a593Smuzhiyun static inline void
ia64_set_dbr(__u64 regnum,__u64 value)606*4882a593Smuzhiyun ia64_set_dbr (__u64 regnum, __u64 value)
607*4882a593Smuzhiyun {
608*4882a593Smuzhiyun __ia64_set_dbr(regnum, value);
609*4882a593Smuzhiyun #ifdef CONFIG_ITANIUM
610*4882a593Smuzhiyun ia64_srlz_d();
611*4882a593Smuzhiyun #endif
612*4882a593Smuzhiyun }
613*4882a593Smuzhiyun
614*4882a593Smuzhiyun static inline __u64
ia64_get_dbr(__u64 regnum)615*4882a593Smuzhiyun ia64_get_dbr (__u64 regnum)
616*4882a593Smuzhiyun {
617*4882a593Smuzhiyun __u64 retval;
618*4882a593Smuzhiyun
619*4882a593Smuzhiyun retval = __ia64_get_dbr(regnum);
620*4882a593Smuzhiyun #ifdef CONFIG_ITANIUM
621*4882a593Smuzhiyun ia64_srlz_d();
622*4882a593Smuzhiyun #endif
623*4882a593Smuzhiyun return retval;
624*4882a593Smuzhiyun }
625*4882a593Smuzhiyun
626*4882a593Smuzhiyun static inline __u64
ia64_rotr(__u64 w,__u64 n)627*4882a593Smuzhiyun ia64_rotr (__u64 w, __u64 n)
628*4882a593Smuzhiyun {
629*4882a593Smuzhiyun return (w >> n) | (w << (64 - n));
630*4882a593Smuzhiyun }
631*4882a593Smuzhiyun
632*4882a593Smuzhiyun #define ia64_rotl(w,n) ia64_rotr((w), (64) - (n))
633*4882a593Smuzhiyun
634*4882a593Smuzhiyun /*
635*4882a593Smuzhiyun * Take a mapped kernel address and return the equivalent address
636*4882a593Smuzhiyun * in the region 7 identity mapped virtual area.
637*4882a593Smuzhiyun */
638*4882a593Smuzhiyun static inline void *
ia64_imva(void * addr)639*4882a593Smuzhiyun ia64_imva (void *addr)
640*4882a593Smuzhiyun {
641*4882a593Smuzhiyun void *result;
642*4882a593Smuzhiyun result = (void *) ia64_tpa(addr);
643*4882a593Smuzhiyun return __va(result);
644*4882a593Smuzhiyun }
645*4882a593Smuzhiyun
646*4882a593Smuzhiyun #define ARCH_HAS_PREFETCH
647*4882a593Smuzhiyun #define ARCH_HAS_PREFETCHW
648*4882a593Smuzhiyun #define ARCH_HAS_SPINLOCK_PREFETCH
649*4882a593Smuzhiyun #define PREFETCH_STRIDE L1_CACHE_BYTES
650*4882a593Smuzhiyun
651*4882a593Smuzhiyun static inline void
prefetch(const void * x)652*4882a593Smuzhiyun prefetch (const void *x)
653*4882a593Smuzhiyun {
654*4882a593Smuzhiyun ia64_lfetch(ia64_lfhint_none, x);
655*4882a593Smuzhiyun }
656*4882a593Smuzhiyun
657*4882a593Smuzhiyun static inline void
prefetchw(const void * x)658*4882a593Smuzhiyun prefetchw (const void *x)
659*4882a593Smuzhiyun {
660*4882a593Smuzhiyun ia64_lfetch_excl(ia64_lfhint_none, x);
661*4882a593Smuzhiyun }
662*4882a593Smuzhiyun
663*4882a593Smuzhiyun #define spin_lock_prefetch(x) prefetchw(x)
664*4882a593Smuzhiyun
665*4882a593Smuzhiyun extern unsigned long boot_option_idle_override;
666*4882a593Smuzhiyun
667*4882a593Smuzhiyun enum idle_boot_override {IDLE_NO_OVERRIDE=0, IDLE_HALT, IDLE_FORCE_MWAIT,
668*4882a593Smuzhiyun IDLE_NOMWAIT, IDLE_POLL};
669*4882a593Smuzhiyun
670*4882a593Smuzhiyun void default_idle(void);
671*4882a593Smuzhiyun
672*4882a593Smuzhiyun #endif /* !__ASSEMBLY__ */
673*4882a593Smuzhiyun
674*4882a593Smuzhiyun #endif /* _ASM_IA64_PROCESSOR_H */
675