1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * GRU KERNEL MCS INSTRUCTIONS
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright (c) 2008 Silicon Graphics, Inc. All Rights Reserved.
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #include <linux/kernel.h>
9*4882a593Smuzhiyun #include "gru.h"
10*4882a593Smuzhiyun #include "grulib.h"
11*4882a593Smuzhiyun #include "grutables.h"
12*4882a593Smuzhiyun
13*4882a593Smuzhiyun /* 10 sec */
14*4882a593Smuzhiyun #ifdef CONFIG_IA64
15*4882a593Smuzhiyun #include <asm/processor.h>
16*4882a593Smuzhiyun #define GRU_OPERATION_TIMEOUT (((cycles_t) local_cpu_data->itc_freq)*10)
17*4882a593Smuzhiyun #define CLKS2NSEC(c) ((c) *1000000000 / local_cpu_data->itc_freq)
18*4882a593Smuzhiyun #else
19*4882a593Smuzhiyun #include <linux/sync_core.h>
20*4882a593Smuzhiyun #include <asm/tsc.h>
21*4882a593Smuzhiyun #define GRU_OPERATION_TIMEOUT ((cycles_t) tsc_khz*10*1000)
22*4882a593Smuzhiyun #define CLKS2NSEC(c) ((c) * 1000000 / tsc_khz)
23*4882a593Smuzhiyun #endif
24*4882a593Smuzhiyun
25*4882a593Smuzhiyun /* Extract the status field from a kernel handle */
26*4882a593Smuzhiyun #define GET_MSEG_HANDLE_STATUS(h) (((*(unsigned long *)(h)) >> 16) & 3)
27*4882a593Smuzhiyun
28*4882a593Smuzhiyun struct mcs_op_statistic mcs_op_statistics[mcsop_last];
29*4882a593Smuzhiyun
update_mcs_stats(enum mcs_op op,unsigned long clks)30*4882a593Smuzhiyun static void update_mcs_stats(enum mcs_op op, unsigned long clks)
31*4882a593Smuzhiyun {
32*4882a593Smuzhiyun unsigned long nsec;
33*4882a593Smuzhiyun
34*4882a593Smuzhiyun nsec = CLKS2NSEC(clks);
35*4882a593Smuzhiyun atomic_long_inc(&mcs_op_statistics[op].count);
36*4882a593Smuzhiyun atomic_long_add(nsec, &mcs_op_statistics[op].total);
37*4882a593Smuzhiyun if (mcs_op_statistics[op].max < nsec)
38*4882a593Smuzhiyun mcs_op_statistics[op].max = nsec;
39*4882a593Smuzhiyun }
40*4882a593Smuzhiyun
start_instruction(void * h)41*4882a593Smuzhiyun static void start_instruction(void *h)
42*4882a593Smuzhiyun {
43*4882a593Smuzhiyun unsigned long *w0 = h;
44*4882a593Smuzhiyun
45*4882a593Smuzhiyun wmb(); /* setting CMD/STATUS bits must be last */
46*4882a593Smuzhiyun *w0 = *w0 | 0x20001;
47*4882a593Smuzhiyun gru_flush_cache(h);
48*4882a593Smuzhiyun }
49*4882a593Smuzhiyun
report_instruction_timeout(void * h)50*4882a593Smuzhiyun static void report_instruction_timeout(void *h)
51*4882a593Smuzhiyun {
52*4882a593Smuzhiyun unsigned long goff = GSEGPOFF((unsigned long)h);
53*4882a593Smuzhiyun char *id = "???";
54*4882a593Smuzhiyun
55*4882a593Smuzhiyun if (TYPE_IS(CCH, goff))
56*4882a593Smuzhiyun id = "CCH";
57*4882a593Smuzhiyun else if (TYPE_IS(TGH, goff))
58*4882a593Smuzhiyun id = "TGH";
59*4882a593Smuzhiyun else if (TYPE_IS(TFH, goff))
60*4882a593Smuzhiyun id = "TFH";
61*4882a593Smuzhiyun
62*4882a593Smuzhiyun panic(KERN_ALERT "GRU %p (%s) is malfunctioning\n", h, id);
63*4882a593Smuzhiyun }
64*4882a593Smuzhiyun
wait_instruction_complete(void * h,enum mcs_op opc)65*4882a593Smuzhiyun static int wait_instruction_complete(void *h, enum mcs_op opc)
66*4882a593Smuzhiyun {
67*4882a593Smuzhiyun int status;
68*4882a593Smuzhiyun unsigned long start_time = get_cycles();
69*4882a593Smuzhiyun
70*4882a593Smuzhiyun while (1) {
71*4882a593Smuzhiyun cpu_relax();
72*4882a593Smuzhiyun status = GET_MSEG_HANDLE_STATUS(h);
73*4882a593Smuzhiyun if (status != CCHSTATUS_ACTIVE)
74*4882a593Smuzhiyun break;
75*4882a593Smuzhiyun if (GRU_OPERATION_TIMEOUT < (get_cycles() - start_time)) {
76*4882a593Smuzhiyun report_instruction_timeout(h);
77*4882a593Smuzhiyun start_time = get_cycles();
78*4882a593Smuzhiyun }
79*4882a593Smuzhiyun }
80*4882a593Smuzhiyun if (gru_options & OPT_STATS)
81*4882a593Smuzhiyun update_mcs_stats(opc, get_cycles() - start_time);
82*4882a593Smuzhiyun return status;
83*4882a593Smuzhiyun }
84*4882a593Smuzhiyun
cch_allocate(struct gru_context_configuration_handle * cch)85*4882a593Smuzhiyun int cch_allocate(struct gru_context_configuration_handle *cch)
86*4882a593Smuzhiyun {
87*4882a593Smuzhiyun int ret;
88*4882a593Smuzhiyun
89*4882a593Smuzhiyun cch->opc = CCHOP_ALLOCATE;
90*4882a593Smuzhiyun start_instruction(cch);
91*4882a593Smuzhiyun ret = wait_instruction_complete(cch, cchop_allocate);
92*4882a593Smuzhiyun
93*4882a593Smuzhiyun /*
94*4882a593Smuzhiyun * Stop speculation into the GSEG being mapped by the previous ALLOCATE.
95*4882a593Smuzhiyun * The GSEG memory does not exist until the ALLOCATE completes.
96*4882a593Smuzhiyun */
97*4882a593Smuzhiyun sync_core();
98*4882a593Smuzhiyun return ret;
99*4882a593Smuzhiyun }
100*4882a593Smuzhiyun
cch_start(struct gru_context_configuration_handle * cch)101*4882a593Smuzhiyun int cch_start(struct gru_context_configuration_handle *cch)
102*4882a593Smuzhiyun {
103*4882a593Smuzhiyun cch->opc = CCHOP_START;
104*4882a593Smuzhiyun start_instruction(cch);
105*4882a593Smuzhiyun return wait_instruction_complete(cch, cchop_start);
106*4882a593Smuzhiyun }
107*4882a593Smuzhiyun
cch_interrupt(struct gru_context_configuration_handle * cch)108*4882a593Smuzhiyun int cch_interrupt(struct gru_context_configuration_handle *cch)
109*4882a593Smuzhiyun {
110*4882a593Smuzhiyun cch->opc = CCHOP_INTERRUPT;
111*4882a593Smuzhiyun start_instruction(cch);
112*4882a593Smuzhiyun return wait_instruction_complete(cch, cchop_interrupt);
113*4882a593Smuzhiyun }
114*4882a593Smuzhiyun
cch_deallocate(struct gru_context_configuration_handle * cch)115*4882a593Smuzhiyun int cch_deallocate(struct gru_context_configuration_handle *cch)
116*4882a593Smuzhiyun {
117*4882a593Smuzhiyun int ret;
118*4882a593Smuzhiyun
119*4882a593Smuzhiyun cch->opc = CCHOP_DEALLOCATE;
120*4882a593Smuzhiyun start_instruction(cch);
121*4882a593Smuzhiyun ret = wait_instruction_complete(cch, cchop_deallocate);
122*4882a593Smuzhiyun
123*4882a593Smuzhiyun /*
124*4882a593Smuzhiyun * Stop speculation into the GSEG being unmapped by the previous
125*4882a593Smuzhiyun * DEALLOCATE.
126*4882a593Smuzhiyun */
127*4882a593Smuzhiyun sync_core();
128*4882a593Smuzhiyun return ret;
129*4882a593Smuzhiyun }
130*4882a593Smuzhiyun
cch_interrupt_sync(struct gru_context_configuration_handle * cch)131*4882a593Smuzhiyun int cch_interrupt_sync(struct gru_context_configuration_handle
132*4882a593Smuzhiyun *cch)
133*4882a593Smuzhiyun {
134*4882a593Smuzhiyun cch->opc = CCHOP_INTERRUPT_SYNC;
135*4882a593Smuzhiyun start_instruction(cch);
136*4882a593Smuzhiyun return wait_instruction_complete(cch, cchop_interrupt_sync);
137*4882a593Smuzhiyun }
138*4882a593Smuzhiyun
tgh_invalidate(struct gru_tlb_global_handle * tgh,unsigned long vaddr,unsigned long vaddrmask,int asid,int pagesize,int global,int n,unsigned short ctxbitmap)139*4882a593Smuzhiyun int tgh_invalidate(struct gru_tlb_global_handle *tgh,
140*4882a593Smuzhiyun unsigned long vaddr, unsigned long vaddrmask,
141*4882a593Smuzhiyun int asid, int pagesize, int global, int n,
142*4882a593Smuzhiyun unsigned short ctxbitmap)
143*4882a593Smuzhiyun {
144*4882a593Smuzhiyun tgh->vaddr = vaddr;
145*4882a593Smuzhiyun tgh->asid = asid;
146*4882a593Smuzhiyun tgh->pagesize = pagesize;
147*4882a593Smuzhiyun tgh->n = n;
148*4882a593Smuzhiyun tgh->global = global;
149*4882a593Smuzhiyun tgh->vaddrmask = vaddrmask;
150*4882a593Smuzhiyun tgh->ctxbitmap = ctxbitmap;
151*4882a593Smuzhiyun tgh->opc = TGHOP_TLBINV;
152*4882a593Smuzhiyun start_instruction(tgh);
153*4882a593Smuzhiyun return wait_instruction_complete(tgh, tghop_invalidate);
154*4882a593Smuzhiyun }
155*4882a593Smuzhiyun
tfh_write_only(struct gru_tlb_fault_handle * tfh,unsigned long paddr,int gaa,unsigned long vaddr,int asid,int dirty,int pagesize)156*4882a593Smuzhiyun int tfh_write_only(struct gru_tlb_fault_handle *tfh,
157*4882a593Smuzhiyun unsigned long paddr, int gaa,
158*4882a593Smuzhiyun unsigned long vaddr, int asid, int dirty,
159*4882a593Smuzhiyun int pagesize)
160*4882a593Smuzhiyun {
161*4882a593Smuzhiyun tfh->fillasid = asid;
162*4882a593Smuzhiyun tfh->fillvaddr = vaddr;
163*4882a593Smuzhiyun tfh->pfn = paddr >> GRU_PADDR_SHIFT;
164*4882a593Smuzhiyun tfh->gaa = gaa;
165*4882a593Smuzhiyun tfh->dirty = dirty;
166*4882a593Smuzhiyun tfh->pagesize = pagesize;
167*4882a593Smuzhiyun tfh->opc = TFHOP_WRITE_ONLY;
168*4882a593Smuzhiyun start_instruction(tfh);
169*4882a593Smuzhiyun return wait_instruction_complete(tfh, tfhop_write_only);
170*4882a593Smuzhiyun }
171*4882a593Smuzhiyun
tfh_write_restart(struct gru_tlb_fault_handle * tfh,unsigned long paddr,int gaa,unsigned long vaddr,int asid,int dirty,int pagesize)172*4882a593Smuzhiyun void tfh_write_restart(struct gru_tlb_fault_handle *tfh,
173*4882a593Smuzhiyun unsigned long paddr, int gaa,
174*4882a593Smuzhiyun unsigned long vaddr, int asid, int dirty,
175*4882a593Smuzhiyun int pagesize)
176*4882a593Smuzhiyun {
177*4882a593Smuzhiyun tfh->fillasid = asid;
178*4882a593Smuzhiyun tfh->fillvaddr = vaddr;
179*4882a593Smuzhiyun tfh->pfn = paddr >> GRU_PADDR_SHIFT;
180*4882a593Smuzhiyun tfh->gaa = gaa;
181*4882a593Smuzhiyun tfh->dirty = dirty;
182*4882a593Smuzhiyun tfh->pagesize = pagesize;
183*4882a593Smuzhiyun tfh->opc = TFHOP_WRITE_RESTART;
184*4882a593Smuzhiyun start_instruction(tfh);
185*4882a593Smuzhiyun }
186*4882a593Smuzhiyun
tfh_user_polling_mode(struct gru_tlb_fault_handle * tfh)187*4882a593Smuzhiyun void tfh_user_polling_mode(struct gru_tlb_fault_handle *tfh)
188*4882a593Smuzhiyun {
189*4882a593Smuzhiyun tfh->opc = TFHOP_USER_POLLING_MODE;
190*4882a593Smuzhiyun start_instruction(tfh);
191*4882a593Smuzhiyun }
192*4882a593Smuzhiyun
tfh_exception(struct gru_tlb_fault_handle * tfh)193*4882a593Smuzhiyun void tfh_exception(struct gru_tlb_fault_handle *tfh)
194*4882a593Smuzhiyun {
195*4882a593Smuzhiyun tfh->opc = TFHOP_EXCEPTION;
196*4882a593Smuzhiyun start_instruction(tfh);
197*4882a593Smuzhiyun }
198*4882a593Smuzhiyun
199