1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Freescale Embedded oprofile support, based on ppc64 oprofile support
4*4882a593Smuzhiyun * Copyright (C) 2004 Anton Blanchard <anton@au.ibm.com>, IBM
5*4882a593Smuzhiyun *
6*4882a593Smuzhiyun * Copyright (c) 2004, 2010 Freescale Semiconductor, Inc
7*4882a593Smuzhiyun *
8*4882a593Smuzhiyun * Author: Andy Fleming
9*4882a593Smuzhiyun * Maintainer: Kumar Gala <galak@kernel.crashing.org>
10*4882a593Smuzhiyun */
11*4882a593Smuzhiyun
12*4882a593Smuzhiyun #include <linux/oprofile.h>
13*4882a593Smuzhiyun #include <linux/smp.h>
14*4882a593Smuzhiyun #include <asm/ptrace.h>
15*4882a593Smuzhiyun #include <asm/processor.h>
16*4882a593Smuzhiyun #include <asm/cputable.h>
17*4882a593Smuzhiyun #include <asm/reg_fsl_emb.h>
18*4882a593Smuzhiyun #include <asm/page.h>
19*4882a593Smuzhiyun #include <asm/pmc.h>
20*4882a593Smuzhiyun #include <asm/oprofile_impl.h>
21*4882a593Smuzhiyun
22*4882a593Smuzhiyun static unsigned long reset_value[OP_MAX_COUNTER];
23*4882a593Smuzhiyun
24*4882a593Smuzhiyun static int num_counters;
25*4882a593Smuzhiyun static int oprofile_running;
26*4882a593Smuzhiyun
get_pmlca(int ctr)27*4882a593Smuzhiyun static inline u32 get_pmlca(int ctr)
28*4882a593Smuzhiyun {
29*4882a593Smuzhiyun u32 pmlca;
30*4882a593Smuzhiyun
31*4882a593Smuzhiyun switch (ctr) {
32*4882a593Smuzhiyun case 0:
33*4882a593Smuzhiyun pmlca = mfpmr(PMRN_PMLCA0);
34*4882a593Smuzhiyun break;
35*4882a593Smuzhiyun case 1:
36*4882a593Smuzhiyun pmlca = mfpmr(PMRN_PMLCA1);
37*4882a593Smuzhiyun break;
38*4882a593Smuzhiyun case 2:
39*4882a593Smuzhiyun pmlca = mfpmr(PMRN_PMLCA2);
40*4882a593Smuzhiyun break;
41*4882a593Smuzhiyun case 3:
42*4882a593Smuzhiyun pmlca = mfpmr(PMRN_PMLCA3);
43*4882a593Smuzhiyun break;
44*4882a593Smuzhiyun case 4:
45*4882a593Smuzhiyun pmlca = mfpmr(PMRN_PMLCA4);
46*4882a593Smuzhiyun break;
47*4882a593Smuzhiyun case 5:
48*4882a593Smuzhiyun pmlca = mfpmr(PMRN_PMLCA5);
49*4882a593Smuzhiyun break;
50*4882a593Smuzhiyun default:
51*4882a593Smuzhiyun panic("Bad ctr number\n");
52*4882a593Smuzhiyun }
53*4882a593Smuzhiyun
54*4882a593Smuzhiyun return pmlca;
55*4882a593Smuzhiyun }
56*4882a593Smuzhiyun
set_pmlca(int ctr,u32 pmlca)57*4882a593Smuzhiyun static inline void set_pmlca(int ctr, u32 pmlca)
58*4882a593Smuzhiyun {
59*4882a593Smuzhiyun switch (ctr) {
60*4882a593Smuzhiyun case 0:
61*4882a593Smuzhiyun mtpmr(PMRN_PMLCA0, pmlca);
62*4882a593Smuzhiyun break;
63*4882a593Smuzhiyun case 1:
64*4882a593Smuzhiyun mtpmr(PMRN_PMLCA1, pmlca);
65*4882a593Smuzhiyun break;
66*4882a593Smuzhiyun case 2:
67*4882a593Smuzhiyun mtpmr(PMRN_PMLCA2, pmlca);
68*4882a593Smuzhiyun break;
69*4882a593Smuzhiyun case 3:
70*4882a593Smuzhiyun mtpmr(PMRN_PMLCA3, pmlca);
71*4882a593Smuzhiyun break;
72*4882a593Smuzhiyun case 4:
73*4882a593Smuzhiyun mtpmr(PMRN_PMLCA4, pmlca);
74*4882a593Smuzhiyun break;
75*4882a593Smuzhiyun case 5:
76*4882a593Smuzhiyun mtpmr(PMRN_PMLCA5, pmlca);
77*4882a593Smuzhiyun break;
78*4882a593Smuzhiyun default:
79*4882a593Smuzhiyun panic("Bad ctr number\n");
80*4882a593Smuzhiyun }
81*4882a593Smuzhiyun }
82*4882a593Smuzhiyun
ctr_read(unsigned int i)83*4882a593Smuzhiyun static inline unsigned int ctr_read(unsigned int i)
84*4882a593Smuzhiyun {
85*4882a593Smuzhiyun switch(i) {
86*4882a593Smuzhiyun case 0:
87*4882a593Smuzhiyun return mfpmr(PMRN_PMC0);
88*4882a593Smuzhiyun case 1:
89*4882a593Smuzhiyun return mfpmr(PMRN_PMC1);
90*4882a593Smuzhiyun case 2:
91*4882a593Smuzhiyun return mfpmr(PMRN_PMC2);
92*4882a593Smuzhiyun case 3:
93*4882a593Smuzhiyun return mfpmr(PMRN_PMC3);
94*4882a593Smuzhiyun case 4:
95*4882a593Smuzhiyun return mfpmr(PMRN_PMC4);
96*4882a593Smuzhiyun case 5:
97*4882a593Smuzhiyun return mfpmr(PMRN_PMC5);
98*4882a593Smuzhiyun default:
99*4882a593Smuzhiyun return 0;
100*4882a593Smuzhiyun }
101*4882a593Smuzhiyun }
102*4882a593Smuzhiyun
ctr_write(unsigned int i,unsigned int val)103*4882a593Smuzhiyun static inline void ctr_write(unsigned int i, unsigned int val)
104*4882a593Smuzhiyun {
105*4882a593Smuzhiyun switch(i) {
106*4882a593Smuzhiyun case 0:
107*4882a593Smuzhiyun mtpmr(PMRN_PMC0, val);
108*4882a593Smuzhiyun break;
109*4882a593Smuzhiyun case 1:
110*4882a593Smuzhiyun mtpmr(PMRN_PMC1, val);
111*4882a593Smuzhiyun break;
112*4882a593Smuzhiyun case 2:
113*4882a593Smuzhiyun mtpmr(PMRN_PMC2, val);
114*4882a593Smuzhiyun break;
115*4882a593Smuzhiyun case 3:
116*4882a593Smuzhiyun mtpmr(PMRN_PMC3, val);
117*4882a593Smuzhiyun break;
118*4882a593Smuzhiyun case 4:
119*4882a593Smuzhiyun mtpmr(PMRN_PMC4, val);
120*4882a593Smuzhiyun break;
121*4882a593Smuzhiyun case 5:
122*4882a593Smuzhiyun mtpmr(PMRN_PMC5, val);
123*4882a593Smuzhiyun break;
124*4882a593Smuzhiyun default:
125*4882a593Smuzhiyun break;
126*4882a593Smuzhiyun }
127*4882a593Smuzhiyun }
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun
init_pmc_stop(int ctr)130*4882a593Smuzhiyun static void init_pmc_stop(int ctr)
131*4882a593Smuzhiyun {
132*4882a593Smuzhiyun u32 pmlca = (PMLCA_FC | PMLCA_FCS | PMLCA_FCU |
133*4882a593Smuzhiyun PMLCA_FCM1 | PMLCA_FCM0);
134*4882a593Smuzhiyun u32 pmlcb = 0;
135*4882a593Smuzhiyun
136*4882a593Smuzhiyun switch (ctr) {
137*4882a593Smuzhiyun case 0:
138*4882a593Smuzhiyun mtpmr(PMRN_PMLCA0, pmlca);
139*4882a593Smuzhiyun mtpmr(PMRN_PMLCB0, pmlcb);
140*4882a593Smuzhiyun break;
141*4882a593Smuzhiyun case 1:
142*4882a593Smuzhiyun mtpmr(PMRN_PMLCA1, pmlca);
143*4882a593Smuzhiyun mtpmr(PMRN_PMLCB1, pmlcb);
144*4882a593Smuzhiyun break;
145*4882a593Smuzhiyun case 2:
146*4882a593Smuzhiyun mtpmr(PMRN_PMLCA2, pmlca);
147*4882a593Smuzhiyun mtpmr(PMRN_PMLCB2, pmlcb);
148*4882a593Smuzhiyun break;
149*4882a593Smuzhiyun case 3:
150*4882a593Smuzhiyun mtpmr(PMRN_PMLCA3, pmlca);
151*4882a593Smuzhiyun mtpmr(PMRN_PMLCB3, pmlcb);
152*4882a593Smuzhiyun break;
153*4882a593Smuzhiyun case 4:
154*4882a593Smuzhiyun mtpmr(PMRN_PMLCA4, pmlca);
155*4882a593Smuzhiyun mtpmr(PMRN_PMLCB4, pmlcb);
156*4882a593Smuzhiyun break;
157*4882a593Smuzhiyun case 5:
158*4882a593Smuzhiyun mtpmr(PMRN_PMLCA5, pmlca);
159*4882a593Smuzhiyun mtpmr(PMRN_PMLCB5, pmlcb);
160*4882a593Smuzhiyun break;
161*4882a593Smuzhiyun default:
162*4882a593Smuzhiyun panic("Bad ctr number!\n");
163*4882a593Smuzhiyun }
164*4882a593Smuzhiyun }
165*4882a593Smuzhiyun
set_pmc_event(int ctr,int event)166*4882a593Smuzhiyun static void set_pmc_event(int ctr, int event)
167*4882a593Smuzhiyun {
168*4882a593Smuzhiyun u32 pmlca;
169*4882a593Smuzhiyun
170*4882a593Smuzhiyun pmlca = get_pmlca(ctr);
171*4882a593Smuzhiyun
172*4882a593Smuzhiyun pmlca = (pmlca & ~PMLCA_EVENT_MASK) |
173*4882a593Smuzhiyun ((event << PMLCA_EVENT_SHIFT) &
174*4882a593Smuzhiyun PMLCA_EVENT_MASK);
175*4882a593Smuzhiyun
176*4882a593Smuzhiyun set_pmlca(ctr, pmlca);
177*4882a593Smuzhiyun }
178*4882a593Smuzhiyun
set_pmc_user_kernel(int ctr,int user,int kernel)179*4882a593Smuzhiyun static void set_pmc_user_kernel(int ctr, int user, int kernel)
180*4882a593Smuzhiyun {
181*4882a593Smuzhiyun u32 pmlca;
182*4882a593Smuzhiyun
183*4882a593Smuzhiyun pmlca = get_pmlca(ctr);
184*4882a593Smuzhiyun
185*4882a593Smuzhiyun if(user)
186*4882a593Smuzhiyun pmlca &= ~PMLCA_FCU;
187*4882a593Smuzhiyun else
188*4882a593Smuzhiyun pmlca |= PMLCA_FCU;
189*4882a593Smuzhiyun
190*4882a593Smuzhiyun if(kernel)
191*4882a593Smuzhiyun pmlca &= ~PMLCA_FCS;
192*4882a593Smuzhiyun else
193*4882a593Smuzhiyun pmlca |= PMLCA_FCS;
194*4882a593Smuzhiyun
195*4882a593Smuzhiyun set_pmlca(ctr, pmlca);
196*4882a593Smuzhiyun }
197*4882a593Smuzhiyun
set_pmc_marked(int ctr,int mark0,int mark1)198*4882a593Smuzhiyun static void set_pmc_marked(int ctr, int mark0, int mark1)
199*4882a593Smuzhiyun {
200*4882a593Smuzhiyun u32 pmlca = get_pmlca(ctr);
201*4882a593Smuzhiyun
202*4882a593Smuzhiyun if(mark0)
203*4882a593Smuzhiyun pmlca &= ~PMLCA_FCM0;
204*4882a593Smuzhiyun else
205*4882a593Smuzhiyun pmlca |= PMLCA_FCM0;
206*4882a593Smuzhiyun
207*4882a593Smuzhiyun if(mark1)
208*4882a593Smuzhiyun pmlca &= ~PMLCA_FCM1;
209*4882a593Smuzhiyun else
210*4882a593Smuzhiyun pmlca |= PMLCA_FCM1;
211*4882a593Smuzhiyun
212*4882a593Smuzhiyun set_pmlca(ctr, pmlca);
213*4882a593Smuzhiyun }
214*4882a593Smuzhiyun
pmc_start_ctr(int ctr,int enable)215*4882a593Smuzhiyun static void pmc_start_ctr(int ctr, int enable)
216*4882a593Smuzhiyun {
217*4882a593Smuzhiyun u32 pmlca = get_pmlca(ctr);
218*4882a593Smuzhiyun
219*4882a593Smuzhiyun pmlca &= ~PMLCA_FC;
220*4882a593Smuzhiyun
221*4882a593Smuzhiyun if (enable)
222*4882a593Smuzhiyun pmlca |= PMLCA_CE;
223*4882a593Smuzhiyun else
224*4882a593Smuzhiyun pmlca &= ~PMLCA_CE;
225*4882a593Smuzhiyun
226*4882a593Smuzhiyun set_pmlca(ctr, pmlca);
227*4882a593Smuzhiyun }
228*4882a593Smuzhiyun
pmc_start_ctrs(int enable)229*4882a593Smuzhiyun static void pmc_start_ctrs(int enable)
230*4882a593Smuzhiyun {
231*4882a593Smuzhiyun u32 pmgc0 = mfpmr(PMRN_PMGC0);
232*4882a593Smuzhiyun
233*4882a593Smuzhiyun pmgc0 &= ~PMGC0_FAC;
234*4882a593Smuzhiyun pmgc0 |= PMGC0_FCECE;
235*4882a593Smuzhiyun
236*4882a593Smuzhiyun if (enable)
237*4882a593Smuzhiyun pmgc0 |= PMGC0_PMIE;
238*4882a593Smuzhiyun else
239*4882a593Smuzhiyun pmgc0 &= ~PMGC0_PMIE;
240*4882a593Smuzhiyun
241*4882a593Smuzhiyun mtpmr(PMRN_PMGC0, pmgc0);
242*4882a593Smuzhiyun }
243*4882a593Smuzhiyun
pmc_stop_ctrs(void)244*4882a593Smuzhiyun static void pmc_stop_ctrs(void)
245*4882a593Smuzhiyun {
246*4882a593Smuzhiyun u32 pmgc0 = mfpmr(PMRN_PMGC0);
247*4882a593Smuzhiyun
248*4882a593Smuzhiyun pmgc0 |= PMGC0_FAC;
249*4882a593Smuzhiyun
250*4882a593Smuzhiyun pmgc0 &= ~(PMGC0_PMIE | PMGC0_FCECE);
251*4882a593Smuzhiyun
252*4882a593Smuzhiyun mtpmr(PMRN_PMGC0, pmgc0);
253*4882a593Smuzhiyun }
254*4882a593Smuzhiyun
fsl_emb_cpu_setup(struct op_counter_config * ctr)255*4882a593Smuzhiyun static int fsl_emb_cpu_setup(struct op_counter_config *ctr)
256*4882a593Smuzhiyun {
257*4882a593Smuzhiyun int i;
258*4882a593Smuzhiyun
259*4882a593Smuzhiyun /* freeze all counters */
260*4882a593Smuzhiyun pmc_stop_ctrs();
261*4882a593Smuzhiyun
262*4882a593Smuzhiyun for (i = 0;i < num_counters;i++) {
263*4882a593Smuzhiyun init_pmc_stop(i);
264*4882a593Smuzhiyun
265*4882a593Smuzhiyun set_pmc_event(i, ctr[i].event);
266*4882a593Smuzhiyun
267*4882a593Smuzhiyun set_pmc_user_kernel(i, ctr[i].user, ctr[i].kernel);
268*4882a593Smuzhiyun }
269*4882a593Smuzhiyun
270*4882a593Smuzhiyun return 0;
271*4882a593Smuzhiyun }
272*4882a593Smuzhiyun
fsl_emb_reg_setup(struct op_counter_config * ctr,struct op_system_config * sys,int num_ctrs)273*4882a593Smuzhiyun static int fsl_emb_reg_setup(struct op_counter_config *ctr,
274*4882a593Smuzhiyun struct op_system_config *sys,
275*4882a593Smuzhiyun int num_ctrs)
276*4882a593Smuzhiyun {
277*4882a593Smuzhiyun int i;
278*4882a593Smuzhiyun
279*4882a593Smuzhiyun num_counters = num_ctrs;
280*4882a593Smuzhiyun
281*4882a593Smuzhiyun /* Our counters count up, and "count" refers to
282*4882a593Smuzhiyun * how much before the next interrupt, and we interrupt
283*4882a593Smuzhiyun * on overflow. So we calculate the starting value
284*4882a593Smuzhiyun * which will give us "count" until overflow.
285*4882a593Smuzhiyun * Then we set the events on the enabled counters */
286*4882a593Smuzhiyun for (i = 0; i < num_counters; ++i)
287*4882a593Smuzhiyun reset_value[i] = 0x80000000UL - ctr[i].count;
288*4882a593Smuzhiyun
289*4882a593Smuzhiyun return 0;
290*4882a593Smuzhiyun }
291*4882a593Smuzhiyun
fsl_emb_start(struct op_counter_config * ctr)292*4882a593Smuzhiyun static int fsl_emb_start(struct op_counter_config *ctr)
293*4882a593Smuzhiyun {
294*4882a593Smuzhiyun int i;
295*4882a593Smuzhiyun
296*4882a593Smuzhiyun mtmsr(mfmsr() | MSR_PMM);
297*4882a593Smuzhiyun
298*4882a593Smuzhiyun for (i = 0; i < num_counters; ++i) {
299*4882a593Smuzhiyun if (ctr[i].enabled) {
300*4882a593Smuzhiyun ctr_write(i, reset_value[i]);
301*4882a593Smuzhiyun /* Set each enabled counter to only
302*4882a593Smuzhiyun * count when the Mark bit is *not* set */
303*4882a593Smuzhiyun set_pmc_marked(i, 1, 0);
304*4882a593Smuzhiyun pmc_start_ctr(i, 1);
305*4882a593Smuzhiyun } else {
306*4882a593Smuzhiyun ctr_write(i, 0);
307*4882a593Smuzhiyun
308*4882a593Smuzhiyun /* Set the ctr to be stopped */
309*4882a593Smuzhiyun pmc_start_ctr(i, 0);
310*4882a593Smuzhiyun }
311*4882a593Smuzhiyun }
312*4882a593Smuzhiyun
313*4882a593Smuzhiyun /* Clear the freeze bit, and enable the interrupt.
314*4882a593Smuzhiyun * The counters won't actually start until the rfi clears
315*4882a593Smuzhiyun * the PMM bit */
316*4882a593Smuzhiyun pmc_start_ctrs(1);
317*4882a593Smuzhiyun
318*4882a593Smuzhiyun oprofile_running = 1;
319*4882a593Smuzhiyun
320*4882a593Smuzhiyun pr_debug("start on cpu %d, pmgc0 %x\n", smp_processor_id(),
321*4882a593Smuzhiyun mfpmr(PMRN_PMGC0));
322*4882a593Smuzhiyun
323*4882a593Smuzhiyun return 0;
324*4882a593Smuzhiyun }
325*4882a593Smuzhiyun
fsl_emb_stop(void)326*4882a593Smuzhiyun static void fsl_emb_stop(void)
327*4882a593Smuzhiyun {
328*4882a593Smuzhiyun /* freeze counters */
329*4882a593Smuzhiyun pmc_stop_ctrs();
330*4882a593Smuzhiyun
331*4882a593Smuzhiyun oprofile_running = 0;
332*4882a593Smuzhiyun
333*4882a593Smuzhiyun pr_debug("stop on cpu %d, pmgc0 %x\n", smp_processor_id(),
334*4882a593Smuzhiyun mfpmr(PMRN_PMGC0));
335*4882a593Smuzhiyun
336*4882a593Smuzhiyun mb();
337*4882a593Smuzhiyun }
338*4882a593Smuzhiyun
339*4882a593Smuzhiyun
fsl_emb_handle_interrupt(struct pt_regs * regs,struct op_counter_config * ctr)340*4882a593Smuzhiyun static void fsl_emb_handle_interrupt(struct pt_regs *regs,
341*4882a593Smuzhiyun struct op_counter_config *ctr)
342*4882a593Smuzhiyun {
343*4882a593Smuzhiyun unsigned long pc;
344*4882a593Smuzhiyun int is_kernel;
345*4882a593Smuzhiyun int val;
346*4882a593Smuzhiyun int i;
347*4882a593Smuzhiyun
348*4882a593Smuzhiyun pc = regs->nip;
349*4882a593Smuzhiyun is_kernel = is_kernel_addr(pc);
350*4882a593Smuzhiyun
351*4882a593Smuzhiyun for (i = 0; i < num_counters; ++i) {
352*4882a593Smuzhiyun val = ctr_read(i);
353*4882a593Smuzhiyun if (val < 0) {
354*4882a593Smuzhiyun if (oprofile_running && ctr[i].enabled) {
355*4882a593Smuzhiyun oprofile_add_ext_sample(pc, regs, i, is_kernel);
356*4882a593Smuzhiyun ctr_write(i, reset_value[i]);
357*4882a593Smuzhiyun } else {
358*4882a593Smuzhiyun ctr_write(i, 0);
359*4882a593Smuzhiyun }
360*4882a593Smuzhiyun }
361*4882a593Smuzhiyun }
362*4882a593Smuzhiyun
363*4882a593Smuzhiyun /* The freeze bit was set by the interrupt. */
364*4882a593Smuzhiyun /* Clear the freeze bit, and reenable the interrupt. The
365*4882a593Smuzhiyun * counters won't actually start until the rfi clears the PMM
366*4882a593Smuzhiyun * bit. The PMM bit should not be set until after the interrupt
367*4882a593Smuzhiyun * is cleared to avoid it getting lost in some hypervisor
368*4882a593Smuzhiyun * environments.
369*4882a593Smuzhiyun */
370*4882a593Smuzhiyun mtmsr(mfmsr() | MSR_PMM);
371*4882a593Smuzhiyun pmc_start_ctrs(1);
372*4882a593Smuzhiyun }
373*4882a593Smuzhiyun
374*4882a593Smuzhiyun struct op_powerpc_model op_model_fsl_emb = {
375*4882a593Smuzhiyun .reg_setup = fsl_emb_reg_setup,
376*4882a593Smuzhiyun .cpu_setup = fsl_emb_cpu_setup,
377*4882a593Smuzhiyun .start = fsl_emb_start,
378*4882a593Smuzhiyun .stop = fsl_emb_stop,
379*4882a593Smuzhiyun .handle_interrupt = fsl_emb_handle_interrupt,
380*4882a593Smuzhiyun };
381