xref: /OK3568_Linux_fs/kernel/arch/mips/oprofile/op_model_loongson3.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun  * This file is subject to the terms and conditions of the GNU General Public
3*4882a593Smuzhiyun  * License.  See the file "COPYING" in the main directory of this archive
4*4882a593Smuzhiyun  * for more details.
5*4882a593Smuzhiyun  *
6*4882a593Smuzhiyun  */
7*4882a593Smuzhiyun #include <linux/init.h>
8*4882a593Smuzhiyun #include <linux/cpu.h>
9*4882a593Smuzhiyun #include <linux/smp.h>
10*4882a593Smuzhiyun #include <linux/proc_fs.h>
11*4882a593Smuzhiyun #include <linux/oprofile.h>
12*4882a593Smuzhiyun #include <linux/spinlock.h>
13*4882a593Smuzhiyun #include <linux/interrupt.h>
14*4882a593Smuzhiyun #include <linux/uaccess.h>
15*4882a593Smuzhiyun #include <irq.h>
16*4882a593Smuzhiyun #include <loongson.h>
17*4882a593Smuzhiyun #include "op_impl.h"
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun #define LOONGSON3_PERFCNT_OVERFLOW	(1ULL << 63)
20*4882a593Smuzhiyun 
21*4882a593Smuzhiyun #define LOONGSON3_PERFCTRL_EXL		(1UL << 0)
22*4882a593Smuzhiyun #define LOONGSON3_PERFCTRL_KERNEL	(1UL << 1)
23*4882a593Smuzhiyun #define LOONGSON3_PERFCTRL_SUPERVISOR	(1UL << 2)
24*4882a593Smuzhiyun #define LOONGSON3_PERFCTRL_USER		(1UL << 3)
25*4882a593Smuzhiyun #define LOONGSON3_PERFCTRL_ENABLE	(1UL << 4)
26*4882a593Smuzhiyun #define LOONGSON3_PERFCTRL_W		(1UL << 30)
27*4882a593Smuzhiyun #define LOONGSON3_PERFCTRL_M		(1UL << 31)
28*4882a593Smuzhiyun #define LOONGSON3_PERFCTRL_EVENT(idx, event) \
29*4882a593Smuzhiyun 	(((event) & (idx ? 0x0f : 0x3f)) << 5)
30*4882a593Smuzhiyun 
31*4882a593Smuzhiyun /* Loongson-3 PerfCount performance counter1 register */
32*4882a593Smuzhiyun #define read_c0_perflo1() __read_64bit_c0_register($25, 0)
33*4882a593Smuzhiyun #define write_c0_perflo1(val) __write_64bit_c0_register($25, 0, val)
34*4882a593Smuzhiyun #define read_c0_perfhi1() __read_64bit_c0_register($25, 1)
35*4882a593Smuzhiyun #define write_c0_perfhi1(val) __write_64bit_c0_register($25, 1, val)
36*4882a593Smuzhiyun 
37*4882a593Smuzhiyun /* Loongson-3 PerfCount performance counter2 register */
38*4882a593Smuzhiyun #define read_c0_perflo2() __read_64bit_c0_register($25, 2)
39*4882a593Smuzhiyun #define write_c0_perflo2(val) __write_64bit_c0_register($25, 2, val)
40*4882a593Smuzhiyun #define read_c0_perfhi2() __read_64bit_c0_register($25, 3)
41*4882a593Smuzhiyun #define write_c0_perfhi2(val) __write_64bit_c0_register($25, 3, val)
42*4882a593Smuzhiyun 
43*4882a593Smuzhiyun static int (*save_perf_irq)(void);
44*4882a593Smuzhiyun 
45*4882a593Smuzhiyun static struct loongson3_register_config {
46*4882a593Smuzhiyun 	unsigned int control1;
47*4882a593Smuzhiyun 	unsigned int control2;
48*4882a593Smuzhiyun 	unsigned long long reset_counter1;
49*4882a593Smuzhiyun 	unsigned long long reset_counter2;
50*4882a593Smuzhiyun 	int ctr1_enable, ctr2_enable;
51*4882a593Smuzhiyun } reg;
52*4882a593Smuzhiyun 
reset_counters(void * arg)53*4882a593Smuzhiyun static void reset_counters(void *arg)
54*4882a593Smuzhiyun {
55*4882a593Smuzhiyun 	write_c0_perfhi1(0);
56*4882a593Smuzhiyun 	write_c0_perfhi2(0);
57*4882a593Smuzhiyun 	write_c0_perflo1(0xc0000000);
58*4882a593Smuzhiyun 	write_c0_perflo2(0x40000000);
59*4882a593Smuzhiyun }
60*4882a593Smuzhiyun 
61*4882a593Smuzhiyun /* Compute all of the registers in preparation for enabling profiling. */
loongson3_reg_setup(struct op_counter_config * ctr)62*4882a593Smuzhiyun static void loongson3_reg_setup(struct op_counter_config *ctr)
63*4882a593Smuzhiyun {
64*4882a593Smuzhiyun 	unsigned int control1 = 0;
65*4882a593Smuzhiyun 	unsigned int control2 = 0;
66*4882a593Smuzhiyun 
67*4882a593Smuzhiyun 	reg.reset_counter1 = 0;
68*4882a593Smuzhiyun 	reg.reset_counter2 = 0;
69*4882a593Smuzhiyun 	/* Compute the performance counter control word. */
70*4882a593Smuzhiyun 	/* For now count kernel and user mode */
71*4882a593Smuzhiyun 	if (ctr[0].enabled) {
72*4882a593Smuzhiyun 		control1 |= LOONGSON3_PERFCTRL_EVENT(0, ctr[0].event) |
73*4882a593Smuzhiyun 					LOONGSON3_PERFCTRL_ENABLE;
74*4882a593Smuzhiyun 		if (ctr[0].kernel)
75*4882a593Smuzhiyun 			control1 |= LOONGSON3_PERFCTRL_KERNEL;
76*4882a593Smuzhiyun 		if (ctr[0].user)
77*4882a593Smuzhiyun 			control1 |= LOONGSON3_PERFCTRL_USER;
78*4882a593Smuzhiyun 		reg.reset_counter1 = 0x8000000000000000ULL - ctr[0].count;
79*4882a593Smuzhiyun 	}
80*4882a593Smuzhiyun 
81*4882a593Smuzhiyun 	if (ctr[1].enabled) {
82*4882a593Smuzhiyun 		control2 |= LOONGSON3_PERFCTRL_EVENT(1, ctr[1].event) |
83*4882a593Smuzhiyun 					LOONGSON3_PERFCTRL_ENABLE;
84*4882a593Smuzhiyun 		if (ctr[1].kernel)
85*4882a593Smuzhiyun 			control2 |= LOONGSON3_PERFCTRL_KERNEL;
86*4882a593Smuzhiyun 		if (ctr[1].user)
87*4882a593Smuzhiyun 			control2 |= LOONGSON3_PERFCTRL_USER;
88*4882a593Smuzhiyun 		reg.reset_counter2 = 0x8000000000000000ULL - ctr[1].count;
89*4882a593Smuzhiyun 	}
90*4882a593Smuzhiyun 
91*4882a593Smuzhiyun 	if (ctr[0].enabled)
92*4882a593Smuzhiyun 		control1 |= LOONGSON3_PERFCTRL_EXL;
93*4882a593Smuzhiyun 	if (ctr[1].enabled)
94*4882a593Smuzhiyun 		control2 |= LOONGSON3_PERFCTRL_EXL;
95*4882a593Smuzhiyun 
96*4882a593Smuzhiyun 	reg.control1 = control1;
97*4882a593Smuzhiyun 	reg.control2 = control2;
98*4882a593Smuzhiyun 	reg.ctr1_enable = ctr[0].enabled;
99*4882a593Smuzhiyun 	reg.ctr2_enable = ctr[1].enabled;
100*4882a593Smuzhiyun }
101*4882a593Smuzhiyun 
102*4882a593Smuzhiyun /* Program all of the registers in preparation for enabling profiling. */
loongson3_cpu_setup(void * args)103*4882a593Smuzhiyun static void loongson3_cpu_setup(void *args)
104*4882a593Smuzhiyun {
105*4882a593Smuzhiyun 	uint64_t perfcount1, perfcount2;
106*4882a593Smuzhiyun 
107*4882a593Smuzhiyun 	perfcount1 = reg.reset_counter1;
108*4882a593Smuzhiyun 	perfcount2 = reg.reset_counter2;
109*4882a593Smuzhiyun 	write_c0_perfhi1(perfcount1);
110*4882a593Smuzhiyun 	write_c0_perfhi2(perfcount2);
111*4882a593Smuzhiyun }
112*4882a593Smuzhiyun 
loongson3_cpu_start(void * args)113*4882a593Smuzhiyun static void loongson3_cpu_start(void *args)
114*4882a593Smuzhiyun {
115*4882a593Smuzhiyun 	/* Start all counters on current CPU */
116*4882a593Smuzhiyun 	reg.control1 |= (LOONGSON3_PERFCTRL_W|LOONGSON3_PERFCTRL_M);
117*4882a593Smuzhiyun 	reg.control2 |= (LOONGSON3_PERFCTRL_W|LOONGSON3_PERFCTRL_M);
118*4882a593Smuzhiyun 
119*4882a593Smuzhiyun 	if (reg.ctr1_enable)
120*4882a593Smuzhiyun 		write_c0_perflo1(reg.control1);
121*4882a593Smuzhiyun 	if (reg.ctr2_enable)
122*4882a593Smuzhiyun 		write_c0_perflo2(reg.control2);
123*4882a593Smuzhiyun }
124*4882a593Smuzhiyun 
loongson3_cpu_stop(void * args)125*4882a593Smuzhiyun static void loongson3_cpu_stop(void *args)
126*4882a593Smuzhiyun {
127*4882a593Smuzhiyun 	/* Stop all counters on current CPU */
128*4882a593Smuzhiyun 	write_c0_perflo1(0xc0000000);
129*4882a593Smuzhiyun 	write_c0_perflo2(0x40000000);
130*4882a593Smuzhiyun 	memset(&reg, 0, sizeof(reg));
131*4882a593Smuzhiyun }
132*4882a593Smuzhiyun 
loongson3_perfcount_handler(void)133*4882a593Smuzhiyun static int loongson3_perfcount_handler(void)
134*4882a593Smuzhiyun {
135*4882a593Smuzhiyun 	unsigned long flags;
136*4882a593Smuzhiyun 	uint64_t counter1, counter2;
137*4882a593Smuzhiyun 	uint32_t cause, handled = IRQ_NONE;
138*4882a593Smuzhiyun 	struct pt_regs *regs = get_irq_regs();
139*4882a593Smuzhiyun 
140*4882a593Smuzhiyun 	cause = read_c0_cause();
141*4882a593Smuzhiyun 	if (!(cause & CAUSEF_PCI))
142*4882a593Smuzhiyun 		return handled;
143*4882a593Smuzhiyun 
144*4882a593Smuzhiyun 	counter1 = read_c0_perfhi1();
145*4882a593Smuzhiyun 	counter2 = read_c0_perfhi2();
146*4882a593Smuzhiyun 
147*4882a593Smuzhiyun 	local_irq_save(flags);
148*4882a593Smuzhiyun 
149*4882a593Smuzhiyun 	if (counter1 & LOONGSON3_PERFCNT_OVERFLOW) {
150*4882a593Smuzhiyun 		if (reg.ctr1_enable)
151*4882a593Smuzhiyun 			oprofile_add_sample(regs, 0);
152*4882a593Smuzhiyun 		counter1 = reg.reset_counter1;
153*4882a593Smuzhiyun 	}
154*4882a593Smuzhiyun 	if (counter2 & LOONGSON3_PERFCNT_OVERFLOW) {
155*4882a593Smuzhiyun 		if (reg.ctr2_enable)
156*4882a593Smuzhiyun 			oprofile_add_sample(regs, 1);
157*4882a593Smuzhiyun 		counter2 = reg.reset_counter2;
158*4882a593Smuzhiyun 	}
159*4882a593Smuzhiyun 
160*4882a593Smuzhiyun 	local_irq_restore(flags);
161*4882a593Smuzhiyun 
162*4882a593Smuzhiyun 	write_c0_perfhi1(counter1);
163*4882a593Smuzhiyun 	write_c0_perfhi2(counter2);
164*4882a593Smuzhiyun 
165*4882a593Smuzhiyun 	if (!(cause & CAUSEF_TI))
166*4882a593Smuzhiyun 		handled = IRQ_HANDLED;
167*4882a593Smuzhiyun 
168*4882a593Smuzhiyun 	return handled;
169*4882a593Smuzhiyun }
170*4882a593Smuzhiyun 
loongson3_starting_cpu(unsigned int cpu)171*4882a593Smuzhiyun static int loongson3_starting_cpu(unsigned int cpu)
172*4882a593Smuzhiyun {
173*4882a593Smuzhiyun 	write_c0_perflo1(reg.control1);
174*4882a593Smuzhiyun 	write_c0_perflo2(reg.control2);
175*4882a593Smuzhiyun 	return 0;
176*4882a593Smuzhiyun }
177*4882a593Smuzhiyun 
loongson3_dying_cpu(unsigned int cpu)178*4882a593Smuzhiyun static int loongson3_dying_cpu(unsigned int cpu)
179*4882a593Smuzhiyun {
180*4882a593Smuzhiyun 	write_c0_perflo1(0xc0000000);
181*4882a593Smuzhiyun 	write_c0_perflo2(0x40000000);
182*4882a593Smuzhiyun 	return 0;
183*4882a593Smuzhiyun }
184*4882a593Smuzhiyun 
loongson3_init(void)185*4882a593Smuzhiyun static int __init loongson3_init(void)
186*4882a593Smuzhiyun {
187*4882a593Smuzhiyun 	on_each_cpu(reset_counters, NULL, 1);
188*4882a593Smuzhiyun 	cpuhp_setup_state_nocalls(CPUHP_AP_MIPS_OP_LOONGSON3_STARTING,
189*4882a593Smuzhiyun 				  "mips/oprofile/loongson3:starting",
190*4882a593Smuzhiyun 				  loongson3_starting_cpu, loongson3_dying_cpu);
191*4882a593Smuzhiyun 	save_perf_irq = perf_irq;
192*4882a593Smuzhiyun 	perf_irq = loongson3_perfcount_handler;
193*4882a593Smuzhiyun 
194*4882a593Smuzhiyun 	return 0;
195*4882a593Smuzhiyun }
196*4882a593Smuzhiyun 
loongson3_exit(void)197*4882a593Smuzhiyun static void loongson3_exit(void)
198*4882a593Smuzhiyun {
199*4882a593Smuzhiyun 	on_each_cpu(reset_counters, NULL, 1);
200*4882a593Smuzhiyun 	cpuhp_remove_state_nocalls(CPUHP_AP_MIPS_OP_LOONGSON3_STARTING);
201*4882a593Smuzhiyun 	perf_irq = save_perf_irq;
202*4882a593Smuzhiyun }
203*4882a593Smuzhiyun 
204*4882a593Smuzhiyun struct op_mips_model op_model_loongson3_ops = {
205*4882a593Smuzhiyun 	.reg_setup	= loongson3_reg_setup,
206*4882a593Smuzhiyun 	.cpu_setup	= loongson3_cpu_setup,
207*4882a593Smuzhiyun 	.init		= loongson3_init,
208*4882a593Smuzhiyun 	.exit		= loongson3_exit,
209*4882a593Smuzhiyun 	.cpu_start	= loongson3_cpu_start,
210*4882a593Smuzhiyun 	.cpu_stop	= loongson3_cpu_stop,
211*4882a593Smuzhiyun 	.cpu_type	= "mips/loongson3",
212*4882a593Smuzhiyun 	.num_counters	= 2
213*4882a593Smuzhiyun };
214