xref: /OK3568_Linux_fs/kernel/arch/x86/events/intel/p6.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun #include <linux/perf_event.h>
3*4882a593Smuzhiyun #include <linux/types.h>
4*4882a593Smuzhiyun 
5*4882a593Smuzhiyun #include "../perf_event.h"
6*4882a593Smuzhiyun 
7*4882a593Smuzhiyun /*
8*4882a593Smuzhiyun  * Not sure about some of these
9*4882a593Smuzhiyun  */
10*4882a593Smuzhiyun static const u64 p6_perfmon_event_map[] =
11*4882a593Smuzhiyun {
12*4882a593Smuzhiyun   [PERF_COUNT_HW_CPU_CYCLES]		= 0x0079,	/* CPU_CLK_UNHALTED */
13*4882a593Smuzhiyun   [PERF_COUNT_HW_INSTRUCTIONS]		= 0x00c0,	/* INST_RETIRED     */
14*4882a593Smuzhiyun   [PERF_COUNT_HW_CACHE_REFERENCES]	= 0x0f2e,	/* L2_RQSTS:M:E:S:I */
15*4882a593Smuzhiyun   [PERF_COUNT_HW_CACHE_MISSES]		= 0x012e,	/* L2_RQSTS:I       */
16*4882a593Smuzhiyun   [PERF_COUNT_HW_BRANCH_INSTRUCTIONS]	= 0x00c4,	/* BR_INST_RETIRED  */
17*4882a593Smuzhiyun   [PERF_COUNT_HW_BRANCH_MISSES]		= 0x00c5,	/* BR_MISS_PRED_RETIRED */
18*4882a593Smuzhiyun   [PERF_COUNT_HW_BUS_CYCLES]		= 0x0062,	/* BUS_DRDY_CLOCKS  */
19*4882a593Smuzhiyun   [PERF_COUNT_HW_STALLED_CYCLES_FRONTEND] = 0x00a2,	/* RESOURCE_STALLS  */
20*4882a593Smuzhiyun 
21*4882a593Smuzhiyun };
22*4882a593Smuzhiyun 
23*4882a593Smuzhiyun static const u64 __initconst p6_hw_cache_event_ids
24*4882a593Smuzhiyun 				[PERF_COUNT_HW_CACHE_MAX]
25*4882a593Smuzhiyun 				[PERF_COUNT_HW_CACHE_OP_MAX]
26*4882a593Smuzhiyun 				[PERF_COUNT_HW_CACHE_RESULT_MAX] =
27*4882a593Smuzhiyun {
28*4882a593Smuzhiyun  [ C(L1D) ] = {
29*4882a593Smuzhiyun 	[ C(OP_READ) ] = {
30*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = 0x0043,	/* DATA_MEM_REFS       */
31*4882a593Smuzhiyun                 [ C(RESULT_MISS)   ] = 0x0045,	/* DCU_LINES_IN        */
32*4882a593Smuzhiyun 	},
33*4882a593Smuzhiyun 	[ C(OP_WRITE) ] = {
34*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = 0,
35*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = 0x0f29,	/* L2_LD:M:E:S:I       */
36*4882a593Smuzhiyun 	},
37*4882a593Smuzhiyun         [ C(OP_PREFETCH) ] = {
38*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = 0,
39*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = 0,
40*4882a593Smuzhiyun         },
41*4882a593Smuzhiyun  },
42*4882a593Smuzhiyun  [ C(L1I ) ] = {
43*4882a593Smuzhiyun 	[ C(OP_READ) ] = {
44*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = 0x0080,	/* IFU_IFETCH         */
45*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = 0x0f28,	/* L2_IFETCH:M:E:S:I  */
46*4882a593Smuzhiyun 	},
47*4882a593Smuzhiyun 	[ C(OP_WRITE) ] = {
48*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = -1,
49*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = -1,
50*4882a593Smuzhiyun 	},
51*4882a593Smuzhiyun 	[ C(OP_PREFETCH) ] = {
52*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = 0,
53*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = 0,
54*4882a593Smuzhiyun 	},
55*4882a593Smuzhiyun  },
56*4882a593Smuzhiyun  [ C(LL  ) ] = {
57*4882a593Smuzhiyun 	[ C(OP_READ) ] = {
58*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = 0,
59*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = 0,
60*4882a593Smuzhiyun 	},
61*4882a593Smuzhiyun 	[ C(OP_WRITE) ] = {
62*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = 0,
63*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = 0x0025,	/* L2_M_LINES_INM     */
64*4882a593Smuzhiyun 	},
65*4882a593Smuzhiyun 	[ C(OP_PREFETCH) ] = {
66*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = 0,
67*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = 0,
68*4882a593Smuzhiyun 	},
69*4882a593Smuzhiyun  },
70*4882a593Smuzhiyun  [ C(DTLB) ] = {
71*4882a593Smuzhiyun 	[ C(OP_READ) ] = {
72*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = 0x0043,	/* DATA_MEM_REFS      */
73*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = 0,
74*4882a593Smuzhiyun 	},
75*4882a593Smuzhiyun 	[ C(OP_WRITE) ] = {
76*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = 0,
77*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = 0,
78*4882a593Smuzhiyun 	},
79*4882a593Smuzhiyun 	[ C(OP_PREFETCH) ] = {
80*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = 0,
81*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = 0,
82*4882a593Smuzhiyun 	},
83*4882a593Smuzhiyun  },
84*4882a593Smuzhiyun  [ C(ITLB) ] = {
85*4882a593Smuzhiyun 	[ C(OP_READ) ] = {
86*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = 0x0080,	/* IFU_IFETCH         */
87*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = 0x0085,	/* ITLB_MISS          */
88*4882a593Smuzhiyun 	},
89*4882a593Smuzhiyun 	[ C(OP_WRITE) ] = {
90*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = -1,
91*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = -1,
92*4882a593Smuzhiyun 	},
93*4882a593Smuzhiyun 	[ C(OP_PREFETCH) ] = {
94*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = -1,
95*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = -1,
96*4882a593Smuzhiyun 	},
97*4882a593Smuzhiyun  },
98*4882a593Smuzhiyun  [ C(BPU ) ] = {
99*4882a593Smuzhiyun 	[ C(OP_READ) ] = {
100*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = 0x00c4,	/* BR_INST_RETIRED      */
101*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = 0x00c5,	/* BR_MISS_PRED_RETIRED */
102*4882a593Smuzhiyun         },
103*4882a593Smuzhiyun 	[ C(OP_WRITE) ] = {
104*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = -1,
105*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = -1,
106*4882a593Smuzhiyun 	},
107*4882a593Smuzhiyun 	[ C(OP_PREFETCH) ] = {
108*4882a593Smuzhiyun 		[ C(RESULT_ACCESS) ] = -1,
109*4882a593Smuzhiyun 		[ C(RESULT_MISS)   ] = -1,
110*4882a593Smuzhiyun 	},
111*4882a593Smuzhiyun  },
112*4882a593Smuzhiyun };
113*4882a593Smuzhiyun 
p6_pmu_event_map(int hw_event)114*4882a593Smuzhiyun static u64 p6_pmu_event_map(int hw_event)
115*4882a593Smuzhiyun {
116*4882a593Smuzhiyun 	return p6_perfmon_event_map[hw_event];
117*4882a593Smuzhiyun }
118*4882a593Smuzhiyun 
119*4882a593Smuzhiyun /*
120*4882a593Smuzhiyun  * Event setting that is specified not to count anything.
121*4882a593Smuzhiyun  * We use this to effectively disable a counter.
122*4882a593Smuzhiyun  *
123*4882a593Smuzhiyun  * L2_RQSTS with 0 MESI unit mask.
124*4882a593Smuzhiyun  */
125*4882a593Smuzhiyun #define P6_NOP_EVENT			0x0000002EULL
126*4882a593Smuzhiyun 
127*4882a593Smuzhiyun static struct event_constraint p6_event_constraints[] =
128*4882a593Smuzhiyun {
129*4882a593Smuzhiyun 	INTEL_EVENT_CONSTRAINT(0xc1, 0x1),	/* FLOPS */
130*4882a593Smuzhiyun 	INTEL_EVENT_CONSTRAINT(0x10, 0x1),	/* FP_COMP_OPS_EXE */
131*4882a593Smuzhiyun 	INTEL_EVENT_CONSTRAINT(0x11, 0x2),	/* FP_ASSIST */
132*4882a593Smuzhiyun 	INTEL_EVENT_CONSTRAINT(0x12, 0x2),	/* MUL */
133*4882a593Smuzhiyun 	INTEL_EVENT_CONSTRAINT(0x13, 0x2),	/* DIV */
134*4882a593Smuzhiyun 	INTEL_EVENT_CONSTRAINT(0x14, 0x1),	/* CYCLES_DIV_BUSY */
135*4882a593Smuzhiyun 	EVENT_CONSTRAINT_END
136*4882a593Smuzhiyun };
137*4882a593Smuzhiyun 
p6_pmu_disable_all(void)138*4882a593Smuzhiyun static void p6_pmu_disable_all(void)
139*4882a593Smuzhiyun {
140*4882a593Smuzhiyun 	u64 val;
141*4882a593Smuzhiyun 
142*4882a593Smuzhiyun 	/* p6 only has one enable register */
143*4882a593Smuzhiyun 	rdmsrl(MSR_P6_EVNTSEL0, val);
144*4882a593Smuzhiyun 	val &= ~ARCH_PERFMON_EVENTSEL_ENABLE;
145*4882a593Smuzhiyun 	wrmsrl(MSR_P6_EVNTSEL0, val);
146*4882a593Smuzhiyun }
147*4882a593Smuzhiyun 
p6_pmu_enable_all(int added)148*4882a593Smuzhiyun static void p6_pmu_enable_all(int added)
149*4882a593Smuzhiyun {
150*4882a593Smuzhiyun 	unsigned long val;
151*4882a593Smuzhiyun 
152*4882a593Smuzhiyun 	/* p6 only has one enable register */
153*4882a593Smuzhiyun 	rdmsrl(MSR_P6_EVNTSEL0, val);
154*4882a593Smuzhiyun 	val |= ARCH_PERFMON_EVENTSEL_ENABLE;
155*4882a593Smuzhiyun 	wrmsrl(MSR_P6_EVNTSEL0, val);
156*4882a593Smuzhiyun }
157*4882a593Smuzhiyun 
158*4882a593Smuzhiyun static inline void
p6_pmu_disable_event(struct perf_event * event)159*4882a593Smuzhiyun p6_pmu_disable_event(struct perf_event *event)
160*4882a593Smuzhiyun {
161*4882a593Smuzhiyun 	struct hw_perf_event *hwc = &event->hw;
162*4882a593Smuzhiyun 	u64 val = P6_NOP_EVENT;
163*4882a593Smuzhiyun 
164*4882a593Smuzhiyun 	(void)wrmsrl_safe(hwc->config_base, val);
165*4882a593Smuzhiyun }
166*4882a593Smuzhiyun 
p6_pmu_enable_event(struct perf_event * event)167*4882a593Smuzhiyun static void p6_pmu_enable_event(struct perf_event *event)
168*4882a593Smuzhiyun {
169*4882a593Smuzhiyun 	struct hw_perf_event *hwc = &event->hw;
170*4882a593Smuzhiyun 	u64 val;
171*4882a593Smuzhiyun 
172*4882a593Smuzhiyun 	val = hwc->config;
173*4882a593Smuzhiyun 
174*4882a593Smuzhiyun 	/*
175*4882a593Smuzhiyun 	 * p6 only has a global event enable, set on PerfEvtSel0
176*4882a593Smuzhiyun 	 * We "disable" events by programming P6_NOP_EVENT
177*4882a593Smuzhiyun 	 * and we rely on p6_pmu_enable_all() being called
178*4882a593Smuzhiyun 	 * to actually enable the events.
179*4882a593Smuzhiyun 	 */
180*4882a593Smuzhiyun 
181*4882a593Smuzhiyun 	(void)wrmsrl_safe(hwc->config_base, val);
182*4882a593Smuzhiyun }
183*4882a593Smuzhiyun 
184*4882a593Smuzhiyun PMU_FORMAT_ATTR(event,	"config:0-7"	);
185*4882a593Smuzhiyun PMU_FORMAT_ATTR(umask,	"config:8-15"	);
186*4882a593Smuzhiyun PMU_FORMAT_ATTR(edge,	"config:18"	);
187*4882a593Smuzhiyun PMU_FORMAT_ATTR(pc,	"config:19"	);
188*4882a593Smuzhiyun PMU_FORMAT_ATTR(inv,	"config:23"	);
189*4882a593Smuzhiyun PMU_FORMAT_ATTR(cmask,	"config:24-31"	);
190*4882a593Smuzhiyun 
191*4882a593Smuzhiyun static struct attribute *intel_p6_formats_attr[] = {
192*4882a593Smuzhiyun 	&format_attr_event.attr,
193*4882a593Smuzhiyun 	&format_attr_umask.attr,
194*4882a593Smuzhiyun 	&format_attr_edge.attr,
195*4882a593Smuzhiyun 	&format_attr_pc.attr,
196*4882a593Smuzhiyun 	&format_attr_inv.attr,
197*4882a593Smuzhiyun 	&format_attr_cmask.attr,
198*4882a593Smuzhiyun 	NULL,
199*4882a593Smuzhiyun };
200*4882a593Smuzhiyun 
201*4882a593Smuzhiyun static __initconst const struct x86_pmu p6_pmu = {
202*4882a593Smuzhiyun 	.name			= "p6",
203*4882a593Smuzhiyun 	.handle_irq		= x86_pmu_handle_irq,
204*4882a593Smuzhiyun 	.disable_all		= p6_pmu_disable_all,
205*4882a593Smuzhiyun 	.enable_all		= p6_pmu_enable_all,
206*4882a593Smuzhiyun 	.enable			= p6_pmu_enable_event,
207*4882a593Smuzhiyun 	.disable		= p6_pmu_disable_event,
208*4882a593Smuzhiyun 	.hw_config		= x86_pmu_hw_config,
209*4882a593Smuzhiyun 	.schedule_events	= x86_schedule_events,
210*4882a593Smuzhiyun 	.eventsel		= MSR_P6_EVNTSEL0,
211*4882a593Smuzhiyun 	.perfctr		= MSR_P6_PERFCTR0,
212*4882a593Smuzhiyun 	.event_map		= p6_pmu_event_map,
213*4882a593Smuzhiyun 	.max_events		= ARRAY_SIZE(p6_perfmon_event_map),
214*4882a593Smuzhiyun 	.apic			= 1,
215*4882a593Smuzhiyun 	.max_period		= (1ULL << 31) - 1,
216*4882a593Smuzhiyun 	.version		= 0,
217*4882a593Smuzhiyun 	.num_counters		= 2,
218*4882a593Smuzhiyun 	/*
219*4882a593Smuzhiyun 	 * Events have 40 bits implemented. However they are designed such
220*4882a593Smuzhiyun 	 * that bits [32-39] are sign extensions of bit 31. As such the
221*4882a593Smuzhiyun 	 * effective width of a event for P6-like PMU is 32 bits only.
222*4882a593Smuzhiyun 	 *
223*4882a593Smuzhiyun 	 * See IA-32 Intel Architecture Software developer manual Vol 3B
224*4882a593Smuzhiyun 	 */
225*4882a593Smuzhiyun 	.cntval_bits		= 32,
226*4882a593Smuzhiyun 	.cntval_mask		= (1ULL << 32) - 1,
227*4882a593Smuzhiyun 	.get_event_constraints	= x86_get_event_constraints,
228*4882a593Smuzhiyun 	.event_constraints	= p6_event_constraints,
229*4882a593Smuzhiyun 
230*4882a593Smuzhiyun 	.format_attrs		= intel_p6_formats_attr,
231*4882a593Smuzhiyun 	.events_sysfs_show	= intel_event_sysfs_show,
232*4882a593Smuzhiyun 
233*4882a593Smuzhiyun };
234*4882a593Smuzhiyun 
p6_pmu_rdpmc_quirk(void)235*4882a593Smuzhiyun static __init void p6_pmu_rdpmc_quirk(void)
236*4882a593Smuzhiyun {
237*4882a593Smuzhiyun 	if (boot_cpu_data.x86_stepping < 9) {
238*4882a593Smuzhiyun 		/*
239*4882a593Smuzhiyun 		 * PPro erratum 26; fixed in stepping 9 and above.
240*4882a593Smuzhiyun 		 */
241*4882a593Smuzhiyun 		pr_warn("Userspace RDPMC support disabled due to a CPU erratum\n");
242*4882a593Smuzhiyun 		x86_pmu.attr_rdpmc_broken = 1;
243*4882a593Smuzhiyun 		x86_pmu.attr_rdpmc = 0;
244*4882a593Smuzhiyun 	}
245*4882a593Smuzhiyun }
246*4882a593Smuzhiyun 
p6_pmu_init(void)247*4882a593Smuzhiyun __init int p6_pmu_init(void)
248*4882a593Smuzhiyun {
249*4882a593Smuzhiyun 	x86_pmu = p6_pmu;
250*4882a593Smuzhiyun 
251*4882a593Smuzhiyun 	switch (boot_cpu_data.x86_model) {
252*4882a593Smuzhiyun 	case  1: /* Pentium Pro */
253*4882a593Smuzhiyun 		x86_add_quirk(p6_pmu_rdpmc_quirk);
254*4882a593Smuzhiyun 		break;
255*4882a593Smuzhiyun 
256*4882a593Smuzhiyun 	case  3: /* Pentium II - Klamath */
257*4882a593Smuzhiyun 	case  5: /* Pentium II - Deschutes */
258*4882a593Smuzhiyun 	case  6: /* Pentium II - Mendocino */
259*4882a593Smuzhiyun 		break;
260*4882a593Smuzhiyun 
261*4882a593Smuzhiyun 	case  7: /* Pentium III - Katmai */
262*4882a593Smuzhiyun 	case  8: /* Pentium III - Coppermine */
263*4882a593Smuzhiyun 	case 10: /* Pentium III Xeon */
264*4882a593Smuzhiyun 	case 11: /* Pentium III - Tualatin */
265*4882a593Smuzhiyun 		break;
266*4882a593Smuzhiyun 
267*4882a593Smuzhiyun 	case  9: /* Pentium M - Banias */
268*4882a593Smuzhiyun 	case 13: /* Pentium M - Dothan */
269*4882a593Smuzhiyun 		break;
270*4882a593Smuzhiyun 
271*4882a593Smuzhiyun 	default:
272*4882a593Smuzhiyun 		pr_cont("unsupported p6 CPU model %d ", boot_cpu_data.x86_model);
273*4882a593Smuzhiyun 		return -ENODEV;
274*4882a593Smuzhiyun 	}
275*4882a593Smuzhiyun 
276*4882a593Smuzhiyun 	memcpy(hw_cache_event_ids, p6_hw_cache_event_ids,
277*4882a593Smuzhiyun 		sizeof(hw_cache_event_ids));
278*4882a593Smuzhiyun 
279*4882a593Smuzhiyun 	return 0;
280*4882a593Smuzhiyun }
281