xref: /OK3568_Linux_fs/kernel/tools/perf/arch/powerpc/util/perf_regs.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun #include <errno.h>
3*4882a593Smuzhiyun #include <string.h>
4*4882a593Smuzhiyun #include <regex.h>
5*4882a593Smuzhiyun #include <linux/zalloc.h>
6*4882a593Smuzhiyun 
7*4882a593Smuzhiyun #include "../../../util/perf_regs.h"
8*4882a593Smuzhiyun #include "../../../util/debug.h"
9*4882a593Smuzhiyun #include "../../../util/event.h"
10*4882a593Smuzhiyun #include "../../../util/header.h"
11*4882a593Smuzhiyun #include "../../../perf-sys.h"
12*4882a593Smuzhiyun #include "utils_header.h"
13*4882a593Smuzhiyun 
14*4882a593Smuzhiyun #include <linux/kernel.h>
15*4882a593Smuzhiyun 
16*4882a593Smuzhiyun #define PVR_POWER9		0x004E
17*4882a593Smuzhiyun #define PVR_POWER10		0x0080
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun const struct sample_reg sample_reg_masks[] = {
20*4882a593Smuzhiyun 	SMPL_REG(r0, PERF_REG_POWERPC_R0),
21*4882a593Smuzhiyun 	SMPL_REG(r1, PERF_REG_POWERPC_R1),
22*4882a593Smuzhiyun 	SMPL_REG(r2, PERF_REG_POWERPC_R2),
23*4882a593Smuzhiyun 	SMPL_REG(r3, PERF_REG_POWERPC_R3),
24*4882a593Smuzhiyun 	SMPL_REG(r4, PERF_REG_POWERPC_R4),
25*4882a593Smuzhiyun 	SMPL_REG(r5, PERF_REG_POWERPC_R5),
26*4882a593Smuzhiyun 	SMPL_REG(r6, PERF_REG_POWERPC_R6),
27*4882a593Smuzhiyun 	SMPL_REG(r7, PERF_REG_POWERPC_R7),
28*4882a593Smuzhiyun 	SMPL_REG(r8, PERF_REG_POWERPC_R8),
29*4882a593Smuzhiyun 	SMPL_REG(r9, PERF_REG_POWERPC_R9),
30*4882a593Smuzhiyun 	SMPL_REG(r10, PERF_REG_POWERPC_R10),
31*4882a593Smuzhiyun 	SMPL_REG(r11, PERF_REG_POWERPC_R11),
32*4882a593Smuzhiyun 	SMPL_REG(r12, PERF_REG_POWERPC_R12),
33*4882a593Smuzhiyun 	SMPL_REG(r13, PERF_REG_POWERPC_R13),
34*4882a593Smuzhiyun 	SMPL_REG(r14, PERF_REG_POWERPC_R14),
35*4882a593Smuzhiyun 	SMPL_REG(r15, PERF_REG_POWERPC_R15),
36*4882a593Smuzhiyun 	SMPL_REG(r16, PERF_REG_POWERPC_R16),
37*4882a593Smuzhiyun 	SMPL_REG(r17, PERF_REG_POWERPC_R17),
38*4882a593Smuzhiyun 	SMPL_REG(r18, PERF_REG_POWERPC_R18),
39*4882a593Smuzhiyun 	SMPL_REG(r19, PERF_REG_POWERPC_R19),
40*4882a593Smuzhiyun 	SMPL_REG(r20, PERF_REG_POWERPC_R20),
41*4882a593Smuzhiyun 	SMPL_REG(r21, PERF_REG_POWERPC_R21),
42*4882a593Smuzhiyun 	SMPL_REG(r22, PERF_REG_POWERPC_R22),
43*4882a593Smuzhiyun 	SMPL_REG(r23, PERF_REG_POWERPC_R23),
44*4882a593Smuzhiyun 	SMPL_REG(r24, PERF_REG_POWERPC_R24),
45*4882a593Smuzhiyun 	SMPL_REG(r25, PERF_REG_POWERPC_R25),
46*4882a593Smuzhiyun 	SMPL_REG(r26, PERF_REG_POWERPC_R26),
47*4882a593Smuzhiyun 	SMPL_REG(r27, PERF_REG_POWERPC_R27),
48*4882a593Smuzhiyun 	SMPL_REG(r28, PERF_REG_POWERPC_R28),
49*4882a593Smuzhiyun 	SMPL_REG(r29, PERF_REG_POWERPC_R29),
50*4882a593Smuzhiyun 	SMPL_REG(r30, PERF_REG_POWERPC_R30),
51*4882a593Smuzhiyun 	SMPL_REG(r31, PERF_REG_POWERPC_R31),
52*4882a593Smuzhiyun 	SMPL_REG(nip, PERF_REG_POWERPC_NIP),
53*4882a593Smuzhiyun 	SMPL_REG(msr, PERF_REG_POWERPC_MSR),
54*4882a593Smuzhiyun 	SMPL_REG(orig_r3, PERF_REG_POWERPC_ORIG_R3),
55*4882a593Smuzhiyun 	SMPL_REG(ctr, PERF_REG_POWERPC_CTR),
56*4882a593Smuzhiyun 	SMPL_REG(link, PERF_REG_POWERPC_LINK),
57*4882a593Smuzhiyun 	SMPL_REG(xer, PERF_REG_POWERPC_XER),
58*4882a593Smuzhiyun 	SMPL_REG(ccr, PERF_REG_POWERPC_CCR),
59*4882a593Smuzhiyun 	SMPL_REG(softe, PERF_REG_POWERPC_SOFTE),
60*4882a593Smuzhiyun 	SMPL_REG(trap, PERF_REG_POWERPC_TRAP),
61*4882a593Smuzhiyun 	SMPL_REG(dar, PERF_REG_POWERPC_DAR),
62*4882a593Smuzhiyun 	SMPL_REG(dsisr, PERF_REG_POWERPC_DSISR),
63*4882a593Smuzhiyun 	SMPL_REG(sier, PERF_REG_POWERPC_SIER),
64*4882a593Smuzhiyun 	SMPL_REG(mmcra, PERF_REG_POWERPC_MMCRA),
65*4882a593Smuzhiyun 	SMPL_REG(mmcr0, PERF_REG_POWERPC_MMCR0),
66*4882a593Smuzhiyun 	SMPL_REG(mmcr1, PERF_REG_POWERPC_MMCR1),
67*4882a593Smuzhiyun 	SMPL_REG(mmcr2, PERF_REG_POWERPC_MMCR2),
68*4882a593Smuzhiyun 	SMPL_REG(mmcr3, PERF_REG_POWERPC_MMCR3),
69*4882a593Smuzhiyun 	SMPL_REG(sier2, PERF_REG_POWERPC_SIER2),
70*4882a593Smuzhiyun 	SMPL_REG(sier3, PERF_REG_POWERPC_SIER3),
71*4882a593Smuzhiyun 	SMPL_REG_END
72*4882a593Smuzhiyun };
73*4882a593Smuzhiyun 
74*4882a593Smuzhiyun /* REG or %rREG */
75*4882a593Smuzhiyun #define SDT_OP_REGEX1  "^(%r)?([1-2]?[0-9]|3[0-1])$"
76*4882a593Smuzhiyun 
77*4882a593Smuzhiyun /* -NUM(REG) or NUM(REG) or -NUM(%rREG) or NUM(%rREG) */
78*4882a593Smuzhiyun #define SDT_OP_REGEX2  "^(\\-)?([0-9]+)\\((%r)?([1-2]?[0-9]|3[0-1])\\)$"
79*4882a593Smuzhiyun 
80*4882a593Smuzhiyun static regex_t sdt_op_regex1, sdt_op_regex2;
81*4882a593Smuzhiyun 
sdt_init_op_regex(void)82*4882a593Smuzhiyun static int sdt_init_op_regex(void)
83*4882a593Smuzhiyun {
84*4882a593Smuzhiyun 	static int initialized;
85*4882a593Smuzhiyun 	int ret = 0;
86*4882a593Smuzhiyun 
87*4882a593Smuzhiyun 	if (initialized)
88*4882a593Smuzhiyun 		return 0;
89*4882a593Smuzhiyun 
90*4882a593Smuzhiyun 	ret = regcomp(&sdt_op_regex1, SDT_OP_REGEX1, REG_EXTENDED);
91*4882a593Smuzhiyun 	if (ret)
92*4882a593Smuzhiyun 		goto error;
93*4882a593Smuzhiyun 
94*4882a593Smuzhiyun 	ret = regcomp(&sdt_op_regex2, SDT_OP_REGEX2, REG_EXTENDED);
95*4882a593Smuzhiyun 	if (ret)
96*4882a593Smuzhiyun 		goto free_regex1;
97*4882a593Smuzhiyun 
98*4882a593Smuzhiyun 	initialized = 1;
99*4882a593Smuzhiyun 	return 0;
100*4882a593Smuzhiyun 
101*4882a593Smuzhiyun free_regex1:
102*4882a593Smuzhiyun 	regfree(&sdt_op_regex1);
103*4882a593Smuzhiyun error:
104*4882a593Smuzhiyun 	pr_debug4("Regex compilation error.\n");
105*4882a593Smuzhiyun 	return ret;
106*4882a593Smuzhiyun }
107*4882a593Smuzhiyun 
108*4882a593Smuzhiyun /*
109*4882a593Smuzhiyun  * Parse OP and convert it into uprobe format, which is, +/-NUM(%gprREG).
110*4882a593Smuzhiyun  * Possible variants of OP are:
111*4882a593Smuzhiyun  *	Format		Example
112*4882a593Smuzhiyun  *	-------------------------
113*4882a593Smuzhiyun  *	NUM(REG)	48(18)
114*4882a593Smuzhiyun  *	-NUM(REG)	-48(18)
115*4882a593Smuzhiyun  *	NUM(%rREG)	48(%r18)
116*4882a593Smuzhiyun  *	-NUM(%rREG)	-48(%r18)
117*4882a593Smuzhiyun  *	REG		18
118*4882a593Smuzhiyun  *	%rREG		%r18
119*4882a593Smuzhiyun  *	iNUM		i0
120*4882a593Smuzhiyun  *	i-NUM		i-1
121*4882a593Smuzhiyun  *
122*4882a593Smuzhiyun  * SDT marker arguments on Powerpc uses %rREG form with -mregnames flag
123*4882a593Smuzhiyun  * and REG form with -mno-regnames. Here REG is general purpose register,
124*4882a593Smuzhiyun  * which is in 0 to 31 range.
125*4882a593Smuzhiyun  */
arch_sdt_arg_parse_op(char * old_op,char ** new_op)126*4882a593Smuzhiyun int arch_sdt_arg_parse_op(char *old_op, char **new_op)
127*4882a593Smuzhiyun {
128*4882a593Smuzhiyun 	int ret, new_len;
129*4882a593Smuzhiyun 	regmatch_t rm[5];
130*4882a593Smuzhiyun 	char prefix;
131*4882a593Smuzhiyun 
132*4882a593Smuzhiyun 	/* Constant argument. Uprobe does not support it */
133*4882a593Smuzhiyun 	if (old_op[0] == 'i') {
134*4882a593Smuzhiyun 		pr_debug4("Skipping unsupported SDT argument: %s\n", old_op);
135*4882a593Smuzhiyun 		return SDT_ARG_SKIP;
136*4882a593Smuzhiyun 	}
137*4882a593Smuzhiyun 
138*4882a593Smuzhiyun 	ret = sdt_init_op_regex();
139*4882a593Smuzhiyun 	if (ret < 0)
140*4882a593Smuzhiyun 		return ret;
141*4882a593Smuzhiyun 
142*4882a593Smuzhiyun 	if (!regexec(&sdt_op_regex1, old_op, 3, rm, 0)) {
143*4882a593Smuzhiyun 		/* REG or %rREG --> %gprREG */
144*4882a593Smuzhiyun 
145*4882a593Smuzhiyun 		new_len = 5;	/* % g p r NULL */
146*4882a593Smuzhiyun 		new_len += (int)(rm[2].rm_eo - rm[2].rm_so);
147*4882a593Smuzhiyun 
148*4882a593Smuzhiyun 		*new_op = zalloc(new_len);
149*4882a593Smuzhiyun 		if (!*new_op)
150*4882a593Smuzhiyun 			return -ENOMEM;
151*4882a593Smuzhiyun 
152*4882a593Smuzhiyun 		scnprintf(*new_op, new_len, "%%gpr%.*s",
153*4882a593Smuzhiyun 			(int)(rm[2].rm_eo - rm[2].rm_so), old_op + rm[2].rm_so);
154*4882a593Smuzhiyun 	} else if (!regexec(&sdt_op_regex2, old_op, 5, rm, 0)) {
155*4882a593Smuzhiyun 		/*
156*4882a593Smuzhiyun 		 * -NUM(REG) or NUM(REG) or -NUM(%rREG) or NUM(%rREG) -->
157*4882a593Smuzhiyun 		 *	+/-NUM(%gprREG)
158*4882a593Smuzhiyun 		 */
159*4882a593Smuzhiyun 		prefix = (rm[1].rm_so == -1) ? '+' : '-';
160*4882a593Smuzhiyun 
161*4882a593Smuzhiyun 		new_len = 8;	/* +/- ( % g p r ) NULL */
162*4882a593Smuzhiyun 		new_len += (int)(rm[2].rm_eo - rm[2].rm_so);
163*4882a593Smuzhiyun 		new_len += (int)(rm[4].rm_eo - rm[4].rm_so);
164*4882a593Smuzhiyun 
165*4882a593Smuzhiyun 		*new_op = zalloc(new_len);
166*4882a593Smuzhiyun 		if (!*new_op)
167*4882a593Smuzhiyun 			return -ENOMEM;
168*4882a593Smuzhiyun 
169*4882a593Smuzhiyun 		scnprintf(*new_op, new_len, "%c%.*s(%%gpr%.*s)", prefix,
170*4882a593Smuzhiyun 			(int)(rm[2].rm_eo - rm[2].rm_so), old_op + rm[2].rm_so,
171*4882a593Smuzhiyun 			(int)(rm[4].rm_eo - rm[4].rm_so), old_op + rm[4].rm_so);
172*4882a593Smuzhiyun 	} else {
173*4882a593Smuzhiyun 		pr_debug4("Skipping unsupported SDT argument: %s\n", old_op);
174*4882a593Smuzhiyun 		return SDT_ARG_SKIP;
175*4882a593Smuzhiyun 	}
176*4882a593Smuzhiyun 
177*4882a593Smuzhiyun 	return SDT_ARG_VALID;
178*4882a593Smuzhiyun }
179*4882a593Smuzhiyun 
arch__intr_reg_mask(void)180*4882a593Smuzhiyun uint64_t arch__intr_reg_mask(void)
181*4882a593Smuzhiyun {
182*4882a593Smuzhiyun 	struct perf_event_attr attr = {
183*4882a593Smuzhiyun 		.type                   = PERF_TYPE_HARDWARE,
184*4882a593Smuzhiyun 		.config                 = PERF_COUNT_HW_CPU_CYCLES,
185*4882a593Smuzhiyun 		.sample_type            = PERF_SAMPLE_REGS_INTR,
186*4882a593Smuzhiyun 		.precise_ip             = 1,
187*4882a593Smuzhiyun 		.disabled               = 1,
188*4882a593Smuzhiyun 		.exclude_kernel         = 1,
189*4882a593Smuzhiyun 	};
190*4882a593Smuzhiyun 	int fd;
191*4882a593Smuzhiyun 	u32 version;
192*4882a593Smuzhiyun 	u64 extended_mask = 0, mask = PERF_REGS_MASK;
193*4882a593Smuzhiyun 
194*4882a593Smuzhiyun 	/*
195*4882a593Smuzhiyun 	 * Get the PVR value to set the extended
196*4882a593Smuzhiyun 	 * mask specific to platform.
197*4882a593Smuzhiyun 	 */
198*4882a593Smuzhiyun 	version = (((mfspr(SPRN_PVR)) >>  16) & 0xFFFF);
199*4882a593Smuzhiyun 	if (version == PVR_POWER9)
200*4882a593Smuzhiyun 		extended_mask = PERF_REG_PMU_MASK_300;
201*4882a593Smuzhiyun 	else if (version == PVR_POWER10)
202*4882a593Smuzhiyun 		extended_mask = PERF_REG_PMU_MASK_31;
203*4882a593Smuzhiyun 	else
204*4882a593Smuzhiyun 		return mask;
205*4882a593Smuzhiyun 
206*4882a593Smuzhiyun 	attr.sample_regs_intr = extended_mask;
207*4882a593Smuzhiyun 	attr.sample_period = 1;
208*4882a593Smuzhiyun 	event_attr_init(&attr);
209*4882a593Smuzhiyun 
210*4882a593Smuzhiyun 	/*
211*4882a593Smuzhiyun 	 * check if the pmu supports perf extended regs, before
212*4882a593Smuzhiyun 	 * returning the register mask to sample.
213*4882a593Smuzhiyun 	 */
214*4882a593Smuzhiyun 	fd = sys_perf_event_open(&attr, 0, -1, -1, 0);
215*4882a593Smuzhiyun 	if (fd != -1) {
216*4882a593Smuzhiyun 		close(fd);
217*4882a593Smuzhiyun 		mask |= extended_mask;
218*4882a593Smuzhiyun 	}
219*4882a593Smuzhiyun 	return mask;
220*4882a593Smuzhiyun }
221