1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * perf events self profiling example test case for hw breakpoints.
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * This tests perf PERF_TYPE_BREAKPOINT parameters
6*4882a593Smuzhiyun * 1) tests all variants of the break on read/write flags
7*4882a593Smuzhiyun * 2) tests exclude_user == 0 and 1
8*4882a593Smuzhiyun * 3) test array matches (if DAWR is supported))
9*4882a593Smuzhiyun * 4) test different numbers of breakpoints matches
10*4882a593Smuzhiyun *
11*4882a593Smuzhiyun * Configure this breakpoint, then read and write the data a number of
12*4882a593Smuzhiyun * times. Then check the output count from perf is as expected.
13*4882a593Smuzhiyun *
14*4882a593Smuzhiyun * Based on:
15*4882a593Smuzhiyun * http://ozlabs.org/~anton/junkcode/perf_events_example1.c
16*4882a593Smuzhiyun *
17*4882a593Smuzhiyun * Copyright (C) 2018 Michael Neuling, IBM Corporation.
18*4882a593Smuzhiyun */
19*4882a593Smuzhiyun
20*4882a593Smuzhiyun #include <unistd.h>
21*4882a593Smuzhiyun #include <assert.h>
22*4882a593Smuzhiyun #include <stdio.h>
23*4882a593Smuzhiyun #include <stdlib.h>
24*4882a593Smuzhiyun #include <string.h>
25*4882a593Smuzhiyun #include <sys/ioctl.h>
26*4882a593Smuzhiyun #include <elf.h>
27*4882a593Smuzhiyun #include <pthread.h>
28*4882a593Smuzhiyun #include <sys/syscall.h>
29*4882a593Smuzhiyun #include <linux/perf_event.h>
30*4882a593Smuzhiyun #include <linux/hw_breakpoint.h>
31*4882a593Smuzhiyun #include "utils.h"
32*4882a593Smuzhiyun
33*4882a593Smuzhiyun #define MAX_LOOPS 10000
34*4882a593Smuzhiyun
35*4882a593Smuzhiyun #define DAWR_LENGTH_MAX ((0x3f + 1) * 8)
36*4882a593Smuzhiyun
sys_perf_event_open(struct perf_event_attr * attr,pid_t pid,int cpu,int group_fd,unsigned long flags)37*4882a593Smuzhiyun static inline int sys_perf_event_open(struct perf_event_attr *attr, pid_t pid,
38*4882a593Smuzhiyun int cpu, int group_fd,
39*4882a593Smuzhiyun unsigned long flags)
40*4882a593Smuzhiyun {
41*4882a593Smuzhiyun attr->size = sizeof(*attr);
42*4882a593Smuzhiyun return syscall(__NR_perf_event_open, attr, pid, cpu, group_fd, flags);
43*4882a593Smuzhiyun }
44*4882a593Smuzhiyun
breakpoint_test(int len)45*4882a593Smuzhiyun static inline bool breakpoint_test(int len)
46*4882a593Smuzhiyun {
47*4882a593Smuzhiyun struct perf_event_attr attr;
48*4882a593Smuzhiyun int fd;
49*4882a593Smuzhiyun
50*4882a593Smuzhiyun /* setup counters */
51*4882a593Smuzhiyun memset(&attr, 0, sizeof(attr));
52*4882a593Smuzhiyun attr.disabled = 1;
53*4882a593Smuzhiyun attr.type = PERF_TYPE_BREAKPOINT;
54*4882a593Smuzhiyun attr.bp_type = HW_BREAKPOINT_R;
55*4882a593Smuzhiyun /* bp_addr can point anywhere but needs to be aligned */
56*4882a593Smuzhiyun attr.bp_addr = (__u64)(&attr) & 0xfffffffffffff800;
57*4882a593Smuzhiyun attr.bp_len = len;
58*4882a593Smuzhiyun fd = sys_perf_event_open(&attr, 0, -1, -1, 0);
59*4882a593Smuzhiyun if (fd < 0)
60*4882a593Smuzhiyun return false;
61*4882a593Smuzhiyun close(fd);
62*4882a593Smuzhiyun return true;
63*4882a593Smuzhiyun }
64*4882a593Smuzhiyun
perf_breakpoint_supported(void)65*4882a593Smuzhiyun static inline bool perf_breakpoint_supported(void)
66*4882a593Smuzhiyun {
67*4882a593Smuzhiyun return breakpoint_test(4);
68*4882a593Smuzhiyun }
69*4882a593Smuzhiyun
dawr_supported(void)70*4882a593Smuzhiyun static inline bool dawr_supported(void)
71*4882a593Smuzhiyun {
72*4882a593Smuzhiyun return breakpoint_test(DAWR_LENGTH_MAX);
73*4882a593Smuzhiyun }
74*4882a593Smuzhiyun
runtestsingle(int readwriteflag,int exclude_user,int arraytest)75*4882a593Smuzhiyun static int runtestsingle(int readwriteflag, int exclude_user, int arraytest)
76*4882a593Smuzhiyun {
77*4882a593Smuzhiyun int i,j;
78*4882a593Smuzhiyun struct perf_event_attr attr;
79*4882a593Smuzhiyun size_t res;
80*4882a593Smuzhiyun unsigned long long breaks, needed;
81*4882a593Smuzhiyun int readint;
82*4882a593Smuzhiyun int readintarraybig[2*DAWR_LENGTH_MAX/sizeof(int)];
83*4882a593Smuzhiyun int *readintalign;
84*4882a593Smuzhiyun volatile int *ptr;
85*4882a593Smuzhiyun int break_fd;
86*4882a593Smuzhiyun int loop_num = MAX_LOOPS - (rand() % 100); /* provide some variability */
87*4882a593Smuzhiyun volatile int *k;
88*4882a593Smuzhiyun
89*4882a593Smuzhiyun /* align to 0x400 boundary as required by DAWR */
90*4882a593Smuzhiyun readintalign = (int *)(((unsigned long)readintarraybig + 0x7ff) &
91*4882a593Smuzhiyun 0xfffffffffffff800);
92*4882a593Smuzhiyun
93*4882a593Smuzhiyun ptr = &readint;
94*4882a593Smuzhiyun if (arraytest)
95*4882a593Smuzhiyun ptr = &readintalign[0];
96*4882a593Smuzhiyun
97*4882a593Smuzhiyun /* setup counters */
98*4882a593Smuzhiyun memset(&attr, 0, sizeof(attr));
99*4882a593Smuzhiyun attr.disabled = 1;
100*4882a593Smuzhiyun attr.type = PERF_TYPE_BREAKPOINT;
101*4882a593Smuzhiyun attr.bp_type = readwriteflag;
102*4882a593Smuzhiyun attr.bp_addr = (__u64)ptr;
103*4882a593Smuzhiyun attr.bp_len = sizeof(int);
104*4882a593Smuzhiyun if (arraytest)
105*4882a593Smuzhiyun attr.bp_len = DAWR_LENGTH_MAX;
106*4882a593Smuzhiyun attr.exclude_user = exclude_user;
107*4882a593Smuzhiyun break_fd = sys_perf_event_open(&attr, 0, -1, -1, 0);
108*4882a593Smuzhiyun if (break_fd < 0) {
109*4882a593Smuzhiyun perror("sys_perf_event_open");
110*4882a593Smuzhiyun exit(1);
111*4882a593Smuzhiyun }
112*4882a593Smuzhiyun
113*4882a593Smuzhiyun /* start counters */
114*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_ENABLE);
115*4882a593Smuzhiyun
116*4882a593Smuzhiyun /* Test a bunch of reads and writes */
117*4882a593Smuzhiyun k = &readint;
118*4882a593Smuzhiyun for (i = 0; i < loop_num; i++) {
119*4882a593Smuzhiyun if (arraytest)
120*4882a593Smuzhiyun k = &(readintalign[i % (DAWR_LENGTH_MAX/sizeof(int))]);
121*4882a593Smuzhiyun
122*4882a593Smuzhiyun j = *k;
123*4882a593Smuzhiyun *k = j;
124*4882a593Smuzhiyun }
125*4882a593Smuzhiyun
126*4882a593Smuzhiyun /* stop counters */
127*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_DISABLE);
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun /* read and check counters */
130*4882a593Smuzhiyun res = read(break_fd, &breaks, sizeof(unsigned long long));
131*4882a593Smuzhiyun assert(res == sizeof(unsigned long long));
132*4882a593Smuzhiyun /* we read and write each loop, so subtract the ones we are counting */
133*4882a593Smuzhiyun needed = 0;
134*4882a593Smuzhiyun if (readwriteflag & HW_BREAKPOINT_R)
135*4882a593Smuzhiyun needed += loop_num;
136*4882a593Smuzhiyun if (readwriteflag & HW_BREAKPOINT_W)
137*4882a593Smuzhiyun needed += loop_num;
138*4882a593Smuzhiyun needed = needed * (1 - exclude_user);
139*4882a593Smuzhiyun printf("TESTED: addr:0x%lx brks:% 8lld loops:% 8i rw:%i !user:%i array:%i\n",
140*4882a593Smuzhiyun (unsigned long int)ptr, breaks, loop_num, readwriteflag, exclude_user, arraytest);
141*4882a593Smuzhiyun if (breaks != needed) {
142*4882a593Smuzhiyun printf("FAILED: 0x%lx brks:%lld needed:%lli %i %i %i\n\n",
143*4882a593Smuzhiyun (unsigned long int)ptr, breaks, needed, loop_num, readwriteflag, exclude_user);
144*4882a593Smuzhiyun return 1;
145*4882a593Smuzhiyun }
146*4882a593Smuzhiyun close(break_fd);
147*4882a593Smuzhiyun
148*4882a593Smuzhiyun return 0;
149*4882a593Smuzhiyun }
150*4882a593Smuzhiyun
runtest_dar_outside(void)151*4882a593Smuzhiyun static int runtest_dar_outside(void)
152*4882a593Smuzhiyun {
153*4882a593Smuzhiyun void *target;
154*4882a593Smuzhiyun volatile __u16 temp16;
155*4882a593Smuzhiyun volatile __u64 temp64;
156*4882a593Smuzhiyun struct perf_event_attr attr;
157*4882a593Smuzhiyun int break_fd;
158*4882a593Smuzhiyun unsigned long long breaks;
159*4882a593Smuzhiyun int fail = 0;
160*4882a593Smuzhiyun size_t res;
161*4882a593Smuzhiyun
162*4882a593Smuzhiyun target = malloc(8);
163*4882a593Smuzhiyun if (!target) {
164*4882a593Smuzhiyun perror("malloc failed");
165*4882a593Smuzhiyun exit(EXIT_FAILURE);
166*4882a593Smuzhiyun }
167*4882a593Smuzhiyun
168*4882a593Smuzhiyun /* setup counters */
169*4882a593Smuzhiyun memset(&attr, 0, sizeof(attr));
170*4882a593Smuzhiyun attr.disabled = 1;
171*4882a593Smuzhiyun attr.type = PERF_TYPE_BREAKPOINT;
172*4882a593Smuzhiyun attr.exclude_kernel = 1;
173*4882a593Smuzhiyun attr.exclude_hv = 1;
174*4882a593Smuzhiyun attr.exclude_guest = 1;
175*4882a593Smuzhiyun attr.bp_type = HW_BREAKPOINT_RW;
176*4882a593Smuzhiyun /* watch middle half of target array */
177*4882a593Smuzhiyun attr.bp_addr = (__u64)(target + 2);
178*4882a593Smuzhiyun attr.bp_len = 4;
179*4882a593Smuzhiyun break_fd = sys_perf_event_open(&attr, 0, -1, -1, 0);
180*4882a593Smuzhiyun if (break_fd < 0) {
181*4882a593Smuzhiyun free(target);
182*4882a593Smuzhiyun perror("sys_perf_event_open");
183*4882a593Smuzhiyun exit(EXIT_FAILURE);
184*4882a593Smuzhiyun }
185*4882a593Smuzhiyun
186*4882a593Smuzhiyun /* Shouldn't hit. */
187*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_RESET);
188*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_ENABLE);
189*4882a593Smuzhiyun temp16 = *((__u16 *)target);
190*4882a593Smuzhiyun *((__u16 *)target) = temp16;
191*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_DISABLE);
192*4882a593Smuzhiyun res = read(break_fd, &breaks, sizeof(unsigned long long));
193*4882a593Smuzhiyun assert(res == sizeof(unsigned long long));
194*4882a593Smuzhiyun if (breaks == 0) {
195*4882a593Smuzhiyun printf("TESTED: No overlap\n");
196*4882a593Smuzhiyun } else {
197*4882a593Smuzhiyun printf("FAILED: No overlap: %lld != 0\n", breaks);
198*4882a593Smuzhiyun fail = 1;
199*4882a593Smuzhiyun }
200*4882a593Smuzhiyun
201*4882a593Smuzhiyun /* Hit */
202*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_RESET);
203*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_ENABLE);
204*4882a593Smuzhiyun temp16 = *((__u16 *)(target + 1));
205*4882a593Smuzhiyun *((__u16 *)(target + 1)) = temp16;
206*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_DISABLE);
207*4882a593Smuzhiyun res = read(break_fd, &breaks, sizeof(unsigned long long));
208*4882a593Smuzhiyun assert(res == sizeof(unsigned long long));
209*4882a593Smuzhiyun if (breaks == 2) {
210*4882a593Smuzhiyun printf("TESTED: Partial overlap\n");
211*4882a593Smuzhiyun } else {
212*4882a593Smuzhiyun printf("FAILED: Partial overlap: %lld != 2\n", breaks);
213*4882a593Smuzhiyun fail = 1;
214*4882a593Smuzhiyun }
215*4882a593Smuzhiyun
216*4882a593Smuzhiyun /* Hit */
217*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_RESET);
218*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_ENABLE);
219*4882a593Smuzhiyun temp16 = *((__u16 *)(target + 5));
220*4882a593Smuzhiyun *((__u16 *)(target + 5)) = temp16;
221*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_DISABLE);
222*4882a593Smuzhiyun res = read(break_fd, &breaks, sizeof(unsigned long long));
223*4882a593Smuzhiyun assert(res == sizeof(unsigned long long));
224*4882a593Smuzhiyun if (breaks == 2) {
225*4882a593Smuzhiyun printf("TESTED: Partial overlap\n");
226*4882a593Smuzhiyun } else {
227*4882a593Smuzhiyun printf("FAILED: Partial overlap: %lld != 2\n", breaks);
228*4882a593Smuzhiyun fail = 1;
229*4882a593Smuzhiyun }
230*4882a593Smuzhiyun
231*4882a593Smuzhiyun /* Shouldn't Hit */
232*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_RESET);
233*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_ENABLE);
234*4882a593Smuzhiyun temp16 = *((__u16 *)(target + 6));
235*4882a593Smuzhiyun *((__u16 *)(target + 6)) = temp16;
236*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_DISABLE);
237*4882a593Smuzhiyun res = read(break_fd, &breaks, sizeof(unsigned long long));
238*4882a593Smuzhiyun assert(res == sizeof(unsigned long long));
239*4882a593Smuzhiyun if (breaks == 0) {
240*4882a593Smuzhiyun printf("TESTED: No overlap\n");
241*4882a593Smuzhiyun } else {
242*4882a593Smuzhiyun printf("FAILED: No overlap: %lld != 0\n", breaks);
243*4882a593Smuzhiyun fail = 1;
244*4882a593Smuzhiyun }
245*4882a593Smuzhiyun
246*4882a593Smuzhiyun /* Hit */
247*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_RESET);
248*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_ENABLE);
249*4882a593Smuzhiyun temp64 = *((__u64 *)target);
250*4882a593Smuzhiyun *((__u64 *)target) = temp64;
251*4882a593Smuzhiyun ioctl(break_fd, PERF_EVENT_IOC_DISABLE);
252*4882a593Smuzhiyun res = read(break_fd, &breaks, sizeof(unsigned long long));
253*4882a593Smuzhiyun assert(res == sizeof(unsigned long long));
254*4882a593Smuzhiyun if (breaks == 2) {
255*4882a593Smuzhiyun printf("TESTED: Full overlap\n");
256*4882a593Smuzhiyun } else {
257*4882a593Smuzhiyun printf("FAILED: Full overlap: %lld != 2\n", breaks);
258*4882a593Smuzhiyun fail = 1;
259*4882a593Smuzhiyun }
260*4882a593Smuzhiyun
261*4882a593Smuzhiyun free(target);
262*4882a593Smuzhiyun close(break_fd);
263*4882a593Smuzhiyun return fail;
264*4882a593Smuzhiyun }
265*4882a593Smuzhiyun
runtest(void)266*4882a593Smuzhiyun static int runtest(void)
267*4882a593Smuzhiyun {
268*4882a593Smuzhiyun int rwflag;
269*4882a593Smuzhiyun int exclude_user;
270*4882a593Smuzhiyun int ret;
271*4882a593Smuzhiyun
272*4882a593Smuzhiyun /*
273*4882a593Smuzhiyun * perf defines rwflag as two bits read and write and at least
274*4882a593Smuzhiyun * one must be set. So range 1-3.
275*4882a593Smuzhiyun */
276*4882a593Smuzhiyun for (rwflag = 1 ; rwflag < 4; rwflag++) {
277*4882a593Smuzhiyun for (exclude_user = 0 ; exclude_user < 2; exclude_user++) {
278*4882a593Smuzhiyun ret = runtestsingle(rwflag, exclude_user, 0);
279*4882a593Smuzhiyun if (ret)
280*4882a593Smuzhiyun return ret;
281*4882a593Smuzhiyun
282*4882a593Smuzhiyun /* if we have the dawr, we can do an array test */
283*4882a593Smuzhiyun if (!dawr_supported())
284*4882a593Smuzhiyun continue;
285*4882a593Smuzhiyun ret = runtestsingle(rwflag, exclude_user, 1);
286*4882a593Smuzhiyun if (ret)
287*4882a593Smuzhiyun return ret;
288*4882a593Smuzhiyun }
289*4882a593Smuzhiyun }
290*4882a593Smuzhiyun
291*4882a593Smuzhiyun ret = runtest_dar_outside();
292*4882a593Smuzhiyun return ret;
293*4882a593Smuzhiyun }
294*4882a593Smuzhiyun
295*4882a593Smuzhiyun
perf_hwbreak(void)296*4882a593Smuzhiyun static int perf_hwbreak(void)
297*4882a593Smuzhiyun {
298*4882a593Smuzhiyun srand ( time(NULL) );
299*4882a593Smuzhiyun
300*4882a593Smuzhiyun SKIP_IF(!perf_breakpoint_supported());
301*4882a593Smuzhiyun
302*4882a593Smuzhiyun return runtest();
303*4882a593Smuzhiyun }
304*4882a593Smuzhiyun
main(int argc,char * argv[],char ** envp)305*4882a593Smuzhiyun int main(int argc, char *argv[], char **envp)
306*4882a593Smuzhiyun {
307*4882a593Smuzhiyun return test_harness(perf_hwbreak, "perf_hwbreak");
308*4882a593Smuzhiyun }
309