1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /* Copyright (c) 2016 Facebook
3*4882a593Smuzhiyun */
4*4882a593Smuzhiyun #include <stdio.h>
5*4882a593Smuzhiyun #include <unistd.h>
6*4882a593Smuzhiyun #include <stdlib.h>
7*4882a593Smuzhiyun #include <stdbool.h>
8*4882a593Smuzhiyun #include <string.h>
9*4882a593Smuzhiyun #include <linux/perf_event.h>
10*4882a593Smuzhiyun #include <linux/bpf.h>
11*4882a593Smuzhiyun #include <signal.h>
12*4882a593Smuzhiyun #include <errno.h>
13*4882a593Smuzhiyun #include <sys/resource.h>
14*4882a593Smuzhiyun #include <bpf/bpf.h>
15*4882a593Smuzhiyun #include <bpf/libbpf.h>
16*4882a593Smuzhiyun #include "perf-sys.h"
17*4882a593Smuzhiyun #include "trace_helpers.h"
18*4882a593Smuzhiyun
19*4882a593Smuzhiyun #define SAMPLE_FREQ 50
20*4882a593Smuzhiyun
21*4882a593Smuzhiyun static int pid;
22*4882a593Smuzhiyun /* counts, stackmap */
23*4882a593Smuzhiyun static int map_fd[2];
24*4882a593Smuzhiyun struct bpf_program *prog;
25*4882a593Smuzhiyun static bool sys_read_seen, sys_write_seen;
26*4882a593Smuzhiyun
print_ksym(__u64 addr)27*4882a593Smuzhiyun static void print_ksym(__u64 addr)
28*4882a593Smuzhiyun {
29*4882a593Smuzhiyun struct ksym *sym;
30*4882a593Smuzhiyun
31*4882a593Smuzhiyun if (!addr)
32*4882a593Smuzhiyun return;
33*4882a593Smuzhiyun sym = ksym_search(addr);
34*4882a593Smuzhiyun if (!sym) {
35*4882a593Smuzhiyun printf("ksym not found. Is kallsyms loaded?\n");
36*4882a593Smuzhiyun return;
37*4882a593Smuzhiyun }
38*4882a593Smuzhiyun
39*4882a593Smuzhiyun printf("%s;", sym->name);
40*4882a593Smuzhiyun if (!strstr(sym->name, "sys_read"))
41*4882a593Smuzhiyun sys_read_seen = true;
42*4882a593Smuzhiyun else if (!strstr(sym->name, "sys_write"))
43*4882a593Smuzhiyun sys_write_seen = true;
44*4882a593Smuzhiyun }
45*4882a593Smuzhiyun
print_addr(__u64 addr)46*4882a593Smuzhiyun static void print_addr(__u64 addr)
47*4882a593Smuzhiyun {
48*4882a593Smuzhiyun if (!addr)
49*4882a593Smuzhiyun return;
50*4882a593Smuzhiyun printf("%llx;", addr);
51*4882a593Smuzhiyun }
52*4882a593Smuzhiyun
53*4882a593Smuzhiyun #define TASK_COMM_LEN 16
54*4882a593Smuzhiyun
55*4882a593Smuzhiyun struct key_t {
56*4882a593Smuzhiyun char comm[TASK_COMM_LEN];
57*4882a593Smuzhiyun __u32 kernstack;
58*4882a593Smuzhiyun __u32 userstack;
59*4882a593Smuzhiyun };
60*4882a593Smuzhiyun
print_stack(struct key_t * key,__u64 count)61*4882a593Smuzhiyun static void print_stack(struct key_t *key, __u64 count)
62*4882a593Smuzhiyun {
63*4882a593Smuzhiyun __u64 ip[PERF_MAX_STACK_DEPTH] = {};
64*4882a593Smuzhiyun static bool warned;
65*4882a593Smuzhiyun int i;
66*4882a593Smuzhiyun
67*4882a593Smuzhiyun printf("%3lld %s;", count, key->comm);
68*4882a593Smuzhiyun if (bpf_map_lookup_elem(map_fd[1], &key->kernstack, ip) != 0) {
69*4882a593Smuzhiyun printf("---;");
70*4882a593Smuzhiyun } else {
71*4882a593Smuzhiyun for (i = PERF_MAX_STACK_DEPTH - 1; i >= 0; i--)
72*4882a593Smuzhiyun print_ksym(ip[i]);
73*4882a593Smuzhiyun }
74*4882a593Smuzhiyun printf("-;");
75*4882a593Smuzhiyun if (bpf_map_lookup_elem(map_fd[1], &key->userstack, ip) != 0) {
76*4882a593Smuzhiyun printf("---;");
77*4882a593Smuzhiyun } else {
78*4882a593Smuzhiyun for (i = PERF_MAX_STACK_DEPTH - 1; i >= 0; i--)
79*4882a593Smuzhiyun print_addr(ip[i]);
80*4882a593Smuzhiyun }
81*4882a593Smuzhiyun if (count < 6)
82*4882a593Smuzhiyun printf("\r");
83*4882a593Smuzhiyun else
84*4882a593Smuzhiyun printf("\n");
85*4882a593Smuzhiyun
86*4882a593Smuzhiyun if (key->kernstack == -EEXIST && !warned) {
87*4882a593Smuzhiyun printf("stackmap collisions seen. Consider increasing size\n");
88*4882a593Smuzhiyun warned = true;
89*4882a593Smuzhiyun } else if ((int)key->kernstack < 0 && (int)key->userstack < 0) {
90*4882a593Smuzhiyun printf("err stackid %d %d\n", key->kernstack, key->userstack);
91*4882a593Smuzhiyun }
92*4882a593Smuzhiyun }
93*4882a593Smuzhiyun
err_exit(int err)94*4882a593Smuzhiyun static void err_exit(int err)
95*4882a593Smuzhiyun {
96*4882a593Smuzhiyun kill(pid, SIGKILL);
97*4882a593Smuzhiyun exit(err);
98*4882a593Smuzhiyun }
99*4882a593Smuzhiyun
print_stacks(void)100*4882a593Smuzhiyun static void print_stacks(void)
101*4882a593Smuzhiyun {
102*4882a593Smuzhiyun struct key_t key = {}, next_key;
103*4882a593Smuzhiyun __u64 value;
104*4882a593Smuzhiyun __u32 stackid = 0, next_id;
105*4882a593Smuzhiyun int error = 1, fd = map_fd[0], stack_map = map_fd[1];
106*4882a593Smuzhiyun
107*4882a593Smuzhiyun sys_read_seen = sys_write_seen = false;
108*4882a593Smuzhiyun while (bpf_map_get_next_key(fd, &key, &next_key) == 0) {
109*4882a593Smuzhiyun bpf_map_lookup_elem(fd, &next_key, &value);
110*4882a593Smuzhiyun print_stack(&next_key, value);
111*4882a593Smuzhiyun bpf_map_delete_elem(fd, &next_key);
112*4882a593Smuzhiyun key = next_key;
113*4882a593Smuzhiyun }
114*4882a593Smuzhiyun printf("\n");
115*4882a593Smuzhiyun if (!sys_read_seen || !sys_write_seen) {
116*4882a593Smuzhiyun printf("BUG kernel stack doesn't contain sys_read() and sys_write()\n");
117*4882a593Smuzhiyun err_exit(error);
118*4882a593Smuzhiyun }
119*4882a593Smuzhiyun
120*4882a593Smuzhiyun /* clear stack map */
121*4882a593Smuzhiyun while (bpf_map_get_next_key(stack_map, &stackid, &next_id) == 0) {
122*4882a593Smuzhiyun bpf_map_delete_elem(stack_map, &next_id);
123*4882a593Smuzhiyun stackid = next_id;
124*4882a593Smuzhiyun }
125*4882a593Smuzhiyun }
126*4882a593Smuzhiyun
generate_load(void)127*4882a593Smuzhiyun static inline int generate_load(void)
128*4882a593Smuzhiyun {
129*4882a593Smuzhiyun if (system("dd if=/dev/zero of=/dev/null count=5000k status=none") < 0) {
130*4882a593Smuzhiyun printf("failed to generate some load with dd: %s\n", strerror(errno));
131*4882a593Smuzhiyun return -1;
132*4882a593Smuzhiyun }
133*4882a593Smuzhiyun
134*4882a593Smuzhiyun return 0;
135*4882a593Smuzhiyun }
136*4882a593Smuzhiyun
test_perf_event_all_cpu(struct perf_event_attr * attr)137*4882a593Smuzhiyun static void test_perf_event_all_cpu(struct perf_event_attr *attr)
138*4882a593Smuzhiyun {
139*4882a593Smuzhiyun int nr_cpus = sysconf(_SC_NPROCESSORS_ONLN);
140*4882a593Smuzhiyun struct bpf_link **links = calloc(nr_cpus, sizeof(struct bpf_link *));
141*4882a593Smuzhiyun int i, pmu_fd, error = 1;
142*4882a593Smuzhiyun
143*4882a593Smuzhiyun if (!links) {
144*4882a593Smuzhiyun printf("malloc of links failed\n");
145*4882a593Smuzhiyun goto err;
146*4882a593Smuzhiyun }
147*4882a593Smuzhiyun
148*4882a593Smuzhiyun /* system wide perf event, no need to inherit */
149*4882a593Smuzhiyun attr->inherit = 0;
150*4882a593Smuzhiyun
151*4882a593Smuzhiyun /* open perf_event on all cpus */
152*4882a593Smuzhiyun for (i = 0; i < nr_cpus; i++) {
153*4882a593Smuzhiyun pmu_fd = sys_perf_event_open(attr, -1, i, -1, 0);
154*4882a593Smuzhiyun if (pmu_fd < 0) {
155*4882a593Smuzhiyun printf("sys_perf_event_open failed\n");
156*4882a593Smuzhiyun goto all_cpu_err;
157*4882a593Smuzhiyun }
158*4882a593Smuzhiyun links[i] = bpf_program__attach_perf_event(prog, pmu_fd);
159*4882a593Smuzhiyun if (libbpf_get_error(links[i])) {
160*4882a593Smuzhiyun printf("bpf_program__attach_perf_event failed\n");
161*4882a593Smuzhiyun links[i] = NULL;
162*4882a593Smuzhiyun close(pmu_fd);
163*4882a593Smuzhiyun goto all_cpu_err;
164*4882a593Smuzhiyun }
165*4882a593Smuzhiyun }
166*4882a593Smuzhiyun
167*4882a593Smuzhiyun if (generate_load() < 0)
168*4882a593Smuzhiyun goto all_cpu_err;
169*4882a593Smuzhiyun
170*4882a593Smuzhiyun print_stacks();
171*4882a593Smuzhiyun error = 0;
172*4882a593Smuzhiyun all_cpu_err:
173*4882a593Smuzhiyun for (i--; i >= 0; i--)
174*4882a593Smuzhiyun bpf_link__destroy(links[i]);
175*4882a593Smuzhiyun err:
176*4882a593Smuzhiyun free(links);
177*4882a593Smuzhiyun if (error)
178*4882a593Smuzhiyun err_exit(error);
179*4882a593Smuzhiyun }
180*4882a593Smuzhiyun
test_perf_event_task(struct perf_event_attr * attr)181*4882a593Smuzhiyun static void test_perf_event_task(struct perf_event_attr *attr)
182*4882a593Smuzhiyun {
183*4882a593Smuzhiyun struct bpf_link *link = NULL;
184*4882a593Smuzhiyun int pmu_fd, error = 1;
185*4882a593Smuzhiyun
186*4882a593Smuzhiyun /* per task perf event, enable inherit so the "dd ..." command can be traced properly.
187*4882a593Smuzhiyun * Enabling inherit will cause bpf_perf_prog_read_time helper failure.
188*4882a593Smuzhiyun */
189*4882a593Smuzhiyun attr->inherit = 1;
190*4882a593Smuzhiyun
191*4882a593Smuzhiyun /* open task bound event */
192*4882a593Smuzhiyun pmu_fd = sys_perf_event_open(attr, 0, -1, -1, 0);
193*4882a593Smuzhiyun if (pmu_fd < 0) {
194*4882a593Smuzhiyun printf("sys_perf_event_open failed\n");
195*4882a593Smuzhiyun goto err;
196*4882a593Smuzhiyun }
197*4882a593Smuzhiyun link = bpf_program__attach_perf_event(prog, pmu_fd);
198*4882a593Smuzhiyun if (libbpf_get_error(link)) {
199*4882a593Smuzhiyun printf("bpf_program__attach_perf_event failed\n");
200*4882a593Smuzhiyun link = NULL;
201*4882a593Smuzhiyun close(pmu_fd);
202*4882a593Smuzhiyun goto err;
203*4882a593Smuzhiyun }
204*4882a593Smuzhiyun
205*4882a593Smuzhiyun if (generate_load() < 0)
206*4882a593Smuzhiyun goto err;
207*4882a593Smuzhiyun
208*4882a593Smuzhiyun print_stacks();
209*4882a593Smuzhiyun error = 0;
210*4882a593Smuzhiyun err:
211*4882a593Smuzhiyun bpf_link__destroy(link);
212*4882a593Smuzhiyun if (error)
213*4882a593Smuzhiyun err_exit(error);
214*4882a593Smuzhiyun }
215*4882a593Smuzhiyun
test_bpf_perf_event(void)216*4882a593Smuzhiyun static void test_bpf_perf_event(void)
217*4882a593Smuzhiyun {
218*4882a593Smuzhiyun struct perf_event_attr attr_type_hw = {
219*4882a593Smuzhiyun .sample_freq = SAMPLE_FREQ,
220*4882a593Smuzhiyun .freq = 1,
221*4882a593Smuzhiyun .type = PERF_TYPE_HARDWARE,
222*4882a593Smuzhiyun .config = PERF_COUNT_HW_CPU_CYCLES,
223*4882a593Smuzhiyun };
224*4882a593Smuzhiyun struct perf_event_attr attr_type_sw = {
225*4882a593Smuzhiyun .sample_freq = SAMPLE_FREQ,
226*4882a593Smuzhiyun .freq = 1,
227*4882a593Smuzhiyun .type = PERF_TYPE_SOFTWARE,
228*4882a593Smuzhiyun .config = PERF_COUNT_SW_CPU_CLOCK,
229*4882a593Smuzhiyun };
230*4882a593Smuzhiyun struct perf_event_attr attr_hw_cache_l1d = {
231*4882a593Smuzhiyun .sample_freq = SAMPLE_FREQ,
232*4882a593Smuzhiyun .freq = 1,
233*4882a593Smuzhiyun .type = PERF_TYPE_HW_CACHE,
234*4882a593Smuzhiyun .config =
235*4882a593Smuzhiyun PERF_COUNT_HW_CACHE_L1D |
236*4882a593Smuzhiyun (PERF_COUNT_HW_CACHE_OP_READ << 8) |
237*4882a593Smuzhiyun (PERF_COUNT_HW_CACHE_RESULT_ACCESS << 16),
238*4882a593Smuzhiyun };
239*4882a593Smuzhiyun struct perf_event_attr attr_hw_cache_branch_miss = {
240*4882a593Smuzhiyun .sample_freq = SAMPLE_FREQ,
241*4882a593Smuzhiyun .freq = 1,
242*4882a593Smuzhiyun .type = PERF_TYPE_HW_CACHE,
243*4882a593Smuzhiyun .config =
244*4882a593Smuzhiyun PERF_COUNT_HW_CACHE_BPU |
245*4882a593Smuzhiyun (PERF_COUNT_HW_CACHE_OP_READ << 8) |
246*4882a593Smuzhiyun (PERF_COUNT_HW_CACHE_RESULT_MISS << 16),
247*4882a593Smuzhiyun };
248*4882a593Smuzhiyun struct perf_event_attr attr_type_raw = {
249*4882a593Smuzhiyun .sample_freq = SAMPLE_FREQ,
250*4882a593Smuzhiyun .freq = 1,
251*4882a593Smuzhiyun .type = PERF_TYPE_RAW,
252*4882a593Smuzhiyun /* Intel Instruction Retired */
253*4882a593Smuzhiyun .config = 0xc0,
254*4882a593Smuzhiyun };
255*4882a593Smuzhiyun struct perf_event_attr attr_type_raw_lock_load = {
256*4882a593Smuzhiyun .sample_freq = SAMPLE_FREQ,
257*4882a593Smuzhiyun .freq = 1,
258*4882a593Smuzhiyun .type = PERF_TYPE_RAW,
259*4882a593Smuzhiyun /* Intel MEM_UOPS_RETIRED.LOCK_LOADS */
260*4882a593Smuzhiyun .config = 0x21d0,
261*4882a593Smuzhiyun /* Request to record lock address from PEBS */
262*4882a593Smuzhiyun .sample_type = PERF_SAMPLE_ADDR,
263*4882a593Smuzhiyun /* Record address value requires precise event */
264*4882a593Smuzhiyun .precise_ip = 2,
265*4882a593Smuzhiyun };
266*4882a593Smuzhiyun
267*4882a593Smuzhiyun printf("Test HW_CPU_CYCLES\n");
268*4882a593Smuzhiyun test_perf_event_all_cpu(&attr_type_hw);
269*4882a593Smuzhiyun test_perf_event_task(&attr_type_hw);
270*4882a593Smuzhiyun
271*4882a593Smuzhiyun printf("Test SW_CPU_CLOCK\n");
272*4882a593Smuzhiyun test_perf_event_all_cpu(&attr_type_sw);
273*4882a593Smuzhiyun test_perf_event_task(&attr_type_sw);
274*4882a593Smuzhiyun
275*4882a593Smuzhiyun printf("Test HW_CACHE_L1D\n");
276*4882a593Smuzhiyun test_perf_event_all_cpu(&attr_hw_cache_l1d);
277*4882a593Smuzhiyun test_perf_event_task(&attr_hw_cache_l1d);
278*4882a593Smuzhiyun
279*4882a593Smuzhiyun printf("Test HW_CACHE_BPU\n");
280*4882a593Smuzhiyun test_perf_event_all_cpu(&attr_hw_cache_branch_miss);
281*4882a593Smuzhiyun test_perf_event_task(&attr_hw_cache_branch_miss);
282*4882a593Smuzhiyun
283*4882a593Smuzhiyun printf("Test Instruction Retired\n");
284*4882a593Smuzhiyun test_perf_event_all_cpu(&attr_type_raw);
285*4882a593Smuzhiyun test_perf_event_task(&attr_type_raw);
286*4882a593Smuzhiyun
287*4882a593Smuzhiyun printf("Test Lock Load\n");
288*4882a593Smuzhiyun test_perf_event_all_cpu(&attr_type_raw_lock_load);
289*4882a593Smuzhiyun test_perf_event_task(&attr_type_raw_lock_load);
290*4882a593Smuzhiyun
291*4882a593Smuzhiyun printf("*** PASS ***\n");
292*4882a593Smuzhiyun }
293*4882a593Smuzhiyun
294*4882a593Smuzhiyun
main(int argc,char ** argv)295*4882a593Smuzhiyun int main(int argc, char **argv)
296*4882a593Smuzhiyun {
297*4882a593Smuzhiyun struct rlimit r = {RLIM_INFINITY, RLIM_INFINITY};
298*4882a593Smuzhiyun struct bpf_object *obj = NULL;
299*4882a593Smuzhiyun char filename[256];
300*4882a593Smuzhiyun int error = 1;
301*4882a593Smuzhiyun
302*4882a593Smuzhiyun snprintf(filename, sizeof(filename), "%s_kern.o", argv[0]);
303*4882a593Smuzhiyun setrlimit(RLIMIT_MEMLOCK, &r);
304*4882a593Smuzhiyun
305*4882a593Smuzhiyun signal(SIGINT, err_exit);
306*4882a593Smuzhiyun signal(SIGTERM, err_exit);
307*4882a593Smuzhiyun
308*4882a593Smuzhiyun if (load_kallsyms()) {
309*4882a593Smuzhiyun printf("failed to process /proc/kallsyms\n");
310*4882a593Smuzhiyun goto cleanup;
311*4882a593Smuzhiyun }
312*4882a593Smuzhiyun
313*4882a593Smuzhiyun obj = bpf_object__open_file(filename, NULL);
314*4882a593Smuzhiyun if (libbpf_get_error(obj)) {
315*4882a593Smuzhiyun printf("opening BPF object file failed\n");
316*4882a593Smuzhiyun obj = NULL;
317*4882a593Smuzhiyun goto cleanup;
318*4882a593Smuzhiyun }
319*4882a593Smuzhiyun
320*4882a593Smuzhiyun prog = bpf_object__find_program_by_name(obj, "bpf_prog1");
321*4882a593Smuzhiyun if (!prog) {
322*4882a593Smuzhiyun printf("finding a prog in obj file failed\n");
323*4882a593Smuzhiyun goto cleanup;
324*4882a593Smuzhiyun }
325*4882a593Smuzhiyun
326*4882a593Smuzhiyun /* load BPF program */
327*4882a593Smuzhiyun if (bpf_object__load(obj)) {
328*4882a593Smuzhiyun printf("loading BPF object file failed\n");
329*4882a593Smuzhiyun goto cleanup;
330*4882a593Smuzhiyun }
331*4882a593Smuzhiyun
332*4882a593Smuzhiyun map_fd[0] = bpf_object__find_map_fd_by_name(obj, "counts");
333*4882a593Smuzhiyun map_fd[1] = bpf_object__find_map_fd_by_name(obj, "stackmap");
334*4882a593Smuzhiyun if (map_fd[0] < 0 || map_fd[1] < 0) {
335*4882a593Smuzhiyun printf("finding a counts/stackmap map in obj file failed\n");
336*4882a593Smuzhiyun goto cleanup;
337*4882a593Smuzhiyun }
338*4882a593Smuzhiyun
339*4882a593Smuzhiyun pid = fork();
340*4882a593Smuzhiyun if (pid == 0) {
341*4882a593Smuzhiyun read_trace_pipe();
342*4882a593Smuzhiyun return 0;
343*4882a593Smuzhiyun } else if (pid == -1) {
344*4882a593Smuzhiyun printf("couldn't spawn process\n");
345*4882a593Smuzhiyun goto cleanup;
346*4882a593Smuzhiyun }
347*4882a593Smuzhiyun
348*4882a593Smuzhiyun test_bpf_perf_event();
349*4882a593Smuzhiyun error = 0;
350*4882a593Smuzhiyun
351*4882a593Smuzhiyun cleanup:
352*4882a593Smuzhiyun bpf_object__close(obj);
353*4882a593Smuzhiyun err_exit(error);
354*4882a593Smuzhiyun }
355