1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * Strictly speaking, this is not a test. But it can report during test
3*4882a593Smuzhiyun * runs so relative performace can be measured.
4*4882a593Smuzhiyun */
5*4882a593Smuzhiyun #define _GNU_SOURCE
6*4882a593Smuzhiyun #include <assert.h>
7*4882a593Smuzhiyun #include <limits.h>
8*4882a593Smuzhiyun #include <stdbool.h>
9*4882a593Smuzhiyun #include <stddef.h>
10*4882a593Smuzhiyun #include <stdio.h>
11*4882a593Smuzhiyun #include <stdlib.h>
12*4882a593Smuzhiyun #include <time.h>
13*4882a593Smuzhiyun #include <unistd.h>
14*4882a593Smuzhiyun #include <linux/filter.h>
15*4882a593Smuzhiyun #include <linux/seccomp.h>
16*4882a593Smuzhiyun #include <sys/param.h>
17*4882a593Smuzhiyun #include <sys/prctl.h>
18*4882a593Smuzhiyun #include <sys/syscall.h>
19*4882a593Smuzhiyun #include <sys/types.h>
20*4882a593Smuzhiyun
21*4882a593Smuzhiyun #define ARRAY_SIZE(a) (sizeof(a) / sizeof(a[0]))
22*4882a593Smuzhiyun
timing(clockid_t clk_id,unsigned long long samples)23*4882a593Smuzhiyun unsigned long long timing(clockid_t clk_id, unsigned long long samples)
24*4882a593Smuzhiyun {
25*4882a593Smuzhiyun struct timespec start, finish;
26*4882a593Smuzhiyun unsigned long long i;
27*4882a593Smuzhiyun pid_t pid, ret;
28*4882a593Smuzhiyun
29*4882a593Smuzhiyun pid = getpid();
30*4882a593Smuzhiyun assert(clock_gettime(clk_id, &start) == 0);
31*4882a593Smuzhiyun for (i = 0; i < samples; i++) {
32*4882a593Smuzhiyun ret = syscall(__NR_getpid);
33*4882a593Smuzhiyun assert(pid == ret);
34*4882a593Smuzhiyun }
35*4882a593Smuzhiyun assert(clock_gettime(clk_id, &finish) == 0);
36*4882a593Smuzhiyun
37*4882a593Smuzhiyun i = finish.tv_sec - start.tv_sec;
38*4882a593Smuzhiyun i *= 1000000000ULL;
39*4882a593Smuzhiyun i += finish.tv_nsec - start.tv_nsec;
40*4882a593Smuzhiyun
41*4882a593Smuzhiyun printf("%lu.%09lu - %lu.%09lu = %llu (%.1fs)\n",
42*4882a593Smuzhiyun finish.tv_sec, finish.tv_nsec,
43*4882a593Smuzhiyun start.tv_sec, start.tv_nsec,
44*4882a593Smuzhiyun i, (double)i / 1000000000.0);
45*4882a593Smuzhiyun
46*4882a593Smuzhiyun return i;
47*4882a593Smuzhiyun }
48*4882a593Smuzhiyun
calibrate(void)49*4882a593Smuzhiyun unsigned long long calibrate(void)
50*4882a593Smuzhiyun {
51*4882a593Smuzhiyun struct timespec start, finish;
52*4882a593Smuzhiyun unsigned long long i, samples, step = 9973;
53*4882a593Smuzhiyun pid_t pid, ret;
54*4882a593Smuzhiyun int seconds = 15;
55*4882a593Smuzhiyun
56*4882a593Smuzhiyun printf("Calibrating sample size for %d seconds worth of syscalls ...\n", seconds);
57*4882a593Smuzhiyun
58*4882a593Smuzhiyun samples = 0;
59*4882a593Smuzhiyun pid = getpid();
60*4882a593Smuzhiyun assert(clock_gettime(CLOCK_MONOTONIC, &start) == 0);
61*4882a593Smuzhiyun do {
62*4882a593Smuzhiyun for (i = 0; i < step; i++) {
63*4882a593Smuzhiyun ret = syscall(__NR_getpid);
64*4882a593Smuzhiyun assert(pid == ret);
65*4882a593Smuzhiyun }
66*4882a593Smuzhiyun assert(clock_gettime(CLOCK_MONOTONIC, &finish) == 0);
67*4882a593Smuzhiyun
68*4882a593Smuzhiyun samples += step;
69*4882a593Smuzhiyun i = finish.tv_sec - start.tv_sec;
70*4882a593Smuzhiyun i *= 1000000000ULL;
71*4882a593Smuzhiyun i += finish.tv_nsec - start.tv_nsec;
72*4882a593Smuzhiyun } while (i < 1000000000ULL);
73*4882a593Smuzhiyun
74*4882a593Smuzhiyun return samples * seconds;
75*4882a593Smuzhiyun }
76*4882a593Smuzhiyun
approx(int i_one,int i_two)77*4882a593Smuzhiyun bool approx(int i_one, int i_two)
78*4882a593Smuzhiyun {
79*4882a593Smuzhiyun double one = i_one, one_bump = one * 0.01;
80*4882a593Smuzhiyun double two = i_two, two_bump = two * 0.01;
81*4882a593Smuzhiyun
82*4882a593Smuzhiyun one_bump = one + MAX(one_bump, 2.0);
83*4882a593Smuzhiyun two_bump = two + MAX(two_bump, 2.0);
84*4882a593Smuzhiyun
85*4882a593Smuzhiyun /* Equal to, or within 1% or 2 digits */
86*4882a593Smuzhiyun if (one == two ||
87*4882a593Smuzhiyun (one > two && one <= two_bump) ||
88*4882a593Smuzhiyun (two > one && two <= one_bump))
89*4882a593Smuzhiyun return true;
90*4882a593Smuzhiyun return false;
91*4882a593Smuzhiyun }
92*4882a593Smuzhiyun
le(int i_one,int i_two)93*4882a593Smuzhiyun bool le(int i_one, int i_two)
94*4882a593Smuzhiyun {
95*4882a593Smuzhiyun if (i_one <= i_two)
96*4882a593Smuzhiyun return true;
97*4882a593Smuzhiyun return false;
98*4882a593Smuzhiyun }
99*4882a593Smuzhiyun
compare(const char * name_one,const char * name_eval,const char * name_two,unsigned long long one,bool (* eval)(int,int),unsigned long long two)100*4882a593Smuzhiyun long compare(const char *name_one, const char *name_eval, const char *name_two,
101*4882a593Smuzhiyun unsigned long long one, bool (*eval)(int, int), unsigned long long two)
102*4882a593Smuzhiyun {
103*4882a593Smuzhiyun bool good;
104*4882a593Smuzhiyun
105*4882a593Smuzhiyun printf("\t%s %s %s (%lld %s %lld): ", name_one, name_eval, name_two,
106*4882a593Smuzhiyun (long long)one, name_eval, (long long)two);
107*4882a593Smuzhiyun if (one > INT_MAX) {
108*4882a593Smuzhiyun printf("Miscalculation! Measurement went negative: %lld\n", (long long)one);
109*4882a593Smuzhiyun return 1;
110*4882a593Smuzhiyun }
111*4882a593Smuzhiyun if (two > INT_MAX) {
112*4882a593Smuzhiyun printf("Miscalculation! Measurement went negative: %lld\n", (long long)two);
113*4882a593Smuzhiyun return 1;
114*4882a593Smuzhiyun }
115*4882a593Smuzhiyun
116*4882a593Smuzhiyun good = eval(one, two);
117*4882a593Smuzhiyun printf("%s\n", good ? "✔️" : "❌");
118*4882a593Smuzhiyun
119*4882a593Smuzhiyun return good ? 0 : 1;
120*4882a593Smuzhiyun }
121*4882a593Smuzhiyun
main(int argc,char * argv[])122*4882a593Smuzhiyun int main(int argc, char *argv[])
123*4882a593Smuzhiyun {
124*4882a593Smuzhiyun struct sock_filter bitmap_filter[] = {
125*4882a593Smuzhiyun BPF_STMT(BPF_LD|BPF_W|BPF_ABS, offsetof(struct seccomp_data, nr)),
126*4882a593Smuzhiyun BPF_STMT(BPF_RET|BPF_K, SECCOMP_RET_ALLOW),
127*4882a593Smuzhiyun };
128*4882a593Smuzhiyun struct sock_fprog bitmap_prog = {
129*4882a593Smuzhiyun .len = (unsigned short)ARRAY_SIZE(bitmap_filter),
130*4882a593Smuzhiyun .filter = bitmap_filter,
131*4882a593Smuzhiyun };
132*4882a593Smuzhiyun struct sock_filter filter[] = {
133*4882a593Smuzhiyun BPF_STMT(BPF_LD|BPF_W|BPF_ABS, offsetof(struct seccomp_data, args[0])),
134*4882a593Smuzhiyun BPF_STMT(BPF_RET|BPF_K, SECCOMP_RET_ALLOW),
135*4882a593Smuzhiyun };
136*4882a593Smuzhiyun struct sock_fprog prog = {
137*4882a593Smuzhiyun .len = (unsigned short)ARRAY_SIZE(filter),
138*4882a593Smuzhiyun .filter = filter,
139*4882a593Smuzhiyun };
140*4882a593Smuzhiyun
141*4882a593Smuzhiyun long ret, bits;
142*4882a593Smuzhiyun unsigned long long samples, calc;
143*4882a593Smuzhiyun unsigned long long native, filter1, filter2, bitmap1, bitmap2;
144*4882a593Smuzhiyun unsigned long long entry, per_filter1, per_filter2;
145*4882a593Smuzhiyun
146*4882a593Smuzhiyun printf("Current BPF sysctl settings:\n");
147*4882a593Smuzhiyun system("sysctl net.core.bpf_jit_enable");
148*4882a593Smuzhiyun system("sysctl net.core.bpf_jit_harden");
149*4882a593Smuzhiyun
150*4882a593Smuzhiyun if (argc > 1)
151*4882a593Smuzhiyun samples = strtoull(argv[1], NULL, 0);
152*4882a593Smuzhiyun else
153*4882a593Smuzhiyun samples = calibrate();
154*4882a593Smuzhiyun
155*4882a593Smuzhiyun printf("Benchmarking %llu syscalls...\n", samples);
156*4882a593Smuzhiyun
157*4882a593Smuzhiyun /* Native call */
158*4882a593Smuzhiyun native = timing(CLOCK_PROCESS_CPUTIME_ID, samples) / samples;
159*4882a593Smuzhiyun printf("getpid native: %llu ns\n", native);
160*4882a593Smuzhiyun
161*4882a593Smuzhiyun ret = prctl(PR_SET_NO_NEW_PRIVS, 1, 0, 0, 0);
162*4882a593Smuzhiyun assert(ret == 0);
163*4882a593Smuzhiyun
164*4882a593Smuzhiyun /* One filter resulting in a bitmap */
165*4882a593Smuzhiyun ret = prctl(PR_SET_SECCOMP, SECCOMP_MODE_FILTER, &bitmap_prog);
166*4882a593Smuzhiyun assert(ret == 0);
167*4882a593Smuzhiyun
168*4882a593Smuzhiyun bitmap1 = timing(CLOCK_PROCESS_CPUTIME_ID, samples) / samples;
169*4882a593Smuzhiyun printf("getpid RET_ALLOW 1 filter (bitmap): %llu ns\n", bitmap1);
170*4882a593Smuzhiyun
171*4882a593Smuzhiyun /* Second filter resulting in a bitmap */
172*4882a593Smuzhiyun ret = prctl(PR_SET_SECCOMP, SECCOMP_MODE_FILTER, &bitmap_prog);
173*4882a593Smuzhiyun assert(ret == 0);
174*4882a593Smuzhiyun
175*4882a593Smuzhiyun bitmap2 = timing(CLOCK_PROCESS_CPUTIME_ID, samples) / samples;
176*4882a593Smuzhiyun printf("getpid RET_ALLOW 2 filters (bitmap): %llu ns\n", bitmap2);
177*4882a593Smuzhiyun
178*4882a593Smuzhiyun /* Third filter, can no longer be converted to bitmap */
179*4882a593Smuzhiyun ret = prctl(PR_SET_SECCOMP, SECCOMP_MODE_FILTER, &prog);
180*4882a593Smuzhiyun assert(ret == 0);
181*4882a593Smuzhiyun
182*4882a593Smuzhiyun filter1 = timing(CLOCK_PROCESS_CPUTIME_ID, samples) / samples;
183*4882a593Smuzhiyun printf("getpid RET_ALLOW 3 filters (full): %llu ns\n", filter1);
184*4882a593Smuzhiyun
185*4882a593Smuzhiyun /* Fourth filter, can not be converted to bitmap because of filter 3 */
186*4882a593Smuzhiyun ret = prctl(PR_SET_SECCOMP, SECCOMP_MODE_FILTER, &bitmap_prog);
187*4882a593Smuzhiyun assert(ret == 0);
188*4882a593Smuzhiyun
189*4882a593Smuzhiyun filter2 = timing(CLOCK_PROCESS_CPUTIME_ID, samples) / samples;
190*4882a593Smuzhiyun printf("getpid RET_ALLOW 4 filters (full): %llu ns\n", filter2);
191*4882a593Smuzhiyun
192*4882a593Smuzhiyun /* Estimations */
193*4882a593Smuzhiyun #define ESTIMATE(fmt, var, what) do { \
194*4882a593Smuzhiyun var = (what); \
195*4882a593Smuzhiyun printf("Estimated " fmt ": %llu ns\n", var); \
196*4882a593Smuzhiyun if (var > INT_MAX) \
197*4882a593Smuzhiyun goto more_samples; \
198*4882a593Smuzhiyun } while (0)
199*4882a593Smuzhiyun
200*4882a593Smuzhiyun ESTIMATE("total seccomp overhead for 1 bitmapped filter", calc,
201*4882a593Smuzhiyun bitmap1 - native);
202*4882a593Smuzhiyun ESTIMATE("total seccomp overhead for 2 bitmapped filters", calc,
203*4882a593Smuzhiyun bitmap2 - native);
204*4882a593Smuzhiyun ESTIMATE("total seccomp overhead for 3 full filters", calc,
205*4882a593Smuzhiyun filter1 - native);
206*4882a593Smuzhiyun ESTIMATE("total seccomp overhead for 4 full filters", calc,
207*4882a593Smuzhiyun filter2 - native);
208*4882a593Smuzhiyun ESTIMATE("seccomp entry overhead", entry,
209*4882a593Smuzhiyun bitmap1 - native - (bitmap2 - bitmap1));
210*4882a593Smuzhiyun ESTIMATE("seccomp per-filter overhead (last 2 diff)", per_filter1,
211*4882a593Smuzhiyun filter2 - filter1);
212*4882a593Smuzhiyun ESTIMATE("seccomp per-filter overhead (filters / 4)", per_filter2,
213*4882a593Smuzhiyun (filter2 - native - entry) / 4);
214*4882a593Smuzhiyun
215*4882a593Smuzhiyun printf("Expectations:\n");
216*4882a593Smuzhiyun ret |= compare("native", "≤", "1 bitmap", native, le, bitmap1);
217*4882a593Smuzhiyun bits = compare("native", "≤", "1 filter", native, le, filter1);
218*4882a593Smuzhiyun if (bits)
219*4882a593Smuzhiyun goto more_samples;
220*4882a593Smuzhiyun
221*4882a593Smuzhiyun ret |= compare("per-filter (last 2 diff)", "≈", "per-filter (filters / 4)",
222*4882a593Smuzhiyun per_filter1, approx, per_filter2);
223*4882a593Smuzhiyun
224*4882a593Smuzhiyun bits = compare("1 bitmapped", "≈", "2 bitmapped",
225*4882a593Smuzhiyun bitmap1 - native, approx, bitmap2 - native);
226*4882a593Smuzhiyun if (bits) {
227*4882a593Smuzhiyun printf("Skipping constant action bitmap expectations: they appear unsupported.\n");
228*4882a593Smuzhiyun goto out;
229*4882a593Smuzhiyun }
230*4882a593Smuzhiyun
231*4882a593Smuzhiyun ret |= compare("entry", "≈", "1 bitmapped", entry, approx, bitmap1 - native);
232*4882a593Smuzhiyun ret |= compare("entry", "≈", "2 bitmapped", entry, approx, bitmap2 - native);
233*4882a593Smuzhiyun ret |= compare("native + entry + (per filter * 4)", "≈", "4 filters total",
234*4882a593Smuzhiyun entry + (per_filter1 * 4) + native, approx, filter2);
235*4882a593Smuzhiyun if (ret == 0)
236*4882a593Smuzhiyun goto out;
237*4882a593Smuzhiyun
238*4882a593Smuzhiyun more_samples:
239*4882a593Smuzhiyun printf("Saw unexpected benchmark result. Try running again with more samples?\n");
240*4882a593Smuzhiyun out:
241*4882a593Smuzhiyun return 0;
242*4882a593Smuzhiyun }
243