1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun
3*4882a593Smuzhiyun #define _GNU_SOURCE
4*4882a593Smuzhiyun #include <assert.h>
5*4882a593Smuzhiyun #include <errno.h>
6*4882a593Smuzhiyun #include <fcntl.h>
7*4882a593Smuzhiyun #include <linux/types.h>
8*4882a593Smuzhiyun #include <sched.h>
9*4882a593Smuzhiyun #include <signal.h>
10*4882a593Smuzhiyun #include <stdio.h>
11*4882a593Smuzhiyun #include <stdlib.h>
12*4882a593Smuzhiyun #include <string.h>
13*4882a593Smuzhiyun #include <syscall.h>
14*4882a593Smuzhiyun #include <sys/wait.h>
15*4882a593Smuzhiyun #include <sys/mman.h>
16*4882a593Smuzhiyun
17*4882a593Smuzhiyun #include "pidfd.h"
18*4882a593Smuzhiyun #include "../kselftest.h"
19*4882a593Smuzhiyun
20*4882a593Smuzhiyun struct error {
21*4882a593Smuzhiyun int code;
22*4882a593Smuzhiyun char msg[512];
23*4882a593Smuzhiyun };
24*4882a593Smuzhiyun
error_set(struct error * err,int code,const char * fmt,...)25*4882a593Smuzhiyun static int error_set(struct error *err, int code, const char *fmt, ...)
26*4882a593Smuzhiyun {
27*4882a593Smuzhiyun va_list args;
28*4882a593Smuzhiyun int r;
29*4882a593Smuzhiyun
30*4882a593Smuzhiyun if (code == PIDFD_PASS || !err || err->code != PIDFD_PASS)
31*4882a593Smuzhiyun return code;
32*4882a593Smuzhiyun
33*4882a593Smuzhiyun err->code = code;
34*4882a593Smuzhiyun va_start(args, fmt);
35*4882a593Smuzhiyun r = vsnprintf(err->msg, sizeof(err->msg), fmt, args);
36*4882a593Smuzhiyun assert((size_t)r < sizeof(err->msg));
37*4882a593Smuzhiyun va_end(args);
38*4882a593Smuzhiyun
39*4882a593Smuzhiyun return code;
40*4882a593Smuzhiyun }
41*4882a593Smuzhiyun
error_report(struct error * err,const char * test_name)42*4882a593Smuzhiyun static void error_report(struct error *err, const char *test_name)
43*4882a593Smuzhiyun {
44*4882a593Smuzhiyun switch (err->code) {
45*4882a593Smuzhiyun case PIDFD_ERROR:
46*4882a593Smuzhiyun ksft_exit_fail_msg("%s test: Fatal: %s\n", test_name, err->msg);
47*4882a593Smuzhiyun break;
48*4882a593Smuzhiyun
49*4882a593Smuzhiyun case PIDFD_FAIL:
50*4882a593Smuzhiyun /* will be: not ok %d # error %s test: %s */
51*4882a593Smuzhiyun ksft_test_result_error("%s test: %s\n", test_name, err->msg);
52*4882a593Smuzhiyun break;
53*4882a593Smuzhiyun
54*4882a593Smuzhiyun case PIDFD_SKIP:
55*4882a593Smuzhiyun /* will be: not ok %d # SKIP %s test: %s */
56*4882a593Smuzhiyun ksft_test_result_skip("%s test: %s\n", test_name, err->msg);
57*4882a593Smuzhiyun break;
58*4882a593Smuzhiyun
59*4882a593Smuzhiyun case PIDFD_XFAIL:
60*4882a593Smuzhiyun ksft_test_result_pass("%s test: Expected failure: %s\n",
61*4882a593Smuzhiyun test_name, err->msg);
62*4882a593Smuzhiyun break;
63*4882a593Smuzhiyun
64*4882a593Smuzhiyun case PIDFD_PASS:
65*4882a593Smuzhiyun ksft_test_result_pass("%s test: Passed\n");
66*4882a593Smuzhiyun break;
67*4882a593Smuzhiyun
68*4882a593Smuzhiyun default:
69*4882a593Smuzhiyun ksft_exit_fail_msg("%s test: Unknown code: %d %s\n",
70*4882a593Smuzhiyun test_name, err->code, err->msg);
71*4882a593Smuzhiyun break;
72*4882a593Smuzhiyun }
73*4882a593Smuzhiyun }
74*4882a593Smuzhiyun
error_check(struct error * err,const char * test_name)75*4882a593Smuzhiyun static inline int error_check(struct error *err, const char *test_name)
76*4882a593Smuzhiyun {
77*4882a593Smuzhiyun /* In case of error we bail out and terminate the test program */
78*4882a593Smuzhiyun if (err->code == PIDFD_ERROR)
79*4882a593Smuzhiyun error_report(err, test_name);
80*4882a593Smuzhiyun
81*4882a593Smuzhiyun return err->code;
82*4882a593Smuzhiyun }
83*4882a593Smuzhiyun
84*4882a593Smuzhiyun #define CHILD_STACK_SIZE 8192
85*4882a593Smuzhiyun
86*4882a593Smuzhiyun struct child {
87*4882a593Smuzhiyun char *stack;
88*4882a593Smuzhiyun pid_t pid;
89*4882a593Smuzhiyun int fd;
90*4882a593Smuzhiyun };
91*4882a593Smuzhiyun
clone_newns(int (* fn)(void *),void * args,struct error * err)92*4882a593Smuzhiyun static struct child clone_newns(int (*fn)(void *), void *args,
93*4882a593Smuzhiyun struct error *err)
94*4882a593Smuzhiyun {
95*4882a593Smuzhiyun static int flags = CLONE_PIDFD | CLONE_NEWPID | CLONE_NEWNS | SIGCHLD;
96*4882a593Smuzhiyun struct child ret;
97*4882a593Smuzhiyun
98*4882a593Smuzhiyun if (!(flags & CLONE_NEWUSER) && geteuid() != 0)
99*4882a593Smuzhiyun flags |= CLONE_NEWUSER;
100*4882a593Smuzhiyun
101*4882a593Smuzhiyun ret.stack = mmap(NULL, CHILD_STACK_SIZE, PROT_READ | PROT_WRITE,
102*4882a593Smuzhiyun MAP_PRIVATE | MAP_ANONYMOUS | MAP_STACK, -1, 0);
103*4882a593Smuzhiyun if (ret.stack == MAP_FAILED) {
104*4882a593Smuzhiyun error_set(err, -1, "mmap of stack failed (errno %d)", errno);
105*4882a593Smuzhiyun return ret;
106*4882a593Smuzhiyun }
107*4882a593Smuzhiyun
108*4882a593Smuzhiyun #ifdef __ia64__
109*4882a593Smuzhiyun ret.pid = __clone2(fn, ret.stack, CHILD_STACK_SIZE, flags, args, &ret.fd);
110*4882a593Smuzhiyun #else
111*4882a593Smuzhiyun ret.pid = clone(fn, ret.stack + CHILD_STACK_SIZE, flags, args, &ret.fd);
112*4882a593Smuzhiyun #endif
113*4882a593Smuzhiyun
114*4882a593Smuzhiyun if (ret.pid < 0) {
115*4882a593Smuzhiyun error_set(err, PIDFD_ERROR, "clone failed (ret %d, errno %d)",
116*4882a593Smuzhiyun ret.fd, errno);
117*4882a593Smuzhiyun return ret;
118*4882a593Smuzhiyun }
119*4882a593Smuzhiyun
120*4882a593Smuzhiyun ksft_print_msg("New child: %d, fd: %d\n", ret.pid, ret.fd);
121*4882a593Smuzhiyun
122*4882a593Smuzhiyun return ret;
123*4882a593Smuzhiyun }
124*4882a593Smuzhiyun
child_close(struct child * child)125*4882a593Smuzhiyun static inline void child_close(struct child *child)
126*4882a593Smuzhiyun {
127*4882a593Smuzhiyun close(child->fd);
128*4882a593Smuzhiyun }
129*4882a593Smuzhiyun
child_join(struct child * child,struct error * err)130*4882a593Smuzhiyun static inline int child_join(struct child *child, struct error *err)
131*4882a593Smuzhiyun {
132*4882a593Smuzhiyun int r;
133*4882a593Smuzhiyun
134*4882a593Smuzhiyun r = wait_for_pid(child->pid);
135*4882a593Smuzhiyun if (r < 0)
136*4882a593Smuzhiyun error_set(err, PIDFD_ERROR, "waitpid failed (ret %d, errno %d)",
137*4882a593Smuzhiyun r, errno);
138*4882a593Smuzhiyun else if (r > 0)
139*4882a593Smuzhiyun error_set(err, r, "child %d reported: %d", child->pid, r);
140*4882a593Smuzhiyun
141*4882a593Smuzhiyun if (munmap(child->stack, CHILD_STACK_SIZE)) {
142*4882a593Smuzhiyun error_set(err, -1, "munmap of child stack failed (errno %d)", errno);
143*4882a593Smuzhiyun r = -1;
144*4882a593Smuzhiyun }
145*4882a593Smuzhiyun
146*4882a593Smuzhiyun return r;
147*4882a593Smuzhiyun }
148*4882a593Smuzhiyun
child_join_close(struct child * child,struct error * err)149*4882a593Smuzhiyun static inline int child_join_close(struct child *child, struct error *err)
150*4882a593Smuzhiyun {
151*4882a593Smuzhiyun child_close(child);
152*4882a593Smuzhiyun return child_join(child, err);
153*4882a593Smuzhiyun }
154*4882a593Smuzhiyun
trim_newline(char * str)155*4882a593Smuzhiyun static inline void trim_newline(char *str)
156*4882a593Smuzhiyun {
157*4882a593Smuzhiyun char *pos = strrchr(str, '\n');
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun if (pos)
160*4882a593Smuzhiyun *pos = '\0';
161*4882a593Smuzhiyun }
162*4882a593Smuzhiyun
verify_fdinfo(int pidfd,struct error * err,const char * prefix,size_t prefix_len,const char * expect,...)163*4882a593Smuzhiyun static int verify_fdinfo(int pidfd, struct error *err, const char *prefix,
164*4882a593Smuzhiyun size_t prefix_len, const char *expect, ...)
165*4882a593Smuzhiyun {
166*4882a593Smuzhiyun char buffer[512] = {0, };
167*4882a593Smuzhiyun char path[512] = {0, };
168*4882a593Smuzhiyun va_list args;
169*4882a593Smuzhiyun FILE *f;
170*4882a593Smuzhiyun char *line = NULL;
171*4882a593Smuzhiyun size_t n = 0;
172*4882a593Smuzhiyun int found = 0;
173*4882a593Smuzhiyun int r;
174*4882a593Smuzhiyun
175*4882a593Smuzhiyun va_start(args, expect);
176*4882a593Smuzhiyun r = vsnprintf(buffer, sizeof(buffer), expect, args);
177*4882a593Smuzhiyun assert((size_t)r < sizeof(buffer));
178*4882a593Smuzhiyun va_end(args);
179*4882a593Smuzhiyun
180*4882a593Smuzhiyun snprintf(path, sizeof(path), "/proc/self/fdinfo/%d", pidfd);
181*4882a593Smuzhiyun f = fopen(path, "re");
182*4882a593Smuzhiyun if (!f)
183*4882a593Smuzhiyun return error_set(err, PIDFD_ERROR, "fdinfo open failed for %d",
184*4882a593Smuzhiyun pidfd);
185*4882a593Smuzhiyun
186*4882a593Smuzhiyun while (getline(&line, &n, f) != -1) {
187*4882a593Smuzhiyun char *val;
188*4882a593Smuzhiyun
189*4882a593Smuzhiyun if (strncmp(line, prefix, prefix_len))
190*4882a593Smuzhiyun continue;
191*4882a593Smuzhiyun
192*4882a593Smuzhiyun found = 1;
193*4882a593Smuzhiyun
194*4882a593Smuzhiyun val = line + prefix_len;
195*4882a593Smuzhiyun r = strcmp(val, buffer);
196*4882a593Smuzhiyun if (r != 0) {
197*4882a593Smuzhiyun trim_newline(line);
198*4882a593Smuzhiyun trim_newline(buffer);
199*4882a593Smuzhiyun error_set(err, PIDFD_FAIL, "%s '%s' != '%s'",
200*4882a593Smuzhiyun prefix, val, buffer);
201*4882a593Smuzhiyun }
202*4882a593Smuzhiyun break;
203*4882a593Smuzhiyun }
204*4882a593Smuzhiyun
205*4882a593Smuzhiyun free(line);
206*4882a593Smuzhiyun fclose(f);
207*4882a593Smuzhiyun
208*4882a593Smuzhiyun if (found == 0)
209*4882a593Smuzhiyun return error_set(err, PIDFD_FAIL, "%s not found for fd %d",
210*4882a593Smuzhiyun prefix, pidfd);
211*4882a593Smuzhiyun
212*4882a593Smuzhiyun return PIDFD_PASS;
213*4882a593Smuzhiyun }
214*4882a593Smuzhiyun
child_fdinfo_nspid_test(void * args)215*4882a593Smuzhiyun static int child_fdinfo_nspid_test(void *args)
216*4882a593Smuzhiyun {
217*4882a593Smuzhiyun struct error err;
218*4882a593Smuzhiyun int pidfd;
219*4882a593Smuzhiyun int r;
220*4882a593Smuzhiyun
221*4882a593Smuzhiyun /* if we got no fd for the sibling, we are done */
222*4882a593Smuzhiyun if (!args)
223*4882a593Smuzhiyun return PIDFD_PASS;
224*4882a593Smuzhiyun
225*4882a593Smuzhiyun /* verify that we can not resolve the pidfd for a process
226*4882a593Smuzhiyun * in a sibling pid namespace, i.e. a pid namespace it is
227*4882a593Smuzhiyun * not in our or a descended namespace
228*4882a593Smuzhiyun */
229*4882a593Smuzhiyun r = mount(NULL, "/", NULL, MS_REC | MS_PRIVATE, 0);
230*4882a593Smuzhiyun if (r < 0) {
231*4882a593Smuzhiyun ksft_print_msg("Failed to remount / private\n");
232*4882a593Smuzhiyun return PIDFD_ERROR;
233*4882a593Smuzhiyun }
234*4882a593Smuzhiyun
235*4882a593Smuzhiyun (void)umount2("/proc", MNT_DETACH);
236*4882a593Smuzhiyun r = mount("proc", "/proc", "proc", 0, NULL);
237*4882a593Smuzhiyun if (r < 0) {
238*4882a593Smuzhiyun ksft_print_msg("Failed to remount /proc\n");
239*4882a593Smuzhiyun return PIDFD_ERROR;
240*4882a593Smuzhiyun }
241*4882a593Smuzhiyun
242*4882a593Smuzhiyun pidfd = *(int *)args;
243*4882a593Smuzhiyun r = verify_fdinfo(pidfd, &err, "NSpid:", 6, "\t0\n");
244*4882a593Smuzhiyun
245*4882a593Smuzhiyun if (r != PIDFD_PASS)
246*4882a593Smuzhiyun ksft_print_msg("NSpid fdinfo check failed: %s\n", err.msg);
247*4882a593Smuzhiyun
248*4882a593Smuzhiyun return r;
249*4882a593Smuzhiyun }
250*4882a593Smuzhiyun
test_pidfd_fdinfo_nspid(void)251*4882a593Smuzhiyun static void test_pidfd_fdinfo_nspid(void)
252*4882a593Smuzhiyun {
253*4882a593Smuzhiyun struct child a, b;
254*4882a593Smuzhiyun struct error err = {0, };
255*4882a593Smuzhiyun const char *test_name = "pidfd check for NSpid in fdinfo";
256*4882a593Smuzhiyun
257*4882a593Smuzhiyun /* Create a new child in a new pid and mount namespace */
258*4882a593Smuzhiyun a = clone_newns(child_fdinfo_nspid_test, NULL, &err);
259*4882a593Smuzhiyun error_check(&err, test_name);
260*4882a593Smuzhiyun
261*4882a593Smuzhiyun /* Pass the pidfd representing the first child to the
262*4882a593Smuzhiyun * second child, which will be in a sibling pid namespace,
263*4882a593Smuzhiyun * which means that the fdinfo NSpid entry for the pidfd
264*4882a593Smuzhiyun * should only contain '0'.
265*4882a593Smuzhiyun */
266*4882a593Smuzhiyun b = clone_newns(child_fdinfo_nspid_test, &a.fd, &err);
267*4882a593Smuzhiyun error_check(&err, test_name);
268*4882a593Smuzhiyun
269*4882a593Smuzhiyun /* The children will have pid 1 in the new pid namespace,
270*4882a593Smuzhiyun * so the line must be 'NSPid:\t<pid>\t1'.
271*4882a593Smuzhiyun */
272*4882a593Smuzhiyun verify_fdinfo(a.fd, &err, "NSpid:", 6, "\t%d\t%d\n", a.pid, 1);
273*4882a593Smuzhiyun verify_fdinfo(b.fd, &err, "NSpid:", 6, "\t%d\t%d\n", b.pid, 1);
274*4882a593Smuzhiyun
275*4882a593Smuzhiyun /* wait for the process, check the exit status and set
276*4882a593Smuzhiyun * 'err' accordingly, if it is not already set.
277*4882a593Smuzhiyun */
278*4882a593Smuzhiyun child_join_close(&a, &err);
279*4882a593Smuzhiyun child_join_close(&b, &err);
280*4882a593Smuzhiyun
281*4882a593Smuzhiyun error_report(&err, test_name);
282*4882a593Smuzhiyun }
283*4882a593Smuzhiyun
test_pidfd_dead_fdinfo(void)284*4882a593Smuzhiyun static void test_pidfd_dead_fdinfo(void)
285*4882a593Smuzhiyun {
286*4882a593Smuzhiyun struct child a;
287*4882a593Smuzhiyun struct error err = {0, };
288*4882a593Smuzhiyun const char *test_name = "pidfd check fdinfo for dead process";
289*4882a593Smuzhiyun
290*4882a593Smuzhiyun /* Create a new child in a new pid and mount namespace */
291*4882a593Smuzhiyun a = clone_newns(child_fdinfo_nspid_test, NULL, &err);
292*4882a593Smuzhiyun error_check(&err, test_name);
293*4882a593Smuzhiyun child_join(&a, &err);
294*4882a593Smuzhiyun
295*4882a593Smuzhiyun verify_fdinfo(a.fd, &err, "Pid:", 4, "\t-1\n");
296*4882a593Smuzhiyun verify_fdinfo(a.fd, &err, "NSpid:", 6, "\t-1\n");
297*4882a593Smuzhiyun child_close(&a);
298*4882a593Smuzhiyun error_report(&err, test_name);
299*4882a593Smuzhiyun }
300*4882a593Smuzhiyun
main(int argc,char ** argv)301*4882a593Smuzhiyun int main(int argc, char **argv)
302*4882a593Smuzhiyun {
303*4882a593Smuzhiyun ksft_print_header();
304*4882a593Smuzhiyun ksft_set_plan(2);
305*4882a593Smuzhiyun
306*4882a593Smuzhiyun test_pidfd_fdinfo_nspid();
307*4882a593Smuzhiyun test_pidfd_dead_fdinfo();
308*4882a593Smuzhiyun
309*4882a593Smuzhiyun return ksft_exit_pass();
310*4882a593Smuzhiyun }
311