1 // SPDX-License-Identifier: GPL-2.0
2 /* Copyright (c) 2021 Facebook */
3 #define _GNU_SOURCE
4 #include <sched.h>
5 #include <test_progs.h>
6 #include <time.h>
7 #include <sys/mman.h>
8 #include <sys/syscall.h>
9 #include "fexit_sleep.lskel.h"
10
do_sleep(void * skel)11 static int do_sleep(void *skel)
12 {
13 struct fexit_sleep_lskel *fexit_skel = skel;
14 struct timespec ts1 = { .tv_nsec = 1 };
15 struct timespec ts2 = { .tv_sec = 10 };
16
17 fexit_skel->bss->pid = getpid();
18 (void)syscall(__NR_nanosleep, &ts1, NULL);
19 (void)syscall(__NR_nanosleep, &ts2, NULL);
20 return 0;
21 }
22
23 #define STACK_SIZE (1024 * 1024)
24
test_fexit_sleep(void)25 void test_fexit_sleep(void)
26 {
27 struct fexit_sleep_lskel *fexit_skel = NULL;
28 int wstatus, duration = 0;
29 pid_t cpid;
30 char *child_stack = NULL;
31 int err, fexit_cnt;
32
33 fexit_skel = fexit_sleep_lskel__open_and_load();
34 if (CHECK(!fexit_skel, "fexit_skel_load", "fexit skeleton failed\n"))
35 goto cleanup;
36
37 err = fexit_sleep_lskel__attach(fexit_skel);
38 if (CHECK(err, "fexit_attach", "fexit attach failed: %d\n", err))
39 goto cleanup;
40
41 child_stack = mmap(NULL, STACK_SIZE, PROT_READ | PROT_WRITE, MAP_PRIVATE |
42 MAP_ANONYMOUS | MAP_STACK, -1, 0);
43 if (!ASSERT_NEQ(child_stack, MAP_FAILED, "mmap"))
44 goto cleanup;
45
46 cpid = clone(do_sleep, child_stack + STACK_SIZE, CLONE_FILES | SIGCHLD, fexit_skel);
47 if (CHECK(cpid == -1, "clone", "%s\n", strerror(errno)))
48 goto cleanup;
49
50 /* wait until first sys_nanosleep ends and second sys_nanosleep starts */
51 while (READ_ONCE(fexit_skel->bss->fentry_cnt) != 2);
52 fexit_cnt = READ_ONCE(fexit_skel->bss->fexit_cnt);
53 if (CHECK(fexit_cnt != 1, "fexit_cnt", "%d", fexit_cnt))
54 goto cleanup;
55
56 /* close progs and detach them. That will trigger two nop5->jmp5 rewrites
57 * in the trampolines to skip nanosleep_fexit prog.
58 * The nanosleep_fentry prog will get detached first.
59 * The nanosleep_fexit prog will get detached second.
60 * Detaching will trigger freeing of both progs JITed images.
61 * There will be two dying bpf_tramp_image-s, but only the initial
62 * bpf_tramp_image (with both _fentry and _fexit progs will be stuck
63 * waiting for percpu_ref_kill to confirm). The other one
64 * will be freed quickly.
65 */
66 close(fexit_skel->progs.nanosleep_fentry.prog_fd);
67 close(fexit_skel->progs.nanosleep_fexit.prog_fd);
68 fexit_sleep_lskel__detach(fexit_skel);
69
70 /* kill the thread to unwind sys_nanosleep stack through the trampoline */
71 kill(cpid, 9);
72
73 if (CHECK(waitpid(cpid, &wstatus, 0) == -1, "waitpid", "%s\n", strerror(errno)))
74 goto cleanup;
75 if (CHECK(WEXITSTATUS(wstatus) != 0, "exitstatus", "failed"))
76 goto cleanup;
77
78 /* The bypassed nanosleep_fexit prog shouldn't have executed.
79 * Unlike progs the maps were not freed and directly accessible.
80 */
81 fexit_cnt = READ_ONCE(fexit_skel->bss->fexit_cnt);
82 if (CHECK(fexit_cnt != 1, "fexit_cnt", "%d", fexit_cnt))
83 goto cleanup;
84
85 cleanup:
86 munmap(child_stack, STACK_SIZE);
87 fexit_sleep_lskel__destroy(fexit_skel);
88 }
89