1686a8bb7SPeter Xu // SPDX-License-Identifier: GPL-2.0-only
2686a8bb7SPeter Xu /*
3686a8bb7SPeter Xu  * Userfaultfd unit tests.
4686a8bb7SPeter Xu  *
5686a8bb7SPeter Xu  *  Copyright (C) 2015-2023  Red Hat, Inc.
6686a8bb7SPeter Xu  */
7686a8bb7SPeter Xu 
8686a8bb7SPeter Xu #include "uffd-common.h"
9686a8bb7SPeter Xu 
10760aee0bSPeter Xu #include "../../../../mm/gup_test.h"
11760aee0bSPeter Xu 
12686a8bb7SPeter Xu #ifdef __NR_userfaultfd
13686a8bb7SPeter Xu 
1416a45b57SPeter Xu /* The unit test doesn't need a large or random size, make it 32MB for now */
1516a45b57SPeter Xu #define  UFFD_TEST_MEM_SIZE               (32UL << 20)
1616a45b57SPeter Xu 
1716a45b57SPeter Xu #define  MEM_ANON                         BIT_ULL(0)
1816a45b57SPeter Xu #define  MEM_SHMEM                        BIT_ULL(1)
1916a45b57SPeter Xu #define  MEM_SHMEM_PRIVATE                BIT_ULL(2)
2016a45b57SPeter Xu #define  MEM_HUGETLB                      BIT_ULL(3)
2116a45b57SPeter Xu #define  MEM_HUGETLB_PRIVATE              BIT_ULL(4)
2216a45b57SPeter Xu 
2373c1ea93SPeter Xu #define  MEM_ALL  (MEM_ANON | MEM_SHMEM | MEM_SHMEM_PRIVATE | \
2473c1ea93SPeter Xu 		   MEM_HUGETLB | MEM_HUGETLB_PRIVATE)
2573c1ea93SPeter Xu 
2616a45b57SPeter Xu struct mem_type {
2716a45b57SPeter Xu 	const char *name;
2816a45b57SPeter Xu 	unsigned int mem_flag;
2916a45b57SPeter Xu 	uffd_test_ops_t *mem_ops;
3016a45b57SPeter Xu 	bool shared;
3116a45b57SPeter Xu };
3216a45b57SPeter Xu typedef struct mem_type mem_type_t;
3316a45b57SPeter Xu 
3416a45b57SPeter Xu mem_type_t mem_types[] = {
3516a45b57SPeter Xu 	{
3616a45b57SPeter Xu 		.name = "anon",
3716a45b57SPeter Xu 		.mem_flag = MEM_ANON,
3816a45b57SPeter Xu 		.mem_ops = &anon_uffd_test_ops,
3916a45b57SPeter Xu 		.shared = false,
4016a45b57SPeter Xu 	},
4116a45b57SPeter Xu 	{
4216a45b57SPeter Xu 		.name = "shmem",
4316a45b57SPeter Xu 		.mem_flag = MEM_SHMEM,
4416a45b57SPeter Xu 		.mem_ops = &shmem_uffd_test_ops,
4516a45b57SPeter Xu 		.shared = true,
4616a45b57SPeter Xu 	},
4716a45b57SPeter Xu 	{
4816a45b57SPeter Xu 		.name = "shmem-private",
4916a45b57SPeter Xu 		.mem_flag = MEM_SHMEM_PRIVATE,
5016a45b57SPeter Xu 		.mem_ops = &shmem_uffd_test_ops,
5116a45b57SPeter Xu 		.shared = false,
5216a45b57SPeter Xu 	},
5316a45b57SPeter Xu 	{
5416a45b57SPeter Xu 		.name = "hugetlb",
5516a45b57SPeter Xu 		.mem_flag = MEM_HUGETLB,
5616a45b57SPeter Xu 		.mem_ops = &hugetlb_uffd_test_ops,
5716a45b57SPeter Xu 		.shared = true,
5816a45b57SPeter Xu 	},
5916a45b57SPeter Xu 	{
6016a45b57SPeter Xu 		.name = "hugetlb-private",
6116a45b57SPeter Xu 		.mem_flag = MEM_HUGETLB_PRIVATE,
6216a45b57SPeter Xu 		.mem_ops = &hugetlb_uffd_test_ops,
6316a45b57SPeter Xu 		.shared = false,
6416a45b57SPeter Xu 	},
6516a45b57SPeter Xu };
6616a45b57SPeter Xu 
6743759d44SPeter Xu /* Arguments to be passed over to each uffd unit test */
6843759d44SPeter Xu struct uffd_test_args {
6943759d44SPeter Xu 	mem_type_t *mem_type;
7043759d44SPeter Xu };
7143759d44SPeter Xu typedef struct uffd_test_args uffd_test_args_t;
7243759d44SPeter Xu 
7316a45b57SPeter Xu /* Returns: UFFD_TEST_* */
7443759d44SPeter Xu typedef void (*uffd_test_fn)(uffd_test_args_t *);
7516a45b57SPeter Xu 
7616a45b57SPeter Xu typedef struct {
7716a45b57SPeter Xu 	const char *name;
7816a45b57SPeter Xu 	uffd_test_fn uffd_fn;
7916a45b57SPeter Xu 	unsigned int mem_targets;
8016a45b57SPeter Xu 	uint64_t uffd_feature_required;
8116a45b57SPeter Xu } uffd_test_case_t;
8216a45b57SPeter Xu 
uffd_test_report(void)83d5433ce8SPeter Xu static void uffd_test_report(void)
84d5433ce8SPeter Xu {
85d5433ce8SPeter Xu 	printf("Userfaults unit tests: pass=%u, skip=%u, fail=%u (total=%u)\n",
86d5433ce8SPeter Xu 	       ksft_get_pass_cnt(),
87d5433ce8SPeter Xu 	       ksft_get_xskip_cnt(),
88d5433ce8SPeter Xu 	       ksft_get_fail_cnt(),
89d5433ce8SPeter Xu 	       ksft_test_num());
90d5433ce8SPeter Xu }
91d5433ce8SPeter Xu 
uffd_test_pass(void)92d5433ce8SPeter Xu static void uffd_test_pass(void)
93d5433ce8SPeter Xu {
94d5433ce8SPeter Xu 	printf("done\n");
95d5433ce8SPeter Xu 	ksft_inc_pass_cnt();
96d5433ce8SPeter Xu }
97d5433ce8SPeter Xu 
98d5433ce8SPeter Xu #define  uffd_test_start(...)  do {		\
99d5433ce8SPeter Xu 		printf("Testing ");		\
100d5433ce8SPeter Xu 		printf(__VA_ARGS__);		\
101d5433ce8SPeter Xu 		printf("... ");			\
102d5433ce8SPeter Xu 		fflush(stdout);			\
103d5433ce8SPeter Xu 	} while (0)
104d5433ce8SPeter Xu 
105d5433ce8SPeter Xu #define  uffd_test_fail(...)  do {		\
106d5433ce8SPeter Xu 		printf("failed [reason: ");	\
107d5433ce8SPeter Xu 		printf(__VA_ARGS__);		\
108d5433ce8SPeter Xu 		printf("]\n");			\
109d5433ce8SPeter Xu 		ksft_inc_fail_cnt();		\
110d5433ce8SPeter Xu 	} while (0)
111d5433ce8SPeter Xu 
uffd_test_skip(const char * message)1120e14e7e9SJohn Hubbard static void uffd_test_skip(const char *message)
1130e14e7e9SJohn Hubbard {
1140e14e7e9SJohn Hubbard 	printf("skipped [reason: %s]\n", message);
1150e14e7e9SJohn Hubbard 	ksft_inc_xskip_cnt();
1160e14e7e9SJohn Hubbard }
117d5433ce8SPeter Xu 
118d5433ce8SPeter Xu /*
119d5433ce8SPeter Xu  * Returns 1 if specific userfaultfd supported, 0 otherwise.  Note, we'll
120d5433ce8SPeter Xu  * return 1 even if some test failed as long as uffd supported, because in
121d5433ce8SPeter Xu  * that case we still want to proceed with the rest uffd unit tests.
122d5433ce8SPeter Xu  */
test_uffd_api(bool use_dev)123d5433ce8SPeter Xu static int test_uffd_api(bool use_dev)
124d5433ce8SPeter Xu {
125d5433ce8SPeter Xu 	struct uffdio_api uffdio_api;
126d5433ce8SPeter Xu 	int uffd;
127d5433ce8SPeter Xu 
128d5433ce8SPeter Xu 	uffd_test_start("UFFDIO_API (with %s)",
129d5433ce8SPeter Xu 			use_dev ? "/dev/userfaultfd" : "syscall");
130d5433ce8SPeter Xu 
131d5433ce8SPeter Xu 	if (use_dev)
132d5433ce8SPeter Xu 		uffd = uffd_open_dev(UFFD_FLAGS);
133d5433ce8SPeter Xu 	else
134d5433ce8SPeter Xu 		uffd = uffd_open_sys(UFFD_FLAGS);
135d5433ce8SPeter Xu 	if (uffd < 0) {
136d5433ce8SPeter Xu 		uffd_test_skip("cannot open userfaultfd handle");
137d5433ce8SPeter Xu 		return 0;
138d5433ce8SPeter Xu 	}
139d5433ce8SPeter Xu 
140d5433ce8SPeter Xu 	/* Test wrong UFFD_API */
141d5433ce8SPeter Xu 	uffdio_api.api = 0xab;
142d5433ce8SPeter Xu 	uffdio_api.features = 0;
143d5433ce8SPeter Xu 	if (ioctl(uffd, UFFDIO_API, &uffdio_api) == 0) {
144d5433ce8SPeter Xu 		uffd_test_fail("UFFDIO_API should fail with wrong api but didn't");
145d5433ce8SPeter Xu 		goto out;
146d5433ce8SPeter Xu 	}
147d5433ce8SPeter Xu 
148d5433ce8SPeter Xu 	/* Test wrong feature bit */
149d5433ce8SPeter Xu 	uffdio_api.api = UFFD_API;
150d5433ce8SPeter Xu 	uffdio_api.features = BIT_ULL(63);
151d5433ce8SPeter Xu 	if (ioctl(uffd, UFFDIO_API, &uffdio_api) == 0) {
152d5433ce8SPeter Xu 		uffd_test_fail("UFFDIO_API should fail with wrong feature but didn't");
153d5433ce8SPeter Xu 		goto out;
154d5433ce8SPeter Xu 	}
155d5433ce8SPeter Xu 
156d5433ce8SPeter Xu 	/* Test normal UFFDIO_API */
157d5433ce8SPeter Xu 	uffdio_api.api = UFFD_API;
158d5433ce8SPeter Xu 	uffdio_api.features = 0;
159d5433ce8SPeter Xu 	if (ioctl(uffd, UFFDIO_API, &uffdio_api)) {
160d5433ce8SPeter Xu 		uffd_test_fail("UFFDIO_API should succeed but failed");
161d5433ce8SPeter Xu 		goto out;
162d5433ce8SPeter Xu 	}
163d5433ce8SPeter Xu 
164d5433ce8SPeter Xu 	/* Test double requests of UFFDIO_API with a random feature set */
165d5433ce8SPeter Xu 	uffdio_api.features = BIT_ULL(0);
166d5433ce8SPeter Xu 	if (ioctl(uffd, UFFDIO_API, &uffdio_api) == 0) {
167d5433ce8SPeter Xu 		uffd_test_fail("UFFDIO_API should reject initialized uffd");
168d5433ce8SPeter Xu 		goto out;
169d5433ce8SPeter Xu 	}
170d5433ce8SPeter Xu 
171d5433ce8SPeter Xu 	uffd_test_pass();
172d5433ce8SPeter Xu out:
173d5433ce8SPeter Xu 	close(uffd);
174d5433ce8SPeter Xu 	/* We have a valid uffd handle */
175d5433ce8SPeter Xu 	return 1;
176d5433ce8SPeter Xu }
177d5433ce8SPeter Xu 
17816a45b57SPeter Xu /*
17916a45b57SPeter Xu  * This function initializes the global variables.  TODO: remove global
18016a45b57SPeter Xu  * vars and then remove this.
18116a45b57SPeter Xu  */
18243759d44SPeter Xu static int
uffd_setup_environment(uffd_test_args_t * args,uffd_test_case_t * test,mem_type_t * mem_type,const char ** errmsg)18343759d44SPeter Xu uffd_setup_environment(uffd_test_args_t *args, uffd_test_case_t *test,
18443759d44SPeter Xu 		       mem_type_t *mem_type, const char **errmsg)
18516a45b57SPeter Xu {
18616a45b57SPeter Xu 	map_shared = mem_type->shared;
18716a45b57SPeter Xu 	uffd_test_ops = mem_type->mem_ops;
18816a45b57SPeter Xu 
18916a45b57SPeter Xu 	if (mem_type->mem_flag & (MEM_HUGETLB_PRIVATE | MEM_HUGETLB))
19016a45b57SPeter Xu 		page_size = default_huge_page_size();
19116a45b57SPeter Xu 	else
19216a45b57SPeter Xu 		page_size = psize();
19316a45b57SPeter Xu 
19416a45b57SPeter Xu 	nr_pages = UFFD_TEST_MEM_SIZE / page_size;
19516a45b57SPeter Xu 	/* TODO: remove this global var.. it's so ugly */
19616a45b57SPeter Xu 	nr_cpus = 1;
19716a45b57SPeter Xu 
19843759d44SPeter Xu 	/* Initialize test arguments */
19943759d44SPeter Xu 	args->mem_type = mem_type;
20043759d44SPeter Xu 
201f9da2426SPeter Xu 	return uffd_test_ctx_init(test->uffd_feature_required, errmsg);
20216a45b57SPeter Xu }
20316a45b57SPeter Xu 
uffd_feature_supported(uffd_test_case_t * test)20416a45b57SPeter Xu static bool uffd_feature_supported(uffd_test_case_t *test)
20516a45b57SPeter Xu {
20616a45b57SPeter Xu 	uint64_t features;
20716a45b57SPeter Xu 
20816a45b57SPeter Xu 	if (uffd_get_features(&features))
20916a45b57SPeter Xu 		return false;
21016a45b57SPeter Xu 
21116a45b57SPeter Xu 	return (features & test->uffd_feature_required) ==
21216a45b57SPeter Xu 	    test->uffd_feature_required;
21316a45b57SPeter Xu }
21416a45b57SPeter Xu 
pagemap_open(void)2158bda424fSPeter Xu static int pagemap_open(void)
2168bda424fSPeter Xu {
2178bda424fSPeter Xu 	int fd = open("/proc/self/pagemap", O_RDONLY);
2188bda424fSPeter Xu 
2198bda424fSPeter Xu 	if (fd < 0)
2208bda424fSPeter Xu 		err("open pagemap");
2218bda424fSPeter Xu 
2228bda424fSPeter Xu 	return fd;
2238bda424fSPeter Xu }
2248bda424fSPeter Xu 
2258bda424fSPeter Xu /* This macro let __LINE__ works in err() */
2268bda424fSPeter Xu #define  pagemap_check_wp(value, wp) do {				\
2278bda424fSPeter Xu 		if (!!(value & PM_UFFD_WP) != wp)			\
2288bda424fSPeter Xu 			err("pagemap uffd-wp bit error: 0x%"PRIx64, value); \
2298bda424fSPeter Xu 	} while (0)
2308bda424fSPeter Xu 
231cff29458SPeter Xu typedef struct {
232cff29458SPeter Xu 	int parent_uffd, child_uffd;
233cff29458SPeter Xu } fork_event_args;
234cff29458SPeter Xu 
fork_event_consumer(void * data)235cff29458SPeter Xu static void *fork_event_consumer(void *data)
2368bda424fSPeter Xu {
237cff29458SPeter Xu 	fork_event_args *args = data;
238cff29458SPeter Xu 	struct uffd_msg msg = { 0 };
239cff29458SPeter Xu 
240cff29458SPeter Xu 	/* Read until a full msg received */
241cff29458SPeter Xu 	while (uffd_read_msg(args->parent_uffd, &msg));
242cff29458SPeter Xu 
243cff29458SPeter Xu 	if (msg.event != UFFD_EVENT_FORK)
244cff29458SPeter Xu 		err("wrong message: %u\n", msg.event);
245cff29458SPeter Xu 
246cff29458SPeter Xu 	/* Just to be properly freed later */
247cff29458SPeter Xu 	args->child_uffd = msg.arg.fork.ufd;
248cff29458SPeter Xu 	return NULL;
249cff29458SPeter Xu }
250cff29458SPeter Xu 
251760aee0bSPeter Xu typedef struct {
252760aee0bSPeter Xu 	int gup_fd;
253760aee0bSPeter Xu 	bool pinned;
254760aee0bSPeter Xu } pin_args;
255760aee0bSPeter Xu 
256760aee0bSPeter Xu /*
257760aee0bSPeter Xu  * Returns 0 if succeed, <0 for errors.  pin_pages() needs to be paired
258760aee0bSPeter Xu  * with unpin_pages().  Currently it needs to be RO longterm pin to satisfy
259760aee0bSPeter Xu  * all needs of the test cases (e.g., trigger unshare, trigger fork() early
260760aee0bSPeter Xu  * CoW, etc.).
261760aee0bSPeter Xu  */
pin_pages(pin_args * args,void * buffer,size_t size)262760aee0bSPeter Xu static int pin_pages(pin_args *args, void *buffer, size_t size)
263760aee0bSPeter Xu {
264760aee0bSPeter Xu 	struct pin_longterm_test test = {
265760aee0bSPeter Xu 		.addr = (uintptr_t)buffer,
266760aee0bSPeter Xu 		.size = size,
267760aee0bSPeter Xu 		/* Read-only pins */
268760aee0bSPeter Xu 		.flags = 0,
269760aee0bSPeter Xu 	};
270760aee0bSPeter Xu 
271760aee0bSPeter Xu 	if (args->pinned)
272760aee0bSPeter Xu 		err("already pinned");
273760aee0bSPeter Xu 
274760aee0bSPeter Xu 	args->gup_fd = open("/sys/kernel/debug/gup_test", O_RDWR);
275760aee0bSPeter Xu 	if (args->gup_fd < 0)
276760aee0bSPeter Xu 		return -errno;
277760aee0bSPeter Xu 
278760aee0bSPeter Xu 	if (ioctl(args->gup_fd, PIN_LONGTERM_TEST_START, &test)) {
279760aee0bSPeter Xu 		/* Even if gup_test existed, can be an old gup_test / kernel */
280760aee0bSPeter Xu 		close(args->gup_fd);
281760aee0bSPeter Xu 		return -errno;
282760aee0bSPeter Xu 	}
283760aee0bSPeter Xu 	args->pinned = true;
284760aee0bSPeter Xu 	return 0;
285760aee0bSPeter Xu }
286760aee0bSPeter Xu 
unpin_pages(pin_args * args)287760aee0bSPeter Xu static void unpin_pages(pin_args *args)
288760aee0bSPeter Xu {
289760aee0bSPeter Xu 	if (!args->pinned)
290760aee0bSPeter Xu 		err("unpin without pin first");
291760aee0bSPeter Xu 	if (ioctl(args->gup_fd, PIN_LONGTERM_TEST_STOP))
292760aee0bSPeter Xu 		err("PIN_LONGTERM_TEST_STOP");
293760aee0bSPeter Xu 	close(args->gup_fd);
294760aee0bSPeter Xu 	args->pinned = false;
295760aee0bSPeter Xu }
296760aee0bSPeter Xu 
pagemap_test_fork(int uffd,bool with_event,bool test_pin)297760aee0bSPeter Xu static int pagemap_test_fork(int uffd, bool with_event, bool test_pin)
298cff29458SPeter Xu {
299cff29458SPeter Xu 	fork_event_args args = { .parent_uffd = uffd, .child_uffd = -1 };
300cff29458SPeter Xu 	pthread_t thread;
301cff29458SPeter Xu 	pid_t child;
3028bda424fSPeter Xu 	uint64_t value;
3038bda424fSPeter Xu 	int fd, result;
3048bda424fSPeter Xu 
305cff29458SPeter Xu 	/* Prepare a thread to resolve EVENT_FORK */
306cff29458SPeter Xu 	if (with_event) {
307cff29458SPeter Xu 		if (pthread_create(&thread, NULL, fork_event_consumer, &args))
308cff29458SPeter Xu 			err("pthread_create()");
309cff29458SPeter Xu 	}
310cff29458SPeter Xu 
311cff29458SPeter Xu 	child = fork();
3128bda424fSPeter Xu 	if (!child) {
3138bda424fSPeter Xu 		/* Open the pagemap fd of the child itself */
314760aee0bSPeter Xu 		pin_args args = {};
315760aee0bSPeter Xu 
3168bda424fSPeter Xu 		fd = pagemap_open();
317760aee0bSPeter Xu 
318760aee0bSPeter Xu 		if (test_pin && pin_pages(&args, area_dst, page_size))
319760aee0bSPeter Xu 			/*
320760aee0bSPeter Xu 			 * Normally when reach here we have pinned in
321760aee0bSPeter Xu 			 * previous tests, so shouldn't fail anymore
322760aee0bSPeter Xu 			 */
323760aee0bSPeter Xu 			err("pin page failed in child");
324760aee0bSPeter Xu 
3258bda424fSPeter Xu 		value = pagemap_get_entry(fd, area_dst);
3268bda424fSPeter Xu 		/*
327cff29458SPeter Xu 		 * After fork(), we should handle uffd-wp bit differently:
328cff29458SPeter Xu 		 *
329cff29458SPeter Xu 		 * (1) when with EVENT_FORK, it should persist
330cff29458SPeter Xu 		 * (2) when without EVENT_FORK, it should be dropped
3318bda424fSPeter Xu 		 */
332cff29458SPeter Xu 		pagemap_check_wp(value, with_event);
333760aee0bSPeter Xu 		if (test_pin)
334760aee0bSPeter Xu 			unpin_pages(&args);
3358bda424fSPeter Xu 		/* Succeed */
3368bda424fSPeter Xu 		exit(0);
3378bda424fSPeter Xu 	}
3388bda424fSPeter Xu 	waitpid(child, &result, 0);
339cff29458SPeter Xu 
340cff29458SPeter Xu 	if (with_event) {
341cff29458SPeter Xu 		if (pthread_join(thread, NULL))
342cff29458SPeter Xu 			err("pthread_join()");
343cff29458SPeter Xu 		if (args.child_uffd < 0)
344cff29458SPeter Xu 			err("Didn't receive child uffd");
345cff29458SPeter Xu 		close(args.child_uffd);
346cff29458SPeter Xu 	}
347cff29458SPeter Xu 
3488bda424fSPeter Xu 	return result;
3498bda424fSPeter Xu }
3508bda424fSPeter Xu 
uffd_wp_unpopulated_test(uffd_test_args_t * args)35143759d44SPeter Xu static void uffd_wp_unpopulated_test(uffd_test_args_t *args)
3528bda424fSPeter Xu {
3538bda424fSPeter Xu 	uint64_t value;
3548bda424fSPeter Xu 	int pagemap_fd;
3558bda424fSPeter Xu 
3568bda424fSPeter Xu 	if (uffd_register(uffd, area_dst, nr_pages * page_size,
3578bda424fSPeter Xu 			  false, true, false))
3588bda424fSPeter Xu 		err("register failed");
3598bda424fSPeter Xu 
3608bda424fSPeter Xu 	pagemap_fd = pagemap_open();
3618bda424fSPeter Xu 
3628bda424fSPeter Xu 	/* Test applying pte marker to anon unpopulated */
3638bda424fSPeter Xu 	wp_range(uffd, (uint64_t)area_dst, page_size, true);
3648bda424fSPeter Xu 	value = pagemap_get_entry(pagemap_fd, area_dst);
3658bda424fSPeter Xu 	pagemap_check_wp(value, true);
3668bda424fSPeter Xu 
3678bda424fSPeter Xu 	/* Test unprotect on anon pte marker */
3688bda424fSPeter Xu 	wp_range(uffd, (uint64_t)area_dst, page_size, false);
3698bda424fSPeter Xu 	value = pagemap_get_entry(pagemap_fd, area_dst);
3708bda424fSPeter Xu 	pagemap_check_wp(value, false);
3718bda424fSPeter Xu 
3728bda424fSPeter Xu 	/* Test zap on anon marker */
3738bda424fSPeter Xu 	wp_range(uffd, (uint64_t)area_dst, page_size, true);
3748bda424fSPeter Xu 	if (madvise(area_dst, page_size, MADV_DONTNEED))
3758bda424fSPeter Xu 		err("madvise(MADV_DONTNEED) failed");
3768bda424fSPeter Xu 	value = pagemap_get_entry(pagemap_fd, area_dst);
3778bda424fSPeter Xu 	pagemap_check_wp(value, false);
3788bda424fSPeter Xu 
3798bda424fSPeter Xu 	/* Test fault in after marker removed */
3808bda424fSPeter Xu 	*area_dst = 1;
3818bda424fSPeter Xu 	value = pagemap_get_entry(pagemap_fd, area_dst);
3828bda424fSPeter Xu 	pagemap_check_wp(value, false);
3838bda424fSPeter Xu 	/* Drop it to make pte none again */
3848bda424fSPeter Xu 	if (madvise(area_dst, page_size, MADV_DONTNEED))
3858bda424fSPeter Xu 		err("madvise(MADV_DONTNEED) failed");
3868bda424fSPeter Xu 
3878bda424fSPeter Xu 	/* Test read-zero-page upon pte marker */
3888bda424fSPeter Xu 	wp_range(uffd, (uint64_t)area_dst, page_size, true);
3898bda424fSPeter Xu 	*(volatile char *)area_dst;
3908bda424fSPeter Xu 	/* Drop it to make pte none again */
3918bda424fSPeter Xu 	if (madvise(area_dst, page_size, MADV_DONTNEED))
3928bda424fSPeter Xu 		err("madvise(MADV_DONTNEED) failed");
3938bda424fSPeter Xu 
3948bda424fSPeter Xu 	uffd_test_pass();
3958bda424fSPeter Xu }
3968bda424fSPeter Xu 
uffd_wp_fork_test_common(uffd_test_args_t * args,bool with_event)397cff29458SPeter Xu static void uffd_wp_fork_test_common(uffd_test_args_t *args,
398cff29458SPeter Xu 				     bool with_event)
3998bda424fSPeter Xu {
4008bda424fSPeter Xu 	int pagemap_fd;
4018bda424fSPeter Xu 	uint64_t value;
4028bda424fSPeter Xu 
4038bda424fSPeter Xu 	if (uffd_register(uffd, area_dst, nr_pages * page_size,
4048bda424fSPeter Xu 			  false, true, false))
4058bda424fSPeter Xu 		err("register failed");
4068bda424fSPeter Xu 
4078bda424fSPeter Xu 	pagemap_fd = pagemap_open();
4088bda424fSPeter Xu 
4098bda424fSPeter Xu 	/* Touch the page */
4108bda424fSPeter Xu 	*area_dst = 1;
4118bda424fSPeter Xu 	wp_range(uffd, (uint64_t)area_dst, page_size, true);
4128bda424fSPeter Xu 	value = pagemap_get_entry(pagemap_fd, area_dst);
4138bda424fSPeter Xu 	pagemap_check_wp(value, true);
414760aee0bSPeter Xu 	if (pagemap_test_fork(uffd, with_event, false)) {
415cff29458SPeter Xu 		uffd_test_fail("Detected %s uffd-wp bit in child in present pte",
416cff29458SPeter Xu 			       with_event ? "missing" : "stall");
417cff29458SPeter Xu 		goto out;
418cff29458SPeter Xu 	}
4198bda424fSPeter Xu 
420cff29458SPeter Xu 	/*
421cff29458SPeter Xu 	 * This is an attempt for zapping the pgtable so as to test the
422cff29458SPeter Xu 	 * markers.
423cff29458SPeter Xu 	 *
424cff29458SPeter Xu 	 * For private mappings, PAGEOUT will only work on exclusive ptes
425cff29458SPeter Xu 	 * (PM_MMAP_EXCLUSIVE) which we should satisfy.
426cff29458SPeter Xu 	 *
427cff29458SPeter Xu 	 * For shared, PAGEOUT may not work.  Use DONTNEED instead which
428cff29458SPeter Xu 	 * plays a similar role of zapping (rather than freeing the page)
429cff29458SPeter Xu 	 * to expose pte markers.
430cff29458SPeter Xu 	 */
431cff29458SPeter Xu 	if (args->mem_type->shared) {
432cff29458SPeter Xu 		if (madvise(area_dst, page_size, MADV_DONTNEED))
433cff29458SPeter Xu 			err("MADV_DONTNEED");
434cff29458SPeter Xu 	} else {
435cff29458SPeter Xu 		/*
436cff29458SPeter Xu 		 * NOTE: ignore retval because private-hugetlb doesn't yet
437cff29458SPeter Xu 		 * support swapping, so it could fail.
438cff29458SPeter Xu 		 */
439cff29458SPeter Xu 		madvise(area_dst, page_size, MADV_PAGEOUT);
440cff29458SPeter Xu 	}
4418bda424fSPeter Xu 
4428bda424fSPeter Xu 	/* Uffd-wp should persist even swapped out */
4438bda424fSPeter Xu 	value = pagemap_get_entry(pagemap_fd, area_dst);
4448bda424fSPeter Xu 	pagemap_check_wp(value, true);
445760aee0bSPeter Xu 	if (pagemap_test_fork(uffd, with_event, false)) {
446cff29458SPeter Xu 		uffd_test_fail("Detected %s uffd-wp bit in child in zapped pte",
447cff29458SPeter Xu 			       with_event ? "missing" : "stall");
448cff29458SPeter Xu 		goto out;
449cff29458SPeter Xu 	}
4508bda424fSPeter Xu 
4518bda424fSPeter Xu 	/* Unprotect; this tests swap pte modifications */
4528bda424fSPeter Xu 	wp_range(uffd, (uint64_t)area_dst, page_size, false);
4538bda424fSPeter Xu 	value = pagemap_get_entry(pagemap_fd, area_dst);
4548bda424fSPeter Xu 	pagemap_check_wp(value, false);
4558bda424fSPeter Xu 
4568bda424fSPeter Xu 	/* Fault in the page from disk */
4578bda424fSPeter Xu 	*area_dst = 2;
4588bda424fSPeter Xu 	value = pagemap_get_entry(pagemap_fd, area_dst);
4598bda424fSPeter Xu 	pagemap_check_wp(value, false);
4608bda424fSPeter Xu 	uffd_test_pass();
461cff29458SPeter Xu out:
462cff29458SPeter Xu 	if (uffd_unregister(uffd, area_dst, nr_pages * page_size))
463cff29458SPeter Xu 		err("unregister failed");
464cff29458SPeter Xu 	close(pagemap_fd);
465cff29458SPeter Xu }
466cff29458SPeter Xu 
uffd_wp_fork_test(uffd_test_args_t * args)467cff29458SPeter Xu static void uffd_wp_fork_test(uffd_test_args_t *args)
468cff29458SPeter Xu {
469cff29458SPeter Xu 	uffd_wp_fork_test_common(args, false);
470cff29458SPeter Xu }
471cff29458SPeter Xu 
uffd_wp_fork_with_event_test(uffd_test_args_t * args)472cff29458SPeter Xu static void uffd_wp_fork_with_event_test(uffd_test_args_t *args)
473cff29458SPeter Xu {
474cff29458SPeter Xu 	uffd_wp_fork_test_common(args, true);
4758bda424fSPeter Xu }
4768bda424fSPeter Xu 
uffd_wp_fork_pin_test_common(uffd_test_args_t * args,bool with_event)477760aee0bSPeter Xu static void uffd_wp_fork_pin_test_common(uffd_test_args_t *args,
478760aee0bSPeter Xu 					 bool with_event)
479760aee0bSPeter Xu {
480760aee0bSPeter Xu 	int pagemap_fd;
481760aee0bSPeter Xu 	pin_args pin_args = {};
482760aee0bSPeter Xu 
483760aee0bSPeter Xu 	if (uffd_register(uffd, area_dst, page_size, false, true, false))
484760aee0bSPeter Xu 		err("register failed");
485760aee0bSPeter Xu 
486760aee0bSPeter Xu 	pagemap_fd = pagemap_open();
487760aee0bSPeter Xu 
488760aee0bSPeter Xu 	/* Touch the page */
489760aee0bSPeter Xu 	*area_dst = 1;
490760aee0bSPeter Xu 	wp_range(uffd, (uint64_t)area_dst, page_size, true);
491760aee0bSPeter Xu 
492760aee0bSPeter Xu 	/*
493760aee0bSPeter Xu 	 * 1. First pin, then fork().  This tests fork() special path when
494760aee0bSPeter Xu 	 * doing early CoW if the page is private.
495760aee0bSPeter Xu 	 */
496760aee0bSPeter Xu 	if (pin_pages(&pin_args, area_dst, page_size)) {
497760aee0bSPeter Xu 		uffd_test_skip("Possibly CONFIG_GUP_TEST missing "
498760aee0bSPeter Xu 			       "or unprivileged");
499760aee0bSPeter Xu 		close(pagemap_fd);
500760aee0bSPeter Xu 		uffd_unregister(uffd, area_dst, page_size);
501760aee0bSPeter Xu 		return;
502760aee0bSPeter Xu 	}
503760aee0bSPeter Xu 
504760aee0bSPeter Xu 	if (pagemap_test_fork(uffd, with_event, false)) {
505760aee0bSPeter Xu 		uffd_test_fail("Detected %s uffd-wp bit in early CoW of fork()",
506760aee0bSPeter Xu 			       with_event ? "missing" : "stall");
507760aee0bSPeter Xu 		unpin_pages(&pin_args);
508760aee0bSPeter Xu 		goto out;
509760aee0bSPeter Xu 	}
510760aee0bSPeter Xu 
511760aee0bSPeter Xu 	unpin_pages(&pin_args);
512760aee0bSPeter Xu 
513760aee0bSPeter Xu 	/*
514760aee0bSPeter Xu 	 * 2. First fork(), then pin (in the child, where test_pin==true).
515760aee0bSPeter Xu 	 * This tests COR, aka, page unsharing on private memories.
516760aee0bSPeter Xu 	 */
517760aee0bSPeter Xu 	if (pagemap_test_fork(uffd, with_event, true)) {
518760aee0bSPeter Xu 		uffd_test_fail("Detected %s uffd-wp bit when RO pin",
519760aee0bSPeter Xu 			       with_event ? "missing" : "stall");
520760aee0bSPeter Xu 		goto out;
521760aee0bSPeter Xu 	}
522760aee0bSPeter Xu 	uffd_test_pass();
523760aee0bSPeter Xu out:
524760aee0bSPeter Xu 	if (uffd_unregister(uffd, area_dst, page_size))
525760aee0bSPeter Xu 		err("register failed");
526760aee0bSPeter Xu 	close(pagemap_fd);
527760aee0bSPeter Xu }
528760aee0bSPeter Xu 
uffd_wp_fork_pin_test(uffd_test_args_t * args)529760aee0bSPeter Xu static void uffd_wp_fork_pin_test(uffd_test_args_t *args)
530760aee0bSPeter Xu {
531760aee0bSPeter Xu 	uffd_wp_fork_pin_test_common(args, false);
532760aee0bSPeter Xu }
533760aee0bSPeter Xu 
uffd_wp_fork_pin_with_event_test(uffd_test_args_t * args)534760aee0bSPeter Xu static void uffd_wp_fork_pin_with_event_test(uffd_test_args_t *args)
535760aee0bSPeter Xu {
536760aee0bSPeter Xu 	uffd_wp_fork_pin_test_common(args, true);
537760aee0bSPeter Xu }
538760aee0bSPeter Xu 
check_memory_contents(char * p)53962515b5fSPeter Xu static void check_memory_contents(char *p)
54062515b5fSPeter Xu {
54162515b5fSPeter Xu 	unsigned long i, j;
54262515b5fSPeter Xu 	uint8_t expected_byte;
54362515b5fSPeter Xu 
54462515b5fSPeter Xu 	for (i = 0; i < nr_pages; ++i) {
54562515b5fSPeter Xu 		expected_byte = ~((uint8_t)(i % ((uint8_t)-1)));
54662515b5fSPeter Xu 		for (j = 0; j < page_size; j++) {
54762515b5fSPeter Xu 			uint8_t v = *(uint8_t *)(p + (i * page_size) + j);
54862515b5fSPeter Xu 			if (v != expected_byte)
54962515b5fSPeter Xu 				err("unexpected page contents");
55062515b5fSPeter Xu 		}
55162515b5fSPeter Xu 	}
55262515b5fSPeter Xu }
55362515b5fSPeter Xu 
uffd_minor_test_common(bool test_collapse,bool test_wp)55462515b5fSPeter Xu static void uffd_minor_test_common(bool test_collapse, bool test_wp)
55562515b5fSPeter Xu {
55662515b5fSPeter Xu 	unsigned long p;
55762515b5fSPeter Xu 	pthread_t uffd_mon;
55862515b5fSPeter Xu 	char c;
55962515b5fSPeter Xu 	struct uffd_args args = { 0 };
56062515b5fSPeter Xu 
56162515b5fSPeter Xu 	/*
56262515b5fSPeter Xu 	 * NOTE: MADV_COLLAPSE is not yet compatible with WP, so testing
56362515b5fSPeter Xu 	 * both do not make much sense.
56462515b5fSPeter Xu 	 */
56562515b5fSPeter Xu 	assert(!(test_collapse && test_wp));
56662515b5fSPeter Xu 
56762515b5fSPeter Xu 	if (uffd_register(uffd, area_dst_alias, nr_pages * page_size,
56862515b5fSPeter Xu 			  /* NOTE! MADV_COLLAPSE may not work with uffd-wp */
56962515b5fSPeter Xu 			  false, test_wp, true))
57062515b5fSPeter Xu 		err("register failure");
57162515b5fSPeter Xu 
57262515b5fSPeter Xu 	/*
57362515b5fSPeter Xu 	 * After registering with UFFD, populate the non-UFFD-registered side of
57462515b5fSPeter Xu 	 * the shared mapping. This should *not* trigger any UFFD minor faults.
57562515b5fSPeter Xu 	 */
57662515b5fSPeter Xu 	for (p = 0; p < nr_pages; ++p)
57762515b5fSPeter Xu 		memset(area_dst + (p * page_size), p % ((uint8_t)-1),
57862515b5fSPeter Xu 		       page_size);
57962515b5fSPeter Xu 
58062515b5fSPeter Xu 	args.apply_wp = test_wp;
58162515b5fSPeter Xu 	if (pthread_create(&uffd_mon, NULL, uffd_poll_thread, &args))
58262515b5fSPeter Xu 		err("uffd_poll_thread create");
58362515b5fSPeter Xu 
58462515b5fSPeter Xu 	/*
58562515b5fSPeter Xu 	 * Read each of the pages back using the UFFD-registered mapping. We
58662515b5fSPeter Xu 	 * expect that the first time we touch a page, it will result in a minor
58762515b5fSPeter Xu 	 * fault. uffd_poll_thread will resolve the fault by bit-flipping the
58862515b5fSPeter Xu 	 * page's contents, and then issuing a CONTINUE ioctl.
58962515b5fSPeter Xu 	 */
59062515b5fSPeter Xu 	check_memory_contents(area_dst_alias);
59162515b5fSPeter Xu 
59262515b5fSPeter Xu 	if (write(pipefd[1], &c, sizeof(c)) != sizeof(c))
59362515b5fSPeter Xu 		err("pipe write");
59462515b5fSPeter Xu 	if (pthread_join(uffd_mon, NULL))
59562515b5fSPeter Xu 		err("join() failed");
59662515b5fSPeter Xu 
59762515b5fSPeter Xu 	if (test_collapse) {
59862515b5fSPeter Xu 		if (madvise(area_dst_alias, nr_pages * page_size,
59962515b5fSPeter Xu 			    MADV_COLLAPSE)) {
60062515b5fSPeter Xu 			/* It's fine to fail for this one... */
60162515b5fSPeter Xu 			uffd_test_skip("MADV_COLLAPSE failed");
60262515b5fSPeter Xu 			return;
60362515b5fSPeter Xu 		}
60462515b5fSPeter Xu 
60562515b5fSPeter Xu 		uffd_test_ops->check_pmd_mapping(area_dst,
60662515b5fSPeter Xu 						 nr_pages * page_size /
60762515b5fSPeter Xu 						 read_pmd_pagesize());
60862515b5fSPeter Xu 		/*
60962515b5fSPeter Xu 		 * This won't cause uffd-fault - it purely just makes sure there
61062515b5fSPeter Xu 		 * was no corruption.
61162515b5fSPeter Xu 		 */
61262515b5fSPeter Xu 		check_memory_contents(area_dst_alias);
61362515b5fSPeter Xu 	}
61462515b5fSPeter Xu 
61562515b5fSPeter Xu 	if (args.missing_faults != 0 || args.minor_faults != nr_pages)
61662515b5fSPeter Xu 		uffd_test_fail("stats check error");
61762515b5fSPeter Xu 	else
61862515b5fSPeter Xu 		uffd_test_pass();
61962515b5fSPeter Xu }
62062515b5fSPeter Xu 
uffd_minor_test(uffd_test_args_t * args)62143759d44SPeter Xu void uffd_minor_test(uffd_test_args_t *args)
62262515b5fSPeter Xu {
62362515b5fSPeter Xu 	uffd_minor_test_common(false, false);
62462515b5fSPeter Xu }
62562515b5fSPeter Xu 
uffd_minor_wp_test(uffd_test_args_t * args)62643759d44SPeter Xu void uffd_minor_wp_test(uffd_test_args_t *args)
62762515b5fSPeter Xu {
62862515b5fSPeter Xu 	uffd_minor_test_common(false, true);
62962515b5fSPeter Xu }
63062515b5fSPeter Xu 
uffd_minor_collapse_test(uffd_test_args_t * args)63143759d44SPeter Xu void uffd_minor_collapse_test(uffd_test_args_t *args)
63262515b5fSPeter Xu {
63362515b5fSPeter Xu 	uffd_minor_test_common(true, false);
63462515b5fSPeter Xu }
63562515b5fSPeter Xu 
63673c1ea93SPeter Xu static sigjmp_buf jbuf, *sigbuf;
63773c1ea93SPeter Xu 
sighndl(int sig,siginfo_t * siginfo,void * ptr)63873c1ea93SPeter Xu static void sighndl(int sig, siginfo_t *siginfo, void *ptr)
63973c1ea93SPeter Xu {
64073c1ea93SPeter Xu 	if (sig == SIGBUS) {
64173c1ea93SPeter Xu 		if (sigbuf)
64273c1ea93SPeter Xu 			siglongjmp(*sigbuf, 1);
64373c1ea93SPeter Xu 		abort();
64473c1ea93SPeter Xu 	}
64573c1ea93SPeter Xu }
64673c1ea93SPeter Xu 
64773c1ea93SPeter Xu /*
64873c1ea93SPeter Xu  * For non-cooperative userfaultfd test we fork() a process that will
64973c1ea93SPeter Xu  * generate pagefaults, will mremap the area monitored by the
65073c1ea93SPeter Xu  * userfaultfd and at last this process will release the monitored
65173c1ea93SPeter Xu  * area.
65273c1ea93SPeter Xu  * For the anonymous and shared memory the area is divided into two
65373c1ea93SPeter Xu  * parts, the first part is accessed before mremap, and the second
65473c1ea93SPeter Xu  * part is accessed after mremap. Since hugetlbfs does not support
65573c1ea93SPeter Xu  * mremap, the entire monitored area is accessed in a single pass for
65673c1ea93SPeter Xu  * HUGETLB_TEST.
65773c1ea93SPeter Xu  * The release of the pages currently generates event for shmem and
65873c1ea93SPeter Xu  * anonymous memory (UFFD_EVENT_REMOVE), hence it is not checked
65973c1ea93SPeter Xu  * for hugetlb.
66073c1ea93SPeter Xu  * For signal test(UFFD_FEATURE_SIGBUS), signal_test = 1, we register
66173c1ea93SPeter Xu  * monitored area, generate pagefaults and test that signal is delivered.
66273c1ea93SPeter Xu  * Use UFFDIO_COPY to allocate missing page and retry. For signal_test = 2
66373c1ea93SPeter Xu  * test robustness use case - we release monitored area, fork a process
66473c1ea93SPeter Xu  * that will generate pagefaults and verify signal is generated.
66573c1ea93SPeter Xu  * This also tests UFFD_FEATURE_EVENT_FORK event along with the signal
66673c1ea93SPeter Xu  * feature. Using monitor thread, verify no userfault events are generated.
66773c1ea93SPeter Xu  */
faulting_process(int signal_test,bool wp)66873c1ea93SPeter Xu static int faulting_process(int signal_test, bool wp)
66973c1ea93SPeter Xu {
67073c1ea93SPeter Xu 	unsigned long nr, i;
67173c1ea93SPeter Xu 	unsigned long long count;
67273c1ea93SPeter Xu 	unsigned long split_nr_pages;
67373c1ea93SPeter Xu 	unsigned long lastnr;
67473c1ea93SPeter Xu 	struct sigaction act;
67573c1ea93SPeter Xu 	volatile unsigned long signalled = 0;
67673c1ea93SPeter Xu 
67773c1ea93SPeter Xu 	split_nr_pages = (nr_pages + 1) / 2;
67873c1ea93SPeter Xu 
67973c1ea93SPeter Xu 	if (signal_test) {
68073c1ea93SPeter Xu 		sigbuf = &jbuf;
68173c1ea93SPeter Xu 		memset(&act, 0, sizeof(act));
68273c1ea93SPeter Xu 		act.sa_sigaction = sighndl;
68373c1ea93SPeter Xu 		act.sa_flags = SA_SIGINFO;
68473c1ea93SPeter Xu 		if (sigaction(SIGBUS, &act, 0))
68573c1ea93SPeter Xu 			err("sigaction");
68673c1ea93SPeter Xu 		lastnr = (unsigned long)-1;
68773c1ea93SPeter Xu 	}
68873c1ea93SPeter Xu 
68973c1ea93SPeter Xu 	for (nr = 0; nr < split_nr_pages; nr++) {
69073c1ea93SPeter Xu 		volatile int steps = 1;
69173c1ea93SPeter Xu 		unsigned long offset = nr * page_size;
69273c1ea93SPeter Xu 
69373c1ea93SPeter Xu 		if (signal_test) {
69473c1ea93SPeter Xu 			if (sigsetjmp(*sigbuf, 1) != 0) {
69573c1ea93SPeter Xu 				if (steps == 1 && nr == lastnr)
69673c1ea93SPeter Xu 					err("Signal repeated");
69773c1ea93SPeter Xu 
69873c1ea93SPeter Xu 				lastnr = nr;
69973c1ea93SPeter Xu 				if (signal_test == 1) {
70073c1ea93SPeter Xu 					if (steps == 1) {
70173c1ea93SPeter Xu 						/* This is a MISSING request */
70273c1ea93SPeter Xu 						steps++;
70373c1ea93SPeter Xu 						if (copy_page(uffd, offset, wp))
70473c1ea93SPeter Xu 							signalled++;
70573c1ea93SPeter Xu 					} else {
70673c1ea93SPeter Xu 						/* This is a WP request */
70773c1ea93SPeter Xu 						assert(steps == 2);
70873c1ea93SPeter Xu 						wp_range(uffd,
70973c1ea93SPeter Xu 							 (__u64)area_dst +
71073c1ea93SPeter Xu 							 offset,
71173c1ea93SPeter Xu 							 page_size, false);
71273c1ea93SPeter Xu 					}
71373c1ea93SPeter Xu 				} else {
71473c1ea93SPeter Xu 					signalled++;
71573c1ea93SPeter Xu 					continue;
71673c1ea93SPeter Xu 				}
71773c1ea93SPeter Xu 			}
71873c1ea93SPeter Xu 		}
71973c1ea93SPeter Xu 
72073c1ea93SPeter Xu 		count = *area_count(area_dst, nr);
72173c1ea93SPeter Xu 		if (count != count_verify[nr])
72273c1ea93SPeter Xu 			err("nr %lu memory corruption %llu %llu\n",
72373c1ea93SPeter Xu 			    nr, count, count_verify[nr]);
72473c1ea93SPeter Xu 		/*
72573c1ea93SPeter Xu 		 * Trigger write protection if there is by writing
72673c1ea93SPeter Xu 		 * the same value back.
72773c1ea93SPeter Xu 		 */
72873c1ea93SPeter Xu 		*area_count(area_dst, nr) = count;
72973c1ea93SPeter Xu 	}
73073c1ea93SPeter Xu 
73173c1ea93SPeter Xu 	if (signal_test)
73273c1ea93SPeter Xu 		return signalled != split_nr_pages;
73373c1ea93SPeter Xu 
73473c1ea93SPeter Xu 	area_dst = mremap(area_dst, nr_pages * page_size,  nr_pages * page_size,
73573c1ea93SPeter Xu 			  MREMAP_MAYMOVE | MREMAP_FIXED, area_src);
73673c1ea93SPeter Xu 	if (area_dst == MAP_FAILED)
73773c1ea93SPeter Xu 		err("mremap");
73873c1ea93SPeter Xu 	/* Reset area_src since we just clobbered it */
73973c1ea93SPeter Xu 	area_src = NULL;
74073c1ea93SPeter Xu 
74173c1ea93SPeter Xu 	for (; nr < nr_pages; nr++) {
74273c1ea93SPeter Xu 		count = *area_count(area_dst, nr);
74373c1ea93SPeter Xu 		if (count != count_verify[nr]) {
74473c1ea93SPeter Xu 			err("nr %lu memory corruption %llu %llu\n",
74573c1ea93SPeter Xu 			    nr, count, count_verify[nr]);
74673c1ea93SPeter Xu 		}
74773c1ea93SPeter Xu 		/*
74873c1ea93SPeter Xu 		 * Trigger write protection if there is by writing
74973c1ea93SPeter Xu 		 * the same value back.
75073c1ea93SPeter Xu 		 */
75173c1ea93SPeter Xu 		*area_count(area_dst, nr) = count;
75273c1ea93SPeter Xu 	}
75373c1ea93SPeter Xu 
75473c1ea93SPeter Xu 	uffd_test_ops->release_pages(area_dst);
75573c1ea93SPeter Xu 
75673c1ea93SPeter Xu 	for (nr = 0; nr < nr_pages; nr++)
75773c1ea93SPeter Xu 		for (i = 0; i < page_size; i++)
75873c1ea93SPeter Xu 			if (*(area_dst + nr * page_size + i) != 0)
75973c1ea93SPeter Xu 				err("page %lu offset %lu is not zero", nr, i);
76073c1ea93SPeter Xu 
76173c1ea93SPeter Xu 	return 0;
76273c1ea93SPeter Xu }
76373c1ea93SPeter Xu 
uffd_sigbus_test_common(bool wp)76473c1ea93SPeter Xu static void uffd_sigbus_test_common(bool wp)
76573c1ea93SPeter Xu {
76673c1ea93SPeter Xu 	unsigned long userfaults;
76773c1ea93SPeter Xu 	pthread_t uffd_mon;
76873c1ea93SPeter Xu 	pid_t pid;
76973c1ea93SPeter Xu 	int err;
77073c1ea93SPeter Xu 	char c;
77173c1ea93SPeter Xu 	struct uffd_args args = { 0 };
77273c1ea93SPeter Xu 
77307cf57ebSEdward Liaw 	ready_for_fork = false;
77407cf57ebSEdward Liaw 
77573c1ea93SPeter Xu 	fcntl(uffd, F_SETFL, uffd_flags | O_NONBLOCK);
77673c1ea93SPeter Xu 
77773c1ea93SPeter Xu 	if (uffd_register(uffd, area_dst, nr_pages * page_size,
77873c1ea93SPeter Xu 			  true, wp, false))
77973c1ea93SPeter Xu 		err("register failure");
78073c1ea93SPeter Xu 
78173c1ea93SPeter Xu 	if (faulting_process(1, wp))
78273c1ea93SPeter Xu 		err("faulting process failed");
78373c1ea93SPeter Xu 
78473c1ea93SPeter Xu 	uffd_test_ops->release_pages(area_dst);
78573c1ea93SPeter Xu 
78673c1ea93SPeter Xu 	args.apply_wp = wp;
78773c1ea93SPeter Xu 	if (pthread_create(&uffd_mon, NULL, uffd_poll_thread, &args))
78873c1ea93SPeter Xu 		err("uffd_poll_thread create");
78973c1ea93SPeter Xu 
79007cf57ebSEdward Liaw 	while (!ready_for_fork)
79107cf57ebSEdward Liaw 		; /* Wait for the poll_thread to start executing before forking */
79207cf57ebSEdward Liaw 
79373c1ea93SPeter Xu 	pid = fork();
79473c1ea93SPeter Xu 	if (pid < 0)
79573c1ea93SPeter Xu 		err("fork");
79673c1ea93SPeter Xu 
79773c1ea93SPeter Xu 	if (!pid)
79873c1ea93SPeter Xu 		exit(faulting_process(2, wp));
79973c1ea93SPeter Xu 
80073c1ea93SPeter Xu 	waitpid(pid, &err, 0);
80173c1ea93SPeter Xu 	if (err)
80273c1ea93SPeter Xu 		err("faulting process failed");
80373c1ea93SPeter Xu 	if (write(pipefd[1], &c, sizeof(c)) != sizeof(c))
80473c1ea93SPeter Xu 		err("pipe write");
80573c1ea93SPeter Xu 	if (pthread_join(uffd_mon, (void **)&userfaults))
80673c1ea93SPeter Xu 		err("pthread_join()");
80773c1ea93SPeter Xu 
80873c1ea93SPeter Xu 	if (userfaults)
80973c1ea93SPeter Xu 		uffd_test_fail("Signal test failed, userfaults: %ld", userfaults);
81073c1ea93SPeter Xu 	else
81173c1ea93SPeter Xu 		uffd_test_pass();
81273c1ea93SPeter Xu }
81373c1ea93SPeter Xu 
uffd_sigbus_test(uffd_test_args_t * args)81443759d44SPeter Xu static void uffd_sigbus_test(uffd_test_args_t *args)
81573c1ea93SPeter Xu {
81673c1ea93SPeter Xu 	uffd_sigbus_test_common(false);
81773c1ea93SPeter Xu }
81873c1ea93SPeter Xu 
uffd_sigbus_wp_test(uffd_test_args_t * args)81943759d44SPeter Xu static void uffd_sigbus_wp_test(uffd_test_args_t *args)
82073c1ea93SPeter Xu {
82173c1ea93SPeter Xu 	uffd_sigbus_test_common(true);
82273c1ea93SPeter Xu }
82373c1ea93SPeter Xu 
uffd_events_test_common(bool wp)82473c1ea93SPeter Xu static void uffd_events_test_common(bool wp)
82573c1ea93SPeter Xu {
82673c1ea93SPeter Xu 	pthread_t uffd_mon;
82773c1ea93SPeter Xu 	pid_t pid;
82873c1ea93SPeter Xu 	int err;
82973c1ea93SPeter Xu 	char c;
83073c1ea93SPeter Xu 	struct uffd_args args = { 0 };
83173c1ea93SPeter Xu 
83207cf57ebSEdward Liaw 	ready_for_fork = false;
83307cf57ebSEdward Liaw 
83473c1ea93SPeter Xu 	fcntl(uffd, F_SETFL, uffd_flags | O_NONBLOCK);
83573c1ea93SPeter Xu 	if (uffd_register(uffd, area_dst, nr_pages * page_size,
83673c1ea93SPeter Xu 			  true, wp, false))
83773c1ea93SPeter Xu 		err("register failure");
83873c1ea93SPeter Xu 
83973c1ea93SPeter Xu 	args.apply_wp = wp;
84073c1ea93SPeter Xu 	if (pthread_create(&uffd_mon, NULL, uffd_poll_thread, &args))
84173c1ea93SPeter Xu 		err("uffd_poll_thread create");
84273c1ea93SPeter Xu 
84307cf57ebSEdward Liaw 	while (!ready_for_fork)
84407cf57ebSEdward Liaw 		; /* Wait for the poll_thread to start executing before forking */
84507cf57ebSEdward Liaw 
84673c1ea93SPeter Xu 	pid = fork();
84773c1ea93SPeter Xu 	if (pid < 0)
84873c1ea93SPeter Xu 		err("fork");
84973c1ea93SPeter Xu 
85073c1ea93SPeter Xu 	if (!pid)
85173c1ea93SPeter Xu 		exit(faulting_process(0, wp));
85273c1ea93SPeter Xu 
85373c1ea93SPeter Xu 	waitpid(pid, &err, 0);
85473c1ea93SPeter Xu 	if (err)
85573c1ea93SPeter Xu 		err("faulting process failed");
85673c1ea93SPeter Xu 	if (write(pipefd[1], &c, sizeof(c)) != sizeof(c))
85773c1ea93SPeter Xu 		err("pipe write");
85873c1ea93SPeter Xu 	if (pthread_join(uffd_mon, NULL))
85973c1ea93SPeter Xu 		err("pthread_join()");
86073c1ea93SPeter Xu 
86173c1ea93SPeter Xu 	if (args.missing_faults != nr_pages)
86273c1ea93SPeter Xu 		uffd_test_fail("Fault counts wrong");
86373c1ea93SPeter Xu 	else
86473c1ea93SPeter Xu 		uffd_test_pass();
86573c1ea93SPeter Xu }
86673c1ea93SPeter Xu 
uffd_events_test(uffd_test_args_t * args)86743759d44SPeter Xu static void uffd_events_test(uffd_test_args_t *args)
86873c1ea93SPeter Xu {
86973c1ea93SPeter Xu 	uffd_events_test_common(false);
87073c1ea93SPeter Xu }
87173c1ea93SPeter Xu 
uffd_events_wp_test(uffd_test_args_t * args)87243759d44SPeter Xu static void uffd_events_wp_test(uffd_test_args_t *args)
87373c1ea93SPeter Xu {
87473c1ea93SPeter Xu 	uffd_events_test_common(true);
87573c1ea93SPeter Xu }
87673c1ea93SPeter Xu 
retry_uffdio_zeropage(int ufd,struct uffdio_zeropage * uffdio_zeropage)877c3315502SPeter Xu static void retry_uffdio_zeropage(int ufd,
878c3315502SPeter Xu 				  struct uffdio_zeropage *uffdio_zeropage)
879c3315502SPeter Xu {
880c3315502SPeter Xu 	uffd_test_ops->alias_mapping(&uffdio_zeropage->range.start,
881c3315502SPeter Xu 				     uffdio_zeropage->range.len,
882c3315502SPeter Xu 				     0);
883c3315502SPeter Xu 	if (ioctl(ufd, UFFDIO_ZEROPAGE, uffdio_zeropage)) {
884c3315502SPeter Xu 		if (uffdio_zeropage->zeropage != -EEXIST)
885c3315502SPeter Xu 			err("UFFDIO_ZEROPAGE error: %"PRId64,
886c3315502SPeter Xu 			    (int64_t)uffdio_zeropage->zeropage);
887c3315502SPeter Xu 	} else {
888c3315502SPeter Xu 		err("UFFDIO_ZEROPAGE error: %"PRId64,
889c3315502SPeter Xu 		    (int64_t)uffdio_zeropage->zeropage);
890c3315502SPeter Xu 	}
891c3315502SPeter Xu }
892c3315502SPeter Xu 
do_uffdio_zeropage(int ufd,bool has_zeropage)893c3315502SPeter Xu static bool do_uffdio_zeropage(int ufd, bool has_zeropage)
894c3315502SPeter Xu {
895c3315502SPeter Xu 	struct uffdio_zeropage uffdio_zeropage = { 0 };
896c3315502SPeter Xu 	int ret;
897c3315502SPeter Xu 	__s64 res;
898c3315502SPeter Xu 
899c3315502SPeter Xu 	uffdio_zeropage.range.start = (unsigned long) area_dst;
900c3315502SPeter Xu 	uffdio_zeropage.range.len = page_size;
901c3315502SPeter Xu 	uffdio_zeropage.mode = 0;
902c3315502SPeter Xu 	ret = ioctl(ufd, UFFDIO_ZEROPAGE, &uffdio_zeropage);
903c3315502SPeter Xu 	res = uffdio_zeropage.zeropage;
904c3315502SPeter Xu 	if (ret) {
905c3315502SPeter Xu 		/* real retval in ufdio_zeropage.zeropage */
906c3315502SPeter Xu 		if (has_zeropage)
907c3315502SPeter Xu 			err("UFFDIO_ZEROPAGE error: %"PRId64, (int64_t)res);
908c3315502SPeter Xu 		else if (res != -EINVAL)
909c3315502SPeter Xu 			err("UFFDIO_ZEROPAGE not -EINVAL");
910c3315502SPeter Xu 	} else if (has_zeropage) {
911c3315502SPeter Xu 		if (res != page_size)
912c3315502SPeter Xu 			err("UFFDIO_ZEROPAGE unexpected size");
913c3315502SPeter Xu 		else
914c3315502SPeter Xu 			retry_uffdio_zeropage(ufd, &uffdio_zeropage);
915c3315502SPeter Xu 		return true;
916c3315502SPeter Xu 	} else
917c3315502SPeter Xu 		err("UFFDIO_ZEROPAGE succeeded");
918c3315502SPeter Xu 
919c3315502SPeter Xu 	return false;
920c3315502SPeter Xu }
921c3315502SPeter Xu 
922c3315502SPeter Xu /*
923c3315502SPeter Xu  * Registers a range with MISSING mode only for zeropage test.  Return true
924c3315502SPeter Xu  * if UFFDIO_ZEROPAGE supported, false otherwise. Can't use uffd_register()
925c3315502SPeter Xu  * because we want to detect .ioctls along the way.
926c3315502SPeter Xu  */
927c3315502SPeter Xu static bool
uffd_register_detect_zeropage(int uffd,void * addr,uint64_t len)928c3315502SPeter Xu uffd_register_detect_zeropage(int uffd, void *addr, uint64_t len)
929c3315502SPeter Xu {
930c3315502SPeter Xu 	uint64_t ioctls = 0;
931c3315502SPeter Xu 
932c3315502SPeter Xu 	if (uffd_register_with_ioctls(uffd, addr, len, true,
933c3315502SPeter Xu 				      false, false, &ioctls))
934c3315502SPeter Xu 		err("zeropage register fail");
935c3315502SPeter Xu 
936c3315502SPeter Xu 	return ioctls & (1 << _UFFDIO_ZEROPAGE);
937c3315502SPeter Xu }
938c3315502SPeter Xu 
939c3315502SPeter Xu /* exercise UFFDIO_ZEROPAGE */
uffd_zeropage_test(uffd_test_args_t * args)94043759d44SPeter Xu static void uffd_zeropage_test(uffd_test_args_t *args)
941c3315502SPeter Xu {
942c3315502SPeter Xu 	bool has_zeropage;
943c3315502SPeter Xu 	int i;
944c3315502SPeter Xu 
945c3315502SPeter Xu 	has_zeropage = uffd_register_detect_zeropage(uffd, area_dst, page_size);
946c3315502SPeter Xu 	if (area_dst_alias)
947c3315502SPeter Xu 		/* Ignore the retval; we already have it */
948c3315502SPeter Xu 		uffd_register_detect_zeropage(uffd, area_dst_alias, page_size);
949c3315502SPeter Xu 
950c3315502SPeter Xu 	if (do_uffdio_zeropage(uffd, has_zeropage))
951c3315502SPeter Xu 		for (i = 0; i < page_size; i++)
952c3315502SPeter Xu 			if (area_dst[i] != 0)
953c3315502SPeter Xu 				err("data non-zero at offset %d\n", i);
954c3315502SPeter Xu 
955c3315502SPeter Xu 	if (uffd_unregister(uffd, area_dst, page_size))
956c3315502SPeter Xu 		err("unregister");
957c3315502SPeter Xu 
958c3315502SPeter Xu 	if (area_dst_alias && uffd_unregister(uffd, area_dst_alias, page_size))
959c3315502SPeter Xu 		err("unregister");
960c3315502SPeter Xu 
961c3315502SPeter Xu 	uffd_test_pass();
962c3315502SPeter Xu }
963c3315502SPeter Xu 
uffd_register_poison(int uffd,void * addr,uint64_t len)96499aa7721SAxel Rasmussen static void uffd_register_poison(int uffd, void *addr, uint64_t len)
96599aa7721SAxel Rasmussen {
96699aa7721SAxel Rasmussen 	uint64_t ioctls = 0;
96799aa7721SAxel Rasmussen 	uint64_t expected = (1 << _UFFDIO_COPY) | (1 << _UFFDIO_POISON);
96899aa7721SAxel Rasmussen 
96999aa7721SAxel Rasmussen 	if (uffd_register_with_ioctls(uffd, addr, len, true,
97099aa7721SAxel Rasmussen 				      false, false, &ioctls))
97199aa7721SAxel Rasmussen 		err("poison register fail");
97299aa7721SAxel Rasmussen 
97399aa7721SAxel Rasmussen 	if ((ioctls & expected) != expected)
97499aa7721SAxel Rasmussen 		err("registered area doesn't support COPY and POISON ioctls");
97599aa7721SAxel Rasmussen }
97699aa7721SAxel Rasmussen 
do_uffdio_poison(int uffd,unsigned long offset)97799aa7721SAxel Rasmussen static void do_uffdio_poison(int uffd, unsigned long offset)
97899aa7721SAxel Rasmussen {
97999aa7721SAxel Rasmussen 	struct uffdio_poison uffdio_poison = { 0 };
98099aa7721SAxel Rasmussen 	int ret;
98199aa7721SAxel Rasmussen 	__s64 res;
98299aa7721SAxel Rasmussen 
98399aa7721SAxel Rasmussen 	uffdio_poison.range.start = (unsigned long) area_dst + offset;
98499aa7721SAxel Rasmussen 	uffdio_poison.range.len = page_size;
98599aa7721SAxel Rasmussen 	uffdio_poison.mode = 0;
98699aa7721SAxel Rasmussen 	ret = ioctl(uffd, UFFDIO_POISON, &uffdio_poison);
98799aa7721SAxel Rasmussen 	res = uffdio_poison.updated;
98899aa7721SAxel Rasmussen 
98999aa7721SAxel Rasmussen 	if (ret)
99099aa7721SAxel Rasmussen 		err("UFFDIO_POISON error: %"PRId64, (int64_t)res);
99199aa7721SAxel Rasmussen 	else if (res != page_size)
99299aa7721SAxel Rasmussen 		err("UFFDIO_POISON unexpected size: %"PRId64, (int64_t)res);
99399aa7721SAxel Rasmussen }
99499aa7721SAxel Rasmussen 
uffd_poison_handle_fault(struct uffd_msg * msg,struct uffd_args * args)99599aa7721SAxel Rasmussen static void uffd_poison_handle_fault(
99699aa7721SAxel Rasmussen 	struct uffd_msg *msg, struct uffd_args *args)
99799aa7721SAxel Rasmussen {
99899aa7721SAxel Rasmussen 	unsigned long offset;
99999aa7721SAxel Rasmussen 
100099aa7721SAxel Rasmussen 	if (msg->event != UFFD_EVENT_PAGEFAULT)
100199aa7721SAxel Rasmussen 		err("unexpected msg event %u", msg->event);
100299aa7721SAxel Rasmussen 
100399aa7721SAxel Rasmussen 	if (msg->arg.pagefault.flags &
100499aa7721SAxel Rasmussen 	    (UFFD_PAGEFAULT_FLAG_WP | UFFD_PAGEFAULT_FLAG_MINOR))
100599aa7721SAxel Rasmussen 		err("unexpected fault type %llu", msg->arg.pagefault.flags);
100699aa7721SAxel Rasmussen 
100799aa7721SAxel Rasmussen 	offset = (char *)(unsigned long)msg->arg.pagefault.address - area_dst;
100899aa7721SAxel Rasmussen 	offset &= ~(page_size-1);
100999aa7721SAxel Rasmussen 
101099aa7721SAxel Rasmussen 	/* Odd pages -> copy zeroed page; even pages -> poison. */
101199aa7721SAxel Rasmussen 	if (offset & page_size)
101299aa7721SAxel Rasmussen 		copy_page(uffd, offset, false);
101399aa7721SAxel Rasmussen 	else
101499aa7721SAxel Rasmussen 		do_uffdio_poison(uffd, offset);
101599aa7721SAxel Rasmussen }
101699aa7721SAxel Rasmussen 
uffd_poison_test(uffd_test_args_t * targs)101799aa7721SAxel Rasmussen static void uffd_poison_test(uffd_test_args_t *targs)
101899aa7721SAxel Rasmussen {
101999aa7721SAxel Rasmussen 	pthread_t uffd_mon;
102099aa7721SAxel Rasmussen 	char c;
102199aa7721SAxel Rasmussen 	struct uffd_args args = { 0 };
102299aa7721SAxel Rasmussen 	struct sigaction act = { 0 };
102399aa7721SAxel Rasmussen 	unsigned long nr_sigbus = 0;
102499aa7721SAxel Rasmussen 	unsigned long nr;
102599aa7721SAxel Rasmussen 
102699aa7721SAxel Rasmussen 	fcntl(uffd, F_SETFL, uffd_flags | O_NONBLOCK);
102799aa7721SAxel Rasmussen 
102899aa7721SAxel Rasmussen 	uffd_register_poison(uffd, area_dst, nr_pages * page_size);
102999aa7721SAxel Rasmussen 	memset(area_src, 0, nr_pages * page_size);
103099aa7721SAxel Rasmussen 
103199aa7721SAxel Rasmussen 	args.handle_fault = uffd_poison_handle_fault;
103299aa7721SAxel Rasmussen 	if (pthread_create(&uffd_mon, NULL, uffd_poll_thread, &args))
103399aa7721SAxel Rasmussen 		err("uffd_poll_thread create");
103499aa7721SAxel Rasmussen 
103599aa7721SAxel Rasmussen 	sigbuf = &jbuf;
103699aa7721SAxel Rasmussen 	act.sa_sigaction = sighndl;
103799aa7721SAxel Rasmussen 	act.sa_flags = SA_SIGINFO;
103899aa7721SAxel Rasmussen 	if (sigaction(SIGBUS, &act, 0))
103999aa7721SAxel Rasmussen 		err("sigaction");
104099aa7721SAxel Rasmussen 
104199aa7721SAxel Rasmussen 	for (nr = 0; nr < nr_pages; ++nr) {
104299aa7721SAxel Rasmussen 		unsigned long offset = nr * page_size;
104399aa7721SAxel Rasmussen 		const char *bytes = (const char *) area_dst + offset;
104499aa7721SAxel Rasmussen 		const char *i;
104599aa7721SAxel Rasmussen 
104699aa7721SAxel Rasmussen 		if (sigsetjmp(*sigbuf, 1)) {
104799aa7721SAxel Rasmussen 			/*
104899aa7721SAxel Rasmussen 			 * Access below triggered a SIGBUS, which was caught by
104999aa7721SAxel Rasmussen 			 * sighndl, which then jumped here. Count this SIGBUS,
105099aa7721SAxel Rasmussen 			 * and move on to next page.
105199aa7721SAxel Rasmussen 			 */
105299aa7721SAxel Rasmussen 			++nr_sigbus;
105399aa7721SAxel Rasmussen 			continue;
105499aa7721SAxel Rasmussen 		}
105599aa7721SAxel Rasmussen 
105699aa7721SAxel Rasmussen 		for (i = bytes; i < bytes + page_size; ++i) {
105799aa7721SAxel Rasmussen 			if (*i)
105899aa7721SAxel Rasmussen 				err("nonzero byte in area_dst (%p) at %p: %u",
105999aa7721SAxel Rasmussen 				    area_dst, i, *i);
106099aa7721SAxel Rasmussen 		}
106199aa7721SAxel Rasmussen 	}
106299aa7721SAxel Rasmussen 
106399aa7721SAxel Rasmussen 	if (write(pipefd[1], &c, sizeof(c)) != sizeof(c))
106499aa7721SAxel Rasmussen 		err("pipe write");
106599aa7721SAxel Rasmussen 	if (pthread_join(uffd_mon, NULL))
106699aa7721SAxel Rasmussen 		err("pthread_join()");
106799aa7721SAxel Rasmussen 
106899aa7721SAxel Rasmussen 	if (nr_sigbus != nr_pages / 2)
106999aa7721SAxel Rasmussen 		err("expected to receive %lu SIGBUS, actually received %lu",
107099aa7721SAxel Rasmussen 		    nr_pages / 2, nr_sigbus);
107199aa7721SAxel Rasmussen 
107299aa7721SAxel Rasmussen 	uffd_test_pass();
107399aa7721SAxel Rasmussen }
107499aa7721SAxel Rasmussen 
107543759d44SPeter Xu /*
107643759d44SPeter Xu  * Test the returned uffdio_register.ioctls with different register modes.
107743759d44SPeter Xu  * Note that _UFFDIO_ZEROPAGE is tested separately in the zeropage test.
107843759d44SPeter Xu  */
107943759d44SPeter Xu static void
do_register_ioctls_test(uffd_test_args_t * args,bool miss,bool wp,bool minor)108043759d44SPeter Xu do_register_ioctls_test(uffd_test_args_t *args, bool miss, bool wp, bool minor)
108143759d44SPeter Xu {
108243759d44SPeter Xu 	uint64_t ioctls = 0, expected = BIT_ULL(_UFFDIO_WAKE);
108343759d44SPeter Xu 	mem_type_t *mem_type = args->mem_type;
108443759d44SPeter Xu 	int ret;
108543759d44SPeter Xu 
108643759d44SPeter Xu 	ret = uffd_register_with_ioctls(uffd, area_dst, page_size,
108743759d44SPeter Xu 					miss, wp, minor, &ioctls);
108843759d44SPeter Xu 
108943759d44SPeter Xu 	/*
109043759d44SPeter Xu 	 * Handle special cases of UFFDIO_REGISTER here where it should
109143759d44SPeter Xu 	 * just fail with -EINVAL first..
109243759d44SPeter Xu 	 *
109343759d44SPeter Xu 	 * Case 1: register MINOR on anon
109443759d44SPeter Xu 	 * Case 2: register with no mode selected
109543759d44SPeter Xu 	 */
109643759d44SPeter Xu 	if ((minor && (mem_type->mem_flag == MEM_ANON)) ||
109743759d44SPeter Xu 	    (!miss && !wp && !minor)) {
109843759d44SPeter Xu 		if (ret != -EINVAL)
109943759d44SPeter Xu 			err("register (miss=%d, wp=%d, minor=%d) failed "
110043759d44SPeter Xu 			    "with wrong errno=%d", miss, wp, minor, ret);
110143759d44SPeter Xu 		return;
110243759d44SPeter Xu 	}
110343759d44SPeter Xu 
110443759d44SPeter Xu 	/* UFFDIO_REGISTER should succeed, then check ioctls returned */
110543759d44SPeter Xu 	if (miss)
110643759d44SPeter Xu 		expected |= BIT_ULL(_UFFDIO_COPY);
110743759d44SPeter Xu 	if (wp)
110843759d44SPeter Xu 		expected |= BIT_ULL(_UFFDIO_WRITEPROTECT);
110943759d44SPeter Xu 	if (minor)
111043759d44SPeter Xu 		expected |= BIT_ULL(_UFFDIO_CONTINUE);
111143759d44SPeter Xu 
111243759d44SPeter Xu 	if ((ioctls & expected) != expected)
111343759d44SPeter Xu 		err("unexpected uffdio_register.ioctls "
111443759d44SPeter Xu 		    "(miss=%d, wp=%d, minor=%d): expected=0x%"PRIx64", "
111543759d44SPeter Xu 		    "returned=0x%"PRIx64, miss, wp, minor, expected, ioctls);
111643759d44SPeter Xu 
111743759d44SPeter Xu 	if (uffd_unregister(uffd, area_dst, page_size))
111843759d44SPeter Xu 		err("unregister");
111943759d44SPeter Xu }
112043759d44SPeter Xu 
uffd_register_ioctls_test(uffd_test_args_t * args)112143759d44SPeter Xu static void uffd_register_ioctls_test(uffd_test_args_t *args)
112243759d44SPeter Xu {
112343759d44SPeter Xu 	int miss, wp, minor;
112443759d44SPeter Xu 
112543759d44SPeter Xu 	for (miss = 0; miss <= 1; miss++)
112643759d44SPeter Xu 		for (wp = 0; wp <= 1; wp++)
112743759d44SPeter Xu 			for (minor = 0; minor <= 1; minor++)
112843759d44SPeter Xu 				do_register_ioctls_test(args, miss, wp, minor);
112943759d44SPeter Xu 
113043759d44SPeter Xu 	uffd_test_pass();
113143759d44SPeter Xu }
113243759d44SPeter Xu 
113316a45b57SPeter Xu uffd_test_case_t uffd_tests[] = {
11348bda424fSPeter Xu 	{
113543759d44SPeter Xu 		/* Test returned uffdio_register.ioctls. */
113643759d44SPeter Xu 		.name = "register-ioctls",
113743759d44SPeter Xu 		.uffd_fn = uffd_register_ioctls_test,
113843759d44SPeter Xu 		.mem_targets = MEM_ALL,
113943759d44SPeter Xu 		.uffd_feature_required = UFFD_FEATURE_MISSING_HUGETLBFS |
114043759d44SPeter Xu 		UFFD_FEATURE_MISSING_SHMEM |
114143759d44SPeter Xu 		UFFD_FEATURE_PAGEFAULT_FLAG_WP |
114243759d44SPeter Xu 		UFFD_FEATURE_WP_HUGETLBFS_SHMEM |
114343759d44SPeter Xu 		UFFD_FEATURE_MINOR_HUGETLBFS |
114443759d44SPeter Xu 		UFFD_FEATURE_MINOR_SHMEM,
114543759d44SPeter Xu 	},
114643759d44SPeter Xu 	{
1147c3315502SPeter Xu 		.name = "zeropage",
1148c3315502SPeter Xu 		.uffd_fn = uffd_zeropage_test,
1149c3315502SPeter Xu 		.mem_targets = MEM_ALL,
1150c3315502SPeter Xu 		.uffd_feature_required = 0,
1151c3315502SPeter Xu 	},
1152c3315502SPeter Xu 	{
1153cff29458SPeter Xu 		.name = "wp-fork",
1154cff29458SPeter Xu 		.uffd_fn = uffd_wp_fork_test,
1155cff29458SPeter Xu 		.mem_targets = MEM_ALL,
1156cff29458SPeter Xu 		.uffd_feature_required = UFFD_FEATURE_PAGEFAULT_FLAG_WP |
1157cff29458SPeter Xu 		UFFD_FEATURE_WP_HUGETLBFS_SHMEM,
1158cff29458SPeter Xu 	},
1159cff29458SPeter Xu 	{
1160cff29458SPeter Xu 		.name = "wp-fork-with-event",
1161cff29458SPeter Xu 		.uffd_fn = uffd_wp_fork_with_event_test,
1162cff29458SPeter Xu 		.mem_targets = MEM_ALL,
1163cff29458SPeter Xu 		.uffd_feature_required = UFFD_FEATURE_PAGEFAULT_FLAG_WP |
1164cff29458SPeter Xu 		UFFD_FEATURE_WP_HUGETLBFS_SHMEM |
1165cff29458SPeter Xu 		/* when set, child process should inherit uffd-wp bits */
1166cff29458SPeter Xu 		UFFD_FEATURE_EVENT_FORK,
11678bda424fSPeter Xu 	},
11688bda424fSPeter Xu 	{
1169760aee0bSPeter Xu 		.name = "wp-fork-pin",
1170760aee0bSPeter Xu 		.uffd_fn = uffd_wp_fork_pin_test,
1171760aee0bSPeter Xu 		.mem_targets = MEM_ALL,
1172760aee0bSPeter Xu 		.uffd_feature_required = UFFD_FEATURE_PAGEFAULT_FLAG_WP |
1173760aee0bSPeter Xu 		UFFD_FEATURE_WP_HUGETLBFS_SHMEM,
1174760aee0bSPeter Xu 	},
1175760aee0bSPeter Xu 	{
1176760aee0bSPeter Xu 		.name = "wp-fork-pin-with-event",
1177760aee0bSPeter Xu 		.uffd_fn = uffd_wp_fork_pin_with_event_test,
1178760aee0bSPeter Xu 		.mem_targets = MEM_ALL,
1179760aee0bSPeter Xu 		.uffd_feature_required = UFFD_FEATURE_PAGEFAULT_FLAG_WP |
1180760aee0bSPeter Xu 		UFFD_FEATURE_WP_HUGETLBFS_SHMEM |
1181760aee0bSPeter Xu 		/* when set, child process should inherit uffd-wp bits */
1182760aee0bSPeter Xu 		UFFD_FEATURE_EVENT_FORK,
1183760aee0bSPeter Xu 	},
1184760aee0bSPeter Xu 	{
11858bda424fSPeter Xu 		.name = "wp-unpopulated",
11868bda424fSPeter Xu 		.uffd_fn = uffd_wp_unpopulated_test,
11878bda424fSPeter Xu 		.mem_targets = MEM_ANON,
11888bda424fSPeter Xu 		.uffd_feature_required =
11898bda424fSPeter Xu 		UFFD_FEATURE_PAGEFAULT_FLAG_WP | UFFD_FEATURE_WP_UNPOPULATED,
11908bda424fSPeter Xu 	},
119162515b5fSPeter Xu 	{
119262515b5fSPeter Xu 		.name = "minor",
119362515b5fSPeter Xu 		.uffd_fn = uffd_minor_test,
119462515b5fSPeter Xu 		.mem_targets = MEM_SHMEM | MEM_HUGETLB,
119562515b5fSPeter Xu 		.uffd_feature_required =
119662515b5fSPeter Xu 		UFFD_FEATURE_MINOR_HUGETLBFS | UFFD_FEATURE_MINOR_SHMEM,
119762515b5fSPeter Xu 	},
119862515b5fSPeter Xu 	{
119962515b5fSPeter Xu 		.name = "minor-wp",
120062515b5fSPeter Xu 		.uffd_fn = uffd_minor_wp_test,
120162515b5fSPeter Xu 		.mem_targets = MEM_SHMEM | MEM_HUGETLB,
120262515b5fSPeter Xu 		.uffd_feature_required =
120362515b5fSPeter Xu 		UFFD_FEATURE_MINOR_HUGETLBFS | UFFD_FEATURE_MINOR_SHMEM |
12044df9cefaSPeter Xu 		UFFD_FEATURE_PAGEFAULT_FLAG_WP |
12054df9cefaSPeter Xu 		/*
12064df9cefaSPeter Xu 		 * HACK: here we leveraged WP_UNPOPULATED to detect whether
12074df9cefaSPeter Xu 		 * minor mode supports wr-protect.  There's no feature flag
12084df9cefaSPeter Xu 		 * for it so this is the best we can test against.
12094df9cefaSPeter Xu 		 */
12104df9cefaSPeter Xu 		UFFD_FEATURE_WP_UNPOPULATED,
121162515b5fSPeter Xu 	},
121262515b5fSPeter Xu 	{
121362515b5fSPeter Xu 		.name = "minor-collapse",
121462515b5fSPeter Xu 		.uffd_fn = uffd_minor_collapse_test,
121562515b5fSPeter Xu 		/* MADV_COLLAPSE only works with shmem */
121662515b5fSPeter Xu 		.mem_targets = MEM_SHMEM,
121762515b5fSPeter Xu 		/* We can't test MADV_COLLAPSE, so try our luck */
121862515b5fSPeter Xu 		.uffd_feature_required = UFFD_FEATURE_MINOR_SHMEM,
121962515b5fSPeter Xu 	},
122073c1ea93SPeter Xu 	{
122173c1ea93SPeter Xu 		.name = "sigbus",
122273c1ea93SPeter Xu 		.uffd_fn = uffd_sigbus_test,
122373c1ea93SPeter Xu 		.mem_targets = MEM_ALL,
122473c1ea93SPeter Xu 		.uffd_feature_required = UFFD_FEATURE_SIGBUS |
122573c1ea93SPeter Xu 		UFFD_FEATURE_EVENT_FORK,
122673c1ea93SPeter Xu 	},
122773c1ea93SPeter Xu 	{
122873c1ea93SPeter Xu 		.name = "sigbus-wp",
122973c1ea93SPeter Xu 		.uffd_fn = uffd_sigbus_wp_test,
123073c1ea93SPeter Xu 		.mem_targets = MEM_ALL,
123173c1ea93SPeter Xu 		.uffd_feature_required = UFFD_FEATURE_SIGBUS |
1232fe295de2SEdward Liaw 		UFFD_FEATURE_EVENT_FORK | UFFD_FEATURE_PAGEFAULT_FLAG_WP |
1233fe295de2SEdward Liaw 		UFFD_FEATURE_WP_HUGETLBFS_SHMEM,
123473c1ea93SPeter Xu 	},
123573c1ea93SPeter Xu 	{
123673c1ea93SPeter Xu 		.name = "events",
123773c1ea93SPeter Xu 		.uffd_fn = uffd_events_test,
123873c1ea93SPeter Xu 		.mem_targets = MEM_ALL,
123973c1ea93SPeter Xu 		.uffd_feature_required = UFFD_FEATURE_EVENT_FORK |
124073c1ea93SPeter Xu 		UFFD_FEATURE_EVENT_REMAP | UFFD_FEATURE_EVENT_REMOVE,
124173c1ea93SPeter Xu 	},
124273c1ea93SPeter Xu 	{
124373c1ea93SPeter Xu 		.name = "events-wp",
124473c1ea93SPeter Xu 		.uffd_fn = uffd_events_wp_test,
124573c1ea93SPeter Xu 		.mem_targets = MEM_ALL,
124673c1ea93SPeter Xu 		.uffd_feature_required = UFFD_FEATURE_EVENT_FORK |
124773c1ea93SPeter Xu 		UFFD_FEATURE_EVENT_REMAP | UFFD_FEATURE_EVENT_REMOVE |
124873c1ea93SPeter Xu 		UFFD_FEATURE_PAGEFAULT_FLAG_WP |
124973c1ea93SPeter Xu 		UFFD_FEATURE_WP_HUGETLBFS_SHMEM,
125073c1ea93SPeter Xu 	},
125199aa7721SAxel Rasmussen 	{
125299aa7721SAxel Rasmussen 		.name = "poison",
125399aa7721SAxel Rasmussen 		.uffd_fn = uffd_poison_test,
125499aa7721SAxel Rasmussen 		.mem_targets = MEM_ALL,
125599aa7721SAxel Rasmussen 		.uffd_feature_required = UFFD_FEATURE_POISON,
125699aa7721SAxel Rasmussen 	},
125716a45b57SPeter Xu };
125816a45b57SPeter Xu 
usage(const char * prog)125921337f2aSPeter Xu static void usage(const char *prog)
126021337f2aSPeter Xu {
126121337f2aSPeter Xu 	printf("usage: %s [-f TESTNAME]\n", prog);
126221337f2aSPeter Xu 	puts("");
126321337f2aSPeter Xu 	puts(" -f: test name to filter (e.g., event)");
126421337f2aSPeter Xu 	puts(" -h: show the help msg");
126521337f2aSPeter Xu 	puts(" -l: list tests only");
126621337f2aSPeter Xu 	puts("");
126721337f2aSPeter Xu 	exit(KSFT_FAIL);
126821337f2aSPeter Xu }
126921337f2aSPeter Xu 
main(int argc,char * argv[])1270686a8bb7SPeter Xu int main(int argc, char *argv[])
1271686a8bb7SPeter Xu {
127216a45b57SPeter Xu 	int n_tests = sizeof(uffd_tests) / sizeof(uffd_test_case_t);
127316a45b57SPeter Xu 	int n_mems = sizeof(mem_types) / sizeof(mem_type_t);
127421337f2aSPeter Xu 	const char *test_filter = NULL;
127521337f2aSPeter Xu 	bool list_only = false;
127616a45b57SPeter Xu 	uffd_test_case_t *test;
127716a45b57SPeter Xu 	mem_type_t *mem_type;
127843759d44SPeter Xu 	uffd_test_args_t args;
1279f9da2426SPeter Xu 	const char *errmsg;
128021337f2aSPeter Xu 	int has_uffd, opt;
128116a45b57SPeter Xu 	int i, j;
1282d5433ce8SPeter Xu 
128321337f2aSPeter Xu 	while ((opt = getopt(argc, argv, "f:hl")) != -1) {
128421337f2aSPeter Xu 		switch (opt) {
128521337f2aSPeter Xu 		case 'f':
128621337f2aSPeter Xu 			test_filter = optarg;
128721337f2aSPeter Xu 			break;
128821337f2aSPeter Xu 		case 'l':
128921337f2aSPeter Xu 			list_only = true;
129021337f2aSPeter Xu 			break;
129121337f2aSPeter Xu 		case 'h':
129221337f2aSPeter Xu 		default:
129321337f2aSPeter Xu 			/* Unknown */
129421337f2aSPeter Xu 			usage(argv[0]);
129521337f2aSPeter Xu 			break;
129621337f2aSPeter Xu 		}
129721337f2aSPeter Xu 	}
129821337f2aSPeter Xu 
129921337f2aSPeter Xu 	if (!test_filter && !list_only) {
1300d5433ce8SPeter Xu 		has_uffd = test_uffd_api(false);
1301d5433ce8SPeter Xu 		has_uffd |= test_uffd_api(true);
1302d5433ce8SPeter Xu 
1303d5433ce8SPeter Xu 		if (!has_uffd) {
1304d5433ce8SPeter Xu 			printf("Userfaultfd not supported or unprivileged, skip all tests\n");
1305d5433ce8SPeter Xu 			exit(KSFT_SKIP);
1306d5433ce8SPeter Xu 		}
130721337f2aSPeter Xu 	}
130816a45b57SPeter Xu 
130916a45b57SPeter Xu 	for (i = 0; i < n_tests; i++) {
131016a45b57SPeter Xu 		test = &uffd_tests[i];
131121337f2aSPeter Xu 		if (test_filter && !strstr(test->name, test_filter))
131221337f2aSPeter Xu 			continue;
131321337f2aSPeter Xu 		if (list_only) {
131421337f2aSPeter Xu 			printf("%s\n", test->name);
131521337f2aSPeter Xu 			continue;
131621337f2aSPeter Xu 		}
131716a45b57SPeter Xu 		for (j = 0; j < n_mems; j++) {
131816a45b57SPeter Xu 			mem_type = &mem_types[j];
131916a45b57SPeter Xu 			if (!(test->mem_targets & mem_type->mem_flag))
132016a45b57SPeter Xu 				continue;
132116a45b57SPeter Xu 
13220e14e7e9SJohn Hubbard 			uffd_test_start("%s on %s", test->name, mem_type->name);
13230b34dca1STerry Tritton 			if ((mem_type->mem_flag == MEM_HUGETLB ||
13240b34dca1STerry Tritton 			    mem_type->mem_flag == MEM_HUGETLB_PRIVATE) &&
13250b34dca1STerry Tritton 			    (default_huge_page_size() == 0)) {
13260b34dca1STerry Tritton 				uffd_test_skip("huge page size is 0, feature missing?");
13270b34dca1STerry Tritton 				continue;
13280b34dca1STerry Tritton 			}
132916a45b57SPeter Xu 			if (!uffd_feature_supported(test)) {
133016a45b57SPeter Xu 				uffd_test_skip("feature missing");
133116a45b57SPeter Xu 				continue;
133216a45b57SPeter Xu 			}
133343759d44SPeter Xu 			if (uffd_setup_environment(&args, test, mem_type,
133443759d44SPeter Xu 						   &errmsg)) {
1335f9da2426SPeter Xu 				uffd_test_skip(errmsg);
133616a45b57SPeter Xu 				continue;
133716a45b57SPeter Xu 			}
133843759d44SPeter Xu 			test->uffd_fn(&args);
133916a45b57SPeter Xu 		}
134016a45b57SPeter Xu 	}
134116a45b57SPeter Xu 
134221337f2aSPeter Xu 	if (!list_only)
1343d5433ce8SPeter Xu 		uffd_test_report();
1344d5433ce8SPeter Xu 
1345d5433ce8SPeter Xu 	return ksft_get_fail_cnt() ? KSFT_FAIL : KSFT_PASS;
1346686a8bb7SPeter Xu }
1347686a8bb7SPeter Xu 
1348686a8bb7SPeter Xu #else /* __NR_userfaultfd */
1349686a8bb7SPeter Xu 
1350686a8bb7SPeter Xu #warning "missing __NR_userfaultfd definition"
1351686a8bb7SPeter Xu 
main(void)1352686a8bb7SPeter Xu int main(void)
1353686a8bb7SPeter Xu {
1354686a8bb7SPeter Xu 	printf("Skipping %s (missing __NR_userfaultfd)\n", __file__);
1355686a8bb7SPeter Xu 	return KSFT_SKIP;
1356686a8bb7SPeter Xu }
1357686a8bb7SPeter Xu 
1358686a8bb7SPeter Xu #endif /* __NR_userfaultfd */
1359