xref: /openbmc/linux/tools/testing/selftests/bpf/benchs/bench_htab_mem.c (revision c900529f3d9161bfde5cca0754f83b4d3c3e0220)
1*fd283ab1SHou Tao // SPDX-License-Identifier: GPL-2.0
2*fd283ab1SHou Tao /* Copyright (C) 2023. Huawei Technologies Co., Ltd */
3*fd283ab1SHou Tao #include <argp.h>
4*fd283ab1SHou Tao #include <stdbool.h>
5*fd283ab1SHou Tao #include <pthread.h>
6*fd283ab1SHou Tao #include <sys/types.h>
7*fd283ab1SHou Tao #include <sys/stat.h>
8*fd283ab1SHou Tao #include <sys/param.h>
9*fd283ab1SHou Tao #include <fcntl.h>
10*fd283ab1SHou Tao 
11*fd283ab1SHou Tao #include "bench.h"
12*fd283ab1SHou Tao #include "bpf_util.h"
13*fd283ab1SHou Tao #include "cgroup_helpers.h"
14*fd283ab1SHou Tao #include "htab_mem_bench.skel.h"
15*fd283ab1SHou Tao 
16*fd283ab1SHou Tao struct htab_mem_use_case {
17*fd283ab1SHou Tao 	const char *name;
18*fd283ab1SHou Tao 	const char **progs;
19*fd283ab1SHou Tao 	/* Do synchronization between addition thread and deletion thread */
20*fd283ab1SHou Tao 	bool need_sync;
21*fd283ab1SHou Tao };
22*fd283ab1SHou Tao 
23*fd283ab1SHou Tao static struct htab_mem_ctx {
24*fd283ab1SHou Tao 	const struct htab_mem_use_case *uc;
25*fd283ab1SHou Tao 	struct htab_mem_bench *skel;
26*fd283ab1SHou Tao 	pthread_barrier_t *notify;
27*fd283ab1SHou Tao 	int fd;
28*fd283ab1SHou Tao } ctx;
29*fd283ab1SHou Tao 
30*fd283ab1SHou Tao const char *ow_progs[] = {"overwrite", NULL};
31*fd283ab1SHou Tao const char *batch_progs[] = {"batch_add_batch_del", NULL};
32*fd283ab1SHou Tao const char *add_del_progs[] = {"add_only", "del_only", NULL};
33*fd283ab1SHou Tao const static struct htab_mem_use_case use_cases[] = {
34*fd283ab1SHou Tao 	{ .name = "overwrite", .progs = ow_progs },
35*fd283ab1SHou Tao 	{ .name = "batch_add_batch_del", .progs = batch_progs },
36*fd283ab1SHou Tao 	{ .name = "add_del_on_diff_cpu", .progs = add_del_progs, .need_sync = true },
37*fd283ab1SHou Tao };
38*fd283ab1SHou Tao 
39*fd283ab1SHou Tao static struct htab_mem_args {
40*fd283ab1SHou Tao 	u32 value_size;
41*fd283ab1SHou Tao 	const char *use_case;
42*fd283ab1SHou Tao 	bool preallocated;
43*fd283ab1SHou Tao } args = {
44*fd283ab1SHou Tao 	.value_size = 8,
45*fd283ab1SHou Tao 	.use_case = "overwrite",
46*fd283ab1SHou Tao 	.preallocated = false,
47*fd283ab1SHou Tao };
48*fd283ab1SHou Tao 
49*fd283ab1SHou Tao enum {
50*fd283ab1SHou Tao 	ARG_VALUE_SIZE = 10000,
51*fd283ab1SHou Tao 	ARG_USE_CASE = 10001,
52*fd283ab1SHou Tao 	ARG_PREALLOCATED = 10002,
53*fd283ab1SHou Tao };
54*fd283ab1SHou Tao 
55*fd283ab1SHou Tao static const struct argp_option opts[] = {
56*fd283ab1SHou Tao 	{ "value-size", ARG_VALUE_SIZE, "VALUE_SIZE", 0,
57*fd283ab1SHou Tao 	  "Set the value size of hash map (default 8)" },
58*fd283ab1SHou Tao 	{ "use-case", ARG_USE_CASE, "USE_CASE", 0,
59*fd283ab1SHou Tao 	  "Set the use case of hash map: overwrite|batch_add_batch_del|add_del_on_diff_cpu" },
60*fd283ab1SHou Tao 	{ "preallocated", ARG_PREALLOCATED, NULL, 0, "use preallocated hash map" },
61*fd283ab1SHou Tao 	{},
62*fd283ab1SHou Tao };
63*fd283ab1SHou Tao 
htab_mem_parse_arg(int key,char * arg,struct argp_state * state)64*fd283ab1SHou Tao static error_t htab_mem_parse_arg(int key, char *arg, struct argp_state *state)
65*fd283ab1SHou Tao {
66*fd283ab1SHou Tao 	switch (key) {
67*fd283ab1SHou Tao 	case ARG_VALUE_SIZE:
68*fd283ab1SHou Tao 		args.value_size = strtoul(arg, NULL, 10);
69*fd283ab1SHou Tao 		if (args.value_size > 4096) {
70*fd283ab1SHou Tao 			fprintf(stderr, "too big value size %u\n", args.value_size);
71*fd283ab1SHou Tao 			argp_usage(state);
72*fd283ab1SHou Tao 		}
73*fd283ab1SHou Tao 		break;
74*fd283ab1SHou Tao 	case ARG_USE_CASE:
75*fd283ab1SHou Tao 		args.use_case = strdup(arg);
76*fd283ab1SHou Tao 		if (!args.use_case) {
77*fd283ab1SHou Tao 			fprintf(stderr, "no mem for use-case\n");
78*fd283ab1SHou Tao 			argp_usage(state);
79*fd283ab1SHou Tao 		}
80*fd283ab1SHou Tao 		break;
81*fd283ab1SHou Tao 	case ARG_PREALLOCATED:
82*fd283ab1SHou Tao 		args.preallocated = true;
83*fd283ab1SHou Tao 		break;
84*fd283ab1SHou Tao 	default:
85*fd283ab1SHou Tao 		return ARGP_ERR_UNKNOWN;
86*fd283ab1SHou Tao 	}
87*fd283ab1SHou Tao 
88*fd283ab1SHou Tao 	return 0;
89*fd283ab1SHou Tao }
90*fd283ab1SHou Tao 
91*fd283ab1SHou Tao const struct argp bench_htab_mem_argp = {
92*fd283ab1SHou Tao 	.options = opts,
93*fd283ab1SHou Tao 	.parser = htab_mem_parse_arg,
94*fd283ab1SHou Tao };
95*fd283ab1SHou Tao 
htab_mem_validate(void)96*fd283ab1SHou Tao static void htab_mem_validate(void)
97*fd283ab1SHou Tao {
98*fd283ab1SHou Tao 	if (!strcmp(use_cases[2].name, args.use_case) && env.producer_cnt % 2) {
99*fd283ab1SHou Tao 		fprintf(stderr, "%s needs an even number of producers\n", args.use_case);
100*fd283ab1SHou Tao 		exit(1);
101*fd283ab1SHou Tao 	}
102*fd283ab1SHou Tao }
103*fd283ab1SHou Tao 
htab_mem_bench_init_barriers(void)104*fd283ab1SHou Tao static int htab_mem_bench_init_barriers(void)
105*fd283ab1SHou Tao {
106*fd283ab1SHou Tao 	pthread_barrier_t *barriers;
107*fd283ab1SHou Tao 	unsigned int i, nr;
108*fd283ab1SHou Tao 
109*fd283ab1SHou Tao 	if (!ctx.uc->need_sync)
110*fd283ab1SHou Tao 		return 0;
111*fd283ab1SHou Tao 
112*fd283ab1SHou Tao 	nr = (env.producer_cnt + 1) / 2;
113*fd283ab1SHou Tao 	barriers = calloc(nr, sizeof(*barriers));
114*fd283ab1SHou Tao 	if (!barriers)
115*fd283ab1SHou Tao 		return -1;
116*fd283ab1SHou Tao 
117*fd283ab1SHou Tao 	/* Used for synchronization between two threads */
118*fd283ab1SHou Tao 	for (i = 0; i < nr; i++)
119*fd283ab1SHou Tao 		pthread_barrier_init(&barriers[i], NULL, 2);
120*fd283ab1SHou Tao 
121*fd283ab1SHou Tao 	ctx.notify = barriers;
122*fd283ab1SHou Tao 	return 0;
123*fd283ab1SHou Tao }
124*fd283ab1SHou Tao 
htab_mem_bench_exit_barriers(void)125*fd283ab1SHou Tao static void htab_mem_bench_exit_barriers(void)
126*fd283ab1SHou Tao {
127*fd283ab1SHou Tao 	unsigned int i, nr;
128*fd283ab1SHou Tao 
129*fd283ab1SHou Tao 	if (!ctx.notify)
130*fd283ab1SHou Tao 		return;
131*fd283ab1SHou Tao 
132*fd283ab1SHou Tao 	nr = (env.producer_cnt + 1) / 2;
133*fd283ab1SHou Tao 	for (i = 0; i < nr; i++)
134*fd283ab1SHou Tao 		pthread_barrier_destroy(&ctx.notify[i]);
135*fd283ab1SHou Tao 	free(ctx.notify);
136*fd283ab1SHou Tao }
137*fd283ab1SHou Tao 
htab_mem_find_use_case_or_exit(const char * name)138*fd283ab1SHou Tao static const struct htab_mem_use_case *htab_mem_find_use_case_or_exit(const char *name)
139*fd283ab1SHou Tao {
140*fd283ab1SHou Tao 	unsigned int i;
141*fd283ab1SHou Tao 
142*fd283ab1SHou Tao 	for (i = 0; i < ARRAY_SIZE(use_cases); i++) {
143*fd283ab1SHou Tao 		if (!strcmp(name, use_cases[i].name))
144*fd283ab1SHou Tao 			return &use_cases[i];
145*fd283ab1SHou Tao 	}
146*fd283ab1SHou Tao 
147*fd283ab1SHou Tao 	fprintf(stderr, "no such use-case: %s\n", name);
148*fd283ab1SHou Tao 	fprintf(stderr, "available use case:");
149*fd283ab1SHou Tao 	for (i = 0; i < ARRAY_SIZE(use_cases); i++)
150*fd283ab1SHou Tao 		fprintf(stderr, " %s", use_cases[i].name);
151*fd283ab1SHou Tao 	fprintf(stderr, "\n");
152*fd283ab1SHou Tao 	exit(1);
153*fd283ab1SHou Tao }
154*fd283ab1SHou Tao 
htab_mem_setup(void)155*fd283ab1SHou Tao static void htab_mem_setup(void)
156*fd283ab1SHou Tao {
157*fd283ab1SHou Tao 	struct bpf_map *map;
158*fd283ab1SHou Tao 	const char **names;
159*fd283ab1SHou Tao 	int err;
160*fd283ab1SHou Tao 
161*fd283ab1SHou Tao 	setup_libbpf();
162*fd283ab1SHou Tao 
163*fd283ab1SHou Tao 	ctx.uc = htab_mem_find_use_case_or_exit(args.use_case);
164*fd283ab1SHou Tao 	err = htab_mem_bench_init_barriers();
165*fd283ab1SHou Tao 	if (err) {
166*fd283ab1SHou Tao 		fprintf(stderr, "failed to init barrier\n");
167*fd283ab1SHou Tao 		exit(1);
168*fd283ab1SHou Tao 	}
169*fd283ab1SHou Tao 
170*fd283ab1SHou Tao 	ctx.fd = cgroup_setup_and_join("/htab_mem");
171*fd283ab1SHou Tao 	if (ctx.fd < 0)
172*fd283ab1SHou Tao 		goto cleanup;
173*fd283ab1SHou Tao 
174*fd283ab1SHou Tao 	ctx.skel = htab_mem_bench__open();
175*fd283ab1SHou Tao 	if (!ctx.skel) {
176*fd283ab1SHou Tao 		fprintf(stderr, "failed to open skeleton\n");
177*fd283ab1SHou Tao 		goto cleanup;
178*fd283ab1SHou Tao 	}
179*fd283ab1SHou Tao 
180*fd283ab1SHou Tao 	map = ctx.skel->maps.htab;
181*fd283ab1SHou Tao 	bpf_map__set_value_size(map, args.value_size);
182*fd283ab1SHou Tao 	/* Ensure that different CPUs can operate on different subset */
183*fd283ab1SHou Tao 	bpf_map__set_max_entries(map, MAX(8192, 64 * env.nr_cpus));
184*fd283ab1SHou Tao 	if (args.preallocated)
185*fd283ab1SHou Tao 		bpf_map__set_map_flags(map, bpf_map__map_flags(map) & ~BPF_F_NO_PREALLOC);
186*fd283ab1SHou Tao 
187*fd283ab1SHou Tao 	names = ctx.uc->progs;
188*fd283ab1SHou Tao 	while (*names) {
189*fd283ab1SHou Tao 		struct bpf_program *prog;
190*fd283ab1SHou Tao 
191*fd283ab1SHou Tao 		prog = bpf_object__find_program_by_name(ctx.skel->obj, *names);
192*fd283ab1SHou Tao 		if (!prog) {
193*fd283ab1SHou Tao 			fprintf(stderr, "no such program %s\n", *names);
194*fd283ab1SHou Tao 			goto cleanup;
195*fd283ab1SHou Tao 		}
196*fd283ab1SHou Tao 		bpf_program__set_autoload(prog, true);
197*fd283ab1SHou Tao 		names++;
198*fd283ab1SHou Tao 	}
199*fd283ab1SHou Tao 	ctx.skel->bss->nr_thread = env.producer_cnt;
200*fd283ab1SHou Tao 
201*fd283ab1SHou Tao 	err = htab_mem_bench__load(ctx.skel);
202*fd283ab1SHou Tao 	if (err) {
203*fd283ab1SHou Tao 		fprintf(stderr, "failed to load skeleton\n");
204*fd283ab1SHou Tao 		goto cleanup;
205*fd283ab1SHou Tao 	}
206*fd283ab1SHou Tao 	err = htab_mem_bench__attach(ctx.skel);
207*fd283ab1SHou Tao 	if (err) {
208*fd283ab1SHou Tao 		fprintf(stderr, "failed to attach skeleton\n");
209*fd283ab1SHou Tao 		goto cleanup;
210*fd283ab1SHou Tao 	}
211*fd283ab1SHou Tao 	return;
212*fd283ab1SHou Tao 
213*fd283ab1SHou Tao cleanup:
214*fd283ab1SHou Tao 	htab_mem_bench__destroy(ctx.skel);
215*fd283ab1SHou Tao 	htab_mem_bench_exit_barriers();
216*fd283ab1SHou Tao 	if (ctx.fd >= 0) {
217*fd283ab1SHou Tao 		close(ctx.fd);
218*fd283ab1SHou Tao 		cleanup_cgroup_environment();
219*fd283ab1SHou Tao 	}
220*fd283ab1SHou Tao 	exit(1);
221*fd283ab1SHou Tao }
222*fd283ab1SHou Tao 
htab_mem_add_fn(pthread_barrier_t * notify)223*fd283ab1SHou Tao static void htab_mem_add_fn(pthread_barrier_t *notify)
224*fd283ab1SHou Tao {
225*fd283ab1SHou Tao 	while (true) {
226*fd283ab1SHou Tao 		/* Do addition */
227*fd283ab1SHou Tao 		(void)syscall(__NR_getpgid, 0);
228*fd283ab1SHou Tao 		/* Notify deletion thread to do deletion */
229*fd283ab1SHou Tao 		pthread_barrier_wait(notify);
230*fd283ab1SHou Tao 		/* Wait for deletion to complete */
231*fd283ab1SHou Tao 		pthread_barrier_wait(notify);
232*fd283ab1SHou Tao 	}
233*fd283ab1SHou Tao }
234*fd283ab1SHou Tao 
htab_mem_delete_fn(pthread_barrier_t * notify)235*fd283ab1SHou Tao static void htab_mem_delete_fn(pthread_barrier_t *notify)
236*fd283ab1SHou Tao {
237*fd283ab1SHou Tao 	while (true) {
238*fd283ab1SHou Tao 		/* Wait for addition to complete */
239*fd283ab1SHou Tao 		pthread_barrier_wait(notify);
240*fd283ab1SHou Tao 		/* Do deletion */
241*fd283ab1SHou Tao 		(void)syscall(__NR_getppid);
242*fd283ab1SHou Tao 		/* Notify addition thread to do addition */
243*fd283ab1SHou Tao 		pthread_barrier_wait(notify);
244*fd283ab1SHou Tao 	}
245*fd283ab1SHou Tao }
246*fd283ab1SHou Tao 
htab_mem_producer(void * arg)247*fd283ab1SHou Tao static void *htab_mem_producer(void *arg)
248*fd283ab1SHou Tao {
249*fd283ab1SHou Tao 	pthread_barrier_t *notify;
250*fd283ab1SHou Tao 	int seq;
251*fd283ab1SHou Tao 
252*fd283ab1SHou Tao 	if (!ctx.uc->need_sync) {
253*fd283ab1SHou Tao 		while (true)
254*fd283ab1SHou Tao 			(void)syscall(__NR_getpgid, 0);
255*fd283ab1SHou Tao 		return NULL;
256*fd283ab1SHou Tao 	}
257*fd283ab1SHou Tao 
258*fd283ab1SHou Tao 	seq = (long)arg;
259*fd283ab1SHou Tao 	notify = &ctx.notify[seq / 2];
260*fd283ab1SHou Tao 	if (seq & 1)
261*fd283ab1SHou Tao 		htab_mem_delete_fn(notify);
262*fd283ab1SHou Tao 	else
263*fd283ab1SHou Tao 		htab_mem_add_fn(notify);
264*fd283ab1SHou Tao 	return NULL;
265*fd283ab1SHou Tao }
266*fd283ab1SHou Tao 
htab_mem_read_mem_cgrp_file(const char * name,unsigned long * value)267*fd283ab1SHou Tao static void htab_mem_read_mem_cgrp_file(const char *name, unsigned long *value)
268*fd283ab1SHou Tao {
269*fd283ab1SHou Tao 	char buf[32];
270*fd283ab1SHou Tao 	ssize_t got;
271*fd283ab1SHou Tao 	int fd;
272*fd283ab1SHou Tao 
273*fd283ab1SHou Tao 	fd = openat(ctx.fd, name, O_RDONLY);
274*fd283ab1SHou Tao 	if (fd < 0) {
275*fd283ab1SHou Tao 		/* cgroup v1 ? */
276*fd283ab1SHou Tao 		fprintf(stderr, "no %s\n", name);
277*fd283ab1SHou Tao 		*value = 0;
278*fd283ab1SHou Tao 		return;
279*fd283ab1SHou Tao 	}
280*fd283ab1SHou Tao 
281*fd283ab1SHou Tao 	got = read(fd, buf, sizeof(buf) - 1);
282*fd283ab1SHou Tao 	if (got <= 0) {
283*fd283ab1SHou Tao 		*value = 0;
284*fd283ab1SHou Tao 		return;
285*fd283ab1SHou Tao 	}
286*fd283ab1SHou Tao 	buf[got] = 0;
287*fd283ab1SHou Tao 
288*fd283ab1SHou Tao 	*value = strtoull(buf, NULL, 0);
289*fd283ab1SHou Tao 
290*fd283ab1SHou Tao 	close(fd);
291*fd283ab1SHou Tao }
292*fd283ab1SHou Tao 
htab_mem_measure(struct bench_res * res)293*fd283ab1SHou Tao static void htab_mem_measure(struct bench_res *res)
294*fd283ab1SHou Tao {
295*fd283ab1SHou Tao 	res->hits = atomic_swap(&ctx.skel->bss->op_cnt, 0) / env.producer_cnt;
296*fd283ab1SHou Tao 	htab_mem_read_mem_cgrp_file("memory.current", &res->gp_ct);
297*fd283ab1SHou Tao }
298*fd283ab1SHou Tao 
htab_mem_report_progress(int iter,struct bench_res * res,long delta_ns)299*fd283ab1SHou Tao static void htab_mem_report_progress(int iter, struct bench_res *res, long delta_ns)
300*fd283ab1SHou Tao {
301*fd283ab1SHou Tao 	double loop, mem;
302*fd283ab1SHou Tao 
303*fd283ab1SHou Tao 	loop = res->hits / 1000.0 / (delta_ns / 1000000000.0);
304*fd283ab1SHou Tao 	mem = res->gp_ct / 1048576.0;
305*fd283ab1SHou Tao 	printf("Iter %3d (%7.3lfus): ", iter, (delta_ns - 1000000000) / 1000.0);
306*fd283ab1SHou Tao 	printf("per-prod-op %7.2lfk/s, memory usage %7.2lfMiB\n", loop, mem);
307*fd283ab1SHou Tao }
308*fd283ab1SHou Tao 
htab_mem_report_final(struct bench_res res[],int res_cnt)309*fd283ab1SHou Tao static void htab_mem_report_final(struct bench_res res[], int res_cnt)
310*fd283ab1SHou Tao {
311*fd283ab1SHou Tao 	double mem_mean = 0.0, mem_stddev = 0.0;
312*fd283ab1SHou Tao 	double loop_mean = 0.0, loop_stddev = 0.0;
313*fd283ab1SHou Tao 	unsigned long peak_mem;
314*fd283ab1SHou Tao 	int i;
315*fd283ab1SHou Tao 
316*fd283ab1SHou Tao 	for (i = 0; i < res_cnt; i++) {
317*fd283ab1SHou Tao 		loop_mean += res[i].hits / 1000.0 / (0.0 + res_cnt);
318*fd283ab1SHou Tao 		mem_mean += res[i].gp_ct / 1048576.0 / (0.0 + res_cnt);
319*fd283ab1SHou Tao 	}
320*fd283ab1SHou Tao 	if (res_cnt > 1)  {
321*fd283ab1SHou Tao 		for (i = 0; i < res_cnt; i++) {
322*fd283ab1SHou Tao 			loop_stddev += (loop_mean - res[i].hits / 1000.0) *
323*fd283ab1SHou Tao 				       (loop_mean - res[i].hits / 1000.0) /
324*fd283ab1SHou Tao 				       (res_cnt - 1.0);
325*fd283ab1SHou Tao 			mem_stddev += (mem_mean - res[i].gp_ct / 1048576.0) *
326*fd283ab1SHou Tao 				      (mem_mean - res[i].gp_ct / 1048576.0) /
327*fd283ab1SHou Tao 				      (res_cnt - 1.0);
328*fd283ab1SHou Tao 		}
329*fd283ab1SHou Tao 		loop_stddev = sqrt(loop_stddev);
330*fd283ab1SHou Tao 		mem_stddev = sqrt(mem_stddev);
331*fd283ab1SHou Tao 	}
332*fd283ab1SHou Tao 
333*fd283ab1SHou Tao 	htab_mem_read_mem_cgrp_file("memory.peak", &peak_mem);
334*fd283ab1SHou Tao 	printf("Summary: per-prod-op %7.2lf \u00B1 %7.2lfk/s, memory usage %7.2lf \u00B1 %7.2lfMiB,"
335*fd283ab1SHou Tao 	       " peak memory usage %7.2lfMiB\n",
336*fd283ab1SHou Tao 	       loop_mean, loop_stddev, mem_mean, mem_stddev, peak_mem / 1048576.0);
337*fd283ab1SHou Tao 
338*fd283ab1SHou Tao 	cleanup_cgroup_environment();
339*fd283ab1SHou Tao }
340*fd283ab1SHou Tao 
341*fd283ab1SHou Tao const struct bench bench_htab_mem = {
342*fd283ab1SHou Tao 	.name = "htab-mem",
343*fd283ab1SHou Tao 	.argp = &bench_htab_mem_argp,
344*fd283ab1SHou Tao 	.validate = htab_mem_validate,
345*fd283ab1SHou Tao 	.setup = htab_mem_setup,
346*fd283ab1SHou Tao 	.producer_thread = htab_mem_producer,
347*fd283ab1SHou Tao 	.measure = htab_mem_measure,
348*fd283ab1SHou Tao 	.report_progress = htab_mem_report_progress,
349*fd283ab1SHou Tao 	.report_final = htab_mem_report_final,
350*fd283ab1SHou Tao };
351