xref: /openbmc/linux/tools/testing/selftests/bpf/veristat.c (revision 34d6f206a88c2651d216bd3487ac956a40b2ba8e)
1  // SPDX-License-Identifier: (GPL-2.0-only OR BSD-2-Clause)
2  /* Copyright (c) 2022 Meta Platforms, Inc. and affiliates. */
3  #define _GNU_SOURCE
4  #include <argp.h>
5  #include <string.h>
6  #include <stdlib.h>
7  #include <sched.h>
8  #include <pthread.h>
9  #include <dirent.h>
10  #include <signal.h>
11  #include <fcntl.h>
12  #include <unistd.h>
13  #include <sys/time.h>
14  #include <sys/sysinfo.h>
15  #include <sys/stat.h>
16  #include <bpf/libbpf.h>
17  #include <bpf/btf.h>
18  #include <libelf.h>
19  #include <gelf.h>
20  #include <float.h>
21  
22  #ifndef ARRAY_SIZE
23  #define ARRAY_SIZE(arr) (sizeof(arr) / sizeof((arr)[0]))
24  #endif
25  
26  enum stat_id {
27  	VERDICT,
28  	DURATION,
29  	TOTAL_INSNS,
30  	TOTAL_STATES,
31  	PEAK_STATES,
32  	MAX_STATES_PER_INSN,
33  	MARK_READ_MAX_LEN,
34  
35  	FILE_NAME,
36  	PROG_NAME,
37  
38  	ALL_STATS_CNT,
39  	NUM_STATS_CNT = FILE_NAME - VERDICT,
40  };
41  
42  /* In comparison mode each stat can specify up to four different values:
43   *   - A side value;
44   *   - B side value;
45   *   - absolute diff value;
46   *   - relative (percentage) diff value.
47   *
48   * When specifying stat specs in comparison mode, user can use one of the
49   * following variant suffixes to specify which exact variant should be used for
50   * ordering or filtering:
51   *   - `_a` for A side value;
52   *   - `_b` for B side value;
53   *   - `_diff` for absolute diff value;
54   *   - `_pct` for relative (percentage) diff value.
55   *
56   * If no variant suffix is provided, then `_b` (control data) is assumed.
57   *
58   * As an example, let's say instructions stat has the following output:
59   *
60   * Insns (A)  Insns (B)  Insns   (DIFF)
61   * ---------  ---------  --------------
62   * 21547      20920       -627 (-2.91%)
63   *
64   * Then:
65   *   - 21547 is A side value (insns_a);
66   *   - 20920 is B side value (insns_b);
67   *   - -627 is absolute diff value (insns_diff);
68   *   - -2.91% is relative diff value (insns_pct).
69   *
70   * For verdict there is no verdict_pct variant.
71   * For file and program name, _a and _b variants are equivalent and there are
72   * no _diff or _pct variants.
73   */
74  enum stat_variant {
75  	VARIANT_A,
76  	VARIANT_B,
77  	VARIANT_DIFF,
78  	VARIANT_PCT,
79  };
80  
81  struct verif_stats {
82  	char *file_name;
83  	char *prog_name;
84  
85  	long stats[NUM_STATS_CNT];
86  };
87  
88  /* joined comparison mode stats */
89  struct verif_stats_join {
90  	char *file_name;
91  	char *prog_name;
92  
93  	const struct verif_stats *stats_a;
94  	const struct verif_stats *stats_b;
95  };
96  
97  struct stat_specs {
98  	int spec_cnt;
99  	enum stat_id ids[ALL_STATS_CNT];
100  	enum stat_variant variants[ALL_STATS_CNT];
101  	bool asc[ALL_STATS_CNT];
102  	int lens[ALL_STATS_CNT * 3]; /* 3x for comparison mode */
103  };
104  
105  enum resfmt {
106  	RESFMT_TABLE,
107  	RESFMT_TABLE_CALCLEN, /* fake format to pre-calculate table's column widths */
108  	RESFMT_CSV,
109  };
110  
111  enum filter_kind {
112  	FILTER_NAME,
113  	FILTER_STAT,
114  };
115  
116  enum operator_kind {
117  	OP_EQ,		/* == or = */
118  	OP_NEQ,		/* != or <> */
119  	OP_LT,		/* < */
120  	OP_LE,		/* <= */
121  	OP_GT,		/* > */
122  	OP_GE,		/* >= */
123  };
124  
125  struct filter {
126  	enum filter_kind kind;
127  	/* FILTER_NAME */
128  	char *any_glob;
129  	char *file_glob;
130  	char *prog_glob;
131  	/* FILTER_STAT */
132  	enum operator_kind op;
133  	int stat_id;
134  	enum stat_variant stat_var;
135  	long value;
136  };
137  
138  static struct env {
139  	char **filenames;
140  	int filename_cnt;
141  	bool verbose;
142  	bool debug;
143  	bool quiet;
144  	bool force_checkpoints;
145  	enum resfmt out_fmt;
146  	bool show_version;
147  	bool comparison_mode;
148  	bool replay_mode;
149  
150  	int log_level;
151  	int log_size;
152  	bool log_fixed;
153  
154  	struct verif_stats *prog_stats;
155  	int prog_stat_cnt;
156  
157  	/* baseline_stats is allocated and used only in comparison mode */
158  	struct verif_stats *baseline_stats;
159  	int baseline_stat_cnt;
160  
161  	struct verif_stats_join *join_stats;
162  	int join_stat_cnt;
163  
164  	struct stat_specs output_spec;
165  	struct stat_specs sort_spec;
166  
167  	struct filter *allow_filters;
168  	struct filter *deny_filters;
169  	int allow_filter_cnt;
170  	int deny_filter_cnt;
171  
172  	int files_processed;
173  	int files_skipped;
174  	int progs_processed;
175  	int progs_skipped;
176  } env;
177  
libbpf_print_fn(enum libbpf_print_level level,const char * format,va_list args)178  static int libbpf_print_fn(enum libbpf_print_level level, const char *format, va_list args)
179  {
180  	if (!env.verbose)
181  		return 0;
182  	if (level == LIBBPF_DEBUG  && !env.debug)
183  		return 0;
184  	return vfprintf(stderr, format, args);
185  }
186  
187  #ifndef VERISTAT_VERSION
188  #define VERISTAT_VERSION "<kernel>"
189  #endif
190  
191  const char *argp_program_version = "veristat v" VERISTAT_VERSION;
192  const char *argp_program_bug_address = "<bpf@vger.kernel.org>";
193  const char argp_program_doc[] =
194  "veristat    BPF verifier stats collection and comparison tool.\n"
195  "\n"
196  "USAGE: veristat <obj-file> [<obj-file>...]\n"
197  "   OR: veristat -C <baseline.csv> <comparison.csv>\n"
198  "   OR: veristat -R <results.csv>\n";
199  
200  enum {
201  	OPT_LOG_FIXED = 1000,
202  	OPT_LOG_SIZE = 1001,
203  };
204  
205  static const struct argp_option opts[] = {
206  	{ NULL, 'h', NULL, OPTION_HIDDEN, "Show the full help" },
207  	{ "version", 'V', NULL, 0, "Print version" },
208  	{ "verbose", 'v', NULL, 0, "Verbose mode" },
209  	{ "debug", 'd', NULL, 0, "Debug mode (turns on libbpf debug logging)" },
210  	{ "log-level", 'l', "LEVEL", 0, "Verifier log level (default 0 for normal mode, 1 for verbose mode)" },
211  	{ "log-fixed", OPT_LOG_FIXED, NULL, 0, "Disable verifier log rotation" },
212  	{ "log-size", OPT_LOG_SIZE, "BYTES", 0, "Customize verifier log size (default to 16MB)" },
213  	{ "test-states", 't', NULL, 0,
214  	  "Force frequent BPF verifier state checkpointing (set BPF_F_TEST_STATE_FREQ program flag)" },
215  	{ "quiet", 'q', NULL, 0, "Quiet mode" },
216  	{ "emit", 'e', "SPEC", 0, "Specify stats to be emitted" },
217  	{ "sort", 's', "SPEC", 0, "Specify sort order" },
218  	{ "output-format", 'o', "FMT", 0, "Result output format (table, csv), default is table." },
219  	{ "compare", 'C', NULL, 0, "Comparison mode" },
220  	{ "replay", 'R', NULL, 0, "Replay mode" },
221  	{ "filter", 'f', "FILTER", 0, "Filter expressions (or @filename for file with expressions)." },
222  	{},
223  };
224  
225  static int parse_stats(const char *stats_str, struct stat_specs *specs);
226  static int append_filter(struct filter **filters, int *cnt, const char *str);
227  static int append_filter_file(const char *path);
228  
parse_arg(int key,char * arg,struct argp_state * state)229  static error_t parse_arg(int key, char *arg, struct argp_state *state)
230  {
231  	void *tmp;
232  	int err;
233  
234  	switch (key) {
235  	case 'h':
236  		argp_state_help(state, stderr, ARGP_HELP_STD_HELP);
237  		break;
238  	case 'V':
239  		env.show_version = true;
240  		break;
241  	case 'v':
242  		env.verbose = true;
243  		break;
244  	case 'd':
245  		env.debug = true;
246  		env.verbose = true;
247  		break;
248  	case 'q':
249  		env.quiet = true;
250  		break;
251  	case 'e':
252  		err = parse_stats(arg, &env.output_spec);
253  		if (err)
254  			return err;
255  		break;
256  	case 's':
257  		err = parse_stats(arg, &env.sort_spec);
258  		if (err)
259  			return err;
260  		break;
261  	case 'o':
262  		if (strcmp(arg, "table") == 0) {
263  			env.out_fmt = RESFMT_TABLE;
264  		} else if (strcmp(arg, "csv") == 0) {
265  			env.out_fmt = RESFMT_CSV;
266  		} else {
267  			fprintf(stderr, "Unrecognized output format '%s'\n", arg);
268  			return -EINVAL;
269  		}
270  		break;
271  	case 'l':
272  		errno = 0;
273  		env.log_level = strtol(arg, NULL, 10);
274  		if (errno) {
275  			fprintf(stderr, "invalid log level: %s\n", arg);
276  			argp_usage(state);
277  		}
278  		break;
279  	case OPT_LOG_FIXED:
280  		env.log_fixed = true;
281  		break;
282  	case OPT_LOG_SIZE:
283  		errno = 0;
284  		env.log_size = strtol(arg, NULL, 10);
285  		if (errno) {
286  			fprintf(stderr, "invalid log size: %s\n", arg);
287  			argp_usage(state);
288  		}
289  		break;
290  	case 't':
291  		env.force_checkpoints = true;
292  		break;
293  	case 'C':
294  		env.comparison_mode = true;
295  		break;
296  	case 'R':
297  		env.replay_mode = true;
298  		break;
299  	case 'f':
300  		if (arg[0] == '@')
301  			err = append_filter_file(arg + 1);
302  		else if (arg[0] == '!')
303  			err = append_filter(&env.deny_filters, &env.deny_filter_cnt, arg + 1);
304  		else
305  			err = append_filter(&env.allow_filters, &env.allow_filter_cnt, arg);
306  		if (err) {
307  			fprintf(stderr, "Failed to collect program filter expressions: %d\n", err);
308  			return err;
309  		}
310  		break;
311  	case ARGP_KEY_ARG:
312  		tmp = realloc(env.filenames, (env.filename_cnt + 1) * sizeof(*env.filenames));
313  		if (!tmp)
314  			return -ENOMEM;
315  		env.filenames = tmp;
316  		env.filenames[env.filename_cnt] = strdup(arg);
317  		if (!env.filenames[env.filename_cnt])
318  			return -ENOMEM;
319  		env.filename_cnt++;
320  		break;
321  	default:
322  		return ARGP_ERR_UNKNOWN;
323  	}
324  	return 0;
325  }
326  
327  static const struct argp argp = {
328  	.options = opts,
329  	.parser = parse_arg,
330  	.doc = argp_program_doc,
331  };
332  
333  
334  /* Adapted from perf/util/string.c */
glob_matches(const char * str,const char * pat)335  static bool glob_matches(const char *str, const char *pat)
336  {
337  	while (*str && *pat && *pat != '*') {
338  		if (*str != *pat)
339  			return false;
340  		str++;
341  		pat++;
342  	}
343  	/* Check wild card */
344  	if (*pat == '*') {
345  		while (*pat == '*')
346  			pat++;
347  		if (!*pat) /* Tail wild card matches all */
348  			return true;
349  		while (*str)
350  			if (glob_matches(str++, pat))
351  				return true;
352  	}
353  	return !*str && !*pat;
354  }
355  
is_bpf_obj_file(const char * path)356  static bool is_bpf_obj_file(const char *path) {
357  	Elf64_Ehdr *ehdr;
358  	int fd, err = -EINVAL;
359  	Elf *elf = NULL;
360  
361  	fd = open(path, O_RDONLY | O_CLOEXEC);
362  	if (fd < 0)
363  		return true; /* we'll fail later and propagate error */
364  
365  	/* ensure libelf is initialized */
366  	(void)elf_version(EV_CURRENT);
367  
368  	elf = elf_begin(fd, ELF_C_READ, NULL);
369  	if (!elf)
370  		goto cleanup;
371  
372  	if (elf_kind(elf) != ELF_K_ELF || gelf_getclass(elf) != ELFCLASS64)
373  		goto cleanup;
374  
375  	ehdr = elf64_getehdr(elf);
376  	/* Old LLVM set e_machine to EM_NONE */
377  	if (!ehdr || ehdr->e_type != ET_REL || (ehdr->e_machine && ehdr->e_machine != EM_BPF))
378  		goto cleanup;
379  
380  	err = 0;
381  cleanup:
382  	if (elf)
383  		elf_end(elf);
384  	close(fd);
385  	return err == 0;
386  }
387  
should_process_file_prog(const char * filename,const char * prog_name)388  static bool should_process_file_prog(const char *filename, const char *prog_name)
389  {
390  	struct filter *f;
391  	int i, allow_cnt = 0;
392  
393  	for (i = 0; i < env.deny_filter_cnt; i++) {
394  		f = &env.deny_filters[i];
395  		if (f->kind != FILTER_NAME)
396  			continue;
397  
398  		if (f->any_glob && glob_matches(filename, f->any_glob))
399  			return false;
400  		if (f->any_glob && prog_name && glob_matches(prog_name, f->any_glob))
401  			return false;
402  		if (f->file_glob && glob_matches(filename, f->file_glob))
403  			return false;
404  		if (f->prog_glob && prog_name && glob_matches(prog_name, f->prog_glob))
405  			return false;
406  	}
407  
408  	for (i = 0; i < env.allow_filter_cnt; i++) {
409  		f = &env.allow_filters[i];
410  		if (f->kind != FILTER_NAME)
411  			continue;
412  
413  		allow_cnt++;
414  		if (f->any_glob) {
415  			if (glob_matches(filename, f->any_glob))
416  				return true;
417  			/* If we don't know program name yet, any_glob filter
418  			 * has to assume that current BPF object file might be
419  			 * relevant; we'll check again later on after opening
420  			 * BPF object file, at which point program name will
421  			 * be known finally.
422  			 */
423  			if (!prog_name || glob_matches(prog_name, f->any_glob))
424  				return true;
425  		} else {
426  			if (f->file_glob && !glob_matches(filename, f->file_glob))
427  				continue;
428  			if (f->prog_glob && prog_name && !glob_matches(prog_name, f->prog_glob))
429  				continue;
430  			return true;
431  		}
432  	}
433  
434  	/* if there are no file/prog name allow filters, allow all progs,
435  	 * unless they are denied earlier explicitly
436  	 */
437  	return allow_cnt == 0;
438  }
439  
440  static struct {
441  	enum operator_kind op_kind;
442  	const char *op_str;
443  } operators[] = {
444  	/* Order of these definitions matter to avoid situations like '<'
445  	 * matching part of what is actually a '<>' operator. That is,
446  	 * substrings should go last.
447  	 */
448  	{ OP_EQ, "==" },
449  	{ OP_NEQ, "!=" },
450  	{ OP_NEQ, "<>" },
451  	{ OP_LE, "<=" },
452  	{ OP_LT, "<" },
453  	{ OP_GE, ">=" },
454  	{ OP_GT, ">" },
455  	{ OP_EQ, "=" },
456  };
457  
458  static bool parse_stat_id_var(const char *name, size_t len, int *id, enum stat_variant *var);
459  
append_filter(struct filter ** filters,int * cnt,const char * str)460  static int append_filter(struct filter **filters, int *cnt, const char *str)
461  {
462  	struct filter *f;
463  	void *tmp;
464  	const char *p;
465  	int i;
466  
467  	tmp = realloc(*filters, (*cnt + 1) * sizeof(**filters));
468  	if (!tmp)
469  		return -ENOMEM;
470  	*filters = tmp;
471  
472  	f = &(*filters)[*cnt];
473  	memset(f, 0, sizeof(*f));
474  
475  	/* First, let's check if it's a stats filter of the following form:
476  	 * <stat><op><value, where:
477  	 *   - <stat> is one of supported numerical stats (verdict is also
478  	 *     considered numerical, failure == 0, success == 1);
479  	 *   - <op> is comparison operator (see `operators` definitions);
480  	 *   - <value> is an integer (or failure/success, or false/true as
481  	 *     special aliases for 0 and 1, respectively).
482  	 * If the form doesn't match what user provided, we assume file/prog
483  	 * glob filter.
484  	 */
485  	for (i = 0; i < ARRAY_SIZE(operators); i++) {
486  		enum stat_variant var;
487  		int id;
488  		long val;
489  		const char *end = str;
490  		const char *op_str;
491  
492  		op_str = operators[i].op_str;
493  		p = strstr(str, op_str);
494  		if (!p)
495  			continue;
496  
497  		if (!parse_stat_id_var(str, p - str, &id, &var)) {
498  			fprintf(stderr, "Unrecognized stat name in '%s'!\n", str);
499  			return -EINVAL;
500  		}
501  		if (id >= FILE_NAME) {
502  			fprintf(stderr, "Non-integer stat is specified in '%s'!\n", str);
503  			return -EINVAL;
504  		}
505  
506  		p += strlen(op_str);
507  
508  		if (strcasecmp(p, "true") == 0 ||
509  		    strcasecmp(p, "t") == 0 ||
510  		    strcasecmp(p, "success") == 0 ||
511  		    strcasecmp(p, "succ") == 0 ||
512  		    strcasecmp(p, "s") == 0 ||
513  		    strcasecmp(p, "match") == 0 ||
514  		    strcasecmp(p, "m") == 0) {
515  			val = 1;
516  		} else if (strcasecmp(p, "false") == 0 ||
517  			   strcasecmp(p, "f") == 0 ||
518  			   strcasecmp(p, "failure") == 0 ||
519  			   strcasecmp(p, "fail") == 0 ||
520  			   strcasecmp(p, "mismatch") == 0 ||
521  			   strcasecmp(p, "mis") == 0) {
522  			val = 0;
523  		} else {
524  			errno = 0;
525  			val = strtol(p, (char **)&end, 10);
526  			if (errno || end == p || *end != '\0' ) {
527  				fprintf(stderr, "Invalid integer value in '%s'!\n", str);
528  				return -EINVAL;
529  			}
530  		}
531  
532  		f->kind = FILTER_STAT;
533  		f->stat_id = id;
534  		f->stat_var = var;
535  		f->op = operators[i].op_kind;
536  		f->value = val;
537  
538  		*cnt += 1;
539  		return 0;
540  	}
541  
542  	/* File/prog filter can be specified either as '<glob>' or
543  	 * '<file-glob>/<prog-glob>'. In the former case <glob> is applied to
544  	 * both file and program names. This seems to be way more useful in
545  	 * practice. If user needs full control, they can use '/<prog-glob>'
546  	 * form to glob just program name, or '<file-glob>/' to glob only file
547  	 * name. But usually common <glob> seems to be the most useful and
548  	 * ergonomic way.
549  	 */
550  	f->kind = FILTER_NAME;
551  	p = strchr(str, '/');
552  	if (!p) {
553  		f->any_glob = strdup(str);
554  		if (!f->any_glob)
555  			return -ENOMEM;
556  	} else {
557  		if (str != p) {
558  			/* non-empty file glob */
559  			f->file_glob = strndup(str, p - str);
560  			if (!f->file_glob)
561  				return -ENOMEM;
562  		}
563  		if (strlen(p + 1) > 0) {
564  			/* non-empty prog glob */
565  			f->prog_glob = strdup(p + 1);
566  			if (!f->prog_glob) {
567  				free(f->file_glob);
568  				f->file_glob = NULL;
569  				return -ENOMEM;
570  			}
571  		}
572  	}
573  
574  	*cnt += 1;
575  	return 0;
576  }
577  
append_filter_file(const char * path)578  static int append_filter_file(const char *path)
579  {
580  	char buf[1024];
581  	FILE *f;
582  	int err = 0;
583  
584  	f = fopen(path, "r");
585  	if (!f) {
586  		err = -errno;
587  		fprintf(stderr, "Failed to open filters in '%s': %d\n", path, err);
588  		return err;
589  	}
590  
591  	while (fscanf(f, " %1023[^\n]\n", buf) == 1) {
592  		/* lines starting with # are comments, skip them */
593  		if (buf[0] == '\0' || buf[0] == '#')
594  			continue;
595  		/* lines starting with ! are negative match filters */
596  		if (buf[0] == '!')
597  			err = append_filter(&env.deny_filters, &env.deny_filter_cnt, buf + 1);
598  		else
599  			err = append_filter(&env.allow_filters, &env.allow_filter_cnt, buf);
600  		if (err)
601  			goto cleanup;
602  	}
603  
604  cleanup:
605  	fclose(f);
606  	return err;
607  }
608  
609  static const struct stat_specs default_output_spec = {
610  	.spec_cnt = 7,
611  	.ids = {
612  		FILE_NAME, PROG_NAME, VERDICT, DURATION,
613  		TOTAL_INSNS, TOTAL_STATES, PEAK_STATES,
614  	},
615  };
616  
617  static const struct stat_specs default_csv_output_spec = {
618  	.spec_cnt = 9,
619  	.ids = {
620  		FILE_NAME, PROG_NAME, VERDICT, DURATION,
621  		TOTAL_INSNS, TOTAL_STATES, PEAK_STATES,
622  		MAX_STATES_PER_INSN, MARK_READ_MAX_LEN,
623  	},
624  };
625  
626  static const struct stat_specs default_sort_spec = {
627  	.spec_cnt = 2,
628  	.ids = {
629  		FILE_NAME, PROG_NAME,
630  	},
631  	.asc = { true, true, },
632  };
633  
634  /* sorting for comparison mode to join two data sets */
635  static const struct stat_specs join_sort_spec = {
636  	.spec_cnt = 2,
637  	.ids = {
638  		FILE_NAME, PROG_NAME,
639  	},
640  	.asc = { true, true, },
641  };
642  
643  static struct stat_def {
644  	const char *header;
645  	const char *names[4];
646  	bool asc_by_default;
647  	bool left_aligned;
648  } stat_defs[] = {
649  	[FILE_NAME] = { "File", {"file_name", "filename", "file"}, true /* asc */, true /* left */ },
650  	[PROG_NAME] = { "Program", {"prog_name", "progname", "prog"}, true /* asc */, true /* left */ },
651  	[VERDICT] = { "Verdict", {"verdict"}, true /* asc: failure, success */, true /* left */ },
652  	[DURATION] = { "Duration (us)", {"duration", "dur"}, },
653  	[TOTAL_INSNS] = { "Insns", {"total_insns", "insns"}, },
654  	[TOTAL_STATES] = { "States", {"total_states", "states"}, },
655  	[PEAK_STATES] = { "Peak states", {"peak_states"}, },
656  	[MAX_STATES_PER_INSN] = { "Max states per insn", {"max_states_per_insn"}, },
657  	[MARK_READ_MAX_LEN] = { "Max mark read length", {"max_mark_read_len", "mark_read"}, },
658  };
659  
parse_stat_id_var(const char * name,size_t len,int * id,enum stat_variant * var)660  static bool parse_stat_id_var(const char *name, size_t len, int *id, enum stat_variant *var)
661  {
662  	static const char *var_sfxs[] = {
663  		[VARIANT_A] = "_a",
664  		[VARIANT_B] = "_b",
665  		[VARIANT_DIFF] = "_diff",
666  		[VARIANT_PCT] = "_pct",
667  	};
668  	int i, j, k;
669  
670  	for (i = 0; i < ARRAY_SIZE(stat_defs); i++) {
671  		struct stat_def *def = &stat_defs[i];
672  		size_t alias_len, sfx_len;
673  		const char *alias;
674  
675  		for (j = 0; j < ARRAY_SIZE(stat_defs[i].names); j++) {
676  			alias = def->names[j];
677  			if (!alias)
678  				continue;
679  
680  			alias_len = strlen(alias);
681  			if (strncmp(name, alias, alias_len) != 0)
682  				continue;
683  
684  			if (alias_len == len) {
685  				/* If no variant suffix is specified, we
686  				 * assume control group (just in case we are
687  				 * in comparison mode. Variant is ignored in
688  				 * non-comparison mode.
689  				 */
690  				*var = VARIANT_B;
691  				*id = i;
692  				return true;
693  			}
694  
695  			for (k = 0; k < ARRAY_SIZE(var_sfxs); k++) {
696  				sfx_len = strlen(var_sfxs[k]);
697  				if (alias_len + sfx_len != len)
698  					continue;
699  
700  				if (strncmp(name + alias_len, var_sfxs[k], sfx_len) == 0) {
701  					*var = (enum stat_variant)k;
702  					*id = i;
703  					return true;
704  				}
705  			}
706  		}
707  	}
708  
709  	return false;
710  }
711  
is_asc_sym(char c)712  static bool is_asc_sym(char c)
713  {
714  	return c == '^';
715  }
716  
is_desc_sym(char c)717  static bool is_desc_sym(char c)
718  {
719  	return c == 'v' || c == 'V' || c == '.' || c == '!' || c == '_';
720  }
721  
parse_stat(const char * stat_name,struct stat_specs * specs)722  static int parse_stat(const char *stat_name, struct stat_specs *specs)
723  {
724  	int id;
725  	bool has_order = false, is_asc = false;
726  	size_t len = strlen(stat_name);
727  	enum stat_variant var;
728  
729  	if (specs->spec_cnt >= ARRAY_SIZE(specs->ids)) {
730  		fprintf(stderr, "Can't specify more than %zd stats\n", ARRAY_SIZE(specs->ids));
731  		return -E2BIG;
732  	}
733  
734  	if (len > 1 && (is_asc_sym(stat_name[len - 1]) || is_desc_sym(stat_name[len - 1]))) {
735  		has_order = true;
736  		is_asc = is_asc_sym(stat_name[len - 1]);
737  		len -= 1;
738  	}
739  
740  	if (!parse_stat_id_var(stat_name, len, &id, &var)) {
741  		fprintf(stderr, "Unrecognized stat name '%s'\n", stat_name);
742  		return -ESRCH;
743  	}
744  
745  	specs->ids[specs->spec_cnt] = id;
746  	specs->variants[specs->spec_cnt] = var;
747  	specs->asc[specs->spec_cnt] = has_order ? is_asc : stat_defs[id].asc_by_default;
748  	specs->spec_cnt++;
749  
750  	return 0;
751  }
752  
parse_stats(const char * stats_str,struct stat_specs * specs)753  static int parse_stats(const char *stats_str, struct stat_specs *specs)
754  {
755  	char *input, *state = NULL, *next;
756  	int err, cnt = 0;
757  
758  	input = strdup(stats_str);
759  	if (!input)
760  		return -ENOMEM;
761  
762  	while ((next = strtok_r(cnt++ ? NULL : input, ",", &state))) {
763  		err = parse_stat(next, specs);
764  		if (err)
765  			return err;
766  	}
767  
768  	return 0;
769  }
770  
free_verif_stats(struct verif_stats * stats,size_t stat_cnt)771  static void free_verif_stats(struct verif_stats *stats, size_t stat_cnt)
772  {
773  	int i;
774  
775  	if (!stats)
776  		return;
777  
778  	for (i = 0; i < stat_cnt; i++) {
779  		free(stats[i].file_name);
780  		free(stats[i].prog_name);
781  	}
782  	free(stats);
783  }
784  
785  static char verif_log_buf[64 * 1024];
786  
787  #define MAX_PARSED_LOG_LINES 100
788  
parse_verif_log(char * const buf,size_t buf_sz,struct verif_stats * s)789  static int parse_verif_log(char * const buf, size_t buf_sz, struct verif_stats *s)
790  {
791  	const char *cur;
792  	int pos, lines;
793  
794  	buf[buf_sz - 1] = '\0';
795  
796  	for (pos = strlen(buf) - 1, lines = 0; pos >= 0 && lines < MAX_PARSED_LOG_LINES; lines++) {
797  		/* find previous endline or otherwise take the start of log buf */
798  		for (cur = &buf[pos]; cur > buf && cur[0] != '\n'; cur--, pos--) {
799  		}
800  		/* next time start from end of previous line (or pos goes to <0) */
801  		pos--;
802  		/* if we found endline, point right after endline symbol;
803  		 * otherwise, stay at the beginning of log buf
804  		 */
805  		if (cur[0] == '\n')
806  			cur++;
807  
808  		if (1 == sscanf(cur, "verification time %ld usec\n", &s->stats[DURATION]))
809  			continue;
810  		if (6 == sscanf(cur, "processed %ld insns (limit %*d) max_states_per_insn %ld total_states %ld peak_states %ld mark_read %ld",
811  				&s->stats[TOTAL_INSNS],
812  				&s->stats[MAX_STATES_PER_INSN],
813  				&s->stats[TOTAL_STATES],
814  				&s->stats[PEAK_STATES],
815  				&s->stats[MARK_READ_MAX_LEN]))
816  			continue;
817  	}
818  
819  	return 0;
820  }
821  
guess_prog_type_by_ctx_name(const char * ctx_name,enum bpf_prog_type * prog_type,enum bpf_attach_type * attach_type)822  static int guess_prog_type_by_ctx_name(const char *ctx_name,
823  				       enum bpf_prog_type *prog_type,
824  				       enum bpf_attach_type *attach_type)
825  {
826  	/* We need to guess program type based on its declared context type.
827  	 * This guess can't be perfect as many different program types might
828  	 * share the same context type.  So we can only hope to reasonably
829  	 * well guess this and get lucky.
830  	 *
831  	 * Just in case, we support both UAPI-side type names and
832  	 * kernel-internal names.
833  	 */
834  	static struct {
835  		const char *uapi_name;
836  		const char *kern_name;
837  		enum bpf_prog_type prog_type;
838  		enum bpf_attach_type attach_type;
839  	} ctx_map[] = {
840  		/* __sk_buff is most ambiguous, we assume TC program */
841  		{ "__sk_buff", "sk_buff", BPF_PROG_TYPE_SCHED_CLS },
842  		{ "bpf_sock", "sock", BPF_PROG_TYPE_CGROUP_SOCK, BPF_CGROUP_INET4_POST_BIND },
843  		{ "bpf_sock_addr", "bpf_sock_addr_kern",  BPF_PROG_TYPE_CGROUP_SOCK_ADDR, BPF_CGROUP_INET4_BIND },
844  		{ "bpf_sock_ops", "bpf_sock_ops_kern", BPF_PROG_TYPE_SOCK_OPS, BPF_CGROUP_SOCK_OPS },
845  		{ "sk_msg_md", "sk_msg", BPF_PROG_TYPE_SK_MSG, BPF_SK_MSG_VERDICT },
846  		{ "bpf_cgroup_dev_ctx", "bpf_cgroup_dev_ctx", BPF_PROG_TYPE_CGROUP_DEVICE, BPF_CGROUP_DEVICE },
847  		{ "bpf_sysctl", "bpf_sysctl_kern", BPF_PROG_TYPE_CGROUP_SYSCTL, BPF_CGROUP_SYSCTL },
848  		{ "bpf_sockopt", "bpf_sockopt_kern", BPF_PROG_TYPE_CGROUP_SOCKOPT, BPF_CGROUP_SETSOCKOPT },
849  		{ "sk_reuseport_md", "sk_reuseport_kern", BPF_PROG_TYPE_SK_REUSEPORT, BPF_SK_REUSEPORT_SELECT_OR_MIGRATE },
850  		{ "bpf_sk_lookup", "bpf_sk_lookup_kern", BPF_PROG_TYPE_SK_LOOKUP, BPF_SK_LOOKUP },
851  		{ "xdp_md", "xdp_buff", BPF_PROG_TYPE_XDP, BPF_XDP },
852  		/* tracing types with no expected attach type */
853  		{ "bpf_user_pt_regs_t", "pt_regs", BPF_PROG_TYPE_KPROBE },
854  		{ "bpf_perf_event_data", "bpf_perf_event_data_kern", BPF_PROG_TYPE_PERF_EVENT },
855  		/* raw_tp programs use u64[] from kernel side, we don't want
856  		 * to match on that, probably; so NULL for kern-side type
857  		 */
858  		{ "bpf_raw_tracepoint_args", NULL, BPF_PROG_TYPE_RAW_TRACEPOINT },
859  	};
860  	int i;
861  
862  	if (!ctx_name)
863  		return -EINVAL;
864  
865  	for (i = 0; i < ARRAY_SIZE(ctx_map); i++) {
866  		if (strcmp(ctx_map[i].uapi_name, ctx_name) == 0 ||
867  		    (ctx_map[i].kern_name && strcmp(ctx_map[i].kern_name, ctx_name) == 0)) {
868  			*prog_type = ctx_map[i].prog_type;
869  			*attach_type = ctx_map[i].attach_type;
870  			return 0;
871  		}
872  	}
873  
874  	return -ESRCH;
875  }
876  
fixup_obj(struct bpf_object * obj,struct bpf_program * prog,const char * filename)877  static void fixup_obj(struct bpf_object *obj, struct bpf_program *prog, const char *filename)
878  {
879  	struct bpf_map *map;
880  
881  	bpf_object__for_each_map(map, obj) {
882  		/* disable pinning */
883  		bpf_map__set_pin_path(map, NULL);
884  
885  		/* fix up map size, if necessary */
886  		switch (bpf_map__type(map)) {
887  		case BPF_MAP_TYPE_SK_STORAGE:
888  		case BPF_MAP_TYPE_TASK_STORAGE:
889  		case BPF_MAP_TYPE_INODE_STORAGE:
890  		case BPF_MAP_TYPE_CGROUP_STORAGE:
891  			break;
892  		default:
893  			if (bpf_map__max_entries(map) == 0)
894  				bpf_map__set_max_entries(map, 1);
895  		}
896  	}
897  
898  	/* SEC(freplace) programs can't be loaded with veristat as is,
899  	 * but we can try guessing their target program's expected type by
900  	 * looking at the type of program's first argument and substituting
901  	 * corresponding program type
902  	 */
903  	if (bpf_program__type(prog) == BPF_PROG_TYPE_EXT) {
904  		const struct btf *btf = bpf_object__btf(obj);
905  		const char *prog_name = bpf_program__name(prog);
906  		enum bpf_prog_type prog_type;
907  		enum bpf_attach_type attach_type;
908  		const struct btf_type *t;
909  		const char *ctx_name;
910  		int id;
911  
912  		if (!btf)
913  			goto skip_freplace_fixup;
914  
915  		id = btf__find_by_name_kind(btf, prog_name, BTF_KIND_FUNC);
916  		t = btf__type_by_id(btf, id);
917  		t = btf__type_by_id(btf, t->type);
918  		if (!btf_is_func_proto(t) || btf_vlen(t) != 1)
919  			goto skip_freplace_fixup;
920  
921  		/* context argument is a pointer to a struct/typedef */
922  		t = btf__type_by_id(btf, btf_params(t)[0].type);
923  		while (t && btf_is_mod(t))
924  			t = btf__type_by_id(btf, t->type);
925  		if (!t || !btf_is_ptr(t))
926  			goto skip_freplace_fixup;
927  		t = btf__type_by_id(btf, t->type);
928  		while (t && btf_is_mod(t))
929  			t = btf__type_by_id(btf, t->type);
930  		if (!t)
931  			goto skip_freplace_fixup;
932  
933  		ctx_name = btf__name_by_offset(btf, t->name_off);
934  
935  		if (guess_prog_type_by_ctx_name(ctx_name, &prog_type, &attach_type) == 0) {
936  			bpf_program__set_type(prog, prog_type);
937  			bpf_program__set_expected_attach_type(prog, attach_type);
938  
939  			if (!env.quiet) {
940  				printf("Using guessed program type '%s' for %s/%s...\n",
941  					libbpf_bpf_prog_type_str(prog_type),
942  					filename, prog_name);
943  			}
944  		} else {
945  			if (!env.quiet) {
946  				printf("Failed to guess program type for freplace program with context type name '%s' for %s/%s. Consider using canonical type names to help veristat...\n",
947  					ctx_name, filename, prog_name);
948  			}
949  		}
950  	}
951  skip_freplace_fixup:
952  	return;
953  }
954  
process_prog(const char * filename,struct bpf_object * obj,struct bpf_program * prog)955  static int process_prog(const char *filename, struct bpf_object *obj, struct bpf_program *prog)
956  {
957  	const char *prog_name = bpf_program__name(prog);
958  	const char *base_filename = basename(filename);
959  	char *buf;
960  	int buf_sz, log_level;
961  	struct verif_stats *stats;
962  	int err = 0;
963  	void *tmp;
964  
965  	if (!should_process_file_prog(base_filename, bpf_program__name(prog))) {
966  		env.progs_skipped++;
967  		return 0;
968  	}
969  
970  	tmp = realloc(env.prog_stats, (env.prog_stat_cnt + 1) * sizeof(*env.prog_stats));
971  	if (!tmp)
972  		return -ENOMEM;
973  	env.prog_stats = tmp;
974  	stats = &env.prog_stats[env.prog_stat_cnt++];
975  	memset(stats, 0, sizeof(*stats));
976  
977  	if (env.verbose) {
978  		buf_sz = env.log_size ? env.log_size : 16 * 1024 * 1024;
979  		buf = malloc(buf_sz);
980  		if (!buf)
981  			return -ENOMEM;
982  		/* ensure we always request stats */
983  		log_level = env.log_level | 4 | (env.log_fixed ? 8 : 0);
984  	} else {
985  		buf = verif_log_buf;
986  		buf_sz = sizeof(verif_log_buf);
987  		/* request only verifier stats */
988  		log_level = 4 | (env.log_fixed ? 8 : 0);
989  	}
990  	verif_log_buf[0] = '\0';
991  
992  	bpf_program__set_log_buf(prog, buf, buf_sz);
993  	bpf_program__set_log_level(prog, log_level);
994  
995  	/* increase chances of successful BPF object loading */
996  	fixup_obj(obj, prog, base_filename);
997  
998  	if (env.force_checkpoints)
999  		bpf_program__set_flags(prog, bpf_program__flags(prog) | BPF_F_TEST_STATE_FREQ);
1000  
1001  	err = bpf_object__load(obj);
1002  	env.progs_processed++;
1003  
1004  	stats->file_name = strdup(base_filename);
1005  	stats->prog_name = strdup(bpf_program__name(prog));
1006  	stats->stats[VERDICT] = err == 0; /* 1 - success, 0 - failure */
1007  	parse_verif_log(buf, buf_sz, stats);
1008  
1009  	if (env.verbose) {
1010  		printf("PROCESSING %s/%s, DURATION US: %ld, VERDICT: %s, VERIFIER LOG:\n%s\n",
1011  		       filename, prog_name, stats->stats[DURATION],
1012  		       err ? "failure" : "success", buf);
1013  	}
1014  
1015  	if (verif_log_buf != buf)
1016  		free(buf);
1017  
1018  	return 0;
1019  };
1020  
process_obj(const char * filename)1021  static int process_obj(const char *filename)
1022  {
1023  	struct bpf_object *obj = NULL, *tobj;
1024  	struct bpf_program *prog, *tprog, *lprog;
1025  	libbpf_print_fn_t old_libbpf_print_fn;
1026  	LIBBPF_OPTS(bpf_object_open_opts, opts);
1027  	int err = 0, prog_cnt = 0;
1028  
1029  	if (!should_process_file_prog(basename(filename), NULL)) {
1030  		if (env.verbose)
1031  			printf("Skipping '%s' due to filters...\n", filename);
1032  		env.files_skipped++;
1033  		return 0;
1034  	}
1035  	if (!is_bpf_obj_file(filename)) {
1036  		if (env.verbose)
1037  			printf("Skipping '%s' as it's not a BPF object file...\n", filename);
1038  		env.files_skipped++;
1039  		return 0;
1040  	}
1041  
1042  	if (!env.quiet && env.out_fmt == RESFMT_TABLE)
1043  		printf("Processing '%s'...\n", basename(filename));
1044  
1045  	old_libbpf_print_fn = libbpf_set_print(libbpf_print_fn);
1046  	obj = bpf_object__open_file(filename, &opts);
1047  	if (!obj) {
1048  		/* if libbpf can't open BPF object file, it could be because
1049  		 * that BPF object file is incomplete and has to be statically
1050  		 * linked into a final BPF object file; instead of bailing
1051  		 * out, report it into stderr, mark it as skipped, and
1052  		 * proceed
1053  		 */
1054  		fprintf(stderr, "Failed to open '%s': %d\n", filename, -errno);
1055  		env.files_skipped++;
1056  		err = 0;
1057  		goto cleanup;
1058  	}
1059  
1060  	env.files_processed++;
1061  
1062  	bpf_object__for_each_program(prog, obj) {
1063  		prog_cnt++;
1064  	}
1065  
1066  	if (prog_cnt == 1) {
1067  		prog = bpf_object__next_program(obj, NULL);
1068  		bpf_program__set_autoload(prog, true);
1069  		process_prog(filename, obj, prog);
1070  		goto cleanup;
1071  	}
1072  
1073  	bpf_object__for_each_program(prog, obj) {
1074  		const char *prog_name = bpf_program__name(prog);
1075  
1076  		tobj = bpf_object__open_file(filename, &opts);
1077  		if (!tobj) {
1078  			err = -errno;
1079  			fprintf(stderr, "Failed to open '%s': %d\n", filename, err);
1080  			goto cleanup;
1081  		}
1082  
1083  		lprog = NULL;
1084  		bpf_object__for_each_program(tprog, tobj) {
1085  			const char *tprog_name = bpf_program__name(tprog);
1086  
1087  			if (strcmp(prog_name, tprog_name) == 0) {
1088  				bpf_program__set_autoload(tprog, true);
1089  				lprog = tprog;
1090  			} else {
1091  				bpf_program__set_autoload(tprog, false);
1092  			}
1093  		}
1094  
1095  		process_prog(filename, tobj, lprog);
1096  		bpf_object__close(tobj);
1097  	}
1098  
1099  cleanup:
1100  	bpf_object__close(obj);
1101  	libbpf_set_print(old_libbpf_print_fn);
1102  	return err;
1103  }
1104  
cmp_stat(const struct verif_stats * s1,const struct verif_stats * s2,enum stat_id id,bool asc)1105  static int cmp_stat(const struct verif_stats *s1, const struct verif_stats *s2,
1106  		    enum stat_id id, bool asc)
1107  {
1108  	int cmp = 0;
1109  
1110  	switch (id) {
1111  	case FILE_NAME:
1112  		cmp = strcmp(s1->file_name, s2->file_name);
1113  		break;
1114  	case PROG_NAME:
1115  		cmp = strcmp(s1->prog_name, s2->prog_name);
1116  		break;
1117  	case VERDICT:
1118  	case DURATION:
1119  	case TOTAL_INSNS:
1120  	case TOTAL_STATES:
1121  	case PEAK_STATES:
1122  	case MAX_STATES_PER_INSN:
1123  	case MARK_READ_MAX_LEN: {
1124  		long v1 = s1->stats[id];
1125  		long v2 = s2->stats[id];
1126  
1127  		if (v1 != v2)
1128  			cmp = v1 < v2 ? -1 : 1;
1129  		break;
1130  	}
1131  	default:
1132  		fprintf(stderr, "Unrecognized stat #%d\n", id);
1133  		exit(1);
1134  	}
1135  
1136  	return asc ? cmp : -cmp;
1137  }
1138  
cmp_prog_stats(const void * v1,const void * v2)1139  static int cmp_prog_stats(const void *v1, const void *v2)
1140  {
1141  	const struct verif_stats *s1 = v1, *s2 = v2;
1142  	int i, cmp;
1143  
1144  	for (i = 0; i < env.sort_spec.spec_cnt; i++) {
1145  		cmp = cmp_stat(s1, s2, env.sort_spec.ids[i], env.sort_spec.asc[i]);
1146  		if (cmp != 0)
1147  			return cmp;
1148  	}
1149  
1150  	/* always disambiguate with file+prog, which are unique */
1151  	cmp = strcmp(s1->file_name, s2->file_name);
1152  	if (cmp != 0)
1153  		return cmp;
1154  	return strcmp(s1->prog_name, s2->prog_name);
1155  }
1156  
fetch_join_stat_value(const struct verif_stats_join * s,enum stat_id id,enum stat_variant var,const char ** str_val,double * num_val)1157  static void fetch_join_stat_value(const struct verif_stats_join *s,
1158  				  enum stat_id id, enum stat_variant var,
1159  				  const char **str_val,
1160  				  double *num_val)
1161  {
1162  	long v1, v2;
1163  
1164  	if (id == FILE_NAME) {
1165  		*str_val = s->file_name;
1166  		return;
1167  	}
1168  	if (id == PROG_NAME) {
1169  		*str_val = s->prog_name;
1170  		return;
1171  	}
1172  
1173  	v1 = s->stats_a ? s->stats_a->stats[id] : 0;
1174  	v2 = s->stats_b ? s->stats_b->stats[id] : 0;
1175  
1176  	switch (var) {
1177  	case VARIANT_A:
1178  		if (!s->stats_a)
1179  			*num_val = -DBL_MAX;
1180  		else
1181  			*num_val = s->stats_a->stats[id];
1182  		return;
1183  	case VARIANT_B:
1184  		if (!s->stats_b)
1185  			*num_val = -DBL_MAX;
1186  		else
1187  			*num_val = s->stats_b->stats[id];
1188  		return;
1189  	case VARIANT_DIFF:
1190  		if (!s->stats_a || !s->stats_b)
1191  			*num_val = -DBL_MAX;
1192  		else if (id == VERDICT)
1193  			*num_val = v1 == v2 ? 1.0 /* MATCH */ : 0.0 /* MISMATCH */;
1194  		else
1195  			*num_val = (double)(v2 - v1);
1196  		return;
1197  	case VARIANT_PCT:
1198  		if (!s->stats_a || !s->stats_b) {
1199  			*num_val = -DBL_MAX;
1200  		} else if (v1 == 0) {
1201  			if (v1 == v2)
1202  				*num_val = 0.0;
1203  			else
1204  				*num_val = v2 < v1 ? -100.0 : 100.0;
1205  		} else {
1206  			 *num_val = (v2 - v1) * 100.0 / v1;
1207  		}
1208  		return;
1209  	}
1210  }
1211  
cmp_join_stat(const struct verif_stats_join * s1,const struct verif_stats_join * s2,enum stat_id id,enum stat_variant var,bool asc)1212  static int cmp_join_stat(const struct verif_stats_join *s1,
1213  			 const struct verif_stats_join *s2,
1214  			 enum stat_id id, enum stat_variant var, bool asc)
1215  {
1216  	const char *str1 = NULL, *str2 = NULL;
1217  	double v1 = 0.0, v2 = 0.0;
1218  	int cmp = 0;
1219  
1220  	fetch_join_stat_value(s1, id, var, &str1, &v1);
1221  	fetch_join_stat_value(s2, id, var, &str2, &v2);
1222  
1223  	if (str1)
1224  		cmp = strcmp(str1, str2);
1225  	else if (v1 != v2)
1226  		cmp = v1 < v2 ? -1 : 1;
1227  
1228  	return asc ? cmp : -cmp;
1229  }
1230  
cmp_join_stats(const void * v1,const void * v2)1231  static int cmp_join_stats(const void *v1, const void *v2)
1232  {
1233  	const struct verif_stats_join *s1 = v1, *s2 = v2;
1234  	int i, cmp;
1235  
1236  	for (i = 0; i < env.sort_spec.spec_cnt; i++) {
1237  		cmp = cmp_join_stat(s1, s2,
1238  				    env.sort_spec.ids[i],
1239  				    env.sort_spec.variants[i],
1240  				    env.sort_spec.asc[i]);
1241  		if (cmp != 0)
1242  			return cmp;
1243  	}
1244  
1245  	/* always disambiguate with file+prog, which are unique */
1246  	cmp = strcmp(s1->file_name, s2->file_name);
1247  	if (cmp != 0)
1248  		return cmp;
1249  	return strcmp(s1->prog_name, s2->prog_name);
1250  }
1251  
1252  #define HEADER_CHAR '-'
1253  #define COLUMN_SEP "  "
1254  
output_header_underlines(void)1255  static void output_header_underlines(void)
1256  {
1257  	int i, j, len;
1258  
1259  	for (i = 0; i < env.output_spec.spec_cnt; i++) {
1260  		len = env.output_spec.lens[i];
1261  
1262  		printf("%s", i == 0 ? "" : COLUMN_SEP);
1263  		for (j = 0; j < len; j++)
1264  			printf("%c", HEADER_CHAR);
1265  	}
1266  	printf("\n");
1267  }
1268  
output_headers(enum resfmt fmt)1269  static void output_headers(enum resfmt fmt)
1270  {
1271  	const char *fmt_str;
1272  	int i, len;
1273  
1274  	for (i = 0; i < env.output_spec.spec_cnt; i++) {
1275  		int id = env.output_spec.ids[i];
1276  		int *max_len = &env.output_spec.lens[i];
1277  
1278  		switch (fmt) {
1279  		case RESFMT_TABLE_CALCLEN:
1280  			len = snprintf(NULL, 0, "%s", stat_defs[id].header);
1281  			if (len > *max_len)
1282  				*max_len = len;
1283  			break;
1284  		case RESFMT_TABLE:
1285  			fmt_str = stat_defs[id].left_aligned ? "%s%-*s" : "%s%*s";
1286  			printf(fmt_str, i == 0 ? "" : COLUMN_SEP,  *max_len, stat_defs[id].header);
1287  			if (i == env.output_spec.spec_cnt - 1)
1288  				printf("\n");
1289  			break;
1290  		case RESFMT_CSV:
1291  			printf("%s%s", i == 0 ? "" : ",", stat_defs[id].names[0]);
1292  			if (i == env.output_spec.spec_cnt - 1)
1293  				printf("\n");
1294  			break;
1295  		}
1296  	}
1297  
1298  	if (fmt == RESFMT_TABLE)
1299  		output_header_underlines();
1300  }
1301  
prepare_value(const struct verif_stats * s,enum stat_id id,const char ** str,long * val)1302  static void prepare_value(const struct verif_stats *s, enum stat_id id,
1303  			  const char **str, long *val)
1304  {
1305  	switch (id) {
1306  	case FILE_NAME:
1307  		*str = s ? s->file_name : "N/A";
1308  		break;
1309  	case PROG_NAME:
1310  		*str = s ? s->prog_name : "N/A";
1311  		break;
1312  	case VERDICT:
1313  		if (!s)
1314  			*str = "N/A";
1315  		else
1316  			*str = s->stats[VERDICT] ? "success" : "failure";
1317  		break;
1318  	case DURATION:
1319  	case TOTAL_INSNS:
1320  	case TOTAL_STATES:
1321  	case PEAK_STATES:
1322  	case MAX_STATES_PER_INSN:
1323  	case MARK_READ_MAX_LEN:
1324  		*val = s ? s->stats[id] : 0;
1325  		break;
1326  	default:
1327  		fprintf(stderr, "Unrecognized stat #%d\n", id);
1328  		exit(1);
1329  	}
1330  }
1331  
output_stats(const struct verif_stats * s,enum resfmt fmt,bool last)1332  static void output_stats(const struct verif_stats *s, enum resfmt fmt, bool last)
1333  {
1334  	int i;
1335  
1336  	for (i = 0; i < env.output_spec.spec_cnt; i++) {
1337  		int id = env.output_spec.ids[i];
1338  		int *max_len = &env.output_spec.lens[i], len;
1339  		const char *str = NULL;
1340  		long val = 0;
1341  
1342  		prepare_value(s, id, &str, &val);
1343  
1344  		switch (fmt) {
1345  		case RESFMT_TABLE_CALCLEN:
1346  			if (str)
1347  				len = snprintf(NULL, 0, "%s", str);
1348  			else
1349  				len = snprintf(NULL, 0, "%ld", val);
1350  			if (len > *max_len)
1351  				*max_len = len;
1352  			break;
1353  		case RESFMT_TABLE:
1354  			if (str)
1355  				printf("%s%-*s", i == 0 ? "" : COLUMN_SEP, *max_len, str);
1356  			else
1357  				printf("%s%*ld", i == 0 ? "" : COLUMN_SEP,  *max_len, val);
1358  			if (i == env.output_spec.spec_cnt - 1)
1359  				printf("\n");
1360  			break;
1361  		case RESFMT_CSV:
1362  			if (str)
1363  				printf("%s%s", i == 0 ? "" : ",", str);
1364  			else
1365  				printf("%s%ld", i == 0 ? "" : ",", val);
1366  			if (i == env.output_spec.spec_cnt - 1)
1367  				printf("\n");
1368  			break;
1369  		}
1370  	}
1371  
1372  	if (last && fmt == RESFMT_TABLE) {
1373  		output_header_underlines();
1374  		printf("Done. Processed %d files, %d programs. Skipped %d files, %d programs.\n",
1375  		       env.files_processed, env.files_skipped, env.progs_processed, env.progs_skipped);
1376  	}
1377  }
1378  
parse_stat_value(const char * str,enum stat_id id,struct verif_stats * st)1379  static int parse_stat_value(const char *str, enum stat_id id, struct verif_stats *st)
1380  {
1381  	switch (id) {
1382  	case FILE_NAME:
1383  		st->file_name = strdup(str);
1384  		if (!st->file_name)
1385  			return -ENOMEM;
1386  		break;
1387  	case PROG_NAME:
1388  		st->prog_name = strdup(str);
1389  		if (!st->prog_name)
1390  			return -ENOMEM;
1391  		break;
1392  	case VERDICT:
1393  		if (strcmp(str, "success") == 0) {
1394  			st->stats[VERDICT] = true;
1395  		} else if (strcmp(str, "failure") == 0) {
1396  			st->stats[VERDICT] = false;
1397  		} else {
1398  			fprintf(stderr, "Unrecognized verification verdict '%s'\n", str);
1399  			return -EINVAL;
1400  		}
1401  		break;
1402  	case DURATION:
1403  	case TOTAL_INSNS:
1404  	case TOTAL_STATES:
1405  	case PEAK_STATES:
1406  	case MAX_STATES_PER_INSN:
1407  	case MARK_READ_MAX_LEN: {
1408  		long val;
1409  		int err, n;
1410  
1411  		if (sscanf(str, "%ld %n", &val, &n) != 1 || n != strlen(str)) {
1412  			err = -errno;
1413  			fprintf(stderr, "Failed to parse '%s' as integer\n", str);
1414  			return err;
1415  		}
1416  
1417  		st->stats[id] = val;
1418  		break;
1419  	}
1420  	default:
1421  		fprintf(stderr, "Unrecognized stat #%d\n", id);
1422  		return -EINVAL;
1423  	}
1424  	return 0;
1425  }
1426  
parse_stats_csv(const char * filename,struct stat_specs * specs,struct verif_stats ** statsp,int * stat_cntp)1427  static int parse_stats_csv(const char *filename, struct stat_specs *specs,
1428  			   struct verif_stats **statsp, int *stat_cntp)
1429  {
1430  	char line[4096];
1431  	FILE *f;
1432  	int err = 0;
1433  	bool header = true;
1434  
1435  	f = fopen(filename, "r");
1436  	if (!f) {
1437  		err = -errno;
1438  		fprintf(stderr, "Failed to open '%s': %d\n", filename, err);
1439  		return err;
1440  	}
1441  
1442  	*stat_cntp = 0;
1443  
1444  	while (fgets(line, sizeof(line), f)) {
1445  		char *input = line, *state = NULL, *next;
1446  		struct verif_stats *st = NULL;
1447  		int col = 0, cnt = 0;
1448  
1449  		if (!header) {
1450  			void *tmp;
1451  
1452  			tmp = realloc(*statsp, (*stat_cntp + 1) * sizeof(**statsp));
1453  			if (!tmp) {
1454  				err = -ENOMEM;
1455  				goto cleanup;
1456  			}
1457  			*statsp = tmp;
1458  
1459  			st = &(*statsp)[*stat_cntp];
1460  			memset(st, 0, sizeof(*st));
1461  
1462  			*stat_cntp += 1;
1463  		}
1464  
1465  		while ((next = strtok_r(cnt++ ? NULL : input, ",\n", &state))) {
1466  			if (header) {
1467  				/* for the first line, set up spec stats */
1468  				err = parse_stat(next, specs);
1469  				if (err)
1470  					goto cleanup;
1471  				continue;
1472  			}
1473  
1474  			/* for all other lines, parse values based on spec */
1475  			if (col >= specs->spec_cnt) {
1476  				fprintf(stderr, "Found extraneous column #%d in row #%d of '%s'\n",
1477  					col, *stat_cntp, filename);
1478  				err = -EINVAL;
1479  				goto cleanup;
1480  			}
1481  			err = parse_stat_value(next, specs->ids[col], st);
1482  			if (err)
1483  				goto cleanup;
1484  			col++;
1485  		}
1486  
1487  		if (header) {
1488  			header = false;
1489  			continue;
1490  		}
1491  
1492  		if (col < specs->spec_cnt) {
1493  			fprintf(stderr, "Not enough columns in row #%d in '%s'\n",
1494  				*stat_cntp, filename);
1495  			err = -EINVAL;
1496  			goto cleanup;
1497  		}
1498  
1499  		if (!st->file_name || !st->prog_name) {
1500  			fprintf(stderr, "Row #%d in '%s' is missing file and/or program name\n",
1501  				*stat_cntp, filename);
1502  			err = -EINVAL;
1503  			goto cleanup;
1504  		}
1505  
1506  		/* in comparison mode we can only check filters after we
1507  		 * parsed entire line; if row should be ignored we pretend we
1508  		 * never parsed it
1509  		 */
1510  		if (!should_process_file_prog(st->file_name, st->prog_name)) {
1511  			free(st->file_name);
1512  			free(st->prog_name);
1513  			*stat_cntp -= 1;
1514  		}
1515  	}
1516  
1517  	if (!feof(f)) {
1518  		err = -errno;
1519  		fprintf(stderr, "Failed I/O for '%s': %d\n", filename, err);
1520  	}
1521  
1522  cleanup:
1523  	fclose(f);
1524  	return err;
1525  }
1526  
1527  /* empty/zero stats for mismatched rows */
1528  static const struct verif_stats fallback_stats = { .file_name = "", .prog_name = "" };
1529  
is_key_stat(enum stat_id id)1530  static bool is_key_stat(enum stat_id id)
1531  {
1532  	return id == FILE_NAME || id == PROG_NAME;
1533  }
1534  
output_comp_header_underlines(void)1535  static void output_comp_header_underlines(void)
1536  {
1537  	int i, j, k;
1538  
1539  	for (i = 0; i < env.output_spec.spec_cnt; i++) {
1540  		int id = env.output_spec.ids[i];
1541  		int max_j = is_key_stat(id) ? 1 : 3;
1542  
1543  		for (j = 0; j < max_j; j++) {
1544  			int len = env.output_spec.lens[3 * i + j];
1545  
1546  			printf("%s", i + j == 0 ? "" : COLUMN_SEP);
1547  
1548  			for (k = 0; k < len; k++)
1549  				printf("%c", HEADER_CHAR);
1550  		}
1551  	}
1552  	printf("\n");
1553  }
1554  
output_comp_headers(enum resfmt fmt)1555  static void output_comp_headers(enum resfmt fmt)
1556  {
1557  	static const char *table_sfxs[3] = {" (A)", " (B)", " (DIFF)"};
1558  	static const char *name_sfxs[3] = {"_base", "_comp", "_diff"};
1559  	int i, j, len;
1560  
1561  	for (i = 0; i < env.output_spec.spec_cnt; i++) {
1562  		int id = env.output_spec.ids[i];
1563  		/* key stats don't have A/B/DIFF columns, they are common for both data sets */
1564  		int max_j = is_key_stat(id) ? 1 : 3;
1565  
1566  		for (j = 0; j < max_j; j++) {
1567  			int *max_len = &env.output_spec.lens[3 * i + j];
1568  			bool last = (i == env.output_spec.spec_cnt - 1) && (j == max_j - 1);
1569  			const char *sfx;
1570  
1571  			switch (fmt) {
1572  			case RESFMT_TABLE_CALCLEN:
1573  				sfx = is_key_stat(id) ? "" : table_sfxs[j];
1574  				len = snprintf(NULL, 0, "%s%s", stat_defs[id].header, sfx);
1575  				if (len > *max_len)
1576  					*max_len = len;
1577  				break;
1578  			case RESFMT_TABLE:
1579  				sfx = is_key_stat(id) ? "" : table_sfxs[j];
1580  				printf("%s%-*s%s", i + j == 0 ? "" : COLUMN_SEP,
1581  				       *max_len - (int)strlen(sfx), stat_defs[id].header, sfx);
1582  				if (last)
1583  					printf("\n");
1584  				break;
1585  			case RESFMT_CSV:
1586  				sfx = is_key_stat(id) ? "" : name_sfxs[j];
1587  				printf("%s%s%s", i + j == 0 ? "" : ",", stat_defs[id].names[0], sfx);
1588  				if (last)
1589  					printf("\n");
1590  				break;
1591  			}
1592  		}
1593  	}
1594  
1595  	if (fmt == RESFMT_TABLE)
1596  		output_comp_header_underlines();
1597  }
1598  
output_comp_stats(const struct verif_stats_join * join_stats,enum resfmt fmt,bool last)1599  static void output_comp_stats(const struct verif_stats_join *join_stats,
1600  			      enum resfmt fmt, bool last)
1601  {
1602  	const struct verif_stats *base = join_stats->stats_a;
1603  	const struct verif_stats *comp = join_stats->stats_b;
1604  	char base_buf[1024] = {}, comp_buf[1024] = {}, diff_buf[1024] = {};
1605  	int i;
1606  
1607  	for (i = 0; i < env.output_spec.spec_cnt; i++) {
1608  		int id = env.output_spec.ids[i], len;
1609  		int *max_len_base = &env.output_spec.lens[3 * i + 0];
1610  		int *max_len_comp = &env.output_spec.lens[3 * i + 1];
1611  		int *max_len_diff = &env.output_spec.lens[3 * i + 2];
1612  		const char *base_str = NULL, *comp_str = NULL;
1613  		long base_val = 0, comp_val = 0, diff_val = 0;
1614  
1615  		prepare_value(base, id, &base_str, &base_val);
1616  		prepare_value(comp, id, &comp_str, &comp_val);
1617  
1618  		/* normalize all the outputs to be in string buffers for simplicity */
1619  		if (is_key_stat(id)) {
1620  			/* key stats (file and program name) are always strings */
1621  			if (base)
1622  				snprintf(base_buf, sizeof(base_buf), "%s", base_str);
1623  			else
1624  				snprintf(base_buf, sizeof(base_buf), "%s", comp_str);
1625  		} else if (base_str) {
1626  			snprintf(base_buf, sizeof(base_buf), "%s", base_str);
1627  			snprintf(comp_buf, sizeof(comp_buf), "%s", comp_str);
1628  			if (!base || !comp)
1629  				snprintf(diff_buf, sizeof(diff_buf), "%s", "N/A");
1630  			else if (strcmp(base_str, comp_str) == 0)
1631  				snprintf(diff_buf, sizeof(diff_buf), "%s", "MATCH");
1632  			else
1633  				snprintf(diff_buf, sizeof(diff_buf), "%s", "MISMATCH");
1634  		} else {
1635  			double p = 0.0;
1636  
1637  			if (base)
1638  				snprintf(base_buf, sizeof(base_buf), "%ld", base_val);
1639  			else
1640  				snprintf(base_buf, sizeof(base_buf), "%s", "N/A");
1641  			if (comp)
1642  				snprintf(comp_buf, sizeof(comp_buf), "%ld", comp_val);
1643  			else
1644  				snprintf(comp_buf, sizeof(comp_buf), "%s", "N/A");
1645  
1646  			diff_val = comp_val - base_val;
1647  			if (!base || !comp) {
1648  				snprintf(diff_buf, sizeof(diff_buf), "%s", "N/A");
1649  			} else {
1650  				if (base_val == 0) {
1651  					if (comp_val == base_val)
1652  						p = 0.0; /* avoid +0 (+100%) case */
1653  					else
1654  						p = comp_val < base_val ? -100.0 : 100.0;
1655  				} else {
1656  					 p = diff_val * 100.0 / base_val;
1657  				}
1658  				snprintf(diff_buf, sizeof(diff_buf), "%+ld (%+.2lf%%)", diff_val, p);
1659  			}
1660  		}
1661  
1662  		switch (fmt) {
1663  		case RESFMT_TABLE_CALCLEN:
1664  			len = strlen(base_buf);
1665  			if (len > *max_len_base)
1666  				*max_len_base = len;
1667  			if (!is_key_stat(id)) {
1668  				len = strlen(comp_buf);
1669  				if (len > *max_len_comp)
1670  					*max_len_comp = len;
1671  				len = strlen(diff_buf);
1672  				if (len > *max_len_diff)
1673  					*max_len_diff = len;
1674  			}
1675  			break;
1676  		case RESFMT_TABLE: {
1677  			/* string outputs are left-aligned, number outputs are right-aligned */
1678  			const char *fmt = base_str ? "%s%-*s" : "%s%*s";
1679  
1680  			printf(fmt, i == 0 ? "" : COLUMN_SEP, *max_len_base, base_buf);
1681  			if (!is_key_stat(id)) {
1682  				printf(fmt, COLUMN_SEP, *max_len_comp, comp_buf);
1683  				printf(fmt, COLUMN_SEP, *max_len_diff, diff_buf);
1684  			}
1685  			if (i == env.output_spec.spec_cnt - 1)
1686  				printf("\n");
1687  			break;
1688  		}
1689  		case RESFMT_CSV:
1690  			printf("%s%s", i == 0 ? "" : ",", base_buf);
1691  			if (!is_key_stat(id)) {
1692  				printf("%s%s", i == 0 ? "" : ",", comp_buf);
1693  				printf("%s%s", i == 0 ? "" : ",", diff_buf);
1694  			}
1695  			if (i == env.output_spec.spec_cnt - 1)
1696  				printf("\n");
1697  			break;
1698  		}
1699  	}
1700  
1701  	if (last && fmt == RESFMT_TABLE)
1702  		output_comp_header_underlines();
1703  }
1704  
cmp_stats_key(const struct verif_stats * base,const struct verif_stats * comp)1705  static int cmp_stats_key(const struct verif_stats *base, const struct verif_stats *comp)
1706  {
1707  	int r;
1708  
1709  	r = strcmp(base->file_name, comp->file_name);
1710  	if (r != 0)
1711  		return r;
1712  	return strcmp(base->prog_name, comp->prog_name);
1713  }
1714  
is_join_stat_filter_matched(struct filter * f,const struct verif_stats_join * stats)1715  static bool is_join_stat_filter_matched(struct filter *f, const struct verif_stats_join *stats)
1716  {
1717  	static const double eps = 1e-9;
1718  	const char *str = NULL;
1719  	double value = 0.0;
1720  
1721  	fetch_join_stat_value(stats, f->stat_id, f->stat_var, &str, &value);
1722  
1723  	switch (f->op) {
1724  	case OP_EQ: return value > f->value - eps && value < f->value + eps;
1725  	case OP_NEQ: return value < f->value - eps || value > f->value + eps;
1726  	case OP_LT: return value < f->value - eps;
1727  	case OP_LE: return value <= f->value + eps;
1728  	case OP_GT: return value > f->value + eps;
1729  	case OP_GE: return value >= f->value - eps;
1730  	}
1731  
1732  	fprintf(stderr, "BUG: unknown filter op %d!\n", f->op);
1733  	return false;
1734  }
1735  
should_output_join_stats(const struct verif_stats_join * stats)1736  static bool should_output_join_stats(const struct verif_stats_join *stats)
1737  {
1738  	struct filter *f;
1739  	int i, allow_cnt = 0;
1740  
1741  	for (i = 0; i < env.deny_filter_cnt; i++) {
1742  		f = &env.deny_filters[i];
1743  		if (f->kind != FILTER_STAT)
1744  			continue;
1745  
1746  		if (is_join_stat_filter_matched(f, stats))
1747  			return false;
1748  	}
1749  
1750  	for (i = 0; i < env.allow_filter_cnt; i++) {
1751  		f = &env.allow_filters[i];
1752  		if (f->kind != FILTER_STAT)
1753  			continue;
1754  		allow_cnt++;
1755  
1756  		if (is_join_stat_filter_matched(f, stats))
1757  			return true;
1758  	}
1759  
1760  	/* if there are no stat allowed filters, pass everything through */
1761  	return allow_cnt == 0;
1762  }
1763  
handle_comparison_mode(void)1764  static int handle_comparison_mode(void)
1765  {
1766  	struct stat_specs base_specs = {}, comp_specs = {};
1767  	struct stat_specs tmp_sort_spec;
1768  	enum resfmt cur_fmt;
1769  	int err, i, j, last_idx;
1770  
1771  	if (env.filename_cnt != 2) {
1772  		fprintf(stderr, "Comparison mode expects exactly two input CSV files!\n\n");
1773  		argp_help(&argp, stderr, ARGP_HELP_USAGE, "veristat");
1774  		return -EINVAL;
1775  	}
1776  
1777  	err = parse_stats_csv(env.filenames[0], &base_specs,
1778  			      &env.baseline_stats, &env.baseline_stat_cnt);
1779  	if (err) {
1780  		fprintf(stderr, "Failed to parse stats from '%s': %d\n", env.filenames[0], err);
1781  		return err;
1782  	}
1783  	err = parse_stats_csv(env.filenames[1], &comp_specs,
1784  			      &env.prog_stats, &env.prog_stat_cnt);
1785  	if (err) {
1786  		fprintf(stderr, "Failed to parse stats from '%s': %d\n", env.filenames[1], err);
1787  		return err;
1788  	}
1789  
1790  	/* To keep it simple we validate that the set and order of stats in
1791  	 * both CSVs are exactly the same. This can be lifted with a bit more
1792  	 * pre-processing later.
1793  	 */
1794  	if (base_specs.spec_cnt != comp_specs.spec_cnt) {
1795  		fprintf(stderr, "Number of stats in '%s' and '%s' differs (%d != %d)!\n",
1796  			env.filenames[0], env.filenames[1],
1797  			base_specs.spec_cnt, comp_specs.spec_cnt);
1798  		return -EINVAL;
1799  	}
1800  	for (i = 0; i < base_specs.spec_cnt; i++) {
1801  		if (base_specs.ids[i] != comp_specs.ids[i]) {
1802  			fprintf(stderr, "Stats composition differs between '%s' and '%s' (%s != %s)!\n",
1803  				env.filenames[0], env.filenames[1],
1804  				stat_defs[base_specs.ids[i]].names[0],
1805  				stat_defs[comp_specs.ids[i]].names[0]);
1806  			return -EINVAL;
1807  		}
1808  	}
1809  
1810  	/* Replace user-specified sorting spec with file+prog sorting rule to
1811  	 * be able to join two datasets correctly. Once we are done, we will
1812  	 * restore the original sort spec.
1813  	 */
1814  	tmp_sort_spec = env.sort_spec;
1815  	env.sort_spec = join_sort_spec;
1816  	qsort(env.prog_stats, env.prog_stat_cnt, sizeof(*env.prog_stats), cmp_prog_stats);
1817  	qsort(env.baseline_stats, env.baseline_stat_cnt, sizeof(*env.baseline_stats), cmp_prog_stats);
1818  	env.sort_spec = tmp_sort_spec;
1819  
1820  	/* Join two datasets together. If baseline and comparison datasets
1821  	 * have different subset of rows (we match by 'object + prog' as
1822  	 * a unique key) then assume empty/missing/zero value for rows that
1823  	 * are missing in the opposite data set.
1824  	 */
1825  	i = j = 0;
1826  	while (i < env.baseline_stat_cnt || j < env.prog_stat_cnt) {
1827  		const struct verif_stats *base, *comp;
1828  		struct verif_stats_join *join;
1829  		void *tmp;
1830  		int r;
1831  
1832  		base = i < env.baseline_stat_cnt ? &env.baseline_stats[i] : &fallback_stats;
1833  		comp = j < env.prog_stat_cnt ? &env.prog_stats[j] : &fallback_stats;
1834  
1835  		if (!base->file_name || !base->prog_name) {
1836  			fprintf(stderr, "Entry #%d in '%s' doesn't have file and/or program name specified!\n",
1837  				i, env.filenames[0]);
1838  			return -EINVAL;
1839  		}
1840  		if (!comp->file_name || !comp->prog_name) {
1841  			fprintf(stderr, "Entry #%d in '%s' doesn't have file and/or program name specified!\n",
1842  				j, env.filenames[1]);
1843  			return -EINVAL;
1844  		}
1845  
1846  		tmp = realloc(env.join_stats, (env.join_stat_cnt + 1) * sizeof(*env.join_stats));
1847  		if (!tmp)
1848  			return -ENOMEM;
1849  		env.join_stats = tmp;
1850  
1851  		join = &env.join_stats[env.join_stat_cnt];
1852  		memset(join, 0, sizeof(*join));
1853  
1854  		r = cmp_stats_key(base, comp);
1855  		if (r == 0) {
1856  			join->file_name = base->file_name;
1857  			join->prog_name = base->prog_name;
1858  			join->stats_a = base;
1859  			join->stats_b = comp;
1860  			i++;
1861  			j++;
1862  		} else if (base != &fallback_stats && (comp == &fallback_stats || r < 0)) {
1863  			join->file_name = base->file_name;
1864  			join->prog_name = base->prog_name;
1865  			join->stats_a = base;
1866  			join->stats_b = NULL;
1867  			i++;
1868  		} else if (comp != &fallback_stats && (base == &fallback_stats || r > 0)) {
1869  			join->file_name = comp->file_name;
1870  			join->prog_name = comp->prog_name;
1871  			join->stats_a = NULL;
1872  			join->stats_b = comp;
1873  			j++;
1874  		} else {
1875  			fprintf(stderr, "%s:%d: should never reach here i=%i, j=%i",
1876  				__FILE__, __LINE__, i, j);
1877  			return -EINVAL;
1878  		}
1879  		env.join_stat_cnt += 1;
1880  	}
1881  
1882  	/* now sort joined results accorsing to sort spec */
1883  	qsort(env.join_stats, env.join_stat_cnt, sizeof(*env.join_stats), cmp_join_stats);
1884  
1885  	/* for human-readable table output we need to do extra pass to
1886  	 * calculate column widths, so we substitute current output format
1887  	 * with RESFMT_TABLE_CALCLEN and later revert it back to RESFMT_TABLE
1888  	 * and do everything again.
1889  	 */
1890  	if (env.out_fmt == RESFMT_TABLE)
1891  		cur_fmt = RESFMT_TABLE_CALCLEN;
1892  	else
1893  		cur_fmt = env.out_fmt;
1894  
1895  one_more_time:
1896  	output_comp_headers(cur_fmt);
1897  
1898  	last_idx = -1;
1899  	for (i = 0; i < env.join_stat_cnt; i++) {
1900  		const struct verif_stats_join *join = &env.join_stats[i];
1901  
1902  		if (!should_output_join_stats(join))
1903  			continue;
1904  
1905  		if (cur_fmt == RESFMT_TABLE_CALCLEN)
1906  			last_idx = i;
1907  
1908  		output_comp_stats(join, cur_fmt, i == last_idx);
1909  	}
1910  
1911  	if (cur_fmt == RESFMT_TABLE_CALCLEN) {
1912  		cur_fmt = RESFMT_TABLE;
1913  		goto one_more_time; /* ... this time with feeling */
1914  	}
1915  
1916  	return 0;
1917  }
1918  
is_stat_filter_matched(struct filter * f,const struct verif_stats * stats)1919  static bool is_stat_filter_matched(struct filter *f, const struct verif_stats *stats)
1920  {
1921  	long value = stats->stats[f->stat_id];
1922  
1923  	switch (f->op) {
1924  	case OP_EQ: return value == f->value;
1925  	case OP_NEQ: return value != f->value;
1926  	case OP_LT: return value < f->value;
1927  	case OP_LE: return value <= f->value;
1928  	case OP_GT: return value > f->value;
1929  	case OP_GE: return value >= f->value;
1930  	}
1931  
1932  	fprintf(stderr, "BUG: unknown filter op %d!\n", f->op);
1933  	return false;
1934  }
1935  
should_output_stats(const struct verif_stats * stats)1936  static bool should_output_stats(const struct verif_stats *stats)
1937  {
1938  	struct filter *f;
1939  	int i, allow_cnt = 0;
1940  
1941  	for (i = 0; i < env.deny_filter_cnt; i++) {
1942  		f = &env.deny_filters[i];
1943  		if (f->kind != FILTER_STAT)
1944  			continue;
1945  
1946  		if (is_stat_filter_matched(f, stats))
1947  			return false;
1948  	}
1949  
1950  	for (i = 0; i < env.allow_filter_cnt; i++) {
1951  		f = &env.allow_filters[i];
1952  		if (f->kind != FILTER_STAT)
1953  			continue;
1954  		allow_cnt++;
1955  
1956  		if (is_stat_filter_matched(f, stats))
1957  			return true;
1958  	}
1959  
1960  	/* if there are no stat allowed filters, pass everything through */
1961  	return allow_cnt == 0;
1962  }
1963  
output_prog_stats(void)1964  static void output_prog_stats(void)
1965  {
1966  	const struct verif_stats *stats;
1967  	int i, last_stat_idx = 0;
1968  
1969  	if (env.out_fmt == RESFMT_TABLE) {
1970  		/* calculate column widths */
1971  		output_headers(RESFMT_TABLE_CALCLEN);
1972  		for (i = 0; i < env.prog_stat_cnt; i++) {
1973  			stats = &env.prog_stats[i];
1974  			if (!should_output_stats(stats))
1975  				continue;
1976  			output_stats(stats, RESFMT_TABLE_CALCLEN, false);
1977  			last_stat_idx = i;
1978  		}
1979  	}
1980  
1981  	/* actually output the table */
1982  	output_headers(env.out_fmt);
1983  	for (i = 0; i < env.prog_stat_cnt; i++) {
1984  		stats = &env.prog_stats[i];
1985  		if (!should_output_stats(stats))
1986  			continue;
1987  		output_stats(stats, env.out_fmt, i == last_stat_idx);
1988  	}
1989  }
1990  
handle_verif_mode(void)1991  static int handle_verif_mode(void)
1992  {
1993  	int i, err;
1994  
1995  	if (env.filename_cnt == 0) {
1996  		fprintf(stderr, "Please provide path to BPF object file!\n\n");
1997  		argp_help(&argp, stderr, ARGP_HELP_USAGE, "veristat");
1998  		return -EINVAL;
1999  	}
2000  
2001  	for (i = 0; i < env.filename_cnt; i++) {
2002  		err = process_obj(env.filenames[i]);
2003  		if (err) {
2004  			fprintf(stderr, "Failed to process '%s': %d\n", env.filenames[i], err);
2005  			return err;
2006  		}
2007  	}
2008  
2009  	qsort(env.prog_stats, env.prog_stat_cnt, sizeof(*env.prog_stats), cmp_prog_stats);
2010  
2011  	output_prog_stats();
2012  
2013  	return 0;
2014  }
2015  
handle_replay_mode(void)2016  static int handle_replay_mode(void)
2017  {
2018  	struct stat_specs specs = {};
2019  	int err;
2020  
2021  	if (env.filename_cnt != 1) {
2022  		fprintf(stderr, "Replay mode expects exactly one input CSV file!\n\n");
2023  		argp_help(&argp, stderr, ARGP_HELP_USAGE, "veristat");
2024  		return -EINVAL;
2025  	}
2026  
2027  	err = parse_stats_csv(env.filenames[0], &specs,
2028  			      &env.prog_stats, &env.prog_stat_cnt);
2029  	if (err) {
2030  		fprintf(stderr, "Failed to parse stats from '%s': %d\n", env.filenames[0], err);
2031  		return err;
2032  	}
2033  
2034  	qsort(env.prog_stats, env.prog_stat_cnt, sizeof(*env.prog_stats), cmp_prog_stats);
2035  
2036  	output_prog_stats();
2037  
2038  	return 0;
2039  }
2040  
main(int argc,char ** argv)2041  int main(int argc, char **argv)
2042  {
2043  	int err = 0, i;
2044  
2045  	if (argp_parse(&argp, argc, argv, 0, NULL, NULL))
2046  		return 1;
2047  
2048  	if (env.show_version) {
2049  		printf("%s\n", argp_program_version);
2050  		return 0;
2051  	}
2052  
2053  	if (env.verbose && env.quiet) {
2054  		fprintf(stderr, "Verbose and quiet modes are incompatible, please specify just one or neither!\n\n");
2055  		argp_help(&argp, stderr, ARGP_HELP_USAGE, "veristat");
2056  		return 1;
2057  	}
2058  	if (env.verbose && env.log_level == 0)
2059  		env.log_level = 1;
2060  
2061  	if (env.output_spec.spec_cnt == 0) {
2062  		if (env.out_fmt == RESFMT_CSV)
2063  			env.output_spec = default_csv_output_spec;
2064  		else
2065  			env.output_spec = default_output_spec;
2066  	}
2067  	if (env.sort_spec.spec_cnt == 0)
2068  		env.sort_spec = default_sort_spec;
2069  
2070  	if (env.comparison_mode && env.replay_mode) {
2071  		fprintf(stderr, "Can't specify replay and comparison mode at the same time!\n\n");
2072  		argp_help(&argp, stderr, ARGP_HELP_USAGE, "veristat");
2073  		return 1;
2074  	}
2075  
2076  	if (env.comparison_mode)
2077  		err = handle_comparison_mode();
2078  	else if (env.replay_mode)
2079  		err = handle_replay_mode();
2080  	else
2081  		err = handle_verif_mode();
2082  
2083  	free_verif_stats(env.prog_stats, env.prog_stat_cnt);
2084  	free_verif_stats(env.baseline_stats, env.baseline_stat_cnt);
2085  	free(env.join_stats);
2086  	for (i = 0; i < env.filename_cnt; i++)
2087  		free(env.filenames[i]);
2088  	free(env.filenames);
2089  	for (i = 0; i < env.allow_filter_cnt; i++) {
2090  		free(env.allow_filters[i].any_glob);
2091  		free(env.allow_filters[i].file_glob);
2092  		free(env.allow_filters[i].prog_glob);
2093  	}
2094  	free(env.allow_filters);
2095  	for (i = 0; i < env.deny_filter_cnt; i++) {
2096  		free(env.deny_filters[i].any_glob);
2097  		free(env.deny_filters[i].file_glob);
2098  		free(env.deny_filters[i].prog_glob);
2099  	}
2100  	free(env.deny_filters);
2101  	return -err;
2102  }
2103