xref: /openbmc/linux/tools/lib/bpf/btf.c (revision 9df839a711aee437390b16ee39cf0b5c1620be6a)
1 // SPDX-License-Identifier: (LGPL-2.1 OR BSD-2-Clause)
2 /* Copyright (c) 2018 Facebook */
3 
4 #include <byteswap.h>
5 #include <endian.h>
6 #include <stdio.h>
7 #include <stdlib.h>
8 #include <string.h>
9 #include <fcntl.h>
10 #include <unistd.h>
11 #include <errno.h>
12 #include <sys/utsname.h>
13 #include <sys/param.h>
14 #include <sys/stat.h>
15 #include <linux/kernel.h>
16 #include <linux/err.h>
17 #include <linux/btf.h>
18 #include <gelf.h>
19 #include "btf.h"
20 #include "bpf.h"
21 #include "libbpf.h"
22 #include "libbpf_internal.h"
23 #include "hashmap.h"
24 #include "strset.h"
25 
26 #define BTF_MAX_NR_TYPES 0x7fffffffU
27 #define BTF_MAX_STR_OFFSET 0x7fffffffU
28 
29 static struct btf_type btf_void;
30 
31 struct btf {
32 	/* raw BTF data in native endianness */
33 	void *raw_data;
34 	/* raw BTF data in non-native endianness */
35 	void *raw_data_swapped;
36 	__u32 raw_size;
37 	/* whether target endianness differs from the native one */
38 	bool swapped_endian;
39 
40 	/*
41 	 * When BTF is loaded from an ELF or raw memory it is stored
42 	 * in a contiguous memory block. The hdr, type_data, and, strs_data
43 	 * point inside that memory region to their respective parts of BTF
44 	 * representation:
45 	 *
46 	 * +--------------------------------+
47 	 * |  Header  |  Types  |  Strings  |
48 	 * +--------------------------------+
49 	 * ^          ^         ^
50 	 * |          |         |
51 	 * hdr        |         |
52 	 * types_data-+         |
53 	 * strs_data------------+
54 	 *
55 	 * If BTF data is later modified, e.g., due to types added or
56 	 * removed, BTF deduplication performed, etc, this contiguous
57 	 * representation is broken up into three independently allocated
58 	 * memory regions to be able to modify them independently.
59 	 * raw_data is nulled out at that point, but can be later allocated
60 	 * and cached again if user calls btf__raw_data(), at which point
61 	 * raw_data will contain a contiguous copy of header, types, and
62 	 * strings:
63 	 *
64 	 * +----------+  +---------+  +-----------+
65 	 * |  Header  |  |  Types  |  |  Strings  |
66 	 * +----------+  +---------+  +-----------+
67 	 * ^             ^            ^
68 	 * |             |            |
69 	 * hdr           |            |
70 	 * types_data----+            |
71 	 * strset__data(strs_set)-----+
72 	 *
73 	 *               +----------+---------+-----------+
74 	 *               |  Header  |  Types  |  Strings  |
75 	 * raw_data----->+----------+---------+-----------+
76 	 */
77 	struct btf_header *hdr;
78 
79 	void *types_data;
80 	size_t types_data_cap; /* used size stored in hdr->type_len */
81 
82 	/* type ID to `struct btf_type *` lookup index
83 	 * type_offs[0] corresponds to the first non-VOID type:
84 	 *   - for base BTF it's type [1];
85 	 *   - for split BTF it's the first non-base BTF type.
86 	 */
87 	__u32 *type_offs;
88 	size_t type_offs_cap;
89 	/* number of types in this BTF instance:
90 	 *   - doesn't include special [0] void type;
91 	 *   - for split BTF counts number of types added on top of base BTF.
92 	 */
93 	__u32 nr_types;
94 	/* if not NULL, points to the base BTF on top of which the current
95 	 * split BTF is based
96 	 */
97 	struct btf *base_btf;
98 	/* BTF type ID of the first type in this BTF instance:
99 	 *   - for base BTF it's equal to 1;
100 	 *   - for split BTF it's equal to biggest type ID of base BTF plus 1.
101 	 */
102 	int start_id;
103 	/* logical string offset of this BTF instance:
104 	 *   - for base BTF it's equal to 0;
105 	 *   - for split BTF it's equal to total size of base BTF's string section size.
106 	 */
107 	int start_str_off;
108 
109 	/* only one of strs_data or strs_set can be non-NULL, depending on
110 	 * whether BTF is in a modifiable state (strs_set is used) or not
111 	 * (strs_data points inside raw_data)
112 	 */
113 	void *strs_data;
114 	/* a set of unique strings */
115 	struct strset *strs_set;
116 	/* whether strings are already deduplicated */
117 	bool strs_deduped;
118 
119 	/* BTF object FD, if loaded into kernel */
120 	int fd;
121 
122 	/* Pointer size (in bytes) for a target architecture of this BTF */
123 	int ptr_sz;
124 };
125 
126 static inline __u64 ptr_to_u64(const void *ptr)
127 {
128 	return (__u64) (unsigned long) ptr;
129 }
130 
131 /* Ensure given dynamically allocated memory region pointed to by *data* with
132  * capacity of *cap_cnt* elements each taking *elem_sz* bytes has enough
133  * memory to accommodate *add_cnt* new elements, assuming *cur_cnt* elements
134  * are already used. At most *max_cnt* elements can be ever allocated.
135  * If necessary, memory is reallocated and all existing data is copied over,
136  * new pointer to the memory region is stored at *data, new memory region
137  * capacity (in number of elements) is stored in *cap.
138  * On success, memory pointer to the beginning of unused memory is returned.
139  * On error, NULL is returned.
140  */
141 void *libbpf_add_mem(void **data, size_t *cap_cnt, size_t elem_sz,
142 		     size_t cur_cnt, size_t max_cnt, size_t add_cnt)
143 {
144 	size_t new_cnt;
145 	void *new_data;
146 
147 	if (cur_cnt + add_cnt <= *cap_cnt)
148 		return *data + cur_cnt * elem_sz;
149 
150 	/* requested more than the set limit */
151 	if (cur_cnt + add_cnt > max_cnt)
152 		return NULL;
153 
154 	new_cnt = *cap_cnt;
155 	new_cnt += new_cnt / 4;		  /* expand by 25% */
156 	if (new_cnt < 16)		  /* but at least 16 elements */
157 		new_cnt = 16;
158 	if (new_cnt > max_cnt)		  /* but not exceeding a set limit */
159 		new_cnt = max_cnt;
160 	if (new_cnt < cur_cnt + add_cnt)  /* also ensure we have enough memory */
161 		new_cnt = cur_cnt + add_cnt;
162 
163 	new_data = libbpf_reallocarray(*data, new_cnt, elem_sz);
164 	if (!new_data)
165 		return NULL;
166 
167 	/* zero out newly allocated portion of memory */
168 	memset(new_data + (*cap_cnt) * elem_sz, 0, (new_cnt - *cap_cnt) * elem_sz);
169 
170 	*data = new_data;
171 	*cap_cnt = new_cnt;
172 	return new_data + cur_cnt * elem_sz;
173 }
174 
175 /* Ensure given dynamically allocated memory region has enough allocated space
176  * to accommodate *need_cnt* elements of size *elem_sz* bytes each
177  */
178 int libbpf_ensure_mem(void **data, size_t *cap_cnt, size_t elem_sz, size_t need_cnt)
179 {
180 	void *p;
181 
182 	if (need_cnt <= *cap_cnt)
183 		return 0;
184 
185 	p = libbpf_add_mem(data, cap_cnt, elem_sz, *cap_cnt, SIZE_MAX, need_cnt - *cap_cnt);
186 	if (!p)
187 		return -ENOMEM;
188 
189 	return 0;
190 }
191 
192 static void *btf_add_type_offs_mem(struct btf *btf, size_t add_cnt)
193 {
194 	return libbpf_add_mem((void **)&btf->type_offs, &btf->type_offs_cap, sizeof(__u32),
195 			      btf->nr_types, BTF_MAX_NR_TYPES, add_cnt);
196 }
197 
198 static int btf_add_type_idx_entry(struct btf *btf, __u32 type_off)
199 {
200 	__u32 *p;
201 
202 	p = btf_add_type_offs_mem(btf, 1);
203 	if (!p)
204 		return -ENOMEM;
205 
206 	*p = type_off;
207 	return 0;
208 }
209 
210 static void btf_bswap_hdr(struct btf_header *h)
211 {
212 	h->magic = bswap_16(h->magic);
213 	h->hdr_len = bswap_32(h->hdr_len);
214 	h->type_off = bswap_32(h->type_off);
215 	h->type_len = bswap_32(h->type_len);
216 	h->str_off = bswap_32(h->str_off);
217 	h->str_len = bswap_32(h->str_len);
218 }
219 
220 static int btf_parse_hdr(struct btf *btf)
221 {
222 	struct btf_header *hdr = btf->hdr;
223 	__u32 meta_left;
224 
225 	if (btf->raw_size < sizeof(struct btf_header)) {
226 		pr_debug("BTF header not found\n");
227 		return -EINVAL;
228 	}
229 
230 	if (hdr->magic == bswap_16(BTF_MAGIC)) {
231 		btf->swapped_endian = true;
232 		if (bswap_32(hdr->hdr_len) != sizeof(struct btf_header)) {
233 			pr_warn("Can't load BTF with non-native endianness due to unsupported header length %u\n",
234 				bswap_32(hdr->hdr_len));
235 			return -ENOTSUP;
236 		}
237 		btf_bswap_hdr(hdr);
238 	} else if (hdr->magic != BTF_MAGIC) {
239 		pr_debug("Invalid BTF magic: %x\n", hdr->magic);
240 		return -EINVAL;
241 	}
242 
243 	if (btf->raw_size < hdr->hdr_len) {
244 		pr_debug("BTF header len %u larger than data size %u\n",
245 			 hdr->hdr_len, btf->raw_size);
246 		return -EINVAL;
247 	}
248 
249 	meta_left = btf->raw_size - hdr->hdr_len;
250 	if (meta_left < (long long)hdr->str_off + hdr->str_len) {
251 		pr_debug("Invalid BTF total size: %u\n", btf->raw_size);
252 		return -EINVAL;
253 	}
254 
255 	if ((long long)hdr->type_off + hdr->type_len > hdr->str_off) {
256 		pr_debug("Invalid BTF data sections layout: type data at %u + %u, strings data at %u + %u\n",
257 			 hdr->type_off, hdr->type_len, hdr->str_off, hdr->str_len);
258 		return -EINVAL;
259 	}
260 
261 	if (hdr->type_off % 4) {
262 		pr_debug("BTF type section is not aligned to 4 bytes\n");
263 		return -EINVAL;
264 	}
265 
266 	return 0;
267 }
268 
269 static int btf_parse_str_sec(struct btf *btf)
270 {
271 	const struct btf_header *hdr = btf->hdr;
272 	const char *start = btf->strs_data;
273 	const char *end = start + btf->hdr->str_len;
274 
275 	if (btf->base_btf && hdr->str_len == 0)
276 		return 0;
277 	if (!hdr->str_len || hdr->str_len - 1 > BTF_MAX_STR_OFFSET || end[-1]) {
278 		pr_debug("Invalid BTF string section\n");
279 		return -EINVAL;
280 	}
281 	if (!btf->base_btf && start[0]) {
282 		pr_debug("Invalid BTF string section\n");
283 		return -EINVAL;
284 	}
285 	return 0;
286 }
287 
288 static int btf_type_size(const struct btf_type *t)
289 {
290 	const int base_size = sizeof(struct btf_type);
291 	__u16 vlen = btf_vlen(t);
292 
293 	switch (btf_kind(t)) {
294 	case BTF_KIND_FWD:
295 	case BTF_KIND_CONST:
296 	case BTF_KIND_VOLATILE:
297 	case BTF_KIND_RESTRICT:
298 	case BTF_KIND_PTR:
299 	case BTF_KIND_TYPEDEF:
300 	case BTF_KIND_FUNC:
301 	case BTF_KIND_FLOAT:
302 	case BTF_KIND_TYPE_TAG:
303 		return base_size;
304 	case BTF_KIND_INT:
305 		return base_size + sizeof(__u32);
306 	case BTF_KIND_ENUM:
307 		return base_size + vlen * sizeof(struct btf_enum);
308 	case BTF_KIND_ENUM64:
309 		return base_size + vlen * sizeof(struct btf_enum64);
310 	case BTF_KIND_ARRAY:
311 		return base_size + sizeof(struct btf_array);
312 	case BTF_KIND_STRUCT:
313 	case BTF_KIND_UNION:
314 		return base_size + vlen * sizeof(struct btf_member);
315 	case BTF_KIND_FUNC_PROTO:
316 		return base_size + vlen * sizeof(struct btf_param);
317 	case BTF_KIND_VAR:
318 		return base_size + sizeof(struct btf_var);
319 	case BTF_KIND_DATASEC:
320 		return base_size + vlen * sizeof(struct btf_var_secinfo);
321 	case BTF_KIND_DECL_TAG:
322 		return base_size + sizeof(struct btf_decl_tag);
323 	default:
324 		pr_debug("Unsupported BTF_KIND:%u\n", btf_kind(t));
325 		return -EINVAL;
326 	}
327 }
328 
329 static void btf_bswap_type_base(struct btf_type *t)
330 {
331 	t->name_off = bswap_32(t->name_off);
332 	t->info = bswap_32(t->info);
333 	t->type = bswap_32(t->type);
334 }
335 
336 static int btf_bswap_type_rest(struct btf_type *t)
337 {
338 	struct btf_var_secinfo *v;
339 	struct btf_enum64 *e64;
340 	struct btf_member *m;
341 	struct btf_array *a;
342 	struct btf_param *p;
343 	struct btf_enum *e;
344 	__u16 vlen = btf_vlen(t);
345 	int i;
346 
347 	switch (btf_kind(t)) {
348 	case BTF_KIND_FWD:
349 	case BTF_KIND_CONST:
350 	case BTF_KIND_VOLATILE:
351 	case BTF_KIND_RESTRICT:
352 	case BTF_KIND_PTR:
353 	case BTF_KIND_TYPEDEF:
354 	case BTF_KIND_FUNC:
355 	case BTF_KIND_FLOAT:
356 	case BTF_KIND_TYPE_TAG:
357 		return 0;
358 	case BTF_KIND_INT:
359 		*(__u32 *)(t + 1) = bswap_32(*(__u32 *)(t + 1));
360 		return 0;
361 	case BTF_KIND_ENUM:
362 		for (i = 0, e = btf_enum(t); i < vlen; i++, e++) {
363 			e->name_off = bswap_32(e->name_off);
364 			e->val = bswap_32(e->val);
365 		}
366 		return 0;
367 	case BTF_KIND_ENUM64:
368 		for (i = 0, e64 = btf_enum64(t); i < vlen; i++, e64++) {
369 			e64->name_off = bswap_32(e64->name_off);
370 			e64->val_lo32 = bswap_32(e64->val_lo32);
371 			e64->val_hi32 = bswap_32(e64->val_hi32);
372 		}
373 		return 0;
374 	case BTF_KIND_ARRAY:
375 		a = btf_array(t);
376 		a->type = bswap_32(a->type);
377 		a->index_type = bswap_32(a->index_type);
378 		a->nelems = bswap_32(a->nelems);
379 		return 0;
380 	case BTF_KIND_STRUCT:
381 	case BTF_KIND_UNION:
382 		for (i = 0, m = btf_members(t); i < vlen; i++, m++) {
383 			m->name_off = bswap_32(m->name_off);
384 			m->type = bswap_32(m->type);
385 			m->offset = bswap_32(m->offset);
386 		}
387 		return 0;
388 	case BTF_KIND_FUNC_PROTO:
389 		for (i = 0, p = btf_params(t); i < vlen; i++, p++) {
390 			p->name_off = bswap_32(p->name_off);
391 			p->type = bswap_32(p->type);
392 		}
393 		return 0;
394 	case BTF_KIND_VAR:
395 		btf_var(t)->linkage = bswap_32(btf_var(t)->linkage);
396 		return 0;
397 	case BTF_KIND_DATASEC:
398 		for (i = 0, v = btf_var_secinfos(t); i < vlen; i++, v++) {
399 			v->type = bswap_32(v->type);
400 			v->offset = bswap_32(v->offset);
401 			v->size = bswap_32(v->size);
402 		}
403 		return 0;
404 	case BTF_KIND_DECL_TAG:
405 		btf_decl_tag(t)->component_idx = bswap_32(btf_decl_tag(t)->component_idx);
406 		return 0;
407 	default:
408 		pr_debug("Unsupported BTF_KIND:%u\n", btf_kind(t));
409 		return -EINVAL;
410 	}
411 }
412 
413 static int btf_parse_type_sec(struct btf *btf)
414 {
415 	struct btf_header *hdr = btf->hdr;
416 	void *next_type = btf->types_data;
417 	void *end_type = next_type + hdr->type_len;
418 	int err, type_size;
419 
420 	while (next_type + sizeof(struct btf_type) <= end_type) {
421 		if (btf->swapped_endian)
422 			btf_bswap_type_base(next_type);
423 
424 		type_size = btf_type_size(next_type);
425 		if (type_size < 0)
426 			return type_size;
427 		if (next_type + type_size > end_type) {
428 			pr_warn("BTF type [%d] is malformed\n", btf->start_id + btf->nr_types);
429 			return -EINVAL;
430 		}
431 
432 		if (btf->swapped_endian && btf_bswap_type_rest(next_type))
433 			return -EINVAL;
434 
435 		err = btf_add_type_idx_entry(btf, next_type - btf->types_data);
436 		if (err)
437 			return err;
438 
439 		next_type += type_size;
440 		btf->nr_types++;
441 	}
442 
443 	if (next_type != end_type) {
444 		pr_warn("BTF types data is malformed\n");
445 		return -EINVAL;
446 	}
447 
448 	return 0;
449 }
450 
451 __u32 btf__type_cnt(const struct btf *btf)
452 {
453 	return btf->start_id + btf->nr_types;
454 }
455 
456 const struct btf *btf__base_btf(const struct btf *btf)
457 {
458 	return btf->base_btf;
459 }
460 
461 /* internal helper returning non-const pointer to a type */
462 struct btf_type *btf_type_by_id(const struct btf *btf, __u32 type_id)
463 {
464 	if (type_id == 0)
465 		return &btf_void;
466 	if (type_id < btf->start_id)
467 		return btf_type_by_id(btf->base_btf, type_id);
468 	return btf->types_data + btf->type_offs[type_id - btf->start_id];
469 }
470 
471 const struct btf_type *btf__type_by_id(const struct btf *btf, __u32 type_id)
472 {
473 	if (type_id >= btf->start_id + btf->nr_types)
474 		return errno = EINVAL, NULL;
475 	return btf_type_by_id((struct btf *)btf, type_id);
476 }
477 
478 static int determine_ptr_size(const struct btf *btf)
479 {
480 	static const char * const long_aliases[] = {
481 		"long",
482 		"long int",
483 		"int long",
484 		"unsigned long",
485 		"long unsigned",
486 		"unsigned long int",
487 		"unsigned int long",
488 		"long unsigned int",
489 		"long int unsigned",
490 		"int unsigned long",
491 		"int long unsigned",
492 	};
493 	const struct btf_type *t;
494 	const char *name;
495 	int i, j, n;
496 
497 	if (btf->base_btf && btf->base_btf->ptr_sz > 0)
498 		return btf->base_btf->ptr_sz;
499 
500 	n = btf__type_cnt(btf);
501 	for (i = 1; i < n; i++) {
502 		t = btf__type_by_id(btf, i);
503 		if (!btf_is_int(t))
504 			continue;
505 
506 		if (t->size != 4 && t->size != 8)
507 			continue;
508 
509 		name = btf__name_by_offset(btf, t->name_off);
510 		if (!name)
511 			continue;
512 
513 		for (j = 0; j < ARRAY_SIZE(long_aliases); j++) {
514 			if (strcmp(name, long_aliases[j]) == 0)
515 				return t->size;
516 		}
517 	}
518 
519 	return -1;
520 }
521 
522 static size_t btf_ptr_sz(const struct btf *btf)
523 {
524 	if (!btf->ptr_sz)
525 		((struct btf *)btf)->ptr_sz = determine_ptr_size(btf);
526 	return btf->ptr_sz < 0 ? sizeof(void *) : btf->ptr_sz;
527 }
528 
529 /* Return pointer size this BTF instance assumes. The size is heuristically
530  * determined by looking for 'long' or 'unsigned long' integer type and
531  * recording its size in bytes. If BTF type information doesn't have any such
532  * type, this function returns 0. In the latter case, native architecture's
533  * pointer size is assumed, so will be either 4 or 8, depending on
534  * architecture that libbpf was compiled for. It's possible to override
535  * guessed value by using btf__set_pointer_size() API.
536  */
537 size_t btf__pointer_size(const struct btf *btf)
538 {
539 	if (!btf->ptr_sz)
540 		((struct btf *)btf)->ptr_sz = determine_ptr_size(btf);
541 
542 	if (btf->ptr_sz < 0)
543 		/* not enough BTF type info to guess */
544 		return 0;
545 
546 	return btf->ptr_sz;
547 }
548 
549 /* Override or set pointer size in bytes. Only values of 4 and 8 are
550  * supported.
551  */
552 int btf__set_pointer_size(struct btf *btf, size_t ptr_sz)
553 {
554 	if (ptr_sz != 4 && ptr_sz != 8)
555 		return libbpf_err(-EINVAL);
556 	btf->ptr_sz = ptr_sz;
557 	return 0;
558 }
559 
560 static bool is_host_big_endian(void)
561 {
562 #if __BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__
563 	return false;
564 #elif __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
565 	return true;
566 #else
567 # error "Unrecognized __BYTE_ORDER__"
568 #endif
569 }
570 
571 enum btf_endianness btf__endianness(const struct btf *btf)
572 {
573 	if (is_host_big_endian())
574 		return btf->swapped_endian ? BTF_LITTLE_ENDIAN : BTF_BIG_ENDIAN;
575 	else
576 		return btf->swapped_endian ? BTF_BIG_ENDIAN : BTF_LITTLE_ENDIAN;
577 }
578 
579 int btf__set_endianness(struct btf *btf, enum btf_endianness endian)
580 {
581 	if (endian != BTF_LITTLE_ENDIAN && endian != BTF_BIG_ENDIAN)
582 		return libbpf_err(-EINVAL);
583 
584 	btf->swapped_endian = is_host_big_endian() != (endian == BTF_BIG_ENDIAN);
585 	if (!btf->swapped_endian) {
586 		free(btf->raw_data_swapped);
587 		btf->raw_data_swapped = NULL;
588 	}
589 	return 0;
590 }
591 
592 static bool btf_type_is_void(const struct btf_type *t)
593 {
594 	return t == &btf_void || btf_is_fwd(t);
595 }
596 
597 static bool btf_type_is_void_or_null(const struct btf_type *t)
598 {
599 	return !t || btf_type_is_void(t);
600 }
601 
602 #define MAX_RESOLVE_DEPTH 32
603 
604 __s64 btf__resolve_size(const struct btf *btf, __u32 type_id)
605 {
606 	const struct btf_array *array;
607 	const struct btf_type *t;
608 	__u32 nelems = 1;
609 	__s64 size = -1;
610 	int i;
611 
612 	t = btf__type_by_id(btf, type_id);
613 	for (i = 0; i < MAX_RESOLVE_DEPTH && !btf_type_is_void_or_null(t); i++) {
614 		switch (btf_kind(t)) {
615 		case BTF_KIND_INT:
616 		case BTF_KIND_STRUCT:
617 		case BTF_KIND_UNION:
618 		case BTF_KIND_ENUM:
619 		case BTF_KIND_ENUM64:
620 		case BTF_KIND_DATASEC:
621 		case BTF_KIND_FLOAT:
622 			size = t->size;
623 			goto done;
624 		case BTF_KIND_PTR:
625 			size = btf_ptr_sz(btf);
626 			goto done;
627 		case BTF_KIND_TYPEDEF:
628 		case BTF_KIND_VOLATILE:
629 		case BTF_KIND_CONST:
630 		case BTF_KIND_RESTRICT:
631 		case BTF_KIND_VAR:
632 		case BTF_KIND_DECL_TAG:
633 		case BTF_KIND_TYPE_TAG:
634 			type_id = t->type;
635 			break;
636 		case BTF_KIND_ARRAY:
637 			array = btf_array(t);
638 			if (nelems && array->nelems > UINT32_MAX / nelems)
639 				return libbpf_err(-E2BIG);
640 			nelems *= array->nelems;
641 			type_id = array->type;
642 			break;
643 		default:
644 			return libbpf_err(-EINVAL);
645 		}
646 
647 		t = btf__type_by_id(btf, type_id);
648 	}
649 
650 done:
651 	if (size < 0)
652 		return libbpf_err(-EINVAL);
653 	if (nelems && size > UINT32_MAX / nelems)
654 		return libbpf_err(-E2BIG);
655 
656 	return nelems * size;
657 }
658 
659 int btf__align_of(const struct btf *btf, __u32 id)
660 {
661 	const struct btf_type *t = btf__type_by_id(btf, id);
662 	__u16 kind = btf_kind(t);
663 
664 	switch (kind) {
665 	case BTF_KIND_INT:
666 	case BTF_KIND_ENUM:
667 	case BTF_KIND_ENUM64:
668 	case BTF_KIND_FLOAT:
669 		return min(btf_ptr_sz(btf), (size_t)t->size);
670 	case BTF_KIND_PTR:
671 		return btf_ptr_sz(btf);
672 	case BTF_KIND_TYPEDEF:
673 	case BTF_KIND_VOLATILE:
674 	case BTF_KIND_CONST:
675 	case BTF_KIND_RESTRICT:
676 	case BTF_KIND_TYPE_TAG:
677 		return btf__align_of(btf, t->type);
678 	case BTF_KIND_ARRAY:
679 		return btf__align_of(btf, btf_array(t)->type);
680 	case BTF_KIND_STRUCT:
681 	case BTF_KIND_UNION: {
682 		const struct btf_member *m = btf_members(t);
683 		__u16 vlen = btf_vlen(t);
684 		int i, max_align = 1, align;
685 
686 		for (i = 0; i < vlen; i++, m++) {
687 			align = btf__align_of(btf, m->type);
688 			if (align <= 0)
689 				return libbpf_err(align);
690 			max_align = max(max_align, align);
691 
692 			/* if field offset isn't aligned according to field
693 			 * type's alignment, then struct must be packed
694 			 */
695 			if (btf_member_bitfield_size(t, i) == 0 &&
696 			    (m->offset % (8 * align)) != 0)
697 				return 1;
698 		}
699 
700 		/* if struct/union size isn't a multiple of its alignment,
701 		 * then struct must be packed
702 		 */
703 		if ((t->size % max_align) != 0)
704 			return 1;
705 
706 		return max_align;
707 	}
708 	default:
709 		pr_warn("unsupported BTF_KIND:%u\n", btf_kind(t));
710 		return errno = EINVAL, 0;
711 	}
712 }
713 
714 int btf__resolve_type(const struct btf *btf, __u32 type_id)
715 {
716 	const struct btf_type *t;
717 	int depth = 0;
718 
719 	t = btf__type_by_id(btf, type_id);
720 	while (depth < MAX_RESOLVE_DEPTH &&
721 	       !btf_type_is_void_or_null(t) &&
722 	       (btf_is_mod(t) || btf_is_typedef(t) || btf_is_var(t))) {
723 		type_id = t->type;
724 		t = btf__type_by_id(btf, type_id);
725 		depth++;
726 	}
727 
728 	if (depth == MAX_RESOLVE_DEPTH || btf_type_is_void_or_null(t))
729 		return libbpf_err(-EINVAL);
730 
731 	return type_id;
732 }
733 
734 __s32 btf__find_by_name(const struct btf *btf, const char *type_name)
735 {
736 	__u32 i, nr_types = btf__type_cnt(btf);
737 
738 	if (!strcmp(type_name, "void"))
739 		return 0;
740 
741 	for (i = 1; i < nr_types; i++) {
742 		const struct btf_type *t = btf__type_by_id(btf, i);
743 		const char *name = btf__name_by_offset(btf, t->name_off);
744 
745 		if (name && !strcmp(type_name, name))
746 			return i;
747 	}
748 
749 	return libbpf_err(-ENOENT);
750 }
751 
752 static __s32 btf_find_by_name_kind(const struct btf *btf, int start_id,
753 				   const char *type_name, __u32 kind)
754 {
755 	__u32 i, nr_types = btf__type_cnt(btf);
756 
757 	if (kind == BTF_KIND_UNKN || !strcmp(type_name, "void"))
758 		return 0;
759 
760 	for (i = start_id; i < nr_types; i++) {
761 		const struct btf_type *t = btf__type_by_id(btf, i);
762 		const char *name;
763 
764 		if (btf_kind(t) != kind)
765 			continue;
766 		name = btf__name_by_offset(btf, t->name_off);
767 		if (name && !strcmp(type_name, name))
768 			return i;
769 	}
770 
771 	return libbpf_err(-ENOENT);
772 }
773 
774 __s32 btf__find_by_name_kind_own(const struct btf *btf, const char *type_name,
775 				 __u32 kind)
776 {
777 	return btf_find_by_name_kind(btf, btf->start_id, type_name, kind);
778 }
779 
780 __s32 btf__find_by_name_kind(const struct btf *btf, const char *type_name,
781 			     __u32 kind)
782 {
783 	return btf_find_by_name_kind(btf, 1, type_name, kind);
784 }
785 
786 static bool btf_is_modifiable(const struct btf *btf)
787 {
788 	return (void *)btf->hdr != btf->raw_data;
789 }
790 
791 void btf__free(struct btf *btf)
792 {
793 	if (IS_ERR_OR_NULL(btf))
794 		return;
795 
796 	if (btf->fd >= 0)
797 		close(btf->fd);
798 
799 	if (btf_is_modifiable(btf)) {
800 		/* if BTF was modified after loading, it will have a split
801 		 * in-memory representation for header, types, and strings
802 		 * sections, so we need to free all of them individually. It
803 		 * might still have a cached contiguous raw data present,
804 		 * which will be unconditionally freed below.
805 		 */
806 		free(btf->hdr);
807 		free(btf->types_data);
808 		strset__free(btf->strs_set);
809 	}
810 	free(btf->raw_data);
811 	free(btf->raw_data_swapped);
812 	free(btf->type_offs);
813 	free(btf);
814 }
815 
816 static struct btf *btf_new_empty(struct btf *base_btf)
817 {
818 	struct btf *btf;
819 
820 	btf = calloc(1, sizeof(*btf));
821 	if (!btf)
822 		return ERR_PTR(-ENOMEM);
823 
824 	btf->nr_types = 0;
825 	btf->start_id = 1;
826 	btf->start_str_off = 0;
827 	btf->fd = -1;
828 	btf->ptr_sz = sizeof(void *);
829 	btf->swapped_endian = false;
830 
831 	if (base_btf) {
832 		btf->base_btf = base_btf;
833 		btf->start_id = btf__type_cnt(base_btf);
834 		btf->start_str_off = base_btf->hdr->str_len;
835 	}
836 
837 	/* +1 for empty string at offset 0 */
838 	btf->raw_size = sizeof(struct btf_header) + (base_btf ? 0 : 1);
839 	btf->raw_data = calloc(1, btf->raw_size);
840 	if (!btf->raw_data) {
841 		free(btf);
842 		return ERR_PTR(-ENOMEM);
843 	}
844 
845 	btf->hdr = btf->raw_data;
846 	btf->hdr->hdr_len = sizeof(struct btf_header);
847 	btf->hdr->magic = BTF_MAGIC;
848 	btf->hdr->version = BTF_VERSION;
849 
850 	btf->types_data = btf->raw_data + btf->hdr->hdr_len;
851 	btf->strs_data = btf->raw_data + btf->hdr->hdr_len;
852 	btf->hdr->str_len = base_btf ? 0 : 1; /* empty string at offset 0 */
853 
854 	return btf;
855 }
856 
857 struct btf *btf__new_empty(void)
858 {
859 	return libbpf_ptr(btf_new_empty(NULL));
860 }
861 
862 struct btf *btf__new_empty_split(struct btf *base_btf)
863 {
864 	return libbpf_ptr(btf_new_empty(base_btf));
865 }
866 
867 static struct btf *btf_new(const void *data, __u32 size, struct btf *base_btf)
868 {
869 	struct btf *btf;
870 	int err;
871 
872 	btf = calloc(1, sizeof(struct btf));
873 	if (!btf)
874 		return ERR_PTR(-ENOMEM);
875 
876 	btf->nr_types = 0;
877 	btf->start_id = 1;
878 	btf->start_str_off = 0;
879 	btf->fd = -1;
880 
881 	if (base_btf) {
882 		btf->base_btf = base_btf;
883 		btf->start_id = btf__type_cnt(base_btf);
884 		btf->start_str_off = base_btf->hdr->str_len;
885 	}
886 
887 	btf->raw_data = malloc(size);
888 	if (!btf->raw_data) {
889 		err = -ENOMEM;
890 		goto done;
891 	}
892 	memcpy(btf->raw_data, data, size);
893 	btf->raw_size = size;
894 
895 	btf->hdr = btf->raw_data;
896 	err = btf_parse_hdr(btf);
897 	if (err)
898 		goto done;
899 
900 	btf->strs_data = btf->raw_data + btf->hdr->hdr_len + btf->hdr->str_off;
901 	btf->types_data = btf->raw_data + btf->hdr->hdr_len + btf->hdr->type_off;
902 
903 	err = btf_parse_str_sec(btf);
904 	err = err ?: btf_parse_type_sec(btf);
905 	if (err)
906 		goto done;
907 
908 done:
909 	if (err) {
910 		btf__free(btf);
911 		return ERR_PTR(err);
912 	}
913 
914 	return btf;
915 }
916 
917 struct btf *btf__new(const void *data, __u32 size)
918 {
919 	return libbpf_ptr(btf_new(data, size, NULL));
920 }
921 
922 static struct btf *btf_parse_elf(const char *path, struct btf *base_btf,
923 				 struct btf_ext **btf_ext)
924 {
925 	Elf_Data *btf_data = NULL, *btf_ext_data = NULL;
926 	int err = 0, fd = -1, idx = 0;
927 	struct btf *btf = NULL;
928 	Elf_Scn *scn = NULL;
929 	Elf *elf = NULL;
930 	GElf_Ehdr ehdr;
931 	size_t shstrndx;
932 
933 	if (elf_version(EV_CURRENT) == EV_NONE) {
934 		pr_warn("failed to init libelf for %s\n", path);
935 		return ERR_PTR(-LIBBPF_ERRNO__LIBELF);
936 	}
937 
938 	fd = open(path, O_RDONLY | O_CLOEXEC);
939 	if (fd < 0) {
940 		err = -errno;
941 		pr_warn("failed to open %s: %s\n", path, strerror(errno));
942 		return ERR_PTR(err);
943 	}
944 
945 	err = -LIBBPF_ERRNO__FORMAT;
946 
947 	elf = elf_begin(fd, ELF_C_READ, NULL);
948 	if (!elf) {
949 		pr_warn("failed to open %s as ELF file\n", path);
950 		goto done;
951 	}
952 	if (!gelf_getehdr(elf, &ehdr)) {
953 		pr_warn("failed to get EHDR from %s\n", path);
954 		goto done;
955 	}
956 
957 	if (elf_getshdrstrndx(elf, &shstrndx)) {
958 		pr_warn("failed to get section names section index for %s\n",
959 			path);
960 		goto done;
961 	}
962 
963 	if (!elf_rawdata(elf_getscn(elf, shstrndx), NULL)) {
964 		pr_warn("failed to get e_shstrndx from %s\n", path);
965 		goto done;
966 	}
967 
968 	while ((scn = elf_nextscn(elf, scn)) != NULL) {
969 		GElf_Shdr sh;
970 		char *name;
971 
972 		idx++;
973 		if (gelf_getshdr(scn, &sh) != &sh) {
974 			pr_warn("failed to get section(%d) header from %s\n",
975 				idx, path);
976 			goto done;
977 		}
978 		name = elf_strptr(elf, shstrndx, sh.sh_name);
979 		if (!name) {
980 			pr_warn("failed to get section(%d) name from %s\n",
981 				idx, path);
982 			goto done;
983 		}
984 		if (strcmp(name, BTF_ELF_SEC) == 0) {
985 			btf_data = elf_getdata(scn, 0);
986 			if (!btf_data) {
987 				pr_warn("failed to get section(%d, %s) data from %s\n",
988 					idx, name, path);
989 				goto done;
990 			}
991 			continue;
992 		} else if (btf_ext && strcmp(name, BTF_EXT_ELF_SEC) == 0) {
993 			btf_ext_data = elf_getdata(scn, 0);
994 			if (!btf_ext_data) {
995 				pr_warn("failed to get section(%d, %s) data from %s\n",
996 					idx, name, path);
997 				goto done;
998 			}
999 			continue;
1000 		}
1001 	}
1002 
1003 	if (!btf_data) {
1004 		pr_warn("failed to find '%s' ELF section in %s\n", BTF_ELF_SEC, path);
1005 		err = -ENODATA;
1006 		goto done;
1007 	}
1008 	btf = btf_new(btf_data->d_buf, btf_data->d_size, base_btf);
1009 	err = libbpf_get_error(btf);
1010 	if (err)
1011 		goto done;
1012 
1013 	switch (gelf_getclass(elf)) {
1014 	case ELFCLASS32:
1015 		btf__set_pointer_size(btf, 4);
1016 		break;
1017 	case ELFCLASS64:
1018 		btf__set_pointer_size(btf, 8);
1019 		break;
1020 	default:
1021 		pr_warn("failed to get ELF class (bitness) for %s\n", path);
1022 		break;
1023 	}
1024 
1025 	if (btf_ext && btf_ext_data) {
1026 		*btf_ext = btf_ext__new(btf_ext_data->d_buf, btf_ext_data->d_size);
1027 		err = libbpf_get_error(*btf_ext);
1028 		if (err)
1029 			goto done;
1030 	} else if (btf_ext) {
1031 		*btf_ext = NULL;
1032 	}
1033 done:
1034 	if (elf)
1035 		elf_end(elf);
1036 	close(fd);
1037 
1038 	if (!err)
1039 		return btf;
1040 
1041 	if (btf_ext)
1042 		btf_ext__free(*btf_ext);
1043 	btf__free(btf);
1044 
1045 	return ERR_PTR(err);
1046 }
1047 
1048 struct btf *btf__parse_elf(const char *path, struct btf_ext **btf_ext)
1049 {
1050 	return libbpf_ptr(btf_parse_elf(path, NULL, btf_ext));
1051 }
1052 
1053 struct btf *btf__parse_elf_split(const char *path, struct btf *base_btf)
1054 {
1055 	return libbpf_ptr(btf_parse_elf(path, base_btf, NULL));
1056 }
1057 
1058 static struct btf *btf_parse_raw(const char *path, struct btf *base_btf)
1059 {
1060 	struct btf *btf = NULL;
1061 	void *data = NULL;
1062 	FILE *f = NULL;
1063 	__u16 magic;
1064 	int err = 0;
1065 	long sz;
1066 
1067 	f = fopen(path, "rb");
1068 	if (!f) {
1069 		err = -errno;
1070 		goto err_out;
1071 	}
1072 
1073 	/* check BTF magic */
1074 	if (fread(&magic, 1, sizeof(magic), f) < sizeof(magic)) {
1075 		err = -EIO;
1076 		goto err_out;
1077 	}
1078 	if (magic != BTF_MAGIC && magic != bswap_16(BTF_MAGIC)) {
1079 		/* definitely not a raw BTF */
1080 		err = -EPROTO;
1081 		goto err_out;
1082 	}
1083 
1084 	/* get file size */
1085 	if (fseek(f, 0, SEEK_END)) {
1086 		err = -errno;
1087 		goto err_out;
1088 	}
1089 	sz = ftell(f);
1090 	if (sz < 0) {
1091 		err = -errno;
1092 		goto err_out;
1093 	}
1094 	/* rewind to the start */
1095 	if (fseek(f, 0, SEEK_SET)) {
1096 		err = -errno;
1097 		goto err_out;
1098 	}
1099 
1100 	/* pre-alloc memory and read all of BTF data */
1101 	data = malloc(sz);
1102 	if (!data) {
1103 		err = -ENOMEM;
1104 		goto err_out;
1105 	}
1106 	if (fread(data, 1, sz, f) < sz) {
1107 		err = -EIO;
1108 		goto err_out;
1109 	}
1110 
1111 	/* finally parse BTF data */
1112 	btf = btf_new(data, sz, base_btf);
1113 
1114 err_out:
1115 	free(data);
1116 	if (f)
1117 		fclose(f);
1118 	return err ? ERR_PTR(err) : btf;
1119 }
1120 
1121 struct btf *btf__parse_raw(const char *path)
1122 {
1123 	return libbpf_ptr(btf_parse_raw(path, NULL));
1124 }
1125 
1126 struct btf *btf__parse_raw_split(const char *path, struct btf *base_btf)
1127 {
1128 	return libbpf_ptr(btf_parse_raw(path, base_btf));
1129 }
1130 
1131 static struct btf *btf_parse(const char *path, struct btf *base_btf, struct btf_ext **btf_ext)
1132 {
1133 	struct btf *btf;
1134 	int err;
1135 
1136 	if (btf_ext)
1137 		*btf_ext = NULL;
1138 
1139 	btf = btf_parse_raw(path, base_btf);
1140 	err = libbpf_get_error(btf);
1141 	if (!err)
1142 		return btf;
1143 	if (err != -EPROTO)
1144 		return ERR_PTR(err);
1145 	return btf_parse_elf(path, base_btf, btf_ext);
1146 }
1147 
1148 struct btf *btf__parse(const char *path, struct btf_ext **btf_ext)
1149 {
1150 	return libbpf_ptr(btf_parse(path, NULL, btf_ext));
1151 }
1152 
1153 struct btf *btf__parse_split(const char *path, struct btf *base_btf)
1154 {
1155 	return libbpf_ptr(btf_parse(path, base_btf, NULL));
1156 }
1157 
1158 static void *btf_get_raw_data(const struct btf *btf, __u32 *size, bool swap_endian);
1159 
1160 int btf_load_into_kernel(struct btf *btf, char *log_buf, size_t log_sz, __u32 log_level)
1161 {
1162 	LIBBPF_OPTS(bpf_btf_load_opts, opts);
1163 	__u32 buf_sz = 0, raw_size;
1164 	char *buf = NULL, *tmp;
1165 	void *raw_data;
1166 	int err = 0;
1167 
1168 	if (btf->fd >= 0)
1169 		return libbpf_err(-EEXIST);
1170 	if (log_sz && !log_buf)
1171 		return libbpf_err(-EINVAL);
1172 
1173 	/* cache native raw data representation */
1174 	raw_data = btf_get_raw_data(btf, &raw_size, false);
1175 	if (!raw_data) {
1176 		err = -ENOMEM;
1177 		goto done;
1178 	}
1179 	btf->raw_size = raw_size;
1180 	btf->raw_data = raw_data;
1181 
1182 retry_load:
1183 	/* if log_level is 0, we won't provide log_buf/log_size to the kernel,
1184 	 * initially. Only if BTF loading fails, we bump log_level to 1 and
1185 	 * retry, using either auto-allocated or custom log_buf. This way
1186 	 * non-NULL custom log_buf provides a buffer just in case, but hopes
1187 	 * for successful load and no need for log_buf.
1188 	 */
1189 	if (log_level) {
1190 		/* if caller didn't provide custom log_buf, we'll keep
1191 		 * allocating our own progressively bigger buffers for BTF
1192 		 * verification log
1193 		 */
1194 		if (!log_buf) {
1195 			buf_sz = max((__u32)BPF_LOG_BUF_SIZE, buf_sz * 2);
1196 			tmp = realloc(buf, buf_sz);
1197 			if (!tmp) {
1198 				err = -ENOMEM;
1199 				goto done;
1200 			}
1201 			buf = tmp;
1202 			buf[0] = '\0';
1203 		}
1204 
1205 		opts.log_buf = log_buf ? log_buf : buf;
1206 		opts.log_size = log_buf ? log_sz : buf_sz;
1207 		opts.log_level = log_level;
1208 	}
1209 
1210 	btf->fd = bpf_btf_load(raw_data, raw_size, &opts);
1211 	if (btf->fd < 0) {
1212 		/* time to turn on verbose mode and try again */
1213 		if (log_level == 0) {
1214 			log_level = 1;
1215 			goto retry_load;
1216 		}
1217 		/* only retry if caller didn't provide custom log_buf, but
1218 		 * make sure we can never overflow buf_sz
1219 		 */
1220 		if (!log_buf && errno == ENOSPC && buf_sz <= UINT_MAX / 2)
1221 			goto retry_load;
1222 
1223 		err = -errno;
1224 		pr_warn("BTF loading error: %d\n", err);
1225 		/* don't print out contents of custom log_buf */
1226 		if (!log_buf && buf[0])
1227 			pr_warn("-- BEGIN BTF LOAD LOG ---\n%s\n-- END BTF LOAD LOG --\n", buf);
1228 	}
1229 
1230 done:
1231 	free(buf);
1232 	return libbpf_err(err);
1233 }
1234 
1235 int btf__load_into_kernel(struct btf *btf)
1236 {
1237 	return btf_load_into_kernel(btf, NULL, 0, 0);
1238 }
1239 
1240 int btf__fd(const struct btf *btf)
1241 {
1242 	return btf->fd;
1243 }
1244 
1245 void btf__set_fd(struct btf *btf, int fd)
1246 {
1247 	btf->fd = fd;
1248 }
1249 
1250 static const void *btf_strs_data(const struct btf *btf)
1251 {
1252 	return btf->strs_data ? btf->strs_data : strset__data(btf->strs_set);
1253 }
1254 
1255 static void *btf_get_raw_data(const struct btf *btf, __u32 *size, bool swap_endian)
1256 {
1257 	struct btf_header *hdr = btf->hdr;
1258 	struct btf_type *t;
1259 	void *data, *p;
1260 	__u32 data_sz;
1261 	int i;
1262 
1263 	data = swap_endian ? btf->raw_data_swapped : btf->raw_data;
1264 	if (data) {
1265 		*size = btf->raw_size;
1266 		return data;
1267 	}
1268 
1269 	data_sz = hdr->hdr_len + hdr->type_len + hdr->str_len;
1270 	data = calloc(1, data_sz);
1271 	if (!data)
1272 		return NULL;
1273 	p = data;
1274 
1275 	memcpy(p, hdr, hdr->hdr_len);
1276 	if (swap_endian)
1277 		btf_bswap_hdr(p);
1278 	p += hdr->hdr_len;
1279 
1280 	memcpy(p, btf->types_data, hdr->type_len);
1281 	if (swap_endian) {
1282 		for (i = 0; i < btf->nr_types; i++) {
1283 			t = p + btf->type_offs[i];
1284 			/* btf_bswap_type_rest() relies on native t->info, so
1285 			 * we swap base type info after we swapped all the
1286 			 * additional information
1287 			 */
1288 			if (btf_bswap_type_rest(t))
1289 				goto err_out;
1290 			btf_bswap_type_base(t);
1291 		}
1292 	}
1293 	p += hdr->type_len;
1294 
1295 	memcpy(p, btf_strs_data(btf), hdr->str_len);
1296 	p += hdr->str_len;
1297 
1298 	*size = data_sz;
1299 	return data;
1300 err_out:
1301 	free(data);
1302 	return NULL;
1303 }
1304 
1305 const void *btf__raw_data(const struct btf *btf_ro, __u32 *size)
1306 {
1307 	struct btf *btf = (struct btf *)btf_ro;
1308 	__u32 data_sz;
1309 	void *data;
1310 
1311 	data = btf_get_raw_data(btf, &data_sz, btf->swapped_endian);
1312 	if (!data)
1313 		return errno = ENOMEM, NULL;
1314 
1315 	btf->raw_size = data_sz;
1316 	if (btf->swapped_endian)
1317 		btf->raw_data_swapped = data;
1318 	else
1319 		btf->raw_data = data;
1320 	*size = data_sz;
1321 	return data;
1322 }
1323 
1324 __attribute__((alias("btf__raw_data")))
1325 const void *btf__get_raw_data(const struct btf *btf, __u32 *size);
1326 
1327 const char *btf__str_by_offset(const struct btf *btf, __u32 offset)
1328 {
1329 	if (offset < btf->start_str_off)
1330 		return btf__str_by_offset(btf->base_btf, offset);
1331 	else if (offset - btf->start_str_off < btf->hdr->str_len)
1332 		return btf_strs_data(btf) + (offset - btf->start_str_off);
1333 	else
1334 		return errno = EINVAL, NULL;
1335 }
1336 
1337 const char *btf__name_by_offset(const struct btf *btf, __u32 offset)
1338 {
1339 	return btf__str_by_offset(btf, offset);
1340 }
1341 
1342 struct btf *btf_get_from_fd(int btf_fd, struct btf *base_btf)
1343 {
1344 	struct bpf_btf_info btf_info;
1345 	__u32 len = sizeof(btf_info);
1346 	__u32 last_size;
1347 	struct btf *btf;
1348 	void *ptr;
1349 	int err;
1350 
1351 	/* we won't know btf_size until we call bpf_btf_get_info_by_fd(). so
1352 	 * let's start with a sane default - 4KiB here - and resize it only if
1353 	 * bpf_btf_get_info_by_fd() needs a bigger buffer.
1354 	 */
1355 	last_size = 4096;
1356 	ptr = malloc(last_size);
1357 	if (!ptr)
1358 		return ERR_PTR(-ENOMEM);
1359 
1360 	memset(&btf_info, 0, sizeof(btf_info));
1361 	btf_info.btf = ptr_to_u64(ptr);
1362 	btf_info.btf_size = last_size;
1363 	err = bpf_btf_get_info_by_fd(btf_fd, &btf_info, &len);
1364 
1365 	if (!err && btf_info.btf_size > last_size) {
1366 		void *temp_ptr;
1367 
1368 		last_size = btf_info.btf_size;
1369 		temp_ptr = realloc(ptr, last_size);
1370 		if (!temp_ptr) {
1371 			btf = ERR_PTR(-ENOMEM);
1372 			goto exit_free;
1373 		}
1374 		ptr = temp_ptr;
1375 
1376 		len = sizeof(btf_info);
1377 		memset(&btf_info, 0, sizeof(btf_info));
1378 		btf_info.btf = ptr_to_u64(ptr);
1379 		btf_info.btf_size = last_size;
1380 
1381 		err = bpf_btf_get_info_by_fd(btf_fd, &btf_info, &len);
1382 	}
1383 
1384 	if (err || btf_info.btf_size > last_size) {
1385 		btf = err ? ERR_PTR(-errno) : ERR_PTR(-E2BIG);
1386 		goto exit_free;
1387 	}
1388 
1389 	btf = btf_new(ptr, btf_info.btf_size, base_btf);
1390 
1391 exit_free:
1392 	free(ptr);
1393 	return btf;
1394 }
1395 
1396 struct btf *btf__load_from_kernel_by_id_split(__u32 id, struct btf *base_btf)
1397 {
1398 	struct btf *btf;
1399 	int btf_fd;
1400 
1401 	btf_fd = bpf_btf_get_fd_by_id(id);
1402 	if (btf_fd < 0)
1403 		return libbpf_err_ptr(-errno);
1404 
1405 	btf = btf_get_from_fd(btf_fd, base_btf);
1406 	close(btf_fd);
1407 
1408 	return libbpf_ptr(btf);
1409 }
1410 
1411 struct btf *btf__load_from_kernel_by_id(__u32 id)
1412 {
1413 	return btf__load_from_kernel_by_id_split(id, NULL);
1414 }
1415 
1416 static void btf_invalidate_raw_data(struct btf *btf)
1417 {
1418 	if (btf->raw_data) {
1419 		free(btf->raw_data);
1420 		btf->raw_data = NULL;
1421 	}
1422 	if (btf->raw_data_swapped) {
1423 		free(btf->raw_data_swapped);
1424 		btf->raw_data_swapped = NULL;
1425 	}
1426 }
1427 
1428 /* Ensure BTF is ready to be modified (by splitting into a three memory
1429  * regions for header, types, and strings). Also invalidate cached
1430  * raw_data, if any.
1431  */
1432 static int btf_ensure_modifiable(struct btf *btf)
1433 {
1434 	void *hdr, *types;
1435 	struct strset *set = NULL;
1436 	int err = -ENOMEM;
1437 
1438 	if (btf_is_modifiable(btf)) {
1439 		/* any BTF modification invalidates raw_data */
1440 		btf_invalidate_raw_data(btf);
1441 		return 0;
1442 	}
1443 
1444 	/* split raw data into three memory regions */
1445 	hdr = malloc(btf->hdr->hdr_len);
1446 	types = malloc(btf->hdr->type_len);
1447 	if (!hdr || !types)
1448 		goto err_out;
1449 
1450 	memcpy(hdr, btf->hdr, btf->hdr->hdr_len);
1451 	memcpy(types, btf->types_data, btf->hdr->type_len);
1452 
1453 	/* build lookup index for all strings */
1454 	set = strset__new(BTF_MAX_STR_OFFSET, btf->strs_data, btf->hdr->str_len);
1455 	if (IS_ERR(set)) {
1456 		err = PTR_ERR(set);
1457 		goto err_out;
1458 	}
1459 
1460 	/* only when everything was successful, update internal state */
1461 	btf->hdr = hdr;
1462 	btf->types_data = types;
1463 	btf->types_data_cap = btf->hdr->type_len;
1464 	btf->strs_data = NULL;
1465 	btf->strs_set = set;
1466 	/* if BTF was created from scratch, all strings are guaranteed to be
1467 	 * unique and deduplicated
1468 	 */
1469 	if (btf->hdr->str_len == 0)
1470 		btf->strs_deduped = true;
1471 	if (!btf->base_btf && btf->hdr->str_len == 1)
1472 		btf->strs_deduped = true;
1473 
1474 	/* invalidate raw_data representation */
1475 	btf_invalidate_raw_data(btf);
1476 
1477 	return 0;
1478 
1479 err_out:
1480 	strset__free(set);
1481 	free(hdr);
1482 	free(types);
1483 	return err;
1484 }
1485 
1486 /* Find an offset in BTF string section that corresponds to a given string *s*.
1487  * Returns:
1488  *   - >0 offset into string section, if string is found;
1489  *   - -ENOENT, if string is not in the string section;
1490  *   - <0, on any other error.
1491  */
1492 int btf__find_str(struct btf *btf, const char *s)
1493 {
1494 	int off;
1495 
1496 	if (btf->base_btf) {
1497 		off = btf__find_str(btf->base_btf, s);
1498 		if (off != -ENOENT)
1499 			return off;
1500 	}
1501 
1502 	/* BTF needs to be in a modifiable state to build string lookup index */
1503 	if (btf_ensure_modifiable(btf))
1504 		return libbpf_err(-ENOMEM);
1505 
1506 	off = strset__find_str(btf->strs_set, s);
1507 	if (off < 0)
1508 		return libbpf_err(off);
1509 
1510 	return btf->start_str_off + off;
1511 }
1512 
1513 /* Add a string s to the BTF string section.
1514  * Returns:
1515  *   - > 0 offset into string section, on success;
1516  *   - < 0, on error.
1517  */
1518 int btf__add_str(struct btf *btf, const char *s)
1519 {
1520 	int off;
1521 
1522 	if (btf->base_btf) {
1523 		off = btf__find_str(btf->base_btf, s);
1524 		if (off != -ENOENT)
1525 			return off;
1526 	}
1527 
1528 	if (btf_ensure_modifiable(btf))
1529 		return libbpf_err(-ENOMEM);
1530 
1531 	off = strset__add_str(btf->strs_set, s);
1532 	if (off < 0)
1533 		return libbpf_err(off);
1534 
1535 	btf->hdr->str_len = strset__data_size(btf->strs_set);
1536 
1537 	return btf->start_str_off + off;
1538 }
1539 
1540 static void *btf_add_type_mem(struct btf *btf, size_t add_sz)
1541 {
1542 	return libbpf_add_mem(&btf->types_data, &btf->types_data_cap, 1,
1543 			      btf->hdr->type_len, UINT_MAX, add_sz);
1544 }
1545 
1546 static void btf_type_inc_vlen(struct btf_type *t)
1547 {
1548 	t->info = btf_type_info(btf_kind(t), btf_vlen(t) + 1, btf_kflag(t));
1549 }
1550 
1551 static int btf_commit_type(struct btf *btf, int data_sz)
1552 {
1553 	int err;
1554 
1555 	err = btf_add_type_idx_entry(btf, btf->hdr->type_len);
1556 	if (err)
1557 		return libbpf_err(err);
1558 
1559 	btf->hdr->type_len += data_sz;
1560 	btf->hdr->str_off += data_sz;
1561 	btf->nr_types++;
1562 	return btf->start_id + btf->nr_types - 1;
1563 }
1564 
1565 struct btf_pipe {
1566 	const struct btf *src;
1567 	struct btf *dst;
1568 	struct hashmap *str_off_map; /* map string offsets from src to dst */
1569 };
1570 
1571 static int btf_rewrite_str(__u32 *str_off, void *ctx)
1572 {
1573 	struct btf_pipe *p = ctx;
1574 	long mapped_off;
1575 	int off, err;
1576 
1577 	if (!*str_off) /* nothing to do for empty strings */
1578 		return 0;
1579 
1580 	if (p->str_off_map &&
1581 	    hashmap__find(p->str_off_map, *str_off, &mapped_off)) {
1582 		*str_off = mapped_off;
1583 		return 0;
1584 	}
1585 
1586 	off = btf__add_str(p->dst, btf__str_by_offset(p->src, *str_off));
1587 	if (off < 0)
1588 		return off;
1589 
1590 	/* Remember string mapping from src to dst.  It avoids
1591 	 * performing expensive string comparisons.
1592 	 */
1593 	if (p->str_off_map) {
1594 		err = hashmap__append(p->str_off_map, *str_off, off);
1595 		if (err)
1596 			return err;
1597 	}
1598 
1599 	*str_off = off;
1600 	return 0;
1601 }
1602 
1603 int btf__add_type(struct btf *btf, const struct btf *src_btf, const struct btf_type *src_type)
1604 {
1605 	struct btf_pipe p = { .src = src_btf, .dst = btf };
1606 	struct btf_type *t;
1607 	int sz, err;
1608 
1609 	sz = btf_type_size(src_type);
1610 	if (sz < 0)
1611 		return libbpf_err(sz);
1612 
1613 	/* deconstruct BTF, if necessary, and invalidate raw_data */
1614 	if (btf_ensure_modifiable(btf))
1615 		return libbpf_err(-ENOMEM);
1616 
1617 	t = btf_add_type_mem(btf, sz);
1618 	if (!t)
1619 		return libbpf_err(-ENOMEM);
1620 
1621 	memcpy(t, src_type, sz);
1622 
1623 	err = btf_type_visit_str_offs(t, btf_rewrite_str, &p);
1624 	if (err)
1625 		return libbpf_err(err);
1626 
1627 	return btf_commit_type(btf, sz);
1628 }
1629 
1630 static int btf_rewrite_type_ids(__u32 *type_id, void *ctx)
1631 {
1632 	struct btf *btf = ctx;
1633 
1634 	if (!*type_id) /* nothing to do for VOID references */
1635 		return 0;
1636 
1637 	/* we haven't updated btf's type count yet, so
1638 	 * btf->start_id + btf->nr_types - 1 is the type ID offset we should
1639 	 * add to all newly added BTF types
1640 	 */
1641 	*type_id += btf->start_id + btf->nr_types - 1;
1642 	return 0;
1643 }
1644 
1645 static size_t btf_dedup_identity_hash_fn(long key, void *ctx);
1646 static bool btf_dedup_equal_fn(long k1, long k2, void *ctx);
1647 
1648 int btf__add_btf(struct btf *btf, const struct btf *src_btf)
1649 {
1650 	struct btf_pipe p = { .src = src_btf, .dst = btf };
1651 	int data_sz, sz, cnt, i, err, old_strs_len;
1652 	__u32 *off;
1653 	void *t;
1654 
1655 	/* appending split BTF isn't supported yet */
1656 	if (src_btf->base_btf)
1657 		return libbpf_err(-ENOTSUP);
1658 
1659 	/* deconstruct BTF, if necessary, and invalidate raw_data */
1660 	if (btf_ensure_modifiable(btf))
1661 		return libbpf_err(-ENOMEM);
1662 
1663 	/* remember original strings section size if we have to roll back
1664 	 * partial strings section changes
1665 	 */
1666 	old_strs_len = btf->hdr->str_len;
1667 
1668 	data_sz = src_btf->hdr->type_len;
1669 	cnt = btf__type_cnt(src_btf) - 1;
1670 
1671 	/* pre-allocate enough memory for new types */
1672 	t = btf_add_type_mem(btf, data_sz);
1673 	if (!t)
1674 		return libbpf_err(-ENOMEM);
1675 
1676 	/* pre-allocate enough memory for type offset index for new types */
1677 	off = btf_add_type_offs_mem(btf, cnt);
1678 	if (!off)
1679 		return libbpf_err(-ENOMEM);
1680 
1681 	/* Map the string offsets from src_btf to the offsets from btf to improve performance */
1682 	p.str_off_map = hashmap__new(btf_dedup_identity_hash_fn, btf_dedup_equal_fn, NULL);
1683 	if (IS_ERR(p.str_off_map))
1684 		return libbpf_err(-ENOMEM);
1685 
1686 	/* bulk copy types data for all types from src_btf */
1687 	memcpy(t, src_btf->types_data, data_sz);
1688 
1689 	for (i = 0; i < cnt; i++) {
1690 		sz = btf_type_size(t);
1691 		if (sz < 0) {
1692 			/* unlikely, has to be corrupted src_btf */
1693 			err = sz;
1694 			goto err_out;
1695 		}
1696 
1697 		/* fill out type ID to type offset mapping for lookups by type ID */
1698 		*off = t - btf->types_data;
1699 
1700 		/* add, dedup, and remap strings referenced by this BTF type */
1701 		err = btf_type_visit_str_offs(t, btf_rewrite_str, &p);
1702 		if (err)
1703 			goto err_out;
1704 
1705 		/* remap all type IDs referenced from this BTF type */
1706 		err = btf_type_visit_type_ids(t, btf_rewrite_type_ids, btf);
1707 		if (err)
1708 			goto err_out;
1709 
1710 		/* go to next type data and type offset index entry */
1711 		t += sz;
1712 		off++;
1713 	}
1714 
1715 	/* Up until now any of the copied type data was effectively invisible,
1716 	 * so if we exited early before this point due to error, BTF would be
1717 	 * effectively unmodified. There would be extra internal memory
1718 	 * pre-allocated, but it would not be available for querying.  But now
1719 	 * that we've copied and rewritten all the data successfully, we can
1720 	 * update type count and various internal offsets and sizes to
1721 	 * "commit" the changes and made them visible to the outside world.
1722 	 */
1723 	btf->hdr->type_len += data_sz;
1724 	btf->hdr->str_off += data_sz;
1725 	btf->nr_types += cnt;
1726 
1727 	hashmap__free(p.str_off_map);
1728 
1729 	/* return type ID of the first added BTF type */
1730 	return btf->start_id + btf->nr_types - cnt;
1731 err_out:
1732 	/* zero out preallocated memory as if it was just allocated with
1733 	 * libbpf_add_mem()
1734 	 */
1735 	memset(btf->types_data + btf->hdr->type_len, 0, data_sz);
1736 	memset(btf->strs_data + old_strs_len, 0, btf->hdr->str_len - old_strs_len);
1737 
1738 	/* and now restore original strings section size; types data size
1739 	 * wasn't modified, so doesn't need restoring, see big comment above
1740 	 */
1741 	btf->hdr->str_len = old_strs_len;
1742 
1743 	hashmap__free(p.str_off_map);
1744 
1745 	return libbpf_err(err);
1746 }
1747 
1748 /*
1749  * Append new BTF_KIND_INT type with:
1750  *   - *name* - non-empty, non-NULL type name;
1751  *   - *sz* - power-of-2 (1, 2, 4, ..) size of the type, in bytes;
1752  *   - encoding is a combination of BTF_INT_SIGNED, BTF_INT_CHAR, BTF_INT_BOOL.
1753  * Returns:
1754  *   - >0, type ID of newly added BTF type;
1755  *   - <0, on error.
1756  */
1757 int btf__add_int(struct btf *btf, const char *name, size_t byte_sz, int encoding)
1758 {
1759 	struct btf_type *t;
1760 	int sz, name_off;
1761 
1762 	/* non-empty name */
1763 	if (!name || !name[0])
1764 		return libbpf_err(-EINVAL);
1765 	/* byte_sz must be power of 2 */
1766 	if (!byte_sz || (byte_sz & (byte_sz - 1)) || byte_sz > 16)
1767 		return libbpf_err(-EINVAL);
1768 	if (encoding & ~(BTF_INT_SIGNED | BTF_INT_CHAR | BTF_INT_BOOL))
1769 		return libbpf_err(-EINVAL);
1770 
1771 	/* deconstruct BTF, if necessary, and invalidate raw_data */
1772 	if (btf_ensure_modifiable(btf))
1773 		return libbpf_err(-ENOMEM);
1774 
1775 	sz = sizeof(struct btf_type) + sizeof(int);
1776 	t = btf_add_type_mem(btf, sz);
1777 	if (!t)
1778 		return libbpf_err(-ENOMEM);
1779 
1780 	/* if something goes wrong later, we might end up with an extra string,
1781 	 * but that shouldn't be a problem, because BTF can't be constructed
1782 	 * completely anyway and will most probably be just discarded
1783 	 */
1784 	name_off = btf__add_str(btf, name);
1785 	if (name_off < 0)
1786 		return name_off;
1787 
1788 	t->name_off = name_off;
1789 	t->info = btf_type_info(BTF_KIND_INT, 0, 0);
1790 	t->size = byte_sz;
1791 	/* set INT info, we don't allow setting legacy bit offset/size */
1792 	*(__u32 *)(t + 1) = (encoding << 24) | (byte_sz * 8);
1793 
1794 	return btf_commit_type(btf, sz);
1795 }
1796 
1797 /*
1798  * Append new BTF_KIND_FLOAT type with:
1799  *   - *name* - non-empty, non-NULL type name;
1800  *   - *sz* - size of the type, in bytes;
1801  * Returns:
1802  *   - >0, type ID of newly added BTF type;
1803  *   - <0, on error.
1804  */
1805 int btf__add_float(struct btf *btf, const char *name, size_t byte_sz)
1806 {
1807 	struct btf_type *t;
1808 	int sz, name_off;
1809 
1810 	/* non-empty name */
1811 	if (!name || !name[0])
1812 		return libbpf_err(-EINVAL);
1813 
1814 	/* byte_sz must be one of the explicitly allowed values */
1815 	if (byte_sz != 2 && byte_sz != 4 && byte_sz != 8 && byte_sz != 12 &&
1816 	    byte_sz != 16)
1817 		return libbpf_err(-EINVAL);
1818 
1819 	if (btf_ensure_modifiable(btf))
1820 		return libbpf_err(-ENOMEM);
1821 
1822 	sz = sizeof(struct btf_type);
1823 	t = btf_add_type_mem(btf, sz);
1824 	if (!t)
1825 		return libbpf_err(-ENOMEM);
1826 
1827 	name_off = btf__add_str(btf, name);
1828 	if (name_off < 0)
1829 		return name_off;
1830 
1831 	t->name_off = name_off;
1832 	t->info = btf_type_info(BTF_KIND_FLOAT, 0, 0);
1833 	t->size = byte_sz;
1834 
1835 	return btf_commit_type(btf, sz);
1836 }
1837 
1838 /* it's completely legal to append BTF types with type IDs pointing forward to
1839  * types that haven't been appended yet, so we only make sure that id looks
1840  * sane, we can't guarantee that ID will always be valid
1841  */
1842 static int validate_type_id(int id)
1843 {
1844 	if (id < 0 || id > BTF_MAX_NR_TYPES)
1845 		return -EINVAL;
1846 	return 0;
1847 }
1848 
1849 /* generic append function for PTR, TYPEDEF, CONST/VOLATILE/RESTRICT */
1850 static int btf_add_ref_kind(struct btf *btf, int kind, const char *name, int ref_type_id)
1851 {
1852 	struct btf_type *t;
1853 	int sz, name_off = 0;
1854 
1855 	if (validate_type_id(ref_type_id))
1856 		return libbpf_err(-EINVAL);
1857 
1858 	if (btf_ensure_modifiable(btf))
1859 		return libbpf_err(-ENOMEM);
1860 
1861 	sz = sizeof(struct btf_type);
1862 	t = btf_add_type_mem(btf, sz);
1863 	if (!t)
1864 		return libbpf_err(-ENOMEM);
1865 
1866 	if (name && name[0]) {
1867 		name_off = btf__add_str(btf, name);
1868 		if (name_off < 0)
1869 			return name_off;
1870 	}
1871 
1872 	t->name_off = name_off;
1873 	t->info = btf_type_info(kind, 0, 0);
1874 	t->type = ref_type_id;
1875 
1876 	return btf_commit_type(btf, sz);
1877 }
1878 
1879 /*
1880  * Append new BTF_KIND_PTR type with:
1881  *   - *ref_type_id* - referenced type ID, it might not exist yet;
1882  * Returns:
1883  *   - >0, type ID of newly added BTF type;
1884  *   - <0, on error.
1885  */
1886 int btf__add_ptr(struct btf *btf, int ref_type_id)
1887 {
1888 	return btf_add_ref_kind(btf, BTF_KIND_PTR, NULL, ref_type_id);
1889 }
1890 
1891 /*
1892  * Append new BTF_KIND_ARRAY type with:
1893  *   - *index_type_id* - type ID of the type describing array index;
1894  *   - *elem_type_id* - type ID of the type describing array element;
1895  *   - *nr_elems* - the size of the array;
1896  * Returns:
1897  *   - >0, type ID of newly added BTF type;
1898  *   - <0, on error.
1899  */
1900 int btf__add_array(struct btf *btf, int index_type_id, int elem_type_id, __u32 nr_elems)
1901 {
1902 	struct btf_type *t;
1903 	struct btf_array *a;
1904 	int sz;
1905 
1906 	if (validate_type_id(index_type_id) || validate_type_id(elem_type_id))
1907 		return libbpf_err(-EINVAL);
1908 
1909 	if (btf_ensure_modifiable(btf))
1910 		return libbpf_err(-ENOMEM);
1911 
1912 	sz = sizeof(struct btf_type) + sizeof(struct btf_array);
1913 	t = btf_add_type_mem(btf, sz);
1914 	if (!t)
1915 		return libbpf_err(-ENOMEM);
1916 
1917 	t->name_off = 0;
1918 	t->info = btf_type_info(BTF_KIND_ARRAY, 0, 0);
1919 	t->size = 0;
1920 
1921 	a = btf_array(t);
1922 	a->type = elem_type_id;
1923 	a->index_type = index_type_id;
1924 	a->nelems = nr_elems;
1925 
1926 	return btf_commit_type(btf, sz);
1927 }
1928 
1929 /* generic STRUCT/UNION append function */
1930 static int btf_add_composite(struct btf *btf, int kind, const char *name, __u32 bytes_sz)
1931 {
1932 	struct btf_type *t;
1933 	int sz, name_off = 0;
1934 
1935 	if (btf_ensure_modifiable(btf))
1936 		return libbpf_err(-ENOMEM);
1937 
1938 	sz = sizeof(struct btf_type);
1939 	t = btf_add_type_mem(btf, sz);
1940 	if (!t)
1941 		return libbpf_err(-ENOMEM);
1942 
1943 	if (name && name[0]) {
1944 		name_off = btf__add_str(btf, name);
1945 		if (name_off < 0)
1946 			return name_off;
1947 	}
1948 
1949 	/* start out with vlen=0 and no kflag; this will be adjusted when
1950 	 * adding each member
1951 	 */
1952 	t->name_off = name_off;
1953 	t->info = btf_type_info(kind, 0, 0);
1954 	t->size = bytes_sz;
1955 
1956 	return btf_commit_type(btf, sz);
1957 }
1958 
1959 /*
1960  * Append new BTF_KIND_STRUCT type with:
1961  *   - *name* - name of the struct, can be NULL or empty for anonymous structs;
1962  *   - *byte_sz* - size of the struct, in bytes;
1963  *
1964  * Struct initially has no fields in it. Fields can be added by
1965  * btf__add_field() right after btf__add_struct() succeeds.
1966  *
1967  * Returns:
1968  *   - >0, type ID of newly added BTF type;
1969  *   - <0, on error.
1970  */
1971 int btf__add_struct(struct btf *btf, const char *name, __u32 byte_sz)
1972 {
1973 	return btf_add_composite(btf, BTF_KIND_STRUCT, name, byte_sz);
1974 }
1975 
1976 /*
1977  * Append new BTF_KIND_UNION type with:
1978  *   - *name* - name of the union, can be NULL or empty for anonymous union;
1979  *   - *byte_sz* - size of the union, in bytes;
1980  *
1981  * Union initially has no fields in it. Fields can be added by
1982  * btf__add_field() right after btf__add_union() succeeds. All fields
1983  * should have *bit_offset* of 0.
1984  *
1985  * Returns:
1986  *   - >0, type ID of newly added BTF type;
1987  *   - <0, on error.
1988  */
1989 int btf__add_union(struct btf *btf, const char *name, __u32 byte_sz)
1990 {
1991 	return btf_add_composite(btf, BTF_KIND_UNION, name, byte_sz);
1992 }
1993 
1994 static struct btf_type *btf_last_type(struct btf *btf)
1995 {
1996 	return btf_type_by_id(btf, btf__type_cnt(btf) - 1);
1997 }
1998 
1999 /*
2000  * Append new field for the current STRUCT/UNION type with:
2001  *   - *name* - name of the field, can be NULL or empty for anonymous field;
2002  *   - *type_id* - type ID for the type describing field type;
2003  *   - *bit_offset* - bit offset of the start of the field within struct/union;
2004  *   - *bit_size* - bit size of a bitfield, 0 for non-bitfield fields;
2005  * Returns:
2006  *   -  0, on success;
2007  *   - <0, on error.
2008  */
2009 int btf__add_field(struct btf *btf, const char *name, int type_id,
2010 		   __u32 bit_offset, __u32 bit_size)
2011 {
2012 	struct btf_type *t;
2013 	struct btf_member *m;
2014 	bool is_bitfield;
2015 	int sz, name_off = 0;
2016 
2017 	/* last type should be union/struct */
2018 	if (btf->nr_types == 0)
2019 		return libbpf_err(-EINVAL);
2020 	t = btf_last_type(btf);
2021 	if (!btf_is_composite(t))
2022 		return libbpf_err(-EINVAL);
2023 
2024 	if (validate_type_id(type_id))
2025 		return libbpf_err(-EINVAL);
2026 	/* best-effort bit field offset/size enforcement */
2027 	is_bitfield = bit_size || (bit_offset % 8 != 0);
2028 	if (is_bitfield && (bit_size == 0 || bit_size > 255 || bit_offset > 0xffffff))
2029 		return libbpf_err(-EINVAL);
2030 
2031 	/* only offset 0 is allowed for unions */
2032 	if (btf_is_union(t) && bit_offset)
2033 		return libbpf_err(-EINVAL);
2034 
2035 	/* decompose and invalidate raw data */
2036 	if (btf_ensure_modifiable(btf))
2037 		return libbpf_err(-ENOMEM);
2038 
2039 	sz = sizeof(struct btf_member);
2040 	m = btf_add_type_mem(btf, sz);
2041 	if (!m)
2042 		return libbpf_err(-ENOMEM);
2043 
2044 	if (name && name[0]) {
2045 		name_off = btf__add_str(btf, name);
2046 		if (name_off < 0)
2047 			return name_off;
2048 	}
2049 
2050 	m->name_off = name_off;
2051 	m->type = type_id;
2052 	m->offset = bit_offset | (bit_size << 24);
2053 
2054 	/* btf_add_type_mem can invalidate t pointer */
2055 	t = btf_last_type(btf);
2056 	/* update parent type's vlen and kflag */
2057 	t->info = btf_type_info(btf_kind(t), btf_vlen(t) + 1, is_bitfield || btf_kflag(t));
2058 
2059 	btf->hdr->type_len += sz;
2060 	btf->hdr->str_off += sz;
2061 	return 0;
2062 }
2063 
2064 static int btf_add_enum_common(struct btf *btf, const char *name, __u32 byte_sz,
2065 			       bool is_signed, __u8 kind)
2066 {
2067 	struct btf_type *t;
2068 	int sz, name_off = 0;
2069 
2070 	/* byte_sz must be power of 2 */
2071 	if (!byte_sz || (byte_sz & (byte_sz - 1)) || byte_sz > 8)
2072 		return libbpf_err(-EINVAL);
2073 
2074 	if (btf_ensure_modifiable(btf))
2075 		return libbpf_err(-ENOMEM);
2076 
2077 	sz = sizeof(struct btf_type);
2078 	t = btf_add_type_mem(btf, sz);
2079 	if (!t)
2080 		return libbpf_err(-ENOMEM);
2081 
2082 	if (name && name[0]) {
2083 		name_off = btf__add_str(btf, name);
2084 		if (name_off < 0)
2085 			return name_off;
2086 	}
2087 
2088 	/* start out with vlen=0; it will be adjusted when adding enum values */
2089 	t->name_off = name_off;
2090 	t->info = btf_type_info(kind, 0, is_signed);
2091 	t->size = byte_sz;
2092 
2093 	return btf_commit_type(btf, sz);
2094 }
2095 
2096 /*
2097  * Append new BTF_KIND_ENUM type with:
2098  *   - *name* - name of the enum, can be NULL or empty for anonymous enums;
2099  *   - *byte_sz* - size of the enum, in bytes.
2100  *
2101  * Enum initially has no enum values in it (and corresponds to enum forward
2102  * declaration). Enumerator values can be added by btf__add_enum_value()
2103  * immediately after btf__add_enum() succeeds.
2104  *
2105  * Returns:
2106  *   - >0, type ID of newly added BTF type;
2107  *   - <0, on error.
2108  */
2109 int btf__add_enum(struct btf *btf, const char *name, __u32 byte_sz)
2110 {
2111 	/*
2112 	 * set the signedness to be unsigned, it will change to signed
2113 	 * if any later enumerator is negative.
2114 	 */
2115 	return btf_add_enum_common(btf, name, byte_sz, false, BTF_KIND_ENUM);
2116 }
2117 
2118 /*
2119  * Append new enum value for the current ENUM type with:
2120  *   - *name* - name of the enumerator value, can't be NULL or empty;
2121  *   - *value* - integer value corresponding to enum value *name*;
2122  * Returns:
2123  *   -  0, on success;
2124  *   - <0, on error.
2125  */
2126 int btf__add_enum_value(struct btf *btf, const char *name, __s64 value)
2127 {
2128 	struct btf_type *t;
2129 	struct btf_enum *v;
2130 	int sz, name_off;
2131 
2132 	/* last type should be BTF_KIND_ENUM */
2133 	if (btf->nr_types == 0)
2134 		return libbpf_err(-EINVAL);
2135 	t = btf_last_type(btf);
2136 	if (!btf_is_enum(t))
2137 		return libbpf_err(-EINVAL);
2138 
2139 	/* non-empty name */
2140 	if (!name || !name[0])
2141 		return libbpf_err(-EINVAL);
2142 	if (value < INT_MIN || value > UINT_MAX)
2143 		return libbpf_err(-E2BIG);
2144 
2145 	/* decompose and invalidate raw data */
2146 	if (btf_ensure_modifiable(btf))
2147 		return libbpf_err(-ENOMEM);
2148 
2149 	sz = sizeof(struct btf_enum);
2150 	v = btf_add_type_mem(btf, sz);
2151 	if (!v)
2152 		return libbpf_err(-ENOMEM);
2153 
2154 	name_off = btf__add_str(btf, name);
2155 	if (name_off < 0)
2156 		return name_off;
2157 
2158 	v->name_off = name_off;
2159 	v->val = value;
2160 
2161 	/* update parent type's vlen */
2162 	t = btf_last_type(btf);
2163 	btf_type_inc_vlen(t);
2164 
2165 	/* if negative value, set signedness to signed */
2166 	if (value < 0)
2167 		t->info = btf_type_info(btf_kind(t), btf_vlen(t), true);
2168 
2169 	btf->hdr->type_len += sz;
2170 	btf->hdr->str_off += sz;
2171 	return 0;
2172 }
2173 
2174 /*
2175  * Append new BTF_KIND_ENUM64 type with:
2176  *   - *name* - name of the enum, can be NULL or empty for anonymous enums;
2177  *   - *byte_sz* - size of the enum, in bytes.
2178  *   - *is_signed* - whether the enum values are signed or not;
2179  *
2180  * Enum initially has no enum values in it (and corresponds to enum forward
2181  * declaration). Enumerator values can be added by btf__add_enum64_value()
2182  * immediately after btf__add_enum64() succeeds.
2183  *
2184  * Returns:
2185  *   - >0, type ID of newly added BTF type;
2186  *   - <0, on error.
2187  */
2188 int btf__add_enum64(struct btf *btf, const char *name, __u32 byte_sz,
2189 		    bool is_signed)
2190 {
2191 	return btf_add_enum_common(btf, name, byte_sz, is_signed,
2192 				   BTF_KIND_ENUM64);
2193 }
2194 
2195 /*
2196  * Append new enum value for the current ENUM64 type with:
2197  *   - *name* - name of the enumerator value, can't be NULL or empty;
2198  *   - *value* - integer value corresponding to enum value *name*;
2199  * Returns:
2200  *   -  0, on success;
2201  *   - <0, on error.
2202  */
2203 int btf__add_enum64_value(struct btf *btf, const char *name, __u64 value)
2204 {
2205 	struct btf_enum64 *v;
2206 	struct btf_type *t;
2207 	int sz, name_off;
2208 
2209 	/* last type should be BTF_KIND_ENUM64 */
2210 	if (btf->nr_types == 0)
2211 		return libbpf_err(-EINVAL);
2212 	t = btf_last_type(btf);
2213 	if (!btf_is_enum64(t))
2214 		return libbpf_err(-EINVAL);
2215 
2216 	/* non-empty name */
2217 	if (!name || !name[0])
2218 		return libbpf_err(-EINVAL);
2219 
2220 	/* decompose and invalidate raw data */
2221 	if (btf_ensure_modifiable(btf))
2222 		return libbpf_err(-ENOMEM);
2223 
2224 	sz = sizeof(struct btf_enum64);
2225 	v = btf_add_type_mem(btf, sz);
2226 	if (!v)
2227 		return libbpf_err(-ENOMEM);
2228 
2229 	name_off = btf__add_str(btf, name);
2230 	if (name_off < 0)
2231 		return name_off;
2232 
2233 	v->name_off = name_off;
2234 	v->val_lo32 = (__u32)value;
2235 	v->val_hi32 = value >> 32;
2236 
2237 	/* update parent type's vlen */
2238 	t = btf_last_type(btf);
2239 	btf_type_inc_vlen(t);
2240 
2241 	btf->hdr->type_len += sz;
2242 	btf->hdr->str_off += sz;
2243 	return 0;
2244 }
2245 
2246 /*
2247  * Append new BTF_KIND_FWD type with:
2248  *   - *name*, non-empty/non-NULL name;
2249  *   - *fwd_kind*, kind of forward declaration, one of BTF_FWD_STRUCT,
2250  *     BTF_FWD_UNION, or BTF_FWD_ENUM;
2251  * Returns:
2252  *   - >0, type ID of newly added BTF type;
2253  *   - <0, on error.
2254  */
2255 int btf__add_fwd(struct btf *btf, const char *name, enum btf_fwd_kind fwd_kind)
2256 {
2257 	if (!name || !name[0])
2258 		return libbpf_err(-EINVAL);
2259 
2260 	switch (fwd_kind) {
2261 	case BTF_FWD_STRUCT:
2262 	case BTF_FWD_UNION: {
2263 		struct btf_type *t;
2264 		int id;
2265 
2266 		id = btf_add_ref_kind(btf, BTF_KIND_FWD, name, 0);
2267 		if (id <= 0)
2268 			return id;
2269 		t = btf_type_by_id(btf, id);
2270 		t->info = btf_type_info(BTF_KIND_FWD, 0, fwd_kind == BTF_FWD_UNION);
2271 		return id;
2272 	}
2273 	case BTF_FWD_ENUM:
2274 		/* enum forward in BTF currently is just an enum with no enum
2275 		 * values; we also assume a standard 4-byte size for it
2276 		 */
2277 		return btf__add_enum(btf, name, sizeof(int));
2278 	default:
2279 		return libbpf_err(-EINVAL);
2280 	}
2281 }
2282 
2283 /*
2284  * Append new BTF_KING_TYPEDEF type with:
2285  *   - *name*, non-empty/non-NULL name;
2286  *   - *ref_type_id* - referenced type ID, it might not exist yet;
2287  * Returns:
2288  *   - >0, type ID of newly added BTF type;
2289  *   - <0, on error.
2290  */
2291 int btf__add_typedef(struct btf *btf, const char *name, int ref_type_id)
2292 {
2293 	if (!name || !name[0])
2294 		return libbpf_err(-EINVAL);
2295 
2296 	return btf_add_ref_kind(btf, BTF_KIND_TYPEDEF, name, ref_type_id);
2297 }
2298 
2299 /*
2300  * Append new BTF_KIND_VOLATILE type with:
2301  *   - *ref_type_id* - referenced type ID, it might not exist yet;
2302  * Returns:
2303  *   - >0, type ID of newly added BTF type;
2304  *   - <0, on error.
2305  */
2306 int btf__add_volatile(struct btf *btf, int ref_type_id)
2307 {
2308 	return btf_add_ref_kind(btf, BTF_KIND_VOLATILE, NULL, ref_type_id);
2309 }
2310 
2311 /*
2312  * Append new BTF_KIND_CONST type with:
2313  *   - *ref_type_id* - referenced type ID, it might not exist yet;
2314  * Returns:
2315  *   - >0, type ID of newly added BTF type;
2316  *   - <0, on error.
2317  */
2318 int btf__add_const(struct btf *btf, int ref_type_id)
2319 {
2320 	return btf_add_ref_kind(btf, BTF_KIND_CONST, NULL, ref_type_id);
2321 }
2322 
2323 /*
2324  * Append new BTF_KIND_RESTRICT type with:
2325  *   - *ref_type_id* - referenced type ID, it might not exist yet;
2326  * Returns:
2327  *   - >0, type ID of newly added BTF type;
2328  *   - <0, on error.
2329  */
2330 int btf__add_restrict(struct btf *btf, int ref_type_id)
2331 {
2332 	return btf_add_ref_kind(btf, BTF_KIND_RESTRICT, NULL, ref_type_id);
2333 }
2334 
2335 /*
2336  * Append new BTF_KIND_TYPE_TAG type with:
2337  *   - *value*, non-empty/non-NULL tag value;
2338  *   - *ref_type_id* - referenced type ID, it might not exist yet;
2339  * Returns:
2340  *   - >0, type ID of newly added BTF type;
2341  *   - <0, on error.
2342  */
2343 int btf__add_type_tag(struct btf *btf, const char *value, int ref_type_id)
2344 {
2345 	if (!value || !value[0])
2346 		return libbpf_err(-EINVAL);
2347 
2348 	return btf_add_ref_kind(btf, BTF_KIND_TYPE_TAG, value, ref_type_id);
2349 }
2350 
2351 /*
2352  * Append new BTF_KIND_FUNC type with:
2353  *   - *name*, non-empty/non-NULL name;
2354  *   - *proto_type_id* - FUNC_PROTO's type ID, it might not exist yet;
2355  * Returns:
2356  *   - >0, type ID of newly added BTF type;
2357  *   - <0, on error.
2358  */
2359 int btf__add_func(struct btf *btf, const char *name,
2360 		  enum btf_func_linkage linkage, int proto_type_id)
2361 {
2362 	int id;
2363 
2364 	if (!name || !name[0])
2365 		return libbpf_err(-EINVAL);
2366 	if (linkage != BTF_FUNC_STATIC && linkage != BTF_FUNC_GLOBAL &&
2367 	    linkage != BTF_FUNC_EXTERN)
2368 		return libbpf_err(-EINVAL);
2369 
2370 	id = btf_add_ref_kind(btf, BTF_KIND_FUNC, name, proto_type_id);
2371 	if (id > 0) {
2372 		struct btf_type *t = btf_type_by_id(btf, id);
2373 
2374 		t->info = btf_type_info(BTF_KIND_FUNC, linkage, 0);
2375 	}
2376 	return libbpf_err(id);
2377 }
2378 
2379 /*
2380  * Append new BTF_KIND_FUNC_PROTO with:
2381  *   - *ret_type_id* - type ID for return result of a function.
2382  *
2383  * Function prototype initially has no arguments, but they can be added by
2384  * btf__add_func_param() one by one, immediately after
2385  * btf__add_func_proto() succeeded.
2386  *
2387  * Returns:
2388  *   - >0, type ID of newly added BTF type;
2389  *   - <0, on error.
2390  */
2391 int btf__add_func_proto(struct btf *btf, int ret_type_id)
2392 {
2393 	struct btf_type *t;
2394 	int sz;
2395 
2396 	if (validate_type_id(ret_type_id))
2397 		return libbpf_err(-EINVAL);
2398 
2399 	if (btf_ensure_modifiable(btf))
2400 		return libbpf_err(-ENOMEM);
2401 
2402 	sz = sizeof(struct btf_type);
2403 	t = btf_add_type_mem(btf, sz);
2404 	if (!t)
2405 		return libbpf_err(-ENOMEM);
2406 
2407 	/* start out with vlen=0; this will be adjusted when adding enum
2408 	 * values, if necessary
2409 	 */
2410 	t->name_off = 0;
2411 	t->info = btf_type_info(BTF_KIND_FUNC_PROTO, 0, 0);
2412 	t->type = ret_type_id;
2413 
2414 	return btf_commit_type(btf, sz);
2415 }
2416 
2417 /*
2418  * Append new function parameter for current FUNC_PROTO type with:
2419  *   - *name* - parameter name, can be NULL or empty;
2420  *   - *type_id* - type ID describing the type of the parameter.
2421  * Returns:
2422  *   -  0, on success;
2423  *   - <0, on error.
2424  */
2425 int btf__add_func_param(struct btf *btf, const char *name, int type_id)
2426 {
2427 	struct btf_type *t;
2428 	struct btf_param *p;
2429 	int sz, name_off = 0;
2430 
2431 	if (validate_type_id(type_id))
2432 		return libbpf_err(-EINVAL);
2433 
2434 	/* last type should be BTF_KIND_FUNC_PROTO */
2435 	if (btf->nr_types == 0)
2436 		return libbpf_err(-EINVAL);
2437 	t = btf_last_type(btf);
2438 	if (!btf_is_func_proto(t))
2439 		return libbpf_err(-EINVAL);
2440 
2441 	/* decompose and invalidate raw data */
2442 	if (btf_ensure_modifiable(btf))
2443 		return libbpf_err(-ENOMEM);
2444 
2445 	sz = sizeof(struct btf_param);
2446 	p = btf_add_type_mem(btf, sz);
2447 	if (!p)
2448 		return libbpf_err(-ENOMEM);
2449 
2450 	if (name && name[0]) {
2451 		name_off = btf__add_str(btf, name);
2452 		if (name_off < 0)
2453 			return name_off;
2454 	}
2455 
2456 	p->name_off = name_off;
2457 	p->type = type_id;
2458 
2459 	/* update parent type's vlen */
2460 	t = btf_last_type(btf);
2461 	btf_type_inc_vlen(t);
2462 
2463 	btf->hdr->type_len += sz;
2464 	btf->hdr->str_off += sz;
2465 	return 0;
2466 }
2467 
2468 /*
2469  * Append new BTF_KIND_VAR type with:
2470  *   - *name* - non-empty/non-NULL name;
2471  *   - *linkage* - variable linkage, one of BTF_VAR_STATIC,
2472  *     BTF_VAR_GLOBAL_ALLOCATED, or BTF_VAR_GLOBAL_EXTERN;
2473  *   - *type_id* - type ID of the type describing the type of the variable.
2474  * Returns:
2475  *   - >0, type ID of newly added BTF type;
2476  *   - <0, on error.
2477  */
2478 int btf__add_var(struct btf *btf, const char *name, int linkage, int type_id)
2479 {
2480 	struct btf_type *t;
2481 	struct btf_var *v;
2482 	int sz, name_off;
2483 
2484 	/* non-empty name */
2485 	if (!name || !name[0])
2486 		return libbpf_err(-EINVAL);
2487 	if (linkage != BTF_VAR_STATIC && linkage != BTF_VAR_GLOBAL_ALLOCATED &&
2488 	    linkage != BTF_VAR_GLOBAL_EXTERN)
2489 		return libbpf_err(-EINVAL);
2490 	if (validate_type_id(type_id))
2491 		return libbpf_err(-EINVAL);
2492 
2493 	/* deconstruct BTF, if necessary, and invalidate raw_data */
2494 	if (btf_ensure_modifiable(btf))
2495 		return libbpf_err(-ENOMEM);
2496 
2497 	sz = sizeof(struct btf_type) + sizeof(struct btf_var);
2498 	t = btf_add_type_mem(btf, sz);
2499 	if (!t)
2500 		return libbpf_err(-ENOMEM);
2501 
2502 	name_off = btf__add_str(btf, name);
2503 	if (name_off < 0)
2504 		return name_off;
2505 
2506 	t->name_off = name_off;
2507 	t->info = btf_type_info(BTF_KIND_VAR, 0, 0);
2508 	t->type = type_id;
2509 
2510 	v = btf_var(t);
2511 	v->linkage = linkage;
2512 
2513 	return btf_commit_type(btf, sz);
2514 }
2515 
2516 /*
2517  * Append new BTF_KIND_DATASEC type with:
2518  *   - *name* - non-empty/non-NULL name;
2519  *   - *byte_sz* - data section size, in bytes.
2520  *
2521  * Data section is initially empty. Variables info can be added with
2522  * btf__add_datasec_var_info() calls, after btf__add_datasec() succeeds.
2523  *
2524  * Returns:
2525  *   - >0, type ID of newly added BTF type;
2526  *   - <0, on error.
2527  */
2528 int btf__add_datasec(struct btf *btf, const char *name, __u32 byte_sz)
2529 {
2530 	struct btf_type *t;
2531 	int sz, name_off;
2532 
2533 	/* non-empty name */
2534 	if (!name || !name[0])
2535 		return libbpf_err(-EINVAL);
2536 
2537 	if (btf_ensure_modifiable(btf))
2538 		return libbpf_err(-ENOMEM);
2539 
2540 	sz = sizeof(struct btf_type);
2541 	t = btf_add_type_mem(btf, sz);
2542 	if (!t)
2543 		return libbpf_err(-ENOMEM);
2544 
2545 	name_off = btf__add_str(btf, name);
2546 	if (name_off < 0)
2547 		return name_off;
2548 
2549 	/* start with vlen=0, which will be update as var_secinfos are added */
2550 	t->name_off = name_off;
2551 	t->info = btf_type_info(BTF_KIND_DATASEC, 0, 0);
2552 	t->size = byte_sz;
2553 
2554 	return btf_commit_type(btf, sz);
2555 }
2556 
2557 /*
2558  * Append new data section variable information entry for current DATASEC type:
2559  *   - *var_type_id* - type ID, describing type of the variable;
2560  *   - *offset* - variable offset within data section, in bytes;
2561  *   - *byte_sz* - variable size, in bytes.
2562  *
2563  * Returns:
2564  *   -  0, on success;
2565  *   - <0, on error.
2566  */
2567 int btf__add_datasec_var_info(struct btf *btf, int var_type_id, __u32 offset, __u32 byte_sz)
2568 {
2569 	struct btf_type *t;
2570 	struct btf_var_secinfo *v;
2571 	int sz;
2572 
2573 	/* last type should be BTF_KIND_DATASEC */
2574 	if (btf->nr_types == 0)
2575 		return libbpf_err(-EINVAL);
2576 	t = btf_last_type(btf);
2577 	if (!btf_is_datasec(t))
2578 		return libbpf_err(-EINVAL);
2579 
2580 	if (validate_type_id(var_type_id))
2581 		return libbpf_err(-EINVAL);
2582 
2583 	/* decompose and invalidate raw data */
2584 	if (btf_ensure_modifiable(btf))
2585 		return libbpf_err(-ENOMEM);
2586 
2587 	sz = sizeof(struct btf_var_secinfo);
2588 	v = btf_add_type_mem(btf, sz);
2589 	if (!v)
2590 		return libbpf_err(-ENOMEM);
2591 
2592 	v->type = var_type_id;
2593 	v->offset = offset;
2594 	v->size = byte_sz;
2595 
2596 	/* update parent type's vlen */
2597 	t = btf_last_type(btf);
2598 	btf_type_inc_vlen(t);
2599 
2600 	btf->hdr->type_len += sz;
2601 	btf->hdr->str_off += sz;
2602 	return 0;
2603 }
2604 
2605 /*
2606  * Append new BTF_KIND_DECL_TAG type with:
2607  *   - *value* - non-empty/non-NULL string;
2608  *   - *ref_type_id* - referenced type ID, it might not exist yet;
2609  *   - *component_idx* - -1 for tagging reference type, otherwise struct/union
2610  *     member or function argument index;
2611  * Returns:
2612  *   - >0, type ID of newly added BTF type;
2613  *   - <0, on error.
2614  */
2615 int btf__add_decl_tag(struct btf *btf, const char *value, int ref_type_id,
2616 		 int component_idx)
2617 {
2618 	struct btf_type *t;
2619 	int sz, value_off;
2620 
2621 	if (!value || !value[0] || component_idx < -1)
2622 		return libbpf_err(-EINVAL);
2623 
2624 	if (validate_type_id(ref_type_id))
2625 		return libbpf_err(-EINVAL);
2626 
2627 	if (btf_ensure_modifiable(btf))
2628 		return libbpf_err(-ENOMEM);
2629 
2630 	sz = sizeof(struct btf_type) + sizeof(struct btf_decl_tag);
2631 	t = btf_add_type_mem(btf, sz);
2632 	if (!t)
2633 		return libbpf_err(-ENOMEM);
2634 
2635 	value_off = btf__add_str(btf, value);
2636 	if (value_off < 0)
2637 		return value_off;
2638 
2639 	t->name_off = value_off;
2640 	t->info = btf_type_info(BTF_KIND_DECL_TAG, 0, false);
2641 	t->type = ref_type_id;
2642 	btf_decl_tag(t)->component_idx = component_idx;
2643 
2644 	return btf_commit_type(btf, sz);
2645 }
2646 
2647 struct btf_ext_sec_setup_param {
2648 	__u32 off;
2649 	__u32 len;
2650 	__u32 min_rec_size;
2651 	struct btf_ext_info *ext_info;
2652 	const char *desc;
2653 };
2654 
2655 static int btf_ext_setup_info(struct btf_ext *btf_ext,
2656 			      struct btf_ext_sec_setup_param *ext_sec)
2657 {
2658 	const struct btf_ext_info_sec *sinfo;
2659 	struct btf_ext_info *ext_info;
2660 	__u32 info_left, record_size;
2661 	size_t sec_cnt = 0;
2662 	/* The start of the info sec (including the __u32 record_size). */
2663 	void *info;
2664 
2665 	if (ext_sec->len == 0)
2666 		return 0;
2667 
2668 	if (ext_sec->off & 0x03) {
2669 		pr_debug(".BTF.ext %s section is not aligned to 4 bytes\n",
2670 		     ext_sec->desc);
2671 		return -EINVAL;
2672 	}
2673 
2674 	info = btf_ext->data + btf_ext->hdr->hdr_len + ext_sec->off;
2675 	info_left = ext_sec->len;
2676 
2677 	if (btf_ext->data + btf_ext->data_size < info + ext_sec->len) {
2678 		pr_debug("%s section (off:%u len:%u) is beyond the end of the ELF section .BTF.ext\n",
2679 			 ext_sec->desc, ext_sec->off, ext_sec->len);
2680 		return -EINVAL;
2681 	}
2682 
2683 	/* At least a record size */
2684 	if (info_left < sizeof(__u32)) {
2685 		pr_debug(".BTF.ext %s record size not found\n", ext_sec->desc);
2686 		return -EINVAL;
2687 	}
2688 
2689 	/* The record size needs to meet the minimum standard */
2690 	record_size = *(__u32 *)info;
2691 	if (record_size < ext_sec->min_rec_size ||
2692 	    record_size & 0x03) {
2693 		pr_debug("%s section in .BTF.ext has invalid record size %u\n",
2694 			 ext_sec->desc, record_size);
2695 		return -EINVAL;
2696 	}
2697 
2698 	sinfo = info + sizeof(__u32);
2699 	info_left -= sizeof(__u32);
2700 
2701 	/* If no records, return failure now so .BTF.ext won't be used. */
2702 	if (!info_left) {
2703 		pr_debug("%s section in .BTF.ext has no records", ext_sec->desc);
2704 		return -EINVAL;
2705 	}
2706 
2707 	while (info_left) {
2708 		unsigned int sec_hdrlen = sizeof(struct btf_ext_info_sec);
2709 		__u64 total_record_size;
2710 		__u32 num_records;
2711 
2712 		if (info_left < sec_hdrlen) {
2713 			pr_debug("%s section header is not found in .BTF.ext\n",
2714 			     ext_sec->desc);
2715 			return -EINVAL;
2716 		}
2717 
2718 		num_records = sinfo->num_info;
2719 		if (num_records == 0) {
2720 			pr_debug("%s section has incorrect num_records in .BTF.ext\n",
2721 			     ext_sec->desc);
2722 			return -EINVAL;
2723 		}
2724 
2725 		total_record_size = sec_hdrlen + (__u64)num_records * record_size;
2726 		if (info_left < total_record_size) {
2727 			pr_debug("%s section has incorrect num_records in .BTF.ext\n",
2728 			     ext_sec->desc);
2729 			return -EINVAL;
2730 		}
2731 
2732 		info_left -= total_record_size;
2733 		sinfo = (void *)sinfo + total_record_size;
2734 		sec_cnt++;
2735 	}
2736 
2737 	ext_info = ext_sec->ext_info;
2738 	ext_info->len = ext_sec->len - sizeof(__u32);
2739 	ext_info->rec_size = record_size;
2740 	ext_info->info = info + sizeof(__u32);
2741 	ext_info->sec_cnt = sec_cnt;
2742 
2743 	return 0;
2744 }
2745 
2746 static int btf_ext_setup_func_info(struct btf_ext *btf_ext)
2747 {
2748 	struct btf_ext_sec_setup_param param = {
2749 		.off = btf_ext->hdr->func_info_off,
2750 		.len = btf_ext->hdr->func_info_len,
2751 		.min_rec_size = sizeof(struct bpf_func_info_min),
2752 		.ext_info = &btf_ext->func_info,
2753 		.desc = "func_info"
2754 	};
2755 
2756 	return btf_ext_setup_info(btf_ext, &param);
2757 }
2758 
2759 static int btf_ext_setup_line_info(struct btf_ext *btf_ext)
2760 {
2761 	struct btf_ext_sec_setup_param param = {
2762 		.off = btf_ext->hdr->line_info_off,
2763 		.len = btf_ext->hdr->line_info_len,
2764 		.min_rec_size = sizeof(struct bpf_line_info_min),
2765 		.ext_info = &btf_ext->line_info,
2766 		.desc = "line_info",
2767 	};
2768 
2769 	return btf_ext_setup_info(btf_ext, &param);
2770 }
2771 
2772 static int btf_ext_setup_core_relos(struct btf_ext *btf_ext)
2773 {
2774 	struct btf_ext_sec_setup_param param = {
2775 		.off = btf_ext->hdr->core_relo_off,
2776 		.len = btf_ext->hdr->core_relo_len,
2777 		.min_rec_size = sizeof(struct bpf_core_relo),
2778 		.ext_info = &btf_ext->core_relo_info,
2779 		.desc = "core_relo",
2780 	};
2781 
2782 	return btf_ext_setup_info(btf_ext, &param);
2783 }
2784 
2785 static int btf_ext_parse_hdr(__u8 *data, __u32 data_size)
2786 {
2787 	const struct btf_ext_header *hdr = (struct btf_ext_header *)data;
2788 
2789 	if (data_size < offsetofend(struct btf_ext_header, hdr_len) ||
2790 	    data_size < hdr->hdr_len) {
2791 		pr_debug("BTF.ext header not found");
2792 		return -EINVAL;
2793 	}
2794 
2795 	if (hdr->magic == bswap_16(BTF_MAGIC)) {
2796 		pr_warn("BTF.ext in non-native endianness is not supported\n");
2797 		return -ENOTSUP;
2798 	} else if (hdr->magic != BTF_MAGIC) {
2799 		pr_debug("Invalid BTF.ext magic:%x\n", hdr->magic);
2800 		return -EINVAL;
2801 	}
2802 
2803 	if (hdr->version != BTF_VERSION) {
2804 		pr_debug("Unsupported BTF.ext version:%u\n", hdr->version);
2805 		return -ENOTSUP;
2806 	}
2807 
2808 	if (hdr->flags) {
2809 		pr_debug("Unsupported BTF.ext flags:%x\n", hdr->flags);
2810 		return -ENOTSUP;
2811 	}
2812 
2813 	if (data_size == hdr->hdr_len) {
2814 		pr_debug("BTF.ext has no data\n");
2815 		return -EINVAL;
2816 	}
2817 
2818 	return 0;
2819 }
2820 
2821 void btf_ext__free(struct btf_ext *btf_ext)
2822 {
2823 	if (IS_ERR_OR_NULL(btf_ext))
2824 		return;
2825 	free(btf_ext->func_info.sec_idxs);
2826 	free(btf_ext->line_info.sec_idxs);
2827 	free(btf_ext->core_relo_info.sec_idxs);
2828 	free(btf_ext->data);
2829 	free(btf_ext);
2830 }
2831 
2832 struct btf_ext *btf_ext__new(const __u8 *data, __u32 size)
2833 {
2834 	struct btf_ext *btf_ext;
2835 	int err;
2836 
2837 	btf_ext = calloc(1, sizeof(struct btf_ext));
2838 	if (!btf_ext)
2839 		return libbpf_err_ptr(-ENOMEM);
2840 
2841 	btf_ext->data_size = size;
2842 	btf_ext->data = malloc(size);
2843 	if (!btf_ext->data) {
2844 		err = -ENOMEM;
2845 		goto done;
2846 	}
2847 	memcpy(btf_ext->data, data, size);
2848 
2849 	err = btf_ext_parse_hdr(btf_ext->data, size);
2850 	if (err)
2851 		goto done;
2852 
2853 	if (btf_ext->hdr->hdr_len < offsetofend(struct btf_ext_header, line_info_len)) {
2854 		err = -EINVAL;
2855 		goto done;
2856 	}
2857 
2858 	err = btf_ext_setup_func_info(btf_ext);
2859 	if (err)
2860 		goto done;
2861 
2862 	err = btf_ext_setup_line_info(btf_ext);
2863 	if (err)
2864 		goto done;
2865 
2866 	if (btf_ext->hdr->hdr_len < offsetofend(struct btf_ext_header, core_relo_len))
2867 		goto done; /* skip core relos parsing */
2868 
2869 	err = btf_ext_setup_core_relos(btf_ext);
2870 	if (err)
2871 		goto done;
2872 
2873 done:
2874 	if (err) {
2875 		btf_ext__free(btf_ext);
2876 		return libbpf_err_ptr(err);
2877 	}
2878 
2879 	return btf_ext;
2880 }
2881 
2882 const void *btf_ext__get_raw_data(const struct btf_ext *btf_ext, __u32 *size)
2883 {
2884 	*size = btf_ext->data_size;
2885 	return btf_ext->data;
2886 }
2887 
2888 struct btf_dedup;
2889 
2890 static struct btf_dedup *btf_dedup_new(struct btf *btf, const struct btf_dedup_opts *opts);
2891 static void btf_dedup_free(struct btf_dedup *d);
2892 static int btf_dedup_prep(struct btf_dedup *d);
2893 static int btf_dedup_strings(struct btf_dedup *d);
2894 static int btf_dedup_prim_types(struct btf_dedup *d);
2895 static int btf_dedup_struct_types(struct btf_dedup *d);
2896 static int btf_dedup_ref_types(struct btf_dedup *d);
2897 static int btf_dedup_resolve_fwds(struct btf_dedup *d);
2898 static int btf_dedup_compact_types(struct btf_dedup *d);
2899 static int btf_dedup_remap_types(struct btf_dedup *d);
2900 
2901 /*
2902  * Deduplicate BTF types and strings.
2903  *
2904  * BTF dedup algorithm takes as an input `struct btf` representing `.BTF` ELF
2905  * section with all BTF type descriptors and string data. It overwrites that
2906  * memory in-place with deduplicated types and strings without any loss of
2907  * information. If optional `struct btf_ext` representing '.BTF.ext' ELF section
2908  * is provided, all the strings referenced from .BTF.ext section are honored
2909  * and updated to point to the right offsets after deduplication.
2910  *
2911  * If function returns with error, type/string data might be garbled and should
2912  * be discarded.
2913  *
2914  * More verbose and detailed description of both problem btf_dedup is solving,
2915  * as well as solution could be found at:
2916  * https://facebookmicrosites.github.io/bpf/blog/2018/11/14/btf-enhancement.html
2917  *
2918  * Problem description and justification
2919  * =====================================
2920  *
2921  * BTF type information is typically emitted either as a result of conversion
2922  * from DWARF to BTF or directly by compiler. In both cases, each compilation
2923  * unit contains information about a subset of all the types that are used
2924  * in an application. These subsets are frequently overlapping and contain a lot
2925  * of duplicated information when later concatenated together into a single
2926  * binary. This algorithm ensures that each unique type is represented by single
2927  * BTF type descriptor, greatly reducing resulting size of BTF data.
2928  *
2929  * Compilation unit isolation and subsequent duplication of data is not the only
2930  * problem. The same type hierarchy (e.g., struct and all the type that struct
2931  * references) in different compilation units can be represented in BTF to
2932  * various degrees of completeness (or, rather, incompleteness) due to
2933  * struct/union forward declarations.
2934  *
2935  * Let's take a look at an example, that we'll use to better understand the
2936  * problem (and solution). Suppose we have two compilation units, each using
2937  * same `struct S`, but each of them having incomplete type information about
2938  * struct's fields:
2939  *
2940  * // CU #1:
2941  * struct S;
2942  * struct A {
2943  *	int a;
2944  *	struct A* self;
2945  *	struct S* parent;
2946  * };
2947  * struct B;
2948  * struct S {
2949  *	struct A* a_ptr;
2950  *	struct B* b_ptr;
2951  * };
2952  *
2953  * // CU #2:
2954  * struct S;
2955  * struct A;
2956  * struct B {
2957  *	int b;
2958  *	struct B* self;
2959  *	struct S* parent;
2960  * };
2961  * struct S {
2962  *	struct A* a_ptr;
2963  *	struct B* b_ptr;
2964  * };
2965  *
2966  * In case of CU #1, BTF data will know only that `struct B` exist (but no
2967  * more), but will know the complete type information about `struct A`. While
2968  * for CU #2, it will know full type information about `struct B`, but will
2969  * only know about forward declaration of `struct A` (in BTF terms, it will
2970  * have `BTF_KIND_FWD` type descriptor with name `B`).
2971  *
2972  * This compilation unit isolation means that it's possible that there is no
2973  * single CU with complete type information describing structs `S`, `A`, and
2974  * `B`. Also, we might get tons of duplicated and redundant type information.
2975  *
2976  * Additional complication we need to keep in mind comes from the fact that
2977  * types, in general, can form graphs containing cycles, not just DAGs.
2978  *
2979  * While algorithm does deduplication, it also merges and resolves type
2980  * information (unless disabled throught `struct btf_opts`), whenever possible.
2981  * E.g., in the example above with two compilation units having partial type
2982  * information for structs `A` and `B`, the output of algorithm will emit
2983  * a single copy of each BTF type that describes structs `A`, `B`, and `S`
2984  * (as well as type information for `int` and pointers), as if they were defined
2985  * in a single compilation unit as:
2986  *
2987  * struct A {
2988  *	int a;
2989  *	struct A* self;
2990  *	struct S* parent;
2991  * };
2992  * struct B {
2993  *	int b;
2994  *	struct B* self;
2995  *	struct S* parent;
2996  * };
2997  * struct S {
2998  *	struct A* a_ptr;
2999  *	struct B* b_ptr;
3000  * };
3001  *
3002  * Algorithm summary
3003  * =================
3004  *
3005  * Algorithm completes its work in 7 separate passes:
3006  *
3007  * 1. Strings deduplication.
3008  * 2. Primitive types deduplication (int, enum, fwd).
3009  * 3. Struct/union types deduplication.
3010  * 4. Resolve unambiguous forward declarations.
3011  * 5. Reference types deduplication (pointers, typedefs, arrays, funcs, func
3012  *    protos, and const/volatile/restrict modifiers).
3013  * 6. Types compaction.
3014  * 7. Types remapping.
3015  *
3016  * Algorithm determines canonical type descriptor, which is a single
3017  * representative type for each truly unique type. This canonical type is the
3018  * one that will go into final deduplicated BTF type information. For
3019  * struct/unions, it is also the type that algorithm will merge additional type
3020  * information into (while resolving FWDs), as it discovers it from data in
3021  * other CUs. Each input BTF type eventually gets either mapped to itself, if
3022  * that type is canonical, or to some other type, if that type is equivalent
3023  * and was chosen as canonical representative. This mapping is stored in
3024  * `btf_dedup->map` array. This map is also used to record STRUCT/UNION that
3025  * FWD type got resolved to.
3026  *
3027  * To facilitate fast discovery of canonical types, we also maintain canonical
3028  * index (`btf_dedup->dedup_table`), which maps type descriptor's signature hash
3029  * (i.e., hashed kind, name, size, fields, etc) into a list of canonical types
3030  * that match that signature. With sufficiently good choice of type signature
3031  * hashing function, we can limit number of canonical types for each unique type
3032  * signature to a very small number, allowing to find canonical type for any
3033  * duplicated type very quickly.
3034  *
3035  * Struct/union deduplication is the most critical part and algorithm for
3036  * deduplicating structs/unions is described in greater details in comments for
3037  * `btf_dedup_is_equiv` function.
3038  */
3039 int btf__dedup(struct btf *btf, const struct btf_dedup_opts *opts)
3040 {
3041 	struct btf_dedup *d;
3042 	int err;
3043 
3044 	if (!OPTS_VALID(opts, btf_dedup_opts))
3045 		return libbpf_err(-EINVAL);
3046 
3047 	d = btf_dedup_new(btf, opts);
3048 	if (IS_ERR(d)) {
3049 		pr_debug("btf_dedup_new failed: %ld", PTR_ERR(d));
3050 		return libbpf_err(-EINVAL);
3051 	}
3052 
3053 	if (btf_ensure_modifiable(btf)) {
3054 		err = -ENOMEM;
3055 		goto done;
3056 	}
3057 
3058 	err = btf_dedup_prep(d);
3059 	if (err) {
3060 		pr_debug("btf_dedup_prep failed:%d\n", err);
3061 		goto done;
3062 	}
3063 	err = btf_dedup_strings(d);
3064 	if (err < 0) {
3065 		pr_debug("btf_dedup_strings failed:%d\n", err);
3066 		goto done;
3067 	}
3068 	err = btf_dedup_prim_types(d);
3069 	if (err < 0) {
3070 		pr_debug("btf_dedup_prim_types failed:%d\n", err);
3071 		goto done;
3072 	}
3073 	err = btf_dedup_struct_types(d);
3074 	if (err < 0) {
3075 		pr_debug("btf_dedup_struct_types failed:%d\n", err);
3076 		goto done;
3077 	}
3078 	err = btf_dedup_resolve_fwds(d);
3079 	if (err < 0) {
3080 		pr_debug("btf_dedup_resolve_fwds failed:%d\n", err);
3081 		goto done;
3082 	}
3083 	err = btf_dedup_ref_types(d);
3084 	if (err < 0) {
3085 		pr_debug("btf_dedup_ref_types failed:%d\n", err);
3086 		goto done;
3087 	}
3088 	err = btf_dedup_compact_types(d);
3089 	if (err < 0) {
3090 		pr_debug("btf_dedup_compact_types failed:%d\n", err);
3091 		goto done;
3092 	}
3093 	err = btf_dedup_remap_types(d);
3094 	if (err < 0) {
3095 		pr_debug("btf_dedup_remap_types failed:%d\n", err);
3096 		goto done;
3097 	}
3098 
3099 done:
3100 	btf_dedup_free(d);
3101 	return libbpf_err(err);
3102 }
3103 
3104 #define BTF_UNPROCESSED_ID ((__u32)-1)
3105 #define BTF_IN_PROGRESS_ID ((__u32)-2)
3106 
3107 struct btf_dedup {
3108 	/* .BTF section to be deduped in-place */
3109 	struct btf *btf;
3110 	/*
3111 	 * Optional .BTF.ext section. When provided, any strings referenced
3112 	 * from it will be taken into account when deduping strings
3113 	 */
3114 	struct btf_ext *btf_ext;
3115 	/*
3116 	 * This is a map from any type's signature hash to a list of possible
3117 	 * canonical representative type candidates. Hash collisions are
3118 	 * ignored, so even types of various kinds can share same list of
3119 	 * candidates, which is fine because we rely on subsequent
3120 	 * btf_xxx_equal() checks to authoritatively verify type equality.
3121 	 */
3122 	struct hashmap *dedup_table;
3123 	/* Canonical types map */
3124 	__u32 *map;
3125 	/* Hypothetical mapping, used during type graph equivalence checks */
3126 	__u32 *hypot_map;
3127 	__u32 *hypot_list;
3128 	size_t hypot_cnt;
3129 	size_t hypot_cap;
3130 	/* Whether hypothetical mapping, if successful, would need to adjust
3131 	 * already canonicalized types (due to a new forward declaration to
3132 	 * concrete type resolution). In such case, during split BTF dedup
3133 	 * candidate type would still be considered as different, because base
3134 	 * BTF is considered to be immutable.
3135 	 */
3136 	bool hypot_adjust_canon;
3137 	/* Various option modifying behavior of algorithm */
3138 	struct btf_dedup_opts opts;
3139 	/* temporary strings deduplication state */
3140 	struct strset *strs_set;
3141 };
3142 
3143 static long hash_combine(long h, long value)
3144 {
3145 	return h * 31 + value;
3146 }
3147 
3148 #define for_each_dedup_cand(d, node, hash) \
3149 	hashmap__for_each_key_entry(d->dedup_table, node, hash)
3150 
3151 static int btf_dedup_table_add(struct btf_dedup *d, long hash, __u32 type_id)
3152 {
3153 	return hashmap__append(d->dedup_table, hash, type_id);
3154 }
3155 
3156 static int btf_dedup_hypot_map_add(struct btf_dedup *d,
3157 				   __u32 from_id, __u32 to_id)
3158 {
3159 	if (d->hypot_cnt == d->hypot_cap) {
3160 		__u32 *new_list;
3161 
3162 		d->hypot_cap += max((size_t)16, d->hypot_cap / 2);
3163 		new_list = libbpf_reallocarray(d->hypot_list, d->hypot_cap, sizeof(__u32));
3164 		if (!new_list)
3165 			return -ENOMEM;
3166 		d->hypot_list = new_list;
3167 	}
3168 	d->hypot_list[d->hypot_cnt++] = from_id;
3169 	d->hypot_map[from_id] = to_id;
3170 	return 0;
3171 }
3172 
3173 static void btf_dedup_clear_hypot_map(struct btf_dedup *d)
3174 {
3175 	int i;
3176 
3177 	for (i = 0; i < d->hypot_cnt; i++)
3178 		d->hypot_map[d->hypot_list[i]] = BTF_UNPROCESSED_ID;
3179 	d->hypot_cnt = 0;
3180 	d->hypot_adjust_canon = false;
3181 }
3182 
3183 static void btf_dedup_free(struct btf_dedup *d)
3184 {
3185 	hashmap__free(d->dedup_table);
3186 	d->dedup_table = NULL;
3187 
3188 	free(d->map);
3189 	d->map = NULL;
3190 
3191 	free(d->hypot_map);
3192 	d->hypot_map = NULL;
3193 
3194 	free(d->hypot_list);
3195 	d->hypot_list = NULL;
3196 
3197 	free(d);
3198 }
3199 
3200 static size_t btf_dedup_identity_hash_fn(long key, void *ctx)
3201 {
3202 	return key;
3203 }
3204 
3205 static size_t btf_dedup_collision_hash_fn(long key, void *ctx)
3206 {
3207 	return 0;
3208 }
3209 
3210 static bool btf_dedup_equal_fn(long k1, long k2, void *ctx)
3211 {
3212 	return k1 == k2;
3213 }
3214 
3215 static struct btf_dedup *btf_dedup_new(struct btf *btf, const struct btf_dedup_opts *opts)
3216 {
3217 	struct btf_dedup *d = calloc(1, sizeof(struct btf_dedup));
3218 	hashmap_hash_fn hash_fn = btf_dedup_identity_hash_fn;
3219 	int i, err = 0, type_cnt;
3220 
3221 	if (!d)
3222 		return ERR_PTR(-ENOMEM);
3223 
3224 	if (OPTS_GET(opts, force_collisions, false))
3225 		hash_fn = btf_dedup_collision_hash_fn;
3226 
3227 	d->btf = btf;
3228 	d->btf_ext = OPTS_GET(opts, btf_ext, NULL);
3229 
3230 	d->dedup_table = hashmap__new(hash_fn, btf_dedup_equal_fn, NULL);
3231 	if (IS_ERR(d->dedup_table)) {
3232 		err = PTR_ERR(d->dedup_table);
3233 		d->dedup_table = NULL;
3234 		goto done;
3235 	}
3236 
3237 	type_cnt = btf__type_cnt(btf);
3238 	d->map = malloc(sizeof(__u32) * type_cnt);
3239 	if (!d->map) {
3240 		err = -ENOMEM;
3241 		goto done;
3242 	}
3243 	/* special BTF "void" type is made canonical immediately */
3244 	d->map[0] = 0;
3245 	for (i = 1; i < type_cnt; i++) {
3246 		struct btf_type *t = btf_type_by_id(d->btf, i);
3247 
3248 		/* VAR and DATASEC are never deduped and are self-canonical */
3249 		if (btf_is_var(t) || btf_is_datasec(t))
3250 			d->map[i] = i;
3251 		else
3252 			d->map[i] = BTF_UNPROCESSED_ID;
3253 	}
3254 
3255 	d->hypot_map = malloc(sizeof(__u32) * type_cnt);
3256 	if (!d->hypot_map) {
3257 		err = -ENOMEM;
3258 		goto done;
3259 	}
3260 	for (i = 0; i < type_cnt; i++)
3261 		d->hypot_map[i] = BTF_UNPROCESSED_ID;
3262 
3263 done:
3264 	if (err) {
3265 		btf_dedup_free(d);
3266 		return ERR_PTR(err);
3267 	}
3268 
3269 	return d;
3270 }
3271 
3272 /*
3273  * Iterate over all possible places in .BTF and .BTF.ext that can reference
3274  * string and pass pointer to it to a provided callback `fn`.
3275  */
3276 static int btf_for_each_str_off(struct btf_dedup *d, str_off_visit_fn fn, void *ctx)
3277 {
3278 	int i, r;
3279 
3280 	for (i = 0; i < d->btf->nr_types; i++) {
3281 		struct btf_type *t = btf_type_by_id(d->btf, d->btf->start_id + i);
3282 
3283 		r = btf_type_visit_str_offs(t, fn, ctx);
3284 		if (r)
3285 			return r;
3286 	}
3287 
3288 	if (!d->btf_ext)
3289 		return 0;
3290 
3291 	r = btf_ext_visit_str_offs(d->btf_ext, fn, ctx);
3292 	if (r)
3293 		return r;
3294 
3295 	return 0;
3296 }
3297 
3298 static int strs_dedup_remap_str_off(__u32 *str_off_ptr, void *ctx)
3299 {
3300 	struct btf_dedup *d = ctx;
3301 	__u32 str_off = *str_off_ptr;
3302 	const char *s;
3303 	int off, err;
3304 
3305 	/* don't touch empty string or string in main BTF */
3306 	if (str_off == 0 || str_off < d->btf->start_str_off)
3307 		return 0;
3308 
3309 	s = btf__str_by_offset(d->btf, str_off);
3310 	if (d->btf->base_btf) {
3311 		err = btf__find_str(d->btf->base_btf, s);
3312 		if (err >= 0) {
3313 			*str_off_ptr = err;
3314 			return 0;
3315 		}
3316 		if (err != -ENOENT)
3317 			return err;
3318 	}
3319 
3320 	off = strset__add_str(d->strs_set, s);
3321 	if (off < 0)
3322 		return off;
3323 
3324 	*str_off_ptr = d->btf->start_str_off + off;
3325 	return 0;
3326 }
3327 
3328 /*
3329  * Dedup string and filter out those that are not referenced from either .BTF
3330  * or .BTF.ext (if provided) sections.
3331  *
3332  * This is done by building index of all strings in BTF's string section,
3333  * then iterating over all entities that can reference strings (e.g., type
3334  * names, struct field names, .BTF.ext line info, etc) and marking corresponding
3335  * strings as used. After that all used strings are deduped and compacted into
3336  * sequential blob of memory and new offsets are calculated. Then all the string
3337  * references are iterated again and rewritten using new offsets.
3338  */
3339 static int btf_dedup_strings(struct btf_dedup *d)
3340 {
3341 	int err;
3342 
3343 	if (d->btf->strs_deduped)
3344 		return 0;
3345 
3346 	d->strs_set = strset__new(BTF_MAX_STR_OFFSET, NULL, 0);
3347 	if (IS_ERR(d->strs_set)) {
3348 		err = PTR_ERR(d->strs_set);
3349 		goto err_out;
3350 	}
3351 
3352 	if (!d->btf->base_btf) {
3353 		/* insert empty string; we won't be looking it up during strings
3354 		 * dedup, but it's good to have it for generic BTF string lookups
3355 		 */
3356 		err = strset__add_str(d->strs_set, "");
3357 		if (err < 0)
3358 			goto err_out;
3359 	}
3360 
3361 	/* remap string offsets */
3362 	err = btf_for_each_str_off(d, strs_dedup_remap_str_off, d);
3363 	if (err)
3364 		goto err_out;
3365 
3366 	/* replace BTF string data and hash with deduped ones */
3367 	strset__free(d->btf->strs_set);
3368 	d->btf->hdr->str_len = strset__data_size(d->strs_set);
3369 	d->btf->strs_set = d->strs_set;
3370 	d->strs_set = NULL;
3371 	d->btf->strs_deduped = true;
3372 	return 0;
3373 
3374 err_out:
3375 	strset__free(d->strs_set);
3376 	d->strs_set = NULL;
3377 
3378 	return err;
3379 }
3380 
3381 static long btf_hash_common(struct btf_type *t)
3382 {
3383 	long h;
3384 
3385 	h = hash_combine(0, t->name_off);
3386 	h = hash_combine(h, t->info);
3387 	h = hash_combine(h, t->size);
3388 	return h;
3389 }
3390 
3391 static bool btf_equal_common(struct btf_type *t1, struct btf_type *t2)
3392 {
3393 	return t1->name_off == t2->name_off &&
3394 	       t1->info == t2->info &&
3395 	       t1->size == t2->size;
3396 }
3397 
3398 /* Calculate type signature hash of INT or TAG. */
3399 static long btf_hash_int_decl_tag(struct btf_type *t)
3400 {
3401 	__u32 info = *(__u32 *)(t + 1);
3402 	long h;
3403 
3404 	h = btf_hash_common(t);
3405 	h = hash_combine(h, info);
3406 	return h;
3407 }
3408 
3409 /* Check structural equality of two INTs or TAGs. */
3410 static bool btf_equal_int_tag(struct btf_type *t1, struct btf_type *t2)
3411 {
3412 	__u32 info1, info2;
3413 
3414 	if (!btf_equal_common(t1, t2))
3415 		return false;
3416 	info1 = *(__u32 *)(t1 + 1);
3417 	info2 = *(__u32 *)(t2 + 1);
3418 	return info1 == info2;
3419 }
3420 
3421 /* Calculate type signature hash of ENUM/ENUM64. */
3422 static long btf_hash_enum(struct btf_type *t)
3423 {
3424 	long h;
3425 
3426 	/* don't hash vlen, enum members and size to support enum fwd resolving */
3427 	h = hash_combine(0, t->name_off);
3428 	return h;
3429 }
3430 
3431 static bool btf_equal_enum_members(struct btf_type *t1, struct btf_type *t2)
3432 {
3433 	const struct btf_enum *m1, *m2;
3434 	__u16 vlen;
3435 	int i;
3436 
3437 	vlen = btf_vlen(t1);
3438 	m1 = btf_enum(t1);
3439 	m2 = btf_enum(t2);
3440 	for (i = 0; i < vlen; i++) {
3441 		if (m1->name_off != m2->name_off || m1->val != m2->val)
3442 			return false;
3443 		m1++;
3444 		m2++;
3445 	}
3446 	return true;
3447 }
3448 
3449 static bool btf_equal_enum64_members(struct btf_type *t1, struct btf_type *t2)
3450 {
3451 	const struct btf_enum64 *m1, *m2;
3452 	__u16 vlen;
3453 	int i;
3454 
3455 	vlen = btf_vlen(t1);
3456 	m1 = btf_enum64(t1);
3457 	m2 = btf_enum64(t2);
3458 	for (i = 0; i < vlen; i++) {
3459 		if (m1->name_off != m2->name_off || m1->val_lo32 != m2->val_lo32 ||
3460 		    m1->val_hi32 != m2->val_hi32)
3461 			return false;
3462 		m1++;
3463 		m2++;
3464 	}
3465 	return true;
3466 }
3467 
3468 /* Check structural equality of two ENUMs or ENUM64s. */
3469 static bool btf_equal_enum(struct btf_type *t1, struct btf_type *t2)
3470 {
3471 	if (!btf_equal_common(t1, t2))
3472 		return false;
3473 
3474 	/* t1 & t2 kinds are identical because of btf_equal_common */
3475 	if (btf_kind(t1) == BTF_KIND_ENUM)
3476 		return btf_equal_enum_members(t1, t2);
3477 	else
3478 		return btf_equal_enum64_members(t1, t2);
3479 }
3480 
3481 static inline bool btf_is_enum_fwd(struct btf_type *t)
3482 {
3483 	return btf_is_any_enum(t) && btf_vlen(t) == 0;
3484 }
3485 
3486 static bool btf_compat_enum(struct btf_type *t1, struct btf_type *t2)
3487 {
3488 	if (!btf_is_enum_fwd(t1) && !btf_is_enum_fwd(t2))
3489 		return btf_equal_enum(t1, t2);
3490 	/* At this point either t1 or t2 or both are forward declarations, thus:
3491 	 * - skip comparing vlen because it is zero for forward declarations;
3492 	 * - skip comparing size to allow enum forward declarations
3493 	 *   to be compatible with enum64 full declarations;
3494 	 * - skip comparing kind for the same reason.
3495 	 */
3496 	return t1->name_off == t2->name_off &&
3497 	       btf_is_any_enum(t1) && btf_is_any_enum(t2);
3498 }
3499 
3500 /*
3501  * Calculate type signature hash of STRUCT/UNION, ignoring referenced type IDs,
3502  * as referenced type IDs equivalence is established separately during type
3503  * graph equivalence check algorithm.
3504  */
3505 static long btf_hash_struct(struct btf_type *t)
3506 {
3507 	const struct btf_member *member = btf_members(t);
3508 	__u32 vlen = btf_vlen(t);
3509 	long h = btf_hash_common(t);
3510 	int i;
3511 
3512 	for (i = 0; i < vlen; i++) {
3513 		h = hash_combine(h, member->name_off);
3514 		h = hash_combine(h, member->offset);
3515 		/* no hashing of referenced type ID, it can be unresolved yet */
3516 		member++;
3517 	}
3518 	return h;
3519 }
3520 
3521 /*
3522  * Check structural compatibility of two STRUCTs/UNIONs, ignoring referenced
3523  * type IDs. This check is performed during type graph equivalence check and
3524  * referenced types equivalence is checked separately.
3525  */
3526 static bool btf_shallow_equal_struct(struct btf_type *t1, struct btf_type *t2)
3527 {
3528 	const struct btf_member *m1, *m2;
3529 	__u16 vlen;
3530 	int i;
3531 
3532 	if (!btf_equal_common(t1, t2))
3533 		return false;
3534 
3535 	vlen = btf_vlen(t1);
3536 	m1 = btf_members(t1);
3537 	m2 = btf_members(t2);
3538 	for (i = 0; i < vlen; i++) {
3539 		if (m1->name_off != m2->name_off || m1->offset != m2->offset)
3540 			return false;
3541 		m1++;
3542 		m2++;
3543 	}
3544 	return true;
3545 }
3546 
3547 /*
3548  * Calculate type signature hash of ARRAY, including referenced type IDs,
3549  * under assumption that they were already resolved to canonical type IDs and
3550  * are not going to change.
3551  */
3552 static long btf_hash_array(struct btf_type *t)
3553 {
3554 	const struct btf_array *info = btf_array(t);
3555 	long h = btf_hash_common(t);
3556 
3557 	h = hash_combine(h, info->type);
3558 	h = hash_combine(h, info->index_type);
3559 	h = hash_combine(h, info->nelems);
3560 	return h;
3561 }
3562 
3563 /*
3564  * Check exact equality of two ARRAYs, taking into account referenced
3565  * type IDs, under assumption that they were already resolved to canonical
3566  * type IDs and are not going to change.
3567  * This function is called during reference types deduplication to compare
3568  * ARRAY to potential canonical representative.
3569  */
3570 static bool btf_equal_array(struct btf_type *t1, struct btf_type *t2)
3571 {
3572 	const struct btf_array *info1, *info2;
3573 
3574 	if (!btf_equal_common(t1, t2))
3575 		return false;
3576 
3577 	info1 = btf_array(t1);
3578 	info2 = btf_array(t2);
3579 	return info1->type == info2->type &&
3580 	       info1->index_type == info2->index_type &&
3581 	       info1->nelems == info2->nelems;
3582 }
3583 
3584 /*
3585  * Check structural compatibility of two ARRAYs, ignoring referenced type
3586  * IDs. This check is performed during type graph equivalence check and
3587  * referenced types equivalence is checked separately.
3588  */
3589 static bool btf_compat_array(struct btf_type *t1, struct btf_type *t2)
3590 {
3591 	if (!btf_equal_common(t1, t2))
3592 		return false;
3593 
3594 	return btf_array(t1)->nelems == btf_array(t2)->nelems;
3595 }
3596 
3597 /*
3598  * Calculate type signature hash of FUNC_PROTO, including referenced type IDs,
3599  * under assumption that they were already resolved to canonical type IDs and
3600  * are not going to change.
3601  */
3602 static long btf_hash_fnproto(struct btf_type *t)
3603 {
3604 	const struct btf_param *member = btf_params(t);
3605 	__u16 vlen = btf_vlen(t);
3606 	long h = btf_hash_common(t);
3607 	int i;
3608 
3609 	for (i = 0; i < vlen; i++) {
3610 		h = hash_combine(h, member->name_off);
3611 		h = hash_combine(h, member->type);
3612 		member++;
3613 	}
3614 	return h;
3615 }
3616 
3617 /*
3618  * Check exact equality of two FUNC_PROTOs, taking into account referenced
3619  * type IDs, under assumption that they were already resolved to canonical
3620  * type IDs and are not going to change.
3621  * This function is called during reference types deduplication to compare
3622  * FUNC_PROTO to potential canonical representative.
3623  */
3624 static bool btf_equal_fnproto(struct btf_type *t1, struct btf_type *t2)
3625 {
3626 	const struct btf_param *m1, *m2;
3627 	__u16 vlen;
3628 	int i;
3629 
3630 	if (!btf_equal_common(t1, t2))
3631 		return false;
3632 
3633 	vlen = btf_vlen(t1);
3634 	m1 = btf_params(t1);
3635 	m2 = btf_params(t2);
3636 	for (i = 0; i < vlen; i++) {
3637 		if (m1->name_off != m2->name_off || m1->type != m2->type)
3638 			return false;
3639 		m1++;
3640 		m2++;
3641 	}
3642 	return true;
3643 }
3644 
3645 /*
3646  * Check structural compatibility of two FUNC_PROTOs, ignoring referenced type
3647  * IDs. This check is performed during type graph equivalence check and
3648  * referenced types equivalence is checked separately.
3649  */
3650 static bool btf_compat_fnproto(struct btf_type *t1, struct btf_type *t2)
3651 {
3652 	const struct btf_param *m1, *m2;
3653 	__u16 vlen;
3654 	int i;
3655 
3656 	/* skip return type ID */
3657 	if (t1->name_off != t2->name_off || t1->info != t2->info)
3658 		return false;
3659 
3660 	vlen = btf_vlen(t1);
3661 	m1 = btf_params(t1);
3662 	m2 = btf_params(t2);
3663 	for (i = 0; i < vlen; i++) {
3664 		if (m1->name_off != m2->name_off)
3665 			return false;
3666 		m1++;
3667 		m2++;
3668 	}
3669 	return true;
3670 }
3671 
3672 /* Prepare split BTF for deduplication by calculating hashes of base BTF's
3673  * types and initializing the rest of the state (canonical type mapping) for
3674  * the fixed base BTF part.
3675  */
3676 static int btf_dedup_prep(struct btf_dedup *d)
3677 {
3678 	struct btf_type *t;
3679 	int type_id;
3680 	long h;
3681 
3682 	if (!d->btf->base_btf)
3683 		return 0;
3684 
3685 	for (type_id = 1; type_id < d->btf->start_id; type_id++) {
3686 		t = btf_type_by_id(d->btf, type_id);
3687 
3688 		/* all base BTF types are self-canonical by definition */
3689 		d->map[type_id] = type_id;
3690 
3691 		switch (btf_kind(t)) {
3692 		case BTF_KIND_VAR:
3693 		case BTF_KIND_DATASEC:
3694 			/* VAR and DATASEC are never hash/deduplicated */
3695 			continue;
3696 		case BTF_KIND_CONST:
3697 		case BTF_KIND_VOLATILE:
3698 		case BTF_KIND_RESTRICT:
3699 		case BTF_KIND_PTR:
3700 		case BTF_KIND_FWD:
3701 		case BTF_KIND_TYPEDEF:
3702 		case BTF_KIND_FUNC:
3703 		case BTF_KIND_FLOAT:
3704 		case BTF_KIND_TYPE_TAG:
3705 			h = btf_hash_common(t);
3706 			break;
3707 		case BTF_KIND_INT:
3708 		case BTF_KIND_DECL_TAG:
3709 			h = btf_hash_int_decl_tag(t);
3710 			break;
3711 		case BTF_KIND_ENUM:
3712 		case BTF_KIND_ENUM64:
3713 			h = btf_hash_enum(t);
3714 			break;
3715 		case BTF_KIND_STRUCT:
3716 		case BTF_KIND_UNION:
3717 			h = btf_hash_struct(t);
3718 			break;
3719 		case BTF_KIND_ARRAY:
3720 			h = btf_hash_array(t);
3721 			break;
3722 		case BTF_KIND_FUNC_PROTO:
3723 			h = btf_hash_fnproto(t);
3724 			break;
3725 		default:
3726 			pr_debug("unknown kind %d for type [%d]\n", btf_kind(t), type_id);
3727 			return -EINVAL;
3728 		}
3729 		if (btf_dedup_table_add(d, h, type_id))
3730 			return -ENOMEM;
3731 	}
3732 
3733 	return 0;
3734 }
3735 
3736 /*
3737  * Deduplicate primitive types, that can't reference other types, by calculating
3738  * their type signature hash and comparing them with any possible canonical
3739  * candidate. If no canonical candidate matches, type itself is marked as
3740  * canonical and is added into `btf_dedup->dedup_table` as another candidate.
3741  */
3742 static int btf_dedup_prim_type(struct btf_dedup *d, __u32 type_id)
3743 {
3744 	struct btf_type *t = btf_type_by_id(d->btf, type_id);
3745 	struct hashmap_entry *hash_entry;
3746 	struct btf_type *cand;
3747 	/* if we don't find equivalent type, then we are canonical */
3748 	__u32 new_id = type_id;
3749 	__u32 cand_id;
3750 	long h;
3751 
3752 	switch (btf_kind(t)) {
3753 	case BTF_KIND_CONST:
3754 	case BTF_KIND_VOLATILE:
3755 	case BTF_KIND_RESTRICT:
3756 	case BTF_KIND_PTR:
3757 	case BTF_KIND_TYPEDEF:
3758 	case BTF_KIND_ARRAY:
3759 	case BTF_KIND_STRUCT:
3760 	case BTF_KIND_UNION:
3761 	case BTF_KIND_FUNC:
3762 	case BTF_KIND_FUNC_PROTO:
3763 	case BTF_KIND_VAR:
3764 	case BTF_KIND_DATASEC:
3765 	case BTF_KIND_DECL_TAG:
3766 	case BTF_KIND_TYPE_TAG:
3767 		return 0;
3768 
3769 	case BTF_KIND_INT:
3770 		h = btf_hash_int_decl_tag(t);
3771 		for_each_dedup_cand(d, hash_entry, h) {
3772 			cand_id = hash_entry->value;
3773 			cand = btf_type_by_id(d->btf, cand_id);
3774 			if (btf_equal_int_tag(t, cand)) {
3775 				new_id = cand_id;
3776 				break;
3777 			}
3778 		}
3779 		break;
3780 
3781 	case BTF_KIND_ENUM:
3782 	case BTF_KIND_ENUM64:
3783 		h = btf_hash_enum(t);
3784 		for_each_dedup_cand(d, hash_entry, h) {
3785 			cand_id = hash_entry->value;
3786 			cand = btf_type_by_id(d->btf, cand_id);
3787 			if (btf_equal_enum(t, cand)) {
3788 				new_id = cand_id;
3789 				break;
3790 			}
3791 			if (btf_compat_enum(t, cand)) {
3792 				if (btf_is_enum_fwd(t)) {
3793 					/* resolve fwd to full enum */
3794 					new_id = cand_id;
3795 					break;
3796 				}
3797 				/* resolve canonical enum fwd to full enum */
3798 				d->map[cand_id] = type_id;
3799 			}
3800 		}
3801 		break;
3802 
3803 	case BTF_KIND_FWD:
3804 	case BTF_KIND_FLOAT:
3805 		h = btf_hash_common(t);
3806 		for_each_dedup_cand(d, hash_entry, h) {
3807 			cand_id = hash_entry->value;
3808 			cand = btf_type_by_id(d->btf, cand_id);
3809 			if (btf_equal_common(t, cand)) {
3810 				new_id = cand_id;
3811 				break;
3812 			}
3813 		}
3814 		break;
3815 
3816 	default:
3817 		return -EINVAL;
3818 	}
3819 
3820 	d->map[type_id] = new_id;
3821 	if (type_id == new_id && btf_dedup_table_add(d, h, type_id))
3822 		return -ENOMEM;
3823 
3824 	return 0;
3825 }
3826 
3827 static int btf_dedup_prim_types(struct btf_dedup *d)
3828 {
3829 	int i, err;
3830 
3831 	for (i = 0; i < d->btf->nr_types; i++) {
3832 		err = btf_dedup_prim_type(d, d->btf->start_id + i);
3833 		if (err)
3834 			return err;
3835 	}
3836 	return 0;
3837 }
3838 
3839 /*
3840  * Check whether type is already mapped into canonical one (could be to itself).
3841  */
3842 static inline bool is_type_mapped(struct btf_dedup *d, uint32_t type_id)
3843 {
3844 	return d->map[type_id] <= BTF_MAX_NR_TYPES;
3845 }
3846 
3847 /*
3848  * Resolve type ID into its canonical type ID, if any; otherwise return original
3849  * type ID. If type is FWD and is resolved into STRUCT/UNION already, follow
3850  * STRUCT/UNION link and resolve it into canonical type ID as well.
3851  */
3852 static inline __u32 resolve_type_id(struct btf_dedup *d, __u32 type_id)
3853 {
3854 	while (is_type_mapped(d, type_id) && d->map[type_id] != type_id)
3855 		type_id = d->map[type_id];
3856 	return type_id;
3857 }
3858 
3859 /*
3860  * Resolve FWD to underlying STRUCT/UNION, if any; otherwise return original
3861  * type ID.
3862  */
3863 static uint32_t resolve_fwd_id(struct btf_dedup *d, uint32_t type_id)
3864 {
3865 	__u32 orig_type_id = type_id;
3866 
3867 	if (!btf_is_fwd(btf__type_by_id(d->btf, type_id)))
3868 		return type_id;
3869 
3870 	while (is_type_mapped(d, type_id) && d->map[type_id] != type_id)
3871 		type_id = d->map[type_id];
3872 
3873 	if (!btf_is_fwd(btf__type_by_id(d->btf, type_id)))
3874 		return type_id;
3875 
3876 	return orig_type_id;
3877 }
3878 
3879 
3880 static inline __u16 btf_fwd_kind(struct btf_type *t)
3881 {
3882 	return btf_kflag(t) ? BTF_KIND_UNION : BTF_KIND_STRUCT;
3883 }
3884 
3885 /* Check if given two types are identical ARRAY definitions */
3886 static bool btf_dedup_identical_arrays(struct btf_dedup *d, __u32 id1, __u32 id2)
3887 {
3888 	struct btf_type *t1, *t2;
3889 
3890 	t1 = btf_type_by_id(d->btf, id1);
3891 	t2 = btf_type_by_id(d->btf, id2);
3892 	if (!btf_is_array(t1) || !btf_is_array(t2))
3893 		return false;
3894 
3895 	return btf_equal_array(t1, t2);
3896 }
3897 
3898 /* Check if given two types are identical STRUCT/UNION definitions */
3899 static bool btf_dedup_identical_structs(struct btf_dedup *d, __u32 id1, __u32 id2)
3900 {
3901 	const struct btf_member *m1, *m2;
3902 	struct btf_type *t1, *t2;
3903 	int n, i;
3904 
3905 	t1 = btf_type_by_id(d->btf, id1);
3906 	t2 = btf_type_by_id(d->btf, id2);
3907 
3908 	if (!btf_is_composite(t1) || btf_kind(t1) != btf_kind(t2))
3909 		return false;
3910 
3911 	if (!btf_shallow_equal_struct(t1, t2))
3912 		return false;
3913 
3914 	m1 = btf_members(t1);
3915 	m2 = btf_members(t2);
3916 	for (i = 0, n = btf_vlen(t1); i < n; i++, m1++, m2++) {
3917 		if (m1->type != m2->type &&
3918 		    !btf_dedup_identical_arrays(d, m1->type, m2->type) &&
3919 		    !btf_dedup_identical_structs(d, m1->type, m2->type))
3920 			return false;
3921 	}
3922 	return true;
3923 }
3924 
3925 /*
3926  * Check equivalence of BTF type graph formed by candidate struct/union (we'll
3927  * call it "candidate graph" in this description for brevity) to a type graph
3928  * formed by (potential) canonical struct/union ("canonical graph" for brevity
3929  * here, though keep in mind that not all types in canonical graph are
3930  * necessarily canonical representatives themselves, some of them might be
3931  * duplicates or its uniqueness might not have been established yet).
3932  * Returns:
3933  *  - >0, if type graphs are equivalent;
3934  *  -  0, if not equivalent;
3935  *  - <0, on error.
3936  *
3937  * Algorithm performs side-by-side DFS traversal of both type graphs and checks
3938  * equivalence of BTF types at each step. If at any point BTF types in candidate
3939  * and canonical graphs are not compatible structurally, whole graphs are
3940  * incompatible. If types are structurally equivalent (i.e., all information
3941  * except referenced type IDs is exactly the same), a mapping from `canon_id` to
3942  * a `cand_id` is recored in hypothetical mapping (`btf_dedup->hypot_map`).
3943  * If a type references other types, then those referenced types are checked
3944  * for equivalence recursively.
3945  *
3946  * During DFS traversal, if we find that for current `canon_id` type we
3947  * already have some mapping in hypothetical map, we check for two possible
3948  * situations:
3949  *   - `canon_id` is mapped to exactly the same type as `cand_id`. This will
3950  *     happen when type graphs have cycles. In this case we assume those two
3951  *     types are equivalent.
3952  *   - `canon_id` is mapped to different type. This is contradiction in our
3953  *     hypothetical mapping, because same graph in canonical graph corresponds
3954  *     to two different types in candidate graph, which for equivalent type
3955  *     graphs shouldn't happen. This condition terminates equivalence check
3956  *     with negative result.
3957  *
3958  * If type graphs traversal exhausts types to check and find no contradiction,
3959  * then type graphs are equivalent.
3960  *
3961  * When checking types for equivalence, there is one special case: FWD types.
3962  * If FWD type resolution is allowed and one of the types (either from canonical
3963  * or candidate graph) is FWD and other is STRUCT/UNION (depending on FWD's kind
3964  * flag) and their names match, hypothetical mapping is updated to point from
3965  * FWD to STRUCT/UNION. If graphs will be determined as equivalent successfully,
3966  * this mapping will be used to record FWD -> STRUCT/UNION mapping permanently.
3967  *
3968  * Technically, this could lead to incorrect FWD to STRUCT/UNION resolution,
3969  * if there are two exactly named (or anonymous) structs/unions that are
3970  * compatible structurally, one of which has FWD field, while other is concrete
3971  * STRUCT/UNION, but according to C sources they are different structs/unions
3972  * that are referencing different types with the same name. This is extremely
3973  * unlikely to happen, but btf_dedup API allows to disable FWD resolution if
3974  * this logic is causing problems.
3975  *
3976  * Doing FWD resolution means that both candidate and/or canonical graphs can
3977  * consists of portions of the graph that come from multiple compilation units.
3978  * This is due to the fact that types within single compilation unit are always
3979  * deduplicated and FWDs are already resolved, if referenced struct/union
3980  * definiton is available. So, if we had unresolved FWD and found corresponding
3981  * STRUCT/UNION, they will be from different compilation units. This
3982  * consequently means that when we "link" FWD to corresponding STRUCT/UNION,
3983  * type graph will likely have at least two different BTF types that describe
3984  * same type (e.g., most probably there will be two different BTF types for the
3985  * same 'int' primitive type) and could even have "overlapping" parts of type
3986  * graph that describe same subset of types.
3987  *
3988  * This in turn means that our assumption that each type in canonical graph
3989  * must correspond to exactly one type in candidate graph might not hold
3990  * anymore and will make it harder to detect contradictions using hypothetical
3991  * map. To handle this problem, we allow to follow FWD -> STRUCT/UNION
3992  * resolution only in canonical graph. FWDs in candidate graphs are never
3993  * resolved. To see why it's OK, let's check all possible situations w.r.t. FWDs
3994  * that can occur:
3995  *   - Both types in canonical and candidate graphs are FWDs. If they are
3996  *     structurally equivalent, then they can either be both resolved to the
3997  *     same STRUCT/UNION or not resolved at all. In both cases they are
3998  *     equivalent and there is no need to resolve FWD on candidate side.
3999  *   - Both types in canonical and candidate graphs are concrete STRUCT/UNION,
4000  *     so nothing to resolve as well, algorithm will check equivalence anyway.
4001  *   - Type in canonical graph is FWD, while type in candidate is concrete
4002  *     STRUCT/UNION. In this case candidate graph comes from single compilation
4003  *     unit, so there is exactly one BTF type for each unique C type. After
4004  *     resolving FWD into STRUCT/UNION, there might be more than one BTF type
4005  *     in canonical graph mapping to single BTF type in candidate graph, but
4006  *     because hypothetical mapping maps from canonical to candidate types, it's
4007  *     alright, and we still maintain the property of having single `canon_id`
4008  *     mapping to single `cand_id` (there could be two different `canon_id`
4009  *     mapped to the same `cand_id`, but it's not contradictory).
4010  *   - Type in canonical graph is concrete STRUCT/UNION, while type in candidate
4011  *     graph is FWD. In this case we are just going to check compatibility of
4012  *     STRUCT/UNION and corresponding FWD, and if they are compatible, we'll
4013  *     assume that whatever STRUCT/UNION FWD resolves to must be equivalent to
4014  *     a concrete STRUCT/UNION from canonical graph. If the rest of type graphs
4015  *     turn out equivalent, we'll re-resolve FWD to concrete STRUCT/UNION from
4016  *     canonical graph.
4017  */
4018 static int btf_dedup_is_equiv(struct btf_dedup *d, __u32 cand_id,
4019 			      __u32 canon_id)
4020 {
4021 	struct btf_type *cand_type;
4022 	struct btf_type *canon_type;
4023 	__u32 hypot_type_id;
4024 	__u16 cand_kind;
4025 	__u16 canon_kind;
4026 	int i, eq;
4027 
4028 	/* if both resolve to the same canonical, they must be equivalent */
4029 	if (resolve_type_id(d, cand_id) == resolve_type_id(d, canon_id))
4030 		return 1;
4031 
4032 	canon_id = resolve_fwd_id(d, canon_id);
4033 
4034 	hypot_type_id = d->hypot_map[canon_id];
4035 	if (hypot_type_id <= BTF_MAX_NR_TYPES) {
4036 		if (hypot_type_id == cand_id)
4037 			return 1;
4038 		/* In some cases compiler will generate different DWARF types
4039 		 * for *identical* array type definitions and use them for
4040 		 * different fields within the *same* struct. This breaks type
4041 		 * equivalence check, which makes an assumption that candidate
4042 		 * types sub-graph has a consistent and deduped-by-compiler
4043 		 * types within a single CU. So work around that by explicitly
4044 		 * allowing identical array types here.
4045 		 */
4046 		if (btf_dedup_identical_arrays(d, hypot_type_id, cand_id))
4047 			return 1;
4048 		/* It turns out that similar situation can happen with
4049 		 * struct/union sometimes, sigh... Handle the case where
4050 		 * structs/unions are exactly the same, down to the referenced
4051 		 * type IDs. Anything more complicated (e.g., if referenced
4052 		 * types are different, but equivalent) is *way more*
4053 		 * complicated and requires a many-to-many equivalence mapping.
4054 		 */
4055 		if (btf_dedup_identical_structs(d, hypot_type_id, cand_id))
4056 			return 1;
4057 		return 0;
4058 	}
4059 
4060 	if (btf_dedup_hypot_map_add(d, canon_id, cand_id))
4061 		return -ENOMEM;
4062 
4063 	cand_type = btf_type_by_id(d->btf, cand_id);
4064 	canon_type = btf_type_by_id(d->btf, canon_id);
4065 	cand_kind = btf_kind(cand_type);
4066 	canon_kind = btf_kind(canon_type);
4067 
4068 	if (cand_type->name_off != canon_type->name_off)
4069 		return 0;
4070 
4071 	/* FWD <--> STRUCT/UNION equivalence check, if enabled */
4072 	if ((cand_kind == BTF_KIND_FWD || canon_kind == BTF_KIND_FWD)
4073 	    && cand_kind != canon_kind) {
4074 		__u16 real_kind;
4075 		__u16 fwd_kind;
4076 
4077 		if (cand_kind == BTF_KIND_FWD) {
4078 			real_kind = canon_kind;
4079 			fwd_kind = btf_fwd_kind(cand_type);
4080 		} else {
4081 			real_kind = cand_kind;
4082 			fwd_kind = btf_fwd_kind(canon_type);
4083 			/* we'd need to resolve base FWD to STRUCT/UNION */
4084 			if (fwd_kind == real_kind && canon_id < d->btf->start_id)
4085 				d->hypot_adjust_canon = true;
4086 		}
4087 		return fwd_kind == real_kind;
4088 	}
4089 
4090 	if (cand_kind != canon_kind)
4091 		return 0;
4092 
4093 	switch (cand_kind) {
4094 	case BTF_KIND_INT:
4095 		return btf_equal_int_tag(cand_type, canon_type);
4096 
4097 	case BTF_KIND_ENUM:
4098 	case BTF_KIND_ENUM64:
4099 		return btf_compat_enum(cand_type, canon_type);
4100 
4101 	case BTF_KIND_FWD:
4102 	case BTF_KIND_FLOAT:
4103 		return btf_equal_common(cand_type, canon_type);
4104 
4105 	case BTF_KIND_CONST:
4106 	case BTF_KIND_VOLATILE:
4107 	case BTF_KIND_RESTRICT:
4108 	case BTF_KIND_PTR:
4109 	case BTF_KIND_TYPEDEF:
4110 	case BTF_KIND_FUNC:
4111 	case BTF_KIND_TYPE_TAG:
4112 		if (cand_type->info != canon_type->info)
4113 			return 0;
4114 		return btf_dedup_is_equiv(d, cand_type->type, canon_type->type);
4115 
4116 	case BTF_KIND_ARRAY: {
4117 		const struct btf_array *cand_arr, *canon_arr;
4118 
4119 		if (!btf_compat_array(cand_type, canon_type))
4120 			return 0;
4121 		cand_arr = btf_array(cand_type);
4122 		canon_arr = btf_array(canon_type);
4123 		eq = btf_dedup_is_equiv(d, cand_arr->index_type, canon_arr->index_type);
4124 		if (eq <= 0)
4125 			return eq;
4126 		return btf_dedup_is_equiv(d, cand_arr->type, canon_arr->type);
4127 	}
4128 
4129 	case BTF_KIND_STRUCT:
4130 	case BTF_KIND_UNION: {
4131 		const struct btf_member *cand_m, *canon_m;
4132 		__u16 vlen;
4133 
4134 		if (!btf_shallow_equal_struct(cand_type, canon_type))
4135 			return 0;
4136 		vlen = btf_vlen(cand_type);
4137 		cand_m = btf_members(cand_type);
4138 		canon_m = btf_members(canon_type);
4139 		for (i = 0; i < vlen; i++) {
4140 			eq = btf_dedup_is_equiv(d, cand_m->type, canon_m->type);
4141 			if (eq <= 0)
4142 				return eq;
4143 			cand_m++;
4144 			canon_m++;
4145 		}
4146 
4147 		return 1;
4148 	}
4149 
4150 	case BTF_KIND_FUNC_PROTO: {
4151 		const struct btf_param *cand_p, *canon_p;
4152 		__u16 vlen;
4153 
4154 		if (!btf_compat_fnproto(cand_type, canon_type))
4155 			return 0;
4156 		eq = btf_dedup_is_equiv(d, cand_type->type, canon_type->type);
4157 		if (eq <= 0)
4158 			return eq;
4159 		vlen = btf_vlen(cand_type);
4160 		cand_p = btf_params(cand_type);
4161 		canon_p = btf_params(canon_type);
4162 		for (i = 0; i < vlen; i++) {
4163 			eq = btf_dedup_is_equiv(d, cand_p->type, canon_p->type);
4164 			if (eq <= 0)
4165 				return eq;
4166 			cand_p++;
4167 			canon_p++;
4168 		}
4169 		return 1;
4170 	}
4171 
4172 	default:
4173 		return -EINVAL;
4174 	}
4175 	return 0;
4176 }
4177 
4178 /*
4179  * Use hypothetical mapping, produced by successful type graph equivalence
4180  * check, to augment existing struct/union canonical mapping, where possible.
4181  *
4182  * If BTF_KIND_FWD resolution is allowed, this mapping is also used to record
4183  * FWD -> STRUCT/UNION correspondence as well. FWD resolution is bidirectional:
4184  * it doesn't matter if FWD type was part of canonical graph or candidate one,
4185  * we are recording the mapping anyway. As opposed to carefulness required
4186  * for struct/union correspondence mapping (described below), for FWD resolution
4187  * it's not important, as by the time that FWD type (reference type) will be
4188  * deduplicated all structs/unions will be deduped already anyway.
4189  *
4190  * Recording STRUCT/UNION mapping is purely a performance optimization and is
4191  * not required for correctness. It needs to be done carefully to ensure that
4192  * struct/union from candidate's type graph is not mapped into corresponding
4193  * struct/union from canonical type graph that itself hasn't been resolved into
4194  * canonical representative. The only guarantee we have is that canonical
4195  * struct/union was determined as canonical and that won't change. But any
4196  * types referenced through that struct/union fields could have been not yet
4197  * resolved, so in case like that it's too early to establish any kind of
4198  * correspondence between structs/unions.
4199  *
4200  * No canonical correspondence is derived for primitive types (they are already
4201  * deduplicated completely already anyway) or reference types (they rely on
4202  * stability of struct/union canonical relationship for equivalence checks).
4203  */
4204 static void btf_dedup_merge_hypot_map(struct btf_dedup *d)
4205 {
4206 	__u32 canon_type_id, targ_type_id;
4207 	__u16 t_kind, c_kind;
4208 	__u32 t_id, c_id;
4209 	int i;
4210 
4211 	for (i = 0; i < d->hypot_cnt; i++) {
4212 		canon_type_id = d->hypot_list[i];
4213 		targ_type_id = d->hypot_map[canon_type_id];
4214 		t_id = resolve_type_id(d, targ_type_id);
4215 		c_id = resolve_type_id(d, canon_type_id);
4216 		t_kind = btf_kind(btf__type_by_id(d->btf, t_id));
4217 		c_kind = btf_kind(btf__type_by_id(d->btf, c_id));
4218 		/*
4219 		 * Resolve FWD into STRUCT/UNION.
4220 		 * It's ok to resolve FWD into STRUCT/UNION that's not yet
4221 		 * mapped to canonical representative (as opposed to
4222 		 * STRUCT/UNION <--> STRUCT/UNION mapping logic below), because
4223 		 * eventually that struct is going to be mapped and all resolved
4224 		 * FWDs will automatically resolve to correct canonical
4225 		 * representative. This will happen before ref type deduping,
4226 		 * which critically depends on stability of these mapping. This
4227 		 * stability is not a requirement for STRUCT/UNION equivalence
4228 		 * checks, though.
4229 		 */
4230 
4231 		/* if it's the split BTF case, we still need to point base FWD
4232 		 * to STRUCT/UNION in a split BTF, because FWDs from split BTF
4233 		 * will be resolved against base FWD. If we don't point base
4234 		 * canonical FWD to the resolved STRUCT/UNION, then all the
4235 		 * FWDs in split BTF won't be correctly resolved to a proper
4236 		 * STRUCT/UNION.
4237 		 */
4238 		if (t_kind != BTF_KIND_FWD && c_kind == BTF_KIND_FWD)
4239 			d->map[c_id] = t_id;
4240 
4241 		/* if graph equivalence determined that we'd need to adjust
4242 		 * base canonical types, then we need to only point base FWDs
4243 		 * to STRUCTs/UNIONs and do no more modifications. For all
4244 		 * other purposes the type graphs were not equivalent.
4245 		 */
4246 		if (d->hypot_adjust_canon)
4247 			continue;
4248 
4249 		if (t_kind == BTF_KIND_FWD && c_kind != BTF_KIND_FWD)
4250 			d->map[t_id] = c_id;
4251 
4252 		if ((t_kind == BTF_KIND_STRUCT || t_kind == BTF_KIND_UNION) &&
4253 		    c_kind != BTF_KIND_FWD &&
4254 		    is_type_mapped(d, c_id) &&
4255 		    !is_type_mapped(d, t_id)) {
4256 			/*
4257 			 * as a perf optimization, we can map struct/union
4258 			 * that's part of type graph we just verified for
4259 			 * equivalence. We can do that for struct/union that has
4260 			 * canonical representative only, though.
4261 			 */
4262 			d->map[t_id] = c_id;
4263 		}
4264 	}
4265 }
4266 
4267 /*
4268  * Deduplicate struct/union types.
4269  *
4270  * For each struct/union type its type signature hash is calculated, taking
4271  * into account type's name, size, number, order and names of fields, but
4272  * ignoring type ID's referenced from fields, because they might not be deduped
4273  * completely until after reference types deduplication phase. This type hash
4274  * is used to iterate over all potential canonical types, sharing same hash.
4275  * For each canonical candidate we check whether type graphs that they form
4276  * (through referenced types in fields and so on) are equivalent using algorithm
4277  * implemented in `btf_dedup_is_equiv`. If such equivalence is found and
4278  * BTF_KIND_FWD resolution is allowed, then hypothetical mapping
4279  * (btf_dedup->hypot_map) produced by aforementioned type graph equivalence
4280  * algorithm is used to record FWD -> STRUCT/UNION mapping. It's also used to
4281  * potentially map other structs/unions to their canonical representatives,
4282  * if such relationship hasn't yet been established. This speeds up algorithm
4283  * by eliminating some of the duplicate work.
4284  *
4285  * If no matching canonical representative was found, struct/union is marked
4286  * as canonical for itself and is added into btf_dedup->dedup_table hash map
4287  * for further look ups.
4288  */
4289 static int btf_dedup_struct_type(struct btf_dedup *d, __u32 type_id)
4290 {
4291 	struct btf_type *cand_type, *t;
4292 	struct hashmap_entry *hash_entry;
4293 	/* if we don't find equivalent type, then we are canonical */
4294 	__u32 new_id = type_id;
4295 	__u16 kind;
4296 	long h;
4297 
4298 	/* already deduped or is in process of deduping (loop detected) */
4299 	if (d->map[type_id] <= BTF_MAX_NR_TYPES)
4300 		return 0;
4301 
4302 	t = btf_type_by_id(d->btf, type_id);
4303 	kind = btf_kind(t);
4304 
4305 	if (kind != BTF_KIND_STRUCT && kind != BTF_KIND_UNION)
4306 		return 0;
4307 
4308 	h = btf_hash_struct(t);
4309 	for_each_dedup_cand(d, hash_entry, h) {
4310 		__u32 cand_id = hash_entry->value;
4311 		int eq;
4312 
4313 		/*
4314 		 * Even though btf_dedup_is_equiv() checks for
4315 		 * btf_shallow_equal_struct() internally when checking two
4316 		 * structs (unions) for equivalence, we need to guard here
4317 		 * from picking matching FWD type as a dedup candidate.
4318 		 * This can happen due to hash collision. In such case just
4319 		 * relying on btf_dedup_is_equiv() would lead to potentially
4320 		 * creating a loop (FWD -> STRUCT and STRUCT -> FWD), because
4321 		 * FWD and compatible STRUCT/UNION are considered equivalent.
4322 		 */
4323 		cand_type = btf_type_by_id(d->btf, cand_id);
4324 		if (!btf_shallow_equal_struct(t, cand_type))
4325 			continue;
4326 
4327 		btf_dedup_clear_hypot_map(d);
4328 		eq = btf_dedup_is_equiv(d, type_id, cand_id);
4329 		if (eq < 0)
4330 			return eq;
4331 		if (!eq)
4332 			continue;
4333 		btf_dedup_merge_hypot_map(d);
4334 		if (d->hypot_adjust_canon) /* not really equivalent */
4335 			continue;
4336 		new_id = cand_id;
4337 		break;
4338 	}
4339 
4340 	d->map[type_id] = new_id;
4341 	if (type_id == new_id && btf_dedup_table_add(d, h, type_id))
4342 		return -ENOMEM;
4343 
4344 	return 0;
4345 }
4346 
4347 static int btf_dedup_struct_types(struct btf_dedup *d)
4348 {
4349 	int i, err;
4350 
4351 	for (i = 0; i < d->btf->nr_types; i++) {
4352 		err = btf_dedup_struct_type(d, d->btf->start_id + i);
4353 		if (err)
4354 			return err;
4355 	}
4356 	return 0;
4357 }
4358 
4359 /*
4360  * Deduplicate reference type.
4361  *
4362  * Once all primitive and struct/union types got deduplicated, we can easily
4363  * deduplicate all other (reference) BTF types. This is done in two steps:
4364  *
4365  * 1. Resolve all referenced type IDs into their canonical type IDs. This
4366  * resolution can be done either immediately for primitive or struct/union types
4367  * (because they were deduped in previous two phases) or recursively for
4368  * reference types. Recursion will always terminate at either primitive or
4369  * struct/union type, at which point we can "unwind" chain of reference types
4370  * one by one. There is no danger of encountering cycles because in C type
4371  * system the only way to form type cycle is through struct/union, so any chain
4372  * of reference types, even those taking part in a type cycle, will inevitably
4373  * reach struct/union at some point.
4374  *
4375  * 2. Once all referenced type IDs are resolved into canonical ones, BTF type
4376  * becomes "stable", in the sense that no further deduplication will cause
4377  * any changes to it. With that, it's now possible to calculate type's signature
4378  * hash (this time taking into account referenced type IDs) and loop over all
4379  * potential canonical representatives. If no match was found, current type
4380  * will become canonical representative of itself and will be added into
4381  * btf_dedup->dedup_table as another possible canonical representative.
4382  */
4383 static int btf_dedup_ref_type(struct btf_dedup *d, __u32 type_id)
4384 {
4385 	struct hashmap_entry *hash_entry;
4386 	__u32 new_id = type_id, cand_id;
4387 	struct btf_type *t, *cand;
4388 	/* if we don't find equivalent type, then we are representative type */
4389 	int ref_type_id;
4390 	long h;
4391 
4392 	if (d->map[type_id] == BTF_IN_PROGRESS_ID)
4393 		return -ELOOP;
4394 	if (d->map[type_id] <= BTF_MAX_NR_TYPES)
4395 		return resolve_type_id(d, type_id);
4396 
4397 	t = btf_type_by_id(d->btf, type_id);
4398 	d->map[type_id] = BTF_IN_PROGRESS_ID;
4399 
4400 	switch (btf_kind(t)) {
4401 	case BTF_KIND_CONST:
4402 	case BTF_KIND_VOLATILE:
4403 	case BTF_KIND_RESTRICT:
4404 	case BTF_KIND_PTR:
4405 	case BTF_KIND_TYPEDEF:
4406 	case BTF_KIND_FUNC:
4407 	case BTF_KIND_TYPE_TAG:
4408 		ref_type_id = btf_dedup_ref_type(d, t->type);
4409 		if (ref_type_id < 0)
4410 			return ref_type_id;
4411 		t->type = ref_type_id;
4412 
4413 		h = btf_hash_common(t);
4414 		for_each_dedup_cand(d, hash_entry, h) {
4415 			cand_id = hash_entry->value;
4416 			cand = btf_type_by_id(d->btf, cand_id);
4417 			if (btf_equal_common(t, cand)) {
4418 				new_id = cand_id;
4419 				break;
4420 			}
4421 		}
4422 		break;
4423 
4424 	case BTF_KIND_DECL_TAG:
4425 		ref_type_id = btf_dedup_ref_type(d, t->type);
4426 		if (ref_type_id < 0)
4427 			return ref_type_id;
4428 		t->type = ref_type_id;
4429 
4430 		h = btf_hash_int_decl_tag(t);
4431 		for_each_dedup_cand(d, hash_entry, h) {
4432 			cand_id = hash_entry->value;
4433 			cand = btf_type_by_id(d->btf, cand_id);
4434 			if (btf_equal_int_tag(t, cand)) {
4435 				new_id = cand_id;
4436 				break;
4437 			}
4438 		}
4439 		break;
4440 
4441 	case BTF_KIND_ARRAY: {
4442 		struct btf_array *info = btf_array(t);
4443 
4444 		ref_type_id = btf_dedup_ref_type(d, info->type);
4445 		if (ref_type_id < 0)
4446 			return ref_type_id;
4447 		info->type = ref_type_id;
4448 
4449 		ref_type_id = btf_dedup_ref_type(d, info->index_type);
4450 		if (ref_type_id < 0)
4451 			return ref_type_id;
4452 		info->index_type = ref_type_id;
4453 
4454 		h = btf_hash_array(t);
4455 		for_each_dedup_cand(d, hash_entry, h) {
4456 			cand_id = hash_entry->value;
4457 			cand = btf_type_by_id(d->btf, cand_id);
4458 			if (btf_equal_array(t, cand)) {
4459 				new_id = cand_id;
4460 				break;
4461 			}
4462 		}
4463 		break;
4464 	}
4465 
4466 	case BTF_KIND_FUNC_PROTO: {
4467 		struct btf_param *param;
4468 		__u16 vlen;
4469 		int i;
4470 
4471 		ref_type_id = btf_dedup_ref_type(d, t->type);
4472 		if (ref_type_id < 0)
4473 			return ref_type_id;
4474 		t->type = ref_type_id;
4475 
4476 		vlen = btf_vlen(t);
4477 		param = btf_params(t);
4478 		for (i = 0; i < vlen; i++) {
4479 			ref_type_id = btf_dedup_ref_type(d, param->type);
4480 			if (ref_type_id < 0)
4481 				return ref_type_id;
4482 			param->type = ref_type_id;
4483 			param++;
4484 		}
4485 
4486 		h = btf_hash_fnproto(t);
4487 		for_each_dedup_cand(d, hash_entry, h) {
4488 			cand_id = hash_entry->value;
4489 			cand = btf_type_by_id(d->btf, cand_id);
4490 			if (btf_equal_fnproto(t, cand)) {
4491 				new_id = cand_id;
4492 				break;
4493 			}
4494 		}
4495 		break;
4496 	}
4497 
4498 	default:
4499 		return -EINVAL;
4500 	}
4501 
4502 	d->map[type_id] = new_id;
4503 	if (type_id == new_id && btf_dedup_table_add(d, h, type_id))
4504 		return -ENOMEM;
4505 
4506 	return new_id;
4507 }
4508 
4509 static int btf_dedup_ref_types(struct btf_dedup *d)
4510 {
4511 	int i, err;
4512 
4513 	for (i = 0; i < d->btf->nr_types; i++) {
4514 		err = btf_dedup_ref_type(d, d->btf->start_id + i);
4515 		if (err < 0)
4516 			return err;
4517 	}
4518 	/* we won't need d->dedup_table anymore */
4519 	hashmap__free(d->dedup_table);
4520 	d->dedup_table = NULL;
4521 	return 0;
4522 }
4523 
4524 /*
4525  * Collect a map from type names to type ids for all canonical structs
4526  * and unions. If the same name is shared by several canonical types
4527  * use a special value 0 to indicate this fact.
4528  */
4529 static int btf_dedup_fill_unique_names_map(struct btf_dedup *d, struct hashmap *names_map)
4530 {
4531 	__u32 nr_types = btf__type_cnt(d->btf);
4532 	struct btf_type *t;
4533 	__u32 type_id;
4534 	__u16 kind;
4535 	int err;
4536 
4537 	/*
4538 	 * Iterate over base and split module ids in order to get all
4539 	 * available structs in the map.
4540 	 */
4541 	for (type_id = 1; type_id < nr_types; ++type_id) {
4542 		t = btf_type_by_id(d->btf, type_id);
4543 		kind = btf_kind(t);
4544 
4545 		if (kind != BTF_KIND_STRUCT && kind != BTF_KIND_UNION)
4546 			continue;
4547 
4548 		/* Skip non-canonical types */
4549 		if (type_id != d->map[type_id])
4550 			continue;
4551 
4552 		err = hashmap__add(names_map, t->name_off, type_id);
4553 		if (err == -EEXIST)
4554 			err = hashmap__set(names_map, t->name_off, 0, NULL, NULL);
4555 
4556 		if (err)
4557 			return err;
4558 	}
4559 
4560 	return 0;
4561 }
4562 
4563 static int btf_dedup_resolve_fwd(struct btf_dedup *d, struct hashmap *names_map, __u32 type_id)
4564 {
4565 	struct btf_type *t = btf_type_by_id(d->btf, type_id);
4566 	enum btf_fwd_kind fwd_kind = btf_kflag(t);
4567 	__u16 cand_kind, kind = btf_kind(t);
4568 	struct btf_type *cand_t;
4569 	uintptr_t cand_id;
4570 
4571 	if (kind != BTF_KIND_FWD)
4572 		return 0;
4573 
4574 	/* Skip if this FWD already has a mapping */
4575 	if (type_id != d->map[type_id])
4576 		return 0;
4577 
4578 	if (!hashmap__find(names_map, t->name_off, &cand_id))
4579 		return 0;
4580 
4581 	/* Zero is a special value indicating that name is not unique */
4582 	if (!cand_id)
4583 		return 0;
4584 
4585 	cand_t = btf_type_by_id(d->btf, cand_id);
4586 	cand_kind = btf_kind(cand_t);
4587 	if ((cand_kind == BTF_KIND_STRUCT && fwd_kind != BTF_FWD_STRUCT) ||
4588 	    (cand_kind == BTF_KIND_UNION && fwd_kind != BTF_FWD_UNION))
4589 		return 0;
4590 
4591 	d->map[type_id] = cand_id;
4592 
4593 	return 0;
4594 }
4595 
4596 /*
4597  * Resolve unambiguous forward declarations.
4598  *
4599  * The lion's share of all FWD declarations is resolved during
4600  * `btf_dedup_struct_types` phase when different type graphs are
4601  * compared against each other. However, if in some compilation unit a
4602  * FWD declaration is not a part of a type graph compared against
4603  * another type graph that declaration's canonical type would not be
4604  * changed. Example:
4605  *
4606  * CU #1:
4607  *
4608  * struct foo;
4609  * struct foo *some_global;
4610  *
4611  * CU #2:
4612  *
4613  * struct foo { int u; };
4614  * struct foo *another_global;
4615  *
4616  * After `btf_dedup_struct_types` the BTF looks as follows:
4617  *
4618  * [1] STRUCT 'foo' size=4 vlen=1 ...
4619  * [2] INT 'int' size=4 ...
4620  * [3] PTR '(anon)' type_id=1
4621  * [4] FWD 'foo' fwd_kind=struct
4622  * [5] PTR '(anon)' type_id=4
4623  *
4624  * This pass assumes that such FWD declarations should be mapped to
4625  * structs or unions with identical name in case if the name is not
4626  * ambiguous.
4627  */
4628 static int btf_dedup_resolve_fwds(struct btf_dedup *d)
4629 {
4630 	int i, err;
4631 	struct hashmap *names_map;
4632 
4633 	names_map = hashmap__new(btf_dedup_identity_hash_fn, btf_dedup_equal_fn, NULL);
4634 	if (IS_ERR(names_map))
4635 		return PTR_ERR(names_map);
4636 
4637 	err = btf_dedup_fill_unique_names_map(d, names_map);
4638 	if (err < 0)
4639 		goto exit;
4640 
4641 	for (i = 0; i < d->btf->nr_types; i++) {
4642 		err = btf_dedup_resolve_fwd(d, names_map, d->btf->start_id + i);
4643 		if (err < 0)
4644 			break;
4645 	}
4646 
4647 exit:
4648 	hashmap__free(names_map);
4649 	return err;
4650 }
4651 
4652 /*
4653  * Compact types.
4654  *
4655  * After we established for each type its corresponding canonical representative
4656  * type, we now can eliminate types that are not canonical and leave only
4657  * canonical ones layed out sequentially in memory by copying them over
4658  * duplicates. During compaction btf_dedup->hypot_map array is reused to store
4659  * a map from original type ID to a new compacted type ID, which will be used
4660  * during next phase to "fix up" type IDs, referenced from struct/union and
4661  * reference types.
4662  */
4663 static int btf_dedup_compact_types(struct btf_dedup *d)
4664 {
4665 	__u32 *new_offs;
4666 	__u32 next_type_id = d->btf->start_id;
4667 	const struct btf_type *t;
4668 	void *p;
4669 	int i, id, len;
4670 
4671 	/* we are going to reuse hypot_map to store compaction remapping */
4672 	d->hypot_map[0] = 0;
4673 	/* base BTF types are not renumbered */
4674 	for (id = 1; id < d->btf->start_id; id++)
4675 		d->hypot_map[id] = id;
4676 	for (i = 0, id = d->btf->start_id; i < d->btf->nr_types; i++, id++)
4677 		d->hypot_map[id] = BTF_UNPROCESSED_ID;
4678 
4679 	p = d->btf->types_data;
4680 
4681 	for (i = 0, id = d->btf->start_id; i < d->btf->nr_types; i++, id++) {
4682 		if (d->map[id] != id)
4683 			continue;
4684 
4685 		t = btf__type_by_id(d->btf, id);
4686 		len = btf_type_size(t);
4687 		if (len < 0)
4688 			return len;
4689 
4690 		memmove(p, t, len);
4691 		d->hypot_map[id] = next_type_id;
4692 		d->btf->type_offs[next_type_id - d->btf->start_id] = p - d->btf->types_data;
4693 		p += len;
4694 		next_type_id++;
4695 	}
4696 
4697 	/* shrink struct btf's internal types index and update btf_header */
4698 	d->btf->nr_types = next_type_id - d->btf->start_id;
4699 	d->btf->type_offs_cap = d->btf->nr_types;
4700 	d->btf->hdr->type_len = p - d->btf->types_data;
4701 	new_offs = libbpf_reallocarray(d->btf->type_offs, d->btf->type_offs_cap,
4702 				       sizeof(*new_offs));
4703 	if (d->btf->type_offs_cap && !new_offs)
4704 		return -ENOMEM;
4705 	d->btf->type_offs = new_offs;
4706 	d->btf->hdr->str_off = d->btf->hdr->type_len;
4707 	d->btf->raw_size = d->btf->hdr->hdr_len + d->btf->hdr->type_len + d->btf->hdr->str_len;
4708 	return 0;
4709 }
4710 
4711 /*
4712  * Figure out final (deduplicated and compacted) type ID for provided original
4713  * `type_id` by first resolving it into corresponding canonical type ID and
4714  * then mapping it to a deduplicated type ID, stored in btf_dedup->hypot_map,
4715  * which is populated during compaction phase.
4716  */
4717 static int btf_dedup_remap_type_id(__u32 *type_id, void *ctx)
4718 {
4719 	struct btf_dedup *d = ctx;
4720 	__u32 resolved_type_id, new_type_id;
4721 
4722 	resolved_type_id = resolve_type_id(d, *type_id);
4723 	new_type_id = d->hypot_map[resolved_type_id];
4724 	if (new_type_id > BTF_MAX_NR_TYPES)
4725 		return -EINVAL;
4726 
4727 	*type_id = new_type_id;
4728 	return 0;
4729 }
4730 
4731 /*
4732  * Remap referenced type IDs into deduped type IDs.
4733  *
4734  * After BTF types are deduplicated and compacted, their final type IDs may
4735  * differ from original ones. The map from original to a corresponding
4736  * deduped type ID is stored in btf_dedup->hypot_map and is populated during
4737  * compaction phase. During remapping phase we are rewriting all type IDs
4738  * referenced from any BTF type (e.g., struct fields, func proto args, etc) to
4739  * their final deduped type IDs.
4740  */
4741 static int btf_dedup_remap_types(struct btf_dedup *d)
4742 {
4743 	int i, r;
4744 
4745 	for (i = 0; i < d->btf->nr_types; i++) {
4746 		struct btf_type *t = btf_type_by_id(d->btf, d->btf->start_id + i);
4747 
4748 		r = btf_type_visit_type_ids(t, btf_dedup_remap_type_id, d);
4749 		if (r)
4750 			return r;
4751 	}
4752 
4753 	if (!d->btf_ext)
4754 		return 0;
4755 
4756 	r = btf_ext_visit_type_ids(d->btf_ext, btf_dedup_remap_type_id, d);
4757 	if (r)
4758 		return r;
4759 
4760 	return 0;
4761 }
4762 
4763 /*
4764  * Probe few well-known locations for vmlinux kernel image and try to load BTF
4765  * data out of it to use for target BTF.
4766  */
4767 struct btf *btf__load_vmlinux_btf(void)
4768 {
4769 	const char *locations[] = {
4770 		/* try canonical vmlinux BTF through sysfs first */
4771 		"/sys/kernel/btf/vmlinux",
4772 		/* fall back to trying to find vmlinux on disk otherwise */
4773 		"/boot/vmlinux-%1$s",
4774 		"/lib/modules/%1$s/vmlinux-%1$s",
4775 		"/lib/modules/%1$s/build/vmlinux",
4776 		"/usr/lib/modules/%1$s/kernel/vmlinux",
4777 		"/usr/lib/debug/boot/vmlinux-%1$s",
4778 		"/usr/lib/debug/boot/vmlinux-%1$s.debug",
4779 		"/usr/lib/debug/lib/modules/%1$s/vmlinux",
4780 	};
4781 	char path[PATH_MAX + 1];
4782 	struct utsname buf;
4783 	struct btf *btf;
4784 	int i, err;
4785 
4786 	uname(&buf);
4787 
4788 	for (i = 0; i < ARRAY_SIZE(locations); i++) {
4789 		snprintf(path, PATH_MAX, locations[i], buf.release);
4790 
4791 		if (faccessat(AT_FDCWD, path, R_OK, AT_EACCESS))
4792 			continue;
4793 
4794 		btf = btf__parse(path, NULL);
4795 		err = libbpf_get_error(btf);
4796 		pr_debug("loading kernel BTF '%s': %d\n", path, err);
4797 		if (err)
4798 			continue;
4799 
4800 		return btf;
4801 	}
4802 
4803 	pr_warn("failed to find valid kernel BTF\n");
4804 	return libbpf_err_ptr(-ESRCH);
4805 }
4806 
4807 struct btf *libbpf_find_kernel_btf(void) __attribute__((alias("btf__load_vmlinux_btf")));
4808 
4809 struct btf *btf__load_module_btf(const char *module_name, struct btf *vmlinux_btf)
4810 {
4811 	char path[80];
4812 
4813 	snprintf(path, sizeof(path), "/sys/kernel/btf/%s", module_name);
4814 	return btf__parse_split(path, vmlinux_btf);
4815 }
4816 
4817 int btf_type_visit_type_ids(struct btf_type *t, type_id_visit_fn visit, void *ctx)
4818 {
4819 	int i, n, err;
4820 
4821 	switch (btf_kind(t)) {
4822 	case BTF_KIND_INT:
4823 	case BTF_KIND_FLOAT:
4824 	case BTF_KIND_ENUM:
4825 	case BTF_KIND_ENUM64:
4826 		return 0;
4827 
4828 	case BTF_KIND_FWD:
4829 	case BTF_KIND_CONST:
4830 	case BTF_KIND_VOLATILE:
4831 	case BTF_KIND_RESTRICT:
4832 	case BTF_KIND_PTR:
4833 	case BTF_KIND_TYPEDEF:
4834 	case BTF_KIND_FUNC:
4835 	case BTF_KIND_VAR:
4836 	case BTF_KIND_DECL_TAG:
4837 	case BTF_KIND_TYPE_TAG:
4838 		return visit(&t->type, ctx);
4839 
4840 	case BTF_KIND_ARRAY: {
4841 		struct btf_array *a = btf_array(t);
4842 
4843 		err = visit(&a->type, ctx);
4844 		err = err ?: visit(&a->index_type, ctx);
4845 		return err;
4846 	}
4847 
4848 	case BTF_KIND_STRUCT:
4849 	case BTF_KIND_UNION: {
4850 		struct btf_member *m = btf_members(t);
4851 
4852 		for (i = 0, n = btf_vlen(t); i < n; i++, m++) {
4853 			err = visit(&m->type, ctx);
4854 			if (err)
4855 				return err;
4856 		}
4857 		return 0;
4858 	}
4859 
4860 	case BTF_KIND_FUNC_PROTO: {
4861 		struct btf_param *m = btf_params(t);
4862 
4863 		err = visit(&t->type, ctx);
4864 		if (err)
4865 			return err;
4866 		for (i = 0, n = btf_vlen(t); i < n; i++, m++) {
4867 			err = visit(&m->type, ctx);
4868 			if (err)
4869 				return err;
4870 		}
4871 		return 0;
4872 	}
4873 
4874 	case BTF_KIND_DATASEC: {
4875 		struct btf_var_secinfo *m = btf_var_secinfos(t);
4876 
4877 		for (i = 0, n = btf_vlen(t); i < n; i++, m++) {
4878 			err = visit(&m->type, ctx);
4879 			if (err)
4880 				return err;
4881 		}
4882 		return 0;
4883 	}
4884 
4885 	default:
4886 		return -EINVAL;
4887 	}
4888 }
4889 
4890 int btf_type_visit_str_offs(struct btf_type *t, str_off_visit_fn visit, void *ctx)
4891 {
4892 	int i, n, err;
4893 
4894 	err = visit(&t->name_off, ctx);
4895 	if (err)
4896 		return err;
4897 
4898 	switch (btf_kind(t)) {
4899 	case BTF_KIND_STRUCT:
4900 	case BTF_KIND_UNION: {
4901 		struct btf_member *m = btf_members(t);
4902 
4903 		for (i = 0, n = btf_vlen(t); i < n; i++, m++) {
4904 			err = visit(&m->name_off, ctx);
4905 			if (err)
4906 				return err;
4907 		}
4908 		break;
4909 	}
4910 	case BTF_KIND_ENUM: {
4911 		struct btf_enum *m = btf_enum(t);
4912 
4913 		for (i = 0, n = btf_vlen(t); i < n; i++, m++) {
4914 			err = visit(&m->name_off, ctx);
4915 			if (err)
4916 				return err;
4917 		}
4918 		break;
4919 	}
4920 	case BTF_KIND_ENUM64: {
4921 		struct btf_enum64 *m = btf_enum64(t);
4922 
4923 		for (i = 0, n = btf_vlen(t); i < n; i++, m++) {
4924 			err = visit(&m->name_off, ctx);
4925 			if (err)
4926 				return err;
4927 		}
4928 		break;
4929 	}
4930 	case BTF_KIND_FUNC_PROTO: {
4931 		struct btf_param *m = btf_params(t);
4932 
4933 		for (i = 0, n = btf_vlen(t); i < n; i++, m++) {
4934 			err = visit(&m->name_off, ctx);
4935 			if (err)
4936 				return err;
4937 		}
4938 		break;
4939 	}
4940 	default:
4941 		break;
4942 	}
4943 
4944 	return 0;
4945 }
4946 
4947 int btf_ext_visit_type_ids(struct btf_ext *btf_ext, type_id_visit_fn visit, void *ctx)
4948 {
4949 	const struct btf_ext_info *seg;
4950 	struct btf_ext_info_sec *sec;
4951 	int i, err;
4952 
4953 	seg = &btf_ext->func_info;
4954 	for_each_btf_ext_sec(seg, sec) {
4955 		struct bpf_func_info_min *rec;
4956 
4957 		for_each_btf_ext_rec(seg, sec, i, rec) {
4958 			err = visit(&rec->type_id, ctx);
4959 			if (err < 0)
4960 				return err;
4961 		}
4962 	}
4963 
4964 	seg = &btf_ext->core_relo_info;
4965 	for_each_btf_ext_sec(seg, sec) {
4966 		struct bpf_core_relo *rec;
4967 
4968 		for_each_btf_ext_rec(seg, sec, i, rec) {
4969 			err = visit(&rec->type_id, ctx);
4970 			if (err < 0)
4971 				return err;
4972 		}
4973 	}
4974 
4975 	return 0;
4976 }
4977 
4978 int btf_ext_visit_str_offs(struct btf_ext *btf_ext, str_off_visit_fn visit, void *ctx)
4979 {
4980 	const struct btf_ext_info *seg;
4981 	struct btf_ext_info_sec *sec;
4982 	int i, err;
4983 
4984 	seg = &btf_ext->func_info;
4985 	for_each_btf_ext_sec(seg, sec) {
4986 		err = visit(&sec->sec_name_off, ctx);
4987 		if (err)
4988 			return err;
4989 	}
4990 
4991 	seg = &btf_ext->line_info;
4992 	for_each_btf_ext_sec(seg, sec) {
4993 		struct bpf_line_info_min *rec;
4994 
4995 		err = visit(&sec->sec_name_off, ctx);
4996 		if (err)
4997 			return err;
4998 
4999 		for_each_btf_ext_rec(seg, sec, i, rec) {
5000 			err = visit(&rec->file_name_off, ctx);
5001 			if (err)
5002 				return err;
5003 			err = visit(&rec->line_off, ctx);
5004 			if (err)
5005 				return err;
5006 		}
5007 	}
5008 
5009 	seg = &btf_ext->core_relo_info;
5010 	for_each_btf_ext_sec(seg, sec) {
5011 		struct bpf_core_relo *rec;
5012 
5013 		err = visit(&sec->sec_name_off, ctx);
5014 		if (err)
5015 			return err;
5016 
5017 		for_each_btf_ext_rec(seg, sec, i, rec) {
5018 			err = visit(&rec->access_str_off, ctx);
5019 			if (err)
5020 				return err;
5021 		}
5022 	}
5023 
5024 	return 0;
5025 }
5026