xref: /openbmc/linux/kernel/bpf/map_in_map.c (revision 6c71a0574249f5e5a45fe055ab5f837023d5eeca)
125763b3cSThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
256f668dfSMartin KaFai Lau /* Copyright (c) 2017 Facebook
356f668dfSMartin KaFai Lau  */
456f668dfSMartin KaFai Lau #include <linux/slab.h>
556f668dfSMartin KaFai Lau #include <linux/bpf.h>
640ec00abSAlexei Starovoitov #include <linux/btf.h>
756f668dfSMartin KaFai Lau 
856f668dfSMartin KaFai Lau #include "map_in_map.h"
956f668dfSMartin KaFai Lau 
bpf_map_meta_alloc(int inner_map_ufd)1056f668dfSMartin KaFai Lau struct bpf_map *bpf_map_meta_alloc(int inner_map_ufd)
1156f668dfSMartin KaFai Lau {
1256f668dfSMartin KaFai Lau 	struct bpf_map *inner_map, *inner_map_meta;
139d5564ddSDaniel Borkmann 	u32 inner_map_meta_size;
1456f668dfSMartin KaFai Lau 	struct fd f;
15f73e601aSKumar Kartikeya Dwivedi 	int ret;
1656f668dfSMartin KaFai Lau 
1756f668dfSMartin KaFai Lau 	f = fdget(inner_map_ufd);
1856f668dfSMartin KaFai Lau 	inner_map = __bpf_map_get(f);
1956f668dfSMartin KaFai Lau 	if (IS_ERR(inner_map))
2056f668dfSMartin KaFai Lau 		return inner_map;
2156f668dfSMartin KaFai Lau 
2256f668dfSMartin KaFai Lau 	/* Does not support >1 level map-in-map */
2356f668dfSMartin KaFai Lau 	if (inner_map->inner_map_meta) {
24f73e601aSKumar Kartikeya Dwivedi 		ret = -EINVAL;
25f73e601aSKumar Kartikeya Dwivedi 		goto put;
2656f668dfSMartin KaFai Lau 	}
2756f668dfSMartin KaFai Lau 
28f4d05259SMartin KaFai Lau 	if (!inner_map->ops->map_meta_equal) {
29f73e601aSKumar Kartikeya Dwivedi 		ret = -ENOTSUPP;
30f73e601aSKumar Kartikeya Dwivedi 		goto put;
31f4d05259SMartin KaFai Lau 	}
32f4d05259SMartin KaFai Lau 
339d5564ddSDaniel Borkmann 	inner_map_meta_size = sizeof(*inner_map_meta);
349d5564ddSDaniel Borkmann 	/* In some cases verifier needs to access beyond just base map. */
359d5564ddSDaniel Borkmann 	if (inner_map->ops == &array_map_ops)
369d5564ddSDaniel Borkmann 		inner_map_meta_size = sizeof(struct bpf_array);
379d5564ddSDaniel Borkmann 
389d5564ddSDaniel Borkmann 	inner_map_meta = kzalloc(inner_map_meta_size, GFP_USER);
3956f668dfSMartin KaFai Lau 	if (!inner_map_meta) {
40f73e601aSKumar Kartikeya Dwivedi 		ret = -ENOMEM;
41f73e601aSKumar Kartikeya Dwivedi 		goto put;
4256f668dfSMartin KaFai Lau 	}
4356f668dfSMartin KaFai Lau 
4456f668dfSMartin KaFai Lau 	inner_map_meta->map_type = inner_map->map_type;
4556f668dfSMartin KaFai Lau 	inner_map_meta->key_size = inner_map->key_size;
4656f668dfSMartin KaFai Lau 	inner_map_meta->value_size = inner_map->value_size;
4756f668dfSMartin KaFai Lau 	inner_map_meta->map_flags = inner_map->map_flags;
4856f668dfSMartin KaFai Lau 	inner_map_meta->max_entries = inner_map->max_entries;
49f73e601aSKumar Kartikeya Dwivedi 
50aa3496acSKumar Kartikeya Dwivedi 	inner_map_meta->record = btf_record_dup(inner_map->record);
51aa3496acSKumar Kartikeya Dwivedi 	if (IS_ERR(inner_map_meta->record)) {
52aa3496acSKumar Kartikeya Dwivedi 		/* btf_record_dup returns NULL or valid pointer in case of
53aa3496acSKumar Kartikeya Dwivedi 		 * invalid/empty/valid, but ERR_PTR in case of errors. During
54aa3496acSKumar Kartikeya Dwivedi 		 * equality NULL or IS_ERR is equivalent.
55aa3496acSKumar Kartikeya Dwivedi 		 */
56f73e601aSKumar Kartikeya Dwivedi 		ret = PTR_ERR(inner_map_meta->record);
57f73e601aSKumar Kartikeya Dwivedi 		goto free;
58f73e601aSKumar Kartikeya Dwivedi 	}
59c22dfdd2SKumar Kartikeya Dwivedi 	/* Note: We must use the same BTF, as we also used btf_record_dup above
60c22dfdd2SKumar Kartikeya Dwivedi 	 * which relies on BTF being same for both maps, as some members like
61c22dfdd2SKumar Kartikeya Dwivedi 	 * record->fields.list_head have pointers like value_rec pointing into
62c22dfdd2SKumar Kartikeya Dwivedi 	 * inner_map->btf.
63c22dfdd2SKumar Kartikeya Dwivedi 	 */
6440ec00abSAlexei Starovoitov 	if (inner_map->btf) {
6540ec00abSAlexei Starovoitov 		btf_get(inner_map->btf);
6640ec00abSAlexei Starovoitov 		inner_map_meta->btf = inner_map->btf;
6740ec00abSAlexei Starovoitov 	}
6856f668dfSMartin KaFai Lau 
699d5564ddSDaniel Borkmann 	/* Misc members not needed in bpf_map_meta_equal() check. */
709d5564ddSDaniel Borkmann 	inner_map_meta->ops = inner_map->ops;
719d5564ddSDaniel Borkmann 	if (inner_map->ops == &array_map_ops) {
72cba41bb7SRhys Rustad-Elliott 		struct bpf_array *inner_array_meta =
73cba41bb7SRhys Rustad-Elliott 			container_of(inner_map_meta, struct bpf_array, map);
74cba41bb7SRhys Rustad-Elliott 		struct bpf_array *inner_array = container_of(inner_map, struct bpf_array, map);
75cba41bb7SRhys Rustad-Elliott 
76cba41bb7SRhys Rustad-Elliott 		inner_array_meta->index_mask = inner_array->index_mask;
77cba41bb7SRhys Rustad-Elliott 		inner_array_meta->elem_size = inner_array->elem_size;
782c78ee89SAlexei Starovoitov 		inner_map_meta->bypass_spec_v1 = inner_map->bypass_spec_v1;
799d5564ddSDaniel Borkmann 	}
809d5564ddSDaniel Borkmann 
8156f668dfSMartin KaFai Lau 	fdput(f);
8256f668dfSMartin KaFai Lau 	return inner_map_meta;
83f73e601aSKumar Kartikeya Dwivedi free:
84f73e601aSKumar Kartikeya Dwivedi 	kfree(inner_map_meta);
85f73e601aSKumar Kartikeya Dwivedi put:
86f73e601aSKumar Kartikeya Dwivedi 	fdput(f);
87f73e601aSKumar Kartikeya Dwivedi 	return ERR_PTR(ret);
8856f668dfSMartin KaFai Lau }
8956f668dfSMartin KaFai Lau 
bpf_map_meta_free(struct bpf_map * map_meta)9056f668dfSMartin KaFai Lau void bpf_map_meta_free(struct bpf_map *map_meta)
9156f668dfSMartin KaFai Lau {
92aa3496acSKumar Kartikeya Dwivedi 	bpf_map_free_record(map_meta);
9340ec00abSAlexei Starovoitov 	btf_put(map_meta->btf);
9456f668dfSMartin KaFai Lau 	kfree(map_meta);
9556f668dfSMartin KaFai Lau }
9656f668dfSMartin KaFai Lau 
bpf_map_meta_equal(const struct bpf_map * meta0,const struct bpf_map * meta1)9756f668dfSMartin KaFai Lau bool bpf_map_meta_equal(const struct bpf_map *meta0,
9856f668dfSMartin KaFai Lau 			const struct bpf_map *meta1)
9956f668dfSMartin KaFai Lau {
10056f668dfSMartin KaFai Lau 	/* No need to compare ops because it is covered by map_type */
10156f668dfSMartin KaFai Lau 	return meta0->map_type == meta1->map_type &&
10256f668dfSMartin KaFai Lau 		meta0->key_size == meta1->key_size &&
10356f668dfSMartin KaFai Lau 		meta0->value_size == meta1->value_size &&
10461df10c7SKumar Kartikeya Dwivedi 		meta0->map_flags == meta1->map_flags &&
105aa3496acSKumar Kartikeya Dwivedi 		btf_record_equal(meta0->record, meta1->record);
10656f668dfSMartin KaFai Lau }
10756f668dfSMartin KaFai Lau 
bpf_map_fd_get_ptr(struct bpf_map * map,struct file * map_file,int ufd)10856f668dfSMartin KaFai Lau void *bpf_map_fd_get_ptr(struct bpf_map *map,
10956f668dfSMartin KaFai Lau 			 struct file *map_file /* not used */,
11056f668dfSMartin KaFai Lau 			 int ufd)
11156f668dfSMartin KaFai Lau {
112f4d05259SMartin KaFai Lau 	struct bpf_map *inner_map, *inner_map_meta;
11356f668dfSMartin KaFai Lau 	struct fd f;
11456f668dfSMartin KaFai Lau 
11556f668dfSMartin KaFai Lau 	f = fdget(ufd);
11656f668dfSMartin KaFai Lau 	inner_map = __bpf_map_get(f);
11756f668dfSMartin KaFai Lau 	if (IS_ERR(inner_map))
11856f668dfSMartin KaFai Lau 		return inner_map;
11956f668dfSMartin KaFai Lau 
120f4d05259SMartin KaFai Lau 	inner_map_meta = map->inner_map_meta;
121f4d05259SMartin KaFai Lau 	if (inner_map_meta->ops->map_meta_equal(inner_map_meta, inner_map))
1221e0bd5a0SAndrii Nakryiko 		bpf_map_inc(inner_map);
12356f668dfSMartin KaFai Lau 	else
12456f668dfSMartin KaFai Lau 		inner_map = ERR_PTR(-EINVAL);
12556f668dfSMartin KaFai Lau 
12656f668dfSMartin KaFai Lau 	fdput(f);
12756f668dfSMartin KaFai Lau 	return inner_map;
12856f668dfSMartin KaFai Lau }
12956f668dfSMartin KaFai Lau 
bpf_map_fd_put_ptr(struct bpf_map * map,void * ptr,bool need_defer)1301c40ec6bSHou Tao void bpf_map_fd_put_ptr(struct bpf_map *map, void *ptr, bool need_defer)
13156f668dfSMartin KaFai Lau {
132f91cd728SHou Tao 	struct bpf_map *inner_map = ptr;
133f91cd728SHou Tao 
134*2ad2f2edSHou Tao 	/* Defer the freeing of inner map according to the sleepable attribute
135*2ad2f2edSHou Tao 	 * of bpf program which owns the outer map, so unnecessary waiting for
136*2ad2f2edSHou Tao 	 * RCU tasks trace grace period can be avoided.
13756f668dfSMartin KaFai Lau 	 */
138*2ad2f2edSHou Tao 	if (need_defer) {
139*2ad2f2edSHou Tao 		if (atomic64_read(&map->sleepable_refcnt))
140f91cd728SHou Tao 			WRITE_ONCE(inner_map->free_after_mult_rcu_gp, true);
141*2ad2f2edSHou Tao 		else
142*2ad2f2edSHou Tao 			WRITE_ONCE(inner_map->free_after_rcu_gp, true);
143*2ad2f2edSHou Tao 	}
144f91cd728SHou Tao 	bpf_map_put(inner_map);
14556f668dfSMartin KaFai Lau }
14614dc6f04SMartin KaFai Lau 
bpf_map_fd_sys_lookup_elem(void * ptr)14714dc6f04SMartin KaFai Lau u32 bpf_map_fd_sys_lookup_elem(void *ptr)
14814dc6f04SMartin KaFai Lau {
14914dc6f04SMartin KaFai Lau 	return ((struct bpf_map *)ptr)->id;
15014dc6f04SMartin KaFai Lau }
151