xref: /openbmc/linux/kernel/bpf/offload.c (revision 6dc18fa6f4cad69c892d6fb9499f7e41c6a88a8e)
1a39e17b2SJakub Kicinski /*
20cd3cbedSJakub Kicinski  * Copyright (C) 2017-2018 Netronome Systems, Inc.
3a39e17b2SJakub Kicinski  *
4a39e17b2SJakub Kicinski  * This software is licensed under the GNU General License Version 2,
5a39e17b2SJakub Kicinski  * June 1991 as shown in the file COPYING in the top-level directory of this
6a39e17b2SJakub Kicinski  * source tree.
7a39e17b2SJakub Kicinski  *
8a39e17b2SJakub Kicinski  * THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS"
9a39e17b2SJakub Kicinski  * WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING,
10a39e17b2SJakub Kicinski  * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
11a39e17b2SJakub Kicinski  * FOR A PARTICULAR PURPOSE. THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE
12a39e17b2SJakub Kicinski  * OF THE PROGRAM IS WITH YOU. SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME
13a39e17b2SJakub Kicinski  * THE COST OF ALL NECESSARY SERVICING, REPAIR OR CORRECTION.
14a39e17b2SJakub Kicinski  */
15a39e17b2SJakub Kicinski 
16ab3f0063SJakub Kicinski #include <linux/bpf.h>
17ab3f0063SJakub Kicinski #include <linux/bpf_verifier.h>
18ab3f0063SJakub Kicinski #include <linux/bug.h>
19675fc275SJakub Kicinski #include <linux/kdev_t.h>
20ab3f0063SJakub Kicinski #include <linux/list.h>
219fd7c555SJakub Kicinski #include <linux/lockdep.h>
22ab3f0063SJakub Kicinski #include <linux/netdevice.h>
23ab3f0063SJakub Kicinski #include <linux/printk.h>
24675fc275SJakub Kicinski #include <linux/proc_ns.h>
259fd7c555SJakub Kicinski #include <linux/rhashtable.h>
26ab3f0063SJakub Kicinski #include <linux/rtnetlink.h>
27e0d3974aSJakub Kicinski #include <linux/rwsem.h>
28ab3f0063SJakub Kicinski 
299fd7c555SJakub Kicinski /* Protects offdevs, members of bpf_offload_netdev and offload members
30a3884572SJakub Kicinski  * of all progs.
31e0d3974aSJakub Kicinski  * RTNL lock cannot be taken when holding this lock.
32e0d3974aSJakub Kicinski  */
33e0d3974aSJakub Kicinski static DECLARE_RWSEM(bpf_devs_lock);
349fd7c555SJakub Kicinski 
35602144c2SJakub Kicinski struct bpf_offload_dev {
361385d755SQuentin Monnet 	const struct bpf_prog_offload_ops *ops;
37602144c2SJakub Kicinski 	struct list_head netdevs;
38602144c2SJakub Kicinski };
39602144c2SJakub Kicinski 
409fd7c555SJakub Kicinski struct bpf_offload_netdev {
419fd7c555SJakub Kicinski 	struct rhash_head l;
429fd7c555SJakub Kicinski 	struct net_device *netdev;
43602144c2SJakub Kicinski 	struct bpf_offload_dev *offdev;
449fd7c555SJakub Kicinski 	struct list_head progs;
459fd7c555SJakub Kicinski 	struct list_head maps;
46602144c2SJakub Kicinski 	struct list_head offdev_netdevs;
479fd7c555SJakub Kicinski };
489fd7c555SJakub Kicinski 
499fd7c555SJakub Kicinski static const struct rhashtable_params offdevs_params = {
509fd7c555SJakub Kicinski 	.nelem_hint		= 4,
519fd7c555SJakub Kicinski 	.key_len		= sizeof(struct net_device *),
529fd7c555SJakub Kicinski 	.key_offset		= offsetof(struct bpf_offload_netdev, netdev),
539fd7c555SJakub Kicinski 	.head_offset		= offsetof(struct bpf_offload_netdev, l),
549fd7c555SJakub Kicinski 	.automatic_shrinking	= true,
559fd7c555SJakub Kicinski };
569fd7c555SJakub Kicinski 
579fd7c555SJakub Kicinski static struct rhashtable offdevs;
589fd7c555SJakub Kicinski static bool offdevs_inited;
59ab3f0063SJakub Kicinski 
605bc2d55cSJakub Kicinski static int bpf_dev_offload_check(struct net_device *netdev)
615bc2d55cSJakub Kicinski {
625bc2d55cSJakub Kicinski 	if (!netdev)
635bc2d55cSJakub Kicinski 		return -EINVAL;
645bc2d55cSJakub Kicinski 	if (!netdev->netdev_ops->ndo_bpf)
655bc2d55cSJakub Kicinski 		return -EOPNOTSUPP;
665bc2d55cSJakub Kicinski 	return 0;
675bc2d55cSJakub Kicinski }
685bc2d55cSJakub Kicinski 
699fd7c555SJakub Kicinski static struct bpf_offload_netdev *
709fd7c555SJakub Kicinski bpf_offload_find_netdev(struct net_device *netdev)
719fd7c555SJakub Kicinski {
729fd7c555SJakub Kicinski 	lockdep_assert_held(&bpf_devs_lock);
739fd7c555SJakub Kicinski 
749fd7c555SJakub Kicinski 	if (!offdevs_inited)
759fd7c555SJakub Kicinski 		return NULL;
769fd7c555SJakub Kicinski 	return rhashtable_lookup_fast(&offdevs, &netdev, offdevs_params);
779fd7c555SJakub Kicinski }
789fd7c555SJakub Kicinski 
79ab3f0063SJakub Kicinski int bpf_prog_offload_init(struct bpf_prog *prog, union bpf_attr *attr)
80ab3f0063SJakub Kicinski {
819fd7c555SJakub Kicinski 	struct bpf_offload_netdev *ondev;
820a9c1991SJakub Kicinski 	struct bpf_prog_offload *offload;
835bc2d55cSJakub Kicinski 	int err;
84ab3f0063SJakub Kicinski 
85649f11dcSJakub Kicinski 	if (attr->prog_type != BPF_PROG_TYPE_SCHED_CLS &&
86649f11dcSJakub Kicinski 	    attr->prog_type != BPF_PROG_TYPE_XDP)
87649f11dcSJakub Kicinski 		return -EINVAL;
88ab3f0063SJakub Kicinski 
89ab3f0063SJakub Kicinski 	if (attr->prog_flags)
90ab3f0063SJakub Kicinski 		return -EINVAL;
91ab3f0063SJakub Kicinski 
92ab3f0063SJakub Kicinski 	offload = kzalloc(sizeof(*offload), GFP_USER);
93ab3f0063SJakub Kicinski 	if (!offload)
94ab3f0063SJakub Kicinski 		return -ENOMEM;
95ab3f0063SJakub Kicinski 
96ab3f0063SJakub Kicinski 	offload->prog = prog;
97ab3f0063SJakub Kicinski 
98e0d3974aSJakub Kicinski 	offload->netdev = dev_get_by_index(current->nsproxy->net_ns,
99e0d3974aSJakub Kicinski 					   attr->prog_ifindex);
1005bc2d55cSJakub Kicinski 	err = bpf_dev_offload_check(offload->netdev);
1015bc2d55cSJakub Kicinski 	if (err)
1025bc2d55cSJakub Kicinski 		goto err_maybe_put;
103ab3f0063SJakub Kicinski 
104e0d3974aSJakub Kicinski 	down_write(&bpf_devs_lock);
1059fd7c555SJakub Kicinski 	ondev = bpf_offload_find_netdev(offload->netdev);
1069fd7c555SJakub Kicinski 	if (!ondev) {
1075bc2d55cSJakub Kicinski 		err = -EINVAL;
108e0d3974aSJakub Kicinski 		goto err_unlock;
1095bc2d55cSJakub Kicinski 	}
110341b3e7bSQuentin Monnet 	offload->offdev = ondev->offdev;
111ab3f0063SJakub Kicinski 	prog->aux->offload = offload;
1129fd7c555SJakub Kicinski 	list_add_tail(&offload->offloads, &ondev->progs);
113e0d3974aSJakub Kicinski 	dev_put(offload->netdev);
114e0d3974aSJakub Kicinski 	up_write(&bpf_devs_lock);
115ab3f0063SJakub Kicinski 
116ab3f0063SJakub Kicinski 	return 0;
117e0d3974aSJakub Kicinski err_unlock:
118e0d3974aSJakub Kicinski 	up_write(&bpf_devs_lock);
1195bc2d55cSJakub Kicinski err_maybe_put:
1205bc2d55cSJakub Kicinski 	if (offload->netdev)
121e0d3974aSJakub Kicinski 		dev_put(offload->netdev);
122e0d3974aSJakub Kicinski 	kfree(offload);
1235bc2d55cSJakub Kicinski 	return err;
124ab3f0063SJakub Kicinski }
125ab3f0063SJakub Kicinski 
126ab3f0063SJakub Kicinski static int __bpf_offload_ndo(struct bpf_prog *prog, enum bpf_netdev_command cmd,
127ab3f0063SJakub Kicinski 			     struct netdev_bpf *data)
128ab3f0063SJakub Kicinski {
1290a9c1991SJakub Kicinski 	struct bpf_prog_offload *offload = prog->aux->offload;
130ce3b9db4SJakub Kicinski 	struct net_device *netdev;
131ab3f0063SJakub Kicinski 
132ab3f0063SJakub Kicinski 	ASSERT_RTNL();
133ab3f0063SJakub Kicinski 
134ce3b9db4SJakub Kicinski 	if (!offload)
135ab3f0063SJakub Kicinski 		return -ENODEV;
136ce3b9db4SJakub Kicinski 	netdev = offload->netdev;
137ab3f0063SJakub Kicinski 
138ab3f0063SJakub Kicinski 	data->command = cmd;
139ab3f0063SJakub Kicinski 
140ab3f0063SJakub Kicinski 	return netdev->netdev_ops->ndo_bpf(netdev, data);
141ab3f0063SJakub Kicinski }
142ab3f0063SJakub Kicinski 
143ab3f0063SJakub Kicinski int bpf_prog_offload_verifier_prep(struct bpf_verifier_env *env)
144ab3f0063SJakub Kicinski {
145ab3f0063SJakub Kicinski 	struct netdev_bpf data = {};
146ab3f0063SJakub Kicinski 	int err;
147ab3f0063SJakub Kicinski 
148ab3f0063SJakub Kicinski 	data.verifier.prog = env->prog;
149ab3f0063SJakub Kicinski 
150ab3f0063SJakub Kicinski 	rtnl_lock();
151ab3f0063SJakub Kicinski 	err = __bpf_offload_ndo(env->prog, BPF_OFFLOAD_VERIFIER_PREP, &data);
152ab3f0063SJakub Kicinski 	if (err)
153ab3f0063SJakub Kicinski 		goto exit_unlock;
154ab3f0063SJakub Kicinski 
155cae1927cSJakub Kicinski 	env->prog->aux->offload->dev_ops = data.verifier.ops;
156ab3f0063SJakub Kicinski 	env->prog->aux->offload->dev_state = true;
157ab3f0063SJakub Kicinski exit_unlock:
158ab3f0063SJakub Kicinski 	rtnl_unlock();
159ab3f0063SJakub Kicinski 	return err;
160ab3f0063SJakub Kicinski }
161ab3f0063SJakub Kicinski 
162cae1927cSJakub Kicinski int bpf_prog_offload_verify_insn(struct bpf_verifier_env *env,
163cae1927cSJakub Kicinski 				 int insn_idx, int prev_insn_idx)
164cae1927cSJakub Kicinski {
1650a9c1991SJakub Kicinski 	struct bpf_prog_offload *offload;
166cae1927cSJakub Kicinski 	int ret = -ENODEV;
167cae1927cSJakub Kicinski 
168cae1927cSJakub Kicinski 	down_read(&bpf_devs_lock);
169cae1927cSJakub Kicinski 	offload = env->prog->aux->offload;
170ce3b9db4SJakub Kicinski 	if (offload)
171341b3e7bSQuentin Monnet 		ret = offload->offdev->ops->insn_hook(env, insn_idx,
172341b3e7bSQuentin Monnet 						      prev_insn_idx);
173cae1927cSJakub Kicinski 	up_read(&bpf_devs_lock);
174cae1927cSJakub Kicinski 
175cae1927cSJakub Kicinski 	return ret;
176cae1927cSJakub Kicinski }
177cae1927cSJakub Kicinski 
178c941ce9cSQuentin Monnet int bpf_prog_offload_finalize(struct bpf_verifier_env *env)
179c941ce9cSQuentin Monnet {
180c941ce9cSQuentin Monnet 	struct bpf_prog_offload *offload;
181c941ce9cSQuentin Monnet 	int ret = -ENODEV;
182c941ce9cSQuentin Monnet 
183c941ce9cSQuentin Monnet 	down_read(&bpf_devs_lock);
184c941ce9cSQuentin Monnet 	offload = env->prog->aux->offload;
185c941ce9cSQuentin Monnet 	if (offload) {
186*6dc18fa6SQuentin Monnet 		if (offload->offdev->ops->finalize)
187*6dc18fa6SQuentin Monnet 			ret = offload->offdev->ops->finalize(env);
188c941ce9cSQuentin Monnet 		else
189c941ce9cSQuentin Monnet 			ret = 0;
190c941ce9cSQuentin Monnet 	}
191c941ce9cSQuentin Monnet 	up_read(&bpf_devs_lock);
192c941ce9cSQuentin Monnet 
193c941ce9cSQuentin Monnet 	return ret;
194c941ce9cSQuentin Monnet }
195c941ce9cSQuentin Monnet 
196ab3f0063SJakub Kicinski static void __bpf_prog_offload_destroy(struct bpf_prog *prog)
197ab3f0063SJakub Kicinski {
1980a9c1991SJakub Kicinski 	struct bpf_prog_offload *offload = prog->aux->offload;
199ab3f0063SJakub Kicinski 	struct netdev_bpf data = {};
200ab3f0063SJakub Kicinski 
201ab3f0063SJakub Kicinski 	data.offload.prog = prog;
202ab3f0063SJakub Kicinski 
203ab3f0063SJakub Kicinski 	if (offload->dev_state)
204ab3f0063SJakub Kicinski 		WARN_ON(__bpf_offload_ndo(prog, BPF_OFFLOAD_DESTROY, &data));
205ab3f0063SJakub Kicinski 
206ad8ad79fSJakub Kicinski 	/* Make sure BPF_PROG_GET_NEXT_ID can't find this dead program */
207ad8ad79fSJakub Kicinski 	bpf_prog_free_id(prog, true);
208ad8ad79fSJakub Kicinski 
209ab3f0063SJakub Kicinski 	list_del_init(&offload->offloads);
210ce3b9db4SJakub Kicinski 	kfree(offload);
211ce3b9db4SJakub Kicinski 	prog->aux->offload = NULL;
212ab3f0063SJakub Kicinski }
213ab3f0063SJakub Kicinski 
214ab3f0063SJakub Kicinski void bpf_prog_offload_destroy(struct bpf_prog *prog)
215ab3f0063SJakub Kicinski {
216ab3f0063SJakub Kicinski 	rtnl_lock();
217e0d3974aSJakub Kicinski 	down_write(&bpf_devs_lock);
218ce3b9db4SJakub Kicinski 	if (prog->aux->offload)
219ab3f0063SJakub Kicinski 		__bpf_prog_offload_destroy(prog);
220e0d3974aSJakub Kicinski 	up_write(&bpf_devs_lock);
221ab3f0063SJakub Kicinski 	rtnl_unlock();
222ab3f0063SJakub Kicinski }
223ab3f0063SJakub Kicinski 
224ab3f0063SJakub Kicinski static int bpf_prog_offload_translate(struct bpf_prog *prog)
225ab3f0063SJakub Kicinski {
226ab3f0063SJakub Kicinski 	struct netdev_bpf data = {};
227ab3f0063SJakub Kicinski 	int ret;
228ab3f0063SJakub Kicinski 
229ab3f0063SJakub Kicinski 	data.offload.prog = prog;
230ab3f0063SJakub Kicinski 
231ab3f0063SJakub Kicinski 	rtnl_lock();
232ab3f0063SJakub Kicinski 	ret = __bpf_offload_ndo(prog, BPF_OFFLOAD_TRANSLATE, &data);
233ab3f0063SJakub Kicinski 	rtnl_unlock();
234ab3f0063SJakub Kicinski 
235ab3f0063SJakub Kicinski 	return ret;
236ab3f0063SJakub Kicinski }
237ab3f0063SJakub Kicinski 
238ab3f0063SJakub Kicinski static unsigned int bpf_prog_warn_on_exec(const void *ctx,
239ab3f0063SJakub Kicinski 					  const struct bpf_insn *insn)
240ab3f0063SJakub Kicinski {
241ab3f0063SJakub Kicinski 	WARN(1, "attempt to execute device eBPF program on the host!");
242ab3f0063SJakub Kicinski 	return 0;
243ab3f0063SJakub Kicinski }
244ab3f0063SJakub Kicinski 
245ab3f0063SJakub Kicinski int bpf_prog_offload_compile(struct bpf_prog *prog)
246ab3f0063SJakub Kicinski {
247ab3f0063SJakub Kicinski 	prog->bpf_func = bpf_prog_warn_on_exec;
248ab3f0063SJakub Kicinski 
249ab3f0063SJakub Kicinski 	return bpf_prog_offload_translate(prog);
250ab3f0063SJakub Kicinski }
251ab3f0063SJakub Kicinski 
252675fc275SJakub Kicinski struct ns_get_path_bpf_prog_args {
253675fc275SJakub Kicinski 	struct bpf_prog *prog;
254675fc275SJakub Kicinski 	struct bpf_prog_info *info;
255675fc275SJakub Kicinski };
256675fc275SJakub Kicinski 
257675fc275SJakub Kicinski static struct ns_common *bpf_prog_offload_info_fill_ns(void *private_data)
258675fc275SJakub Kicinski {
259675fc275SJakub Kicinski 	struct ns_get_path_bpf_prog_args *args = private_data;
260675fc275SJakub Kicinski 	struct bpf_prog_aux *aux = args->prog->aux;
261675fc275SJakub Kicinski 	struct ns_common *ns;
262675fc275SJakub Kicinski 	struct net *net;
263675fc275SJakub Kicinski 
264675fc275SJakub Kicinski 	rtnl_lock();
265675fc275SJakub Kicinski 	down_read(&bpf_devs_lock);
266675fc275SJakub Kicinski 
267675fc275SJakub Kicinski 	if (aux->offload) {
268675fc275SJakub Kicinski 		args->info->ifindex = aux->offload->netdev->ifindex;
269675fc275SJakub Kicinski 		net = dev_net(aux->offload->netdev);
270675fc275SJakub Kicinski 		get_net(net);
271675fc275SJakub Kicinski 		ns = &net->ns;
272675fc275SJakub Kicinski 	} else {
273675fc275SJakub Kicinski 		args->info->ifindex = 0;
274675fc275SJakub Kicinski 		ns = NULL;
275675fc275SJakub Kicinski 	}
276675fc275SJakub Kicinski 
277675fc275SJakub Kicinski 	up_read(&bpf_devs_lock);
278675fc275SJakub Kicinski 	rtnl_unlock();
279675fc275SJakub Kicinski 
280675fc275SJakub Kicinski 	return ns;
281675fc275SJakub Kicinski }
282675fc275SJakub Kicinski 
283675fc275SJakub Kicinski int bpf_prog_offload_info_fill(struct bpf_prog_info *info,
284675fc275SJakub Kicinski 			       struct bpf_prog *prog)
285675fc275SJakub Kicinski {
286675fc275SJakub Kicinski 	struct ns_get_path_bpf_prog_args args = {
287675fc275SJakub Kicinski 		.prog	= prog,
288675fc275SJakub Kicinski 		.info	= info,
289675fc275SJakub Kicinski 	};
290fcfb126dSJiong Wang 	struct bpf_prog_aux *aux = prog->aux;
291675fc275SJakub Kicinski 	struct inode *ns_inode;
292675fc275SJakub Kicinski 	struct path ns_path;
293fcfb126dSJiong Wang 	char __user *uinsns;
294675fc275SJakub Kicinski 	void *res;
295fcfb126dSJiong Wang 	u32 ulen;
296675fc275SJakub Kicinski 
297675fc275SJakub Kicinski 	res = ns_get_path_cb(&ns_path, bpf_prog_offload_info_fill_ns, &args);
298675fc275SJakub Kicinski 	if (IS_ERR(res)) {
299675fc275SJakub Kicinski 		if (!info->ifindex)
300675fc275SJakub Kicinski 			return -ENODEV;
301675fc275SJakub Kicinski 		return PTR_ERR(res);
302675fc275SJakub Kicinski 	}
303675fc275SJakub Kicinski 
304fcfb126dSJiong Wang 	down_read(&bpf_devs_lock);
305fcfb126dSJiong Wang 
306fcfb126dSJiong Wang 	if (!aux->offload) {
307fcfb126dSJiong Wang 		up_read(&bpf_devs_lock);
308fcfb126dSJiong Wang 		return -ENODEV;
309fcfb126dSJiong Wang 	}
310fcfb126dSJiong Wang 
311fcfb126dSJiong Wang 	ulen = info->jited_prog_len;
312fcfb126dSJiong Wang 	info->jited_prog_len = aux->offload->jited_len;
313fcfb126dSJiong Wang 	if (info->jited_prog_len & ulen) {
314fcfb126dSJiong Wang 		uinsns = u64_to_user_ptr(info->jited_prog_insns);
315fcfb126dSJiong Wang 		ulen = min_t(u32, info->jited_prog_len, ulen);
316fcfb126dSJiong Wang 		if (copy_to_user(uinsns, aux->offload->jited_image, ulen)) {
317fcfb126dSJiong Wang 			up_read(&bpf_devs_lock);
318fcfb126dSJiong Wang 			return -EFAULT;
319fcfb126dSJiong Wang 		}
320fcfb126dSJiong Wang 	}
321fcfb126dSJiong Wang 
322fcfb126dSJiong Wang 	up_read(&bpf_devs_lock);
323fcfb126dSJiong Wang 
324675fc275SJakub Kicinski 	ns_inode = ns_path.dentry->d_inode;
325675fc275SJakub Kicinski 	info->netns_dev = new_encode_dev(ns_inode->i_sb->s_dev);
326675fc275SJakub Kicinski 	info->netns_ino = ns_inode->i_ino;
327675fc275SJakub Kicinski 	path_put(&ns_path);
328675fc275SJakub Kicinski 
329675fc275SJakub Kicinski 	return 0;
330675fc275SJakub Kicinski }
331675fc275SJakub Kicinski 
332ab3f0063SJakub Kicinski const struct bpf_prog_ops bpf_offload_prog_ops = {
333ab3f0063SJakub Kicinski };
334ab3f0063SJakub Kicinski 
335a3884572SJakub Kicinski static int bpf_map_offload_ndo(struct bpf_offloaded_map *offmap,
336a3884572SJakub Kicinski 			       enum bpf_netdev_command cmd)
337a3884572SJakub Kicinski {
338a3884572SJakub Kicinski 	struct netdev_bpf data = {};
339a3884572SJakub Kicinski 	struct net_device *netdev;
340a3884572SJakub Kicinski 
341a3884572SJakub Kicinski 	ASSERT_RTNL();
342a3884572SJakub Kicinski 
343a3884572SJakub Kicinski 	data.command = cmd;
344a3884572SJakub Kicinski 	data.offmap = offmap;
345a3884572SJakub Kicinski 	/* Caller must make sure netdev is valid */
346a3884572SJakub Kicinski 	netdev = offmap->netdev;
347a3884572SJakub Kicinski 
348a3884572SJakub Kicinski 	return netdev->netdev_ops->ndo_bpf(netdev, &data);
349a3884572SJakub Kicinski }
350a3884572SJakub Kicinski 
351a3884572SJakub Kicinski struct bpf_map *bpf_map_offload_map_alloc(union bpf_attr *attr)
352a3884572SJakub Kicinski {
353a3884572SJakub Kicinski 	struct net *net = current->nsproxy->net_ns;
3549fd7c555SJakub Kicinski 	struct bpf_offload_netdev *ondev;
355a3884572SJakub Kicinski 	struct bpf_offloaded_map *offmap;
356a3884572SJakub Kicinski 	int err;
357a3884572SJakub Kicinski 
358a3884572SJakub Kicinski 	if (!capable(CAP_SYS_ADMIN))
359a3884572SJakub Kicinski 		return ERR_PTR(-EPERM);
3607a0ef693SJakub Kicinski 	if (attr->map_type != BPF_MAP_TYPE_ARRAY &&
3617a0ef693SJakub Kicinski 	    attr->map_type != BPF_MAP_TYPE_HASH)
362a3884572SJakub Kicinski 		return ERR_PTR(-EINVAL);
363a3884572SJakub Kicinski 
364a3884572SJakub Kicinski 	offmap = kzalloc(sizeof(*offmap), GFP_USER);
365a3884572SJakub Kicinski 	if (!offmap)
366a3884572SJakub Kicinski 		return ERR_PTR(-ENOMEM);
367a3884572SJakub Kicinski 
368a3884572SJakub Kicinski 	bpf_map_init_from_attr(&offmap->map, attr);
369a3884572SJakub Kicinski 
370a3884572SJakub Kicinski 	rtnl_lock();
371a3884572SJakub Kicinski 	down_write(&bpf_devs_lock);
372a3884572SJakub Kicinski 	offmap->netdev = __dev_get_by_index(net, attr->map_ifindex);
373a3884572SJakub Kicinski 	err = bpf_dev_offload_check(offmap->netdev);
374a3884572SJakub Kicinski 	if (err)
375a3884572SJakub Kicinski 		goto err_unlock;
376a3884572SJakub Kicinski 
3779fd7c555SJakub Kicinski 	ondev = bpf_offload_find_netdev(offmap->netdev);
3789fd7c555SJakub Kicinski 	if (!ondev) {
3799fd7c555SJakub Kicinski 		err = -EINVAL;
3809fd7c555SJakub Kicinski 		goto err_unlock;
3819fd7c555SJakub Kicinski 	}
3829fd7c555SJakub Kicinski 
383a3884572SJakub Kicinski 	err = bpf_map_offload_ndo(offmap, BPF_OFFLOAD_MAP_ALLOC);
384a3884572SJakub Kicinski 	if (err)
385a3884572SJakub Kicinski 		goto err_unlock;
386a3884572SJakub Kicinski 
3879fd7c555SJakub Kicinski 	list_add_tail(&offmap->offloads, &ondev->maps);
388a3884572SJakub Kicinski 	up_write(&bpf_devs_lock);
389a3884572SJakub Kicinski 	rtnl_unlock();
390a3884572SJakub Kicinski 
391a3884572SJakub Kicinski 	return &offmap->map;
392a3884572SJakub Kicinski 
393a3884572SJakub Kicinski err_unlock:
394a3884572SJakub Kicinski 	up_write(&bpf_devs_lock);
395a3884572SJakub Kicinski 	rtnl_unlock();
396a3884572SJakub Kicinski 	kfree(offmap);
397a3884572SJakub Kicinski 	return ERR_PTR(err);
398a3884572SJakub Kicinski }
399a3884572SJakub Kicinski 
400a3884572SJakub Kicinski static void __bpf_map_offload_destroy(struct bpf_offloaded_map *offmap)
401a3884572SJakub Kicinski {
402a3884572SJakub Kicinski 	WARN_ON(bpf_map_offload_ndo(offmap, BPF_OFFLOAD_MAP_FREE));
403a3884572SJakub Kicinski 	/* Make sure BPF_MAP_GET_NEXT_ID can't find this dead map */
404a3884572SJakub Kicinski 	bpf_map_free_id(&offmap->map, true);
405a3884572SJakub Kicinski 	list_del_init(&offmap->offloads);
406a3884572SJakub Kicinski 	offmap->netdev = NULL;
407a3884572SJakub Kicinski }
408a3884572SJakub Kicinski 
409a3884572SJakub Kicinski void bpf_map_offload_map_free(struct bpf_map *map)
410a3884572SJakub Kicinski {
411a3884572SJakub Kicinski 	struct bpf_offloaded_map *offmap = map_to_offmap(map);
412a3884572SJakub Kicinski 
413a3884572SJakub Kicinski 	rtnl_lock();
414a3884572SJakub Kicinski 	down_write(&bpf_devs_lock);
415a3884572SJakub Kicinski 	if (offmap->netdev)
416a3884572SJakub Kicinski 		__bpf_map_offload_destroy(offmap);
417a3884572SJakub Kicinski 	up_write(&bpf_devs_lock);
418a3884572SJakub Kicinski 	rtnl_unlock();
419a3884572SJakub Kicinski 
420a3884572SJakub Kicinski 	kfree(offmap);
421a3884572SJakub Kicinski }
422a3884572SJakub Kicinski 
423a3884572SJakub Kicinski int bpf_map_offload_lookup_elem(struct bpf_map *map, void *key, void *value)
424a3884572SJakub Kicinski {
425a3884572SJakub Kicinski 	struct bpf_offloaded_map *offmap = map_to_offmap(map);
426a3884572SJakub Kicinski 	int ret = -ENODEV;
427a3884572SJakub Kicinski 
428a3884572SJakub Kicinski 	down_read(&bpf_devs_lock);
429a3884572SJakub Kicinski 	if (offmap->netdev)
430a3884572SJakub Kicinski 		ret = offmap->dev_ops->map_lookup_elem(offmap, key, value);
431a3884572SJakub Kicinski 	up_read(&bpf_devs_lock);
432a3884572SJakub Kicinski 
433a3884572SJakub Kicinski 	return ret;
434a3884572SJakub Kicinski }
435a3884572SJakub Kicinski 
436a3884572SJakub Kicinski int bpf_map_offload_update_elem(struct bpf_map *map,
437a3884572SJakub Kicinski 				void *key, void *value, u64 flags)
438a3884572SJakub Kicinski {
439a3884572SJakub Kicinski 	struct bpf_offloaded_map *offmap = map_to_offmap(map);
440a3884572SJakub Kicinski 	int ret = -ENODEV;
441a3884572SJakub Kicinski 
442a3884572SJakub Kicinski 	if (unlikely(flags > BPF_EXIST))
443a3884572SJakub Kicinski 		return -EINVAL;
444a3884572SJakub Kicinski 
445a3884572SJakub Kicinski 	down_read(&bpf_devs_lock);
446a3884572SJakub Kicinski 	if (offmap->netdev)
447a3884572SJakub Kicinski 		ret = offmap->dev_ops->map_update_elem(offmap, key, value,
448a3884572SJakub Kicinski 						       flags);
449a3884572SJakub Kicinski 	up_read(&bpf_devs_lock);
450a3884572SJakub Kicinski 
451a3884572SJakub Kicinski 	return ret;
452a3884572SJakub Kicinski }
453a3884572SJakub Kicinski 
454a3884572SJakub Kicinski int bpf_map_offload_delete_elem(struct bpf_map *map, void *key)
455a3884572SJakub Kicinski {
456a3884572SJakub Kicinski 	struct bpf_offloaded_map *offmap = map_to_offmap(map);
457a3884572SJakub Kicinski 	int ret = -ENODEV;
458a3884572SJakub Kicinski 
459a3884572SJakub Kicinski 	down_read(&bpf_devs_lock);
460a3884572SJakub Kicinski 	if (offmap->netdev)
461a3884572SJakub Kicinski 		ret = offmap->dev_ops->map_delete_elem(offmap, key);
462a3884572SJakub Kicinski 	up_read(&bpf_devs_lock);
463a3884572SJakub Kicinski 
464a3884572SJakub Kicinski 	return ret;
465a3884572SJakub Kicinski }
466a3884572SJakub Kicinski 
467a3884572SJakub Kicinski int bpf_map_offload_get_next_key(struct bpf_map *map, void *key, void *next_key)
468a3884572SJakub Kicinski {
469a3884572SJakub Kicinski 	struct bpf_offloaded_map *offmap = map_to_offmap(map);
470a3884572SJakub Kicinski 	int ret = -ENODEV;
471a3884572SJakub Kicinski 
472a3884572SJakub Kicinski 	down_read(&bpf_devs_lock);
473a3884572SJakub Kicinski 	if (offmap->netdev)
474a3884572SJakub Kicinski 		ret = offmap->dev_ops->map_get_next_key(offmap, key, next_key);
475a3884572SJakub Kicinski 	up_read(&bpf_devs_lock);
476a3884572SJakub Kicinski 
477a3884572SJakub Kicinski 	return ret;
478a3884572SJakub Kicinski }
479a3884572SJakub Kicinski 
48052775b33SJakub Kicinski struct ns_get_path_bpf_map_args {
48152775b33SJakub Kicinski 	struct bpf_offloaded_map *offmap;
48252775b33SJakub Kicinski 	struct bpf_map_info *info;
48352775b33SJakub Kicinski };
48452775b33SJakub Kicinski 
48552775b33SJakub Kicinski static struct ns_common *bpf_map_offload_info_fill_ns(void *private_data)
48652775b33SJakub Kicinski {
48752775b33SJakub Kicinski 	struct ns_get_path_bpf_map_args *args = private_data;
48852775b33SJakub Kicinski 	struct ns_common *ns;
48952775b33SJakub Kicinski 	struct net *net;
49052775b33SJakub Kicinski 
49152775b33SJakub Kicinski 	rtnl_lock();
49252775b33SJakub Kicinski 	down_read(&bpf_devs_lock);
49352775b33SJakub Kicinski 
49452775b33SJakub Kicinski 	if (args->offmap->netdev) {
49552775b33SJakub Kicinski 		args->info->ifindex = args->offmap->netdev->ifindex;
49652775b33SJakub Kicinski 		net = dev_net(args->offmap->netdev);
49752775b33SJakub Kicinski 		get_net(net);
49852775b33SJakub Kicinski 		ns = &net->ns;
49952775b33SJakub Kicinski 	} else {
50052775b33SJakub Kicinski 		args->info->ifindex = 0;
50152775b33SJakub Kicinski 		ns = NULL;
50252775b33SJakub Kicinski 	}
50352775b33SJakub Kicinski 
50452775b33SJakub Kicinski 	up_read(&bpf_devs_lock);
50552775b33SJakub Kicinski 	rtnl_unlock();
50652775b33SJakub Kicinski 
50752775b33SJakub Kicinski 	return ns;
50852775b33SJakub Kicinski }
50952775b33SJakub Kicinski 
51052775b33SJakub Kicinski int bpf_map_offload_info_fill(struct bpf_map_info *info, struct bpf_map *map)
51152775b33SJakub Kicinski {
51252775b33SJakub Kicinski 	struct ns_get_path_bpf_map_args args = {
51352775b33SJakub Kicinski 		.offmap	= map_to_offmap(map),
51452775b33SJakub Kicinski 		.info	= info,
51552775b33SJakub Kicinski 	};
51652775b33SJakub Kicinski 	struct inode *ns_inode;
51752775b33SJakub Kicinski 	struct path ns_path;
51852775b33SJakub Kicinski 	void *res;
51952775b33SJakub Kicinski 
52052775b33SJakub Kicinski 	res = ns_get_path_cb(&ns_path, bpf_map_offload_info_fill_ns, &args);
52152775b33SJakub Kicinski 	if (IS_ERR(res)) {
52252775b33SJakub Kicinski 		if (!info->ifindex)
52352775b33SJakub Kicinski 			return -ENODEV;
52452775b33SJakub Kicinski 		return PTR_ERR(res);
52552775b33SJakub Kicinski 	}
52652775b33SJakub Kicinski 
52752775b33SJakub Kicinski 	ns_inode = ns_path.dentry->d_inode;
52852775b33SJakub Kicinski 	info->netns_dev = new_encode_dev(ns_inode->i_sb->s_dev);
52952775b33SJakub Kicinski 	info->netns_ino = ns_inode->i_ino;
53052775b33SJakub Kicinski 	path_put(&ns_path);
53152775b33SJakub Kicinski 
53252775b33SJakub Kicinski 	return 0;
53352775b33SJakub Kicinski }
53452775b33SJakub Kicinski 
535fd4f227dSJakub Kicinski static bool __bpf_offload_dev_match(struct bpf_prog *prog,
536fd4f227dSJakub Kicinski 				    struct net_device *netdev)
537a3884572SJakub Kicinski {
538fd4f227dSJakub Kicinski 	struct bpf_offload_netdev *ondev1, *ondev2;
539a3884572SJakub Kicinski 	struct bpf_prog_offload *offload;
540a3884572SJakub Kicinski 
5410cd3cbedSJakub Kicinski 	if (!bpf_prog_is_dev_bound(prog->aux))
542a3884572SJakub Kicinski 		return false;
543fd4f227dSJakub Kicinski 
544fd4f227dSJakub Kicinski 	offload = prog->aux->offload;
545fd4f227dSJakub Kicinski 	if (!offload)
546fd4f227dSJakub Kicinski 		return false;
547fd4f227dSJakub Kicinski 	if (offload->netdev == netdev)
548fd4f227dSJakub Kicinski 		return true;
549fd4f227dSJakub Kicinski 
550fd4f227dSJakub Kicinski 	ondev1 = bpf_offload_find_netdev(offload->netdev);
551fd4f227dSJakub Kicinski 	ondev2 = bpf_offload_find_netdev(netdev);
552fd4f227dSJakub Kicinski 
553fd4f227dSJakub Kicinski 	return ondev1 && ondev2 && ondev1->offdev == ondev2->offdev;
554fd4f227dSJakub Kicinski }
555fd4f227dSJakub Kicinski 
556fd4f227dSJakub Kicinski bool bpf_offload_dev_match(struct bpf_prog *prog, struct net_device *netdev)
557fd4f227dSJakub Kicinski {
558fd4f227dSJakub Kicinski 	bool ret;
559a3884572SJakub Kicinski 
560a3884572SJakub Kicinski 	down_read(&bpf_devs_lock);
561fd4f227dSJakub Kicinski 	ret = __bpf_offload_dev_match(prog, netdev);
562fd4f227dSJakub Kicinski 	up_read(&bpf_devs_lock);
563fd4f227dSJakub Kicinski 
564fd4f227dSJakub Kicinski 	return ret;
565fd4f227dSJakub Kicinski }
566fd4f227dSJakub Kicinski EXPORT_SYMBOL_GPL(bpf_offload_dev_match);
567fd4f227dSJakub Kicinski 
568fd4f227dSJakub Kicinski bool bpf_offload_prog_map_match(struct bpf_prog *prog, struct bpf_map *map)
569fd4f227dSJakub Kicinski {
570fd4f227dSJakub Kicinski 	struct bpf_offloaded_map *offmap;
571fd4f227dSJakub Kicinski 	bool ret;
572fd4f227dSJakub Kicinski 
573fd4f227dSJakub Kicinski 	if (!bpf_map_is_dev_bound(map))
574fd4f227dSJakub Kicinski 		return bpf_map_offload_neutral(map);
575a3884572SJakub Kicinski 	offmap = map_to_offmap(map);
576a3884572SJakub Kicinski 
577fd4f227dSJakub Kicinski 	down_read(&bpf_devs_lock);
578fd4f227dSJakub Kicinski 	ret = __bpf_offload_dev_match(prog, offmap->netdev);
579a3884572SJakub Kicinski 	up_read(&bpf_devs_lock);
580a3884572SJakub Kicinski 
581a3884572SJakub Kicinski 	return ret;
582a3884572SJakub Kicinski }
583a3884572SJakub Kicinski 
584602144c2SJakub Kicinski int bpf_offload_dev_netdev_register(struct bpf_offload_dev *offdev,
585602144c2SJakub Kicinski 				    struct net_device *netdev)
586a3884572SJakub Kicinski {
5879fd7c555SJakub Kicinski 	struct bpf_offload_netdev *ondev;
5889fd7c555SJakub Kicinski 	int err;
589a3884572SJakub Kicinski 
5909fd7c555SJakub Kicinski 	ondev = kzalloc(sizeof(*ondev), GFP_KERNEL);
5919fd7c555SJakub Kicinski 	if (!ondev)
5929fd7c555SJakub Kicinski 		return -ENOMEM;
5939fd7c555SJakub Kicinski 
5949fd7c555SJakub Kicinski 	ondev->netdev = netdev;
595602144c2SJakub Kicinski 	ondev->offdev = offdev;
5969fd7c555SJakub Kicinski 	INIT_LIST_HEAD(&ondev->progs);
5979fd7c555SJakub Kicinski 	INIT_LIST_HEAD(&ondev->maps);
5989fd7c555SJakub Kicinski 
5999fd7c555SJakub Kicinski 	down_write(&bpf_devs_lock);
6009fd7c555SJakub Kicinski 	err = rhashtable_insert_fast(&offdevs, &ondev->l, offdevs_params);
6019fd7c555SJakub Kicinski 	if (err) {
6029fd7c555SJakub Kicinski 		netdev_warn(netdev, "failed to register for BPF offload\n");
6039fd7c555SJakub Kicinski 		goto err_unlock_free;
604a3884572SJakub Kicinski 	}
605a3884572SJakub Kicinski 
606602144c2SJakub Kicinski 	list_add(&ondev->offdev_netdevs, &offdev->netdevs);
6079fd7c555SJakub Kicinski 	up_write(&bpf_devs_lock);
6089fd7c555SJakub Kicinski 	return 0;
609a3884572SJakub Kicinski 
6109fd7c555SJakub Kicinski err_unlock_free:
6119fd7c555SJakub Kicinski 	up_write(&bpf_devs_lock);
6129fd7c555SJakub Kicinski 	kfree(ondev);
6139fd7c555SJakub Kicinski 	return err;
614a3884572SJakub Kicinski }
6159fd7c555SJakub Kicinski EXPORT_SYMBOL_GPL(bpf_offload_dev_netdev_register);
616a3884572SJakub Kicinski 
617602144c2SJakub Kicinski void bpf_offload_dev_netdev_unregister(struct bpf_offload_dev *offdev,
618602144c2SJakub Kicinski 				       struct net_device *netdev)
619ab3f0063SJakub Kicinski {
620602144c2SJakub Kicinski 	struct bpf_offload_netdev *ondev, *altdev;
6219fd7c555SJakub Kicinski 	struct bpf_offloaded_map *offmap, *mtmp;
6229fd7c555SJakub Kicinski 	struct bpf_prog_offload *offload, *ptmp;
623ab3f0063SJakub Kicinski 
624ab3f0063SJakub Kicinski 	ASSERT_RTNL();
625ab3f0063SJakub Kicinski 
626e0d3974aSJakub Kicinski 	down_write(&bpf_devs_lock);
6279fd7c555SJakub Kicinski 	ondev = rhashtable_lookup_fast(&offdevs, &netdev, offdevs_params);
6289fd7c555SJakub Kicinski 	if (WARN_ON(!ondev))
6299fd7c555SJakub Kicinski 		goto unlock;
6309fd7c555SJakub Kicinski 
6319fd7c555SJakub Kicinski 	WARN_ON(rhashtable_remove_fast(&offdevs, &ondev->l, offdevs_params));
632602144c2SJakub Kicinski 	list_del(&ondev->offdev_netdevs);
6339fd7c555SJakub Kicinski 
634602144c2SJakub Kicinski 	/* Try to move the objects to another netdev of the device */
635602144c2SJakub Kicinski 	altdev = list_first_entry_or_null(&offdev->netdevs,
636602144c2SJakub Kicinski 					  struct bpf_offload_netdev,
637602144c2SJakub Kicinski 					  offdev_netdevs);
638602144c2SJakub Kicinski 	if (altdev) {
639602144c2SJakub Kicinski 		list_for_each_entry(offload, &ondev->progs, offloads)
640602144c2SJakub Kicinski 			offload->netdev = altdev->netdev;
641602144c2SJakub Kicinski 		list_splice_init(&ondev->progs, &altdev->progs);
642602144c2SJakub Kicinski 
643602144c2SJakub Kicinski 		list_for_each_entry(offmap, &ondev->maps, offloads)
644602144c2SJakub Kicinski 			offmap->netdev = altdev->netdev;
645602144c2SJakub Kicinski 		list_splice_init(&ondev->maps, &altdev->maps);
646602144c2SJakub Kicinski 	} else {
6479fd7c555SJakub Kicinski 		list_for_each_entry_safe(offload, ptmp, &ondev->progs, offloads)
6489fd7c555SJakub Kicinski 			__bpf_prog_offload_destroy(offload->prog);
6499fd7c555SJakub Kicinski 		list_for_each_entry_safe(offmap, mtmp, &ondev->maps, offloads)
6509fd7c555SJakub Kicinski 			__bpf_map_offload_destroy(offmap);
651602144c2SJakub Kicinski 	}
6529fd7c555SJakub Kicinski 
6539fd7c555SJakub Kicinski 	WARN_ON(!list_empty(&ondev->progs));
6549fd7c555SJakub Kicinski 	WARN_ON(!list_empty(&ondev->maps));
6559fd7c555SJakub Kicinski 	kfree(ondev);
6569fd7c555SJakub Kicinski unlock:
657e0d3974aSJakub Kicinski 	up_write(&bpf_devs_lock);
658ab3f0063SJakub Kicinski }
6599fd7c555SJakub Kicinski EXPORT_SYMBOL_GPL(bpf_offload_dev_netdev_unregister);
660602144c2SJakub Kicinski 
6611385d755SQuentin Monnet struct bpf_offload_dev *
6621385d755SQuentin Monnet bpf_offload_dev_create(const struct bpf_prog_offload_ops *ops)
663602144c2SJakub Kicinski {
664602144c2SJakub Kicinski 	struct bpf_offload_dev *offdev;
665602144c2SJakub Kicinski 	int err;
666602144c2SJakub Kicinski 
667602144c2SJakub Kicinski 	down_write(&bpf_devs_lock);
668602144c2SJakub Kicinski 	if (!offdevs_inited) {
669602144c2SJakub Kicinski 		err = rhashtable_init(&offdevs, &offdevs_params);
670602144c2SJakub Kicinski 		if (err)
671602144c2SJakub Kicinski 			return ERR_PTR(err);
672602144c2SJakub Kicinski 		offdevs_inited = true;
673602144c2SJakub Kicinski 	}
674602144c2SJakub Kicinski 	up_write(&bpf_devs_lock);
675602144c2SJakub Kicinski 
676602144c2SJakub Kicinski 	offdev = kzalloc(sizeof(*offdev), GFP_KERNEL);
677602144c2SJakub Kicinski 	if (!offdev)
678602144c2SJakub Kicinski 		return ERR_PTR(-ENOMEM);
679602144c2SJakub Kicinski 
6801385d755SQuentin Monnet 	offdev->ops = ops;
681602144c2SJakub Kicinski 	INIT_LIST_HEAD(&offdev->netdevs);
682602144c2SJakub Kicinski 
683602144c2SJakub Kicinski 	return offdev;
684602144c2SJakub Kicinski }
685602144c2SJakub Kicinski EXPORT_SYMBOL_GPL(bpf_offload_dev_create);
686602144c2SJakub Kicinski 
687602144c2SJakub Kicinski void bpf_offload_dev_destroy(struct bpf_offload_dev *offdev)
688602144c2SJakub Kicinski {
689602144c2SJakub Kicinski 	WARN_ON(!list_empty(&offdev->netdevs));
690602144c2SJakub Kicinski 	kfree(offdev);
691602144c2SJakub Kicinski }
692602144c2SJakub Kicinski EXPORT_SYMBOL_GPL(bpf_offload_dev_destroy);
693