xref: /openbmc/linux/drivers/net/ipvlan/ipvtap.c (revision 10a03c36)
109c434b8SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
2235a9d89SSainath Grandhi #include <linux/etherdevice.h>
3235a9d89SSainath Grandhi #include "ipvlan.h"
4235a9d89SSainath Grandhi #include <linux/if_vlan.h>
5235a9d89SSainath Grandhi #include <linux/if_tap.h>
6235a9d89SSainath Grandhi #include <linux/interrupt.h>
7235a9d89SSainath Grandhi #include <linux/nsproxy.h>
8235a9d89SSainath Grandhi #include <linux/compat.h>
9235a9d89SSainath Grandhi #include <linux/if_tun.h>
10235a9d89SSainath Grandhi #include <linux/module.h>
11235a9d89SSainath Grandhi #include <linux/skbuff.h>
12235a9d89SSainath Grandhi #include <linux/cache.h>
13235a9d89SSainath Grandhi #include <linux/sched.h>
14235a9d89SSainath Grandhi #include <linux/types.h>
15235a9d89SSainath Grandhi #include <linux/slab.h>
16235a9d89SSainath Grandhi #include <linux/wait.h>
17235a9d89SSainath Grandhi #include <linux/cdev.h>
18235a9d89SSainath Grandhi #include <linux/idr.h>
19235a9d89SSainath Grandhi #include <linux/fs.h>
20235a9d89SSainath Grandhi #include <linux/uio.h>
21235a9d89SSainath Grandhi 
22235a9d89SSainath Grandhi #include <net/net_namespace.h>
23235a9d89SSainath Grandhi #include <net/rtnetlink.h>
24235a9d89SSainath Grandhi #include <net/sock.h>
25235a9d89SSainath Grandhi #include <linux/virtio_net.h>
26235a9d89SSainath Grandhi 
27235a9d89SSainath Grandhi #define TUN_OFFLOADS (NETIF_F_HW_CSUM | NETIF_F_TSO_ECN | NETIF_F_TSO | \
28182e0b6bSDavid S. Miller 		      NETIF_F_TSO6)
29235a9d89SSainath Grandhi 
30235a9d89SSainath Grandhi static dev_t ipvtap_major;
31235a9d89SSainath Grandhi static struct cdev ipvtap_cdev;
32235a9d89SSainath Grandhi 
ipvtap_net_namespace(const struct device * d)33*fa627348SGreg Kroah-Hartman static const void *ipvtap_net_namespace(const struct device *d)
34235a9d89SSainath Grandhi {
35*fa627348SGreg Kroah-Hartman 	const struct net_device *dev = to_net_dev(d->parent);
36235a9d89SSainath Grandhi 	return dev_net(dev);
37235a9d89SSainath Grandhi }
38235a9d89SSainath Grandhi 
39235a9d89SSainath Grandhi static struct class ipvtap_class = {
40235a9d89SSainath Grandhi 	 .name = "ipvtap",
41235a9d89SSainath Grandhi 	 .ns_type = &net_ns_type_operations,
42235a9d89SSainath Grandhi 	 .namespace = ipvtap_net_namespace,
43235a9d89SSainath Grandhi };
44235a9d89SSainath Grandhi 
45235a9d89SSainath Grandhi struct ipvtap_dev {
46235a9d89SSainath Grandhi 	struct ipvl_dev vlan;
47235a9d89SSainath Grandhi 	struct tap_dev	  tap;
48235a9d89SSainath Grandhi };
49235a9d89SSainath Grandhi 
ipvtap_count_tx_dropped(struct tap_dev * tap)50235a9d89SSainath Grandhi static void ipvtap_count_tx_dropped(struct tap_dev *tap)
51235a9d89SSainath Grandhi {
52235a9d89SSainath Grandhi 	struct ipvtap_dev *vlantap = container_of(tap, struct ipvtap_dev, tap);
53235a9d89SSainath Grandhi 	struct ipvl_dev *vlan = &vlantap->vlan;
54235a9d89SSainath Grandhi 
55235a9d89SSainath Grandhi 	this_cpu_inc(vlan->pcpu_stats->tx_drps);
56235a9d89SSainath Grandhi }
57235a9d89SSainath Grandhi 
ipvtap_count_rx_dropped(struct tap_dev * tap)58235a9d89SSainath Grandhi static void ipvtap_count_rx_dropped(struct tap_dev *tap)
59235a9d89SSainath Grandhi {
60235a9d89SSainath Grandhi 	struct ipvtap_dev *vlantap = container_of(tap, struct ipvtap_dev, tap);
61235a9d89SSainath Grandhi 	struct ipvl_dev *vlan = &vlantap->vlan;
62235a9d89SSainath Grandhi 
63235a9d89SSainath Grandhi 	ipvlan_count_rx(vlan, 0, 0, 0);
64235a9d89SSainath Grandhi }
65235a9d89SSainath Grandhi 
ipvtap_update_features(struct tap_dev * tap,netdev_features_t features)66235a9d89SSainath Grandhi static void ipvtap_update_features(struct tap_dev *tap,
67235a9d89SSainath Grandhi 				   netdev_features_t features)
68235a9d89SSainath Grandhi {
69235a9d89SSainath Grandhi 	struct ipvtap_dev *vlantap = container_of(tap, struct ipvtap_dev, tap);
70235a9d89SSainath Grandhi 	struct ipvl_dev *vlan = &vlantap->vlan;
71235a9d89SSainath Grandhi 
72235a9d89SSainath Grandhi 	vlan->sfeatures = features;
73235a9d89SSainath Grandhi 	netdev_update_features(vlan->dev);
74235a9d89SSainath Grandhi }
75235a9d89SSainath Grandhi 
ipvtap_newlink(struct net * src_net,struct net_device * dev,struct nlattr * tb[],struct nlattr * data[],struct netlink_ext_ack * extack)767a3f4a18SMatthias Schiffer static int ipvtap_newlink(struct net *src_net, struct net_device *dev,
777a3f4a18SMatthias Schiffer 			  struct nlattr *tb[], struct nlattr *data[],
787a3f4a18SMatthias Schiffer 			  struct netlink_ext_ack *extack)
79235a9d89SSainath Grandhi {
80235a9d89SSainath Grandhi 	struct ipvtap_dev *vlantap = netdev_priv(dev);
81235a9d89SSainath Grandhi 	int err;
82235a9d89SSainath Grandhi 
83235a9d89SSainath Grandhi 	INIT_LIST_HEAD(&vlantap->tap.queue_list);
84235a9d89SSainath Grandhi 
85235a9d89SSainath Grandhi 	/* Since macvlan supports all offloads by default, make
86235a9d89SSainath Grandhi 	 * tap support all offloads also.
87235a9d89SSainath Grandhi 	 */
88235a9d89SSainath Grandhi 	vlantap->tap.tap_features = TUN_OFFLOADS;
89235a9d89SSainath Grandhi 	vlantap->tap.count_tx_dropped = ipvtap_count_tx_dropped;
90235a9d89SSainath Grandhi 	vlantap->tap.update_features =	ipvtap_update_features;
91235a9d89SSainath Grandhi 	vlantap->tap.count_rx_dropped = ipvtap_count_rx_dropped;
92235a9d89SSainath Grandhi 
93235a9d89SSainath Grandhi 	err = netdev_rx_handler_register(dev, tap_handle_frame, &vlantap->tap);
94235a9d89SSainath Grandhi 	if (err)
95235a9d89SSainath Grandhi 		return err;
96235a9d89SSainath Grandhi 
97235a9d89SSainath Grandhi 	/* Don't put anything that may fail after macvlan_common_newlink
98235a9d89SSainath Grandhi 	 * because we can't undo what it does.
99235a9d89SSainath Grandhi 	 */
1007a3f4a18SMatthias Schiffer 	err =  ipvlan_link_new(src_net, dev, tb, data, extack);
101235a9d89SSainath Grandhi 	if (err) {
102235a9d89SSainath Grandhi 		netdev_rx_handler_unregister(dev);
103235a9d89SSainath Grandhi 		return err;
104235a9d89SSainath Grandhi 	}
105235a9d89SSainath Grandhi 
106235a9d89SSainath Grandhi 	vlantap->tap.dev = vlantap->vlan.dev;
107235a9d89SSainath Grandhi 
108235a9d89SSainath Grandhi 	return err;
109235a9d89SSainath Grandhi }
110235a9d89SSainath Grandhi 
ipvtap_dellink(struct net_device * dev,struct list_head * head)111235a9d89SSainath Grandhi static void ipvtap_dellink(struct net_device *dev,
112235a9d89SSainath Grandhi 			   struct list_head *head)
113235a9d89SSainath Grandhi {
114235a9d89SSainath Grandhi 	struct ipvtap_dev *vlan = netdev_priv(dev);
115235a9d89SSainath Grandhi 
116235a9d89SSainath Grandhi 	netdev_rx_handler_unregister(dev);
117235a9d89SSainath Grandhi 	tap_del_queues(&vlan->tap);
118235a9d89SSainath Grandhi 	ipvlan_link_delete(dev, head);
119235a9d89SSainath Grandhi }
120235a9d89SSainath Grandhi 
ipvtap_setup(struct net_device * dev)121235a9d89SSainath Grandhi static void ipvtap_setup(struct net_device *dev)
122235a9d89SSainath Grandhi {
123235a9d89SSainath Grandhi 	ipvlan_link_setup(dev);
124235a9d89SSainath Grandhi 	dev->tx_queue_len = TUN_READQ_SIZE;
125235a9d89SSainath Grandhi 	dev->priv_flags &= ~IFF_NO_QUEUE;
126235a9d89SSainath Grandhi }
127235a9d89SSainath Grandhi 
128235a9d89SSainath Grandhi static struct rtnl_link_ops ipvtap_link_ops __read_mostly = {
129235a9d89SSainath Grandhi 	.kind		= "ipvtap",
130235a9d89SSainath Grandhi 	.setup		= ipvtap_setup,
131235a9d89SSainath Grandhi 	.newlink	= ipvtap_newlink,
132235a9d89SSainath Grandhi 	.dellink	= ipvtap_dellink,
133235a9d89SSainath Grandhi 	.priv_size	= sizeof(struct ipvtap_dev),
134235a9d89SSainath Grandhi };
135235a9d89SSainath Grandhi 
ipvtap_device_event(struct notifier_block * unused,unsigned long event,void * ptr)136235a9d89SSainath Grandhi static int ipvtap_device_event(struct notifier_block *unused,
137235a9d89SSainath Grandhi 			       unsigned long event, void *ptr)
138235a9d89SSainath Grandhi {
139235a9d89SSainath Grandhi 	struct net_device *dev = netdev_notifier_info_to_dev(ptr);
140235a9d89SSainath Grandhi 	struct ipvtap_dev *vlantap;
141235a9d89SSainath Grandhi 	struct device *classdev;
142235a9d89SSainath Grandhi 	dev_t devt;
143235a9d89SSainath Grandhi 	int err;
144235a9d89SSainath Grandhi 	char tap_name[IFNAMSIZ];
145235a9d89SSainath Grandhi 
146235a9d89SSainath Grandhi 	if (dev->rtnl_link_ops != &ipvtap_link_ops)
147235a9d89SSainath Grandhi 		return NOTIFY_DONE;
148235a9d89SSainath Grandhi 
149235a9d89SSainath Grandhi 	snprintf(tap_name, IFNAMSIZ, "tap%d", dev->ifindex);
150235a9d89SSainath Grandhi 	vlantap = netdev_priv(dev);
151235a9d89SSainath Grandhi 
152235a9d89SSainath Grandhi 	switch (event) {
153235a9d89SSainath Grandhi 	case NETDEV_REGISTER:
154235a9d89SSainath Grandhi 		/* Create the device node here after the network device has
155235a9d89SSainath Grandhi 		 * been registered but before register_netdevice has
156235a9d89SSainath Grandhi 		 * finished running.
157235a9d89SSainath Grandhi 		 */
158235a9d89SSainath Grandhi 		err = tap_get_minor(ipvtap_major, &vlantap->tap);
159235a9d89SSainath Grandhi 		if (err)
160235a9d89SSainath Grandhi 			return notifier_from_errno(err);
161235a9d89SSainath Grandhi 
162235a9d89SSainath Grandhi 		devt = MKDEV(MAJOR(ipvtap_major), vlantap->tap.minor);
163235a9d89SSainath Grandhi 		classdev = device_create(&ipvtap_class, &dev->dev, devt,
164a07a296bSJean Sacren 					 dev, "%s", tap_name);
165235a9d89SSainath Grandhi 		if (IS_ERR(classdev)) {
166235a9d89SSainath Grandhi 			tap_free_minor(ipvtap_major, &vlantap->tap);
167235a9d89SSainath Grandhi 			return notifier_from_errno(PTR_ERR(classdev));
168235a9d89SSainath Grandhi 		}
169235a9d89SSainath Grandhi 		err = sysfs_create_link(&dev->dev.kobj, &classdev->kobj,
170235a9d89SSainath Grandhi 					tap_name);
171235a9d89SSainath Grandhi 		if (err)
172235a9d89SSainath Grandhi 			return notifier_from_errno(err);
173235a9d89SSainath Grandhi 		break;
174235a9d89SSainath Grandhi 	case NETDEV_UNREGISTER:
175235a9d89SSainath Grandhi 		/* vlan->minor == 0 if NETDEV_REGISTER above failed */
176235a9d89SSainath Grandhi 		if (vlantap->tap.minor == 0)
177235a9d89SSainath Grandhi 			break;
178235a9d89SSainath Grandhi 		sysfs_remove_link(&dev->dev.kobj, tap_name);
179235a9d89SSainath Grandhi 		devt = MKDEV(MAJOR(ipvtap_major), vlantap->tap.minor);
180235a9d89SSainath Grandhi 		device_destroy(&ipvtap_class, devt);
181235a9d89SSainath Grandhi 		tap_free_minor(ipvtap_major, &vlantap->tap);
182235a9d89SSainath Grandhi 		break;
183235a9d89SSainath Grandhi 	case NETDEV_CHANGE_TX_QUEUE_LEN:
184235a9d89SSainath Grandhi 		if (tap_queue_resize(&vlantap->tap))
185235a9d89SSainath Grandhi 			return NOTIFY_BAD;
186235a9d89SSainath Grandhi 		break;
187235a9d89SSainath Grandhi 	}
188235a9d89SSainath Grandhi 
189235a9d89SSainath Grandhi 	return NOTIFY_DONE;
190235a9d89SSainath Grandhi }
191235a9d89SSainath Grandhi 
192235a9d89SSainath Grandhi static struct notifier_block ipvtap_notifier_block __read_mostly = {
193235a9d89SSainath Grandhi 	.notifier_call	= ipvtap_device_event,
194235a9d89SSainath Grandhi };
195235a9d89SSainath Grandhi 
ipvtap_init(void)1964b2e3a17SMaciej Żenczykowski static int __init ipvtap_init(void)
197235a9d89SSainath Grandhi {
198235a9d89SSainath Grandhi 	int err;
199235a9d89SSainath Grandhi 
200dea6e19fSGirish Moodalbail 	err = tap_create_cdev(&ipvtap_cdev, &ipvtap_major, "ipvtap",
201dea6e19fSGirish Moodalbail 			      THIS_MODULE);
202235a9d89SSainath Grandhi 	if (err)
203235a9d89SSainath Grandhi 		goto out1;
204235a9d89SSainath Grandhi 
205235a9d89SSainath Grandhi 	err = class_register(&ipvtap_class);
206235a9d89SSainath Grandhi 	if (err)
207235a9d89SSainath Grandhi 		goto out2;
208235a9d89SSainath Grandhi 
209235a9d89SSainath Grandhi 	err = register_netdevice_notifier(&ipvtap_notifier_block);
210235a9d89SSainath Grandhi 	if (err)
211235a9d89SSainath Grandhi 		goto out3;
212235a9d89SSainath Grandhi 
213235a9d89SSainath Grandhi 	err = ipvlan_link_register(&ipvtap_link_ops);
214235a9d89SSainath Grandhi 	if (err)
215235a9d89SSainath Grandhi 		goto out4;
216235a9d89SSainath Grandhi 
217235a9d89SSainath Grandhi 	return 0;
218235a9d89SSainath Grandhi 
219235a9d89SSainath Grandhi out4:
220235a9d89SSainath Grandhi 	unregister_netdevice_notifier(&ipvtap_notifier_block);
221235a9d89SSainath Grandhi out3:
222235a9d89SSainath Grandhi 	class_unregister(&ipvtap_class);
223235a9d89SSainath Grandhi out2:
224235a9d89SSainath Grandhi 	tap_destroy_cdev(ipvtap_major, &ipvtap_cdev);
225235a9d89SSainath Grandhi out1:
226235a9d89SSainath Grandhi 	return err;
227235a9d89SSainath Grandhi }
228235a9d89SSainath Grandhi module_init(ipvtap_init);
229235a9d89SSainath Grandhi 
ipvtap_exit(void)2304b2e3a17SMaciej Żenczykowski static void __exit ipvtap_exit(void)
231235a9d89SSainath Grandhi {
232235a9d89SSainath Grandhi 	rtnl_link_unregister(&ipvtap_link_ops);
233235a9d89SSainath Grandhi 	unregister_netdevice_notifier(&ipvtap_notifier_block);
234235a9d89SSainath Grandhi 	class_unregister(&ipvtap_class);
235235a9d89SSainath Grandhi 	tap_destroy_cdev(ipvtap_major, &ipvtap_cdev);
236235a9d89SSainath Grandhi }
237235a9d89SSainath Grandhi module_exit(ipvtap_exit);
238235a9d89SSainath Grandhi MODULE_ALIAS_RTNL_LINK("ipvtap");
239235a9d89SSainath Grandhi MODULE_AUTHOR("Sainath Grandhi <sainath.grandhi@intel.com>");
240235a9d89SSainath Grandhi MODULE_LICENSE("GPL");
241