xref: /openbmc/linux/net/batman-adv/bat_v_elp.c (revision dc6a81c3)
1 // SPDX-License-Identifier: GPL-2.0
2 /* Copyright (C) 2011-2020  B.A.T.M.A.N. contributors:
3  *
4  * Linus Lüssing, Marek Lindner
5  */
6 
7 #include "bat_v_elp.h"
8 #include "main.h"
9 
10 #include <linux/atomic.h>
11 #include <linux/bitops.h>
12 #include <linux/byteorder/generic.h>
13 #include <linux/errno.h>
14 #include <linux/etherdevice.h>
15 #include <linux/ethtool.h>
16 #include <linux/gfp.h>
17 #include <linux/if_ether.h>
18 #include <linux/jiffies.h>
19 #include <linux/kernel.h>
20 #include <linux/kref.h>
21 #include <linux/netdevice.h>
22 #include <linux/nl80211.h>
23 #include <linux/random.h>
24 #include <linux/rculist.h>
25 #include <linux/rcupdate.h>
26 #include <linux/rtnetlink.h>
27 #include <linux/skbuff.h>
28 #include <linux/stddef.h>
29 #include <linux/string.h>
30 #include <linux/types.h>
31 #include <linux/workqueue.h>
32 #include <net/cfg80211.h>
33 #include <uapi/linux/batadv_packet.h>
34 
35 #include "bat_algo.h"
36 #include "bat_v_ogm.h"
37 #include "hard-interface.h"
38 #include "log.h"
39 #include "originator.h"
40 #include "routing.h"
41 #include "send.h"
42 
43 /**
44  * batadv_v_elp_start_timer() - restart timer for ELP periodic work
45  * @hard_iface: the interface for which the timer has to be reset
46  */
47 static void batadv_v_elp_start_timer(struct batadv_hard_iface *hard_iface)
48 {
49 	unsigned int msecs;
50 
51 	msecs = atomic_read(&hard_iface->bat_v.elp_interval) - BATADV_JITTER;
52 	msecs += prandom_u32() % (2 * BATADV_JITTER);
53 
54 	queue_delayed_work(batadv_event_workqueue, &hard_iface->bat_v.elp_wq,
55 			   msecs_to_jiffies(msecs));
56 }
57 
58 /**
59  * batadv_v_elp_get_throughput() - get the throughput towards a neighbour
60  * @neigh: the neighbour for which the throughput has to be obtained
61  *
62  * Return: The throughput towards the given neighbour in multiples of 100kpbs
63  *         (a value of '1' equals to 0.1Mbps, '10' equals 1Mbps, etc).
64  */
65 static u32 batadv_v_elp_get_throughput(struct batadv_hardif_neigh_node *neigh)
66 {
67 	struct batadv_hard_iface *hard_iface = neigh->if_incoming;
68 	struct ethtool_link_ksettings link_settings;
69 	struct net_device *real_netdev;
70 	struct station_info sinfo;
71 	u32 throughput;
72 	int ret;
73 
74 	/* if the user specified a customised value for this interface, then
75 	 * return it directly
76 	 */
77 	throughput =  atomic_read(&hard_iface->bat_v.throughput_override);
78 	if (throughput != 0)
79 		return throughput;
80 
81 	/* if this is a wireless device, then ask its throughput through
82 	 * cfg80211 API
83 	 */
84 	if (batadv_is_wifi_hardif(hard_iface)) {
85 		if (!batadv_is_cfg80211_hardif(hard_iface))
86 			/* unsupported WiFi driver version */
87 			goto default_throughput;
88 
89 		real_netdev = batadv_get_real_netdev(hard_iface->net_dev);
90 		if (!real_netdev)
91 			goto default_throughput;
92 
93 		ret = cfg80211_get_station(real_netdev, neigh->addr, &sinfo);
94 
95 		if (!ret) {
96 			/* free the TID stats immediately */
97 			cfg80211_sinfo_release_content(&sinfo);
98 		}
99 
100 		dev_put(real_netdev);
101 		if (ret == -ENOENT) {
102 			/* Node is not associated anymore! It would be
103 			 * possible to delete this neighbor. For now set
104 			 * the throughput metric to 0.
105 			 */
106 			return 0;
107 		}
108 		if (ret)
109 			goto default_throughput;
110 
111 		if (sinfo.filled & BIT(NL80211_STA_INFO_EXPECTED_THROUGHPUT))
112 			return sinfo.expected_throughput / 100;
113 
114 		/* try to estimate the expected throughput based on reported tx
115 		 * rates
116 		 */
117 		if (sinfo.filled & BIT(NL80211_STA_INFO_TX_BITRATE))
118 			return cfg80211_calculate_bitrate(&sinfo.txrate) / 3;
119 
120 		goto default_throughput;
121 	}
122 
123 	/* if not a wifi interface, check if this device provides data via
124 	 * ethtool (e.g. an Ethernet adapter)
125 	 */
126 	memset(&link_settings, 0, sizeof(link_settings));
127 	rtnl_lock();
128 	ret = __ethtool_get_link_ksettings(hard_iface->net_dev, &link_settings);
129 	rtnl_unlock();
130 
131 	/* Virtual interface drivers such as tun / tap interfaces, VLAN, etc
132 	 * tend to initialize the interface throughput with some value for the
133 	 * sake of having a throughput number to export via ethtool. This
134 	 * exported throughput leaves batman-adv to conclude the interface
135 	 * throughput is genuine (reflecting reality), thus no measurements
136 	 * are necessary.
137 	 *
138 	 * Based on the observation that those interface types also tend to set
139 	 * the link auto-negotiation to 'off', batman-adv shall check this
140 	 * setting to differentiate between genuine link throughput information
141 	 * and placeholders installed by virtual interfaces.
142 	 */
143 	if (ret == 0 && link_settings.base.autoneg == AUTONEG_ENABLE) {
144 		/* link characteristics might change over time */
145 		if (link_settings.base.duplex == DUPLEX_FULL)
146 			hard_iface->bat_v.flags |= BATADV_FULL_DUPLEX;
147 		else
148 			hard_iface->bat_v.flags &= ~BATADV_FULL_DUPLEX;
149 
150 		throughput = link_settings.base.speed;
151 		if (throughput && throughput != SPEED_UNKNOWN)
152 			return throughput * 10;
153 	}
154 
155 default_throughput:
156 	if (!(hard_iface->bat_v.flags & BATADV_WARNING_DEFAULT)) {
157 		batadv_info(hard_iface->soft_iface,
158 			    "WiFi driver or ethtool info does not provide information about link speeds on interface %s, therefore defaulting to hardcoded throughput values of %u.%1u Mbps. Consider overriding the throughput manually or checking your driver.\n",
159 			    hard_iface->net_dev->name,
160 			    BATADV_THROUGHPUT_DEFAULT_VALUE / 10,
161 			    BATADV_THROUGHPUT_DEFAULT_VALUE % 10);
162 		hard_iface->bat_v.flags |= BATADV_WARNING_DEFAULT;
163 	}
164 
165 	/* if none of the above cases apply, return the base_throughput */
166 	return BATADV_THROUGHPUT_DEFAULT_VALUE;
167 }
168 
169 /**
170  * batadv_v_elp_throughput_metric_update() - worker updating the throughput
171  *  metric of a single hop neighbour
172  * @work: the work queue item
173  */
174 void batadv_v_elp_throughput_metric_update(struct work_struct *work)
175 {
176 	struct batadv_hardif_neigh_node_bat_v *neigh_bat_v;
177 	struct batadv_hardif_neigh_node *neigh;
178 
179 	neigh_bat_v = container_of(work, struct batadv_hardif_neigh_node_bat_v,
180 				   metric_work);
181 	neigh = container_of(neigh_bat_v, struct batadv_hardif_neigh_node,
182 			     bat_v);
183 
184 	ewma_throughput_add(&neigh->bat_v.throughput,
185 			    batadv_v_elp_get_throughput(neigh));
186 
187 	/* decrement refcounter to balance increment performed before scheduling
188 	 * this task
189 	 */
190 	batadv_hardif_neigh_put(neigh);
191 }
192 
193 /**
194  * batadv_v_elp_wifi_neigh_probe() - send link probing packets to a neighbour
195  * @neigh: the neighbour to probe
196  *
197  * Sends a predefined number of unicast wifi packets to a given neighbour in
198  * order to trigger the throughput estimation on this link by the RC algorithm.
199  * Packets are sent only if there there is not enough payload unicast traffic
200  * towards this neighbour..
201  *
202  * Return: True on success and false in case of error during skb preparation.
203  */
204 static bool
205 batadv_v_elp_wifi_neigh_probe(struct batadv_hardif_neigh_node *neigh)
206 {
207 	struct batadv_hard_iface *hard_iface = neigh->if_incoming;
208 	struct batadv_priv *bat_priv = netdev_priv(hard_iface->soft_iface);
209 	unsigned long last_tx_diff;
210 	struct sk_buff *skb;
211 	int probe_len, i;
212 	int elp_skb_len;
213 
214 	/* this probing routine is for Wifi neighbours only */
215 	if (!batadv_is_wifi_hardif(hard_iface))
216 		return true;
217 
218 	/* probe the neighbor only if no unicast packets have been sent
219 	 * to it in the last 100 milliseconds: this is the rate control
220 	 * algorithm sampling interval (minstrel). In this way, if not
221 	 * enough traffic has been sent to the neighbor, batman-adv can
222 	 * generate 2 probe packets and push the RC algorithm to perform
223 	 * the sampling
224 	 */
225 	last_tx_diff = jiffies_to_msecs(jiffies - neigh->bat_v.last_unicast_tx);
226 	if (last_tx_diff <= BATADV_ELP_PROBE_MAX_TX_DIFF)
227 		return true;
228 
229 	probe_len = max_t(int, sizeof(struct batadv_elp_packet),
230 			  BATADV_ELP_MIN_PROBE_SIZE);
231 
232 	for (i = 0; i < BATADV_ELP_PROBES_PER_NODE; i++) {
233 		elp_skb_len = hard_iface->bat_v.elp_skb->len;
234 		skb = skb_copy_expand(hard_iface->bat_v.elp_skb, 0,
235 				      probe_len - elp_skb_len,
236 				      GFP_ATOMIC);
237 		if (!skb)
238 			return false;
239 
240 		/* Tell the skb to get as big as the allocated space (we want
241 		 * the packet to be exactly of that size to make the link
242 		 * throughput estimation effective.
243 		 */
244 		skb_put_zero(skb, probe_len - hard_iface->bat_v.elp_skb->len);
245 
246 		batadv_dbg(BATADV_DBG_BATMAN, bat_priv,
247 			   "Sending unicast (probe) ELP packet on interface %s to %pM\n",
248 			   hard_iface->net_dev->name, neigh->addr);
249 
250 		batadv_send_skb_packet(skb, hard_iface, neigh->addr);
251 	}
252 
253 	return true;
254 }
255 
256 /**
257  * batadv_v_elp_periodic_work() - ELP periodic task per interface
258  * @work: work queue item
259  *
260  * Emits broadcast ELP message in regular intervals.
261  */
262 static void batadv_v_elp_periodic_work(struct work_struct *work)
263 {
264 	struct batadv_hardif_neigh_node *hardif_neigh;
265 	struct batadv_hard_iface *hard_iface;
266 	struct batadv_hard_iface_bat_v *bat_v;
267 	struct batadv_elp_packet *elp_packet;
268 	struct batadv_priv *bat_priv;
269 	struct sk_buff *skb;
270 	u32 elp_interval;
271 	bool ret;
272 
273 	bat_v = container_of(work, struct batadv_hard_iface_bat_v, elp_wq.work);
274 	hard_iface = container_of(bat_v, struct batadv_hard_iface, bat_v);
275 	bat_priv = netdev_priv(hard_iface->soft_iface);
276 
277 	if (atomic_read(&bat_priv->mesh_state) == BATADV_MESH_DEACTIVATING)
278 		goto out;
279 
280 	/* we are in the process of shutting this interface down */
281 	if (hard_iface->if_status == BATADV_IF_NOT_IN_USE ||
282 	    hard_iface->if_status == BATADV_IF_TO_BE_REMOVED)
283 		goto out;
284 
285 	/* the interface was enabled but may not be ready yet */
286 	if (hard_iface->if_status != BATADV_IF_ACTIVE)
287 		goto restart_timer;
288 
289 	skb = skb_copy(hard_iface->bat_v.elp_skb, GFP_ATOMIC);
290 	if (!skb)
291 		goto restart_timer;
292 
293 	elp_packet = (struct batadv_elp_packet *)skb->data;
294 	elp_packet->seqno = htonl(atomic_read(&hard_iface->bat_v.elp_seqno));
295 	elp_interval = atomic_read(&hard_iface->bat_v.elp_interval);
296 	elp_packet->elp_interval = htonl(elp_interval);
297 
298 	batadv_dbg(BATADV_DBG_BATMAN, bat_priv,
299 		   "Sending broadcast ELP packet on interface %s, seqno %u\n",
300 		   hard_iface->net_dev->name,
301 		   atomic_read(&hard_iface->bat_v.elp_seqno));
302 
303 	batadv_send_broadcast_skb(skb, hard_iface);
304 
305 	atomic_inc(&hard_iface->bat_v.elp_seqno);
306 
307 	/* The throughput metric is updated on each sent packet. This way, if a
308 	 * node is dead and no longer sends packets, batman-adv is still able to
309 	 * react timely to its death.
310 	 *
311 	 * The throughput metric is updated by following these steps:
312 	 * 1) if the hard_iface is wifi => send a number of unicast ELPs for
313 	 *    probing/sampling to each neighbor
314 	 * 2) update the throughput metric value of each neighbor (note that the
315 	 *    value retrieved in this step might be 100ms old because the
316 	 *    probing packets at point 1) could still be in the HW queue)
317 	 */
318 	rcu_read_lock();
319 	hlist_for_each_entry_rcu(hardif_neigh, &hard_iface->neigh_list, list) {
320 		if (!batadv_v_elp_wifi_neigh_probe(hardif_neigh))
321 			/* if something goes wrong while probing, better to stop
322 			 * sending packets immediately and reschedule the task
323 			 */
324 			break;
325 
326 		if (!kref_get_unless_zero(&hardif_neigh->refcount))
327 			continue;
328 
329 		/* Reading the estimated throughput from cfg80211 is a task that
330 		 * may sleep and that is not allowed in an rcu protected
331 		 * context. Therefore schedule a task for that.
332 		 */
333 		ret = queue_work(batadv_event_workqueue,
334 				 &hardif_neigh->bat_v.metric_work);
335 
336 		if (!ret)
337 			batadv_hardif_neigh_put(hardif_neigh);
338 	}
339 	rcu_read_unlock();
340 
341 restart_timer:
342 	batadv_v_elp_start_timer(hard_iface);
343 out:
344 	return;
345 }
346 
347 /**
348  * batadv_v_elp_iface_enable() - setup the ELP interface private resources
349  * @hard_iface: interface for which the data has to be prepared
350  *
351  * Return: 0 on success or a -ENOMEM in case of failure.
352  */
353 int batadv_v_elp_iface_enable(struct batadv_hard_iface *hard_iface)
354 {
355 	static const size_t tvlv_padding = sizeof(__be32);
356 	struct batadv_elp_packet *elp_packet;
357 	unsigned char *elp_buff;
358 	u32 random_seqno;
359 	size_t size;
360 	int res = -ENOMEM;
361 
362 	size = ETH_HLEN + NET_IP_ALIGN + BATADV_ELP_HLEN + tvlv_padding;
363 	hard_iface->bat_v.elp_skb = dev_alloc_skb(size);
364 	if (!hard_iface->bat_v.elp_skb)
365 		goto out;
366 
367 	skb_reserve(hard_iface->bat_v.elp_skb, ETH_HLEN + NET_IP_ALIGN);
368 	elp_buff = skb_put_zero(hard_iface->bat_v.elp_skb,
369 				BATADV_ELP_HLEN + tvlv_padding);
370 	elp_packet = (struct batadv_elp_packet *)elp_buff;
371 
372 	elp_packet->packet_type = BATADV_ELP;
373 	elp_packet->version = BATADV_COMPAT_VERSION;
374 
375 	/* randomize initial seqno to avoid collision */
376 	get_random_bytes(&random_seqno, sizeof(random_seqno));
377 	atomic_set(&hard_iface->bat_v.elp_seqno, random_seqno);
378 
379 	/* assume full-duplex by default */
380 	hard_iface->bat_v.flags |= BATADV_FULL_DUPLEX;
381 
382 	/* warn the user (again) if there is no throughput data is available */
383 	hard_iface->bat_v.flags &= ~BATADV_WARNING_DEFAULT;
384 
385 	if (batadv_is_wifi_hardif(hard_iface))
386 		hard_iface->bat_v.flags &= ~BATADV_FULL_DUPLEX;
387 
388 	INIT_DELAYED_WORK(&hard_iface->bat_v.elp_wq,
389 			  batadv_v_elp_periodic_work);
390 	batadv_v_elp_start_timer(hard_iface);
391 	res = 0;
392 
393 out:
394 	return res;
395 }
396 
397 /**
398  * batadv_v_elp_iface_disable() - release ELP interface private resources
399  * @hard_iface: interface for which the resources have to be released
400  */
401 void batadv_v_elp_iface_disable(struct batadv_hard_iface *hard_iface)
402 {
403 	cancel_delayed_work_sync(&hard_iface->bat_v.elp_wq);
404 
405 	dev_kfree_skb(hard_iface->bat_v.elp_skb);
406 	hard_iface->bat_v.elp_skb = NULL;
407 }
408 
409 /**
410  * batadv_v_elp_iface_activate() - update the ELP buffer belonging to the given
411  *  hard-interface
412  * @primary_iface: the new primary interface
413  * @hard_iface: interface holding the to-be-updated buffer
414  */
415 void batadv_v_elp_iface_activate(struct batadv_hard_iface *primary_iface,
416 				 struct batadv_hard_iface *hard_iface)
417 {
418 	struct batadv_elp_packet *elp_packet;
419 	struct sk_buff *skb;
420 
421 	if (!hard_iface->bat_v.elp_skb)
422 		return;
423 
424 	skb = hard_iface->bat_v.elp_skb;
425 	elp_packet = (struct batadv_elp_packet *)skb->data;
426 	ether_addr_copy(elp_packet->orig,
427 			primary_iface->net_dev->dev_addr);
428 }
429 
430 /**
431  * batadv_v_elp_primary_iface_set() - change internal data to reflect the new
432  *  primary interface
433  * @primary_iface: the new primary interface
434  */
435 void batadv_v_elp_primary_iface_set(struct batadv_hard_iface *primary_iface)
436 {
437 	struct batadv_hard_iface *hard_iface;
438 
439 	/* update orig field of every elp iface belonging to this mesh */
440 	rcu_read_lock();
441 	list_for_each_entry_rcu(hard_iface, &batadv_hardif_list, list) {
442 		if (primary_iface->soft_iface != hard_iface->soft_iface)
443 			continue;
444 
445 		batadv_v_elp_iface_activate(primary_iface, hard_iface);
446 	}
447 	rcu_read_unlock();
448 }
449 
450 /**
451  * batadv_v_elp_neigh_update() - update an ELP neighbour node
452  * @bat_priv: the bat priv with all the soft interface information
453  * @neigh_addr: the neighbour interface address
454  * @if_incoming: the interface the packet was received through
455  * @elp_packet: the received ELP packet
456  *
457  * Updates the ELP neighbour node state with the data received within the new
458  * ELP packet.
459  */
460 static void batadv_v_elp_neigh_update(struct batadv_priv *bat_priv,
461 				      u8 *neigh_addr,
462 				      struct batadv_hard_iface *if_incoming,
463 				      struct batadv_elp_packet *elp_packet)
464 
465 {
466 	struct batadv_neigh_node *neigh;
467 	struct batadv_orig_node *orig_neigh;
468 	struct batadv_hardif_neigh_node *hardif_neigh;
469 	s32 seqno_diff;
470 	s32 elp_latest_seqno;
471 
472 	orig_neigh = batadv_v_ogm_orig_get(bat_priv, elp_packet->orig);
473 	if (!orig_neigh)
474 		return;
475 
476 	neigh = batadv_neigh_node_get_or_create(orig_neigh,
477 						if_incoming, neigh_addr);
478 	if (!neigh)
479 		goto orig_free;
480 
481 	hardif_neigh = batadv_hardif_neigh_get(if_incoming, neigh_addr);
482 	if (!hardif_neigh)
483 		goto neigh_free;
484 
485 	elp_latest_seqno = hardif_neigh->bat_v.elp_latest_seqno;
486 	seqno_diff = ntohl(elp_packet->seqno) - elp_latest_seqno;
487 
488 	/* known or older sequence numbers are ignored. However always adopt
489 	 * if the router seems to have been restarted.
490 	 */
491 	if (seqno_diff < 1 && seqno_diff > -BATADV_ELP_MAX_AGE)
492 		goto hardif_free;
493 
494 	neigh->last_seen = jiffies;
495 	hardif_neigh->last_seen = jiffies;
496 	hardif_neigh->bat_v.elp_latest_seqno = ntohl(elp_packet->seqno);
497 	hardif_neigh->bat_v.elp_interval = ntohl(elp_packet->elp_interval);
498 
499 hardif_free:
500 	if (hardif_neigh)
501 		batadv_hardif_neigh_put(hardif_neigh);
502 neigh_free:
503 	if (neigh)
504 		batadv_neigh_node_put(neigh);
505 orig_free:
506 	if (orig_neigh)
507 		batadv_orig_node_put(orig_neigh);
508 }
509 
510 /**
511  * batadv_v_elp_packet_recv() - main ELP packet handler
512  * @skb: the received packet
513  * @if_incoming: the interface this packet was received through
514  *
515  * Return: NET_RX_SUCCESS and consumes the skb if the packet was peoperly
516  * processed or NET_RX_DROP in case of failure.
517  */
518 int batadv_v_elp_packet_recv(struct sk_buff *skb,
519 			     struct batadv_hard_iface *if_incoming)
520 {
521 	struct batadv_priv *bat_priv = netdev_priv(if_incoming->soft_iface);
522 	struct batadv_elp_packet *elp_packet;
523 	struct batadv_hard_iface *primary_if;
524 	struct ethhdr *ethhdr = (struct ethhdr *)skb_mac_header(skb);
525 	bool res;
526 	int ret = NET_RX_DROP;
527 
528 	res = batadv_check_management_packet(skb, if_incoming, BATADV_ELP_HLEN);
529 	if (!res)
530 		goto free_skb;
531 
532 	if (batadv_is_my_mac(bat_priv, ethhdr->h_source))
533 		goto free_skb;
534 
535 	/* did we receive a B.A.T.M.A.N. V ELP packet on an interface
536 	 * that does not have B.A.T.M.A.N. V ELP enabled ?
537 	 */
538 	if (strcmp(bat_priv->algo_ops->name, "BATMAN_V") != 0)
539 		goto free_skb;
540 
541 	elp_packet = (struct batadv_elp_packet *)skb->data;
542 
543 	batadv_dbg(BATADV_DBG_BATMAN, bat_priv,
544 		   "Received ELP packet from %pM seqno %u ORIG: %pM\n",
545 		   ethhdr->h_source, ntohl(elp_packet->seqno),
546 		   elp_packet->orig);
547 
548 	primary_if = batadv_primary_if_get_selected(bat_priv);
549 	if (!primary_if)
550 		goto free_skb;
551 
552 	batadv_v_elp_neigh_update(bat_priv, ethhdr->h_source, if_incoming,
553 				  elp_packet);
554 
555 	ret = NET_RX_SUCCESS;
556 	batadv_hardif_put(primary_if);
557 
558 free_skb:
559 	if (ret == NET_RX_SUCCESS)
560 		consume_skb(skb);
561 	else
562 		kfree_skb(skb);
563 
564 	return ret;
565 }
566