xref: /openbmc/linux/include/net/dst.h (revision 290b895e0ba4552dfcfc4bd35759c192345b934a)
11da177e4SLinus Torvalds /*
21da177e4SLinus Torvalds  * net/dst.h	Protocol independent destination cache definitions.
31da177e4SLinus Torvalds  *
41da177e4SLinus Torvalds  * Authors:	Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
51da177e4SLinus Torvalds  *
61da177e4SLinus Torvalds  */
71da177e4SLinus Torvalds 
81da177e4SLinus Torvalds #ifndef _NET_DST_H
91da177e4SLinus Torvalds #define _NET_DST_H
101da177e4SLinus Torvalds 
1186393e52SAlexey Dobriyan #include <net/dst_ops.h>
1214c85021SArnaldo Carvalho de Melo #include <linux/netdevice.h>
131da177e4SLinus Torvalds #include <linux/rtnetlink.h>
141da177e4SLinus Torvalds #include <linux/rcupdate.h>
151da177e4SLinus Torvalds #include <linux/jiffies.h>
161da177e4SLinus Torvalds #include <net/neighbour.h>
171da177e4SLinus Torvalds #include <asm/processor.h>
181da177e4SLinus Torvalds 
191da177e4SLinus Torvalds /*
201da177e4SLinus Torvalds  * 0 - no debugging messages
211da177e4SLinus Torvalds  * 1 - rare events and bugs (default)
221da177e4SLinus Torvalds  * 2 - trace mode.
231da177e4SLinus Torvalds  */
241da177e4SLinus Torvalds #define RT_CACHE_DEBUG		0
251da177e4SLinus Torvalds 
261da177e4SLinus Torvalds #define DST_GC_MIN	(HZ/10)
271da177e4SLinus Torvalds #define DST_GC_INC	(HZ/2)
281da177e4SLinus Torvalds #define DST_GC_MAX	(120*HZ)
291da177e4SLinus Torvalds 
301da177e4SLinus Torvalds /* Each dst_entry has reference count and sits in some parent list(s).
311da177e4SLinus Torvalds  * When it is removed from parent list, it is "freed" (dst_free).
321da177e4SLinus Torvalds  * After this it enters dead state (dst->obsolete > 0) and if its refcnt
331da177e4SLinus Torvalds  * is zero, it can be destroyed immediately, otherwise it is added
341da177e4SLinus Torvalds  * to gc list and garbage collector periodically checks the refcnt.
351da177e4SLinus Torvalds  */
361da177e4SLinus Torvalds 
371da177e4SLinus Torvalds struct sk_buff;
381da177e4SLinus Torvalds 
39fd2c3ef7SEric Dumazet struct dst_entry {
401e19e02cSEric Dumazet 	struct rcu_head		rcu_head;
411da177e4SLinus Torvalds 	struct dst_entry	*child;
421da177e4SLinus Torvalds 	struct net_device       *dev;
43c4d54110SHerbert Xu 	short			error;
44c4d54110SHerbert Xu 	short			obsolete;
451da177e4SLinus Torvalds 	int			flags;
461da177e4SLinus Torvalds #define DST_HOST		1
471da177e4SLinus Torvalds #define DST_NOXFRM		2
481da177e4SLinus Torvalds #define DST_NOPOLICY		4
491da177e4SLinus Torvalds #define DST_NOHASH		8
501da177e4SLinus Torvalds 	unsigned long		expires;
511da177e4SLinus Torvalds 
521da177e4SLinus Torvalds 	unsigned short		header_len;	/* more space at head required */
531da177e4SLinus Torvalds 	unsigned short		trailer_len;	/* space to reserve at tail */
541da177e4SLinus Torvalds 
5569a73829SEric Dumazet 	unsigned int		rate_tokens;
56f1dd9c37SZhang Yanmin 	unsigned long		rate_last;	/* rate limiting for ICMP */
5769a73829SEric Dumazet 
58f1dd9c37SZhang Yanmin 	struct dst_entry	*path;
591da177e4SLinus Torvalds 
601da177e4SLinus Torvalds 	struct neighbour	*neighbour;
611da177e4SLinus Torvalds 	struct hh_cache		*hh;
62def8b4faSAlexey Dobriyan #ifdef CONFIG_XFRM
631da177e4SLinus Torvalds 	struct xfrm_state	*xfrm;
645635c10dSEric Dumazet #else
655635c10dSEric Dumazet 	void			*__pad1;
66def8b4faSAlexey Dobriyan #endif
671da177e4SLinus Torvalds 	int			(*input)(struct sk_buff*);
681da177e4SLinus Torvalds 	int			(*output)(struct sk_buff*);
691da177e4SLinus Torvalds 
701da177e4SLinus Torvalds 	struct  dst_ops	        *ops;
711da177e4SLinus Torvalds 
72f1dd9c37SZhang Yanmin 	u32			metrics[RTAX_MAX];
73f1dd9c37SZhang Yanmin 
74f1dd9c37SZhang Yanmin #ifdef CONFIG_NET_CLS_ROUTE
75f1dd9c37SZhang Yanmin 	__u32			tclassid;
765635c10dSEric Dumazet #else
775635c10dSEric Dumazet 	__u32			__pad2;
78f1dd9c37SZhang Yanmin #endif
79f1dd9c37SZhang Yanmin 
805635c10dSEric Dumazet 
815635c10dSEric Dumazet 	/*
825635c10dSEric Dumazet 	 * Align __refcnt to a 64 bytes alignment
835635c10dSEric Dumazet 	 * (L1_CACHE_SIZE would be too much)
845635c10dSEric Dumazet 	 */
855635c10dSEric Dumazet #ifdef CONFIG_64BIT
865635c10dSEric Dumazet 	long			__pad_to_align_refcnt[1];
875635c10dSEric Dumazet #endif
88f1dd9c37SZhang Yanmin 	/*
89f1dd9c37SZhang Yanmin 	 * __refcnt wants to be on a different cache line from
90f1dd9c37SZhang Yanmin 	 * input/output/ops or performance tanks badly
91f1dd9c37SZhang Yanmin 	 */
921e19e02cSEric Dumazet 	atomic_t		__refcnt;	/* client references	*/
931e19e02cSEric Dumazet 	int			__use;
94f1dd9c37SZhang Yanmin 	unsigned long		lastuse;
951e19e02cSEric Dumazet 	union {
961e19e02cSEric Dumazet 		struct dst_entry *next;
971e19e02cSEric Dumazet 		struct rtable    *rt_next;
981e19e02cSEric Dumazet 		struct rt6_info   *rt6_next;
991e19e02cSEric Dumazet 		struct dn_route  *dn_next;
1001e19e02cSEric Dumazet 	};
1011da177e4SLinus Torvalds };
1021da177e4SLinus Torvalds 
1031da177e4SLinus Torvalds #ifdef __KERNEL__
1041da177e4SLinus Torvalds 
1051da177e4SLinus Torvalds static inline u32
1061da177e4SLinus Torvalds dst_metric(const struct dst_entry *dst, int metric)
1071da177e4SLinus Torvalds {
1081da177e4SLinus Torvalds 	return dst->metrics[metric-1];
1091da177e4SLinus Torvalds }
1101da177e4SLinus Torvalds 
1110c3adfb8SGilad Ben-Yossef static inline u32
1120c3adfb8SGilad Ben-Yossef dst_feature(const struct dst_entry *dst, u32 feature)
1130c3adfb8SGilad Ben-Yossef {
114bb5b7c11SDavid S. Miller 	return dst_metric(dst, RTAX_FEATURES) & feature;
1150c3adfb8SGilad Ben-Yossef }
1160c3adfb8SGilad Ben-Yossef 
1171da177e4SLinus Torvalds static inline u32 dst_mtu(const struct dst_entry *dst)
1181da177e4SLinus Torvalds {
1191da177e4SLinus Torvalds 	u32 mtu = dst_metric(dst, RTAX_MTU);
1201da177e4SLinus Torvalds 	/*
1211da177e4SLinus Torvalds 	 * Alexey put it here, so ask him about it :)
1221da177e4SLinus Torvalds 	 */
1231da177e4SLinus Torvalds 	barrier();
1241da177e4SLinus Torvalds 	return mtu;
1251da177e4SLinus Torvalds }
1261da177e4SLinus Torvalds 
127c1e20f7cSStephen Hemminger /* RTT metrics are stored in milliseconds for user ABI, but used as jiffies */
128c1e20f7cSStephen Hemminger static inline unsigned long dst_metric_rtt(const struct dst_entry *dst, int metric)
129c1e20f7cSStephen Hemminger {
130c1e20f7cSStephen Hemminger 	return msecs_to_jiffies(dst_metric(dst, metric));
131c1e20f7cSStephen Hemminger }
132c1e20f7cSStephen Hemminger 
133c1e20f7cSStephen Hemminger static inline void set_dst_metric_rtt(struct dst_entry *dst, int metric,
134c1e20f7cSStephen Hemminger 				      unsigned long rtt)
135c1e20f7cSStephen Hemminger {
136c1e20f7cSStephen Hemminger 	dst->metrics[metric-1] = jiffies_to_msecs(rtt);
137c1e20f7cSStephen Hemminger }
138c1e20f7cSStephen Hemminger 
1391da177e4SLinus Torvalds static inline u32
1401da177e4SLinus Torvalds dst_allfrag(const struct dst_entry *dst)
1411da177e4SLinus Torvalds {
1420c3adfb8SGilad Ben-Yossef 	int ret = dst_feature(dst,  RTAX_FEATURE_ALLFRAG);
1431da177e4SLinus Torvalds 	/* Yes, _exactly_. This is paranoia. */
1441da177e4SLinus Torvalds 	barrier();
1451da177e4SLinus Torvalds 	return ret;
1461da177e4SLinus Torvalds }
1471da177e4SLinus Torvalds 
1481da177e4SLinus Torvalds static inline int
1491da177e4SLinus Torvalds dst_metric_locked(struct dst_entry *dst, int metric)
1501da177e4SLinus Torvalds {
1511da177e4SLinus Torvalds 	return dst_metric(dst, RTAX_LOCK) & (1<<metric);
1521da177e4SLinus Torvalds }
1531da177e4SLinus Torvalds 
1541da177e4SLinus Torvalds static inline void dst_hold(struct dst_entry * dst)
1551da177e4SLinus Torvalds {
1565635c10dSEric Dumazet 	/*
1575635c10dSEric Dumazet 	 * If your kernel compilation stops here, please check
1585635c10dSEric Dumazet 	 * __pad_to_align_refcnt declaration in struct dst_entry
1595635c10dSEric Dumazet 	 */
1605635c10dSEric Dumazet 	BUILD_BUG_ON(offsetof(struct dst_entry, __refcnt) & 63);
1611da177e4SLinus Torvalds 	atomic_inc(&dst->__refcnt);
1621da177e4SLinus Torvalds }
1631da177e4SLinus Torvalds 
16403f49f34SPavel Emelyanov static inline void dst_use(struct dst_entry *dst, unsigned long time)
16503f49f34SPavel Emelyanov {
16603f49f34SPavel Emelyanov 	dst_hold(dst);
16703f49f34SPavel Emelyanov 	dst->__use++;
16803f49f34SPavel Emelyanov 	dst->lastuse = time;
16903f49f34SPavel Emelyanov }
17003f49f34SPavel Emelyanov 
1717fee226aSEric Dumazet static inline void dst_use_noref(struct dst_entry *dst, unsigned long time)
1727fee226aSEric Dumazet {
1737fee226aSEric Dumazet 	dst->__use++;
1747fee226aSEric Dumazet 	dst->lastuse = time;
1757fee226aSEric Dumazet }
1767fee226aSEric Dumazet 
1771da177e4SLinus Torvalds static inline
1781da177e4SLinus Torvalds struct dst_entry * dst_clone(struct dst_entry * dst)
1791da177e4SLinus Torvalds {
1801da177e4SLinus Torvalds 	if (dst)
1811da177e4SLinus Torvalds 		atomic_inc(&dst->__refcnt);
1821da177e4SLinus Torvalds 	return dst;
1831da177e4SLinus Torvalds }
1841da177e4SLinus Torvalds 
1858d330868SIlpo Järvinen extern void dst_release(struct dst_entry *dst);
1867fee226aSEric Dumazet 
1877fee226aSEric Dumazet static inline void refdst_drop(unsigned long refdst)
1887fee226aSEric Dumazet {
1897fee226aSEric Dumazet 	if (!(refdst & SKB_DST_NOREF))
1907fee226aSEric Dumazet 		dst_release((struct dst_entry *)(refdst & SKB_DST_PTRMASK));
1917fee226aSEric Dumazet }
1927fee226aSEric Dumazet 
1937fee226aSEric Dumazet /**
1947fee226aSEric Dumazet  * skb_dst_drop - drops skb dst
1957fee226aSEric Dumazet  * @skb: buffer
1967fee226aSEric Dumazet  *
1977fee226aSEric Dumazet  * Drops dst reference count if a reference was taken.
1987fee226aSEric Dumazet  */
199adf30907SEric Dumazet static inline void skb_dst_drop(struct sk_buff *skb)
200adf30907SEric Dumazet {
2017fee226aSEric Dumazet 	if (skb->_skb_refdst) {
2027fee226aSEric Dumazet 		refdst_drop(skb->_skb_refdst);
2037fee226aSEric Dumazet 		skb->_skb_refdst = 0UL;
2047fee226aSEric Dumazet 	}
2057fee226aSEric Dumazet }
2067fee226aSEric Dumazet 
2077fee226aSEric Dumazet static inline void skb_dst_copy(struct sk_buff *nskb, const struct sk_buff *oskb)
2087fee226aSEric Dumazet {
2097fee226aSEric Dumazet 	nskb->_skb_refdst = oskb->_skb_refdst;
2107fee226aSEric Dumazet 	if (!(nskb->_skb_refdst & SKB_DST_NOREF))
2117fee226aSEric Dumazet 		dst_clone(skb_dst(nskb));
2127fee226aSEric Dumazet }
2137fee226aSEric Dumazet 
2147fee226aSEric Dumazet /**
2157fee226aSEric Dumazet  * skb_dst_force - makes sure skb dst is refcounted
2167fee226aSEric Dumazet  * @skb: buffer
2177fee226aSEric Dumazet  *
2187fee226aSEric Dumazet  * If dst is not yet refcounted, let's do it
2197fee226aSEric Dumazet  */
2207fee226aSEric Dumazet static inline void skb_dst_force(struct sk_buff *skb)
2217fee226aSEric Dumazet {
2227fee226aSEric Dumazet 	if (skb_dst_is_noref(skb)) {
2237fee226aSEric Dumazet 		WARN_ON(!rcu_read_lock_held());
2247fee226aSEric Dumazet 		skb->_skb_refdst &= ~SKB_DST_NOREF;
2257fee226aSEric Dumazet 		dst_clone(skb_dst(skb));
2267fee226aSEric Dumazet 	}
227adf30907SEric Dumazet }
2281da177e4SLinus Torvalds 
229d19d56ddSEric Dumazet 
230d19d56ddSEric Dumazet /**
231*290b895eSEric Dumazet  *	__skb_tunnel_rx - prepare skb for rx reinsert
232*290b895eSEric Dumazet  *	@skb: buffer
233*290b895eSEric Dumazet  *	@dev: tunnel device
234*290b895eSEric Dumazet  *
235*290b895eSEric Dumazet  *	After decapsulation, packet is going to re-enter (netif_rx()) our stack,
236*290b895eSEric Dumazet  *	so make some cleanups. (no accounting done)
237*290b895eSEric Dumazet  */
238*290b895eSEric Dumazet static inline void __skb_tunnel_rx(struct sk_buff *skb, struct net_device *dev)
239*290b895eSEric Dumazet {
240*290b895eSEric Dumazet 	skb->dev = dev;
241*290b895eSEric Dumazet 	skb->rxhash = 0;
242*290b895eSEric Dumazet 	skb_set_queue_mapping(skb, 0);
243*290b895eSEric Dumazet 	skb_dst_drop(skb);
244*290b895eSEric Dumazet 	nf_reset(skb);
245*290b895eSEric Dumazet }
246*290b895eSEric Dumazet 
247*290b895eSEric Dumazet /**
248d19d56ddSEric Dumazet  *	skb_tunnel_rx - prepare skb for rx reinsert
249d19d56ddSEric Dumazet  *	@skb: buffer
250d19d56ddSEric Dumazet  *	@dev: tunnel device
251d19d56ddSEric Dumazet  *
252d19d56ddSEric Dumazet  *	After decapsulation, packet is going to re-enter (netif_rx()) our stack,
253d19d56ddSEric Dumazet  *	so make some cleanups, and perform accounting.
254*290b895eSEric Dumazet  *	Note: this accounting is not SMP safe.
255d19d56ddSEric Dumazet  */
256d19d56ddSEric Dumazet static inline void skb_tunnel_rx(struct sk_buff *skb, struct net_device *dev)
257d19d56ddSEric Dumazet {
258d19d56ddSEric Dumazet 	/* TODO : stats should be SMP safe */
259d19d56ddSEric Dumazet 	dev->stats.rx_packets++;
260d19d56ddSEric Dumazet 	dev->stats.rx_bytes += skb->len;
261*290b895eSEric Dumazet 	__skb_tunnel_rx(skb, dev);
262d19d56ddSEric Dumazet }
263d19d56ddSEric Dumazet 
2641da177e4SLinus Torvalds /* Children define the path of the packet through the
2651da177e4SLinus Torvalds  * Linux networking.  Thus, destinations are stackable.
2661da177e4SLinus Torvalds  */
2671da177e4SLinus Torvalds 
2688764ab2cSSteffen Klassert static inline struct dst_entry *skb_dst_pop(struct sk_buff *skb)
2691da177e4SLinus Torvalds {
2708764ab2cSSteffen Klassert 	struct dst_entry *child = skb_dst(skb)->child;
2711da177e4SLinus Torvalds 
2728764ab2cSSteffen Klassert 	skb_dst_drop(skb);
2731da177e4SLinus Torvalds 	return child;
2741da177e4SLinus Torvalds }
2751da177e4SLinus Torvalds 
276352e512cSHerbert Xu extern int dst_discard(struct sk_buff *skb);
2771da177e4SLinus Torvalds extern void * dst_alloc(struct dst_ops * ops);
2781da177e4SLinus Torvalds extern void __dst_free(struct dst_entry * dst);
2791da177e4SLinus Torvalds extern struct dst_entry *dst_destroy(struct dst_entry * dst);
2801da177e4SLinus Torvalds 
2811da177e4SLinus Torvalds static inline void dst_free(struct dst_entry * dst)
2821da177e4SLinus Torvalds {
2831da177e4SLinus Torvalds 	if (dst->obsolete > 1)
2841da177e4SLinus Torvalds 		return;
2851da177e4SLinus Torvalds 	if (!atomic_read(&dst->__refcnt)) {
2861da177e4SLinus Torvalds 		dst = dst_destroy(dst);
2871da177e4SLinus Torvalds 		if (!dst)
2881da177e4SLinus Torvalds 			return;
2891da177e4SLinus Torvalds 	}
2901da177e4SLinus Torvalds 	__dst_free(dst);
2911da177e4SLinus Torvalds }
2921da177e4SLinus Torvalds 
2931da177e4SLinus Torvalds static inline void dst_rcu_free(struct rcu_head *head)
2941da177e4SLinus Torvalds {
2951da177e4SLinus Torvalds 	struct dst_entry *dst = container_of(head, struct dst_entry, rcu_head);
2961da177e4SLinus Torvalds 	dst_free(dst);
2971da177e4SLinus Torvalds }
2981da177e4SLinus Torvalds 
2991da177e4SLinus Torvalds static inline void dst_confirm(struct dst_entry *dst)
3001da177e4SLinus Torvalds {
3011da177e4SLinus Torvalds 	if (dst)
3021da177e4SLinus Torvalds 		neigh_confirm(dst->neighbour);
3031da177e4SLinus Torvalds }
3041da177e4SLinus Torvalds 
3051da177e4SLinus Torvalds static inline void dst_link_failure(struct sk_buff *skb)
3061da177e4SLinus Torvalds {
307adf30907SEric Dumazet 	struct dst_entry *dst = skb_dst(skb);
3081da177e4SLinus Torvalds 	if (dst && dst->ops && dst->ops->link_failure)
3091da177e4SLinus Torvalds 		dst->ops->link_failure(skb);
3101da177e4SLinus Torvalds }
3111da177e4SLinus Torvalds 
3121da177e4SLinus Torvalds static inline void dst_set_expires(struct dst_entry *dst, int timeout)
3131da177e4SLinus Torvalds {
3141da177e4SLinus Torvalds 	unsigned long expires = jiffies + timeout;
3151da177e4SLinus Torvalds 
3161da177e4SLinus Torvalds 	if (expires == 0)
3171da177e4SLinus Torvalds 		expires = 1;
3181da177e4SLinus Torvalds 
3191da177e4SLinus Torvalds 	if (dst->expires == 0 || time_before(expires, dst->expires))
3201da177e4SLinus Torvalds 		dst->expires = expires;
3211da177e4SLinus Torvalds }
3221da177e4SLinus Torvalds 
3231da177e4SLinus Torvalds /* Output packet to network from transport.  */
3241da177e4SLinus Torvalds static inline int dst_output(struct sk_buff *skb)
3251da177e4SLinus Torvalds {
326adf30907SEric Dumazet 	return skb_dst(skb)->output(skb);
3271da177e4SLinus Torvalds }
3281da177e4SLinus Torvalds 
3291da177e4SLinus Torvalds /* Input packet from network to transport.  */
3301da177e4SLinus Torvalds static inline int dst_input(struct sk_buff *skb)
3311da177e4SLinus Torvalds {
332adf30907SEric Dumazet 	return skb_dst(skb)->input(skb);
3331da177e4SLinus Torvalds }
3341da177e4SLinus Torvalds 
3351da177e4SLinus Torvalds static inline struct dst_entry *dst_check(struct dst_entry *dst, u32 cookie)
3361da177e4SLinus Torvalds {
3371da177e4SLinus Torvalds 	if (dst->obsolete)
3381da177e4SLinus Torvalds 		dst = dst->ops->check(dst, cookie);
3391da177e4SLinus Torvalds 	return dst;
3401da177e4SLinus Torvalds }
3411da177e4SLinus Torvalds 
3421da177e4SLinus Torvalds extern void		dst_init(void);
3431da177e4SLinus Torvalds 
344815f4e57SHerbert Xu /* Flags for xfrm_lookup flags argument. */
345815f4e57SHerbert Xu enum {
346815f4e57SHerbert Xu 	XFRM_LOOKUP_WAIT = 1 << 0,
3478b7817f3SHerbert Xu 	XFRM_LOOKUP_ICMP = 1 << 1,
348815f4e57SHerbert Xu };
349815f4e57SHerbert Xu 
3501da177e4SLinus Torvalds struct flowi;
3511da177e4SLinus Torvalds #ifndef CONFIG_XFRM
35252479b62SAlexey Dobriyan static inline int xfrm_lookup(struct net *net, struct dst_entry **dst_p,
35352479b62SAlexey Dobriyan 			      struct flowi *fl, struct sock *sk, int flags)
3541da177e4SLinus Torvalds {
3551da177e4SLinus Torvalds 	return 0;
3561da177e4SLinus Torvalds }
35752479b62SAlexey Dobriyan static inline int __xfrm_lookup(struct net *net, struct dst_entry **dst_p,
35852479b62SAlexey Dobriyan 				struct flowi *fl, struct sock *sk, int flags)
35914e50e57SDavid S. Miller {
36014e50e57SDavid S. Miller 	return 0;
36114e50e57SDavid S. Miller }
3621da177e4SLinus Torvalds #else
36352479b62SAlexey Dobriyan extern int xfrm_lookup(struct net *net, struct dst_entry **dst_p,
36452479b62SAlexey Dobriyan 		       struct flowi *fl, struct sock *sk, int flags);
36552479b62SAlexey Dobriyan extern int __xfrm_lookup(struct net *net, struct dst_entry **dst_p,
36652479b62SAlexey Dobriyan 			 struct flowi *fl, struct sock *sk, int flags);
3671da177e4SLinus Torvalds #endif
3681da177e4SLinus Torvalds #endif
3691da177e4SLinus Torvalds 
3701da177e4SLinus Torvalds #endif /* _NET_DST_H */
371