xref: /openbmc/linux/include/net/ip_vs.h (revision b0e010c527de742cb18e8d50a06dfd1a995b5382)
107dcc686SSimon Horman /* IP Virtual Server
21da177e4SLinus Torvalds  * data structure and functionality definitions
31da177e4SLinus Torvalds  */
41da177e4SLinus Torvalds 
5bc4768ebSJulius Volz #ifndef _NET_IP_VS_H
6bc4768ebSJulius Volz #define _NET_IP_VS_H
71da177e4SLinus Torvalds 
8bc4768ebSJulius Volz #include <linux/ip_vs.h>                /* definitions shared with userland */
91da177e4SLinus Torvalds 
10bc4768ebSJulius Volz #include <asm/types.h>                  /* for __uXX types */
11bc4768ebSJulius Volz 
121da177e4SLinus Torvalds #include <linux/list.h>                 /* for struct list_head */
131da177e4SLinus Torvalds #include <linux/spinlock.h>             /* for struct rwlock_t */
1460063497SArun Sharma #include <linux/atomic.h>               /* for struct atomic_t */
151da177e4SLinus Torvalds #include <linux/compiler.h>
1614c85021SArnaldo Carvalho de Melo #include <linux/timer.h>
17187f1882SPaul Gortmaker #include <linux/bug.h>
181da177e4SLinus Torvalds 
1914c85021SArnaldo Carvalho de Melo #include <net/checksum.h>
20e7ade46aSJulius Volz #include <linux/netfilter.h>		/* for union nf_inet_addr */
211668e010SKOVACS Krisztian #include <linux/ip.h>
22e7ade46aSJulius Volz #include <linux/ipv6.h>			/* for struct ipv6hdr */
234e3fd7a0SAlexey Dobriyan #include <net/ipv6.h>
2454d83efaSJesper Dangaard Brouer #if IS_ENABLED(CONFIG_IP_VS_IPV6)
2563dca2c0SJesper Dangaard Brouer #include <linux/netfilter_ipv6/ip6_tables.h>
2663dca2c0SJesper Dangaard Brouer #endif
27a638e514SJesper Dangaard Brouer #if IS_ENABLED(CONFIG_NF_CONNTRACK)
28f4bc17cdSJulian Anastasov #include <net/netfilter/nf_conntrack.h>
29f4bc17cdSJulian Anastasov #endif
3061b1ab45SHans Schillstrom #include <net/net_namespace.h>		/* Netw namespace */
3161b1ab45SHans Schillstrom 
3207dcc686SSimon Horman /* Generic access of ipvs struct */
3361b1ab45SHans Schillstrom static inline struct netns_ipvs *net_ipvs(struct net* net)
3461b1ab45SHans Schillstrom {
3561b1ab45SHans Schillstrom 	return net->ipvs;
3661b1ab45SHans Schillstrom }
3707dcc686SSimon Horman 
3807dcc686SSimon Horman /* Get net ptr from skb in traffic cases
39fc723250SHans Schillstrom  * use skb_sknet when call is from userland (ioctl or netlink)
40fc723250SHans Schillstrom  */
41a0840e2eSHans Schillstrom static inline struct net *skb_net(const struct sk_buff *skb)
42fc723250SHans Schillstrom {
43fc723250SHans Schillstrom #ifdef CONFIG_NET_NS
44fc723250SHans Schillstrom #ifdef CONFIG_IP_VS_DEBUG
45fc723250SHans Schillstrom 	/*
46fc723250SHans Schillstrom 	 * This is used for debug only.
47fc723250SHans Schillstrom 	 * Start with the most likely hit
48fc723250SHans Schillstrom 	 * End with BUG
49fc723250SHans Schillstrom 	 */
500c5c9fb5SEric W. Biederman 	if (likely(skb->dev && dev_net(skb->dev)))
51fc723250SHans Schillstrom 		return dev_net(skb->dev);
52a09d1977SHans Schillstrom 	if (skb_dst(skb) && skb_dst(skb)->dev)
53fc723250SHans Schillstrom 		return dev_net(skb_dst(skb)->dev);
54fc723250SHans Schillstrom 	WARN(skb->sk, "Maybe skb_sknet should be used in %s() at line:%d\n",
55fc723250SHans Schillstrom 		      __func__, __LINE__);
560c5c9fb5SEric W. Biederman 	if (likely(skb->sk && sock_net(skb->sk)))
57fc723250SHans Schillstrom 		return sock_net(skb->sk);
58fc723250SHans Schillstrom 	pr_err("There is no net ptr to find in the skb in %s() line:%d\n",
59fc723250SHans Schillstrom 		__func__, __LINE__);
60fc723250SHans Schillstrom 	BUG();
61fc723250SHans Schillstrom #else
62fc723250SHans Schillstrom 	return dev_net(skb->dev ? : skb_dst(skb)->dev);
63fc723250SHans Schillstrom #endif
64fc723250SHans Schillstrom #else
65fc723250SHans Schillstrom 	return &init_net;
66fc723250SHans Schillstrom #endif
67fc723250SHans Schillstrom }
68fc723250SHans Schillstrom 
69a0840e2eSHans Schillstrom static inline struct net *skb_sknet(const struct sk_buff *skb)
70fc723250SHans Schillstrom {
71fc723250SHans Schillstrom #ifdef CONFIG_NET_NS
72fc723250SHans Schillstrom #ifdef CONFIG_IP_VS_DEBUG
73fc723250SHans Schillstrom 	/* Start with the most likely hit */
740c5c9fb5SEric W. Biederman 	if (likely(skb->sk && sock_net(skb->sk)))
75fc723250SHans Schillstrom 		return sock_net(skb->sk);
76fc723250SHans Schillstrom 	WARN(skb->dev, "Maybe skb_net should be used instead in %s() line:%d\n",
77fc723250SHans Schillstrom 		       __func__, __LINE__);
780c5c9fb5SEric W. Biederman 	if (likely(skb->dev && dev_net(skb->dev)))
79fc723250SHans Schillstrom 		return dev_net(skb->dev);
80fc723250SHans Schillstrom 	pr_err("There is no net ptr to find in the skb in %s() line:%d\n",
81fc723250SHans Schillstrom 		__func__, __LINE__);
82fc723250SHans Schillstrom 	BUG();
83fc723250SHans Schillstrom #else
84fc723250SHans Schillstrom 	return sock_net(skb->sk);
85fc723250SHans Schillstrom #endif
86fc723250SHans Schillstrom #else
87fc723250SHans Schillstrom 	return &init_net;
88fc723250SHans Schillstrom #endif
89fc723250SHans Schillstrom }
9007dcc686SSimon Horman 
9107dcc686SSimon Horman /* This one needed for single_open_net since net is stored directly in
9225985edcSLucas De Marchi  * private not as a struct i.e. seq_file_net can't be used.
93b17fc996SHans Schillstrom  */
94b17fc996SHans Schillstrom static inline struct net *seq_file_single_net(struct seq_file *seq)
95b17fc996SHans Schillstrom {
96b17fc996SHans Schillstrom #ifdef CONFIG_NET_NS
97b17fc996SHans Schillstrom 	return (struct net *)seq->private;
98b17fc996SHans Schillstrom #else
99b17fc996SHans Schillstrom 	return &init_net;
100b17fc996SHans Schillstrom #endif
101b17fc996SHans Schillstrom }
1026f7edb48SCatalin(ux) M. BOIE 
1036f7edb48SCatalin(ux) M. BOIE /* Connections' size value needed by ip_vs_ctl.c */
1046f7edb48SCatalin(ux) M. BOIE extern int ip_vs_conn_tab_size;
1056f7edb48SCatalin(ux) M. BOIE 
10664aae3cbSJulius Volz struct ip_vs_iphdr {
107*b0e010c5SAlex Gartrell 	__u32 off;	/* Where IP or IPv4 header starts */
10863dca2c0SJesper Dangaard Brouer 	__u32 len;	/* IPv4 simply where L4 starts
10907dcc686SSimon Horman 			 * IPv6 where L4 Transport Header starts */
11063dca2c0SJesper Dangaard Brouer 	__u16 fragoffs; /* IPv6 fragment offset, 0 if first frag (or not frag)*/
11163dca2c0SJesper Dangaard Brouer 	__s16 protocol;
11263dca2c0SJesper Dangaard Brouer 	__s32 flags;
11364aae3cbSJulius Volz 	union nf_inet_addr saddr;
11464aae3cbSJulius Volz 	union nf_inet_addr daddr;
11564aae3cbSJulius Volz };
11664aae3cbSJulius Volz 
1172f74713dSJesper Dangaard Brouer static inline void *frag_safe_skb_hp(const struct sk_buff *skb, int offset,
1182f74713dSJesper Dangaard Brouer 				      int len, void *buffer,
1192f74713dSJesper Dangaard Brouer 				      const struct ip_vs_iphdr *ipvsh)
1202f74713dSJesper Dangaard Brouer {
1212f74713dSJesper Dangaard Brouer 	return skb_header_pointer(skb, offset, len, buffer);
1222f74713dSJesper Dangaard Brouer }
1232f74713dSJesper Dangaard Brouer 
12463dca2c0SJesper Dangaard Brouer /* This function handles filling *ip_vs_iphdr, both for IPv4 and IPv6.
12563dca2c0SJesper Dangaard Brouer  * IPv6 requires some extra work, as finding proper header position,
12663dca2c0SJesper Dangaard Brouer  * depend on the IPv6 extension headers.
12763dca2c0SJesper Dangaard Brouer  */
128*b0e010c5SAlex Gartrell static inline int
129*b0e010c5SAlex Gartrell ip_vs_fill_iph_skb_off(int af, const struct sk_buff *skb, int offset,
130*b0e010c5SAlex Gartrell 		       struct ip_vs_iphdr *iphdr)
13164aae3cbSJulius Volz {
132*b0e010c5SAlex Gartrell 	iphdr->off = offset;
13364aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6
13464aae3cbSJulius Volz 	if (af == AF_INET6) {
135*b0e010c5SAlex Gartrell 		struct ipv6hdr _iph;
136*b0e010c5SAlex Gartrell 		const struct ipv6hdr *iph = skb_header_pointer(
137*b0e010c5SAlex Gartrell 			skb, offset, sizeof(_iph), &_iph);
138*b0e010c5SAlex Gartrell 		if (!iph)
139*b0e010c5SAlex Gartrell 			return 0;
140*b0e010c5SAlex Gartrell 
1414e3fd7a0SAlexey Dobriyan 		iphdr->saddr.in6 = iph->saddr;
1424e3fd7a0SAlexey Dobriyan 		iphdr->daddr.in6 = iph->daddr;
1436aafeef0SJiri Pirko 		/* ipv6_find_hdr() updates len, flags */
144*b0e010c5SAlex Gartrell 		iphdr->len	 = offset;
14563dca2c0SJesper Dangaard Brouer 		iphdr->flags	 = 0;
14663dca2c0SJesper Dangaard Brouer 		iphdr->protocol  = ipv6_find_hdr(skb, &iphdr->len, -1,
14763dca2c0SJesper Dangaard Brouer 						 &iphdr->fragoffs,
14863dca2c0SJesper Dangaard Brouer 						 &iphdr->flags);
149*b0e010c5SAlex Gartrell 		if (iphdr->protocol < 0)
150*b0e010c5SAlex Gartrell 			return 0;
15164aae3cbSJulius Volz 	} else
15264aae3cbSJulius Volz #endif
15364aae3cbSJulius Volz 	{
154*b0e010c5SAlex Gartrell 		struct iphdr _iph;
155*b0e010c5SAlex Gartrell 		const struct iphdr *iph = skb_header_pointer(
156*b0e010c5SAlex Gartrell 			skb, offset, sizeof(_iph), &_iph);
157*b0e010c5SAlex Gartrell 		if (!iph)
158*b0e010c5SAlex Gartrell 			return 0;
159*b0e010c5SAlex Gartrell 
160*b0e010c5SAlex Gartrell 		iphdr->len	= offset + iph->ihl * 4;
16163dca2c0SJesper Dangaard Brouer 		iphdr->fragoffs	= 0;
16264aae3cbSJulius Volz 		iphdr->protocol	= iph->protocol;
16364aae3cbSJulius Volz 		iphdr->saddr.ip	= iph->saddr;
16464aae3cbSJulius Volz 		iphdr->daddr.ip	= iph->daddr;
16564aae3cbSJulius Volz 	}
166*b0e010c5SAlex Gartrell 
167*b0e010c5SAlex Gartrell 	return 1;
168*b0e010c5SAlex Gartrell }
169*b0e010c5SAlex Gartrell 
170*b0e010c5SAlex Gartrell static inline int
171*b0e010c5SAlex Gartrell ip_vs_fill_iph_skb(int af, const struct sk_buff *skb, struct ip_vs_iphdr *iphdr)
172*b0e010c5SAlex Gartrell {
173*b0e010c5SAlex Gartrell 	return ip_vs_fill_iph_skb_off(af, skb, skb_network_offset(skb), iphdr);
17464aae3cbSJulius Volz }
17564aae3cbSJulius Volz 
17664aae3cbSJulius Volz static inline void ip_vs_addr_copy(int af, union nf_inet_addr *dst,
17764aae3cbSJulius Volz 				   const union nf_inet_addr *src)
17864aae3cbSJulius Volz {
17964aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6
18064aae3cbSJulius Volz 	if (af == AF_INET6)
1814e3fd7a0SAlexey Dobriyan 		dst->in6 = src->in6;
18264aae3cbSJulius Volz 	else
18364aae3cbSJulius Volz #endif
18464aae3cbSJulius Volz 	dst->ip = src->ip;
18564aae3cbSJulius Volz }
18664aae3cbSJulius Volz 
1879a05475cSJulian Anastasov static inline void ip_vs_addr_set(int af, union nf_inet_addr *dst,
1889a05475cSJulian Anastasov 				  const union nf_inet_addr *src)
1899a05475cSJulian Anastasov {
1909a05475cSJulian Anastasov #ifdef CONFIG_IP_VS_IPV6
1919a05475cSJulian Anastasov 	if (af == AF_INET6) {
1929a05475cSJulian Anastasov 		dst->in6 = src->in6;
1939a05475cSJulian Anastasov 		return;
1949a05475cSJulian Anastasov 	}
1959a05475cSJulian Anastasov #endif
1969a05475cSJulian Anastasov 	dst->ip = src->ip;
1979a05475cSJulian Anastasov 	dst->all[1] = 0;
1989a05475cSJulian Anastasov 	dst->all[2] = 0;
1999a05475cSJulian Anastasov 	dst->all[3] = 0;
2009a05475cSJulian Anastasov }
2019a05475cSJulian Anastasov 
20264aae3cbSJulius Volz static inline int ip_vs_addr_equal(int af, const union nf_inet_addr *a,
20364aae3cbSJulius Volz 				   const union nf_inet_addr *b)
20464aae3cbSJulius Volz {
20564aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6
20664aae3cbSJulius Volz 	if (af == AF_INET6)
20764aae3cbSJulius Volz 		return ipv6_addr_equal(&a->in6, &b->in6);
20864aae3cbSJulius Volz #endif
20964aae3cbSJulius Volz 	return a->ip == b->ip;
21064aae3cbSJulius Volz }
21164aae3cbSJulius Volz 
2121da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG
21314c85021SArnaldo Carvalho de Melo #include <linux/net.h>
21414c85021SArnaldo Carvalho de Melo 
2155c3a0fd7SJoe Perches int ip_vs_get_debug_level(void);
216c842a3adSJulius Volz 
217c842a3adSJulius Volz static inline const char *ip_vs_dbg_addr(int af, char *buf, size_t buf_len,
218c842a3adSJulius Volz 					 const union nf_inet_addr *addr,
219c842a3adSJulius Volz 					 int *idx)
220c842a3adSJulius Volz {
221c842a3adSJulius Volz 	int len;
222c842a3adSJulius Volz #ifdef CONFIG_IP_VS_IPV6
223c842a3adSJulius Volz 	if (af == AF_INET6)
224120b9c14SJesper Dangaard Brouer 		len = snprintf(&buf[*idx], buf_len - *idx, "[%pI6c]",
2250c6ce78aSHarvey Harrison 			       &addr->in6) + 1;
226c842a3adSJulius Volz 	else
227c842a3adSJulius Volz #endif
2283685f25dSHarvey Harrison 		len = snprintf(&buf[*idx], buf_len - *idx, "%pI4",
2293685f25dSHarvey Harrison 			       &addr->ip) + 1;
230c842a3adSJulius Volz 
231c842a3adSJulius Volz 	*idx += len;
232c842a3adSJulius Volz 	BUG_ON(*idx > buf_len + 1);
233c842a3adSJulius Volz 	return &buf[*idx - len];
234c842a3adSJulius Volz }
235c842a3adSJulius Volz 
2369aada7acSHannes Eder #define IP_VS_DBG_BUF(level, msg, ...)					\
237c842a3adSJulius Volz 	do {								\
238c842a3adSJulius Volz 		char ip_vs_dbg_buf[160];				\
239c842a3adSJulius Volz 		int ip_vs_dbg_idx = 0;					\
240c842a3adSJulius Volz 		if (level <= ip_vs_get_debug_level())			\
2419aada7acSHannes Eder 			printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__);	\
242c842a3adSJulius Volz 	} while (0)
243c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...)						\
244c842a3adSJulius Volz 	do {								\
245c842a3adSJulius Volz 		char ip_vs_dbg_buf[160];				\
246c842a3adSJulius Volz 		int ip_vs_dbg_idx = 0;					\
2479aada7acSHannes Eder 		pr_err(msg);						\
248c842a3adSJulius Volz 	} while (0)
249c842a3adSJulius Volz 
250c842a3adSJulius Volz /* Only use from within IP_VS_DBG_BUF() or IP_VS_ERR_BUF macros */
251c842a3adSJulius Volz #define IP_VS_DBG_ADDR(af, addr)					\
252c842a3adSJulius Volz 	ip_vs_dbg_addr(af, ip_vs_dbg_buf,				\
253c842a3adSJulius Volz 		       sizeof(ip_vs_dbg_buf), addr,			\
254c842a3adSJulius Volz 		       &ip_vs_dbg_idx)
255c842a3adSJulius Volz 
2569aada7acSHannes Eder #define IP_VS_DBG(level, msg, ...)					\
2571da177e4SLinus Torvalds 	do {								\
2581da177e4SLinus Torvalds 		if (level <= ip_vs_get_debug_level())			\
2599aada7acSHannes Eder 			printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__);	\
2601da177e4SLinus Torvalds 	} while (0)
2619aada7acSHannes Eder #define IP_VS_DBG_RL(msg, ...)						\
2621da177e4SLinus Torvalds 	do {								\
2631da177e4SLinus Torvalds 		if (net_ratelimit())					\
2649aada7acSHannes Eder 			printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__);	\
2651da177e4SLinus Torvalds 	} while (0)
2660d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg)			\
2671da177e4SLinus Torvalds 	do {								\
2681da177e4SLinus Torvalds 		if (level <= ip_vs_get_debug_level())			\
2690d79641aSJulian Anastasov 			pp->debug_packet(af, pp, skb, ofs, msg);	\
2701da177e4SLinus Torvalds 	} while (0)
2710d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg)			\
2721da177e4SLinus Torvalds 	do {								\
2731da177e4SLinus Torvalds 		if (level <= ip_vs_get_debug_level() &&			\
2741da177e4SLinus Torvalds 		    net_ratelimit())					\
2750d79641aSJulian Anastasov 			pp->debug_packet(af, pp, skb, ofs, msg);	\
2761da177e4SLinus Torvalds 	} while (0)
2771da177e4SLinus Torvalds #else	/* NO DEBUGGING at ALL */
278c842a3adSJulius Volz #define IP_VS_DBG_BUF(level, msg...)  do {} while (0)
279c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...)  do {} while (0)
2801da177e4SLinus Torvalds #define IP_VS_DBG(level, msg...)  do {} while (0)
2811da177e4SLinus Torvalds #define IP_VS_DBG_RL(msg...)  do {} while (0)
2820d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg)	do {} while (0)
2830d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg)	do {} while (0)
2841da177e4SLinus Torvalds #endif
2851da177e4SLinus Torvalds 
2861da177e4SLinus Torvalds #define IP_VS_BUG() BUG()
2871e3e238eSHannes Eder #define IP_VS_ERR_RL(msg, ...)						\
2881da177e4SLinus Torvalds 	do {								\
2891da177e4SLinus Torvalds 		if (net_ratelimit())					\
2901e3e238eSHannes Eder 			pr_err(msg, ##__VA_ARGS__);			\
2911da177e4SLinus Torvalds 	} while (0)
2921da177e4SLinus Torvalds 
2931da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG
2941da177e4SLinus Torvalds #define EnterFunction(level)						\
2951da177e4SLinus Torvalds 	do {								\
2961da177e4SLinus Torvalds 		if (level <= ip_vs_get_debug_level())			\
2979aada7acSHannes Eder 			printk(KERN_DEBUG				\
2989aada7acSHannes Eder 			       pr_fmt("Enter: %s, %s line %i\n"),	\
299d5c003b4SHarvey Harrison 			       __func__, __FILE__, __LINE__);		\
3001da177e4SLinus Torvalds 	} while (0)
3011da177e4SLinus Torvalds #define LeaveFunction(level)						\
3021da177e4SLinus Torvalds 	do {								\
3031da177e4SLinus Torvalds 		if (level <= ip_vs_get_debug_level())			\
3049aada7acSHannes Eder 			printk(KERN_DEBUG				\
3059aada7acSHannes Eder 			       pr_fmt("Leave: %s, %s line %i\n"),	\
306d5c003b4SHarvey Harrison 			       __func__, __FILE__, __LINE__);		\
3071da177e4SLinus Torvalds 	} while (0)
3081da177e4SLinus Torvalds #else
3091da177e4SLinus Torvalds #define EnterFunction(level)   do {} while (0)
3101da177e4SLinus Torvalds #define LeaveFunction(level)   do {} while (0)
3111da177e4SLinus Torvalds #endif
3121da177e4SLinus Torvalds 
31307dcc686SSimon Horman /* The port number of FTP service (in network order). */
314f3a7c66bSHarvey Harrison #define FTPPORT  cpu_to_be16(21)
315f3a7c66bSHarvey Harrison #define FTPDATA  cpu_to_be16(20)
3161da177e4SLinus Torvalds 
31707dcc686SSimon Horman /* TCP State Values */
3181da177e4SLinus Torvalds enum {
3191da177e4SLinus Torvalds 	IP_VS_TCP_S_NONE = 0,
3201da177e4SLinus Torvalds 	IP_VS_TCP_S_ESTABLISHED,
3211da177e4SLinus Torvalds 	IP_VS_TCP_S_SYN_SENT,
3221da177e4SLinus Torvalds 	IP_VS_TCP_S_SYN_RECV,
3231da177e4SLinus Torvalds 	IP_VS_TCP_S_FIN_WAIT,
3241da177e4SLinus Torvalds 	IP_VS_TCP_S_TIME_WAIT,
3251da177e4SLinus Torvalds 	IP_VS_TCP_S_CLOSE,
3261da177e4SLinus Torvalds 	IP_VS_TCP_S_CLOSE_WAIT,
3271da177e4SLinus Torvalds 	IP_VS_TCP_S_LAST_ACK,
3281da177e4SLinus Torvalds 	IP_VS_TCP_S_LISTEN,
3291da177e4SLinus Torvalds 	IP_VS_TCP_S_SYNACK,
3301da177e4SLinus Torvalds 	IP_VS_TCP_S_LAST
3311da177e4SLinus Torvalds };
3321da177e4SLinus Torvalds 
33307dcc686SSimon Horman /* UDP State Values */
3341da177e4SLinus Torvalds enum {
3351da177e4SLinus Torvalds 	IP_VS_UDP_S_NORMAL,
3361da177e4SLinus Torvalds 	IP_VS_UDP_S_LAST,
3371da177e4SLinus Torvalds };
3381da177e4SLinus Torvalds 
33907dcc686SSimon Horman /* ICMP State Values */
3401da177e4SLinus Torvalds enum {
3411da177e4SLinus Torvalds 	IP_VS_ICMP_S_NORMAL,
3421da177e4SLinus Torvalds 	IP_VS_ICMP_S_LAST,
3431da177e4SLinus Torvalds };
3441da177e4SLinus Torvalds 
34507dcc686SSimon Horman /* SCTP State Values */
3462906f66aSVenkata Mohan Reddy enum ip_vs_sctp_states {
3472906f66aSVenkata Mohan Reddy 	IP_VS_SCTP_S_NONE,
34861e7c420SJulian Anastasov 	IP_VS_SCTP_S_INIT1,
34961e7c420SJulian Anastasov 	IP_VS_SCTP_S_INIT,
35061e7c420SJulian Anastasov 	IP_VS_SCTP_S_COOKIE_SENT,
35161e7c420SJulian Anastasov 	IP_VS_SCTP_S_COOKIE_REPLIED,
35261e7c420SJulian Anastasov 	IP_VS_SCTP_S_COOKIE_WAIT,
35361e7c420SJulian Anastasov 	IP_VS_SCTP_S_COOKIE,
35461e7c420SJulian Anastasov 	IP_VS_SCTP_S_COOKIE_ECHOED,
3552906f66aSVenkata Mohan Reddy 	IP_VS_SCTP_S_ESTABLISHED,
35661e7c420SJulian Anastasov 	IP_VS_SCTP_S_SHUTDOWN_SENT,
35761e7c420SJulian Anastasov 	IP_VS_SCTP_S_SHUTDOWN_RECEIVED,
35861e7c420SJulian Anastasov 	IP_VS_SCTP_S_SHUTDOWN_ACK_SENT,
35961e7c420SJulian Anastasov 	IP_VS_SCTP_S_REJECTED,
3602906f66aSVenkata Mohan Reddy 	IP_VS_SCTP_S_CLOSED,
3612906f66aSVenkata Mohan Reddy 	IP_VS_SCTP_S_LAST
3622906f66aSVenkata Mohan Reddy };
3632906f66aSVenkata Mohan Reddy 
36407dcc686SSimon Horman /* Delta sequence info structure
3651da177e4SLinus Torvalds  * Each ip_vs_conn has 2 (output AND input seq. changes).
3661da177e4SLinus Torvalds  * Only used in the VS/NAT.
3671da177e4SLinus Torvalds  */
3681da177e4SLinus Torvalds struct ip_vs_seq {
3691da177e4SLinus Torvalds 	__u32			init_seq;	/* Add delta from this seq */
3701da177e4SLinus Torvalds 	__u32			delta;		/* Delta in sequence numbers */
3711da177e4SLinus Torvalds 	__u32			previous_delta;	/* Delta in sequence numbers
37207dcc686SSimon Horman 						 * before last resized pkt */
3731da177e4SLinus Torvalds };
3741da177e4SLinus Torvalds 
37507dcc686SSimon Horman /* counters per cpu */
376b17fc996SHans Schillstrom struct ip_vs_counters {
377cd67cd5eSJulian Anastasov 	__u64		conns;		/* connections scheduled */
378cd67cd5eSJulian Anastasov 	__u64		inpkts;		/* incoming packets */
379cd67cd5eSJulian Anastasov 	__u64		outpkts;	/* outgoing packets */
380b17fc996SHans Schillstrom 	__u64		inbytes;	/* incoming bytes */
381b17fc996SHans Schillstrom 	__u64		outbytes;	/* outgoing bytes */
382b17fc996SHans Schillstrom };
38307dcc686SSimon Horman /* Stats per cpu */
384b17fc996SHans Schillstrom struct ip_vs_cpu_stats {
385cd67cd5eSJulian Anastasov 	struct ip_vs_counters   cnt;
386b17fc996SHans Schillstrom 	struct u64_stats_sync   syncp;
387b17fc996SHans Schillstrom };
3881da177e4SLinus Torvalds 
38907dcc686SSimon Horman /* IPVS statistics objects */
3903a14a313SSven Wegener struct ip_vs_estimator {
3913a14a313SSven Wegener 	struct list_head	list;
3923a14a313SSven Wegener 
3933a14a313SSven Wegener 	u64			last_inbytes;
3943a14a313SSven Wegener 	u64			last_outbytes;
395cd67cd5eSJulian Anastasov 	u64			last_conns;
396cd67cd5eSJulian Anastasov 	u64			last_inpkts;
397cd67cd5eSJulian Anastasov 	u64			last_outpkts;
3983a14a313SSven Wegener 
399cd67cd5eSJulian Anastasov 	u64			cps;
400cd67cd5eSJulian Anastasov 	u64			inpps;
401cd67cd5eSJulian Anastasov 	u64			outpps;
402cd67cd5eSJulian Anastasov 	u64			inbps;
403cd67cd5eSJulian Anastasov 	u64			outbps;
404cd67cd5eSJulian Anastasov };
405cd67cd5eSJulian Anastasov 
406cd67cd5eSJulian Anastasov /*
407cd67cd5eSJulian Anastasov  * IPVS statistics object, 64-bit kernel version of struct ip_vs_stats_user
408cd67cd5eSJulian Anastasov  */
409cd67cd5eSJulian Anastasov struct ip_vs_kstats {
410cd67cd5eSJulian Anastasov 	u64			conns;		/* connections scheduled */
411cd67cd5eSJulian Anastasov 	u64			inpkts;		/* incoming packets */
412cd67cd5eSJulian Anastasov 	u64			outpkts;	/* outgoing packets */
413cd67cd5eSJulian Anastasov 	u64			inbytes;	/* incoming bytes */
414cd67cd5eSJulian Anastasov 	u64			outbytes;	/* outgoing bytes */
415cd67cd5eSJulian Anastasov 
416cd67cd5eSJulian Anastasov 	u64			cps;		/* current connection rate */
417cd67cd5eSJulian Anastasov 	u64			inpps;		/* current in packet rate */
418cd67cd5eSJulian Anastasov 	u64			outpps;		/* current out packet rate */
419cd67cd5eSJulian Anastasov 	u64			inbps;		/* current in byte rate */
420cd67cd5eSJulian Anastasov 	u64			outbps;		/* current out byte rate */
4213a14a313SSven Wegener };
4223a14a313SSven Wegener 
423fd2c3ef7SEric Dumazet struct ip_vs_stats {
424cd67cd5eSJulian Anastasov 	struct ip_vs_kstats	kstats;		/* kernel statistics */
425e9c0ce23SSven Wegener 	struct ip_vs_estimator	est;		/* estimator */
426b962abdcSJulian Anastasov 	struct ip_vs_cpu_stats __percpu	*cpustats;	/* per cpu counters */
4271da177e4SLinus Torvalds 	spinlock_t		lock;		/* spin lock */
428cd67cd5eSJulian Anastasov 	struct ip_vs_kstats	kstats0;	/* reset values */
4291da177e4SLinus Torvalds };
4301da177e4SLinus Torvalds 
43114c85021SArnaldo Carvalho de Melo struct dst_entry;
43214c85021SArnaldo Carvalho de Melo struct iphdr;
4331da177e4SLinus Torvalds struct ip_vs_conn;
4341da177e4SLinus Torvalds struct ip_vs_app;
43514c85021SArnaldo Carvalho de Melo struct sk_buff;
436252c6410SHans Schillstrom struct ip_vs_proto_data;
4371da177e4SLinus Torvalds 
4381da177e4SLinus Torvalds struct ip_vs_protocol {
4391da177e4SLinus Torvalds 	struct ip_vs_protocol	*next;
4401da177e4SLinus Torvalds 	char			*name;
4412ad17defSJulian Anastasov 	u16			protocol;
4422ad17defSJulian Anastasov 	u16			num_states;
4431da177e4SLinus Torvalds 	int			dont_defrag;
4441da177e4SLinus Torvalds 
4451da177e4SLinus Torvalds 	void (*init)(struct ip_vs_protocol *pp);
4461da177e4SLinus Torvalds 
4471da177e4SLinus Torvalds 	void (*exit)(struct ip_vs_protocol *pp);
4481da177e4SLinus Torvalds 
449582b8e3eSHans Schillstrom 	int (*init_netns)(struct net *net, struct ip_vs_proto_data *pd);
450252c6410SHans Schillstrom 
451252c6410SHans Schillstrom 	void (*exit_netns)(struct net *net, struct ip_vs_proto_data *pd);
452252c6410SHans Schillstrom 
45351ef348bSJulius Volz 	int (*conn_schedule)(int af, struct sk_buff *skb,
4549330419dSHans Schillstrom 			     struct ip_vs_proto_data *pd,
455d4383f04SJesper Dangaard Brouer 			     int *verdict, struct ip_vs_conn **cpp,
456d4383f04SJesper Dangaard Brouer 			     struct ip_vs_iphdr *iph);
4571da177e4SLinus Torvalds 
4581da177e4SLinus Torvalds 	struct ip_vs_conn *
45951ef348bSJulius Volz 	(*conn_in_get)(int af,
46051ef348bSJulius Volz 		       const struct sk_buff *skb,
46151ef348bSJulius Volz 		       const struct ip_vs_iphdr *iph,
4621da177e4SLinus Torvalds 		       int inverse);
4631da177e4SLinus Torvalds 
4641da177e4SLinus Torvalds 	struct ip_vs_conn *
46551ef348bSJulius Volz 	(*conn_out_get)(int af,
46651ef348bSJulius Volz 			const struct sk_buff *skb,
46751ef348bSJulius Volz 			const struct ip_vs_iphdr *iph,
4681da177e4SLinus Torvalds 			int inverse);
4691da177e4SLinus Torvalds 
470d4383f04SJesper Dangaard Brouer 	int (*snat_handler)(struct sk_buff *skb, struct ip_vs_protocol *pp,
471d4383f04SJesper Dangaard Brouer 			    struct ip_vs_conn *cp, struct ip_vs_iphdr *iph);
4721da177e4SLinus Torvalds 
473d4383f04SJesper Dangaard Brouer 	int (*dnat_handler)(struct sk_buff *skb, struct ip_vs_protocol *pp,
474d4383f04SJesper Dangaard Brouer 			    struct ip_vs_conn *cp, struct ip_vs_iphdr *iph);
4751da177e4SLinus Torvalds 
47651ef348bSJulius Volz 	int (*csum_check)(int af, struct sk_buff *skb,
47751ef348bSJulius Volz 			  struct ip_vs_protocol *pp);
4781da177e4SLinus Torvalds 
4791da177e4SLinus Torvalds 	const char *(*state_name)(int state);
4801da177e4SLinus Torvalds 
4814a516f11SSimon Horman 	void (*state_transition)(struct ip_vs_conn *cp, int direction,
4821da177e4SLinus Torvalds 				 const struct sk_buff *skb,
4839330419dSHans Schillstrom 				 struct ip_vs_proto_data *pd);
4841da177e4SLinus Torvalds 
485ab8a5e84SHans Schillstrom 	int (*register_app)(struct net *net, struct ip_vs_app *inc);
4861da177e4SLinus Torvalds 
487ab8a5e84SHans Schillstrom 	void (*unregister_app)(struct net *net, struct ip_vs_app *inc);
4881da177e4SLinus Torvalds 
4891da177e4SLinus Torvalds 	int (*app_conn_bind)(struct ip_vs_conn *cp);
4901da177e4SLinus Torvalds 
4910d79641aSJulian Anastasov 	void (*debug_packet)(int af, struct ip_vs_protocol *pp,
4921da177e4SLinus Torvalds 			     const struct sk_buff *skb,
4931da177e4SLinus Torvalds 			     int offset,
4941da177e4SLinus Torvalds 			     const char *msg);
4951da177e4SLinus Torvalds 
4969330419dSHans Schillstrom 	void (*timeout_change)(struct ip_vs_proto_data *pd, int flags);
4971da177e4SLinus Torvalds };
4981da177e4SLinus Torvalds 
49907dcc686SSimon Horman /* protocol data per netns */
500252c6410SHans Schillstrom struct ip_vs_proto_data {
501252c6410SHans Schillstrom 	struct ip_vs_proto_data	*next;
502252c6410SHans Schillstrom 	struct ip_vs_protocol	*pp;
503252c6410SHans Schillstrom 	int			*timeout_table;	/* protocol timeout table */
504252c6410SHans Schillstrom 	atomic_t		appcnt;		/* counter of proto app incs. */
505252c6410SHans Schillstrom 	struct tcp_states_t	*tcp_state_table;
506252c6410SHans Schillstrom };
507252c6410SHans Schillstrom 
5085c3a0fd7SJoe Perches struct ip_vs_protocol   *ip_vs_proto_get(unsigned short proto);
5095c3a0fd7SJoe Perches struct ip_vs_proto_data *ip_vs_proto_data_get(struct net *net,
510252c6410SHans Schillstrom 					      unsigned short proto);
5111da177e4SLinus Torvalds 
512f11017ecSSimon Horman struct ip_vs_conn_param {
5136e67e586SHans Schillstrom 	struct net			*net;
514f11017ecSSimon Horman 	const union nf_inet_addr	*caddr;
515f11017ecSSimon Horman 	const union nf_inet_addr	*vaddr;
516f11017ecSSimon Horman 	__be16				cport;
517f11017ecSSimon Horman 	__be16				vport;
518f11017ecSSimon Horman 	__u16				protocol;
519f11017ecSSimon Horman 	u16				af;
52085999283SSimon Horman 
52185999283SSimon Horman 	const struct ip_vs_pe		*pe;
52285999283SSimon Horman 	char				*pe_data;
52385999283SSimon Horman 	__u8				pe_data_len;
524f11017ecSSimon Horman };
525f11017ecSSimon Horman 
52607dcc686SSimon Horman /* IP_VS structure allocated for each dynamically scheduled connection */
5271da177e4SLinus Torvalds struct ip_vs_conn {
528731109e7SChangli Gao 	struct hlist_node	c_list;         /* hashed list heads */
5291da177e4SLinus Torvalds 	/* Protocol, addresses and port numbers */
5306e67e586SHans Schillstrom 	__be16                  cport;
5316e67e586SHans Schillstrom 	__be16                  dport;
5321845ed0bSJulian Anastasov 	__be16                  vport;
5331845ed0bSJulian Anastasov 	u16			af;		/* address family */
534e7ade46aSJulius Volz 	union nf_inet_addr      caddr;          /* client address */
535e7ade46aSJulius Volz 	union nf_inet_addr      vaddr;          /* virtual address */
536e7ade46aSJulius Volz 	union nf_inet_addr      daddr;          /* destination address */
5373575792eSJulian Anastasov 	volatile __u32          flags;          /* status flags */
5381da177e4SLinus Torvalds 	__u16                   protocol;       /* Which protocol (TCP/UDP) */
539ba38528aSAlex Gartrell 	__u16			daf;		/* Address family of the dest */
5401845ed0bSJulian Anastasov #ifdef CONFIG_NET_NS
5411845ed0bSJulian Anastasov 	struct net              *net;           /* Name space */
5421845ed0bSJulian Anastasov #endif
5431da177e4SLinus Torvalds 
5441da177e4SLinus Torvalds 	/* counter and timer */
5451da177e4SLinus Torvalds 	atomic_t		refcnt;		/* reference count */
5461da177e4SLinus Torvalds 	struct timer_list	timer;		/* Expiration timer */
5471da177e4SLinus Torvalds 	volatile unsigned long	timeout;	/* timeout */
5481da177e4SLinus Torvalds 
5491da177e4SLinus Torvalds 	/* Flags and state transition */
5501da177e4SLinus Torvalds 	spinlock_t              lock;           /* lock for state transition */
5511da177e4SLinus Torvalds 	volatile __u16          state;          /* state info */
552efac5276SRumen G. Bogdanovski 	volatile __u16          old_state;      /* old state, to be used for
553efac5276SRumen G. Bogdanovski 						 * state transition triggerd
554efac5276SRumen G. Bogdanovski 						 * synchronization
555efac5276SRumen G. Bogdanovski 						 */
5561845ed0bSJulian Anastasov 	__u32			fwmark;		/* Fire wall mark from skb */
557749c42b6SJulian Anastasov 	unsigned long		sync_endtime;	/* jiffies + sent_retries */
5581da177e4SLinus Torvalds 
5591da177e4SLinus Torvalds 	/* Control members */
5601da177e4SLinus Torvalds 	struct ip_vs_conn       *control;       /* Master control connection */
5611da177e4SLinus Torvalds 	atomic_t                n_control;      /* Number of controlled ones */
5621da177e4SLinus Torvalds 	struct ip_vs_dest       *dest;          /* real server */
5631da177e4SLinus Torvalds 	atomic_t                in_pkts;        /* incoming packet counter */
5641da177e4SLinus Torvalds 
56507dcc686SSimon Horman 	/* Packet transmitter for different forwarding methods.  If it
56607dcc686SSimon Horman 	 * mangles the packet, it must return NF_DROP or better NF_STOLEN,
56707dcc686SSimon Horman 	 * otherwise this must be changed to a sk_buff **.
56807dcc686SSimon Horman 	 * NF_ACCEPT can be returned when destination is local.
5691da177e4SLinus Torvalds 	 */
5701da177e4SLinus Torvalds 	int (*packet_xmit)(struct sk_buff *skb, struct ip_vs_conn *cp,
571d4383f04SJesper Dangaard Brouer 			   struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
5721da177e4SLinus Torvalds 
5731da177e4SLinus Torvalds 	/* Note: we can group the following members into a structure,
57407dcc686SSimon Horman 	 * in order to save more space, and the following members are
57507dcc686SSimon Horman 	 * only used in VS/NAT anyway
57607dcc686SSimon Horman 	 */
5771da177e4SLinus Torvalds 	struct ip_vs_app        *app;           /* bound ip_vs_app object */
5781da177e4SLinus Torvalds 	void                    *app_data;      /* Application private data */
5791da177e4SLinus Torvalds 	struct ip_vs_seq        in_seq;         /* incoming seq. struct */
5801da177e4SLinus Torvalds 	struct ip_vs_seq        out_seq;        /* outgoing seq. struct */
58185999283SSimon Horman 
582e9e5eee8SSimon Horman 	const struct ip_vs_pe	*pe;
58385999283SSimon Horman 	char			*pe_data;
58485999283SSimon Horman 	__u8			pe_data_len;
585088339a5SJulian Anastasov 
586088339a5SJulian Anastasov 	struct rcu_head		rcu_head;
5871da177e4SLinus Torvalds };
5881da177e4SLinus Torvalds 
58907dcc686SSimon Horman /* To save some memory in conn table when name space is disabled. */
5906e67e586SHans Schillstrom static inline struct net *ip_vs_conn_net(const struct ip_vs_conn *cp)
5916e67e586SHans Schillstrom {
5926e67e586SHans Schillstrom #ifdef CONFIG_NET_NS
5936e67e586SHans Schillstrom 	return cp->net;
5946e67e586SHans Schillstrom #else
5956e67e586SHans Schillstrom 	return &init_net;
5966e67e586SHans Schillstrom #endif
5976e67e586SHans Schillstrom }
59807dcc686SSimon Horman 
5996e67e586SHans Schillstrom static inline void ip_vs_conn_net_set(struct ip_vs_conn *cp, struct net *net)
6006e67e586SHans Schillstrom {
6016e67e586SHans Schillstrom #ifdef CONFIG_NET_NS
6026e67e586SHans Schillstrom 	cp->net = net;
6036e67e586SHans Schillstrom #endif
6046e67e586SHans Schillstrom }
6056e67e586SHans Schillstrom 
6066e67e586SHans Schillstrom static inline int ip_vs_conn_net_eq(const struct ip_vs_conn *cp,
6076e67e586SHans Schillstrom 				    struct net *net)
6086e67e586SHans Schillstrom {
6096e67e586SHans Schillstrom #ifdef CONFIG_NET_NS
6106e67e586SHans Schillstrom 	return cp->net == net;
6116e67e586SHans Schillstrom #else
6126e67e586SHans Schillstrom 	return 1;
6136e67e586SHans Schillstrom #endif
6146e67e586SHans Schillstrom }
6151da177e4SLinus Torvalds 
61607dcc686SSimon Horman /* Extended internal versions of struct ip_vs_service_user and ip_vs_dest_user
61707dcc686SSimon Horman  * for IPv6 support.
618c860c6b1SJulius Volz  *
619c860c6b1SJulius Volz  * We need these to conveniently pass around service and destination
620c860c6b1SJulius Volz  * options, but unfortunately, we also need to keep the old definitions to
621c860c6b1SJulius Volz  * maintain userspace backwards compatibility for the setsockopt interface.
622c860c6b1SJulius Volz  */
623c860c6b1SJulius Volz struct ip_vs_service_user_kern {
624c860c6b1SJulius Volz 	/* virtual service addresses */
625c860c6b1SJulius Volz 	u16			af;
626c860c6b1SJulius Volz 	u16			protocol;
627c860c6b1SJulius Volz 	union nf_inet_addr	addr;		/* virtual ip address */
6280a925864SJulian Anastasov 	__be16			port;
629c860c6b1SJulius Volz 	u32			fwmark;		/* firwall mark of service */
630c860c6b1SJulius Volz 
631c860c6b1SJulius Volz 	/* virtual service options */
632c860c6b1SJulius Volz 	char			*sched_name;
6330d1e71b0SSimon Horman 	char			*pe_name;
63495c96174SEric Dumazet 	unsigned int		flags;		/* virtual service flags */
63595c96174SEric Dumazet 	unsigned int		timeout;	/* persistent timeout in sec */
6360a925864SJulian Anastasov 	__be32			netmask;	/* persistent netmask or plen */
637c860c6b1SJulius Volz };
638c860c6b1SJulius Volz 
639c860c6b1SJulius Volz 
640c860c6b1SJulius Volz struct ip_vs_dest_user_kern {
641c860c6b1SJulius Volz 	/* destination server address */
642c860c6b1SJulius Volz 	union nf_inet_addr	addr;
6430a925864SJulian Anastasov 	__be16			port;
644c860c6b1SJulius Volz 
645c860c6b1SJulius Volz 	/* real server options */
64695c96174SEric Dumazet 	unsigned int		conn_flags;	/* connection flags */
647c860c6b1SJulius Volz 	int			weight;		/* destination weight */
648c860c6b1SJulius Volz 
649c860c6b1SJulius Volz 	/* thresholds for active connections */
650c860c6b1SJulius Volz 	u32			u_threshold;	/* upper threshold */
651c860c6b1SJulius Volz 	u32			l_threshold;	/* lower threshold */
6526cff339bSAlex Gartrell 
6536cff339bSAlex Gartrell 	/* Address family of addr */
6546cff339bSAlex Gartrell 	u16			af;
655c860c6b1SJulius Volz };
656c860c6b1SJulius Volz 
657c860c6b1SJulius Volz 
658c860c6b1SJulius Volz /*
65907dcc686SSimon Horman  * The information about the virtual service offered to the net and the
66007dcc686SSimon Horman  * forwarding entries.
6611da177e4SLinus Torvalds  */
6621da177e4SLinus Torvalds struct ip_vs_service {
663ceec4c38SJulian Anastasov 	struct hlist_node	s_list;   /* for normal service table */
664ceec4c38SJulian Anastasov 	struct hlist_node	f_list;   /* for fwmark-based service table */
6651da177e4SLinus Torvalds 	atomic_t		refcnt;   /* reference counter */
6661da177e4SLinus Torvalds 
667e7ade46aSJulius Volz 	u16			af;       /* address family */
6681da177e4SLinus Torvalds 	__u16			protocol; /* which protocol (TCP/UDP) */
669e7ade46aSJulius Volz 	union nf_inet_addr	addr;	  /* IP address for virtual service */
670014d730dSAl Viro 	__be16			port;	  /* port number for the service */
6711da177e4SLinus Torvalds 	__u32                   fwmark;   /* firewall mark of the service */
67295c96174SEric Dumazet 	unsigned int		flags;	  /* service status flags */
67395c96174SEric Dumazet 	unsigned int		timeout;  /* persistent timeout in ticks */
6740a925864SJulian Anastasov 	__be32			netmask;  /* grouping granularity, mask/plen */
675fc723250SHans Schillstrom 	struct net		*net;
6761da177e4SLinus Torvalds 
6771da177e4SLinus Torvalds 	struct list_head	destinations;  /* real server d-linked list */
6781da177e4SLinus Torvalds 	__u32			num_dests;     /* number of servers */
6791da177e4SLinus Torvalds 	struct ip_vs_stats      stats;         /* statistics for the service */
6801da177e4SLinus Torvalds 
6811da177e4SLinus Torvalds 	/* for scheduling */
682ceec4c38SJulian Anastasov 	struct ip_vs_scheduler __rcu *scheduler; /* bound scheduler object */
683ba3a3ce1SJulian Anastasov 	spinlock_t		sched_lock;    /* lock sched_data */
6841da177e4SLinus Torvalds 	void			*sched_data;   /* scheduler application data */
68585999283SSimon Horman 
68685999283SSimon Horman 	/* alternate persistence engine */
687ceec4c38SJulian Anastasov 	struct ip_vs_pe __rcu	*pe;
688ceec4c38SJulian Anastasov 
689ceec4c38SJulian Anastasov 	struct rcu_head		rcu_head;
6901da177e4SLinus Torvalds };
6911da177e4SLinus Torvalds 
692026ace06SJulian Anastasov /* Information for cached dst */
693026ace06SJulian Anastasov struct ip_vs_dest_dst {
694026ace06SJulian Anastasov 	struct dst_entry	*dst_cache;	/* destination cache entry */
695026ace06SJulian Anastasov 	u32			dst_cookie;
696026ace06SJulian Anastasov 	union nf_inet_addr	dst_saddr;
697026ace06SJulian Anastasov 	struct rcu_head		rcu_head;
698026ace06SJulian Anastasov };
6991da177e4SLinus Torvalds 
70007dcc686SSimon Horman /* The real server destination forwarding entry with ip address, port number,
70107dcc686SSimon Horman  * and so on.
7021da177e4SLinus Torvalds  */
7031da177e4SLinus Torvalds struct ip_vs_dest {
7041da177e4SLinus Torvalds 	struct list_head	n_list;   /* for the dests in the service */
705276472eaSJulian Anastasov 	struct hlist_node	d_list;   /* for table with all the dests */
7061da177e4SLinus Torvalds 
707e7ade46aSJulius Volz 	u16			af;		/* address family */
708014d730dSAl Viro 	__be16			port;		/* port number of the server */
709f2431e6eSHans Schillstrom 	union nf_inet_addr	addr;		/* IP address of the server */
71095c96174SEric Dumazet 	volatile unsigned int	flags;		/* dest status flags */
7111da177e4SLinus Torvalds 	atomic_t		conn_flags;	/* flags to copy to conn */
7121da177e4SLinus Torvalds 	atomic_t		weight;		/* server weight */
7131da177e4SLinus Torvalds 
7141da177e4SLinus Torvalds 	atomic_t		refcnt;		/* reference counter */
7151da177e4SLinus Torvalds 	struct ip_vs_stats      stats;          /* statistics */
716bcbde4c0SJulian Anastasov 	unsigned long		idle_start;	/* start time, jiffies */
7171da177e4SLinus Torvalds 
7181da177e4SLinus Torvalds 	/* connection counters and thresholds */
7191da177e4SLinus Torvalds 	atomic_t		activeconns;	/* active connections */
7201da177e4SLinus Torvalds 	atomic_t		inactconns;	/* inactive connections */
7211da177e4SLinus Torvalds 	atomic_t		persistconns;	/* persistent connections */
7221da177e4SLinus Torvalds 	__u32			u_threshold;	/* upper threshold */
7231da177e4SLinus Torvalds 	__u32			l_threshold;	/* lower threshold */
7241da177e4SLinus Torvalds 
7251da177e4SLinus Torvalds 	/* for destination cache */
7261da177e4SLinus Torvalds 	spinlock_t		dst_lock;	/* lock of dst_cache */
727026ace06SJulian Anastasov 	struct ip_vs_dest_dst __rcu *dest_dst;	/* cached dst info */
7281da177e4SLinus Torvalds 
7291da177e4SLinus Torvalds 	/* for virtual service */
730bcbde4c0SJulian Anastasov 	struct ip_vs_service __rcu *svc;	/* service it belongs to */
7311da177e4SLinus Torvalds 	__u16			protocol;	/* which protocol (TCP/UDP) */
732014d730dSAl Viro 	__be16			vport;		/* virtual port number */
733f2431e6eSHans Schillstrom 	union nf_inet_addr	vaddr;		/* virtual IP address */
7341da177e4SLinus Torvalds 	__u32			vfwmark;	/* firewall mark of service */
735276472eaSJulian Anastasov 
736578bc3efSJulian Anastasov 	struct list_head	t_list;		/* in dest_trash */
737276472eaSJulian Anastasov 	unsigned int		in_rs_table:1;	/* we are in rs_table */
7381da177e4SLinus Torvalds };
7391da177e4SLinus Torvalds 
74007dcc686SSimon Horman /* The scheduler object */
7411da177e4SLinus Torvalds struct ip_vs_scheduler {
7421da177e4SLinus Torvalds 	struct list_head	n_list;		/* d-linked list head */
7431da177e4SLinus Torvalds 	char			*name;		/* scheduler name */
7441da177e4SLinus Torvalds 	atomic_t		refcnt;		/* reference counter */
7451da177e4SLinus Torvalds 	struct module		*module;	/* THIS_MODULE/NULL */
7461da177e4SLinus Torvalds 
7471da177e4SLinus Torvalds 	/* scheduler initializing service */
7481da177e4SLinus Torvalds 	int (*init_service)(struct ip_vs_service *svc);
7491da177e4SLinus Torvalds 	/* scheduling service finish */
750ed3ffc4eSJulian Anastasov 	void (*done_service)(struct ip_vs_service *svc);
7516b6df466SJulian Anastasov 	/* dest is linked */
7526b6df466SJulian Anastasov 	int (*add_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest);
7536b6df466SJulian Anastasov 	/* dest is unlinked */
7546b6df466SJulian Anastasov 	int (*del_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest);
7556b6df466SJulian Anastasov 	/* dest is updated */
7566b6df466SJulian Anastasov 	int (*upd_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest);
7571da177e4SLinus Torvalds 
7581da177e4SLinus Torvalds 	/* selecting a server from the given service */
7591da177e4SLinus Torvalds 	struct ip_vs_dest* (*schedule)(struct ip_vs_service *svc,
760bba54de5SJulian Anastasov 				       const struct sk_buff *skb,
761bba54de5SJulian Anastasov 				       struct ip_vs_iphdr *iph);
7621da177e4SLinus Torvalds };
7631da177e4SLinus Torvalds 
76485999283SSimon Horman /* The persistence engine object */
76585999283SSimon Horman struct ip_vs_pe {
76685999283SSimon Horman 	struct list_head	n_list;		/* d-linked list head */
76785999283SSimon Horman 	char			*name;		/* scheduler name */
76885999283SSimon Horman 	atomic_t		refcnt;		/* reference counter */
76985999283SSimon Horman 	struct module		*module;	/* THIS_MODULE/NULL */
77085999283SSimon Horman 
77185999283SSimon Horman 	/* get the connection template, if any */
77285999283SSimon Horman 	int (*fill_param)(struct ip_vs_conn_param *p, struct sk_buff *skb);
77385999283SSimon Horman 	bool (*ct_match)(const struct ip_vs_conn_param *p,
77485999283SSimon Horman 			 struct ip_vs_conn *ct);
77585999283SSimon Horman 	u32 (*hashkey_raw)(const struct ip_vs_conn_param *p, u32 initval,
77685999283SSimon Horman 			   bool inverse);
777a3c918acSSimon Horman 	int (*show_pe_data)(const struct ip_vs_conn *cp, char *buf);
77885999283SSimon Horman };
7791da177e4SLinus Torvalds 
78007dcc686SSimon Horman /* The application module object (a.k.a. app incarnation) */
781fd2c3ef7SEric Dumazet struct ip_vs_app {
7821da177e4SLinus Torvalds 	struct list_head	a_list;		/* member in app list */
7831da177e4SLinus Torvalds 	int			type;		/* IP_VS_APP_TYPE_xxx */
7841da177e4SLinus Torvalds 	char			*name;		/* application module name */
7851da177e4SLinus Torvalds 	__u16			protocol;
7861da177e4SLinus Torvalds 	struct module		*module;	/* THIS_MODULE/NULL */
7871da177e4SLinus Torvalds 	struct list_head	incs_list;	/* list of incarnations */
7881da177e4SLinus Torvalds 
7891da177e4SLinus Torvalds 	/* members for application incarnations */
7901da177e4SLinus Torvalds 	struct list_head	p_list;		/* member in proto app list */
7911da177e4SLinus Torvalds 	struct ip_vs_app	*app;		/* its real application */
792014d730dSAl Viro 	__be16			port;		/* port number in net order */
7931da177e4SLinus Torvalds 	atomic_t		usecnt;		/* usage counter */
794363c97d7SJulian Anastasov 	struct rcu_head		rcu_head;
7951da177e4SLinus Torvalds 
79607dcc686SSimon Horman 	/* output hook: Process packet in inout direction, diff set for TCP.
7978b27b10fSJulian Anastasov 	 * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok,
7988b27b10fSJulian Anastasov 	 *	   2=Mangled but checksum was not updated
7998b27b10fSJulian Anastasov 	 */
8001da177e4SLinus Torvalds 	int (*pkt_out)(struct ip_vs_app *, struct ip_vs_conn *,
8013db05feaSHerbert Xu 		       struct sk_buff *, int *diff);
8021da177e4SLinus Torvalds 
80307dcc686SSimon Horman 	/* input hook: Process packet in outin direction, diff set for TCP.
8048b27b10fSJulian Anastasov 	 * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok,
8058b27b10fSJulian Anastasov 	 *	   2=Mangled but checksum was not updated
8068b27b10fSJulian Anastasov 	 */
8071da177e4SLinus Torvalds 	int (*pkt_in)(struct ip_vs_app *, struct ip_vs_conn *,
8083db05feaSHerbert Xu 		      struct sk_buff *, int *diff);
8091da177e4SLinus Torvalds 
8101da177e4SLinus Torvalds 	/* ip_vs_app initializer */
8111da177e4SLinus Torvalds 	int (*init_conn)(struct ip_vs_app *, struct ip_vs_conn *);
8121da177e4SLinus Torvalds 
8131da177e4SLinus Torvalds 	/* ip_vs_app finish */
8141da177e4SLinus Torvalds 	int (*done_conn)(struct ip_vs_app *, struct ip_vs_conn *);
8151da177e4SLinus Torvalds 
8161da177e4SLinus Torvalds 
8171da177e4SLinus Torvalds 	/* not used now */
8181da177e4SLinus Torvalds 	int (*bind_conn)(struct ip_vs_app *, struct ip_vs_conn *,
8191da177e4SLinus Torvalds 			 struct ip_vs_protocol *);
8201da177e4SLinus Torvalds 
8211da177e4SLinus Torvalds 	void (*unbind_conn)(struct ip_vs_app *, struct ip_vs_conn *);
8221da177e4SLinus Torvalds 
8231da177e4SLinus Torvalds 	int *			timeout_table;
8241da177e4SLinus Torvalds 	int *			timeouts;
8251da177e4SLinus Torvalds 	int			timeouts_size;
8261da177e4SLinus Torvalds 
8271da177e4SLinus Torvalds 	int (*conn_schedule)(struct sk_buff *skb, struct ip_vs_app *app,
8281da177e4SLinus Torvalds 			     int *verdict, struct ip_vs_conn **cpp);
8291da177e4SLinus Torvalds 
8301da177e4SLinus Torvalds 	struct ip_vs_conn *
8311da177e4SLinus Torvalds 	(*conn_in_get)(const struct sk_buff *skb, struct ip_vs_app *app,
832d4383f04SJesper Dangaard Brouer 		       const struct iphdr *iph, int inverse);
8331da177e4SLinus Torvalds 
8341da177e4SLinus Torvalds 	struct ip_vs_conn *
8351da177e4SLinus Torvalds 	(*conn_out_get)(const struct sk_buff *skb, struct ip_vs_app *app,
836d4383f04SJesper Dangaard Brouer 			const struct iphdr *iph, int inverse);
8371da177e4SLinus Torvalds 
8381da177e4SLinus Torvalds 	int (*state_transition)(struct ip_vs_conn *cp, int direction,
8391da177e4SLinus Torvalds 				const struct sk_buff *skb,
8401da177e4SLinus Torvalds 				struct ip_vs_app *app);
8411da177e4SLinus Torvalds 
8421da177e4SLinus Torvalds 	void (*timeout_change)(struct ip_vs_app *app, int flags);
8431da177e4SLinus Torvalds };
8441da177e4SLinus Torvalds 
845f73181c8SPablo Neira Ayuso struct ipvs_master_sync_state {
846f73181c8SPablo Neira Ayuso 	struct list_head	sync_queue;
847f73181c8SPablo Neira Ayuso 	struct ip_vs_sync_buff	*sync_buff;
84807995674SZhang Yanfei 	unsigned long		sync_queue_len;
849f73181c8SPablo Neira Ayuso 	unsigned int		sync_queue_delay;
850f73181c8SPablo Neira Ayuso 	struct task_struct	*master_thread;
851f73181c8SPablo Neira Ayuso 	struct delayed_work	master_wakeup_work;
852f73181c8SPablo Neira Ayuso 	struct netns_ipvs	*ipvs;
853f73181c8SPablo Neira Ayuso };
854f73181c8SPablo Neira Ayuso 
855578bc3efSJulian Anastasov /* How much time to keep dests in trash */
856578bc3efSJulian Anastasov #define IP_VS_DEST_TRASH_PERIOD		(120 * HZ)
857578bc3efSJulian Anastasov 
858e4ff6751SJulian Anastasov struct ipvs_sync_daemon_cfg {
859d3328817SJulian Anastasov 	union nf_inet_addr	mcast_group;
860e4ff6751SJulian Anastasov 	int			syncid;
861e4ff6751SJulian Anastasov 	u16			sync_maxlen;
862d3328817SJulian Anastasov 	u16			mcast_port;
863d3328817SJulian Anastasov 	u8			mcast_af;
864d3328817SJulian Anastasov 	u8			mcast_ttl;
865e4ff6751SJulian Anastasov 	/* multicast interface name */
866e4ff6751SJulian Anastasov 	char			mcast_ifn[IP_VS_IFNAME_MAXLEN];
867e4ff6751SJulian Anastasov };
868e4ff6751SJulian Anastasov 
8692553d064SJulian Anastasov /* IPVS in network namespace */
8702553d064SJulian Anastasov struct netns_ipvs {
8712553d064SJulian Anastasov 	int			gen;		/* Generation */
8727a4f0761SHans Schillstrom 	int			enable;		/* enable like nf_hooks do */
87307dcc686SSimon Horman 	/* Hash table: for real service lookups */
8742553d064SJulian Anastasov 	#define IP_VS_RTAB_BITS 4
8752553d064SJulian Anastasov 	#define IP_VS_RTAB_SIZE (1 << IP_VS_RTAB_BITS)
8762553d064SJulian Anastasov 	#define IP_VS_RTAB_MASK (IP_VS_RTAB_SIZE - 1)
8772553d064SJulian Anastasov 
878276472eaSJulian Anastasov 	struct hlist_head	rs_table[IP_VS_RTAB_SIZE];
8792553d064SJulian Anastasov 	/* ip_vs_app */
8802553d064SJulian Anastasov 	struct list_head	app_list;
8812553d064SJulian Anastasov 	/* ip_vs_proto */
8822553d064SJulian Anastasov 	#define IP_VS_PROTO_TAB_SIZE	32	/* must be power of 2 */
8832553d064SJulian Anastasov 	struct ip_vs_proto_data *proto_data_table[IP_VS_PROTO_TAB_SIZE];
8842553d064SJulian Anastasov 	/* ip_vs_proto_tcp */
8852553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_TCP
8862553d064SJulian Anastasov 	#define	TCP_APP_TAB_BITS	4
8872553d064SJulian Anastasov 	#define	TCP_APP_TAB_SIZE	(1 << TCP_APP_TAB_BITS)
8882553d064SJulian Anastasov 	#define	TCP_APP_TAB_MASK	(TCP_APP_TAB_SIZE - 1)
8892553d064SJulian Anastasov 	struct list_head	tcp_apps[TCP_APP_TAB_SIZE];
8902553d064SJulian Anastasov #endif
8912553d064SJulian Anastasov 	/* ip_vs_proto_udp */
8922553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_UDP
8932553d064SJulian Anastasov 	#define	UDP_APP_TAB_BITS	4
8942553d064SJulian Anastasov 	#define	UDP_APP_TAB_SIZE	(1 << UDP_APP_TAB_BITS)
8952553d064SJulian Anastasov 	#define	UDP_APP_TAB_MASK	(UDP_APP_TAB_SIZE - 1)
8962553d064SJulian Anastasov 	struct list_head	udp_apps[UDP_APP_TAB_SIZE];
8972553d064SJulian Anastasov #endif
8982553d064SJulian Anastasov 	/* ip_vs_proto_sctp */
8992553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_SCTP
9002553d064SJulian Anastasov 	#define SCTP_APP_TAB_BITS	4
9012553d064SJulian Anastasov 	#define SCTP_APP_TAB_SIZE	(1 << SCTP_APP_TAB_BITS)
9022553d064SJulian Anastasov 	#define SCTP_APP_TAB_MASK	(SCTP_APP_TAB_SIZE - 1)
9032553d064SJulian Anastasov 	/* Hash table for SCTP application incarnations	 */
9042553d064SJulian Anastasov 	struct list_head	sctp_apps[SCTP_APP_TAB_SIZE];
9052553d064SJulian Anastasov #endif
9062553d064SJulian Anastasov 	/* ip_vs_conn */
9072553d064SJulian Anastasov 	atomic_t		conn_count;      /* connection counter */
9082553d064SJulian Anastasov 
9092553d064SJulian Anastasov 	/* ip_vs_ctl */
9102a0751afSJulian Anastasov 	struct ip_vs_stats		tot_stats;  /* Statistics & est. */
9112553d064SJulian Anastasov 
9122553d064SJulian Anastasov 	int			num_services;    /* no of virtual services */
913f2247fbdSSimon Horman 
9142553d064SJulian Anastasov 	/* Trash for destinations */
9152553d064SJulian Anastasov 	struct list_head	dest_trash;
916578bc3efSJulian Anastasov 	spinlock_t		dest_trash_lock;
917578bc3efSJulian Anastasov 	struct timer_list	dest_trash_timer; /* expiration timer */
9182553d064SJulian Anastasov 	/* Service counters */
9192553d064SJulian Anastasov 	atomic_t		ftpsvc_counter;
9202553d064SJulian Anastasov 	atomic_t		nullsvc_counter;
9212553d064SJulian Anastasov 
922f2247fbdSSimon Horman #ifdef CONFIG_SYSCTL
923f2247fbdSSimon Horman 	/* 1/rate drop and drop-entry variables */
924f2247fbdSSimon Horman 	struct delayed_work	defense_work;   /* Work handler */
925f2247fbdSSimon Horman 	int			drop_rate;
926f2247fbdSSimon Horman 	int			drop_counter;
927f2247fbdSSimon Horman 	atomic_t		dropentry;
928f2247fbdSSimon Horman 	/* locks in ctl.c */
929f2247fbdSSimon Horman 	spinlock_t		dropentry_lock;  /* drop entry handling */
930f2247fbdSSimon Horman 	spinlock_t		droppacket_lock; /* drop packet handling */
931f2247fbdSSimon Horman 	spinlock_t		securetcp_lock;  /* state and timeout tables */
932f2247fbdSSimon Horman 
9332553d064SJulian Anastasov 	/* sys-ctl struct */
9342553d064SJulian Anastasov 	struct ctl_table_header	*sysctl_hdr;
9352553d064SJulian Anastasov 	struct ctl_table	*sysctl_tbl;
936f2247fbdSSimon Horman #endif
937f2247fbdSSimon Horman 
9382553d064SJulian Anastasov 	/* sysctl variables */
9392553d064SJulian Anastasov 	int			sysctl_amemthresh;
9402553d064SJulian Anastasov 	int			sysctl_am_droprate;
9412553d064SJulian Anastasov 	int			sysctl_drop_entry;
9422553d064SJulian Anastasov 	int			sysctl_drop_packet;
9432553d064SJulian Anastasov 	int			sysctl_secure_tcp;
9442553d064SJulian Anastasov #ifdef CONFIG_IP_VS_NFCT
9452553d064SJulian Anastasov 	int			sysctl_conntrack;
9462553d064SJulian Anastasov #endif
9472553d064SJulian Anastasov 	int			sysctl_snat_reroute;
9482553d064SJulian Anastasov 	int			sysctl_sync_ver;
949f73181c8SPablo Neira Ayuso 	int			sysctl_sync_ports;
9504d0c875dSJulian Anastasov 	int			sysctl_sync_persist_mode;
95107995674SZhang Yanfei 	unsigned long		sysctl_sync_qlen_max;
9521c003b15SPablo Neira Ayuso 	int			sysctl_sync_sock_size;
9532553d064SJulian Anastasov 	int			sysctl_cache_bypass;
9542553d064SJulian Anastasov 	int			sysctl_expire_nodest_conn;
955c6c96c18SAlexander Frolkin 	int			sysctl_sloppy_tcp;
956c6c96c18SAlexander Frolkin 	int			sysctl_sloppy_sctp;
9572553d064SJulian Anastasov 	int			sysctl_expire_quiescent_template;
9582553d064SJulian Anastasov 	int			sysctl_sync_threshold[2];
959749c42b6SJulian Anastasov 	unsigned int		sysctl_sync_refresh_period;
960749c42b6SJulian Anastasov 	int			sysctl_sync_retries;
9612553d064SJulian Anastasov 	int			sysctl_nat_icmp_send;
9623654e611SJulian Anastasov 	int			sysctl_pmtu_disc;
9630c12582fSJulian Anastasov 	int			sysctl_backup_only;
964d752c364SMarcelo Ricardo Leitner 	int			sysctl_conn_reuse_mode;
9652553d064SJulian Anastasov 
9662553d064SJulian Anastasov 	/* ip_vs_lblc */
9672553d064SJulian Anastasov 	int			sysctl_lblc_expiration;
9682553d064SJulian Anastasov 	struct ctl_table_header	*lblc_ctl_header;
9692553d064SJulian Anastasov 	struct ctl_table	*lblc_ctl_table;
9702553d064SJulian Anastasov 	/* ip_vs_lblcr */
9712553d064SJulian Anastasov 	int			sysctl_lblcr_expiration;
9722553d064SJulian Anastasov 	struct ctl_table_header	*lblcr_ctl_header;
9732553d064SJulian Anastasov 	struct ctl_table	*lblcr_ctl_table;
9742553d064SJulian Anastasov 	/* ip_vs_est */
9752553d064SJulian Anastasov 	struct list_head	est_list;	/* estimator list */
9762553d064SJulian Anastasov 	spinlock_t		est_lock;
9772553d064SJulian Anastasov 	struct timer_list	est_timer;	/* Estimation timer */
9782553d064SJulian Anastasov 	/* ip_vs_sync */
9792553d064SJulian Anastasov 	spinlock_t		sync_lock;
980f73181c8SPablo Neira Ayuso 	struct ipvs_master_sync_state *ms;
9812553d064SJulian Anastasov 	spinlock_t		sync_buff_lock;
982f73181c8SPablo Neira Ayuso 	struct task_struct	**backup_threads;
983f73181c8SPablo Neira Ayuso 	int			threads_mask;
9842553d064SJulian Anastasov 	volatile int		sync_state;
985ae1d48b2SHans Schillstrom 	struct mutex		sync_mutex;
986e4ff6751SJulian Anastasov 	struct ipvs_sync_daemon_cfg	mcfg;	/* Master Configuration */
987e4ff6751SJulian Anastasov 	struct ipvs_sync_daemon_cfg	bcfg;	/* Backup Configuration */
9882553d064SJulian Anastasov 	/* net name space ptr */
9892553d064SJulian Anastasov 	struct net		*net;            /* Needed by timer routines */
99007dcc686SSimon Horman 	/* Number of heterogeneous destinations, needed becaus heterogeneous
99107dcc686SSimon Horman 	 * are not supported when synchronization is enabled.
99207dcc686SSimon Horman 	 */
993391f503dSAlex Gartrell 	unsigned int		mixed_address_family_dests;
9942553d064SJulian Anastasov };
9951da177e4SLinus Torvalds 
99659e0350eSSimon Horman #define DEFAULT_SYNC_THRESHOLD	3
99759e0350eSSimon Horman #define DEFAULT_SYNC_PERIOD	50
9987532e8d4SSimon Horman #define DEFAULT_SYNC_VER	1
999c6c96c18SAlexander Frolkin #define DEFAULT_SLOPPY_TCP	0
1000c6c96c18SAlexander Frolkin #define DEFAULT_SLOPPY_SCTP	0
1001749c42b6SJulian Anastasov #define DEFAULT_SYNC_REFRESH_PERIOD	(0U * HZ)
1002749c42b6SJulian Anastasov #define DEFAULT_SYNC_RETRIES		0
10031c003b15SPablo Neira Ayuso #define IPVS_SYNC_WAKEUP_RATE	8
10041c003b15SPablo Neira Ayuso #define IPVS_SYNC_QLEN_MAX	(IPVS_SYNC_WAKEUP_RATE * 4)
10051c003b15SPablo Neira Ayuso #define IPVS_SYNC_SEND_DELAY	(HZ / 50)
10061c003b15SPablo Neira Ayuso #define IPVS_SYNC_CHECK_PERIOD	HZ
1007749c42b6SJulian Anastasov #define IPVS_SYNC_FLUSH_TIME	(HZ * 2)
1008f73181c8SPablo Neira Ayuso #define IPVS_SYNC_PORTS_MAX	(1 << 6)
100959e0350eSSimon Horman 
101059e0350eSSimon Horman #ifdef CONFIG_SYSCTL
101159e0350eSSimon Horman 
101259e0350eSSimon Horman static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs)
101359e0350eSSimon Horman {
101459e0350eSSimon Horman 	return ipvs->sysctl_sync_threshold[0];
101559e0350eSSimon Horman }
101659e0350eSSimon Horman 
101759e0350eSSimon Horman static inline int sysctl_sync_period(struct netns_ipvs *ipvs)
101859e0350eSSimon Horman {
1019749c42b6SJulian Anastasov 	return ACCESS_ONCE(ipvs->sysctl_sync_threshold[1]);
1020749c42b6SJulian Anastasov }
1021749c42b6SJulian Anastasov 
1022749c42b6SJulian Anastasov static inline unsigned int sysctl_sync_refresh_period(struct netns_ipvs *ipvs)
1023749c42b6SJulian Anastasov {
1024749c42b6SJulian Anastasov 	return ACCESS_ONCE(ipvs->sysctl_sync_refresh_period);
1025749c42b6SJulian Anastasov }
1026749c42b6SJulian Anastasov 
1027749c42b6SJulian Anastasov static inline int sysctl_sync_retries(struct netns_ipvs *ipvs)
1028749c42b6SJulian Anastasov {
1029749c42b6SJulian Anastasov 	return ipvs->sysctl_sync_retries;
103059e0350eSSimon Horman }
103159e0350eSSimon Horman 
10327532e8d4SSimon Horman static inline int sysctl_sync_ver(struct netns_ipvs *ipvs)
10337532e8d4SSimon Horman {
10347532e8d4SSimon Horman 	return ipvs->sysctl_sync_ver;
10357532e8d4SSimon Horman }
10367532e8d4SSimon Horman 
1037c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_tcp(struct netns_ipvs *ipvs)
1038c6c96c18SAlexander Frolkin {
1039c6c96c18SAlexander Frolkin 	return ipvs->sysctl_sloppy_tcp;
1040c6c96c18SAlexander Frolkin }
1041c6c96c18SAlexander Frolkin 
1042c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_sctp(struct netns_ipvs *ipvs)
1043c6c96c18SAlexander Frolkin {
1044c6c96c18SAlexander Frolkin 	return ipvs->sysctl_sloppy_sctp;
1045c6c96c18SAlexander Frolkin }
1046c6c96c18SAlexander Frolkin 
1047f73181c8SPablo Neira Ayuso static inline int sysctl_sync_ports(struct netns_ipvs *ipvs)
1048f73181c8SPablo Neira Ayuso {
1049f73181c8SPablo Neira Ayuso 	return ACCESS_ONCE(ipvs->sysctl_sync_ports);
1050f73181c8SPablo Neira Ayuso }
1051f73181c8SPablo Neira Ayuso 
10524d0c875dSJulian Anastasov static inline int sysctl_sync_persist_mode(struct netns_ipvs *ipvs)
10534d0c875dSJulian Anastasov {
10544d0c875dSJulian Anastasov 	return ipvs->sysctl_sync_persist_mode;
10554d0c875dSJulian Anastasov }
10564d0c875dSJulian Anastasov 
105707995674SZhang Yanfei static inline unsigned long sysctl_sync_qlen_max(struct netns_ipvs *ipvs)
10581c003b15SPablo Neira Ayuso {
10591c003b15SPablo Neira Ayuso 	return ipvs->sysctl_sync_qlen_max;
10601c003b15SPablo Neira Ayuso }
10611c003b15SPablo Neira Ayuso 
10621c003b15SPablo Neira Ayuso static inline int sysctl_sync_sock_size(struct netns_ipvs *ipvs)
10631c003b15SPablo Neira Ayuso {
10641c003b15SPablo Neira Ayuso 	return ipvs->sysctl_sync_sock_size;
10651c003b15SPablo Neira Ayuso }
10661c003b15SPablo Neira Ayuso 
10673654e611SJulian Anastasov static inline int sysctl_pmtu_disc(struct netns_ipvs *ipvs)
10683654e611SJulian Anastasov {
10693654e611SJulian Anastasov 	return ipvs->sysctl_pmtu_disc;
10703654e611SJulian Anastasov }
10713654e611SJulian Anastasov 
10720c12582fSJulian Anastasov static inline int sysctl_backup_only(struct netns_ipvs *ipvs)
10730c12582fSJulian Anastasov {
10740c12582fSJulian Anastasov 	return ipvs->sync_state & IP_VS_STATE_BACKUP &&
10750c12582fSJulian Anastasov 	       ipvs->sysctl_backup_only;
10760c12582fSJulian Anastasov }
10770c12582fSJulian Anastasov 
1078d752c364SMarcelo Ricardo Leitner static inline int sysctl_conn_reuse_mode(struct netns_ipvs *ipvs)
1079d752c364SMarcelo Ricardo Leitner {
1080d752c364SMarcelo Ricardo Leitner 	return ipvs->sysctl_conn_reuse_mode;
1081d752c364SMarcelo Ricardo Leitner }
1082d752c364SMarcelo Ricardo Leitner 
108359e0350eSSimon Horman #else
108459e0350eSSimon Horman 
108559e0350eSSimon Horman static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs)
108659e0350eSSimon Horman {
108759e0350eSSimon Horman 	return DEFAULT_SYNC_THRESHOLD;
108859e0350eSSimon Horman }
108959e0350eSSimon Horman 
109059e0350eSSimon Horman static inline int sysctl_sync_period(struct netns_ipvs *ipvs)
109159e0350eSSimon Horman {
109259e0350eSSimon Horman 	return DEFAULT_SYNC_PERIOD;
109359e0350eSSimon Horman }
109459e0350eSSimon Horman 
1095749c42b6SJulian Anastasov static inline unsigned int sysctl_sync_refresh_period(struct netns_ipvs *ipvs)
1096749c42b6SJulian Anastasov {
1097749c42b6SJulian Anastasov 	return DEFAULT_SYNC_REFRESH_PERIOD;
1098749c42b6SJulian Anastasov }
1099749c42b6SJulian Anastasov 
1100749c42b6SJulian Anastasov static inline int sysctl_sync_retries(struct netns_ipvs *ipvs)
1101749c42b6SJulian Anastasov {
1102749c42b6SJulian Anastasov 	return DEFAULT_SYNC_RETRIES & 3;
1103749c42b6SJulian Anastasov }
1104749c42b6SJulian Anastasov 
11057532e8d4SSimon Horman static inline int sysctl_sync_ver(struct netns_ipvs *ipvs)
11067532e8d4SSimon Horman {
11077532e8d4SSimon Horman 	return DEFAULT_SYNC_VER;
11087532e8d4SSimon Horman }
11097532e8d4SSimon Horman 
1110c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_tcp(struct netns_ipvs *ipvs)
1111c6c96c18SAlexander Frolkin {
1112c6c96c18SAlexander Frolkin 	return DEFAULT_SLOPPY_TCP;
1113c6c96c18SAlexander Frolkin }
1114c6c96c18SAlexander Frolkin 
1115c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_sctp(struct netns_ipvs *ipvs)
1116c6c96c18SAlexander Frolkin {
1117c6c96c18SAlexander Frolkin 	return DEFAULT_SLOPPY_SCTP;
1118c6c96c18SAlexander Frolkin }
1119c6c96c18SAlexander Frolkin 
1120f73181c8SPablo Neira Ayuso static inline int sysctl_sync_ports(struct netns_ipvs *ipvs)
1121f73181c8SPablo Neira Ayuso {
1122f73181c8SPablo Neira Ayuso 	return 1;
1123f73181c8SPablo Neira Ayuso }
1124f73181c8SPablo Neira Ayuso 
11254d0c875dSJulian Anastasov static inline int sysctl_sync_persist_mode(struct netns_ipvs *ipvs)
11264d0c875dSJulian Anastasov {
11274d0c875dSJulian Anastasov 	return 0;
11284d0c875dSJulian Anastasov }
11294d0c875dSJulian Anastasov 
113007995674SZhang Yanfei static inline unsigned long sysctl_sync_qlen_max(struct netns_ipvs *ipvs)
11311c003b15SPablo Neira Ayuso {
11321c003b15SPablo Neira Ayuso 	return IPVS_SYNC_QLEN_MAX;
11331c003b15SPablo Neira Ayuso }
11341c003b15SPablo Neira Ayuso 
11351c003b15SPablo Neira Ayuso static inline int sysctl_sync_sock_size(struct netns_ipvs *ipvs)
11361c003b15SPablo Neira Ayuso {
11371c003b15SPablo Neira Ayuso 	return 0;
11381c003b15SPablo Neira Ayuso }
11391c003b15SPablo Neira Ayuso 
11403654e611SJulian Anastasov static inline int sysctl_pmtu_disc(struct netns_ipvs *ipvs)
11413654e611SJulian Anastasov {
11423654e611SJulian Anastasov 	return 1;
11433654e611SJulian Anastasov }
11443654e611SJulian Anastasov 
11450c12582fSJulian Anastasov static inline int sysctl_backup_only(struct netns_ipvs *ipvs)
11460c12582fSJulian Anastasov {
11470c12582fSJulian Anastasov 	return 0;
11480c12582fSJulian Anastasov }
11490c12582fSJulian Anastasov 
1150d752c364SMarcelo Ricardo Leitner static inline int sysctl_conn_reuse_mode(struct netns_ipvs *ipvs)
1151d752c364SMarcelo Ricardo Leitner {
1152d752c364SMarcelo Ricardo Leitner 	return 1;
1153d752c364SMarcelo Ricardo Leitner }
1154d752c364SMarcelo Ricardo Leitner 
115559e0350eSSimon Horman #endif
115659e0350eSSimon Horman 
115707dcc686SSimon Horman /* IPVS core functions
11581da177e4SLinus Torvalds  * (from ip_vs_core.c)
11591da177e4SLinus Torvalds  */
11605c3a0fd7SJoe Perches const char *ip_vs_proto_name(unsigned int proto);
11615c3a0fd7SJoe Perches void ip_vs_init_hash_table(struct list_head *table, int rows);
1162afdd6140SSven Wegener #define IP_VS_INIT_HASH_TABLE(t) ip_vs_init_hash_table((t), ARRAY_SIZE((t)))
11631da177e4SLinus Torvalds 
11641da177e4SLinus Torvalds #define IP_VS_APP_TYPE_FTP	1
11651da177e4SLinus Torvalds 
116607dcc686SSimon Horman /* ip_vs_conn handling functions
11671da177e4SLinus Torvalds  * (from ip_vs_conn.c)
11681da177e4SLinus Torvalds  */
11691da177e4SLinus Torvalds enum {
11701da177e4SLinus Torvalds 	IP_VS_DIR_INPUT = 0,
11711da177e4SLinus Torvalds 	IP_VS_DIR_OUTPUT,
11721da177e4SLinus Torvalds 	IP_VS_DIR_INPUT_ONLY,
11731da177e4SLinus Torvalds 	IP_VS_DIR_LAST,
11741da177e4SLinus Torvalds };
11751da177e4SLinus Torvalds 
11766e67e586SHans Schillstrom static inline void ip_vs_conn_fill_param(struct net *net, int af, int protocol,
1177f11017ecSSimon Horman 					 const union nf_inet_addr *caddr,
1178f11017ecSSimon Horman 					 __be16 cport,
1179f11017ecSSimon Horman 					 const union nf_inet_addr *vaddr,
1180f11017ecSSimon Horman 					 __be16 vport,
1181f11017ecSSimon Horman 					 struct ip_vs_conn_param *p)
1182f11017ecSSimon Horman {
11836e67e586SHans Schillstrom 	p->net = net;
1184f11017ecSSimon Horman 	p->af = af;
1185f11017ecSSimon Horman 	p->protocol = protocol;
1186f11017ecSSimon Horman 	p->caddr = caddr;
1187f11017ecSSimon Horman 	p->cport = cport;
1188f11017ecSSimon Horman 	p->vaddr = vaddr;
1189f11017ecSSimon Horman 	p->vport = vport;
119085999283SSimon Horman 	p->pe = NULL;
119185999283SSimon Horman 	p->pe_data = NULL;
1192f11017ecSSimon Horman }
119328364a59SJulius Volz 
1194f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_in_get(const struct ip_vs_conn_param *p);
1195f11017ecSSimon Horman struct ip_vs_conn *ip_vs_ct_in_get(const struct ip_vs_conn_param *p);
119628364a59SJulius Volz 
11975c0d2374SSimon Horman struct ip_vs_conn * ip_vs_conn_in_get_proto(int af, const struct sk_buff *skb,
11985c0d2374SSimon Horman 					    const struct ip_vs_iphdr *iph,
11995c0d2374SSimon Horman 					    int inverse);
12005c0d2374SSimon Horman 
1201f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_out_get(const struct ip_vs_conn_param *p);
12021da177e4SLinus Torvalds 
12035c0d2374SSimon Horman struct ip_vs_conn * ip_vs_conn_out_get_proto(int af, const struct sk_buff *skb,
12045c0d2374SSimon Horman 					     const struct ip_vs_iphdr *iph,
12055c0d2374SSimon Horman 					     int inverse);
12065c0d2374SSimon Horman 
1207088339a5SJulian Anastasov /* Get reference to gain full access to conn.
1208088339a5SJulian Anastasov  * By default, RCU read-side critical sections have access only to
1209088339a5SJulian Anastasov  * conn fields and its PE data, see ip_vs_conn_rcu_free() for reference.
1210088339a5SJulian Anastasov  */
1211088339a5SJulian Anastasov static inline bool __ip_vs_conn_get(struct ip_vs_conn *cp)
1212088339a5SJulian Anastasov {
1213088339a5SJulian Anastasov 	return atomic_inc_not_zero(&cp->refcnt);
1214088339a5SJulian Anastasov }
1215088339a5SJulian Anastasov 
12161da177e4SLinus Torvalds /* put back the conn without restarting its timer */
12171da177e4SLinus Torvalds static inline void __ip_vs_conn_put(struct ip_vs_conn *cp)
12181da177e4SLinus Torvalds {
12194e857c58SPeter Zijlstra 	smp_mb__before_atomic();
12201da177e4SLinus Torvalds 	atomic_dec(&cp->refcnt);
12211da177e4SLinus Torvalds }
12225c3a0fd7SJoe Perches void ip_vs_conn_put(struct ip_vs_conn *cp);
12235c3a0fd7SJoe Perches void ip_vs_conn_fill_cport(struct ip_vs_conn *cp, __be16 cport);
12241da177e4SLinus Torvalds 
1225ba38528aSAlex Gartrell struct ip_vs_conn *ip_vs_conn_new(const struct ip_vs_conn_param *p, int dest_af,
1226f11017ecSSimon Horman 				  const union nf_inet_addr *daddr,
122795c96174SEric Dumazet 				  __be16 dport, unsigned int flags,
12280e051e68SHans Schillstrom 				  struct ip_vs_dest *dest, __u32 fwmark);
12295c3a0fd7SJoe Perches void ip_vs_conn_expire_now(struct ip_vs_conn *cp);
12301da177e4SLinus Torvalds 
12315c3a0fd7SJoe Perches const char *ip_vs_state_name(__u16 proto, int state);
12321da177e4SLinus Torvalds 
12335c3a0fd7SJoe Perches void ip_vs_tcp_conn_listen(struct net *net, struct ip_vs_conn *cp);
12345c3a0fd7SJoe Perches int ip_vs_check_template(struct ip_vs_conn *ct);
12355c3a0fd7SJoe Perches void ip_vs_random_dropentry(struct net *net);
12365c3a0fd7SJoe Perches int ip_vs_conn_init(void);
12375c3a0fd7SJoe Perches void ip_vs_conn_cleanup(void);
12381da177e4SLinus Torvalds 
12391da177e4SLinus Torvalds static inline void ip_vs_control_del(struct ip_vs_conn *cp)
12401da177e4SLinus Torvalds {
12411da177e4SLinus Torvalds 	struct ip_vs_conn *ctl_cp = cp->control;
12421da177e4SLinus Torvalds 	if (!ctl_cp) {
1243cfc78c5aSJulius Volz 		IP_VS_ERR_BUF("request control DEL for uncontrolled: "
1244cfc78c5aSJulius Volz 			      "%s:%d to %s:%d\n",
1245cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1246cfc78c5aSJulius Volz 			      ntohs(cp->cport),
1247cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->vaddr),
1248cfc78c5aSJulius Volz 			      ntohs(cp->vport));
1249cfc78c5aSJulius Volz 
12501da177e4SLinus Torvalds 		return;
12511da177e4SLinus Torvalds 	}
12521da177e4SLinus Torvalds 
1253cfc78c5aSJulius Volz 	IP_VS_DBG_BUF(7, "DELeting control for: "
1254cfc78c5aSJulius Volz 		      "cp.dst=%s:%d ctl_cp.dst=%s:%d\n",
1255cfc78c5aSJulius Volz 		      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1256cfc78c5aSJulius Volz 		      ntohs(cp->cport),
1257cfc78c5aSJulius Volz 		      IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr),
1258cfc78c5aSJulius Volz 		      ntohs(ctl_cp->cport));
12591da177e4SLinus Torvalds 
12601da177e4SLinus Torvalds 	cp->control = NULL;
12611da177e4SLinus Torvalds 	if (atomic_read(&ctl_cp->n_control) == 0) {
1262cfc78c5aSJulius Volz 		IP_VS_ERR_BUF("BUG control DEL with n=0 : "
1263cfc78c5aSJulius Volz 			      "%s:%d to %s:%d\n",
1264cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1265cfc78c5aSJulius Volz 			      ntohs(cp->cport),
1266cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->vaddr),
1267cfc78c5aSJulius Volz 			      ntohs(cp->vport));
1268cfc78c5aSJulius Volz 
12691da177e4SLinus Torvalds 		return;
12701da177e4SLinus Torvalds 	}
12711da177e4SLinus Torvalds 	atomic_dec(&ctl_cp->n_control);
12721da177e4SLinus Torvalds }
12731da177e4SLinus Torvalds 
12741da177e4SLinus Torvalds static inline void
12751da177e4SLinus Torvalds ip_vs_control_add(struct ip_vs_conn *cp, struct ip_vs_conn *ctl_cp)
12761da177e4SLinus Torvalds {
12771da177e4SLinus Torvalds 	if (cp->control) {
1278cfc78c5aSJulius Volz 		IP_VS_ERR_BUF("request control ADD for already controlled: "
1279cfc78c5aSJulius Volz 			      "%s:%d to %s:%d\n",
1280cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1281cfc78c5aSJulius Volz 			      ntohs(cp->cport),
1282cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->vaddr),
1283cfc78c5aSJulius Volz 			      ntohs(cp->vport));
1284cfc78c5aSJulius Volz 
12851da177e4SLinus Torvalds 		ip_vs_control_del(cp);
12861da177e4SLinus Torvalds 	}
12871da177e4SLinus Torvalds 
1288cfc78c5aSJulius Volz 	IP_VS_DBG_BUF(7, "ADDing control for: "
1289cfc78c5aSJulius Volz 		      "cp.dst=%s:%d ctl_cp.dst=%s:%d\n",
1290cfc78c5aSJulius Volz 		      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1291cfc78c5aSJulius Volz 		      ntohs(cp->cport),
1292cfc78c5aSJulius Volz 		      IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr),
1293cfc78c5aSJulius Volz 		      ntohs(ctl_cp->cport));
12941da177e4SLinus Torvalds 
12951da177e4SLinus Torvalds 	cp->control = ctl_cp;
12961da177e4SLinus Torvalds 	atomic_inc(&ctl_cp->n_control);
12971da177e4SLinus Torvalds }
12981da177e4SLinus Torvalds 
129907dcc686SSimon Horman /* IPVS netns init & cleanup functions */
13005c3a0fd7SJoe Perches int ip_vs_estimator_net_init(struct net *net);
13015c3a0fd7SJoe Perches int ip_vs_control_net_init(struct net *net);
13025c3a0fd7SJoe Perches int ip_vs_protocol_net_init(struct net *net);
13035c3a0fd7SJoe Perches int ip_vs_app_net_init(struct net *net);
13045c3a0fd7SJoe Perches int ip_vs_conn_net_init(struct net *net);
13055c3a0fd7SJoe Perches int ip_vs_sync_net_init(struct net *net);
13065c3a0fd7SJoe Perches void ip_vs_conn_net_cleanup(struct net *net);
13075c3a0fd7SJoe Perches void ip_vs_app_net_cleanup(struct net *net);
13085c3a0fd7SJoe Perches void ip_vs_protocol_net_cleanup(struct net *net);
13095c3a0fd7SJoe Perches void ip_vs_control_net_cleanup(struct net *net);
13105c3a0fd7SJoe Perches void ip_vs_estimator_net_cleanup(struct net *net);
13115c3a0fd7SJoe Perches void ip_vs_sync_net_cleanup(struct net *net);
13125c3a0fd7SJoe Perches void ip_vs_service_net_cleanup(struct net *net);
13131da177e4SLinus Torvalds 
131407dcc686SSimon Horman /* IPVS application functions
13151da177e4SLinus Torvalds  * (from ip_vs_app.c)
13161da177e4SLinus Torvalds  */
13171da177e4SLinus Torvalds #define IP_VS_APP_MAX_PORTS  8
13185c3a0fd7SJoe Perches struct ip_vs_app *register_ip_vs_app(struct net *net, struct ip_vs_app *app);
13195c3a0fd7SJoe Perches void unregister_ip_vs_app(struct net *net, struct ip_vs_app *app);
13205c3a0fd7SJoe Perches int ip_vs_bind_app(struct ip_vs_conn *cp, struct ip_vs_protocol *pp);
13215c3a0fd7SJoe Perches void ip_vs_unbind_app(struct ip_vs_conn *cp);
13225c3a0fd7SJoe Perches int register_ip_vs_app_inc(struct net *net, struct ip_vs_app *app, __u16 proto,
13235c3a0fd7SJoe Perches 			   __u16 port);
13245c3a0fd7SJoe Perches int ip_vs_app_inc_get(struct ip_vs_app *inc);
13255c3a0fd7SJoe Perches void ip_vs_app_inc_put(struct ip_vs_app *inc);
13261da177e4SLinus Torvalds 
13275c3a0fd7SJoe Perches int ip_vs_app_pkt_out(struct ip_vs_conn *, struct sk_buff *skb);
13285c3a0fd7SJoe Perches int ip_vs_app_pkt_in(struct ip_vs_conn *, struct sk_buff *skb);
13291da177e4SLinus Torvalds 
13308be67a66SSimon Horman int register_ip_vs_pe(struct ip_vs_pe *pe);
13318be67a66SSimon Horman int unregister_ip_vs_pe(struct ip_vs_pe *pe);
1332e9e5eee8SSimon Horman struct ip_vs_pe *ip_vs_pe_getbyname(const char *name);
1333fe5e7a1eSHans Schillstrom struct ip_vs_pe *__ip_vs_pe_getbyname(const char *pe_name);
1334e9e5eee8SSimon Horman 
133507dcc686SSimon Horman /* Use a #define to avoid all of module.h just for these trivial ops */
133669e7dae4SPaul Gortmaker #define ip_vs_pe_get(pe)			\
133769e7dae4SPaul Gortmaker 	if (pe && pe->module)			\
1338e9e5eee8SSimon Horman 		__module_get(pe->module);
1339e9e5eee8SSimon Horman 
134069e7dae4SPaul Gortmaker #define ip_vs_pe_put(pe)			\
134169e7dae4SPaul Gortmaker 	if (pe && pe->module)			\
1342e9e5eee8SSimon Horman 		module_put(pe->module);
13431da177e4SLinus Torvalds 
134407dcc686SSimon Horman /* IPVS protocol functions (from ip_vs_proto.c) */
13455c3a0fd7SJoe Perches int ip_vs_protocol_init(void);
13465c3a0fd7SJoe Perches void ip_vs_protocol_cleanup(void);
13475c3a0fd7SJoe Perches void ip_vs_protocol_timeout_change(struct netns_ipvs *ipvs, int flags);
13485c3a0fd7SJoe Perches int *ip_vs_create_timeout_table(int *table, int size);
13495c3a0fd7SJoe Perches int ip_vs_set_state_timeout(int *table, int num, const char *const *names,
135036cbd3dcSJan Engelhardt 			    const char *name, int to);
13515c3a0fd7SJoe Perches void ip_vs_tcpudp_debug_packet(int af, struct ip_vs_protocol *pp,
13525c3a0fd7SJoe Perches 			       const struct sk_buff *skb, int offset,
13535c3a0fd7SJoe Perches 			       const char *msg);
13541da177e4SLinus Torvalds 
13551da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_tcp;
13561da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_udp;
13571da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_icmp;
13581da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_esp;
13591da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_ah;
13602906f66aSVenkata Mohan Reddy extern struct ip_vs_protocol ip_vs_protocol_sctp;
13611da177e4SLinus Torvalds 
136207dcc686SSimon Horman /* Registering/unregistering scheduler functions
13631da177e4SLinus Torvalds  * (from ip_vs_sched.c)
13641da177e4SLinus Torvalds  */
13655c3a0fd7SJoe Perches int register_ip_vs_scheduler(struct ip_vs_scheduler *scheduler);
13665c3a0fd7SJoe Perches int unregister_ip_vs_scheduler(struct ip_vs_scheduler *scheduler);
13675c3a0fd7SJoe Perches int ip_vs_bind_scheduler(struct ip_vs_service *svc,
13681da177e4SLinus Torvalds 			 struct ip_vs_scheduler *scheduler);
13695c3a0fd7SJoe Perches void ip_vs_unbind_scheduler(struct ip_vs_service *svc,
1370ceec4c38SJulian Anastasov 			    struct ip_vs_scheduler *sched);
13715c3a0fd7SJoe Perches struct ip_vs_scheduler *ip_vs_scheduler_get(const char *sched_name);
13725c3a0fd7SJoe Perches void ip_vs_scheduler_put(struct ip_vs_scheduler *scheduler);
13735c3a0fd7SJoe Perches struct ip_vs_conn *
1374190ecd27SJulian Anastasov ip_vs_schedule(struct ip_vs_service *svc, struct sk_buff *skb,
1375d4383f04SJesper Dangaard Brouer 	       struct ip_vs_proto_data *pd, int *ignored,
1376d4383f04SJesper Dangaard Brouer 	       struct ip_vs_iphdr *iph);
13775c3a0fd7SJoe Perches int ip_vs_leave(struct ip_vs_service *svc, struct sk_buff *skb,
1378d4383f04SJesper Dangaard Brouer 		struct ip_vs_proto_data *pd, struct ip_vs_iphdr *iph);
13791da177e4SLinus Torvalds 
13805c3a0fd7SJoe Perches void ip_vs_scheduler_err(struct ip_vs_service *svc, const char *msg);
138141ac51eeSPatrick Schaaf 
138207dcc686SSimon Horman /* IPVS control data and functions (from ip_vs_ctl.c) */
13831da177e4SLinus Torvalds extern struct ip_vs_stats ip_vs_stats;
1384b880c1f0SHans Schillstrom extern int sysctl_ip_vs_sync_ver;
13851da177e4SLinus Torvalds 
13865c3a0fd7SJoe Perches struct ip_vs_service *
1387ceec4c38SJulian Anastasov ip_vs_service_find(struct net *net, int af, __u32 fwmark, __u16 protocol,
13883c2e0505SJulius Volz 		  const union nf_inet_addr *vaddr, __be16 vport);
13891da177e4SLinus Torvalds 
13905c3a0fd7SJoe Perches bool ip_vs_has_real_service(struct net *net, int af, __u16 protocol,
13917937df15SJulius Volz 			    const union nf_inet_addr *daddr, __be16 dport);
13927937df15SJulius Volz 
13935c3a0fd7SJoe Perches int ip_vs_use_count_inc(void);
13945c3a0fd7SJoe Perches void ip_vs_use_count_dec(void);
13955c3a0fd7SJoe Perches int ip_vs_register_nl_ioctl(void);
13965c3a0fd7SJoe Perches void ip_vs_unregister_nl_ioctl(void);
13975c3a0fd7SJoe Perches int ip_vs_control_init(void);
13985c3a0fd7SJoe Perches void ip_vs_control_cleanup(void);
13995c3a0fd7SJoe Perches struct ip_vs_dest *
1400655eef10SAlex Gartrell ip_vs_find_dest(struct net *net, int svc_af, int dest_af,
1401655eef10SAlex Gartrell 		const union nf_inet_addr *daddr, __be16 dport,
1402655eef10SAlex Gartrell 		const union nf_inet_addr *vaddr, __be16 vport,
140352793dbeSJulian Anastasov 		__u16 protocol, __u32 fwmark, __u32 flags);
14045c3a0fd7SJoe Perches void ip_vs_try_bind_dest(struct ip_vs_conn *cp);
14051da177e4SLinus Torvalds 
1406fca9c20aSJulian Anastasov static inline void ip_vs_dest_hold(struct ip_vs_dest *dest)
1407fca9c20aSJulian Anastasov {
1408fca9c20aSJulian Anastasov 	atomic_inc(&dest->refcnt);
1409fca9c20aSJulian Anastasov }
1410fca9c20aSJulian Anastasov 
1411fca9c20aSJulian Anastasov static inline void ip_vs_dest_put(struct ip_vs_dest *dest)
1412fca9c20aSJulian Anastasov {
14134e857c58SPeter Zijlstra 	smp_mb__before_atomic();
1414fca9c20aSJulian Anastasov 	atomic_dec(&dest->refcnt);
1415fca9c20aSJulian Anastasov }
14161da177e4SLinus Torvalds 
14179e4e948aSJulian Anastasov static inline void ip_vs_dest_put_and_free(struct ip_vs_dest *dest)
14189e4e948aSJulian Anastasov {
14199e4e948aSJulian Anastasov 	if (atomic_dec_return(&dest->refcnt) < 0)
14209e4e948aSJulian Anastasov 		kfree(dest);
14219e4e948aSJulian Anastasov }
14229e4e948aSJulian Anastasov 
142307dcc686SSimon Horman /* IPVS sync daemon data and function prototypes
14241da177e4SLinus Torvalds  * (from ip_vs_sync.c)
14251da177e4SLinus Torvalds  */
1426e4ff6751SJulian Anastasov int start_sync_thread(struct net *net, struct ipvs_sync_daemon_cfg *cfg,
1427e4ff6751SJulian Anastasov 		      int state);
14285c3a0fd7SJoe Perches int stop_sync_thread(struct net *net, int state);
14295c3a0fd7SJoe Perches void ip_vs_sync_conn(struct net *net, struct ip_vs_conn *cp, int pkts);
14301da177e4SLinus Torvalds 
143107dcc686SSimon Horman /* IPVS rate estimator prototypes (from ip_vs_est.c) */
14325c3a0fd7SJoe Perches void ip_vs_start_estimator(struct net *net, struct ip_vs_stats *stats);
14335c3a0fd7SJoe Perches void ip_vs_stop_estimator(struct net *net, struct ip_vs_stats *stats);
14345c3a0fd7SJoe Perches void ip_vs_zero_estimator(struct ip_vs_stats *stats);
1435cd67cd5eSJulian Anastasov void ip_vs_read_estimator(struct ip_vs_kstats *dst, struct ip_vs_stats *stats);
14361da177e4SLinus Torvalds 
143707dcc686SSimon Horman /* Various IPVS packet transmitters (from ip_vs_xmit.c) */
14385c3a0fd7SJoe Perches int ip_vs_null_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1439d4383f04SJesper Dangaard Brouer 		    struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14405c3a0fd7SJoe Perches int ip_vs_bypass_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1441d4383f04SJesper Dangaard Brouer 		      struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14425c3a0fd7SJoe Perches int ip_vs_nat_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1443d4383f04SJesper Dangaard Brouer 		   struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14445c3a0fd7SJoe Perches int ip_vs_tunnel_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
14455c3a0fd7SJoe Perches 		      struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14465c3a0fd7SJoe Perches int ip_vs_dr_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
14475c3a0fd7SJoe Perches 		  struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14485c3a0fd7SJoe Perches int ip_vs_icmp_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1449d4383f04SJesper Dangaard Brouer 		    struct ip_vs_protocol *pp, int offset,
1450d4383f04SJesper Dangaard Brouer 		    unsigned int hooknum, struct ip_vs_iphdr *iph);
14515c3a0fd7SJoe Perches void ip_vs_dest_dst_rcu_free(struct rcu_head *head);
14521da177e4SLinus Torvalds 
1453b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6
14545c3a0fd7SJoe Perches int ip_vs_bypass_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
1455d4383f04SJesper Dangaard Brouer 			 struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14565c3a0fd7SJoe Perches int ip_vs_nat_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
14575c3a0fd7SJoe Perches 		      struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14585c3a0fd7SJoe Perches int ip_vs_tunnel_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
14595c3a0fd7SJoe Perches 			 struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14605c3a0fd7SJoe Perches int ip_vs_dr_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
14615c3a0fd7SJoe Perches 		     struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14625c3a0fd7SJoe Perches int ip_vs_icmp_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
1463d4383f04SJesper Dangaard Brouer 		       struct ip_vs_protocol *pp, int offset,
1464d4383f04SJesper Dangaard Brouer 		       unsigned int hooknum, struct ip_vs_iphdr *iph);
1465b3cdd2a7SJulius Volz #endif
14661da177e4SLinus Torvalds 
14673a1bbf18SSimon Horman #ifdef CONFIG_SYSCTL
146807dcc686SSimon Horman /* This is a simple mechanism to ignore packets when
14691da177e4SLinus Torvalds  * we are loaded. Just set ip_vs_drop_rate to 'n' and
14701da177e4SLinus Torvalds  * we start to drop 1/rate of the packets
14711da177e4SLinus Torvalds  */
1472a0840e2eSHans Schillstrom static inline int ip_vs_todrop(struct netns_ipvs *ipvs)
14731da177e4SLinus Torvalds {
1474a0840e2eSHans Schillstrom 	if (!ipvs->drop_rate)
1475a0840e2eSHans Schillstrom 		return 0;
1476a0840e2eSHans Schillstrom 	if (--ipvs->drop_counter > 0)
1477a0840e2eSHans Schillstrom 		return 0;
1478a0840e2eSHans Schillstrom 	ipvs->drop_counter = ipvs->drop_rate;
14791da177e4SLinus Torvalds 	return 1;
14801da177e4SLinus Torvalds }
14813a1bbf18SSimon Horman #else
14823a1bbf18SSimon Horman static inline int ip_vs_todrop(struct netns_ipvs *ipvs) { return 0; }
14833a1bbf18SSimon Horman #endif
14841da177e4SLinus Torvalds 
148507dcc686SSimon Horman /* ip_vs_fwd_tag returns the forwarding tag of the connection */
14861da177e4SLinus Torvalds #define IP_VS_FWD_METHOD(cp)  (cp->flags & IP_VS_CONN_F_FWD_MASK)
14871da177e4SLinus Torvalds 
1488732db659SAdrian Bunk static inline char ip_vs_fwd_tag(struct ip_vs_conn *cp)
14891da177e4SLinus Torvalds {
14901da177e4SLinus Torvalds 	char fwd;
14911da177e4SLinus Torvalds 
14921da177e4SLinus Torvalds 	switch (IP_VS_FWD_METHOD(cp)) {
14931da177e4SLinus Torvalds 	case IP_VS_CONN_F_MASQ:
14941da177e4SLinus Torvalds 		fwd = 'M'; break;
14951da177e4SLinus Torvalds 	case IP_VS_CONN_F_LOCALNODE:
14961da177e4SLinus Torvalds 		fwd = 'L'; break;
14971da177e4SLinus Torvalds 	case IP_VS_CONN_F_TUNNEL:
14981da177e4SLinus Torvalds 		fwd = 'T'; break;
14991da177e4SLinus Torvalds 	case IP_VS_CONN_F_DROUTE:
15001da177e4SLinus Torvalds 		fwd = 'R'; break;
15011da177e4SLinus Torvalds 	case IP_VS_CONN_F_BYPASS:
15021da177e4SLinus Torvalds 		fwd = 'B'; break;
15031da177e4SLinus Torvalds 	default:
15041da177e4SLinus Torvalds 		fwd = '?'; break;
15051da177e4SLinus Torvalds 	}
15061da177e4SLinus Torvalds 	return fwd;
15071da177e4SLinus Torvalds }
15081da177e4SLinus Torvalds 
15095c3a0fd7SJoe Perches void ip_vs_nat_icmp(struct sk_buff *skb, struct ip_vs_protocol *pp,
15101da177e4SLinus Torvalds 		    struct ip_vs_conn *cp, int dir);
15111da177e4SLinus Torvalds 
1512b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6
15135c3a0fd7SJoe Perches void ip_vs_nat_icmp_v6(struct sk_buff *skb, struct ip_vs_protocol *pp,
1514b3cdd2a7SJulius Volz 		       struct ip_vs_conn *cp, int dir);
1515b3cdd2a7SJulius Volz #endif
1516b3cdd2a7SJulius Volz 
15175c3a0fd7SJoe Perches __sum16 ip_vs_checksum_complete(struct sk_buff *skb, int offset);
15181da177e4SLinus Torvalds 
1519f9214b26SAl Viro static inline __wsum ip_vs_check_diff4(__be32 old, __be32 new, __wsum oldsum)
15201da177e4SLinus Torvalds {
1521f9214b26SAl Viro 	__be32 diff[2] = { ~old, new };
15221da177e4SLinus Torvalds 
152307f0757aSJoe Perches 	return csum_partial(diff, sizeof(diff), oldsum);
1524f9214b26SAl Viro }
1525f9214b26SAl Viro 
15260bbdd42bSJulius Volz #ifdef CONFIG_IP_VS_IPV6
15270bbdd42bSJulius Volz static inline __wsum ip_vs_check_diff16(const __be32 *old, const __be32 *new,
15280bbdd42bSJulius Volz 					__wsum oldsum)
15290bbdd42bSJulius Volz {
15300bbdd42bSJulius Volz 	__be32 diff[8] = { ~old[3], ~old[2], ~old[1], ~old[0],
15310bbdd42bSJulius Volz 			    new[3],  new[2],  new[1],  new[0] };
15320bbdd42bSJulius Volz 
153307f0757aSJoe Perches 	return csum_partial(diff, sizeof(diff), oldsum);
15340bbdd42bSJulius Volz }
15350bbdd42bSJulius Volz #endif
15360bbdd42bSJulius Volz 
1537f9214b26SAl Viro static inline __wsum ip_vs_check_diff2(__be16 old, __be16 new, __wsum oldsum)
1538f9214b26SAl Viro {
1539f9214b26SAl Viro 	__be16 diff[2] = { ~old, new };
1540f9214b26SAl Viro 
154107f0757aSJoe Perches 	return csum_partial(diff, sizeof(diff), oldsum);
15421da177e4SLinus Torvalds }
15431da177e4SLinus Torvalds 
154407dcc686SSimon Horman /* Forget current conntrack (unconfirmed) and attach notrack entry */
1545cf356d69SJulian Anastasov static inline void ip_vs_notrack(struct sk_buff *skb)
1546cf356d69SJulian Anastasov {
1547cf356d69SJulian Anastasov #if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE)
1548cf356d69SJulian Anastasov 	enum ip_conntrack_info ctinfo;
154906b69390SJesper Juhl 	struct nf_conn *ct = nf_ct_get(skb, &ctinfo);
1550cf356d69SJulian Anastasov 
1551cf356d69SJulian Anastasov 	if (!ct || !nf_ct_is_untracked(ct)) {
15529e33ce45SLin Ming 		nf_conntrack_put(skb->nfct);
1553cf356d69SJulian Anastasov 		skb->nfct = &nf_ct_untracked_get()->ct_general;
1554cf356d69SJulian Anastasov 		skb->nfctinfo = IP_CT_NEW;
1555cf356d69SJulian Anastasov 		nf_conntrack_get(skb->nfct);
1556cf356d69SJulian Anastasov 	}
1557cf356d69SJulian Anastasov #endif
1558cf356d69SJulian Anastasov }
1559cf356d69SJulian Anastasov 
1560f4bc17cdSJulian Anastasov #ifdef CONFIG_IP_VS_NFCT
156107dcc686SSimon Horman /* Netfilter connection tracking
1562f4bc17cdSJulian Anastasov  * (from ip_vs_nfct.c)
1563f4bc17cdSJulian Anastasov  */
1564a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs)
1565f4bc17cdSJulian Anastasov {
1566a4e2f5a7SSimon Horman #ifdef CONFIG_SYSCTL
1567a0840e2eSHans Schillstrom 	return ipvs->sysctl_conntrack;
1568a4e2f5a7SSimon Horman #else
1569a4e2f5a7SSimon Horman 	return 0;
1570a4e2f5a7SSimon Horman #endif
1571f4bc17cdSJulian Anastasov }
1572f4bc17cdSJulian Anastasov 
15735c3a0fd7SJoe Perches void ip_vs_update_conntrack(struct sk_buff *skb, struct ip_vs_conn *cp,
15746523ce15SJulian Anastasov 			    int outin);
15755c3a0fd7SJoe Perches int ip_vs_confirm_conntrack(struct sk_buff *skb);
15765c3a0fd7SJoe Perches void ip_vs_nfct_expect_related(struct sk_buff *skb, struct nf_conn *ct,
1577f4bc17cdSJulian Anastasov 			       struct ip_vs_conn *cp, u_int8_t proto,
1578f4bc17cdSJulian Anastasov 			       const __be16 port, int from_rs);
15795c3a0fd7SJoe Perches void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp);
1580f4bc17cdSJulian Anastasov 
1581f4bc17cdSJulian Anastasov #else
1582f4bc17cdSJulian Anastasov 
1583a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs)
1584f4bc17cdSJulian Anastasov {
1585f4bc17cdSJulian Anastasov 	return 0;
1586f4bc17cdSJulian Anastasov }
1587f4bc17cdSJulian Anastasov 
1588f4bc17cdSJulian Anastasov static inline void ip_vs_update_conntrack(struct sk_buff *skb,
1589f4bc17cdSJulian Anastasov 					  struct ip_vs_conn *cp, int outin)
1590f4bc17cdSJulian Anastasov {
1591f4bc17cdSJulian Anastasov }
1592f4bc17cdSJulian Anastasov 
1593e23ebf0fSKrzysztof Wilczynski static inline int ip_vs_confirm_conntrack(struct sk_buff *skb)
1594f4bc17cdSJulian Anastasov {
1595f4bc17cdSJulian Anastasov 	return NF_ACCEPT;
1596f4bc17cdSJulian Anastasov }
1597f4bc17cdSJulian Anastasov 
1598f4bc17cdSJulian Anastasov static inline void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp)
1599f4bc17cdSJulian Anastasov {
1600f4bc17cdSJulian Anastasov }
160107dcc686SSimon Horman #endif /* CONFIG_IP_VS_NFCT */
16026523ce15SJulian Anastasov 
1603c16526a7SSimon Kirby static inline int
1604b552f7e3SChangli Gao ip_vs_dest_conn_overhead(struct ip_vs_dest *dest)
1605b552f7e3SChangli Gao {
160607dcc686SSimon Horman 	/* We think the overhead of processing active connections is 256
1607b552f7e3SChangli Gao 	 * times higher than that of inactive connections in average. (This
1608b552f7e3SChangli Gao 	 * 256 times might not be accurate, we will change it later) We
1609b552f7e3SChangli Gao 	 * use the following formula to estimate the overhead now:
1610b552f7e3SChangli Gao 	 *		  dest->activeconns*256 + dest->inactconns
1611b552f7e3SChangli Gao 	 */
1612b552f7e3SChangli Gao 	return (atomic_read(&dest->activeconns) << 8) +
1613b552f7e3SChangli Gao 		atomic_read(&dest->inactconns);
1614b552f7e3SChangli Gao }
1615b552f7e3SChangli Gao 
1616bc4768ebSJulius Volz #endif	/* _NET_IP_VS_H */
1617