xref: /openbmc/linux/include/net/ip_vs.h (revision 391f503d69779867f05e9296ae523e9002c2d7ee)
11da177e4SLinus Torvalds /*
21da177e4SLinus Torvalds  *      IP Virtual Server
31da177e4SLinus Torvalds  *      data structure and functionality definitions
41da177e4SLinus Torvalds  */
51da177e4SLinus Torvalds 
6bc4768ebSJulius Volz #ifndef _NET_IP_VS_H
7bc4768ebSJulius Volz #define _NET_IP_VS_H
81da177e4SLinus Torvalds 
9bc4768ebSJulius Volz #include <linux/ip_vs.h>                /* definitions shared with userland */
101da177e4SLinus Torvalds 
11bc4768ebSJulius Volz #include <asm/types.h>                  /* for __uXX types */
12bc4768ebSJulius Volz 
131da177e4SLinus Torvalds #include <linux/list.h>                 /* for struct list_head */
141da177e4SLinus Torvalds #include <linux/spinlock.h>             /* for struct rwlock_t */
1560063497SArun Sharma #include <linux/atomic.h>                 /* for struct atomic_t */
161da177e4SLinus Torvalds #include <linux/compiler.h>
1714c85021SArnaldo Carvalho de Melo #include <linux/timer.h>
18187f1882SPaul Gortmaker #include <linux/bug.h>
191da177e4SLinus Torvalds 
2014c85021SArnaldo Carvalho de Melo #include <net/checksum.h>
21e7ade46aSJulius Volz #include <linux/netfilter.h>		/* for union nf_inet_addr */
221668e010SKOVACS Krisztian #include <linux/ip.h>
23e7ade46aSJulius Volz #include <linux/ipv6.h>			/* for struct ipv6hdr */
244e3fd7a0SAlexey Dobriyan #include <net/ipv6.h>
2554d83efaSJesper Dangaard Brouer #if IS_ENABLED(CONFIG_IP_VS_IPV6)
2663dca2c0SJesper Dangaard Brouer #include <linux/netfilter_ipv6/ip6_tables.h>
2763dca2c0SJesper Dangaard Brouer #endif
28a638e514SJesper Dangaard Brouer #if IS_ENABLED(CONFIG_NF_CONNTRACK)
29f4bc17cdSJulian Anastasov #include <net/netfilter/nf_conntrack.h>
30f4bc17cdSJulian Anastasov #endif
3161b1ab45SHans Schillstrom #include <net/net_namespace.h>		/* Netw namespace */
3261b1ab45SHans Schillstrom 
3361b1ab45SHans Schillstrom /*
3461b1ab45SHans Schillstrom  * Generic access of ipvs struct
3561b1ab45SHans Schillstrom  */
3661b1ab45SHans Schillstrom static inline struct netns_ipvs *net_ipvs(struct net* net)
3761b1ab45SHans Schillstrom {
3861b1ab45SHans Schillstrom 	return net->ipvs;
3961b1ab45SHans Schillstrom }
40fc723250SHans Schillstrom /*
41fc723250SHans Schillstrom  * Get net ptr from skb in traffic cases
42fc723250SHans Schillstrom  * use skb_sknet when call is from userland (ioctl or netlink)
43fc723250SHans Schillstrom  */
44a0840e2eSHans Schillstrom static inline struct net *skb_net(const struct sk_buff *skb)
45fc723250SHans Schillstrom {
46fc723250SHans Schillstrom #ifdef CONFIG_NET_NS
47fc723250SHans Schillstrom #ifdef CONFIG_IP_VS_DEBUG
48fc723250SHans Schillstrom 	/*
49fc723250SHans Schillstrom 	 * This is used for debug only.
50fc723250SHans Schillstrom 	 * Start with the most likely hit
51fc723250SHans Schillstrom 	 * End with BUG
52fc723250SHans Schillstrom 	 */
53fc723250SHans Schillstrom 	if (likely(skb->dev && skb->dev->nd_net))
54fc723250SHans Schillstrom 		return dev_net(skb->dev);
55a09d1977SHans Schillstrom 	if (skb_dst(skb) && skb_dst(skb)->dev)
56fc723250SHans Schillstrom 		return dev_net(skb_dst(skb)->dev);
57fc723250SHans Schillstrom 	WARN(skb->sk, "Maybe skb_sknet should be used in %s() at line:%d\n",
58fc723250SHans Schillstrom 		      __func__, __LINE__);
59fc723250SHans Schillstrom 	if (likely(skb->sk && skb->sk->sk_net))
60fc723250SHans Schillstrom 		return sock_net(skb->sk);
61fc723250SHans Schillstrom 	pr_err("There is no net ptr to find in the skb in %s() line:%d\n",
62fc723250SHans Schillstrom 		__func__, __LINE__);
63fc723250SHans Schillstrom 	BUG();
64fc723250SHans Schillstrom #else
65fc723250SHans Schillstrom 	return dev_net(skb->dev ? : skb_dst(skb)->dev);
66fc723250SHans Schillstrom #endif
67fc723250SHans Schillstrom #else
68fc723250SHans Schillstrom 	return &init_net;
69fc723250SHans Schillstrom #endif
70fc723250SHans Schillstrom }
71fc723250SHans Schillstrom 
72a0840e2eSHans Schillstrom static inline struct net *skb_sknet(const struct sk_buff *skb)
73fc723250SHans Schillstrom {
74fc723250SHans Schillstrom #ifdef CONFIG_NET_NS
75fc723250SHans Schillstrom #ifdef CONFIG_IP_VS_DEBUG
76fc723250SHans Schillstrom 	/* Start with the most likely hit */
77fc723250SHans Schillstrom 	if (likely(skb->sk && skb->sk->sk_net))
78fc723250SHans Schillstrom 		return sock_net(skb->sk);
79fc723250SHans Schillstrom 	WARN(skb->dev, "Maybe skb_net should be used instead in %s() line:%d\n",
80fc723250SHans Schillstrom 		       __func__, __LINE__);
81fc723250SHans Schillstrom 	if (likely(skb->dev && skb->dev->nd_net))
82fc723250SHans Schillstrom 		return dev_net(skb->dev);
83fc723250SHans Schillstrom 	pr_err("There is no net ptr to find in the skb in %s() line:%d\n",
84fc723250SHans Schillstrom 		__func__, __LINE__);
85fc723250SHans Schillstrom 	BUG();
86fc723250SHans Schillstrom #else
87fc723250SHans Schillstrom 	return sock_net(skb->sk);
88fc723250SHans Schillstrom #endif
89fc723250SHans Schillstrom #else
90fc723250SHans Schillstrom 	return &init_net;
91fc723250SHans Schillstrom #endif
92fc723250SHans Schillstrom }
93b17fc996SHans Schillstrom /*
94b17fc996SHans Schillstrom  * This one needed for single_open_net since net is stored directly in
9525985edcSLucas De Marchi  * private not as a struct i.e. seq_file_net can't be used.
96b17fc996SHans Schillstrom  */
97b17fc996SHans Schillstrom static inline struct net *seq_file_single_net(struct seq_file *seq)
98b17fc996SHans Schillstrom {
99b17fc996SHans Schillstrom #ifdef CONFIG_NET_NS
100b17fc996SHans Schillstrom 	return (struct net *)seq->private;
101b17fc996SHans Schillstrom #else
102b17fc996SHans Schillstrom 	return &init_net;
103b17fc996SHans Schillstrom #endif
104b17fc996SHans Schillstrom }
1056f7edb48SCatalin(ux) M. BOIE 
1066f7edb48SCatalin(ux) M. BOIE /* Connections' size value needed by ip_vs_ctl.c */
1076f7edb48SCatalin(ux) M. BOIE extern int ip_vs_conn_tab_size;
1086f7edb48SCatalin(ux) M. BOIE 
10964aae3cbSJulius Volz struct ip_vs_iphdr {
11063dca2c0SJesper Dangaard Brouer 	__u32 len;	/* IPv4 simply where L4 starts
11163dca2c0SJesper Dangaard Brouer 			   IPv6 where L4 Transport Header starts */
11263dca2c0SJesper Dangaard Brouer 	__u16 fragoffs; /* IPv6 fragment offset, 0 if first frag (or not frag)*/
11363dca2c0SJesper Dangaard Brouer 	__s16 protocol;
11463dca2c0SJesper Dangaard Brouer 	__s32 flags;
11564aae3cbSJulius Volz 	union nf_inet_addr saddr;
11664aae3cbSJulius Volz 	union nf_inet_addr daddr;
11764aae3cbSJulius Volz };
11864aae3cbSJulius Volz 
1192f74713dSJesper Dangaard Brouer static inline void *frag_safe_skb_hp(const struct sk_buff *skb, int offset,
1202f74713dSJesper Dangaard Brouer 				      int len, void *buffer,
1212f74713dSJesper Dangaard Brouer 				      const struct ip_vs_iphdr *ipvsh)
1222f74713dSJesper Dangaard Brouer {
1232f74713dSJesper Dangaard Brouer 	return skb_header_pointer(skb, offset, len, buffer);
1242f74713dSJesper Dangaard Brouer }
1252f74713dSJesper Dangaard Brouer 
12664aae3cbSJulius Volz static inline void
12763dca2c0SJesper Dangaard Brouer ip_vs_fill_ip4hdr(const void *nh, struct ip_vs_iphdr *iphdr)
12863dca2c0SJesper Dangaard Brouer {
12963dca2c0SJesper Dangaard Brouer 	const struct iphdr *iph = nh;
13063dca2c0SJesper Dangaard Brouer 
13163dca2c0SJesper Dangaard Brouer 	iphdr->len	= iph->ihl * 4;
13263dca2c0SJesper Dangaard Brouer 	iphdr->fragoffs	= 0;
13363dca2c0SJesper Dangaard Brouer 	iphdr->protocol	= iph->protocol;
13463dca2c0SJesper Dangaard Brouer 	iphdr->saddr.ip	= iph->saddr;
13563dca2c0SJesper Dangaard Brouer 	iphdr->daddr.ip	= iph->daddr;
13663dca2c0SJesper Dangaard Brouer }
13763dca2c0SJesper Dangaard Brouer 
13863dca2c0SJesper Dangaard Brouer /* This function handles filling *ip_vs_iphdr, both for IPv4 and IPv6.
13963dca2c0SJesper Dangaard Brouer  * IPv6 requires some extra work, as finding proper header position,
14063dca2c0SJesper Dangaard Brouer  * depend on the IPv6 extension headers.
14163dca2c0SJesper Dangaard Brouer  */
14263dca2c0SJesper Dangaard Brouer static inline void
14363dca2c0SJesper Dangaard Brouer ip_vs_fill_iph_skb(int af, const struct sk_buff *skb, struct ip_vs_iphdr *iphdr)
14464aae3cbSJulius Volz {
14564aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6
14664aae3cbSJulius Volz 	if (af == AF_INET6) {
14763dca2c0SJesper Dangaard Brouer 		const struct ipv6hdr *iph =
14863dca2c0SJesper Dangaard Brouer 			(struct ipv6hdr *)skb_network_header(skb);
1494e3fd7a0SAlexey Dobriyan 		iphdr->saddr.in6 = iph->saddr;
1504e3fd7a0SAlexey Dobriyan 		iphdr->daddr.in6 = iph->daddr;
1516aafeef0SJiri Pirko 		/* ipv6_find_hdr() updates len, flags */
15263dca2c0SJesper Dangaard Brouer 		iphdr->len	 = 0;
15363dca2c0SJesper Dangaard Brouer 		iphdr->flags	 = 0;
15463dca2c0SJesper Dangaard Brouer 		iphdr->protocol  = ipv6_find_hdr(skb, &iphdr->len, -1,
15563dca2c0SJesper Dangaard Brouer 						 &iphdr->fragoffs,
15663dca2c0SJesper Dangaard Brouer 						 &iphdr->flags);
15764aae3cbSJulius Volz 	} else
15864aae3cbSJulius Volz #endif
15964aae3cbSJulius Volz 	{
16063dca2c0SJesper Dangaard Brouer 		const struct iphdr *iph =
16163dca2c0SJesper Dangaard Brouer 			(struct iphdr *)skb_network_header(skb);
16264aae3cbSJulius Volz 		iphdr->len	= iph->ihl * 4;
16363dca2c0SJesper Dangaard Brouer 		iphdr->fragoffs	= 0;
16464aae3cbSJulius Volz 		iphdr->protocol	= iph->protocol;
16564aae3cbSJulius Volz 		iphdr->saddr.ip	= iph->saddr;
16664aae3cbSJulius Volz 		iphdr->daddr.ip	= iph->daddr;
16764aae3cbSJulius Volz 	}
16864aae3cbSJulius Volz }
16964aae3cbSJulius Volz 
17064aae3cbSJulius Volz static inline void ip_vs_addr_copy(int af, union nf_inet_addr *dst,
17164aae3cbSJulius Volz 				   const union nf_inet_addr *src)
17264aae3cbSJulius Volz {
17364aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6
17464aae3cbSJulius Volz 	if (af == AF_INET6)
1754e3fd7a0SAlexey Dobriyan 		dst->in6 = src->in6;
17664aae3cbSJulius Volz 	else
17764aae3cbSJulius Volz #endif
17864aae3cbSJulius Volz 	dst->ip = src->ip;
17964aae3cbSJulius Volz }
18064aae3cbSJulius Volz 
1819a05475cSJulian Anastasov static inline void ip_vs_addr_set(int af, union nf_inet_addr *dst,
1829a05475cSJulian Anastasov 				  const union nf_inet_addr *src)
1839a05475cSJulian Anastasov {
1849a05475cSJulian Anastasov #ifdef CONFIG_IP_VS_IPV6
1859a05475cSJulian Anastasov 	if (af == AF_INET6) {
1869a05475cSJulian Anastasov 		dst->in6 = src->in6;
1879a05475cSJulian Anastasov 		return;
1889a05475cSJulian Anastasov 	}
1899a05475cSJulian Anastasov #endif
1909a05475cSJulian Anastasov 	dst->ip = src->ip;
1919a05475cSJulian Anastasov 	dst->all[1] = 0;
1929a05475cSJulian Anastasov 	dst->all[2] = 0;
1939a05475cSJulian Anastasov 	dst->all[3] = 0;
1949a05475cSJulian Anastasov }
1959a05475cSJulian Anastasov 
19664aae3cbSJulius Volz static inline int ip_vs_addr_equal(int af, const union nf_inet_addr *a,
19764aae3cbSJulius Volz 				   const union nf_inet_addr *b)
19864aae3cbSJulius Volz {
19964aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6
20064aae3cbSJulius Volz 	if (af == AF_INET6)
20164aae3cbSJulius Volz 		return ipv6_addr_equal(&a->in6, &b->in6);
20264aae3cbSJulius Volz #endif
20364aae3cbSJulius Volz 	return a->ip == b->ip;
20464aae3cbSJulius Volz }
20564aae3cbSJulius Volz 
2061da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG
20714c85021SArnaldo Carvalho de Melo #include <linux/net.h>
20814c85021SArnaldo Carvalho de Melo 
2095c3a0fd7SJoe Perches int ip_vs_get_debug_level(void);
210c842a3adSJulius Volz 
211c842a3adSJulius Volz static inline const char *ip_vs_dbg_addr(int af, char *buf, size_t buf_len,
212c842a3adSJulius Volz 					 const union nf_inet_addr *addr,
213c842a3adSJulius Volz 					 int *idx)
214c842a3adSJulius Volz {
215c842a3adSJulius Volz 	int len;
216c842a3adSJulius Volz #ifdef CONFIG_IP_VS_IPV6
217c842a3adSJulius Volz 	if (af == AF_INET6)
218120b9c14SJesper Dangaard Brouer 		len = snprintf(&buf[*idx], buf_len - *idx, "[%pI6c]",
2190c6ce78aSHarvey Harrison 			       &addr->in6) + 1;
220c842a3adSJulius Volz 	else
221c842a3adSJulius Volz #endif
2223685f25dSHarvey Harrison 		len = snprintf(&buf[*idx], buf_len - *idx, "%pI4",
2233685f25dSHarvey Harrison 			       &addr->ip) + 1;
224c842a3adSJulius Volz 
225c842a3adSJulius Volz 	*idx += len;
226c842a3adSJulius Volz 	BUG_ON(*idx > buf_len + 1);
227c842a3adSJulius Volz 	return &buf[*idx - len];
228c842a3adSJulius Volz }
229c842a3adSJulius Volz 
2309aada7acSHannes Eder #define IP_VS_DBG_BUF(level, msg, ...)					\
231c842a3adSJulius Volz 	do {								\
232c842a3adSJulius Volz 		char ip_vs_dbg_buf[160];				\
233c842a3adSJulius Volz 		int ip_vs_dbg_idx = 0;					\
234c842a3adSJulius Volz 		if (level <= ip_vs_get_debug_level())			\
2359aada7acSHannes Eder 			printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__);	\
236c842a3adSJulius Volz 	} while (0)
237c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...)						\
238c842a3adSJulius Volz 	do {								\
239c842a3adSJulius Volz 		char ip_vs_dbg_buf[160];				\
240c842a3adSJulius Volz 		int ip_vs_dbg_idx = 0;					\
2419aada7acSHannes Eder 		pr_err(msg);						\
242c842a3adSJulius Volz 	} while (0)
243c842a3adSJulius Volz 
244c842a3adSJulius Volz /* Only use from within IP_VS_DBG_BUF() or IP_VS_ERR_BUF macros */
245c842a3adSJulius Volz #define IP_VS_DBG_ADDR(af, addr)					\
246c842a3adSJulius Volz 	ip_vs_dbg_addr(af, ip_vs_dbg_buf,				\
247c842a3adSJulius Volz 		       sizeof(ip_vs_dbg_buf), addr,			\
248c842a3adSJulius Volz 		       &ip_vs_dbg_idx)
249c842a3adSJulius Volz 
2509aada7acSHannes Eder #define IP_VS_DBG(level, msg, ...)					\
2511da177e4SLinus Torvalds 	do {								\
2521da177e4SLinus Torvalds 		if (level <= ip_vs_get_debug_level())			\
2539aada7acSHannes Eder 			printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__);	\
2541da177e4SLinus Torvalds 	} while (0)
2559aada7acSHannes Eder #define IP_VS_DBG_RL(msg, ...)						\
2561da177e4SLinus Torvalds 	do {								\
2571da177e4SLinus Torvalds 		if (net_ratelimit())					\
2589aada7acSHannes Eder 			printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__);	\
2591da177e4SLinus Torvalds 	} while (0)
2600d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg)			\
2611da177e4SLinus Torvalds 	do {								\
2621da177e4SLinus Torvalds 		if (level <= ip_vs_get_debug_level())			\
2630d79641aSJulian Anastasov 			pp->debug_packet(af, pp, skb, ofs, msg);	\
2641da177e4SLinus Torvalds 	} while (0)
2650d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg)			\
2661da177e4SLinus Torvalds 	do {								\
2671da177e4SLinus Torvalds 		if (level <= ip_vs_get_debug_level() &&			\
2681da177e4SLinus Torvalds 		    net_ratelimit())					\
2690d79641aSJulian Anastasov 			pp->debug_packet(af, pp, skb, ofs, msg);	\
2701da177e4SLinus Torvalds 	} while (0)
2711da177e4SLinus Torvalds #else	/* NO DEBUGGING at ALL */
272c842a3adSJulius Volz #define IP_VS_DBG_BUF(level, msg...)  do {} while (0)
273c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...)  do {} while (0)
2741da177e4SLinus Torvalds #define IP_VS_DBG(level, msg...)  do {} while (0)
2751da177e4SLinus Torvalds #define IP_VS_DBG_RL(msg...)  do {} while (0)
2760d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg)	do {} while (0)
2770d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg)	do {} while (0)
2781da177e4SLinus Torvalds #endif
2791da177e4SLinus Torvalds 
2801da177e4SLinus Torvalds #define IP_VS_BUG() BUG()
2811e3e238eSHannes Eder #define IP_VS_ERR_RL(msg, ...)						\
2821da177e4SLinus Torvalds 	do {								\
2831da177e4SLinus Torvalds 		if (net_ratelimit())					\
2841e3e238eSHannes Eder 			pr_err(msg, ##__VA_ARGS__);			\
2851da177e4SLinus Torvalds 	} while (0)
2861da177e4SLinus Torvalds 
2871da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG
2881da177e4SLinus Torvalds #define EnterFunction(level)						\
2891da177e4SLinus Torvalds 	do {								\
2901da177e4SLinus Torvalds 		if (level <= ip_vs_get_debug_level())			\
2919aada7acSHannes Eder 			printk(KERN_DEBUG				\
2929aada7acSHannes Eder 			       pr_fmt("Enter: %s, %s line %i\n"),	\
293d5c003b4SHarvey Harrison 			       __func__, __FILE__, __LINE__);		\
2941da177e4SLinus Torvalds 	} while (0)
2951da177e4SLinus Torvalds #define LeaveFunction(level)						\
2961da177e4SLinus Torvalds 	do {								\
2971da177e4SLinus Torvalds 		if (level <= ip_vs_get_debug_level())			\
2989aada7acSHannes Eder 			printk(KERN_DEBUG				\
2999aada7acSHannes Eder 			       pr_fmt("Leave: %s, %s line %i\n"),	\
300d5c003b4SHarvey Harrison 			       __func__, __FILE__, __LINE__);		\
3011da177e4SLinus Torvalds 	} while (0)
3021da177e4SLinus Torvalds #else
3031da177e4SLinus Torvalds #define EnterFunction(level)   do {} while (0)
3041da177e4SLinus Torvalds #define LeaveFunction(level)   do {} while (0)
3051da177e4SLinus Torvalds #endif
3061da177e4SLinus Torvalds 
3071da177e4SLinus Torvalds 
3081da177e4SLinus Torvalds /*
3091da177e4SLinus Torvalds  *      The port number of FTP service (in network order).
3101da177e4SLinus Torvalds  */
311f3a7c66bSHarvey Harrison #define FTPPORT  cpu_to_be16(21)
312f3a7c66bSHarvey Harrison #define FTPDATA  cpu_to_be16(20)
3131da177e4SLinus Torvalds 
3141da177e4SLinus Torvalds /*
3151da177e4SLinus Torvalds  *      TCP State Values
3161da177e4SLinus Torvalds  */
3171da177e4SLinus Torvalds enum {
3181da177e4SLinus Torvalds 	IP_VS_TCP_S_NONE = 0,
3191da177e4SLinus Torvalds 	IP_VS_TCP_S_ESTABLISHED,
3201da177e4SLinus Torvalds 	IP_VS_TCP_S_SYN_SENT,
3211da177e4SLinus Torvalds 	IP_VS_TCP_S_SYN_RECV,
3221da177e4SLinus Torvalds 	IP_VS_TCP_S_FIN_WAIT,
3231da177e4SLinus Torvalds 	IP_VS_TCP_S_TIME_WAIT,
3241da177e4SLinus Torvalds 	IP_VS_TCP_S_CLOSE,
3251da177e4SLinus Torvalds 	IP_VS_TCP_S_CLOSE_WAIT,
3261da177e4SLinus Torvalds 	IP_VS_TCP_S_LAST_ACK,
3271da177e4SLinus Torvalds 	IP_VS_TCP_S_LISTEN,
3281da177e4SLinus Torvalds 	IP_VS_TCP_S_SYNACK,
3291da177e4SLinus Torvalds 	IP_VS_TCP_S_LAST
3301da177e4SLinus Torvalds };
3311da177e4SLinus Torvalds 
3321da177e4SLinus Torvalds /*
3331da177e4SLinus Torvalds  *	UDP State Values
3341da177e4SLinus Torvalds  */
3351da177e4SLinus Torvalds enum {
3361da177e4SLinus Torvalds 	IP_VS_UDP_S_NORMAL,
3371da177e4SLinus Torvalds 	IP_VS_UDP_S_LAST,
3381da177e4SLinus Torvalds };
3391da177e4SLinus Torvalds 
3401da177e4SLinus Torvalds /*
3411da177e4SLinus Torvalds  *	ICMP State Values
3421da177e4SLinus Torvalds  */
3431da177e4SLinus Torvalds enum {
3441da177e4SLinus Torvalds 	IP_VS_ICMP_S_NORMAL,
3451da177e4SLinus Torvalds 	IP_VS_ICMP_S_LAST,
3461da177e4SLinus Torvalds };
3471da177e4SLinus Torvalds 
3481da177e4SLinus Torvalds /*
3492906f66aSVenkata Mohan Reddy  *	SCTP State Values
3502906f66aSVenkata Mohan Reddy  */
3512906f66aSVenkata Mohan Reddy enum ip_vs_sctp_states {
3522906f66aSVenkata Mohan Reddy 	IP_VS_SCTP_S_NONE,
35361e7c420SJulian Anastasov 	IP_VS_SCTP_S_INIT1,
35461e7c420SJulian Anastasov 	IP_VS_SCTP_S_INIT,
35561e7c420SJulian Anastasov 	IP_VS_SCTP_S_COOKIE_SENT,
35661e7c420SJulian Anastasov 	IP_VS_SCTP_S_COOKIE_REPLIED,
35761e7c420SJulian Anastasov 	IP_VS_SCTP_S_COOKIE_WAIT,
35861e7c420SJulian Anastasov 	IP_VS_SCTP_S_COOKIE,
35961e7c420SJulian Anastasov 	IP_VS_SCTP_S_COOKIE_ECHOED,
3602906f66aSVenkata Mohan Reddy 	IP_VS_SCTP_S_ESTABLISHED,
36161e7c420SJulian Anastasov 	IP_VS_SCTP_S_SHUTDOWN_SENT,
36261e7c420SJulian Anastasov 	IP_VS_SCTP_S_SHUTDOWN_RECEIVED,
36361e7c420SJulian Anastasov 	IP_VS_SCTP_S_SHUTDOWN_ACK_SENT,
36461e7c420SJulian Anastasov 	IP_VS_SCTP_S_REJECTED,
3652906f66aSVenkata Mohan Reddy 	IP_VS_SCTP_S_CLOSED,
3662906f66aSVenkata Mohan Reddy 	IP_VS_SCTP_S_LAST
3672906f66aSVenkata Mohan Reddy };
3682906f66aSVenkata Mohan Reddy 
3692906f66aSVenkata Mohan Reddy /*
3701da177e4SLinus Torvalds  *	Delta sequence info structure
3711da177e4SLinus Torvalds  *	Each ip_vs_conn has 2 (output AND input seq. changes).
3721da177e4SLinus Torvalds  *      Only used in the VS/NAT.
3731da177e4SLinus Torvalds  */
3741da177e4SLinus Torvalds struct ip_vs_seq {
3751da177e4SLinus Torvalds 	__u32			init_seq;	/* Add delta from this seq */
3761da177e4SLinus Torvalds 	__u32			delta;		/* Delta in sequence numbers */
3771da177e4SLinus Torvalds 	__u32			previous_delta;	/* Delta in sequence numbers
3781da177e4SLinus Torvalds 						   before last resized pkt */
3791da177e4SLinus Torvalds };
3801da177e4SLinus Torvalds 
381b17fc996SHans Schillstrom /*
382b17fc996SHans Schillstrom  * counters per cpu
383b17fc996SHans Schillstrom  */
384b17fc996SHans Schillstrom struct ip_vs_counters {
385b17fc996SHans Schillstrom 	__u32		conns;		/* connections scheduled */
386b17fc996SHans Schillstrom 	__u32		inpkts;		/* incoming packets */
387b17fc996SHans Schillstrom 	__u32		outpkts;	/* outgoing packets */
388b17fc996SHans Schillstrom 	__u64		inbytes;	/* incoming bytes */
389b17fc996SHans Schillstrom 	__u64		outbytes;	/* outgoing bytes */
390b17fc996SHans Schillstrom };
391b17fc996SHans Schillstrom /*
392b17fc996SHans Schillstrom  * Stats per cpu
393b17fc996SHans Schillstrom  */
394b17fc996SHans Schillstrom struct ip_vs_cpu_stats {
395b17fc996SHans Schillstrom 	struct ip_vs_counters   ustats;
396b17fc996SHans Schillstrom 	struct u64_stats_sync   syncp;
397b17fc996SHans Schillstrom };
3981da177e4SLinus Torvalds 
3991da177e4SLinus Torvalds /*
4003a14a313SSven Wegener  *	IPVS statistics objects
4011da177e4SLinus Torvalds  */
4023a14a313SSven Wegener struct ip_vs_estimator {
4033a14a313SSven Wegener 	struct list_head	list;
4043a14a313SSven Wegener 
4053a14a313SSven Wegener 	u64			last_inbytes;
4063a14a313SSven Wegener 	u64			last_outbytes;
4073a14a313SSven Wegener 	u32			last_conns;
4083a14a313SSven Wegener 	u32			last_inpkts;
4093a14a313SSven Wegener 	u32			last_outpkts;
4103a14a313SSven Wegener 
4113a14a313SSven Wegener 	u32			cps;
4123a14a313SSven Wegener 	u32			inpps;
4133a14a313SSven Wegener 	u32			outpps;
4143a14a313SSven Wegener 	u32			inbps;
4153a14a313SSven Wegener 	u32			outbps;
4163a14a313SSven Wegener };
4173a14a313SSven Wegener 
418fd2c3ef7SEric Dumazet struct ip_vs_stats {
419e9c0ce23SSven Wegener 	struct ip_vs_stats_user	ustats;		/* statistics */
420e9c0ce23SSven Wegener 	struct ip_vs_estimator	est;		/* estimator */
421b962abdcSJulian Anastasov 	struct ip_vs_cpu_stats __percpu	*cpustats;	/* per cpu counters */
4221da177e4SLinus Torvalds 	spinlock_t		lock;		/* spin lock */
42355a3d4e1SJulian Anastasov 	struct ip_vs_stats_user	ustats0;	/* reset values */
4241da177e4SLinus Torvalds };
4251da177e4SLinus Torvalds 
42614c85021SArnaldo Carvalho de Melo struct dst_entry;
42714c85021SArnaldo Carvalho de Melo struct iphdr;
4281da177e4SLinus Torvalds struct ip_vs_conn;
4291da177e4SLinus Torvalds struct ip_vs_app;
43014c85021SArnaldo Carvalho de Melo struct sk_buff;
431252c6410SHans Schillstrom struct ip_vs_proto_data;
4321da177e4SLinus Torvalds 
4331da177e4SLinus Torvalds struct ip_vs_protocol {
4341da177e4SLinus Torvalds 	struct ip_vs_protocol	*next;
4351da177e4SLinus Torvalds 	char			*name;
4362ad17defSJulian Anastasov 	u16			protocol;
4372ad17defSJulian Anastasov 	u16			num_states;
4381da177e4SLinus Torvalds 	int			dont_defrag;
4391da177e4SLinus Torvalds 
4401da177e4SLinus Torvalds 	void (*init)(struct ip_vs_protocol *pp);
4411da177e4SLinus Torvalds 
4421da177e4SLinus Torvalds 	void (*exit)(struct ip_vs_protocol *pp);
4431da177e4SLinus Torvalds 
444582b8e3eSHans Schillstrom 	int (*init_netns)(struct net *net, struct ip_vs_proto_data *pd);
445252c6410SHans Schillstrom 
446252c6410SHans Schillstrom 	void (*exit_netns)(struct net *net, struct ip_vs_proto_data *pd);
447252c6410SHans Schillstrom 
44851ef348bSJulius Volz 	int (*conn_schedule)(int af, struct sk_buff *skb,
4499330419dSHans Schillstrom 			     struct ip_vs_proto_data *pd,
450d4383f04SJesper Dangaard Brouer 			     int *verdict, struct ip_vs_conn **cpp,
451d4383f04SJesper Dangaard Brouer 			     struct ip_vs_iphdr *iph);
4521da177e4SLinus Torvalds 
4531da177e4SLinus Torvalds 	struct ip_vs_conn *
45451ef348bSJulius Volz 	(*conn_in_get)(int af,
45551ef348bSJulius Volz 		       const struct sk_buff *skb,
45651ef348bSJulius Volz 		       const struct ip_vs_iphdr *iph,
4571da177e4SLinus Torvalds 		       int inverse);
4581da177e4SLinus Torvalds 
4591da177e4SLinus Torvalds 	struct ip_vs_conn *
46051ef348bSJulius Volz 	(*conn_out_get)(int af,
46151ef348bSJulius Volz 			const struct sk_buff *skb,
46251ef348bSJulius Volz 			const struct ip_vs_iphdr *iph,
4631da177e4SLinus Torvalds 			int inverse);
4641da177e4SLinus Torvalds 
465d4383f04SJesper Dangaard Brouer 	int (*snat_handler)(struct sk_buff *skb, struct ip_vs_protocol *pp,
466d4383f04SJesper Dangaard Brouer 			    struct ip_vs_conn *cp, struct ip_vs_iphdr *iph);
4671da177e4SLinus Torvalds 
468d4383f04SJesper Dangaard Brouer 	int (*dnat_handler)(struct sk_buff *skb, struct ip_vs_protocol *pp,
469d4383f04SJesper Dangaard Brouer 			    struct ip_vs_conn *cp, struct ip_vs_iphdr *iph);
4701da177e4SLinus Torvalds 
47151ef348bSJulius Volz 	int (*csum_check)(int af, struct sk_buff *skb,
47251ef348bSJulius Volz 			  struct ip_vs_protocol *pp);
4731da177e4SLinus Torvalds 
4741da177e4SLinus Torvalds 	const char *(*state_name)(int state);
4751da177e4SLinus Torvalds 
4764a516f11SSimon Horman 	void (*state_transition)(struct ip_vs_conn *cp, int direction,
4771da177e4SLinus Torvalds 				 const struct sk_buff *skb,
4789330419dSHans Schillstrom 				 struct ip_vs_proto_data *pd);
4791da177e4SLinus Torvalds 
480ab8a5e84SHans Schillstrom 	int (*register_app)(struct net *net, struct ip_vs_app *inc);
4811da177e4SLinus Torvalds 
482ab8a5e84SHans Schillstrom 	void (*unregister_app)(struct net *net, struct ip_vs_app *inc);
4831da177e4SLinus Torvalds 
4841da177e4SLinus Torvalds 	int (*app_conn_bind)(struct ip_vs_conn *cp);
4851da177e4SLinus Torvalds 
4860d79641aSJulian Anastasov 	void (*debug_packet)(int af, struct ip_vs_protocol *pp,
4871da177e4SLinus Torvalds 			     const struct sk_buff *skb,
4881da177e4SLinus Torvalds 			     int offset,
4891da177e4SLinus Torvalds 			     const char *msg);
4901da177e4SLinus Torvalds 
4919330419dSHans Schillstrom 	void (*timeout_change)(struct ip_vs_proto_data *pd, int flags);
4921da177e4SLinus Torvalds };
4931da177e4SLinus Torvalds 
494252c6410SHans Schillstrom /*
495252c6410SHans Schillstrom  * protocol data per netns
496252c6410SHans Schillstrom  */
497252c6410SHans Schillstrom struct ip_vs_proto_data {
498252c6410SHans Schillstrom 	struct ip_vs_proto_data	*next;
499252c6410SHans Schillstrom 	struct ip_vs_protocol	*pp;
500252c6410SHans Schillstrom 	int			*timeout_table;	/* protocol timeout table */
501252c6410SHans Schillstrom 	atomic_t		appcnt;		/* counter of proto app incs. */
502252c6410SHans Schillstrom 	struct tcp_states_t	*tcp_state_table;
503252c6410SHans Schillstrom };
504252c6410SHans Schillstrom 
5055c3a0fd7SJoe Perches struct ip_vs_protocol   *ip_vs_proto_get(unsigned short proto);
5065c3a0fd7SJoe Perches struct ip_vs_proto_data *ip_vs_proto_data_get(struct net *net,
507252c6410SHans Schillstrom 					      unsigned short proto);
5081da177e4SLinus Torvalds 
509f11017ecSSimon Horman struct ip_vs_conn_param {
5106e67e586SHans Schillstrom 	struct net			*net;
511f11017ecSSimon Horman 	const union nf_inet_addr	*caddr;
512f11017ecSSimon Horman 	const union nf_inet_addr	*vaddr;
513f11017ecSSimon Horman 	__be16				cport;
514f11017ecSSimon Horman 	__be16				vport;
515f11017ecSSimon Horman 	__u16				protocol;
516f11017ecSSimon Horman 	u16				af;
51785999283SSimon Horman 
51885999283SSimon Horman 	const struct ip_vs_pe		*pe;
51985999283SSimon Horman 	char				*pe_data;
52085999283SSimon Horman 	__u8				pe_data_len;
521f11017ecSSimon Horman };
522f11017ecSSimon Horman 
5231da177e4SLinus Torvalds /*
5241da177e4SLinus Torvalds  *	IP_VS structure allocated for each dynamically scheduled connection
5251da177e4SLinus Torvalds  */
5261da177e4SLinus Torvalds struct ip_vs_conn {
527731109e7SChangli Gao 	struct hlist_node	c_list;         /* hashed list heads */
5281da177e4SLinus Torvalds 	/* Protocol, addresses and port numbers */
5296e67e586SHans Schillstrom 	__be16                  cport;
5306e67e586SHans Schillstrom 	__be16                  dport;
5311845ed0bSJulian Anastasov 	__be16                  vport;
5321845ed0bSJulian Anastasov 	u16			af;		/* address family */
533e7ade46aSJulius Volz 	union nf_inet_addr      caddr;          /* client address */
534e7ade46aSJulius Volz 	union nf_inet_addr      vaddr;          /* virtual address */
535e7ade46aSJulius Volz 	union nf_inet_addr      daddr;          /* destination address */
5363575792eSJulian Anastasov 	volatile __u32          flags;          /* status flags */
5371da177e4SLinus Torvalds 	__u16                   protocol;       /* Which protocol (TCP/UDP) */
538ba38528aSAlex Gartrell 	__u16			daf;		/* Address family of the dest */
5391845ed0bSJulian Anastasov #ifdef CONFIG_NET_NS
5401845ed0bSJulian Anastasov 	struct net              *net;           /* Name space */
5411845ed0bSJulian Anastasov #endif
5421da177e4SLinus Torvalds 
5431da177e4SLinus Torvalds 	/* counter and timer */
5441da177e4SLinus Torvalds 	atomic_t		refcnt;		/* reference count */
5451da177e4SLinus Torvalds 	struct timer_list	timer;		/* Expiration timer */
5461da177e4SLinus Torvalds 	volatile unsigned long	timeout;	/* timeout */
5471da177e4SLinus Torvalds 
5481da177e4SLinus Torvalds 	/* Flags and state transition */
5491da177e4SLinus Torvalds 	spinlock_t              lock;           /* lock for state transition */
5501da177e4SLinus Torvalds 	volatile __u16          state;          /* state info */
551efac5276SRumen G. Bogdanovski 	volatile __u16          old_state;      /* old state, to be used for
552efac5276SRumen G. Bogdanovski 						 * state transition triggerd
553efac5276SRumen G. Bogdanovski 						 * synchronization
554efac5276SRumen G. Bogdanovski 						 */
5551845ed0bSJulian Anastasov 	__u32			fwmark;		/* Fire wall mark from skb */
556749c42b6SJulian Anastasov 	unsigned long		sync_endtime;	/* jiffies + sent_retries */
5571da177e4SLinus Torvalds 
5581da177e4SLinus Torvalds 	/* Control members */
5591da177e4SLinus Torvalds 	struct ip_vs_conn       *control;       /* Master control connection */
5601da177e4SLinus Torvalds 	atomic_t                n_control;      /* Number of controlled ones */
5611da177e4SLinus Torvalds 	struct ip_vs_dest       *dest;          /* real server */
5621da177e4SLinus Torvalds 	atomic_t                in_pkts;        /* incoming packet counter */
5631da177e4SLinus Torvalds 
5641da177e4SLinus Torvalds 	/* packet transmitter for different forwarding methods.  If it
5651da177e4SLinus Torvalds 	   mangles the packet, it must return NF_DROP or better NF_STOLEN,
5661da177e4SLinus Torvalds 	   otherwise this must be changed to a sk_buff **.
567fc604767SJulian Anastasov 	   NF_ACCEPT can be returned when destination is local.
5681da177e4SLinus Torvalds 	 */
5691da177e4SLinus Torvalds 	int (*packet_xmit)(struct sk_buff *skb, struct ip_vs_conn *cp,
570d4383f04SJesper Dangaard Brouer 			   struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
5711da177e4SLinus Torvalds 
5721da177e4SLinus Torvalds 	/* Note: we can group the following members into a structure,
5731da177e4SLinus Torvalds 	   in order to save more space, and the following members are
5741da177e4SLinus Torvalds 	   only used in VS/NAT anyway */
5751da177e4SLinus Torvalds 	struct ip_vs_app        *app;           /* bound ip_vs_app object */
5761da177e4SLinus Torvalds 	void                    *app_data;      /* Application private data */
5771da177e4SLinus Torvalds 	struct ip_vs_seq        in_seq;         /* incoming seq. struct */
5781da177e4SLinus Torvalds 	struct ip_vs_seq        out_seq;        /* outgoing seq. struct */
57985999283SSimon Horman 
580e9e5eee8SSimon Horman 	const struct ip_vs_pe	*pe;
58185999283SSimon Horman 	char			*pe_data;
58285999283SSimon Horman 	__u8			pe_data_len;
583088339a5SJulian Anastasov 
584088339a5SJulian Anastasov 	struct rcu_head		rcu_head;
5851da177e4SLinus Torvalds };
5861da177e4SLinus Torvalds 
5876e67e586SHans Schillstrom /*
5886e67e586SHans Schillstrom  *  To save some memory in conn table when name space is disabled.
5896e67e586SHans Schillstrom  */
5906e67e586SHans Schillstrom static inline struct net *ip_vs_conn_net(const struct ip_vs_conn *cp)
5916e67e586SHans Schillstrom {
5926e67e586SHans Schillstrom #ifdef CONFIG_NET_NS
5936e67e586SHans Schillstrom 	return cp->net;
5946e67e586SHans Schillstrom #else
5956e67e586SHans Schillstrom 	return &init_net;
5966e67e586SHans Schillstrom #endif
5976e67e586SHans Schillstrom }
5986e67e586SHans Schillstrom static inline void ip_vs_conn_net_set(struct ip_vs_conn *cp, struct net *net)
5996e67e586SHans Schillstrom {
6006e67e586SHans Schillstrom #ifdef CONFIG_NET_NS
6016e67e586SHans Schillstrom 	cp->net = net;
6026e67e586SHans Schillstrom #endif
6036e67e586SHans Schillstrom }
6046e67e586SHans Schillstrom 
6056e67e586SHans Schillstrom static inline int ip_vs_conn_net_eq(const struct ip_vs_conn *cp,
6066e67e586SHans Schillstrom 				    struct net *net)
6076e67e586SHans Schillstrom {
6086e67e586SHans Schillstrom #ifdef CONFIG_NET_NS
6096e67e586SHans Schillstrom 	return cp->net == net;
6106e67e586SHans Schillstrom #else
6116e67e586SHans Schillstrom 	return 1;
6126e67e586SHans Schillstrom #endif
6136e67e586SHans Schillstrom }
6141da177e4SLinus Torvalds 
6151da177e4SLinus Torvalds /*
616c860c6b1SJulius Volz  *	Extended internal versions of struct ip_vs_service_user and
617c860c6b1SJulius Volz  *	ip_vs_dest_user for IPv6 support.
618c860c6b1SJulius Volz  *
619c860c6b1SJulius Volz  *	We need these to conveniently pass around service and destination
620c860c6b1SJulius Volz  *	options, but unfortunately, we also need to keep the old definitions to
621c860c6b1SJulius Volz  *	maintain userspace backwards compatibility for the setsockopt interface.
622c860c6b1SJulius Volz  */
623c860c6b1SJulius Volz struct ip_vs_service_user_kern {
624c860c6b1SJulius Volz 	/* virtual service addresses */
625c860c6b1SJulius Volz 	u16			af;
626c860c6b1SJulius Volz 	u16			protocol;
627c860c6b1SJulius Volz 	union nf_inet_addr	addr;		/* virtual ip address */
6280a925864SJulian Anastasov 	__be16			port;
629c860c6b1SJulius Volz 	u32			fwmark;		/* firwall mark of service */
630c860c6b1SJulius Volz 
631c860c6b1SJulius Volz 	/* virtual service options */
632c860c6b1SJulius Volz 	char			*sched_name;
6330d1e71b0SSimon Horman 	char			*pe_name;
63495c96174SEric Dumazet 	unsigned int		flags;		/* virtual service flags */
63595c96174SEric Dumazet 	unsigned int		timeout;	/* persistent timeout in sec */
6360a925864SJulian Anastasov 	__be32			netmask;	/* persistent netmask or plen */
637c860c6b1SJulius Volz };
638c860c6b1SJulius Volz 
639c860c6b1SJulius Volz 
640c860c6b1SJulius Volz struct ip_vs_dest_user_kern {
641c860c6b1SJulius Volz 	/* destination server address */
642c860c6b1SJulius Volz 	union nf_inet_addr	addr;
6430a925864SJulian Anastasov 	__be16			port;
644c860c6b1SJulius Volz 
645c860c6b1SJulius Volz 	/* real server options */
64695c96174SEric Dumazet 	unsigned int		conn_flags;	/* connection flags */
647c860c6b1SJulius Volz 	int			weight;		/* destination weight */
648c860c6b1SJulius Volz 
649c860c6b1SJulius Volz 	/* thresholds for active connections */
650c860c6b1SJulius Volz 	u32			u_threshold;	/* upper threshold */
651c860c6b1SJulius Volz 	u32			l_threshold;	/* lower threshold */
6526cff339bSAlex Gartrell 
6536cff339bSAlex Gartrell 	/* Address family of addr */
6546cff339bSAlex Gartrell 	u16			af;
655c860c6b1SJulius Volz };
656c860c6b1SJulius Volz 
657c860c6b1SJulius Volz 
658c860c6b1SJulius Volz /*
6591da177e4SLinus Torvalds  *	The information about the virtual service offered to the net
6601da177e4SLinus Torvalds  *	and the forwarding entries
6611da177e4SLinus Torvalds  */
6621da177e4SLinus Torvalds struct ip_vs_service {
663ceec4c38SJulian Anastasov 	struct hlist_node	s_list;   /* for normal service table */
664ceec4c38SJulian Anastasov 	struct hlist_node	f_list;   /* for fwmark-based service table */
6651da177e4SLinus Torvalds 	atomic_t		refcnt;   /* reference counter */
6661da177e4SLinus Torvalds 
667e7ade46aSJulius Volz 	u16			af;       /* address family */
6681da177e4SLinus Torvalds 	__u16			protocol; /* which protocol (TCP/UDP) */
669e7ade46aSJulius Volz 	union nf_inet_addr	addr;	  /* IP address for virtual service */
670014d730dSAl Viro 	__be16			port;	  /* port number for the service */
6711da177e4SLinus Torvalds 	__u32                   fwmark;   /* firewall mark of the service */
67295c96174SEric Dumazet 	unsigned int		flags;	  /* service status flags */
67395c96174SEric Dumazet 	unsigned int		timeout;  /* persistent timeout in ticks */
6740a925864SJulian Anastasov 	__be32			netmask;  /* grouping granularity, mask/plen */
675fc723250SHans Schillstrom 	struct net		*net;
6761da177e4SLinus Torvalds 
6771da177e4SLinus Torvalds 	struct list_head	destinations;  /* real server d-linked list */
6781da177e4SLinus Torvalds 	__u32			num_dests;     /* number of servers */
6791da177e4SLinus Torvalds 	struct ip_vs_stats      stats;         /* statistics for the service */
6801da177e4SLinus Torvalds 
6811da177e4SLinus Torvalds 	/* for scheduling */
682ceec4c38SJulian Anastasov 	struct ip_vs_scheduler __rcu *scheduler; /* bound scheduler object */
683ba3a3ce1SJulian Anastasov 	spinlock_t		sched_lock;    /* lock sched_data */
6841da177e4SLinus Torvalds 	void			*sched_data;   /* scheduler application data */
68585999283SSimon Horman 
68685999283SSimon Horman 	/* alternate persistence engine */
687ceec4c38SJulian Anastasov 	struct ip_vs_pe __rcu	*pe;
688ceec4c38SJulian Anastasov 
689ceec4c38SJulian Anastasov 	struct rcu_head		rcu_head;
6901da177e4SLinus Torvalds };
6911da177e4SLinus Torvalds 
692026ace06SJulian Anastasov /* Information for cached dst */
693026ace06SJulian Anastasov struct ip_vs_dest_dst {
694026ace06SJulian Anastasov 	struct dst_entry	*dst_cache;	/* destination cache entry */
695026ace06SJulian Anastasov 	u32			dst_cookie;
696026ace06SJulian Anastasov 	union nf_inet_addr	dst_saddr;
697026ace06SJulian Anastasov 	struct rcu_head		rcu_head;
698026ace06SJulian Anastasov };
6991da177e4SLinus Torvalds 
7001da177e4SLinus Torvalds /*
7011da177e4SLinus Torvalds  *	The real server destination forwarding entry
7021da177e4SLinus Torvalds  *	with ip address, port number, and so on.
7031da177e4SLinus Torvalds  */
7041da177e4SLinus Torvalds struct ip_vs_dest {
7051da177e4SLinus Torvalds 	struct list_head	n_list;   /* for the dests in the service */
706276472eaSJulian Anastasov 	struct hlist_node	d_list;   /* for table with all the dests */
7071da177e4SLinus Torvalds 
708e7ade46aSJulius Volz 	u16			af;		/* address family */
709014d730dSAl Viro 	__be16			port;		/* port number of the server */
710f2431e6eSHans Schillstrom 	union nf_inet_addr	addr;		/* IP address of the server */
71195c96174SEric Dumazet 	volatile unsigned int	flags;		/* dest status flags */
7121da177e4SLinus Torvalds 	atomic_t		conn_flags;	/* flags to copy to conn */
7131da177e4SLinus Torvalds 	atomic_t		weight;		/* server weight */
7141da177e4SLinus Torvalds 
7151da177e4SLinus Torvalds 	atomic_t		refcnt;		/* reference counter */
7161da177e4SLinus Torvalds 	struct ip_vs_stats      stats;          /* statistics */
717bcbde4c0SJulian Anastasov 	unsigned long		idle_start;	/* start time, jiffies */
7181da177e4SLinus Torvalds 
7191da177e4SLinus Torvalds 	/* connection counters and thresholds */
7201da177e4SLinus Torvalds 	atomic_t		activeconns;	/* active connections */
7211da177e4SLinus Torvalds 	atomic_t		inactconns;	/* inactive connections */
7221da177e4SLinus Torvalds 	atomic_t		persistconns;	/* persistent connections */
7231da177e4SLinus Torvalds 	__u32			u_threshold;	/* upper threshold */
7241da177e4SLinus Torvalds 	__u32			l_threshold;	/* lower threshold */
7251da177e4SLinus Torvalds 
7261da177e4SLinus Torvalds 	/* for destination cache */
7271da177e4SLinus Torvalds 	spinlock_t		dst_lock;	/* lock of dst_cache */
728026ace06SJulian Anastasov 	struct ip_vs_dest_dst __rcu *dest_dst;	/* cached dst info */
7291da177e4SLinus Torvalds 
7301da177e4SLinus Torvalds 	/* for virtual service */
731bcbde4c0SJulian Anastasov 	struct ip_vs_service __rcu *svc;	/* service it belongs to */
7321da177e4SLinus Torvalds 	__u16			protocol;	/* which protocol (TCP/UDP) */
733014d730dSAl Viro 	__be16			vport;		/* virtual port number */
734f2431e6eSHans Schillstrom 	union nf_inet_addr	vaddr;		/* virtual IP address */
7351da177e4SLinus Torvalds 	__u32			vfwmark;	/* firewall mark of service */
736276472eaSJulian Anastasov 
737578bc3efSJulian Anastasov 	struct list_head	t_list;		/* in dest_trash */
738276472eaSJulian Anastasov 	unsigned int		in_rs_table:1;	/* we are in rs_table */
7391da177e4SLinus Torvalds };
7401da177e4SLinus Torvalds 
7411da177e4SLinus Torvalds 
7421da177e4SLinus Torvalds /*
7431da177e4SLinus Torvalds  *	The scheduler object
7441da177e4SLinus Torvalds  */
7451da177e4SLinus Torvalds struct ip_vs_scheduler {
7461da177e4SLinus Torvalds 	struct list_head	n_list;		/* d-linked list head */
7471da177e4SLinus Torvalds 	char			*name;		/* scheduler name */
7481da177e4SLinus Torvalds 	atomic_t		refcnt;		/* reference counter */
7491da177e4SLinus Torvalds 	struct module		*module;	/* THIS_MODULE/NULL */
7501da177e4SLinus Torvalds 
7511da177e4SLinus Torvalds 	/* scheduler initializing service */
7521da177e4SLinus Torvalds 	int (*init_service)(struct ip_vs_service *svc);
7531da177e4SLinus Torvalds 	/* scheduling service finish */
754ed3ffc4eSJulian Anastasov 	void (*done_service)(struct ip_vs_service *svc);
7556b6df466SJulian Anastasov 	/* dest is linked */
7566b6df466SJulian Anastasov 	int (*add_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest);
7576b6df466SJulian Anastasov 	/* dest is unlinked */
7586b6df466SJulian Anastasov 	int (*del_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest);
7596b6df466SJulian Anastasov 	/* dest is updated */
7606b6df466SJulian Anastasov 	int (*upd_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest);
7611da177e4SLinus Torvalds 
7621da177e4SLinus Torvalds 	/* selecting a server from the given service */
7631da177e4SLinus Torvalds 	struct ip_vs_dest* (*schedule)(struct ip_vs_service *svc,
764bba54de5SJulian Anastasov 				       const struct sk_buff *skb,
765bba54de5SJulian Anastasov 				       struct ip_vs_iphdr *iph);
7661da177e4SLinus Torvalds };
7671da177e4SLinus Torvalds 
76885999283SSimon Horman /* The persistence engine object */
76985999283SSimon Horman struct ip_vs_pe {
77085999283SSimon Horman 	struct list_head	n_list;		/* d-linked list head */
77185999283SSimon Horman 	char			*name;		/* scheduler name */
77285999283SSimon Horman 	atomic_t		refcnt;		/* reference counter */
77385999283SSimon Horman 	struct module		*module;	/* THIS_MODULE/NULL */
77485999283SSimon Horman 
77585999283SSimon Horman 	/* get the connection template, if any */
77685999283SSimon Horman 	int (*fill_param)(struct ip_vs_conn_param *p, struct sk_buff *skb);
77785999283SSimon Horman 	bool (*ct_match)(const struct ip_vs_conn_param *p,
77885999283SSimon Horman 			 struct ip_vs_conn *ct);
77985999283SSimon Horman 	u32 (*hashkey_raw)(const struct ip_vs_conn_param *p, u32 initval,
78085999283SSimon Horman 			   bool inverse);
781a3c918acSSimon Horman 	int (*show_pe_data)(const struct ip_vs_conn *cp, char *buf);
78285999283SSimon Horman };
7831da177e4SLinus Torvalds 
7841da177e4SLinus Torvalds /*
7851da177e4SLinus Torvalds  *	The application module object (a.k.a. app incarnation)
7861da177e4SLinus Torvalds  */
787fd2c3ef7SEric Dumazet struct ip_vs_app {
7881da177e4SLinus Torvalds 	struct list_head	a_list;		/* member in app list */
7891da177e4SLinus Torvalds 	int			type;		/* IP_VS_APP_TYPE_xxx */
7901da177e4SLinus Torvalds 	char			*name;		/* application module name */
7911da177e4SLinus Torvalds 	__u16			protocol;
7921da177e4SLinus Torvalds 	struct module		*module;	/* THIS_MODULE/NULL */
7931da177e4SLinus Torvalds 	struct list_head	incs_list;	/* list of incarnations */
7941da177e4SLinus Torvalds 
7951da177e4SLinus Torvalds 	/* members for application incarnations */
7961da177e4SLinus Torvalds 	struct list_head	p_list;		/* member in proto app list */
7971da177e4SLinus Torvalds 	struct ip_vs_app	*app;		/* its real application */
798014d730dSAl Viro 	__be16			port;		/* port number in net order */
7991da177e4SLinus Torvalds 	atomic_t		usecnt;		/* usage counter */
800363c97d7SJulian Anastasov 	struct rcu_head		rcu_head;
8011da177e4SLinus Torvalds 
8028b27b10fSJulian Anastasov 	/*
8038b27b10fSJulian Anastasov 	 * output hook: Process packet in inout direction, diff set for TCP.
8048b27b10fSJulian Anastasov 	 * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok,
8058b27b10fSJulian Anastasov 	 *	   2=Mangled but checksum was not updated
8068b27b10fSJulian Anastasov 	 */
8071da177e4SLinus Torvalds 	int (*pkt_out)(struct ip_vs_app *, struct ip_vs_conn *,
8083db05feaSHerbert Xu 		       struct sk_buff *, int *diff);
8091da177e4SLinus Torvalds 
8108b27b10fSJulian Anastasov 	/*
8118b27b10fSJulian Anastasov 	 * input hook: Process packet in outin direction, diff set for TCP.
8128b27b10fSJulian Anastasov 	 * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok,
8138b27b10fSJulian Anastasov 	 *	   2=Mangled but checksum was not updated
8148b27b10fSJulian Anastasov 	 */
8151da177e4SLinus Torvalds 	int (*pkt_in)(struct ip_vs_app *, struct ip_vs_conn *,
8163db05feaSHerbert Xu 		      struct sk_buff *, int *diff);
8171da177e4SLinus Torvalds 
8181da177e4SLinus Torvalds 	/* ip_vs_app initializer */
8191da177e4SLinus Torvalds 	int (*init_conn)(struct ip_vs_app *, struct ip_vs_conn *);
8201da177e4SLinus Torvalds 
8211da177e4SLinus Torvalds 	/* ip_vs_app finish */
8221da177e4SLinus Torvalds 	int (*done_conn)(struct ip_vs_app *, struct ip_vs_conn *);
8231da177e4SLinus Torvalds 
8241da177e4SLinus Torvalds 
8251da177e4SLinus Torvalds 	/* not used now */
8261da177e4SLinus Torvalds 	int (*bind_conn)(struct ip_vs_app *, struct ip_vs_conn *,
8271da177e4SLinus Torvalds 			 struct ip_vs_protocol *);
8281da177e4SLinus Torvalds 
8291da177e4SLinus Torvalds 	void (*unbind_conn)(struct ip_vs_app *, struct ip_vs_conn *);
8301da177e4SLinus Torvalds 
8311da177e4SLinus Torvalds 	int *			timeout_table;
8321da177e4SLinus Torvalds 	int *			timeouts;
8331da177e4SLinus Torvalds 	int			timeouts_size;
8341da177e4SLinus Torvalds 
8351da177e4SLinus Torvalds 	int (*conn_schedule)(struct sk_buff *skb, struct ip_vs_app *app,
8361da177e4SLinus Torvalds 			     int *verdict, struct ip_vs_conn **cpp);
8371da177e4SLinus Torvalds 
8381da177e4SLinus Torvalds 	struct ip_vs_conn *
8391da177e4SLinus Torvalds 	(*conn_in_get)(const struct sk_buff *skb, struct ip_vs_app *app,
840d4383f04SJesper Dangaard Brouer 		       const struct iphdr *iph, int inverse);
8411da177e4SLinus Torvalds 
8421da177e4SLinus Torvalds 	struct ip_vs_conn *
8431da177e4SLinus Torvalds 	(*conn_out_get)(const struct sk_buff *skb, struct ip_vs_app *app,
844d4383f04SJesper Dangaard Brouer 			const struct iphdr *iph, int inverse);
8451da177e4SLinus Torvalds 
8461da177e4SLinus Torvalds 	int (*state_transition)(struct ip_vs_conn *cp, int direction,
8471da177e4SLinus Torvalds 				const struct sk_buff *skb,
8481da177e4SLinus Torvalds 				struct ip_vs_app *app);
8491da177e4SLinus Torvalds 
8501da177e4SLinus Torvalds 	void (*timeout_change)(struct ip_vs_app *app, int flags);
8511da177e4SLinus Torvalds };
8521da177e4SLinus Torvalds 
853f73181c8SPablo Neira Ayuso struct ipvs_master_sync_state {
854f73181c8SPablo Neira Ayuso 	struct list_head	sync_queue;
855f73181c8SPablo Neira Ayuso 	struct ip_vs_sync_buff	*sync_buff;
85607995674SZhang Yanfei 	unsigned long		sync_queue_len;
857f73181c8SPablo Neira Ayuso 	unsigned int		sync_queue_delay;
858f73181c8SPablo Neira Ayuso 	struct task_struct	*master_thread;
859f73181c8SPablo Neira Ayuso 	struct delayed_work	master_wakeup_work;
860f73181c8SPablo Neira Ayuso 	struct netns_ipvs	*ipvs;
861f73181c8SPablo Neira Ayuso };
862f73181c8SPablo Neira Ayuso 
863578bc3efSJulian Anastasov /* How much time to keep dests in trash */
864578bc3efSJulian Anastasov #define IP_VS_DEST_TRASH_PERIOD		(120 * HZ)
865578bc3efSJulian Anastasov 
8662553d064SJulian Anastasov /* IPVS in network namespace */
8672553d064SJulian Anastasov struct netns_ipvs {
8682553d064SJulian Anastasov 	int			gen;		/* Generation */
8697a4f0761SHans Schillstrom 	int			enable;		/* enable like nf_hooks do */
8702553d064SJulian Anastasov 	/*
8712553d064SJulian Anastasov 	 *	Hash table: for real service lookups
8722553d064SJulian Anastasov 	 */
8732553d064SJulian Anastasov 	#define IP_VS_RTAB_BITS 4
8742553d064SJulian Anastasov 	#define IP_VS_RTAB_SIZE (1 << IP_VS_RTAB_BITS)
8752553d064SJulian Anastasov 	#define IP_VS_RTAB_MASK (IP_VS_RTAB_SIZE - 1)
8762553d064SJulian Anastasov 
877276472eaSJulian Anastasov 	struct hlist_head	rs_table[IP_VS_RTAB_SIZE];
8782553d064SJulian Anastasov 	/* ip_vs_app */
8792553d064SJulian Anastasov 	struct list_head	app_list;
8802553d064SJulian Anastasov 	/* ip_vs_proto */
8812553d064SJulian Anastasov 	#define IP_VS_PROTO_TAB_SIZE	32	/* must be power of 2 */
8822553d064SJulian Anastasov 	struct ip_vs_proto_data *proto_data_table[IP_VS_PROTO_TAB_SIZE];
8832553d064SJulian Anastasov 	/* ip_vs_proto_tcp */
8842553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_TCP
8852553d064SJulian Anastasov 	#define	TCP_APP_TAB_BITS	4
8862553d064SJulian Anastasov 	#define	TCP_APP_TAB_SIZE	(1 << TCP_APP_TAB_BITS)
8872553d064SJulian Anastasov 	#define	TCP_APP_TAB_MASK	(TCP_APP_TAB_SIZE - 1)
8882553d064SJulian Anastasov 	struct list_head	tcp_apps[TCP_APP_TAB_SIZE];
8892553d064SJulian Anastasov #endif
8902553d064SJulian Anastasov 	/* ip_vs_proto_udp */
8912553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_UDP
8922553d064SJulian Anastasov 	#define	UDP_APP_TAB_BITS	4
8932553d064SJulian Anastasov 	#define	UDP_APP_TAB_SIZE	(1 << UDP_APP_TAB_BITS)
8942553d064SJulian Anastasov 	#define	UDP_APP_TAB_MASK	(UDP_APP_TAB_SIZE - 1)
8952553d064SJulian Anastasov 	struct list_head	udp_apps[UDP_APP_TAB_SIZE];
8962553d064SJulian Anastasov #endif
8972553d064SJulian Anastasov 	/* ip_vs_proto_sctp */
8982553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_SCTP
8992553d064SJulian Anastasov 	#define SCTP_APP_TAB_BITS	4
9002553d064SJulian Anastasov 	#define SCTP_APP_TAB_SIZE	(1 << SCTP_APP_TAB_BITS)
9012553d064SJulian Anastasov 	#define SCTP_APP_TAB_MASK	(SCTP_APP_TAB_SIZE - 1)
9022553d064SJulian Anastasov 	/* Hash table for SCTP application incarnations	 */
9032553d064SJulian Anastasov 	struct list_head	sctp_apps[SCTP_APP_TAB_SIZE];
9042553d064SJulian Anastasov #endif
9052553d064SJulian Anastasov 	/* ip_vs_conn */
9062553d064SJulian Anastasov 	atomic_t		conn_count;      /*  connection counter */
9072553d064SJulian Anastasov 
9082553d064SJulian Anastasov 	/* ip_vs_ctl */
9092a0751afSJulian Anastasov 	struct ip_vs_stats		tot_stats;  /* Statistics & est. */
9102553d064SJulian Anastasov 
9112553d064SJulian Anastasov 	int			num_services;    /* no of virtual services */
912f2247fbdSSimon Horman 
9132553d064SJulian Anastasov 	/* Trash for destinations */
9142553d064SJulian Anastasov 	struct list_head	dest_trash;
915578bc3efSJulian Anastasov 	spinlock_t		dest_trash_lock;
916578bc3efSJulian Anastasov 	struct timer_list	dest_trash_timer; /* expiration timer */
9172553d064SJulian Anastasov 	/* Service counters */
9182553d064SJulian Anastasov 	atomic_t		ftpsvc_counter;
9192553d064SJulian Anastasov 	atomic_t		nullsvc_counter;
9202553d064SJulian Anastasov 
921f2247fbdSSimon Horman #ifdef CONFIG_SYSCTL
922f2247fbdSSimon Horman 	/* 1/rate drop and drop-entry variables */
923f2247fbdSSimon Horman 	struct delayed_work	defense_work;   /* Work handler */
924f2247fbdSSimon Horman 	int			drop_rate;
925f2247fbdSSimon Horman 	int			drop_counter;
926f2247fbdSSimon Horman 	atomic_t		dropentry;
927f2247fbdSSimon Horman 	/* locks in ctl.c */
928f2247fbdSSimon Horman 	spinlock_t		dropentry_lock;  /* drop entry handling */
929f2247fbdSSimon Horman 	spinlock_t		droppacket_lock; /* drop packet handling */
930f2247fbdSSimon Horman 	spinlock_t		securetcp_lock;  /* state and timeout tables */
931f2247fbdSSimon Horman 
9322553d064SJulian Anastasov 	/* sys-ctl struct */
9332553d064SJulian Anastasov 	struct ctl_table_header	*sysctl_hdr;
9342553d064SJulian Anastasov 	struct ctl_table	*sysctl_tbl;
935f2247fbdSSimon Horman #endif
936f2247fbdSSimon Horman 
9372553d064SJulian Anastasov 	/* sysctl variables */
9382553d064SJulian Anastasov 	int			sysctl_amemthresh;
9392553d064SJulian Anastasov 	int			sysctl_am_droprate;
9402553d064SJulian Anastasov 	int			sysctl_drop_entry;
9412553d064SJulian Anastasov 	int			sysctl_drop_packet;
9422553d064SJulian Anastasov 	int			sysctl_secure_tcp;
9432553d064SJulian Anastasov #ifdef CONFIG_IP_VS_NFCT
9442553d064SJulian Anastasov 	int			sysctl_conntrack;
9452553d064SJulian Anastasov #endif
9462553d064SJulian Anastasov 	int			sysctl_snat_reroute;
9472553d064SJulian Anastasov 	int			sysctl_sync_ver;
948f73181c8SPablo Neira Ayuso 	int			sysctl_sync_ports;
9494d0c875dSJulian Anastasov 	int			sysctl_sync_persist_mode;
95007995674SZhang Yanfei 	unsigned long		sysctl_sync_qlen_max;
9511c003b15SPablo Neira Ayuso 	int			sysctl_sync_sock_size;
9522553d064SJulian Anastasov 	int			sysctl_cache_bypass;
9532553d064SJulian Anastasov 	int			sysctl_expire_nodest_conn;
954c6c96c18SAlexander Frolkin 	int			sysctl_sloppy_tcp;
955c6c96c18SAlexander Frolkin 	int			sysctl_sloppy_sctp;
9562553d064SJulian Anastasov 	int			sysctl_expire_quiescent_template;
9572553d064SJulian Anastasov 	int			sysctl_sync_threshold[2];
958749c42b6SJulian Anastasov 	unsigned int		sysctl_sync_refresh_period;
959749c42b6SJulian Anastasov 	int			sysctl_sync_retries;
9602553d064SJulian Anastasov 	int			sysctl_nat_icmp_send;
9613654e611SJulian Anastasov 	int			sysctl_pmtu_disc;
9620c12582fSJulian Anastasov 	int			sysctl_backup_only;
9632553d064SJulian Anastasov 
9642553d064SJulian Anastasov 	/* ip_vs_lblc */
9652553d064SJulian Anastasov 	int			sysctl_lblc_expiration;
9662553d064SJulian Anastasov 	struct ctl_table_header	*lblc_ctl_header;
9672553d064SJulian Anastasov 	struct ctl_table	*lblc_ctl_table;
9682553d064SJulian Anastasov 	/* ip_vs_lblcr */
9692553d064SJulian Anastasov 	int			sysctl_lblcr_expiration;
9702553d064SJulian Anastasov 	struct ctl_table_header	*lblcr_ctl_header;
9712553d064SJulian Anastasov 	struct ctl_table	*lblcr_ctl_table;
9722553d064SJulian Anastasov 	/* ip_vs_est */
9732553d064SJulian Anastasov 	struct list_head	est_list;	/* estimator list */
9742553d064SJulian Anastasov 	spinlock_t		est_lock;
9752553d064SJulian Anastasov 	struct timer_list	est_timer;	/* Estimation timer */
9762553d064SJulian Anastasov 	/* ip_vs_sync */
9772553d064SJulian Anastasov 	spinlock_t		sync_lock;
978f73181c8SPablo Neira Ayuso 	struct ipvs_master_sync_state *ms;
9792553d064SJulian Anastasov 	spinlock_t		sync_buff_lock;
980f73181c8SPablo Neira Ayuso 	struct task_struct	**backup_threads;
981f73181c8SPablo Neira Ayuso 	int			threads_mask;
9822553d064SJulian Anastasov 	int			send_mesg_maxlen;
9832553d064SJulian Anastasov 	int			recv_mesg_maxlen;
9842553d064SJulian Anastasov 	volatile int		sync_state;
9852553d064SJulian Anastasov 	volatile int		master_syncid;
9862553d064SJulian Anastasov 	volatile int		backup_syncid;
987ae1d48b2SHans Schillstrom 	struct mutex		sync_mutex;
9882553d064SJulian Anastasov 	/* multicast interface name */
9892553d064SJulian Anastasov 	char			master_mcast_ifn[IP_VS_IFNAME_MAXLEN];
9902553d064SJulian Anastasov 	char			backup_mcast_ifn[IP_VS_IFNAME_MAXLEN];
9912553d064SJulian Anastasov 	/* net name space ptr */
9922553d064SJulian Anastasov 	struct net		*net;            /* Needed by timer routines */
993*391f503dSAlex Gartrell 	/* Number of heterogeneous destinations, needed because
994*391f503dSAlex Gartrell 	 * heterogeneous are not supported when synchronization is
995*391f503dSAlex Gartrell 	 * enabled */
996*391f503dSAlex Gartrell 	unsigned int		mixed_address_family_dests;
9972553d064SJulian Anastasov };
9981da177e4SLinus Torvalds 
99959e0350eSSimon Horman #define DEFAULT_SYNC_THRESHOLD	3
100059e0350eSSimon Horman #define DEFAULT_SYNC_PERIOD	50
10017532e8d4SSimon Horman #define DEFAULT_SYNC_VER	1
1002c6c96c18SAlexander Frolkin #define DEFAULT_SLOPPY_TCP	0
1003c6c96c18SAlexander Frolkin #define DEFAULT_SLOPPY_SCTP	0
1004749c42b6SJulian Anastasov #define DEFAULT_SYNC_REFRESH_PERIOD	(0U * HZ)
1005749c42b6SJulian Anastasov #define DEFAULT_SYNC_RETRIES		0
10061c003b15SPablo Neira Ayuso #define IPVS_SYNC_WAKEUP_RATE	8
10071c003b15SPablo Neira Ayuso #define IPVS_SYNC_QLEN_MAX	(IPVS_SYNC_WAKEUP_RATE * 4)
10081c003b15SPablo Neira Ayuso #define IPVS_SYNC_SEND_DELAY	(HZ / 50)
10091c003b15SPablo Neira Ayuso #define IPVS_SYNC_CHECK_PERIOD	HZ
1010749c42b6SJulian Anastasov #define IPVS_SYNC_FLUSH_TIME	(HZ * 2)
1011f73181c8SPablo Neira Ayuso #define IPVS_SYNC_PORTS_MAX	(1 << 6)
101259e0350eSSimon Horman 
101359e0350eSSimon Horman #ifdef CONFIG_SYSCTL
101459e0350eSSimon Horman 
101559e0350eSSimon Horman static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs)
101659e0350eSSimon Horman {
101759e0350eSSimon Horman 	return ipvs->sysctl_sync_threshold[0];
101859e0350eSSimon Horman }
101959e0350eSSimon Horman 
102059e0350eSSimon Horman static inline int sysctl_sync_period(struct netns_ipvs *ipvs)
102159e0350eSSimon Horman {
1022749c42b6SJulian Anastasov 	return ACCESS_ONCE(ipvs->sysctl_sync_threshold[1]);
1023749c42b6SJulian Anastasov }
1024749c42b6SJulian Anastasov 
1025749c42b6SJulian Anastasov static inline unsigned int sysctl_sync_refresh_period(struct netns_ipvs *ipvs)
1026749c42b6SJulian Anastasov {
1027749c42b6SJulian Anastasov 	return ACCESS_ONCE(ipvs->sysctl_sync_refresh_period);
1028749c42b6SJulian Anastasov }
1029749c42b6SJulian Anastasov 
1030749c42b6SJulian Anastasov static inline int sysctl_sync_retries(struct netns_ipvs *ipvs)
1031749c42b6SJulian Anastasov {
1032749c42b6SJulian Anastasov 	return ipvs->sysctl_sync_retries;
103359e0350eSSimon Horman }
103459e0350eSSimon Horman 
10357532e8d4SSimon Horman static inline int sysctl_sync_ver(struct netns_ipvs *ipvs)
10367532e8d4SSimon Horman {
10377532e8d4SSimon Horman 	return ipvs->sysctl_sync_ver;
10387532e8d4SSimon Horman }
10397532e8d4SSimon Horman 
1040c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_tcp(struct netns_ipvs *ipvs)
1041c6c96c18SAlexander Frolkin {
1042c6c96c18SAlexander Frolkin 	return ipvs->sysctl_sloppy_tcp;
1043c6c96c18SAlexander Frolkin }
1044c6c96c18SAlexander Frolkin 
1045c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_sctp(struct netns_ipvs *ipvs)
1046c6c96c18SAlexander Frolkin {
1047c6c96c18SAlexander Frolkin 	return ipvs->sysctl_sloppy_sctp;
1048c6c96c18SAlexander Frolkin }
1049c6c96c18SAlexander Frolkin 
1050f73181c8SPablo Neira Ayuso static inline int sysctl_sync_ports(struct netns_ipvs *ipvs)
1051f73181c8SPablo Neira Ayuso {
1052f73181c8SPablo Neira Ayuso 	return ACCESS_ONCE(ipvs->sysctl_sync_ports);
1053f73181c8SPablo Neira Ayuso }
1054f73181c8SPablo Neira Ayuso 
10554d0c875dSJulian Anastasov static inline int sysctl_sync_persist_mode(struct netns_ipvs *ipvs)
10564d0c875dSJulian Anastasov {
10574d0c875dSJulian Anastasov 	return ipvs->sysctl_sync_persist_mode;
10584d0c875dSJulian Anastasov }
10594d0c875dSJulian Anastasov 
106007995674SZhang Yanfei static inline unsigned long sysctl_sync_qlen_max(struct netns_ipvs *ipvs)
10611c003b15SPablo Neira Ayuso {
10621c003b15SPablo Neira Ayuso 	return ipvs->sysctl_sync_qlen_max;
10631c003b15SPablo Neira Ayuso }
10641c003b15SPablo Neira Ayuso 
10651c003b15SPablo Neira Ayuso static inline int sysctl_sync_sock_size(struct netns_ipvs *ipvs)
10661c003b15SPablo Neira Ayuso {
10671c003b15SPablo Neira Ayuso 	return ipvs->sysctl_sync_sock_size;
10681c003b15SPablo Neira Ayuso }
10691c003b15SPablo Neira Ayuso 
10703654e611SJulian Anastasov static inline int sysctl_pmtu_disc(struct netns_ipvs *ipvs)
10713654e611SJulian Anastasov {
10723654e611SJulian Anastasov 	return ipvs->sysctl_pmtu_disc;
10733654e611SJulian Anastasov }
10743654e611SJulian Anastasov 
10750c12582fSJulian Anastasov static inline int sysctl_backup_only(struct netns_ipvs *ipvs)
10760c12582fSJulian Anastasov {
10770c12582fSJulian Anastasov 	return ipvs->sync_state & IP_VS_STATE_BACKUP &&
10780c12582fSJulian Anastasov 	       ipvs->sysctl_backup_only;
10790c12582fSJulian Anastasov }
10800c12582fSJulian Anastasov 
108159e0350eSSimon Horman #else
108259e0350eSSimon Horman 
108359e0350eSSimon Horman static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs)
108459e0350eSSimon Horman {
108559e0350eSSimon Horman 	return DEFAULT_SYNC_THRESHOLD;
108659e0350eSSimon Horman }
108759e0350eSSimon Horman 
108859e0350eSSimon Horman static inline int sysctl_sync_period(struct netns_ipvs *ipvs)
108959e0350eSSimon Horman {
109059e0350eSSimon Horman 	return DEFAULT_SYNC_PERIOD;
109159e0350eSSimon Horman }
109259e0350eSSimon Horman 
1093749c42b6SJulian Anastasov static inline unsigned int sysctl_sync_refresh_period(struct netns_ipvs *ipvs)
1094749c42b6SJulian Anastasov {
1095749c42b6SJulian Anastasov 	return DEFAULT_SYNC_REFRESH_PERIOD;
1096749c42b6SJulian Anastasov }
1097749c42b6SJulian Anastasov 
1098749c42b6SJulian Anastasov static inline int sysctl_sync_retries(struct netns_ipvs *ipvs)
1099749c42b6SJulian Anastasov {
1100749c42b6SJulian Anastasov 	return DEFAULT_SYNC_RETRIES & 3;
1101749c42b6SJulian Anastasov }
1102749c42b6SJulian Anastasov 
11037532e8d4SSimon Horman static inline int sysctl_sync_ver(struct netns_ipvs *ipvs)
11047532e8d4SSimon Horman {
11057532e8d4SSimon Horman 	return DEFAULT_SYNC_VER;
11067532e8d4SSimon Horman }
11077532e8d4SSimon Horman 
1108c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_tcp(struct netns_ipvs *ipvs)
1109c6c96c18SAlexander Frolkin {
1110c6c96c18SAlexander Frolkin 	return DEFAULT_SLOPPY_TCP;
1111c6c96c18SAlexander Frolkin }
1112c6c96c18SAlexander Frolkin 
1113c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_sctp(struct netns_ipvs *ipvs)
1114c6c96c18SAlexander Frolkin {
1115c6c96c18SAlexander Frolkin 	return DEFAULT_SLOPPY_SCTP;
1116c6c96c18SAlexander Frolkin }
1117c6c96c18SAlexander Frolkin 
1118f73181c8SPablo Neira Ayuso static inline int sysctl_sync_ports(struct netns_ipvs *ipvs)
1119f73181c8SPablo Neira Ayuso {
1120f73181c8SPablo Neira Ayuso 	return 1;
1121f73181c8SPablo Neira Ayuso }
1122f73181c8SPablo Neira Ayuso 
11234d0c875dSJulian Anastasov static inline int sysctl_sync_persist_mode(struct netns_ipvs *ipvs)
11244d0c875dSJulian Anastasov {
11254d0c875dSJulian Anastasov 	return 0;
11264d0c875dSJulian Anastasov }
11274d0c875dSJulian Anastasov 
112807995674SZhang Yanfei static inline unsigned long sysctl_sync_qlen_max(struct netns_ipvs *ipvs)
11291c003b15SPablo Neira Ayuso {
11301c003b15SPablo Neira Ayuso 	return IPVS_SYNC_QLEN_MAX;
11311c003b15SPablo Neira Ayuso }
11321c003b15SPablo Neira Ayuso 
11331c003b15SPablo Neira Ayuso static inline int sysctl_sync_sock_size(struct netns_ipvs *ipvs)
11341c003b15SPablo Neira Ayuso {
11351c003b15SPablo Neira Ayuso 	return 0;
11361c003b15SPablo Neira Ayuso }
11371c003b15SPablo Neira Ayuso 
11383654e611SJulian Anastasov static inline int sysctl_pmtu_disc(struct netns_ipvs *ipvs)
11393654e611SJulian Anastasov {
11403654e611SJulian Anastasov 	return 1;
11413654e611SJulian Anastasov }
11423654e611SJulian Anastasov 
11430c12582fSJulian Anastasov static inline int sysctl_backup_only(struct netns_ipvs *ipvs)
11440c12582fSJulian Anastasov {
11450c12582fSJulian Anastasov 	return 0;
11460c12582fSJulian Anastasov }
11470c12582fSJulian Anastasov 
114859e0350eSSimon Horman #endif
114959e0350eSSimon Horman 
11501da177e4SLinus Torvalds /*
11511da177e4SLinus Torvalds  *      IPVS core functions
11521da177e4SLinus Torvalds  *      (from ip_vs_core.c)
11531da177e4SLinus Torvalds  */
11545c3a0fd7SJoe Perches const char *ip_vs_proto_name(unsigned int proto);
11555c3a0fd7SJoe Perches void ip_vs_init_hash_table(struct list_head *table, int rows);
1156afdd6140SSven Wegener #define IP_VS_INIT_HASH_TABLE(t) ip_vs_init_hash_table((t), ARRAY_SIZE((t)))
11571da177e4SLinus Torvalds 
11581da177e4SLinus Torvalds #define IP_VS_APP_TYPE_FTP	1
11591da177e4SLinus Torvalds 
11601da177e4SLinus Torvalds /*
11611da177e4SLinus Torvalds  *     ip_vs_conn handling functions
11621da177e4SLinus Torvalds  *     (from ip_vs_conn.c)
11631da177e4SLinus Torvalds  */
11641da177e4SLinus Torvalds 
11651da177e4SLinus Torvalds enum {
11661da177e4SLinus Torvalds 	IP_VS_DIR_INPUT = 0,
11671da177e4SLinus Torvalds 	IP_VS_DIR_OUTPUT,
11681da177e4SLinus Torvalds 	IP_VS_DIR_INPUT_ONLY,
11691da177e4SLinus Torvalds 	IP_VS_DIR_LAST,
11701da177e4SLinus Torvalds };
11711da177e4SLinus Torvalds 
11726e67e586SHans Schillstrom static inline void ip_vs_conn_fill_param(struct net *net, int af, int protocol,
1173f11017ecSSimon Horman 					 const union nf_inet_addr *caddr,
1174f11017ecSSimon Horman 					 __be16 cport,
1175f11017ecSSimon Horman 					 const union nf_inet_addr *vaddr,
1176f11017ecSSimon Horman 					 __be16 vport,
1177f11017ecSSimon Horman 					 struct ip_vs_conn_param *p)
1178f11017ecSSimon Horman {
11796e67e586SHans Schillstrom 	p->net = net;
1180f11017ecSSimon Horman 	p->af = af;
1181f11017ecSSimon Horman 	p->protocol = protocol;
1182f11017ecSSimon Horman 	p->caddr = caddr;
1183f11017ecSSimon Horman 	p->cport = cport;
1184f11017ecSSimon Horman 	p->vaddr = vaddr;
1185f11017ecSSimon Horman 	p->vport = vport;
118685999283SSimon Horman 	p->pe = NULL;
118785999283SSimon Horman 	p->pe_data = NULL;
1188f11017ecSSimon Horman }
118928364a59SJulius Volz 
1190f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_in_get(const struct ip_vs_conn_param *p);
1191f11017ecSSimon Horman struct ip_vs_conn *ip_vs_ct_in_get(const struct ip_vs_conn_param *p);
119228364a59SJulius Volz 
11935c0d2374SSimon Horman struct ip_vs_conn * ip_vs_conn_in_get_proto(int af, const struct sk_buff *skb,
11945c0d2374SSimon Horman 					    const struct ip_vs_iphdr *iph,
11955c0d2374SSimon Horman 					    int inverse);
11965c0d2374SSimon Horman 
1197f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_out_get(const struct ip_vs_conn_param *p);
11981da177e4SLinus Torvalds 
11995c0d2374SSimon Horman struct ip_vs_conn * ip_vs_conn_out_get_proto(int af, const struct sk_buff *skb,
12005c0d2374SSimon Horman 					     const struct ip_vs_iphdr *iph,
12015c0d2374SSimon Horman 					     int inverse);
12025c0d2374SSimon Horman 
1203088339a5SJulian Anastasov /* Get reference to gain full access to conn.
1204088339a5SJulian Anastasov  * By default, RCU read-side critical sections have access only to
1205088339a5SJulian Anastasov  * conn fields and its PE data, see ip_vs_conn_rcu_free() for reference.
1206088339a5SJulian Anastasov  */
1207088339a5SJulian Anastasov static inline bool __ip_vs_conn_get(struct ip_vs_conn *cp)
1208088339a5SJulian Anastasov {
1209088339a5SJulian Anastasov 	return atomic_inc_not_zero(&cp->refcnt);
1210088339a5SJulian Anastasov }
1211088339a5SJulian Anastasov 
12121da177e4SLinus Torvalds /* put back the conn without restarting its timer */
12131da177e4SLinus Torvalds static inline void __ip_vs_conn_put(struct ip_vs_conn *cp)
12141da177e4SLinus Torvalds {
12154e857c58SPeter Zijlstra 	smp_mb__before_atomic();
12161da177e4SLinus Torvalds 	atomic_dec(&cp->refcnt);
12171da177e4SLinus Torvalds }
12185c3a0fd7SJoe Perches void ip_vs_conn_put(struct ip_vs_conn *cp);
12195c3a0fd7SJoe Perches void ip_vs_conn_fill_cport(struct ip_vs_conn *cp, __be16 cport);
12201da177e4SLinus Torvalds 
1221ba38528aSAlex Gartrell struct ip_vs_conn *ip_vs_conn_new(const struct ip_vs_conn_param *p, int dest_af,
1222f11017ecSSimon Horman 				  const union nf_inet_addr *daddr,
122395c96174SEric Dumazet 				  __be16 dport, unsigned int flags,
12240e051e68SHans Schillstrom 				  struct ip_vs_dest *dest, __u32 fwmark);
12255c3a0fd7SJoe Perches void ip_vs_conn_expire_now(struct ip_vs_conn *cp);
12261da177e4SLinus Torvalds 
12275c3a0fd7SJoe Perches const char *ip_vs_state_name(__u16 proto, int state);
12281da177e4SLinus Torvalds 
12295c3a0fd7SJoe Perches void ip_vs_tcp_conn_listen(struct net *net, struct ip_vs_conn *cp);
12305c3a0fd7SJoe Perches int ip_vs_check_template(struct ip_vs_conn *ct);
12315c3a0fd7SJoe Perches void ip_vs_random_dropentry(struct net *net);
12325c3a0fd7SJoe Perches int ip_vs_conn_init(void);
12335c3a0fd7SJoe Perches void ip_vs_conn_cleanup(void);
12341da177e4SLinus Torvalds 
12351da177e4SLinus Torvalds static inline void ip_vs_control_del(struct ip_vs_conn *cp)
12361da177e4SLinus Torvalds {
12371da177e4SLinus Torvalds 	struct ip_vs_conn *ctl_cp = cp->control;
12381da177e4SLinus Torvalds 	if (!ctl_cp) {
1239cfc78c5aSJulius Volz 		IP_VS_ERR_BUF("request control DEL for uncontrolled: "
1240cfc78c5aSJulius Volz 			      "%s:%d to %s:%d\n",
1241cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1242cfc78c5aSJulius Volz 			      ntohs(cp->cport),
1243cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->vaddr),
1244cfc78c5aSJulius Volz 			      ntohs(cp->vport));
1245cfc78c5aSJulius Volz 
12461da177e4SLinus Torvalds 		return;
12471da177e4SLinus Torvalds 	}
12481da177e4SLinus Torvalds 
1249cfc78c5aSJulius Volz 	IP_VS_DBG_BUF(7, "DELeting control for: "
1250cfc78c5aSJulius Volz 		      "cp.dst=%s:%d ctl_cp.dst=%s:%d\n",
1251cfc78c5aSJulius Volz 		      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1252cfc78c5aSJulius Volz 		      ntohs(cp->cport),
1253cfc78c5aSJulius Volz 		      IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr),
1254cfc78c5aSJulius Volz 		      ntohs(ctl_cp->cport));
12551da177e4SLinus Torvalds 
12561da177e4SLinus Torvalds 	cp->control = NULL;
12571da177e4SLinus Torvalds 	if (atomic_read(&ctl_cp->n_control) == 0) {
1258cfc78c5aSJulius Volz 		IP_VS_ERR_BUF("BUG control DEL with n=0 : "
1259cfc78c5aSJulius Volz 			      "%s:%d to %s:%d\n",
1260cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1261cfc78c5aSJulius Volz 			      ntohs(cp->cport),
1262cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->vaddr),
1263cfc78c5aSJulius Volz 			      ntohs(cp->vport));
1264cfc78c5aSJulius Volz 
12651da177e4SLinus Torvalds 		return;
12661da177e4SLinus Torvalds 	}
12671da177e4SLinus Torvalds 	atomic_dec(&ctl_cp->n_control);
12681da177e4SLinus Torvalds }
12691da177e4SLinus Torvalds 
12701da177e4SLinus Torvalds static inline void
12711da177e4SLinus Torvalds ip_vs_control_add(struct ip_vs_conn *cp, struct ip_vs_conn *ctl_cp)
12721da177e4SLinus Torvalds {
12731da177e4SLinus Torvalds 	if (cp->control) {
1274cfc78c5aSJulius Volz 		IP_VS_ERR_BUF("request control ADD for already controlled: "
1275cfc78c5aSJulius Volz 			      "%s:%d to %s:%d\n",
1276cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1277cfc78c5aSJulius Volz 			      ntohs(cp->cport),
1278cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->vaddr),
1279cfc78c5aSJulius Volz 			      ntohs(cp->vport));
1280cfc78c5aSJulius Volz 
12811da177e4SLinus Torvalds 		ip_vs_control_del(cp);
12821da177e4SLinus Torvalds 	}
12831da177e4SLinus Torvalds 
1284cfc78c5aSJulius Volz 	IP_VS_DBG_BUF(7, "ADDing control for: "
1285cfc78c5aSJulius Volz 		      "cp.dst=%s:%d ctl_cp.dst=%s:%d\n",
1286cfc78c5aSJulius Volz 		      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1287cfc78c5aSJulius Volz 		      ntohs(cp->cport),
1288cfc78c5aSJulius Volz 		      IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr),
1289cfc78c5aSJulius Volz 		      ntohs(ctl_cp->cport));
12901da177e4SLinus Torvalds 
12911da177e4SLinus Torvalds 	cp->control = ctl_cp;
12921da177e4SLinus Torvalds 	atomic_inc(&ctl_cp->n_control);
12931da177e4SLinus Torvalds }
12941da177e4SLinus Torvalds 
12957a4f0761SHans Schillstrom /*
12967a4f0761SHans Schillstrom  * IPVS netns init & cleanup functions
12977a4f0761SHans Schillstrom  */
12985c3a0fd7SJoe Perches int ip_vs_estimator_net_init(struct net *net);
12995c3a0fd7SJoe Perches int ip_vs_control_net_init(struct net *net);
13005c3a0fd7SJoe Perches int ip_vs_protocol_net_init(struct net *net);
13015c3a0fd7SJoe Perches int ip_vs_app_net_init(struct net *net);
13025c3a0fd7SJoe Perches int ip_vs_conn_net_init(struct net *net);
13035c3a0fd7SJoe Perches int ip_vs_sync_net_init(struct net *net);
13045c3a0fd7SJoe Perches void ip_vs_conn_net_cleanup(struct net *net);
13055c3a0fd7SJoe Perches void ip_vs_app_net_cleanup(struct net *net);
13065c3a0fd7SJoe Perches void ip_vs_protocol_net_cleanup(struct net *net);
13075c3a0fd7SJoe Perches void ip_vs_control_net_cleanup(struct net *net);
13085c3a0fd7SJoe Perches void ip_vs_estimator_net_cleanup(struct net *net);
13095c3a0fd7SJoe Perches void ip_vs_sync_net_cleanup(struct net *net);
13105c3a0fd7SJoe Perches void ip_vs_service_net_cleanup(struct net *net);
13111da177e4SLinus Torvalds 
13121da177e4SLinus Torvalds /*
13131da177e4SLinus Torvalds  *      IPVS application functions
13141da177e4SLinus Torvalds  *      (from ip_vs_app.c)
13151da177e4SLinus Torvalds  */
13161da177e4SLinus Torvalds #define IP_VS_APP_MAX_PORTS  8
13175c3a0fd7SJoe Perches struct ip_vs_app *register_ip_vs_app(struct net *net, struct ip_vs_app *app);
13185c3a0fd7SJoe Perches void unregister_ip_vs_app(struct net *net, struct ip_vs_app *app);
13195c3a0fd7SJoe Perches int ip_vs_bind_app(struct ip_vs_conn *cp, struct ip_vs_protocol *pp);
13205c3a0fd7SJoe Perches void ip_vs_unbind_app(struct ip_vs_conn *cp);
13215c3a0fd7SJoe Perches int register_ip_vs_app_inc(struct net *net, struct ip_vs_app *app, __u16 proto,
13225c3a0fd7SJoe Perches 			   __u16 port);
13235c3a0fd7SJoe Perches int ip_vs_app_inc_get(struct ip_vs_app *inc);
13245c3a0fd7SJoe Perches void ip_vs_app_inc_put(struct ip_vs_app *inc);
13251da177e4SLinus Torvalds 
13265c3a0fd7SJoe Perches int ip_vs_app_pkt_out(struct ip_vs_conn *, struct sk_buff *skb);
13275c3a0fd7SJoe Perches int ip_vs_app_pkt_in(struct ip_vs_conn *, struct sk_buff *skb);
13281da177e4SLinus Torvalds 
13298be67a66SSimon Horman int register_ip_vs_pe(struct ip_vs_pe *pe);
13308be67a66SSimon Horman int unregister_ip_vs_pe(struct ip_vs_pe *pe);
1331e9e5eee8SSimon Horman struct ip_vs_pe *ip_vs_pe_getbyname(const char *name);
1332fe5e7a1eSHans Schillstrom struct ip_vs_pe *__ip_vs_pe_getbyname(const char *pe_name);
1333e9e5eee8SSimon Horman 
133469e7dae4SPaul Gortmaker /*
133569e7dae4SPaul Gortmaker  * Use a #define to avoid all of module.h just for these trivial ops
133669e7dae4SPaul Gortmaker  */
133769e7dae4SPaul Gortmaker #define ip_vs_pe_get(pe)			\
133869e7dae4SPaul Gortmaker 	if (pe && pe->module)			\
1339e9e5eee8SSimon Horman 		__module_get(pe->module);
1340e9e5eee8SSimon Horman 
134169e7dae4SPaul Gortmaker #define ip_vs_pe_put(pe)			\
134269e7dae4SPaul Gortmaker 	if (pe && pe->module)			\
1343e9e5eee8SSimon Horman 		module_put(pe->module);
13441da177e4SLinus Torvalds 
13451da177e4SLinus Torvalds /*
13461da177e4SLinus Torvalds  *	IPVS protocol functions (from ip_vs_proto.c)
13471da177e4SLinus Torvalds  */
13485c3a0fd7SJoe Perches int ip_vs_protocol_init(void);
13495c3a0fd7SJoe Perches void ip_vs_protocol_cleanup(void);
13505c3a0fd7SJoe Perches void ip_vs_protocol_timeout_change(struct netns_ipvs *ipvs, int flags);
13515c3a0fd7SJoe Perches int *ip_vs_create_timeout_table(int *table, int size);
13525c3a0fd7SJoe Perches int ip_vs_set_state_timeout(int *table, int num, const char *const *names,
135336cbd3dcSJan Engelhardt 			    const char *name, int to);
13545c3a0fd7SJoe Perches void ip_vs_tcpudp_debug_packet(int af, struct ip_vs_protocol *pp,
13555c3a0fd7SJoe Perches 			       const struct sk_buff *skb, int offset,
13565c3a0fd7SJoe Perches 			       const char *msg);
13571da177e4SLinus Torvalds 
13581da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_tcp;
13591da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_udp;
13601da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_icmp;
13611da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_esp;
13621da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_ah;
13632906f66aSVenkata Mohan Reddy extern struct ip_vs_protocol ip_vs_protocol_sctp;
13641da177e4SLinus Torvalds 
13651da177e4SLinus Torvalds /*
13661da177e4SLinus Torvalds  *      Registering/unregistering scheduler functions
13671da177e4SLinus Torvalds  *      (from ip_vs_sched.c)
13681da177e4SLinus Torvalds  */
13695c3a0fd7SJoe Perches int register_ip_vs_scheduler(struct ip_vs_scheduler *scheduler);
13705c3a0fd7SJoe Perches int unregister_ip_vs_scheduler(struct ip_vs_scheduler *scheduler);
13715c3a0fd7SJoe Perches int ip_vs_bind_scheduler(struct ip_vs_service *svc,
13721da177e4SLinus Torvalds 			 struct ip_vs_scheduler *scheduler);
13735c3a0fd7SJoe Perches void ip_vs_unbind_scheduler(struct ip_vs_service *svc,
1374ceec4c38SJulian Anastasov 			    struct ip_vs_scheduler *sched);
13755c3a0fd7SJoe Perches struct ip_vs_scheduler *ip_vs_scheduler_get(const char *sched_name);
13765c3a0fd7SJoe Perches void ip_vs_scheduler_put(struct ip_vs_scheduler *scheduler);
13775c3a0fd7SJoe Perches struct ip_vs_conn *
1378190ecd27SJulian Anastasov ip_vs_schedule(struct ip_vs_service *svc, struct sk_buff *skb,
1379d4383f04SJesper Dangaard Brouer 	       struct ip_vs_proto_data *pd, int *ignored,
1380d4383f04SJesper Dangaard Brouer 	       struct ip_vs_iphdr *iph);
13815c3a0fd7SJoe Perches int ip_vs_leave(struct ip_vs_service *svc, struct sk_buff *skb,
1382d4383f04SJesper Dangaard Brouer 		struct ip_vs_proto_data *pd, struct ip_vs_iphdr *iph);
13831da177e4SLinus Torvalds 
13845c3a0fd7SJoe Perches void ip_vs_scheduler_err(struct ip_vs_service *svc, const char *msg);
138541ac51eeSPatrick Schaaf 
13861da177e4SLinus Torvalds 
13871da177e4SLinus Torvalds /*
13881da177e4SLinus Torvalds  *      IPVS control data and functions (from ip_vs_ctl.c)
13891da177e4SLinus Torvalds  */
13901da177e4SLinus Torvalds extern struct ip_vs_stats ip_vs_stats;
1391b880c1f0SHans Schillstrom extern int sysctl_ip_vs_sync_ver;
13921da177e4SLinus Torvalds 
13935c3a0fd7SJoe Perches struct ip_vs_service *
1394ceec4c38SJulian Anastasov ip_vs_service_find(struct net *net, int af, __u32 fwmark, __u16 protocol,
13953c2e0505SJulius Volz 		  const union nf_inet_addr *vaddr, __be16 vport);
13961da177e4SLinus Torvalds 
13975c3a0fd7SJoe Perches bool ip_vs_has_real_service(struct net *net, int af, __u16 protocol,
13987937df15SJulius Volz 			    const union nf_inet_addr *daddr, __be16 dport);
13997937df15SJulius Volz 
14005c3a0fd7SJoe Perches int ip_vs_use_count_inc(void);
14015c3a0fd7SJoe Perches void ip_vs_use_count_dec(void);
14025c3a0fd7SJoe Perches int ip_vs_register_nl_ioctl(void);
14035c3a0fd7SJoe Perches void ip_vs_unregister_nl_ioctl(void);
14045c3a0fd7SJoe Perches int ip_vs_control_init(void);
14055c3a0fd7SJoe Perches void ip_vs_control_cleanup(void);
14065c3a0fd7SJoe Perches struct ip_vs_dest *
1407655eef10SAlex Gartrell ip_vs_find_dest(struct net *net, int svc_af, int dest_af,
1408655eef10SAlex Gartrell 		const union nf_inet_addr *daddr, __be16 dport,
1409655eef10SAlex Gartrell 		const union nf_inet_addr *vaddr, __be16 vport,
141052793dbeSJulian Anastasov 		__u16 protocol, __u32 fwmark, __u32 flags);
14115c3a0fd7SJoe Perches void ip_vs_try_bind_dest(struct ip_vs_conn *cp);
14121da177e4SLinus Torvalds 
1413fca9c20aSJulian Anastasov static inline void ip_vs_dest_hold(struct ip_vs_dest *dest)
1414fca9c20aSJulian Anastasov {
1415fca9c20aSJulian Anastasov 	atomic_inc(&dest->refcnt);
1416fca9c20aSJulian Anastasov }
1417fca9c20aSJulian Anastasov 
1418fca9c20aSJulian Anastasov static inline void ip_vs_dest_put(struct ip_vs_dest *dest)
1419fca9c20aSJulian Anastasov {
14204e857c58SPeter Zijlstra 	smp_mb__before_atomic();
1421fca9c20aSJulian Anastasov 	atomic_dec(&dest->refcnt);
1422fca9c20aSJulian Anastasov }
14231da177e4SLinus Torvalds 
14249e4e948aSJulian Anastasov static inline void ip_vs_dest_put_and_free(struct ip_vs_dest *dest)
14259e4e948aSJulian Anastasov {
14269e4e948aSJulian Anastasov 	if (atomic_dec_return(&dest->refcnt) < 0)
14279e4e948aSJulian Anastasov 		kfree(dest);
14289e4e948aSJulian Anastasov }
14299e4e948aSJulian Anastasov 
14301da177e4SLinus Torvalds /*
14311da177e4SLinus Torvalds  *      IPVS sync daemon data and function prototypes
14321da177e4SLinus Torvalds  *      (from ip_vs_sync.c)
14331da177e4SLinus Torvalds  */
14345c3a0fd7SJoe Perches int start_sync_thread(struct net *net, int state, char *mcast_ifn, __u8 syncid);
14355c3a0fd7SJoe Perches int stop_sync_thread(struct net *net, int state);
14365c3a0fd7SJoe Perches void ip_vs_sync_conn(struct net *net, struct ip_vs_conn *cp, int pkts);
14371da177e4SLinus Torvalds 
14381da177e4SLinus Torvalds /*
14391da177e4SLinus Torvalds  *      IPVS rate estimator prototypes (from ip_vs_est.c)
14401da177e4SLinus Torvalds  */
14415c3a0fd7SJoe Perches void ip_vs_start_estimator(struct net *net, struct ip_vs_stats *stats);
14425c3a0fd7SJoe Perches void ip_vs_stop_estimator(struct net *net, struct ip_vs_stats *stats);
14435c3a0fd7SJoe Perches void ip_vs_zero_estimator(struct ip_vs_stats *stats);
14445c3a0fd7SJoe Perches void ip_vs_read_estimator(struct ip_vs_stats_user *dst,
1445ea9f22ccSJulian Anastasov 			  struct ip_vs_stats *stats);
14461da177e4SLinus Torvalds 
14471da177e4SLinus Torvalds /*
14481da177e4SLinus Torvalds  *	Various IPVS packet transmitters (from ip_vs_xmit.c)
14491da177e4SLinus Torvalds  */
14505c3a0fd7SJoe Perches int ip_vs_null_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1451d4383f04SJesper Dangaard Brouer 		    struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14525c3a0fd7SJoe Perches int ip_vs_bypass_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1453d4383f04SJesper Dangaard Brouer 		      struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14545c3a0fd7SJoe Perches int ip_vs_nat_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1455d4383f04SJesper Dangaard Brouer 		   struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14565c3a0fd7SJoe Perches int ip_vs_tunnel_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
14575c3a0fd7SJoe Perches 		      struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14585c3a0fd7SJoe Perches int ip_vs_dr_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
14595c3a0fd7SJoe Perches 		  struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14605c3a0fd7SJoe Perches int ip_vs_icmp_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1461d4383f04SJesper Dangaard Brouer 		    struct ip_vs_protocol *pp, int offset,
1462d4383f04SJesper Dangaard Brouer 		    unsigned int hooknum, struct ip_vs_iphdr *iph);
14635c3a0fd7SJoe Perches void ip_vs_dest_dst_rcu_free(struct rcu_head *head);
14641da177e4SLinus Torvalds 
1465b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6
14665c3a0fd7SJoe Perches int ip_vs_bypass_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
1467d4383f04SJesper Dangaard Brouer 			 struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14685c3a0fd7SJoe Perches int ip_vs_nat_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
14695c3a0fd7SJoe Perches 		      struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14705c3a0fd7SJoe Perches int ip_vs_tunnel_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
14715c3a0fd7SJoe Perches 			 struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14725c3a0fd7SJoe Perches int ip_vs_dr_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
14735c3a0fd7SJoe Perches 		     struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14745c3a0fd7SJoe Perches int ip_vs_icmp_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
1475d4383f04SJesper Dangaard Brouer 		       struct ip_vs_protocol *pp, int offset,
1476d4383f04SJesper Dangaard Brouer 		       unsigned int hooknum, struct ip_vs_iphdr *iph);
1477b3cdd2a7SJulius Volz #endif
14781da177e4SLinus Torvalds 
14793a1bbf18SSimon Horman #ifdef CONFIG_SYSCTL
14801da177e4SLinus Torvalds /*
14811da177e4SLinus Torvalds  *	This is a simple mechanism to ignore packets when
14821da177e4SLinus Torvalds  *	we are loaded. Just set ip_vs_drop_rate to 'n' and
14831da177e4SLinus Torvalds  *	we start to drop 1/rate of the packets
14841da177e4SLinus Torvalds  */
14851da177e4SLinus Torvalds 
1486a0840e2eSHans Schillstrom static inline int ip_vs_todrop(struct netns_ipvs *ipvs)
14871da177e4SLinus Torvalds {
1488a0840e2eSHans Schillstrom 	if (!ipvs->drop_rate)
1489a0840e2eSHans Schillstrom 		return 0;
1490a0840e2eSHans Schillstrom 	if (--ipvs->drop_counter > 0)
1491a0840e2eSHans Schillstrom 		return 0;
1492a0840e2eSHans Schillstrom 	ipvs->drop_counter = ipvs->drop_rate;
14931da177e4SLinus Torvalds 	return 1;
14941da177e4SLinus Torvalds }
14953a1bbf18SSimon Horman #else
14963a1bbf18SSimon Horman static inline int ip_vs_todrop(struct netns_ipvs *ipvs) { return 0; }
14973a1bbf18SSimon Horman #endif
14981da177e4SLinus Torvalds 
14991da177e4SLinus Torvalds /*
15001da177e4SLinus Torvalds  *      ip_vs_fwd_tag returns the forwarding tag of the connection
15011da177e4SLinus Torvalds  */
15021da177e4SLinus Torvalds #define IP_VS_FWD_METHOD(cp)  (cp->flags & IP_VS_CONN_F_FWD_MASK)
15031da177e4SLinus Torvalds 
1504732db659SAdrian Bunk static inline char ip_vs_fwd_tag(struct ip_vs_conn *cp)
15051da177e4SLinus Torvalds {
15061da177e4SLinus Torvalds 	char fwd;
15071da177e4SLinus Torvalds 
15081da177e4SLinus Torvalds 	switch (IP_VS_FWD_METHOD(cp)) {
15091da177e4SLinus Torvalds 	case IP_VS_CONN_F_MASQ:
15101da177e4SLinus Torvalds 		fwd = 'M'; break;
15111da177e4SLinus Torvalds 	case IP_VS_CONN_F_LOCALNODE:
15121da177e4SLinus Torvalds 		fwd = 'L'; break;
15131da177e4SLinus Torvalds 	case IP_VS_CONN_F_TUNNEL:
15141da177e4SLinus Torvalds 		fwd = 'T'; break;
15151da177e4SLinus Torvalds 	case IP_VS_CONN_F_DROUTE:
15161da177e4SLinus Torvalds 		fwd = 'R'; break;
15171da177e4SLinus Torvalds 	case IP_VS_CONN_F_BYPASS:
15181da177e4SLinus Torvalds 		fwd = 'B'; break;
15191da177e4SLinus Torvalds 	default:
15201da177e4SLinus Torvalds 		fwd = '?'; break;
15211da177e4SLinus Torvalds 	}
15221da177e4SLinus Torvalds 	return fwd;
15231da177e4SLinus Torvalds }
15241da177e4SLinus Torvalds 
15255c3a0fd7SJoe Perches void ip_vs_nat_icmp(struct sk_buff *skb, struct ip_vs_protocol *pp,
15261da177e4SLinus Torvalds 		    struct ip_vs_conn *cp, int dir);
15271da177e4SLinus Torvalds 
1528b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6
15295c3a0fd7SJoe Perches void ip_vs_nat_icmp_v6(struct sk_buff *skb, struct ip_vs_protocol *pp,
1530b3cdd2a7SJulius Volz 		       struct ip_vs_conn *cp, int dir);
1531b3cdd2a7SJulius Volz #endif
1532b3cdd2a7SJulius Volz 
15335c3a0fd7SJoe Perches __sum16 ip_vs_checksum_complete(struct sk_buff *skb, int offset);
15341da177e4SLinus Torvalds 
1535f9214b26SAl Viro static inline __wsum ip_vs_check_diff4(__be32 old, __be32 new, __wsum oldsum)
15361da177e4SLinus Torvalds {
1537f9214b26SAl Viro 	__be32 diff[2] = { ~old, new };
15381da177e4SLinus Torvalds 
153907f0757aSJoe Perches 	return csum_partial(diff, sizeof(diff), oldsum);
1540f9214b26SAl Viro }
1541f9214b26SAl Viro 
15420bbdd42bSJulius Volz #ifdef CONFIG_IP_VS_IPV6
15430bbdd42bSJulius Volz static inline __wsum ip_vs_check_diff16(const __be32 *old, const __be32 *new,
15440bbdd42bSJulius Volz 					__wsum oldsum)
15450bbdd42bSJulius Volz {
15460bbdd42bSJulius Volz 	__be32 diff[8] = { ~old[3], ~old[2], ~old[1], ~old[0],
15470bbdd42bSJulius Volz 			    new[3],  new[2],  new[1],  new[0] };
15480bbdd42bSJulius Volz 
154907f0757aSJoe Perches 	return csum_partial(diff, sizeof(diff), oldsum);
15500bbdd42bSJulius Volz }
15510bbdd42bSJulius Volz #endif
15520bbdd42bSJulius Volz 
1553f9214b26SAl Viro static inline __wsum ip_vs_check_diff2(__be16 old, __be16 new, __wsum oldsum)
1554f9214b26SAl Viro {
1555f9214b26SAl Viro 	__be16 diff[2] = { ~old, new };
1556f9214b26SAl Viro 
155707f0757aSJoe Perches 	return csum_partial(diff, sizeof(diff), oldsum);
15581da177e4SLinus Torvalds }
15591da177e4SLinus Torvalds 
1560cf356d69SJulian Anastasov /*
1561cf356d69SJulian Anastasov  * Forget current conntrack (unconfirmed) and attach notrack entry
1562cf356d69SJulian Anastasov  */
1563cf356d69SJulian Anastasov static inline void ip_vs_notrack(struct sk_buff *skb)
1564cf356d69SJulian Anastasov {
1565cf356d69SJulian Anastasov #if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE)
1566cf356d69SJulian Anastasov 	enum ip_conntrack_info ctinfo;
156706b69390SJesper Juhl 	struct nf_conn *ct = nf_ct_get(skb, &ctinfo);
1568cf356d69SJulian Anastasov 
1569cf356d69SJulian Anastasov 	if (!ct || !nf_ct_is_untracked(ct)) {
15709e33ce45SLin Ming 		nf_conntrack_put(skb->nfct);
1571cf356d69SJulian Anastasov 		skb->nfct = &nf_ct_untracked_get()->ct_general;
1572cf356d69SJulian Anastasov 		skb->nfctinfo = IP_CT_NEW;
1573cf356d69SJulian Anastasov 		nf_conntrack_get(skb->nfct);
1574cf356d69SJulian Anastasov 	}
1575cf356d69SJulian Anastasov #endif
1576cf356d69SJulian Anastasov }
1577cf356d69SJulian Anastasov 
1578f4bc17cdSJulian Anastasov #ifdef CONFIG_IP_VS_NFCT
1579f4bc17cdSJulian Anastasov /*
1580f4bc17cdSJulian Anastasov  *      Netfilter connection tracking
1581f4bc17cdSJulian Anastasov  *      (from ip_vs_nfct.c)
1582f4bc17cdSJulian Anastasov  */
1583a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs)
1584f4bc17cdSJulian Anastasov {
1585a4e2f5a7SSimon Horman #ifdef CONFIG_SYSCTL
1586a0840e2eSHans Schillstrom 	return ipvs->sysctl_conntrack;
1587a4e2f5a7SSimon Horman #else
1588a4e2f5a7SSimon Horman 	return 0;
1589a4e2f5a7SSimon Horman #endif
1590f4bc17cdSJulian Anastasov }
1591f4bc17cdSJulian Anastasov 
15925c3a0fd7SJoe Perches void ip_vs_update_conntrack(struct sk_buff *skb, struct ip_vs_conn *cp,
15936523ce15SJulian Anastasov 			    int outin);
15945c3a0fd7SJoe Perches int ip_vs_confirm_conntrack(struct sk_buff *skb);
15955c3a0fd7SJoe Perches void ip_vs_nfct_expect_related(struct sk_buff *skb, struct nf_conn *ct,
1596f4bc17cdSJulian Anastasov 			       struct ip_vs_conn *cp, u_int8_t proto,
1597f4bc17cdSJulian Anastasov 			       const __be16 port, int from_rs);
15985c3a0fd7SJoe Perches void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp);
1599f4bc17cdSJulian Anastasov 
1600f4bc17cdSJulian Anastasov #else
1601f4bc17cdSJulian Anastasov 
1602a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs)
1603f4bc17cdSJulian Anastasov {
1604f4bc17cdSJulian Anastasov 	return 0;
1605f4bc17cdSJulian Anastasov }
1606f4bc17cdSJulian Anastasov 
1607f4bc17cdSJulian Anastasov static inline void ip_vs_update_conntrack(struct sk_buff *skb,
1608f4bc17cdSJulian Anastasov 					  struct ip_vs_conn *cp, int outin)
1609f4bc17cdSJulian Anastasov {
1610f4bc17cdSJulian Anastasov }
1611f4bc17cdSJulian Anastasov 
1612e23ebf0fSKrzysztof Wilczynski static inline int ip_vs_confirm_conntrack(struct sk_buff *skb)
1613f4bc17cdSJulian Anastasov {
1614f4bc17cdSJulian Anastasov 	return NF_ACCEPT;
1615f4bc17cdSJulian Anastasov }
1616f4bc17cdSJulian Anastasov 
1617f4bc17cdSJulian Anastasov static inline void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp)
1618f4bc17cdSJulian Anastasov {
1619f4bc17cdSJulian Anastasov }
1620f4bc17cdSJulian Anastasov /* CONFIG_IP_VS_NFCT */
1621f4bc17cdSJulian Anastasov #endif
16226523ce15SJulian Anastasov 
1623c16526a7SSimon Kirby static inline int
1624b552f7e3SChangli Gao ip_vs_dest_conn_overhead(struct ip_vs_dest *dest)
1625b552f7e3SChangli Gao {
1626b552f7e3SChangli Gao 	/*
1627b552f7e3SChangli Gao 	 * We think the overhead of processing active connections is 256
1628b552f7e3SChangli Gao 	 * times higher than that of inactive connections in average. (This
1629b552f7e3SChangli Gao 	 * 256 times might not be accurate, we will change it later) We
1630b552f7e3SChangli Gao 	 * use the following formula to estimate the overhead now:
1631b552f7e3SChangli Gao 	 *		  dest->activeconns*256 + dest->inactconns
1632b552f7e3SChangli Gao 	 */
1633b552f7e3SChangli Gao 	return (atomic_read(&dest->activeconns) << 8) +
1634b552f7e3SChangli Gao 		atomic_read(&dest->inactconns);
1635b552f7e3SChangli Gao }
1636b552f7e3SChangli Gao 
1637bc4768ebSJulius Volz #endif	/* _NET_IP_VS_H */
1638