xref: /openbmc/linux/include/net/ip_vs.h (revision ba38528aae6ee2d22226c6a78727ddc13512b068)
11da177e4SLinus Torvalds /*
21da177e4SLinus Torvalds  *      IP Virtual Server
31da177e4SLinus Torvalds  *      data structure and functionality definitions
41da177e4SLinus Torvalds  */
51da177e4SLinus Torvalds 
6bc4768ebSJulius Volz #ifndef _NET_IP_VS_H
7bc4768ebSJulius Volz #define _NET_IP_VS_H
81da177e4SLinus Torvalds 
9bc4768ebSJulius Volz #include <linux/ip_vs.h>                /* definitions shared with userland */
101da177e4SLinus Torvalds 
11bc4768ebSJulius Volz #include <asm/types.h>                  /* for __uXX types */
12bc4768ebSJulius Volz 
131da177e4SLinus Torvalds #include <linux/list.h>                 /* for struct list_head */
141da177e4SLinus Torvalds #include <linux/spinlock.h>             /* for struct rwlock_t */
1560063497SArun Sharma #include <linux/atomic.h>                 /* for struct atomic_t */
161da177e4SLinus Torvalds #include <linux/compiler.h>
1714c85021SArnaldo Carvalho de Melo #include <linux/timer.h>
18187f1882SPaul Gortmaker #include <linux/bug.h>
191da177e4SLinus Torvalds 
2014c85021SArnaldo Carvalho de Melo #include <net/checksum.h>
21e7ade46aSJulius Volz #include <linux/netfilter.h>		/* for union nf_inet_addr */
221668e010SKOVACS Krisztian #include <linux/ip.h>
23e7ade46aSJulius Volz #include <linux/ipv6.h>			/* for struct ipv6hdr */
244e3fd7a0SAlexey Dobriyan #include <net/ipv6.h>
2554d83efaSJesper Dangaard Brouer #if IS_ENABLED(CONFIG_IP_VS_IPV6)
2663dca2c0SJesper Dangaard Brouer #include <linux/netfilter_ipv6/ip6_tables.h>
2763dca2c0SJesper Dangaard Brouer #endif
28a638e514SJesper Dangaard Brouer #if IS_ENABLED(CONFIG_NF_CONNTRACK)
29f4bc17cdSJulian Anastasov #include <net/netfilter/nf_conntrack.h>
30f4bc17cdSJulian Anastasov #endif
3161b1ab45SHans Schillstrom #include <net/net_namespace.h>		/* Netw namespace */
3261b1ab45SHans Schillstrom 
3361b1ab45SHans Schillstrom /*
3461b1ab45SHans Schillstrom  * Generic access of ipvs struct
3561b1ab45SHans Schillstrom  */
3661b1ab45SHans Schillstrom static inline struct netns_ipvs *net_ipvs(struct net* net)
3761b1ab45SHans Schillstrom {
3861b1ab45SHans Schillstrom 	return net->ipvs;
3961b1ab45SHans Schillstrom }
40fc723250SHans Schillstrom /*
41fc723250SHans Schillstrom  * Get net ptr from skb in traffic cases
42fc723250SHans Schillstrom  * use skb_sknet when call is from userland (ioctl or netlink)
43fc723250SHans Schillstrom  */
44a0840e2eSHans Schillstrom static inline struct net *skb_net(const struct sk_buff *skb)
45fc723250SHans Schillstrom {
46fc723250SHans Schillstrom #ifdef CONFIG_NET_NS
47fc723250SHans Schillstrom #ifdef CONFIG_IP_VS_DEBUG
48fc723250SHans Schillstrom 	/*
49fc723250SHans Schillstrom 	 * This is used for debug only.
50fc723250SHans Schillstrom 	 * Start with the most likely hit
51fc723250SHans Schillstrom 	 * End with BUG
52fc723250SHans Schillstrom 	 */
53fc723250SHans Schillstrom 	if (likely(skb->dev && skb->dev->nd_net))
54fc723250SHans Schillstrom 		return dev_net(skb->dev);
55a09d1977SHans Schillstrom 	if (skb_dst(skb) && skb_dst(skb)->dev)
56fc723250SHans Schillstrom 		return dev_net(skb_dst(skb)->dev);
57fc723250SHans Schillstrom 	WARN(skb->sk, "Maybe skb_sknet should be used in %s() at line:%d\n",
58fc723250SHans Schillstrom 		      __func__, __LINE__);
59fc723250SHans Schillstrom 	if (likely(skb->sk && skb->sk->sk_net))
60fc723250SHans Schillstrom 		return sock_net(skb->sk);
61fc723250SHans Schillstrom 	pr_err("There is no net ptr to find in the skb in %s() line:%d\n",
62fc723250SHans Schillstrom 		__func__, __LINE__);
63fc723250SHans Schillstrom 	BUG();
64fc723250SHans Schillstrom #else
65fc723250SHans Schillstrom 	return dev_net(skb->dev ? : skb_dst(skb)->dev);
66fc723250SHans Schillstrom #endif
67fc723250SHans Schillstrom #else
68fc723250SHans Schillstrom 	return &init_net;
69fc723250SHans Schillstrom #endif
70fc723250SHans Schillstrom }
71fc723250SHans Schillstrom 
72a0840e2eSHans Schillstrom static inline struct net *skb_sknet(const struct sk_buff *skb)
73fc723250SHans Schillstrom {
74fc723250SHans Schillstrom #ifdef CONFIG_NET_NS
75fc723250SHans Schillstrom #ifdef CONFIG_IP_VS_DEBUG
76fc723250SHans Schillstrom 	/* Start with the most likely hit */
77fc723250SHans Schillstrom 	if (likely(skb->sk && skb->sk->sk_net))
78fc723250SHans Schillstrom 		return sock_net(skb->sk);
79fc723250SHans Schillstrom 	WARN(skb->dev, "Maybe skb_net should be used instead in %s() line:%d\n",
80fc723250SHans Schillstrom 		       __func__, __LINE__);
81fc723250SHans Schillstrom 	if (likely(skb->dev && skb->dev->nd_net))
82fc723250SHans Schillstrom 		return dev_net(skb->dev);
83fc723250SHans Schillstrom 	pr_err("There is no net ptr to find in the skb in %s() line:%d\n",
84fc723250SHans Schillstrom 		__func__, __LINE__);
85fc723250SHans Schillstrom 	BUG();
86fc723250SHans Schillstrom #else
87fc723250SHans Schillstrom 	return sock_net(skb->sk);
88fc723250SHans Schillstrom #endif
89fc723250SHans Schillstrom #else
90fc723250SHans Schillstrom 	return &init_net;
91fc723250SHans Schillstrom #endif
92fc723250SHans Schillstrom }
93b17fc996SHans Schillstrom /*
94b17fc996SHans Schillstrom  * This one needed for single_open_net since net is stored directly in
9525985edcSLucas De Marchi  * private not as a struct i.e. seq_file_net can't be used.
96b17fc996SHans Schillstrom  */
97b17fc996SHans Schillstrom static inline struct net *seq_file_single_net(struct seq_file *seq)
98b17fc996SHans Schillstrom {
99b17fc996SHans Schillstrom #ifdef CONFIG_NET_NS
100b17fc996SHans Schillstrom 	return (struct net *)seq->private;
101b17fc996SHans Schillstrom #else
102b17fc996SHans Schillstrom 	return &init_net;
103b17fc996SHans Schillstrom #endif
104b17fc996SHans Schillstrom }
1056f7edb48SCatalin(ux) M. BOIE 
1066f7edb48SCatalin(ux) M. BOIE /* Connections' size value needed by ip_vs_ctl.c */
1076f7edb48SCatalin(ux) M. BOIE extern int ip_vs_conn_tab_size;
1086f7edb48SCatalin(ux) M. BOIE 
10964aae3cbSJulius Volz struct ip_vs_iphdr {
11063dca2c0SJesper Dangaard Brouer 	__u32 len;	/* IPv4 simply where L4 starts
11163dca2c0SJesper Dangaard Brouer 			   IPv6 where L4 Transport Header starts */
11263dca2c0SJesper Dangaard Brouer 	__u16 fragoffs; /* IPv6 fragment offset, 0 if first frag (or not frag)*/
11363dca2c0SJesper Dangaard Brouer 	__s16 protocol;
11463dca2c0SJesper Dangaard Brouer 	__s32 flags;
11564aae3cbSJulius Volz 	union nf_inet_addr saddr;
11664aae3cbSJulius Volz 	union nf_inet_addr daddr;
11764aae3cbSJulius Volz };
11864aae3cbSJulius Volz 
1192f74713dSJesper Dangaard Brouer static inline void *frag_safe_skb_hp(const struct sk_buff *skb, int offset,
1202f74713dSJesper Dangaard Brouer 				      int len, void *buffer,
1212f74713dSJesper Dangaard Brouer 				      const struct ip_vs_iphdr *ipvsh)
1222f74713dSJesper Dangaard Brouer {
1232f74713dSJesper Dangaard Brouer 	return skb_header_pointer(skb, offset, len, buffer);
1242f74713dSJesper Dangaard Brouer }
1252f74713dSJesper Dangaard Brouer 
12664aae3cbSJulius Volz static inline void
12763dca2c0SJesper Dangaard Brouer ip_vs_fill_ip4hdr(const void *nh, struct ip_vs_iphdr *iphdr)
12863dca2c0SJesper Dangaard Brouer {
12963dca2c0SJesper Dangaard Brouer 	const struct iphdr *iph = nh;
13063dca2c0SJesper Dangaard Brouer 
13163dca2c0SJesper Dangaard Brouer 	iphdr->len	= iph->ihl * 4;
13263dca2c0SJesper Dangaard Brouer 	iphdr->fragoffs	= 0;
13363dca2c0SJesper Dangaard Brouer 	iphdr->protocol	= iph->protocol;
13463dca2c0SJesper Dangaard Brouer 	iphdr->saddr.ip	= iph->saddr;
13563dca2c0SJesper Dangaard Brouer 	iphdr->daddr.ip	= iph->daddr;
13663dca2c0SJesper Dangaard Brouer }
13763dca2c0SJesper Dangaard Brouer 
13863dca2c0SJesper Dangaard Brouer /* This function handles filling *ip_vs_iphdr, both for IPv4 and IPv6.
13963dca2c0SJesper Dangaard Brouer  * IPv6 requires some extra work, as finding proper header position,
14063dca2c0SJesper Dangaard Brouer  * depend on the IPv6 extension headers.
14163dca2c0SJesper Dangaard Brouer  */
14263dca2c0SJesper Dangaard Brouer static inline void
14363dca2c0SJesper Dangaard Brouer ip_vs_fill_iph_skb(int af, const struct sk_buff *skb, struct ip_vs_iphdr *iphdr)
14464aae3cbSJulius Volz {
14564aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6
14664aae3cbSJulius Volz 	if (af == AF_INET6) {
14763dca2c0SJesper Dangaard Brouer 		const struct ipv6hdr *iph =
14863dca2c0SJesper Dangaard Brouer 			(struct ipv6hdr *)skb_network_header(skb);
1494e3fd7a0SAlexey Dobriyan 		iphdr->saddr.in6 = iph->saddr;
1504e3fd7a0SAlexey Dobriyan 		iphdr->daddr.in6 = iph->daddr;
1516aafeef0SJiri Pirko 		/* ipv6_find_hdr() updates len, flags */
15263dca2c0SJesper Dangaard Brouer 		iphdr->len	 = 0;
15363dca2c0SJesper Dangaard Brouer 		iphdr->flags	 = 0;
15463dca2c0SJesper Dangaard Brouer 		iphdr->protocol  = ipv6_find_hdr(skb, &iphdr->len, -1,
15563dca2c0SJesper Dangaard Brouer 						 &iphdr->fragoffs,
15663dca2c0SJesper Dangaard Brouer 						 &iphdr->flags);
15764aae3cbSJulius Volz 	} else
15864aae3cbSJulius Volz #endif
15964aae3cbSJulius Volz 	{
16063dca2c0SJesper Dangaard Brouer 		const struct iphdr *iph =
16163dca2c0SJesper Dangaard Brouer 			(struct iphdr *)skb_network_header(skb);
16264aae3cbSJulius Volz 		iphdr->len	= iph->ihl * 4;
16363dca2c0SJesper Dangaard Brouer 		iphdr->fragoffs	= 0;
16464aae3cbSJulius Volz 		iphdr->protocol	= iph->protocol;
16564aae3cbSJulius Volz 		iphdr->saddr.ip	= iph->saddr;
16664aae3cbSJulius Volz 		iphdr->daddr.ip	= iph->daddr;
16764aae3cbSJulius Volz 	}
16864aae3cbSJulius Volz }
16964aae3cbSJulius Volz 
17064aae3cbSJulius Volz static inline void ip_vs_addr_copy(int af, union nf_inet_addr *dst,
17164aae3cbSJulius Volz 				   const union nf_inet_addr *src)
17264aae3cbSJulius Volz {
17364aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6
17464aae3cbSJulius Volz 	if (af == AF_INET6)
1754e3fd7a0SAlexey Dobriyan 		dst->in6 = src->in6;
17664aae3cbSJulius Volz 	else
17764aae3cbSJulius Volz #endif
17864aae3cbSJulius Volz 	dst->ip = src->ip;
17964aae3cbSJulius Volz }
18064aae3cbSJulius Volz 
1819a05475cSJulian Anastasov static inline void ip_vs_addr_set(int af, union nf_inet_addr *dst,
1829a05475cSJulian Anastasov 				  const union nf_inet_addr *src)
1839a05475cSJulian Anastasov {
1849a05475cSJulian Anastasov #ifdef CONFIG_IP_VS_IPV6
1859a05475cSJulian Anastasov 	if (af == AF_INET6) {
1869a05475cSJulian Anastasov 		dst->in6 = src->in6;
1879a05475cSJulian Anastasov 		return;
1889a05475cSJulian Anastasov 	}
1899a05475cSJulian Anastasov #endif
1909a05475cSJulian Anastasov 	dst->ip = src->ip;
1919a05475cSJulian Anastasov 	dst->all[1] = 0;
1929a05475cSJulian Anastasov 	dst->all[2] = 0;
1939a05475cSJulian Anastasov 	dst->all[3] = 0;
1949a05475cSJulian Anastasov }
1959a05475cSJulian Anastasov 
19664aae3cbSJulius Volz static inline int ip_vs_addr_equal(int af, const union nf_inet_addr *a,
19764aae3cbSJulius Volz 				   const union nf_inet_addr *b)
19864aae3cbSJulius Volz {
19964aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6
20064aae3cbSJulius Volz 	if (af == AF_INET6)
20164aae3cbSJulius Volz 		return ipv6_addr_equal(&a->in6, &b->in6);
20264aae3cbSJulius Volz #endif
20364aae3cbSJulius Volz 	return a->ip == b->ip;
20464aae3cbSJulius Volz }
20564aae3cbSJulius Volz 
2061da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG
20714c85021SArnaldo Carvalho de Melo #include <linux/net.h>
20814c85021SArnaldo Carvalho de Melo 
2095c3a0fd7SJoe Perches int ip_vs_get_debug_level(void);
210c842a3adSJulius Volz 
211c842a3adSJulius Volz static inline const char *ip_vs_dbg_addr(int af, char *buf, size_t buf_len,
212c842a3adSJulius Volz 					 const union nf_inet_addr *addr,
213c842a3adSJulius Volz 					 int *idx)
214c842a3adSJulius Volz {
215c842a3adSJulius Volz 	int len;
216c842a3adSJulius Volz #ifdef CONFIG_IP_VS_IPV6
217c842a3adSJulius Volz 	if (af == AF_INET6)
218120b9c14SJesper Dangaard Brouer 		len = snprintf(&buf[*idx], buf_len - *idx, "[%pI6c]",
2190c6ce78aSHarvey Harrison 			       &addr->in6) + 1;
220c842a3adSJulius Volz 	else
221c842a3adSJulius Volz #endif
2223685f25dSHarvey Harrison 		len = snprintf(&buf[*idx], buf_len - *idx, "%pI4",
2233685f25dSHarvey Harrison 			       &addr->ip) + 1;
224c842a3adSJulius Volz 
225c842a3adSJulius Volz 	*idx += len;
226c842a3adSJulius Volz 	BUG_ON(*idx > buf_len + 1);
227c842a3adSJulius Volz 	return &buf[*idx - len];
228c842a3adSJulius Volz }
229c842a3adSJulius Volz 
2309aada7acSHannes Eder #define IP_VS_DBG_BUF(level, msg, ...)					\
231c842a3adSJulius Volz 	do {								\
232c842a3adSJulius Volz 		char ip_vs_dbg_buf[160];				\
233c842a3adSJulius Volz 		int ip_vs_dbg_idx = 0;					\
234c842a3adSJulius Volz 		if (level <= ip_vs_get_debug_level())			\
2359aada7acSHannes Eder 			printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__);	\
236c842a3adSJulius Volz 	} while (0)
237c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...)						\
238c842a3adSJulius Volz 	do {								\
239c842a3adSJulius Volz 		char ip_vs_dbg_buf[160];				\
240c842a3adSJulius Volz 		int ip_vs_dbg_idx = 0;					\
2419aada7acSHannes Eder 		pr_err(msg);						\
242c842a3adSJulius Volz 	} while (0)
243c842a3adSJulius Volz 
244c842a3adSJulius Volz /* Only use from within IP_VS_DBG_BUF() or IP_VS_ERR_BUF macros */
245c842a3adSJulius Volz #define IP_VS_DBG_ADDR(af, addr)					\
246c842a3adSJulius Volz 	ip_vs_dbg_addr(af, ip_vs_dbg_buf,				\
247c842a3adSJulius Volz 		       sizeof(ip_vs_dbg_buf), addr,			\
248c842a3adSJulius Volz 		       &ip_vs_dbg_idx)
249c842a3adSJulius Volz 
2509aada7acSHannes Eder #define IP_VS_DBG(level, msg, ...)					\
2511da177e4SLinus Torvalds 	do {								\
2521da177e4SLinus Torvalds 		if (level <= ip_vs_get_debug_level())			\
2539aada7acSHannes Eder 			printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__);	\
2541da177e4SLinus Torvalds 	} while (0)
2559aada7acSHannes Eder #define IP_VS_DBG_RL(msg, ...)						\
2561da177e4SLinus Torvalds 	do {								\
2571da177e4SLinus Torvalds 		if (net_ratelimit())					\
2589aada7acSHannes Eder 			printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__);	\
2591da177e4SLinus Torvalds 	} while (0)
2600d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg)			\
2611da177e4SLinus Torvalds 	do {								\
2621da177e4SLinus Torvalds 		if (level <= ip_vs_get_debug_level())			\
2630d79641aSJulian Anastasov 			pp->debug_packet(af, pp, skb, ofs, msg);	\
2641da177e4SLinus Torvalds 	} while (0)
2650d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg)			\
2661da177e4SLinus Torvalds 	do {								\
2671da177e4SLinus Torvalds 		if (level <= ip_vs_get_debug_level() &&			\
2681da177e4SLinus Torvalds 		    net_ratelimit())					\
2690d79641aSJulian Anastasov 			pp->debug_packet(af, pp, skb, ofs, msg);	\
2701da177e4SLinus Torvalds 	} while (0)
2711da177e4SLinus Torvalds #else	/* NO DEBUGGING at ALL */
272c842a3adSJulius Volz #define IP_VS_DBG_BUF(level, msg...)  do {} while (0)
273c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...)  do {} while (0)
2741da177e4SLinus Torvalds #define IP_VS_DBG(level, msg...)  do {} while (0)
2751da177e4SLinus Torvalds #define IP_VS_DBG_RL(msg...)  do {} while (0)
2760d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg)	do {} while (0)
2770d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg)	do {} while (0)
2781da177e4SLinus Torvalds #endif
2791da177e4SLinus Torvalds 
2801da177e4SLinus Torvalds #define IP_VS_BUG() BUG()
2811e3e238eSHannes Eder #define IP_VS_ERR_RL(msg, ...)						\
2821da177e4SLinus Torvalds 	do {								\
2831da177e4SLinus Torvalds 		if (net_ratelimit())					\
2841e3e238eSHannes Eder 			pr_err(msg, ##__VA_ARGS__);			\
2851da177e4SLinus Torvalds 	} while (0)
2861da177e4SLinus Torvalds 
2871da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG
2881da177e4SLinus Torvalds #define EnterFunction(level)						\
2891da177e4SLinus Torvalds 	do {								\
2901da177e4SLinus Torvalds 		if (level <= ip_vs_get_debug_level())			\
2919aada7acSHannes Eder 			printk(KERN_DEBUG				\
2929aada7acSHannes Eder 			       pr_fmt("Enter: %s, %s line %i\n"),	\
293d5c003b4SHarvey Harrison 			       __func__, __FILE__, __LINE__);		\
2941da177e4SLinus Torvalds 	} while (0)
2951da177e4SLinus Torvalds #define LeaveFunction(level)						\
2961da177e4SLinus Torvalds 	do {								\
2971da177e4SLinus Torvalds 		if (level <= ip_vs_get_debug_level())			\
2989aada7acSHannes Eder 			printk(KERN_DEBUG				\
2999aada7acSHannes Eder 			       pr_fmt("Leave: %s, %s line %i\n"),	\
300d5c003b4SHarvey Harrison 			       __func__, __FILE__, __LINE__);		\
3011da177e4SLinus Torvalds 	} while (0)
3021da177e4SLinus Torvalds #else
3031da177e4SLinus Torvalds #define EnterFunction(level)   do {} while (0)
3041da177e4SLinus Torvalds #define LeaveFunction(level)   do {} while (0)
3051da177e4SLinus Torvalds #endif
3061da177e4SLinus Torvalds 
3071da177e4SLinus Torvalds 
3081da177e4SLinus Torvalds /*
3091da177e4SLinus Torvalds  *      The port number of FTP service (in network order).
3101da177e4SLinus Torvalds  */
311f3a7c66bSHarvey Harrison #define FTPPORT  cpu_to_be16(21)
312f3a7c66bSHarvey Harrison #define FTPDATA  cpu_to_be16(20)
3131da177e4SLinus Torvalds 
3141da177e4SLinus Torvalds /*
3151da177e4SLinus Torvalds  *      TCP State Values
3161da177e4SLinus Torvalds  */
3171da177e4SLinus Torvalds enum {
3181da177e4SLinus Torvalds 	IP_VS_TCP_S_NONE = 0,
3191da177e4SLinus Torvalds 	IP_VS_TCP_S_ESTABLISHED,
3201da177e4SLinus Torvalds 	IP_VS_TCP_S_SYN_SENT,
3211da177e4SLinus Torvalds 	IP_VS_TCP_S_SYN_RECV,
3221da177e4SLinus Torvalds 	IP_VS_TCP_S_FIN_WAIT,
3231da177e4SLinus Torvalds 	IP_VS_TCP_S_TIME_WAIT,
3241da177e4SLinus Torvalds 	IP_VS_TCP_S_CLOSE,
3251da177e4SLinus Torvalds 	IP_VS_TCP_S_CLOSE_WAIT,
3261da177e4SLinus Torvalds 	IP_VS_TCP_S_LAST_ACK,
3271da177e4SLinus Torvalds 	IP_VS_TCP_S_LISTEN,
3281da177e4SLinus Torvalds 	IP_VS_TCP_S_SYNACK,
3291da177e4SLinus Torvalds 	IP_VS_TCP_S_LAST
3301da177e4SLinus Torvalds };
3311da177e4SLinus Torvalds 
3321da177e4SLinus Torvalds /*
3331da177e4SLinus Torvalds  *	UDP State Values
3341da177e4SLinus Torvalds  */
3351da177e4SLinus Torvalds enum {
3361da177e4SLinus Torvalds 	IP_VS_UDP_S_NORMAL,
3371da177e4SLinus Torvalds 	IP_VS_UDP_S_LAST,
3381da177e4SLinus Torvalds };
3391da177e4SLinus Torvalds 
3401da177e4SLinus Torvalds /*
3411da177e4SLinus Torvalds  *	ICMP State Values
3421da177e4SLinus Torvalds  */
3431da177e4SLinus Torvalds enum {
3441da177e4SLinus Torvalds 	IP_VS_ICMP_S_NORMAL,
3451da177e4SLinus Torvalds 	IP_VS_ICMP_S_LAST,
3461da177e4SLinus Torvalds };
3471da177e4SLinus Torvalds 
3481da177e4SLinus Torvalds /*
3492906f66aSVenkata Mohan Reddy  *	SCTP State Values
3502906f66aSVenkata Mohan Reddy  */
3512906f66aSVenkata Mohan Reddy enum ip_vs_sctp_states {
3522906f66aSVenkata Mohan Reddy 	IP_VS_SCTP_S_NONE,
35361e7c420SJulian Anastasov 	IP_VS_SCTP_S_INIT1,
35461e7c420SJulian Anastasov 	IP_VS_SCTP_S_INIT,
35561e7c420SJulian Anastasov 	IP_VS_SCTP_S_COOKIE_SENT,
35661e7c420SJulian Anastasov 	IP_VS_SCTP_S_COOKIE_REPLIED,
35761e7c420SJulian Anastasov 	IP_VS_SCTP_S_COOKIE_WAIT,
35861e7c420SJulian Anastasov 	IP_VS_SCTP_S_COOKIE,
35961e7c420SJulian Anastasov 	IP_VS_SCTP_S_COOKIE_ECHOED,
3602906f66aSVenkata Mohan Reddy 	IP_VS_SCTP_S_ESTABLISHED,
36161e7c420SJulian Anastasov 	IP_VS_SCTP_S_SHUTDOWN_SENT,
36261e7c420SJulian Anastasov 	IP_VS_SCTP_S_SHUTDOWN_RECEIVED,
36361e7c420SJulian Anastasov 	IP_VS_SCTP_S_SHUTDOWN_ACK_SENT,
36461e7c420SJulian Anastasov 	IP_VS_SCTP_S_REJECTED,
3652906f66aSVenkata Mohan Reddy 	IP_VS_SCTP_S_CLOSED,
3662906f66aSVenkata Mohan Reddy 	IP_VS_SCTP_S_LAST
3672906f66aSVenkata Mohan Reddy };
3682906f66aSVenkata Mohan Reddy 
3692906f66aSVenkata Mohan Reddy /*
3701da177e4SLinus Torvalds  *	Delta sequence info structure
3711da177e4SLinus Torvalds  *	Each ip_vs_conn has 2 (output AND input seq. changes).
3721da177e4SLinus Torvalds  *      Only used in the VS/NAT.
3731da177e4SLinus Torvalds  */
3741da177e4SLinus Torvalds struct ip_vs_seq {
3751da177e4SLinus Torvalds 	__u32			init_seq;	/* Add delta from this seq */
3761da177e4SLinus Torvalds 	__u32			delta;		/* Delta in sequence numbers */
3771da177e4SLinus Torvalds 	__u32			previous_delta;	/* Delta in sequence numbers
3781da177e4SLinus Torvalds 						   before last resized pkt */
3791da177e4SLinus Torvalds };
3801da177e4SLinus Torvalds 
381b17fc996SHans Schillstrom /*
382b17fc996SHans Schillstrom  * counters per cpu
383b17fc996SHans Schillstrom  */
384b17fc996SHans Schillstrom struct ip_vs_counters {
385b17fc996SHans Schillstrom 	__u32		conns;		/* connections scheduled */
386b17fc996SHans Schillstrom 	__u32		inpkts;		/* incoming packets */
387b17fc996SHans Schillstrom 	__u32		outpkts;	/* outgoing packets */
388b17fc996SHans Schillstrom 	__u64		inbytes;	/* incoming bytes */
389b17fc996SHans Schillstrom 	__u64		outbytes;	/* outgoing bytes */
390b17fc996SHans Schillstrom };
391b17fc996SHans Schillstrom /*
392b17fc996SHans Schillstrom  * Stats per cpu
393b17fc996SHans Schillstrom  */
394b17fc996SHans Schillstrom struct ip_vs_cpu_stats {
395b17fc996SHans Schillstrom 	struct ip_vs_counters   ustats;
396b17fc996SHans Schillstrom 	struct u64_stats_sync   syncp;
397b17fc996SHans Schillstrom };
3981da177e4SLinus Torvalds 
3991da177e4SLinus Torvalds /*
4003a14a313SSven Wegener  *	IPVS statistics objects
4011da177e4SLinus Torvalds  */
4023a14a313SSven Wegener struct ip_vs_estimator {
4033a14a313SSven Wegener 	struct list_head	list;
4043a14a313SSven Wegener 
4053a14a313SSven Wegener 	u64			last_inbytes;
4063a14a313SSven Wegener 	u64			last_outbytes;
4073a14a313SSven Wegener 	u32			last_conns;
4083a14a313SSven Wegener 	u32			last_inpkts;
4093a14a313SSven Wegener 	u32			last_outpkts;
4103a14a313SSven Wegener 
4113a14a313SSven Wegener 	u32			cps;
4123a14a313SSven Wegener 	u32			inpps;
4133a14a313SSven Wegener 	u32			outpps;
4143a14a313SSven Wegener 	u32			inbps;
4153a14a313SSven Wegener 	u32			outbps;
4163a14a313SSven Wegener };
4173a14a313SSven Wegener 
418fd2c3ef7SEric Dumazet struct ip_vs_stats {
419e9c0ce23SSven Wegener 	struct ip_vs_stats_user	ustats;		/* statistics */
420e9c0ce23SSven Wegener 	struct ip_vs_estimator	est;		/* estimator */
421b962abdcSJulian Anastasov 	struct ip_vs_cpu_stats __percpu	*cpustats;	/* per cpu counters */
4221da177e4SLinus Torvalds 	spinlock_t		lock;		/* spin lock */
42355a3d4e1SJulian Anastasov 	struct ip_vs_stats_user	ustats0;	/* reset values */
4241da177e4SLinus Torvalds };
4251da177e4SLinus Torvalds 
42614c85021SArnaldo Carvalho de Melo struct dst_entry;
42714c85021SArnaldo Carvalho de Melo struct iphdr;
4281da177e4SLinus Torvalds struct ip_vs_conn;
4291da177e4SLinus Torvalds struct ip_vs_app;
43014c85021SArnaldo Carvalho de Melo struct sk_buff;
431252c6410SHans Schillstrom struct ip_vs_proto_data;
4321da177e4SLinus Torvalds 
4331da177e4SLinus Torvalds struct ip_vs_protocol {
4341da177e4SLinus Torvalds 	struct ip_vs_protocol	*next;
4351da177e4SLinus Torvalds 	char			*name;
4362ad17defSJulian Anastasov 	u16			protocol;
4372ad17defSJulian Anastasov 	u16			num_states;
4381da177e4SLinus Torvalds 	int			dont_defrag;
4391da177e4SLinus Torvalds 
4401da177e4SLinus Torvalds 	void (*init)(struct ip_vs_protocol *pp);
4411da177e4SLinus Torvalds 
4421da177e4SLinus Torvalds 	void (*exit)(struct ip_vs_protocol *pp);
4431da177e4SLinus Torvalds 
444582b8e3eSHans Schillstrom 	int (*init_netns)(struct net *net, struct ip_vs_proto_data *pd);
445252c6410SHans Schillstrom 
446252c6410SHans Schillstrom 	void (*exit_netns)(struct net *net, struct ip_vs_proto_data *pd);
447252c6410SHans Schillstrom 
44851ef348bSJulius Volz 	int (*conn_schedule)(int af, struct sk_buff *skb,
4499330419dSHans Schillstrom 			     struct ip_vs_proto_data *pd,
450d4383f04SJesper Dangaard Brouer 			     int *verdict, struct ip_vs_conn **cpp,
451d4383f04SJesper Dangaard Brouer 			     struct ip_vs_iphdr *iph);
4521da177e4SLinus Torvalds 
4531da177e4SLinus Torvalds 	struct ip_vs_conn *
45451ef348bSJulius Volz 	(*conn_in_get)(int af,
45551ef348bSJulius Volz 		       const struct sk_buff *skb,
45651ef348bSJulius Volz 		       const struct ip_vs_iphdr *iph,
4571da177e4SLinus Torvalds 		       int inverse);
4581da177e4SLinus Torvalds 
4591da177e4SLinus Torvalds 	struct ip_vs_conn *
46051ef348bSJulius Volz 	(*conn_out_get)(int af,
46151ef348bSJulius Volz 			const struct sk_buff *skb,
46251ef348bSJulius Volz 			const struct ip_vs_iphdr *iph,
4631da177e4SLinus Torvalds 			int inverse);
4641da177e4SLinus Torvalds 
465d4383f04SJesper Dangaard Brouer 	int (*snat_handler)(struct sk_buff *skb, struct ip_vs_protocol *pp,
466d4383f04SJesper Dangaard Brouer 			    struct ip_vs_conn *cp, struct ip_vs_iphdr *iph);
4671da177e4SLinus Torvalds 
468d4383f04SJesper Dangaard Brouer 	int (*dnat_handler)(struct sk_buff *skb, struct ip_vs_protocol *pp,
469d4383f04SJesper Dangaard Brouer 			    struct ip_vs_conn *cp, struct ip_vs_iphdr *iph);
4701da177e4SLinus Torvalds 
47151ef348bSJulius Volz 	int (*csum_check)(int af, struct sk_buff *skb,
47251ef348bSJulius Volz 			  struct ip_vs_protocol *pp);
4731da177e4SLinus Torvalds 
4741da177e4SLinus Torvalds 	const char *(*state_name)(int state);
4751da177e4SLinus Torvalds 
4764a516f11SSimon Horman 	void (*state_transition)(struct ip_vs_conn *cp, int direction,
4771da177e4SLinus Torvalds 				 const struct sk_buff *skb,
4789330419dSHans Schillstrom 				 struct ip_vs_proto_data *pd);
4791da177e4SLinus Torvalds 
480ab8a5e84SHans Schillstrom 	int (*register_app)(struct net *net, struct ip_vs_app *inc);
4811da177e4SLinus Torvalds 
482ab8a5e84SHans Schillstrom 	void (*unregister_app)(struct net *net, struct ip_vs_app *inc);
4831da177e4SLinus Torvalds 
4841da177e4SLinus Torvalds 	int (*app_conn_bind)(struct ip_vs_conn *cp);
4851da177e4SLinus Torvalds 
4860d79641aSJulian Anastasov 	void (*debug_packet)(int af, struct ip_vs_protocol *pp,
4871da177e4SLinus Torvalds 			     const struct sk_buff *skb,
4881da177e4SLinus Torvalds 			     int offset,
4891da177e4SLinus Torvalds 			     const char *msg);
4901da177e4SLinus Torvalds 
4919330419dSHans Schillstrom 	void (*timeout_change)(struct ip_vs_proto_data *pd, int flags);
4921da177e4SLinus Torvalds };
4931da177e4SLinus Torvalds 
494252c6410SHans Schillstrom /*
495252c6410SHans Schillstrom  * protocol data per netns
496252c6410SHans Schillstrom  */
497252c6410SHans Schillstrom struct ip_vs_proto_data {
498252c6410SHans Schillstrom 	struct ip_vs_proto_data	*next;
499252c6410SHans Schillstrom 	struct ip_vs_protocol	*pp;
500252c6410SHans Schillstrom 	int			*timeout_table;	/* protocol timeout table */
501252c6410SHans Schillstrom 	atomic_t		appcnt;		/* counter of proto app incs. */
502252c6410SHans Schillstrom 	struct tcp_states_t	*tcp_state_table;
503252c6410SHans Schillstrom };
504252c6410SHans Schillstrom 
5055c3a0fd7SJoe Perches struct ip_vs_protocol   *ip_vs_proto_get(unsigned short proto);
5065c3a0fd7SJoe Perches struct ip_vs_proto_data *ip_vs_proto_data_get(struct net *net,
507252c6410SHans Schillstrom 					      unsigned short proto);
5081da177e4SLinus Torvalds 
509f11017ecSSimon Horman struct ip_vs_conn_param {
5106e67e586SHans Schillstrom 	struct net			*net;
511f11017ecSSimon Horman 	const union nf_inet_addr	*caddr;
512f11017ecSSimon Horman 	const union nf_inet_addr	*vaddr;
513f11017ecSSimon Horman 	__be16				cport;
514f11017ecSSimon Horman 	__be16				vport;
515f11017ecSSimon Horman 	__u16				protocol;
516f11017ecSSimon Horman 	u16				af;
51785999283SSimon Horman 
51885999283SSimon Horman 	const struct ip_vs_pe		*pe;
51985999283SSimon Horman 	char				*pe_data;
52085999283SSimon Horman 	__u8				pe_data_len;
521f11017ecSSimon Horman };
522f11017ecSSimon Horman 
5231da177e4SLinus Torvalds /*
5241da177e4SLinus Torvalds  *	IP_VS structure allocated for each dynamically scheduled connection
5251da177e4SLinus Torvalds  */
5261da177e4SLinus Torvalds struct ip_vs_conn {
527731109e7SChangli Gao 	struct hlist_node	c_list;         /* hashed list heads */
5281da177e4SLinus Torvalds 	/* Protocol, addresses and port numbers */
5296e67e586SHans Schillstrom 	__be16                  cport;
5306e67e586SHans Schillstrom 	__be16                  dport;
5311845ed0bSJulian Anastasov 	__be16                  vport;
5321845ed0bSJulian Anastasov 	u16			af;		/* address family */
533e7ade46aSJulius Volz 	union nf_inet_addr      caddr;          /* client address */
534e7ade46aSJulius Volz 	union nf_inet_addr      vaddr;          /* virtual address */
535e7ade46aSJulius Volz 	union nf_inet_addr      daddr;          /* destination address */
5363575792eSJulian Anastasov 	volatile __u32          flags;          /* status flags */
5371da177e4SLinus Torvalds 	__u16                   protocol;       /* Which protocol (TCP/UDP) */
538*ba38528aSAlex Gartrell 	__u16			daf;		/* Address family of the dest */
5391845ed0bSJulian Anastasov #ifdef CONFIG_NET_NS
5401845ed0bSJulian Anastasov 	struct net              *net;           /* Name space */
5411845ed0bSJulian Anastasov #endif
5421da177e4SLinus Torvalds 
5431da177e4SLinus Torvalds 	/* counter and timer */
5441da177e4SLinus Torvalds 	atomic_t		refcnt;		/* reference count */
5451da177e4SLinus Torvalds 	struct timer_list	timer;		/* Expiration timer */
5461da177e4SLinus Torvalds 	volatile unsigned long	timeout;	/* timeout */
5471da177e4SLinus Torvalds 
5481da177e4SLinus Torvalds 	/* Flags and state transition */
5491da177e4SLinus Torvalds 	spinlock_t              lock;           /* lock for state transition */
5501da177e4SLinus Torvalds 	volatile __u16          state;          /* state info */
551efac5276SRumen G. Bogdanovski 	volatile __u16          old_state;      /* old state, to be used for
552efac5276SRumen G. Bogdanovski 						 * state transition triggerd
553efac5276SRumen G. Bogdanovski 						 * synchronization
554efac5276SRumen G. Bogdanovski 						 */
5551845ed0bSJulian Anastasov 	__u32			fwmark;		/* Fire wall mark from skb */
556749c42b6SJulian Anastasov 	unsigned long		sync_endtime;	/* jiffies + sent_retries */
5571da177e4SLinus Torvalds 
5581da177e4SLinus Torvalds 	/* Control members */
5591da177e4SLinus Torvalds 	struct ip_vs_conn       *control;       /* Master control connection */
5601da177e4SLinus Torvalds 	atomic_t                n_control;      /* Number of controlled ones */
5611da177e4SLinus Torvalds 	struct ip_vs_dest       *dest;          /* real server */
5621da177e4SLinus Torvalds 	atomic_t                in_pkts;        /* incoming packet counter */
5631da177e4SLinus Torvalds 
5641da177e4SLinus Torvalds 	/* packet transmitter for different forwarding methods.  If it
5651da177e4SLinus Torvalds 	   mangles the packet, it must return NF_DROP or better NF_STOLEN,
5661da177e4SLinus Torvalds 	   otherwise this must be changed to a sk_buff **.
567fc604767SJulian Anastasov 	   NF_ACCEPT can be returned when destination is local.
5681da177e4SLinus Torvalds 	 */
5691da177e4SLinus Torvalds 	int (*packet_xmit)(struct sk_buff *skb, struct ip_vs_conn *cp,
570d4383f04SJesper Dangaard Brouer 			   struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
5711da177e4SLinus Torvalds 
5721da177e4SLinus Torvalds 	/* Note: we can group the following members into a structure,
5731da177e4SLinus Torvalds 	   in order to save more space, and the following members are
5741da177e4SLinus Torvalds 	   only used in VS/NAT anyway */
5751da177e4SLinus Torvalds 	struct ip_vs_app        *app;           /* bound ip_vs_app object */
5761da177e4SLinus Torvalds 	void                    *app_data;      /* Application private data */
5771da177e4SLinus Torvalds 	struct ip_vs_seq        in_seq;         /* incoming seq. struct */
5781da177e4SLinus Torvalds 	struct ip_vs_seq        out_seq;        /* outgoing seq. struct */
57985999283SSimon Horman 
580e9e5eee8SSimon Horman 	const struct ip_vs_pe	*pe;
58185999283SSimon Horman 	char			*pe_data;
58285999283SSimon Horman 	__u8			pe_data_len;
583088339a5SJulian Anastasov 
584088339a5SJulian Anastasov 	struct rcu_head		rcu_head;
5851da177e4SLinus Torvalds };
5861da177e4SLinus Torvalds 
5876e67e586SHans Schillstrom /*
5886e67e586SHans Schillstrom  *  To save some memory in conn table when name space is disabled.
5896e67e586SHans Schillstrom  */
5906e67e586SHans Schillstrom static inline struct net *ip_vs_conn_net(const struct ip_vs_conn *cp)
5916e67e586SHans Schillstrom {
5926e67e586SHans Schillstrom #ifdef CONFIG_NET_NS
5936e67e586SHans Schillstrom 	return cp->net;
5946e67e586SHans Schillstrom #else
5956e67e586SHans Schillstrom 	return &init_net;
5966e67e586SHans Schillstrom #endif
5976e67e586SHans Schillstrom }
5986e67e586SHans Schillstrom static inline void ip_vs_conn_net_set(struct ip_vs_conn *cp, struct net *net)
5996e67e586SHans Schillstrom {
6006e67e586SHans Schillstrom #ifdef CONFIG_NET_NS
6016e67e586SHans Schillstrom 	cp->net = net;
6026e67e586SHans Schillstrom #endif
6036e67e586SHans Schillstrom }
6046e67e586SHans Schillstrom 
6056e67e586SHans Schillstrom static inline int ip_vs_conn_net_eq(const struct ip_vs_conn *cp,
6066e67e586SHans Schillstrom 				    struct net *net)
6076e67e586SHans Schillstrom {
6086e67e586SHans Schillstrom #ifdef CONFIG_NET_NS
6096e67e586SHans Schillstrom 	return cp->net == net;
6106e67e586SHans Schillstrom #else
6116e67e586SHans Schillstrom 	return 1;
6126e67e586SHans Schillstrom #endif
6136e67e586SHans Schillstrom }
6141da177e4SLinus Torvalds 
6151da177e4SLinus Torvalds /*
616c860c6b1SJulius Volz  *	Extended internal versions of struct ip_vs_service_user and
617c860c6b1SJulius Volz  *	ip_vs_dest_user for IPv6 support.
618c860c6b1SJulius Volz  *
619c860c6b1SJulius Volz  *	We need these to conveniently pass around service and destination
620c860c6b1SJulius Volz  *	options, but unfortunately, we also need to keep the old definitions to
621c860c6b1SJulius Volz  *	maintain userspace backwards compatibility for the setsockopt interface.
622c860c6b1SJulius Volz  */
623c860c6b1SJulius Volz struct ip_vs_service_user_kern {
624c860c6b1SJulius Volz 	/* virtual service addresses */
625c860c6b1SJulius Volz 	u16			af;
626c860c6b1SJulius Volz 	u16			protocol;
627c860c6b1SJulius Volz 	union nf_inet_addr	addr;		/* virtual ip address */
6280a925864SJulian Anastasov 	__be16			port;
629c860c6b1SJulius Volz 	u32			fwmark;		/* firwall mark of service */
630c860c6b1SJulius Volz 
631c860c6b1SJulius Volz 	/* virtual service options */
632c860c6b1SJulius Volz 	char			*sched_name;
6330d1e71b0SSimon Horman 	char			*pe_name;
63495c96174SEric Dumazet 	unsigned int		flags;		/* virtual service flags */
63595c96174SEric Dumazet 	unsigned int		timeout;	/* persistent timeout in sec */
6360a925864SJulian Anastasov 	__be32			netmask;	/* persistent netmask or plen */
637c860c6b1SJulius Volz };
638c860c6b1SJulius Volz 
639c860c6b1SJulius Volz 
640c860c6b1SJulius Volz struct ip_vs_dest_user_kern {
641c860c6b1SJulius Volz 	/* destination server address */
642c860c6b1SJulius Volz 	union nf_inet_addr	addr;
6430a925864SJulian Anastasov 	__be16			port;
644c860c6b1SJulius Volz 
645c860c6b1SJulius Volz 	/* real server options */
64695c96174SEric Dumazet 	unsigned int		conn_flags;	/* connection flags */
647c860c6b1SJulius Volz 	int			weight;		/* destination weight */
648c860c6b1SJulius Volz 
649c860c6b1SJulius Volz 	/* thresholds for active connections */
650c860c6b1SJulius Volz 	u32			u_threshold;	/* upper threshold */
651c860c6b1SJulius Volz 	u32			l_threshold;	/* lower threshold */
6526cff339bSAlex Gartrell 
6536cff339bSAlex Gartrell 	/* Address family of addr */
6546cff339bSAlex Gartrell 	u16			af;
655c860c6b1SJulius Volz };
656c860c6b1SJulius Volz 
657c860c6b1SJulius Volz 
658c860c6b1SJulius Volz /*
6591da177e4SLinus Torvalds  *	The information about the virtual service offered to the net
6601da177e4SLinus Torvalds  *	and the forwarding entries
6611da177e4SLinus Torvalds  */
6621da177e4SLinus Torvalds struct ip_vs_service {
663ceec4c38SJulian Anastasov 	struct hlist_node	s_list;   /* for normal service table */
664ceec4c38SJulian Anastasov 	struct hlist_node	f_list;   /* for fwmark-based service table */
6651da177e4SLinus Torvalds 	atomic_t		refcnt;   /* reference counter */
6661da177e4SLinus Torvalds 
667e7ade46aSJulius Volz 	u16			af;       /* address family */
6681da177e4SLinus Torvalds 	__u16			protocol; /* which protocol (TCP/UDP) */
669e7ade46aSJulius Volz 	union nf_inet_addr	addr;	  /* IP address for virtual service */
670014d730dSAl Viro 	__be16			port;	  /* port number for the service */
6711da177e4SLinus Torvalds 	__u32                   fwmark;   /* firewall mark of the service */
67295c96174SEric Dumazet 	unsigned int		flags;	  /* service status flags */
67395c96174SEric Dumazet 	unsigned int		timeout;  /* persistent timeout in ticks */
6740a925864SJulian Anastasov 	__be32			netmask;  /* grouping granularity, mask/plen */
675fc723250SHans Schillstrom 	struct net		*net;
6761da177e4SLinus Torvalds 
6771da177e4SLinus Torvalds 	struct list_head	destinations;  /* real server d-linked list */
6781da177e4SLinus Torvalds 	__u32			num_dests;     /* number of servers */
6791da177e4SLinus Torvalds 	struct ip_vs_stats      stats;         /* statistics for the service */
6801da177e4SLinus Torvalds 
6811da177e4SLinus Torvalds 	/* for scheduling */
682ceec4c38SJulian Anastasov 	struct ip_vs_scheduler __rcu *scheduler; /* bound scheduler object */
683ba3a3ce1SJulian Anastasov 	spinlock_t		sched_lock;    /* lock sched_data */
6841da177e4SLinus Torvalds 	void			*sched_data;   /* scheduler application data */
68585999283SSimon Horman 
68685999283SSimon Horman 	/* alternate persistence engine */
687ceec4c38SJulian Anastasov 	struct ip_vs_pe __rcu	*pe;
688ceec4c38SJulian Anastasov 
689ceec4c38SJulian Anastasov 	struct rcu_head		rcu_head;
6901da177e4SLinus Torvalds };
6911da177e4SLinus Torvalds 
692026ace06SJulian Anastasov /* Information for cached dst */
693026ace06SJulian Anastasov struct ip_vs_dest_dst {
694026ace06SJulian Anastasov 	struct dst_entry	*dst_cache;	/* destination cache entry */
695026ace06SJulian Anastasov 	u32			dst_cookie;
696026ace06SJulian Anastasov 	union nf_inet_addr	dst_saddr;
697026ace06SJulian Anastasov 	struct rcu_head		rcu_head;
698026ace06SJulian Anastasov };
6991da177e4SLinus Torvalds 
7001da177e4SLinus Torvalds /*
7011da177e4SLinus Torvalds  *	The real server destination forwarding entry
7021da177e4SLinus Torvalds  *	with ip address, port number, and so on.
7031da177e4SLinus Torvalds  */
7041da177e4SLinus Torvalds struct ip_vs_dest {
7051da177e4SLinus Torvalds 	struct list_head	n_list;   /* for the dests in the service */
706276472eaSJulian Anastasov 	struct hlist_node	d_list;   /* for table with all the dests */
7071da177e4SLinus Torvalds 
708e7ade46aSJulius Volz 	u16			af;		/* address family */
709014d730dSAl Viro 	__be16			port;		/* port number of the server */
710f2431e6eSHans Schillstrom 	union nf_inet_addr	addr;		/* IP address of the server */
71195c96174SEric Dumazet 	volatile unsigned int	flags;		/* dest status flags */
7121da177e4SLinus Torvalds 	atomic_t		conn_flags;	/* flags to copy to conn */
7131da177e4SLinus Torvalds 	atomic_t		weight;		/* server weight */
7141da177e4SLinus Torvalds 
7151da177e4SLinus Torvalds 	atomic_t		refcnt;		/* reference counter */
7161da177e4SLinus Torvalds 	struct ip_vs_stats      stats;          /* statistics */
717bcbde4c0SJulian Anastasov 	unsigned long		idle_start;	/* start time, jiffies */
7181da177e4SLinus Torvalds 
7191da177e4SLinus Torvalds 	/* connection counters and thresholds */
7201da177e4SLinus Torvalds 	atomic_t		activeconns;	/* active connections */
7211da177e4SLinus Torvalds 	atomic_t		inactconns;	/* inactive connections */
7221da177e4SLinus Torvalds 	atomic_t		persistconns;	/* persistent connections */
7231da177e4SLinus Torvalds 	__u32			u_threshold;	/* upper threshold */
7241da177e4SLinus Torvalds 	__u32			l_threshold;	/* lower threshold */
7251da177e4SLinus Torvalds 
7261da177e4SLinus Torvalds 	/* for destination cache */
7271da177e4SLinus Torvalds 	spinlock_t		dst_lock;	/* lock of dst_cache */
728026ace06SJulian Anastasov 	struct ip_vs_dest_dst __rcu *dest_dst;	/* cached dst info */
7291da177e4SLinus Torvalds 
7301da177e4SLinus Torvalds 	/* for virtual service */
731bcbde4c0SJulian Anastasov 	struct ip_vs_service __rcu *svc;	/* service it belongs to */
7321da177e4SLinus Torvalds 	__u16			protocol;	/* which protocol (TCP/UDP) */
733014d730dSAl Viro 	__be16			vport;		/* virtual port number */
734f2431e6eSHans Schillstrom 	union nf_inet_addr	vaddr;		/* virtual IP address */
7351da177e4SLinus Torvalds 	__u32			vfwmark;	/* firewall mark of service */
736276472eaSJulian Anastasov 
737578bc3efSJulian Anastasov 	struct list_head	t_list;		/* in dest_trash */
738276472eaSJulian Anastasov 	unsigned int		in_rs_table:1;	/* we are in rs_table */
7391da177e4SLinus Torvalds };
7401da177e4SLinus Torvalds 
7411da177e4SLinus Torvalds 
7421da177e4SLinus Torvalds /*
7431da177e4SLinus Torvalds  *	The scheduler object
7441da177e4SLinus Torvalds  */
7451da177e4SLinus Torvalds struct ip_vs_scheduler {
7461da177e4SLinus Torvalds 	struct list_head	n_list;		/* d-linked list head */
7471da177e4SLinus Torvalds 	char			*name;		/* scheduler name */
7481da177e4SLinus Torvalds 	atomic_t		refcnt;		/* reference counter */
7491da177e4SLinus Torvalds 	struct module		*module;	/* THIS_MODULE/NULL */
7501da177e4SLinus Torvalds 
7511da177e4SLinus Torvalds 	/* scheduler initializing service */
7521da177e4SLinus Torvalds 	int (*init_service)(struct ip_vs_service *svc);
7531da177e4SLinus Torvalds 	/* scheduling service finish */
754ed3ffc4eSJulian Anastasov 	void (*done_service)(struct ip_vs_service *svc);
7556b6df466SJulian Anastasov 	/* dest is linked */
7566b6df466SJulian Anastasov 	int (*add_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest);
7576b6df466SJulian Anastasov 	/* dest is unlinked */
7586b6df466SJulian Anastasov 	int (*del_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest);
7596b6df466SJulian Anastasov 	/* dest is updated */
7606b6df466SJulian Anastasov 	int (*upd_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest);
7611da177e4SLinus Torvalds 
7621da177e4SLinus Torvalds 	/* selecting a server from the given service */
7631da177e4SLinus Torvalds 	struct ip_vs_dest* (*schedule)(struct ip_vs_service *svc,
764bba54de5SJulian Anastasov 				       const struct sk_buff *skb,
765bba54de5SJulian Anastasov 				       struct ip_vs_iphdr *iph);
7661da177e4SLinus Torvalds };
7671da177e4SLinus Torvalds 
76885999283SSimon Horman /* The persistence engine object */
76985999283SSimon Horman struct ip_vs_pe {
77085999283SSimon Horman 	struct list_head	n_list;		/* d-linked list head */
77185999283SSimon Horman 	char			*name;		/* scheduler name */
77285999283SSimon Horman 	atomic_t		refcnt;		/* reference counter */
77385999283SSimon Horman 	struct module		*module;	/* THIS_MODULE/NULL */
77485999283SSimon Horman 
77585999283SSimon Horman 	/* get the connection template, if any */
77685999283SSimon Horman 	int (*fill_param)(struct ip_vs_conn_param *p, struct sk_buff *skb);
77785999283SSimon Horman 	bool (*ct_match)(const struct ip_vs_conn_param *p,
77885999283SSimon Horman 			 struct ip_vs_conn *ct);
77985999283SSimon Horman 	u32 (*hashkey_raw)(const struct ip_vs_conn_param *p, u32 initval,
78085999283SSimon Horman 			   bool inverse);
781a3c918acSSimon Horman 	int (*show_pe_data)(const struct ip_vs_conn *cp, char *buf);
78285999283SSimon Horman };
7831da177e4SLinus Torvalds 
7841da177e4SLinus Torvalds /*
7851da177e4SLinus Torvalds  *	The application module object (a.k.a. app incarnation)
7861da177e4SLinus Torvalds  */
787fd2c3ef7SEric Dumazet struct ip_vs_app {
7881da177e4SLinus Torvalds 	struct list_head	a_list;		/* member in app list */
7891da177e4SLinus Torvalds 	int			type;		/* IP_VS_APP_TYPE_xxx */
7901da177e4SLinus Torvalds 	char			*name;		/* application module name */
7911da177e4SLinus Torvalds 	__u16			protocol;
7921da177e4SLinus Torvalds 	struct module		*module;	/* THIS_MODULE/NULL */
7931da177e4SLinus Torvalds 	struct list_head	incs_list;	/* list of incarnations */
7941da177e4SLinus Torvalds 
7951da177e4SLinus Torvalds 	/* members for application incarnations */
7961da177e4SLinus Torvalds 	struct list_head	p_list;		/* member in proto app list */
7971da177e4SLinus Torvalds 	struct ip_vs_app	*app;		/* its real application */
798014d730dSAl Viro 	__be16			port;		/* port number in net order */
7991da177e4SLinus Torvalds 	atomic_t		usecnt;		/* usage counter */
800363c97d7SJulian Anastasov 	struct rcu_head		rcu_head;
8011da177e4SLinus Torvalds 
8028b27b10fSJulian Anastasov 	/*
8038b27b10fSJulian Anastasov 	 * output hook: Process packet in inout direction, diff set for TCP.
8048b27b10fSJulian Anastasov 	 * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok,
8058b27b10fSJulian Anastasov 	 *	   2=Mangled but checksum was not updated
8068b27b10fSJulian Anastasov 	 */
8071da177e4SLinus Torvalds 	int (*pkt_out)(struct ip_vs_app *, struct ip_vs_conn *,
8083db05feaSHerbert Xu 		       struct sk_buff *, int *diff);
8091da177e4SLinus Torvalds 
8108b27b10fSJulian Anastasov 	/*
8118b27b10fSJulian Anastasov 	 * input hook: Process packet in outin direction, diff set for TCP.
8128b27b10fSJulian Anastasov 	 * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok,
8138b27b10fSJulian Anastasov 	 *	   2=Mangled but checksum was not updated
8148b27b10fSJulian Anastasov 	 */
8151da177e4SLinus Torvalds 	int (*pkt_in)(struct ip_vs_app *, struct ip_vs_conn *,
8163db05feaSHerbert Xu 		      struct sk_buff *, int *diff);
8171da177e4SLinus Torvalds 
8181da177e4SLinus Torvalds 	/* ip_vs_app initializer */
8191da177e4SLinus Torvalds 	int (*init_conn)(struct ip_vs_app *, struct ip_vs_conn *);
8201da177e4SLinus Torvalds 
8211da177e4SLinus Torvalds 	/* ip_vs_app finish */
8221da177e4SLinus Torvalds 	int (*done_conn)(struct ip_vs_app *, struct ip_vs_conn *);
8231da177e4SLinus Torvalds 
8241da177e4SLinus Torvalds 
8251da177e4SLinus Torvalds 	/* not used now */
8261da177e4SLinus Torvalds 	int (*bind_conn)(struct ip_vs_app *, struct ip_vs_conn *,
8271da177e4SLinus Torvalds 			 struct ip_vs_protocol *);
8281da177e4SLinus Torvalds 
8291da177e4SLinus Torvalds 	void (*unbind_conn)(struct ip_vs_app *, struct ip_vs_conn *);
8301da177e4SLinus Torvalds 
8311da177e4SLinus Torvalds 	int *			timeout_table;
8321da177e4SLinus Torvalds 	int *			timeouts;
8331da177e4SLinus Torvalds 	int			timeouts_size;
8341da177e4SLinus Torvalds 
8351da177e4SLinus Torvalds 	int (*conn_schedule)(struct sk_buff *skb, struct ip_vs_app *app,
8361da177e4SLinus Torvalds 			     int *verdict, struct ip_vs_conn **cpp);
8371da177e4SLinus Torvalds 
8381da177e4SLinus Torvalds 	struct ip_vs_conn *
8391da177e4SLinus Torvalds 	(*conn_in_get)(const struct sk_buff *skb, struct ip_vs_app *app,
840d4383f04SJesper Dangaard Brouer 		       const struct iphdr *iph, int inverse);
8411da177e4SLinus Torvalds 
8421da177e4SLinus Torvalds 	struct ip_vs_conn *
8431da177e4SLinus Torvalds 	(*conn_out_get)(const struct sk_buff *skb, struct ip_vs_app *app,
844d4383f04SJesper Dangaard Brouer 			const struct iphdr *iph, int inverse);
8451da177e4SLinus Torvalds 
8461da177e4SLinus Torvalds 	int (*state_transition)(struct ip_vs_conn *cp, int direction,
8471da177e4SLinus Torvalds 				const struct sk_buff *skb,
8481da177e4SLinus Torvalds 				struct ip_vs_app *app);
8491da177e4SLinus Torvalds 
8501da177e4SLinus Torvalds 	void (*timeout_change)(struct ip_vs_app *app, int flags);
8511da177e4SLinus Torvalds };
8521da177e4SLinus Torvalds 
853f73181c8SPablo Neira Ayuso struct ipvs_master_sync_state {
854f73181c8SPablo Neira Ayuso 	struct list_head	sync_queue;
855f73181c8SPablo Neira Ayuso 	struct ip_vs_sync_buff	*sync_buff;
85607995674SZhang Yanfei 	unsigned long		sync_queue_len;
857f73181c8SPablo Neira Ayuso 	unsigned int		sync_queue_delay;
858f73181c8SPablo Neira Ayuso 	struct task_struct	*master_thread;
859f73181c8SPablo Neira Ayuso 	struct delayed_work	master_wakeup_work;
860f73181c8SPablo Neira Ayuso 	struct netns_ipvs	*ipvs;
861f73181c8SPablo Neira Ayuso };
862f73181c8SPablo Neira Ayuso 
863578bc3efSJulian Anastasov /* How much time to keep dests in trash */
864578bc3efSJulian Anastasov #define IP_VS_DEST_TRASH_PERIOD		(120 * HZ)
865578bc3efSJulian Anastasov 
8662553d064SJulian Anastasov /* IPVS in network namespace */
8672553d064SJulian Anastasov struct netns_ipvs {
8682553d064SJulian Anastasov 	int			gen;		/* Generation */
8697a4f0761SHans Schillstrom 	int			enable;		/* enable like nf_hooks do */
8702553d064SJulian Anastasov 	/*
8712553d064SJulian Anastasov 	 *	Hash table: for real service lookups
8722553d064SJulian Anastasov 	 */
8732553d064SJulian Anastasov 	#define IP_VS_RTAB_BITS 4
8742553d064SJulian Anastasov 	#define IP_VS_RTAB_SIZE (1 << IP_VS_RTAB_BITS)
8752553d064SJulian Anastasov 	#define IP_VS_RTAB_MASK (IP_VS_RTAB_SIZE - 1)
8762553d064SJulian Anastasov 
877276472eaSJulian Anastasov 	struct hlist_head	rs_table[IP_VS_RTAB_SIZE];
8782553d064SJulian Anastasov 	/* ip_vs_app */
8792553d064SJulian Anastasov 	struct list_head	app_list;
8802553d064SJulian Anastasov 	/* ip_vs_proto */
8812553d064SJulian Anastasov 	#define IP_VS_PROTO_TAB_SIZE	32	/* must be power of 2 */
8822553d064SJulian Anastasov 	struct ip_vs_proto_data *proto_data_table[IP_VS_PROTO_TAB_SIZE];
8832553d064SJulian Anastasov 	/* ip_vs_proto_tcp */
8842553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_TCP
8852553d064SJulian Anastasov 	#define	TCP_APP_TAB_BITS	4
8862553d064SJulian Anastasov 	#define	TCP_APP_TAB_SIZE	(1 << TCP_APP_TAB_BITS)
8872553d064SJulian Anastasov 	#define	TCP_APP_TAB_MASK	(TCP_APP_TAB_SIZE - 1)
8882553d064SJulian Anastasov 	struct list_head	tcp_apps[TCP_APP_TAB_SIZE];
8892553d064SJulian Anastasov #endif
8902553d064SJulian Anastasov 	/* ip_vs_proto_udp */
8912553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_UDP
8922553d064SJulian Anastasov 	#define	UDP_APP_TAB_BITS	4
8932553d064SJulian Anastasov 	#define	UDP_APP_TAB_SIZE	(1 << UDP_APP_TAB_BITS)
8942553d064SJulian Anastasov 	#define	UDP_APP_TAB_MASK	(UDP_APP_TAB_SIZE - 1)
8952553d064SJulian Anastasov 	struct list_head	udp_apps[UDP_APP_TAB_SIZE];
8962553d064SJulian Anastasov #endif
8972553d064SJulian Anastasov 	/* ip_vs_proto_sctp */
8982553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_SCTP
8992553d064SJulian Anastasov 	#define SCTP_APP_TAB_BITS	4
9002553d064SJulian Anastasov 	#define SCTP_APP_TAB_SIZE	(1 << SCTP_APP_TAB_BITS)
9012553d064SJulian Anastasov 	#define SCTP_APP_TAB_MASK	(SCTP_APP_TAB_SIZE - 1)
9022553d064SJulian Anastasov 	/* Hash table for SCTP application incarnations	 */
9032553d064SJulian Anastasov 	struct list_head	sctp_apps[SCTP_APP_TAB_SIZE];
9042553d064SJulian Anastasov #endif
9052553d064SJulian Anastasov 	/* ip_vs_conn */
9062553d064SJulian Anastasov 	atomic_t		conn_count;      /*  connection counter */
9072553d064SJulian Anastasov 
9082553d064SJulian Anastasov 	/* ip_vs_ctl */
9092a0751afSJulian Anastasov 	struct ip_vs_stats		tot_stats;  /* Statistics & est. */
9102553d064SJulian Anastasov 
9112553d064SJulian Anastasov 	int			num_services;    /* no of virtual services */
912f2247fbdSSimon Horman 
9132553d064SJulian Anastasov 	/* Trash for destinations */
9142553d064SJulian Anastasov 	struct list_head	dest_trash;
915578bc3efSJulian Anastasov 	spinlock_t		dest_trash_lock;
916578bc3efSJulian Anastasov 	struct timer_list	dest_trash_timer; /* expiration timer */
9172553d064SJulian Anastasov 	/* Service counters */
9182553d064SJulian Anastasov 	atomic_t		ftpsvc_counter;
9192553d064SJulian Anastasov 	atomic_t		nullsvc_counter;
9202553d064SJulian Anastasov 
921f2247fbdSSimon Horman #ifdef CONFIG_SYSCTL
922f2247fbdSSimon Horman 	/* 1/rate drop and drop-entry variables */
923f2247fbdSSimon Horman 	struct delayed_work	defense_work;   /* Work handler */
924f2247fbdSSimon Horman 	int			drop_rate;
925f2247fbdSSimon Horman 	int			drop_counter;
926f2247fbdSSimon Horman 	atomic_t		dropentry;
927f2247fbdSSimon Horman 	/* locks in ctl.c */
928f2247fbdSSimon Horman 	spinlock_t		dropentry_lock;  /* drop entry handling */
929f2247fbdSSimon Horman 	spinlock_t		droppacket_lock; /* drop packet handling */
930f2247fbdSSimon Horman 	spinlock_t		securetcp_lock;  /* state and timeout tables */
931f2247fbdSSimon Horman 
9322553d064SJulian Anastasov 	/* sys-ctl struct */
9332553d064SJulian Anastasov 	struct ctl_table_header	*sysctl_hdr;
9342553d064SJulian Anastasov 	struct ctl_table	*sysctl_tbl;
935f2247fbdSSimon Horman #endif
936f2247fbdSSimon Horman 
9372553d064SJulian Anastasov 	/* sysctl variables */
9382553d064SJulian Anastasov 	int			sysctl_amemthresh;
9392553d064SJulian Anastasov 	int			sysctl_am_droprate;
9402553d064SJulian Anastasov 	int			sysctl_drop_entry;
9412553d064SJulian Anastasov 	int			sysctl_drop_packet;
9422553d064SJulian Anastasov 	int			sysctl_secure_tcp;
9432553d064SJulian Anastasov #ifdef CONFIG_IP_VS_NFCT
9442553d064SJulian Anastasov 	int			sysctl_conntrack;
9452553d064SJulian Anastasov #endif
9462553d064SJulian Anastasov 	int			sysctl_snat_reroute;
9472553d064SJulian Anastasov 	int			sysctl_sync_ver;
948f73181c8SPablo Neira Ayuso 	int			sysctl_sync_ports;
9494d0c875dSJulian Anastasov 	int			sysctl_sync_persist_mode;
95007995674SZhang Yanfei 	unsigned long		sysctl_sync_qlen_max;
9511c003b15SPablo Neira Ayuso 	int			sysctl_sync_sock_size;
9522553d064SJulian Anastasov 	int			sysctl_cache_bypass;
9532553d064SJulian Anastasov 	int			sysctl_expire_nodest_conn;
954c6c96c18SAlexander Frolkin 	int			sysctl_sloppy_tcp;
955c6c96c18SAlexander Frolkin 	int			sysctl_sloppy_sctp;
9562553d064SJulian Anastasov 	int			sysctl_expire_quiescent_template;
9572553d064SJulian Anastasov 	int			sysctl_sync_threshold[2];
958749c42b6SJulian Anastasov 	unsigned int		sysctl_sync_refresh_period;
959749c42b6SJulian Anastasov 	int			sysctl_sync_retries;
9602553d064SJulian Anastasov 	int			sysctl_nat_icmp_send;
9613654e611SJulian Anastasov 	int			sysctl_pmtu_disc;
9620c12582fSJulian Anastasov 	int			sysctl_backup_only;
9632553d064SJulian Anastasov 
9642553d064SJulian Anastasov 	/* ip_vs_lblc */
9652553d064SJulian Anastasov 	int			sysctl_lblc_expiration;
9662553d064SJulian Anastasov 	struct ctl_table_header	*lblc_ctl_header;
9672553d064SJulian Anastasov 	struct ctl_table	*lblc_ctl_table;
9682553d064SJulian Anastasov 	/* ip_vs_lblcr */
9692553d064SJulian Anastasov 	int			sysctl_lblcr_expiration;
9702553d064SJulian Anastasov 	struct ctl_table_header	*lblcr_ctl_header;
9712553d064SJulian Anastasov 	struct ctl_table	*lblcr_ctl_table;
9722553d064SJulian Anastasov 	/* ip_vs_est */
9732553d064SJulian Anastasov 	struct list_head	est_list;	/* estimator list */
9742553d064SJulian Anastasov 	spinlock_t		est_lock;
9752553d064SJulian Anastasov 	struct timer_list	est_timer;	/* Estimation timer */
9762553d064SJulian Anastasov 	/* ip_vs_sync */
9772553d064SJulian Anastasov 	spinlock_t		sync_lock;
978f73181c8SPablo Neira Ayuso 	struct ipvs_master_sync_state *ms;
9792553d064SJulian Anastasov 	spinlock_t		sync_buff_lock;
980f73181c8SPablo Neira Ayuso 	struct task_struct	**backup_threads;
981f73181c8SPablo Neira Ayuso 	int			threads_mask;
9822553d064SJulian Anastasov 	int			send_mesg_maxlen;
9832553d064SJulian Anastasov 	int			recv_mesg_maxlen;
9842553d064SJulian Anastasov 	volatile int		sync_state;
9852553d064SJulian Anastasov 	volatile int		master_syncid;
9862553d064SJulian Anastasov 	volatile int		backup_syncid;
987ae1d48b2SHans Schillstrom 	struct mutex		sync_mutex;
9882553d064SJulian Anastasov 	/* multicast interface name */
9892553d064SJulian Anastasov 	char			master_mcast_ifn[IP_VS_IFNAME_MAXLEN];
9902553d064SJulian Anastasov 	char			backup_mcast_ifn[IP_VS_IFNAME_MAXLEN];
9912553d064SJulian Anastasov 	/* net name space ptr */
9922553d064SJulian Anastasov 	struct net		*net;            /* Needed by timer routines */
9932553d064SJulian Anastasov };
9941da177e4SLinus Torvalds 
99559e0350eSSimon Horman #define DEFAULT_SYNC_THRESHOLD	3
99659e0350eSSimon Horman #define DEFAULT_SYNC_PERIOD	50
9977532e8d4SSimon Horman #define DEFAULT_SYNC_VER	1
998c6c96c18SAlexander Frolkin #define DEFAULT_SLOPPY_TCP	0
999c6c96c18SAlexander Frolkin #define DEFAULT_SLOPPY_SCTP	0
1000749c42b6SJulian Anastasov #define DEFAULT_SYNC_REFRESH_PERIOD	(0U * HZ)
1001749c42b6SJulian Anastasov #define DEFAULT_SYNC_RETRIES		0
10021c003b15SPablo Neira Ayuso #define IPVS_SYNC_WAKEUP_RATE	8
10031c003b15SPablo Neira Ayuso #define IPVS_SYNC_QLEN_MAX	(IPVS_SYNC_WAKEUP_RATE * 4)
10041c003b15SPablo Neira Ayuso #define IPVS_SYNC_SEND_DELAY	(HZ / 50)
10051c003b15SPablo Neira Ayuso #define IPVS_SYNC_CHECK_PERIOD	HZ
1006749c42b6SJulian Anastasov #define IPVS_SYNC_FLUSH_TIME	(HZ * 2)
1007f73181c8SPablo Neira Ayuso #define IPVS_SYNC_PORTS_MAX	(1 << 6)
100859e0350eSSimon Horman 
100959e0350eSSimon Horman #ifdef CONFIG_SYSCTL
101059e0350eSSimon Horman 
101159e0350eSSimon Horman static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs)
101259e0350eSSimon Horman {
101359e0350eSSimon Horman 	return ipvs->sysctl_sync_threshold[0];
101459e0350eSSimon Horman }
101559e0350eSSimon Horman 
101659e0350eSSimon Horman static inline int sysctl_sync_period(struct netns_ipvs *ipvs)
101759e0350eSSimon Horman {
1018749c42b6SJulian Anastasov 	return ACCESS_ONCE(ipvs->sysctl_sync_threshold[1]);
1019749c42b6SJulian Anastasov }
1020749c42b6SJulian Anastasov 
1021749c42b6SJulian Anastasov static inline unsigned int sysctl_sync_refresh_period(struct netns_ipvs *ipvs)
1022749c42b6SJulian Anastasov {
1023749c42b6SJulian Anastasov 	return ACCESS_ONCE(ipvs->sysctl_sync_refresh_period);
1024749c42b6SJulian Anastasov }
1025749c42b6SJulian Anastasov 
1026749c42b6SJulian Anastasov static inline int sysctl_sync_retries(struct netns_ipvs *ipvs)
1027749c42b6SJulian Anastasov {
1028749c42b6SJulian Anastasov 	return ipvs->sysctl_sync_retries;
102959e0350eSSimon Horman }
103059e0350eSSimon Horman 
10317532e8d4SSimon Horman static inline int sysctl_sync_ver(struct netns_ipvs *ipvs)
10327532e8d4SSimon Horman {
10337532e8d4SSimon Horman 	return ipvs->sysctl_sync_ver;
10347532e8d4SSimon Horman }
10357532e8d4SSimon Horman 
1036c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_tcp(struct netns_ipvs *ipvs)
1037c6c96c18SAlexander Frolkin {
1038c6c96c18SAlexander Frolkin 	return ipvs->sysctl_sloppy_tcp;
1039c6c96c18SAlexander Frolkin }
1040c6c96c18SAlexander Frolkin 
1041c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_sctp(struct netns_ipvs *ipvs)
1042c6c96c18SAlexander Frolkin {
1043c6c96c18SAlexander Frolkin 	return ipvs->sysctl_sloppy_sctp;
1044c6c96c18SAlexander Frolkin }
1045c6c96c18SAlexander Frolkin 
1046f73181c8SPablo Neira Ayuso static inline int sysctl_sync_ports(struct netns_ipvs *ipvs)
1047f73181c8SPablo Neira Ayuso {
1048f73181c8SPablo Neira Ayuso 	return ACCESS_ONCE(ipvs->sysctl_sync_ports);
1049f73181c8SPablo Neira Ayuso }
1050f73181c8SPablo Neira Ayuso 
10514d0c875dSJulian Anastasov static inline int sysctl_sync_persist_mode(struct netns_ipvs *ipvs)
10524d0c875dSJulian Anastasov {
10534d0c875dSJulian Anastasov 	return ipvs->sysctl_sync_persist_mode;
10544d0c875dSJulian Anastasov }
10554d0c875dSJulian Anastasov 
105607995674SZhang Yanfei static inline unsigned long sysctl_sync_qlen_max(struct netns_ipvs *ipvs)
10571c003b15SPablo Neira Ayuso {
10581c003b15SPablo Neira Ayuso 	return ipvs->sysctl_sync_qlen_max;
10591c003b15SPablo Neira Ayuso }
10601c003b15SPablo Neira Ayuso 
10611c003b15SPablo Neira Ayuso static inline int sysctl_sync_sock_size(struct netns_ipvs *ipvs)
10621c003b15SPablo Neira Ayuso {
10631c003b15SPablo Neira Ayuso 	return ipvs->sysctl_sync_sock_size;
10641c003b15SPablo Neira Ayuso }
10651c003b15SPablo Neira Ayuso 
10663654e611SJulian Anastasov static inline int sysctl_pmtu_disc(struct netns_ipvs *ipvs)
10673654e611SJulian Anastasov {
10683654e611SJulian Anastasov 	return ipvs->sysctl_pmtu_disc;
10693654e611SJulian Anastasov }
10703654e611SJulian Anastasov 
10710c12582fSJulian Anastasov static inline int sysctl_backup_only(struct netns_ipvs *ipvs)
10720c12582fSJulian Anastasov {
10730c12582fSJulian Anastasov 	return ipvs->sync_state & IP_VS_STATE_BACKUP &&
10740c12582fSJulian Anastasov 	       ipvs->sysctl_backup_only;
10750c12582fSJulian Anastasov }
10760c12582fSJulian Anastasov 
107759e0350eSSimon Horman #else
107859e0350eSSimon Horman 
107959e0350eSSimon Horman static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs)
108059e0350eSSimon Horman {
108159e0350eSSimon Horman 	return DEFAULT_SYNC_THRESHOLD;
108259e0350eSSimon Horman }
108359e0350eSSimon Horman 
108459e0350eSSimon Horman static inline int sysctl_sync_period(struct netns_ipvs *ipvs)
108559e0350eSSimon Horman {
108659e0350eSSimon Horman 	return DEFAULT_SYNC_PERIOD;
108759e0350eSSimon Horman }
108859e0350eSSimon Horman 
1089749c42b6SJulian Anastasov static inline unsigned int sysctl_sync_refresh_period(struct netns_ipvs *ipvs)
1090749c42b6SJulian Anastasov {
1091749c42b6SJulian Anastasov 	return DEFAULT_SYNC_REFRESH_PERIOD;
1092749c42b6SJulian Anastasov }
1093749c42b6SJulian Anastasov 
1094749c42b6SJulian Anastasov static inline int sysctl_sync_retries(struct netns_ipvs *ipvs)
1095749c42b6SJulian Anastasov {
1096749c42b6SJulian Anastasov 	return DEFAULT_SYNC_RETRIES & 3;
1097749c42b6SJulian Anastasov }
1098749c42b6SJulian Anastasov 
10997532e8d4SSimon Horman static inline int sysctl_sync_ver(struct netns_ipvs *ipvs)
11007532e8d4SSimon Horman {
11017532e8d4SSimon Horman 	return DEFAULT_SYNC_VER;
11027532e8d4SSimon Horman }
11037532e8d4SSimon Horman 
1104c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_tcp(struct netns_ipvs *ipvs)
1105c6c96c18SAlexander Frolkin {
1106c6c96c18SAlexander Frolkin 	return DEFAULT_SLOPPY_TCP;
1107c6c96c18SAlexander Frolkin }
1108c6c96c18SAlexander Frolkin 
1109c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_sctp(struct netns_ipvs *ipvs)
1110c6c96c18SAlexander Frolkin {
1111c6c96c18SAlexander Frolkin 	return DEFAULT_SLOPPY_SCTP;
1112c6c96c18SAlexander Frolkin }
1113c6c96c18SAlexander Frolkin 
1114f73181c8SPablo Neira Ayuso static inline int sysctl_sync_ports(struct netns_ipvs *ipvs)
1115f73181c8SPablo Neira Ayuso {
1116f73181c8SPablo Neira Ayuso 	return 1;
1117f73181c8SPablo Neira Ayuso }
1118f73181c8SPablo Neira Ayuso 
11194d0c875dSJulian Anastasov static inline int sysctl_sync_persist_mode(struct netns_ipvs *ipvs)
11204d0c875dSJulian Anastasov {
11214d0c875dSJulian Anastasov 	return 0;
11224d0c875dSJulian Anastasov }
11234d0c875dSJulian Anastasov 
112407995674SZhang Yanfei static inline unsigned long sysctl_sync_qlen_max(struct netns_ipvs *ipvs)
11251c003b15SPablo Neira Ayuso {
11261c003b15SPablo Neira Ayuso 	return IPVS_SYNC_QLEN_MAX;
11271c003b15SPablo Neira Ayuso }
11281c003b15SPablo Neira Ayuso 
11291c003b15SPablo Neira Ayuso static inline int sysctl_sync_sock_size(struct netns_ipvs *ipvs)
11301c003b15SPablo Neira Ayuso {
11311c003b15SPablo Neira Ayuso 	return 0;
11321c003b15SPablo Neira Ayuso }
11331c003b15SPablo Neira Ayuso 
11343654e611SJulian Anastasov static inline int sysctl_pmtu_disc(struct netns_ipvs *ipvs)
11353654e611SJulian Anastasov {
11363654e611SJulian Anastasov 	return 1;
11373654e611SJulian Anastasov }
11383654e611SJulian Anastasov 
11390c12582fSJulian Anastasov static inline int sysctl_backup_only(struct netns_ipvs *ipvs)
11400c12582fSJulian Anastasov {
11410c12582fSJulian Anastasov 	return 0;
11420c12582fSJulian Anastasov }
11430c12582fSJulian Anastasov 
114459e0350eSSimon Horman #endif
114559e0350eSSimon Horman 
11461da177e4SLinus Torvalds /*
11471da177e4SLinus Torvalds  *      IPVS core functions
11481da177e4SLinus Torvalds  *      (from ip_vs_core.c)
11491da177e4SLinus Torvalds  */
11505c3a0fd7SJoe Perches const char *ip_vs_proto_name(unsigned int proto);
11515c3a0fd7SJoe Perches void ip_vs_init_hash_table(struct list_head *table, int rows);
1152afdd6140SSven Wegener #define IP_VS_INIT_HASH_TABLE(t) ip_vs_init_hash_table((t), ARRAY_SIZE((t)))
11531da177e4SLinus Torvalds 
11541da177e4SLinus Torvalds #define IP_VS_APP_TYPE_FTP	1
11551da177e4SLinus Torvalds 
11561da177e4SLinus Torvalds /*
11571da177e4SLinus Torvalds  *     ip_vs_conn handling functions
11581da177e4SLinus Torvalds  *     (from ip_vs_conn.c)
11591da177e4SLinus Torvalds  */
11601da177e4SLinus Torvalds 
11611da177e4SLinus Torvalds enum {
11621da177e4SLinus Torvalds 	IP_VS_DIR_INPUT = 0,
11631da177e4SLinus Torvalds 	IP_VS_DIR_OUTPUT,
11641da177e4SLinus Torvalds 	IP_VS_DIR_INPUT_ONLY,
11651da177e4SLinus Torvalds 	IP_VS_DIR_LAST,
11661da177e4SLinus Torvalds };
11671da177e4SLinus Torvalds 
11686e67e586SHans Schillstrom static inline void ip_vs_conn_fill_param(struct net *net, int af, int protocol,
1169f11017ecSSimon Horman 					 const union nf_inet_addr *caddr,
1170f11017ecSSimon Horman 					 __be16 cport,
1171f11017ecSSimon Horman 					 const union nf_inet_addr *vaddr,
1172f11017ecSSimon Horman 					 __be16 vport,
1173f11017ecSSimon Horman 					 struct ip_vs_conn_param *p)
1174f11017ecSSimon Horman {
11756e67e586SHans Schillstrom 	p->net = net;
1176f11017ecSSimon Horman 	p->af = af;
1177f11017ecSSimon Horman 	p->protocol = protocol;
1178f11017ecSSimon Horman 	p->caddr = caddr;
1179f11017ecSSimon Horman 	p->cport = cport;
1180f11017ecSSimon Horman 	p->vaddr = vaddr;
1181f11017ecSSimon Horman 	p->vport = vport;
118285999283SSimon Horman 	p->pe = NULL;
118385999283SSimon Horman 	p->pe_data = NULL;
1184f11017ecSSimon Horman }
118528364a59SJulius Volz 
1186f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_in_get(const struct ip_vs_conn_param *p);
1187f11017ecSSimon Horman struct ip_vs_conn *ip_vs_ct_in_get(const struct ip_vs_conn_param *p);
118828364a59SJulius Volz 
11895c0d2374SSimon Horman struct ip_vs_conn * ip_vs_conn_in_get_proto(int af, const struct sk_buff *skb,
11905c0d2374SSimon Horman 					    const struct ip_vs_iphdr *iph,
11915c0d2374SSimon Horman 					    int inverse);
11925c0d2374SSimon Horman 
1193f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_out_get(const struct ip_vs_conn_param *p);
11941da177e4SLinus Torvalds 
11955c0d2374SSimon Horman struct ip_vs_conn * ip_vs_conn_out_get_proto(int af, const struct sk_buff *skb,
11965c0d2374SSimon Horman 					     const struct ip_vs_iphdr *iph,
11975c0d2374SSimon Horman 					     int inverse);
11985c0d2374SSimon Horman 
1199088339a5SJulian Anastasov /* Get reference to gain full access to conn.
1200088339a5SJulian Anastasov  * By default, RCU read-side critical sections have access only to
1201088339a5SJulian Anastasov  * conn fields and its PE data, see ip_vs_conn_rcu_free() for reference.
1202088339a5SJulian Anastasov  */
1203088339a5SJulian Anastasov static inline bool __ip_vs_conn_get(struct ip_vs_conn *cp)
1204088339a5SJulian Anastasov {
1205088339a5SJulian Anastasov 	return atomic_inc_not_zero(&cp->refcnt);
1206088339a5SJulian Anastasov }
1207088339a5SJulian Anastasov 
12081da177e4SLinus Torvalds /* put back the conn without restarting its timer */
12091da177e4SLinus Torvalds static inline void __ip_vs_conn_put(struct ip_vs_conn *cp)
12101da177e4SLinus Torvalds {
12114e857c58SPeter Zijlstra 	smp_mb__before_atomic();
12121da177e4SLinus Torvalds 	atomic_dec(&cp->refcnt);
12131da177e4SLinus Torvalds }
12145c3a0fd7SJoe Perches void ip_vs_conn_put(struct ip_vs_conn *cp);
12155c3a0fd7SJoe Perches void ip_vs_conn_fill_cport(struct ip_vs_conn *cp, __be16 cport);
12161da177e4SLinus Torvalds 
1217*ba38528aSAlex Gartrell struct ip_vs_conn *ip_vs_conn_new(const struct ip_vs_conn_param *p, int dest_af,
1218f11017ecSSimon Horman 				  const union nf_inet_addr *daddr,
121995c96174SEric Dumazet 				  __be16 dport, unsigned int flags,
12200e051e68SHans Schillstrom 				  struct ip_vs_dest *dest, __u32 fwmark);
12215c3a0fd7SJoe Perches void ip_vs_conn_expire_now(struct ip_vs_conn *cp);
12221da177e4SLinus Torvalds 
12235c3a0fd7SJoe Perches const char *ip_vs_state_name(__u16 proto, int state);
12241da177e4SLinus Torvalds 
12255c3a0fd7SJoe Perches void ip_vs_tcp_conn_listen(struct net *net, struct ip_vs_conn *cp);
12265c3a0fd7SJoe Perches int ip_vs_check_template(struct ip_vs_conn *ct);
12275c3a0fd7SJoe Perches void ip_vs_random_dropentry(struct net *net);
12285c3a0fd7SJoe Perches int ip_vs_conn_init(void);
12295c3a0fd7SJoe Perches void ip_vs_conn_cleanup(void);
12301da177e4SLinus Torvalds 
12311da177e4SLinus Torvalds static inline void ip_vs_control_del(struct ip_vs_conn *cp)
12321da177e4SLinus Torvalds {
12331da177e4SLinus Torvalds 	struct ip_vs_conn *ctl_cp = cp->control;
12341da177e4SLinus Torvalds 	if (!ctl_cp) {
1235cfc78c5aSJulius Volz 		IP_VS_ERR_BUF("request control DEL for uncontrolled: "
1236cfc78c5aSJulius Volz 			      "%s:%d to %s:%d\n",
1237cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1238cfc78c5aSJulius Volz 			      ntohs(cp->cport),
1239cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->vaddr),
1240cfc78c5aSJulius Volz 			      ntohs(cp->vport));
1241cfc78c5aSJulius Volz 
12421da177e4SLinus Torvalds 		return;
12431da177e4SLinus Torvalds 	}
12441da177e4SLinus Torvalds 
1245cfc78c5aSJulius Volz 	IP_VS_DBG_BUF(7, "DELeting control for: "
1246cfc78c5aSJulius Volz 		      "cp.dst=%s:%d ctl_cp.dst=%s:%d\n",
1247cfc78c5aSJulius Volz 		      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1248cfc78c5aSJulius Volz 		      ntohs(cp->cport),
1249cfc78c5aSJulius Volz 		      IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr),
1250cfc78c5aSJulius Volz 		      ntohs(ctl_cp->cport));
12511da177e4SLinus Torvalds 
12521da177e4SLinus Torvalds 	cp->control = NULL;
12531da177e4SLinus Torvalds 	if (atomic_read(&ctl_cp->n_control) == 0) {
1254cfc78c5aSJulius Volz 		IP_VS_ERR_BUF("BUG control DEL with n=0 : "
1255cfc78c5aSJulius Volz 			      "%s:%d to %s:%d\n",
1256cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1257cfc78c5aSJulius Volz 			      ntohs(cp->cport),
1258cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->vaddr),
1259cfc78c5aSJulius Volz 			      ntohs(cp->vport));
1260cfc78c5aSJulius Volz 
12611da177e4SLinus Torvalds 		return;
12621da177e4SLinus Torvalds 	}
12631da177e4SLinus Torvalds 	atomic_dec(&ctl_cp->n_control);
12641da177e4SLinus Torvalds }
12651da177e4SLinus Torvalds 
12661da177e4SLinus Torvalds static inline void
12671da177e4SLinus Torvalds ip_vs_control_add(struct ip_vs_conn *cp, struct ip_vs_conn *ctl_cp)
12681da177e4SLinus Torvalds {
12691da177e4SLinus Torvalds 	if (cp->control) {
1270cfc78c5aSJulius Volz 		IP_VS_ERR_BUF("request control ADD for already controlled: "
1271cfc78c5aSJulius Volz 			      "%s:%d to %s:%d\n",
1272cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1273cfc78c5aSJulius Volz 			      ntohs(cp->cport),
1274cfc78c5aSJulius Volz 			      IP_VS_DBG_ADDR(cp->af, &cp->vaddr),
1275cfc78c5aSJulius Volz 			      ntohs(cp->vport));
1276cfc78c5aSJulius Volz 
12771da177e4SLinus Torvalds 		ip_vs_control_del(cp);
12781da177e4SLinus Torvalds 	}
12791da177e4SLinus Torvalds 
1280cfc78c5aSJulius Volz 	IP_VS_DBG_BUF(7, "ADDing control for: "
1281cfc78c5aSJulius Volz 		      "cp.dst=%s:%d ctl_cp.dst=%s:%d\n",
1282cfc78c5aSJulius Volz 		      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1283cfc78c5aSJulius Volz 		      ntohs(cp->cport),
1284cfc78c5aSJulius Volz 		      IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr),
1285cfc78c5aSJulius Volz 		      ntohs(ctl_cp->cport));
12861da177e4SLinus Torvalds 
12871da177e4SLinus Torvalds 	cp->control = ctl_cp;
12881da177e4SLinus Torvalds 	atomic_inc(&ctl_cp->n_control);
12891da177e4SLinus Torvalds }
12901da177e4SLinus Torvalds 
12917a4f0761SHans Schillstrom /*
12927a4f0761SHans Schillstrom  * IPVS netns init & cleanup functions
12937a4f0761SHans Schillstrom  */
12945c3a0fd7SJoe Perches int ip_vs_estimator_net_init(struct net *net);
12955c3a0fd7SJoe Perches int ip_vs_control_net_init(struct net *net);
12965c3a0fd7SJoe Perches int ip_vs_protocol_net_init(struct net *net);
12975c3a0fd7SJoe Perches int ip_vs_app_net_init(struct net *net);
12985c3a0fd7SJoe Perches int ip_vs_conn_net_init(struct net *net);
12995c3a0fd7SJoe Perches int ip_vs_sync_net_init(struct net *net);
13005c3a0fd7SJoe Perches void ip_vs_conn_net_cleanup(struct net *net);
13015c3a0fd7SJoe Perches void ip_vs_app_net_cleanup(struct net *net);
13025c3a0fd7SJoe Perches void ip_vs_protocol_net_cleanup(struct net *net);
13035c3a0fd7SJoe Perches void ip_vs_control_net_cleanup(struct net *net);
13045c3a0fd7SJoe Perches void ip_vs_estimator_net_cleanup(struct net *net);
13055c3a0fd7SJoe Perches void ip_vs_sync_net_cleanup(struct net *net);
13065c3a0fd7SJoe Perches void ip_vs_service_net_cleanup(struct net *net);
13071da177e4SLinus Torvalds 
13081da177e4SLinus Torvalds /*
13091da177e4SLinus Torvalds  *      IPVS application functions
13101da177e4SLinus Torvalds  *      (from ip_vs_app.c)
13111da177e4SLinus Torvalds  */
13121da177e4SLinus Torvalds #define IP_VS_APP_MAX_PORTS  8
13135c3a0fd7SJoe Perches struct ip_vs_app *register_ip_vs_app(struct net *net, struct ip_vs_app *app);
13145c3a0fd7SJoe Perches void unregister_ip_vs_app(struct net *net, struct ip_vs_app *app);
13155c3a0fd7SJoe Perches int ip_vs_bind_app(struct ip_vs_conn *cp, struct ip_vs_protocol *pp);
13165c3a0fd7SJoe Perches void ip_vs_unbind_app(struct ip_vs_conn *cp);
13175c3a0fd7SJoe Perches int register_ip_vs_app_inc(struct net *net, struct ip_vs_app *app, __u16 proto,
13185c3a0fd7SJoe Perches 			   __u16 port);
13195c3a0fd7SJoe Perches int ip_vs_app_inc_get(struct ip_vs_app *inc);
13205c3a0fd7SJoe Perches void ip_vs_app_inc_put(struct ip_vs_app *inc);
13211da177e4SLinus Torvalds 
13225c3a0fd7SJoe Perches int ip_vs_app_pkt_out(struct ip_vs_conn *, struct sk_buff *skb);
13235c3a0fd7SJoe Perches int ip_vs_app_pkt_in(struct ip_vs_conn *, struct sk_buff *skb);
13241da177e4SLinus Torvalds 
13258be67a66SSimon Horman int register_ip_vs_pe(struct ip_vs_pe *pe);
13268be67a66SSimon Horman int unregister_ip_vs_pe(struct ip_vs_pe *pe);
1327e9e5eee8SSimon Horman struct ip_vs_pe *ip_vs_pe_getbyname(const char *name);
1328fe5e7a1eSHans Schillstrom struct ip_vs_pe *__ip_vs_pe_getbyname(const char *pe_name);
1329e9e5eee8SSimon Horman 
133069e7dae4SPaul Gortmaker /*
133169e7dae4SPaul Gortmaker  * Use a #define to avoid all of module.h just for these trivial ops
133269e7dae4SPaul Gortmaker  */
133369e7dae4SPaul Gortmaker #define ip_vs_pe_get(pe)			\
133469e7dae4SPaul Gortmaker 	if (pe && pe->module)			\
1335e9e5eee8SSimon Horman 		__module_get(pe->module);
1336e9e5eee8SSimon Horman 
133769e7dae4SPaul Gortmaker #define ip_vs_pe_put(pe)			\
133869e7dae4SPaul Gortmaker 	if (pe && pe->module)			\
1339e9e5eee8SSimon Horman 		module_put(pe->module);
13401da177e4SLinus Torvalds 
13411da177e4SLinus Torvalds /*
13421da177e4SLinus Torvalds  *	IPVS protocol functions (from ip_vs_proto.c)
13431da177e4SLinus Torvalds  */
13445c3a0fd7SJoe Perches int ip_vs_protocol_init(void);
13455c3a0fd7SJoe Perches void ip_vs_protocol_cleanup(void);
13465c3a0fd7SJoe Perches void ip_vs_protocol_timeout_change(struct netns_ipvs *ipvs, int flags);
13475c3a0fd7SJoe Perches int *ip_vs_create_timeout_table(int *table, int size);
13485c3a0fd7SJoe Perches int ip_vs_set_state_timeout(int *table, int num, const char *const *names,
134936cbd3dcSJan Engelhardt 			    const char *name, int to);
13505c3a0fd7SJoe Perches void ip_vs_tcpudp_debug_packet(int af, struct ip_vs_protocol *pp,
13515c3a0fd7SJoe Perches 			       const struct sk_buff *skb, int offset,
13525c3a0fd7SJoe Perches 			       const char *msg);
13531da177e4SLinus Torvalds 
13541da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_tcp;
13551da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_udp;
13561da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_icmp;
13571da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_esp;
13581da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_ah;
13592906f66aSVenkata Mohan Reddy extern struct ip_vs_protocol ip_vs_protocol_sctp;
13601da177e4SLinus Torvalds 
13611da177e4SLinus Torvalds /*
13621da177e4SLinus Torvalds  *      Registering/unregistering scheduler functions
13631da177e4SLinus Torvalds  *      (from ip_vs_sched.c)
13641da177e4SLinus Torvalds  */
13655c3a0fd7SJoe Perches int register_ip_vs_scheduler(struct ip_vs_scheduler *scheduler);
13665c3a0fd7SJoe Perches int unregister_ip_vs_scheduler(struct ip_vs_scheduler *scheduler);
13675c3a0fd7SJoe Perches int ip_vs_bind_scheduler(struct ip_vs_service *svc,
13681da177e4SLinus Torvalds 			 struct ip_vs_scheduler *scheduler);
13695c3a0fd7SJoe Perches void ip_vs_unbind_scheduler(struct ip_vs_service *svc,
1370ceec4c38SJulian Anastasov 			    struct ip_vs_scheduler *sched);
13715c3a0fd7SJoe Perches struct ip_vs_scheduler *ip_vs_scheduler_get(const char *sched_name);
13725c3a0fd7SJoe Perches void ip_vs_scheduler_put(struct ip_vs_scheduler *scheduler);
13735c3a0fd7SJoe Perches struct ip_vs_conn *
1374190ecd27SJulian Anastasov ip_vs_schedule(struct ip_vs_service *svc, struct sk_buff *skb,
1375d4383f04SJesper Dangaard Brouer 	       struct ip_vs_proto_data *pd, int *ignored,
1376d4383f04SJesper Dangaard Brouer 	       struct ip_vs_iphdr *iph);
13775c3a0fd7SJoe Perches int ip_vs_leave(struct ip_vs_service *svc, struct sk_buff *skb,
1378d4383f04SJesper Dangaard Brouer 		struct ip_vs_proto_data *pd, struct ip_vs_iphdr *iph);
13791da177e4SLinus Torvalds 
13805c3a0fd7SJoe Perches void ip_vs_scheduler_err(struct ip_vs_service *svc, const char *msg);
138141ac51eeSPatrick Schaaf 
13821da177e4SLinus Torvalds 
13831da177e4SLinus Torvalds /*
13841da177e4SLinus Torvalds  *      IPVS control data and functions (from ip_vs_ctl.c)
13851da177e4SLinus Torvalds  */
13861da177e4SLinus Torvalds extern struct ip_vs_stats ip_vs_stats;
1387b880c1f0SHans Schillstrom extern int sysctl_ip_vs_sync_ver;
13881da177e4SLinus Torvalds 
13895c3a0fd7SJoe Perches struct ip_vs_service *
1390ceec4c38SJulian Anastasov ip_vs_service_find(struct net *net, int af, __u32 fwmark, __u16 protocol,
13913c2e0505SJulius Volz 		  const union nf_inet_addr *vaddr, __be16 vport);
13921da177e4SLinus Torvalds 
13935c3a0fd7SJoe Perches bool ip_vs_has_real_service(struct net *net, int af, __u16 protocol,
13947937df15SJulius Volz 			    const union nf_inet_addr *daddr, __be16 dport);
13957937df15SJulius Volz 
13965c3a0fd7SJoe Perches int ip_vs_use_count_inc(void);
13975c3a0fd7SJoe Perches void ip_vs_use_count_dec(void);
13985c3a0fd7SJoe Perches int ip_vs_register_nl_ioctl(void);
13995c3a0fd7SJoe Perches void ip_vs_unregister_nl_ioctl(void);
14005c3a0fd7SJoe Perches int ip_vs_control_init(void);
14015c3a0fd7SJoe Perches void ip_vs_control_cleanup(void);
14025c3a0fd7SJoe Perches struct ip_vs_dest *
1403655eef10SAlex Gartrell ip_vs_find_dest(struct net *net, int svc_af, int dest_af,
1404655eef10SAlex Gartrell 		const union nf_inet_addr *daddr, __be16 dport,
1405655eef10SAlex Gartrell 		const union nf_inet_addr *vaddr, __be16 vport,
140652793dbeSJulian Anastasov 		__u16 protocol, __u32 fwmark, __u32 flags);
14075c3a0fd7SJoe Perches void ip_vs_try_bind_dest(struct ip_vs_conn *cp);
14081da177e4SLinus Torvalds 
1409fca9c20aSJulian Anastasov static inline void ip_vs_dest_hold(struct ip_vs_dest *dest)
1410fca9c20aSJulian Anastasov {
1411fca9c20aSJulian Anastasov 	atomic_inc(&dest->refcnt);
1412fca9c20aSJulian Anastasov }
1413fca9c20aSJulian Anastasov 
1414fca9c20aSJulian Anastasov static inline void ip_vs_dest_put(struct ip_vs_dest *dest)
1415fca9c20aSJulian Anastasov {
14164e857c58SPeter Zijlstra 	smp_mb__before_atomic();
1417fca9c20aSJulian Anastasov 	atomic_dec(&dest->refcnt);
1418fca9c20aSJulian Anastasov }
14191da177e4SLinus Torvalds 
14209e4e948aSJulian Anastasov static inline void ip_vs_dest_put_and_free(struct ip_vs_dest *dest)
14219e4e948aSJulian Anastasov {
14229e4e948aSJulian Anastasov 	if (atomic_dec_return(&dest->refcnt) < 0)
14239e4e948aSJulian Anastasov 		kfree(dest);
14249e4e948aSJulian Anastasov }
14259e4e948aSJulian Anastasov 
14261da177e4SLinus Torvalds /*
14271da177e4SLinus Torvalds  *      IPVS sync daemon data and function prototypes
14281da177e4SLinus Torvalds  *      (from ip_vs_sync.c)
14291da177e4SLinus Torvalds  */
14305c3a0fd7SJoe Perches int start_sync_thread(struct net *net, int state, char *mcast_ifn, __u8 syncid);
14315c3a0fd7SJoe Perches int stop_sync_thread(struct net *net, int state);
14325c3a0fd7SJoe Perches void ip_vs_sync_conn(struct net *net, struct ip_vs_conn *cp, int pkts);
14331da177e4SLinus Torvalds 
14341da177e4SLinus Torvalds /*
14351da177e4SLinus Torvalds  *      IPVS rate estimator prototypes (from ip_vs_est.c)
14361da177e4SLinus Torvalds  */
14375c3a0fd7SJoe Perches void ip_vs_start_estimator(struct net *net, struct ip_vs_stats *stats);
14385c3a0fd7SJoe Perches void ip_vs_stop_estimator(struct net *net, struct ip_vs_stats *stats);
14395c3a0fd7SJoe Perches void ip_vs_zero_estimator(struct ip_vs_stats *stats);
14405c3a0fd7SJoe Perches void ip_vs_read_estimator(struct ip_vs_stats_user *dst,
1441ea9f22ccSJulian Anastasov 			  struct ip_vs_stats *stats);
14421da177e4SLinus Torvalds 
14431da177e4SLinus Torvalds /*
14441da177e4SLinus Torvalds  *	Various IPVS packet transmitters (from ip_vs_xmit.c)
14451da177e4SLinus Torvalds  */
14465c3a0fd7SJoe Perches int ip_vs_null_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1447d4383f04SJesper Dangaard Brouer 		    struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14485c3a0fd7SJoe Perches int ip_vs_bypass_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1449d4383f04SJesper Dangaard Brouer 		      struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14505c3a0fd7SJoe Perches int ip_vs_nat_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1451d4383f04SJesper Dangaard Brouer 		   struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14525c3a0fd7SJoe Perches int ip_vs_tunnel_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
14535c3a0fd7SJoe Perches 		      struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14545c3a0fd7SJoe Perches int ip_vs_dr_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
14555c3a0fd7SJoe Perches 		  struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14565c3a0fd7SJoe Perches int ip_vs_icmp_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1457d4383f04SJesper Dangaard Brouer 		    struct ip_vs_protocol *pp, int offset,
1458d4383f04SJesper Dangaard Brouer 		    unsigned int hooknum, struct ip_vs_iphdr *iph);
14595c3a0fd7SJoe Perches void ip_vs_dest_dst_rcu_free(struct rcu_head *head);
14601da177e4SLinus Torvalds 
1461b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6
14625c3a0fd7SJoe Perches int ip_vs_bypass_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
1463d4383f04SJesper Dangaard Brouer 			 struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14645c3a0fd7SJoe Perches int ip_vs_nat_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
14655c3a0fd7SJoe Perches 		      struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14665c3a0fd7SJoe Perches int ip_vs_tunnel_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
14675c3a0fd7SJoe Perches 			 struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14685c3a0fd7SJoe Perches int ip_vs_dr_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
14695c3a0fd7SJoe Perches 		     struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
14705c3a0fd7SJoe Perches int ip_vs_icmp_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
1471d4383f04SJesper Dangaard Brouer 		       struct ip_vs_protocol *pp, int offset,
1472d4383f04SJesper Dangaard Brouer 		       unsigned int hooknum, struct ip_vs_iphdr *iph);
1473b3cdd2a7SJulius Volz #endif
14741da177e4SLinus Torvalds 
14753a1bbf18SSimon Horman #ifdef CONFIG_SYSCTL
14761da177e4SLinus Torvalds /*
14771da177e4SLinus Torvalds  *	This is a simple mechanism to ignore packets when
14781da177e4SLinus Torvalds  *	we are loaded. Just set ip_vs_drop_rate to 'n' and
14791da177e4SLinus Torvalds  *	we start to drop 1/rate of the packets
14801da177e4SLinus Torvalds  */
14811da177e4SLinus Torvalds 
1482a0840e2eSHans Schillstrom static inline int ip_vs_todrop(struct netns_ipvs *ipvs)
14831da177e4SLinus Torvalds {
1484a0840e2eSHans Schillstrom 	if (!ipvs->drop_rate)
1485a0840e2eSHans Schillstrom 		return 0;
1486a0840e2eSHans Schillstrom 	if (--ipvs->drop_counter > 0)
1487a0840e2eSHans Schillstrom 		return 0;
1488a0840e2eSHans Schillstrom 	ipvs->drop_counter = ipvs->drop_rate;
14891da177e4SLinus Torvalds 	return 1;
14901da177e4SLinus Torvalds }
14913a1bbf18SSimon Horman #else
14923a1bbf18SSimon Horman static inline int ip_vs_todrop(struct netns_ipvs *ipvs) { return 0; }
14933a1bbf18SSimon Horman #endif
14941da177e4SLinus Torvalds 
14951da177e4SLinus Torvalds /*
14961da177e4SLinus Torvalds  *      ip_vs_fwd_tag returns the forwarding tag of the connection
14971da177e4SLinus Torvalds  */
14981da177e4SLinus Torvalds #define IP_VS_FWD_METHOD(cp)  (cp->flags & IP_VS_CONN_F_FWD_MASK)
14991da177e4SLinus Torvalds 
1500732db659SAdrian Bunk static inline char ip_vs_fwd_tag(struct ip_vs_conn *cp)
15011da177e4SLinus Torvalds {
15021da177e4SLinus Torvalds 	char fwd;
15031da177e4SLinus Torvalds 
15041da177e4SLinus Torvalds 	switch (IP_VS_FWD_METHOD(cp)) {
15051da177e4SLinus Torvalds 	case IP_VS_CONN_F_MASQ:
15061da177e4SLinus Torvalds 		fwd = 'M'; break;
15071da177e4SLinus Torvalds 	case IP_VS_CONN_F_LOCALNODE:
15081da177e4SLinus Torvalds 		fwd = 'L'; break;
15091da177e4SLinus Torvalds 	case IP_VS_CONN_F_TUNNEL:
15101da177e4SLinus Torvalds 		fwd = 'T'; break;
15111da177e4SLinus Torvalds 	case IP_VS_CONN_F_DROUTE:
15121da177e4SLinus Torvalds 		fwd = 'R'; break;
15131da177e4SLinus Torvalds 	case IP_VS_CONN_F_BYPASS:
15141da177e4SLinus Torvalds 		fwd = 'B'; break;
15151da177e4SLinus Torvalds 	default:
15161da177e4SLinus Torvalds 		fwd = '?'; break;
15171da177e4SLinus Torvalds 	}
15181da177e4SLinus Torvalds 	return fwd;
15191da177e4SLinus Torvalds }
15201da177e4SLinus Torvalds 
15215c3a0fd7SJoe Perches void ip_vs_nat_icmp(struct sk_buff *skb, struct ip_vs_protocol *pp,
15221da177e4SLinus Torvalds 		    struct ip_vs_conn *cp, int dir);
15231da177e4SLinus Torvalds 
1524b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6
15255c3a0fd7SJoe Perches void ip_vs_nat_icmp_v6(struct sk_buff *skb, struct ip_vs_protocol *pp,
1526b3cdd2a7SJulius Volz 		       struct ip_vs_conn *cp, int dir);
1527b3cdd2a7SJulius Volz #endif
1528b3cdd2a7SJulius Volz 
15295c3a0fd7SJoe Perches __sum16 ip_vs_checksum_complete(struct sk_buff *skb, int offset);
15301da177e4SLinus Torvalds 
1531f9214b26SAl Viro static inline __wsum ip_vs_check_diff4(__be32 old, __be32 new, __wsum oldsum)
15321da177e4SLinus Torvalds {
1533f9214b26SAl Viro 	__be32 diff[2] = { ~old, new };
15341da177e4SLinus Torvalds 
153507f0757aSJoe Perches 	return csum_partial(diff, sizeof(diff), oldsum);
1536f9214b26SAl Viro }
1537f9214b26SAl Viro 
15380bbdd42bSJulius Volz #ifdef CONFIG_IP_VS_IPV6
15390bbdd42bSJulius Volz static inline __wsum ip_vs_check_diff16(const __be32 *old, const __be32 *new,
15400bbdd42bSJulius Volz 					__wsum oldsum)
15410bbdd42bSJulius Volz {
15420bbdd42bSJulius Volz 	__be32 diff[8] = { ~old[3], ~old[2], ~old[1], ~old[0],
15430bbdd42bSJulius Volz 			    new[3],  new[2],  new[1],  new[0] };
15440bbdd42bSJulius Volz 
154507f0757aSJoe Perches 	return csum_partial(diff, sizeof(diff), oldsum);
15460bbdd42bSJulius Volz }
15470bbdd42bSJulius Volz #endif
15480bbdd42bSJulius Volz 
1549f9214b26SAl Viro static inline __wsum ip_vs_check_diff2(__be16 old, __be16 new, __wsum oldsum)
1550f9214b26SAl Viro {
1551f9214b26SAl Viro 	__be16 diff[2] = { ~old, new };
1552f9214b26SAl Viro 
155307f0757aSJoe Perches 	return csum_partial(diff, sizeof(diff), oldsum);
15541da177e4SLinus Torvalds }
15551da177e4SLinus Torvalds 
1556cf356d69SJulian Anastasov /*
1557cf356d69SJulian Anastasov  * Forget current conntrack (unconfirmed) and attach notrack entry
1558cf356d69SJulian Anastasov  */
1559cf356d69SJulian Anastasov static inline void ip_vs_notrack(struct sk_buff *skb)
1560cf356d69SJulian Anastasov {
1561cf356d69SJulian Anastasov #if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE)
1562cf356d69SJulian Anastasov 	enum ip_conntrack_info ctinfo;
156306b69390SJesper Juhl 	struct nf_conn *ct = nf_ct_get(skb, &ctinfo);
1564cf356d69SJulian Anastasov 
1565cf356d69SJulian Anastasov 	if (!ct || !nf_ct_is_untracked(ct)) {
15669e33ce45SLin Ming 		nf_conntrack_put(skb->nfct);
1567cf356d69SJulian Anastasov 		skb->nfct = &nf_ct_untracked_get()->ct_general;
1568cf356d69SJulian Anastasov 		skb->nfctinfo = IP_CT_NEW;
1569cf356d69SJulian Anastasov 		nf_conntrack_get(skb->nfct);
1570cf356d69SJulian Anastasov 	}
1571cf356d69SJulian Anastasov #endif
1572cf356d69SJulian Anastasov }
1573cf356d69SJulian Anastasov 
1574f4bc17cdSJulian Anastasov #ifdef CONFIG_IP_VS_NFCT
1575f4bc17cdSJulian Anastasov /*
1576f4bc17cdSJulian Anastasov  *      Netfilter connection tracking
1577f4bc17cdSJulian Anastasov  *      (from ip_vs_nfct.c)
1578f4bc17cdSJulian Anastasov  */
1579a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs)
1580f4bc17cdSJulian Anastasov {
1581a4e2f5a7SSimon Horman #ifdef CONFIG_SYSCTL
1582a0840e2eSHans Schillstrom 	return ipvs->sysctl_conntrack;
1583a4e2f5a7SSimon Horman #else
1584a4e2f5a7SSimon Horman 	return 0;
1585a4e2f5a7SSimon Horman #endif
1586f4bc17cdSJulian Anastasov }
1587f4bc17cdSJulian Anastasov 
15885c3a0fd7SJoe Perches void ip_vs_update_conntrack(struct sk_buff *skb, struct ip_vs_conn *cp,
15896523ce15SJulian Anastasov 			    int outin);
15905c3a0fd7SJoe Perches int ip_vs_confirm_conntrack(struct sk_buff *skb);
15915c3a0fd7SJoe Perches void ip_vs_nfct_expect_related(struct sk_buff *skb, struct nf_conn *ct,
1592f4bc17cdSJulian Anastasov 			       struct ip_vs_conn *cp, u_int8_t proto,
1593f4bc17cdSJulian Anastasov 			       const __be16 port, int from_rs);
15945c3a0fd7SJoe Perches void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp);
1595f4bc17cdSJulian Anastasov 
1596f4bc17cdSJulian Anastasov #else
1597f4bc17cdSJulian Anastasov 
1598a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs)
1599f4bc17cdSJulian Anastasov {
1600f4bc17cdSJulian Anastasov 	return 0;
1601f4bc17cdSJulian Anastasov }
1602f4bc17cdSJulian Anastasov 
1603f4bc17cdSJulian Anastasov static inline void ip_vs_update_conntrack(struct sk_buff *skb,
1604f4bc17cdSJulian Anastasov 					  struct ip_vs_conn *cp, int outin)
1605f4bc17cdSJulian Anastasov {
1606f4bc17cdSJulian Anastasov }
1607f4bc17cdSJulian Anastasov 
1608e23ebf0fSKrzysztof Wilczynski static inline int ip_vs_confirm_conntrack(struct sk_buff *skb)
1609f4bc17cdSJulian Anastasov {
1610f4bc17cdSJulian Anastasov 	return NF_ACCEPT;
1611f4bc17cdSJulian Anastasov }
1612f4bc17cdSJulian Anastasov 
1613f4bc17cdSJulian Anastasov static inline void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp)
1614f4bc17cdSJulian Anastasov {
1615f4bc17cdSJulian Anastasov }
1616f4bc17cdSJulian Anastasov /* CONFIG_IP_VS_NFCT */
1617f4bc17cdSJulian Anastasov #endif
16186523ce15SJulian Anastasov 
1619c16526a7SSimon Kirby static inline int
1620b552f7e3SChangli Gao ip_vs_dest_conn_overhead(struct ip_vs_dest *dest)
1621b552f7e3SChangli Gao {
1622b552f7e3SChangli Gao 	/*
1623b552f7e3SChangli Gao 	 * We think the overhead of processing active connections is 256
1624b552f7e3SChangli Gao 	 * times higher than that of inactive connections in average. (This
1625b552f7e3SChangli Gao 	 * 256 times might not be accurate, we will change it later) We
1626b552f7e3SChangli Gao 	 * use the following formula to estimate the overhead now:
1627b552f7e3SChangli Gao 	 *		  dest->activeconns*256 + dest->inactconns
1628b552f7e3SChangli Gao 	 */
1629b552f7e3SChangli Gao 	return (atomic_read(&dest->activeconns) << 8) +
1630b552f7e3SChangli Gao 		atomic_read(&dest->inactconns);
1631b552f7e3SChangli Gao }
1632b552f7e3SChangli Gao 
1633bc4768ebSJulius Volz #endif	/* _NET_IP_VS_H */
1634