107dcc686SSimon Horman /* IP Virtual Server 21da177e4SLinus Torvalds * data structure and functionality definitions 31da177e4SLinus Torvalds */ 41da177e4SLinus Torvalds 5bc4768ebSJulius Volz #ifndef _NET_IP_VS_H 6bc4768ebSJulius Volz #define _NET_IP_VS_H 71da177e4SLinus Torvalds 8bc4768ebSJulius Volz #include <linux/ip_vs.h> /* definitions shared with userland */ 91da177e4SLinus Torvalds 10bc4768ebSJulius Volz #include <asm/types.h> /* for __uXX types */ 11bc4768ebSJulius Volz 121da177e4SLinus Torvalds #include <linux/list.h> /* for struct list_head */ 131da177e4SLinus Torvalds #include <linux/spinlock.h> /* for struct rwlock_t */ 1460063497SArun Sharma #include <linux/atomic.h> /* for struct atomic_t */ 151da177e4SLinus Torvalds #include <linux/compiler.h> 1614c85021SArnaldo Carvalho de Melo #include <linux/timer.h> 17187f1882SPaul Gortmaker #include <linux/bug.h> 181da177e4SLinus Torvalds 1914c85021SArnaldo Carvalho de Melo #include <net/checksum.h> 20e7ade46aSJulius Volz #include <linux/netfilter.h> /* for union nf_inet_addr */ 211668e010SKOVACS Krisztian #include <linux/ip.h> 22e7ade46aSJulius Volz #include <linux/ipv6.h> /* for struct ipv6hdr */ 234e3fd7a0SAlexey Dobriyan #include <net/ipv6.h> 2454d83efaSJesper Dangaard Brouer #if IS_ENABLED(CONFIG_IP_VS_IPV6) 2563dca2c0SJesper Dangaard Brouer #include <linux/netfilter_ipv6/ip6_tables.h> 2663dca2c0SJesper Dangaard Brouer #endif 27a638e514SJesper Dangaard Brouer #if IS_ENABLED(CONFIG_NF_CONNTRACK) 28f4bc17cdSJulian Anastasov #include <net/netfilter/nf_conntrack.h> 29f4bc17cdSJulian Anastasov #endif 3061b1ab45SHans Schillstrom #include <net/net_namespace.h> /* Netw namespace */ 3161b1ab45SHans Schillstrom 324fd9beefSAlex Gartrell #define IP_VS_HDR_INVERSE 1 334fd9beefSAlex Gartrell #define IP_VS_HDR_ICMP 2 344fd9beefSAlex Gartrell 3507dcc686SSimon Horman /* Generic access of ipvs struct */ 3661b1ab45SHans Schillstrom static inline struct netns_ipvs *net_ipvs(struct net* net) 3761b1ab45SHans Schillstrom { 3861b1ab45SHans Schillstrom return net->ipvs; 3961b1ab45SHans Schillstrom } 4007dcc686SSimon Horman 4107dcc686SSimon Horman /* This one needed for single_open_net since net is stored directly in 4225985edcSLucas De Marchi * private not as a struct i.e. seq_file_net can't be used. 43b17fc996SHans Schillstrom */ 44b17fc996SHans Schillstrom static inline struct net *seq_file_single_net(struct seq_file *seq) 45b17fc996SHans Schillstrom { 46b17fc996SHans Schillstrom #ifdef CONFIG_NET_NS 47b17fc996SHans Schillstrom return (struct net *)seq->private; 48b17fc996SHans Schillstrom #else 49b17fc996SHans Schillstrom return &init_net; 50b17fc996SHans Schillstrom #endif 51b17fc996SHans Schillstrom } 526f7edb48SCatalin(ux) M. BOIE 536f7edb48SCatalin(ux) M. BOIE /* Connections' size value needed by ip_vs_ctl.c */ 546f7edb48SCatalin(ux) M. BOIE extern int ip_vs_conn_tab_size; 556f7edb48SCatalin(ux) M. BOIE 5664aae3cbSJulius Volz struct ip_vs_iphdr { 574fd9beefSAlex Gartrell int hdr_flags; /* ipvs flags */ 58b0e010c5SAlex Gartrell __u32 off; /* Where IP or IPv4 header starts */ 5963dca2c0SJesper Dangaard Brouer __u32 len; /* IPv4 simply where L4 starts 6007dcc686SSimon Horman * IPv6 where L4 Transport Header starts */ 6163dca2c0SJesper Dangaard Brouer __u16 fragoffs; /* IPv6 fragment offset, 0 if first frag (or not frag)*/ 6263dca2c0SJesper Dangaard Brouer __s16 protocol; 6363dca2c0SJesper Dangaard Brouer __s32 flags; 6464aae3cbSJulius Volz union nf_inet_addr saddr; 6564aae3cbSJulius Volz union nf_inet_addr daddr; 6664aae3cbSJulius Volz }; 6764aae3cbSJulius Volz 682f74713dSJesper Dangaard Brouer static inline void *frag_safe_skb_hp(const struct sk_buff *skb, int offset, 692f74713dSJesper Dangaard Brouer int len, void *buffer, 702f74713dSJesper Dangaard Brouer const struct ip_vs_iphdr *ipvsh) 712f74713dSJesper Dangaard Brouer { 722f74713dSJesper Dangaard Brouer return skb_header_pointer(skb, offset, len, buffer); 732f74713dSJesper Dangaard Brouer } 742f74713dSJesper Dangaard Brouer 7563dca2c0SJesper Dangaard Brouer /* This function handles filling *ip_vs_iphdr, both for IPv4 and IPv6. 7663dca2c0SJesper Dangaard Brouer * IPv6 requires some extra work, as finding proper header position, 7763dca2c0SJesper Dangaard Brouer * depend on the IPv6 extension headers. 7863dca2c0SJesper Dangaard Brouer */ 79b0e010c5SAlex Gartrell static inline int 80b0e010c5SAlex Gartrell ip_vs_fill_iph_skb_off(int af, const struct sk_buff *skb, int offset, 814fd9beefSAlex Gartrell int hdr_flags, struct ip_vs_iphdr *iphdr) 8264aae3cbSJulius Volz { 834fd9beefSAlex Gartrell iphdr->hdr_flags = hdr_flags; 84b0e010c5SAlex Gartrell iphdr->off = offset; 854fd9beefSAlex Gartrell 8664aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 8764aae3cbSJulius Volz if (af == AF_INET6) { 88b0e010c5SAlex Gartrell struct ipv6hdr _iph; 89b0e010c5SAlex Gartrell const struct ipv6hdr *iph = skb_header_pointer( 90b0e010c5SAlex Gartrell skb, offset, sizeof(_iph), &_iph); 91b0e010c5SAlex Gartrell if (!iph) 92b0e010c5SAlex Gartrell return 0; 93b0e010c5SAlex Gartrell 944e3fd7a0SAlexey Dobriyan iphdr->saddr.in6 = iph->saddr; 954e3fd7a0SAlexey Dobriyan iphdr->daddr.in6 = iph->daddr; 966aafeef0SJiri Pirko /* ipv6_find_hdr() updates len, flags */ 97b0e010c5SAlex Gartrell iphdr->len = offset; 9863dca2c0SJesper Dangaard Brouer iphdr->flags = 0; 9963dca2c0SJesper Dangaard Brouer iphdr->protocol = ipv6_find_hdr(skb, &iphdr->len, -1, 10063dca2c0SJesper Dangaard Brouer &iphdr->fragoffs, 10163dca2c0SJesper Dangaard Brouer &iphdr->flags); 102b0e010c5SAlex Gartrell if (iphdr->protocol < 0) 103b0e010c5SAlex Gartrell return 0; 10464aae3cbSJulius Volz } else 10564aae3cbSJulius Volz #endif 10664aae3cbSJulius Volz { 107b0e010c5SAlex Gartrell struct iphdr _iph; 108b0e010c5SAlex Gartrell const struct iphdr *iph = skb_header_pointer( 109b0e010c5SAlex Gartrell skb, offset, sizeof(_iph), &_iph); 110b0e010c5SAlex Gartrell if (!iph) 111b0e010c5SAlex Gartrell return 0; 112b0e010c5SAlex Gartrell 113b0e010c5SAlex Gartrell iphdr->len = offset + iph->ihl * 4; 11463dca2c0SJesper Dangaard Brouer iphdr->fragoffs = 0; 11564aae3cbSJulius Volz iphdr->protocol = iph->protocol; 11664aae3cbSJulius Volz iphdr->saddr.ip = iph->saddr; 11764aae3cbSJulius Volz iphdr->daddr.ip = iph->daddr; 11864aae3cbSJulius Volz } 119b0e010c5SAlex Gartrell 120b0e010c5SAlex Gartrell return 1; 121b0e010c5SAlex Gartrell } 122b0e010c5SAlex Gartrell 123b0e010c5SAlex Gartrell static inline int 1244fd9beefSAlex Gartrell ip_vs_fill_iph_skb_icmp(int af, const struct sk_buff *skb, int offset, 1254fd9beefSAlex Gartrell bool inverse, struct ip_vs_iphdr *iphdr) 126b0e010c5SAlex Gartrell { 1274fd9beefSAlex Gartrell int hdr_flags = IP_VS_HDR_ICMP; 1284fd9beefSAlex Gartrell 1294fd9beefSAlex Gartrell if (inverse) 1304fd9beefSAlex Gartrell hdr_flags |= IP_VS_HDR_INVERSE; 1314fd9beefSAlex Gartrell 1324fd9beefSAlex Gartrell return ip_vs_fill_iph_skb_off(af, skb, offset, hdr_flags, iphdr); 1334fd9beefSAlex Gartrell } 1344fd9beefSAlex Gartrell 1354fd9beefSAlex Gartrell static inline int 1364fd9beefSAlex Gartrell ip_vs_fill_iph_skb(int af, const struct sk_buff *skb, bool inverse, 1374fd9beefSAlex Gartrell struct ip_vs_iphdr *iphdr) 1384fd9beefSAlex Gartrell { 1394fd9beefSAlex Gartrell int hdr_flags = 0; 1404fd9beefSAlex Gartrell 1414fd9beefSAlex Gartrell if (inverse) 1424fd9beefSAlex Gartrell hdr_flags |= IP_VS_HDR_INVERSE; 1434fd9beefSAlex Gartrell 1444fd9beefSAlex Gartrell return ip_vs_fill_iph_skb_off(af, skb, skb_network_offset(skb), 1454fd9beefSAlex Gartrell hdr_flags, iphdr); 1464fd9beefSAlex Gartrell } 1474fd9beefSAlex Gartrell 1484fd9beefSAlex Gartrell static inline bool 1494fd9beefSAlex Gartrell ip_vs_iph_inverse(const struct ip_vs_iphdr *iph) 1504fd9beefSAlex Gartrell { 1514fd9beefSAlex Gartrell return !!(iph->hdr_flags & IP_VS_HDR_INVERSE); 1524fd9beefSAlex Gartrell } 1534fd9beefSAlex Gartrell 1544fd9beefSAlex Gartrell static inline bool 1554fd9beefSAlex Gartrell ip_vs_iph_icmp(const struct ip_vs_iphdr *iph) 1564fd9beefSAlex Gartrell { 1574fd9beefSAlex Gartrell return !!(iph->hdr_flags & IP_VS_HDR_ICMP); 15864aae3cbSJulius Volz } 15964aae3cbSJulius Volz 16064aae3cbSJulius Volz static inline void ip_vs_addr_copy(int af, union nf_inet_addr *dst, 16164aae3cbSJulius Volz const union nf_inet_addr *src) 16264aae3cbSJulius Volz { 16364aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 16464aae3cbSJulius Volz if (af == AF_INET6) 1654e3fd7a0SAlexey Dobriyan dst->in6 = src->in6; 16664aae3cbSJulius Volz else 16764aae3cbSJulius Volz #endif 16864aae3cbSJulius Volz dst->ip = src->ip; 16964aae3cbSJulius Volz } 17064aae3cbSJulius Volz 1719a05475cSJulian Anastasov static inline void ip_vs_addr_set(int af, union nf_inet_addr *dst, 1729a05475cSJulian Anastasov const union nf_inet_addr *src) 1739a05475cSJulian Anastasov { 1749a05475cSJulian Anastasov #ifdef CONFIG_IP_VS_IPV6 1759a05475cSJulian Anastasov if (af == AF_INET6) { 1769a05475cSJulian Anastasov dst->in6 = src->in6; 1779a05475cSJulian Anastasov return; 1789a05475cSJulian Anastasov } 1799a05475cSJulian Anastasov #endif 1809a05475cSJulian Anastasov dst->ip = src->ip; 1819a05475cSJulian Anastasov dst->all[1] = 0; 1829a05475cSJulian Anastasov dst->all[2] = 0; 1839a05475cSJulian Anastasov dst->all[3] = 0; 1849a05475cSJulian Anastasov } 1859a05475cSJulian Anastasov 18664aae3cbSJulius Volz static inline int ip_vs_addr_equal(int af, const union nf_inet_addr *a, 18764aae3cbSJulius Volz const union nf_inet_addr *b) 18864aae3cbSJulius Volz { 18964aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 19064aae3cbSJulius Volz if (af == AF_INET6) 19164aae3cbSJulius Volz return ipv6_addr_equal(&a->in6, &b->in6); 19264aae3cbSJulius Volz #endif 19364aae3cbSJulius Volz return a->ip == b->ip; 19464aae3cbSJulius Volz } 19564aae3cbSJulius Volz 1961da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG 19714c85021SArnaldo Carvalho de Melo #include <linux/net.h> 19814c85021SArnaldo Carvalho de Melo 1995c3a0fd7SJoe Perches int ip_vs_get_debug_level(void); 200c842a3adSJulius Volz 201c842a3adSJulius Volz static inline const char *ip_vs_dbg_addr(int af, char *buf, size_t buf_len, 202c842a3adSJulius Volz const union nf_inet_addr *addr, 203c842a3adSJulius Volz int *idx) 204c842a3adSJulius Volz { 205c842a3adSJulius Volz int len; 206c842a3adSJulius Volz #ifdef CONFIG_IP_VS_IPV6 207c842a3adSJulius Volz if (af == AF_INET6) 208120b9c14SJesper Dangaard Brouer len = snprintf(&buf[*idx], buf_len - *idx, "[%pI6c]", 2090c6ce78aSHarvey Harrison &addr->in6) + 1; 210c842a3adSJulius Volz else 211c842a3adSJulius Volz #endif 2123685f25dSHarvey Harrison len = snprintf(&buf[*idx], buf_len - *idx, "%pI4", 2133685f25dSHarvey Harrison &addr->ip) + 1; 214c842a3adSJulius Volz 215c842a3adSJulius Volz *idx += len; 216c842a3adSJulius Volz BUG_ON(*idx > buf_len + 1); 217c842a3adSJulius Volz return &buf[*idx - len]; 218c842a3adSJulius Volz } 219c842a3adSJulius Volz 2209aada7acSHannes Eder #define IP_VS_DBG_BUF(level, msg, ...) \ 221c842a3adSJulius Volz do { \ 222c842a3adSJulius Volz char ip_vs_dbg_buf[160]; \ 223c842a3adSJulius Volz int ip_vs_dbg_idx = 0; \ 224c842a3adSJulius Volz if (level <= ip_vs_get_debug_level()) \ 2259aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 226c842a3adSJulius Volz } while (0) 227c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...) \ 228c842a3adSJulius Volz do { \ 229c842a3adSJulius Volz char ip_vs_dbg_buf[160]; \ 230c842a3adSJulius Volz int ip_vs_dbg_idx = 0; \ 2319aada7acSHannes Eder pr_err(msg); \ 232c842a3adSJulius Volz } while (0) 233c842a3adSJulius Volz 234c842a3adSJulius Volz /* Only use from within IP_VS_DBG_BUF() or IP_VS_ERR_BUF macros */ 235c842a3adSJulius Volz #define IP_VS_DBG_ADDR(af, addr) \ 236c842a3adSJulius Volz ip_vs_dbg_addr(af, ip_vs_dbg_buf, \ 237c842a3adSJulius Volz sizeof(ip_vs_dbg_buf), addr, \ 238c842a3adSJulius Volz &ip_vs_dbg_idx) 239c842a3adSJulius Volz 2409aada7acSHannes Eder #define IP_VS_DBG(level, msg, ...) \ 2411da177e4SLinus Torvalds do { \ 2421da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2439aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 2441da177e4SLinus Torvalds } while (0) 2459aada7acSHannes Eder #define IP_VS_DBG_RL(msg, ...) \ 2461da177e4SLinus Torvalds do { \ 2471da177e4SLinus Torvalds if (net_ratelimit()) \ 2489aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 2491da177e4SLinus Torvalds } while (0) 2500d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg) \ 2511da177e4SLinus Torvalds do { \ 2521da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2530d79641aSJulian Anastasov pp->debug_packet(af, pp, skb, ofs, msg); \ 2541da177e4SLinus Torvalds } while (0) 2550d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg) \ 2561da177e4SLinus Torvalds do { \ 2571da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level() && \ 2581da177e4SLinus Torvalds net_ratelimit()) \ 2590d79641aSJulian Anastasov pp->debug_packet(af, pp, skb, ofs, msg); \ 2601da177e4SLinus Torvalds } while (0) 2611da177e4SLinus Torvalds #else /* NO DEBUGGING at ALL */ 262c842a3adSJulius Volz #define IP_VS_DBG_BUF(level, msg...) do {} while (0) 263c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...) do {} while (0) 2641da177e4SLinus Torvalds #define IP_VS_DBG(level, msg...) do {} while (0) 2651da177e4SLinus Torvalds #define IP_VS_DBG_RL(msg...) do {} while (0) 2660d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg) do {} while (0) 2670d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg) do {} while (0) 2681da177e4SLinus Torvalds #endif 2691da177e4SLinus Torvalds 2701da177e4SLinus Torvalds #define IP_VS_BUG() BUG() 2711e3e238eSHannes Eder #define IP_VS_ERR_RL(msg, ...) \ 2721da177e4SLinus Torvalds do { \ 2731da177e4SLinus Torvalds if (net_ratelimit()) \ 2741e3e238eSHannes Eder pr_err(msg, ##__VA_ARGS__); \ 2751da177e4SLinus Torvalds } while (0) 2761da177e4SLinus Torvalds 2771da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG 2781da177e4SLinus Torvalds #define EnterFunction(level) \ 2791da177e4SLinus Torvalds do { \ 2801da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2819aada7acSHannes Eder printk(KERN_DEBUG \ 2829aada7acSHannes Eder pr_fmt("Enter: %s, %s line %i\n"), \ 283d5c003b4SHarvey Harrison __func__, __FILE__, __LINE__); \ 2841da177e4SLinus Torvalds } while (0) 2851da177e4SLinus Torvalds #define LeaveFunction(level) \ 2861da177e4SLinus Torvalds do { \ 2871da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2889aada7acSHannes Eder printk(KERN_DEBUG \ 2899aada7acSHannes Eder pr_fmt("Leave: %s, %s line %i\n"), \ 290d5c003b4SHarvey Harrison __func__, __FILE__, __LINE__); \ 2911da177e4SLinus Torvalds } while (0) 2921da177e4SLinus Torvalds #else 2931da177e4SLinus Torvalds #define EnterFunction(level) do {} while (0) 2941da177e4SLinus Torvalds #define LeaveFunction(level) do {} while (0) 2951da177e4SLinus Torvalds #endif 2961da177e4SLinus Torvalds 29707dcc686SSimon Horman /* The port number of FTP service (in network order). */ 298f3a7c66bSHarvey Harrison #define FTPPORT cpu_to_be16(21) 299f3a7c66bSHarvey Harrison #define FTPDATA cpu_to_be16(20) 3001da177e4SLinus Torvalds 30107dcc686SSimon Horman /* TCP State Values */ 3021da177e4SLinus Torvalds enum { 3031da177e4SLinus Torvalds IP_VS_TCP_S_NONE = 0, 3041da177e4SLinus Torvalds IP_VS_TCP_S_ESTABLISHED, 3051da177e4SLinus Torvalds IP_VS_TCP_S_SYN_SENT, 3061da177e4SLinus Torvalds IP_VS_TCP_S_SYN_RECV, 3071da177e4SLinus Torvalds IP_VS_TCP_S_FIN_WAIT, 3081da177e4SLinus Torvalds IP_VS_TCP_S_TIME_WAIT, 3091da177e4SLinus Torvalds IP_VS_TCP_S_CLOSE, 3101da177e4SLinus Torvalds IP_VS_TCP_S_CLOSE_WAIT, 3111da177e4SLinus Torvalds IP_VS_TCP_S_LAST_ACK, 3121da177e4SLinus Torvalds IP_VS_TCP_S_LISTEN, 3131da177e4SLinus Torvalds IP_VS_TCP_S_SYNACK, 3141da177e4SLinus Torvalds IP_VS_TCP_S_LAST 3151da177e4SLinus Torvalds }; 3161da177e4SLinus Torvalds 31707dcc686SSimon Horman /* UDP State Values */ 3181da177e4SLinus Torvalds enum { 3191da177e4SLinus Torvalds IP_VS_UDP_S_NORMAL, 3201da177e4SLinus Torvalds IP_VS_UDP_S_LAST, 3211da177e4SLinus Torvalds }; 3221da177e4SLinus Torvalds 32307dcc686SSimon Horman /* ICMP State Values */ 3241da177e4SLinus Torvalds enum { 3251da177e4SLinus Torvalds IP_VS_ICMP_S_NORMAL, 3261da177e4SLinus Torvalds IP_VS_ICMP_S_LAST, 3271da177e4SLinus Torvalds }; 3281da177e4SLinus Torvalds 32907dcc686SSimon Horman /* SCTP State Values */ 3302906f66aSVenkata Mohan Reddy enum ip_vs_sctp_states { 3312906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_NONE, 33261e7c420SJulian Anastasov IP_VS_SCTP_S_INIT1, 33361e7c420SJulian Anastasov IP_VS_SCTP_S_INIT, 33461e7c420SJulian Anastasov IP_VS_SCTP_S_COOKIE_SENT, 33561e7c420SJulian Anastasov IP_VS_SCTP_S_COOKIE_REPLIED, 33661e7c420SJulian Anastasov IP_VS_SCTP_S_COOKIE_WAIT, 33761e7c420SJulian Anastasov IP_VS_SCTP_S_COOKIE, 33861e7c420SJulian Anastasov IP_VS_SCTP_S_COOKIE_ECHOED, 3392906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_ESTABLISHED, 34061e7c420SJulian Anastasov IP_VS_SCTP_S_SHUTDOWN_SENT, 34161e7c420SJulian Anastasov IP_VS_SCTP_S_SHUTDOWN_RECEIVED, 34261e7c420SJulian Anastasov IP_VS_SCTP_S_SHUTDOWN_ACK_SENT, 34361e7c420SJulian Anastasov IP_VS_SCTP_S_REJECTED, 3442906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_CLOSED, 3452906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_LAST 3462906f66aSVenkata Mohan Reddy }; 3472906f66aSVenkata Mohan Reddy 34807dcc686SSimon Horman /* Delta sequence info structure 3491da177e4SLinus Torvalds * Each ip_vs_conn has 2 (output AND input seq. changes). 3501da177e4SLinus Torvalds * Only used in the VS/NAT. 3511da177e4SLinus Torvalds */ 3521da177e4SLinus Torvalds struct ip_vs_seq { 3531da177e4SLinus Torvalds __u32 init_seq; /* Add delta from this seq */ 3541da177e4SLinus Torvalds __u32 delta; /* Delta in sequence numbers */ 3551da177e4SLinus Torvalds __u32 previous_delta; /* Delta in sequence numbers 35607dcc686SSimon Horman * before last resized pkt */ 3571da177e4SLinus Torvalds }; 3581da177e4SLinus Torvalds 35907dcc686SSimon Horman /* counters per cpu */ 360b17fc996SHans Schillstrom struct ip_vs_counters { 361cd67cd5eSJulian Anastasov __u64 conns; /* connections scheduled */ 362cd67cd5eSJulian Anastasov __u64 inpkts; /* incoming packets */ 363cd67cd5eSJulian Anastasov __u64 outpkts; /* outgoing packets */ 364b17fc996SHans Schillstrom __u64 inbytes; /* incoming bytes */ 365b17fc996SHans Schillstrom __u64 outbytes; /* outgoing bytes */ 366b17fc996SHans Schillstrom }; 36707dcc686SSimon Horman /* Stats per cpu */ 368b17fc996SHans Schillstrom struct ip_vs_cpu_stats { 369cd67cd5eSJulian Anastasov struct ip_vs_counters cnt; 370b17fc996SHans Schillstrom struct u64_stats_sync syncp; 371b17fc996SHans Schillstrom }; 3721da177e4SLinus Torvalds 37307dcc686SSimon Horman /* IPVS statistics objects */ 3743a14a313SSven Wegener struct ip_vs_estimator { 3753a14a313SSven Wegener struct list_head list; 3763a14a313SSven Wegener 3773a14a313SSven Wegener u64 last_inbytes; 3783a14a313SSven Wegener u64 last_outbytes; 379cd67cd5eSJulian Anastasov u64 last_conns; 380cd67cd5eSJulian Anastasov u64 last_inpkts; 381cd67cd5eSJulian Anastasov u64 last_outpkts; 3823a14a313SSven Wegener 383cd67cd5eSJulian Anastasov u64 cps; 384cd67cd5eSJulian Anastasov u64 inpps; 385cd67cd5eSJulian Anastasov u64 outpps; 386cd67cd5eSJulian Anastasov u64 inbps; 387cd67cd5eSJulian Anastasov u64 outbps; 388cd67cd5eSJulian Anastasov }; 389cd67cd5eSJulian Anastasov 390cd67cd5eSJulian Anastasov /* 391cd67cd5eSJulian Anastasov * IPVS statistics object, 64-bit kernel version of struct ip_vs_stats_user 392cd67cd5eSJulian Anastasov */ 393cd67cd5eSJulian Anastasov struct ip_vs_kstats { 394cd67cd5eSJulian Anastasov u64 conns; /* connections scheduled */ 395cd67cd5eSJulian Anastasov u64 inpkts; /* incoming packets */ 396cd67cd5eSJulian Anastasov u64 outpkts; /* outgoing packets */ 397cd67cd5eSJulian Anastasov u64 inbytes; /* incoming bytes */ 398cd67cd5eSJulian Anastasov u64 outbytes; /* outgoing bytes */ 399cd67cd5eSJulian Anastasov 400cd67cd5eSJulian Anastasov u64 cps; /* current connection rate */ 401cd67cd5eSJulian Anastasov u64 inpps; /* current in packet rate */ 402cd67cd5eSJulian Anastasov u64 outpps; /* current out packet rate */ 403cd67cd5eSJulian Anastasov u64 inbps; /* current in byte rate */ 404cd67cd5eSJulian Anastasov u64 outbps; /* current out byte rate */ 4053a14a313SSven Wegener }; 4063a14a313SSven Wegener 407fd2c3ef7SEric Dumazet struct ip_vs_stats { 408cd67cd5eSJulian Anastasov struct ip_vs_kstats kstats; /* kernel statistics */ 409e9c0ce23SSven Wegener struct ip_vs_estimator est; /* estimator */ 410b962abdcSJulian Anastasov struct ip_vs_cpu_stats __percpu *cpustats; /* per cpu counters */ 4111da177e4SLinus Torvalds spinlock_t lock; /* spin lock */ 412cd67cd5eSJulian Anastasov struct ip_vs_kstats kstats0; /* reset values */ 4131da177e4SLinus Torvalds }; 4141da177e4SLinus Torvalds 41514c85021SArnaldo Carvalho de Melo struct dst_entry; 41614c85021SArnaldo Carvalho de Melo struct iphdr; 4171da177e4SLinus Torvalds struct ip_vs_conn; 4181da177e4SLinus Torvalds struct ip_vs_app; 41914c85021SArnaldo Carvalho de Melo struct sk_buff; 420252c6410SHans Schillstrom struct ip_vs_proto_data; 4211da177e4SLinus Torvalds 4221da177e4SLinus Torvalds struct ip_vs_protocol { 4231da177e4SLinus Torvalds struct ip_vs_protocol *next; 4241da177e4SLinus Torvalds char *name; 4252ad17defSJulian Anastasov u16 protocol; 4262ad17defSJulian Anastasov u16 num_states; 4271da177e4SLinus Torvalds int dont_defrag; 4281da177e4SLinus Torvalds 4291da177e4SLinus Torvalds void (*init)(struct ip_vs_protocol *pp); 4301da177e4SLinus Torvalds 4311da177e4SLinus Torvalds void (*exit)(struct ip_vs_protocol *pp); 4321da177e4SLinus Torvalds 4331281a9c2SEric W. Biederman int (*init_netns)(struct netns_ipvs *ipvs, struct ip_vs_proto_data *pd); 434252c6410SHans Schillstrom 4351281a9c2SEric W. Biederman void (*exit_netns)(struct netns_ipvs *ipvs, struct ip_vs_proto_data *pd); 436252c6410SHans Schillstrom 437d8f44c33SEric W. Biederman int (*conn_schedule)(struct netns_ipvs *ipvs, 438d8f44c33SEric W. Biederman int af, struct sk_buff *skb, 4399330419dSHans Schillstrom struct ip_vs_proto_data *pd, 440d4383f04SJesper Dangaard Brouer int *verdict, struct ip_vs_conn **cpp, 441d4383f04SJesper Dangaard Brouer struct ip_vs_iphdr *iph); 4421da177e4SLinus Torvalds 4431da177e4SLinus Torvalds struct ip_vs_conn * 444ab161976SEric W. Biederman (*conn_in_get)(struct netns_ipvs *ipvs, 445ab161976SEric W. Biederman int af, 44651ef348bSJulius Volz const struct sk_buff *skb, 447802c41adSAlex Gartrell const struct ip_vs_iphdr *iph); 4481da177e4SLinus Torvalds 4491da177e4SLinus Torvalds struct ip_vs_conn * 4500cf705c8SEric W. Biederman (*conn_out_get)(struct netns_ipvs *ipvs, 4510cf705c8SEric W. Biederman int af, 45251ef348bSJulius Volz const struct sk_buff *skb, 453802c41adSAlex Gartrell const struct ip_vs_iphdr *iph); 4541da177e4SLinus Torvalds 455d4383f04SJesper Dangaard Brouer int (*snat_handler)(struct sk_buff *skb, struct ip_vs_protocol *pp, 456d4383f04SJesper Dangaard Brouer struct ip_vs_conn *cp, struct ip_vs_iphdr *iph); 4571da177e4SLinus Torvalds 458d4383f04SJesper Dangaard Brouer int (*dnat_handler)(struct sk_buff *skb, struct ip_vs_protocol *pp, 459d4383f04SJesper Dangaard Brouer struct ip_vs_conn *cp, struct ip_vs_iphdr *iph); 4601da177e4SLinus Torvalds 46151ef348bSJulius Volz int (*csum_check)(int af, struct sk_buff *skb, 46251ef348bSJulius Volz struct ip_vs_protocol *pp); 4631da177e4SLinus Torvalds 4641da177e4SLinus Torvalds const char *(*state_name)(int state); 4651da177e4SLinus Torvalds 4664a516f11SSimon Horman void (*state_transition)(struct ip_vs_conn *cp, int direction, 4671da177e4SLinus Torvalds const struct sk_buff *skb, 4689330419dSHans Schillstrom struct ip_vs_proto_data *pd); 4691da177e4SLinus Torvalds 47019648918SEric W. Biederman int (*register_app)(struct netns_ipvs *ipvs, struct ip_vs_app *inc); 4711da177e4SLinus Torvalds 47219648918SEric W. Biederman void (*unregister_app)(struct netns_ipvs *ipvs, struct ip_vs_app *inc); 4731da177e4SLinus Torvalds 4741da177e4SLinus Torvalds int (*app_conn_bind)(struct ip_vs_conn *cp); 4751da177e4SLinus Torvalds 4760d79641aSJulian Anastasov void (*debug_packet)(int af, struct ip_vs_protocol *pp, 4771da177e4SLinus Torvalds const struct sk_buff *skb, 4781da177e4SLinus Torvalds int offset, 4791da177e4SLinus Torvalds const char *msg); 4801da177e4SLinus Torvalds 4819330419dSHans Schillstrom void (*timeout_change)(struct ip_vs_proto_data *pd, int flags); 4821da177e4SLinus Torvalds }; 4831da177e4SLinus Torvalds 48407dcc686SSimon Horman /* protocol data per netns */ 485252c6410SHans Schillstrom struct ip_vs_proto_data { 486252c6410SHans Schillstrom struct ip_vs_proto_data *next; 487252c6410SHans Schillstrom struct ip_vs_protocol *pp; 488252c6410SHans Schillstrom int *timeout_table; /* protocol timeout table */ 489252c6410SHans Schillstrom atomic_t appcnt; /* counter of proto app incs. */ 490252c6410SHans Schillstrom struct tcp_states_t *tcp_state_table; 491252c6410SHans Schillstrom }; 492252c6410SHans Schillstrom 4935c3a0fd7SJoe Perches struct ip_vs_protocol *ip_vs_proto_get(unsigned short proto); 49418d6ade6SEric W. Biederman struct ip_vs_proto_data *ip_vs_proto_data_get(struct netns_ipvs *ipvs, 495252c6410SHans Schillstrom unsigned short proto); 4961da177e4SLinus Torvalds 497f11017ecSSimon Horman struct ip_vs_conn_param { 498e64e2b46SEric W. Biederman struct netns_ipvs *ipvs; 499f11017ecSSimon Horman const union nf_inet_addr *caddr; 500f11017ecSSimon Horman const union nf_inet_addr *vaddr; 501f11017ecSSimon Horman __be16 cport; 502f11017ecSSimon Horman __be16 vport; 503f11017ecSSimon Horman __u16 protocol; 504f11017ecSSimon Horman u16 af; 50585999283SSimon Horman 50685999283SSimon Horman const struct ip_vs_pe *pe; 50785999283SSimon Horman char *pe_data; 50885999283SSimon Horman __u8 pe_data_len; 509f11017ecSSimon Horman }; 510f11017ecSSimon Horman 51107dcc686SSimon Horman /* IP_VS structure allocated for each dynamically scheduled connection */ 5121da177e4SLinus Torvalds struct ip_vs_conn { 513731109e7SChangli Gao struct hlist_node c_list; /* hashed list heads */ 5141da177e4SLinus Torvalds /* Protocol, addresses and port numbers */ 5156e67e586SHans Schillstrom __be16 cport; 5166e67e586SHans Schillstrom __be16 dport; 5171845ed0bSJulian Anastasov __be16 vport; 5181845ed0bSJulian Anastasov u16 af; /* address family */ 519e7ade46aSJulius Volz union nf_inet_addr caddr; /* client address */ 520e7ade46aSJulius Volz union nf_inet_addr vaddr; /* virtual address */ 521e7ade46aSJulius Volz union nf_inet_addr daddr; /* destination address */ 5223575792eSJulian Anastasov volatile __u32 flags; /* status flags */ 5231da177e4SLinus Torvalds __u16 protocol; /* Which protocol (TCP/UDP) */ 524ba38528aSAlex Gartrell __u16 daf; /* Address family of the dest */ 52558dbc6f2SEric W. Biederman struct netns_ipvs *ipvs; 5261da177e4SLinus Torvalds 5271da177e4SLinus Torvalds /* counter and timer */ 5281da177e4SLinus Torvalds atomic_t refcnt; /* reference count */ 5291da177e4SLinus Torvalds struct timer_list timer; /* Expiration timer */ 5301da177e4SLinus Torvalds volatile unsigned long timeout; /* timeout */ 5311da177e4SLinus Torvalds 5321da177e4SLinus Torvalds /* Flags and state transition */ 5331da177e4SLinus Torvalds spinlock_t lock; /* lock for state transition */ 5341da177e4SLinus Torvalds volatile __u16 state; /* state info */ 535efac5276SRumen G. Bogdanovski volatile __u16 old_state; /* old state, to be used for 536efac5276SRumen G. Bogdanovski * state transition triggerd 537efac5276SRumen G. Bogdanovski * synchronization 538efac5276SRumen G. Bogdanovski */ 5391845ed0bSJulian Anastasov __u32 fwmark; /* Fire wall mark from skb */ 540749c42b6SJulian Anastasov unsigned long sync_endtime; /* jiffies + sent_retries */ 5411da177e4SLinus Torvalds 5421da177e4SLinus Torvalds /* Control members */ 5431da177e4SLinus Torvalds struct ip_vs_conn *control; /* Master control connection */ 5441da177e4SLinus Torvalds atomic_t n_control; /* Number of controlled ones */ 5451da177e4SLinus Torvalds struct ip_vs_dest *dest; /* real server */ 5461da177e4SLinus Torvalds atomic_t in_pkts; /* incoming packet counter */ 5471da177e4SLinus Torvalds 54807dcc686SSimon Horman /* Packet transmitter for different forwarding methods. If it 54907dcc686SSimon Horman * mangles the packet, it must return NF_DROP or better NF_STOLEN, 55007dcc686SSimon Horman * otherwise this must be changed to a sk_buff **. 55107dcc686SSimon Horman * NF_ACCEPT can be returned when destination is local. 5521da177e4SLinus Torvalds */ 5531da177e4SLinus Torvalds int (*packet_xmit)(struct sk_buff *skb, struct ip_vs_conn *cp, 554d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 5551da177e4SLinus Torvalds 5561da177e4SLinus Torvalds /* Note: we can group the following members into a structure, 55707dcc686SSimon Horman * in order to save more space, and the following members are 55807dcc686SSimon Horman * only used in VS/NAT anyway 55907dcc686SSimon Horman */ 5601da177e4SLinus Torvalds struct ip_vs_app *app; /* bound ip_vs_app object */ 5611da177e4SLinus Torvalds void *app_data; /* Application private data */ 5621da177e4SLinus Torvalds struct ip_vs_seq in_seq; /* incoming seq. struct */ 5631da177e4SLinus Torvalds struct ip_vs_seq out_seq; /* outgoing seq. struct */ 56485999283SSimon Horman 565e9e5eee8SSimon Horman const struct ip_vs_pe *pe; 56685999283SSimon Horman char *pe_data; 56785999283SSimon Horman __u8 pe_data_len; 568088339a5SJulian Anastasov 569088339a5SJulian Anastasov struct rcu_head rcu_head; 5701da177e4SLinus Torvalds }; 5711da177e4SLinus Torvalds 57207dcc686SSimon Horman /* Extended internal versions of struct ip_vs_service_user and ip_vs_dest_user 57307dcc686SSimon Horman * for IPv6 support. 574c860c6b1SJulius Volz * 575c860c6b1SJulius Volz * We need these to conveniently pass around service and destination 576c860c6b1SJulius Volz * options, but unfortunately, we also need to keep the old definitions to 577c860c6b1SJulius Volz * maintain userspace backwards compatibility for the setsockopt interface. 578c860c6b1SJulius Volz */ 579c860c6b1SJulius Volz struct ip_vs_service_user_kern { 580c860c6b1SJulius Volz /* virtual service addresses */ 581c860c6b1SJulius Volz u16 af; 582c860c6b1SJulius Volz u16 protocol; 583c860c6b1SJulius Volz union nf_inet_addr addr; /* virtual ip address */ 5840a925864SJulian Anastasov __be16 port; 585c860c6b1SJulius Volz u32 fwmark; /* firwall mark of service */ 586c860c6b1SJulius Volz 587c860c6b1SJulius Volz /* virtual service options */ 588c860c6b1SJulius Volz char *sched_name; 5890d1e71b0SSimon Horman char *pe_name; 59095c96174SEric Dumazet unsigned int flags; /* virtual service flags */ 59195c96174SEric Dumazet unsigned int timeout; /* persistent timeout in sec */ 5920a925864SJulian Anastasov __be32 netmask; /* persistent netmask or plen */ 593c860c6b1SJulius Volz }; 594c860c6b1SJulius Volz 595c860c6b1SJulius Volz 596c860c6b1SJulius Volz struct ip_vs_dest_user_kern { 597c860c6b1SJulius Volz /* destination server address */ 598c860c6b1SJulius Volz union nf_inet_addr addr; 5990a925864SJulian Anastasov __be16 port; 600c860c6b1SJulius Volz 601c860c6b1SJulius Volz /* real server options */ 60295c96174SEric Dumazet unsigned int conn_flags; /* connection flags */ 603c860c6b1SJulius Volz int weight; /* destination weight */ 604c860c6b1SJulius Volz 605c860c6b1SJulius Volz /* thresholds for active connections */ 606c860c6b1SJulius Volz u32 u_threshold; /* upper threshold */ 607c860c6b1SJulius Volz u32 l_threshold; /* lower threshold */ 6086cff339bSAlex Gartrell 6096cff339bSAlex Gartrell /* Address family of addr */ 6106cff339bSAlex Gartrell u16 af; 611c860c6b1SJulius Volz }; 612c860c6b1SJulius Volz 613c860c6b1SJulius Volz 614c860c6b1SJulius Volz /* 61507dcc686SSimon Horman * The information about the virtual service offered to the net and the 61607dcc686SSimon Horman * forwarding entries. 6171da177e4SLinus Torvalds */ 6181da177e4SLinus Torvalds struct ip_vs_service { 619ceec4c38SJulian Anastasov struct hlist_node s_list; /* for normal service table */ 620ceec4c38SJulian Anastasov struct hlist_node f_list; /* for fwmark-based service table */ 6211da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 6221da177e4SLinus Torvalds 623e7ade46aSJulius Volz u16 af; /* address family */ 6241da177e4SLinus Torvalds __u16 protocol; /* which protocol (TCP/UDP) */ 625e7ade46aSJulius Volz union nf_inet_addr addr; /* IP address for virtual service */ 626014d730dSAl Viro __be16 port; /* port number for the service */ 6271da177e4SLinus Torvalds __u32 fwmark; /* firewall mark of the service */ 62895c96174SEric Dumazet unsigned int flags; /* service status flags */ 62995c96174SEric Dumazet unsigned int timeout; /* persistent timeout in ticks */ 6300a925864SJulian Anastasov __be32 netmask; /* grouping granularity, mask/plen */ 6313109d2f2SEric W. Biederman struct netns_ipvs *ipvs; 6321da177e4SLinus Torvalds 6331da177e4SLinus Torvalds struct list_head destinations; /* real server d-linked list */ 6341da177e4SLinus Torvalds __u32 num_dests; /* number of servers */ 6351da177e4SLinus Torvalds struct ip_vs_stats stats; /* statistics for the service */ 6361da177e4SLinus Torvalds 6371da177e4SLinus Torvalds /* for scheduling */ 638ceec4c38SJulian Anastasov struct ip_vs_scheduler __rcu *scheduler; /* bound scheduler object */ 639ba3a3ce1SJulian Anastasov spinlock_t sched_lock; /* lock sched_data */ 6401da177e4SLinus Torvalds void *sched_data; /* scheduler application data */ 64185999283SSimon Horman 64285999283SSimon Horman /* alternate persistence engine */ 643ceec4c38SJulian Anastasov struct ip_vs_pe __rcu *pe; 644ceec4c38SJulian Anastasov 645ceec4c38SJulian Anastasov struct rcu_head rcu_head; 6461da177e4SLinus Torvalds }; 6471da177e4SLinus Torvalds 648026ace06SJulian Anastasov /* Information for cached dst */ 649026ace06SJulian Anastasov struct ip_vs_dest_dst { 650026ace06SJulian Anastasov struct dst_entry *dst_cache; /* destination cache entry */ 651026ace06SJulian Anastasov u32 dst_cookie; 652026ace06SJulian Anastasov union nf_inet_addr dst_saddr; 653026ace06SJulian Anastasov struct rcu_head rcu_head; 654026ace06SJulian Anastasov }; 6551da177e4SLinus Torvalds 65607dcc686SSimon Horman /* The real server destination forwarding entry with ip address, port number, 65707dcc686SSimon Horman * and so on. 6581da177e4SLinus Torvalds */ 6591da177e4SLinus Torvalds struct ip_vs_dest { 6601da177e4SLinus Torvalds struct list_head n_list; /* for the dests in the service */ 661276472eaSJulian Anastasov struct hlist_node d_list; /* for table with all the dests */ 6621da177e4SLinus Torvalds 663e7ade46aSJulius Volz u16 af; /* address family */ 664014d730dSAl Viro __be16 port; /* port number of the server */ 665f2431e6eSHans Schillstrom union nf_inet_addr addr; /* IP address of the server */ 66695c96174SEric Dumazet volatile unsigned int flags; /* dest status flags */ 6671da177e4SLinus Torvalds atomic_t conn_flags; /* flags to copy to conn */ 6681da177e4SLinus Torvalds atomic_t weight; /* server weight */ 6691da177e4SLinus Torvalds 6701da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 6711da177e4SLinus Torvalds struct ip_vs_stats stats; /* statistics */ 672bcbde4c0SJulian Anastasov unsigned long idle_start; /* start time, jiffies */ 6731da177e4SLinus Torvalds 6741da177e4SLinus Torvalds /* connection counters and thresholds */ 6751da177e4SLinus Torvalds atomic_t activeconns; /* active connections */ 6761da177e4SLinus Torvalds atomic_t inactconns; /* inactive connections */ 6771da177e4SLinus Torvalds atomic_t persistconns; /* persistent connections */ 6781da177e4SLinus Torvalds __u32 u_threshold; /* upper threshold */ 6791da177e4SLinus Torvalds __u32 l_threshold; /* lower threshold */ 6801da177e4SLinus Torvalds 6811da177e4SLinus Torvalds /* for destination cache */ 6821da177e4SLinus Torvalds spinlock_t dst_lock; /* lock of dst_cache */ 683026ace06SJulian Anastasov struct ip_vs_dest_dst __rcu *dest_dst; /* cached dst info */ 6841da177e4SLinus Torvalds 6851da177e4SLinus Torvalds /* for virtual service */ 686bcbde4c0SJulian Anastasov struct ip_vs_service __rcu *svc; /* service it belongs to */ 6871da177e4SLinus Torvalds __u16 protocol; /* which protocol (TCP/UDP) */ 688014d730dSAl Viro __be16 vport; /* virtual port number */ 689f2431e6eSHans Schillstrom union nf_inet_addr vaddr; /* virtual IP address */ 6901da177e4SLinus Torvalds __u32 vfwmark; /* firewall mark of service */ 691276472eaSJulian Anastasov 692578bc3efSJulian Anastasov struct list_head t_list; /* in dest_trash */ 693276472eaSJulian Anastasov unsigned int in_rs_table:1; /* we are in rs_table */ 6941da177e4SLinus Torvalds }; 6951da177e4SLinus Torvalds 69607dcc686SSimon Horman /* The scheduler object */ 6971da177e4SLinus Torvalds struct ip_vs_scheduler { 6981da177e4SLinus Torvalds struct list_head n_list; /* d-linked list head */ 6991da177e4SLinus Torvalds char *name; /* scheduler name */ 7001da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 7011da177e4SLinus Torvalds struct module *module; /* THIS_MODULE/NULL */ 7021da177e4SLinus Torvalds 7031da177e4SLinus Torvalds /* scheduler initializing service */ 7041da177e4SLinus Torvalds int (*init_service)(struct ip_vs_service *svc); 7051da177e4SLinus Torvalds /* scheduling service finish */ 706ed3ffc4eSJulian Anastasov void (*done_service)(struct ip_vs_service *svc); 7076b6df466SJulian Anastasov /* dest is linked */ 7086b6df466SJulian Anastasov int (*add_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest); 7096b6df466SJulian Anastasov /* dest is unlinked */ 7106b6df466SJulian Anastasov int (*del_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest); 7116b6df466SJulian Anastasov /* dest is updated */ 7126b6df466SJulian Anastasov int (*upd_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest); 7131da177e4SLinus Torvalds 7141da177e4SLinus Torvalds /* selecting a server from the given service */ 7151da177e4SLinus Torvalds struct ip_vs_dest* (*schedule)(struct ip_vs_service *svc, 716bba54de5SJulian Anastasov const struct sk_buff *skb, 717bba54de5SJulian Anastasov struct ip_vs_iphdr *iph); 7181da177e4SLinus Torvalds }; 7191da177e4SLinus Torvalds 72085999283SSimon Horman /* The persistence engine object */ 72185999283SSimon Horman struct ip_vs_pe { 72285999283SSimon Horman struct list_head n_list; /* d-linked list head */ 72385999283SSimon Horman char *name; /* scheduler name */ 72485999283SSimon Horman atomic_t refcnt; /* reference counter */ 72585999283SSimon Horman struct module *module; /* THIS_MODULE/NULL */ 72685999283SSimon Horman 72785999283SSimon Horman /* get the connection template, if any */ 72885999283SSimon Horman int (*fill_param)(struct ip_vs_conn_param *p, struct sk_buff *skb); 72985999283SSimon Horman bool (*ct_match)(const struct ip_vs_conn_param *p, 73085999283SSimon Horman struct ip_vs_conn *ct); 73185999283SSimon Horman u32 (*hashkey_raw)(const struct ip_vs_conn_param *p, u32 initval, 73285999283SSimon Horman bool inverse); 733a3c918acSSimon Horman int (*show_pe_data)(const struct ip_vs_conn *cp, char *buf); 73439b97223SMarco Angaroni /* create connections for real-server outgoing packets */ 73539b97223SMarco Angaroni struct ip_vs_conn* (*conn_out)(struct ip_vs_service *svc, 73639b97223SMarco Angaroni struct ip_vs_dest *dest, 73739b97223SMarco Angaroni struct sk_buff *skb, 73839b97223SMarco Angaroni const struct ip_vs_iphdr *iph, 73939b97223SMarco Angaroni __be16 dport, __be16 cport); 74085999283SSimon Horman }; 7411da177e4SLinus Torvalds 74207dcc686SSimon Horman /* The application module object (a.k.a. app incarnation) */ 743fd2c3ef7SEric Dumazet struct ip_vs_app { 7441da177e4SLinus Torvalds struct list_head a_list; /* member in app list */ 7451da177e4SLinus Torvalds int type; /* IP_VS_APP_TYPE_xxx */ 7461da177e4SLinus Torvalds char *name; /* application module name */ 7471da177e4SLinus Torvalds __u16 protocol; 7481da177e4SLinus Torvalds struct module *module; /* THIS_MODULE/NULL */ 7491da177e4SLinus Torvalds struct list_head incs_list; /* list of incarnations */ 7501da177e4SLinus Torvalds 7511da177e4SLinus Torvalds /* members for application incarnations */ 7521da177e4SLinus Torvalds struct list_head p_list; /* member in proto app list */ 7531da177e4SLinus Torvalds struct ip_vs_app *app; /* its real application */ 754014d730dSAl Viro __be16 port; /* port number in net order */ 7551da177e4SLinus Torvalds atomic_t usecnt; /* usage counter */ 756363c97d7SJulian Anastasov struct rcu_head rcu_head; 7571da177e4SLinus Torvalds 75807dcc686SSimon Horman /* output hook: Process packet in inout direction, diff set for TCP. 7598b27b10fSJulian Anastasov * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok, 7608b27b10fSJulian Anastasov * 2=Mangled but checksum was not updated 7618b27b10fSJulian Anastasov */ 7621da177e4SLinus Torvalds int (*pkt_out)(struct ip_vs_app *, struct ip_vs_conn *, 7633db05feaSHerbert Xu struct sk_buff *, int *diff); 7641da177e4SLinus Torvalds 76507dcc686SSimon Horman /* input hook: Process packet in outin direction, diff set for TCP. 7668b27b10fSJulian Anastasov * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok, 7678b27b10fSJulian Anastasov * 2=Mangled but checksum was not updated 7688b27b10fSJulian Anastasov */ 7691da177e4SLinus Torvalds int (*pkt_in)(struct ip_vs_app *, struct ip_vs_conn *, 7703db05feaSHerbert Xu struct sk_buff *, int *diff); 7711da177e4SLinus Torvalds 7721da177e4SLinus Torvalds /* ip_vs_app initializer */ 7731da177e4SLinus Torvalds int (*init_conn)(struct ip_vs_app *, struct ip_vs_conn *); 7741da177e4SLinus Torvalds 7751da177e4SLinus Torvalds /* ip_vs_app finish */ 7761da177e4SLinus Torvalds int (*done_conn)(struct ip_vs_app *, struct ip_vs_conn *); 7771da177e4SLinus Torvalds 7781da177e4SLinus Torvalds 7791da177e4SLinus Torvalds /* not used now */ 7801da177e4SLinus Torvalds int (*bind_conn)(struct ip_vs_app *, struct ip_vs_conn *, 7811da177e4SLinus Torvalds struct ip_vs_protocol *); 7821da177e4SLinus Torvalds 7831da177e4SLinus Torvalds void (*unbind_conn)(struct ip_vs_app *, struct ip_vs_conn *); 7841da177e4SLinus Torvalds 7851da177e4SLinus Torvalds int * timeout_table; 7861da177e4SLinus Torvalds int * timeouts; 7871da177e4SLinus Torvalds int timeouts_size; 7881da177e4SLinus Torvalds 7891da177e4SLinus Torvalds int (*conn_schedule)(struct sk_buff *skb, struct ip_vs_app *app, 7901da177e4SLinus Torvalds int *verdict, struct ip_vs_conn **cpp); 7911da177e4SLinus Torvalds 7921da177e4SLinus Torvalds struct ip_vs_conn * 7931da177e4SLinus Torvalds (*conn_in_get)(const struct sk_buff *skb, struct ip_vs_app *app, 794d4383f04SJesper Dangaard Brouer const struct iphdr *iph, int inverse); 7951da177e4SLinus Torvalds 7961da177e4SLinus Torvalds struct ip_vs_conn * 7971da177e4SLinus Torvalds (*conn_out_get)(const struct sk_buff *skb, struct ip_vs_app *app, 798d4383f04SJesper Dangaard Brouer const struct iphdr *iph, int inverse); 7991da177e4SLinus Torvalds 8001da177e4SLinus Torvalds int (*state_transition)(struct ip_vs_conn *cp, int direction, 8011da177e4SLinus Torvalds const struct sk_buff *skb, 8021da177e4SLinus Torvalds struct ip_vs_app *app); 8031da177e4SLinus Torvalds 8041da177e4SLinus Torvalds void (*timeout_change)(struct ip_vs_app *app, int flags); 8051da177e4SLinus Torvalds }; 8061da177e4SLinus Torvalds 807f73181c8SPablo Neira Ayuso struct ipvs_master_sync_state { 808f73181c8SPablo Neira Ayuso struct list_head sync_queue; 809f73181c8SPablo Neira Ayuso struct ip_vs_sync_buff *sync_buff; 81007995674SZhang Yanfei unsigned long sync_queue_len; 811f73181c8SPablo Neira Ayuso unsigned int sync_queue_delay; 812f73181c8SPablo Neira Ayuso struct task_struct *master_thread; 813f73181c8SPablo Neira Ayuso struct delayed_work master_wakeup_work; 814f73181c8SPablo Neira Ayuso struct netns_ipvs *ipvs; 815f73181c8SPablo Neira Ayuso }; 816f73181c8SPablo Neira Ayuso 817578bc3efSJulian Anastasov /* How much time to keep dests in trash */ 818578bc3efSJulian Anastasov #define IP_VS_DEST_TRASH_PERIOD (120 * HZ) 819578bc3efSJulian Anastasov 820e4ff6751SJulian Anastasov struct ipvs_sync_daemon_cfg { 821d3328817SJulian Anastasov union nf_inet_addr mcast_group; 822e4ff6751SJulian Anastasov int syncid; 823e4ff6751SJulian Anastasov u16 sync_maxlen; 824d3328817SJulian Anastasov u16 mcast_port; 825d3328817SJulian Anastasov u8 mcast_af; 826d3328817SJulian Anastasov u8 mcast_ttl; 827e4ff6751SJulian Anastasov /* multicast interface name */ 828e4ff6751SJulian Anastasov char mcast_ifn[IP_VS_IFNAME_MAXLEN]; 829e4ff6751SJulian Anastasov }; 830e4ff6751SJulian Anastasov 8312553d064SJulian Anastasov /* IPVS in network namespace */ 8322553d064SJulian Anastasov struct netns_ipvs { 8332553d064SJulian Anastasov int gen; /* Generation */ 8347a4f0761SHans Schillstrom int enable; /* enable like nf_hooks do */ 83507dcc686SSimon Horman /* Hash table: for real service lookups */ 8362553d064SJulian Anastasov #define IP_VS_RTAB_BITS 4 8372553d064SJulian Anastasov #define IP_VS_RTAB_SIZE (1 << IP_VS_RTAB_BITS) 8382553d064SJulian Anastasov #define IP_VS_RTAB_MASK (IP_VS_RTAB_SIZE - 1) 8392553d064SJulian Anastasov 840276472eaSJulian Anastasov struct hlist_head rs_table[IP_VS_RTAB_SIZE]; 8412553d064SJulian Anastasov /* ip_vs_app */ 8422553d064SJulian Anastasov struct list_head app_list; 8432553d064SJulian Anastasov /* ip_vs_proto */ 8442553d064SJulian Anastasov #define IP_VS_PROTO_TAB_SIZE 32 /* must be power of 2 */ 8452553d064SJulian Anastasov struct ip_vs_proto_data *proto_data_table[IP_VS_PROTO_TAB_SIZE]; 8462553d064SJulian Anastasov /* ip_vs_proto_tcp */ 8472553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_TCP 8482553d064SJulian Anastasov #define TCP_APP_TAB_BITS 4 8492553d064SJulian Anastasov #define TCP_APP_TAB_SIZE (1 << TCP_APP_TAB_BITS) 8502553d064SJulian Anastasov #define TCP_APP_TAB_MASK (TCP_APP_TAB_SIZE - 1) 8512553d064SJulian Anastasov struct list_head tcp_apps[TCP_APP_TAB_SIZE]; 8522553d064SJulian Anastasov #endif 8532553d064SJulian Anastasov /* ip_vs_proto_udp */ 8542553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_UDP 8552553d064SJulian Anastasov #define UDP_APP_TAB_BITS 4 8562553d064SJulian Anastasov #define UDP_APP_TAB_SIZE (1 << UDP_APP_TAB_BITS) 8572553d064SJulian Anastasov #define UDP_APP_TAB_MASK (UDP_APP_TAB_SIZE - 1) 8582553d064SJulian Anastasov struct list_head udp_apps[UDP_APP_TAB_SIZE]; 8592553d064SJulian Anastasov #endif 8602553d064SJulian Anastasov /* ip_vs_proto_sctp */ 8612553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_SCTP 8622553d064SJulian Anastasov #define SCTP_APP_TAB_BITS 4 8632553d064SJulian Anastasov #define SCTP_APP_TAB_SIZE (1 << SCTP_APP_TAB_BITS) 8642553d064SJulian Anastasov #define SCTP_APP_TAB_MASK (SCTP_APP_TAB_SIZE - 1) 8652553d064SJulian Anastasov /* Hash table for SCTP application incarnations */ 8662553d064SJulian Anastasov struct list_head sctp_apps[SCTP_APP_TAB_SIZE]; 8672553d064SJulian Anastasov #endif 8682553d064SJulian Anastasov /* ip_vs_conn */ 8692553d064SJulian Anastasov atomic_t conn_count; /* connection counter */ 8702553d064SJulian Anastasov 8712553d064SJulian Anastasov /* ip_vs_ctl */ 8722a0751afSJulian Anastasov struct ip_vs_stats tot_stats; /* Statistics & est. */ 8732553d064SJulian Anastasov 8742553d064SJulian Anastasov int num_services; /* no of virtual services */ 875f2247fbdSSimon Horman 8762553d064SJulian Anastasov /* Trash for destinations */ 8772553d064SJulian Anastasov struct list_head dest_trash; 878578bc3efSJulian Anastasov spinlock_t dest_trash_lock; 879578bc3efSJulian Anastasov struct timer_list dest_trash_timer; /* expiration timer */ 8802553d064SJulian Anastasov /* Service counters */ 8812553d064SJulian Anastasov atomic_t ftpsvc_counter; 8822553d064SJulian Anastasov atomic_t nullsvc_counter; 88339b97223SMarco Angaroni atomic_t conn_out_counter; 8842553d064SJulian Anastasov 885f2247fbdSSimon Horman #ifdef CONFIG_SYSCTL 886f2247fbdSSimon Horman /* 1/rate drop and drop-entry variables */ 887f2247fbdSSimon Horman struct delayed_work defense_work; /* Work handler */ 888f2247fbdSSimon Horman int drop_rate; 889f2247fbdSSimon Horman int drop_counter; 890f2247fbdSSimon Horman atomic_t dropentry; 891f2247fbdSSimon Horman /* locks in ctl.c */ 892f2247fbdSSimon Horman spinlock_t dropentry_lock; /* drop entry handling */ 893f2247fbdSSimon Horman spinlock_t droppacket_lock; /* drop packet handling */ 894f2247fbdSSimon Horman spinlock_t securetcp_lock; /* state and timeout tables */ 895f2247fbdSSimon Horman 8962553d064SJulian Anastasov /* sys-ctl struct */ 8972553d064SJulian Anastasov struct ctl_table_header *sysctl_hdr; 8982553d064SJulian Anastasov struct ctl_table *sysctl_tbl; 899f2247fbdSSimon Horman #endif 900f2247fbdSSimon Horman 9012553d064SJulian Anastasov /* sysctl variables */ 9022553d064SJulian Anastasov int sysctl_amemthresh; 9032553d064SJulian Anastasov int sysctl_am_droprate; 9042553d064SJulian Anastasov int sysctl_drop_entry; 9052553d064SJulian Anastasov int sysctl_drop_packet; 9062553d064SJulian Anastasov int sysctl_secure_tcp; 9072553d064SJulian Anastasov #ifdef CONFIG_IP_VS_NFCT 9082553d064SJulian Anastasov int sysctl_conntrack; 9092553d064SJulian Anastasov #endif 9102553d064SJulian Anastasov int sysctl_snat_reroute; 9112553d064SJulian Anastasov int sysctl_sync_ver; 912f73181c8SPablo Neira Ayuso int sysctl_sync_ports; 9134d0c875dSJulian Anastasov int sysctl_sync_persist_mode; 91407995674SZhang Yanfei unsigned long sysctl_sync_qlen_max; 9151c003b15SPablo Neira Ayuso int sysctl_sync_sock_size; 9162553d064SJulian Anastasov int sysctl_cache_bypass; 9172553d064SJulian Anastasov int sysctl_expire_nodest_conn; 918c6c96c18SAlexander Frolkin int sysctl_sloppy_tcp; 919c6c96c18SAlexander Frolkin int sysctl_sloppy_sctp; 9202553d064SJulian Anastasov int sysctl_expire_quiescent_template; 9212553d064SJulian Anastasov int sysctl_sync_threshold[2]; 922749c42b6SJulian Anastasov unsigned int sysctl_sync_refresh_period; 923749c42b6SJulian Anastasov int sysctl_sync_retries; 9242553d064SJulian Anastasov int sysctl_nat_icmp_send; 9253654e611SJulian Anastasov int sysctl_pmtu_disc; 9260c12582fSJulian Anastasov int sysctl_backup_only; 927d752c364SMarcelo Ricardo Leitner int sysctl_conn_reuse_mode; 92894485fedSAlex Gartrell int sysctl_schedule_icmp; 9294e478098SAlex Gartrell int sysctl_ignore_tunneled; 9302553d064SJulian Anastasov 9312553d064SJulian Anastasov /* ip_vs_lblc */ 9322553d064SJulian Anastasov int sysctl_lblc_expiration; 9332553d064SJulian Anastasov struct ctl_table_header *lblc_ctl_header; 9342553d064SJulian Anastasov struct ctl_table *lblc_ctl_table; 9352553d064SJulian Anastasov /* ip_vs_lblcr */ 9362553d064SJulian Anastasov int sysctl_lblcr_expiration; 9372553d064SJulian Anastasov struct ctl_table_header *lblcr_ctl_header; 9382553d064SJulian Anastasov struct ctl_table *lblcr_ctl_table; 9392553d064SJulian Anastasov /* ip_vs_est */ 9402553d064SJulian Anastasov struct list_head est_list; /* estimator list */ 9412553d064SJulian Anastasov spinlock_t est_lock; 9422553d064SJulian Anastasov struct timer_list est_timer; /* Estimation timer */ 9432553d064SJulian Anastasov /* ip_vs_sync */ 9442553d064SJulian Anastasov spinlock_t sync_lock; 945f73181c8SPablo Neira Ayuso struct ipvs_master_sync_state *ms; 9462553d064SJulian Anastasov spinlock_t sync_buff_lock; 947f73181c8SPablo Neira Ayuso struct task_struct **backup_threads; 948f73181c8SPablo Neira Ayuso int threads_mask; 9492553d064SJulian Anastasov volatile int sync_state; 950ae1d48b2SHans Schillstrom struct mutex sync_mutex; 951e4ff6751SJulian Anastasov struct ipvs_sync_daemon_cfg mcfg; /* Master Configuration */ 952e4ff6751SJulian Anastasov struct ipvs_sync_daemon_cfg bcfg; /* Backup Configuration */ 9532553d064SJulian Anastasov /* net name space ptr */ 9542553d064SJulian Anastasov struct net *net; /* Needed by timer routines */ 95507dcc686SSimon Horman /* Number of heterogeneous destinations, needed becaus heterogeneous 95607dcc686SSimon Horman * are not supported when synchronization is enabled. 95707dcc686SSimon Horman */ 958391f503dSAlex Gartrell unsigned int mixed_address_family_dests; 9592553d064SJulian Anastasov }; 9601da177e4SLinus Torvalds 96159e0350eSSimon Horman #define DEFAULT_SYNC_THRESHOLD 3 96259e0350eSSimon Horman #define DEFAULT_SYNC_PERIOD 50 9637532e8d4SSimon Horman #define DEFAULT_SYNC_VER 1 964c6c96c18SAlexander Frolkin #define DEFAULT_SLOPPY_TCP 0 965c6c96c18SAlexander Frolkin #define DEFAULT_SLOPPY_SCTP 0 966749c42b6SJulian Anastasov #define DEFAULT_SYNC_REFRESH_PERIOD (0U * HZ) 967749c42b6SJulian Anastasov #define DEFAULT_SYNC_RETRIES 0 9681c003b15SPablo Neira Ayuso #define IPVS_SYNC_WAKEUP_RATE 8 9691c003b15SPablo Neira Ayuso #define IPVS_SYNC_QLEN_MAX (IPVS_SYNC_WAKEUP_RATE * 4) 9701c003b15SPablo Neira Ayuso #define IPVS_SYNC_SEND_DELAY (HZ / 50) 9711c003b15SPablo Neira Ayuso #define IPVS_SYNC_CHECK_PERIOD HZ 972749c42b6SJulian Anastasov #define IPVS_SYNC_FLUSH_TIME (HZ * 2) 973f73181c8SPablo Neira Ayuso #define IPVS_SYNC_PORTS_MAX (1 << 6) 97459e0350eSSimon Horman 97559e0350eSSimon Horman #ifdef CONFIG_SYSCTL 97659e0350eSSimon Horman 97759e0350eSSimon Horman static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs) 97859e0350eSSimon Horman { 97959e0350eSSimon Horman return ipvs->sysctl_sync_threshold[0]; 98059e0350eSSimon Horman } 98159e0350eSSimon Horman 98259e0350eSSimon Horman static inline int sysctl_sync_period(struct netns_ipvs *ipvs) 98359e0350eSSimon Horman { 984749c42b6SJulian Anastasov return ACCESS_ONCE(ipvs->sysctl_sync_threshold[1]); 985749c42b6SJulian Anastasov } 986749c42b6SJulian Anastasov 987749c42b6SJulian Anastasov static inline unsigned int sysctl_sync_refresh_period(struct netns_ipvs *ipvs) 988749c42b6SJulian Anastasov { 989749c42b6SJulian Anastasov return ACCESS_ONCE(ipvs->sysctl_sync_refresh_period); 990749c42b6SJulian Anastasov } 991749c42b6SJulian Anastasov 992749c42b6SJulian Anastasov static inline int sysctl_sync_retries(struct netns_ipvs *ipvs) 993749c42b6SJulian Anastasov { 994749c42b6SJulian Anastasov return ipvs->sysctl_sync_retries; 99559e0350eSSimon Horman } 99659e0350eSSimon Horman 9977532e8d4SSimon Horman static inline int sysctl_sync_ver(struct netns_ipvs *ipvs) 9987532e8d4SSimon Horman { 9997532e8d4SSimon Horman return ipvs->sysctl_sync_ver; 10007532e8d4SSimon Horman } 10017532e8d4SSimon Horman 1002c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_tcp(struct netns_ipvs *ipvs) 1003c6c96c18SAlexander Frolkin { 1004c6c96c18SAlexander Frolkin return ipvs->sysctl_sloppy_tcp; 1005c6c96c18SAlexander Frolkin } 1006c6c96c18SAlexander Frolkin 1007c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_sctp(struct netns_ipvs *ipvs) 1008c6c96c18SAlexander Frolkin { 1009c6c96c18SAlexander Frolkin return ipvs->sysctl_sloppy_sctp; 1010c6c96c18SAlexander Frolkin } 1011c6c96c18SAlexander Frolkin 1012f73181c8SPablo Neira Ayuso static inline int sysctl_sync_ports(struct netns_ipvs *ipvs) 1013f73181c8SPablo Neira Ayuso { 1014f73181c8SPablo Neira Ayuso return ACCESS_ONCE(ipvs->sysctl_sync_ports); 1015f73181c8SPablo Neira Ayuso } 1016f73181c8SPablo Neira Ayuso 10174d0c875dSJulian Anastasov static inline int sysctl_sync_persist_mode(struct netns_ipvs *ipvs) 10184d0c875dSJulian Anastasov { 10194d0c875dSJulian Anastasov return ipvs->sysctl_sync_persist_mode; 10204d0c875dSJulian Anastasov } 10214d0c875dSJulian Anastasov 102207995674SZhang Yanfei static inline unsigned long sysctl_sync_qlen_max(struct netns_ipvs *ipvs) 10231c003b15SPablo Neira Ayuso { 10241c003b15SPablo Neira Ayuso return ipvs->sysctl_sync_qlen_max; 10251c003b15SPablo Neira Ayuso } 10261c003b15SPablo Neira Ayuso 10271c003b15SPablo Neira Ayuso static inline int sysctl_sync_sock_size(struct netns_ipvs *ipvs) 10281c003b15SPablo Neira Ayuso { 10291c003b15SPablo Neira Ayuso return ipvs->sysctl_sync_sock_size; 10301c003b15SPablo Neira Ayuso } 10311c003b15SPablo Neira Ayuso 10323654e611SJulian Anastasov static inline int sysctl_pmtu_disc(struct netns_ipvs *ipvs) 10333654e611SJulian Anastasov { 10343654e611SJulian Anastasov return ipvs->sysctl_pmtu_disc; 10353654e611SJulian Anastasov } 10363654e611SJulian Anastasov 10370c12582fSJulian Anastasov static inline int sysctl_backup_only(struct netns_ipvs *ipvs) 10380c12582fSJulian Anastasov { 10390c12582fSJulian Anastasov return ipvs->sync_state & IP_VS_STATE_BACKUP && 10400c12582fSJulian Anastasov ipvs->sysctl_backup_only; 10410c12582fSJulian Anastasov } 10420c12582fSJulian Anastasov 1043d752c364SMarcelo Ricardo Leitner static inline int sysctl_conn_reuse_mode(struct netns_ipvs *ipvs) 1044d752c364SMarcelo Ricardo Leitner { 1045d752c364SMarcelo Ricardo Leitner return ipvs->sysctl_conn_reuse_mode; 1046d752c364SMarcelo Ricardo Leitner } 1047d752c364SMarcelo Ricardo Leitner 104894485fedSAlex Gartrell static inline int sysctl_schedule_icmp(struct netns_ipvs *ipvs) 104994485fedSAlex Gartrell { 105094485fedSAlex Gartrell return ipvs->sysctl_schedule_icmp; 105194485fedSAlex Gartrell } 105294485fedSAlex Gartrell 10534e478098SAlex Gartrell static inline int sysctl_ignore_tunneled(struct netns_ipvs *ipvs) 10544e478098SAlex Gartrell { 10554e478098SAlex Gartrell return ipvs->sysctl_ignore_tunneled; 10564e478098SAlex Gartrell } 10574e478098SAlex Gartrell 105857032948SEric W. Biederman static inline int sysctl_cache_bypass(struct netns_ipvs *ipvs) 105957032948SEric W. Biederman { 106057032948SEric W. Biederman return ipvs->sysctl_cache_bypass; 106157032948SEric W. Biederman } 106257032948SEric W. Biederman 106359e0350eSSimon Horman #else 106459e0350eSSimon Horman 106559e0350eSSimon Horman static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs) 106659e0350eSSimon Horman { 106759e0350eSSimon Horman return DEFAULT_SYNC_THRESHOLD; 106859e0350eSSimon Horman } 106959e0350eSSimon Horman 107059e0350eSSimon Horman static inline int sysctl_sync_period(struct netns_ipvs *ipvs) 107159e0350eSSimon Horman { 107259e0350eSSimon Horman return DEFAULT_SYNC_PERIOD; 107359e0350eSSimon Horman } 107459e0350eSSimon Horman 1075749c42b6SJulian Anastasov static inline unsigned int sysctl_sync_refresh_period(struct netns_ipvs *ipvs) 1076749c42b6SJulian Anastasov { 1077749c42b6SJulian Anastasov return DEFAULT_SYNC_REFRESH_PERIOD; 1078749c42b6SJulian Anastasov } 1079749c42b6SJulian Anastasov 1080749c42b6SJulian Anastasov static inline int sysctl_sync_retries(struct netns_ipvs *ipvs) 1081749c42b6SJulian Anastasov { 1082749c42b6SJulian Anastasov return DEFAULT_SYNC_RETRIES & 3; 1083749c42b6SJulian Anastasov } 1084749c42b6SJulian Anastasov 10857532e8d4SSimon Horman static inline int sysctl_sync_ver(struct netns_ipvs *ipvs) 10867532e8d4SSimon Horman { 10877532e8d4SSimon Horman return DEFAULT_SYNC_VER; 10887532e8d4SSimon Horman } 10897532e8d4SSimon Horman 1090c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_tcp(struct netns_ipvs *ipvs) 1091c6c96c18SAlexander Frolkin { 1092c6c96c18SAlexander Frolkin return DEFAULT_SLOPPY_TCP; 1093c6c96c18SAlexander Frolkin } 1094c6c96c18SAlexander Frolkin 1095c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_sctp(struct netns_ipvs *ipvs) 1096c6c96c18SAlexander Frolkin { 1097c6c96c18SAlexander Frolkin return DEFAULT_SLOPPY_SCTP; 1098c6c96c18SAlexander Frolkin } 1099c6c96c18SAlexander Frolkin 1100f73181c8SPablo Neira Ayuso static inline int sysctl_sync_ports(struct netns_ipvs *ipvs) 1101f73181c8SPablo Neira Ayuso { 1102f73181c8SPablo Neira Ayuso return 1; 1103f73181c8SPablo Neira Ayuso } 1104f73181c8SPablo Neira Ayuso 11054d0c875dSJulian Anastasov static inline int sysctl_sync_persist_mode(struct netns_ipvs *ipvs) 11064d0c875dSJulian Anastasov { 11074d0c875dSJulian Anastasov return 0; 11084d0c875dSJulian Anastasov } 11094d0c875dSJulian Anastasov 111007995674SZhang Yanfei static inline unsigned long sysctl_sync_qlen_max(struct netns_ipvs *ipvs) 11111c003b15SPablo Neira Ayuso { 11121c003b15SPablo Neira Ayuso return IPVS_SYNC_QLEN_MAX; 11131c003b15SPablo Neira Ayuso } 11141c003b15SPablo Neira Ayuso 11151c003b15SPablo Neira Ayuso static inline int sysctl_sync_sock_size(struct netns_ipvs *ipvs) 11161c003b15SPablo Neira Ayuso { 11171c003b15SPablo Neira Ayuso return 0; 11181c003b15SPablo Neira Ayuso } 11191c003b15SPablo Neira Ayuso 11203654e611SJulian Anastasov static inline int sysctl_pmtu_disc(struct netns_ipvs *ipvs) 11213654e611SJulian Anastasov { 11223654e611SJulian Anastasov return 1; 11233654e611SJulian Anastasov } 11243654e611SJulian Anastasov 11250c12582fSJulian Anastasov static inline int sysctl_backup_only(struct netns_ipvs *ipvs) 11260c12582fSJulian Anastasov { 11270c12582fSJulian Anastasov return 0; 11280c12582fSJulian Anastasov } 11290c12582fSJulian Anastasov 1130d752c364SMarcelo Ricardo Leitner static inline int sysctl_conn_reuse_mode(struct netns_ipvs *ipvs) 1131d752c364SMarcelo Ricardo Leitner { 1132d752c364SMarcelo Ricardo Leitner return 1; 1133d752c364SMarcelo Ricardo Leitner } 1134d752c364SMarcelo Ricardo Leitner 113594485fedSAlex Gartrell static inline int sysctl_schedule_icmp(struct netns_ipvs *ipvs) 113694485fedSAlex Gartrell { 113794485fedSAlex Gartrell return 0; 113894485fedSAlex Gartrell } 113994485fedSAlex Gartrell 11404e478098SAlex Gartrell static inline int sysctl_ignore_tunneled(struct netns_ipvs *ipvs) 11414e478098SAlex Gartrell { 11424e478098SAlex Gartrell return 0; 11434e478098SAlex Gartrell } 11444e478098SAlex Gartrell 114557032948SEric W. Biederman static inline int sysctl_cache_bypass(struct netns_ipvs *ipvs) 114657032948SEric W. Biederman { 114757032948SEric W. Biederman return 0; 114857032948SEric W. Biederman } 114957032948SEric W. Biederman 115059e0350eSSimon Horman #endif 115159e0350eSSimon Horman 115207dcc686SSimon Horman /* IPVS core functions 11531da177e4SLinus Torvalds * (from ip_vs_core.c) 11541da177e4SLinus Torvalds */ 11555c3a0fd7SJoe Perches const char *ip_vs_proto_name(unsigned int proto); 11565c3a0fd7SJoe Perches void ip_vs_init_hash_table(struct list_head *table, int rows); 115739b97223SMarco Angaroni struct ip_vs_conn *ip_vs_new_conn_out(struct ip_vs_service *svc, 115839b97223SMarco Angaroni struct ip_vs_dest *dest, 115939b97223SMarco Angaroni struct sk_buff *skb, 116039b97223SMarco Angaroni const struct ip_vs_iphdr *iph, 116139b97223SMarco Angaroni __be16 dport, 116239b97223SMarco Angaroni __be16 cport); 1163afdd6140SSven Wegener #define IP_VS_INIT_HASH_TABLE(t) ip_vs_init_hash_table((t), ARRAY_SIZE((t))) 11641da177e4SLinus Torvalds 11651da177e4SLinus Torvalds #define IP_VS_APP_TYPE_FTP 1 11661da177e4SLinus Torvalds 116707dcc686SSimon Horman /* ip_vs_conn handling functions 11681da177e4SLinus Torvalds * (from ip_vs_conn.c) 11691da177e4SLinus Torvalds */ 11701da177e4SLinus Torvalds enum { 11711da177e4SLinus Torvalds IP_VS_DIR_INPUT = 0, 11721da177e4SLinus Torvalds IP_VS_DIR_OUTPUT, 11731da177e4SLinus Torvalds IP_VS_DIR_INPUT_ONLY, 11741da177e4SLinus Torvalds IP_VS_DIR_LAST, 11751da177e4SLinus Torvalds }; 11761da177e4SLinus Torvalds 117719913decSEric W. Biederman static inline void ip_vs_conn_fill_param(struct netns_ipvs *ipvs, int af, int protocol, 1178f11017ecSSimon Horman const union nf_inet_addr *caddr, 1179f11017ecSSimon Horman __be16 cport, 1180f11017ecSSimon Horman const union nf_inet_addr *vaddr, 1181f11017ecSSimon Horman __be16 vport, 1182f11017ecSSimon Horman struct ip_vs_conn_param *p) 1183f11017ecSSimon Horman { 118419913decSEric W. Biederman p->ipvs = ipvs; 1185f11017ecSSimon Horman p->af = af; 1186f11017ecSSimon Horman p->protocol = protocol; 1187f11017ecSSimon Horman p->caddr = caddr; 1188f11017ecSSimon Horman p->cport = cport; 1189f11017ecSSimon Horman p->vaddr = vaddr; 1190f11017ecSSimon Horman p->vport = vport; 119185999283SSimon Horman p->pe = NULL; 119285999283SSimon Horman p->pe_data = NULL; 1193f11017ecSSimon Horman } 119428364a59SJulius Volz 1195f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_in_get(const struct ip_vs_conn_param *p); 1196f11017ecSSimon Horman struct ip_vs_conn *ip_vs_ct_in_get(const struct ip_vs_conn_param *p); 119728364a59SJulius Volz 1198ab161976SEric W. Biederman struct ip_vs_conn * ip_vs_conn_in_get_proto(struct netns_ipvs *ipvs, int af, 1199ab161976SEric W. Biederman const struct sk_buff *skb, 1200802c41adSAlex Gartrell const struct ip_vs_iphdr *iph); 12015c0d2374SSimon Horman 1202f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_out_get(const struct ip_vs_conn_param *p); 12031da177e4SLinus Torvalds 12040cf705c8SEric W. Biederman struct ip_vs_conn * ip_vs_conn_out_get_proto(struct netns_ipvs *ipvs, int af, 12050cf705c8SEric W. Biederman const struct sk_buff *skb, 1206802c41adSAlex Gartrell const struct ip_vs_iphdr *iph); 12075c0d2374SSimon Horman 1208088339a5SJulian Anastasov /* Get reference to gain full access to conn. 1209088339a5SJulian Anastasov * By default, RCU read-side critical sections have access only to 1210088339a5SJulian Anastasov * conn fields and its PE data, see ip_vs_conn_rcu_free() for reference. 1211088339a5SJulian Anastasov */ 1212088339a5SJulian Anastasov static inline bool __ip_vs_conn_get(struct ip_vs_conn *cp) 1213088339a5SJulian Anastasov { 1214088339a5SJulian Anastasov return atomic_inc_not_zero(&cp->refcnt); 1215088339a5SJulian Anastasov } 1216088339a5SJulian Anastasov 12171da177e4SLinus Torvalds /* put back the conn without restarting its timer */ 12181da177e4SLinus Torvalds static inline void __ip_vs_conn_put(struct ip_vs_conn *cp) 12191da177e4SLinus Torvalds { 12204e857c58SPeter Zijlstra smp_mb__before_atomic(); 12211da177e4SLinus Torvalds atomic_dec(&cp->refcnt); 12221da177e4SLinus Torvalds } 12235c3a0fd7SJoe Perches void ip_vs_conn_put(struct ip_vs_conn *cp); 12245c3a0fd7SJoe Perches void ip_vs_conn_fill_cport(struct ip_vs_conn *cp, __be16 cport); 12251da177e4SLinus Torvalds 1226ba38528aSAlex Gartrell struct ip_vs_conn *ip_vs_conn_new(const struct ip_vs_conn_param *p, int dest_af, 1227f11017ecSSimon Horman const union nf_inet_addr *daddr, 122895c96174SEric Dumazet __be16 dport, unsigned int flags, 12290e051e68SHans Schillstrom struct ip_vs_dest *dest, __u32 fwmark); 12305c3a0fd7SJoe Perches void ip_vs_conn_expire_now(struct ip_vs_conn *cp); 12311da177e4SLinus Torvalds 12325c3a0fd7SJoe Perches const char *ip_vs_state_name(__u16 proto, int state); 12331da177e4SLinus Torvalds 123469f39093SEric W. Biederman void ip_vs_tcp_conn_listen(struct ip_vs_conn *cp); 12353ec10d3aSMarco Angaroni int ip_vs_check_template(struct ip_vs_conn *ct, struct ip_vs_dest *cdest); 1236423b5595SEric W. Biederman void ip_vs_random_dropentry(struct netns_ipvs *ipvs); 12375c3a0fd7SJoe Perches int ip_vs_conn_init(void); 12385c3a0fd7SJoe Perches void ip_vs_conn_cleanup(void); 12391da177e4SLinus Torvalds 12401da177e4SLinus Torvalds static inline void ip_vs_control_del(struct ip_vs_conn *cp) 12411da177e4SLinus Torvalds { 12421da177e4SLinus Torvalds struct ip_vs_conn *ctl_cp = cp->control; 12431da177e4SLinus Torvalds if (!ctl_cp) { 1244cfc78c5aSJulius Volz IP_VS_ERR_BUF("request control DEL for uncontrolled: " 1245cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1246cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1247cfc78c5aSJulius Volz ntohs(cp->cport), 1248cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1249cfc78c5aSJulius Volz ntohs(cp->vport)); 1250cfc78c5aSJulius Volz 12511da177e4SLinus Torvalds return; 12521da177e4SLinus Torvalds } 12531da177e4SLinus Torvalds 1254cfc78c5aSJulius Volz IP_VS_DBG_BUF(7, "DELeting control for: " 1255cfc78c5aSJulius Volz "cp.dst=%s:%d ctl_cp.dst=%s:%d\n", 1256cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1257cfc78c5aSJulius Volz ntohs(cp->cport), 1258cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr), 1259cfc78c5aSJulius Volz ntohs(ctl_cp->cport)); 12601da177e4SLinus Torvalds 12611da177e4SLinus Torvalds cp->control = NULL; 12621da177e4SLinus Torvalds if (atomic_read(&ctl_cp->n_control) == 0) { 1263cfc78c5aSJulius Volz IP_VS_ERR_BUF("BUG control DEL with n=0 : " 1264cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1265cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1266cfc78c5aSJulius Volz ntohs(cp->cport), 1267cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1268cfc78c5aSJulius Volz ntohs(cp->vport)); 1269cfc78c5aSJulius Volz 12701da177e4SLinus Torvalds return; 12711da177e4SLinus Torvalds } 12721da177e4SLinus Torvalds atomic_dec(&ctl_cp->n_control); 12731da177e4SLinus Torvalds } 12741da177e4SLinus Torvalds 12751da177e4SLinus Torvalds static inline void 12761da177e4SLinus Torvalds ip_vs_control_add(struct ip_vs_conn *cp, struct ip_vs_conn *ctl_cp) 12771da177e4SLinus Torvalds { 12781da177e4SLinus Torvalds if (cp->control) { 1279cfc78c5aSJulius Volz IP_VS_ERR_BUF("request control ADD for already controlled: " 1280cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1281cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1282cfc78c5aSJulius Volz ntohs(cp->cport), 1283cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1284cfc78c5aSJulius Volz ntohs(cp->vport)); 1285cfc78c5aSJulius Volz 12861da177e4SLinus Torvalds ip_vs_control_del(cp); 12871da177e4SLinus Torvalds } 12881da177e4SLinus Torvalds 1289cfc78c5aSJulius Volz IP_VS_DBG_BUF(7, "ADDing control for: " 1290cfc78c5aSJulius Volz "cp.dst=%s:%d ctl_cp.dst=%s:%d\n", 1291cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1292cfc78c5aSJulius Volz ntohs(cp->cport), 1293cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr), 1294cfc78c5aSJulius Volz ntohs(ctl_cp->cport)); 12951da177e4SLinus Torvalds 12961da177e4SLinus Torvalds cp->control = ctl_cp; 12971da177e4SLinus Torvalds atomic_inc(&ctl_cp->n_control); 12981da177e4SLinus Torvalds } 12991da177e4SLinus Torvalds 130007dcc686SSimon Horman /* IPVS netns init & cleanup functions */ 1301a4dd0360SEric W. Biederman int ip_vs_estimator_net_init(struct netns_ipvs *ipvs); 13023d993766SEric W. Biederman int ip_vs_control_net_init(struct netns_ipvs *ipvs); 13037d1f88ecSEric W. Biederman int ip_vs_protocol_net_init(struct netns_ipvs *ipvs); 1304b5dd212cSEric W. Biederman int ip_vs_app_net_init(struct netns_ipvs *ipvs); 13052f3edc6aSEric W. Biederman int ip_vs_conn_net_init(struct netns_ipvs *ipvs); 1306802cb437SEric W. Biederman int ip_vs_sync_net_init(struct netns_ipvs *ipvs); 13072f3edc6aSEric W. Biederman void ip_vs_conn_net_cleanup(struct netns_ipvs *ipvs); 1308b5dd212cSEric W. Biederman void ip_vs_app_net_cleanup(struct netns_ipvs *ipvs); 13097d1f88ecSEric W. Biederman void ip_vs_protocol_net_cleanup(struct netns_ipvs *ipvs); 13103d993766SEric W. Biederman void ip_vs_control_net_cleanup(struct netns_ipvs *ipvs); 1311a4dd0360SEric W. Biederman void ip_vs_estimator_net_cleanup(struct netns_ipvs *ipvs); 1312ebea1f7cSEric W. Biederman void ip_vs_sync_net_cleanup(struct netns_ipvs *ipvs); 131356d2169bSEric W. Biederman void ip_vs_service_net_cleanup(struct netns_ipvs *ipvs); 13141da177e4SLinus Torvalds 131507dcc686SSimon Horman /* IPVS application functions 13161da177e4SLinus Torvalds * (from ip_vs_app.c) 13171da177e4SLinus Torvalds */ 13181da177e4SLinus Torvalds #define IP_VS_APP_MAX_PORTS 8 13199f8128a5SEric W. Biederman struct ip_vs_app *register_ip_vs_app(struct netns_ipvs *ipvs, struct ip_vs_app *app); 13209f8128a5SEric W. Biederman void unregister_ip_vs_app(struct netns_ipvs *ipvs, struct ip_vs_app *app); 13215c3a0fd7SJoe Perches int ip_vs_bind_app(struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 13225c3a0fd7SJoe Perches void ip_vs_unbind_app(struct ip_vs_conn *cp); 13233250dc9cSEric W. Biederman int register_ip_vs_app_inc(struct netns_ipvs *ipvs, struct ip_vs_app *app, __u16 proto, 13245c3a0fd7SJoe Perches __u16 port); 13255c3a0fd7SJoe Perches int ip_vs_app_inc_get(struct ip_vs_app *inc); 13265c3a0fd7SJoe Perches void ip_vs_app_inc_put(struct ip_vs_app *inc); 13271da177e4SLinus Torvalds 13285c3a0fd7SJoe Perches int ip_vs_app_pkt_out(struct ip_vs_conn *, struct sk_buff *skb); 13295c3a0fd7SJoe Perches int ip_vs_app_pkt_in(struct ip_vs_conn *, struct sk_buff *skb); 13301da177e4SLinus Torvalds 13318be67a66SSimon Horman int register_ip_vs_pe(struct ip_vs_pe *pe); 13328be67a66SSimon Horman int unregister_ip_vs_pe(struct ip_vs_pe *pe); 1333e9e5eee8SSimon Horman struct ip_vs_pe *ip_vs_pe_getbyname(const char *name); 1334fe5e7a1eSHans Schillstrom struct ip_vs_pe *__ip_vs_pe_getbyname(const char *pe_name); 1335e9e5eee8SSimon Horman 133607dcc686SSimon Horman /* Use a #define to avoid all of module.h just for these trivial ops */ 133769e7dae4SPaul Gortmaker #define ip_vs_pe_get(pe) \ 133869e7dae4SPaul Gortmaker if (pe && pe->module) \ 1339e9e5eee8SSimon Horman __module_get(pe->module); 1340e9e5eee8SSimon Horman 134169e7dae4SPaul Gortmaker #define ip_vs_pe_put(pe) \ 134269e7dae4SPaul Gortmaker if (pe && pe->module) \ 1343e9e5eee8SSimon Horman module_put(pe->module); 13441da177e4SLinus Torvalds 134507dcc686SSimon Horman /* IPVS protocol functions (from ip_vs_proto.c) */ 13465c3a0fd7SJoe Perches int ip_vs_protocol_init(void); 13475c3a0fd7SJoe Perches void ip_vs_protocol_cleanup(void); 13485c3a0fd7SJoe Perches void ip_vs_protocol_timeout_change(struct netns_ipvs *ipvs, int flags); 13495c3a0fd7SJoe Perches int *ip_vs_create_timeout_table(int *table, int size); 13505c3a0fd7SJoe Perches int ip_vs_set_state_timeout(int *table, int num, const char *const *names, 135136cbd3dcSJan Engelhardt const char *name, int to); 13525c3a0fd7SJoe Perches void ip_vs_tcpudp_debug_packet(int af, struct ip_vs_protocol *pp, 13535c3a0fd7SJoe Perches const struct sk_buff *skb, int offset, 13545c3a0fd7SJoe Perches const char *msg); 13551da177e4SLinus Torvalds 13561da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_tcp; 13571da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_udp; 13581da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_icmp; 13591da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_esp; 13601da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_ah; 13612906f66aSVenkata Mohan Reddy extern struct ip_vs_protocol ip_vs_protocol_sctp; 13621da177e4SLinus Torvalds 136307dcc686SSimon Horman /* Registering/unregistering scheduler functions 13641da177e4SLinus Torvalds * (from ip_vs_sched.c) 13651da177e4SLinus Torvalds */ 13665c3a0fd7SJoe Perches int register_ip_vs_scheduler(struct ip_vs_scheduler *scheduler); 13675c3a0fd7SJoe Perches int unregister_ip_vs_scheduler(struct ip_vs_scheduler *scheduler); 13685c3a0fd7SJoe Perches int ip_vs_bind_scheduler(struct ip_vs_service *svc, 13691da177e4SLinus Torvalds struct ip_vs_scheduler *scheduler); 13705c3a0fd7SJoe Perches void ip_vs_unbind_scheduler(struct ip_vs_service *svc, 1371ceec4c38SJulian Anastasov struct ip_vs_scheduler *sched); 13725c3a0fd7SJoe Perches struct ip_vs_scheduler *ip_vs_scheduler_get(const char *sched_name); 13735c3a0fd7SJoe Perches void ip_vs_scheduler_put(struct ip_vs_scheduler *scheduler); 13745c3a0fd7SJoe Perches struct ip_vs_conn * 1375190ecd27SJulian Anastasov ip_vs_schedule(struct ip_vs_service *svc, struct sk_buff *skb, 1376d4383f04SJesper Dangaard Brouer struct ip_vs_proto_data *pd, int *ignored, 1377d4383f04SJesper Dangaard Brouer struct ip_vs_iphdr *iph); 13785c3a0fd7SJoe Perches int ip_vs_leave(struct ip_vs_service *svc, struct sk_buff *skb, 1379d4383f04SJesper Dangaard Brouer struct ip_vs_proto_data *pd, struct ip_vs_iphdr *iph); 13801da177e4SLinus Torvalds 13815c3a0fd7SJoe Perches void ip_vs_scheduler_err(struct ip_vs_service *svc, const char *msg); 138241ac51eeSPatrick Schaaf 138307dcc686SSimon Horman /* IPVS control data and functions (from ip_vs_ctl.c) */ 13841da177e4SLinus Torvalds extern struct ip_vs_stats ip_vs_stats; 1385b880c1f0SHans Schillstrom extern int sysctl_ip_vs_sync_ver; 13861da177e4SLinus Torvalds 13875c3a0fd7SJoe Perches struct ip_vs_service * 13880a4fd6ceSEric W. Biederman ip_vs_service_find(struct netns_ipvs *ipvs, int af, __u32 fwmark, __u16 protocol, 13893c2e0505SJulius Volz const union nf_inet_addr *vaddr, __be16 vport); 13901da177e4SLinus Torvalds 139148aed1b0SEric W. Biederman bool ip_vs_has_real_service(struct netns_ipvs *ipvs, int af, __u16 protocol, 13927937df15SJulius Volz const union nf_inet_addr *daddr, __be16 dport); 13937937df15SJulius Volz 139439b97223SMarco Angaroni struct ip_vs_dest * 139539b97223SMarco Angaroni ip_vs_find_real_service(struct netns_ipvs *ipvs, int af, __u16 protocol, 139639b97223SMarco Angaroni const union nf_inet_addr *daddr, __be16 dport); 139739b97223SMarco Angaroni 13985c3a0fd7SJoe Perches int ip_vs_use_count_inc(void); 13995c3a0fd7SJoe Perches void ip_vs_use_count_dec(void); 14005c3a0fd7SJoe Perches int ip_vs_register_nl_ioctl(void); 14015c3a0fd7SJoe Perches void ip_vs_unregister_nl_ioctl(void); 14025c3a0fd7SJoe Perches int ip_vs_control_init(void); 14035c3a0fd7SJoe Perches void ip_vs_control_cleanup(void); 14045c3a0fd7SJoe Perches struct ip_vs_dest * 1405dc2add6fSEric W. Biederman ip_vs_find_dest(struct netns_ipvs *ipvs, int svc_af, int dest_af, 1406655eef10SAlex Gartrell const union nf_inet_addr *daddr, __be16 dport, 1407655eef10SAlex Gartrell const union nf_inet_addr *vaddr, __be16 vport, 140852793dbeSJulian Anastasov __u16 protocol, __u32 fwmark, __u32 flags); 14095c3a0fd7SJoe Perches void ip_vs_try_bind_dest(struct ip_vs_conn *cp); 14101da177e4SLinus Torvalds 1411fca9c20aSJulian Anastasov static inline void ip_vs_dest_hold(struct ip_vs_dest *dest) 1412fca9c20aSJulian Anastasov { 1413fca9c20aSJulian Anastasov atomic_inc(&dest->refcnt); 1414fca9c20aSJulian Anastasov } 1415fca9c20aSJulian Anastasov 1416fca9c20aSJulian Anastasov static inline void ip_vs_dest_put(struct ip_vs_dest *dest) 1417fca9c20aSJulian Anastasov { 14184e857c58SPeter Zijlstra smp_mb__before_atomic(); 1419fca9c20aSJulian Anastasov atomic_dec(&dest->refcnt); 1420fca9c20aSJulian Anastasov } 14211da177e4SLinus Torvalds 14229e4e948aSJulian Anastasov static inline void ip_vs_dest_put_and_free(struct ip_vs_dest *dest) 14239e4e948aSJulian Anastasov { 14249e4e948aSJulian Anastasov if (atomic_dec_return(&dest->refcnt) < 0) 14259e4e948aSJulian Anastasov kfree(dest); 14269e4e948aSJulian Anastasov } 14279e4e948aSJulian Anastasov 142807dcc686SSimon Horman /* IPVS sync daemon data and function prototypes 14291da177e4SLinus Torvalds * (from ip_vs_sync.c) 14301da177e4SLinus Torvalds */ 14316ac121d7SEric W. Biederman int start_sync_thread(struct netns_ipvs *ipvs, struct ipvs_sync_daemon_cfg *cfg, 1432e4ff6751SJulian Anastasov int state); 1433b3cf3cbfSEric W. Biederman int stop_sync_thread(struct netns_ipvs *ipvs, int state); 1434b61a8c1aSEric W. Biederman void ip_vs_sync_conn(struct netns_ipvs *ipvs, struct ip_vs_conn *cp, int pkts); 14351da177e4SLinus Torvalds 143607dcc686SSimon Horman /* IPVS rate estimator prototypes (from ip_vs_est.c) */ 14370f34d54bSEric W. Biederman void ip_vs_start_estimator(struct netns_ipvs *ipvs, struct ip_vs_stats *stats); 14380f34d54bSEric W. Biederman void ip_vs_stop_estimator(struct netns_ipvs *ipvs, struct ip_vs_stats *stats); 14395c3a0fd7SJoe Perches void ip_vs_zero_estimator(struct ip_vs_stats *stats); 1440cd67cd5eSJulian Anastasov void ip_vs_read_estimator(struct ip_vs_kstats *dst, struct ip_vs_stats *stats); 14411da177e4SLinus Torvalds 144207dcc686SSimon Horman /* Various IPVS packet transmitters (from ip_vs_xmit.c) */ 14435c3a0fd7SJoe Perches int ip_vs_null_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1444d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 14455c3a0fd7SJoe Perches int ip_vs_bypass_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1446d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 14475c3a0fd7SJoe Perches int ip_vs_nat_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1448d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 14495c3a0fd7SJoe Perches int ip_vs_tunnel_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 14505c3a0fd7SJoe Perches struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 14515c3a0fd7SJoe Perches int ip_vs_dr_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 14525c3a0fd7SJoe Perches struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 14535c3a0fd7SJoe Perches int ip_vs_icmp_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1454d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, int offset, 1455d4383f04SJesper Dangaard Brouer unsigned int hooknum, struct ip_vs_iphdr *iph); 14565c3a0fd7SJoe Perches void ip_vs_dest_dst_rcu_free(struct rcu_head *head); 14571da177e4SLinus Torvalds 1458b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6 14595c3a0fd7SJoe Perches int ip_vs_bypass_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 1460d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 14615c3a0fd7SJoe Perches int ip_vs_nat_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 14625c3a0fd7SJoe Perches struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 14635c3a0fd7SJoe Perches int ip_vs_tunnel_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 14645c3a0fd7SJoe Perches struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 14655c3a0fd7SJoe Perches int ip_vs_dr_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 14665c3a0fd7SJoe Perches struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 14675c3a0fd7SJoe Perches int ip_vs_icmp_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 1468d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, int offset, 1469d4383f04SJesper Dangaard Brouer unsigned int hooknum, struct ip_vs_iphdr *iph); 1470b3cdd2a7SJulius Volz #endif 14711da177e4SLinus Torvalds 14723a1bbf18SSimon Horman #ifdef CONFIG_SYSCTL 147307dcc686SSimon Horman /* This is a simple mechanism to ignore packets when 14741da177e4SLinus Torvalds * we are loaded. Just set ip_vs_drop_rate to 'n' and 14751da177e4SLinus Torvalds * we start to drop 1/rate of the packets 14761da177e4SLinus Torvalds */ 1477a0840e2eSHans Schillstrom static inline int ip_vs_todrop(struct netns_ipvs *ipvs) 14781da177e4SLinus Torvalds { 1479a0840e2eSHans Schillstrom if (!ipvs->drop_rate) 1480a0840e2eSHans Schillstrom return 0; 1481a0840e2eSHans Schillstrom if (--ipvs->drop_counter > 0) 1482a0840e2eSHans Schillstrom return 0; 1483a0840e2eSHans Schillstrom ipvs->drop_counter = ipvs->drop_rate; 14841da177e4SLinus Torvalds return 1; 14851da177e4SLinus Torvalds } 14863a1bbf18SSimon Horman #else 14873a1bbf18SSimon Horman static inline int ip_vs_todrop(struct netns_ipvs *ipvs) { return 0; } 14883a1bbf18SSimon Horman #endif 14891da177e4SLinus Torvalds 149007dcc686SSimon Horman /* ip_vs_fwd_tag returns the forwarding tag of the connection */ 14911da177e4SLinus Torvalds #define IP_VS_FWD_METHOD(cp) (cp->flags & IP_VS_CONN_F_FWD_MASK) 14921da177e4SLinus Torvalds 1493732db659SAdrian Bunk static inline char ip_vs_fwd_tag(struct ip_vs_conn *cp) 14941da177e4SLinus Torvalds { 14951da177e4SLinus Torvalds char fwd; 14961da177e4SLinus Torvalds 14971da177e4SLinus Torvalds switch (IP_VS_FWD_METHOD(cp)) { 14981da177e4SLinus Torvalds case IP_VS_CONN_F_MASQ: 14991da177e4SLinus Torvalds fwd = 'M'; break; 15001da177e4SLinus Torvalds case IP_VS_CONN_F_LOCALNODE: 15011da177e4SLinus Torvalds fwd = 'L'; break; 15021da177e4SLinus Torvalds case IP_VS_CONN_F_TUNNEL: 15031da177e4SLinus Torvalds fwd = 'T'; break; 15041da177e4SLinus Torvalds case IP_VS_CONN_F_DROUTE: 15051da177e4SLinus Torvalds fwd = 'R'; break; 15061da177e4SLinus Torvalds case IP_VS_CONN_F_BYPASS: 15071da177e4SLinus Torvalds fwd = 'B'; break; 15081da177e4SLinus Torvalds default: 15091da177e4SLinus Torvalds fwd = '?'; break; 15101da177e4SLinus Torvalds } 15111da177e4SLinus Torvalds return fwd; 15121da177e4SLinus Torvalds } 15131da177e4SLinus Torvalds 15145c3a0fd7SJoe Perches void ip_vs_nat_icmp(struct sk_buff *skb, struct ip_vs_protocol *pp, 15151da177e4SLinus Torvalds struct ip_vs_conn *cp, int dir); 15161da177e4SLinus Torvalds 1517b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6 15185c3a0fd7SJoe Perches void ip_vs_nat_icmp_v6(struct sk_buff *skb, struct ip_vs_protocol *pp, 1519b3cdd2a7SJulius Volz struct ip_vs_conn *cp, int dir); 1520b3cdd2a7SJulius Volz #endif 1521b3cdd2a7SJulius Volz 15225c3a0fd7SJoe Perches __sum16 ip_vs_checksum_complete(struct sk_buff *skb, int offset); 15231da177e4SLinus Torvalds 1524f9214b26SAl Viro static inline __wsum ip_vs_check_diff4(__be32 old, __be32 new, __wsum oldsum) 15251da177e4SLinus Torvalds { 1526f9214b26SAl Viro __be32 diff[2] = { ~old, new }; 15271da177e4SLinus Torvalds 152807f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 1529f9214b26SAl Viro } 1530f9214b26SAl Viro 15310bbdd42bSJulius Volz #ifdef CONFIG_IP_VS_IPV6 15320bbdd42bSJulius Volz static inline __wsum ip_vs_check_diff16(const __be32 *old, const __be32 *new, 15330bbdd42bSJulius Volz __wsum oldsum) 15340bbdd42bSJulius Volz { 15350bbdd42bSJulius Volz __be32 diff[8] = { ~old[3], ~old[2], ~old[1], ~old[0], 15360bbdd42bSJulius Volz new[3], new[2], new[1], new[0] }; 15370bbdd42bSJulius Volz 153807f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 15390bbdd42bSJulius Volz } 15400bbdd42bSJulius Volz #endif 15410bbdd42bSJulius Volz 1542f9214b26SAl Viro static inline __wsum ip_vs_check_diff2(__be16 old, __be16 new, __wsum oldsum) 1543f9214b26SAl Viro { 1544f9214b26SAl Viro __be16 diff[2] = { ~old, new }; 1545f9214b26SAl Viro 154607f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 15471da177e4SLinus Torvalds } 15481da177e4SLinus Torvalds 154907dcc686SSimon Horman /* Forget current conntrack (unconfirmed) and attach notrack entry */ 1550cf356d69SJulian Anastasov static inline void ip_vs_notrack(struct sk_buff *skb) 1551cf356d69SJulian Anastasov { 1552cf356d69SJulian Anastasov #if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE) 1553cf356d69SJulian Anastasov enum ip_conntrack_info ctinfo; 155406b69390SJesper Juhl struct nf_conn *ct = nf_ct_get(skb, &ctinfo); 1555cf356d69SJulian Anastasov 1556cf356d69SJulian Anastasov if (!ct || !nf_ct_is_untracked(ct)) { 1557*97a6ad13SFlorian Westphal struct nf_conn *untracked; 1558*97a6ad13SFlorian Westphal 1559*97a6ad13SFlorian Westphal nf_conntrack_put(&ct->ct_general); 1560*97a6ad13SFlorian Westphal untracked = nf_ct_untracked_get(); 1561*97a6ad13SFlorian Westphal nf_conntrack_get(&untracked->ct_general); 1562*97a6ad13SFlorian Westphal skb->nfct = &untracked->ct_general; 1563cf356d69SJulian Anastasov skb->nfctinfo = IP_CT_NEW; 1564cf356d69SJulian Anastasov } 1565cf356d69SJulian Anastasov #endif 1566cf356d69SJulian Anastasov } 1567cf356d69SJulian Anastasov 1568f4bc17cdSJulian Anastasov #ifdef CONFIG_IP_VS_NFCT 156907dcc686SSimon Horman /* Netfilter connection tracking 1570f4bc17cdSJulian Anastasov * (from ip_vs_nfct.c) 1571f4bc17cdSJulian Anastasov */ 1572a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs) 1573f4bc17cdSJulian Anastasov { 1574a4e2f5a7SSimon Horman #ifdef CONFIG_SYSCTL 1575a0840e2eSHans Schillstrom return ipvs->sysctl_conntrack; 1576a4e2f5a7SSimon Horman #else 1577a4e2f5a7SSimon Horman return 0; 1578a4e2f5a7SSimon Horman #endif 1579f4bc17cdSJulian Anastasov } 1580f4bc17cdSJulian Anastasov 15815c3a0fd7SJoe Perches void ip_vs_update_conntrack(struct sk_buff *skb, struct ip_vs_conn *cp, 15826523ce15SJulian Anastasov int outin); 15835c3a0fd7SJoe Perches int ip_vs_confirm_conntrack(struct sk_buff *skb); 15845c3a0fd7SJoe Perches void ip_vs_nfct_expect_related(struct sk_buff *skb, struct nf_conn *ct, 1585f4bc17cdSJulian Anastasov struct ip_vs_conn *cp, u_int8_t proto, 1586f4bc17cdSJulian Anastasov const __be16 port, int from_rs); 15875c3a0fd7SJoe Perches void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp); 1588f4bc17cdSJulian Anastasov 1589f4bc17cdSJulian Anastasov #else 1590f4bc17cdSJulian Anastasov 1591a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs) 1592f4bc17cdSJulian Anastasov { 1593f4bc17cdSJulian Anastasov return 0; 1594f4bc17cdSJulian Anastasov } 1595f4bc17cdSJulian Anastasov 1596f4bc17cdSJulian Anastasov static inline void ip_vs_update_conntrack(struct sk_buff *skb, 1597f4bc17cdSJulian Anastasov struct ip_vs_conn *cp, int outin) 1598f4bc17cdSJulian Anastasov { 1599f4bc17cdSJulian Anastasov } 1600f4bc17cdSJulian Anastasov 1601e23ebf0fSKrzysztof Wilczynski static inline int ip_vs_confirm_conntrack(struct sk_buff *skb) 1602f4bc17cdSJulian Anastasov { 1603f4bc17cdSJulian Anastasov return NF_ACCEPT; 1604f4bc17cdSJulian Anastasov } 1605f4bc17cdSJulian Anastasov 1606f4bc17cdSJulian Anastasov static inline void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp) 1607f4bc17cdSJulian Anastasov { 1608f4bc17cdSJulian Anastasov } 160907dcc686SSimon Horman #endif /* CONFIG_IP_VS_NFCT */ 16106523ce15SJulian Anastasov 1611f719e375SJulian Anastasov /* Really using conntrack? */ 1612f719e375SJulian Anastasov static inline bool ip_vs_conn_uses_conntrack(struct ip_vs_conn *cp, 1613f719e375SJulian Anastasov struct sk_buff *skb) 1614f719e375SJulian Anastasov { 1615f719e375SJulian Anastasov #ifdef CONFIG_IP_VS_NFCT 1616f719e375SJulian Anastasov enum ip_conntrack_info ctinfo; 1617f719e375SJulian Anastasov struct nf_conn *ct; 1618f719e375SJulian Anastasov 1619f719e375SJulian Anastasov if (!(cp->flags & IP_VS_CONN_F_NFCT)) 1620f719e375SJulian Anastasov return false; 1621f719e375SJulian Anastasov ct = nf_ct_get(skb, &ctinfo); 1622f719e375SJulian Anastasov if (ct && !nf_ct_is_untracked(ct)) 1623f719e375SJulian Anastasov return true; 1624f719e375SJulian Anastasov #endif 1625f719e375SJulian Anastasov return false; 1626f719e375SJulian Anastasov } 1627f719e375SJulian Anastasov 1628c16526a7SSimon Kirby static inline int 1629b552f7e3SChangli Gao ip_vs_dest_conn_overhead(struct ip_vs_dest *dest) 1630b552f7e3SChangli Gao { 163107dcc686SSimon Horman /* We think the overhead of processing active connections is 256 1632b552f7e3SChangli Gao * times higher than that of inactive connections in average. (This 1633b552f7e3SChangli Gao * 256 times might not be accurate, we will change it later) We 1634b552f7e3SChangli Gao * use the following formula to estimate the overhead now: 1635b552f7e3SChangli Gao * dest->activeconns*256 + dest->inactconns 1636b552f7e3SChangli Gao */ 1637b552f7e3SChangli Gao return (atomic_read(&dest->activeconns) << 8) + 1638b552f7e3SChangli Gao atomic_read(&dest->inactconns); 1639b552f7e3SChangli Gao } 1640b552f7e3SChangli Gao 1641bc4768ebSJulius Volz #endif /* _NET_IP_VS_H */ 1642