1b2441318SGreg Kroah-Hartman /* SPDX-License-Identifier: GPL-2.0 */ 207dcc686SSimon Horman /* IP Virtual Server 31da177e4SLinus Torvalds * data structure and functionality definitions 41da177e4SLinus Torvalds */ 51da177e4SLinus Torvalds 6bc4768ebSJulius Volz #ifndef _NET_IP_VS_H 7bc4768ebSJulius Volz #define _NET_IP_VS_H 81da177e4SLinus Torvalds 9bc4768ebSJulius Volz #include <linux/ip_vs.h> /* definitions shared with userland */ 101da177e4SLinus Torvalds 11bc4768ebSJulius Volz #include <asm/types.h> /* for __uXX types */ 12bc4768ebSJulius Volz 131da177e4SLinus Torvalds #include <linux/list.h> /* for struct list_head */ 141da177e4SLinus Torvalds #include <linux/spinlock.h> /* for struct rwlock_t */ 1560063497SArun Sharma #include <linux/atomic.h> /* for struct atomic_t */ 16b54ab92bSReshetova, Elena #include <linux/refcount.h> /* for struct refcount_t */ 1735dfb013SAndrew Sy Kim #include <linux/workqueue.h> 18b54ab92bSReshetova, Elena 191da177e4SLinus Torvalds #include <linux/compiler.h> 2014c85021SArnaldo Carvalho de Melo #include <linux/timer.h> 21187f1882SPaul Gortmaker #include <linux/bug.h> 221da177e4SLinus Torvalds 2314c85021SArnaldo Carvalho de Melo #include <net/checksum.h> 24e7ade46aSJulius Volz #include <linux/netfilter.h> /* for union nf_inet_addr */ 251668e010SKOVACS Krisztian #include <linux/ip.h> 26e7ade46aSJulius Volz #include <linux/ipv6.h> /* for struct ipv6hdr */ 274e3fd7a0SAlexey Dobriyan #include <net/ipv6.h> 28a638e514SJesper Dangaard Brouer #if IS_ENABLED(CONFIG_NF_CONNTRACK) 29f4bc17cdSJulian Anastasov #include <net/netfilter/nf_conntrack.h> 30f4bc17cdSJulian Anastasov #endif 3161b1ab45SHans Schillstrom #include <net/net_namespace.h> /* Netw namespace */ 32f0be83d5SJulian Anastasov #include <linux/sched/isolation.h> 3361b1ab45SHans Schillstrom 344fd9beefSAlex Gartrell #define IP_VS_HDR_INVERSE 1 354fd9beefSAlex Gartrell #define IP_VS_HDR_ICMP 2 364fd9beefSAlex Gartrell 3707dcc686SSimon Horman /* Generic access of ipvs struct */ 3861b1ab45SHans Schillstrom static inline struct netns_ipvs *net_ipvs(struct net* net) 3961b1ab45SHans Schillstrom { 4061b1ab45SHans Schillstrom return net->ipvs; 4161b1ab45SHans Schillstrom } 4207dcc686SSimon Horman 436f7edb48SCatalin(ux) M. BOIE /* Connections' size value needed by ip_vs_ctl.c */ 446f7edb48SCatalin(ux) M. BOIE extern int ip_vs_conn_tab_size; 456f7edb48SCatalin(ux) M. BOIE 46705dd344SJulian Anastasov extern struct mutex __ip_vs_mutex; 47705dd344SJulian Anastasov 4864aae3cbSJulius Volz struct ip_vs_iphdr { 494fd9beefSAlex Gartrell int hdr_flags; /* ipvs flags */ 50b0e010c5SAlex Gartrell __u32 off; /* Where IP or IPv4 header starts */ 5163dca2c0SJesper Dangaard Brouer __u32 len; /* IPv4 simply where L4 starts 5207dcc686SSimon Horman * IPv6 where L4 Transport Header starts */ 5363dca2c0SJesper Dangaard Brouer __u16 fragoffs; /* IPv6 fragment offset, 0 if first frag (or not frag)*/ 5463dca2c0SJesper Dangaard Brouer __s16 protocol; 5563dca2c0SJesper Dangaard Brouer __s32 flags; 5664aae3cbSJulius Volz union nf_inet_addr saddr; 5764aae3cbSJulius Volz union nf_inet_addr daddr; 5864aae3cbSJulius Volz }; 5964aae3cbSJulius Volz 602f74713dSJesper Dangaard Brouer static inline void *frag_safe_skb_hp(const struct sk_buff *skb, int offset, 616b3d9330SGao Feng int len, void *buffer) 622f74713dSJesper Dangaard Brouer { 632f74713dSJesper Dangaard Brouer return skb_header_pointer(skb, offset, len, buffer); 642f74713dSJesper Dangaard Brouer } 652f74713dSJesper Dangaard Brouer 6663dca2c0SJesper Dangaard Brouer /* This function handles filling *ip_vs_iphdr, both for IPv4 and IPv6. 6763dca2c0SJesper Dangaard Brouer * IPv6 requires some extra work, as finding proper header position, 6863dca2c0SJesper Dangaard Brouer * depend on the IPv6 extension headers. 6963dca2c0SJesper Dangaard Brouer */ 70b0e010c5SAlex Gartrell static inline int 71b0e010c5SAlex Gartrell ip_vs_fill_iph_skb_off(int af, const struct sk_buff *skb, int offset, 724fd9beefSAlex Gartrell int hdr_flags, struct ip_vs_iphdr *iphdr) 7364aae3cbSJulius Volz { 744fd9beefSAlex Gartrell iphdr->hdr_flags = hdr_flags; 75b0e010c5SAlex Gartrell iphdr->off = offset; 764fd9beefSAlex Gartrell 7764aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 7864aae3cbSJulius Volz if (af == AF_INET6) { 79b0e010c5SAlex Gartrell struct ipv6hdr _iph; 80b0e010c5SAlex Gartrell const struct ipv6hdr *iph = skb_header_pointer( 81b0e010c5SAlex Gartrell skb, offset, sizeof(_iph), &_iph); 82b0e010c5SAlex Gartrell if (!iph) 83b0e010c5SAlex Gartrell return 0; 84b0e010c5SAlex Gartrell 854e3fd7a0SAlexey Dobriyan iphdr->saddr.in6 = iph->saddr; 864e3fd7a0SAlexey Dobriyan iphdr->daddr.in6 = iph->daddr; 876aafeef0SJiri Pirko /* ipv6_find_hdr() updates len, flags */ 88b0e010c5SAlex Gartrell iphdr->len = offset; 8963dca2c0SJesper Dangaard Brouer iphdr->flags = 0; 9063dca2c0SJesper Dangaard Brouer iphdr->protocol = ipv6_find_hdr(skb, &iphdr->len, -1, 9163dca2c0SJesper Dangaard Brouer &iphdr->fragoffs, 9263dca2c0SJesper Dangaard Brouer &iphdr->flags); 93b0e010c5SAlex Gartrell if (iphdr->protocol < 0) 94b0e010c5SAlex Gartrell return 0; 9564aae3cbSJulius Volz } else 9664aae3cbSJulius Volz #endif 9764aae3cbSJulius Volz { 98b0e010c5SAlex Gartrell struct iphdr _iph; 99b0e010c5SAlex Gartrell const struct iphdr *iph = skb_header_pointer( 100b0e010c5SAlex Gartrell skb, offset, sizeof(_iph), &_iph); 101b0e010c5SAlex Gartrell if (!iph) 102b0e010c5SAlex Gartrell return 0; 103b0e010c5SAlex Gartrell 104b0e010c5SAlex Gartrell iphdr->len = offset + iph->ihl * 4; 10563dca2c0SJesper Dangaard Brouer iphdr->fragoffs = 0; 10664aae3cbSJulius Volz iphdr->protocol = iph->protocol; 10764aae3cbSJulius Volz iphdr->saddr.ip = iph->saddr; 10864aae3cbSJulius Volz iphdr->daddr.ip = iph->daddr; 10964aae3cbSJulius Volz } 110b0e010c5SAlex Gartrell 111b0e010c5SAlex Gartrell return 1; 112b0e010c5SAlex Gartrell } 113b0e010c5SAlex Gartrell 114b0e010c5SAlex Gartrell static inline int 1154fd9beefSAlex Gartrell ip_vs_fill_iph_skb_icmp(int af, const struct sk_buff *skb, int offset, 1164fd9beefSAlex Gartrell bool inverse, struct ip_vs_iphdr *iphdr) 117b0e010c5SAlex Gartrell { 1184fd9beefSAlex Gartrell int hdr_flags = IP_VS_HDR_ICMP; 1194fd9beefSAlex Gartrell 1204fd9beefSAlex Gartrell if (inverse) 1214fd9beefSAlex Gartrell hdr_flags |= IP_VS_HDR_INVERSE; 1224fd9beefSAlex Gartrell 1234fd9beefSAlex Gartrell return ip_vs_fill_iph_skb_off(af, skb, offset, hdr_flags, iphdr); 1244fd9beefSAlex Gartrell } 1254fd9beefSAlex Gartrell 1264fd9beefSAlex Gartrell static inline int 1274fd9beefSAlex Gartrell ip_vs_fill_iph_skb(int af, const struct sk_buff *skb, bool inverse, 1284fd9beefSAlex Gartrell struct ip_vs_iphdr *iphdr) 1294fd9beefSAlex Gartrell { 1304fd9beefSAlex Gartrell int hdr_flags = 0; 1314fd9beefSAlex Gartrell 1324fd9beefSAlex Gartrell if (inverse) 1334fd9beefSAlex Gartrell hdr_flags |= IP_VS_HDR_INVERSE; 1344fd9beefSAlex Gartrell 1354fd9beefSAlex Gartrell return ip_vs_fill_iph_skb_off(af, skb, skb_network_offset(skb), 1364fd9beefSAlex Gartrell hdr_flags, iphdr); 1374fd9beefSAlex Gartrell } 1384fd9beefSAlex Gartrell 1394fd9beefSAlex Gartrell static inline bool 1404fd9beefSAlex Gartrell ip_vs_iph_inverse(const struct ip_vs_iphdr *iph) 1414fd9beefSAlex Gartrell { 1424fd9beefSAlex Gartrell return !!(iph->hdr_flags & IP_VS_HDR_INVERSE); 1434fd9beefSAlex Gartrell } 1444fd9beefSAlex Gartrell 1454fd9beefSAlex Gartrell static inline bool 1464fd9beefSAlex Gartrell ip_vs_iph_icmp(const struct ip_vs_iphdr *iph) 1474fd9beefSAlex Gartrell { 1484fd9beefSAlex Gartrell return !!(iph->hdr_flags & IP_VS_HDR_ICMP); 14964aae3cbSJulius Volz } 15064aae3cbSJulius Volz 15164aae3cbSJulius Volz static inline void ip_vs_addr_copy(int af, union nf_inet_addr *dst, 15264aae3cbSJulius Volz const union nf_inet_addr *src) 15364aae3cbSJulius Volz { 15464aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 15564aae3cbSJulius Volz if (af == AF_INET6) 1564e3fd7a0SAlexey Dobriyan dst->in6 = src->in6; 15764aae3cbSJulius Volz else 15864aae3cbSJulius Volz #endif 15964aae3cbSJulius Volz dst->ip = src->ip; 16064aae3cbSJulius Volz } 16164aae3cbSJulius Volz 1629a05475cSJulian Anastasov static inline void ip_vs_addr_set(int af, union nf_inet_addr *dst, 1639a05475cSJulian Anastasov const union nf_inet_addr *src) 1649a05475cSJulian Anastasov { 1659a05475cSJulian Anastasov #ifdef CONFIG_IP_VS_IPV6 1669a05475cSJulian Anastasov if (af == AF_INET6) { 1679a05475cSJulian Anastasov dst->in6 = src->in6; 1689a05475cSJulian Anastasov return; 1699a05475cSJulian Anastasov } 1709a05475cSJulian Anastasov #endif 1719a05475cSJulian Anastasov dst->ip = src->ip; 1729a05475cSJulian Anastasov dst->all[1] = 0; 1739a05475cSJulian Anastasov dst->all[2] = 0; 1749a05475cSJulian Anastasov dst->all[3] = 0; 1759a05475cSJulian Anastasov } 1769a05475cSJulian Anastasov 17764aae3cbSJulius Volz static inline int ip_vs_addr_equal(int af, const union nf_inet_addr *a, 17864aae3cbSJulius Volz const union nf_inet_addr *b) 17964aae3cbSJulius Volz { 18064aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 18164aae3cbSJulius Volz if (af == AF_INET6) 18264aae3cbSJulius Volz return ipv6_addr_equal(&a->in6, &b->in6); 18364aae3cbSJulius Volz #endif 18464aae3cbSJulius Volz return a->ip == b->ip; 18564aae3cbSJulius Volz } 18664aae3cbSJulius Volz 1871da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG 18814c85021SArnaldo Carvalho de Melo #include <linux/net.h> 18914c85021SArnaldo Carvalho de Melo 1905c3a0fd7SJoe Perches int ip_vs_get_debug_level(void); 191c842a3adSJulius Volz 192c842a3adSJulius Volz static inline const char *ip_vs_dbg_addr(int af, char *buf, size_t buf_len, 193c842a3adSJulius Volz const union nf_inet_addr *addr, 194c842a3adSJulius Volz int *idx) 195c842a3adSJulius Volz { 196c842a3adSJulius Volz int len; 197c842a3adSJulius Volz #ifdef CONFIG_IP_VS_IPV6 198c842a3adSJulius Volz if (af == AF_INET6) 199120b9c14SJesper Dangaard Brouer len = snprintf(&buf[*idx], buf_len - *idx, "[%pI6c]", 2000c6ce78aSHarvey Harrison &addr->in6) + 1; 201c842a3adSJulius Volz else 202c842a3adSJulius Volz #endif 2033685f25dSHarvey Harrison len = snprintf(&buf[*idx], buf_len - *idx, "%pI4", 2043685f25dSHarvey Harrison &addr->ip) + 1; 205c842a3adSJulius Volz 206c842a3adSJulius Volz *idx += len; 207c842a3adSJulius Volz BUG_ON(*idx > buf_len + 1); 208c842a3adSJulius Volz return &buf[*idx - len]; 209c842a3adSJulius Volz } 210c842a3adSJulius Volz 2119aada7acSHannes Eder #define IP_VS_DBG_BUF(level, msg, ...) \ 212c842a3adSJulius Volz do { \ 213c842a3adSJulius Volz char ip_vs_dbg_buf[160]; \ 214c842a3adSJulius Volz int ip_vs_dbg_idx = 0; \ 215c842a3adSJulius Volz if (level <= ip_vs_get_debug_level()) \ 2169aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 217c842a3adSJulius Volz } while (0) 218c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...) \ 219c842a3adSJulius Volz do { \ 220c842a3adSJulius Volz char ip_vs_dbg_buf[160]; \ 221c842a3adSJulius Volz int ip_vs_dbg_idx = 0; \ 2229aada7acSHannes Eder pr_err(msg); \ 223c842a3adSJulius Volz } while (0) 224c842a3adSJulius Volz 225c842a3adSJulius Volz /* Only use from within IP_VS_DBG_BUF() or IP_VS_ERR_BUF macros */ 226c842a3adSJulius Volz #define IP_VS_DBG_ADDR(af, addr) \ 227c842a3adSJulius Volz ip_vs_dbg_addr(af, ip_vs_dbg_buf, \ 228c842a3adSJulius Volz sizeof(ip_vs_dbg_buf), addr, \ 229c842a3adSJulius Volz &ip_vs_dbg_idx) 230c842a3adSJulius Volz 2319aada7acSHannes Eder #define IP_VS_DBG(level, msg, ...) \ 2321da177e4SLinus Torvalds do { \ 2331da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2349aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 2351da177e4SLinus Torvalds } while (0) 2369aada7acSHannes Eder #define IP_VS_DBG_RL(msg, ...) \ 2371da177e4SLinus Torvalds do { \ 2381da177e4SLinus Torvalds if (net_ratelimit()) \ 2399aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 2401da177e4SLinus Torvalds } while (0) 2410d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg) \ 2421da177e4SLinus Torvalds do { \ 2431da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2440d79641aSJulian Anastasov pp->debug_packet(af, pp, skb, ofs, msg); \ 2451da177e4SLinus Torvalds } while (0) 2460d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg) \ 2471da177e4SLinus Torvalds do { \ 2481da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level() && \ 2491da177e4SLinus Torvalds net_ratelimit()) \ 2500d79641aSJulian Anastasov pp->debug_packet(af, pp, skb, ofs, msg); \ 2511da177e4SLinus Torvalds } while (0) 2521da177e4SLinus Torvalds #else /* NO DEBUGGING at ALL */ 253c842a3adSJulius Volz #define IP_VS_DBG_BUF(level, msg...) do {} while (0) 254c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...) do {} while (0) 2551da177e4SLinus Torvalds #define IP_VS_DBG(level, msg...) do {} while (0) 2561da177e4SLinus Torvalds #define IP_VS_DBG_RL(msg...) do {} while (0) 2570d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg) do {} while (0) 2580d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg) do {} while (0) 2591da177e4SLinus Torvalds #endif 2601da177e4SLinus Torvalds 2611da177e4SLinus Torvalds #define IP_VS_BUG() BUG() 2621e3e238eSHannes Eder #define IP_VS_ERR_RL(msg, ...) \ 2631da177e4SLinus Torvalds do { \ 2641da177e4SLinus Torvalds if (net_ratelimit()) \ 2651e3e238eSHannes Eder pr_err(msg, ##__VA_ARGS__); \ 2661da177e4SLinus Torvalds } while (0) 2671da177e4SLinus Torvalds 2681da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG 2691da177e4SLinus Torvalds #define EnterFunction(level) \ 2701da177e4SLinus Torvalds do { \ 2711da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2729aada7acSHannes Eder printk(KERN_DEBUG \ 2739aada7acSHannes Eder pr_fmt("Enter: %s, %s line %i\n"), \ 274d5c003b4SHarvey Harrison __func__, __FILE__, __LINE__); \ 2751da177e4SLinus Torvalds } while (0) 2761da177e4SLinus Torvalds #define LeaveFunction(level) \ 2771da177e4SLinus Torvalds do { \ 2781da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2799aada7acSHannes Eder printk(KERN_DEBUG \ 2809aada7acSHannes Eder pr_fmt("Leave: %s, %s line %i\n"), \ 281d5c003b4SHarvey Harrison __func__, __FILE__, __LINE__); \ 2821da177e4SLinus Torvalds } while (0) 2831da177e4SLinus Torvalds #else 2841da177e4SLinus Torvalds #define EnterFunction(level) do {} while (0) 2851da177e4SLinus Torvalds #define LeaveFunction(level) do {} while (0) 2861da177e4SLinus Torvalds #endif 2871da177e4SLinus Torvalds 28807dcc686SSimon Horman /* The port number of FTP service (in network order). */ 289f3a7c66bSHarvey Harrison #define FTPPORT cpu_to_be16(21) 290f3a7c66bSHarvey Harrison #define FTPDATA cpu_to_be16(20) 2911da177e4SLinus Torvalds 29207dcc686SSimon Horman /* TCP State Values */ 2931da177e4SLinus Torvalds enum { 2941da177e4SLinus Torvalds IP_VS_TCP_S_NONE = 0, 2951da177e4SLinus Torvalds IP_VS_TCP_S_ESTABLISHED, 2961da177e4SLinus Torvalds IP_VS_TCP_S_SYN_SENT, 2971da177e4SLinus Torvalds IP_VS_TCP_S_SYN_RECV, 2981da177e4SLinus Torvalds IP_VS_TCP_S_FIN_WAIT, 2991da177e4SLinus Torvalds IP_VS_TCP_S_TIME_WAIT, 3001da177e4SLinus Torvalds IP_VS_TCP_S_CLOSE, 3011da177e4SLinus Torvalds IP_VS_TCP_S_CLOSE_WAIT, 3021da177e4SLinus Torvalds IP_VS_TCP_S_LAST_ACK, 3031da177e4SLinus Torvalds IP_VS_TCP_S_LISTEN, 3041da177e4SLinus Torvalds IP_VS_TCP_S_SYNACK, 3051da177e4SLinus Torvalds IP_VS_TCP_S_LAST 3061da177e4SLinus Torvalds }; 3071da177e4SLinus Torvalds 30807dcc686SSimon Horman /* UDP State Values */ 3091da177e4SLinus Torvalds enum { 3101da177e4SLinus Torvalds IP_VS_UDP_S_NORMAL, 3111da177e4SLinus Torvalds IP_VS_UDP_S_LAST, 3121da177e4SLinus Torvalds }; 3131da177e4SLinus Torvalds 31407dcc686SSimon Horman /* ICMP State Values */ 3151da177e4SLinus Torvalds enum { 3161da177e4SLinus Torvalds IP_VS_ICMP_S_NORMAL, 3171da177e4SLinus Torvalds IP_VS_ICMP_S_LAST, 3181da177e4SLinus Torvalds }; 3191da177e4SLinus Torvalds 32007dcc686SSimon Horman /* SCTP State Values */ 3212906f66aSVenkata Mohan Reddy enum ip_vs_sctp_states { 3222906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_NONE, 32361e7c420SJulian Anastasov IP_VS_SCTP_S_INIT1, 32461e7c420SJulian Anastasov IP_VS_SCTP_S_INIT, 32561e7c420SJulian Anastasov IP_VS_SCTP_S_COOKIE_SENT, 32661e7c420SJulian Anastasov IP_VS_SCTP_S_COOKIE_REPLIED, 32761e7c420SJulian Anastasov IP_VS_SCTP_S_COOKIE_WAIT, 32861e7c420SJulian Anastasov IP_VS_SCTP_S_COOKIE, 32961e7c420SJulian Anastasov IP_VS_SCTP_S_COOKIE_ECHOED, 3302906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_ESTABLISHED, 33161e7c420SJulian Anastasov IP_VS_SCTP_S_SHUTDOWN_SENT, 33261e7c420SJulian Anastasov IP_VS_SCTP_S_SHUTDOWN_RECEIVED, 33361e7c420SJulian Anastasov IP_VS_SCTP_S_SHUTDOWN_ACK_SENT, 33461e7c420SJulian Anastasov IP_VS_SCTP_S_REJECTED, 3352906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_CLOSED, 3362906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_LAST 3372906f66aSVenkata Mohan Reddy }; 3382906f66aSVenkata Mohan Reddy 33927541143SJulian Anastasov /* Connection templates use bits from state */ 34027541143SJulian Anastasov #define IP_VS_CTPL_S_NONE 0x0000 34127541143SJulian Anastasov #define IP_VS_CTPL_S_ASSURED 0x0001 34227541143SJulian Anastasov #define IP_VS_CTPL_S_LAST 0x0002 34327541143SJulian Anastasov 34407dcc686SSimon Horman /* Delta sequence info structure 3451da177e4SLinus Torvalds * Each ip_vs_conn has 2 (output AND input seq. changes). 3461da177e4SLinus Torvalds * Only used in the VS/NAT. 3471da177e4SLinus Torvalds */ 3481da177e4SLinus Torvalds struct ip_vs_seq { 3491da177e4SLinus Torvalds __u32 init_seq; /* Add delta from this seq */ 3501da177e4SLinus Torvalds __u32 delta; /* Delta in sequence numbers */ 3511da177e4SLinus Torvalds __u32 previous_delta; /* Delta in sequence numbers 35207dcc686SSimon Horman * before last resized pkt */ 3531da177e4SLinus Torvalds }; 3541da177e4SLinus Torvalds 35507dcc686SSimon Horman /* counters per cpu */ 356b17fc996SHans Schillstrom struct ip_vs_counters { 3571dbd8d9aSJulian Anastasov u64_stats_t conns; /* connections scheduled */ 3581dbd8d9aSJulian Anastasov u64_stats_t inpkts; /* incoming packets */ 3591dbd8d9aSJulian Anastasov u64_stats_t outpkts; /* outgoing packets */ 3601dbd8d9aSJulian Anastasov u64_stats_t inbytes; /* incoming bytes */ 3611dbd8d9aSJulian Anastasov u64_stats_t outbytes; /* outgoing bytes */ 362b17fc996SHans Schillstrom }; 36307dcc686SSimon Horman /* Stats per cpu */ 364b17fc996SHans Schillstrom struct ip_vs_cpu_stats { 365cd67cd5eSJulian Anastasov struct ip_vs_counters cnt; 366b17fc996SHans Schillstrom struct u64_stats_sync syncp; 367b17fc996SHans Schillstrom }; 3681da177e4SLinus Torvalds 369f0be83d5SJulian Anastasov /* Default nice for estimator kthreads */ 370f0be83d5SJulian Anastasov #define IPVS_EST_NICE 0 371f0be83d5SJulian Anastasov 37207dcc686SSimon Horman /* IPVS statistics objects */ 3733a14a313SSven Wegener struct ip_vs_estimator { 374705dd344SJulian Anastasov struct hlist_node list; 3753a14a313SSven Wegener 3763a14a313SSven Wegener u64 last_inbytes; 3773a14a313SSven Wegener u64 last_outbytes; 378cd67cd5eSJulian Anastasov u64 last_conns; 379cd67cd5eSJulian Anastasov u64 last_inpkts; 380cd67cd5eSJulian Anastasov u64 last_outpkts; 3813a14a313SSven Wegener 382cd67cd5eSJulian Anastasov u64 cps; 383cd67cd5eSJulian Anastasov u64 inpps; 384cd67cd5eSJulian Anastasov u64 outpps; 385cd67cd5eSJulian Anastasov u64 inbps; 386cd67cd5eSJulian Anastasov u64 outbps; 387705dd344SJulian Anastasov 388705dd344SJulian Anastasov s32 ktid:16, /* kthread ID, -1=temp list */ 389705dd344SJulian Anastasov ktrow:8, /* row/tick ID for kthread */ 390705dd344SJulian Anastasov ktcid:8; /* chain ID for kthread tick */ 391cd67cd5eSJulian Anastasov }; 392cd67cd5eSJulian Anastasov 393cd67cd5eSJulian Anastasov /* 394cd67cd5eSJulian Anastasov * IPVS statistics object, 64-bit kernel version of struct ip_vs_stats_user 395cd67cd5eSJulian Anastasov */ 396cd67cd5eSJulian Anastasov struct ip_vs_kstats { 397cd67cd5eSJulian Anastasov u64 conns; /* connections scheduled */ 398cd67cd5eSJulian Anastasov u64 inpkts; /* incoming packets */ 399cd67cd5eSJulian Anastasov u64 outpkts; /* outgoing packets */ 400cd67cd5eSJulian Anastasov u64 inbytes; /* incoming bytes */ 401cd67cd5eSJulian Anastasov u64 outbytes; /* outgoing bytes */ 402cd67cd5eSJulian Anastasov 403cd67cd5eSJulian Anastasov u64 cps; /* current connection rate */ 404cd67cd5eSJulian Anastasov u64 inpps; /* current in packet rate */ 405cd67cd5eSJulian Anastasov u64 outpps; /* current out packet rate */ 406cd67cd5eSJulian Anastasov u64 inbps; /* current in byte rate */ 407cd67cd5eSJulian Anastasov u64 outbps; /* current out byte rate */ 4083a14a313SSven Wegener }; 4093a14a313SSven Wegener 410fd2c3ef7SEric Dumazet struct ip_vs_stats { 411cd67cd5eSJulian Anastasov struct ip_vs_kstats kstats; /* kernel statistics */ 412e9c0ce23SSven Wegener struct ip_vs_estimator est; /* estimator */ 413b962abdcSJulian Anastasov struct ip_vs_cpu_stats __percpu *cpustats; /* per cpu counters */ 4141da177e4SLinus Torvalds spinlock_t lock; /* spin lock */ 415cd67cd5eSJulian Anastasov struct ip_vs_kstats kstats0; /* reset values */ 4161da177e4SLinus Torvalds }; 4171da177e4SLinus Torvalds 4185df7d714SJulian Anastasov struct ip_vs_stats_rcu { 4195df7d714SJulian Anastasov struct ip_vs_stats s; 4205df7d714SJulian Anastasov struct rcu_head rcu_head; 4215df7d714SJulian Anastasov }; 4225df7d714SJulian Anastasov 423de39afb3SJulian Anastasov int ip_vs_stats_init_alloc(struct ip_vs_stats *s); 424de39afb3SJulian Anastasov struct ip_vs_stats *ip_vs_stats_alloc(void); 425de39afb3SJulian Anastasov void ip_vs_stats_release(struct ip_vs_stats *stats); 426de39afb3SJulian Anastasov void ip_vs_stats_free(struct ip_vs_stats *stats); 427de39afb3SJulian Anastasov 428705dd344SJulian Anastasov /* Process estimators in multiple timer ticks (20/50/100, see ktrow) */ 429705dd344SJulian Anastasov #define IPVS_EST_NTICKS 50 430705dd344SJulian Anastasov /* Estimation uses a 2-second period containing ticks (in jiffies) */ 431705dd344SJulian Anastasov #define IPVS_EST_TICK ((2 * HZ) / IPVS_EST_NTICKS) 432705dd344SJulian Anastasov 433705dd344SJulian Anastasov /* Limit of CPU load per kthread (8 for 12.5%), ratio of CPU capacity (1/C). 434705dd344SJulian Anastasov * Value of 4 and above ensures kthreads will take work without exceeding 435705dd344SJulian Anastasov * the CPU capacity under different circumstances. 436705dd344SJulian Anastasov */ 437705dd344SJulian Anastasov #define IPVS_EST_LOAD_DIVISOR 8 438705dd344SJulian Anastasov 439705dd344SJulian Anastasov /* Kthreads should not have work that exceeds the CPU load above 50% */ 440705dd344SJulian Anastasov #define IPVS_EST_CPU_KTHREADS (IPVS_EST_LOAD_DIVISOR / 2) 441705dd344SJulian Anastasov 442705dd344SJulian Anastasov /* Desired number of chains per timer tick (chain load factor in 100us units), 443705dd344SJulian Anastasov * 48=4.8ms of 40ms tick (12% CPU usage): 444705dd344SJulian Anastasov * 2 sec * 1000 ms in sec * 10 (100us in ms) / 8 (12.5%) / 50 445705dd344SJulian Anastasov */ 446705dd344SJulian Anastasov #define IPVS_EST_CHAIN_FACTOR \ 447705dd344SJulian Anastasov ALIGN_DOWN(2 * 1000 * 10 / IPVS_EST_LOAD_DIVISOR / IPVS_EST_NTICKS, 8) 448705dd344SJulian Anastasov 449705dd344SJulian Anastasov /* Compiled number of chains per tick 450705dd344SJulian Anastasov * The defines should match cond_resched_rcu 451705dd344SJulian Anastasov */ 452705dd344SJulian Anastasov #if defined(CONFIG_DEBUG_ATOMIC_SLEEP) || !defined(CONFIG_PREEMPT_RCU) 453705dd344SJulian Anastasov #define IPVS_EST_TICK_CHAINS IPVS_EST_CHAIN_FACTOR 454705dd344SJulian Anastasov #else 455705dd344SJulian Anastasov #define IPVS_EST_TICK_CHAINS 1 456705dd344SJulian Anastasov #endif 457705dd344SJulian Anastasov 458705dd344SJulian Anastasov #if IPVS_EST_NTICKS > 127 459705dd344SJulian Anastasov #error Too many timer ticks for ktrow 460705dd344SJulian Anastasov #endif 461705dd344SJulian Anastasov 462705dd344SJulian Anastasov /* Multiple chains processed in same tick */ 463705dd344SJulian Anastasov struct ip_vs_est_tick_data { 464*e4d0fe71SJulian Anastasov struct rcu_head rcu_head; 465705dd344SJulian Anastasov struct hlist_head chains[IPVS_EST_TICK_CHAINS]; 466705dd344SJulian Anastasov DECLARE_BITMAP(present, IPVS_EST_TICK_CHAINS); 467705dd344SJulian Anastasov DECLARE_BITMAP(full, IPVS_EST_TICK_CHAINS); 468705dd344SJulian Anastasov int chain_len[IPVS_EST_TICK_CHAINS]; 469705dd344SJulian Anastasov }; 470705dd344SJulian Anastasov 471705dd344SJulian Anastasov /* Context for estimation kthread */ 472705dd344SJulian Anastasov struct ip_vs_est_kt_data { 473705dd344SJulian Anastasov struct netns_ipvs *ipvs; 474705dd344SJulian Anastasov struct task_struct *task; /* task if running */ 475705dd344SJulian Anastasov struct ip_vs_est_tick_data __rcu *ticks[IPVS_EST_NTICKS]; 476705dd344SJulian Anastasov DECLARE_BITMAP(avail, IPVS_EST_NTICKS); /* tick has space for ests */ 477705dd344SJulian Anastasov unsigned long est_timer; /* estimation timer (jiffies) */ 478705dd344SJulian Anastasov struct ip_vs_stats *calc_stats; /* Used for calculation */ 479705dd344SJulian Anastasov int tick_len[IPVS_EST_NTICKS]; /* est count */ 480705dd344SJulian Anastasov int id; /* ktid per netns */ 481705dd344SJulian Anastasov int chain_max; /* max ests per tick chain */ 482705dd344SJulian Anastasov int tick_max; /* max ests per tick */ 483705dd344SJulian Anastasov int est_count; /* attached ests to kthread */ 484705dd344SJulian Anastasov int est_max_count; /* max ests per kthread */ 485705dd344SJulian Anastasov int add_row; /* row for new ests */ 486705dd344SJulian Anastasov int est_row; /* estimated row */ 487705dd344SJulian Anastasov }; 488705dd344SJulian Anastasov 48914c85021SArnaldo Carvalho de Melo struct dst_entry; 49014c85021SArnaldo Carvalho de Melo struct iphdr; 4911da177e4SLinus Torvalds struct ip_vs_conn; 4921da177e4SLinus Torvalds struct ip_vs_app; 49314c85021SArnaldo Carvalho de Melo struct sk_buff; 494252c6410SHans Schillstrom struct ip_vs_proto_data; 4951da177e4SLinus Torvalds 4961da177e4SLinus Torvalds struct ip_vs_protocol { 4971da177e4SLinus Torvalds struct ip_vs_protocol *next; 4981da177e4SLinus Torvalds char *name; 4992ad17defSJulian Anastasov u16 protocol; 5002ad17defSJulian Anastasov u16 num_states; 5011da177e4SLinus Torvalds int dont_defrag; 5021da177e4SLinus Torvalds 5031da177e4SLinus Torvalds void (*init)(struct ip_vs_protocol *pp); 5041da177e4SLinus Torvalds 5051da177e4SLinus Torvalds void (*exit)(struct ip_vs_protocol *pp); 5061da177e4SLinus Torvalds 5071281a9c2SEric W. Biederman int (*init_netns)(struct netns_ipvs *ipvs, struct ip_vs_proto_data *pd); 508252c6410SHans Schillstrom 5091281a9c2SEric W. Biederman void (*exit_netns)(struct netns_ipvs *ipvs, struct ip_vs_proto_data *pd); 510252c6410SHans Schillstrom 511d8f44c33SEric W. Biederman int (*conn_schedule)(struct netns_ipvs *ipvs, 512d8f44c33SEric W. Biederman int af, struct sk_buff *skb, 5139330419dSHans Schillstrom struct ip_vs_proto_data *pd, 514d4383f04SJesper Dangaard Brouer int *verdict, struct ip_vs_conn **cpp, 515d4383f04SJesper Dangaard Brouer struct ip_vs_iphdr *iph); 5161da177e4SLinus Torvalds 5171da177e4SLinus Torvalds struct ip_vs_conn * 518ab161976SEric W. Biederman (*conn_in_get)(struct netns_ipvs *ipvs, 519ab161976SEric W. Biederman int af, 52051ef348bSJulius Volz const struct sk_buff *skb, 521802c41adSAlex Gartrell const struct ip_vs_iphdr *iph); 5221da177e4SLinus Torvalds 5231da177e4SLinus Torvalds struct ip_vs_conn * 5240cf705c8SEric W. Biederman (*conn_out_get)(struct netns_ipvs *ipvs, 5250cf705c8SEric W. Biederman int af, 52651ef348bSJulius Volz const struct sk_buff *skb, 527802c41adSAlex Gartrell const struct ip_vs_iphdr *iph); 5281da177e4SLinus Torvalds 529d4383f04SJesper Dangaard Brouer int (*snat_handler)(struct sk_buff *skb, struct ip_vs_protocol *pp, 530d4383f04SJesper Dangaard Brouer struct ip_vs_conn *cp, struct ip_vs_iphdr *iph); 5311da177e4SLinus Torvalds 532d4383f04SJesper Dangaard Brouer int (*dnat_handler)(struct sk_buff *skb, struct ip_vs_protocol *pp, 533d4383f04SJesper Dangaard Brouer struct ip_vs_conn *cp, struct ip_vs_iphdr *iph); 5341da177e4SLinus Torvalds 5351da177e4SLinus Torvalds const char *(*state_name)(int state); 5361da177e4SLinus Torvalds 5374a516f11SSimon Horman void (*state_transition)(struct ip_vs_conn *cp, int direction, 5381da177e4SLinus Torvalds const struct sk_buff *skb, 5399330419dSHans Schillstrom struct ip_vs_proto_data *pd); 5401da177e4SLinus Torvalds 54119648918SEric W. Biederman int (*register_app)(struct netns_ipvs *ipvs, struct ip_vs_app *inc); 5421da177e4SLinus Torvalds 54319648918SEric W. Biederman void (*unregister_app)(struct netns_ipvs *ipvs, struct ip_vs_app *inc); 5441da177e4SLinus Torvalds 5451da177e4SLinus Torvalds int (*app_conn_bind)(struct ip_vs_conn *cp); 5461da177e4SLinus Torvalds 5470d79641aSJulian Anastasov void (*debug_packet)(int af, struct ip_vs_protocol *pp, 5481da177e4SLinus Torvalds const struct sk_buff *skb, 5491da177e4SLinus Torvalds int offset, 5501da177e4SLinus Torvalds const char *msg); 5511da177e4SLinus Torvalds 5529330419dSHans Schillstrom void (*timeout_change)(struct ip_vs_proto_data *pd, int flags); 5531da177e4SLinus Torvalds }; 5541da177e4SLinus Torvalds 55507dcc686SSimon Horman /* protocol data per netns */ 556252c6410SHans Schillstrom struct ip_vs_proto_data { 557252c6410SHans Schillstrom struct ip_vs_proto_data *next; 558252c6410SHans Schillstrom struct ip_vs_protocol *pp; 559252c6410SHans Schillstrom int *timeout_table; /* protocol timeout table */ 560252c6410SHans Schillstrom atomic_t appcnt; /* counter of proto app incs. */ 561252c6410SHans Schillstrom struct tcp_states_t *tcp_state_table; 562252c6410SHans Schillstrom }; 563252c6410SHans Schillstrom 5645c3a0fd7SJoe Perches struct ip_vs_protocol *ip_vs_proto_get(unsigned short proto); 56518d6ade6SEric W. Biederman struct ip_vs_proto_data *ip_vs_proto_data_get(struct netns_ipvs *ipvs, 566252c6410SHans Schillstrom unsigned short proto); 5671da177e4SLinus Torvalds 568f11017ecSSimon Horman struct ip_vs_conn_param { 569e64e2b46SEric W. Biederman struct netns_ipvs *ipvs; 570f11017ecSSimon Horman const union nf_inet_addr *caddr; 571f11017ecSSimon Horman const union nf_inet_addr *vaddr; 572f11017ecSSimon Horman __be16 cport; 573f11017ecSSimon Horman __be16 vport; 574f11017ecSSimon Horman __u16 protocol; 575f11017ecSSimon Horman u16 af; 57685999283SSimon Horman 57785999283SSimon Horman const struct ip_vs_pe *pe; 57885999283SSimon Horman char *pe_data; 57985999283SSimon Horman __u8 pe_data_len; 580f11017ecSSimon Horman }; 581f11017ecSSimon Horman 58207dcc686SSimon Horman /* IP_VS structure allocated for each dynamically scheduled connection */ 5831da177e4SLinus Torvalds struct ip_vs_conn { 584731109e7SChangli Gao struct hlist_node c_list; /* hashed list heads */ 5851da177e4SLinus Torvalds /* Protocol, addresses and port numbers */ 5866e67e586SHans Schillstrom __be16 cport; 5876e67e586SHans Schillstrom __be16 dport; 5881845ed0bSJulian Anastasov __be16 vport; 5891845ed0bSJulian Anastasov u16 af; /* address family */ 590e7ade46aSJulius Volz union nf_inet_addr caddr; /* client address */ 591e7ade46aSJulius Volz union nf_inet_addr vaddr; /* virtual address */ 592e7ade46aSJulius Volz union nf_inet_addr daddr; /* destination address */ 5933575792eSJulian Anastasov volatile __u32 flags; /* status flags */ 5941da177e4SLinus Torvalds __u16 protocol; /* Which protocol (TCP/UDP) */ 595ba38528aSAlex Gartrell __u16 daf; /* Address family of the dest */ 59658dbc6f2SEric W. Biederman struct netns_ipvs *ipvs; 5971da177e4SLinus Torvalds 5981da177e4SLinus Torvalds /* counter and timer */ 599b54ab92bSReshetova, Elena refcount_t refcnt; /* reference count */ 6001da177e4SLinus Torvalds struct timer_list timer; /* Expiration timer */ 6011da177e4SLinus Torvalds volatile unsigned long timeout; /* timeout */ 6021da177e4SLinus Torvalds 6031da177e4SLinus Torvalds /* Flags and state transition */ 6041da177e4SLinus Torvalds spinlock_t lock; /* lock for state transition */ 6051da177e4SLinus Torvalds volatile __u16 state; /* state info */ 606efac5276SRumen G. Bogdanovski volatile __u16 old_state; /* old state, to be used for 607efac5276SRumen G. Bogdanovski * state transition triggerd 608efac5276SRumen G. Bogdanovski * synchronization 609efac5276SRumen G. Bogdanovski */ 6101845ed0bSJulian Anastasov __u32 fwmark; /* Fire wall mark from skb */ 611749c42b6SJulian Anastasov unsigned long sync_endtime; /* jiffies + sent_retries */ 6121da177e4SLinus Torvalds 6131da177e4SLinus Torvalds /* Control members */ 6141da177e4SLinus Torvalds struct ip_vs_conn *control; /* Master control connection */ 6151da177e4SLinus Torvalds atomic_t n_control; /* Number of controlled ones */ 6161da177e4SLinus Torvalds struct ip_vs_dest *dest; /* real server */ 6171da177e4SLinus Torvalds atomic_t in_pkts; /* incoming packet counter */ 6181da177e4SLinus Torvalds 61907dcc686SSimon Horman /* Packet transmitter for different forwarding methods. If it 62007dcc686SSimon Horman * mangles the packet, it must return NF_DROP or better NF_STOLEN, 62107dcc686SSimon Horman * otherwise this must be changed to a sk_buff **. 62207dcc686SSimon Horman * NF_ACCEPT can be returned when destination is local. 6231da177e4SLinus Torvalds */ 6241da177e4SLinus Torvalds int (*packet_xmit)(struct sk_buff *skb, struct ip_vs_conn *cp, 625d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 6261da177e4SLinus Torvalds 6271da177e4SLinus Torvalds /* Note: we can group the following members into a structure, 62807dcc686SSimon Horman * in order to save more space, and the following members are 62907dcc686SSimon Horman * only used in VS/NAT anyway 63007dcc686SSimon Horman */ 6311da177e4SLinus Torvalds struct ip_vs_app *app; /* bound ip_vs_app object */ 6321da177e4SLinus Torvalds void *app_data; /* Application private data */ 6331da177e4SLinus Torvalds struct ip_vs_seq in_seq; /* incoming seq. struct */ 6341da177e4SLinus Torvalds struct ip_vs_seq out_seq; /* outgoing seq. struct */ 63585999283SSimon Horman 636e9e5eee8SSimon Horman const struct ip_vs_pe *pe; 63785999283SSimon Horman char *pe_data; 63885999283SSimon Horman __u8 pe_data_len; 639088339a5SJulian Anastasov 640088339a5SJulian Anastasov struct rcu_head rcu_head; 6411da177e4SLinus Torvalds }; 6421da177e4SLinus Torvalds 64307dcc686SSimon Horman /* Extended internal versions of struct ip_vs_service_user and ip_vs_dest_user 64407dcc686SSimon Horman * for IPv6 support. 645c860c6b1SJulius Volz * 646c860c6b1SJulius Volz * We need these to conveniently pass around service and destination 647c860c6b1SJulius Volz * options, but unfortunately, we also need to keep the old definitions to 648c860c6b1SJulius Volz * maintain userspace backwards compatibility for the setsockopt interface. 649c860c6b1SJulius Volz */ 650c860c6b1SJulius Volz struct ip_vs_service_user_kern { 651c860c6b1SJulius Volz /* virtual service addresses */ 652c860c6b1SJulius Volz u16 af; 653c860c6b1SJulius Volz u16 protocol; 654c860c6b1SJulius Volz union nf_inet_addr addr; /* virtual ip address */ 6550a925864SJulian Anastasov __be16 port; 656c860c6b1SJulius Volz u32 fwmark; /* firwall mark of service */ 657c860c6b1SJulius Volz 658c860c6b1SJulius Volz /* virtual service options */ 659c860c6b1SJulius Volz char *sched_name; 6600d1e71b0SSimon Horman char *pe_name; 66195c96174SEric Dumazet unsigned int flags; /* virtual service flags */ 66295c96174SEric Dumazet unsigned int timeout; /* persistent timeout in sec */ 6630a925864SJulian Anastasov __be32 netmask; /* persistent netmask or plen */ 664c860c6b1SJulius Volz }; 665c860c6b1SJulius Volz 666c860c6b1SJulius Volz 667c860c6b1SJulius Volz struct ip_vs_dest_user_kern { 668c860c6b1SJulius Volz /* destination server address */ 669c860c6b1SJulius Volz union nf_inet_addr addr; 6700a925864SJulian Anastasov __be16 port; 671c860c6b1SJulius Volz 672c860c6b1SJulius Volz /* real server options */ 67395c96174SEric Dumazet unsigned int conn_flags; /* connection flags */ 674c860c6b1SJulius Volz int weight; /* destination weight */ 675c860c6b1SJulius Volz 676c860c6b1SJulius Volz /* thresholds for active connections */ 677c860c6b1SJulius Volz u32 u_threshold; /* upper threshold */ 678c860c6b1SJulius Volz u32 l_threshold; /* lower threshold */ 6796cff339bSAlex Gartrell 6806cff339bSAlex Gartrell /* Address family of addr */ 6816cff339bSAlex Gartrell u16 af; 68284c0d5e9SJacky Hu 68384c0d5e9SJacky Hu u16 tun_type; /* tunnel type */ 68484c0d5e9SJacky Hu __be16 tun_port; /* tunnel port */ 68529930e31SJacky Hu u16 tun_flags; /* tunnel flags */ 686c860c6b1SJulius Volz }; 687c860c6b1SJulius Volz 688c860c6b1SJulius Volz 689c860c6b1SJulius Volz /* 69007dcc686SSimon Horman * The information about the virtual service offered to the net and the 69107dcc686SSimon Horman * forwarding entries. 6921da177e4SLinus Torvalds */ 6931da177e4SLinus Torvalds struct ip_vs_service { 694ceec4c38SJulian Anastasov struct hlist_node s_list; /* for normal service table */ 695ceec4c38SJulian Anastasov struct hlist_node f_list; /* for fwmark-based service table */ 6961da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 6971da177e4SLinus Torvalds 698e7ade46aSJulius Volz u16 af; /* address family */ 6991da177e4SLinus Torvalds __u16 protocol; /* which protocol (TCP/UDP) */ 700e7ade46aSJulius Volz union nf_inet_addr addr; /* IP address for virtual service */ 701014d730dSAl Viro __be16 port; /* port number for the service */ 7021da177e4SLinus Torvalds __u32 fwmark; /* firewall mark of the service */ 70395c96174SEric Dumazet unsigned int flags; /* service status flags */ 70495c96174SEric Dumazet unsigned int timeout; /* persistent timeout in ticks */ 7050a925864SJulian Anastasov __be32 netmask; /* grouping granularity, mask/plen */ 7063109d2f2SEric W. Biederman struct netns_ipvs *ipvs; 7071da177e4SLinus Torvalds 7081da177e4SLinus Torvalds struct list_head destinations; /* real server d-linked list */ 7091da177e4SLinus Torvalds __u32 num_dests; /* number of servers */ 7101da177e4SLinus Torvalds struct ip_vs_stats stats; /* statistics for the service */ 7111da177e4SLinus Torvalds 7121da177e4SLinus Torvalds /* for scheduling */ 713ceec4c38SJulian Anastasov struct ip_vs_scheduler __rcu *scheduler; /* bound scheduler object */ 714ba3a3ce1SJulian Anastasov spinlock_t sched_lock; /* lock sched_data */ 7151da177e4SLinus Torvalds void *sched_data; /* scheduler application data */ 71685999283SSimon Horman 71785999283SSimon Horman /* alternate persistence engine */ 718ceec4c38SJulian Anastasov struct ip_vs_pe __rcu *pe; 71931875d49SJulian Anastasov int conntrack_afmask; 720ceec4c38SJulian Anastasov 721ceec4c38SJulian Anastasov struct rcu_head rcu_head; 7221da177e4SLinus Torvalds }; 7231da177e4SLinus Torvalds 724026ace06SJulian Anastasov /* Information for cached dst */ 725026ace06SJulian Anastasov struct ip_vs_dest_dst { 726026ace06SJulian Anastasov struct dst_entry *dst_cache; /* destination cache entry */ 727026ace06SJulian Anastasov u32 dst_cookie; 728026ace06SJulian Anastasov union nf_inet_addr dst_saddr; 729026ace06SJulian Anastasov struct rcu_head rcu_head; 730026ace06SJulian Anastasov }; 7311da177e4SLinus Torvalds 73207dcc686SSimon Horman /* The real server destination forwarding entry with ip address, port number, 73307dcc686SSimon Horman * and so on. 7341da177e4SLinus Torvalds */ 7351da177e4SLinus Torvalds struct ip_vs_dest { 7361da177e4SLinus Torvalds struct list_head n_list; /* for the dests in the service */ 737276472eaSJulian Anastasov struct hlist_node d_list; /* for table with all the dests */ 7381da177e4SLinus Torvalds 739e7ade46aSJulius Volz u16 af; /* address family */ 740014d730dSAl Viro __be16 port; /* port number of the server */ 741f2431e6eSHans Schillstrom union nf_inet_addr addr; /* IP address of the server */ 74295c96174SEric Dumazet volatile unsigned int flags; /* dest status flags */ 7431da177e4SLinus Torvalds atomic_t conn_flags; /* flags to copy to conn */ 7441da177e4SLinus Torvalds atomic_t weight; /* server weight */ 745a2c09ac0SInju Song atomic_t last_weight; /* server latest weight */ 74684c0d5e9SJacky Hu __u16 tun_type; /* tunnel type */ 74784c0d5e9SJacky Hu __be16 tun_port; /* tunnel port */ 74829930e31SJacky Hu __u16 tun_flags; /* tunnel flags */ 7491da177e4SLinus Torvalds 750b54ab92bSReshetova, Elena refcount_t refcnt; /* reference counter */ 7511da177e4SLinus Torvalds struct ip_vs_stats stats; /* statistics */ 752bcbde4c0SJulian Anastasov unsigned long idle_start; /* start time, jiffies */ 7531da177e4SLinus Torvalds 7541da177e4SLinus Torvalds /* connection counters and thresholds */ 7551da177e4SLinus Torvalds atomic_t activeconns; /* active connections */ 7561da177e4SLinus Torvalds atomic_t inactconns; /* inactive connections */ 7571da177e4SLinus Torvalds atomic_t persistconns; /* persistent connections */ 7581da177e4SLinus Torvalds __u32 u_threshold; /* upper threshold */ 7591da177e4SLinus Torvalds __u32 l_threshold; /* lower threshold */ 7601da177e4SLinus Torvalds 7611da177e4SLinus Torvalds /* for destination cache */ 7621da177e4SLinus Torvalds spinlock_t dst_lock; /* lock of dst_cache */ 763026ace06SJulian Anastasov struct ip_vs_dest_dst __rcu *dest_dst; /* cached dst info */ 7641da177e4SLinus Torvalds 7651da177e4SLinus Torvalds /* for virtual service */ 766bcbde4c0SJulian Anastasov struct ip_vs_service __rcu *svc; /* service it belongs to */ 7671da177e4SLinus Torvalds __u16 protocol; /* which protocol (TCP/UDP) */ 768014d730dSAl Viro __be16 vport; /* virtual port number */ 769f2431e6eSHans Schillstrom union nf_inet_addr vaddr; /* virtual IP address */ 7701da177e4SLinus Torvalds __u32 vfwmark; /* firewall mark of service */ 771276472eaSJulian Anastasov 7725df7d714SJulian Anastasov struct rcu_head rcu_head; 773578bc3efSJulian Anastasov struct list_head t_list; /* in dest_trash */ 774276472eaSJulian Anastasov unsigned int in_rs_table:1; /* we are in rs_table */ 7751da177e4SLinus Torvalds }; 7761da177e4SLinus Torvalds 77707dcc686SSimon Horman /* The scheduler object */ 7781da177e4SLinus Torvalds struct ip_vs_scheduler { 7791da177e4SLinus Torvalds struct list_head n_list; /* d-linked list head */ 7801da177e4SLinus Torvalds char *name; /* scheduler name */ 7811da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 7821da177e4SLinus Torvalds struct module *module; /* THIS_MODULE/NULL */ 7831da177e4SLinus Torvalds 7841da177e4SLinus Torvalds /* scheduler initializing service */ 7851da177e4SLinus Torvalds int (*init_service)(struct ip_vs_service *svc); 7861da177e4SLinus Torvalds /* scheduling service finish */ 787ed3ffc4eSJulian Anastasov void (*done_service)(struct ip_vs_service *svc); 7886b6df466SJulian Anastasov /* dest is linked */ 7896b6df466SJulian Anastasov int (*add_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest); 7906b6df466SJulian Anastasov /* dest is unlinked */ 7916b6df466SJulian Anastasov int (*del_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest); 7926b6df466SJulian Anastasov /* dest is updated */ 7936b6df466SJulian Anastasov int (*upd_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest); 7941da177e4SLinus Torvalds 7951da177e4SLinus Torvalds /* selecting a server from the given service */ 7961da177e4SLinus Torvalds struct ip_vs_dest* (*schedule)(struct ip_vs_service *svc, 797bba54de5SJulian Anastasov const struct sk_buff *skb, 798bba54de5SJulian Anastasov struct ip_vs_iphdr *iph); 7991da177e4SLinus Torvalds }; 8001da177e4SLinus Torvalds 80185999283SSimon Horman /* The persistence engine object */ 80285999283SSimon Horman struct ip_vs_pe { 80385999283SSimon Horman struct list_head n_list; /* d-linked list head */ 80485999283SSimon Horman char *name; /* scheduler name */ 80585999283SSimon Horman atomic_t refcnt; /* reference counter */ 80685999283SSimon Horman struct module *module; /* THIS_MODULE/NULL */ 80785999283SSimon Horman 80885999283SSimon Horman /* get the connection template, if any */ 80985999283SSimon Horman int (*fill_param)(struct ip_vs_conn_param *p, struct sk_buff *skb); 81085999283SSimon Horman bool (*ct_match)(const struct ip_vs_conn_param *p, 81185999283SSimon Horman struct ip_vs_conn *ct); 81285999283SSimon Horman u32 (*hashkey_raw)(const struct ip_vs_conn_param *p, u32 initval, 81385999283SSimon Horman bool inverse); 814a3c918acSSimon Horman int (*show_pe_data)(const struct ip_vs_conn *cp, char *buf); 81539b97223SMarco Angaroni /* create connections for real-server outgoing packets */ 81639b97223SMarco Angaroni struct ip_vs_conn* (*conn_out)(struct ip_vs_service *svc, 81739b97223SMarco Angaroni struct ip_vs_dest *dest, 81839b97223SMarco Angaroni struct sk_buff *skb, 81939b97223SMarco Angaroni const struct ip_vs_iphdr *iph, 82039b97223SMarco Angaroni __be16 dport, __be16 cport); 82185999283SSimon Horman }; 8221da177e4SLinus Torvalds 82307dcc686SSimon Horman /* The application module object (a.k.a. app incarnation) */ 824fd2c3ef7SEric Dumazet struct ip_vs_app { 8251da177e4SLinus Torvalds struct list_head a_list; /* member in app list */ 8261da177e4SLinus Torvalds int type; /* IP_VS_APP_TYPE_xxx */ 8271da177e4SLinus Torvalds char *name; /* application module name */ 8281da177e4SLinus Torvalds __u16 protocol; 8291da177e4SLinus Torvalds struct module *module; /* THIS_MODULE/NULL */ 8301da177e4SLinus Torvalds struct list_head incs_list; /* list of incarnations */ 8311da177e4SLinus Torvalds 8321da177e4SLinus Torvalds /* members for application incarnations */ 8331da177e4SLinus Torvalds struct list_head p_list; /* member in proto app list */ 8341da177e4SLinus Torvalds struct ip_vs_app *app; /* its real application */ 835014d730dSAl Viro __be16 port; /* port number in net order */ 8361da177e4SLinus Torvalds atomic_t usecnt; /* usage counter */ 837363c97d7SJulian Anastasov struct rcu_head rcu_head; 8381da177e4SLinus Torvalds 83907dcc686SSimon Horman /* output hook: Process packet in inout direction, diff set for TCP. 8408b27b10fSJulian Anastasov * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok, 8418b27b10fSJulian Anastasov * 2=Mangled but checksum was not updated 8428b27b10fSJulian Anastasov */ 8431da177e4SLinus Torvalds int (*pkt_out)(struct ip_vs_app *, struct ip_vs_conn *, 844d12e1229SJulian Anastasov struct sk_buff *, int *diff, struct ip_vs_iphdr *ipvsh); 8451da177e4SLinus Torvalds 84607dcc686SSimon Horman /* input hook: Process packet in outin direction, diff set for TCP. 8478b27b10fSJulian Anastasov * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok, 8488b27b10fSJulian Anastasov * 2=Mangled but checksum was not updated 8498b27b10fSJulian Anastasov */ 8501da177e4SLinus Torvalds int (*pkt_in)(struct ip_vs_app *, struct ip_vs_conn *, 851d12e1229SJulian Anastasov struct sk_buff *, int *diff, struct ip_vs_iphdr *ipvsh); 8521da177e4SLinus Torvalds 8531da177e4SLinus Torvalds /* ip_vs_app initializer */ 8541da177e4SLinus Torvalds int (*init_conn)(struct ip_vs_app *, struct ip_vs_conn *); 8551da177e4SLinus Torvalds 8561da177e4SLinus Torvalds /* ip_vs_app finish */ 8571da177e4SLinus Torvalds int (*done_conn)(struct ip_vs_app *, struct ip_vs_conn *); 8581da177e4SLinus Torvalds 8591da177e4SLinus Torvalds 8601da177e4SLinus Torvalds /* not used now */ 8611da177e4SLinus Torvalds int (*bind_conn)(struct ip_vs_app *, struct ip_vs_conn *, 8621da177e4SLinus Torvalds struct ip_vs_protocol *); 8631da177e4SLinus Torvalds 8641da177e4SLinus Torvalds void (*unbind_conn)(struct ip_vs_app *, struct ip_vs_conn *); 8651da177e4SLinus Torvalds 8661da177e4SLinus Torvalds int * timeout_table; 8671da177e4SLinus Torvalds int * timeouts; 8681da177e4SLinus Torvalds int timeouts_size; 8691da177e4SLinus Torvalds 8701da177e4SLinus Torvalds int (*conn_schedule)(struct sk_buff *skb, struct ip_vs_app *app, 8711da177e4SLinus Torvalds int *verdict, struct ip_vs_conn **cpp); 8721da177e4SLinus Torvalds 8731da177e4SLinus Torvalds struct ip_vs_conn * 8741da177e4SLinus Torvalds (*conn_in_get)(const struct sk_buff *skb, struct ip_vs_app *app, 875d4383f04SJesper Dangaard Brouer const struct iphdr *iph, int inverse); 8761da177e4SLinus Torvalds 8771da177e4SLinus Torvalds struct ip_vs_conn * 8781da177e4SLinus Torvalds (*conn_out_get)(const struct sk_buff *skb, struct ip_vs_app *app, 879d4383f04SJesper Dangaard Brouer const struct iphdr *iph, int inverse); 8801da177e4SLinus Torvalds 8811da177e4SLinus Torvalds int (*state_transition)(struct ip_vs_conn *cp, int direction, 8821da177e4SLinus Torvalds const struct sk_buff *skb, 8831da177e4SLinus Torvalds struct ip_vs_app *app); 8841da177e4SLinus Torvalds 8851da177e4SLinus Torvalds void (*timeout_change)(struct ip_vs_app *app, int flags); 8861da177e4SLinus Torvalds }; 8871da177e4SLinus Torvalds 888f73181c8SPablo Neira Ayuso struct ipvs_master_sync_state { 889f73181c8SPablo Neira Ayuso struct list_head sync_queue; 890f73181c8SPablo Neira Ayuso struct ip_vs_sync_buff *sync_buff; 89107995674SZhang Yanfei unsigned long sync_queue_len; 892f73181c8SPablo Neira Ayuso unsigned int sync_queue_delay; 893f73181c8SPablo Neira Ayuso struct delayed_work master_wakeup_work; 894f73181c8SPablo Neira Ayuso struct netns_ipvs *ipvs; 895f73181c8SPablo Neira Ayuso }; 896f73181c8SPablo Neira Ayuso 8975db7c8b9SJulian Anastasov struct ip_vs_sync_thread_data; 8985db7c8b9SJulian Anastasov 899578bc3efSJulian Anastasov /* How much time to keep dests in trash */ 900578bc3efSJulian Anastasov #define IP_VS_DEST_TRASH_PERIOD (120 * HZ) 901578bc3efSJulian Anastasov 902e4ff6751SJulian Anastasov struct ipvs_sync_daemon_cfg { 903d3328817SJulian Anastasov union nf_inet_addr mcast_group; 904e4ff6751SJulian Anastasov int syncid; 905e4ff6751SJulian Anastasov u16 sync_maxlen; 906d3328817SJulian Anastasov u16 mcast_port; 907d3328817SJulian Anastasov u8 mcast_af; 908d3328817SJulian Anastasov u8 mcast_ttl; 909e4ff6751SJulian Anastasov /* multicast interface name */ 910e4ff6751SJulian Anastasov char mcast_ifn[IP_VS_IFNAME_MAXLEN]; 911e4ff6751SJulian Anastasov }; 912e4ff6751SJulian Anastasov 9132553d064SJulian Anastasov /* IPVS in network namespace */ 9142553d064SJulian Anastasov struct netns_ipvs { 9152553d064SJulian Anastasov int gen; /* Generation */ 9167a4f0761SHans Schillstrom int enable; /* enable like nf_hooks do */ 91707dcc686SSimon Horman /* Hash table: for real service lookups */ 9182553d064SJulian Anastasov #define IP_VS_RTAB_BITS 4 9192553d064SJulian Anastasov #define IP_VS_RTAB_SIZE (1 << IP_VS_RTAB_BITS) 9202553d064SJulian Anastasov #define IP_VS_RTAB_MASK (IP_VS_RTAB_SIZE - 1) 9212553d064SJulian Anastasov 922276472eaSJulian Anastasov struct hlist_head rs_table[IP_VS_RTAB_SIZE]; 9232553d064SJulian Anastasov /* ip_vs_app */ 9242553d064SJulian Anastasov struct list_head app_list; 9252553d064SJulian Anastasov /* ip_vs_proto */ 9262553d064SJulian Anastasov #define IP_VS_PROTO_TAB_SIZE 32 /* must be power of 2 */ 9272553d064SJulian Anastasov struct ip_vs_proto_data *proto_data_table[IP_VS_PROTO_TAB_SIZE]; 9282553d064SJulian Anastasov /* ip_vs_proto_tcp */ 9292553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_TCP 9302553d064SJulian Anastasov #define TCP_APP_TAB_BITS 4 9312553d064SJulian Anastasov #define TCP_APP_TAB_SIZE (1 << TCP_APP_TAB_BITS) 9322553d064SJulian Anastasov #define TCP_APP_TAB_MASK (TCP_APP_TAB_SIZE - 1) 9332553d064SJulian Anastasov struct list_head tcp_apps[TCP_APP_TAB_SIZE]; 9342553d064SJulian Anastasov #endif 9352553d064SJulian Anastasov /* ip_vs_proto_udp */ 9362553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_UDP 9372553d064SJulian Anastasov #define UDP_APP_TAB_BITS 4 9382553d064SJulian Anastasov #define UDP_APP_TAB_SIZE (1 << UDP_APP_TAB_BITS) 9392553d064SJulian Anastasov #define UDP_APP_TAB_MASK (UDP_APP_TAB_SIZE - 1) 9402553d064SJulian Anastasov struct list_head udp_apps[UDP_APP_TAB_SIZE]; 9412553d064SJulian Anastasov #endif 9422553d064SJulian Anastasov /* ip_vs_proto_sctp */ 9432553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_SCTP 9442553d064SJulian Anastasov #define SCTP_APP_TAB_BITS 4 9452553d064SJulian Anastasov #define SCTP_APP_TAB_SIZE (1 << SCTP_APP_TAB_BITS) 9462553d064SJulian Anastasov #define SCTP_APP_TAB_MASK (SCTP_APP_TAB_SIZE - 1) 9472553d064SJulian Anastasov /* Hash table for SCTP application incarnations */ 9482553d064SJulian Anastasov struct list_head sctp_apps[SCTP_APP_TAB_SIZE]; 9492553d064SJulian Anastasov #endif 9502553d064SJulian Anastasov /* ip_vs_conn */ 9512553d064SJulian Anastasov atomic_t conn_count; /* connection counter */ 9522553d064SJulian Anastasov 9532553d064SJulian Anastasov /* ip_vs_ctl */ 9545df7d714SJulian Anastasov struct ip_vs_stats_rcu *tot_stats; /* Statistics & est. */ 9552553d064SJulian Anastasov 9562553d064SJulian Anastasov int num_services; /* no of virtual services */ 957857ca897SJulian Anastasov int num_services6; /* IPv6 virtual services */ 958f2247fbdSSimon Horman 9592553d064SJulian Anastasov /* Trash for destinations */ 9602553d064SJulian Anastasov struct list_head dest_trash; 961578bc3efSJulian Anastasov spinlock_t dest_trash_lock; 962578bc3efSJulian Anastasov struct timer_list dest_trash_timer; /* expiration timer */ 9632553d064SJulian Anastasov /* Service counters */ 9642553d064SJulian Anastasov atomic_t ftpsvc_counter; 9652553d064SJulian Anastasov atomic_t nullsvc_counter; 96639b97223SMarco Angaroni atomic_t conn_out_counter; 9672553d064SJulian Anastasov 968f2247fbdSSimon Horman #ifdef CONFIG_SYSCTL 96935dfb013SAndrew Sy Kim /* delayed work for expiring no dest connections */ 97035dfb013SAndrew Sy Kim struct delayed_work expire_nodest_conn_work; 971f2247fbdSSimon Horman /* 1/rate drop and drop-entry variables */ 972f2247fbdSSimon Horman struct delayed_work defense_work; /* Work handler */ 973f2247fbdSSimon Horman int drop_rate; 974f2247fbdSSimon Horman int drop_counter; 975c24b75e0SEric Dumazet int old_secure_tcp; 976f2247fbdSSimon Horman atomic_t dropentry; 977f2247fbdSSimon Horman /* locks in ctl.c */ 978f2247fbdSSimon Horman spinlock_t dropentry_lock; /* drop entry handling */ 979f2247fbdSSimon Horman spinlock_t droppacket_lock; /* drop packet handling */ 980f2247fbdSSimon Horman spinlock_t securetcp_lock; /* state and timeout tables */ 981f2247fbdSSimon Horman 9822553d064SJulian Anastasov /* sys-ctl struct */ 9832553d064SJulian Anastasov struct ctl_table_header *sysctl_hdr; 9842553d064SJulian Anastasov struct ctl_table *sysctl_tbl; 985f2247fbdSSimon Horman #endif 986f2247fbdSSimon Horman 9872553d064SJulian Anastasov /* sysctl variables */ 9882553d064SJulian Anastasov int sysctl_amemthresh; 9892553d064SJulian Anastasov int sysctl_am_droprate; 9902553d064SJulian Anastasov int sysctl_drop_entry; 9912553d064SJulian Anastasov int sysctl_drop_packet; 9922553d064SJulian Anastasov int sysctl_secure_tcp; 9932553d064SJulian Anastasov #ifdef CONFIG_IP_VS_NFCT 9942553d064SJulian Anastasov int sysctl_conntrack; 9952553d064SJulian Anastasov #endif 9962553d064SJulian Anastasov int sysctl_snat_reroute; 9972553d064SJulian Anastasov int sysctl_sync_ver; 998f73181c8SPablo Neira Ayuso int sysctl_sync_ports; 9994d0c875dSJulian Anastasov int sysctl_sync_persist_mode; 100007995674SZhang Yanfei unsigned long sysctl_sync_qlen_max; 10011c003b15SPablo Neira Ayuso int sysctl_sync_sock_size; 10022553d064SJulian Anastasov int sysctl_cache_bypass; 10032553d064SJulian Anastasov int sysctl_expire_nodest_conn; 1004c6c96c18SAlexander Frolkin int sysctl_sloppy_tcp; 1005c6c96c18SAlexander Frolkin int sysctl_sloppy_sctp; 10062553d064SJulian Anastasov int sysctl_expire_quiescent_template; 10072553d064SJulian Anastasov int sysctl_sync_threshold[2]; 1008749c42b6SJulian Anastasov unsigned int sysctl_sync_refresh_period; 1009749c42b6SJulian Anastasov int sysctl_sync_retries; 10102553d064SJulian Anastasov int sysctl_nat_icmp_send; 10113654e611SJulian Anastasov int sysctl_pmtu_disc; 10120c12582fSJulian Anastasov int sysctl_backup_only; 1013d752c364SMarcelo Ricardo Leitner int sysctl_conn_reuse_mode; 101494485fedSAlex Gartrell int sysctl_schedule_icmp; 10154e478098SAlex Gartrell int sysctl_ignore_tunneled; 10162232642eSDust Li int sysctl_run_estimation; 1017f0be83d5SJulian Anastasov #ifdef CONFIG_SYSCTL 1018f0be83d5SJulian Anastasov cpumask_var_t sysctl_est_cpulist; /* kthread cpumask */ 1019f0be83d5SJulian Anastasov int est_cpulist_valid; /* cpulist set */ 1020f0be83d5SJulian Anastasov int sysctl_est_nice; /* kthread nice */ 1021f0be83d5SJulian Anastasov int est_stopped; /* stop tasks */ 1022f0be83d5SJulian Anastasov #endif 10232553d064SJulian Anastasov 10242553d064SJulian Anastasov /* ip_vs_lblc */ 10252553d064SJulian Anastasov int sysctl_lblc_expiration; 10262553d064SJulian Anastasov struct ctl_table_header *lblc_ctl_header; 10272553d064SJulian Anastasov struct ctl_table *lblc_ctl_table; 10282553d064SJulian Anastasov /* ip_vs_lblcr */ 10292553d064SJulian Anastasov int sysctl_lblcr_expiration; 10302553d064SJulian Anastasov struct ctl_table_header *lblcr_ctl_header; 10312553d064SJulian Anastasov struct ctl_table *lblcr_ctl_table; 10322553d064SJulian Anastasov /* ip_vs_est */ 1033705dd344SJulian Anastasov struct delayed_work est_reload_work;/* Reload kthread tasks */ 1034705dd344SJulian Anastasov struct mutex est_mutex; /* protect kthread tasks */ 1035705dd344SJulian Anastasov struct hlist_head est_temp_list; /* Ests during calc phase */ 1036705dd344SJulian Anastasov struct ip_vs_est_kt_data **est_kt_arr; /* Array of kthread data ptrs */ 1037705dd344SJulian Anastasov unsigned long est_max_threads;/* Hard limit of kthreads */ 1038705dd344SJulian Anastasov int est_calc_phase; /* Calculation phase */ 1039705dd344SJulian Anastasov int est_chain_max; /* Calculated chain_max */ 1040705dd344SJulian Anastasov int est_kt_count; /* Allocated ptrs */ 1041705dd344SJulian Anastasov int est_add_ktid; /* ktid where to add ests */ 1042705dd344SJulian Anastasov atomic_t est_genid; /* kthreads reload genid */ 1043705dd344SJulian Anastasov atomic_t est_genid_done; /* applied genid */ 10442553d064SJulian Anastasov /* ip_vs_sync */ 10452553d064SJulian Anastasov spinlock_t sync_lock; 1046f73181c8SPablo Neira Ayuso struct ipvs_master_sync_state *ms; 10472553d064SJulian Anastasov spinlock_t sync_buff_lock; 10485db7c8b9SJulian Anastasov struct ip_vs_sync_thread_data *master_tinfo; 10495db7c8b9SJulian Anastasov struct ip_vs_sync_thread_data *backup_tinfo; 1050f73181c8SPablo Neira Ayuso int threads_mask; 10512553d064SJulian Anastasov volatile int sync_state; 1052ae1d48b2SHans Schillstrom struct mutex sync_mutex; 1053e4ff6751SJulian Anastasov struct ipvs_sync_daemon_cfg mcfg; /* Master Configuration */ 1054e4ff6751SJulian Anastasov struct ipvs_sync_daemon_cfg bcfg; /* Backup Configuration */ 10552553d064SJulian Anastasov /* net name space ptr */ 10562553d064SJulian Anastasov struct net *net; /* Needed by timer routines */ 105707dcc686SSimon Horman /* Number of heterogeneous destinations, needed becaus heterogeneous 105807dcc686SSimon Horman * are not supported when synchronization is enabled. 105907dcc686SSimon Horman */ 1060391f503dSAlex Gartrell unsigned int mixed_address_family_dests; 1061857ca897SJulian Anastasov unsigned int hooks_afmask; /* &1=AF_INET, &2=AF_INET6 */ 10622553d064SJulian Anastasov }; 10631da177e4SLinus Torvalds 106459e0350eSSimon Horman #define DEFAULT_SYNC_THRESHOLD 3 106559e0350eSSimon Horman #define DEFAULT_SYNC_PERIOD 50 10667532e8d4SSimon Horman #define DEFAULT_SYNC_VER 1 1067c6c96c18SAlexander Frolkin #define DEFAULT_SLOPPY_TCP 0 1068c6c96c18SAlexander Frolkin #define DEFAULT_SLOPPY_SCTP 0 1069749c42b6SJulian Anastasov #define DEFAULT_SYNC_REFRESH_PERIOD (0U * HZ) 1070749c42b6SJulian Anastasov #define DEFAULT_SYNC_RETRIES 0 10711c003b15SPablo Neira Ayuso #define IPVS_SYNC_WAKEUP_RATE 8 10721c003b15SPablo Neira Ayuso #define IPVS_SYNC_QLEN_MAX (IPVS_SYNC_WAKEUP_RATE * 4) 10731c003b15SPablo Neira Ayuso #define IPVS_SYNC_SEND_DELAY (HZ / 50) 10741c003b15SPablo Neira Ayuso #define IPVS_SYNC_CHECK_PERIOD HZ 1075749c42b6SJulian Anastasov #define IPVS_SYNC_FLUSH_TIME (HZ * 2) 1076f73181c8SPablo Neira Ayuso #define IPVS_SYNC_PORTS_MAX (1 << 6) 107759e0350eSSimon Horman 107859e0350eSSimon Horman #ifdef CONFIG_SYSCTL 107959e0350eSSimon Horman 108059e0350eSSimon Horman static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs) 108159e0350eSSimon Horman { 108259e0350eSSimon Horman return ipvs->sysctl_sync_threshold[0]; 108359e0350eSSimon Horman } 108459e0350eSSimon Horman 108559e0350eSSimon Horman static inline int sysctl_sync_period(struct netns_ipvs *ipvs) 108659e0350eSSimon Horman { 10876aa7de05SMark Rutland return READ_ONCE(ipvs->sysctl_sync_threshold[1]); 1088749c42b6SJulian Anastasov } 1089749c42b6SJulian Anastasov 1090749c42b6SJulian Anastasov static inline unsigned int sysctl_sync_refresh_period(struct netns_ipvs *ipvs) 1091749c42b6SJulian Anastasov { 10926aa7de05SMark Rutland return READ_ONCE(ipvs->sysctl_sync_refresh_period); 1093749c42b6SJulian Anastasov } 1094749c42b6SJulian Anastasov 1095749c42b6SJulian Anastasov static inline int sysctl_sync_retries(struct netns_ipvs *ipvs) 1096749c42b6SJulian Anastasov { 1097749c42b6SJulian Anastasov return ipvs->sysctl_sync_retries; 109859e0350eSSimon Horman } 109959e0350eSSimon Horman 11007532e8d4SSimon Horman static inline int sysctl_sync_ver(struct netns_ipvs *ipvs) 11017532e8d4SSimon Horman { 11027532e8d4SSimon Horman return ipvs->sysctl_sync_ver; 11037532e8d4SSimon Horman } 11047532e8d4SSimon Horman 1105c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_tcp(struct netns_ipvs *ipvs) 1106c6c96c18SAlexander Frolkin { 1107c6c96c18SAlexander Frolkin return ipvs->sysctl_sloppy_tcp; 1108c6c96c18SAlexander Frolkin } 1109c6c96c18SAlexander Frolkin 1110c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_sctp(struct netns_ipvs *ipvs) 1111c6c96c18SAlexander Frolkin { 1112c6c96c18SAlexander Frolkin return ipvs->sysctl_sloppy_sctp; 1113c6c96c18SAlexander Frolkin } 1114c6c96c18SAlexander Frolkin 1115f73181c8SPablo Neira Ayuso static inline int sysctl_sync_ports(struct netns_ipvs *ipvs) 1116f73181c8SPablo Neira Ayuso { 11176aa7de05SMark Rutland return READ_ONCE(ipvs->sysctl_sync_ports); 1118f73181c8SPablo Neira Ayuso } 1119f73181c8SPablo Neira Ayuso 11204d0c875dSJulian Anastasov static inline int sysctl_sync_persist_mode(struct netns_ipvs *ipvs) 11214d0c875dSJulian Anastasov { 11224d0c875dSJulian Anastasov return ipvs->sysctl_sync_persist_mode; 11234d0c875dSJulian Anastasov } 11244d0c875dSJulian Anastasov 112507995674SZhang Yanfei static inline unsigned long sysctl_sync_qlen_max(struct netns_ipvs *ipvs) 11261c003b15SPablo Neira Ayuso { 11271c003b15SPablo Neira Ayuso return ipvs->sysctl_sync_qlen_max; 11281c003b15SPablo Neira Ayuso } 11291c003b15SPablo Neira Ayuso 11301c003b15SPablo Neira Ayuso static inline int sysctl_sync_sock_size(struct netns_ipvs *ipvs) 11311c003b15SPablo Neira Ayuso { 11321c003b15SPablo Neira Ayuso return ipvs->sysctl_sync_sock_size; 11331c003b15SPablo Neira Ayuso } 11341c003b15SPablo Neira Ayuso 11353654e611SJulian Anastasov static inline int sysctl_pmtu_disc(struct netns_ipvs *ipvs) 11363654e611SJulian Anastasov { 11373654e611SJulian Anastasov return ipvs->sysctl_pmtu_disc; 11383654e611SJulian Anastasov } 11393654e611SJulian Anastasov 11400c12582fSJulian Anastasov static inline int sysctl_backup_only(struct netns_ipvs *ipvs) 11410c12582fSJulian Anastasov { 11420c12582fSJulian Anastasov return ipvs->sync_state & IP_VS_STATE_BACKUP && 11430c12582fSJulian Anastasov ipvs->sysctl_backup_only; 11440c12582fSJulian Anastasov } 11450c12582fSJulian Anastasov 1146d752c364SMarcelo Ricardo Leitner static inline int sysctl_conn_reuse_mode(struct netns_ipvs *ipvs) 1147d752c364SMarcelo Ricardo Leitner { 1148d752c364SMarcelo Ricardo Leitner return ipvs->sysctl_conn_reuse_mode; 1149d752c364SMarcelo Ricardo Leitner } 1150d752c364SMarcelo Ricardo Leitner 115135dfb013SAndrew Sy Kim static inline int sysctl_expire_nodest_conn(struct netns_ipvs *ipvs) 115235dfb013SAndrew Sy Kim { 115335dfb013SAndrew Sy Kim return ipvs->sysctl_expire_nodest_conn; 115435dfb013SAndrew Sy Kim } 115535dfb013SAndrew Sy Kim 115694485fedSAlex Gartrell static inline int sysctl_schedule_icmp(struct netns_ipvs *ipvs) 115794485fedSAlex Gartrell { 115894485fedSAlex Gartrell return ipvs->sysctl_schedule_icmp; 115994485fedSAlex Gartrell } 116094485fedSAlex Gartrell 11614e478098SAlex Gartrell static inline int sysctl_ignore_tunneled(struct netns_ipvs *ipvs) 11624e478098SAlex Gartrell { 11634e478098SAlex Gartrell return ipvs->sysctl_ignore_tunneled; 11644e478098SAlex Gartrell } 11654e478098SAlex Gartrell 116657032948SEric W. Biederman static inline int sysctl_cache_bypass(struct netns_ipvs *ipvs) 116757032948SEric W. Biederman { 116857032948SEric W. Biederman return ipvs->sysctl_cache_bypass; 116957032948SEric W. Biederman } 117057032948SEric W. Biederman 11712232642eSDust Li static inline int sysctl_run_estimation(struct netns_ipvs *ipvs) 11722232642eSDust Li { 11732232642eSDust Li return ipvs->sysctl_run_estimation; 11742232642eSDust Li } 11752232642eSDust Li 1176f0be83d5SJulian Anastasov static inline const struct cpumask *sysctl_est_cpulist(struct netns_ipvs *ipvs) 1177f0be83d5SJulian Anastasov { 1178f0be83d5SJulian Anastasov if (ipvs->est_cpulist_valid) 1179f0be83d5SJulian Anastasov return ipvs->sysctl_est_cpulist; 1180f0be83d5SJulian Anastasov else 1181f0be83d5SJulian Anastasov return housekeeping_cpumask(HK_TYPE_KTHREAD); 1182f0be83d5SJulian Anastasov } 1183f0be83d5SJulian Anastasov 1184f0be83d5SJulian Anastasov static inline int sysctl_est_nice(struct netns_ipvs *ipvs) 1185f0be83d5SJulian Anastasov { 1186f0be83d5SJulian Anastasov return ipvs->sysctl_est_nice; 1187f0be83d5SJulian Anastasov } 1188f0be83d5SJulian Anastasov 118959e0350eSSimon Horman #else 119059e0350eSSimon Horman 119159e0350eSSimon Horman static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs) 119259e0350eSSimon Horman { 119359e0350eSSimon Horman return DEFAULT_SYNC_THRESHOLD; 119459e0350eSSimon Horman } 119559e0350eSSimon Horman 119659e0350eSSimon Horman static inline int sysctl_sync_period(struct netns_ipvs *ipvs) 119759e0350eSSimon Horman { 119859e0350eSSimon Horman return DEFAULT_SYNC_PERIOD; 119959e0350eSSimon Horman } 120059e0350eSSimon Horman 1201749c42b6SJulian Anastasov static inline unsigned int sysctl_sync_refresh_period(struct netns_ipvs *ipvs) 1202749c42b6SJulian Anastasov { 1203749c42b6SJulian Anastasov return DEFAULT_SYNC_REFRESH_PERIOD; 1204749c42b6SJulian Anastasov } 1205749c42b6SJulian Anastasov 1206749c42b6SJulian Anastasov static inline int sysctl_sync_retries(struct netns_ipvs *ipvs) 1207749c42b6SJulian Anastasov { 1208749c42b6SJulian Anastasov return DEFAULT_SYNC_RETRIES & 3; 1209749c42b6SJulian Anastasov } 1210749c42b6SJulian Anastasov 12117532e8d4SSimon Horman static inline int sysctl_sync_ver(struct netns_ipvs *ipvs) 12127532e8d4SSimon Horman { 12137532e8d4SSimon Horman return DEFAULT_SYNC_VER; 12147532e8d4SSimon Horman } 12157532e8d4SSimon Horman 1216c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_tcp(struct netns_ipvs *ipvs) 1217c6c96c18SAlexander Frolkin { 1218c6c96c18SAlexander Frolkin return DEFAULT_SLOPPY_TCP; 1219c6c96c18SAlexander Frolkin } 1220c6c96c18SAlexander Frolkin 1221c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_sctp(struct netns_ipvs *ipvs) 1222c6c96c18SAlexander Frolkin { 1223c6c96c18SAlexander Frolkin return DEFAULT_SLOPPY_SCTP; 1224c6c96c18SAlexander Frolkin } 1225c6c96c18SAlexander Frolkin 1226f73181c8SPablo Neira Ayuso static inline int sysctl_sync_ports(struct netns_ipvs *ipvs) 1227f73181c8SPablo Neira Ayuso { 1228f73181c8SPablo Neira Ayuso return 1; 1229f73181c8SPablo Neira Ayuso } 1230f73181c8SPablo Neira Ayuso 12314d0c875dSJulian Anastasov static inline int sysctl_sync_persist_mode(struct netns_ipvs *ipvs) 12324d0c875dSJulian Anastasov { 12334d0c875dSJulian Anastasov return 0; 12344d0c875dSJulian Anastasov } 12354d0c875dSJulian Anastasov 123607995674SZhang Yanfei static inline unsigned long sysctl_sync_qlen_max(struct netns_ipvs *ipvs) 12371c003b15SPablo Neira Ayuso { 12381c003b15SPablo Neira Ayuso return IPVS_SYNC_QLEN_MAX; 12391c003b15SPablo Neira Ayuso } 12401c003b15SPablo Neira Ayuso 12411c003b15SPablo Neira Ayuso static inline int sysctl_sync_sock_size(struct netns_ipvs *ipvs) 12421c003b15SPablo Neira Ayuso { 12431c003b15SPablo Neira Ayuso return 0; 12441c003b15SPablo Neira Ayuso } 12451c003b15SPablo Neira Ayuso 12463654e611SJulian Anastasov static inline int sysctl_pmtu_disc(struct netns_ipvs *ipvs) 12473654e611SJulian Anastasov { 12483654e611SJulian Anastasov return 1; 12493654e611SJulian Anastasov } 12503654e611SJulian Anastasov 12510c12582fSJulian Anastasov static inline int sysctl_backup_only(struct netns_ipvs *ipvs) 12520c12582fSJulian Anastasov { 12530c12582fSJulian Anastasov return 0; 12540c12582fSJulian Anastasov } 12550c12582fSJulian Anastasov 1256d752c364SMarcelo Ricardo Leitner static inline int sysctl_conn_reuse_mode(struct netns_ipvs *ipvs) 1257d752c364SMarcelo Ricardo Leitner { 1258d752c364SMarcelo Ricardo Leitner return 1; 1259d752c364SMarcelo Ricardo Leitner } 1260d752c364SMarcelo Ricardo Leitner 126135dfb013SAndrew Sy Kim static inline int sysctl_expire_nodest_conn(struct netns_ipvs *ipvs) 126235dfb013SAndrew Sy Kim { 126335dfb013SAndrew Sy Kim return 0; 126435dfb013SAndrew Sy Kim } 126535dfb013SAndrew Sy Kim 126694485fedSAlex Gartrell static inline int sysctl_schedule_icmp(struct netns_ipvs *ipvs) 126794485fedSAlex Gartrell { 126894485fedSAlex Gartrell return 0; 126994485fedSAlex Gartrell } 127094485fedSAlex Gartrell 12714e478098SAlex Gartrell static inline int sysctl_ignore_tunneled(struct netns_ipvs *ipvs) 12724e478098SAlex Gartrell { 12734e478098SAlex Gartrell return 0; 12744e478098SAlex Gartrell } 12754e478098SAlex Gartrell 127657032948SEric W. Biederman static inline int sysctl_cache_bypass(struct netns_ipvs *ipvs) 127757032948SEric W. Biederman { 127857032948SEric W. Biederman return 0; 127957032948SEric W. Biederman } 128057032948SEric W. Biederman 12812232642eSDust Li static inline int sysctl_run_estimation(struct netns_ipvs *ipvs) 12822232642eSDust Li { 12832232642eSDust Li return 1; 12842232642eSDust Li } 12852232642eSDust Li 1286f0be83d5SJulian Anastasov static inline const struct cpumask *sysctl_est_cpulist(struct netns_ipvs *ipvs) 1287f0be83d5SJulian Anastasov { 1288f0be83d5SJulian Anastasov return housekeeping_cpumask(HK_TYPE_KTHREAD); 1289f0be83d5SJulian Anastasov } 1290f0be83d5SJulian Anastasov 1291f0be83d5SJulian Anastasov static inline int sysctl_est_nice(struct netns_ipvs *ipvs) 1292f0be83d5SJulian Anastasov { 1293f0be83d5SJulian Anastasov return IPVS_EST_NICE; 1294f0be83d5SJulian Anastasov } 1295f0be83d5SJulian Anastasov 129659e0350eSSimon Horman #endif 129759e0350eSSimon Horman 129807dcc686SSimon Horman /* IPVS core functions 12991da177e4SLinus Torvalds * (from ip_vs_core.c) 13001da177e4SLinus Torvalds */ 13015c3a0fd7SJoe Perches const char *ip_vs_proto_name(unsigned int proto); 13025c3a0fd7SJoe Perches void ip_vs_init_hash_table(struct list_head *table, int rows); 130339b97223SMarco Angaroni struct ip_vs_conn *ip_vs_new_conn_out(struct ip_vs_service *svc, 130439b97223SMarco Angaroni struct ip_vs_dest *dest, 130539b97223SMarco Angaroni struct sk_buff *skb, 130639b97223SMarco Angaroni const struct ip_vs_iphdr *iph, 130739b97223SMarco Angaroni __be16 dport, 130839b97223SMarco Angaroni __be16 cport); 1309afdd6140SSven Wegener #define IP_VS_INIT_HASH_TABLE(t) ip_vs_init_hash_table((t), ARRAY_SIZE((t))) 13101da177e4SLinus Torvalds 13111da177e4SLinus Torvalds #define IP_VS_APP_TYPE_FTP 1 13121da177e4SLinus Torvalds 131307dcc686SSimon Horman /* ip_vs_conn handling functions 13141da177e4SLinus Torvalds * (from ip_vs_conn.c) 13151da177e4SLinus Torvalds */ 13161da177e4SLinus Torvalds enum { 13171da177e4SLinus Torvalds IP_VS_DIR_INPUT = 0, 13181da177e4SLinus Torvalds IP_VS_DIR_OUTPUT, 13191da177e4SLinus Torvalds IP_VS_DIR_INPUT_ONLY, 13201da177e4SLinus Torvalds IP_VS_DIR_LAST, 13211da177e4SLinus Torvalds }; 13221da177e4SLinus Torvalds 132319913decSEric W. Biederman static inline void ip_vs_conn_fill_param(struct netns_ipvs *ipvs, int af, int protocol, 1324f11017ecSSimon Horman const union nf_inet_addr *caddr, 1325f11017ecSSimon Horman __be16 cport, 1326f11017ecSSimon Horman const union nf_inet_addr *vaddr, 1327f11017ecSSimon Horman __be16 vport, 1328f11017ecSSimon Horman struct ip_vs_conn_param *p) 1329f11017ecSSimon Horman { 133019913decSEric W. Biederman p->ipvs = ipvs; 1331f11017ecSSimon Horman p->af = af; 1332f11017ecSSimon Horman p->protocol = protocol; 1333f11017ecSSimon Horman p->caddr = caddr; 1334f11017ecSSimon Horman p->cport = cport; 1335f11017ecSSimon Horman p->vaddr = vaddr; 1336f11017ecSSimon Horman p->vport = vport; 133785999283SSimon Horman p->pe = NULL; 133885999283SSimon Horman p->pe_data = NULL; 1339f11017ecSSimon Horman } 134028364a59SJulius Volz 1341f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_in_get(const struct ip_vs_conn_param *p); 1342f11017ecSSimon Horman struct ip_vs_conn *ip_vs_ct_in_get(const struct ip_vs_conn_param *p); 134328364a59SJulius Volz 1344ab161976SEric W. Biederman struct ip_vs_conn * ip_vs_conn_in_get_proto(struct netns_ipvs *ipvs, int af, 1345ab161976SEric W. Biederman const struct sk_buff *skb, 1346802c41adSAlex Gartrell const struct ip_vs_iphdr *iph); 13475c0d2374SSimon Horman 1348f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_out_get(const struct ip_vs_conn_param *p); 13491da177e4SLinus Torvalds 13500cf705c8SEric W. Biederman struct ip_vs_conn * ip_vs_conn_out_get_proto(struct netns_ipvs *ipvs, int af, 13510cf705c8SEric W. Biederman const struct sk_buff *skb, 1352802c41adSAlex Gartrell const struct ip_vs_iphdr *iph); 13535c0d2374SSimon Horman 1354088339a5SJulian Anastasov /* Get reference to gain full access to conn. 1355088339a5SJulian Anastasov * By default, RCU read-side critical sections have access only to 1356088339a5SJulian Anastasov * conn fields and its PE data, see ip_vs_conn_rcu_free() for reference. 1357088339a5SJulian Anastasov */ 1358088339a5SJulian Anastasov static inline bool __ip_vs_conn_get(struct ip_vs_conn *cp) 1359088339a5SJulian Anastasov { 1360b54ab92bSReshetova, Elena return refcount_inc_not_zero(&cp->refcnt); 1361088339a5SJulian Anastasov } 1362088339a5SJulian Anastasov 13631da177e4SLinus Torvalds /* put back the conn without restarting its timer */ 13641da177e4SLinus Torvalds static inline void __ip_vs_conn_put(struct ip_vs_conn *cp) 13651da177e4SLinus Torvalds { 13664e857c58SPeter Zijlstra smp_mb__before_atomic(); 1367b54ab92bSReshetova, Elena refcount_dec(&cp->refcnt); 13681da177e4SLinus Torvalds } 13695c3a0fd7SJoe Perches void ip_vs_conn_put(struct ip_vs_conn *cp); 13705c3a0fd7SJoe Perches void ip_vs_conn_fill_cport(struct ip_vs_conn *cp, __be16 cport); 13711da177e4SLinus Torvalds 1372ba38528aSAlex Gartrell struct ip_vs_conn *ip_vs_conn_new(const struct ip_vs_conn_param *p, int dest_af, 1373f11017ecSSimon Horman const union nf_inet_addr *daddr, 137495c96174SEric Dumazet __be16 dport, unsigned int flags, 13750e051e68SHans Schillstrom struct ip_vs_dest *dest, __u32 fwmark); 13765c3a0fd7SJoe Perches void ip_vs_conn_expire_now(struct ip_vs_conn *cp); 13771da177e4SLinus Torvalds 1378ec1b28caSJulian Anastasov const char *ip_vs_state_name(const struct ip_vs_conn *cp); 13791da177e4SLinus Torvalds 138069f39093SEric W. Biederman void ip_vs_tcp_conn_listen(struct ip_vs_conn *cp); 13813ec10d3aSMarco Angaroni int ip_vs_check_template(struct ip_vs_conn *ct, struct ip_vs_dest *cdest); 1382423b5595SEric W. Biederman void ip_vs_random_dropentry(struct netns_ipvs *ipvs); 13835c3a0fd7SJoe Perches int ip_vs_conn_init(void); 13845c3a0fd7SJoe Perches void ip_vs_conn_cleanup(void); 13851da177e4SLinus Torvalds 13861da177e4SLinus Torvalds static inline void ip_vs_control_del(struct ip_vs_conn *cp) 13871da177e4SLinus Torvalds { 13881da177e4SLinus Torvalds struct ip_vs_conn *ctl_cp = cp->control; 13891da177e4SLinus Torvalds if (!ctl_cp) { 1390cfc78c5aSJulius Volz IP_VS_ERR_BUF("request control DEL for uncontrolled: " 1391cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1392cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1393cfc78c5aSJulius Volz ntohs(cp->cport), 1394cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1395cfc78c5aSJulius Volz ntohs(cp->vport)); 1396cfc78c5aSJulius Volz 13971da177e4SLinus Torvalds return; 13981da177e4SLinus Torvalds } 13991da177e4SLinus Torvalds 1400cfc78c5aSJulius Volz IP_VS_DBG_BUF(7, "DELeting control for: " 1401cfc78c5aSJulius Volz "cp.dst=%s:%d ctl_cp.dst=%s:%d\n", 1402cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1403cfc78c5aSJulius Volz ntohs(cp->cport), 1404cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr), 1405cfc78c5aSJulius Volz ntohs(ctl_cp->cport)); 14061da177e4SLinus Torvalds 14071da177e4SLinus Torvalds cp->control = NULL; 14081da177e4SLinus Torvalds if (atomic_read(&ctl_cp->n_control) == 0) { 1409cfc78c5aSJulius Volz IP_VS_ERR_BUF("BUG control DEL with n=0 : " 1410cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1411cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1412cfc78c5aSJulius Volz ntohs(cp->cport), 1413cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1414cfc78c5aSJulius Volz ntohs(cp->vport)); 1415cfc78c5aSJulius Volz 14161da177e4SLinus Torvalds return; 14171da177e4SLinus Torvalds } 14181da177e4SLinus Torvalds atomic_dec(&ctl_cp->n_control); 14191da177e4SLinus Torvalds } 14201da177e4SLinus Torvalds 14211da177e4SLinus Torvalds static inline void 14221da177e4SLinus Torvalds ip_vs_control_add(struct ip_vs_conn *cp, struct ip_vs_conn *ctl_cp) 14231da177e4SLinus Torvalds { 14241da177e4SLinus Torvalds if (cp->control) { 1425cfc78c5aSJulius Volz IP_VS_ERR_BUF("request control ADD for already controlled: " 1426cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1427cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1428cfc78c5aSJulius Volz ntohs(cp->cport), 1429cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1430cfc78c5aSJulius Volz ntohs(cp->vport)); 1431cfc78c5aSJulius Volz 14321da177e4SLinus Torvalds ip_vs_control_del(cp); 14331da177e4SLinus Torvalds } 14341da177e4SLinus Torvalds 1435cfc78c5aSJulius Volz IP_VS_DBG_BUF(7, "ADDing control for: " 1436cfc78c5aSJulius Volz "cp.dst=%s:%d ctl_cp.dst=%s:%d\n", 1437cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1438cfc78c5aSJulius Volz ntohs(cp->cport), 1439cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr), 1440cfc78c5aSJulius Volz ntohs(ctl_cp->cport)); 14411da177e4SLinus Torvalds 14421da177e4SLinus Torvalds cp->control = ctl_cp; 14431da177e4SLinus Torvalds atomic_inc(&ctl_cp->n_control); 14441da177e4SLinus Torvalds } 14451da177e4SLinus Torvalds 144627541143SJulian Anastasov /* Mark our template as assured */ 144727541143SJulian Anastasov static inline void 144827541143SJulian Anastasov ip_vs_control_assure_ct(struct ip_vs_conn *cp) 144927541143SJulian Anastasov { 145027541143SJulian Anastasov struct ip_vs_conn *ct = cp->control; 145127541143SJulian Anastasov 145227541143SJulian Anastasov if (ct && !(ct->state & IP_VS_CTPL_S_ASSURED) && 145327541143SJulian Anastasov (ct->flags & IP_VS_CONN_F_TEMPLATE)) 145427541143SJulian Anastasov ct->state |= IP_VS_CTPL_S_ASSURED; 145527541143SJulian Anastasov } 145627541143SJulian Anastasov 145707dcc686SSimon Horman /* IPVS netns init & cleanup functions */ 1458a4dd0360SEric W. Biederman int ip_vs_estimator_net_init(struct netns_ipvs *ipvs); 14593d993766SEric W. Biederman int ip_vs_control_net_init(struct netns_ipvs *ipvs); 14607d1f88ecSEric W. Biederman int ip_vs_protocol_net_init(struct netns_ipvs *ipvs); 1461b5dd212cSEric W. Biederman int ip_vs_app_net_init(struct netns_ipvs *ipvs); 14622f3edc6aSEric W. Biederman int ip_vs_conn_net_init(struct netns_ipvs *ipvs); 1463802cb437SEric W. Biederman int ip_vs_sync_net_init(struct netns_ipvs *ipvs); 14642f3edc6aSEric W. Biederman void ip_vs_conn_net_cleanup(struct netns_ipvs *ipvs); 1465b5dd212cSEric W. Biederman void ip_vs_app_net_cleanup(struct netns_ipvs *ipvs); 14667d1f88ecSEric W. Biederman void ip_vs_protocol_net_cleanup(struct netns_ipvs *ipvs); 14673d993766SEric W. Biederman void ip_vs_control_net_cleanup(struct netns_ipvs *ipvs); 1468a4dd0360SEric W. Biederman void ip_vs_estimator_net_cleanup(struct netns_ipvs *ipvs); 1469ebea1f7cSEric W. Biederman void ip_vs_sync_net_cleanup(struct netns_ipvs *ipvs); 14705d5a0815SHaishuang Yan void ip_vs_service_nets_cleanup(struct list_head *net_list); 14711da177e4SLinus Torvalds 147207dcc686SSimon Horman /* IPVS application functions 14731da177e4SLinus Torvalds * (from ip_vs_app.c) 14741da177e4SLinus Torvalds */ 14751da177e4SLinus Torvalds #define IP_VS_APP_MAX_PORTS 8 14769f8128a5SEric W. Biederman struct ip_vs_app *register_ip_vs_app(struct netns_ipvs *ipvs, struct ip_vs_app *app); 14779f8128a5SEric W. Biederman void unregister_ip_vs_app(struct netns_ipvs *ipvs, struct ip_vs_app *app); 14785c3a0fd7SJoe Perches int ip_vs_bind_app(struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 14795c3a0fd7SJoe Perches void ip_vs_unbind_app(struct ip_vs_conn *cp); 14803250dc9cSEric W. Biederman int register_ip_vs_app_inc(struct netns_ipvs *ipvs, struct ip_vs_app *app, __u16 proto, 14815c3a0fd7SJoe Perches __u16 port); 14825c3a0fd7SJoe Perches int ip_vs_app_inc_get(struct ip_vs_app *inc); 14835c3a0fd7SJoe Perches void ip_vs_app_inc_put(struct ip_vs_app *inc); 14841da177e4SLinus Torvalds 1485d12e1229SJulian Anastasov int ip_vs_app_pkt_out(struct ip_vs_conn *, struct sk_buff *skb, 1486d12e1229SJulian Anastasov struct ip_vs_iphdr *ipvsh); 1487d12e1229SJulian Anastasov int ip_vs_app_pkt_in(struct ip_vs_conn *, struct sk_buff *skb, 1488d12e1229SJulian Anastasov struct ip_vs_iphdr *ipvsh); 14891da177e4SLinus Torvalds 14908be67a66SSimon Horman int register_ip_vs_pe(struct ip_vs_pe *pe); 14918be67a66SSimon Horman int unregister_ip_vs_pe(struct ip_vs_pe *pe); 1492e9e5eee8SSimon Horman struct ip_vs_pe *ip_vs_pe_getbyname(const char *name); 1493fe5e7a1eSHans Schillstrom struct ip_vs_pe *__ip_vs_pe_getbyname(const char *pe_name); 1494e9e5eee8SSimon Horman 149507dcc686SSimon Horman /* Use a #define to avoid all of module.h just for these trivial ops */ 149669e7dae4SPaul Gortmaker #define ip_vs_pe_get(pe) \ 149769e7dae4SPaul Gortmaker if (pe && pe->module) \ 1498e9e5eee8SSimon Horman __module_get(pe->module); 1499e9e5eee8SSimon Horman 150069e7dae4SPaul Gortmaker #define ip_vs_pe_put(pe) \ 150169e7dae4SPaul Gortmaker if (pe && pe->module) \ 1502e9e5eee8SSimon Horman module_put(pe->module); 15031da177e4SLinus Torvalds 150407dcc686SSimon Horman /* IPVS protocol functions (from ip_vs_proto.c) */ 15055c3a0fd7SJoe Perches int ip_vs_protocol_init(void); 15065c3a0fd7SJoe Perches void ip_vs_protocol_cleanup(void); 15075c3a0fd7SJoe Perches void ip_vs_protocol_timeout_change(struct netns_ipvs *ipvs, int flags); 15085c3a0fd7SJoe Perches int *ip_vs_create_timeout_table(int *table, int size); 15095c3a0fd7SJoe Perches void ip_vs_tcpudp_debug_packet(int af, struct ip_vs_protocol *pp, 15105c3a0fd7SJoe Perches const struct sk_buff *skb, int offset, 15115c3a0fd7SJoe Perches const char *msg); 15121da177e4SLinus Torvalds 15131da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_tcp; 15141da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_udp; 15151da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_icmp; 15161da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_esp; 15171da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_ah; 15182906f66aSVenkata Mohan Reddy extern struct ip_vs_protocol ip_vs_protocol_sctp; 15191da177e4SLinus Torvalds 152007dcc686SSimon Horman /* Registering/unregistering scheduler functions 15211da177e4SLinus Torvalds * (from ip_vs_sched.c) 15221da177e4SLinus Torvalds */ 15235c3a0fd7SJoe Perches int register_ip_vs_scheduler(struct ip_vs_scheduler *scheduler); 15245c3a0fd7SJoe Perches int unregister_ip_vs_scheduler(struct ip_vs_scheduler *scheduler); 15255c3a0fd7SJoe Perches int ip_vs_bind_scheduler(struct ip_vs_service *svc, 15261da177e4SLinus Torvalds struct ip_vs_scheduler *scheduler); 15275c3a0fd7SJoe Perches void ip_vs_unbind_scheduler(struct ip_vs_service *svc, 1528ceec4c38SJulian Anastasov struct ip_vs_scheduler *sched); 15295c3a0fd7SJoe Perches struct ip_vs_scheduler *ip_vs_scheduler_get(const char *sched_name); 15305c3a0fd7SJoe Perches void ip_vs_scheduler_put(struct ip_vs_scheduler *scheduler); 15315c3a0fd7SJoe Perches struct ip_vs_conn * 1532190ecd27SJulian Anastasov ip_vs_schedule(struct ip_vs_service *svc, struct sk_buff *skb, 1533d4383f04SJesper Dangaard Brouer struct ip_vs_proto_data *pd, int *ignored, 1534d4383f04SJesper Dangaard Brouer struct ip_vs_iphdr *iph); 15355c3a0fd7SJoe Perches int ip_vs_leave(struct ip_vs_service *svc, struct sk_buff *skb, 1536d4383f04SJesper Dangaard Brouer struct ip_vs_proto_data *pd, struct ip_vs_iphdr *iph); 15371da177e4SLinus Torvalds 15385c3a0fd7SJoe Perches void ip_vs_scheduler_err(struct ip_vs_service *svc, const char *msg); 153941ac51eeSPatrick Schaaf 154007dcc686SSimon Horman /* IPVS control data and functions (from ip_vs_ctl.c) */ 15411da177e4SLinus Torvalds extern struct ip_vs_stats ip_vs_stats; 1542b880c1f0SHans Schillstrom extern int sysctl_ip_vs_sync_ver; 15431da177e4SLinus Torvalds 15445c3a0fd7SJoe Perches struct ip_vs_service * 15450a4fd6ceSEric W. Biederman ip_vs_service_find(struct netns_ipvs *ipvs, int af, __u32 fwmark, __u16 protocol, 15463c2e0505SJulius Volz const union nf_inet_addr *vaddr, __be16 vport); 15471da177e4SLinus Torvalds 154848aed1b0SEric W. Biederman bool ip_vs_has_real_service(struct netns_ipvs *ipvs, int af, __u16 protocol, 15497937df15SJulius Volz const union nf_inet_addr *daddr, __be16 dport); 15507937df15SJulius Volz 155139b97223SMarco Angaroni struct ip_vs_dest * 155239b97223SMarco Angaroni ip_vs_find_real_service(struct netns_ipvs *ipvs, int af, __u16 protocol, 155339b97223SMarco Angaroni const union nf_inet_addr *daddr, __be16 dport); 15542aa3c9f4SJulian Anastasov struct ip_vs_dest *ip_vs_find_tunnel(struct netns_ipvs *ipvs, int af, 15552aa3c9f4SJulian Anastasov const union nf_inet_addr *daddr, 15562aa3c9f4SJulian Anastasov __be16 tun_port); 155739b97223SMarco Angaroni 15585c3a0fd7SJoe Perches int ip_vs_use_count_inc(void); 15595c3a0fd7SJoe Perches void ip_vs_use_count_dec(void); 15605c3a0fd7SJoe Perches int ip_vs_register_nl_ioctl(void); 15615c3a0fd7SJoe Perches void ip_vs_unregister_nl_ioctl(void); 15625c3a0fd7SJoe Perches int ip_vs_control_init(void); 15635c3a0fd7SJoe Perches void ip_vs_control_cleanup(void); 15645c3a0fd7SJoe Perches struct ip_vs_dest * 1565dc2add6fSEric W. Biederman ip_vs_find_dest(struct netns_ipvs *ipvs, int svc_af, int dest_af, 1566655eef10SAlex Gartrell const union nf_inet_addr *daddr, __be16 dport, 1567655eef10SAlex Gartrell const union nf_inet_addr *vaddr, __be16 vport, 156852793dbeSJulian Anastasov __u16 protocol, __u32 fwmark, __u32 flags); 15695c3a0fd7SJoe Perches void ip_vs_try_bind_dest(struct ip_vs_conn *cp); 15701da177e4SLinus Torvalds 1571fca9c20aSJulian Anastasov static inline void ip_vs_dest_hold(struct ip_vs_dest *dest) 1572fca9c20aSJulian Anastasov { 1573b54ab92bSReshetova, Elena refcount_inc(&dest->refcnt); 1574fca9c20aSJulian Anastasov } 1575fca9c20aSJulian Anastasov 1576fca9c20aSJulian Anastasov static inline void ip_vs_dest_put(struct ip_vs_dest *dest) 1577fca9c20aSJulian Anastasov { 15784e857c58SPeter Zijlstra smp_mb__before_atomic(); 1579b54ab92bSReshetova, Elena refcount_dec(&dest->refcnt); 1580fca9c20aSJulian Anastasov } 15811da177e4SLinus Torvalds 15829e4e948aSJulian Anastasov static inline void ip_vs_dest_put_and_free(struct ip_vs_dest *dest) 15839e4e948aSJulian Anastasov { 1584b54ab92bSReshetova, Elena if (refcount_dec_and_test(&dest->refcnt)) 15859e4e948aSJulian Anastasov kfree(dest); 15869e4e948aSJulian Anastasov } 15879e4e948aSJulian Anastasov 158807dcc686SSimon Horman /* IPVS sync daemon data and function prototypes 15891da177e4SLinus Torvalds * (from ip_vs_sync.c) 15901da177e4SLinus Torvalds */ 15916ac121d7SEric W. Biederman int start_sync_thread(struct netns_ipvs *ipvs, struct ipvs_sync_daemon_cfg *cfg, 1592e4ff6751SJulian Anastasov int state); 1593b3cf3cbfSEric W. Biederman int stop_sync_thread(struct netns_ipvs *ipvs, int state); 1594b61a8c1aSEric W. Biederman void ip_vs_sync_conn(struct netns_ipvs *ipvs, struct ip_vs_conn *cp, int pkts); 15951da177e4SLinus Torvalds 159607dcc686SSimon Horman /* IPVS rate estimator prototypes (from ip_vs_est.c) */ 1597705dd344SJulian Anastasov int ip_vs_start_estimator(struct netns_ipvs *ipvs, struct ip_vs_stats *stats); 15980f34d54bSEric W. Biederman void ip_vs_stop_estimator(struct netns_ipvs *ipvs, struct ip_vs_stats *stats); 15995c3a0fd7SJoe Perches void ip_vs_zero_estimator(struct ip_vs_stats *stats); 1600cd67cd5eSJulian Anastasov void ip_vs_read_estimator(struct ip_vs_kstats *dst, struct ip_vs_stats *stats); 1601705dd344SJulian Anastasov void ip_vs_est_reload_start(struct netns_ipvs *ipvs); 1602705dd344SJulian Anastasov int ip_vs_est_kthread_start(struct netns_ipvs *ipvs, 1603705dd344SJulian Anastasov struct ip_vs_est_kt_data *kd); 1604705dd344SJulian Anastasov void ip_vs_est_kthread_stop(struct ip_vs_est_kt_data *kd); 16051da177e4SLinus Torvalds 1606f0be83d5SJulian Anastasov static inline void ip_vs_est_stopped_recalc(struct netns_ipvs *ipvs) 1607f0be83d5SJulian Anastasov { 1608f0be83d5SJulian Anastasov #ifdef CONFIG_SYSCTL 1609144361c1SJulian Anastasov /* Stop tasks while cpulist is empty or if disabled with flag */ 1610144361c1SJulian Anastasov ipvs->est_stopped = !sysctl_run_estimation(ipvs) || 1611144361c1SJulian Anastasov (ipvs->est_cpulist_valid && 1612144361c1SJulian Anastasov cpumask_empty(sysctl_est_cpulist(ipvs))); 1613f0be83d5SJulian Anastasov #endif 1614f0be83d5SJulian Anastasov } 1615f0be83d5SJulian Anastasov 1616f0be83d5SJulian Anastasov static inline bool ip_vs_est_stopped(struct netns_ipvs *ipvs) 1617f0be83d5SJulian Anastasov { 1618f0be83d5SJulian Anastasov #ifdef CONFIG_SYSCTL 1619f0be83d5SJulian Anastasov return ipvs->est_stopped; 1620f0be83d5SJulian Anastasov #else 1621f0be83d5SJulian Anastasov return false; 1622f0be83d5SJulian Anastasov #endif 1623f0be83d5SJulian Anastasov } 1624f0be83d5SJulian Anastasov 1625f0be83d5SJulian Anastasov static inline int ip_vs_est_max_threads(struct netns_ipvs *ipvs) 1626f0be83d5SJulian Anastasov { 1627f0be83d5SJulian Anastasov unsigned int limit = IPVS_EST_CPU_KTHREADS * 1628f0be83d5SJulian Anastasov cpumask_weight(sysctl_est_cpulist(ipvs)); 1629f0be83d5SJulian Anastasov 1630f0be83d5SJulian Anastasov return max(1U, limit); 1631f0be83d5SJulian Anastasov } 1632f0be83d5SJulian Anastasov 163307dcc686SSimon Horman /* Various IPVS packet transmitters (from ip_vs_xmit.c) */ 16345c3a0fd7SJoe Perches int ip_vs_null_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1635d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 16365c3a0fd7SJoe Perches int ip_vs_bypass_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1637d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 16385c3a0fd7SJoe Perches int ip_vs_nat_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1639d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 16405c3a0fd7SJoe Perches int ip_vs_tunnel_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 16415c3a0fd7SJoe Perches struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 16425c3a0fd7SJoe Perches int ip_vs_dr_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 16435c3a0fd7SJoe Perches struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 16445c3a0fd7SJoe Perches int ip_vs_icmp_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1645d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, int offset, 1646d4383f04SJesper Dangaard Brouer unsigned int hooknum, struct ip_vs_iphdr *iph); 16475c3a0fd7SJoe Perches void ip_vs_dest_dst_rcu_free(struct rcu_head *head); 16481da177e4SLinus Torvalds 1649b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6 16505c3a0fd7SJoe Perches int ip_vs_bypass_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 1651d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 16525c3a0fd7SJoe Perches int ip_vs_nat_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 16535c3a0fd7SJoe Perches struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 16545c3a0fd7SJoe Perches int ip_vs_tunnel_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 16555c3a0fd7SJoe Perches struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 16565c3a0fd7SJoe Perches int ip_vs_dr_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 16575c3a0fd7SJoe Perches struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 16585c3a0fd7SJoe Perches int ip_vs_icmp_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 1659d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, int offset, 1660d4383f04SJesper Dangaard Brouer unsigned int hooknum, struct ip_vs_iphdr *iph); 1661b3cdd2a7SJulius Volz #endif 16621da177e4SLinus Torvalds 16633a1bbf18SSimon Horman #ifdef CONFIG_SYSCTL 166407dcc686SSimon Horman /* This is a simple mechanism to ignore packets when 16651da177e4SLinus Torvalds * we are loaded. Just set ip_vs_drop_rate to 'n' and 16661da177e4SLinus Torvalds * we start to drop 1/rate of the packets 16671da177e4SLinus Torvalds */ 1668a0840e2eSHans Schillstrom static inline int ip_vs_todrop(struct netns_ipvs *ipvs) 16691da177e4SLinus Torvalds { 1670a0840e2eSHans Schillstrom if (!ipvs->drop_rate) 1671a0840e2eSHans Schillstrom return 0; 1672a0840e2eSHans Schillstrom if (--ipvs->drop_counter > 0) 1673a0840e2eSHans Schillstrom return 0; 1674a0840e2eSHans Schillstrom ipvs->drop_counter = ipvs->drop_rate; 16751da177e4SLinus Torvalds return 1; 16761da177e4SLinus Torvalds } 16773a1bbf18SSimon Horman #else 16783a1bbf18SSimon Horman static inline int ip_vs_todrop(struct netns_ipvs *ipvs) { return 0; } 16793a1bbf18SSimon Horman #endif 16801da177e4SLinus Torvalds 168135dfb013SAndrew Sy Kim #ifdef CONFIG_SYSCTL 168235dfb013SAndrew Sy Kim /* Enqueue delayed work for expiring no dest connections 168335dfb013SAndrew Sy Kim * Only run when sysctl_expire_nodest=1 168435dfb013SAndrew Sy Kim */ 168535dfb013SAndrew Sy Kim static inline void ip_vs_enqueue_expire_nodest_conns(struct netns_ipvs *ipvs) 168635dfb013SAndrew Sy Kim { 168735dfb013SAndrew Sy Kim if (sysctl_expire_nodest_conn(ipvs)) 168835dfb013SAndrew Sy Kim queue_delayed_work(system_long_wq, 168935dfb013SAndrew Sy Kim &ipvs->expire_nodest_conn_work, 1); 169035dfb013SAndrew Sy Kim } 169135dfb013SAndrew Sy Kim 169235dfb013SAndrew Sy Kim void ip_vs_expire_nodest_conn_flush(struct netns_ipvs *ipvs); 169335dfb013SAndrew Sy Kim #else 169435dfb013SAndrew Sy Kim static inline void ip_vs_enqueue_expire_nodest_conns(struct netns_ipvs *ipvs) {} 169535dfb013SAndrew Sy Kim #endif 169635dfb013SAndrew Sy Kim 16971da40ab6SJulian Anastasov #define IP_VS_DFWD_METHOD(dest) (atomic_read(&(dest)->conn_flags) & \ 16981da40ab6SJulian Anastasov IP_VS_CONN_F_FWD_MASK) 16991da40ab6SJulian Anastasov 170007dcc686SSimon Horman /* ip_vs_fwd_tag returns the forwarding tag of the connection */ 17011da177e4SLinus Torvalds #define IP_VS_FWD_METHOD(cp) (cp->flags & IP_VS_CONN_F_FWD_MASK) 17021da177e4SLinus Torvalds 1703732db659SAdrian Bunk static inline char ip_vs_fwd_tag(struct ip_vs_conn *cp) 17041da177e4SLinus Torvalds { 17051da177e4SLinus Torvalds char fwd; 17061da177e4SLinus Torvalds 17071da177e4SLinus Torvalds switch (IP_VS_FWD_METHOD(cp)) { 17081da177e4SLinus Torvalds case IP_VS_CONN_F_MASQ: 17091da177e4SLinus Torvalds fwd = 'M'; break; 17101da177e4SLinus Torvalds case IP_VS_CONN_F_LOCALNODE: 17111da177e4SLinus Torvalds fwd = 'L'; break; 17121da177e4SLinus Torvalds case IP_VS_CONN_F_TUNNEL: 17131da177e4SLinus Torvalds fwd = 'T'; break; 17141da177e4SLinus Torvalds case IP_VS_CONN_F_DROUTE: 17151da177e4SLinus Torvalds fwd = 'R'; break; 17161da177e4SLinus Torvalds case IP_VS_CONN_F_BYPASS: 17171da177e4SLinus Torvalds fwd = 'B'; break; 17181da177e4SLinus Torvalds default: 17191da177e4SLinus Torvalds fwd = '?'; break; 17201da177e4SLinus Torvalds } 17211da177e4SLinus Torvalds return fwd; 17221da177e4SLinus Torvalds } 17231da177e4SLinus Torvalds 17245c3a0fd7SJoe Perches void ip_vs_nat_icmp(struct sk_buff *skb, struct ip_vs_protocol *pp, 17251da177e4SLinus Torvalds struct ip_vs_conn *cp, int dir); 17261da177e4SLinus Torvalds 1727b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6 17285c3a0fd7SJoe Perches void ip_vs_nat_icmp_v6(struct sk_buff *skb, struct ip_vs_protocol *pp, 1729b3cdd2a7SJulius Volz struct ip_vs_conn *cp, int dir); 1730b3cdd2a7SJulius Volz #endif 1731b3cdd2a7SJulius Volz 17325c3a0fd7SJoe Perches __sum16 ip_vs_checksum_complete(struct sk_buff *skb, int offset); 17331da177e4SLinus Torvalds 1734f9214b26SAl Viro static inline __wsum ip_vs_check_diff4(__be32 old, __be32 new, __wsum oldsum) 17351da177e4SLinus Torvalds { 1736f9214b26SAl Viro __be32 diff[2] = { ~old, new }; 17371da177e4SLinus Torvalds 173807f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 1739f9214b26SAl Viro } 1740f9214b26SAl Viro 17410bbdd42bSJulius Volz #ifdef CONFIG_IP_VS_IPV6 17420bbdd42bSJulius Volz static inline __wsum ip_vs_check_diff16(const __be32 *old, const __be32 *new, 17430bbdd42bSJulius Volz __wsum oldsum) 17440bbdd42bSJulius Volz { 17450bbdd42bSJulius Volz __be32 diff[8] = { ~old[3], ~old[2], ~old[1], ~old[0], 17460bbdd42bSJulius Volz new[3], new[2], new[1], new[0] }; 17470bbdd42bSJulius Volz 174807f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 17490bbdd42bSJulius Volz } 17500bbdd42bSJulius Volz #endif 17510bbdd42bSJulius Volz 1752f9214b26SAl Viro static inline __wsum ip_vs_check_diff2(__be16 old, __be16 new, __wsum oldsum) 1753f9214b26SAl Viro { 1754f9214b26SAl Viro __be16 diff[2] = { ~old, new }; 1755f9214b26SAl Viro 175607f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 17571da177e4SLinus Torvalds } 17581da177e4SLinus Torvalds 175907dcc686SSimon Horman /* Forget current conntrack (unconfirmed) and attach notrack entry */ 1760cf356d69SJulian Anastasov static inline void ip_vs_notrack(struct sk_buff *skb) 1761cf356d69SJulian Anastasov { 1762cf356d69SJulian Anastasov #if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE) 1763cf356d69SJulian Anastasov enum ip_conntrack_info ctinfo; 176406b69390SJesper Juhl struct nf_conn *ct = nf_ct_get(skb, &ctinfo); 1765cf356d69SJulian Anastasov 1766ab8bc7edSFlorian Westphal if (ct) { 176797a6ad13SFlorian Westphal nf_conntrack_put(&ct->ct_general); 1768cc41c84bSFlorian Westphal nf_ct_set(skb, NULL, IP_CT_UNTRACKED); 1769cf356d69SJulian Anastasov } 1770cf356d69SJulian Anastasov #endif 1771cf356d69SJulian Anastasov } 1772cf356d69SJulian Anastasov 1773f4bc17cdSJulian Anastasov #ifdef CONFIG_IP_VS_NFCT 177407dcc686SSimon Horman /* Netfilter connection tracking 1775f4bc17cdSJulian Anastasov * (from ip_vs_nfct.c) 1776f4bc17cdSJulian Anastasov */ 1777a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs) 1778f4bc17cdSJulian Anastasov { 1779a4e2f5a7SSimon Horman #ifdef CONFIG_SYSCTL 1780a0840e2eSHans Schillstrom return ipvs->sysctl_conntrack; 1781a4e2f5a7SSimon Horman #else 1782a4e2f5a7SSimon Horman return 0; 1783a4e2f5a7SSimon Horman #endif 1784f4bc17cdSJulian Anastasov } 1785f4bc17cdSJulian Anastasov 17865c3a0fd7SJoe Perches void ip_vs_update_conntrack(struct sk_buff *skb, struct ip_vs_conn *cp, 17876523ce15SJulian Anastasov int outin); 17885c3a0fd7SJoe Perches int ip_vs_confirm_conntrack(struct sk_buff *skb); 17895c3a0fd7SJoe Perches void ip_vs_nfct_expect_related(struct sk_buff *skb, struct nf_conn *ct, 1790f4bc17cdSJulian Anastasov struct ip_vs_conn *cp, u_int8_t proto, 1791f4bc17cdSJulian Anastasov const __be16 port, int from_rs); 17925c3a0fd7SJoe Perches void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp); 1793f4bc17cdSJulian Anastasov 1794f4bc17cdSJulian Anastasov #else 1795f4bc17cdSJulian Anastasov 1796a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs) 1797f4bc17cdSJulian Anastasov { 1798f4bc17cdSJulian Anastasov return 0; 1799f4bc17cdSJulian Anastasov } 1800f4bc17cdSJulian Anastasov 1801f4bc17cdSJulian Anastasov static inline void ip_vs_update_conntrack(struct sk_buff *skb, 1802f4bc17cdSJulian Anastasov struct ip_vs_conn *cp, int outin) 1803f4bc17cdSJulian Anastasov { 1804f4bc17cdSJulian Anastasov } 1805f4bc17cdSJulian Anastasov 1806e23ebf0fSKrzysztof Wilczynski static inline int ip_vs_confirm_conntrack(struct sk_buff *skb) 1807f4bc17cdSJulian Anastasov { 1808f4bc17cdSJulian Anastasov return NF_ACCEPT; 1809f4bc17cdSJulian Anastasov } 1810f4bc17cdSJulian Anastasov 1811f4bc17cdSJulian Anastasov static inline void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp) 1812f4bc17cdSJulian Anastasov { 1813f4bc17cdSJulian Anastasov } 181407dcc686SSimon Horman #endif /* CONFIG_IP_VS_NFCT */ 18156523ce15SJulian Anastasov 1816f0a5e4d7SJulian Anastasov /* Using old conntrack that can not be redirected to another real server? */ 1817f0a5e4d7SJulian Anastasov static inline bool ip_vs_conn_uses_old_conntrack(struct ip_vs_conn *cp, 1818f719e375SJulian Anastasov struct sk_buff *skb) 1819f719e375SJulian Anastasov { 1820f719e375SJulian Anastasov #ifdef CONFIG_IP_VS_NFCT 1821f719e375SJulian Anastasov enum ip_conntrack_info ctinfo; 1822f719e375SJulian Anastasov struct nf_conn *ct; 1823f719e375SJulian Anastasov 1824f719e375SJulian Anastasov ct = nf_ct_get(skb, &ctinfo); 1825f0a5e4d7SJulian Anastasov if (ct && nf_ct_is_confirmed(ct)) 1826f719e375SJulian Anastasov return true; 1827f719e375SJulian Anastasov #endif 1828f719e375SJulian Anastasov return false; 1829f719e375SJulian Anastasov } 1830f719e375SJulian Anastasov 183131875d49SJulian Anastasov static inline int ip_vs_register_conntrack(struct ip_vs_service *svc) 183231875d49SJulian Anastasov { 183331875d49SJulian Anastasov #if IS_ENABLED(CONFIG_NF_CONNTRACK) 183431875d49SJulian Anastasov int afmask = (svc->af == AF_INET6) ? 2 : 1; 183531875d49SJulian Anastasov int ret = 0; 183631875d49SJulian Anastasov 183731875d49SJulian Anastasov if (!(svc->conntrack_afmask & afmask)) { 183831875d49SJulian Anastasov ret = nf_ct_netns_get(svc->ipvs->net, svc->af); 183931875d49SJulian Anastasov if (ret >= 0) 184031875d49SJulian Anastasov svc->conntrack_afmask |= afmask; 184131875d49SJulian Anastasov } 184231875d49SJulian Anastasov return ret; 184331875d49SJulian Anastasov #else 184431875d49SJulian Anastasov return 0; 184531875d49SJulian Anastasov #endif 184631875d49SJulian Anastasov } 184731875d49SJulian Anastasov 184831875d49SJulian Anastasov static inline void ip_vs_unregister_conntrack(struct ip_vs_service *svc) 184931875d49SJulian Anastasov { 185031875d49SJulian Anastasov #if IS_ENABLED(CONFIG_NF_CONNTRACK) 185131875d49SJulian Anastasov int afmask = (svc->af == AF_INET6) ? 2 : 1; 185231875d49SJulian Anastasov 185331875d49SJulian Anastasov if (svc->conntrack_afmask & afmask) { 185431875d49SJulian Anastasov nf_ct_netns_put(svc->ipvs->net, svc->af); 185531875d49SJulian Anastasov svc->conntrack_afmask &= ~afmask; 185631875d49SJulian Anastasov } 185731875d49SJulian Anastasov #endif 185831875d49SJulian Anastasov } 185931875d49SJulian Anastasov 1860857ca897SJulian Anastasov int ip_vs_register_hooks(struct netns_ipvs *ipvs, unsigned int af); 1861857ca897SJulian Anastasov void ip_vs_unregister_hooks(struct netns_ipvs *ipvs, unsigned int af); 1862857ca897SJulian Anastasov 1863c16526a7SSimon Kirby static inline int 1864b552f7e3SChangli Gao ip_vs_dest_conn_overhead(struct ip_vs_dest *dest) 1865b552f7e3SChangli Gao { 186607dcc686SSimon Horman /* We think the overhead of processing active connections is 256 1867b552f7e3SChangli Gao * times higher than that of inactive connections in average. (This 1868b552f7e3SChangli Gao * 256 times might not be accurate, we will change it later) We 1869b552f7e3SChangli Gao * use the following formula to estimate the overhead now: 1870b552f7e3SChangli Gao * dest->activeconns*256 + dest->inactconns 1871b552f7e3SChangli Gao */ 1872b552f7e3SChangli Gao return (atomic_read(&dest->activeconns) << 8) + 1873b552f7e3SChangli Gao atomic_read(&dest->inactconns); 1874b552f7e3SChangli Gao } 1875b552f7e3SChangli Gao 1876edf597daSLeon Romanovsky #ifdef CONFIG_IP_VS_PROTO_TCP 1877edf597daSLeon Romanovsky INDIRECT_CALLABLE_DECLARE(int 1878edf597daSLeon Romanovsky tcp_snat_handler(struct sk_buff *skb, struct ip_vs_protocol *pp, 1879edf597daSLeon Romanovsky struct ip_vs_conn *cp, struct ip_vs_iphdr *iph)); 1880edf597daSLeon Romanovsky #endif 1881edf597daSLeon Romanovsky 1882edf597daSLeon Romanovsky #ifdef CONFIG_IP_VS_PROTO_UDP 1883edf597daSLeon Romanovsky INDIRECT_CALLABLE_DECLARE(int 1884edf597daSLeon Romanovsky udp_snat_handler(struct sk_buff *skb, struct ip_vs_protocol *pp, 1885edf597daSLeon Romanovsky struct ip_vs_conn *cp, struct ip_vs_iphdr *iph)); 1886edf597daSLeon Romanovsky #endif 1887bc4768ebSJulius Volz #endif /* _NET_IP_VS_H */ 1888