107dcc686SSimon Horman /* IP Virtual Server 21da177e4SLinus Torvalds * data structure and functionality definitions 31da177e4SLinus Torvalds */ 41da177e4SLinus Torvalds 5bc4768ebSJulius Volz #ifndef _NET_IP_VS_H 6bc4768ebSJulius Volz #define _NET_IP_VS_H 71da177e4SLinus Torvalds 8bc4768ebSJulius Volz #include <linux/ip_vs.h> /* definitions shared with userland */ 91da177e4SLinus Torvalds 10bc4768ebSJulius Volz #include <asm/types.h> /* for __uXX types */ 11bc4768ebSJulius Volz 121da177e4SLinus Torvalds #include <linux/list.h> /* for struct list_head */ 131da177e4SLinus Torvalds #include <linux/spinlock.h> /* for struct rwlock_t */ 1460063497SArun Sharma #include <linux/atomic.h> /* for struct atomic_t */ 151da177e4SLinus Torvalds #include <linux/compiler.h> 1614c85021SArnaldo Carvalho de Melo #include <linux/timer.h> 17187f1882SPaul Gortmaker #include <linux/bug.h> 181da177e4SLinus Torvalds 1914c85021SArnaldo Carvalho de Melo #include <net/checksum.h> 20e7ade46aSJulius Volz #include <linux/netfilter.h> /* for union nf_inet_addr */ 211668e010SKOVACS Krisztian #include <linux/ip.h> 22e7ade46aSJulius Volz #include <linux/ipv6.h> /* for struct ipv6hdr */ 234e3fd7a0SAlexey Dobriyan #include <net/ipv6.h> 2454d83efaSJesper Dangaard Brouer #if IS_ENABLED(CONFIG_IP_VS_IPV6) 2563dca2c0SJesper Dangaard Brouer #include <linux/netfilter_ipv6/ip6_tables.h> 2663dca2c0SJesper Dangaard Brouer #endif 27a638e514SJesper Dangaard Brouer #if IS_ENABLED(CONFIG_NF_CONNTRACK) 28f4bc17cdSJulian Anastasov #include <net/netfilter/nf_conntrack.h> 29f4bc17cdSJulian Anastasov #endif 3061b1ab45SHans Schillstrom #include <net/net_namespace.h> /* Netw namespace */ 3161b1ab45SHans Schillstrom 324fd9beefSAlex Gartrell #define IP_VS_HDR_INVERSE 1 334fd9beefSAlex Gartrell #define IP_VS_HDR_ICMP 2 344fd9beefSAlex Gartrell 3507dcc686SSimon Horman /* Generic access of ipvs struct */ 3661b1ab45SHans Schillstrom static inline struct netns_ipvs *net_ipvs(struct net* net) 3761b1ab45SHans Schillstrom { 3861b1ab45SHans Schillstrom return net->ipvs; 3961b1ab45SHans Schillstrom } 4007dcc686SSimon Horman 4107dcc686SSimon Horman /* Get net ptr from skb in traffic cases 42fc723250SHans Schillstrom * use skb_sknet when call is from userland (ioctl or netlink) 43fc723250SHans Schillstrom */ 44a0840e2eSHans Schillstrom static inline struct net *skb_net(const struct sk_buff *skb) 45fc723250SHans Schillstrom { 46fc723250SHans Schillstrom #ifdef CONFIG_NET_NS 47fc723250SHans Schillstrom #ifdef CONFIG_IP_VS_DEBUG 48fc723250SHans Schillstrom /* 49fc723250SHans Schillstrom * This is used for debug only. 50fc723250SHans Schillstrom * Start with the most likely hit 51fc723250SHans Schillstrom * End with BUG 52fc723250SHans Schillstrom */ 530c5c9fb5SEric W. Biederman if (likely(skb->dev && dev_net(skb->dev))) 54fc723250SHans Schillstrom return dev_net(skb->dev); 55a09d1977SHans Schillstrom if (skb_dst(skb) && skb_dst(skb)->dev) 56fc723250SHans Schillstrom return dev_net(skb_dst(skb)->dev); 57fc723250SHans Schillstrom WARN(skb->sk, "Maybe skb_sknet should be used in %s() at line:%d\n", 58fc723250SHans Schillstrom __func__, __LINE__); 590c5c9fb5SEric W. Biederman if (likely(skb->sk && sock_net(skb->sk))) 60fc723250SHans Schillstrom return sock_net(skb->sk); 61fc723250SHans Schillstrom pr_err("There is no net ptr to find in the skb in %s() line:%d\n", 62fc723250SHans Schillstrom __func__, __LINE__); 63fc723250SHans Schillstrom BUG(); 64fc723250SHans Schillstrom #else 65fc723250SHans Schillstrom return dev_net(skb->dev ? : skb_dst(skb)->dev); 66fc723250SHans Schillstrom #endif 67fc723250SHans Schillstrom #else 68fc723250SHans Schillstrom return &init_net; 69fc723250SHans Schillstrom #endif 70fc723250SHans Schillstrom } 71fc723250SHans Schillstrom 72a0840e2eSHans Schillstrom static inline struct net *skb_sknet(const struct sk_buff *skb) 73fc723250SHans Schillstrom { 74fc723250SHans Schillstrom #ifdef CONFIG_NET_NS 75fc723250SHans Schillstrom #ifdef CONFIG_IP_VS_DEBUG 76fc723250SHans Schillstrom /* Start with the most likely hit */ 770c5c9fb5SEric W. Biederman if (likely(skb->sk && sock_net(skb->sk))) 78fc723250SHans Schillstrom return sock_net(skb->sk); 79fc723250SHans Schillstrom WARN(skb->dev, "Maybe skb_net should be used instead in %s() line:%d\n", 80fc723250SHans Schillstrom __func__, __LINE__); 810c5c9fb5SEric W. Biederman if (likely(skb->dev && dev_net(skb->dev))) 82fc723250SHans Schillstrom return dev_net(skb->dev); 83fc723250SHans Schillstrom pr_err("There is no net ptr to find in the skb in %s() line:%d\n", 84fc723250SHans Schillstrom __func__, __LINE__); 85fc723250SHans Schillstrom BUG(); 86fc723250SHans Schillstrom #else 87fc723250SHans Schillstrom return sock_net(skb->sk); 88fc723250SHans Schillstrom #endif 89fc723250SHans Schillstrom #else 90fc723250SHans Schillstrom return &init_net; 91fc723250SHans Schillstrom #endif 92fc723250SHans Schillstrom } 9307dcc686SSimon Horman 9407dcc686SSimon Horman /* This one needed for single_open_net since net is stored directly in 9525985edcSLucas De Marchi * private not as a struct i.e. seq_file_net can't be used. 96b17fc996SHans Schillstrom */ 97b17fc996SHans Schillstrom static inline struct net *seq_file_single_net(struct seq_file *seq) 98b17fc996SHans Schillstrom { 99b17fc996SHans Schillstrom #ifdef CONFIG_NET_NS 100b17fc996SHans Schillstrom return (struct net *)seq->private; 101b17fc996SHans Schillstrom #else 102b17fc996SHans Schillstrom return &init_net; 103b17fc996SHans Schillstrom #endif 104b17fc996SHans Schillstrom } 1056f7edb48SCatalin(ux) M. BOIE 1066f7edb48SCatalin(ux) M. BOIE /* Connections' size value needed by ip_vs_ctl.c */ 1076f7edb48SCatalin(ux) M. BOIE extern int ip_vs_conn_tab_size; 1086f7edb48SCatalin(ux) M. BOIE 10964aae3cbSJulius Volz struct ip_vs_iphdr { 1104fd9beefSAlex Gartrell int hdr_flags; /* ipvs flags */ 111b0e010c5SAlex Gartrell __u32 off; /* Where IP or IPv4 header starts */ 11263dca2c0SJesper Dangaard Brouer __u32 len; /* IPv4 simply where L4 starts 11307dcc686SSimon Horman * IPv6 where L4 Transport Header starts */ 11463dca2c0SJesper Dangaard Brouer __u16 fragoffs; /* IPv6 fragment offset, 0 if first frag (or not frag)*/ 11563dca2c0SJesper Dangaard Brouer __s16 protocol; 11663dca2c0SJesper Dangaard Brouer __s32 flags; 11764aae3cbSJulius Volz union nf_inet_addr saddr; 11864aae3cbSJulius Volz union nf_inet_addr daddr; 11964aae3cbSJulius Volz }; 12064aae3cbSJulius Volz 1212f74713dSJesper Dangaard Brouer static inline void *frag_safe_skb_hp(const struct sk_buff *skb, int offset, 1222f74713dSJesper Dangaard Brouer int len, void *buffer, 1232f74713dSJesper Dangaard Brouer const struct ip_vs_iphdr *ipvsh) 1242f74713dSJesper Dangaard Brouer { 1252f74713dSJesper Dangaard Brouer return skb_header_pointer(skb, offset, len, buffer); 1262f74713dSJesper Dangaard Brouer } 1272f74713dSJesper Dangaard Brouer 12863dca2c0SJesper Dangaard Brouer /* This function handles filling *ip_vs_iphdr, both for IPv4 and IPv6. 12963dca2c0SJesper Dangaard Brouer * IPv6 requires some extra work, as finding proper header position, 13063dca2c0SJesper Dangaard Brouer * depend on the IPv6 extension headers. 13163dca2c0SJesper Dangaard Brouer */ 132b0e010c5SAlex Gartrell static inline int 133b0e010c5SAlex Gartrell ip_vs_fill_iph_skb_off(int af, const struct sk_buff *skb, int offset, 1344fd9beefSAlex Gartrell int hdr_flags, struct ip_vs_iphdr *iphdr) 13564aae3cbSJulius Volz { 1364fd9beefSAlex Gartrell iphdr->hdr_flags = hdr_flags; 137b0e010c5SAlex Gartrell iphdr->off = offset; 1384fd9beefSAlex Gartrell 13964aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 14064aae3cbSJulius Volz if (af == AF_INET6) { 141b0e010c5SAlex Gartrell struct ipv6hdr _iph; 142b0e010c5SAlex Gartrell const struct ipv6hdr *iph = skb_header_pointer( 143b0e010c5SAlex Gartrell skb, offset, sizeof(_iph), &_iph); 144b0e010c5SAlex Gartrell if (!iph) 145b0e010c5SAlex Gartrell return 0; 146b0e010c5SAlex Gartrell 1474e3fd7a0SAlexey Dobriyan iphdr->saddr.in6 = iph->saddr; 1484e3fd7a0SAlexey Dobriyan iphdr->daddr.in6 = iph->daddr; 1496aafeef0SJiri Pirko /* ipv6_find_hdr() updates len, flags */ 150b0e010c5SAlex Gartrell iphdr->len = offset; 15163dca2c0SJesper Dangaard Brouer iphdr->flags = 0; 15263dca2c0SJesper Dangaard Brouer iphdr->protocol = ipv6_find_hdr(skb, &iphdr->len, -1, 15363dca2c0SJesper Dangaard Brouer &iphdr->fragoffs, 15463dca2c0SJesper Dangaard Brouer &iphdr->flags); 155b0e010c5SAlex Gartrell if (iphdr->protocol < 0) 156b0e010c5SAlex Gartrell return 0; 15764aae3cbSJulius Volz } else 15864aae3cbSJulius Volz #endif 15964aae3cbSJulius Volz { 160b0e010c5SAlex Gartrell struct iphdr _iph; 161b0e010c5SAlex Gartrell const struct iphdr *iph = skb_header_pointer( 162b0e010c5SAlex Gartrell skb, offset, sizeof(_iph), &_iph); 163b0e010c5SAlex Gartrell if (!iph) 164b0e010c5SAlex Gartrell return 0; 165b0e010c5SAlex Gartrell 166b0e010c5SAlex Gartrell iphdr->len = offset + iph->ihl * 4; 16763dca2c0SJesper Dangaard Brouer iphdr->fragoffs = 0; 16864aae3cbSJulius Volz iphdr->protocol = iph->protocol; 16964aae3cbSJulius Volz iphdr->saddr.ip = iph->saddr; 17064aae3cbSJulius Volz iphdr->daddr.ip = iph->daddr; 17164aae3cbSJulius Volz } 172b0e010c5SAlex Gartrell 173b0e010c5SAlex Gartrell return 1; 174b0e010c5SAlex Gartrell } 175b0e010c5SAlex Gartrell 176b0e010c5SAlex Gartrell static inline int 1774fd9beefSAlex Gartrell ip_vs_fill_iph_skb_icmp(int af, const struct sk_buff *skb, int offset, 1784fd9beefSAlex Gartrell bool inverse, struct ip_vs_iphdr *iphdr) 179b0e010c5SAlex Gartrell { 1804fd9beefSAlex Gartrell int hdr_flags = IP_VS_HDR_ICMP; 1814fd9beefSAlex Gartrell 1824fd9beefSAlex Gartrell if (inverse) 1834fd9beefSAlex Gartrell hdr_flags |= IP_VS_HDR_INVERSE; 1844fd9beefSAlex Gartrell 1854fd9beefSAlex Gartrell return ip_vs_fill_iph_skb_off(af, skb, offset, hdr_flags, iphdr); 1864fd9beefSAlex Gartrell } 1874fd9beefSAlex Gartrell 1884fd9beefSAlex Gartrell static inline int 1894fd9beefSAlex Gartrell ip_vs_fill_iph_skb(int af, const struct sk_buff *skb, bool inverse, 1904fd9beefSAlex Gartrell struct ip_vs_iphdr *iphdr) 1914fd9beefSAlex Gartrell { 1924fd9beefSAlex Gartrell int hdr_flags = 0; 1934fd9beefSAlex Gartrell 1944fd9beefSAlex Gartrell if (inverse) 1954fd9beefSAlex Gartrell hdr_flags |= IP_VS_HDR_INVERSE; 1964fd9beefSAlex Gartrell 1974fd9beefSAlex Gartrell return ip_vs_fill_iph_skb_off(af, skb, skb_network_offset(skb), 1984fd9beefSAlex Gartrell hdr_flags, iphdr); 1994fd9beefSAlex Gartrell } 2004fd9beefSAlex Gartrell 2014fd9beefSAlex Gartrell static inline bool 2024fd9beefSAlex Gartrell ip_vs_iph_inverse(const struct ip_vs_iphdr *iph) 2034fd9beefSAlex Gartrell { 2044fd9beefSAlex Gartrell return !!(iph->hdr_flags & IP_VS_HDR_INVERSE); 2054fd9beefSAlex Gartrell } 2064fd9beefSAlex Gartrell 2074fd9beefSAlex Gartrell static inline bool 2084fd9beefSAlex Gartrell ip_vs_iph_icmp(const struct ip_vs_iphdr *iph) 2094fd9beefSAlex Gartrell { 2104fd9beefSAlex Gartrell return !!(iph->hdr_flags & IP_VS_HDR_ICMP); 21164aae3cbSJulius Volz } 21264aae3cbSJulius Volz 21364aae3cbSJulius Volz static inline void ip_vs_addr_copy(int af, union nf_inet_addr *dst, 21464aae3cbSJulius Volz const union nf_inet_addr *src) 21564aae3cbSJulius Volz { 21664aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 21764aae3cbSJulius Volz if (af == AF_INET6) 2184e3fd7a0SAlexey Dobriyan dst->in6 = src->in6; 21964aae3cbSJulius Volz else 22064aae3cbSJulius Volz #endif 22164aae3cbSJulius Volz dst->ip = src->ip; 22264aae3cbSJulius Volz } 22364aae3cbSJulius Volz 2249a05475cSJulian Anastasov static inline void ip_vs_addr_set(int af, union nf_inet_addr *dst, 2259a05475cSJulian Anastasov const union nf_inet_addr *src) 2269a05475cSJulian Anastasov { 2279a05475cSJulian Anastasov #ifdef CONFIG_IP_VS_IPV6 2289a05475cSJulian Anastasov if (af == AF_INET6) { 2299a05475cSJulian Anastasov dst->in6 = src->in6; 2309a05475cSJulian Anastasov return; 2319a05475cSJulian Anastasov } 2329a05475cSJulian Anastasov #endif 2339a05475cSJulian Anastasov dst->ip = src->ip; 2349a05475cSJulian Anastasov dst->all[1] = 0; 2359a05475cSJulian Anastasov dst->all[2] = 0; 2369a05475cSJulian Anastasov dst->all[3] = 0; 2379a05475cSJulian Anastasov } 2389a05475cSJulian Anastasov 23964aae3cbSJulius Volz static inline int ip_vs_addr_equal(int af, const union nf_inet_addr *a, 24064aae3cbSJulius Volz const union nf_inet_addr *b) 24164aae3cbSJulius Volz { 24264aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 24364aae3cbSJulius Volz if (af == AF_INET6) 24464aae3cbSJulius Volz return ipv6_addr_equal(&a->in6, &b->in6); 24564aae3cbSJulius Volz #endif 24664aae3cbSJulius Volz return a->ip == b->ip; 24764aae3cbSJulius Volz } 24864aae3cbSJulius Volz 2491da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG 25014c85021SArnaldo Carvalho de Melo #include <linux/net.h> 25114c85021SArnaldo Carvalho de Melo 2525c3a0fd7SJoe Perches int ip_vs_get_debug_level(void); 253c842a3adSJulius Volz 254c842a3adSJulius Volz static inline const char *ip_vs_dbg_addr(int af, char *buf, size_t buf_len, 255c842a3adSJulius Volz const union nf_inet_addr *addr, 256c842a3adSJulius Volz int *idx) 257c842a3adSJulius Volz { 258c842a3adSJulius Volz int len; 259c842a3adSJulius Volz #ifdef CONFIG_IP_VS_IPV6 260c842a3adSJulius Volz if (af == AF_INET6) 261120b9c14SJesper Dangaard Brouer len = snprintf(&buf[*idx], buf_len - *idx, "[%pI6c]", 2620c6ce78aSHarvey Harrison &addr->in6) + 1; 263c842a3adSJulius Volz else 264c842a3adSJulius Volz #endif 2653685f25dSHarvey Harrison len = snprintf(&buf[*idx], buf_len - *idx, "%pI4", 2663685f25dSHarvey Harrison &addr->ip) + 1; 267c842a3adSJulius Volz 268c842a3adSJulius Volz *idx += len; 269c842a3adSJulius Volz BUG_ON(*idx > buf_len + 1); 270c842a3adSJulius Volz return &buf[*idx - len]; 271c842a3adSJulius Volz } 272c842a3adSJulius Volz 2739aada7acSHannes Eder #define IP_VS_DBG_BUF(level, msg, ...) \ 274c842a3adSJulius Volz do { \ 275c842a3adSJulius Volz char ip_vs_dbg_buf[160]; \ 276c842a3adSJulius Volz int ip_vs_dbg_idx = 0; \ 277c842a3adSJulius Volz if (level <= ip_vs_get_debug_level()) \ 2789aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 279c842a3adSJulius Volz } while (0) 280c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...) \ 281c842a3adSJulius Volz do { \ 282c842a3adSJulius Volz char ip_vs_dbg_buf[160]; \ 283c842a3adSJulius Volz int ip_vs_dbg_idx = 0; \ 2849aada7acSHannes Eder pr_err(msg); \ 285c842a3adSJulius Volz } while (0) 286c842a3adSJulius Volz 287c842a3adSJulius Volz /* Only use from within IP_VS_DBG_BUF() or IP_VS_ERR_BUF macros */ 288c842a3adSJulius Volz #define IP_VS_DBG_ADDR(af, addr) \ 289c842a3adSJulius Volz ip_vs_dbg_addr(af, ip_vs_dbg_buf, \ 290c842a3adSJulius Volz sizeof(ip_vs_dbg_buf), addr, \ 291c842a3adSJulius Volz &ip_vs_dbg_idx) 292c842a3adSJulius Volz 2939aada7acSHannes Eder #define IP_VS_DBG(level, msg, ...) \ 2941da177e4SLinus Torvalds do { \ 2951da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2969aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 2971da177e4SLinus Torvalds } while (0) 2989aada7acSHannes Eder #define IP_VS_DBG_RL(msg, ...) \ 2991da177e4SLinus Torvalds do { \ 3001da177e4SLinus Torvalds if (net_ratelimit()) \ 3019aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 3021da177e4SLinus Torvalds } while (0) 3030d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg) \ 3041da177e4SLinus Torvalds do { \ 3051da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 3060d79641aSJulian Anastasov pp->debug_packet(af, pp, skb, ofs, msg); \ 3071da177e4SLinus Torvalds } while (0) 3080d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg) \ 3091da177e4SLinus Torvalds do { \ 3101da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level() && \ 3111da177e4SLinus Torvalds net_ratelimit()) \ 3120d79641aSJulian Anastasov pp->debug_packet(af, pp, skb, ofs, msg); \ 3131da177e4SLinus Torvalds } while (0) 3141da177e4SLinus Torvalds #else /* NO DEBUGGING at ALL */ 315c842a3adSJulius Volz #define IP_VS_DBG_BUF(level, msg...) do {} while (0) 316c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...) do {} while (0) 3171da177e4SLinus Torvalds #define IP_VS_DBG(level, msg...) do {} while (0) 3181da177e4SLinus Torvalds #define IP_VS_DBG_RL(msg...) do {} while (0) 3190d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg) do {} while (0) 3200d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg) do {} while (0) 3211da177e4SLinus Torvalds #endif 3221da177e4SLinus Torvalds 3231da177e4SLinus Torvalds #define IP_VS_BUG() BUG() 3241e3e238eSHannes Eder #define IP_VS_ERR_RL(msg, ...) \ 3251da177e4SLinus Torvalds do { \ 3261da177e4SLinus Torvalds if (net_ratelimit()) \ 3271e3e238eSHannes Eder pr_err(msg, ##__VA_ARGS__); \ 3281da177e4SLinus Torvalds } while (0) 3291da177e4SLinus Torvalds 3301da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG 3311da177e4SLinus Torvalds #define EnterFunction(level) \ 3321da177e4SLinus Torvalds do { \ 3331da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 3349aada7acSHannes Eder printk(KERN_DEBUG \ 3359aada7acSHannes Eder pr_fmt("Enter: %s, %s line %i\n"), \ 336d5c003b4SHarvey Harrison __func__, __FILE__, __LINE__); \ 3371da177e4SLinus Torvalds } while (0) 3381da177e4SLinus Torvalds #define LeaveFunction(level) \ 3391da177e4SLinus Torvalds do { \ 3401da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 3419aada7acSHannes Eder printk(KERN_DEBUG \ 3429aada7acSHannes Eder pr_fmt("Leave: %s, %s line %i\n"), \ 343d5c003b4SHarvey Harrison __func__, __FILE__, __LINE__); \ 3441da177e4SLinus Torvalds } while (0) 3451da177e4SLinus Torvalds #else 3461da177e4SLinus Torvalds #define EnterFunction(level) do {} while (0) 3471da177e4SLinus Torvalds #define LeaveFunction(level) do {} while (0) 3481da177e4SLinus Torvalds #endif 3491da177e4SLinus Torvalds 35007dcc686SSimon Horman /* The port number of FTP service (in network order). */ 351f3a7c66bSHarvey Harrison #define FTPPORT cpu_to_be16(21) 352f3a7c66bSHarvey Harrison #define FTPDATA cpu_to_be16(20) 3531da177e4SLinus Torvalds 35407dcc686SSimon Horman /* TCP State Values */ 3551da177e4SLinus Torvalds enum { 3561da177e4SLinus Torvalds IP_VS_TCP_S_NONE = 0, 3571da177e4SLinus Torvalds IP_VS_TCP_S_ESTABLISHED, 3581da177e4SLinus Torvalds IP_VS_TCP_S_SYN_SENT, 3591da177e4SLinus Torvalds IP_VS_TCP_S_SYN_RECV, 3601da177e4SLinus Torvalds IP_VS_TCP_S_FIN_WAIT, 3611da177e4SLinus Torvalds IP_VS_TCP_S_TIME_WAIT, 3621da177e4SLinus Torvalds IP_VS_TCP_S_CLOSE, 3631da177e4SLinus Torvalds IP_VS_TCP_S_CLOSE_WAIT, 3641da177e4SLinus Torvalds IP_VS_TCP_S_LAST_ACK, 3651da177e4SLinus Torvalds IP_VS_TCP_S_LISTEN, 3661da177e4SLinus Torvalds IP_VS_TCP_S_SYNACK, 3671da177e4SLinus Torvalds IP_VS_TCP_S_LAST 3681da177e4SLinus Torvalds }; 3691da177e4SLinus Torvalds 37007dcc686SSimon Horman /* UDP State Values */ 3711da177e4SLinus Torvalds enum { 3721da177e4SLinus Torvalds IP_VS_UDP_S_NORMAL, 3731da177e4SLinus Torvalds IP_VS_UDP_S_LAST, 3741da177e4SLinus Torvalds }; 3751da177e4SLinus Torvalds 37607dcc686SSimon Horman /* ICMP State Values */ 3771da177e4SLinus Torvalds enum { 3781da177e4SLinus Torvalds IP_VS_ICMP_S_NORMAL, 3791da177e4SLinus Torvalds IP_VS_ICMP_S_LAST, 3801da177e4SLinus Torvalds }; 3811da177e4SLinus Torvalds 38207dcc686SSimon Horman /* SCTP State Values */ 3832906f66aSVenkata Mohan Reddy enum ip_vs_sctp_states { 3842906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_NONE, 38561e7c420SJulian Anastasov IP_VS_SCTP_S_INIT1, 38661e7c420SJulian Anastasov IP_VS_SCTP_S_INIT, 38761e7c420SJulian Anastasov IP_VS_SCTP_S_COOKIE_SENT, 38861e7c420SJulian Anastasov IP_VS_SCTP_S_COOKIE_REPLIED, 38961e7c420SJulian Anastasov IP_VS_SCTP_S_COOKIE_WAIT, 39061e7c420SJulian Anastasov IP_VS_SCTP_S_COOKIE, 39161e7c420SJulian Anastasov IP_VS_SCTP_S_COOKIE_ECHOED, 3922906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_ESTABLISHED, 39361e7c420SJulian Anastasov IP_VS_SCTP_S_SHUTDOWN_SENT, 39461e7c420SJulian Anastasov IP_VS_SCTP_S_SHUTDOWN_RECEIVED, 39561e7c420SJulian Anastasov IP_VS_SCTP_S_SHUTDOWN_ACK_SENT, 39661e7c420SJulian Anastasov IP_VS_SCTP_S_REJECTED, 3972906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_CLOSED, 3982906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_LAST 3992906f66aSVenkata Mohan Reddy }; 4002906f66aSVenkata Mohan Reddy 40107dcc686SSimon Horman /* Delta sequence info structure 4021da177e4SLinus Torvalds * Each ip_vs_conn has 2 (output AND input seq. changes). 4031da177e4SLinus Torvalds * Only used in the VS/NAT. 4041da177e4SLinus Torvalds */ 4051da177e4SLinus Torvalds struct ip_vs_seq { 4061da177e4SLinus Torvalds __u32 init_seq; /* Add delta from this seq */ 4071da177e4SLinus Torvalds __u32 delta; /* Delta in sequence numbers */ 4081da177e4SLinus Torvalds __u32 previous_delta; /* Delta in sequence numbers 40907dcc686SSimon Horman * before last resized pkt */ 4101da177e4SLinus Torvalds }; 4111da177e4SLinus Torvalds 41207dcc686SSimon Horman /* counters per cpu */ 413b17fc996SHans Schillstrom struct ip_vs_counters { 414cd67cd5eSJulian Anastasov __u64 conns; /* connections scheduled */ 415cd67cd5eSJulian Anastasov __u64 inpkts; /* incoming packets */ 416cd67cd5eSJulian Anastasov __u64 outpkts; /* outgoing packets */ 417b17fc996SHans Schillstrom __u64 inbytes; /* incoming bytes */ 418b17fc996SHans Schillstrom __u64 outbytes; /* outgoing bytes */ 419b17fc996SHans Schillstrom }; 42007dcc686SSimon Horman /* Stats per cpu */ 421b17fc996SHans Schillstrom struct ip_vs_cpu_stats { 422cd67cd5eSJulian Anastasov struct ip_vs_counters cnt; 423b17fc996SHans Schillstrom struct u64_stats_sync syncp; 424b17fc996SHans Schillstrom }; 4251da177e4SLinus Torvalds 42607dcc686SSimon Horman /* IPVS statistics objects */ 4273a14a313SSven Wegener struct ip_vs_estimator { 4283a14a313SSven Wegener struct list_head list; 4293a14a313SSven Wegener 4303a14a313SSven Wegener u64 last_inbytes; 4313a14a313SSven Wegener u64 last_outbytes; 432cd67cd5eSJulian Anastasov u64 last_conns; 433cd67cd5eSJulian Anastasov u64 last_inpkts; 434cd67cd5eSJulian Anastasov u64 last_outpkts; 4353a14a313SSven Wegener 436cd67cd5eSJulian Anastasov u64 cps; 437cd67cd5eSJulian Anastasov u64 inpps; 438cd67cd5eSJulian Anastasov u64 outpps; 439cd67cd5eSJulian Anastasov u64 inbps; 440cd67cd5eSJulian Anastasov u64 outbps; 441cd67cd5eSJulian Anastasov }; 442cd67cd5eSJulian Anastasov 443cd67cd5eSJulian Anastasov /* 444cd67cd5eSJulian Anastasov * IPVS statistics object, 64-bit kernel version of struct ip_vs_stats_user 445cd67cd5eSJulian Anastasov */ 446cd67cd5eSJulian Anastasov struct ip_vs_kstats { 447cd67cd5eSJulian Anastasov u64 conns; /* connections scheduled */ 448cd67cd5eSJulian Anastasov u64 inpkts; /* incoming packets */ 449cd67cd5eSJulian Anastasov u64 outpkts; /* outgoing packets */ 450cd67cd5eSJulian Anastasov u64 inbytes; /* incoming bytes */ 451cd67cd5eSJulian Anastasov u64 outbytes; /* outgoing bytes */ 452cd67cd5eSJulian Anastasov 453cd67cd5eSJulian Anastasov u64 cps; /* current connection rate */ 454cd67cd5eSJulian Anastasov u64 inpps; /* current in packet rate */ 455cd67cd5eSJulian Anastasov u64 outpps; /* current out packet rate */ 456cd67cd5eSJulian Anastasov u64 inbps; /* current in byte rate */ 457cd67cd5eSJulian Anastasov u64 outbps; /* current out byte rate */ 4583a14a313SSven Wegener }; 4593a14a313SSven Wegener 460fd2c3ef7SEric Dumazet struct ip_vs_stats { 461cd67cd5eSJulian Anastasov struct ip_vs_kstats kstats; /* kernel statistics */ 462e9c0ce23SSven Wegener struct ip_vs_estimator est; /* estimator */ 463b962abdcSJulian Anastasov struct ip_vs_cpu_stats __percpu *cpustats; /* per cpu counters */ 4641da177e4SLinus Torvalds spinlock_t lock; /* spin lock */ 465cd67cd5eSJulian Anastasov struct ip_vs_kstats kstats0; /* reset values */ 4661da177e4SLinus Torvalds }; 4671da177e4SLinus Torvalds 46814c85021SArnaldo Carvalho de Melo struct dst_entry; 46914c85021SArnaldo Carvalho de Melo struct iphdr; 4701da177e4SLinus Torvalds struct ip_vs_conn; 4711da177e4SLinus Torvalds struct ip_vs_app; 47214c85021SArnaldo Carvalho de Melo struct sk_buff; 473252c6410SHans Schillstrom struct ip_vs_proto_data; 4741da177e4SLinus Torvalds 4751da177e4SLinus Torvalds struct ip_vs_protocol { 4761da177e4SLinus Torvalds struct ip_vs_protocol *next; 4771da177e4SLinus Torvalds char *name; 4782ad17defSJulian Anastasov u16 protocol; 4792ad17defSJulian Anastasov u16 num_states; 4801da177e4SLinus Torvalds int dont_defrag; 4811da177e4SLinus Torvalds 4821da177e4SLinus Torvalds void (*init)(struct ip_vs_protocol *pp); 4831da177e4SLinus Torvalds 4841da177e4SLinus Torvalds void (*exit)(struct ip_vs_protocol *pp); 4851da177e4SLinus Torvalds 4861281a9c2SEric W. Biederman int (*init_netns)(struct netns_ipvs *ipvs, struct ip_vs_proto_data *pd); 487252c6410SHans Schillstrom 4881281a9c2SEric W. Biederman void (*exit_netns)(struct netns_ipvs *ipvs, struct ip_vs_proto_data *pd); 489252c6410SHans Schillstrom 490d8f44c33SEric W. Biederman int (*conn_schedule)(struct netns_ipvs *ipvs, 491d8f44c33SEric W. Biederman int af, struct sk_buff *skb, 4929330419dSHans Schillstrom struct ip_vs_proto_data *pd, 493d4383f04SJesper Dangaard Brouer int *verdict, struct ip_vs_conn **cpp, 494d4383f04SJesper Dangaard Brouer struct ip_vs_iphdr *iph); 4951da177e4SLinus Torvalds 4961da177e4SLinus Torvalds struct ip_vs_conn * 497ab161976SEric W. Biederman (*conn_in_get)(struct netns_ipvs *ipvs, 498ab161976SEric W. Biederman int af, 49951ef348bSJulius Volz const struct sk_buff *skb, 500802c41adSAlex Gartrell const struct ip_vs_iphdr *iph); 5011da177e4SLinus Torvalds 5021da177e4SLinus Torvalds struct ip_vs_conn * 5030cf705c8SEric W. Biederman (*conn_out_get)(struct netns_ipvs *ipvs, 5040cf705c8SEric W. Biederman int af, 50551ef348bSJulius Volz const struct sk_buff *skb, 506802c41adSAlex Gartrell const struct ip_vs_iphdr *iph); 5071da177e4SLinus Torvalds 508d4383f04SJesper Dangaard Brouer int (*snat_handler)(struct sk_buff *skb, struct ip_vs_protocol *pp, 509d4383f04SJesper Dangaard Brouer struct ip_vs_conn *cp, struct ip_vs_iphdr *iph); 5101da177e4SLinus Torvalds 511d4383f04SJesper Dangaard Brouer int (*dnat_handler)(struct sk_buff *skb, struct ip_vs_protocol *pp, 512d4383f04SJesper Dangaard Brouer struct ip_vs_conn *cp, struct ip_vs_iphdr *iph); 5131da177e4SLinus Torvalds 51451ef348bSJulius Volz int (*csum_check)(int af, struct sk_buff *skb, 51551ef348bSJulius Volz struct ip_vs_protocol *pp); 5161da177e4SLinus Torvalds 5171da177e4SLinus Torvalds const char *(*state_name)(int state); 5181da177e4SLinus Torvalds 5194a516f11SSimon Horman void (*state_transition)(struct ip_vs_conn *cp, int direction, 5201da177e4SLinus Torvalds const struct sk_buff *skb, 5219330419dSHans Schillstrom struct ip_vs_proto_data *pd); 5221da177e4SLinus Torvalds 52319648918SEric W. Biederman int (*register_app)(struct netns_ipvs *ipvs, struct ip_vs_app *inc); 5241da177e4SLinus Torvalds 52519648918SEric W. Biederman void (*unregister_app)(struct netns_ipvs *ipvs, struct ip_vs_app *inc); 5261da177e4SLinus Torvalds 5271da177e4SLinus Torvalds int (*app_conn_bind)(struct ip_vs_conn *cp); 5281da177e4SLinus Torvalds 5290d79641aSJulian Anastasov void (*debug_packet)(int af, struct ip_vs_protocol *pp, 5301da177e4SLinus Torvalds const struct sk_buff *skb, 5311da177e4SLinus Torvalds int offset, 5321da177e4SLinus Torvalds const char *msg); 5331da177e4SLinus Torvalds 5349330419dSHans Schillstrom void (*timeout_change)(struct ip_vs_proto_data *pd, int flags); 5351da177e4SLinus Torvalds }; 5361da177e4SLinus Torvalds 53707dcc686SSimon Horman /* protocol data per netns */ 538252c6410SHans Schillstrom struct ip_vs_proto_data { 539252c6410SHans Schillstrom struct ip_vs_proto_data *next; 540252c6410SHans Schillstrom struct ip_vs_protocol *pp; 541252c6410SHans Schillstrom int *timeout_table; /* protocol timeout table */ 542252c6410SHans Schillstrom atomic_t appcnt; /* counter of proto app incs. */ 543252c6410SHans Schillstrom struct tcp_states_t *tcp_state_table; 544252c6410SHans Schillstrom }; 545252c6410SHans Schillstrom 5465c3a0fd7SJoe Perches struct ip_vs_protocol *ip_vs_proto_get(unsigned short proto); 54718d6ade6SEric W. Biederman struct ip_vs_proto_data *ip_vs_proto_data_get(struct netns_ipvs *ipvs, 548252c6410SHans Schillstrom unsigned short proto); 5491da177e4SLinus Torvalds 550f11017ecSSimon Horman struct ip_vs_conn_param { 551e64e2b46SEric W. Biederman struct netns_ipvs *ipvs; 552f11017ecSSimon Horman const union nf_inet_addr *caddr; 553f11017ecSSimon Horman const union nf_inet_addr *vaddr; 554f11017ecSSimon Horman __be16 cport; 555f11017ecSSimon Horman __be16 vport; 556f11017ecSSimon Horman __u16 protocol; 557f11017ecSSimon Horman u16 af; 55885999283SSimon Horman 55985999283SSimon Horman const struct ip_vs_pe *pe; 56085999283SSimon Horman char *pe_data; 56185999283SSimon Horman __u8 pe_data_len; 562f11017ecSSimon Horman }; 563f11017ecSSimon Horman 56407dcc686SSimon Horman /* IP_VS structure allocated for each dynamically scheduled connection */ 5651da177e4SLinus Torvalds struct ip_vs_conn { 566731109e7SChangli Gao struct hlist_node c_list; /* hashed list heads */ 5671da177e4SLinus Torvalds /* Protocol, addresses and port numbers */ 5686e67e586SHans Schillstrom __be16 cport; 5696e67e586SHans Schillstrom __be16 dport; 5701845ed0bSJulian Anastasov __be16 vport; 5711845ed0bSJulian Anastasov u16 af; /* address family */ 572e7ade46aSJulius Volz union nf_inet_addr caddr; /* client address */ 573e7ade46aSJulius Volz union nf_inet_addr vaddr; /* virtual address */ 574e7ade46aSJulius Volz union nf_inet_addr daddr; /* destination address */ 5753575792eSJulian Anastasov volatile __u32 flags; /* status flags */ 5761da177e4SLinus Torvalds __u16 protocol; /* Which protocol (TCP/UDP) */ 577ba38528aSAlex Gartrell __u16 daf; /* Address family of the dest */ 57858dbc6f2SEric W. Biederman struct netns_ipvs *ipvs; 5791da177e4SLinus Torvalds 5801da177e4SLinus Torvalds /* counter and timer */ 5811da177e4SLinus Torvalds atomic_t refcnt; /* reference count */ 5821da177e4SLinus Torvalds struct timer_list timer; /* Expiration timer */ 5831da177e4SLinus Torvalds volatile unsigned long timeout; /* timeout */ 5841da177e4SLinus Torvalds 5851da177e4SLinus Torvalds /* Flags and state transition */ 5861da177e4SLinus Torvalds spinlock_t lock; /* lock for state transition */ 5871da177e4SLinus Torvalds volatile __u16 state; /* state info */ 588efac5276SRumen G. Bogdanovski volatile __u16 old_state; /* old state, to be used for 589efac5276SRumen G. Bogdanovski * state transition triggerd 590efac5276SRumen G. Bogdanovski * synchronization 591efac5276SRumen G. Bogdanovski */ 5921845ed0bSJulian Anastasov __u32 fwmark; /* Fire wall mark from skb */ 593749c42b6SJulian Anastasov unsigned long sync_endtime; /* jiffies + sent_retries */ 5941da177e4SLinus Torvalds 5951da177e4SLinus Torvalds /* Control members */ 5961da177e4SLinus Torvalds struct ip_vs_conn *control; /* Master control connection */ 5971da177e4SLinus Torvalds atomic_t n_control; /* Number of controlled ones */ 5981da177e4SLinus Torvalds struct ip_vs_dest *dest; /* real server */ 5991da177e4SLinus Torvalds atomic_t in_pkts; /* incoming packet counter */ 6001da177e4SLinus Torvalds 60107dcc686SSimon Horman /* Packet transmitter for different forwarding methods. If it 60207dcc686SSimon Horman * mangles the packet, it must return NF_DROP or better NF_STOLEN, 60307dcc686SSimon Horman * otherwise this must be changed to a sk_buff **. 60407dcc686SSimon Horman * NF_ACCEPT can be returned when destination is local. 6051da177e4SLinus Torvalds */ 6061da177e4SLinus Torvalds int (*packet_xmit)(struct sk_buff *skb, struct ip_vs_conn *cp, 607d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 6081da177e4SLinus Torvalds 6091da177e4SLinus Torvalds /* Note: we can group the following members into a structure, 61007dcc686SSimon Horman * in order to save more space, and the following members are 61107dcc686SSimon Horman * only used in VS/NAT anyway 61207dcc686SSimon Horman */ 6131da177e4SLinus Torvalds struct ip_vs_app *app; /* bound ip_vs_app object */ 6141da177e4SLinus Torvalds void *app_data; /* Application private data */ 6151da177e4SLinus Torvalds struct ip_vs_seq in_seq; /* incoming seq. struct */ 6161da177e4SLinus Torvalds struct ip_vs_seq out_seq; /* outgoing seq. struct */ 61785999283SSimon Horman 618e9e5eee8SSimon Horman const struct ip_vs_pe *pe; 61985999283SSimon Horman char *pe_data; 62085999283SSimon Horman __u8 pe_data_len; 621088339a5SJulian Anastasov 622088339a5SJulian Anastasov struct rcu_head rcu_head; 6231da177e4SLinus Torvalds }; 6241da177e4SLinus Torvalds 62507dcc686SSimon Horman /* Extended internal versions of struct ip_vs_service_user and ip_vs_dest_user 62607dcc686SSimon Horman * for IPv6 support. 627c860c6b1SJulius Volz * 628c860c6b1SJulius Volz * We need these to conveniently pass around service and destination 629c860c6b1SJulius Volz * options, but unfortunately, we also need to keep the old definitions to 630c860c6b1SJulius Volz * maintain userspace backwards compatibility for the setsockopt interface. 631c860c6b1SJulius Volz */ 632c860c6b1SJulius Volz struct ip_vs_service_user_kern { 633c860c6b1SJulius Volz /* virtual service addresses */ 634c860c6b1SJulius Volz u16 af; 635c860c6b1SJulius Volz u16 protocol; 636c860c6b1SJulius Volz union nf_inet_addr addr; /* virtual ip address */ 6370a925864SJulian Anastasov __be16 port; 638c860c6b1SJulius Volz u32 fwmark; /* firwall mark of service */ 639c860c6b1SJulius Volz 640c860c6b1SJulius Volz /* virtual service options */ 641c860c6b1SJulius Volz char *sched_name; 6420d1e71b0SSimon Horman char *pe_name; 64395c96174SEric Dumazet unsigned int flags; /* virtual service flags */ 64495c96174SEric Dumazet unsigned int timeout; /* persistent timeout in sec */ 6450a925864SJulian Anastasov __be32 netmask; /* persistent netmask or plen */ 646c860c6b1SJulius Volz }; 647c860c6b1SJulius Volz 648c860c6b1SJulius Volz 649c860c6b1SJulius Volz struct ip_vs_dest_user_kern { 650c860c6b1SJulius Volz /* destination server address */ 651c860c6b1SJulius Volz union nf_inet_addr addr; 6520a925864SJulian Anastasov __be16 port; 653c860c6b1SJulius Volz 654c860c6b1SJulius Volz /* real server options */ 65595c96174SEric Dumazet unsigned int conn_flags; /* connection flags */ 656c860c6b1SJulius Volz int weight; /* destination weight */ 657c860c6b1SJulius Volz 658c860c6b1SJulius Volz /* thresholds for active connections */ 659c860c6b1SJulius Volz u32 u_threshold; /* upper threshold */ 660c860c6b1SJulius Volz u32 l_threshold; /* lower threshold */ 6616cff339bSAlex Gartrell 6626cff339bSAlex Gartrell /* Address family of addr */ 6636cff339bSAlex Gartrell u16 af; 664c860c6b1SJulius Volz }; 665c860c6b1SJulius Volz 666c860c6b1SJulius Volz 667c860c6b1SJulius Volz /* 66807dcc686SSimon Horman * The information about the virtual service offered to the net and the 66907dcc686SSimon Horman * forwarding entries. 6701da177e4SLinus Torvalds */ 6711da177e4SLinus Torvalds struct ip_vs_service { 672ceec4c38SJulian Anastasov struct hlist_node s_list; /* for normal service table */ 673ceec4c38SJulian Anastasov struct hlist_node f_list; /* for fwmark-based service table */ 6741da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 6751da177e4SLinus Torvalds 676e7ade46aSJulius Volz u16 af; /* address family */ 6771da177e4SLinus Torvalds __u16 protocol; /* which protocol (TCP/UDP) */ 678e7ade46aSJulius Volz union nf_inet_addr addr; /* IP address for virtual service */ 679014d730dSAl Viro __be16 port; /* port number for the service */ 6801da177e4SLinus Torvalds __u32 fwmark; /* firewall mark of the service */ 68195c96174SEric Dumazet unsigned int flags; /* service status flags */ 68295c96174SEric Dumazet unsigned int timeout; /* persistent timeout in ticks */ 6830a925864SJulian Anastasov __be32 netmask; /* grouping granularity, mask/plen */ 6843109d2f2SEric W. Biederman struct netns_ipvs *ipvs; 6851da177e4SLinus Torvalds 6861da177e4SLinus Torvalds struct list_head destinations; /* real server d-linked list */ 6871da177e4SLinus Torvalds __u32 num_dests; /* number of servers */ 6881da177e4SLinus Torvalds struct ip_vs_stats stats; /* statistics for the service */ 6891da177e4SLinus Torvalds 6901da177e4SLinus Torvalds /* for scheduling */ 691ceec4c38SJulian Anastasov struct ip_vs_scheduler __rcu *scheduler; /* bound scheduler object */ 692ba3a3ce1SJulian Anastasov spinlock_t sched_lock; /* lock sched_data */ 6931da177e4SLinus Torvalds void *sched_data; /* scheduler application data */ 69485999283SSimon Horman 69585999283SSimon Horman /* alternate persistence engine */ 696ceec4c38SJulian Anastasov struct ip_vs_pe __rcu *pe; 697ceec4c38SJulian Anastasov 698ceec4c38SJulian Anastasov struct rcu_head rcu_head; 6991da177e4SLinus Torvalds }; 7001da177e4SLinus Torvalds 701026ace06SJulian Anastasov /* Information for cached dst */ 702026ace06SJulian Anastasov struct ip_vs_dest_dst { 703026ace06SJulian Anastasov struct dst_entry *dst_cache; /* destination cache entry */ 704026ace06SJulian Anastasov u32 dst_cookie; 705026ace06SJulian Anastasov union nf_inet_addr dst_saddr; 706026ace06SJulian Anastasov struct rcu_head rcu_head; 707026ace06SJulian Anastasov }; 7081da177e4SLinus Torvalds 70907dcc686SSimon Horman /* The real server destination forwarding entry with ip address, port number, 71007dcc686SSimon Horman * and so on. 7111da177e4SLinus Torvalds */ 7121da177e4SLinus Torvalds struct ip_vs_dest { 7131da177e4SLinus Torvalds struct list_head n_list; /* for the dests in the service */ 714276472eaSJulian Anastasov struct hlist_node d_list; /* for table with all the dests */ 7151da177e4SLinus Torvalds 716e7ade46aSJulius Volz u16 af; /* address family */ 717014d730dSAl Viro __be16 port; /* port number of the server */ 718f2431e6eSHans Schillstrom union nf_inet_addr addr; /* IP address of the server */ 71995c96174SEric Dumazet volatile unsigned int flags; /* dest status flags */ 7201da177e4SLinus Torvalds atomic_t conn_flags; /* flags to copy to conn */ 7211da177e4SLinus Torvalds atomic_t weight; /* server weight */ 7221da177e4SLinus Torvalds 7231da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 7241da177e4SLinus Torvalds struct ip_vs_stats stats; /* statistics */ 725bcbde4c0SJulian Anastasov unsigned long idle_start; /* start time, jiffies */ 7261da177e4SLinus Torvalds 7271da177e4SLinus Torvalds /* connection counters and thresholds */ 7281da177e4SLinus Torvalds atomic_t activeconns; /* active connections */ 7291da177e4SLinus Torvalds atomic_t inactconns; /* inactive connections */ 7301da177e4SLinus Torvalds atomic_t persistconns; /* persistent connections */ 7311da177e4SLinus Torvalds __u32 u_threshold; /* upper threshold */ 7321da177e4SLinus Torvalds __u32 l_threshold; /* lower threshold */ 7331da177e4SLinus Torvalds 7341da177e4SLinus Torvalds /* for destination cache */ 7351da177e4SLinus Torvalds spinlock_t dst_lock; /* lock of dst_cache */ 736026ace06SJulian Anastasov struct ip_vs_dest_dst __rcu *dest_dst; /* cached dst info */ 7371da177e4SLinus Torvalds 7381da177e4SLinus Torvalds /* for virtual service */ 739bcbde4c0SJulian Anastasov struct ip_vs_service __rcu *svc; /* service it belongs to */ 7401da177e4SLinus Torvalds __u16 protocol; /* which protocol (TCP/UDP) */ 741014d730dSAl Viro __be16 vport; /* virtual port number */ 742f2431e6eSHans Schillstrom union nf_inet_addr vaddr; /* virtual IP address */ 7431da177e4SLinus Torvalds __u32 vfwmark; /* firewall mark of service */ 744276472eaSJulian Anastasov 745578bc3efSJulian Anastasov struct list_head t_list; /* in dest_trash */ 746276472eaSJulian Anastasov unsigned int in_rs_table:1; /* we are in rs_table */ 7471da177e4SLinus Torvalds }; 7481da177e4SLinus Torvalds 74907dcc686SSimon Horman /* The scheduler object */ 7501da177e4SLinus Torvalds struct ip_vs_scheduler { 7511da177e4SLinus Torvalds struct list_head n_list; /* d-linked list head */ 7521da177e4SLinus Torvalds char *name; /* scheduler name */ 7531da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 7541da177e4SLinus Torvalds struct module *module; /* THIS_MODULE/NULL */ 7551da177e4SLinus Torvalds 7561da177e4SLinus Torvalds /* scheduler initializing service */ 7571da177e4SLinus Torvalds int (*init_service)(struct ip_vs_service *svc); 7581da177e4SLinus Torvalds /* scheduling service finish */ 759ed3ffc4eSJulian Anastasov void (*done_service)(struct ip_vs_service *svc); 7606b6df466SJulian Anastasov /* dest is linked */ 7616b6df466SJulian Anastasov int (*add_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest); 7626b6df466SJulian Anastasov /* dest is unlinked */ 7636b6df466SJulian Anastasov int (*del_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest); 7646b6df466SJulian Anastasov /* dest is updated */ 7656b6df466SJulian Anastasov int (*upd_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest); 7661da177e4SLinus Torvalds 7671da177e4SLinus Torvalds /* selecting a server from the given service */ 7681da177e4SLinus Torvalds struct ip_vs_dest* (*schedule)(struct ip_vs_service *svc, 769bba54de5SJulian Anastasov const struct sk_buff *skb, 770bba54de5SJulian Anastasov struct ip_vs_iphdr *iph); 7711da177e4SLinus Torvalds }; 7721da177e4SLinus Torvalds 77385999283SSimon Horman /* The persistence engine object */ 77485999283SSimon Horman struct ip_vs_pe { 77585999283SSimon Horman struct list_head n_list; /* d-linked list head */ 77685999283SSimon Horman char *name; /* scheduler name */ 77785999283SSimon Horman atomic_t refcnt; /* reference counter */ 77885999283SSimon Horman struct module *module; /* THIS_MODULE/NULL */ 77985999283SSimon Horman 78085999283SSimon Horman /* get the connection template, if any */ 78185999283SSimon Horman int (*fill_param)(struct ip_vs_conn_param *p, struct sk_buff *skb); 78285999283SSimon Horman bool (*ct_match)(const struct ip_vs_conn_param *p, 78385999283SSimon Horman struct ip_vs_conn *ct); 78485999283SSimon Horman u32 (*hashkey_raw)(const struct ip_vs_conn_param *p, u32 initval, 78585999283SSimon Horman bool inverse); 786a3c918acSSimon Horman int (*show_pe_data)(const struct ip_vs_conn *cp, char *buf); 78785999283SSimon Horman }; 7881da177e4SLinus Torvalds 78907dcc686SSimon Horman /* The application module object (a.k.a. app incarnation) */ 790fd2c3ef7SEric Dumazet struct ip_vs_app { 7911da177e4SLinus Torvalds struct list_head a_list; /* member in app list */ 7921da177e4SLinus Torvalds int type; /* IP_VS_APP_TYPE_xxx */ 7931da177e4SLinus Torvalds char *name; /* application module name */ 7941da177e4SLinus Torvalds __u16 protocol; 7951da177e4SLinus Torvalds struct module *module; /* THIS_MODULE/NULL */ 7961da177e4SLinus Torvalds struct list_head incs_list; /* list of incarnations */ 7971da177e4SLinus Torvalds 7981da177e4SLinus Torvalds /* members for application incarnations */ 7991da177e4SLinus Torvalds struct list_head p_list; /* member in proto app list */ 8001da177e4SLinus Torvalds struct ip_vs_app *app; /* its real application */ 801014d730dSAl Viro __be16 port; /* port number in net order */ 8021da177e4SLinus Torvalds atomic_t usecnt; /* usage counter */ 803363c97d7SJulian Anastasov struct rcu_head rcu_head; 8041da177e4SLinus Torvalds 80507dcc686SSimon Horman /* output hook: Process packet in inout direction, diff set for TCP. 8068b27b10fSJulian Anastasov * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok, 8078b27b10fSJulian Anastasov * 2=Mangled but checksum was not updated 8088b27b10fSJulian Anastasov */ 8091da177e4SLinus Torvalds int (*pkt_out)(struct ip_vs_app *, struct ip_vs_conn *, 8103db05feaSHerbert Xu struct sk_buff *, int *diff); 8111da177e4SLinus Torvalds 81207dcc686SSimon Horman /* input hook: Process packet in outin direction, diff set for TCP. 8138b27b10fSJulian Anastasov * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok, 8148b27b10fSJulian Anastasov * 2=Mangled but checksum was not updated 8158b27b10fSJulian Anastasov */ 8161da177e4SLinus Torvalds int (*pkt_in)(struct ip_vs_app *, struct ip_vs_conn *, 8173db05feaSHerbert Xu struct sk_buff *, int *diff); 8181da177e4SLinus Torvalds 8191da177e4SLinus Torvalds /* ip_vs_app initializer */ 8201da177e4SLinus Torvalds int (*init_conn)(struct ip_vs_app *, struct ip_vs_conn *); 8211da177e4SLinus Torvalds 8221da177e4SLinus Torvalds /* ip_vs_app finish */ 8231da177e4SLinus Torvalds int (*done_conn)(struct ip_vs_app *, struct ip_vs_conn *); 8241da177e4SLinus Torvalds 8251da177e4SLinus Torvalds 8261da177e4SLinus Torvalds /* not used now */ 8271da177e4SLinus Torvalds int (*bind_conn)(struct ip_vs_app *, struct ip_vs_conn *, 8281da177e4SLinus Torvalds struct ip_vs_protocol *); 8291da177e4SLinus Torvalds 8301da177e4SLinus Torvalds void (*unbind_conn)(struct ip_vs_app *, struct ip_vs_conn *); 8311da177e4SLinus Torvalds 8321da177e4SLinus Torvalds int * timeout_table; 8331da177e4SLinus Torvalds int * timeouts; 8341da177e4SLinus Torvalds int timeouts_size; 8351da177e4SLinus Torvalds 8361da177e4SLinus Torvalds int (*conn_schedule)(struct sk_buff *skb, struct ip_vs_app *app, 8371da177e4SLinus Torvalds int *verdict, struct ip_vs_conn **cpp); 8381da177e4SLinus Torvalds 8391da177e4SLinus Torvalds struct ip_vs_conn * 8401da177e4SLinus Torvalds (*conn_in_get)(const struct sk_buff *skb, struct ip_vs_app *app, 841d4383f04SJesper Dangaard Brouer const struct iphdr *iph, int inverse); 8421da177e4SLinus Torvalds 8431da177e4SLinus Torvalds struct ip_vs_conn * 8441da177e4SLinus Torvalds (*conn_out_get)(const struct sk_buff *skb, struct ip_vs_app *app, 845d4383f04SJesper Dangaard Brouer const struct iphdr *iph, int inverse); 8461da177e4SLinus Torvalds 8471da177e4SLinus Torvalds int (*state_transition)(struct ip_vs_conn *cp, int direction, 8481da177e4SLinus Torvalds const struct sk_buff *skb, 8491da177e4SLinus Torvalds struct ip_vs_app *app); 8501da177e4SLinus Torvalds 8511da177e4SLinus Torvalds void (*timeout_change)(struct ip_vs_app *app, int flags); 8521da177e4SLinus Torvalds }; 8531da177e4SLinus Torvalds 854f73181c8SPablo Neira Ayuso struct ipvs_master_sync_state { 855f73181c8SPablo Neira Ayuso struct list_head sync_queue; 856f73181c8SPablo Neira Ayuso struct ip_vs_sync_buff *sync_buff; 85707995674SZhang Yanfei unsigned long sync_queue_len; 858f73181c8SPablo Neira Ayuso unsigned int sync_queue_delay; 859f73181c8SPablo Neira Ayuso struct task_struct *master_thread; 860f73181c8SPablo Neira Ayuso struct delayed_work master_wakeup_work; 861f73181c8SPablo Neira Ayuso struct netns_ipvs *ipvs; 862f73181c8SPablo Neira Ayuso }; 863f73181c8SPablo Neira Ayuso 864578bc3efSJulian Anastasov /* How much time to keep dests in trash */ 865578bc3efSJulian Anastasov #define IP_VS_DEST_TRASH_PERIOD (120 * HZ) 866578bc3efSJulian Anastasov 867e4ff6751SJulian Anastasov struct ipvs_sync_daemon_cfg { 868d3328817SJulian Anastasov union nf_inet_addr mcast_group; 869e4ff6751SJulian Anastasov int syncid; 870e4ff6751SJulian Anastasov u16 sync_maxlen; 871d3328817SJulian Anastasov u16 mcast_port; 872d3328817SJulian Anastasov u8 mcast_af; 873d3328817SJulian Anastasov u8 mcast_ttl; 874e4ff6751SJulian Anastasov /* multicast interface name */ 875e4ff6751SJulian Anastasov char mcast_ifn[IP_VS_IFNAME_MAXLEN]; 876e4ff6751SJulian Anastasov }; 877e4ff6751SJulian Anastasov 8782553d064SJulian Anastasov /* IPVS in network namespace */ 8792553d064SJulian Anastasov struct netns_ipvs { 8802553d064SJulian Anastasov int gen; /* Generation */ 8817a4f0761SHans Schillstrom int enable; /* enable like nf_hooks do */ 88207dcc686SSimon Horman /* Hash table: for real service lookups */ 8832553d064SJulian Anastasov #define IP_VS_RTAB_BITS 4 8842553d064SJulian Anastasov #define IP_VS_RTAB_SIZE (1 << IP_VS_RTAB_BITS) 8852553d064SJulian Anastasov #define IP_VS_RTAB_MASK (IP_VS_RTAB_SIZE - 1) 8862553d064SJulian Anastasov 887276472eaSJulian Anastasov struct hlist_head rs_table[IP_VS_RTAB_SIZE]; 8882553d064SJulian Anastasov /* ip_vs_app */ 8892553d064SJulian Anastasov struct list_head app_list; 8902553d064SJulian Anastasov /* ip_vs_proto */ 8912553d064SJulian Anastasov #define IP_VS_PROTO_TAB_SIZE 32 /* must be power of 2 */ 8922553d064SJulian Anastasov struct ip_vs_proto_data *proto_data_table[IP_VS_PROTO_TAB_SIZE]; 8932553d064SJulian Anastasov /* ip_vs_proto_tcp */ 8942553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_TCP 8952553d064SJulian Anastasov #define TCP_APP_TAB_BITS 4 8962553d064SJulian Anastasov #define TCP_APP_TAB_SIZE (1 << TCP_APP_TAB_BITS) 8972553d064SJulian Anastasov #define TCP_APP_TAB_MASK (TCP_APP_TAB_SIZE - 1) 8982553d064SJulian Anastasov struct list_head tcp_apps[TCP_APP_TAB_SIZE]; 8992553d064SJulian Anastasov #endif 9002553d064SJulian Anastasov /* ip_vs_proto_udp */ 9012553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_UDP 9022553d064SJulian Anastasov #define UDP_APP_TAB_BITS 4 9032553d064SJulian Anastasov #define UDP_APP_TAB_SIZE (1 << UDP_APP_TAB_BITS) 9042553d064SJulian Anastasov #define UDP_APP_TAB_MASK (UDP_APP_TAB_SIZE - 1) 9052553d064SJulian Anastasov struct list_head udp_apps[UDP_APP_TAB_SIZE]; 9062553d064SJulian Anastasov #endif 9072553d064SJulian Anastasov /* ip_vs_proto_sctp */ 9082553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_SCTP 9092553d064SJulian Anastasov #define SCTP_APP_TAB_BITS 4 9102553d064SJulian Anastasov #define SCTP_APP_TAB_SIZE (1 << SCTP_APP_TAB_BITS) 9112553d064SJulian Anastasov #define SCTP_APP_TAB_MASK (SCTP_APP_TAB_SIZE - 1) 9122553d064SJulian Anastasov /* Hash table for SCTP application incarnations */ 9132553d064SJulian Anastasov struct list_head sctp_apps[SCTP_APP_TAB_SIZE]; 9142553d064SJulian Anastasov #endif 9152553d064SJulian Anastasov /* ip_vs_conn */ 9162553d064SJulian Anastasov atomic_t conn_count; /* connection counter */ 9172553d064SJulian Anastasov 9182553d064SJulian Anastasov /* ip_vs_ctl */ 9192a0751afSJulian Anastasov struct ip_vs_stats tot_stats; /* Statistics & est. */ 9202553d064SJulian Anastasov 9212553d064SJulian Anastasov int num_services; /* no of virtual services */ 922f2247fbdSSimon Horman 9232553d064SJulian Anastasov /* Trash for destinations */ 9242553d064SJulian Anastasov struct list_head dest_trash; 925578bc3efSJulian Anastasov spinlock_t dest_trash_lock; 926578bc3efSJulian Anastasov struct timer_list dest_trash_timer; /* expiration timer */ 9272553d064SJulian Anastasov /* Service counters */ 9282553d064SJulian Anastasov atomic_t ftpsvc_counter; 9292553d064SJulian Anastasov atomic_t nullsvc_counter; 9302553d064SJulian Anastasov 931f2247fbdSSimon Horman #ifdef CONFIG_SYSCTL 932f2247fbdSSimon Horman /* 1/rate drop and drop-entry variables */ 933f2247fbdSSimon Horman struct delayed_work defense_work; /* Work handler */ 934f2247fbdSSimon Horman int drop_rate; 935f2247fbdSSimon Horman int drop_counter; 936f2247fbdSSimon Horman atomic_t dropentry; 937f2247fbdSSimon Horman /* locks in ctl.c */ 938f2247fbdSSimon Horman spinlock_t dropentry_lock; /* drop entry handling */ 939f2247fbdSSimon Horman spinlock_t droppacket_lock; /* drop packet handling */ 940f2247fbdSSimon Horman spinlock_t securetcp_lock; /* state and timeout tables */ 941f2247fbdSSimon Horman 9422553d064SJulian Anastasov /* sys-ctl struct */ 9432553d064SJulian Anastasov struct ctl_table_header *sysctl_hdr; 9442553d064SJulian Anastasov struct ctl_table *sysctl_tbl; 945f2247fbdSSimon Horman #endif 946f2247fbdSSimon Horman 9472553d064SJulian Anastasov /* sysctl variables */ 9482553d064SJulian Anastasov int sysctl_amemthresh; 9492553d064SJulian Anastasov int sysctl_am_droprate; 9502553d064SJulian Anastasov int sysctl_drop_entry; 9512553d064SJulian Anastasov int sysctl_drop_packet; 9522553d064SJulian Anastasov int sysctl_secure_tcp; 9532553d064SJulian Anastasov #ifdef CONFIG_IP_VS_NFCT 9542553d064SJulian Anastasov int sysctl_conntrack; 9552553d064SJulian Anastasov #endif 9562553d064SJulian Anastasov int sysctl_snat_reroute; 9572553d064SJulian Anastasov int sysctl_sync_ver; 958f73181c8SPablo Neira Ayuso int sysctl_sync_ports; 9594d0c875dSJulian Anastasov int sysctl_sync_persist_mode; 96007995674SZhang Yanfei unsigned long sysctl_sync_qlen_max; 9611c003b15SPablo Neira Ayuso int sysctl_sync_sock_size; 9622553d064SJulian Anastasov int sysctl_cache_bypass; 9632553d064SJulian Anastasov int sysctl_expire_nodest_conn; 964c6c96c18SAlexander Frolkin int sysctl_sloppy_tcp; 965c6c96c18SAlexander Frolkin int sysctl_sloppy_sctp; 9662553d064SJulian Anastasov int sysctl_expire_quiescent_template; 9672553d064SJulian Anastasov int sysctl_sync_threshold[2]; 968749c42b6SJulian Anastasov unsigned int sysctl_sync_refresh_period; 969749c42b6SJulian Anastasov int sysctl_sync_retries; 9702553d064SJulian Anastasov int sysctl_nat_icmp_send; 9713654e611SJulian Anastasov int sysctl_pmtu_disc; 9720c12582fSJulian Anastasov int sysctl_backup_only; 973d752c364SMarcelo Ricardo Leitner int sysctl_conn_reuse_mode; 97494485fedSAlex Gartrell int sysctl_schedule_icmp; 9754e478098SAlex Gartrell int sysctl_ignore_tunneled; 9762553d064SJulian Anastasov 9772553d064SJulian Anastasov /* ip_vs_lblc */ 9782553d064SJulian Anastasov int sysctl_lblc_expiration; 9792553d064SJulian Anastasov struct ctl_table_header *lblc_ctl_header; 9802553d064SJulian Anastasov struct ctl_table *lblc_ctl_table; 9812553d064SJulian Anastasov /* ip_vs_lblcr */ 9822553d064SJulian Anastasov int sysctl_lblcr_expiration; 9832553d064SJulian Anastasov struct ctl_table_header *lblcr_ctl_header; 9842553d064SJulian Anastasov struct ctl_table *lblcr_ctl_table; 9852553d064SJulian Anastasov /* ip_vs_est */ 9862553d064SJulian Anastasov struct list_head est_list; /* estimator list */ 9872553d064SJulian Anastasov spinlock_t est_lock; 9882553d064SJulian Anastasov struct timer_list est_timer; /* Estimation timer */ 9892553d064SJulian Anastasov /* ip_vs_sync */ 9902553d064SJulian Anastasov spinlock_t sync_lock; 991f73181c8SPablo Neira Ayuso struct ipvs_master_sync_state *ms; 9922553d064SJulian Anastasov spinlock_t sync_buff_lock; 993f73181c8SPablo Neira Ayuso struct task_struct **backup_threads; 994f73181c8SPablo Neira Ayuso int threads_mask; 9952553d064SJulian Anastasov volatile int sync_state; 996ae1d48b2SHans Schillstrom struct mutex sync_mutex; 997e4ff6751SJulian Anastasov struct ipvs_sync_daemon_cfg mcfg; /* Master Configuration */ 998e4ff6751SJulian Anastasov struct ipvs_sync_daemon_cfg bcfg; /* Backup Configuration */ 9992553d064SJulian Anastasov /* net name space ptr */ 10002553d064SJulian Anastasov struct net *net; /* Needed by timer routines */ 100107dcc686SSimon Horman /* Number of heterogeneous destinations, needed becaus heterogeneous 100207dcc686SSimon Horman * are not supported when synchronization is enabled. 100307dcc686SSimon Horman */ 1004391f503dSAlex Gartrell unsigned int mixed_address_family_dests; 10052553d064SJulian Anastasov }; 10061da177e4SLinus Torvalds 100759e0350eSSimon Horman #define DEFAULT_SYNC_THRESHOLD 3 100859e0350eSSimon Horman #define DEFAULT_SYNC_PERIOD 50 10097532e8d4SSimon Horman #define DEFAULT_SYNC_VER 1 1010c6c96c18SAlexander Frolkin #define DEFAULT_SLOPPY_TCP 0 1011c6c96c18SAlexander Frolkin #define DEFAULT_SLOPPY_SCTP 0 1012749c42b6SJulian Anastasov #define DEFAULT_SYNC_REFRESH_PERIOD (0U * HZ) 1013749c42b6SJulian Anastasov #define DEFAULT_SYNC_RETRIES 0 10141c003b15SPablo Neira Ayuso #define IPVS_SYNC_WAKEUP_RATE 8 10151c003b15SPablo Neira Ayuso #define IPVS_SYNC_QLEN_MAX (IPVS_SYNC_WAKEUP_RATE * 4) 10161c003b15SPablo Neira Ayuso #define IPVS_SYNC_SEND_DELAY (HZ / 50) 10171c003b15SPablo Neira Ayuso #define IPVS_SYNC_CHECK_PERIOD HZ 1018749c42b6SJulian Anastasov #define IPVS_SYNC_FLUSH_TIME (HZ * 2) 1019f73181c8SPablo Neira Ayuso #define IPVS_SYNC_PORTS_MAX (1 << 6) 102059e0350eSSimon Horman 102159e0350eSSimon Horman #ifdef CONFIG_SYSCTL 102259e0350eSSimon Horman 102359e0350eSSimon Horman static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs) 102459e0350eSSimon Horman { 102559e0350eSSimon Horman return ipvs->sysctl_sync_threshold[0]; 102659e0350eSSimon Horman } 102759e0350eSSimon Horman 102859e0350eSSimon Horman static inline int sysctl_sync_period(struct netns_ipvs *ipvs) 102959e0350eSSimon Horman { 1030749c42b6SJulian Anastasov return ACCESS_ONCE(ipvs->sysctl_sync_threshold[1]); 1031749c42b6SJulian Anastasov } 1032749c42b6SJulian Anastasov 1033749c42b6SJulian Anastasov static inline unsigned int sysctl_sync_refresh_period(struct netns_ipvs *ipvs) 1034749c42b6SJulian Anastasov { 1035749c42b6SJulian Anastasov return ACCESS_ONCE(ipvs->sysctl_sync_refresh_period); 1036749c42b6SJulian Anastasov } 1037749c42b6SJulian Anastasov 1038749c42b6SJulian Anastasov static inline int sysctl_sync_retries(struct netns_ipvs *ipvs) 1039749c42b6SJulian Anastasov { 1040749c42b6SJulian Anastasov return ipvs->sysctl_sync_retries; 104159e0350eSSimon Horman } 104259e0350eSSimon Horman 10437532e8d4SSimon Horman static inline int sysctl_sync_ver(struct netns_ipvs *ipvs) 10447532e8d4SSimon Horman { 10457532e8d4SSimon Horman return ipvs->sysctl_sync_ver; 10467532e8d4SSimon Horman } 10477532e8d4SSimon Horman 1048c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_tcp(struct netns_ipvs *ipvs) 1049c6c96c18SAlexander Frolkin { 1050c6c96c18SAlexander Frolkin return ipvs->sysctl_sloppy_tcp; 1051c6c96c18SAlexander Frolkin } 1052c6c96c18SAlexander Frolkin 1053c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_sctp(struct netns_ipvs *ipvs) 1054c6c96c18SAlexander Frolkin { 1055c6c96c18SAlexander Frolkin return ipvs->sysctl_sloppy_sctp; 1056c6c96c18SAlexander Frolkin } 1057c6c96c18SAlexander Frolkin 1058f73181c8SPablo Neira Ayuso static inline int sysctl_sync_ports(struct netns_ipvs *ipvs) 1059f73181c8SPablo Neira Ayuso { 1060f73181c8SPablo Neira Ayuso return ACCESS_ONCE(ipvs->sysctl_sync_ports); 1061f73181c8SPablo Neira Ayuso } 1062f73181c8SPablo Neira Ayuso 10634d0c875dSJulian Anastasov static inline int sysctl_sync_persist_mode(struct netns_ipvs *ipvs) 10644d0c875dSJulian Anastasov { 10654d0c875dSJulian Anastasov return ipvs->sysctl_sync_persist_mode; 10664d0c875dSJulian Anastasov } 10674d0c875dSJulian Anastasov 106807995674SZhang Yanfei static inline unsigned long sysctl_sync_qlen_max(struct netns_ipvs *ipvs) 10691c003b15SPablo Neira Ayuso { 10701c003b15SPablo Neira Ayuso return ipvs->sysctl_sync_qlen_max; 10711c003b15SPablo Neira Ayuso } 10721c003b15SPablo Neira Ayuso 10731c003b15SPablo Neira Ayuso static inline int sysctl_sync_sock_size(struct netns_ipvs *ipvs) 10741c003b15SPablo Neira Ayuso { 10751c003b15SPablo Neira Ayuso return ipvs->sysctl_sync_sock_size; 10761c003b15SPablo Neira Ayuso } 10771c003b15SPablo Neira Ayuso 10783654e611SJulian Anastasov static inline int sysctl_pmtu_disc(struct netns_ipvs *ipvs) 10793654e611SJulian Anastasov { 10803654e611SJulian Anastasov return ipvs->sysctl_pmtu_disc; 10813654e611SJulian Anastasov } 10823654e611SJulian Anastasov 10830c12582fSJulian Anastasov static inline int sysctl_backup_only(struct netns_ipvs *ipvs) 10840c12582fSJulian Anastasov { 10850c12582fSJulian Anastasov return ipvs->sync_state & IP_VS_STATE_BACKUP && 10860c12582fSJulian Anastasov ipvs->sysctl_backup_only; 10870c12582fSJulian Anastasov } 10880c12582fSJulian Anastasov 1089d752c364SMarcelo Ricardo Leitner static inline int sysctl_conn_reuse_mode(struct netns_ipvs *ipvs) 1090d752c364SMarcelo Ricardo Leitner { 1091d752c364SMarcelo Ricardo Leitner return ipvs->sysctl_conn_reuse_mode; 1092d752c364SMarcelo Ricardo Leitner } 1093d752c364SMarcelo Ricardo Leitner 109494485fedSAlex Gartrell static inline int sysctl_schedule_icmp(struct netns_ipvs *ipvs) 109594485fedSAlex Gartrell { 109694485fedSAlex Gartrell return ipvs->sysctl_schedule_icmp; 109794485fedSAlex Gartrell } 109894485fedSAlex Gartrell 10994e478098SAlex Gartrell static inline int sysctl_ignore_tunneled(struct netns_ipvs *ipvs) 11004e478098SAlex Gartrell { 11014e478098SAlex Gartrell return ipvs->sysctl_ignore_tunneled; 11024e478098SAlex Gartrell } 11034e478098SAlex Gartrell 110457032948SEric W. Biederman static inline int sysctl_cache_bypass(struct netns_ipvs *ipvs) 110557032948SEric W. Biederman { 110657032948SEric W. Biederman return ipvs->sysctl_cache_bypass; 110757032948SEric W. Biederman } 110857032948SEric W. Biederman 110959e0350eSSimon Horman #else 111059e0350eSSimon Horman 111159e0350eSSimon Horman static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs) 111259e0350eSSimon Horman { 111359e0350eSSimon Horman return DEFAULT_SYNC_THRESHOLD; 111459e0350eSSimon Horman } 111559e0350eSSimon Horman 111659e0350eSSimon Horman static inline int sysctl_sync_period(struct netns_ipvs *ipvs) 111759e0350eSSimon Horman { 111859e0350eSSimon Horman return DEFAULT_SYNC_PERIOD; 111959e0350eSSimon Horman } 112059e0350eSSimon Horman 1121749c42b6SJulian Anastasov static inline unsigned int sysctl_sync_refresh_period(struct netns_ipvs *ipvs) 1122749c42b6SJulian Anastasov { 1123749c42b6SJulian Anastasov return DEFAULT_SYNC_REFRESH_PERIOD; 1124749c42b6SJulian Anastasov } 1125749c42b6SJulian Anastasov 1126749c42b6SJulian Anastasov static inline int sysctl_sync_retries(struct netns_ipvs *ipvs) 1127749c42b6SJulian Anastasov { 1128749c42b6SJulian Anastasov return DEFAULT_SYNC_RETRIES & 3; 1129749c42b6SJulian Anastasov } 1130749c42b6SJulian Anastasov 11317532e8d4SSimon Horman static inline int sysctl_sync_ver(struct netns_ipvs *ipvs) 11327532e8d4SSimon Horman { 11337532e8d4SSimon Horman return DEFAULT_SYNC_VER; 11347532e8d4SSimon Horman } 11357532e8d4SSimon Horman 1136c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_tcp(struct netns_ipvs *ipvs) 1137c6c96c18SAlexander Frolkin { 1138c6c96c18SAlexander Frolkin return DEFAULT_SLOPPY_TCP; 1139c6c96c18SAlexander Frolkin } 1140c6c96c18SAlexander Frolkin 1141c6c96c18SAlexander Frolkin static inline int sysctl_sloppy_sctp(struct netns_ipvs *ipvs) 1142c6c96c18SAlexander Frolkin { 1143c6c96c18SAlexander Frolkin return DEFAULT_SLOPPY_SCTP; 1144c6c96c18SAlexander Frolkin } 1145c6c96c18SAlexander Frolkin 1146f73181c8SPablo Neira Ayuso static inline int sysctl_sync_ports(struct netns_ipvs *ipvs) 1147f73181c8SPablo Neira Ayuso { 1148f73181c8SPablo Neira Ayuso return 1; 1149f73181c8SPablo Neira Ayuso } 1150f73181c8SPablo Neira Ayuso 11514d0c875dSJulian Anastasov static inline int sysctl_sync_persist_mode(struct netns_ipvs *ipvs) 11524d0c875dSJulian Anastasov { 11534d0c875dSJulian Anastasov return 0; 11544d0c875dSJulian Anastasov } 11554d0c875dSJulian Anastasov 115607995674SZhang Yanfei static inline unsigned long sysctl_sync_qlen_max(struct netns_ipvs *ipvs) 11571c003b15SPablo Neira Ayuso { 11581c003b15SPablo Neira Ayuso return IPVS_SYNC_QLEN_MAX; 11591c003b15SPablo Neira Ayuso } 11601c003b15SPablo Neira Ayuso 11611c003b15SPablo Neira Ayuso static inline int sysctl_sync_sock_size(struct netns_ipvs *ipvs) 11621c003b15SPablo Neira Ayuso { 11631c003b15SPablo Neira Ayuso return 0; 11641c003b15SPablo Neira Ayuso } 11651c003b15SPablo Neira Ayuso 11663654e611SJulian Anastasov static inline int sysctl_pmtu_disc(struct netns_ipvs *ipvs) 11673654e611SJulian Anastasov { 11683654e611SJulian Anastasov return 1; 11693654e611SJulian Anastasov } 11703654e611SJulian Anastasov 11710c12582fSJulian Anastasov static inline int sysctl_backup_only(struct netns_ipvs *ipvs) 11720c12582fSJulian Anastasov { 11730c12582fSJulian Anastasov return 0; 11740c12582fSJulian Anastasov } 11750c12582fSJulian Anastasov 1176d752c364SMarcelo Ricardo Leitner static inline int sysctl_conn_reuse_mode(struct netns_ipvs *ipvs) 1177d752c364SMarcelo Ricardo Leitner { 1178d752c364SMarcelo Ricardo Leitner return 1; 1179d752c364SMarcelo Ricardo Leitner } 1180d752c364SMarcelo Ricardo Leitner 118194485fedSAlex Gartrell static inline int sysctl_schedule_icmp(struct netns_ipvs *ipvs) 118294485fedSAlex Gartrell { 118394485fedSAlex Gartrell return 0; 118494485fedSAlex Gartrell } 118594485fedSAlex Gartrell 11864e478098SAlex Gartrell static inline int sysctl_ignore_tunneled(struct netns_ipvs *ipvs) 11874e478098SAlex Gartrell { 11884e478098SAlex Gartrell return 0; 11894e478098SAlex Gartrell } 11904e478098SAlex Gartrell 119157032948SEric W. Biederman static inline int sysctl_cache_bypass(struct netns_ipvs *ipvs) 119257032948SEric W. Biederman { 119357032948SEric W. Biederman return 0; 119457032948SEric W. Biederman } 119557032948SEric W. Biederman 119659e0350eSSimon Horman #endif 119759e0350eSSimon Horman 119807dcc686SSimon Horman /* IPVS core functions 11991da177e4SLinus Torvalds * (from ip_vs_core.c) 12001da177e4SLinus Torvalds */ 12015c3a0fd7SJoe Perches const char *ip_vs_proto_name(unsigned int proto); 12025c3a0fd7SJoe Perches void ip_vs_init_hash_table(struct list_head *table, int rows); 1203afdd6140SSven Wegener #define IP_VS_INIT_HASH_TABLE(t) ip_vs_init_hash_table((t), ARRAY_SIZE((t))) 12041da177e4SLinus Torvalds 12051da177e4SLinus Torvalds #define IP_VS_APP_TYPE_FTP 1 12061da177e4SLinus Torvalds 120707dcc686SSimon Horman /* ip_vs_conn handling functions 12081da177e4SLinus Torvalds * (from ip_vs_conn.c) 12091da177e4SLinus Torvalds */ 12101da177e4SLinus Torvalds enum { 12111da177e4SLinus Torvalds IP_VS_DIR_INPUT = 0, 12121da177e4SLinus Torvalds IP_VS_DIR_OUTPUT, 12131da177e4SLinus Torvalds IP_VS_DIR_INPUT_ONLY, 12141da177e4SLinus Torvalds IP_VS_DIR_LAST, 12151da177e4SLinus Torvalds }; 12161da177e4SLinus Torvalds 121719913decSEric W. Biederman static inline void ip_vs_conn_fill_param(struct netns_ipvs *ipvs, int af, int protocol, 1218f11017ecSSimon Horman const union nf_inet_addr *caddr, 1219f11017ecSSimon Horman __be16 cport, 1220f11017ecSSimon Horman const union nf_inet_addr *vaddr, 1221f11017ecSSimon Horman __be16 vport, 1222f11017ecSSimon Horman struct ip_vs_conn_param *p) 1223f11017ecSSimon Horman { 122419913decSEric W. Biederman p->ipvs = ipvs; 1225f11017ecSSimon Horman p->af = af; 1226f11017ecSSimon Horman p->protocol = protocol; 1227f11017ecSSimon Horman p->caddr = caddr; 1228f11017ecSSimon Horman p->cport = cport; 1229f11017ecSSimon Horman p->vaddr = vaddr; 1230f11017ecSSimon Horman p->vport = vport; 123185999283SSimon Horman p->pe = NULL; 123285999283SSimon Horman p->pe_data = NULL; 1233f11017ecSSimon Horman } 123428364a59SJulius Volz 1235f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_in_get(const struct ip_vs_conn_param *p); 1236f11017ecSSimon Horman struct ip_vs_conn *ip_vs_ct_in_get(const struct ip_vs_conn_param *p); 123728364a59SJulius Volz 1238ab161976SEric W. Biederman struct ip_vs_conn * ip_vs_conn_in_get_proto(struct netns_ipvs *ipvs, int af, 1239ab161976SEric W. Biederman const struct sk_buff *skb, 1240802c41adSAlex Gartrell const struct ip_vs_iphdr *iph); 12415c0d2374SSimon Horman 1242f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_out_get(const struct ip_vs_conn_param *p); 12431da177e4SLinus Torvalds 12440cf705c8SEric W. Biederman struct ip_vs_conn * ip_vs_conn_out_get_proto(struct netns_ipvs *ipvs, int af, 12450cf705c8SEric W. Biederman const struct sk_buff *skb, 1246802c41adSAlex Gartrell const struct ip_vs_iphdr *iph); 12475c0d2374SSimon Horman 1248088339a5SJulian Anastasov /* Get reference to gain full access to conn. 1249088339a5SJulian Anastasov * By default, RCU read-side critical sections have access only to 1250088339a5SJulian Anastasov * conn fields and its PE data, see ip_vs_conn_rcu_free() for reference. 1251088339a5SJulian Anastasov */ 1252088339a5SJulian Anastasov static inline bool __ip_vs_conn_get(struct ip_vs_conn *cp) 1253088339a5SJulian Anastasov { 1254088339a5SJulian Anastasov return atomic_inc_not_zero(&cp->refcnt); 1255088339a5SJulian Anastasov } 1256088339a5SJulian Anastasov 12571da177e4SLinus Torvalds /* put back the conn without restarting its timer */ 12581da177e4SLinus Torvalds static inline void __ip_vs_conn_put(struct ip_vs_conn *cp) 12591da177e4SLinus Torvalds { 12604e857c58SPeter Zijlstra smp_mb__before_atomic(); 12611da177e4SLinus Torvalds atomic_dec(&cp->refcnt); 12621da177e4SLinus Torvalds } 12635c3a0fd7SJoe Perches void ip_vs_conn_put(struct ip_vs_conn *cp); 12645c3a0fd7SJoe Perches void ip_vs_conn_fill_cport(struct ip_vs_conn *cp, __be16 cport); 12651da177e4SLinus Torvalds 1266ba38528aSAlex Gartrell struct ip_vs_conn *ip_vs_conn_new(const struct ip_vs_conn_param *p, int dest_af, 1267f11017ecSSimon Horman const union nf_inet_addr *daddr, 126895c96174SEric Dumazet __be16 dport, unsigned int flags, 12690e051e68SHans Schillstrom struct ip_vs_dest *dest, __u32 fwmark); 12705c3a0fd7SJoe Perches void ip_vs_conn_expire_now(struct ip_vs_conn *cp); 12711da177e4SLinus Torvalds 12725c3a0fd7SJoe Perches const char *ip_vs_state_name(__u16 proto, int state); 12731da177e4SLinus Torvalds 127469f39093SEric W. Biederman void ip_vs_tcp_conn_listen(struct ip_vs_conn *cp); 12755c3a0fd7SJoe Perches int ip_vs_check_template(struct ip_vs_conn *ct); 1276423b5595SEric W. Biederman void ip_vs_random_dropentry(struct netns_ipvs *ipvs); 12775c3a0fd7SJoe Perches int ip_vs_conn_init(void); 12785c3a0fd7SJoe Perches void ip_vs_conn_cleanup(void); 12791da177e4SLinus Torvalds 12801da177e4SLinus Torvalds static inline void ip_vs_control_del(struct ip_vs_conn *cp) 12811da177e4SLinus Torvalds { 12821da177e4SLinus Torvalds struct ip_vs_conn *ctl_cp = cp->control; 12831da177e4SLinus Torvalds if (!ctl_cp) { 1284cfc78c5aSJulius Volz IP_VS_ERR_BUF("request control DEL for uncontrolled: " 1285cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1286cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1287cfc78c5aSJulius Volz ntohs(cp->cport), 1288cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1289cfc78c5aSJulius Volz ntohs(cp->vport)); 1290cfc78c5aSJulius Volz 12911da177e4SLinus Torvalds return; 12921da177e4SLinus Torvalds } 12931da177e4SLinus Torvalds 1294cfc78c5aSJulius Volz IP_VS_DBG_BUF(7, "DELeting control for: " 1295cfc78c5aSJulius Volz "cp.dst=%s:%d ctl_cp.dst=%s:%d\n", 1296cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1297cfc78c5aSJulius Volz ntohs(cp->cport), 1298cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr), 1299cfc78c5aSJulius Volz ntohs(ctl_cp->cport)); 13001da177e4SLinus Torvalds 13011da177e4SLinus Torvalds cp->control = NULL; 13021da177e4SLinus Torvalds if (atomic_read(&ctl_cp->n_control) == 0) { 1303cfc78c5aSJulius Volz IP_VS_ERR_BUF("BUG control DEL with n=0 : " 1304cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1305cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1306cfc78c5aSJulius Volz ntohs(cp->cport), 1307cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1308cfc78c5aSJulius Volz ntohs(cp->vport)); 1309cfc78c5aSJulius Volz 13101da177e4SLinus Torvalds return; 13111da177e4SLinus Torvalds } 13121da177e4SLinus Torvalds atomic_dec(&ctl_cp->n_control); 13131da177e4SLinus Torvalds } 13141da177e4SLinus Torvalds 13151da177e4SLinus Torvalds static inline void 13161da177e4SLinus Torvalds ip_vs_control_add(struct ip_vs_conn *cp, struct ip_vs_conn *ctl_cp) 13171da177e4SLinus Torvalds { 13181da177e4SLinus Torvalds if (cp->control) { 1319cfc78c5aSJulius Volz IP_VS_ERR_BUF("request control ADD for already controlled: " 1320cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1321cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1322cfc78c5aSJulius Volz ntohs(cp->cport), 1323cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1324cfc78c5aSJulius Volz ntohs(cp->vport)); 1325cfc78c5aSJulius Volz 13261da177e4SLinus Torvalds ip_vs_control_del(cp); 13271da177e4SLinus Torvalds } 13281da177e4SLinus Torvalds 1329cfc78c5aSJulius Volz IP_VS_DBG_BUF(7, "ADDing control for: " 1330cfc78c5aSJulius Volz "cp.dst=%s:%d ctl_cp.dst=%s:%d\n", 1331cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1332cfc78c5aSJulius Volz ntohs(cp->cport), 1333cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr), 1334cfc78c5aSJulius Volz ntohs(ctl_cp->cport)); 13351da177e4SLinus Torvalds 13361da177e4SLinus Torvalds cp->control = ctl_cp; 13371da177e4SLinus Torvalds atomic_inc(&ctl_cp->n_control); 13381da177e4SLinus Torvalds } 13391da177e4SLinus Torvalds 134007dcc686SSimon Horman /* IPVS netns init & cleanup functions */ 1341a4dd0360SEric W. Biederman int ip_vs_estimator_net_init(struct netns_ipvs *ipvs); 13423d993766SEric W. Biederman int ip_vs_control_net_init(struct netns_ipvs *ipvs); 1343*7d1f88ecSEric W. Biederman int ip_vs_protocol_net_init(struct netns_ipvs *ipvs); 1344b5dd212cSEric W. Biederman int ip_vs_app_net_init(struct netns_ipvs *ipvs); 13452f3edc6aSEric W. Biederman int ip_vs_conn_net_init(struct netns_ipvs *ipvs); 1346802cb437SEric W. Biederman int ip_vs_sync_net_init(struct netns_ipvs *ipvs); 13472f3edc6aSEric W. Biederman void ip_vs_conn_net_cleanup(struct netns_ipvs *ipvs); 1348b5dd212cSEric W. Biederman void ip_vs_app_net_cleanup(struct netns_ipvs *ipvs); 1349*7d1f88ecSEric W. Biederman void ip_vs_protocol_net_cleanup(struct netns_ipvs *ipvs); 13503d993766SEric W. Biederman void ip_vs_control_net_cleanup(struct netns_ipvs *ipvs); 1351a4dd0360SEric W. Biederman void ip_vs_estimator_net_cleanup(struct netns_ipvs *ipvs); 1352ebea1f7cSEric W. Biederman void ip_vs_sync_net_cleanup(struct netns_ipvs *ipvs); 135356d2169bSEric W. Biederman void ip_vs_service_net_cleanup(struct netns_ipvs *ipvs); 13541da177e4SLinus Torvalds 135507dcc686SSimon Horman /* IPVS application functions 13561da177e4SLinus Torvalds * (from ip_vs_app.c) 13571da177e4SLinus Torvalds */ 13581da177e4SLinus Torvalds #define IP_VS_APP_MAX_PORTS 8 13599f8128a5SEric W. Biederman struct ip_vs_app *register_ip_vs_app(struct netns_ipvs *ipvs, struct ip_vs_app *app); 13609f8128a5SEric W. Biederman void unregister_ip_vs_app(struct netns_ipvs *ipvs, struct ip_vs_app *app); 13615c3a0fd7SJoe Perches int ip_vs_bind_app(struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 13625c3a0fd7SJoe Perches void ip_vs_unbind_app(struct ip_vs_conn *cp); 13633250dc9cSEric W. Biederman int register_ip_vs_app_inc(struct netns_ipvs *ipvs, struct ip_vs_app *app, __u16 proto, 13645c3a0fd7SJoe Perches __u16 port); 13655c3a0fd7SJoe Perches int ip_vs_app_inc_get(struct ip_vs_app *inc); 13665c3a0fd7SJoe Perches void ip_vs_app_inc_put(struct ip_vs_app *inc); 13671da177e4SLinus Torvalds 13685c3a0fd7SJoe Perches int ip_vs_app_pkt_out(struct ip_vs_conn *, struct sk_buff *skb); 13695c3a0fd7SJoe Perches int ip_vs_app_pkt_in(struct ip_vs_conn *, struct sk_buff *skb); 13701da177e4SLinus Torvalds 13718be67a66SSimon Horman int register_ip_vs_pe(struct ip_vs_pe *pe); 13728be67a66SSimon Horman int unregister_ip_vs_pe(struct ip_vs_pe *pe); 1373e9e5eee8SSimon Horman struct ip_vs_pe *ip_vs_pe_getbyname(const char *name); 1374fe5e7a1eSHans Schillstrom struct ip_vs_pe *__ip_vs_pe_getbyname(const char *pe_name); 1375e9e5eee8SSimon Horman 137607dcc686SSimon Horman /* Use a #define to avoid all of module.h just for these trivial ops */ 137769e7dae4SPaul Gortmaker #define ip_vs_pe_get(pe) \ 137869e7dae4SPaul Gortmaker if (pe && pe->module) \ 1379e9e5eee8SSimon Horman __module_get(pe->module); 1380e9e5eee8SSimon Horman 138169e7dae4SPaul Gortmaker #define ip_vs_pe_put(pe) \ 138269e7dae4SPaul Gortmaker if (pe && pe->module) \ 1383e9e5eee8SSimon Horman module_put(pe->module); 13841da177e4SLinus Torvalds 138507dcc686SSimon Horman /* IPVS protocol functions (from ip_vs_proto.c) */ 13865c3a0fd7SJoe Perches int ip_vs_protocol_init(void); 13875c3a0fd7SJoe Perches void ip_vs_protocol_cleanup(void); 13885c3a0fd7SJoe Perches void ip_vs_protocol_timeout_change(struct netns_ipvs *ipvs, int flags); 13895c3a0fd7SJoe Perches int *ip_vs_create_timeout_table(int *table, int size); 13905c3a0fd7SJoe Perches int ip_vs_set_state_timeout(int *table, int num, const char *const *names, 139136cbd3dcSJan Engelhardt const char *name, int to); 13925c3a0fd7SJoe Perches void ip_vs_tcpudp_debug_packet(int af, struct ip_vs_protocol *pp, 13935c3a0fd7SJoe Perches const struct sk_buff *skb, int offset, 13945c3a0fd7SJoe Perches const char *msg); 13951da177e4SLinus Torvalds 13961da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_tcp; 13971da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_udp; 13981da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_icmp; 13991da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_esp; 14001da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_ah; 14012906f66aSVenkata Mohan Reddy extern struct ip_vs_protocol ip_vs_protocol_sctp; 14021da177e4SLinus Torvalds 140307dcc686SSimon Horman /* Registering/unregistering scheduler functions 14041da177e4SLinus Torvalds * (from ip_vs_sched.c) 14051da177e4SLinus Torvalds */ 14065c3a0fd7SJoe Perches int register_ip_vs_scheduler(struct ip_vs_scheduler *scheduler); 14075c3a0fd7SJoe Perches int unregister_ip_vs_scheduler(struct ip_vs_scheduler *scheduler); 14085c3a0fd7SJoe Perches int ip_vs_bind_scheduler(struct ip_vs_service *svc, 14091da177e4SLinus Torvalds struct ip_vs_scheduler *scheduler); 14105c3a0fd7SJoe Perches void ip_vs_unbind_scheduler(struct ip_vs_service *svc, 1411ceec4c38SJulian Anastasov struct ip_vs_scheduler *sched); 14125c3a0fd7SJoe Perches struct ip_vs_scheduler *ip_vs_scheduler_get(const char *sched_name); 14135c3a0fd7SJoe Perches void ip_vs_scheduler_put(struct ip_vs_scheduler *scheduler); 14145c3a0fd7SJoe Perches struct ip_vs_conn * 1415190ecd27SJulian Anastasov ip_vs_schedule(struct ip_vs_service *svc, struct sk_buff *skb, 1416d4383f04SJesper Dangaard Brouer struct ip_vs_proto_data *pd, int *ignored, 1417d4383f04SJesper Dangaard Brouer struct ip_vs_iphdr *iph); 14185c3a0fd7SJoe Perches int ip_vs_leave(struct ip_vs_service *svc, struct sk_buff *skb, 1419d4383f04SJesper Dangaard Brouer struct ip_vs_proto_data *pd, struct ip_vs_iphdr *iph); 14201da177e4SLinus Torvalds 14215c3a0fd7SJoe Perches void ip_vs_scheduler_err(struct ip_vs_service *svc, const char *msg); 142241ac51eeSPatrick Schaaf 142307dcc686SSimon Horman /* IPVS control data and functions (from ip_vs_ctl.c) */ 14241da177e4SLinus Torvalds extern struct ip_vs_stats ip_vs_stats; 1425b880c1f0SHans Schillstrom extern int sysctl_ip_vs_sync_ver; 14261da177e4SLinus Torvalds 14275c3a0fd7SJoe Perches struct ip_vs_service * 14280a4fd6ceSEric W. Biederman ip_vs_service_find(struct netns_ipvs *ipvs, int af, __u32 fwmark, __u16 protocol, 14293c2e0505SJulius Volz const union nf_inet_addr *vaddr, __be16 vport); 14301da177e4SLinus Torvalds 143148aed1b0SEric W. Biederman bool ip_vs_has_real_service(struct netns_ipvs *ipvs, int af, __u16 protocol, 14327937df15SJulius Volz const union nf_inet_addr *daddr, __be16 dport); 14337937df15SJulius Volz 14345c3a0fd7SJoe Perches int ip_vs_use_count_inc(void); 14355c3a0fd7SJoe Perches void ip_vs_use_count_dec(void); 14365c3a0fd7SJoe Perches int ip_vs_register_nl_ioctl(void); 14375c3a0fd7SJoe Perches void ip_vs_unregister_nl_ioctl(void); 14385c3a0fd7SJoe Perches int ip_vs_control_init(void); 14395c3a0fd7SJoe Perches void ip_vs_control_cleanup(void); 14405c3a0fd7SJoe Perches struct ip_vs_dest * 1441dc2add6fSEric W. Biederman ip_vs_find_dest(struct netns_ipvs *ipvs, int svc_af, int dest_af, 1442655eef10SAlex Gartrell const union nf_inet_addr *daddr, __be16 dport, 1443655eef10SAlex Gartrell const union nf_inet_addr *vaddr, __be16 vport, 144452793dbeSJulian Anastasov __u16 protocol, __u32 fwmark, __u32 flags); 14455c3a0fd7SJoe Perches void ip_vs_try_bind_dest(struct ip_vs_conn *cp); 14461da177e4SLinus Torvalds 1447fca9c20aSJulian Anastasov static inline void ip_vs_dest_hold(struct ip_vs_dest *dest) 1448fca9c20aSJulian Anastasov { 1449fca9c20aSJulian Anastasov atomic_inc(&dest->refcnt); 1450fca9c20aSJulian Anastasov } 1451fca9c20aSJulian Anastasov 1452fca9c20aSJulian Anastasov static inline void ip_vs_dest_put(struct ip_vs_dest *dest) 1453fca9c20aSJulian Anastasov { 14544e857c58SPeter Zijlstra smp_mb__before_atomic(); 1455fca9c20aSJulian Anastasov atomic_dec(&dest->refcnt); 1456fca9c20aSJulian Anastasov } 14571da177e4SLinus Torvalds 14589e4e948aSJulian Anastasov static inline void ip_vs_dest_put_and_free(struct ip_vs_dest *dest) 14599e4e948aSJulian Anastasov { 14609e4e948aSJulian Anastasov if (atomic_dec_return(&dest->refcnt) < 0) 14619e4e948aSJulian Anastasov kfree(dest); 14629e4e948aSJulian Anastasov } 14639e4e948aSJulian Anastasov 146407dcc686SSimon Horman /* IPVS sync daemon data and function prototypes 14651da177e4SLinus Torvalds * (from ip_vs_sync.c) 14661da177e4SLinus Torvalds */ 14676ac121d7SEric W. Biederman int start_sync_thread(struct netns_ipvs *ipvs, struct ipvs_sync_daemon_cfg *cfg, 1468e4ff6751SJulian Anastasov int state); 1469b3cf3cbfSEric W. Biederman int stop_sync_thread(struct netns_ipvs *ipvs, int state); 1470b61a8c1aSEric W. Biederman void ip_vs_sync_conn(struct netns_ipvs *ipvs, struct ip_vs_conn *cp, int pkts); 14711da177e4SLinus Torvalds 147207dcc686SSimon Horman /* IPVS rate estimator prototypes (from ip_vs_est.c) */ 14730f34d54bSEric W. Biederman void ip_vs_start_estimator(struct netns_ipvs *ipvs, struct ip_vs_stats *stats); 14740f34d54bSEric W. Biederman void ip_vs_stop_estimator(struct netns_ipvs *ipvs, struct ip_vs_stats *stats); 14755c3a0fd7SJoe Perches void ip_vs_zero_estimator(struct ip_vs_stats *stats); 1476cd67cd5eSJulian Anastasov void ip_vs_read_estimator(struct ip_vs_kstats *dst, struct ip_vs_stats *stats); 14771da177e4SLinus Torvalds 147807dcc686SSimon Horman /* Various IPVS packet transmitters (from ip_vs_xmit.c) */ 14795c3a0fd7SJoe Perches int ip_vs_null_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1480d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 14815c3a0fd7SJoe Perches int ip_vs_bypass_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1482d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 14835c3a0fd7SJoe Perches int ip_vs_nat_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1484d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 14855c3a0fd7SJoe Perches int ip_vs_tunnel_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 14865c3a0fd7SJoe Perches struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 14875c3a0fd7SJoe Perches int ip_vs_dr_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 14885c3a0fd7SJoe Perches struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 14895c3a0fd7SJoe Perches int ip_vs_icmp_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1490d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, int offset, 1491d4383f04SJesper Dangaard Brouer unsigned int hooknum, struct ip_vs_iphdr *iph); 14925c3a0fd7SJoe Perches void ip_vs_dest_dst_rcu_free(struct rcu_head *head); 14931da177e4SLinus Torvalds 1494b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6 14955c3a0fd7SJoe Perches int ip_vs_bypass_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 1496d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 14975c3a0fd7SJoe Perches int ip_vs_nat_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 14985c3a0fd7SJoe Perches struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 14995c3a0fd7SJoe Perches int ip_vs_tunnel_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 15005c3a0fd7SJoe Perches struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 15015c3a0fd7SJoe Perches int ip_vs_dr_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 15025c3a0fd7SJoe Perches struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 15035c3a0fd7SJoe Perches int ip_vs_icmp_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 1504d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, int offset, 1505d4383f04SJesper Dangaard Brouer unsigned int hooknum, struct ip_vs_iphdr *iph); 1506b3cdd2a7SJulius Volz #endif 15071da177e4SLinus Torvalds 15083a1bbf18SSimon Horman #ifdef CONFIG_SYSCTL 150907dcc686SSimon Horman /* This is a simple mechanism to ignore packets when 15101da177e4SLinus Torvalds * we are loaded. Just set ip_vs_drop_rate to 'n' and 15111da177e4SLinus Torvalds * we start to drop 1/rate of the packets 15121da177e4SLinus Torvalds */ 1513a0840e2eSHans Schillstrom static inline int ip_vs_todrop(struct netns_ipvs *ipvs) 15141da177e4SLinus Torvalds { 1515a0840e2eSHans Schillstrom if (!ipvs->drop_rate) 1516a0840e2eSHans Schillstrom return 0; 1517a0840e2eSHans Schillstrom if (--ipvs->drop_counter > 0) 1518a0840e2eSHans Schillstrom return 0; 1519a0840e2eSHans Schillstrom ipvs->drop_counter = ipvs->drop_rate; 15201da177e4SLinus Torvalds return 1; 15211da177e4SLinus Torvalds } 15223a1bbf18SSimon Horman #else 15233a1bbf18SSimon Horman static inline int ip_vs_todrop(struct netns_ipvs *ipvs) { return 0; } 15243a1bbf18SSimon Horman #endif 15251da177e4SLinus Torvalds 152607dcc686SSimon Horman /* ip_vs_fwd_tag returns the forwarding tag of the connection */ 15271da177e4SLinus Torvalds #define IP_VS_FWD_METHOD(cp) (cp->flags & IP_VS_CONN_F_FWD_MASK) 15281da177e4SLinus Torvalds 1529732db659SAdrian Bunk static inline char ip_vs_fwd_tag(struct ip_vs_conn *cp) 15301da177e4SLinus Torvalds { 15311da177e4SLinus Torvalds char fwd; 15321da177e4SLinus Torvalds 15331da177e4SLinus Torvalds switch (IP_VS_FWD_METHOD(cp)) { 15341da177e4SLinus Torvalds case IP_VS_CONN_F_MASQ: 15351da177e4SLinus Torvalds fwd = 'M'; break; 15361da177e4SLinus Torvalds case IP_VS_CONN_F_LOCALNODE: 15371da177e4SLinus Torvalds fwd = 'L'; break; 15381da177e4SLinus Torvalds case IP_VS_CONN_F_TUNNEL: 15391da177e4SLinus Torvalds fwd = 'T'; break; 15401da177e4SLinus Torvalds case IP_VS_CONN_F_DROUTE: 15411da177e4SLinus Torvalds fwd = 'R'; break; 15421da177e4SLinus Torvalds case IP_VS_CONN_F_BYPASS: 15431da177e4SLinus Torvalds fwd = 'B'; break; 15441da177e4SLinus Torvalds default: 15451da177e4SLinus Torvalds fwd = '?'; break; 15461da177e4SLinus Torvalds } 15471da177e4SLinus Torvalds return fwd; 15481da177e4SLinus Torvalds } 15491da177e4SLinus Torvalds 15505c3a0fd7SJoe Perches void ip_vs_nat_icmp(struct sk_buff *skb, struct ip_vs_protocol *pp, 15511da177e4SLinus Torvalds struct ip_vs_conn *cp, int dir); 15521da177e4SLinus Torvalds 1553b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6 15545c3a0fd7SJoe Perches void ip_vs_nat_icmp_v6(struct sk_buff *skb, struct ip_vs_protocol *pp, 1555b3cdd2a7SJulius Volz struct ip_vs_conn *cp, int dir); 1556b3cdd2a7SJulius Volz #endif 1557b3cdd2a7SJulius Volz 15585c3a0fd7SJoe Perches __sum16 ip_vs_checksum_complete(struct sk_buff *skb, int offset); 15591da177e4SLinus Torvalds 1560f9214b26SAl Viro static inline __wsum ip_vs_check_diff4(__be32 old, __be32 new, __wsum oldsum) 15611da177e4SLinus Torvalds { 1562f9214b26SAl Viro __be32 diff[2] = { ~old, new }; 15631da177e4SLinus Torvalds 156407f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 1565f9214b26SAl Viro } 1566f9214b26SAl Viro 15670bbdd42bSJulius Volz #ifdef CONFIG_IP_VS_IPV6 15680bbdd42bSJulius Volz static inline __wsum ip_vs_check_diff16(const __be32 *old, const __be32 *new, 15690bbdd42bSJulius Volz __wsum oldsum) 15700bbdd42bSJulius Volz { 15710bbdd42bSJulius Volz __be32 diff[8] = { ~old[3], ~old[2], ~old[1], ~old[0], 15720bbdd42bSJulius Volz new[3], new[2], new[1], new[0] }; 15730bbdd42bSJulius Volz 157407f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 15750bbdd42bSJulius Volz } 15760bbdd42bSJulius Volz #endif 15770bbdd42bSJulius Volz 1578f9214b26SAl Viro static inline __wsum ip_vs_check_diff2(__be16 old, __be16 new, __wsum oldsum) 1579f9214b26SAl Viro { 1580f9214b26SAl Viro __be16 diff[2] = { ~old, new }; 1581f9214b26SAl Viro 158207f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 15831da177e4SLinus Torvalds } 15841da177e4SLinus Torvalds 158507dcc686SSimon Horman /* Forget current conntrack (unconfirmed) and attach notrack entry */ 1586cf356d69SJulian Anastasov static inline void ip_vs_notrack(struct sk_buff *skb) 1587cf356d69SJulian Anastasov { 1588cf356d69SJulian Anastasov #if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE) 1589cf356d69SJulian Anastasov enum ip_conntrack_info ctinfo; 159006b69390SJesper Juhl struct nf_conn *ct = nf_ct_get(skb, &ctinfo); 1591cf356d69SJulian Anastasov 1592cf356d69SJulian Anastasov if (!ct || !nf_ct_is_untracked(ct)) { 15939e33ce45SLin Ming nf_conntrack_put(skb->nfct); 1594cf356d69SJulian Anastasov skb->nfct = &nf_ct_untracked_get()->ct_general; 1595cf356d69SJulian Anastasov skb->nfctinfo = IP_CT_NEW; 1596cf356d69SJulian Anastasov nf_conntrack_get(skb->nfct); 1597cf356d69SJulian Anastasov } 1598cf356d69SJulian Anastasov #endif 1599cf356d69SJulian Anastasov } 1600cf356d69SJulian Anastasov 1601f4bc17cdSJulian Anastasov #ifdef CONFIG_IP_VS_NFCT 160207dcc686SSimon Horman /* Netfilter connection tracking 1603f4bc17cdSJulian Anastasov * (from ip_vs_nfct.c) 1604f4bc17cdSJulian Anastasov */ 1605a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs) 1606f4bc17cdSJulian Anastasov { 1607a4e2f5a7SSimon Horman #ifdef CONFIG_SYSCTL 1608a0840e2eSHans Schillstrom return ipvs->sysctl_conntrack; 1609a4e2f5a7SSimon Horman #else 1610a4e2f5a7SSimon Horman return 0; 1611a4e2f5a7SSimon Horman #endif 1612f4bc17cdSJulian Anastasov } 1613f4bc17cdSJulian Anastasov 16145c3a0fd7SJoe Perches void ip_vs_update_conntrack(struct sk_buff *skb, struct ip_vs_conn *cp, 16156523ce15SJulian Anastasov int outin); 16165c3a0fd7SJoe Perches int ip_vs_confirm_conntrack(struct sk_buff *skb); 16175c3a0fd7SJoe Perches void ip_vs_nfct_expect_related(struct sk_buff *skb, struct nf_conn *ct, 1618f4bc17cdSJulian Anastasov struct ip_vs_conn *cp, u_int8_t proto, 1619f4bc17cdSJulian Anastasov const __be16 port, int from_rs); 16205c3a0fd7SJoe Perches void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp); 1621f4bc17cdSJulian Anastasov 1622f4bc17cdSJulian Anastasov #else 1623f4bc17cdSJulian Anastasov 1624a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs) 1625f4bc17cdSJulian Anastasov { 1626f4bc17cdSJulian Anastasov return 0; 1627f4bc17cdSJulian Anastasov } 1628f4bc17cdSJulian Anastasov 1629f4bc17cdSJulian Anastasov static inline void ip_vs_update_conntrack(struct sk_buff *skb, 1630f4bc17cdSJulian Anastasov struct ip_vs_conn *cp, int outin) 1631f4bc17cdSJulian Anastasov { 1632f4bc17cdSJulian Anastasov } 1633f4bc17cdSJulian Anastasov 1634e23ebf0fSKrzysztof Wilczynski static inline int ip_vs_confirm_conntrack(struct sk_buff *skb) 1635f4bc17cdSJulian Anastasov { 1636f4bc17cdSJulian Anastasov return NF_ACCEPT; 1637f4bc17cdSJulian Anastasov } 1638f4bc17cdSJulian Anastasov 1639f4bc17cdSJulian Anastasov static inline void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp) 1640f4bc17cdSJulian Anastasov { 1641f4bc17cdSJulian Anastasov } 164207dcc686SSimon Horman #endif /* CONFIG_IP_VS_NFCT */ 16436523ce15SJulian Anastasov 1644c16526a7SSimon Kirby static inline int 1645b552f7e3SChangli Gao ip_vs_dest_conn_overhead(struct ip_vs_dest *dest) 1646b552f7e3SChangli Gao { 164707dcc686SSimon Horman /* We think the overhead of processing active connections is 256 1648b552f7e3SChangli Gao * times higher than that of inactive connections in average. (This 1649b552f7e3SChangli Gao * 256 times might not be accurate, we will change it later) We 1650b552f7e3SChangli Gao * use the following formula to estimate the overhead now: 1651b552f7e3SChangli Gao * dest->activeconns*256 + dest->inactconns 1652b552f7e3SChangli Gao */ 1653b552f7e3SChangli Gao return (atomic_read(&dest->activeconns) << 8) + 1654b552f7e3SChangli Gao atomic_read(&dest->inactconns); 1655b552f7e3SChangli Gao } 1656b552f7e3SChangli Gao 1657bc4768ebSJulius Volz #endif /* _NET_IP_VS_H */ 1658