11da177e4SLinus Torvalds /* 21da177e4SLinus Torvalds * IP Virtual Server 31da177e4SLinus Torvalds * data structure and functionality definitions 41da177e4SLinus Torvalds */ 51da177e4SLinus Torvalds 6bc4768ebSJulius Volz #ifndef _NET_IP_VS_H 7bc4768ebSJulius Volz #define _NET_IP_VS_H 81da177e4SLinus Torvalds 9bc4768ebSJulius Volz #include <linux/ip_vs.h> /* definitions shared with userland */ 101da177e4SLinus Torvalds 11bc4768ebSJulius Volz #include <asm/types.h> /* for __uXX types */ 12bc4768ebSJulius Volz 131da177e4SLinus Torvalds #include <linux/list.h> /* for struct list_head */ 141da177e4SLinus Torvalds #include <linux/spinlock.h> /* for struct rwlock_t */ 1560063497SArun Sharma #include <linux/atomic.h> /* for struct atomic_t */ 161da177e4SLinus Torvalds #include <linux/compiler.h> 1714c85021SArnaldo Carvalho de Melo #include <linux/timer.h> 18187f1882SPaul Gortmaker #include <linux/bug.h> 191da177e4SLinus Torvalds 2014c85021SArnaldo Carvalho de Melo #include <net/checksum.h> 21e7ade46aSJulius Volz #include <linux/netfilter.h> /* for union nf_inet_addr */ 221668e010SKOVACS Krisztian #include <linux/ip.h> 23e7ade46aSJulius Volz #include <linux/ipv6.h> /* for struct ipv6hdr */ 244e3fd7a0SAlexey Dobriyan #include <net/ipv6.h> 2554d83efaSJesper Dangaard Brouer #if IS_ENABLED(CONFIG_IP_VS_IPV6) 2663dca2c0SJesper Dangaard Brouer #include <linux/netfilter_ipv6/ip6_tables.h> 2763dca2c0SJesper Dangaard Brouer #endif 28a638e514SJesper Dangaard Brouer #if IS_ENABLED(CONFIG_NF_CONNTRACK) 29f4bc17cdSJulian Anastasov #include <net/netfilter/nf_conntrack.h> 30f4bc17cdSJulian Anastasov #endif 3161b1ab45SHans Schillstrom #include <net/net_namespace.h> /* Netw namespace */ 3261b1ab45SHans Schillstrom 3361b1ab45SHans Schillstrom /* 3461b1ab45SHans Schillstrom * Generic access of ipvs struct 3561b1ab45SHans Schillstrom */ 3661b1ab45SHans Schillstrom static inline struct netns_ipvs *net_ipvs(struct net* net) 3761b1ab45SHans Schillstrom { 3861b1ab45SHans Schillstrom return net->ipvs; 3961b1ab45SHans Schillstrom } 40fc723250SHans Schillstrom /* 41fc723250SHans Schillstrom * Get net ptr from skb in traffic cases 42fc723250SHans Schillstrom * use skb_sknet when call is from userland (ioctl or netlink) 43fc723250SHans Schillstrom */ 44a0840e2eSHans Schillstrom static inline struct net *skb_net(const struct sk_buff *skb) 45fc723250SHans Schillstrom { 46fc723250SHans Schillstrom #ifdef CONFIG_NET_NS 47fc723250SHans Schillstrom #ifdef CONFIG_IP_VS_DEBUG 48fc723250SHans Schillstrom /* 49fc723250SHans Schillstrom * This is used for debug only. 50fc723250SHans Schillstrom * Start with the most likely hit 51fc723250SHans Schillstrom * End with BUG 52fc723250SHans Schillstrom */ 53fc723250SHans Schillstrom if (likely(skb->dev && skb->dev->nd_net)) 54fc723250SHans Schillstrom return dev_net(skb->dev); 55a09d1977SHans Schillstrom if (skb_dst(skb) && skb_dst(skb)->dev) 56fc723250SHans Schillstrom return dev_net(skb_dst(skb)->dev); 57fc723250SHans Schillstrom WARN(skb->sk, "Maybe skb_sknet should be used in %s() at line:%d\n", 58fc723250SHans Schillstrom __func__, __LINE__); 59fc723250SHans Schillstrom if (likely(skb->sk && skb->sk->sk_net)) 60fc723250SHans Schillstrom return sock_net(skb->sk); 61fc723250SHans Schillstrom pr_err("There is no net ptr to find in the skb in %s() line:%d\n", 62fc723250SHans Schillstrom __func__, __LINE__); 63fc723250SHans Schillstrom BUG(); 64fc723250SHans Schillstrom #else 65fc723250SHans Schillstrom return dev_net(skb->dev ? : skb_dst(skb)->dev); 66fc723250SHans Schillstrom #endif 67fc723250SHans Schillstrom #else 68fc723250SHans Schillstrom return &init_net; 69fc723250SHans Schillstrom #endif 70fc723250SHans Schillstrom } 71fc723250SHans Schillstrom 72a0840e2eSHans Schillstrom static inline struct net *skb_sknet(const struct sk_buff *skb) 73fc723250SHans Schillstrom { 74fc723250SHans Schillstrom #ifdef CONFIG_NET_NS 75fc723250SHans Schillstrom #ifdef CONFIG_IP_VS_DEBUG 76fc723250SHans Schillstrom /* Start with the most likely hit */ 77fc723250SHans Schillstrom if (likely(skb->sk && skb->sk->sk_net)) 78fc723250SHans Schillstrom return sock_net(skb->sk); 79fc723250SHans Schillstrom WARN(skb->dev, "Maybe skb_net should be used instead in %s() line:%d\n", 80fc723250SHans Schillstrom __func__, __LINE__); 81fc723250SHans Schillstrom if (likely(skb->dev && skb->dev->nd_net)) 82fc723250SHans Schillstrom return dev_net(skb->dev); 83fc723250SHans Schillstrom pr_err("There is no net ptr to find in the skb in %s() line:%d\n", 84fc723250SHans Schillstrom __func__, __LINE__); 85fc723250SHans Schillstrom BUG(); 86fc723250SHans Schillstrom #else 87fc723250SHans Schillstrom return sock_net(skb->sk); 88fc723250SHans Schillstrom #endif 89fc723250SHans Schillstrom #else 90fc723250SHans Schillstrom return &init_net; 91fc723250SHans Schillstrom #endif 92fc723250SHans Schillstrom } 93b17fc996SHans Schillstrom /* 94b17fc996SHans Schillstrom * This one needed for single_open_net since net is stored directly in 9525985edcSLucas De Marchi * private not as a struct i.e. seq_file_net can't be used. 96b17fc996SHans Schillstrom */ 97b17fc996SHans Schillstrom static inline struct net *seq_file_single_net(struct seq_file *seq) 98b17fc996SHans Schillstrom { 99b17fc996SHans Schillstrom #ifdef CONFIG_NET_NS 100b17fc996SHans Schillstrom return (struct net *)seq->private; 101b17fc996SHans Schillstrom #else 102b17fc996SHans Schillstrom return &init_net; 103b17fc996SHans Schillstrom #endif 104b17fc996SHans Schillstrom } 1056f7edb48SCatalin(ux) M. BOIE 1066f7edb48SCatalin(ux) M. BOIE /* Connections' size value needed by ip_vs_ctl.c */ 1076f7edb48SCatalin(ux) M. BOIE extern int ip_vs_conn_tab_size; 1086f7edb48SCatalin(ux) M. BOIE 10964aae3cbSJulius Volz struct ip_vs_iphdr { 11063dca2c0SJesper Dangaard Brouer __u32 len; /* IPv4 simply where L4 starts 11163dca2c0SJesper Dangaard Brouer IPv6 where L4 Transport Header starts */ 1122f74713dSJesper Dangaard Brouer __u32 thoff_reasm; /* Transport Header Offset in nfct_reasm skb */ 11363dca2c0SJesper Dangaard Brouer __u16 fragoffs; /* IPv6 fragment offset, 0 if first frag (or not frag)*/ 11463dca2c0SJesper Dangaard Brouer __s16 protocol; 11563dca2c0SJesper Dangaard Brouer __s32 flags; 11664aae3cbSJulius Volz union nf_inet_addr saddr; 11764aae3cbSJulius Volz union nf_inet_addr daddr; 11864aae3cbSJulius Volz }; 11964aae3cbSJulius Volz 1202f74713dSJesper Dangaard Brouer /* Dependency to module: nf_defrag_ipv6 */ 1212f74713dSJesper Dangaard Brouer #if defined(CONFIG_NF_DEFRAG_IPV6) || defined(CONFIG_NF_DEFRAG_IPV6_MODULE) 1222f74713dSJesper Dangaard Brouer static inline struct sk_buff *skb_nfct_reasm(const struct sk_buff *skb) 1232f74713dSJesper Dangaard Brouer { 1242f74713dSJesper Dangaard Brouer return skb->nfct_reasm; 1252f74713dSJesper Dangaard Brouer } 1262f74713dSJesper Dangaard Brouer static inline void *frag_safe_skb_hp(const struct sk_buff *skb, int offset, 1272f74713dSJesper Dangaard Brouer int len, void *buffer, 1282f74713dSJesper Dangaard Brouer const struct ip_vs_iphdr *ipvsh) 1292f74713dSJesper Dangaard Brouer { 1302f74713dSJesper Dangaard Brouer if (unlikely(ipvsh->fragoffs && skb_nfct_reasm(skb))) 1312f74713dSJesper Dangaard Brouer return skb_header_pointer(skb_nfct_reasm(skb), 1322f74713dSJesper Dangaard Brouer ipvsh->thoff_reasm, len, buffer); 1332f74713dSJesper Dangaard Brouer 1342f74713dSJesper Dangaard Brouer return skb_header_pointer(skb, offset, len, buffer); 1352f74713dSJesper Dangaard Brouer } 1362f74713dSJesper Dangaard Brouer #else 1372f74713dSJesper Dangaard Brouer static inline struct sk_buff *skb_nfct_reasm(const struct sk_buff *skb) 1382f74713dSJesper Dangaard Brouer { 1392f74713dSJesper Dangaard Brouer return NULL; 1402f74713dSJesper Dangaard Brouer } 1412f74713dSJesper Dangaard Brouer static inline void *frag_safe_skb_hp(const struct sk_buff *skb, int offset, 1422f74713dSJesper Dangaard Brouer int len, void *buffer, 1432f74713dSJesper Dangaard Brouer const struct ip_vs_iphdr *ipvsh) 1442f74713dSJesper Dangaard Brouer { 1452f74713dSJesper Dangaard Brouer return skb_header_pointer(skb, offset, len, buffer); 1462f74713dSJesper Dangaard Brouer } 1472f74713dSJesper Dangaard Brouer #endif 1482f74713dSJesper Dangaard Brouer 14964aae3cbSJulius Volz static inline void 15063dca2c0SJesper Dangaard Brouer ip_vs_fill_ip4hdr(const void *nh, struct ip_vs_iphdr *iphdr) 15163dca2c0SJesper Dangaard Brouer { 15263dca2c0SJesper Dangaard Brouer const struct iphdr *iph = nh; 15363dca2c0SJesper Dangaard Brouer 15463dca2c0SJesper Dangaard Brouer iphdr->len = iph->ihl * 4; 15563dca2c0SJesper Dangaard Brouer iphdr->fragoffs = 0; 15663dca2c0SJesper Dangaard Brouer iphdr->protocol = iph->protocol; 15763dca2c0SJesper Dangaard Brouer iphdr->saddr.ip = iph->saddr; 15863dca2c0SJesper Dangaard Brouer iphdr->daddr.ip = iph->daddr; 15963dca2c0SJesper Dangaard Brouer } 16063dca2c0SJesper Dangaard Brouer 16163dca2c0SJesper Dangaard Brouer /* This function handles filling *ip_vs_iphdr, both for IPv4 and IPv6. 16263dca2c0SJesper Dangaard Brouer * IPv6 requires some extra work, as finding proper header position, 16363dca2c0SJesper Dangaard Brouer * depend on the IPv6 extension headers. 16463dca2c0SJesper Dangaard Brouer */ 16563dca2c0SJesper Dangaard Brouer static inline void 16663dca2c0SJesper Dangaard Brouer ip_vs_fill_iph_skb(int af, const struct sk_buff *skb, struct ip_vs_iphdr *iphdr) 16764aae3cbSJulius Volz { 16864aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 16964aae3cbSJulius Volz if (af == AF_INET6) { 17063dca2c0SJesper Dangaard Brouer const struct ipv6hdr *iph = 17163dca2c0SJesper Dangaard Brouer (struct ipv6hdr *)skb_network_header(skb); 1724e3fd7a0SAlexey Dobriyan iphdr->saddr.in6 = iph->saddr; 1734e3fd7a0SAlexey Dobriyan iphdr->daddr.in6 = iph->daddr; 1742f74713dSJesper Dangaard Brouer /* ipv6_find_hdr() updates len, flags, thoff_reasm */ 1752f74713dSJesper Dangaard Brouer iphdr->thoff_reasm = 0; 17663dca2c0SJesper Dangaard Brouer iphdr->len = 0; 17763dca2c0SJesper Dangaard Brouer iphdr->flags = 0; 17863dca2c0SJesper Dangaard Brouer iphdr->protocol = ipv6_find_hdr(skb, &iphdr->len, -1, 17963dca2c0SJesper Dangaard Brouer &iphdr->fragoffs, 18063dca2c0SJesper Dangaard Brouer &iphdr->flags); 1812f74713dSJesper Dangaard Brouer /* get proto from re-assembled packet and it's offset */ 1822f74713dSJesper Dangaard Brouer if (skb_nfct_reasm(skb)) 1832f74713dSJesper Dangaard Brouer iphdr->protocol = ipv6_find_hdr(skb_nfct_reasm(skb), 1842f74713dSJesper Dangaard Brouer &iphdr->thoff_reasm, 1852f74713dSJesper Dangaard Brouer -1, NULL, NULL); 1862f74713dSJesper Dangaard Brouer 18764aae3cbSJulius Volz } else 18864aae3cbSJulius Volz #endif 18964aae3cbSJulius Volz { 19063dca2c0SJesper Dangaard Brouer const struct iphdr *iph = 19163dca2c0SJesper Dangaard Brouer (struct iphdr *)skb_network_header(skb); 19264aae3cbSJulius Volz iphdr->len = iph->ihl * 4; 19363dca2c0SJesper Dangaard Brouer iphdr->fragoffs = 0; 19464aae3cbSJulius Volz iphdr->protocol = iph->protocol; 19564aae3cbSJulius Volz iphdr->saddr.ip = iph->saddr; 19664aae3cbSJulius Volz iphdr->daddr.ip = iph->daddr; 19764aae3cbSJulius Volz } 19864aae3cbSJulius Volz } 19964aae3cbSJulius Volz 20063dca2c0SJesper Dangaard Brouer /* This function is a faster version of ip_vs_fill_iph_skb(). 20163dca2c0SJesper Dangaard Brouer * Where we only populate {s,d}addr (and avoid calling ipv6_find_hdr()). 20263dca2c0SJesper Dangaard Brouer * This is used by the some of the ip_vs_*_schedule() functions. 20363dca2c0SJesper Dangaard Brouer * (Mostly done to avoid ABI breakage of external schedulers) 20463dca2c0SJesper Dangaard Brouer */ 20563dca2c0SJesper Dangaard Brouer static inline void 20663dca2c0SJesper Dangaard Brouer ip_vs_fill_iph_addr_only(int af, const struct sk_buff *skb, 20763dca2c0SJesper Dangaard Brouer struct ip_vs_iphdr *iphdr) 20863dca2c0SJesper Dangaard Brouer { 20963dca2c0SJesper Dangaard Brouer #ifdef CONFIG_IP_VS_IPV6 21063dca2c0SJesper Dangaard Brouer if (af == AF_INET6) { 21163dca2c0SJesper Dangaard Brouer const struct ipv6hdr *iph = 21263dca2c0SJesper Dangaard Brouer (struct ipv6hdr *)skb_network_header(skb); 21363dca2c0SJesper Dangaard Brouer iphdr->saddr.in6 = iph->saddr; 21463dca2c0SJesper Dangaard Brouer iphdr->daddr.in6 = iph->daddr; 21554d83efaSJesper Dangaard Brouer } else 21663dca2c0SJesper Dangaard Brouer #endif 21754d83efaSJesper Dangaard Brouer { 21863dca2c0SJesper Dangaard Brouer const struct iphdr *iph = 21963dca2c0SJesper Dangaard Brouer (struct iphdr *)skb_network_header(skb); 22063dca2c0SJesper Dangaard Brouer iphdr->saddr.ip = iph->saddr; 22163dca2c0SJesper Dangaard Brouer iphdr->daddr.ip = iph->daddr; 22263dca2c0SJesper Dangaard Brouer } 22363dca2c0SJesper Dangaard Brouer } 22463dca2c0SJesper Dangaard Brouer 22564aae3cbSJulius Volz static inline void ip_vs_addr_copy(int af, union nf_inet_addr *dst, 22664aae3cbSJulius Volz const union nf_inet_addr *src) 22764aae3cbSJulius Volz { 22864aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 22964aae3cbSJulius Volz if (af == AF_INET6) 2304e3fd7a0SAlexey Dobriyan dst->in6 = src->in6; 23164aae3cbSJulius Volz else 23264aae3cbSJulius Volz #endif 23364aae3cbSJulius Volz dst->ip = src->ip; 23464aae3cbSJulius Volz } 23564aae3cbSJulius Volz 2369a05475cSJulian Anastasov static inline void ip_vs_addr_set(int af, union nf_inet_addr *dst, 2379a05475cSJulian Anastasov const union nf_inet_addr *src) 2389a05475cSJulian Anastasov { 2399a05475cSJulian Anastasov #ifdef CONFIG_IP_VS_IPV6 2409a05475cSJulian Anastasov if (af == AF_INET6) { 2419a05475cSJulian Anastasov dst->in6 = src->in6; 2429a05475cSJulian Anastasov return; 2439a05475cSJulian Anastasov } 2449a05475cSJulian Anastasov #endif 2459a05475cSJulian Anastasov dst->ip = src->ip; 2469a05475cSJulian Anastasov dst->all[1] = 0; 2479a05475cSJulian Anastasov dst->all[2] = 0; 2489a05475cSJulian Anastasov dst->all[3] = 0; 2499a05475cSJulian Anastasov } 2509a05475cSJulian Anastasov 25164aae3cbSJulius Volz static inline int ip_vs_addr_equal(int af, const union nf_inet_addr *a, 25264aae3cbSJulius Volz const union nf_inet_addr *b) 25364aae3cbSJulius Volz { 25464aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 25564aae3cbSJulius Volz if (af == AF_INET6) 25664aae3cbSJulius Volz return ipv6_addr_equal(&a->in6, &b->in6); 25764aae3cbSJulius Volz #endif 25864aae3cbSJulius Volz return a->ip == b->ip; 25964aae3cbSJulius Volz } 26064aae3cbSJulius Volz 2611da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG 26214c85021SArnaldo Carvalho de Melo #include <linux/net.h> 26314c85021SArnaldo Carvalho de Melo 2641da177e4SLinus Torvalds extern int ip_vs_get_debug_level(void); 265c842a3adSJulius Volz 266c842a3adSJulius Volz static inline const char *ip_vs_dbg_addr(int af, char *buf, size_t buf_len, 267c842a3adSJulius Volz const union nf_inet_addr *addr, 268c842a3adSJulius Volz int *idx) 269c842a3adSJulius Volz { 270c842a3adSJulius Volz int len; 271c842a3adSJulius Volz #ifdef CONFIG_IP_VS_IPV6 272c842a3adSJulius Volz if (af == AF_INET6) 273120b9c14SJesper Dangaard Brouer len = snprintf(&buf[*idx], buf_len - *idx, "[%pI6c]", 2740c6ce78aSHarvey Harrison &addr->in6) + 1; 275c842a3adSJulius Volz else 276c842a3adSJulius Volz #endif 2773685f25dSHarvey Harrison len = snprintf(&buf[*idx], buf_len - *idx, "%pI4", 2783685f25dSHarvey Harrison &addr->ip) + 1; 279c842a3adSJulius Volz 280c842a3adSJulius Volz *idx += len; 281c842a3adSJulius Volz BUG_ON(*idx > buf_len + 1); 282c842a3adSJulius Volz return &buf[*idx - len]; 283c842a3adSJulius Volz } 284c842a3adSJulius Volz 2859aada7acSHannes Eder #define IP_VS_DBG_BUF(level, msg, ...) \ 286c842a3adSJulius Volz do { \ 287c842a3adSJulius Volz char ip_vs_dbg_buf[160]; \ 288c842a3adSJulius Volz int ip_vs_dbg_idx = 0; \ 289c842a3adSJulius Volz if (level <= ip_vs_get_debug_level()) \ 2909aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 291c842a3adSJulius Volz } while (0) 292c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...) \ 293c842a3adSJulius Volz do { \ 294c842a3adSJulius Volz char ip_vs_dbg_buf[160]; \ 295c842a3adSJulius Volz int ip_vs_dbg_idx = 0; \ 2969aada7acSHannes Eder pr_err(msg); \ 297c842a3adSJulius Volz } while (0) 298c842a3adSJulius Volz 299c842a3adSJulius Volz /* Only use from within IP_VS_DBG_BUF() or IP_VS_ERR_BUF macros */ 300c842a3adSJulius Volz #define IP_VS_DBG_ADDR(af, addr) \ 301c842a3adSJulius Volz ip_vs_dbg_addr(af, ip_vs_dbg_buf, \ 302c842a3adSJulius Volz sizeof(ip_vs_dbg_buf), addr, \ 303c842a3adSJulius Volz &ip_vs_dbg_idx) 304c842a3adSJulius Volz 3059aada7acSHannes Eder #define IP_VS_DBG(level, msg, ...) \ 3061da177e4SLinus Torvalds do { \ 3071da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 3089aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 3091da177e4SLinus Torvalds } while (0) 3109aada7acSHannes Eder #define IP_VS_DBG_RL(msg, ...) \ 3111da177e4SLinus Torvalds do { \ 3121da177e4SLinus Torvalds if (net_ratelimit()) \ 3139aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 3141da177e4SLinus Torvalds } while (0) 3150d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg) \ 3161da177e4SLinus Torvalds do { \ 3171da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 3180d79641aSJulian Anastasov pp->debug_packet(af, pp, skb, ofs, msg); \ 3191da177e4SLinus Torvalds } while (0) 3200d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg) \ 3211da177e4SLinus Torvalds do { \ 3221da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level() && \ 3231da177e4SLinus Torvalds net_ratelimit()) \ 3240d79641aSJulian Anastasov pp->debug_packet(af, pp, skb, ofs, msg); \ 3251da177e4SLinus Torvalds } while (0) 3261da177e4SLinus Torvalds #else /* NO DEBUGGING at ALL */ 327c842a3adSJulius Volz #define IP_VS_DBG_BUF(level, msg...) do {} while (0) 328c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...) do {} while (0) 3291da177e4SLinus Torvalds #define IP_VS_DBG(level, msg...) do {} while (0) 3301da177e4SLinus Torvalds #define IP_VS_DBG_RL(msg...) do {} while (0) 3310d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg) do {} while (0) 3320d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg) do {} while (0) 3331da177e4SLinus Torvalds #endif 3341da177e4SLinus Torvalds 3351da177e4SLinus Torvalds #define IP_VS_BUG() BUG() 3361e3e238eSHannes Eder #define IP_VS_ERR_RL(msg, ...) \ 3371da177e4SLinus Torvalds do { \ 3381da177e4SLinus Torvalds if (net_ratelimit()) \ 3391e3e238eSHannes Eder pr_err(msg, ##__VA_ARGS__); \ 3401da177e4SLinus Torvalds } while (0) 3411da177e4SLinus Torvalds 3421da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG 3431da177e4SLinus Torvalds #define EnterFunction(level) \ 3441da177e4SLinus Torvalds do { \ 3451da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 3469aada7acSHannes Eder printk(KERN_DEBUG \ 3479aada7acSHannes Eder pr_fmt("Enter: %s, %s line %i\n"), \ 348d5c003b4SHarvey Harrison __func__, __FILE__, __LINE__); \ 3491da177e4SLinus Torvalds } while (0) 3501da177e4SLinus Torvalds #define LeaveFunction(level) \ 3511da177e4SLinus Torvalds do { \ 3521da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 3539aada7acSHannes Eder printk(KERN_DEBUG \ 3549aada7acSHannes Eder pr_fmt("Leave: %s, %s line %i\n"), \ 355d5c003b4SHarvey Harrison __func__, __FILE__, __LINE__); \ 3561da177e4SLinus Torvalds } while (0) 3571da177e4SLinus Torvalds #else 3581da177e4SLinus Torvalds #define EnterFunction(level) do {} while (0) 3591da177e4SLinus Torvalds #define LeaveFunction(level) do {} while (0) 3601da177e4SLinus Torvalds #endif 3611da177e4SLinus Torvalds 3621da177e4SLinus Torvalds #define IP_VS_WAIT_WHILE(expr) while (expr) { cpu_relax(); } 3631da177e4SLinus Torvalds 3641da177e4SLinus Torvalds 3651da177e4SLinus Torvalds /* 3661da177e4SLinus Torvalds * The port number of FTP service (in network order). 3671da177e4SLinus Torvalds */ 368f3a7c66bSHarvey Harrison #define FTPPORT cpu_to_be16(21) 369f3a7c66bSHarvey Harrison #define FTPDATA cpu_to_be16(20) 3701da177e4SLinus Torvalds 3711da177e4SLinus Torvalds /* 3721da177e4SLinus Torvalds * TCP State Values 3731da177e4SLinus Torvalds */ 3741da177e4SLinus Torvalds enum { 3751da177e4SLinus Torvalds IP_VS_TCP_S_NONE = 0, 3761da177e4SLinus Torvalds IP_VS_TCP_S_ESTABLISHED, 3771da177e4SLinus Torvalds IP_VS_TCP_S_SYN_SENT, 3781da177e4SLinus Torvalds IP_VS_TCP_S_SYN_RECV, 3791da177e4SLinus Torvalds IP_VS_TCP_S_FIN_WAIT, 3801da177e4SLinus Torvalds IP_VS_TCP_S_TIME_WAIT, 3811da177e4SLinus Torvalds IP_VS_TCP_S_CLOSE, 3821da177e4SLinus Torvalds IP_VS_TCP_S_CLOSE_WAIT, 3831da177e4SLinus Torvalds IP_VS_TCP_S_LAST_ACK, 3841da177e4SLinus Torvalds IP_VS_TCP_S_LISTEN, 3851da177e4SLinus Torvalds IP_VS_TCP_S_SYNACK, 3861da177e4SLinus Torvalds IP_VS_TCP_S_LAST 3871da177e4SLinus Torvalds }; 3881da177e4SLinus Torvalds 3891da177e4SLinus Torvalds /* 3901da177e4SLinus Torvalds * UDP State Values 3911da177e4SLinus Torvalds */ 3921da177e4SLinus Torvalds enum { 3931da177e4SLinus Torvalds IP_VS_UDP_S_NORMAL, 3941da177e4SLinus Torvalds IP_VS_UDP_S_LAST, 3951da177e4SLinus Torvalds }; 3961da177e4SLinus Torvalds 3971da177e4SLinus Torvalds /* 3981da177e4SLinus Torvalds * ICMP State Values 3991da177e4SLinus Torvalds */ 4001da177e4SLinus Torvalds enum { 4011da177e4SLinus Torvalds IP_VS_ICMP_S_NORMAL, 4021da177e4SLinus Torvalds IP_VS_ICMP_S_LAST, 4031da177e4SLinus Torvalds }; 4041da177e4SLinus Torvalds 4051da177e4SLinus Torvalds /* 4062906f66aSVenkata Mohan Reddy * SCTP State Values 4072906f66aSVenkata Mohan Reddy */ 4082906f66aSVenkata Mohan Reddy enum ip_vs_sctp_states { 4092906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_NONE, 4102906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_INIT_CLI, 4112906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_INIT_SER, 4122906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_INIT_ACK_CLI, 4132906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_INIT_ACK_SER, 4142906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_ECHO_CLI, 4152906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_ECHO_SER, 4162906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_ESTABLISHED, 4172906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_SHUT_CLI, 4182906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_SHUT_SER, 4192906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_SHUT_ACK_CLI, 4202906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_SHUT_ACK_SER, 4212906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_CLOSED, 4222906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_LAST 4232906f66aSVenkata Mohan Reddy }; 4242906f66aSVenkata Mohan Reddy 4252906f66aSVenkata Mohan Reddy /* 4261da177e4SLinus Torvalds * Delta sequence info structure 4271da177e4SLinus Torvalds * Each ip_vs_conn has 2 (output AND input seq. changes). 4281da177e4SLinus Torvalds * Only used in the VS/NAT. 4291da177e4SLinus Torvalds */ 4301da177e4SLinus Torvalds struct ip_vs_seq { 4311da177e4SLinus Torvalds __u32 init_seq; /* Add delta from this seq */ 4321da177e4SLinus Torvalds __u32 delta; /* Delta in sequence numbers */ 4331da177e4SLinus Torvalds __u32 previous_delta; /* Delta in sequence numbers 4341da177e4SLinus Torvalds before last resized pkt */ 4351da177e4SLinus Torvalds }; 4361da177e4SLinus Torvalds 437b17fc996SHans Schillstrom /* 438b17fc996SHans Schillstrom * counters per cpu 439b17fc996SHans Schillstrom */ 440b17fc996SHans Schillstrom struct ip_vs_counters { 441b17fc996SHans Schillstrom __u32 conns; /* connections scheduled */ 442b17fc996SHans Schillstrom __u32 inpkts; /* incoming packets */ 443b17fc996SHans Schillstrom __u32 outpkts; /* outgoing packets */ 444b17fc996SHans Schillstrom __u64 inbytes; /* incoming bytes */ 445b17fc996SHans Schillstrom __u64 outbytes; /* outgoing bytes */ 446b17fc996SHans Schillstrom }; 447b17fc996SHans Schillstrom /* 448b17fc996SHans Schillstrom * Stats per cpu 449b17fc996SHans Schillstrom */ 450b17fc996SHans Schillstrom struct ip_vs_cpu_stats { 451b17fc996SHans Schillstrom struct ip_vs_counters ustats; 452b17fc996SHans Schillstrom struct u64_stats_sync syncp; 453b17fc996SHans Schillstrom }; 4541da177e4SLinus Torvalds 4551da177e4SLinus Torvalds /* 4563a14a313SSven Wegener * IPVS statistics objects 4571da177e4SLinus Torvalds */ 4583a14a313SSven Wegener struct ip_vs_estimator { 4593a14a313SSven Wegener struct list_head list; 4603a14a313SSven Wegener 4613a14a313SSven Wegener u64 last_inbytes; 4623a14a313SSven Wegener u64 last_outbytes; 4633a14a313SSven Wegener u32 last_conns; 4643a14a313SSven Wegener u32 last_inpkts; 4653a14a313SSven Wegener u32 last_outpkts; 4663a14a313SSven Wegener 4673a14a313SSven Wegener u32 cps; 4683a14a313SSven Wegener u32 inpps; 4693a14a313SSven Wegener u32 outpps; 4703a14a313SSven Wegener u32 inbps; 4713a14a313SSven Wegener u32 outbps; 4723a14a313SSven Wegener }; 4733a14a313SSven Wegener 474fd2c3ef7SEric Dumazet struct ip_vs_stats { 475e9c0ce23SSven Wegener struct ip_vs_stats_user ustats; /* statistics */ 476e9c0ce23SSven Wegener struct ip_vs_estimator est; /* estimator */ 477b962abdcSJulian Anastasov struct ip_vs_cpu_stats __percpu *cpustats; /* per cpu counters */ 4781da177e4SLinus Torvalds spinlock_t lock; /* spin lock */ 47955a3d4e1SJulian Anastasov struct ip_vs_stats_user ustats0; /* reset values */ 4801da177e4SLinus Torvalds }; 4811da177e4SLinus Torvalds 48214c85021SArnaldo Carvalho de Melo struct dst_entry; 48314c85021SArnaldo Carvalho de Melo struct iphdr; 4841da177e4SLinus Torvalds struct ip_vs_conn; 4851da177e4SLinus Torvalds struct ip_vs_app; 48614c85021SArnaldo Carvalho de Melo struct sk_buff; 487252c6410SHans Schillstrom struct ip_vs_proto_data; 4881da177e4SLinus Torvalds 4891da177e4SLinus Torvalds struct ip_vs_protocol { 4901da177e4SLinus Torvalds struct ip_vs_protocol *next; 4911da177e4SLinus Torvalds char *name; 4922ad17defSJulian Anastasov u16 protocol; 4932ad17defSJulian Anastasov u16 num_states; 4941da177e4SLinus Torvalds int dont_defrag; 4951da177e4SLinus Torvalds 4961da177e4SLinus Torvalds void (*init)(struct ip_vs_protocol *pp); 4971da177e4SLinus Torvalds 4981da177e4SLinus Torvalds void (*exit)(struct ip_vs_protocol *pp); 4991da177e4SLinus Torvalds 500582b8e3eSHans Schillstrom int (*init_netns)(struct net *net, struct ip_vs_proto_data *pd); 501252c6410SHans Schillstrom 502252c6410SHans Schillstrom void (*exit_netns)(struct net *net, struct ip_vs_proto_data *pd); 503252c6410SHans Schillstrom 50451ef348bSJulius Volz int (*conn_schedule)(int af, struct sk_buff *skb, 5059330419dSHans Schillstrom struct ip_vs_proto_data *pd, 506d4383f04SJesper Dangaard Brouer int *verdict, struct ip_vs_conn **cpp, 507d4383f04SJesper Dangaard Brouer struct ip_vs_iphdr *iph); 5081da177e4SLinus Torvalds 5091da177e4SLinus Torvalds struct ip_vs_conn * 51051ef348bSJulius Volz (*conn_in_get)(int af, 51151ef348bSJulius Volz const struct sk_buff *skb, 51251ef348bSJulius Volz const struct ip_vs_iphdr *iph, 5131da177e4SLinus Torvalds int inverse); 5141da177e4SLinus Torvalds 5151da177e4SLinus Torvalds struct ip_vs_conn * 51651ef348bSJulius Volz (*conn_out_get)(int af, 51751ef348bSJulius Volz const struct sk_buff *skb, 51851ef348bSJulius Volz const struct ip_vs_iphdr *iph, 5191da177e4SLinus Torvalds int inverse); 5201da177e4SLinus Torvalds 521d4383f04SJesper Dangaard Brouer int (*snat_handler)(struct sk_buff *skb, struct ip_vs_protocol *pp, 522d4383f04SJesper Dangaard Brouer struct ip_vs_conn *cp, struct ip_vs_iphdr *iph); 5231da177e4SLinus Torvalds 524d4383f04SJesper Dangaard Brouer int (*dnat_handler)(struct sk_buff *skb, struct ip_vs_protocol *pp, 525d4383f04SJesper Dangaard Brouer struct ip_vs_conn *cp, struct ip_vs_iphdr *iph); 5261da177e4SLinus Torvalds 52751ef348bSJulius Volz int (*csum_check)(int af, struct sk_buff *skb, 52851ef348bSJulius Volz struct ip_vs_protocol *pp); 5291da177e4SLinus Torvalds 5301da177e4SLinus Torvalds const char *(*state_name)(int state); 5311da177e4SLinus Torvalds 5324a516f11SSimon Horman void (*state_transition)(struct ip_vs_conn *cp, int direction, 5331da177e4SLinus Torvalds const struct sk_buff *skb, 5349330419dSHans Schillstrom struct ip_vs_proto_data *pd); 5351da177e4SLinus Torvalds 536ab8a5e84SHans Schillstrom int (*register_app)(struct net *net, struct ip_vs_app *inc); 5371da177e4SLinus Torvalds 538ab8a5e84SHans Schillstrom void (*unregister_app)(struct net *net, struct ip_vs_app *inc); 5391da177e4SLinus Torvalds 5401da177e4SLinus Torvalds int (*app_conn_bind)(struct ip_vs_conn *cp); 5411da177e4SLinus Torvalds 5420d79641aSJulian Anastasov void (*debug_packet)(int af, struct ip_vs_protocol *pp, 5431da177e4SLinus Torvalds const struct sk_buff *skb, 5441da177e4SLinus Torvalds int offset, 5451da177e4SLinus Torvalds const char *msg); 5461da177e4SLinus Torvalds 5479330419dSHans Schillstrom void (*timeout_change)(struct ip_vs_proto_data *pd, int flags); 5481da177e4SLinus Torvalds }; 5491da177e4SLinus Torvalds 550252c6410SHans Schillstrom /* 551252c6410SHans Schillstrom * protocol data per netns 552252c6410SHans Schillstrom */ 553252c6410SHans Schillstrom struct ip_vs_proto_data { 554252c6410SHans Schillstrom struct ip_vs_proto_data *next; 555252c6410SHans Schillstrom struct ip_vs_protocol *pp; 556252c6410SHans Schillstrom int *timeout_table; /* protocol timeout table */ 557252c6410SHans Schillstrom atomic_t appcnt; /* counter of proto app incs. */ 558252c6410SHans Schillstrom struct tcp_states_t *tcp_state_table; 559252c6410SHans Schillstrom }; 560252c6410SHans Schillstrom 5611da177e4SLinus Torvalds extern struct ip_vs_protocol *ip_vs_proto_get(unsigned short proto); 562252c6410SHans Schillstrom extern struct ip_vs_proto_data *ip_vs_proto_data_get(struct net *net, 563252c6410SHans Schillstrom unsigned short proto); 5641da177e4SLinus Torvalds 565f11017ecSSimon Horman struct ip_vs_conn_param { 5666e67e586SHans Schillstrom struct net *net; 567f11017ecSSimon Horman const union nf_inet_addr *caddr; 568f11017ecSSimon Horman const union nf_inet_addr *vaddr; 569f11017ecSSimon Horman __be16 cport; 570f11017ecSSimon Horman __be16 vport; 571f11017ecSSimon Horman __u16 protocol; 572f11017ecSSimon Horman u16 af; 57385999283SSimon Horman 57485999283SSimon Horman const struct ip_vs_pe *pe; 57585999283SSimon Horman char *pe_data; 57685999283SSimon Horman __u8 pe_data_len; 577f11017ecSSimon Horman }; 578f11017ecSSimon Horman 5791da177e4SLinus Torvalds /* 5801da177e4SLinus Torvalds * IP_VS structure allocated for each dynamically scheduled connection 5811da177e4SLinus Torvalds */ 5821da177e4SLinus Torvalds struct ip_vs_conn { 583731109e7SChangli Gao struct hlist_node c_list; /* hashed list heads */ 5841da177e4SLinus Torvalds /* Protocol, addresses and port numbers */ 5856e67e586SHans Schillstrom __be16 cport; 5866e67e586SHans Schillstrom __be16 dport; 5871845ed0bSJulian Anastasov __be16 vport; 5881845ed0bSJulian Anastasov u16 af; /* address family */ 589e7ade46aSJulius Volz union nf_inet_addr caddr; /* client address */ 590e7ade46aSJulius Volz union nf_inet_addr vaddr; /* virtual address */ 591e7ade46aSJulius Volz union nf_inet_addr daddr; /* destination address */ 5923575792eSJulian Anastasov volatile __u32 flags; /* status flags */ 5931da177e4SLinus Torvalds __u16 protocol; /* Which protocol (TCP/UDP) */ 5941845ed0bSJulian Anastasov #ifdef CONFIG_NET_NS 5951845ed0bSJulian Anastasov struct net *net; /* Name space */ 5961845ed0bSJulian Anastasov #endif 5971da177e4SLinus Torvalds 5981da177e4SLinus Torvalds /* counter and timer */ 5991da177e4SLinus Torvalds atomic_t refcnt; /* reference count */ 6001da177e4SLinus Torvalds struct timer_list timer; /* Expiration timer */ 6011da177e4SLinus Torvalds volatile unsigned long timeout; /* timeout */ 6021da177e4SLinus Torvalds 6031da177e4SLinus Torvalds /* Flags and state transition */ 6041da177e4SLinus Torvalds spinlock_t lock; /* lock for state transition */ 6051da177e4SLinus Torvalds volatile __u16 state; /* state info */ 606efac5276SRumen G. Bogdanovski volatile __u16 old_state; /* old state, to be used for 607efac5276SRumen G. Bogdanovski * state transition triggerd 608efac5276SRumen G. Bogdanovski * synchronization 609efac5276SRumen G. Bogdanovski */ 6101845ed0bSJulian Anastasov __u32 fwmark; /* Fire wall mark from skb */ 611749c42b6SJulian Anastasov unsigned long sync_endtime; /* jiffies + sent_retries */ 6121da177e4SLinus Torvalds 6131da177e4SLinus Torvalds /* Control members */ 6141da177e4SLinus Torvalds struct ip_vs_conn *control; /* Master control connection */ 6151da177e4SLinus Torvalds atomic_t n_control; /* Number of controlled ones */ 6161da177e4SLinus Torvalds struct ip_vs_dest *dest; /* real server */ 6171da177e4SLinus Torvalds atomic_t in_pkts; /* incoming packet counter */ 6181da177e4SLinus Torvalds 6191da177e4SLinus Torvalds /* packet transmitter for different forwarding methods. If it 6201da177e4SLinus Torvalds mangles the packet, it must return NF_DROP or better NF_STOLEN, 6211da177e4SLinus Torvalds otherwise this must be changed to a sk_buff **. 622fc604767SJulian Anastasov NF_ACCEPT can be returned when destination is local. 6231da177e4SLinus Torvalds */ 6241da177e4SLinus Torvalds int (*packet_xmit)(struct sk_buff *skb, struct ip_vs_conn *cp, 625d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 6261da177e4SLinus Torvalds 6271da177e4SLinus Torvalds /* Note: we can group the following members into a structure, 6281da177e4SLinus Torvalds in order to save more space, and the following members are 6291da177e4SLinus Torvalds only used in VS/NAT anyway */ 6301da177e4SLinus Torvalds struct ip_vs_app *app; /* bound ip_vs_app object */ 6311da177e4SLinus Torvalds void *app_data; /* Application private data */ 6321da177e4SLinus Torvalds struct ip_vs_seq in_seq; /* incoming seq. struct */ 6331da177e4SLinus Torvalds struct ip_vs_seq out_seq; /* outgoing seq. struct */ 63485999283SSimon Horman 635e9e5eee8SSimon Horman const struct ip_vs_pe *pe; 63685999283SSimon Horman char *pe_data; 63785999283SSimon Horman __u8 pe_data_len; 638088339a5SJulian Anastasov 639088339a5SJulian Anastasov struct rcu_head rcu_head; 6401da177e4SLinus Torvalds }; 6411da177e4SLinus Torvalds 6426e67e586SHans Schillstrom /* 6436e67e586SHans Schillstrom * To save some memory in conn table when name space is disabled. 6446e67e586SHans Schillstrom */ 6456e67e586SHans Schillstrom static inline struct net *ip_vs_conn_net(const struct ip_vs_conn *cp) 6466e67e586SHans Schillstrom { 6476e67e586SHans Schillstrom #ifdef CONFIG_NET_NS 6486e67e586SHans Schillstrom return cp->net; 6496e67e586SHans Schillstrom #else 6506e67e586SHans Schillstrom return &init_net; 6516e67e586SHans Schillstrom #endif 6526e67e586SHans Schillstrom } 6536e67e586SHans Schillstrom static inline void ip_vs_conn_net_set(struct ip_vs_conn *cp, struct net *net) 6546e67e586SHans Schillstrom { 6556e67e586SHans Schillstrom #ifdef CONFIG_NET_NS 6566e67e586SHans Schillstrom cp->net = net; 6576e67e586SHans Schillstrom #endif 6586e67e586SHans Schillstrom } 6596e67e586SHans Schillstrom 6606e67e586SHans Schillstrom static inline int ip_vs_conn_net_eq(const struct ip_vs_conn *cp, 6616e67e586SHans Schillstrom struct net *net) 6626e67e586SHans Schillstrom { 6636e67e586SHans Schillstrom #ifdef CONFIG_NET_NS 6646e67e586SHans Schillstrom return cp->net == net; 6656e67e586SHans Schillstrom #else 6666e67e586SHans Schillstrom return 1; 6676e67e586SHans Schillstrom #endif 6686e67e586SHans Schillstrom } 6691da177e4SLinus Torvalds 6701da177e4SLinus Torvalds /* 671c860c6b1SJulius Volz * Extended internal versions of struct ip_vs_service_user and 672c860c6b1SJulius Volz * ip_vs_dest_user for IPv6 support. 673c860c6b1SJulius Volz * 674c860c6b1SJulius Volz * We need these to conveniently pass around service and destination 675c860c6b1SJulius Volz * options, but unfortunately, we also need to keep the old definitions to 676c860c6b1SJulius Volz * maintain userspace backwards compatibility for the setsockopt interface. 677c860c6b1SJulius Volz */ 678c860c6b1SJulius Volz struct ip_vs_service_user_kern { 679c860c6b1SJulius Volz /* virtual service addresses */ 680c860c6b1SJulius Volz u16 af; 681c860c6b1SJulius Volz u16 protocol; 682c860c6b1SJulius Volz union nf_inet_addr addr; /* virtual ip address */ 683c860c6b1SJulius Volz u16 port; 684c860c6b1SJulius Volz u32 fwmark; /* firwall mark of service */ 685c860c6b1SJulius Volz 686c860c6b1SJulius Volz /* virtual service options */ 687c860c6b1SJulius Volz char *sched_name; 6880d1e71b0SSimon Horman char *pe_name; 68995c96174SEric Dumazet unsigned int flags; /* virtual service flags */ 69095c96174SEric Dumazet unsigned int timeout; /* persistent timeout in sec */ 691c860c6b1SJulius Volz u32 netmask; /* persistent netmask */ 692c860c6b1SJulius Volz }; 693c860c6b1SJulius Volz 694c860c6b1SJulius Volz 695c860c6b1SJulius Volz struct ip_vs_dest_user_kern { 696c860c6b1SJulius Volz /* destination server address */ 697c860c6b1SJulius Volz union nf_inet_addr addr; 698c860c6b1SJulius Volz u16 port; 699c860c6b1SJulius Volz 700c860c6b1SJulius Volz /* real server options */ 70195c96174SEric Dumazet unsigned int conn_flags; /* connection flags */ 702c860c6b1SJulius Volz int weight; /* destination weight */ 703c860c6b1SJulius Volz 704c860c6b1SJulius Volz /* thresholds for active connections */ 705c860c6b1SJulius Volz u32 u_threshold; /* upper threshold */ 706c860c6b1SJulius Volz u32 l_threshold; /* lower threshold */ 707c860c6b1SJulius Volz }; 708c860c6b1SJulius Volz 709c860c6b1SJulius Volz 710c860c6b1SJulius Volz /* 7111da177e4SLinus Torvalds * The information about the virtual service offered to the net 7121da177e4SLinus Torvalds * and the forwarding entries 7131da177e4SLinus Torvalds */ 7141da177e4SLinus Torvalds struct ip_vs_service { 7151da177e4SLinus Torvalds struct list_head s_list; /* for normal service table */ 7161da177e4SLinus Torvalds struct list_head f_list; /* for fwmark-based service table */ 7171da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 7181da177e4SLinus Torvalds atomic_t usecnt; /* use counter */ 7191da177e4SLinus Torvalds 720e7ade46aSJulius Volz u16 af; /* address family */ 7211da177e4SLinus Torvalds __u16 protocol; /* which protocol (TCP/UDP) */ 722e7ade46aSJulius Volz union nf_inet_addr addr; /* IP address for virtual service */ 723014d730dSAl Viro __be16 port; /* port number for the service */ 7241da177e4SLinus Torvalds __u32 fwmark; /* firewall mark of the service */ 72595c96174SEric Dumazet unsigned int flags; /* service status flags */ 72695c96174SEric Dumazet unsigned int timeout; /* persistent timeout in ticks */ 727014d730dSAl Viro __be32 netmask; /* grouping granularity */ 728fc723250SHans Schillstrom struct net *net; 7291da177e4SLinus Torvalds 7301da177e4SLinus Torvalds struct list_head destinations; /* real server d-linked list */ 7311da177e4SLinus Torvalds __u32 num_dests; /* number of servers */ 7321da177e4SLinus Torvalds struct ip_vs_stats stats; /* statistics for the service */ 7331da177e4SLinus Torvalds struct ip_vs_app *inc; /* bind conns to this app inc */ 7341da177e4SLinus Torvalds 7351da177e4SLinus Torvalds /* for scheduling */ 7361da177e4SLinus Torvalds struct ip_vs_scheduler *scheduler; /* bound scheduler object */ 7371da177e4SLinus Torvalds rwlock_t sched_lock; /* lock sched_data */ 7381da177e4SLinus Torvalds void *sched_data; /* scheduler application data */ 73985999283SSimon Horman 74085999283SSimon Horman /* alternate persistence engine */ 74185999283SSimon Horman struct ip_vs_pe *pe; 7421da177e4SLinus Torvalds }; 7431da177e4SLinus Torvalds 744026ace06SJulian Anastasov /* Information for cached dst */ 745026ace06SJulian Anastasov struct ip_vs_dest_dst { 746026ace06SJulian Anastasov struct dst_entry *dst_cache; /* destination cache entry */ 747026ace06SJulian Anastasov u32 dst_cookie; 748026ace06SJulian Anastasov union nf_inet_addr dst_saddr; 749026ace06SJulian Anastasov struct rcu_head rcu_head; 750026ace06SJulian Anastasov }; 7511da177e4SLinus Torvalds 752578bc3efSJulian Anastasov /* In grace period after removing */ 753578bc3efSJulian Anastasov #define IP_VS_DEST_STATE_REMOVING 0x01 7541da177e4SLinus Torvalds /* 7551da177e4SLinus Torvalds * The real server destination forwarding entry 7561da177e4SLinus Torvalds * with ip address, port number, and so on. 7571da177e4SLinus Torvalds */ 7581da177e4SLinus Torvalds struct ip_vs_dest { 7591da177e4SLinus Torvalds struct list_head n_list; /* for the dests in the service */ 760276472eaSJulian Anastasov struct hlist_node d_list; /* for table with all the dests */ 7611da177e4SLinus Torvalds 762e7ade46aSJulius Volz u16 af; /* address family */ 763014d730dSAl Viro __be16 port; /* port number of the server */ 764f2431e6eSHans Schillstrom union nf_inet_addr addr; /* IP address of the server */ 76595c96174SEric Dumazet volatile unsigned int flags; /* dest status flags */ 7661da177e4SLinus Torvalds atomic_t conn_flags; /* flags to copy to conn */ 7671da177e4SLinus Torvalds atomic_t weight; /* server weight */ 7681da177e4SLinus Torvalds 7691da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 7701da177e4SLinus Torvalds struct ip_vs_stats stats; /* statistics */ 771578bc3efSJulian Anastasov unsigned long state; /* state flags */ 7721da177e4SLinus Torvalds 7731da177e4SLinus Torvalds /* connection counters and thresholds */ 7741da177e4SLinus Torvalds atomic_t activeconns; /* active connections */ 7751da177e4SLinus Torvalds atomic_t inactconns; /* inactive connections */ 7761da177e4SLinus Torvalds atomic_t persistconns; /* persistent connections */ 7771da177e4SLinus Torvalds __u32 u_threshold; /* upper threshold */ 7781da177e4SLinus Torvalds __u32 l_threshold; /* lower threshold */ 7791da177e4SLinus Torvalds 7801da177e4SLinus Torvalds /* for destination cache */ 7811da177e4SLinus Torvalds spinlock_t dst_lock; /* lock of dst_cache */ 782026ace06SJulian Anastasov struct ip_vs_dest_dst __rcu *dest_dst; /* cached dst info */ 7831da177e4SLinus Torvalds 7841da177e4SLinus Torvalds /* for virtual service */ 7851da177e4SLinus Torvalds struct ip_vs_service *svc; /* service it belongs to */ 7861da177e4SLinus Torvalds __u16 protocol; /* which protocol (TCP/UDP) */ 787014d730dSAl Viro __be16 vport; /* virtual port number */ 788f2431e6eSHans Schillstrom union nf_inet_addr vaddr; /* virtual IP address */ 7891da177e4SLinus Torvalds __u32 vfwmark; /* firewall mark of service */ 790276472eaSJulian Anastasov 791578bc3efSJulian Anastasov struct list_head t_list; /* in dest_trash */ 792276472eaSJulian Anastasov struct rcu_head rcu_head; 793276472eaSJulian Anastasov unsigned int in_rs_table:1; /* we are in rs_table */ 7941da177e4SLinus Torvalds }; 7951da177e4SLinus Torvalds 7961da177e4SLinus Torvalds 7971da177e4SLinus Torvalds /* 7981da177e4SLinus Torvalds * The scheduler object 7991da177e4SLinus Torvalds */ 8001da177e4SLinus Torvalds struct ip_vs_scheduler { 8011da177e4SLinus Torvalds struct list_head n_list; /* d-linked list head */ 8021da177e4SLinus Torvalds char *name; /* scheduler name */ 8031da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 8041da177e4SLinus Torvalds struct module *module; /* THIS_MODULE/NULL */ 8051da177e4SLinus Torvalds 8061da177e4SLinus Torvalds /* scheduler initializing service */ 8071da177e4SLinus Torvalds int (*init_service)(struct ip_vs_service *svc); 8081da177e4SLinus Torvalds /* scheduling service finish */ 809*ed3ffc4eSJulian Anastasov void (*done_service)(struct ip_vs_service *svc); 8101da177e4SLinus Torvalds /* scheduler updating service */ 8111da177e4SLinus Torvalds int (*update_service)(struct ip_vs_service *svc); 8126b6df466SJulian Anastasov /* dest is linked */ 8136b6df466SJulian Anastasov int (*add_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest); 8146b6df466SJulian Anastasov /* dest is unlinked */ 8156b6df466SJulian Anastasov int (*del_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest); 8166b6df466SJulian Anastasov /* dest is updated */ 8176b6df466SJulian Anastasov int (*upd_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest); 8181da177e4SLinus Torvalds 8191da177e4SLinus Torvalds /* selecting a server from the given service */ 8201da177e4SLinus Torvalds struct ip_vs_dest* (*schedule)(struct ip_vs_service *svc, 8211da177e4SLinus Torvalds const struct sk_buff *skb); 8221da177e4SLinus Torvalds }; 8231da177e4SLinus Torvalds 82485999283SSimon Horman /* The persistence engine object */ 82585999283SSimon Horman struct ip_vs_pe { 82685999283SSimon Horman struct list_head n_list; /* d-linked list head */ 82785999283SSimon Horman char *name; /* scheduler name */ 82885999283SSimon Horman atomic_t refcnt; /* reference counter */ 82985999283SSimon Horman struct module *module; /* THIS_MODULE/NULL */ 83085999283SSimon Horman 83185999283SSimon Horman /* get the connection template, if any */ 83285999283SSimon Horman int (*fill_param)(struct ip_vs_conn_param *p, struct sk_buff *skb); 83385999283SSimon Horman bool (*ct_match)(const struct ip_vs_conn_param *p, 83485999283SSimon Horman struct ip_vs_conn *ct); 83585999283SSimon Horman u32 (*hashkey_raw)(const struct ip_vs_conn_param *p, u32 initval, 83685999283SSimon Horman bool inverse); 837a3c918acSSimon Horman int (*show_pe_data)(const struct ip_vs_conn *cp, char *buf); 83885999283SSimon Horman }; 8391da177e4SLinus Torvalds 8401da177e4SLinus Torvalds /* 8411da177e4SLinus Torvalds * The application module object (a.k.a. app incarnation) 8421da177e4SLinus Torvalds */ 843fd2c3ef7SEric Dumazet struct ip_vs_app { 8441da177e4SLinus Torvalds struct list_head a_list; /* member in app list */ 8451da177e4SLinus Torvalds int type; /* IP_VS_APP_TYPE_xxx */ 8461da177e4SLinus Torvalds char *name; /* application module name */ 8471da177e4SLinus Torvalds __u16 protocol; 8481da177e4SLinus Torvalds struct module *module; /* THIS_MODULE/NULL */ 8491da177e4SLinus Torvalds struct list_head incs_list; /* list of incarnations */ 8501da177e4SLinus Torvalds 8511da177e4SLinus Torvalds /* members for application incarnations */ 8521da177e4SLinus Torvalds struct list_head p_list; /* member in proto app list */ 8531da177e4SLinus Torvalds struct ip_vs_app *app; /* its real application */ 854014d730dSAl Viro __be16 port; /* port number in net order */ 8551da177e4SLinus Torvalds atomic_t usecnt; /* usage counter */ 856363c97d7SJulian Anastasov struct rcu_head rcu_head; 8571da177e4SLinus Torvalds 8588b27b10fSJulian Anastasov /* 8598b27b10fSJulian Anastasov * output hook: Process packet in inout direction, diff set for TCP. 8608b27b10fSJulian Anastasov * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok, 8618b27b10fSJulian Anastasov * 2=Mangled but checksum was not updated 8628b27b10fSJulian Anastasov */ 8631da177e4SLinus Torvalds int (*pkt_out)(struct ip_vs_app *, struct ip_vs_conn *, 8643db05feaSHerbert Xu struct sk_buff *, int *diff); 8651da177e4SLinus Torvalds 8668b27b10fSJulian Anastasov /* 8678b27b10fSJulian Anastasov * input hook: Process packet in outin direction, diff set for TCP. 8688b27b10fSJulian Anastasov * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok, 8698b27b10fSJulian Anastasov * 2=Mangled but checksum was not updated 8708b27b10fSJulian Anastasov */ 8711da177e4SLinus Torvalds int (*pkt_in)(struct ip_vs_app *, struct ip_vs_conn *, 8723db05feaSHerbert Xu struct sk_buff *, int *diff); 8731da177e4SLinus Torvalds 8741da177e4SLinus Torvalds /* ip_vs_app initializer */ 8751da177e4SLinus Torvalds int (*init_conn)(struct ip_vs_app *, struct ip_vs_conn *); 8761da177e4SLinus Torvalds 8771da177e4SLinus Torvalds /* ip_vs_app finish */ 8781da177e4SLinus Torvalds int (*done_conn)(struct ip_vs_app *, struct ip_vs_conn *); 8791da177e4SLinus Torvalds 8801da177e4SLinus Torvalds 8811da177e4SLinus Torvalds /* not used now */ 8821da177e4SLinus Torvalds int (*bind_conn)(struct ip_vs_app *, struct ip_vs_conn *, 8831da177e4SLinus Torvalds struct ip_vs_protocol *); 8841da177e4SLinus Torvalds 8851da177e4SLinus Torvalds void (*unbind_conn)(struct ip_vs_app *, struct ip_vs_conn *); 8861da177e4SLinus Torvalds 8871da177e4SLinus Torvalds int * timeout_table; 8881da177e4SLinus Torvalds int * timeouts; 8891da177e4SLinus Torvalds int timeouts_size; 8901da177e4SLinus Torvalds 8911da177e4SLinus Torvalds int (*conn_schedule)(struct sk_buff *skb, struct ip_vs_app *app, 8921da177e4SLinus Torvalds int *verdict, struct ip_vs_conn **cpp); 8931da177e4SLinus Torvalds 8941da177e4SLinus Torvalds struct ip_vs_conn * 8951da177e4SLinus Torvalds (*conn_in_get)(const struct sk_buff *skb, struct ip_vs_app *app, 896d4383f04SJesper Dangaard Brouer const struct iphdr *iph, int inverse); 8971da177e4SLinus Torvalds 8981da177e4SLinus Torvalds struct ip_vs_conn * 8991da177e4SLinus Torvalds (*conn_out_get)(const struct sk_buff *skb, struct ip_vs_app *app, 900d4383f04SJesper Dangaard Brouer const struct iphdr *iph, int inverse); 9011da177e4SLinus Torvalds 9021da177e4SLinus Torvalds int (*state_transition)(struct ip_vs_conn *cp, int direction, 9031da177e4SLinus Torvalds const struct sk_buff *skb, 9041da177e4SLinus Torvalds struct ip_vs_app *app); 9051da177e4SLinus Torvalds 9061da177e4SLinus Torvalds void (*timeout_change)(struct ip_vs_app *app, int flags); 9071da177e4SLinus Torvalds }; 9081da177e4SLinus Torvalds 909f73181c8SPablo Neira Ayuso struct ipvs_master_sync_state { 910f73181c8SPablo Neira Ayuso struct list_head sync_queue; 911f73181c8SPablo Neira Ayuso struct ip_vs_sync_buff *sync_buff; 912f73181c8SPablo Neira Ayuso int sync_queue_len; 913f73181c8SPablo Neira Ayuso unsigned int sync_queue_delay; 914f73181c8SPablo Neira Ayuso struct task_struct *master_thread; 915f73181c8SPablo Neira Ayuso struct delayed_work master_wakeup_work; 916f73181c8SPablo Neira Ayuso struct netns_ipvs *ipvs; 917f73181c8SPablo Neira Ayuso }; 918f73181c8SPablo Neira Ayuso 919578bc3efSJulian Anastasov /* How much time to keep dests in trash */ 920578bc3efSJulian Anastasov #define IP_VS_DEST_TRASH_PERIOD (120 * HZ) 921578bc3efSJulian Anastasov 9222553d064SJulian Anastasov /* IPVS in network namespace */ 9232553d064SJulian Anastasov struct netns_ipvs { 9242553d064SJulian Anastasov int gen; /* Generation */ 9257a4f0761SHans Schillstrom int enable; /* enable like nf_hooks do */ 9262553d064SJulian Anastasov /* 9272553d064SJulian Anastasov * Hash table: for real service lookups 9282553d064SJulian Anastasov */ 9292553d064SJulian Anastasov #define IP_VS_RTAB_BITS 4 9302553d064SJulian Anastasov #define IP_VS_RTAB_SIZE (1 << IP_VS_RTAB_BITS) 9312553d064SJulian Anastasov #define IP_VS_RTAB_MASK (IP_VS_RTAB_SIZE - 1) 9322553d064SJulian Anastasov 933276472eaSJulian Anastasov struct hlist_head rs_table[IP_VS_RTAB_SIZE]; 9342553d064SJulian Anastasov /* ip_vs_app */ 9352553d064SJulian Anastasov struct list_head app_list; 9362553d064SJulian Anastasov /* ip_vs_proto */ 9372553d064SJulian Anastasov #define IP_VS_PROTO_TAB_SIZE 32 /* must be power of 2 */ 9382553d064SJulian Anastasov struct ip_vs_proto_data *proto_data_table[IP_VS_PROTO_TAB_SIZE]; 9392553d064SJulian Anastasov /* ip_vs_proto_tcp */ 9402553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_TCP 9412553d064SJulian Anastasov #define TCP_APP_TAB_BITS 4 9422553d064SJulian Anastasov #define TCP_APP_TAB_SIZE (1 << TCP_APP_TAB_BITS) 9432553d064SJulian Anastasov #define TCP_APP_TAB_MASK (TCP_APP_TAB_SIZE - 1) 9442553d064SJulian Anastasov struct list_head tcp_apps[TCP_APP_TAB_SIZE]; 9452553d064SJulian Anastasov #endif 9462553d064SJulian Anastasov /* ip_vs_proto_udp */ 9472553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_UDP 9482553d064SJulian Anastasov #define UDP_APP_TAB_BITS 4 9492553d064SJulian Anastasov #define UDP_APP_TAB_SIZE (1 << UDP_APP_TAB_BITS) 9502553d064SJulian Anastasov #define UDP_APP_TAB_MASK (UDP_APP_TAB_SIZE - 1) 9512553d064SJulian Anastasov struct list_head udp_apps[UDP_APP_TAB_SIZE]; 9522553d064SJulian Anastasov #endif 9532553d064SJulian Anastasov /* ip_vs_proto_sctp */ 9542553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_SCTP 9552553d064SJulian Anastasov #define SCTP_APP_TAB_BITS 4 9562553d064SJulian Anastasov #define SCTP_APP_TAB_SIZE (1 << SCTP_APP_TAB_BITS) 9572553d064SJulian Anastasov #define SCTP_APP_TAB_MASK (SCTP_APP_TAB_SIZE - 1) 9582553d064SJulian Anastasov /* Hash table for SCTP application incarnations */ 9592553d064SJulian Anastasov struct list_head sctp_apps[SCTP_APP_TAB_SIZE]; 9602553d064SJulian Anastasov #endif 9612553d064SJulian Anastasov /* ip_vs_conn */ 9622553d064SJulian Anastasov atomic_t conn_count; /* connection counter */ 9632553d064SJulian Anastasov 9642553d064SJulian Anastasov /* ip_vs_ctl */ 9652a0751afSJulian Anastasov struct ip_vs_stats tot_stats; /* Statistics & est. */ 9662553d064SJulian Anastasov 9672553d064SJulian Anastasov int num_services; /* no of virtual services */ 968f2247fbdSSimon Horman 9692553d064SJulian Anastasov /* Trash for destinations */ 9702553d064SJulian Anastasov struct list_head dest_trash; 971578bc3efSJulian Anastasov spinlock_t dest_trash_lock; 972578bc3efSJulian Anastasov struct timer_list dest_trash_timer; /* expiration timer */ 9732553d064SJulian Anastasov /* Service counters */ 9742553d064SJulian Anastasov atomic_t ftpsvc_counter; 9752553d064SJulian Anastasov atomic_t nullsvc_counter; 9762553d064SJulian Anastasov 977f2247fbdSSimon Horman #ifdef CONFIG_SYSCTL 978f2247fbdSSimon Horman /* 1/rate drop and drop-entry variables */ 979f2247fbdSSimon Horman struct delayed_work defense_work; /* Work handler */ 980f2247fbdSSimon Horman int drop_rate; 981f2247fbdSSimon Horman int drop_counter; 982f2247fbdSSimon Horman atomic_t dropentry; 983f2247fbdSSimon Horman /* locks in ctl.c */ 984f2247fbdSSimon Horman spinlock_t dropentry_lock; /* drop entry handling */ 985f2247fbdSSimon Horman spinlock_t droppacket_lock; /* drop packet handling */ 986f2247fbdSSimon Horman spinlock_t securetcp_lock; /* state and timeout tables */ 987f2247fbdSSimon Horman 9882553d064SJulian Anastasov /* sys-ctl struct */ 9892553d064SJulian Anastasov struct ctl_table_header *sysctl_hdr; 9902553d064SJulian Anastasov struct ctl_table *sysctl_tbl; 991f2247fbdSSimon Horman #endif 992f2247fbdSSimon Horman 9932553d064SJulian Anastasov /* sysctl variables */ 9942553d064SJulian Anastasov int sysctl_amemthresh; 9952553d064SJulian Anastasov int sysctl_am_droprate; 9962553d064SJulian Anastasov int sysctl_drop_entry; 9972553d064SJulian Anastasov int sysctl_drop_packet; 9982553d064SJulian Anastasov int sysctl_secure_tcp; 9992553d064SJulian Anastasov #ifdef CONFIG_IP_VS_NFCT 10002553d064SJulian Anastasov int sysctl_conntrack; 10012553d064SJulian Anastasov #endif 10022553d064SJulian Anastasov int sysctl_snat_reroute; 10032553d064SJulian Anastasov int sysctl_sync_ver; 1004f73181c8SPablo Neira Ayuso int sysctl_sync_ports; 10051c003b15SPablo Neira Ayuso int sysctl_sync_qlen_max; 10061c003b15SPablo Neira Ayuso int sysctl_sync_sock_size; 10072553d064SJulian Anastasov int sysctl_cache_bypass; 10082553d064SJulian Anastasov int sysctl_expire_nodest_conn; 10092553d064SJulian Anastasov int sysctl_expire_quiescent_template; 10102553d064SJulian Anastasov int sysctl_sync_threshold[2]; 1011749c42b6SJulian Anastasov unsigned int sysctl_sync_refresh_period; 1012749c42b6SJulian Anastasov int sysctl_sync_retries; 10132553d064SJulian Anastasov int sysctl_nat_icmp_send; 10143654e611SJulian Anastasov int sysctl_pmtu_disc; 10150c12582fSJulian Anastasov int sysctl_backup_only; 10162553d064SJulian Anastasov 10172553d064SJulian Anastasov /* ip_vs_lblc */ 10182553d064SJulian Anastasov int sysctl_lblc_expiration; 10192553d064SJulian Anastasov struct ctl_table_header *lblc_ctl_header; 10202553d064SJulian Anastasov struct ctl_table *lblc_ctl_table; 10212553d064SJulian Anastasov /* ip_vs_lblcr */ 10222553d064SJulian Anastasov int sysctl_lblcr_expiration; 10232553d064SJulian Anastasov struct ctl_table_header *lblcr_ctl_header; 10242553d064SJulian Anastasov struct ctl_table *lblcr_ctl_table; 10252553d064SJulian Anastasov /* ip_vs_est */ 10262553d064SJulian Anastasov struct list_head est_list; /* estimator list */ 10272553d064SJulian Anastasov spinlock_t est_lock; 10282553d064SJulian Anastasov struct timer_list est_timer; /* Estimation timer */ 10292553d064SJulian Anastasov /* ip_vs_sync */ 10302553d064SJulian Anastasov spinlock_t sync_lock; 1031f73181c8SPablo Neira Ayuso struct ipvs_master_sync_state *ms; 10322553d064SJulian Anastasov spinlock_t sync_buff_lock; 1033f73181c8SPablo Neira Ayuso struct task_struct **backup_threads; 1034f73181c8SPablo Neira Ayuso int threads_mask; 10352553d064SJulian Anastasov int send_mesg_maxlen; 10362553d064SJulian Anastasov int recv_mesg_maxlen; 10372553d064SJulian Anastasov volatile int sync_state; 10382553d064SJulian Anastasov volatile int master_syncid; 10392553d064SJulian Anastasov volatile int backup_syncid; 1040ae1d48b2SHans Schillstrom struct mutex sync_mutex; 10412553d064SJulian Anastasov /* multicast interface name */ 10422553d064SJulian Anastasov char master_mcast_ifn[IP_VS_IFNAME_MAXLEN]; 10432553d064SJulian Anastasov char backup_mcast_ifn[IP_VS_IFNAME_MAXLEN]; 10442553d064SJulian Anastasov /* net name space ptr */ 10452553d064SJulian Anastasov struct net *net; /* Needed by timer routines */ 10462553d064SJulian Anastasov }; 10471da177e4SLinus Torvalds 104859e0350eSSimon Horman #define DEFAULT_SYNC_THRESHOLD 3 104959e0350eSSimon Horman #define DEFAULT_SYNC_PERIOD 50 10507532e8d4SSimon Horman #define DEFAULT_SYNC_VER 1 1051749c42b6SJulian Anastasov #define DEFAULT_SYNC_REFRESH_PERIOD (0U * HZ) 1052749c42b6SJulian Anastasov #define DEFAULT_SYNC_RETRIES 0 10531c003b15SPablo Neira Ayuso #define IPVS_SYNC_WAKEUP_RATE 8 10541c003b15SPablo Neira Ayuso #define IPVS_SYNC_QLEN_MAX (IPVS_SYNC_WAKEUP_RATE * 4) 10551c003b15SPablo Neira Ayuso #define IPVS_SYNC_SEND_DELAY (HZ / 50) 10561c003b15SPablo Neira Ayuso #define IPVS_SYNC_CHECK_PERIOD HZ 1057749c42b6SJulian Anastasov #define IPVS_SYNC_FLUSH_TIME (HZ * 2) 1058f73181c8SPablo Neira Ayuso #define IPVS_SYNC_PORTS_MAX (1 << 6) 105959e0350eSSimon Horman 106059e0350eSSimon Horman #ifdef CONFIG_SYSCTL 106159e0350eSSimon Horman 106259e0350eSSimon Horman static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs) 106359e0350eSSimon Horman { 106459e0350eSSimon Horman return ipvs->sysctl_sync_threshold[0]; 106559e0350eSSimon Horman } 106659e0350eSSimon Horman 106759e0350eSSimon Horman static inline int sysctl_sync_period(struct netns_ipvs *ipvs) 106859e0350eSSimon Horman { 1069749c42b6SJulian Anastasov return ACCESS_ONCE(ipvs->sysctl_sync_threshold[1]); 1070749c42b6SJulian Anastasov } 1071749c42b6SJulian Anastasov 1072749c42b6SJulian Anastasov static inline unsigned int sysctl_sync_refresh_period(struct netns_ipvs *ipvs) 1073749c42b6SJulian Anastasov { 1074749c42b6SJulian Anastasov return ACCESS_ONCE(ipvs->sysctl_sync_refresh_period); 1075749c42b6SJulian Anastasov } 1076749c42b6SJulian Anastasov 1077749c42b6SJulian Anastasov static inline int sysctl_sync_retries(struct netns_ipvs *ipvs) 1078749c42b6SJulian Anastasov { 1079749c42b6SJulian Anastasov return ipvs->sysctl_sync_retries; 108059e0350eSSimon Horman } 108159e0350eSSimon Horman 10827532e8d4SSimon Horman static inline int sysctl_sync_ver(struct netns_ipvs *ipvs) 10837532e8d4SSimon Horman { 10847532e8d4SSimon Horman return ipvs->sysctl_sync_ver; 10857532e8d4SSimon Horman } 10867532e8d4SSimon Horman 1087f73181c8SPablo Neira Ayuso static inline int sysctl_sync_ports(struct netns_ipvs *ipvs) 1088f73181c8SPablo Neira Ayuso { 1089f73181c8SPablo Neira Ayuso return ACCESS_ONCE(ipvs->sysctl_sync_ports); 1090f73181c8SPablo Neira Ayuso } 1091f73181c8SPablo Neira Ayuso 10921c003b15SPablo Neira Ayuso static inline int sysctl_sync_qlen_max(struct netns_ipvs *ipvs) 10931c003b15SPablo Neira Ayuso { 10941c003b15SPablo Neira Ayuso return ipvs->sysctl_sync_qlen_max; 10951c003b15SPablo Neira Ayuso } 10961c003b15SPablo Neira Ayuso 10971c003b15SPablo Neira Ayuso static inline int sysctl_sync_sock_size(struct netns_ipvs *ipvs) 10981c003b15SPablo Neira Ayuso { 10991c003b15SPablo Neira Ayuso return ipvs->sysctl_sync_sock_size; 11001c003b15SPablo Neira Ayuso } 11011c003b15SPablo Neira Ayuso 11023654e611SJulian Anastasov static inline int sysctl_pmtu_disc(struct netns_ipvs *ipvs) 11033654e611SJulian Anastasov { 11043654e611SJulian Anastasov return ipvs->sysctl_pmtu_disc; 11053654e611SJulian Anastasov } 11063654e611SJulian Anastasov 11070c12582fSJulian Anastasov static inline int sysctl_backup_only(struct netns_ipvs *ipvs) 11080c12582fSJulian Anastasov { 11090c12582fSJulian Anastasov return ipvs->sync_state & IP_VS_STATE_BACKUP && 11100c12582fSJulian Anastasov ipvs->sysctl_backup_only; 11110c12582fSJulian Anastasov } 11120c12582fSJulian Anastasov 111359e0350eSSimon Horman #else 111459e0350eSSimon Horman 111559e0350eSSimon Horman static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs) 111659e0350eSSimon Horman { 111759e0350eSSimon Horman return DEFAULT_SYNC_THRESHOLD; 111859e0350eSSimon Horman } 111959e0350eSSimon Horman 112059e0350eSSimon Horman static inline int sysctl_sync_period(struct netns_ipvs *ipvs) 112159e0350eSSimon Horman { 112259e0350eSSimon Horman return DEFAULT_SYNC_PERIOD; 112359e0350eSSimon Horman } 112459e0350eSSimon Horman 1125749c42b6SJulian Anastasov static inline unsigned int sysctl_sync_refresh_period(struct netns_ipvs *ipvs) 1126749c42b6SJulian Anastasov { 1127749c42b6SJulian Anastasov return DEFAULT_SYNC_REFRESH_PERIOD; 1128749c42b6SJulian Anastasov } 1129749c42b6SJulian Anastasov 1130749c42b6SJulian Anastasov static inline int sysctl_sync_retries(struct netns_ipvs *ipvs) 1131749c42b6SJulian Anastasov { 1132749c42b6SJulian Anastasov return DEFAULT_SYNC_RETRIES & 3; 1133749c42b6SJulian Anastasov } 1134749c42b6SJulian Anastasov 11357532e8d4SSimon Horman static inline int sysctl_sync_ver(struct netns_ipvs *ipvs) 11367532e8d4SSimon Horman { 11377532e8d4SSimon Horman return DEFAULT_SYNC_VER; 11387532e8d4SSimon Horman } 11397532e8d4SSimon Horman 1140f73181c8SPablo Neira Ayuso static inline int sysctl_sync_ports(struct netns_ipvs *ipvs) 1141f73181c8SPablo Neira Ayuso { 1142f73181c8SPablo Neira Ayuso return 1; 1143f73181c8SPablo Neira Ayuso } 1144f73181c8SPablo Neira Ayuso 11451c003b15SPablo Neira Ayuso static inline int sysctl_sync_qlen_max(struct netns_ipvs *ipvs) 11461c003b15SPablo Neira Ayuso { 11471c003b15SPablo Neira Ayuso return IPVS_SYNC_QLEN_MAX; 11481c003b15SPablo Neira Ayuso } 11491c003b15SPablo Neira Ayuso 11501c003b15SPablo Neira Ayuso static inline int sysctl_sync_sock_size(struct netns_ipvs *ipvs) 11511c003b15SPablo Neira Ayuso { 11521c003b15SPablo Neira Ayuso return 0; 11531c003b15SPablo Neira Ayuso } 11541c003b15SPablo Neira Ayuso 11553654e611SJulian Anastasov static inline int sysctl_pmtu_disc(struct netns_ipvs *ipvs) 11563654e611SJulian Anastasov { 11573654e611SJulian Anastasov return 1; 11583654e611SJulian Anastasov } 11593654e611SJulian Anastasov 11600c12582fSJulian Anastasov static inline int sysctl_backup_only(struct netns_ipvs *ipvs) 11610c12582fSJulian Anastasov { 11620c12582fSJulian Anastasov return 0; 11630c12582fSJulian Anastasov } 11640c12582fSJulian Anastasov 116559e0350eSSimon Horman #endif 116659e0350eSSimon Horman 11671da177e4SLinus Torvalds /* 11681da177e4SLinus Torvalds * IPVS core functions 11691da177e4SLinus Torvalds * (from ip_vs_core.c) 11701da177e4SLinus Torvalds */ 117195c96174SEric Dumazet extern const char *ip_vs_proto_name(unsigned int proto); 11721da177e4SLinus Torvalds extern void ip_vs_init_hash_table(struct list_head *table, int rows); 1173afdd6140SSven Wegener #define IP_VS_INIT_HASH_TABLE(t) ip_vs_init_hash_table((t), ARRAY_SIZE((t))) 11741da177e4SLinus Torvalds 11751da177e4SLinus Torvalds #define IP_VS_APP_TYPE_FTP 1 11761da177e4SLinus Torvalds 11771da177e4SLinus Torvalds /* 11781da177e4SLinus Torvalds * ip_vs_conn handling functions 11791da177e4SLinus Torvalds * (from ip_vs_conn.c) 11801da177e4SLinus Torvalds */ 11811da177e4SLinus Torvalds 11821da177e4SLinus Torvalds enum { 11831da177e4SLinus Torvalds IP_VS_DIR_INPUT = 0, 11841da177e4SLinus Torvalds IP_VS_DIR_OUTPUT, 11851da177e4SLinus Torvalds IP_VS_DIR_INPUT_ONLY, 11861da177e4SLinus Torvalds IP_VS_DIR_LAST, 11871da177e4SLinus Torvalds }; 11881da177e4SLinus Torvalds 11896e67e586SHans Schillstrom static inline void ip_vs_conn_fill_param(struct net *net, int af, int protocol, 1190f11017ecSSimon Horman const union nf_inet_addr *caddr, 1191f11017ecSSimon Horman __be16 cport, 1192f11017ecSSimon Horman const union nf_inet_addr *vaddr, 1193f11017ecSSimon Horman __be16 vport, 1194f11017ecSSimon Horman struct ip_vs_conn_param *p) 1195f11017ecSSimon Horman { 11966e67e586SHans Schillstrom p->net = net; 1197f11017ecSSimon Horman p->af = af; 1198f11017ecSSimon Horman p->protocol = protocol; 1199f11017ecSSimon Horman p->caddr = caddr; 1200f11017ecSSimon Horman p->cport = cport; 1201f11017ecSSimon Horman p->vaddr = vaddr; 1202f11017ecSSimon Horman p->vport = vport; 120385999283SSimon Horman p->pe = NULL; 120485999283SSimon Horman p->pe_data = NULL; 1205f11017ecSSimon Horman } 120628364a59SJulius Volz 1207f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_in_get(const struct ip_vs_conn_param *p); 1208f11017ecSSimon Horman struct ip_vs_conn *ip_vs_ct_in_get(const struct ip_vs_conn_param *p); 120928364a59SJulius Volz 12105c0d2374SSimon Horman struct ip_vs_conn * ip_vs_conn_in_get_proto(int af, const struct sk_buff *skb, 12115c0d2374SSimon Horman const struct ip_vs_iphdr *iph, 12125c0d2374SSimon Horman int inverse); 12135c0d2374SSimon Horman 1214f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_out_get(const struct ip_vs_conn_param *p); 12151da177e4SLinus Torvalds 12165c0d2374SSimon Horman struct ip_vs_conn * ip_vs_conn_out_get_proto(int af, const struct sk_buff *skb, 12175c0d2374SSimon Horman const struct ip_vs_iphdr *iph, 12185c0d2374SSimon Horman int inverse); 12195c0d2374SSimon Horman 1220088339a5SJulian Anastasov /* Get reference to gain full access to conn. 1221088339a5SJulian Anastasov * By default, RCU read-side critical sections have access only to 1222088339a5SJulian Anastasov * conn fields and its PE data, see ip_vs_conn_rcu_free() for reference. 1223088339a5SJulian Anastasov */ 1224088339a5SJulian Anastasov static inline bool __ip_vs_conn_get(struct ip_vs_conn *cp) 1225088339a5SJulian Anastasov { 1226088339a5SJulian Anastasov return atomic_inc_not_zero(&cp->refcnt); 1227088339a5SJulian Anastasov } 1228088339a5SJulian Anastasov 12291da177e4SLinus Torvalds /* put back the conn without restarting its timer */ 12301da177e4SLinus Torvalds static inline void __ip_vs_conn_put(struct ip_vs_conn *cp) 12311da177e4SLinus Torvalds { 1232088339a5SJulian Anastasov smp_mb__before_atomic_dec(); 12331da177e4SLinus Torvalds atomic_dec(&cp->refcnt); 12341da177e4SLinus Torvalds } 12351da177e4SLinus Torvalds extern void ip_vs_conn_put(struct ip_vs_conn *cp); 1236014d730dSAl Viro extern void ip_vs_conn_fill_cport(struct ip_vs_conn *cp, __be16 cport); 12371da177e4SLinus Torvalds 1238f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_new(const struct ip_vs_conn_param *p, 1239f11017ecSSimon Horman const union nf_inet_addr *daddr, 124095c96174SEric Dumazet __be16 dport, unsigned int flags, 12410e051e68SHans Schillstrom struct ip_vs_dest *dest, __u32 fwmark); 12421da177e4SLinus Torvalds extern void ip_vs_conn_expire_now(struct ip_vs_conn *cp); 12431da177e4SLinus Torvalds 12441da177e4SLinus Torvalds extern const char * ip_vs_state_name(__u16 proto, int state); 12451da177e4SLinus Torvalds 12464a85b96cSHans Schillstrom extern void ip_vs_tcp_conn_listen(struct net *net, struct ip_vs_conn *cp); 12471da177e4SLinus Torvalds extern int ip_vs_check_template(struct ip_vs_conn *ct); 1248f6340ee0SHans Schillstrom extern void ip_vs_random_dropentry(struct net *net); 12491da177e4SLinus Torvalds extern int ip_vs_conn_init(void); 12501da177e4SLinus Torvalds extern void ip_vs_conn_cleanup(void); 12511da177e4SLinus Torvalds 12521da177e4SLinus Torvalds static inline void ip_vs_control_del(struct ip_vs_conn *cp) 12531da177e4SLinus Torvalds { 12541da177e4SLinus Torvalds struct ip_vs_conn *ctl_cp = cp->control; 12551da177e4SLinus Torvalds if (!ctl_cp) { 1256cfc78c5aSJulius Volz IP_VS_ERR_BUF("request control DEL for uncontrolled: " 1257cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1258cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1259cfc78c5aSJulius Volz ntohs(cp->cport), 1260cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1261cfc78c5aSJulius Volz ntohs(cp->vport)); 1262cfc78c5aSJulius Volz 12631da177e4SLinus Torvalds return; 12641da177e4SLinus Torvalds } 12651da177e4SLinus Torvalds 1266cfc78c5aSJulius Volz IP_VS_DBG_BUF(7, "DELeting control for: " 1267cfc78c5aSJulius Volz "cp.dst=%s:%d ctl_cp.dst=%s:%d\n", 1268cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1269cfc78c5aSJulius Volz ntohs(cp->cport), 1270cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr), 1271cfc78c5aSJulius Volz ntohs(ctl_cp->cport)); 12721da177e4SLinus Torvalds 12731da177e4SLinus Torvalds cp->control = NULL; 12741da177e4SLinus Torvalds if (atomic_read(&ctl_cp->n_control) == 0) { 1275cfc78c5aSJulius Volz IP_VS_ERR_BUF("BUG control DEL with n=0 : " 1276cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1277cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1278cfc78c5aSJulius Volz ntohs(cp->cport), 1279cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1280cfc78c5aSJulius Volz ntohs(cp->vport)); 1281cfc78c5aSJulius Volz 12821da177e4SLinus Torvalds return; 12831da177e4SLinus Torvalds } 12841da177e4SLinus Torvalds atomic_dec(&ctl_cp->n_control); 12851da177e4SLinus Torvalds } 12861da177e4SLinus Torvalds 12871da177e4SLinus Torvalds static inline void 12881da177e4SLinus Torvalds ip_vs_control_add(struct ip_vs_conn *cp, struct ip_vs_conn *ctl_cp) 12891da177e4SLinus Torvalds { 12901da177e4SLinus Torvalds if (cp->control) { 1291cfc78c5aSJulius Volz IP_VS_ERR_BUF("request control ADD for already controlled: " 1292cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1293cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1294cfc78c5aSJulius Volz ntohs(cp->cport), 1295cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1296cfc78c5aSJulius Volz ntohs(cp->vport)); 1297cfc78c5aSJulius Volz 12981da177e4SLinus Torvalds ip_vs_control_del(cp); 12991da177e4SLinus Torvalds } 13001da177e4SLinus Torvalds 1301cfc78c5aSJulius Volz IP_VS_DBG_BUF(7, "ADDing control for: " 1302cfc78c5aSJulius Volz "cp.dst=%s:%d ctl_cp.dst=%s:%d\n", 1303cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1304cfc78c5aSJulius Volz ntohs(cp->cport), 1305cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr), 1306cfc78c5aSJulius Volz ntohs(ctl_cp->cport)); 13071da177e4SLinus Torvalds 13081da177e4SLinus Torvalds cp->control = ctl_cp; 13091da177e4SLinus Torvalds atomic_inc(&ctl_cp->n_control); 13101da177e4SLinus Torvalds } 13111da177e4SLinus Torvalds 13127a4f0761SHans Schillstrom /* 13137a4f0761SHans Schillstrom * IPVS netns init & cleanup functions 13147a4f0761SHans Schillstrom */ 1315503cf15aSHans Schillstrom extern int ip_vs_estimator_net_init(struct net *net); 1316503cf15aSHans Schillstrom extern int ip_vs_control_net_init(struct net *net); 1317503cf15aSHans Schillstrom extern int ip_vs_protocol_net_init(struct net *net); 1318503cf15aSHans Schillstrom extern int ip_vs_app_net_init(struct net *net); 1319503cf15aSHans Schillstrom extern int ip_vs_conn_net_init(struct net *net); 1320503cf15aSHans Schillstrom extern int ip_vs_sync_net_init(struct net *net); 1321503cf15aSHans Schillstrom extern void ip_vs_conn_net_cleanup(struct net *net); 1322503cf15aSHans Schillstrom extern void ip_vs_app_net_cleanup(struct net *net); 1323503cf15aSHans Schillstrom extern void ip_vs_protocol_net_cleanup(struct net *net); 1324503cf15aSHans Schillstrom extern void ip_vs_control_net_cleanup(struct net *net); 1325503cf15aSHans Schillstrom extern void ip_vs_estimator_net_cleanup(struct net *net); 1326503cf15aSHans Schillstrom extern void ip_vs_sync_net_cleanup(struct net *net); 1327503cf15aSHans Schillstrom extern void ip_vs_service_net_cleanup(struct net *net); 13281da177e4SLinus Torvalds 13291da177e4SLinus Torvalds /* 13301da177e4SLinus Torvalds * IPVS application functions 13311da177e4SLinus Torvalds * (from ip_vs_app.c) 13321da177e4SLinus Torvalds */ 13331da177e4SLinus Torvalds #define IP_VS_APP_MAX_PORTS 8 1334be97fdb5SJulian Anastasov extern struct ip_vs_app *register_ip_vs_app(struct net *net, 1335be97fdb5SJulian Anastasov struct ip_vs_app *app); 1336ab8a5e84SHans Schillstrom extern void unregister_ip_vs_app(struct net *net, struct ip_vs_app *app); 13371da177e4SLinus Torvalds extern int ip_vs_bind_app(struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 13381da177e4SLinus Torvalds extern void ip_vs_unbind_app(struct ip_vs_conn *cp); 1339ab8a5e84SHans Schillstrom extern int register_ip_vs_app_inc(struct net *net, struct ip_vs_app *app, 1340ab8a5e84SHans Schillstrom __u16 proto, __u16 port); 13411da177e4SLinus Torvalds extern int ip_vs_app_inc_get(struct ip_vs_app *inc); 13421da177e4SLinus Torvalds extern void ip_vs_app_inc_put(struct ip_vs_app *inc); 13431da177e4SLinus Torvalds 13443db05feaSHerbert Xu extern int ip_vs_app_pkt_out(struct ip_vs_conn *, struct sk_buff *skb); 13453db05feaSHerbert Xu extern int ip_vs_app_pkt_in(struct ip_vs_conn *, struct sk_buff *skb); 13461da177e4SLinus Torvalds 13478be67a66SSimon Horman void ip_vs_bind_pe(struct ip_vs_service *svc, struct ip_vs_pe *pe); 13488be67a66SSimon Horman void ip_vs_unbind_pe(struct ip_vs_service *svc); 13498be67a66SSimon Horman int register_ip_vs_pe(struct ip_vs_pe *pe); 13508be67a66SSimon Horman int unregister_ip_vs_pe(struct ip_vs_pe *pe); 1351e9e5eee8SSimon Horman struct ip_vs_pe *ip_vs_pe_getbyname(const char *name); 1352fe5e7a1eSHans Schillstrom struct ip_vs_pe *__ip_vs_pe_getbyname(const char *pe_name); 1353e9e5eee8SSimon Horman 135469e7dae4SPaul Gortmaker /* 135569e7dae4SPaul Gortmaker * Use a #define to avoid all of module.h just for these trivial ops 135669e7dae4SPaul Gortmaker */ 135769e7dae4SPaul Gortmaker #define ip_vs_pe_get(pe) \ 135869e7dae4SPaul Gortmaker if (pe && pe->module) \ 1359e9e5eee8SSimon Horman __module_get(pe->module); 1360e9e5eee8SSimon Horman 136169e7dae4SPaul Gortmaker #define ip_vs_pe_put(pe) \ 136269e7dae4SPaul Gortmaker if (pe && pe->module) \ 1363e9e5eee8SSimon Horman module_put(pe->module); 13641da177e4SLinus Torvalds 13651da177e4SLinus Torvalds /* 13661da177e4SLinus Torvalds * IPVS protocol functions (from ip_vs_proto.c) 13671da177e4SLinus Torvalds */ 13681da177e4SLinus Torvalds extern int ip_vs_protocol_init(void); 13691da177e4SLinus Torvalds extern void ip_vs_protocol_cleanup(void); 13709330419dSHans Schillstrom extern void ip_vs_protocol_timeout_change(struct netns_ipvs *ipvs, int flags); 13711da177e4SLinus Torvalds extern int *ip_vs_create_timeout_table(int *table, int size); 13721da177e4SLinus Torvalds extern int 137336cbd3dcSJan Engelhardt ip_vs_set_state_timeout(int *table, int num, const char *const *names, 137436cbd3dcSJan Engelhardt const char *name, int to); 13751da177e4SLinus Torvalds extern void 13760d79641aSJulian Anastasov ip_vs_tcpudp_debug_packet(int af, struct ip_vs_protocol *pp, 13770d79641aSJulian Anastasov const struct sk_buff *skb, 13781da177e4SLinus Torvalds int offset, const char *msg); 13791da177e4SLinus Torvalds 13801da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_tcp; 13811da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_udp; 13821da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_icmp; 13831da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_esp; 13841da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_ah; 13852906f66aSVenkata Mohan Reddy extern struct ip_vs_protocol ip_vs_protocol_sctp; 13861da177e4SLinus Torvalds 13871da177e4SLinus Torvalds /* 13881da177e4SLinus Torvalds * Registering/unregistering scheduler functions 13891da177e4SLinus Torvalds * (from ip_vs_sched.c) 13901da177e4SLinus Torvalds */ 13911da177e4SLinus Torvalds extern int register_ip_vs_scheduler(struct ip_vs_scheduler *scheduler); 13921da177e4SLinus Torvalds extern int unregister_ip_vs_scheduler(struct ip_vs_scheduler *scheduler); 13931da177e4SLinus Torvalds extern int ip_vs_bind_scheduler(struct ip_vs_service *svc, 13941da177e4SLinus Torvalds struct ip_vs_scheduler *scheduler); 1395*ed3ffc4eSJulian Anastasov extern void ip_vs_unbind_scheduler(struct ip_vs_service *svc); 13961da177e4SLinus Torvalds extern struct ip_vs_scheduler *ip_vs_scheduler_get(const char *sched_name); 13971da177e4SLinus Torvalds extern void ip_vs_scheduler_put(struct ip_vs_scheduler *scheduler); 13981da177e4SLinus Torvalds extern struct ip_vs_conn * 1399190ecd27SJulian Anastasov ip_vs_schedule(struct ip_vs_service *svc, struct sk_buff *skb, 1400d4383f04SJesper Dangaard Brouer struct ip_vs_proto_data *pd, int *ignored, 1401d4383f04SJesper Dangaard Brouer struct ip_vs_iphdr *iph); 14021da177e4SLinus Torvalds extern int ip_vs_leave(struct ip_vs_service *svc, struct sk_buff *skb, 1403d4383f04SJesper Dangaard Brouer struct ip_vs_proto_data *pd, struct ip_vs_iphdr *iph); 14041da177e4SLinus Torvalds 140541ac51eeSPatrick Schaaf extern void ip_vs_scheduler_err(struct ip_vs_service *svc, const char *msg); 140641ac51eeSPatrick Schaaf 14071da177e4SLinus Torvalds 14081da177e4SLinus Torvalds /* 14091da177e4SLinus Torvalds * IPVS control data and functions (from ip_vs_ctl.c) 14101da177e4SLinus Torvalds */ 14111da177e4SLinus Torvalds extern struct ip_vs_stats ip_vs_stats; 1412b880c1f0SHans Schillstrom extern int sysctl_ip_vs_sync_ver; 14131da177e4SLinus Torvalds 14141da177e4SLinus Torvalds extern struct ip_vs_service * 1415fc723250SHans Schillstrom ip_vs_service_get(struct net *net, int af, __u32 fwmark, __u16 protocol, 14163c2e0505SJulius Volz const union nf_inet_addr *vaddr, __be16 vport); 14171da177e4SLinus Torvalds 14181da177e4SLinus Torvalds static inline void ip_vs_service_put(struct ip_vs_service *svc) 14191da177e4SLinus Torvalds { 14201da177e4SLinus Torvalds atomic_dec(&svc->usecnt); 14211da177e4SLinus Torvalds } 14221da177e4SLinus Torvalds 1423276472eaSJulian Anastasov extern bool 1424276472eaSJulian Anastasov ip_vs_has_real_service(struct net *net, int af, __u16 protocol, 14257937df15SJulius Volz const union nf_inet_addr *daddr, __be16 dport); 14267937df15SJulius Volz 14271da177e4SLinus Torvalds extern int ip_vs_use_count_inc(void); 14281da177e4SLinus Torvalds extern void ip_vs_use_count_dec(void); 14298537de8aSHans Schillstrom extern int ip_vs_register_nl_ioctl(void); 14308537de8aSHans Schillstrom extern void ip_vs_unregister_nl_ioctl(void); 14311da177e4SLinus Torvalds extern int ip_vs_control_init(void); 14321da177e4SLinus Torvalds extern void ip_vs_control_cleanup(void); 14331e356f9cSRumen G. Bogdanovski extern struct ip_vs_dest * 1434fc723250SHans Schillstrom ip_vs_find_dest(struct net *net, int af, const union nf_inet_addr *daddr, 1435fc723250SHans Schillstrom __be16 dport, const union nf_inet_addr *vaddr, __be16 vport, 143652793dbeSJulian Anastasov __u16 protocol, __u32 fwmark, __u32 flags); 14371e356f9cSRumen G. Bogdanovski extern struct ip_vs_dest *ip_vs_try_bind_dest(struct ip_vs_conn *cp); 14381da177e4SLinus Torvalds 1439fca9c20aSJulian Anastasov static inline void ip_vs_dest_hold(struct ip_vs_dest *dest) 1440fca9c20aSJulian Anastasov { 1441fca9c20aSJulian Anastasov atomic_inc(&dest->refcnt); 1442fca9c20aSJulian Anastasov } 1443fca9c20aSJulian Anastasov 1444fca9c20aSJulian Anastasov static inline void ip_vs_dest_put(struct ip_vs_dest *dest) 1445fca9c20aSJulian Anastasov { 1446fca9c20aSJulian Anastasov smp_mb__before_atomic_dec(); 1447fca9c20aSJulian Anastasov atomic_dec(&dest->refcnt); 1448fca9c20aSJulian Anastasov } 14491da177e4SLinus Torvalds 14501da177e4SLinus Torvalds /* 14511da177e4SLinus Torvalds * IPVS sync daemon data and function prototypes 14521da177e4SLinus Torvalds * (from ip_vs_sync.c) 14531da177e4SLinus Torvalds */ 1454f131315fSHans Schillstrom extern int start_sync_thread(struct net *net, int state, char *mcast_ifn, 1455f131315fSHans Schillstrom __u8 syncid); 1456f131315fSHans Schillstrom extern int stop_sync_thread(struct net *net, int state); 1457749c42b6SJulian Anastasov extern void ip_vs_sync_conn(struct net *net, struct ip_vs_conn *cp, int pkts); 14581da177e4SLinus Torvalds 14591da177e4SLinus Torvalds 14601da177e4SLinus Torvalds /* 14611da177e4SLinus Torvalds * IPVS rate estimator prototypes (from ip_vs_est.c) 14621da177e4SLinus Torvalds */ 14636ef757f9SJulian Anastasov extern void ip_vs_start_estimator(struct net *net, struct ip_vs_stats *stats); 14646ef757f9SJulian Anastasov extern void ip_vs_stop_estimator(struct net *net, struct ip_vs_stats *stats); 14651da177e4SLinus Torvalds extern void ip_vs_zero_estimator(struct ip_vs_stats *stats); 1466ea9f22ccSJulian Anastasov extern void ip_vs_read_estimator(struct ip_vs_stats_user *dst, 1467ea9f22ccSJulian Anastasov struct ip_vs_stats *stats); 14681da177e4SLinus Torvalds 14691da177e4SLinus Torvalds /* 14701da177e4SLinus Torvalds * Various IPVS packet transmitters (from ip_vs_xmit.c) 14711da177e4SLinus Torvalds */ 1472d4383f04SJesper Dangaard Brouer extern int ip_vs_null_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1473d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 1474d4383f04SJesper Dangaard Brouer extern int ip_vs_bypass_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1475d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, 1476d4383f04SJesper Dangaard Brouer struct ip_vs_iphdr *iph); 1477d4383f04SJesper Dangaard Brouer extern int ip_vs_nat_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1478d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 1479d4383f04SJesper Dangaard Brouer extern int ip_vs_tunnel_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1480d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, 1481d4383f04SJesper Dangaard Brouer struct ip_vs_iphdr *iph); 1482d4383f04SJesper Dangaard Brouer extern int ip_vs_dr_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1483d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 1484d4383f04SJesper Dangaard Brouer extern int ip_vs_icmp_xmit(struct sk_buff *skb, struct ip_vs_conn *cp, 1485d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, int offset, 1486d4383f04SJesper Dangaard Brouer unsigned int hooknum, struct ip_vs_iphdr *iph); 1487026ace06SJulian Anastasov extern void ip_vs_dest_dst_rcu_free(struct rcu_head *head); 14881da177e4SLinus Torvalds 1489b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6 1490d4383f04SJesper Dangaard Brouer extern int ip_vs_bypass_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 1491d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, 1492d4383f04SJesper Dangaard Brouer struct ip_vs_iphdr *iph); 1493d4383f04SJesper Dangaard Brouer extern int ip_vs_nat_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 1494d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, 1495d4383f04SJesper Dangaard Brouer struct ip_vs_iphdr *iph); 1496d4383f04SJesper Dangaard Brouer extern int ip_vs_tunnel_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 1497d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, 1498d4383f04SJesper Dangaard Brouer struct ip_vs_iphdr *iph); 1499d4383f04SJesper Dangaard Brouer extern int ip_vs_dr_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 1500d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph); 1501d4383f04SJesper Dangaard Brouer extern int ip_vs_icmp_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp, 1502d4383f04SJesper Dangaard Brouer struct ip_vs_protocol *pp, int offset, 1503d4383f04SJesper Dangaard Brouer unsigned int hooknum, struct ip_vs_iphdr *iph); 1504b3cdd2a7SJulius Volz #endif 15051da177e4SLinus Torvalds 15063a1bbf18SSimon Horman #ifdef CONFIG_SYSCTL 15071da177e4SLinus Torvalds /* 15081da177e4SLinus Torvalds * This is a simple mechanism to ignore packets when 15091da177e4SLinus Torvalds * we are loaded. Just set ip_vs_drop_rate to 'n' and 15101da177e4SLinus Torvalds * we start to drop 1/rate of the packets 15111da177e4SLinus Torvalds */ 15121da177e4SLinus Torvalds 1513a0840e2eSHans Schillstrom static inline int ip_vs_todrop(struct netns_ipvs *ipvs) 15141da177e4SLinus Torvalds { 1515a0840e2eSHans Schillstrom if (!ipvs->drop_rate) 1516a0840e2eSHans Schillstrom return 0; 1517a0840e2eSHans Schillstrom if (--ipvs->drop_counter > 0) 1518a0840e2eSHans Schillstrom return 0; 1519a0840e2eSHans Schillstrom ipvs->drop_counter = ipvs->drop_rate; 15201da177e4SLinus Torvalds return 1; 15211da177e4SLinus Torvalds } 15223a1bbf18SSimon Horman #else 15233a1bbf18SSimon Horman static inline int ip_vs_todrop(struct netns_ipvs *ipvs) { return 0; } 15243a1bbf18SSimon Horman #endif 15251da177e4SLinus Torvalds 15261da177e4SLinus Torvalds /* 15271da177e4SLinus Torvalds * ip_vs_fwd_tag returns the forwarding tag of the connection 15281da177e4SLinus Torvalds */ 15291da177e4SLinus Torvalds #define IP_VS_FWD_METHOD(cp) (cp->flags & IP_VS_CONN_F_FWD_MASK) 15301da177e4SLinus Torvalds 1531732db659SAdrian Bunk static inline char ip_vs_fwd_tag(struct ip_vs_conn *cp) 15321da177e4SLinus Torvalds { 15331da177e4SLinus Torvalds char fwd; 15341da177e4SLinus Torvalds 15351da177e4SLinus Torvalds switch (IP_VS_FWD_METHOD(cp)) { 15361da177e4SLinus Torvalds case IP_VS_CONN_F_MASQ: 15371da177e4SLinus Torvalds fwd = 'M'; break; 15381da177e4SLinus Torvalds case IP_VS_CONN_F_LOCALNODE: 15391da177e4SLinus Torvalds fwd = 'L'; break; 15401da177e4SLinus Torvalds case IP_VS_CONN_F_TUNNEL: 15411da177e4SLinus Torvalds fwd = 'T'; break; 15421da177e4SLinus Torvalds case IP_VS_CONN_F_DROUTE: 15431da177e4SLinus Torvalds fwd = 'R'; break; 15441da177e4SLinus Torvalds case IP_VS_CONN_F_BYPASS: 15451da177e4SLinus Torvalds fwd = 'B'; break; 15461da177e4SLinus Torvalds default: 15471da177e4SLinus Torvalds fwd = '?'; break; 15481da177e4SLinus Torvalds } 15491da177e4SLinus Torvalds return fwd; 15501da177e4SLinus Torvalds } 15511da177e4SLinus Torvalds 15521da177e4SLinus Torvalds extern void ip_vs_nat_icmp(struct sk_buff *skb, struct ip_vs_protocol *pp, 15531da177e4SLinus Torvalds struct ip_vs_conn *cp, int dir); 15541da177e4SLinus Torvalds 1555b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6 1556b3cdd2a7SJulius Volz extern void ip_vs_nat_icmp_v6(struct sk_buff *skb, struct ip_vs_protocol *pp, 1557b3cdd2a7SJulius Volz struct ip_vs_conn *cp, int dir); 1558b3cdd2a7SJulius Volz #endif 1559b3cdd2a7SJulius Volz 1560b1550f22SAl Viro extern __sum16 ip_vs_checksum_complete(struct sk_buff *skb, int offset); 15611da177e4SLinus Torvalds 1562f9214b26SAl Viro static inline __wsum ip_vs_check_diff4(__be32 old, __be32 new, __wsum oldsum) 15631da177e4SLinus Torvalds { 1564f9214b26SAl Viro __be32 diff[2] = { ~old, new }; 15651da177e4SLinus Torvalds 156607f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 1567f9214b26SAl Viro } 1568f9214b26SAl Viro 15690bbdd42bSJulius Volz #ifdef CONFIG_IP_VS_IPV6 15700bbdd42bSJulius Volz static inline __wsum ip_vs_check_diff16(const __be32 *old, const __be32 *new, 15710bbdd42bSJulius Volz __wsum oldsum) 15720bbdd42bSJulius Volz { 15730bbdd42bSJulius Volz __be32 diff[8] = { ~old[3], ~old[2], ~old[1], ~old[0], 15740bbdd42bSJulius Volz new[3], new[2], new[1], new[0] }; 15750bbdd42bSJulius Volz 157607f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 15770bbdd42bSJulius Volz } 15780bbdd42bSJulius Volz #endif 15790bbdd42bSJulius Volz 1580f9214b26SAl Viro static inline __wsum ip_vs_check_diff2(__be16 old, __be16 new, __wsum oldsum) 1581f9214b26SAl Viro { 1582f9214b26SAl Viro __be16 diff[2] = { ~old, new }; 1583f9214b26SAl Viro 158407f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 15851da177e4SLinus Torvalds } 15861da177e4SLinus Torvalds 1587cf356d69SJulian Anastasov /* 1588cf356d69SJulian Anastasov * Forget current conntrack (unconfirmed) and attach notrack entry 1589cf356d69SJulian Anastasov */ 1590cf356d69SJulian Anastasov static inline void ip_vs_notrack(struct sk_buff *skb) 1591cf356d69SJulian Anastasov { 1592cf356d69SJulian Anastasov #if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE) 1593cf356d69SJulian Anastasov enum ip_conntrack_info ctinfo; 159406b69390SJesper Juhl struct nf_conn *ct = nf_ct_get(skb, &ctinfo); 1595cf356d69SJulian Anastasov 1596cf356d69SJulian Anastasov if (!ct || !nf_ct_is_untracked(ct)) { 15979e33ce45SLin Ming nf_conntrack_put(skb->nfct); 1598cf356d69SJulian Anastasov skb->nfct = &nf_ct_untracked_get()->ct_general; 1599cf356d69SJulian Anastasov skb->nfctinfo = IP_CT_NEW; 1600cf356d69SJulian Anastasov nf_conntrack_get(skb->nfct); 1601cf356d69SJulian Anastasov } 1602cf356d69SJulian Anastasov #endif 1603cf356d69SJulian Anastasov } 1604cf356d69SJulian Anastasov 1605f4bc17cdSJulian Anastasov #ifdef CONFIG_IP_VS_NFCT 1606f4bc17cdSJulian Anastasov /* 1607f4bc17cdSJulian Anastasov * Netfilter connection tracking 1608f4bc17cdSJulian Anastasov * (from ip_vs_nfct.c) 1609f4bc17cdSJulian Anastasov */ 1610a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs) 1611f4bc17cdSJulian Anastasov { 1612a4e2f5a7SSimon Horman #ifdef CONFIG_SYSCTL 1613a0840e2eSHans Schillstrom return ipvs->sysctl_conntrack; 1614a4e2f5a7SSimon Horman #else 1615a4e2f5a7SSimon Horman return 0; 1616a4e2f5a7SSimon Horman #endif 1617f4bc17cdSJulian Anastasov } 1618f4bc17cdSJulian Anastasov 16196523ce15SJulian Anastasov extern void ip_vs_update_conntrack(struct sk_buff *skb, struct ip_vs_conn *cp, 16206523ce15SJulian Anastasov int outin); 16213c2de2aeSSimon Horman extern int ip_vs_confirm_conntrack(struct sk_buff *skb); 1622f4bc17cdSJulian Anastasov extern void ip_vs_nfct_expect_related(struct sk_buff *skb, struct nf_conn *ct, 1623f4bc17cdSJulian Anastasov struct ip_vs_conn *cp, u_int8_t proto, 1624f4bc17cdSJulian Anastasov const __be16 port, int from_rs); 1625f4bc17cdSJulian Anastasov extern void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp); 1626f4bc17cdSJulian Anastasov 1627f4bc17cdSJulian Anastasov #else 1628f4bc17cdSJulian Anastasov 1629a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs) 1630f4bc17cdSJulian Anastasov { 1631f4bc17cdSJulian Anastasov return 0; 1632f4bc17cdSJulian Anastasov } 1633f4bc17cdSJulian Anastasov 1634f4bc17cdSJulian Anastasov static inline void ip_vs_update_conntrack(struct sk_buff *skb, 1635f4bc17cdSJulian Anastasov struct ip_vs_conn *cp, int outin) 1636f4bc17cdSJulian Anastasov { 1637f4bc17cdSJulian Anastasov } 1638f4bc17cdSJulian Anastasov 1639e23ebf0fSKrzysztof Wilczynski static inline int ip_vs_confirm_conntrack(struct sk_buff *skb) 1640f4bc17cdSJulian Anastasov { 1641f4bc17cdSJulian Anastasov return NF_ACCEPT; 1642f4bc17cdSJulian Anastasov } 1643f4bc17cdSJulian Anastasov 1644f4bc17cdSJulian Anastasov static inline void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp) 1645f4bc17cdSJulian Anastasov { 1646f4bc17cdSJulian Anastasov } 1647f4bc17cdSJulian Anastasov /* CONFIG_IP_VS_NFCT */ 1648f4bc17cdSJulian Anastasov #endif 16496523ce15SJulian Anastasov 1650b552f7e3SChangli Gao static inline unsigned int 1651b552f7e3SChangli Gao ip_vs_dest_conn_overhead(struct ip_vs_dest *dest) 1652b552f7e3SChangli Gao { 1653b552f7e3SChangli Gao /* 1654b552f7e3SChangli Gao * We think the overhead of processing active connections is 256 1655b552f7e3SChangli Gao * times higher than that of inactive connections in average. (This 1656b552f7e3SChangli Gao * 256 times might not be accurate, we will change it later) We 1657b552f7e3SChangli Gao * use the following formula to estimate the overhead now: 1658b552f7e3SChangli Gao * dest->activeconns*256 + dest->inactconns 1659b552f7e3SChangli Gao */ 1660b552f7e3SChangli Gao return (atomic_read(&dest->activeconns) << 8) + 1661b552f7e3SChangli Gao atomic_read(&dest->inactconns); 1662b552f7e3SChangli Gao } 1663b552f7e3SChangli Gao 1664bc4768ebSJulius Volz #endif /* _NET_IP_VS_H */ 1665