11da177e4SLinus Torvalds /* 21da177e4SLinus Torvalds * IP Virtual Server 31da177e4SLinus Torvalds * data structure and functionality definitions 41da177e4SLinus Torvalds */ 51da177e4SLinus Torvalds 6bc4768ebSJulius Volz #ifndef _NET_IP_VS_H 7bc4768ebSJulius Volz #define _NET_IP_VS_H 81da177e4SLinus Torvalds 9bc4768ebSJulius Volz #include <linux/ip_vs.h> /* definitions shared with userland */ 101da177e4SLinus Torvalds 11bc4768ebSJulius Volz /* old ipvsadm versions still include this file directly */ 121da177e4SLinus Torvalds #ifdef __KERNEL__ 131da177e4SLinus Torvalds 14bc4768ebSJulius Volz #include <asm/types.h> /* for __uXX types */ 15bc4768ebSJulius Volz 16bc4768ebSJulius Volz #include <linux/sysctl.h> /* for ctl_path */ 171da177e4SLinus Torvalds #include <linux/list.h> /* for struct list_head */ 181da177e4SLinus Torvalds #include <linux/spinlock.h> /* for struct rwlock_t */ 191da177e4SLinus Torvalds #include <asm/atomic.h> /* for struct atomic_t */ 201da177e4SLinus Torvalds #include <linux/compiler.h> 2114c85021SArnaldo Carvalho de Melo #include <linux/timer.h> 221da177e4SLinus Torvalds 2314c85021SArnaldo Carvalho de Melo #include <net/checksum.h> 24e7ade46aSJulius Volz #include <linux/netfilter.h> /* for union nf_inet_addr */ 251668e010SKOVACS Krisztian #include <linux/ip.h> 26e7ade46aSJulius Volz #include <linux/ipv6.h> /* for struct ipv6hdr */ 27e7ade46aSJulius Volz #include <net/ipv6.h> /* for ipv6_addr_copy */ 28cf356d69SJulian Anastasov #if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE) 29f4bc17cdSJulian Anastasov #include <net/netfilter/nf_conntrack.h> 30f4bc17cdSJulian Anastasov #endif 3161b1ab45SHans Schillstrom #include <net/net_namespace.h> /* Netw namespace */ 3261b1ab45SHans Schillstrom 3361b1ab45SHans Schillstrom /* 3461b1ab45SHans Schillstrom * Generic access of ipvs struct 3561b1ab45SHans Schillstrom */ 3661b1ab45SHans Schillstrom static inline struct netns_ipvs *net_ipvs(struct net* net) 3761b1ab45SHans Schillstrom { 3861b1ab45SHans Schillstrom return net->ipvs; 3961b1ab45SHans Schillstrom } 40fc723250SHans Schillstrom /* 41fc723250SHans Schillstrom * Get net ptr from skb in traffic cases 42fc723250SHans Schillstrom * use skb_sknet when call is from userland (ioctl or netlink) 43fc723250SHans Schillstrom */ 44a0840e2eSHans Schillstrom static inline struct net *skb_net(const struct sk_buff *skb) 45fc723250SHans Schillstrom { 46fc723250SHans Schillstrom #ifdef CONFIG_NET_NS 47fc723250SHans Schillstrom #ifdef CONFIG_IP_VS_DEBUG 48fc723250SHans Schillstrom /* 49fc723250SHans Schillstrom * This is used for debug only. 50fc723250SHans Schillstrom * Start with the most likely hit 51fc723250SHans Schillstrom * End with BUG 52fc723250SHans Schillstrom */ 53fc723250SHans Schillstrom if (likely(skb->dev && skb->dev->nd_net)) 54fc723250SHans Schillstrom return dev_net(skb->dev); 55fc723250SHans Schillstrom if (skb_dst(skb)->dev) 56fc723250SHans Schillstrom return dev_net(skb_dst(skb)->dev); 57fc723250SHans Schillstrom WARN(skb->sk, "Maybe skb_sknet should be used in %s() at line:%d\n", 58fc723250SHans Schillstrom __func__, __LINE__); 59fc723250SHans Schillstrom if (likely(skb->sk && skb->sk->sk_net)) 60fc723250SHans Schillstrom return sock_net(skb->sk); 61fc723250SHans Schillstrom pr_err("There is no net ptr to find in the skb in %s() line:%d\n", 62fc723250SHans Schillstrom __func__, __LINE__); 63fc723250SHans Schillstrom BUG(); 64fc723250SHans Schillstrom #else 65fc723250SHans Schillstrom return dev_net(skb->dev ? : skb_dst(skb)->dev); 66fc723250SHans Schillstrom #endif 67fc723250SHans Schillstrom #else 68fc723250SHans Schillstrom return &init_net; 69fc723250SHans Schillstrom #endif 70fc723250SHans Schillstrom } 71fc723250SHans Schillstrom 72a0840e2eSHans Schillstrom static inline struct net *skb_sknet(const struct sk_buff *skb) 73fc723250SHans Schillstrom { 74fc723250SHans Schillstrom #ifdef CONFIG_NET_NS 75fc723250SHans Schillstrom #ifdef CONFIG_IP_VS_DEBUG 76fc723250SHans Schillstrom /* Start with the most likely hit */ 77fc723250SHans Schillstrom if (likely(skb->sk && skb->sk->sk_net)) 78fc723250SHans Schillstrom return sock_net(skb->sk); 79fc723250SHans Schillstrom WARN(skb->dev, "Maybe skb_net should be used instead in %s() line:%d\n", 80fc723250SHans Schillstrom __func__, __LINE__); 81fc723250SHans Schillstrom if (likely(skb->dev && skb->dev->nd_net)) 82fc723250SHans Schillstrom return dev_net(skb->dev); 83fc723250SHans Schillstrom pr_err("There is no net ptr to find in the skb in %s() line:%d\n", 84fc723250SHans Schillstrom __func__, __LINE__); 85fc723250SHans Schillstrom BUG(); 86fc723250SHans Schillstrom #else 87fc723250SHans Schillstrom return sock_net(skb->sk); 88fc723250SHans Schillstrom #endif 89fc723250SHans Schillstrom #else 90fc723250SHans Schillstrom return &init_net; 91fc723250SHans Schillstrom #endif 92fc723250SHans Schillstrom } 93b17fc996SHans Schillstrom /* 94b17fc996SHans Schillstrom * This one needed for single_open_net since net is stored directly in 95b17fc996SHans Schillstrom * private not as a struct i.e. seq_file_net cant be used. 96b17fc996SHans Schillstrom */ 97b17fc996SHans Schillstrom static inline struct net *seq_file_single_net(struct seq_file *seq) 98b17fc996SHans Schillstrom { 99b17fc996SHans Schillstrom #ifdef CONFIG_NET_NS 100b17fc996SHans Schillstrom return (struct net *)seq->private; 101b17fc996SHans Schillstrom #else 102b17fc996SHans Schillstrom return &init_net; 103b17fc996SHans Schillstrom #endif 104b17fc996SHans Schillstrom } 1056f7edb48SCatalin(ux) M. BOIE 1066f7edb48SCatalin(ux) M. BOIE /* Connections' size value needed by ip_vs_ctl.c */ 1076f7edb48SCatalin(ux) M. BOIE extern int ip_vs_conn_tab_size; 1086f7edb48SCatalin(ux) M. BOIE 1096f7edb48SCatalin(ux) M. BOIE 11064aae3cbSJulius Volz struct ip_vs_iphdr { 11164aae3cbSJulius Volz int len; 11264aae3cbSJulius Volz __u8 protocol; 11364aae3cbSJulius Volz union nf_inet_addr saddr; 11464aae3cbSJulius Volz union nf_inet_addr daddr; 11564aae3cbSJulius Volz }; 11664aae3cbSJulius Volz 11764aae3cbSJulius Volz static inline void 11864aae3cbSJulius Volz ip_vs_fill_iphdr(int af, const void *nh, struct ip_vs_iphdr *iphdr) 11964aae3cbSJulius Volz { 12064aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 12164aae3cbSJulius Volz if (af == AF_INET6) { 12264aae3cbSJulius Volz const struct ipv6hdr *iph = nh; 12364aae3cbSJulius Volz iphdr->len = sizeof(struct ipv6hdr); 12464aae3cbSJulius Volz iphdr->protocol = iph->nexthdr; 12564aae3cbSJulius Volz ipv6_addr_copy(&iphdr->saddr.in6, &iph->saddr); 12664aae3cbSJulius Volz ipv6_addr_copy(&iphdr->daddr.in6, &iph->daddr); 12764aae3cbSJulius Volz } else 12864aae3cbSJulius Volz #endif 12964aae3cbSJulius Volz { 13064aae3cbSJulius Volz const struct iphdr *iph = nh; 13164aae3cbSJulius Volz iphdr->len = iph->ihl * 4; 13264aae3cbSJulius Volz iphdr->protocol = iph->protocol; 13364aae3cbSJulius Volz iphdr->saddr.ip = iph->saddr; 13464aae3cbSJulius Volz iphdr->daddr.ip = iph->daddr; 13564aae3cbSJulius Volz } 13664aae3cbSJulius Volz } 13764aae3cbSJulius Volz 13864aae3cbSJulius Volz static inline void ip_vs_addr_copy(int af, union nf_inet_addr *dst, 13964aae3cbSJulius Volz const union nf_inet_addr *src) 14064aae3cbSJulius Volz { 14164aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 14264aae3cbSJulius Volz if (af == AF_INET6) 14364aae3cbSJulius Volz ipv6_addr_copy(&dst->in6, &src->in6); 14464aae3cbSJulius Volz else 14564aae3cbSJulius Volz #endif 14664aae3cbSJulius Volz dst->ip = src->ip; 14764aae3cbSJulius Volz } 14864aae3cbSJulius Volz 14964aae3cbSJulius Volz static inline int ip_vs_addr_equal(int af, const union nf_inet_addr *a, 15064aae3cbSJulius Volz const union nf_inet_addr *b) 15164aae3cbSJulius Volz { 15264aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 15364aae3cbSJulius Volz if (af == AF_INET6) 15464aae3cbSJulius Volz return ipv6_addr_equal(&a->in6, &b->in6); 15564aae3cbSJulius Volz #endif 15664aae3cbSJulius Volz return a->ip == b->ip; 15764aae3cbSJulius Volz } 15864aae3cbSJulius Volz 1591da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG 16014c85021SArnaldo Carvalho de Melo #include <linux/net.h> 16114c85021SArnaldo Carvalho de Melo 1621da177e4SLinus Torvalds extern int ip_vs_get_debug_level(void); 163c842a3adSJulius Volz 164c842a3adSJulius Volz static inline const char *ip_vs_dbg_addr(int af, char *buf, size_t buf_len, 165c842a3adSJulius Volz const union nf_inet_addr *addr, 166c842a3adSJulius Volz int *idx) 167c842a3adSJulius Volz { 168c842a3adSJulius Volz int len; 169c842a3adSJulius Volz #ifdef CONFIG_IP_VS_IPV6 170c842a3adSJulius Volz if (af == AF_INET6) 1715b095d98SHarvey Harrison len = snprintf(&buf[*idx], buf_len - *idx, "[%pI6]", 1720c6ce78aSHarvey Harrison &addr->in6) + 1; 173c842a3adSJulius Volz else 174c842a3adSJulius Volz #endif 1753685f25dSHarvey Harrison len = snprintf(&buf[*idx], buf_len - *idx, "%pI4", 1763685f25dSHarvey Harrison &addr->ip) + 1; 177c842a3adSJulius Volz 178c842a3adSJulius Volz *idx += len; 179c842a3adSJulius Volz BUG_ON(*idx > buf_len + 1); 180c842a3adSJulius Volz return &buf[*idx - len]; 181c842a3adSJulius Volz } 182c842a3adSJulius Volz 1839aada7acSHannes Eder #define IP_VS_DBG_BUF(level, msg, ...) \ 184c842a3adSJulius Volz do { \ 185c842a3adSJulius Volz char ip_vs_dbg_buf[160]; \ 186c842a3adSJulius Volz int ip_vs_dbg_idx = 0; \ 187c842a3adSJulius Volz if (level <= ip_vs_get_debug_level()) \ 1889aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 189c842a3adSJulius Volz } while (0) 190c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...) \ 191c842a3adSJulius Volz do { \ 192c842a3adSJulius Volz char ip_vs_dbg_buf[160]; \ 193c842a3adSJulius Volz int ip_vs_dbg_idx = 0; \ 1949aada7acSHannes Eder pr_err(msg); \ 195c842a3adSJulius Volz } while (0) 196c842a3adSJulius Volz 197c842a3adSJulius Volz /* Only use from within IP_VS_DBG_BUF() or IP_VS_ERR_BUF macros */ 198c842a3adSJulius Volz #define IP_VS_DBG_ADDR(af, addr) \ 199c842a3adSJulius Volz ip_vs_dbg_addr(af, ip_vs_dbg_buf, \ 200c842a3adSJulius Volz sizeof(ip_vs_dbg_buf), addr, \ 201c842a3adSJulius Volz &ip_vs_dbg_idx) 202c842a3adSJulius Volz 2039aada7acSHannes Eder #define IP_VS_DBG(level, msg, ...) \ 2041da177e4SLinus Torvalds do { \ 2051da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2069aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 2071da177e4SLinus Torvalds } while (0) 2089aada7acSHannes Eder #define IP_VS_DBG_RL(msg, ...) \ 2091da177e4SLinus Torvalds do { \ 2101da177e4SLinus Torvalds if (net_ratelimit()) \ 2119aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 2121da177e4SLinus Torvalds } while (0) 2130d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg) \ 2141da177e4SLinus Torvalds do { \ 2151da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2160d79641aSJulian Anastasov pp->debug_packet(af, pp, skb, ofs, msg); \ 2171da177e4SLinus Torvalds } while (0) 2180d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg) \ 2191da177e4SLinus Torvalds do { \ 2201da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level() && \ 2211da177e4SLinus Torvalds net_ratelimit()) \ 2220d79641aSJulian Anastasov pp->debug_packet(af, pp, skb, ofs, msg); \ 2231da177e4SLinus Torvalds } while (0) 2241da177e4SLinus Torvalds #else /* NO DEBUGGING at ALL */ 225c842a3adSJulius Volz #define IP_VS_DBG_BUF(level, msg...) do {} while (0) 226c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...) do {} while (0) 2271da177e4SLinus Torvalds #define IP_VS_DBG(level, msg...) do {} while (0) 2281da177e4SLinus Torvalds #define IP_VS_DBG_RL(msg...) do {} while (0) 2290d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg) do {} while (0) 2300d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg) do {} while (0) 2311da177e4SLinus Torvalds #endif 2321da177e4SLinus Torvalds 2331da177e4SLinus Torvalds #define IP_VS_BUG() BUG() 2341e3e238eSHannes Eder #define IP_VS_ERR_RL(msg, ...) \ 2351da177e4SLinus Torvalds do { \ 2361da177e4SLinus Torvalds if (net_ratelimit()) \ 2371e3e238eSHannes Eder pr_err(msg, ##__VA_ARGS__); \ 2381da177e4SLinus Torvalds } while (0) 2391da177e4SLinus Torvalds 2401da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG 2411da177e4SLinus Torvalds #define EnterFunction(level) \ 2421da177e4SLinus Torvalds do { \ 2431da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2449aada7acSHannes Eder printk(KERN_DEBUG \ 2459aada7acSHannes Eder pr_fmt("Enter: %s, %s line %i\n"), \ 246d5c003b4SHarvey Harrison __func__, __FILE__, __LINE__); \ 2471da177e4SLinus Torvalds } while (0) 2481da177e4SLinus Torvalds #define LeaveFunction(level) \ 2491da177e4SLinus Torvalds do { \ 2501da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2519aada7acSHannes Eder printk(KERN_DEBUG \ 2529aada7acSHannes Eder pr_fmt("Leave: %s, %s line %i\n"), \ 253d5c003b4SHarvey Harrison __func__, __FILE__, __LINE__); \ 2541da177e4SLinus Torvalds } while (0) 2551da177e4SLinus Torvalds #else 2561da177e4SLinus Torvalds #define EnterFunction(level) do {} while (0) 2571da177e4SLinus Torvalds #define LeaveFunction(level) do {} while (0) 2581da177e4SLinus Torvalds #endif 2591da177e4SLinus Torvalds 2601da177e4SLinus Torvalds #define IP_VS_WAIT_WHILE(expr) while (expr) { cpu_relax(); } 2611da177e4SLinus Torvalds 2621da177e4SLinus Torvalds 2631da177e4SLinus Torvalds /* 2641da177e4SLinus Torvalds * The port number of FTP service (in network order). 2651da177e4SLinus Torvalds */ 266f3a7c66bSHarvey Harrison #define FTPPORT cpu_to_be16(21) 267f3a7c66bSHarvey Harrison #define FTPDATA cpu_to_be16(20) 2681da177e4SLinus Torvalds 2691da177e4SLinus Torvalds /* 2701da177e4SLinus Torvalds * TCP State Values 2711da177e4SLinus Torvalds */ 2721da177e4SLinus Torvalds enum { 2731da177e4SLinus Torvalds IP_VS_TCP_S_NONE = 0, 2741da177e4SLinus Torvalds IP_VS_TCP_S_ESTABLISHED, 2751da177e4SLinus Torvalds IP_VS_TCP_S_SYN_SENT, 2761da177e4SLinus Torvalds IP_VS_TCP_S_SYN_RECV, 2771da177e4SLinus Torvalds IP_VS_TCP_S_FIN_WAIT, 2781da177e4SLinus Torvalds IP_VS_TCP_S_TIME_WAIT, 2791da177e4SLinus Torvalds IP_VS_TCP_S_CLOSE, 2801da177e4SLinus Torvalds IP_VS_TCP_S_CLOSE_WAIT, 2811da177e4SLinus Torvalds IP_VS_TCP_S_LAST_ACK, 2821da177e4SLinus Torvalds IP_VS_TCP_S_LISTEN, 2831da177e4SLinus Torvalds IP_VS_TCP_S_SYNACK, 2841da177e4SLinus Torvalds IP_VS_TCP_S_LAST 2851da177e4SLinus Torvalds }; 2861da177e4SLinus Torvalds 2871da177e4SLinus Torvalds /* 2881da177e4SLinus Torvalds * UDP State Values 2891da177e4SLinus Torvalds */ 2901da177e4SLinus Torvalds enum { 2911da177e4SLinus Torvalds IP_VS_UDP_S_NORMAL, 2921da177e4SLinus Torvalds IP_VS_UDP_S_LAST, 2931da177e4SLinus Torvalds }; 2941da177e4SLinus Torvalds 2951da177e4SLinus Torvalds /* 2961da177e4SLinus Torvalds * ICMP State Values 2971da177e4SLinus Torvalds */ 2981da177e4SLinus Torvalds enum { 2991da177e4SLinus Torvalds IP_VS_ICMP_S_NORMAL, 3001da177e4SLinus Torvalds IP_VS_ICMP_S_LAST, 3011da177e4SLinus Torvalds }; 3021da177e4SLinus Torvalds 3031da177e4SLinus Torvalds /* 3042906f66aSVenkata Mohan Reddy * SCTP State Values 3052906f66aSVenkata Mohan Reddy */ 3062906f66aSVenkata Mohan Reddy enum ip_vs_sctp_states { 3072906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_NONE, 3082906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_INIT_CLI, 3092906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_INIT_SER, 3102906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_INIT_ACK_CLI, 3112906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_INIT_ACK_SER, 3122906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_ECHO_CLI, 3132906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_ECHO_SER, 3142906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_ESTABLISHED, 3152906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_SHUT_CLI, 3162906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_SHUT_SER, 3172906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_SHUT_ACK_CLI, 3182906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_SHUT_ACK_SER, 3192906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_CLOSED, 3202906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_LAST 3212906f66aSVenkata Mohan Reddy }; 3222906f66aSVenkata Mohan Reddy 3232906f66aSVenkata Mohan Reddy /* 3241da177e4SLinus Torvalds * Delta sequence info structure 3251da177e4SLinus Torvalds * Each ip_vs_conn has 2 (output AND input seq. changes). 3261da177e4SLinus Torvalds * Only used in the VS/NAT. 3271da177e4SLinus Torvalds */ 3281da177e4SLinus Torvalds struct ip_vs_seq { 3291da177e4SLinus Torvalds __u32 init_seq; /* Add delta from this seq */ 3301da177e4SLinus Torvalds __u32 delta; /* Delta in sequence numbers */ 3311da177e4SLinus Torvalds __u32 previous_delta; /* Delta in sequence numbers 3321da177e4SLinus Torvalds before last resized pkt */ 3331da177e4SLinus Torvalds }; 3341da177e4SLinus Torvalds 335b17fc996SHans Schillstrom /* 336b17fc996SHans Schillstrom * counters per cpu 337b17fc996SHans Schillstrom */ 338b17fc996SHans Schillstrom struct ip_vs_counters { 339b17fc996SHans Schillstrom __u32 conns; /* connections scheduled */ 340b17fc996SHans Schillstrom __u32 inpkts; /* incoming packets */ 341b17fc996SHans Schillstrom __u32 outpkts; /* outgoing packets */ 342b17fc996SHans Schillstrom __u64 inbytes; /* incoming bytes */ 343b17fc996SHans Schillstrom __u64 outbytes; /* outgoing bytes */ 344b17fc996SHans Schillstrom }; 345b17fc996SHans Schillstrom /* 346b17fc996SHans Schillstrom * Stats per cpu 347b17fc996SHans Schillstrom */ 348b17fc996SHans Schillstrom struct ip_vs_cpu_stats { 349b17fc996SHans Schillstrom struct ip_vs_counters ustats; 350b17fc996SHans Schillstrom struct u64_stats_sync syncp; 351b17fc996SHans Schillstrom }; 3521da177e4SLinus Torvalds 3531da177e4SLinus Torvalds /* 3543a14a313SSven Wegener * IPVS statistics objects 3551da177e4SLinus Torvalds */ 3563a14a313SSven Wegener struct ip_vs_estimator { 3573a14a313SSven Wegener struct list_head list; 3583a14a313SSven Wegener 3593a14a313SSven Wegener u64 last_inbytes; 3603a14a313SSven Wegener u64 last_outbytes; 3613a14a313SSven Wegener u32 last_conns; 3623a14a313SSven Wegener u32 last_inpkts; 3633a14a313SSven Wegener u32 last_outpkts; 3643a14a313SSven Wegener 3653a14a313SSven Wegener u32 cps; 3663a14a313SSven Wegener u32 inpps; 3673a14a313SSven Wegener u32 outpps; 3683a14a313SSven Wegener u32 inbps; 3693a14a313SSven Wegener u32 outbps; 3703a14a313SSven Wegener }; 3713a14a313SSven Wegener 372fd2c3ef7SEric Dumazet struct ip_vs_stats { 373e9c0ce23SSven Wegener struct ip_vs_stats_user ustats; /* statistics */ 374e9c0ce23SSven Wegener struct ip_vs_estimator est; /* estimator */ 375b17fc996SHans Schillstrom struct ip_vs_cpu_stats *cpustats; /* per cpu counters */ 3761da177e4SLinus Torvalds spinlock_t lock; /* spin lock */ 377*55a3d4e1SJulian Anastasov struct ip_vs_stats_user ustats0; /* reset values */ 3781da177e4SLinus Torvalds }; 3791da177e4SLinus Torvalds 380b17fc996SHans Schillstrom /* 381b17fc996SHans Schillstrom * Helper Macros for per cpu 382b17fc996SHans Schillstrom * ipvs->tot_stats->ustats.count 383b17fc996SHans Schillstrom */ 384b17fc996SHans Schillstrom #define IPVS_STAT_INC(ipvs, count) \ 385b17fc996SHans Schillstrom __this_cpu_inc((ipvs)->ustats->count) 386b17fc996SHans Schillstrom 387b17fc996SHans Schillstrom #define IPVS_STAT_ADD(ipvs, count, value) \ 388b17fc996SHans Schillstrom do {\ 389b17fc996SHans Schillstrom write_seqcount_begin(per_cpu_ptr((ipvs)->ustats_seq, \ 390b17fc996SHans Schillstrom raw_smp_processor_id())); \ 391b17fc996SHans Schillstrom __this_cpu_add((ipvs)->ustats->count, value); \ 392b17fc996SHans Schillstrom write_seqcount_end(per_cpu_ptr((ipvs)->ustats_seq, \ 393b17fc996SHans Schillstrom raw_smp_processor_id())); \ 394b17fc996SHans Schillstrom } while (0) 395b17fc996SHans Schillstrom 39614c85021SArnaldo Carvalho de Melo struct dst_entry; 39714c85021SArnaldo Carvalho de Melo struct iphdr; 3981da177e4SLinus Torvalds struct ip_vs_conn; 3991da177e4SLinus Torvalds struct ip_vs_app; 40014c85021SArnaldo Carvalho de Melo struct sk_buff; 401252c6410SHans Schillstrom struct ip_vs_proto_data; 4021da177e4SLinus Torvalds 4031da177e4SLinus Torvalds struct ip_vs_protocol { 4041da177e4SLinus Torvalds struct ip_vs_protocol *next; 4051da177e4SLinus Torvalds char *name; 4062ad17defSJulian Anastasov u16 protocol; 4072ad17defSJulian Anastasov u16 num_states; 4081da177e4SLinus Torvalds int dont_defrag; 4091da177e4SLinus Torvalds 4101da177e4SLinus Torvalds void (*init)(struct ip_vs_protocol *pp); 4111da177e4SLinus Torvalds 4121da177e4SLinus Torvalds void (*exit)(struct ip_vs_protocol *pp); 4131da177e4SLinus Torvalds 414252c6410SHans Schillstrom void (*init_netns)(struct net *net, struct ip_vs_proto_data *pd); 415252c6410SHans Schillstrom 416252c6410SHans Schillstrom void (*exit_netns)(struct net *net, struct ip_vs_proto_data *pd); 417252c6410SHans Schillstrom 41851ef348bSJulius Volz int (*conn_schedule)(int af, struct sk_buff *skb, 4199330419dSHans Schillstrom struct ip_vs_proto_data *pd, 4201da177e4SLinus Torvalds int *verdict, struct ip_vs_conn **cpp); 4211da177e4SLinus Torvalds 4221da177e4SLinus Torvalds struct ip_vs_conn * 42351ef348bSJulius Volz (*conn_in_get)(int af, 42451ef348bSJulius Volz const struct sk_buff *skb, 42551ef348bSJulius Volz const struct ip_vs_iphdr *iph, 4261da177e4SLinus Torvalds unsigned int proto_off, 4271da177e4SLinus Torvalds int inverse); 4281da177e4SLinus Torvalds 4291da177e4SLinus Torvalds struct ip_vs_conn * 43051ef348bSJulius Volz (*conn_out_get)(int af, 43151ef348bSJulius Volz const struct sk_buff *skb, 43251ef348bSJulius Volz const struct ip_vs_iphdr *iph, 4331da177e4SLinus Torvalds unsigned int proto_off, 4341da177e4SLinus Torvalds int inverse); 4351da177e4SLinus Torvalds 4363db05feaSHerbert Xu int (*snat_handler)(struct sk_buff *skb, 4371da177e4SLinus Torvalds struct ip_vs_protocol *pp, struct ip_vs_conn *cp); 4381da177e4SLinus Torvalds 4393db05feaSHerbert Xu int (*dnat_handler)(struct sk_buff *skb, 4401da177e4SLinus Torvalds struct ip_vs_protocol *pp, struct ip_vs_conn *cp); 4411da177e4SLinus Torvalds 44251ef348bSJulius Volz int (*csum_check)(int af, struct sk_buff *skb, 44351ef348bSJulius Volz struct ip_vs_protocol *pp); 4441da177e4SLinus Torvalds 4451da177e4SLinus Torvalds const char *(*state_name)(int state); 4461da177e4SLinus Torvalds 4471da177e4SLinus Torvalds int (*state_transition)(struct ip_vs_conn *cp, int direction, 4481da177e4SLinus Torvalds const struct sk_buff *skb, 4499330419dSHans Schillstrom struct ip_vs_proto_data *pd); 4501da177e4SLinus Torvalds 451ab8a5e84SHans Schillstrom int (*register_app)(struct net *net, struct ip_vs_app *inc); 4521da177e4SLinus Torvalds 453ab8a5e84SHans Schillstrom void (*unregister_app)(struct net *net, struct ip_vs_app *inc); 4541da177e4SLinus Torvalds 4551da177e4SLinus Torvalds int (*app_conn_bind)(struct ip_vs_conn *cp); 4561da177e4SLinus Torvalds 4570d79641aSJulian Anastasov void (*debug_packet)(int af, struct ip_vs_protocol *pp, 4581da177e4SLinus Torvalds const struct sk_buff *skb, 4591da177e4SLinus Torvalds int offset, 4601da177e4SLinus Torvalds const char *msg); 4611da177e4SLinus Torvalds 4629330419dSHans Schillstrom void (*timeout_change)(struct ip_vs_proto_data *pd, int flags); 4631da177e4SLinus Torvalds }; 4641da177e4SLinus Torvalds 465252c6410SHans Schillstrom /* 466252c6410SHans Schillstrom * protocol data per netns 467252c6410SHans Schillstrom */ 468252c6410SHans Schillstrom struct ip_vs_proto_data { 469252c6410SHans Schillstrom struct ip_vs_proto_data *next; 470252c6410SHans Schillstrom struct ip_vs_protocol *pp; 471252c6410SHans Schillstrom int *timeout_table; /* protocol timeout table */ 472252c6410SHans Schillstrom atomic_t appcnt; /* counter of proto app incs. */ 473252c6410SHans Schillstrom struct tcp_states_t *tcp_state_table; 474252c6410SHans Schillstrom }; 475252c6410SHans Schillstrom 4761da177e4SLinus Torvalds extern struct ip_vs_protocol *ip_vs_proto_get(unsigned short proto); 477252c6410SHans Schillstrom extern struct ip_vs_proto_data *ip_vs_proto_data_get(struct net *net, 478252c6410SHans Schillstrom unsigned short proto); 4791da177e4SLinus Torvalds 480f11017ecSSimon Horman struct ip_vs_conn_param { 4816e67e586SHans Schillstrom struct net *net; 482f11017ecSSimon Horman const union nf_inet_addr *caddr; 483f11017ecSSimon Horman const union nf_inet_addr *vaddr; 484f11017ecSSimon Horman __be16 cport; 485f11017ecSSimon Horman __be16 vport; 486f11017ecSSimon Horman __u16 protocol; 487f11017ecSSimon Horman u16 af; 48885999283SSimon Horman 48985999283SSimon Horman const struct ip_vs_pe *pe; 49085999283SSimon Horman char *pe_data; 49185999283SSimon Horman __u8 pe_data_len; 492f11017ecSSimon Horman }; 493f11017ecSSimon Horman 4941da177e4SLinus Torvalds /* 4951da177e4SLinus Torvalds * IP_VS structure allocated for each dynamically scheduled connection 4961da177e4SLinus Torvalds */ 4971da177e4SLinus Torvalds struct ip_vs_conn { 498731109e7SChangli Gao struct hlist_node c_list; /* hashed list heads */ 4996e67e586SHans Schillstrom #ifdef CONFIG_NET_NS 5006e67e586SHans Schillstrom struct net *net; /* Name space */ 5016e67e586SHans Schillstrom #endif 5021da177e4SLinus Torvalds /* Protocol, addresses and port numbers */ 503e7ade46aSJulius Volz u16 af; /* address family */ 5046e67e586SHans Schillstrom __be16 cport; 5056e67e586SHans Schillstrom __be16 vport; 5066e67e586SHans Schillstrom __be16 dport; 5076e67e586SHans Schillstrom __u32 fwmark; /* Fire wall mark from skb */ 508e7ade46aSJulius Volz union nf_inet_addr caddr; /* client address */ 509e7ade46aSJulius Volz union nf_inet_addr vaddr; /* virtual address */ 510e7ade46aSJulius Volz union nf_inet_addr daddr; /* destination address */ 5113575792eSJulian Anastasov volatile __u32 flags; /* status flags */ 5121da177e4SLinus Torvalds __u16 protocol; /* Which protocol (TCP/UDP) */ 5131da177e4SLinus Torvalds 5141da177e4SLinus Torvalds /* counter and timer */ 5151da177e4SLinus Torvalds atomic_t refcnt; /* reference count */ 5161da177e4SLinus Torvalds struct timer_list timer; /* Expiration timer */ 5171da177e4SLinus Torvalds volatile unsigned long timeout; /* timeout */ 5181da177e4SLinus Torvalds 5191da177e4SLinus Torvalds /* Flags and state transition */ 5201da177e4SLinus Torvalds spinlock_t lock; /* lock for state transition */ 5211da177e4SLinus Torvalds volatile __u16 state; /* state info */ 522efac5276SRumen G. Bogdanovski volatile __u16 old_state; /* old state, to be used for 523efac5276SRumen G. Bogdanovski * state transition triggerd 524efac5276SRumen G. Bogdanovski * synchronization 525efac5276SRumen G. Bogdanovski */ 5261da177e4SLinus Torvalds 5271da177e4SLinus Torvalds /* Control members */ 5281da177e4SLinus Torvalds struct ip_vs_conn *control; /* Master control connection */ 5291da177e4SLinus Torvalds atomic_t n_control; /* Number of controlled ones */ 5301da177e4SLinus Torvalds struct ip_vs_dest *dest; /* real server */ 5311da177e4SLinus Torvalds atomic_t in_pkts; /* incoming packet counter */ 5321da177e4SLinus Torvalds 5331da177e4SLinus Torvalds /* packet transmitter for different forwarding methods. If it 5341da177e4SLinus Torvalds mangles the packet, it must return NF_DROP or better NF_STOLEN, 5351da177e4SLinus Torvalds otherwise this must be changed to a sk_buff **. 536fc604767SJulian Anastasov NF_ACCEPT can be returned when destination is local. 5371da177e4SLinus Torvalds */ 5381da177e4SLinus Torvalds int (*packet_xmit)(struct sk_buff *skb, struct ip_vs_conn *cp, 5391da177e4SLinus Torvalds struct ip_vs_protocol *pp); 5401da177e4SLinus Torvalds 5411da177e4SLinus Torvalds /* Note: we can group the following members into a structure, 5421da177e4SLinus Torvalds in order to save more space, and the following members are 5431da177e4SLinus Torvalds only used in VS/NAT anyway */ 5441da177e4SLinus Torvalds struct ip_vs_app *app; /* bound ip_vs_app object */ 5451da177e4SLinus Torvalds void *app_data; /* Application private data */ 5461da177e4SLinus Torvalds struct ip_vs_seq in_seq; /* incoming seq. struct */ 5471da177e4SLinus Torvalds struct ip_vs_seq out_seq; /* outgoing seq. struct */ 54885999283SSimon Horman 549e9e5eee8SSimon Horman const struct ip_vs_pe *pe; 55085999283SSimon Horman char *pe_data; 55185999283SSimon Horman __u8 pe_data_len; 5521da177e4SLinus Torvalds }; 5531da177e4SLinus Torvalds 5546e67e586SHans Schillstrom /* 5556e67e586SHans Schillstrom * To save some memory in conn table when name space is disabled. 5566e67e586SHans Schillstrom */ 5576e67e586SHans Schillstrom static inline struct net *ip_vs_conn_net(const struct ip_vs_conn *cp) 5586e67e586SHans Schillstrom { 5596e67e586SHans Schillstrom #ifdef CONFIG_NET_NS 5606e67e586SHans Schillstrom return cp->net; 5616e67e586SHans Schillstrom #else 5626e67e586SHans Schillstrom return &init_net; 5636e67e586SHans Schillstrom #endif 5646e67e586SHans Schillstrom } 5656e67e586SHans Schillstrom static inline void ip_vs_conn_net_set(struct ip_vs_conn *cp, struct net *net) 5666e67e586SHans Schillstrom { 5676e67e586SHans Schillstrom #ifdef CONFIG_NET_NS 5686e67e586SHans Schillstrom cp->net = net; 5696e67e586SHans Schillstrom #endif 5706e67e586SHans Schillstrom } 5716e67e586SHans Schillstrom 5726e67e586SHans Schillstrom static inline int ip_vs_conn_net_eq(const struct ip_vs_conn *cp, 5736e67e586SHans Schillstrom struct net *net) 5746e67e586SHans Schillstrom { 5756e67e586SHans Schillstrom #ifdef CONFIG_NET_NS 5766e67e586SHans Schillstrom return cp->net == net; 5776e67e586SHans Schillstrom #else 5786e67e586SHans Schillstrom return 1; 5796e67e586SHans Schillstrom #endif 5806e67e586SHans Schillstrom } 5811da177e4SLinus Torvalds 5821da177e4SLinus Torvalds /* 583c860c6b1SJulius Volz * Extended internal versions of struct ip_vs_service_user and 584c860c6b1SJulius Volz * ip_vs_dest_user for IPv6 support. 585c860c6b1SJulius Volz * 586c860c6b1SJulius Volz * We need these to conveniently pass around service and destination 587c860c6b1SJulius Volz * options, but unfortunately, we also need to keep the old definitions to 588c860c6b1SJulius Volz * maintain userspace backwards compatibility for the setsockopt interface. 589c860c6b1SJulius Volz */ 590c860c6b1SJulius Volz struct ip_vs_service_user_kern { 591c860c6b1SJulius Volz /* virtual service addresses */ 592c860c6b1SJulius Volz u16 af; 593c860c6b1SJulius Volz u16 protocol; 594c860c6b1SJulius Volz union nf_inet_addr addr; /* virtual ip address */ 595c860c6b1SJulius Volz u16 port; 596c860c6b1SJulius Volz u32 fwmark; /* firwall mark of service */ 597c860c6b1SJulius Volz 598c860c6b1SJulius Volz /* virtual service options */ 599c860c6b1SJulius Volz char *sched_name; 6000d1e71b0SSimon Horman char *pe_name; 601c860c6b1SJulius Volz unsigned flags; /* virtual service flags */ 602c860c6b1SJulius Volz unsigned timeout; /* persistent timeout in sec */ 603c860c6b1SJulius Volz u32 netmask; /* persistent netmask */ 604c860c6b1SJulius Volz }; 605c860c6b1SJulius Volz 606c860c6b1SJulius Volz 607c860c6b1SJulius Volz struct ip_vs_dest_user_kern { 608c860c6b1SJulius Volz /* destination server address */ 609c860c6b1SJulius Volz union nf_inet_addr addr; 610c860c6b1SJulius Volz u16 port; 611c860c6b1SJulius Volz 612c860c6b1SJulius Volz /* real server options */ 613c860c6b1SJulius Volz unsigned conn_flags; /* connection flags */ 614c860c6b1SJulius Volz int weight; /* destination weight */ 615c860c6b1SJulius Volz 616c860c6b1SJulius Volz /* thresholds for active connections */ 617c860c6b1SJulius Volz u32 u_threshold; /* upper threshold */ 618c860c6b1SJulius Volz u32 l_threshold; /* lower threshold */ 619c860c6b1SJulius Volz }; 620c860c6b1SJulius Volz 621c860c6b1SJulius Volz 622c860c6b1SJulius Volz /* 6231da177e4SLinus Torvalds * The information about the virtual service offered to the net 6241da177e4SLinus Torvalds * and the forwarding entries 6251da177e4SLinus Torvalds */ 6261da177e4SLinus Torvalds struct ip_vs_service { 6271da177e4SLinus Torvalds struct list_head s_list; /* for normal service table */ 6281da177e4SLinus Torvalds struct list_head f_list; /* for fwmark-based service table */ 6291da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 6301da177e4SLinus Torvalds atomic_t usecnt; /* use counter */ 6311da177e4SLinus Torvalds 632e7ade46aSJulius Volz u16 af; /* address family */ 6331da177e4SLinus Torvalds __u16 protocol; /* which protocol (TCP/UDP) */ 634e7ade46aSJulius Volz union nf_inet_addr addr; /* IP address for virtual service */ 635014d730dSAl Viro __be16 port; /* port number for the service */ 6361da177e4SLinus Torvalds __u32 fwmark; /* firewall mark of the service */ 6371da177e4SLinus Torvalds unsigned flags; /* service status flags */ 6381da177e4SLinus Torvalds unsigned timeout; /* persistent timeout in ticks */ 639014d730dSAl Viro __be32 netmask; /* grouping granularity */ 640fc723250SHans Schillstrom struct net *net; 6411da177e4SLinus Torvalds 6421da177e4SLinus Torvalds struct list_head destinations; /* real server d-linked list */ 6431da177e4SLinus Torvalds __u32 num_dests; /* number of servers */ 6441da177e4SLinus Torvalds struct ip_vs_stats stats; /* statistics for the service */ 6451da177e4SLinus Torvalds struct ip_vs_app *inc; /* bind conns to this app inc */ 6461da177e4SLinus Torvalds 6471da177e4SLinus Torvalds /* for scheduling */ 6481da177e4SLinus Torvalds struct ip_vs_scheduler *scheduler; /* bound scheduler object */ 6491da177e4SLinus Torvalds rwlock_t sched_lock; /* lock sched_data */ 6501da177e4SLinus Torvalds void *sched_data; /* scheduler application data */ 65185999283SSimon Horman 65285999283SSimon Horman /* alternate persistence engine */ 65385999283SSimon Horman struct ip_vs_pe *pe; 6541da177e4SLinus Torvalds }; 6551da177e4SLinus Torvalds 6561da177e4SLinus Torvalds 6571da177e4SLinus Torvalds /* 6581da177e4SLinus Torvalds * The real server destination forwarding entry 6591da177e4SLinus Torvalds * with ip address, port number, and so on. 6601da177e4SLinus Torvalds */ 6611da177e4SLinus Torvalds struct ip_vs_dest { 6621da177e4SLinus Torvalds struct list_head n_list; /* for the dests in the service */ 6631da177e4SLinus Torvalds struct list_head d_list; /* for table with all the dests */ 6641da177e4SLinus Torvalds 665e7ade46aSJulius Volz u16 af; /* address family */ 666014d730dSAl Viro __be16 port; /* port number of the server */ 667f2431e6eSHans Schillstrom union nf_inet_addr addr; /* IP address of the server */ 6681da177e4SLinus Torvalds volatile unsigned flags; /* dest status flags */ 6691da177e4SLinus Torvalds atomic_t conn_flags; /* flags to copy to conn */ 6701da177e4SLinus Torvalds atomic_t weight; /* server weight */ 6711da177e4SLinus Torvalds 6721da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 6731da177e4SLinus Torvalds struct ip_vs_stats stats; /* statistics */ 6741da177e4SLinus Torvalds 6751da177e4SLinus Torvalds /* connection counters and thresholds */ 6761da177e4SLinus Torvalds atomic_t activeconns; /* active connections */ 6771da177e4SLinus Torvalds atomic_t inactconns; /* inactive connections */ 6781da177e4SLinus Torvalds atomic_t persistconns; /* persistent connections */ 6791da177e4SLinus Torvalds __u32 u_threshold; /* upper threshold */ 6801da177e4SLinus Torvalds __u32 l_threshold; /* lower threshold */ 6811da177e4SLinus Torvalds 6821da177e4SLinus Torvalds /* for destination cache */ 6831da177e4SLinus Torvalds spinlock_t dst_lock; /* lock of dst_cache */ 6841da177e4SLinus Torvalds struct dst_entry *dst_cache; /* destination cache entry */ 6851da177e4SLinus Torvalds u32 dst_rtos; /* RT_TOS(tos) for dst */ 686714f095fSHans Schillstrom u32 dst_cookie; 687714f095fSHans Schillstrom #ifdef CONFIG_IP_VS_IPV6 688714f095fSHans Schillstrom struct in6_addr dst_saddr; 689714f095fSHans Schillstrom #endif 6901da177e4SLinus Torvalds 6911da177e4SLinus Torvalds /* for virtual service */ 6921da177e4SLinus Torvalds struct ip_vs_service *svc; /* service it belongs to */ 6931da177e4SLinus Torvalds __u16 protocol; /* which protocol (TCP/UDP) */ 694014d730dSAl Viro __be16 vport; /* virtual port number */ 695f2431e6eSHans Schillstrom union nf_inet_addr vaddr; /* virtual IP address */ 6961da177e4SLinus Torvalds __u32 vfwmark; /* firewall mark of service */ 6971da177e4SLinus Torvalds }; 6981da177e4SLinus Torvalds 6991da177e4SLinus Torvalds 7001da177e4SLinus Torvalds /* 7011da177e4SLinus Torvalds * The scheduler object 7021da177e4SLinus Torvalds */ 7031da177e4SLinus Torvalds struct ip_vs_scheduler { 7041da177e4SLinus Torvalds struct list_head n_list; /* d-linked list head */ 7051da177e4SLinus Torvalds char *name; /* scheduler name */ 7061da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 7071da177e4SLinus Torvalds struct module *module; /* THIS_MODULE/NULL */ 7081da177e4SLinus Torvalds 7091da177e4SLinus Torvalds /* scheduler initializing service */ 7101da177e4SLinus Torvalds int (*init_service)(struct ip_vs_service *svc); 7111da177e4SLinus Torvalds /* scheduling service finish */ 7121da177e4SLinus Torvalds int (*done_service)(struct ip_vs_service *svc); 7131da177e4SLinus Torvalds /* scheduler updating service */ 7141da177e4SLinus Torvalds int (*update_service)(struct ip_vs_service *svc); 7151da177e4SLinus Torvalds 7161da177e4SLinus Torvalds /* selecting a server from the given service */ 7171da177e4SLinus Torvalds struct ip_vs_dest* (*schedule)(struct ip_vs_service *svc, 7181da177e4SLinus Torvalds const struct sk_buff *skb); 7191da177e4SLinus Torvalds }; 7201da177e4SLinus Torvalds 72185999283SSimon Horman /* The persistence engine object */ 72285999283SSimon Horman struct ip_vs_pe { 72385999283SSimon Horman struct list_head n_list; /* d-linked list head */ 72485999283SSimon Horman char *name; /* scheduler name */ 72585999283SSimon Horman atomic_t refcnt; /* reference counter */ 72685999283SSimon Horman struct module *module; /* THIS_MODULE/NULL */ 72785999283SSimon Horman 72885999283SSimon Horman /* get the connection template, if any */ 72985999283SSimon Horman int (*fill_param)(struct ip_vs_conn_param *p, struct sk_buff *skb); 73085999283SSimon Horman bool (*ct_match)(const struct ip_vs_conn_param *p, 73185999283SSimon Horman struct ip_vs_conn *ct); 73285999283SSimon Horman u32 (*hashkey_raw)(const struct ip_vs_conn_param *p, u32 initval, 73385999283SSimon Horman bool inverse); 734a3c918acSSimon Horman int (*show_pe_data)(const struct ip_vs_conn *cp, char *buf); 73585999283SSimon Horman }; 7361da177e4SLinus Torvalds 7371da177e4SLinus Torvalds /* 7381da177e4SLinus Torvalds * The application module object (a.k.a. app incarnation) 7391da177e4SLinus Torvalds */ 740fd2c3ef7SEric Dumazet struct ip_vs_app { 7411da177e4SLinus Torvalds struct list_head a_list; /* member in app list */ 7421da177e4SLinus Torvalds int type; /* IP_VS_APP_TYPE_xxx */ 7431da177e4SLinus Torvalds char *name; /* application module name */ 7441da177e4SLinus Torvalds __u16 protocol; 7451da177e4SLinus Torvalds struct module *module; /* THIS_MODULE/NULL */ 7461da177e4SLinus Torvalds struct list_head incs_list; /* list of incarnations */ 7471da177e4SLinus Torvalds 7481da177e4SLinus Torvalds /* members for application incarnations */ 7491da177e4SLinus Torvalds struct list_head p_list; /* member in proto app list */ 7501da177e4SLinus Torvalds struct ip_vs_app *app; /* its real application */ 751014d730dSAl Viro __be16 port; /* port number in net order */ 7521da177e4SLinus Torvalds atomic_t usecnt; /* usage counter */ 7531da177e4SLinus Torvalds 7548b27b10fSJulian Anastasov /* 7558b27b10fSJulian Anastasov * output hook: Process packet in inout direction, diff set for TCP. 7568b27b10fSJulian Anastasov * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok, 7578b27b10fSJulian Anastasov * 2=Mangled but checksum was not updated 7588b27b10fSJulian Anastasov */ 7591da177e4SLinus Torvalds int (*pkt_out)(struct ip_vs_app *, struct ip_vs_conn *, 7603db05feaSHerbert Xu struct sk_buff *, int *diff); 7611da177e4SLinus Torvalds 7628b27b10fSJulian Anastasov /* 7638b27b10fSJulian Anastasov * input hook: Process packet in outin direction, diff set for TCP. 7648b27b10fSJulian Anastasov * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok, 7658b27b10fSJulian Anastasov * 2=Mangled but checksum was not updated 7668b27b10fSJulian Anastasov */ 7671da177e4SLinus Torvalds int (*pkt_in)(struct ip_vs_app *, struct ip_vs_conn *, 7683db05feaSHerbert Xu struct sk_buff *, int *diff); 7691da177e4SLinus Torvalds 7701da177e4SLinus Torvalds /* ip_vs_app initializer */ 7711da177e4SLinus Torvalds int (*init_conn)(struct ip_vs_app *, struct ip_vs_conn *); 7721da177e4SLinus Torvalds 7731da177e4SLinus Torvalds /* ip_vs_app finish */ 7741da177e4SLinus Torvalds int (*done_conn)(struct ip_vs_app *, struct ip_vs_conn *); 7751da177e4SLinus Torvalds 7761da177e4SLinus Torvalds 7771da177e4SLinus Torvalds /* not used now */ 7781da177e4SLinus Torvalds int (*bind_conn)(struct ip_vs_app *, struct ip_vs_conn *, 7791da177e4SLinus Torvalds struct ip_vs_protocol *); 7801da177e4SLinus Torvalds 7811da177e4SLinus Torvalds void (*unbind_conn)(struct ip_vs_app *, struct ip_vs_conn *); 7821da177e4SLinus Torvalds 7831da177e4SLinus Torvalds int * timeout_table; 7841da177e4SLinus Torvalds int * timeouts; 7851da177e4SLinus Torvalds int timeouts_size; 7861da177e4SLinus Torvalds 7871da177e4SLinus Torvalds int (*conn_schedule)(struct sk_buff *skb, struct ip_vs_app *app, 7881da177e4SLinus Torvalds int *verdict, struct ip_vs_conn **cpp); 7891da177e4SLinus Torvalds 7901da177e4SLinus Torvalds struct ip_vs_conn * 7911da177e4SLinus Torvalds (*conn_in_get)(const struct sk_buff *skb, struct ip_vs_app *app, 7921da177e4SLinus Torvalds const struct iphdr *iph, unsigned int proto_off, 7931da177e4SLinus Torvalds int inverse); 7941da177e4SLinus Torvalds 7951da177e4SLinus Torvalds struct ip_vs_conn * 7961da177e4SLinus Torvalds (*conn_out_get)(const struct sk_buff *skb, struct ip_vs_app *app, 7971da177e4SLinus Torvalds const struct iphdr *iph, unsigned int proto_off, 7981da177e4SLinus Torvalds int inverse); 7991da177e4SLinus Torvalds 8001da177e4SLinus Torvalds int (*state_transition)(struct ip_vs_conn *cp, int direction, 8011da177e4SLinus Torvalds const struct sk_buff *skb, 8021da177e4SLinus Torvalds struct ip_vs_app *app); 8031da177e4SLinus Torvalds 8041da177e4SLinus Torvalds void (*timeout_change)(struct ip_vs_app *app, int flags); 8051da177e4SLinus Torvalds }; 8061da177e4SLinus Torvalds 8072553d064SJulian Anastasov /* IPVS in network namespace */ 8082553d064SJulian Anastasov struct netns_ipvs { 8092553d064SJulian Anastasov int gen; /* Generation */ 8102553d064SJulian Anastasov /* 8112553d064SJulian Anastasov * Hash table: for real service lookups 8122553d064SJulian Anastasov */ 8132553d064SJulian Anastasov #define IP_VS_RTAB_BITS 4 8142553d064SJulian Anastasov #define IP_VS_RTAB_SIZE (1 << IP_VS_RTAB_BITS) 8152553d064SJulian Anastasov #define IP_VS_RTAB_MASK (IP_VS_RTAB_SIZE - 1) 8162553d064SJulian Anastasov 8172553d064SJulian Anastasov struct list_head rs_table[IP_VS_RTAB_SIZE]; 8182553d064SJulian Anastasov /* ip_vs_app */ 8192553d064SJulian Anastasov struct list_head app_list; 8202553d064SJulian Anastasov struct mutex app_mutex; 8212553d064SJulian Anastasov struct lock_class_key app_key; /* mutex debuging */ 8222553d064SJulian Anastasov 8232553d064SJulian Anastasov /* ip_vs_proto */ 8242553d064SJulian Anastasov #define IP_VS_PROTO_TAB_SIZE 32 /* must be power of 2 */ 8252553d064SJulian Anastasov struct ip_vs_proto_data *proto_data_table[IP_VS_PROTO_TAB_SIZE]; 8262553d064SJulian Anastasov /* ip_vs_proto_tcp */ 8272553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_TCP 8282553d064SJulian Anastasov #define TCP_APP_TAB_BITS 4 8292553d064SJulian Anastasov #define TCP_APP_TAB_SIZE (1 << TCP_APP_TAB_BITS) 8302553d064SJulian Anastasov #define TCP_APP_TAB_MASK (TCP_APP_TAB_SIZE - 1) 8312553d064SJulian Anastasov struct list_head tcp_apps[TCP_APP_TAB_SIZE]; 8322553d064SJulian Anastasov spinlock_t tcp_app_lock; 8332553d064SJulian Anastasov #endif 8342553d064SJulian Anastasov /* ip_vs_proto_udp */ 8352553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_UDP 8362553d064SJulian Anastasov #define UDP_APP_TAB_BITS 4 8372553d064SJulian Anastasov #define UDP_APP_TAB_SIZE (1 << UDP_APP_TAB_BITS) 8382553d064SJulian Anastasov #define UDP_APP_TAB_MASK (UDP_APP_TAB_SIZE - 1) 8392553d064SJulian Anastasov struct list_head udp_apps[UDP_APP_TAB_SIZE]; 8402553d064SJulian Anastasov spinlock_t udp_app_lock; 8412553d064SJulian Anastasov #endif 8422553d064SJulian Anastasov /* ip_vs_proto_sctp */ 8432553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_SCTP 8442553d064SJulian Anastasov #define SCTP_APP_TAB_BITS 4 8452553d064SJulian Anastasov #define SCTP_APP_TAB_SIZE (1 << SCTP_APP_TAB_BITS) 8462553d064SJulian Anastasov #define SCTP_APP_TAB_MASK (SCTP_APP_TAB_SIZE - 1) 8472553d064SJulian Anastasov /* Hash table for SCTP application incarnations */ 8482553d064SJulian Anastasov struct list_head sctp_apps[SCTP_APP_TAB_SIZE]; 8492553d064SJulian Anastasov spinlock_t sctp_app_lock; 8502553d064SJulian Anastasov #endif 8512553d064SJulian Anastasov /* ip_vs_conn */ 8522553d064SJulian Anastasov atomic_t conn_count; /* connection counter */ 8532553d064SJulian Anastasov 8542553d064SJulian Anastasov /* ip_vs_ctl */ 8552a0751afSJulian Anastasov struct ip_vs_stats tot_stats; /* Statistics & est. */ 8562553d064SJulian Anastasov seqcount_t *ustats_seq; /* u64 read retry */ 8572553d064SJulian Anastasov 8582553d064SJulian Anastasov int num_services; /* no of virtual services */ 8592553d064SJulian Anastasov /* 1/rate drop and drop-entry variables */ 8602553d064SJulian Anastasov struct delayed_work defense_work; /* Work handler */ 8612553d064SJulian Anastasov int drop_rate; 8622553d064SJulian Anastasov int drop_counter; 8632553d064SJulian Anastasov atomic_t dropentry; 8642553d064SJulian Anastasov /* locks in ctl.c */ 8652553d064SJulian Anastasov spinlock_t dropentry_lock; /* drop entry handling */ 8662553d064SJulian Anastasov spinlock_t droppacket_lock; /* drop packet handling */ 8672553d064SJulian Anastasov spinlock_t securetcp_lock; /* state and timeout tables */ 8682553d064SJulian Anastasov rwlock_t rs_lock; /* real services table */ 8692553d064SJulian Anastasov /* semaphore for IPVS sockopts. And, [gs]etsockopt may sleep. */ 8702553d064SJulian Anastasov struct lock_class_key ctl_key; /* ctl_mutex debuging */ 8712553d064SJulian Anastasov /* Trash for destinations */ 8722553d064SJulian Anastasov struct list_head dest_trash; 8732553d064SJulian Anastasov /* Service counters */ 8742553d064SJulian Anastasov atomic_t ftpsvc_counter; 8752553d064SJulian Anastasov atomic_t nullsvc_counter; 8762553d064SJulian Anastasov 8772553d064SJulian Anastasov /* sys-ctl struct */ 8782553d064SJulian Anastasov struct ctl_table_header *sysctl_hdr; 8792553d064SJulian Anastasov struct ctl_table *sysctl_tbl; 8802553d064SJulian Anastasov /* sysctl variables */ 8812553d064SJulian Anastasov int sysctl_amemthresh; 8822553d064SJulian Anastasov int sysctl_am_droprate; 8832553d064SJulian Anastasov int sysctl_drop_entry; 8842553d064SJulian Anastasov int sysctl_drop_packet; 8852553d064SJulian Anastasov int sysctl_secure_tcp; 8862553d064SJulian Anastasov #ifdef CONFIG_IP_VS_NFCT 8872553d064SJulian Anastasov int sysctl_conntrack; 8882553d064SJulian Anastasov #endif 8892553d064SJulian Anastasov int sysctl_snat_reroute; 8902553d064SJulian Anastasov int sysctl_sync_ver; 8912553d064SJulian Anastasov int sysctl_cache_bypass; 8922553d064SJulian Anastasov int sysctl_expire_nodest_conn; 8932553d064SJulian Anastasov int sysctl_expire_quiescent_template; 8942553d064SJulian Anastasov int sysctl_sync_threshold[2]; 8952553d064SJulian Anastasov int sysctl_nat_icmp_send; 8962553d064SJulian Anastasov 8972553d064SJulian Anastasov /* ip_vs_lblc */ 8982553d064SJulian Anastasov int sysctl_lblc_expiration; 8992553d064SJulian Anastasov struct ctl_table_header *lblc_ctl_header; 9002553d064SJulian Anastasov struct ctl_table *lblc_ctl_table; 9012553d064SJulian Anastasov /* ip_vs_lblcr */ 9022553d064SJulian Anastasov int sysctl_lblcr_expiration; 9032553d064SJulian Anastasov struct ctl_table_header *lblcr_ctl_header; 9042553d064SJulian Anastasov struct ctl_table *lblcr_ctl_table; 9052553d064SJulian Anastasov /* ip_vs_est */ 9062553d064SJulian Anastasov struct list_head est_list; /* estimator list */ 9072553d064SJulian Anastasov spinlock_t est_lock; 9082553d064SJulian Anastasov struct timer_list est_timer; /* Estimation timer */ 9092553d064SJulian Anastasov /* ip_vs_sync */ 9102553d064SJulian Anastasov struct list_head sync_queue; 9112553d064SJulian Anastasov spinlock_t sync_lock; 9122553d064SJulian Anastasov struct ip_vs_sync_buff *sync_buff; 9132553d064SJulian Anastasov spinlock_t sync_buff_lock; 9142553d064SJulian Anastasov struct sockaddr_in sync_mcast_addr; 9152553d064SJulian Anastasov struct task_struct *master_thread; 9162553d064SJulian Anastasov struct task_struct *backup_thread; 9172553d064SJulian Anastasov int send_mesg_maxlen; 9182553d064SJulian Anastasov int recv_mesg_maxlen; 9192553d064SJulian Anastasov volatile int sync_state; 9202553d064SJulian Anastasov volatile int master_syncid; 9212553d064SJulian Anastasov volatile int backup_syncid; 9222553d064SJulian Anastasov /* multicast interface name */ 9232553d064SJulian Anastasov char master_mcast_ifn[IP_VS_IFNAME_MAXLEN]; 9242553d064SJulian Anastasov char backup_mcast_ifn[IP_VS_IFNAME_MAXLEN]; 9252553d064SJulian Anastasov /* net name space ptr */ 9262553d064SJulian Anastasov struct net *net; /* Needed by timer routines */ 9272553d064SJulian Anastasov }; 9281da177e4SLinus Torvalds 9291da177e4SLinus Torvalds /* 9301da177e4SLinus Torvalds * IPVS core functions 9311da177e4SLinus Torvalds * (from ip_vs_core.c) 9321da177e4SLinus Torvalds */ 9331da177e4SLinus Torvalds extern const char *ip_vs_proto_name(unsigned proto); 9341da177e4SLinus Torvalds extern void ip_vs_init_hash_table(struct list_head *table, int rows); 935afdd6140SSven Wegener #define IP_VS_INIT_HASH_TABLE(t) ip_vs_init_hash_table((t), ARRAY_SIZE((t))) 9361da177e4SLinus Torvalds 9371da177e4SLinus Torvalds #define IP_VS_APP_TYPE_FTP 1 9381da177e4SLinus Torvalds 9391da177e4SLinus Torvalds /* 9401da177e4SLinus Torvalds * ip_vs_conn handling functions 9411da177e4SLinus Torvalds * (from ip_vs_conn.c) 9421da177e4SLinus Torvalds */ 9431da177e4SLinus Torvalds 9441da177e4SLinus Torvalds enum { 9451da177e4SLinus Torvalds IP_VS_DIR_INPUT = 0, 9461da177e4SLinus Torvalds IP_VS_DIR_OUTPUT, 9471da177e4SLinus Torvalds IP_VS_DIR_INPUT_ONLY, 9481da177e4SLinus Torvalds IP_VS_DIR_LAST, 9491da177e4SLinus Torvalds }; 9501da177e4SLinus Torvalds 9516e67e586SHans Schillstrom static inline void ip_vs_conn_fill_param(struct net *net, int af, int protocol, 952f11017ecSSimon Horman const union nf_inet_addr *caddr, 953f11017ecSSimon Horman __be16 cport, 954f11017ecSSimon Horman const union nf_inet_addr *vaddr, 955f11017ecSSimon Horman __be16 vport, 956f11017ecSSimon Horman struct ip_vs_conn_param *p) 957f11017ecSSimon Horman { 9586e67e586SHans Schillstrom p->net = net; 959f11017ecSSimon Horman p->af = af; 960f11017ecSSimon Horman p->protocol = protocol; 961f11017ecSSimon Horman p->caddr = caddr; 962f11017ecSSimon Horman p->cport = cport; 963f11017ecSSimon Horman p->vaddr = vaddr; 964f11017ecSSimon Horman p->vport = vport; 96585999283SSimon Horman p->pe = NULL; 96685999283SSimon Horman p->pe_data = NULL; 967f11017ecSSimon Horman } 96828364a59SJulius Volz 969f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_in_get(const struct ip_vs_conn_param *p); 970f11017ecSSimon Horman struct ip_vs_conn *ip_vs_ct_in_get(const struct ip_vs_conn_param *p); 97128364a59SJulius Volz 9725c0d2374SSimon Horman struct ip_vs_conn * ip_vs_conn_in_get_proto(int af, const struct sk_buff *skb, 9735c0d2374SSimon Horman const struct ip_vs_iphdr *iph, 9745c0d2374SSimon Horman unsigned int proto_off, 9755c0d2374SSimon Horman int inverse); 9765c0d2374SSimon Horman 977f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_out_get(const struct ip_vs_conn_param *p); 9781da177e4SLinus Torvalds 9795c0d2374SSimon Horman struct ip_vs_conn * ip_vs_conn_out_get_proto(int af, const struct sk_buff *skb, 9805c0d2374SSimon Horman const struct ip_vs_iphdr *iph, 9815c0d2374SSimon Horman unsigned int proto_off, 9825c0d2374SSimon Horman int inverse); 9835c0d2374SSimon Horman 9841da177e4SLinus Torvalds /* put back the conn without restarting its timer */ 9851da177e4SLinus Torvalds static inline void __ip_vs_conn_put(struct ip_vs_conn *cp) 9861da177e4SLinus Torvalds { 9871da177e4SLinus Torvalds atomic_dec(&cp->refcnt); 9881da177e4SLinus Torvalds } 9891da177e4SLinus Torvalds extern void ip_vs_conn_put(struct ip_vs_conn *cp); 990014d730dSAl Viro extern void ip_vs_conn_fill_cport(struct ip_vs_conn *cp, __be16 cport); 9911da177e4SLinus Torvalds 992f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_new(const struct ip_vs_conn_param *p, 993f11017ecSSimon Horman const union nf_inet_addr *daddr, 994f11017ecSSimon Horman __be16 dport, unsigned flags, 9950e051e68SHans Schillstrom struct ip_vs_dest *dest, __u32 fwmark); 9961da177e4SLinus Torvalds extern void ip_vs_conn_expire_now(struct ip_vs_conn *cp); 9971da177e4SLinus Torvalds 9981da177e4SLinus Torvalds extern const char * ip_vs_state_name(__u16 proto, int state); 9991da177e4SLinus Torvalds 10004a85b96cSHans Schillstrom extern void ip_vs_tcp_conn_listen(struct net *net, struct ip_vs_conn *cp); 10011da177e4SLinus Torvalds extern int ip_vs_check_template(struct ip_vs_conn *ct); 1002f6340ee0SHans Schillstrom extern void ip_vs_random_dropentry(struct net *net); 10031da177e4SLinus Torvalds extern int ip_vs_conn_init(void); 10041da177e4SLinus Torvalds extern void ip_vs_conn_cleanup(void); 10051da177e4SLinus Torvalds 10061da177e4SLinus Torvalds static inline void ip_vs_control_del(struct ip_vs_conn *cp) 10071da177e4SLinus Torvalds { 10081da177e4SLinus Torvalds struct ip_vs_conn *ctl_cp = cp->control; 10091da177e4SLinus Torvalds if (!ctl_cp) { 1010cfc78c5aSJulius Volz IP_VS_ERR_BUF("request control DEL for uncontrolled: " 1011cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1012cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1013cfc78c5aSJulius Volz ntohs(cp->cport), 1014cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1015cfc78c5aSJulius Volz ntohs(cp->vport)); 1016cfc78c5aSJulius Volz 10171da177e4SLinus Torvalds return; 10181da177e4SLinus Torvalds } 10191da177e4SLinus Torvalds 1020cfc78c5aSJulius Volz IP_VS_DBG_BUF(7, "DELeting control for: " 1021cfc78c5aSJulius Volz "cp.dst=%s:%d ctl_cp.dst=%s:%d\n", 1022cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1023cfc78c5aSJulius Volz ntohs(cp->cport), 1024cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr), 1025cfc78c5aSJulius Volz ntohs(ctl_cp->cport)); 10261da177e4SLinus Torvalds 10271da177e4SLinus Torvalds cp->control = NULL; 10281da177e4SLinus Torvalds if (atomic_read(&ctl_cp->n_control) == 0) { 1029cfc78c5aSJulius Volz IP_VS_ERR_BUF("BUG control DEL with n=0 : " 1030cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1031cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1032cfc78c5aSJulius Volz ntohs(cp->cport), 1033cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1034cfc78c5aSJulius Volz ntohs(cp->vport)); 1035cfc78c5aSJulius Volz 10361da177e4SLinus Torvalds return; 10371da177e4SLinus Torvalds } 10381da177e4SLinus Torvalds atomic_dec(&ctl_cp->n_control); 10391da177e4SLinus Torvalds } 10401da177e4SLinus Torvalds 10411da177e4SLinus Torvalds static inline void 10421da177e4SLinus Torvalds ip_vs_control_add(struct ip_vs_conn *cp, struct ip_vs_conn *ctl_cp) 10431da177e4SLinus Torvalds { 10441da177e4SLinus Torvalds if (cp->control) { 1045cfc78c5aSJulius Volz IP_VS_ERR_BUF("request control ADD for already controlled: " 1046cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1047cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1048cfc78c5aSJulius Volz ntohs(cp->cport), 1049cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1050cfc78c5aSJulius Volz ntohs(cp->vport)); 1051cfc78c5aSJulius Volz 10521da177e4SLinus Torvalds ip_vs_control_del(cp); 10531da177e4SLinus Torvalds } 10541da177e4SLinus Torvalds 1055cfc78c5aSJulius Volz IP_VS_DBG_BUF(7, "ADDing control for: " 1056cfc78c5aSJulius Volz "cp.dst=%s:%d ctl_cp.dst=%s:%d\n", 1057cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1058cfc78c5aSJulius Volz ntohs(cp->cport), 1059cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr), 1060cfc78c5aSJulius Volz ntohs(ctl_cp->cport)); 10611da177e4SLinus Torvalds 10621da177e4SLinus Torvalds cp->control = ctl_cp; 10631da177e4SLinus Torvalds atomic_inc(&ctl_cp->n_control); 10641da177e4SLinus Torvalds } 10651da177e4SLinus Torvalds 10661da177e4SLinus Torvalds 10671da177e4SLinus Torvalds /* 10681da177e4SLinus Torvalds * IPVS application functions 10691da177e4SLinus Torvalds * (from ip_vs_app.c) 10701da177e4SLinus Torvalds */ 10711da177e4SLinus Torvalds #define IP_VS_APP_MAX_PORTS 8 1072ab8a5e84SHans Schillstrom extern int register_ip_vs_app(struct net *net, struct ip_vs_app *app); 1073ab8a5e84SHans Schillstrom extern void unregister_ip_vs_app(struct net *net, struct ip_vs_app *app); 10741da177e4SLinus Torvalds extern int ip_vs_bind_app(struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 10751da177e4SLinus Torvalds extern void ip_vs_unbind_app(struct ip_vs_conn *cp); 1076ab8a5e84SHans Schillstrom extern int register_ip_vs_app_inc(struct net *net, struct ip_vs_app *app, 1077ab8a5e84SHans Schillstrom __u16 proto, __u16 port); 10781da177e4SLinus Torvalds extern int ip_vs_app_inc_get(struct ip_vs_app *inc); 10791da177e4SLinus Torvalds extern void ip_vs_app_inc_put(struct ip_vs_app *inc); 10801da177e4SLinus Torvalds 10813db05feaSHerbert Xu extern int ip_vs_app_pkt_out(struct ip_vs_conn *, struct sk_buff *skb); 10823db05feaSHerbert Xu extern int ip_vs_app_pkt_in(struct ip_vs_conn *, struct sk_buff *skb); 10831da177e4SLinus Torvalds extern int ip_vs_app_init(void); 10841da177e4SLinus Torvalds extern void ip_vs_app_cleanup(void); 10851da177e4SLinus Torvalds 10868be67a66SSimon Horman void ip_vs_bind_pe(struct ip_vs_service *svc, struct ip_vs_pe *pe); 10878be67a66SSimon Horman void ip_vs_unbind_pe(struct ip_vs_service *svc); 10888be67a66SSimon Horman int register_ip_vs_pe(struct ip_vs_pe *pe); 10898be67a66SSimon Horman int unregister_ip_vs_pe(struct ip_vs_pe *pe); 1090e9e5eee8SSimon Horman struct ip_vs_pe *ip_vs_pe_getbyname(const char *name); 1091fe5e7a1eSHans Schillstrom struct ip_vs_pe *__ip_vs_pe_getbyname(const char *pe_name); 1092e9e5eee8SSimon Horman 1093e9e5eee8SSimon Horman static inline void ip_vs_pe_get(const struct ip_vs_pe *pe) 1094e9e5eee8SSimon Horman { 1095e9e5eee8SSimon Horman if (pe && pe->module) 1096e9e5eee8SSimon Horman __module_get(pe->module); 1097e9e5eee8SSimon Horman } 1098e9e5eee8SSimon Horman 1099e9e5eee8SSimon Horman static inline void ip_vs_pe_put(const struct ip_vs_pe *pe) 1100e9e5eee8SSimon Horman { 1101e9e5eee8SSimon Horman if (pe && pe->module) 1102e9e5eee8SSimon Horman module_put(pe->module); 1103e9e5eee8SSimon Horman } 11041da177e4SLinus Torvalds 11051da177e4SLinus Torvalds /* 11061da177e4SLinus Torvalds * IPVS protocol functions (from ip_vs_proto.c) 11071da177e4SLinus Torvalds */ 11081da177e4SLinus Torvalds extern int ip_vs_protocol_init(void); 11091da177e4SLinus Torvalds extern void ip_vs_protocol_cleanup(void); 11109330419dSHans Schillstrom extern void ip_vs_protocol_timeout_change(struct netns_ipvs *ipvs, int flags); 11111da177e4SLinus Torvalds extern int *ip_vs_create_timeout_table(int *table, int size); 11121da177e4SLinus Torvalds extern int 111336cbd3dcSJan Engelhardt ip_vs_set_state_timeout(int *table, int num, const char *const *names, 111436cbd3dcSJan Engelhardt const char *name, int to); 11151da177e4SLinus Torvalds extern void 11160d79641aSJulian Anastasov ip_vs_tcpudp_debug_packet(int af, struct ip_vs_protocol *pp, 11170d79641aSJulian Anastasov const struct sk_buff *skb, 11181da177e4SLinus Torvalds int offset, const char *msg); 11191da177e4SLinus Torvalds 11201da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_tcp; 11211da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_udp; 11221da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_icmp; 11231da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_esp; 11241da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_ah; 11252906f66aSVenkata Mohan Reddy extern struct ip_vs_protocol ip_vs_protocol_sctp; 11261da177e4SLinus Torvalds 11271da177e4SLinus Torvalds /* 11281da177e4SLinus Torvalds * Registering/unregistering scheduler functions 11291da177e4SLinus Torvalds * (from ip_vs_sched.c) 11301da177e4SLinus Torvalds */ 11311da177e4SLinus Torvalds extern int register_ip_vs_scheduler(struct ip_vs_scheduler *scheduler); 11321da177e4SLinus Torvalds extern int unregister_ip_vs_scheduler(struct ip_vs_scheduler *scheduler); 11331da177e4SLinus Torvalds extern int ip_vs_bind_scheduler(struct ip_vs_service *svc, 11341da177e4SLinus Torvalds struct ip_vs_scheduler *scheduler); 11351da177e4SLinus Torvalds extern int ip_vs_unbind_scheduler(struct ip_vs_service *svc); 11361da177e4SLinus Torvalds extern struct ip_vs_scheduler *ip_vs_scheduler_get(const char *sched_name); 11371da177e4SLinus Torvalds extern void ip_vs_scheduler_put(struct ip_vs_scheduler *scheduler); 11381da177e4SLinus Torvalds extern struct ip_vs_conn * 1139190ecd27SJulian Anastasov ip_vs_schedule(struct ip_vs_service *svc, struct sk_buff *skb, 11409330419dSHans Schillstrom struct ip_vs_proto_data *pd, int *ignored); 11411da177e4SLinus Torvalds extern int ip_vs_leave(struct ip_vs_service *svc, struct sk_buff *skb, 11429330419dSHans Schillstrom struct ip_vs_proto_data *pd); 11431da177e4SLinus Torvalds 114441ac51eeSPatrick Schaaf extern void ip_vs_scheduler_err(struct ip_vs_service *svc, const char *msg); 114541ac51eeSPatrick Schaaf 11461da177e4SLinus Torvalds 11471da177e4SLinus Torvalds /* 11481da177e4SLinus Torvalds * IPVS control data and functions (from ip_vs_ctl.c) 11491da177e4SLinus Torvalds */ 11501da177e4SLinus Torvalds extern struct ip_vs_stats ip_vs_stats; 11515587da55SSven Wegener extern const struct ctl_path net_vs_ctl_path[]; 1152b880c1f0SHans Schillstrom extern int sysctl_ip_vs_sync_ver; 11531da177e4SLinus Torvalds 1154f131315fSHans Schillstrom extern void ip_vs_sync_switch_mode(struct net *net, int mode); 11551da177e4SLinus Torvalds extern struct ip_vs_service * 1156fc723250SHans Schillstrom ip_vs_service_get(struct net *net, int af, __u32 fwmark, __u16 protocol, 11573c2e0505SJulius Volz const union nf_inet_addr *vaddr, __be16 vport); 11581da177e4SLinus Torvalds 11591da177e4SLinus Torvalds static inline void ip_vs_service_put(struct ip_vs_service *svc) 11601da177e4SLinus Torvalds { 11611da177e4SLinus Torvalds atomic_dec(&svc->usecnt); 11621da177e4SLinus Torvalds } 11631da177e4SLinus Torvalds 11641da177e4SLinus Torvalds extern struct ip_vs_dest * 1165fc723250SHans Schillstrom ip_vs_lookup_real_service(struct net *net, int af, __u16 protocol, 11667937df15SJulius Volz const union nf_inet_addr *daddr, __be16 dport); 11677937df15SJulius Volz 11681da177e4SLinus Torvalds extern int ip_vs_use_count_inc(void); 11691da177e4SLinus Torvalds extern void ip_vs_use_count_dec(void); 11701da177e4SLinus Torvalds extern int ip_vs_control_init(void); 11711da177e4SLinus Torvalds extern void ip_vs_control_cleanup(void); 11721e356f9cSRumen G. Bogdanovski extern struct ip_vs_dest * 1173fc723250SHans Schillstrom ip_vs_find_dest(struct net *net, int af, const union nf_inet_addr *daddr, 1174fc723250SHans Schillstrom __be16 dport, const union nf_inet_addr *vaddr, __be16 vport, 1175fc723250SHans Schillstrom __u16 protocol, __u32 fwmark); 11761e356f9cSRumen G. Bogdanovski extern struct ip_vs_dest *ip_vs_try_bind_dest(struct ip_vs_conn *cp); 11771da177e4SLinus Torvalds 11781da177e4SLinus Torvalds 11791da177e4SLinus Torvalds /* 11801da177e4SLinus Torvalds * IPVS sync daemon data and function prototypes 11811da177e4SLinus Torvalds * (from ip_vs_sync.c) 11821da177e4SLinus Torvalds */ 1183f131315fSHans Schillstrom extern int start_sync_thread(struct net *net, int state, char *mcast_ifn, 1184f131315fSHans Schillstrom __u8 syncid); 1185f131315fSHans Schillstrom extern int stop_sync_thread(struct net *net, int state); 1186f131315fSHans Schillstrom extern void ip_vs_sync_conn(struct net *net, struct ip_vs_conn *cp); 118761b1ab45SHans Schillstrom extern int ip_vs_sync_init(void); 118861b1ab45SHans Schillstrom extern void ip_vs_sync_cleanup(void); 11891da177e4SLinus Torvalds 11901da177e4SLinus Torvalds 11911da177e4SLinus Torvalds /* 11921da177e4SLinus Torvalds * IPVS rate estimator prototypes (from ip_vs_est.c) 11931da177e4SLinus Torvalds */ 1194a919cf4bSSven Wegener extern int ip_vs_estimator_init(void); 1195a919cf4bSSven Wegener extern void ip_vs_estimator_cleanup(void); 119629c2026fSHans Schillstrom extern void ip_vs_new_estimator(struct net *net, struct ip_vs_stats *stats); 119729c2026fSHans Schillstrom extern void ip_vs_kill_estimator(struct net *net, struct ip_vs_stats *stats); 11981da177e4SLinus Torvalds extern void ip_vs_zero_estimator(struct ip_vs_stats *stats); 11991da177e4SLinus Torvalds 12001da177e4SLinus Torvalds /* 12011da177e4SLinus Torvalds * Various IPVS packet transmitters (from ip_vs_xmit.c) 12021da177e4SLinus Torvalds */ 12031da177e4SLinus Torvalds extern int ip_vs_null_xmit 12041da177e4SLinus Torvalds (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 12051da177e4SLinus Torvalds extern int ip_vs_bypass_xmit 12061da177e4SLinus Torvalds (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 12071da177e4SLinus Torvalds extern int ip_vs_nat_xmit 12081da177e4SLinus Torvalds (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 12091da177e4SLinus Torvalds extern int ip_vs_tunnel_xmit 12101da177e4SLinus Torvalds (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 12111da177e4SLinus Torvalds extern int ip_vs_dr_xmit 12121da177e4SLinus Torvalds (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 12131da177e4SLinus Torvalds extern int ip_vs_icmp_xmit 12141da177e4SLinus Torvalds (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp, int offset); 12151da177e4SLinus Torvalds extern void ip_vs_dst_reset(struct ip_vs_dest *dest); 12161da177e4SLinus Torvalds 1217b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6 1218b3cdd2a7SJulius Volz extern int ip_vs_bypass_xmit_v6 1219b3cdd2a7SJulius Volz (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 1220b3cdd2a7SJulius Volz extern int ip_vs_nat_xmit_v6 1221b3cdd2a7SJulius Volz (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 1222b3cdd2a7SJulius Volz extern int ip_vs_tunnel_xmit_v6 1223b3cdd2a7SJulius Volz (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 1224b3cdd2a7SJulius Volz extern int ip_vs_dr_xmit_v6 1225b3cdd2a7SJulius Volz (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 1226b3cdd2a7SJulius Volz extern int ip_vs_icmp_xmit_v6 1227b3cdd2a7SJulius Volz (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp, 1228b3cdd2a7SJulius Volz int offset); 1229b3cdd2a7SJulius Volz #endif 12301da177e4SLinus Torvalds 12311da177e4SLinus Torvalds /* 12321da177e4SLinus Torvalds * This is a simple mechanism to ignore packets when 12331da177e4SLinus Torvalds * we are loaded. Just set ip_vs_drop_rate to 'n' and 12341da177e4SLinus Torvalds * we start to drop 1/rate of the packets 12351da177e4SLinus Torvalds */ 12361da177e4SLinus Torvalds 1237a0840e2eSHans Schillstrom static inline int ip_vs_todrop(struct netns_ipvs *ipvs) 12381da177e4SLinus Torvalds { 1239a0840e2eSHans Schillstrom if (!ipvs->drop_rate) 1240a0840e2eSHans Schillstrom return 0; 1241a0840e2eSHans Schillstrom if (--ipvs->drop_counter > 0) 1242a0840e2eSHans Schillstrom return 0; 1243a0840e2eSHans Schillstrom ipvs->drop_counter = ipvs->drop_rate; 12441da177e4SLinus Torvalds return 1; 12451da177e4SLinus Torvalds } 12461da177e4SLinus Torvalds 12471da177e4SLinus Torvalds /* 12481da177e4SLinus Torvalds * ip_vs_fwd_tag returns the forwarding tag of the connection 12491da177e4SLinus Torvalds */ 12501da177e4SLinus Torvalds #define IP_VS_FWD_METHOD(cp) (cp->flags & IP_VS_CONN_F_FWD_MASK) 12511da177e4SLinus Torvalds 1252732db659SAdrian Bunk static inline char ip_vs_fwd_tag(struct ip_vs_conn *cp) 12531da177e4SLinus Torvalds { 12541da177e4SLinus Torvalds char fwd; 12551da177e4SLinus Torvalds 12561da177e4SLinus Torvalds switch (IP_VS_FWD_METHOD(cp)) { 12571da177e4SLinus Torvalds case IP_VS_CONN_F_MASQ: 12581da177e4SLinus Torvalds fwd = 'M'; break; 12591da177e4SLinus Torvalds case IP_VS_CONN_F_LOCALNODE: 12601da177e4SLinus Torvalds fwd = 'L'; break; 12611da177e4SLinus Torvalds case IP_VS_CONN_F_TUNNEL: 12621da177e4SLinus Torvalds fwd = 'T'; break; 12631da177e4SLinus Torvalds case IP_VS_CONN_F_DROUTE: 12641da177e4SLinus Torvalds fwd = 'R'; break; 12651da177e4SLinus Torvalds case IP_VS_CONN_F_BYPASS: 12661da177e4SLinus Torvalds fwd = 'B'; break; 12671da177e4SLinus Torvalds default: 12681da177e4SLinus Torvalds fwd = '?'; break; 12691da177e4SLinus Torvalds } 12701da177e4SLinus Torvalds return fwd; 12711da177e4SLinus Torvalds } 12721da177e4SLinus Torvalds 12731da177e4SLinus Torvalds extern void ip_vs_nat_icmp(struct sk_buff *skb, struct ip_vs_protocol *pp, 12741da177e4SLinus Torvalds struct ip_vs_conn *cp, int dir); 12751da177e4SLinus Torvalds 1276b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6 1277b3cdd2a7SJulius Volz extern void ip_vs_nat_icmp_v6(struct sk_buff *skb, struct ip_vs_protocol *pp, 1278b3cdd2a7SJulius Volz struct ip_vs_conn *cp, int dir); 1279b3cdd2a7SJulius Volz #endif 1280b3cdd2a7SJulius Volz 1281b1550f22SAl Viro extern __sum16 ip_vs_checksum_complete(struct sk_buff *skb, int offset); 12821da177e4SLinus Torvalds 1283f9214b26SAl Viro static inline __wsum ip_vs_check_diff4(__be32 old, __be32 new, __wsum oldsum) 12841da177e4SLinus Torvalds { 1285f9214b26SAl Viro __be32 diff[2] = { ~old, new }; 12861da177e4SLinus Torvalds 128707f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 1288f9214b26SAl Viro } 1289f9214b26SAl Viro 12900bbdd42bSJulius Volz #ifdef CONFIG_IP_VS_IPV6 12910bbdd42bSJulius Volz static inline __wsum ip_vs_check_diff16(const __be32 *old, const __be32 *new, 12920bbdd42bSJulius Volz __wsum oldsum) 12930bbdd42bSJulius Volz { 12940bbdd42bSJulius Volz __be32 diff[8] = { ~old[3], ~old[2], ~old[1], ~old[0], 12950bbdd42bSJulius Volz new[3], new[2], new[1], new[0] }; 12960bbdd42bSJulius Volz 129707f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 12980bbdd42bSJulius Volz } 12990bbdd42bSJulius Volz #endif 13000bbdd42bSJulius Volz 1301f9214b26SAl Viro static inline __wsum ip_vs_check_diff2(__be16 old, __be16 new, __wsum oldsum) 1302f9214b26SAl Viro { 1303f9214b26SAl Viro __be16 diff[2] = { ~old, new }; 1304f9214b26SAl Viro 130507f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 13061da177e4SLinus Torvalds } 13071da177e4SLinus Torvalds 1308cf356d69SJulian Anastasov /* 1309cf356d69SJulian Anastasov * Forget current conntrack (unconfirmed) and attach notrack entry 1310cf356d69SJulian Anastasov */ 1311cf356d69SJulian Anastasov static inline void ip_vs_notrack(struct sk_buff *skb) 1312cf356d69SJulian Anastasov { 1313cf356d69SJulian Anastasov #if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE) 1314cf356d69SJulian Anastasov enum ip_conntrack_info ctinfo; 131506b69390SJesper Juhl struct nf_conn *ct = nf_ct_get(skb, &ctinfo); 1316cf356d69SJulian Anastasov 1317cf356d69SJulian Anastasov if (!ct || !nf_ct_is_untracked(ct)) { 1318cf356d69SJulian Anastasov nf_reset(skb); 1319cf356d69SJulian Anastasov skb->nfct = &nf_ct_untracked_get()->ct_general; 1320cf356d69SJulian Anastasov skb->nfctinfo = IP_CT_NEW; 1321cf356d69SJulian Anastasov nf_conntrack_get(skb->nfct); 1322cf356d69SJulian Anastasov } 1323cf356d69SJulian Anastasov #endif 1324cf356d69SJulian Anastasov } 1325cf356d69SJulian Anastasov 1326f4bc17cdSJulian Anastasov #ifdef CONFIG_IP_VS_NFCT 1327f4bc17cdSJulian Anastasov /* 1328f4bc17cdSJulian Anastasov * Netfilter connection tracking 1329f4bc17cdSJulian Anastasov * (from ip_vs_nfct.c) 1330f4bc17cdSJulian Anastasov */ 1331a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs) 1332f4bc17cdSJulian Anastasov { 1333a0840e2eSHans Schillstrom return ipvs->sysctl_conntrack; 1334f4bc17cdSJulian Anastasov } 1335f4bc17cdSJulian Anastasov 13366523ce15SJulian Anastasov extern void ip_vs_update_conntrack(struct sk_buff *skb, struct ip_vs_conn *cp, 13376523ce15SJulian Anastasov int outin); 1338f4bc17cdSJulian Anastasov extern int ip_vs_confirm_conntrack(struct sk_buff *skb, struct ip_vs_conn *cp); 1339f4bc17cdSJulian Anastasov extern void ip_vs_nfct_expect_related(struct sk_buff *skb, struct nf_conn *ct, 1340f4bc17cdSJulian Anastasov struct ip_vs_conn *cp, u_int8_t proto, 1341f4bc17cdSJulian Anastasov const __be16 port, int from_rs); 1342f4bc17cdSJulian Anastasov extern void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp); 1343f4bc17cdSJulian Anastasov 1344f4bc17cdSJulian Anastasov #else 1345f4bc17cdSJulian Anastasov 1346a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs) 1347f4bc17cdSJulian Anastasov { 1348f4bc17cdSJulian Anastasov return 0; 1349f4bc17cdSJulian Anastasov } 1350f4bc17cdSJulian Anastasov 1351f4bc17cdSJulian Anastasov static inline void ip_vs_update_conntrack(struct sk_buff *skb, 1352f4bc17cdSJulian Anastasov struct ip_vs_conn *cp, int outin) 1353f4bc17cdSJulian Anastasov { 1354f4bc17cdSJulian Anastasov } 1355f4bc17cdSJulian Anastasov 1356f4bc17cdSJulian Anastasov static inline int ip_vs_confirm_conntrack(struct sk_buff *skb, 1357f4bc17cdSJulian Anastasov struct ip_vs_conn *cp) 1358f4bc17cdSJulian Anastasov { 1359f4bc17cdSJulian Anastasov return NF_ACCEPT; 1360f4bc17cdSJulian Anastasov } 1361f4bc17cdSJulian Anastasov 1362f4bc17cdSJulian Anastasov static inline void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp) 1363f4bc17cdSJulian Anastasov { 1364f4bc17cdSJulian Anastasov } 1365f4bc17cdSJulian Anastasov /* CONFIG_IP_VS_NFCT */ 1366f4bc17cdSJulian Anastasov #endif 13676523ce15SJulian Anastasov 1368b552f7e3SChangli Gao static inline unsigned int 1369b552f7e3SChangli Gao ip_vs_dest_conn_overhead(struct ip_vs_dest *dest) 1370b552f7e3SChangli Gao { 1371b552f7e3SChangli Gao /* 1372b552f7e3SChangli Gao * We think the overhead of processing active connections is 256 1373b552f7e3SChangli Gao * times higher than that of inactive connections in average. (This 1374b552f7e3SChangli Gao * 256 times might not be accurate, we will change it later) We 1375b552f7e3SChangli Gao * use the following formula to estimate the overhead now: 1376b552f7e3SChangli Gao * dest->activeconns*256 + dest->inactconns 1377b552f7e3SChangli Gao */ 1378b552f7e3SChangli Gao return (atomic_read(&dest->activeconns) << 8) + 1379b552f7e3SChangli Gao atomic_read(&dest->inactconns); 1380b552f7e3SChangli Gao } 1381b552f7e3SChangli Gao 13821da177e4SLinus Torvalds #endif /* __KERNEL__ */ 13831da177e4SLinus Torvalds 1384bc4768ebSJulius Volz #endif /* _NET_IP_VS_H */ 1385