11da177e4SLinus Torvalds /* 21da177e4SLinus Torvalds * IP Virtual Server 31da177e4SLinus Torvalds * data structure and functionality definitions 41da177e4SLinus Torvalds */ 51da177e4SLinus Torvalds 6bc4768ebSJulius Volz #ifndef _NET_IP_VS_H 7bc4768ebSJulius Volz #define _NET_IP_VS_H 81da177e4SLinus Torvalds 9bc4768ebSJulius Volz #include <linux/ip_vs.h> /* definitions shared with userland */ 101da177e4SLinus Torvalds 11bc4768ebSJulius Volz /* old ipvsadm versions still include this file directly */ 121da177e4SLinus Torvalds #ifdef __KERNEL__ 131da177e4SLinus Torvalds 14bc4768ebSJulius Volz #include <asm/types.h> /* for __uXX types */ 15bc4768ebSJulius Volz 16bc4768ebSJulius Volz #include <linux/sysctl.h> /* for ctl_path */ 171da177e4SLinus Torvalds #include <linux/list.h> /* for struct list_head */ 181da177e4SLinus Torvalds #include <linux/spinlock.h> /* for struct rwlock_t */ 191da177e4SLinus Torvalds #include <asm/atomic.h> /* for struct atomic_t */ 201da177e4SLinus Torvalds #include <linux/compiler.h> 2114c85021SArnaldo Carvalho de Melo #include <linux/timer.h> 221da177e4SLinus Torvalds 2314c85021SArnaldo Carvalho de Melo #include <net/checksum.h> 24e7ade46aSJulius Volz #include <linux/netfilter.h> /* for union nf_inet_addr */ 251668e010SKOVACS Krisztian #include <linux/ip.h> 26e7ade46aSJulius Volz #include <linux/ipv6.h> /* for struct ipv6hdr */ 27e7ade46aSJulius Volz #include <net/ipv6.h> /* for ipv6_addr_copy */ 28cf356d69SJulian Anastasov #if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE) 29f4bc17cdSJulian Anastasov #include <net/netfilter/nf_conntrack.h> 30f4bc17cdSJulian Anastasov #endif 3161b1ab45SHans Schillstrom #include <net/net_namespace.h> /* Netw namespace */ 3261b1ab45SHans Schillstrom 3361b1ab45SHans Schillstrom /* 3461b1ab45SHans Schillstrom * Generic access of ipvs struct 3561b1ab45SHans Schillstrom */ 3661b1ab45SHans Schillstrom static inline struct netns_ipvs *net_ipvs(struct net* net) 3761b1ab45SHans Schillstrom { 3861b1ab45SHans Schillstrom return net->ipvs; 3961b1ab45SHans Schillstrom } 40fc723250SHans Schillstrom /* 41fc723250SHans Schillstrom * Get net ptr from skb in traffic cases 42fc723250SHans Schillstrom * use skb_sknet when call is from userland (ioctl or netlink) 43fc723250SHans Schillstrom */ 44a0840e2eSHans Schillstrom static inline struct net *skb_net(const struct sk_buff *skb) 45fc723250SHans Schillstrom { 46fc723250SHans Schillstrom #ifdef CONFIG_NET_NS 47fc723250SHans Schillstrom #ifdef CONFIG_IP_VS_DEBUG 48fc723250SHans Schillstrom /* 49fc723250SHans Schillstrom * This is used for debug only. 50fc723250SHans Schillstrom * Start with the most likely hit 51fc723250SHans Schillstrom * End with BUG 52fc723250SHans Schillstrom */ 53fc723250SHans Schillstrom if (likely(skb->dev && skb->dev->nd_net)) 54fc723250SHans Schillstrom return dev_net(skb->dev); 55fc723250SHans Schillstrom if (skb_dst(skb)->dev) 56fc723250SHans Schillstrom return dev_net(skb_dst(skb)->dev); 57fc723250SHans Schillstrom WARN(skb->sk, "Maybe skb_sknet should be used in %s() at line:%d\n", 58fc723250SHans Schillstrom __func__, __LINE__); 59fc723250SHans Schillstrom if (likely(skb->sk && skb->sk->sk_net)) 60fc723250SHans Schillstrom return sock_net(skb->sk); 61fc723250SHans Schillstrom pr_err("There is no net ptr to find in the skb in %s() line:%d\n", 62fc723250SHans Schillstrom __func__, __LINE__); 63fc723250SHans Schillstrom BUG(); 64fc723250SHans Schillstrom #else 65fc723250SHans Schillstrom return dev_net(skb->dev ? : skb_dst(skb)->dev); 66fc723250SHans Schillstrom #endif 67fc723250SHans Schillstrom #else 68fc723250SHans Schillstrom return &init_net; 69fc723250SHans Schillstrom #endif 70fc723250SHans Schillstrom } 71fc723250SHans Schillstrom 72a0840e2eSHans Schillstrom static inline struct net *skb_sknet(const struct sk_buff *skb) 73fc723250SHans Schillstrom { 74fc723250SHans Schillstrom #ifdef CONFIG_NET_NS 75fc723250SHans Schillstrom #ifdef CONFIG_IP_VS_DEBUG 76fc723250SHans Schillstrom /* Start with the most likely hit */ 77fc723250SHans Schillstrom if (likely(skb->sk && skb->sk->sk_net)) 78fc723250SHans Schillstrom return sock_net(skb->sk); 79fc723250SHans Schillstrom WARN(skb->dev, "Maybe skb_net should be used instead in %s() line:%d\n", 80fc723250SHans Schillstrom __func__, __LINE__); 81fc723250SHans Schillstrom if (likely(skb->dev && skb->dev->nd_net)) 82fc723250SHans Schillstrom return dev_net(skb->dev); 83fc723250SHans Schillstrom pr_err("There is no net ptr to find in the skb in %s() line:%d\n", 84fc723250SHans Schillstrom __func__, __LINE__); 85fc723250SHans Schillstrom BUG(); 86fc723250SHans Schillstrom #else 87fc723250SHans Schillstrom return sock_net(skb->sk); 88fc723250SHans Schillstrom #endif 89fc723250SHans Schillstrom #else 90fc723250SHans Schillstrom return &init_net; 91fc723250SHans Schillstrom #endif 92fc723250SHans Schillstrom } 93b17fc996SHans Schillstrom /* 94b17fc996SHans Schillstrom * This one needed for single_open_net since net is stored directly in 95b17fc996SHans Schillstrom * private not as a struct i.e. seq_file_net cant be used. 96b17fc996SHans Schillstrom */ 97b17fc996SHans Schillstrom static inline struct net *seq_file_single_net(struct seq_file *seq) 98b17fc996SHans Schillstrom { 99b17fc996SHans Schillstrom #ifdef CONFIG_NET_NS 100b17fc996SHans Schillstrom return (struct net *)seq->private; 101b17fc996SHans Schillstrom #else 102b17fc996SHans Schillstrom return &init_net; 103b17fc996SHans Schillstrom #endif 104b17fc996SHans Schillstrom } 1056f7edb48SCatalin(ux) M. BOIE 1066f7edb48SCatalin(ux) M. BOIE /* Connections' size value needed by ip_vs_ctl.c */ 1076f7edb48SCatalin(ux) M. BOIE extern int ip_vs_conn_tab_size; 1086f7edb48SCatalin(ux) M. BOIE 1096f7edb48SCatalin(ux) M. BOIE 11064aae3cbSJulius Volz struct ip_vs_iphdr { 11164aae3cbSJulius Volz int len; 11264aae3cbSJulius Volz __u8 protocol; 11364aae3cbSJulius Volz union nf_inet_addr saddr; 11464aae3cbSJulius Volz union nf_inet_addr daddr; 11564aae3cbSJulius Volz }; 11664aae3cbSJulius Volz 11764aae3cbSJulius Volz static inline void 11864aae3cbSJulius Volz ip_vs_fill_iphdr(int af, const void *nh, struct ip_vs_iphdr *iphdr) 11964aae3cbSJulius Volz { 12064aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 12164aae3cbSJulius Volz if (af == AF_INET6) { 12264aae3cbSJulius Volz const struct ipv6hdr *iph = nh; 12364aae3cbSJulius Volz iphdr->len = sizeof(struct ipv6hdr); 12464aae3cbSJulius Volz iphdr->protocol = iph->nexthdr; 12564aae3cbSJulius Volz ipv6_addr_copy(&iphdr->saddr.in6, &iph->saddr); 12664aae3cbSJulius Volz ipv6_addr_copy(&iphdr->daddr.in6, &iph->daddr); 12764aae3cbSJulius Volz } else 12864aae3cbSJulius Volz #endif 12964aae3cbSJulius Volz { 13064aae3cbSJulius Volz const struct iphdr *iph = nh; 13164aae3cbSJulius Volz iphdr->len = iph->ihl * 4; 13264aae3cbSJulius Volz iphdr->protocol = iph->protocol; 13364aae3cbSJulius Volz iphdr->saddr.ip = iph->saddr; 13464aae3cbSJulius Volz iphdr->daddr.ip = iph->daddr; 13564aae3cbSJulius Volz } 13664aae3cbSJulius Volz } 13764aae3cbSJulius Volz 13864aae3cbSJulius Volz static inline void ip_vs_addr_copy(int af, union nf_inet_addr *dst, 13964aae3cbSJulius Volz const union nf_inet_addr *src) 14064aae3cbSJulius Volz { 14164aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 14264aae3cbSJulius Volz if (af == AF_INET6) 14364aae3cbSJulius Volz ipv6_addr_copy(&dst->in6, &src->in6); 14464aae3cbSJulius Volz else 14564aae3cbSJulius Volz #endif 14664aae3cbSJulius Volz dst->ip = src->ip; 14764aae3cbSJulius Volz } 14864aae3cbSJulius Volz 14964aae3cbSJulius Volz static inline int ip_vs_addr_equal(int af, const union nf_inet_addr *a, 15064aae3cbSJulius Volz const union nf_inet_addr *b) 15164aae3cbSJulius Volz { 15264aae3cbSJulius Volz #ifdef CONFIG_IP_VS_IPV6 15364aae3cbSJulius Volz if (af == AF_INET6) 15464aae3cbSJulius Volz return ipv6_addr_equal(&a->in6, &b->in6); 15564aae3cbSJulius Volz #endif 15664aae3cbSJulius Volz return a->ip == b->ip; 15764aae3cbSJulius Volz } 15864aae3cbSJulius Volz 1591da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG 16014c85021SArnaldo Carvalho de Melo #include <linux/net.h> 16114c85021SArnaldo Carvalho de Melo 1621da177e4SLinus Torvalds extern int ip_vs_get_debug_level(void); 163c842a3adSJulius Volz 164c842a3adSJulius Volz static inline const char *ip_vs_dbg_addr(int af, char *buf, size_t buf_len, 165c842a3adSJulius Volz const union nf_inet_addr *addr, 166c842a3adSJulius Volz int *idx) 167c842a3adSJulius Volz { 168c842a3adSJulius Volz int len; 169c842a3adSJulius Volz #ifdef CONFIG_IP_VS_IPV6 170c842a3adSJulius Volz if (af == AF_INET6) 1715b095d98SHarvey Harrison len = snprintf(&buf[*idx], buf_len - *idx, "[%pI6]", 1720c6ce78aSHarvey Harrison &addr->in6) + 1; 173c842a3adSJulius Volz else 174c842a3adSJulius Volz #endif 1753685f25dSHarvey Harrison len = snprintf(&buf[*idx], buf_len - *idx, "%pI4", 1763685f25dSHarvey Harrison &addr->ip) + 1; 177c842a3adSJulius Volz 178c842a3adSJulius Volz *idx += len; 179c842a3adSJulius Volz BUG_ON(*idx > buf_len + 1); 180c842a3adSJulius Volz return &buf[*idx - len]; 181c842a3adSJulius Volz } 182c842a3adSJulius Volz 1839aada7acSHannes Eder #define IP_VS_DBG_BUF(level, msg, ...) \ 184c842a3adSJulius Volz do { \ 185c842a3adSJulius Volz char ip_vs_dbg_buf[160]; \ 186c842a3adSJulius Volz int ip_vs_dbg_idx = 0; \ 187c842a3adSJulius Volz if (level <= ip_vs_get_debug_level()) \ 1889aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 189c842a3adSJulius Volz } while (0) 190c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...) \ 191c842a3adSJulius Volz do { \ 192c842a3adSJulius Volz char ip_vs_dbg_buf[160]; \ 193c842a3adSJulius Volz int ip_vs_dbg_idx = 0; \ 1949aada7acSHannes Eder pr_err(msg); \ 195c842a3adSJulius Volz } while (0) 196c842a3adSJulius Volz 197c842a3adSJulius Volz /* Only use from within IP_VS_DBG_BUF() or IP_VS_ERR_BUF macros */ 198c842a3adSJulius Volz #define IP_VS_DBG_ADDR(af, addr) \ 199c842a3adSJulius Volz ip_vs_dbg_addr(af, ip_vs_dbg_buf, \ 200c842a3adSJulius Volz sizeof(ip_vs_dbg_buf), addr, \ 201c842a3adSJulius Volz &ip_vs_dbg_idx) 202c842a3adSJulius Volz 2039aada7acSHannes Eder #define IP_VS_DBG(level, msg, ...) \ 2041da177e4SLinus Torvalds do { \ 2051da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2069aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 2071da177e4SLinus Torvalds } while (0) 2089aada7acSHannes Eder #define IP_VS_DBG_RL(msg, ...) \ 2091da177e4SLinus Torvalds do { \ 2101da177e4SLinus Torvalds if (net_ratelimit()) \ 2119aada7acSHannes Eder printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__); \ 2121da177e4SLinus Torvalds } while (0) 2130d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg) \ 2141da177e4SLinus Torvalds do { \ 2151da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2160d79641aSJulian Anastasov pp->debug_packet(af, pp, skb, ofs, msg); \ 2171da177e4SLinus Torvalds } while (0) 2180d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg) \ 2191da177e4SLinus Torvalds do { \ 2201da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level() && \ 2211da177e4SLinus Torvalds net_ratelimit()) \ 2220d79641aSJulian Anastasov pp->debug_packet(af, pp, skb, ofs, msg); \ 2231da177e4SLinus Torvalds } while (0) 2241da177e4SLinus Torvalds #else /* NO DEBUGGING at ALL */ 225c842a3adSJulius Volz #define IP_VS_DBG_BUF(level, msg...) do {} while (0) 226c842a3adSJulius Volz #define IP_VS_ERR_BUF(msg...) do {} while (0) 2271da177e4SLinus Torvalds #define IP_VS_DBG(level, msg...) do {} while (0) 2281da177e4SLinus Torvalds #define IP_VS_DBG_RL(msg...) do {} while (0) 2290d79641aSJulian Anastasov #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg) do {} while (0) 2300d79641aSJulian Anastasov #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg) do {} while (0) 2311da177e4SLinus Torvalds #endif 2321da177e4SLinus Torvalds 2331da177e4SLinus Torvalds #define IP_VS_BUG() BUG() 2341e3e238eSHannes Eder #define IP_VS_ERR_RL(msg, ...) \ 2351da177e4SLinus Torvalds do { \ 2361da177e4SLinus Torvalds if (net_ratelimit()) \ 2371e3e238eSHannes Eder pr_err(msg, ##__VA_ARGS__); \ 2381da177e4SLinus Torvalds } while (0) 2391da177e4SLinus Torvalds 2401da177e4SLinus Torvalds #ifdef CONFIG_IP_VS_DEBUG 2411da177e4SLinus Torvalds #define EnterFunction(level) \ 2421da177e4SLinus Torvalds do { \ 2431da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2449aada7acSHannes Eder printk(KERN_DEBUG \ 2459aada7acSHannes Eder pr_fmt("Enter: %s, %s line %i\n"), \ 246d5c003b4SHarvey Harrison __func__, __FILE__, __LINE__); \ 2471da177e4SLinus Torvalds } while (0) 2481da177e4SLinus Torvalds #define LeaveFunction(level) \ 2491da177e4SLinus Torvalds do { \ 2501da177e4SLinus Torvalds if (level <= ip_vs_get_debug_level()) \ 2519aada7acSHannes Eder printk(KERN_DEBUG \ 2529aada7acSHannes Eder pr_fmt("Leave: %s, %s line %i\n"), \ 253d5c003b4SHarvey Harrison __func__, __FILE__, __LINE__); \ 2541da177e4SLinus Torvalds } while (0) 2551da177e4SLinus Torvalds #else 2561da177e4SLinus Torvalds #define EnterFunction(level) do {} while (0) 2571da177e4SLinus Torvalds #define LeaveFunction(level) do {} while (0) 2581da177e4SLinus Torvalds #endif 2591da177e4SLinus Torvalds 2601da177e4SLinus Torvalds #define IP_VS_WAIT_WHILE(expr) while (expr) { cpu_relax(); } 2611da177e4SLinus Torvalds 2621da177e4SLinus Torvalds 2631da177e4SLinus Torvalds /* 2641da177e4SLinus Torvalds * The port number of FTP service (in network order). 2651da177e4SLinus Torvalds */ 266f3a7c66bSHarvey Harrison #define FTPPORT cpu_to_be16(21) 267f3a7c66bSHarvey Harrison #define FTPDATA cpu_to_be16(20) 2681da177e4SLinus Torvalds 2691da177e4SLinus Torvalds /* 2701da177e4SLinus Torvalds * TCP State Values 2711da177e4SLinus Torvalds */ 2721da177e4SLinus Torvalds enum { 2731da177e4SLinus Torvalds IP_VS_TCP_S_NONE = 0, 2741da177e4SLinus Torvalds IP_VS_TCP_S_ESTABLISHED, 2751da177e4SLinus Torvalds IP_VS_TCP_S_SYN_SENT, 2761da177e4SLinus Torvalds IP_VS_TCP_S_SYN_RECV, 2771da177e4SLinus Torvalds IP_VS_TCP_S_FIN_WAIT, 2781da177e4SLinus Torvalds IP_VS_TCP_S_TIME_WAIT, 2791da177e4SLinus Torvalds IP_VS_TCP_S_CLOSE, 2801da177e4SLinus Torvalds IP_VS_TCP_S_CLOSE_WAIT, 2811da177e4SLinus Torvalds IP_VS_TCP_S_LAST_ACK, 2821da177e4SLinus Torvalds IP_VS_TCP_S_LISTEN, 2831da177e4SLinus Torvalds IP_VS_TCP_S_SYNACK, 2841da177e4SLinus Torvalds IP_VS_TCP_S_LAST 2851da177e4SLinus Torvalds }; 2861da177e4SLinus Torvalds 2871da177e4SLinus Torvalds /* 2881da177e4SLinus Torvalds * UDP State Values 2891da177e4SLinus Torvalds */ 2901da177e4SLinus Torvalds enum { 2911da177e4SLinus Torvalds IP_VS_UDP_S_NORMAL, 2921da177e4SLinus Torvalds IP_VS_UDP_S_LAST, 2931da177e4SLinus Torvalds }; 2941da177e4SLinus Torvalds 2951da177e4SLinus Torvalds /* 2961da177e4SLinus Torvalds * ICMP State Values 2971da177e4SLinus Torvalds */ 2981da177e4SLinus Torvalds enum { 2991da177e4SLinus Torvalds IP_VS_ICMP_S_NORMAL, 3001da177e4SLinus Torvalds IP_VS_ICMP_S_LAST, 3011da177e4SLinus Torvalds }; 3021da177e4SLinus Torvalds 3031da177e4SLinus Torvalds /* 3042906f66aSVenkata Mohan Reddy * SCTP State Values 3052906f66aSVenkata Mohan Reddy */ 3062906f66aSVenkata Mohan Reddy enum ip_vs_sctp_states { 3072906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_NONE, 3082906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_INIT_CLI, 3092906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_INIT_SER, 3102906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_INIT_ACK_CLI, 3112906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_INIT_ACK_SER, 3122906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_ECHO_CLI, 3132906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_ECHO_SER, 3142906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_ESTABLISHED, 3152906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_SHUT_CLI, 3162906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_SHUT_SER, 3172906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_SHUT_ACK_CLI, 3182906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_SHUT_ACK_SER, 3192906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_CLOSED, 3202906f66aSVenkata Mohan Reddy IP_VS_SCTP_S_LAST 3212906f66aSVenkata Mohan Reddy }; 3222906f66aSVenkata Mohan Reddy 3232906f66aSVenkata Mohan Reddy /* 3241da177e4SLinus Torvalds * Delta sequence info structure 3251da177e4SLinus Torvalds * Each ip_vs_conn has 2 (output AND input seq. changes). 3261da177e4SLinus Torvalds * Only used in the VS/NAT. 3271da177e4SLinus Torvalds */ 3281da177e4SLinus Torvalds struct ip_vs_seq { 3291da177e4SLinus Torvalds __u32 init_seq; /* Add delta from this seq */ 3301da177e4SLinus Torvalds __u32 delta; /* Delta in sequence numbers */ 3311da177e4SLinus Torvalds __u32 previous_delta; /* Delta in sequence numbers 3321da177e4SLinus Torvalds before last resized pkt */ 3331da177e4SLinus Torvalds }; 3341da177e4SLinus Torvalds 335b17fc996SHans Schillstrom /* 336b17fc996SHans Schillstrom * counters per cpu 337b17fc996SHans Schillstrom */ 338b17fc996SHans Schillstrom struct ip_vs_counters { 339b17fc996SHans Schillstrom __u32 conns; /* connections scheduled */ 340b17fc996SHans Schillstrom __u32 inpkts; /* incoming packets */ 341b17fc996SHans Schillstrom __u32 outpkts; /* outgoing packets */ 342b17fc996SHans Schillstrom __u64 inbytes; /* incoming bytes */ 343b17fc996SHans Schillstrom __u64 outbytes; /* outgoing bytes */ 344b17fc996SHans Schillstrom }; 345b17fc996SHans Schillstrom /* 346b17fc996SHans Schillstrom * Stats per cpu 347b17fc996SHans Schillstrom */ 348b17fc996SHans Schillstrom struct ip_vs_cpu_stats { 349b17fc996SHans Schillstrom struct ip_vs_counters ustats; 350b17fc996SHans Schillstrom struct u64_stats_sync syncp; 351b17fc996SHans Schillstrom }; 3521da177e4SLinus Torvalds 3531da177e4SLinus Torvalds /* 3543a14a313SSven Wegener * IPVS statistics objects 3551da177e4SLinus Torvalds */ 3563a14a313SSven Wegener struct ip_vs_estimator { 3573a14a313SSven Wegener struct list_head list; 3583a14a313SSven Wegener 3593a14a313SSven Wegener u64 last_inbytes; 3603a14a313SSven Wegener u64 last_outbytes; 3613a14a313SSven Wegener u32 last_conns; 3623a14a313SSven Wegener u32 last_inpkts; 3633a14a313SSven Wegener u32 last_outpkts; 3643a14a313SSven Wegener 3653a14a313SSven Wegener u32 cps; 3663a14a313SSven Wegener u32 inpps; 3673a14a313SSven Wegener u32 outpps; 3683a14a313SSven Wegener u32 inbps; 3693a14a313SSven Wegener u32 outbps; 3703a14a313SSven Wegener }; 3713a14a313SSven Wegener 372fd2c3ef7SEric Dumazet struct ip_vs_stats { 373e9c0ce23SSven Wegener struct ip_vs_stats_user ustats; /* statistics */ 374e9c0ce23SSven Wegener struct ip_vs_estimator est; /* estimator */ 375b17fc996SHans Schillstrom struct ip_vs_cpu_stats *cpustats; /* per cpu counters */ 3761da177e4SLinus Torvalds spinlock_t lock; /* spin lock */ 3771da177e4SLinus Torvalds }; 3781da177e4SLinus Torvalds 379b17fc996SHans Schillstrom /* 380b17fc996SHans Schillstrom * Helper Macros for per cpu 381b17fc996SHans Schillstrom * ipvs->tot_stats->ustats.count 382b17fc996SHans Schillstrom */ 383b17fc996SHans Schillstrom #define IPVS_STAT_INC(ipvs, count) \ 384b17fc996SHans Schillstrom __this_cpu_inc((ipvs)->ustats->count) 385b17fc996SHans Schillstrom 386b17fc996SHans Schillstrom #define IPVS_STAT_ADD(ipvs, count, value) \ 387b17fc996SHans Schillstrom do {\ 388b17fc996SHans Schillstrom write_seqcount_begin(per_cpu_ptr((ipvs)->ustats_seq, \ 389b17fc996SHans Schillstrom raw_smp_processor_id())); \ 390b17fc996SHans Schillstrom __this_cpu_add((ipvs)->ustats->count, value); \ 391b17fc996SHans Schillstrom write_seqcount_end(per_cpu_ptr((ipvs)->ustats_seq, \ 392b17fc996SHans Schillstrom raw_smp_processor_id())); \ 393b17fc996SHans Schillstrom } while (0) 394b17fc996SHans Schillstrom 39514c85021SArnaldo Carvalho de Melo struct dst_entry; 39614c85021SArnaldo Carvalho de Melo struct iphdr; 3971da177e4SLinus Torvalds struct ip_vs_conn; 3981da177e4SLinus Torvalds struct ip_vs_app; 39914c85021SArnaldo Carvalho de Melo struct sk_buff; 400252c6410SHans Schillstrom struct ip_vs_proto_data; 4011da177e4SLinus Torvalds 4021da177e4SLinus Torvalds struct ip_vs_protocol { 4031da177e4SLinus Torvalds struct ip_vs_protocol *next; 4041da177e4SLinus Torvalds char *name; 4052ad17defSJulian Anastasov u16 protocol; 4062ad17defSJulian Anastasov u16 num_states; 4071da177e4SLinus Torvalds int dont_defrag; 4081da177e4SLinus Torvalds 4091da177e4SLinus Torvalds void (*init)(struct ip_vs_protocol *pp); 4101da177e4SLinus Torvalds 4111da177e4SLinus Torvalds void (*exit)(struct ip_vs_protocol *pp); 4121da177e4SLinus Torvalds 413252c6410SHans Schillstrom void (*init_netns)(struct net *net, struct ip_vs_proto_data *pd); 414252c6410SHans Schillstrom 415252c6410SHans Schillstrom void (*exit_netns)(struct net *net, struct ip_vs_proto_data *pd); 416252c6410SHans Schillstrom 41751ef348bSJulius Volz int (*conn_schedule)(int af, struct sk_buff *skb, 4189330419dSHans Schillstrom struct ip_vs_proto_data *pd, 4191da177e4SLinus Torvalds int *verdict, struct ip_vs_conn **cpp); 4201da177e4SLinus Torvalds 4211da177e4SLinus Torvalds struct ip_vs_conn * 42251ef348bSJulius Volz (*conn_in_get)(int af, 42351ef348bSJulius Volz const struct sk_buff *skb, 42451ef348bSJulius Volz const struct ip_vs_iphdr *iph, 4251da177e4SLinus Torvalds unsigned int proto_off, 4261da177e4SLinus Torvalds int inverse); 4271da177e4SLinus Torvalds 4281da177e4SLinus Torvalds struct ip_vs_conn * 42951ef348bSJulius Volz (*conn_out_get)(int af, 43051ef348bSJulius Volz const struct sk_buff *skb, 43151ef348bSJulius Volz const struct ip_vs_iphdr *iph, 4321da177e4SLinus Torvalds unsigned int proto_off, 4331da177e4SLinus Torvalds int inverse); 4341da177e4SLinus Torvalds 4353db05feaSHerbert Xu int (*snat_handler)(struct sk_buff *skb, 4361da177e4SLinus Torvalds struct ip_vs_protocol *pp, struct ip_vs_conn *cp); 4371da177e4SLinus Torvalds 4383db05feaSHerbert Xu int (*dnat_handler)(struct sk_buff *skb, 4391da177e4SLinus Torvalds struct ip_vs_protocol *pp, struct ip_vs_conn *cp); 4401da177e4SLinus Torvalds 44151ef348bSJulius Volz int (*csum_check)(int af, struct sk_buff *skb, 44251ef348bSJulius Volz struct ip_vs_protocol *pp); 4431da177e4SLinus Torvalds 4441da177e4SLinus Torvalds const char *(*state_name)(int state); 4451da177e4SLinus Torvalds 4461da177e4SLinus Torvalds int (*state_transition)(struct ip_vs_conn *cp, int direction, 4471da177e4SLinus Torvalds const struct sk_buff *skb, 4489330419dSHans Schillstrom struct ip_vs_proto_data *pd); 4491da177e4SLinus Torvalds 450ab8a5e84SHans Schillstrom int (*register_app)(struct net *net, struct ip_vs_app *inc); 4511da177e4SLinus Torvalds 452ab8a5e84SHans Schillstrom void (*unregister_app)(struct net *net, struct ip_vs_app *inc); 4531da177e4SLinus Torvalds 4541da177e4SLinus Torvalds int (*app_conn_bind)(struct ip_vs_conn *cp); 4551da177e4SLinus Torvalds 4560d79641aSJulian Anastasov void (*debug_packet)(int af, struct ip_vs_protocol *pp, 4571da177e4SLinus Torvalds const struct sk_buff *skb, 4581da177e4SLinus Torvalds int offset, 4591da177e4SLinus Torvalds const char *msg); 4601da177e4SLinus Torvalds 4619330419dSHans Schillstrom void (*timeout_change)(struct ip_vs_proto_data *pd, int flags); 4621da177e4SLinus Torvalds }; 4631da177e4SLinus Torvalds 464252c6410SHans Schillstrom /* 465252c6410SHans Schillstrom * protocol data per netns 466252c6410SHans Schillstrom */ 467252c6410SHans Schillstrom struct ip_vs_proto_data { 468252c6410SHans Schillstrom struct ip_vs_proto_data *next; 469252c6410SHans Schillstrom struct ip_vs_protocol *pp; 470252c6410SHans Schillstrom int *timeout_table; /* protocol timeout table */ 471252c6410SHans Schillstrom atomic_t appcnt; /* counter of proto app incs. */ 472252c6410SHans Schillstrom struct tcp_states_t *tcp_state_table; 473252c6410SHans Schillstrom }; 474252c6410SHans Schillstrom 4751da177e4SLinus Torvalds extern struct ip_vs_protocol *ip_vs_proto_get(unsigned short proto); 476252c6410SHans Schillstrom extern struct ip_vs_proto_data *ip_vs_proto_data_get(struct net *net, 477252c6410SHans Schillstrom unsigned short proto); 4781da177e4SLinus Torvalds 479f11017ecSSimon Horman struct ip_vs_conn_param { 4806e67e586SHans Schillstrom struct net *net; 481f11017ecSSimon Horman const union nf_inet_addr *caddr; 482f11017ecSSimon Horman const union nf_inet_addr *vaddr; 483f11017ecSSimon Horman __be16 cport; 484f11017ecSSimon Horman __be16 vport; 485f11017ecSSimon Horman __u16 protocol; 486f11017ecSSimon Horman u16 af; 48785999283SSimon Horman 48885999283SSimon Horman const struct ip_vs_pe *pe; 48985999283SSimon Horman char *pe_data; 49085999283SSimon Horman __u8 pe_data_len; 491f11017ecSSimon Horman }; 492f11017ecSSimon Horman 4931da177e4SLinus Torvalds /* 4941da177e4SLinus Torvalds * IP_VS structure allocated for each dynamically scheduled connection 4951da177e4SLinus Torvalds */ 4961da177e4SLinus Torvalds struct ip_vs_conn { 497731109e7SChangli Gao struct hlist_node c_list; /* hashed list heads */ 4986e67e586SHans Schillstrom #ifdef CONFIG_NET_NS 4996e67e586SHans Schillstrom struct net *net; /* Name space */ 5006e67e586SHans Schillstrom #endif 5011da177e4SLinus Torvalds /* Protocol, addresses and port numbers */ 502e7ade46aSJulius Volz u16 af; /* address family */ 5036e67e586SHans Schillstrom __be16 cport; 5046e67e586SHans Schillstrom __be16 vport; 5056e67e586SHans Schillstrom __be16 dport; 5066e67e586SHans Schillstrom __u32 fwmark; /* Fire wall mark from skb */ 507e7ade46aSJulius Volz union nf_inet_addr caddr; /* client address */ 508e7ade46aSJulius Volz union nf_inet_addr vaddr; /* virtual address */ 509e7ade46aSJulius Volz union nf_inet_addr daddr; /* destination address */ 5103575792eSJulian Anastasov volatile __u32 flags; /* status flags */ 5111da177e4SLinus Torvalds __u16 protocol; /* Which protocol (TCP/UDP) */ 5121da177e4SLinus Torvalds 5131da177e4SLinus Torvalds /* counter and timer */ 5141da177e4SLinus Torvalds atomic_t refcnt; /* reference count */ 5151da177e4SLinus Torvalds struct timer_list timer; /* Expiration timer */ 5161da177e4SLinus Torvalds volatile unsigned long timeout; /* timeout */ 5171da177e4SLinus Torvalds 5181da177e4SLinus Torvalds /* Flags and state transition */ 5191da177e4SLinus Torvalds spinlock_t lock; /* lock for state transition */ 5201da177e4SLinus Torvalds volatile __u16 state; /* state info */ 521efac5276SRumen G. Bogdanovski volatile __u16 old_state; /* old state, to be used for 522efac5276SRumen G. Bogdanovski * state transition triggerd 523efac5276SRumen G. Bogdanovski * synchronization 524efac5276SRumen G. Bogdanovski */ 5251da177e4SLinus Torvalds 5261da177e4SLinus Torvalds /* Control members */ 5271da177e4SLinus Torvalds struct ip_vs_conn *control; /* Master control connection */ 5281da177e4SLinus Torvalds atomic_t n_control; /* Number of controlled ones */ 5291da177e4SLinus Torvalds struct ip_vs_dest *dest; /* real server */ 5301da177e4SLinus Torvalds atomic_t in_pkts; /* incoming packet counter */ 5311da177e4SLinus Torvalds 5321da177e4SLinus Torvalds /* packet transmitter for different forwarding methods. If it 5331da177e4SLinus Torvalds mangles the packet, it must return NF_DROP or better NF_STOLEN, 5341da177e4SLinus Torvalds otherwise this must be changed to a sk_buff **. 535fc604767SJulian Anastasov NF_ACCEPT can be returned when destination is local. 5361da177e4SLinus Torvalds */ 5371da177e4SLinus Torvalds int (*packet_xmit)(struct sk_buff *skb, struct ip_vs_conn *cp, 5381da177e4SLinus Torvalds struct ip_vs_protocol *pp); 5391da177e4SLinus Torvalds 5401da177e4SLinus Torvalds /* Note: we can group the following members into a structure, 5411da177e4SLinus Torvalds in order to save more space, and the following members are 5421da177e4SLinus Torvalds only used in VS/NAT anyway */ 5431da177e4SLinus Torvalds struct ip_vs_app *app; /* bound ip_vs_app object */ 5441da177e4SLinus Torvalds void *app_data; /* Application private data */ 5451da177e4SLinus Torvalds struct ip_vs_seq in_seq; /* incoming seq. struct */ 5461da177e4SLinus Torvalds struct ip_vs_seq out_seq; /* outgoing seq. struct */ 54785999283SSimon Horman 548e9e5eee8SSimon Horman const struct ip_vs_pe *pe; 54985999283SSimon Horman char *pe_data; 55085999283SSimon Horman __u8 pe_data_len; 5511da177e4SLinus Torvalds }; 5521da177e4SLinus Torvalds 5536e67e586SHans Schillstrom /* 5546e67e586SHans Schillstrom * To save some memory in conn table when name space is disabled. 5556e67e586SHans Schillstrom */ 5566e67e586SHans Schillstrom static inline struct net *ip_vs_conn_net(const struct ip_vs_conn *cp) 5576e67e586SHans Schillstrom { 5586e67e586SHans Schillstrom #ifdef CONFIG_NET_NS 5596e67e586SHans Schillstrom return cp->net; 5606e67e586SHans Schillstrom #else 5616e67e586SHans Schillstrom return &init_net; 5626e67e586SHans Schillstrom #endif 5636e67e586SHans Schillstrom } 5646e67e586SHans Schillstrom static inline void ip_vs_conn_net_set(struct ip_vs_conn *cp, struct net *net) 5656e67e586SHans Schillstrom { 5666e67e586SHans Schillstrom #ifdef CONFIG_NET_NS 5676e67e586SHans Schillstrom cp->net = net; 5686e67e586SHans Schillstrom #endif 5696e67e586SHans Schillstrom } 5706e67e586SHans Schillstrom 5716e67e586SHans Schillstrom static inline int ip_vs_conn_net_eq(const struct ip_vs_conn *cp, 5726e67e586SHans Schillstrom struct net *net) 5736e67e586SHans Schillstrom { 5746e67e586SHans Schillstrom #ifdef CONFIG_NET_NS 5756e67e586SHans Schillstrom return cp->net == net; 5766e67e586SHans Schillstrom #else 5776e67e586SHans Schillstrom return 1; 5786e67e586SHans Schillstrom #endif 5796e67e586SHans Schillstrom } 5801da177e4SLinus Torvalds 5811da177e4SLinus Torvalds /* 582c860c6b1SJulius Volz * Extended internal versions of struct ip_vs_service_user and 583c860c6b1SJulius Volz * ip_vs_dest_user for IPv6 support. 584c860c6b1SJulius Volz * 585c860c6b1SJulius Volz * We need these to conveniently pass around service and destination 586c860c6b1SJulius Volz * options, but unfortunately, we also need to keep the old definitions to 587c860c6b1SJulius Volz * maintain userspace backwards compatibility for the setsockopt interface. 588c860c6b1SJulius Volz */ 589c860c6b1SJulius Volz struct ip_vs_service_user_kern { 590c860c6b1SJulius Volz /* virtual service addresses */ 591c860c6b1SJulius Volz u16 af; 592c860c6b1SJulius Volz u16 protocol; 593c860c6b1SJulius Volz union nf_inet_addr addr; /* virtual ip address */ 594c860c6b1SJulius Volz u16 port; 595c860c6b1SJulius Volz u32 fwmark; /* firwall mark of service */ 596c860c6b1SJulius Volz 597c860c6b1SJulius Volz /* virtual service options */ 598c860c6b1SJulius Volz char *sched_name; 5990d1e71b0SSimon Horman char *pe_name; 600c860c6b1SJulius Volz unsigned flags; /* virtual service flags */ 601c860c6b1SJulius Volz unsigned timeout; /* persistent timeout in sec */ 602c860c6b1SJulius Volz u32 netmask; /* persistent netmask */ 603c860c6b1SJulius Volz }; 604c860c6b1SJulius Volz 605c860c6b1SJulius Volz 606c860c6b1SJulius Volz struct ip_vs_dest_user_kern { 607c860c6b1SJulius Volz /* destination server address */ 608c860c6b1SJulius Volz union nf_inet_addr addr; 609c860c6b1SJulius Volz u16 port; 610c860c6b1SJulius Volz 611c860c6b1SJulius Volz /* real server options */ 612c860c6b1SJulius Volz unsigned conn_flags; /* connection flags */ 613c860c6b1SJulius Volz int weight; /* destination weight */ 614c860c6b1SJulius Volz 615c860c6b1SJulius Volz /* thresholds for active connections */ 616c860c6b1SJulius Volz u32 u_threshold; /* upper threshold */ 617c860c6b1SJulius Volz u32 l_threshold; /* lower threshold */ 618c860c6b1SJulius Volz }; 619c860c6b1SJulius Volz 620c860c6b1SJulius Volz 621c860c6b1SJulius Volz /* 6221da177e4SLinus Torvalds * The information about the virtual service offered to the net 6231da177e4SLinus Torvalds * and the forwarding entries 6241da177e4SLinus Torvalds */ 6251da177e4SLinus Torvalds struct ip_vs_service { 6261da177e4SLinus Torvalds struct list_head s_list; /* for normal service table */ 6271da177e4SLinus Torvalds struct list_head f_list; /* for fwmark-based service table */ 6281da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 6291da177e4SLinus Torvalds atomic_t usecnt; /* use counter */ 6301da177e4SLinus Torvalds 631e7ade46aSJulius Volz u16 af; /* address family */ 6321da177e4SLinus Torvalds __u16 protocol; /* which protocol (TCP/UDP) */ 633e7ade46aSJulius Volz union nf_inet_addr addr; /* IP address for virtual service */ 634014d730dSAl Viro __be16 port; /* port number for the service */ 6351da177e4SLinus Torvalds __u32 fwmark; /* firewall mark of the service */ 6361da177e4SLinus Torvalds unsigned flags; /* service status flags */ 6371da177e4SLinus Torvalds unsigned timeout; /* persistent timeout in ticks */ 638014d730dSAl Viro __be32 netmask; /* grouping granularity */ 639fc723250SHans Schillstrom struct net *net; 6401da177e4SLinus Torvalds 6411da177e4SLinus Torvalds struct list_head destinations; /* real server d-linked list */ 6421da177e4SLinus Torvalds __u32 num_dests; /* number of servers */ 6431da177e4SLinus Torvalds struct ip_vs_stats stats; /* statistics for the service */ 6441da177e4SLinus Torvalds struct ip_vs_app *inc; /* bind conns to this app inc */ 6451da177e4SLinus Torvalds 6461da177e4SLinus Torvalds /* for scheduling */ 6471da177e4SLinus Torvalds struct ip_vs_scheduler *scheduler; /* bound scheduler object */ 6481da177e4SLinus Torvalds rwlock_t sched_lock; /* lock sched_data */ 6491da177e4SLinus Torvalds void *sched_data; /* scheduler application data */ 65085999283SSimon Horman 65185999283SSimon Horman /* alternate persistence engine */ 65285999283SSimon Horman struct ip_vs_pe *pe; 6531da177e4SLinus Torvalds }; 6541da177e4SLinus Torvalds 6551da177e4SLinus Torvalds 6561da177e4SLinus Torvalds /* 6571da177e4SLinus Torvalds * The real server destination forwarding entry 6581da177e4SLinus Torvalds * with ip address, port number, and so on. 6591da177e4SLinus Torvalds */ 6601da177e4SLinus Torvalds struct ip_vs_dest { 6611da177e4SLinus Torvalds struct list_head n_list; /* for the dests in the service */ 6621da177e4SLinus Torvalds struct list_head d_list; /* for table with all the dests */ 6631da177e4SLinus Torvalds 664e7ade46aSJulius Volz u16 af; /* address family */ 665014d730dSAl Viro __be16 port; /* port number of the server */ 666f2431e6eSHans Schillstrom union nf_inet_addr addr; /* IP address of the server */ 6671da177e4SLinus Torvalds volatile unsigned flags; /* dest status flags */ 6681da177e4SLinus Torvalds atomic_t conn_flags; /* flags to copy to conn */ 6691da177e4SLinus Torvalds atomic_t weight; /* server weight */ 6701da177e4SLinus Torvalds 6711da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 6721da177e4SLinus Torvalds struct ip_vs_stats stats; /* statistics */ 6731da177e4SLinus Torvalds 6741da177e4SLinus Torvalds /* connection counters and thresholds */ 6751da177e4SLinus Torvalds atomic_t activeconns; /* active connections */ 6761da177e4SLinus Torvalds atomic_t inactconns; /* inactive connections */ 6771da177e4SLinus Torvalds atomic_t persistconns; /* persistent connections */ 6781da177e4SLinus Torvalds __u32 u_threshold; /* upper threshold */ 6791da177e4SLinus Torvalds __u32 l_threshold; /* lower threshold */ 6801da177e4SLinus Torvalds 6811da177e4SLinus Torvalds /* for destination cache */ 6821da177e4SLinus Torvalds spinlock_t dst_lock; /* lock of dst_cache */ 6831da177e4SLinus Torvalds struct dst_entry *dst_cache; /* destination cache entry */ 6841da177e4SLinus Torvalds u32 dst_rtos; /* RT_TOS(tos) for dst */ 685714f095fSHans Schillstrom u32 dst_cookie; 686714f095fSHans Schillstrom #ifdef CONFIG_IP_VS_IPV6 687714f095fSHans Schillstrom struct in6_addr dst_saddr; 688714f095fSHans Schillstrom #endif 6891da177e4SLinus Torvalds 6901da177e4SLinus Torvalds /* for virtual service */ 6911da177e4SLinus Torvalds struct ip_vs_service *svc; /* service it belongs to */ 6921da177e4SLinus Torvalds __u16 protocol; /* which protocol (TCP/UDP) */ 693014d730dSAl Viro __be16 vport; /* virtual port number */ 694f2431e6eSHans Schillstrom union nf_inet_addr vaddr; /* virtual IP address */ 6951da177e4SLinus Torvalds __u32 vfwmark; /* firewall mark of service */ 6961da177e4SLinus Torvalds }; 6971da177e4SLinus Torvalds 6981da177e4SLinus Torvalds 6991da177e4SLinus Torvalds /* 7001da177e4SLinus Torvalds * The scheduler object 7011da177e4SLinus Torvalds */ 7021da177e4SLinus Torvalds struct ip_vs_scheduler { 7031da177e4SLinus Torvalds struct list_head n_list; /* d-linked list head */ 7041da177e4SLinus Torvalds char *name; /* scheduler name */ 7051da177e4SLinus Torvalds atomic_t refcnt; /* reference counter */ 7061da177e4SLinus Torvalds struct module *module; /* THIS_MODULE/NULL */ 7071da177e4SLinus Torvalds 7081da177e4SLinus Torvalds /* scheduler initializing service */ 7091da177e4SLinus Torvalds int (*init_service)(struct ip_vs_service *svc); 7101da177e4SLinus Torvalds /* scheduling service finish */ 7111da177e4SLinus Torvalds int (*done_service)(struct ip_vs_service *svc); 7121da177e4SLinus Torvalds /* scheduler updating service */ 7131da177e4SLinus Torvalds int (*update_service)(struct ip_vs_service *svc); 7141da177e4SLinus Torvalds 7151da177e4SLinus Torvalds /* selecting a server from the given service */ 7161da177e4SLinus Torvalds struct ip_vs_dest* (*schedule)(struct ip_vs_service *svc, 7171da177e4SLinus Torvalds const struct sk_buff *skb); 7181da177e4SLinus Torvalds }; 7191da177e4SLinus Torvalds 72085999283SSimon Horman /* The persistence engine object */ 72185999283SSimon Horman struct ip_vs_pe { 72285999283SSimon Horman struct list_head n_list; /* d-linked list head */ 72385999283SSimon Horman char *name; /* scheduler name */ 72485999283SSimon Horman atomic_t refcnt; /* reference counter */ 72585999283SSimon Horman struct module *module; /* THIS_MODULE/NULL */ 72685999283SSimon Horman 72785999283SSimon Horman /* get the connection template, if any */ 72885999283SSimon Horman int (*fill_param)(struct ip_vs_conn_param *p, struct sk_buff *skb); 72985999283SSimon Horman bool (*ct_match)(const struct ip_vs_conn_param *p, 73085999283SSimon Horman struct ip_vs_conn *ct); 73185999283SSimon Horman u32 (*hashkey_raw)(const struct ip_vs_conn_param *p, u32 initval, 73285999283SSimon Horman bool inverse); 733a3c918acSSimon Horman int (*show_pe_data)(const struct ip_vs_conn *cp, char *buf); 73485999283SSimon Horman }; 7351da177e4SLinus Torvalds 7361da177e4SLinus Torvalds /* 7371da177e4SLinus Torvalds * The application module object (a.k.a. app incarnation) 7381da177e4SLinus Torvalds */ 739fd2c3ef7SEric Dumazet struct ip_vs_app { 7401da177e4SLinus Torvalds struct list_head a_list; /* member in app list */ 7411da177e4SLinus Torvalds int type; /* IP_VS_APP_TYPE_xxx */ 7421da177e4SLinus Torvalds char *name; /* application module name */ 7431da177e4SLinus Torvalds __u16 protocol; 7441da177e4SLinus Torvalds struct module *module; /* THIS_MODULE/NULL */ 7451da177e4SLinus Torvalds struct list_head incs_list; /* list of incarnations */ 7461da177e4SLinus Torvalds 7471da177e4SLinus Torvalds /* members for application incarnations */ 7481da177e4SLinus Torvalds struct list_head p_list; /* member in proto app list */ 7491da177e4SLinus Torvalds struct ip_vs_app *app; /* its real application */ 750014d730dSAl Viro __be16 port; /* port number in net order */ 7511da177e4SLinus Torvalds atomic_t usecnt; /* usage counter */ 7521da177e4SLinus Torvalds 7538b27b10fSJulian Anastasov /* 7548b27b10fSJulian Anastasov * output hook: Process packet in inout direction, diff set for TCP. 7558b27b10fSJulian Anastasov * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok, 7568b27b10fSJulian Anastasov * 2=Mangled but checksum was not updated 7578b27b10fSJulian Anastasov */ 7581da177e4SLinus Torvalds int (*pkt_out)(struct ip_vs_app *, struct ip_vs_conn *, 7593db05feaSHerbert Xu struct sk_buff *, int *diff); 7601da177e4SLinus Torvalds 7618b27b10fSJulian Anastasov /* 7628b27b10fSJulian Anastasov * input hook: Process packet in outin direction, diff set for TCP. 7638b27b10fSJulian Anastasov * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok, 7648b27b10fSJulian Anastasov * 2=Mangled but checksum was not updated 7658b27b10fSJulian Anastasov */ 7661da177e4SLinus Torvalds int (*pkt_in)(struct ip_vs_app *, struct ip_vs_conn *, 7673db05feaSHerbert Xu struct sk_buff *, int *diff); 7681da177e4SLinus Torvalds 7691da177e4SLinus Torvalds /* ip_vs_app initializer */ 7701da177e4SLinus Torvalds int (*init_conn)(struct ip_vs_app *, struct ip_vs_conn *); 7711da177e4SLinus Torvalds 7721da177e4SLinus Torvalds /* ip_vs_app finish */ 7731da177e4SLinus Torvalds int (*done_conn)(struct ip_vs_app *, struct ip_vs_conn *); 7741da177e4SLinus Torvalds 7751da177e4SLinus Torvalds 7761da177e4SLinus Torvalds /* not used now */ 7771da177e4SLinus Torvalds int (*bind_conn)(struct ip_vs_app *, struct ip_vs_conn *, 7781da177e4SLinus Torvalds struct ip_vs_protocol *); 7791da177e4SLinus Torvalds 7801da177e4SLinus Torvalds void (*unbind_conn)(struct ip_vs_app *, struct ip_vs_conn *); 7811da177e4SLinus Torvalds 7821da177e4SLinus Torvalds int * timeout_table; 7831da177e4SLinus Torvalds int * timeouts; 7841da177e4SLinus Torvalds int timeouts_size; 7851da177e4SLinus Torvalds 7861da177e4SLinus Torvalds int (*conn_schedule)(struct sk_buff *skb, struct ip_vs_app *app, 7871da177e4SLinus Torvalds int *verdict, struct ip_vs_conn **cpp); 7881da177e4SLinus Torvalds 7891da177e4SLinus Torvalds struct ip_vs_conn * 7901da177e4SLinus Torvalds (*conn_in_get)(const struct sk_buff *skb, struct ip_vs_app *app, 7911da177e4SLinus Torvalds const struct iphdr *iph, unsigned int proto_off, 7921da177e4SLinus Torvalds int inverse); 7931da177e4SLinus Torvalds 7941da177e4SLinus Torvalds struct ip_vs_conn * 7951da177e4SLinus Torvalds (*conn_out_get)(const struct sk_buff *skb, struct ip_vs_app *app, 7961da177e4SLinus Torvalds const struct iphdr *iph, unsigned int proto_off, 7971da177e4SLinus Torvalds int inverse); 7981da177e4SLinus Torvalds 7991da177e4SLinus Torvalds int (*state_transition)(struct ip_vs_conn *cp, int direction, 8001da177e4SLinus Torvalds const struct sk_buff *skb, 8011da177e4SLinus Torvalds struct ip_vs_app *app); 8021da177e4SLinus Torvalds 8031da177e4SLinus Torvalds void (*timeout_change)(struct ip_vs_app *app, int flags); 8041da177e4SLinus Torvalds }; 8051da177e4SLinus Torvalds 8062553d064SJulian Anastasov /* IPVS in network namespace */ 8072553d064SJulian Anastasov struct netns_ipvs { 8082553d064SJulian Anastasov int gen; /* Generation */ 8092553d064SJulian Anastasov /* 8102553d064SJulian Anastasov * Hash table: for real service lookups 8112553d064SJulian Anastasov */ 8122553d064SJulian Anastasov #define IP_VS_RTAB_BITS 4 8132553d064SJulian Anastasov #define IP_VS_RTAB_SIZE (1 << IP_VS_RTAB_BITS) 8142553d064SJulian Anastasov #define IP_VS_RTAB_MASK (IP_VS_RTAB_SIZE - 1) 8152553d064SJulian Anastasov 8162553d064SJulian Anastasov struct list_head rs_table[IP_VS_RTAB_SIZE]; 8172553d064SJulian Anastasov /* ip_vs_app */ 8182553d064SJulian Anastasov struct list_head app_list; 8192553d064SJulian Anastasov struct mutex app_mutex; 8202553d064SJulian Anastasov struct lock_class_key app_key; /* mutex debuging */ 8212553d064SJulian Anastasov 8222553d064SJulian Anastasov /* ip_vs_proto */ 8232553d064SJulian Anastasov #define IP_VS_PROTO_TAB_SIZE 32 /* must be power of 2 */ 8242553d064SJulian Anastasov struct ip_vs_proto_data *proto_data_table[IP_VS_PROTO_TAB_SIZE]; 8252553d064SJulian Anastasov /* ip_vs_proto_tcp */ 8262553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_TCP 8272553d064SJulian Anastasov #define TCP_APP_TAB_BITS 4 8282553d064SJulian Anastasov #define TCP_APP_TAB_SIZE (1 << TCP_APP_TAB_BITS) 8292553d064SJulian Anastasov #define TCP_APP_TAB_MASK (TCP_APP_TAB_SIZE - 1) 8302553d064SJulian Anastasov struct list_head tcp_apps[TCP_APP_TAB_SIZE]; 8312553d064SJulian Anastasov spinlock_t tcp_app_lock; 8322553d064SJulian Anastasov #endif 8332553d064SJulian Anastasov /* ip_vs_proto_udp */ 8342553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_UDP 8352553d064SJulian Anastasov #define UDP_APP_TAB_BITS 4 8362553d064SJulian Anastasov #define UDP_APP_TAB_SIZE (1 << UDP_APP_TAB_BITS) 8372553d064SJulian Anastasov #define UDP_APP_TAB_MASK (UDP_APP_TAB_SIZE - 1) 8382553d064SJulian Anastasov struct list_head udp_apps[UDP_APP_TAB_SIZE]; 8392553d064SJulian Anastasov spinlock_t udp_app_lock; 8402553d064SJulian Anastasov #endif 8412553d064SJulian Anastasov /* ip_vs_proto_sctp */ 8422553d064SJulian Anastasov #ifdef CONFIG_IP_VS_PROTO_SCTP 8432553d064SJulian Anastasov #define SCTP_APP_TAB_BITS 4 8442553d064SJulian Anastasov #define SCTP_APP_TAB_SIZE (1 << SCTP_APP_TAB_BITS) 8452553d064SJulian Anastasov #define SCTP_APP_TAB_MASK (SCTP_APP_TAB_SIZE - 1) 8462553d064SJulian Anastasov /* Hash table for SCTP application incarnations */ 8472553d064SJulian Anastasov struct list_head sctp_apps[SCTP_APP_TAB_SIZE]; 8482553d064SJulian Anastasov spinlock_t sctp_app_lock; 8492553d064SJulian Anastasov #endif 8502553d064SJulian Anastasov /* ip_vs_conn */ 8512553d064SJulian Anastasov atomic_t conn_count; /* connection counter */ 8522553d064SJulian Anastasov 8532553d064SJulian Anastasov /* ip_vs_ctl */ 854*2a0751afSJulian Anastasov struct ip_vs_stats tot_stats; /* Statistics & est. */ 8552553d064SJulian Anastasov seqcount_t *ustats_seq; /* u64 read retry */ 8562553d064SJulian Anastasov 8572553d064SJulian Anastasov int num_services; /* no of virtual services */ 8582553d064SJulian Anastasov /* 1/rate drop and drop-entry variables */ 8592553d064SJulian Anastasov struct delayed_work defense_work; /* Work handler */ 8602553d064SJulian Anastasov int drop_rate; 8612553d064SJulian Anastasov int drop_counter; 8622553d064SJulian Anastasov atomic_t dropentry; 8632553d064SJulian Anastasov /* locks in ctl.c */ 8642553d064SJulian Anastasov spinlock_t dropentry_lock; /* drop entry handling */ 8652553d064SJulian Anastasov spinlock_t droppacket_lock; /* drop packet handling */ 8662553d064SJulian Anastasov spinlock_t securetcp_lock; /* state and timeout tables */ 8672553d064SJulian Anastasov rwlock_t rs_lock; /* real services table */ 8682553d064SJulian Anastasov /* semaphore for IPVS sockopts. And, [gs]etsockopt may sleep. */ 8692553d064SJulian Anastasov struct lock_class_key ctl_key; /* ctl_mutex debuging */ 8702553d064SJulian Anastasov /* Trash for destinations */ 8712553d064SJulian Anastasov struct list_head dest_trash; 8722553d064SJulian Anastasov /* Service counters */ 8732553d064SJulian Anastasov atomic_t ftpsvc_counter; 8742553d064SJulian Anastasov atomic_t nullsvc_counter; 8752553d064SJulian Anastasov 8762553d064SJulian Anastasov /* sys-ctl struct */ 8772553d064SJulian Anastasov struct ctl_table_header *sysctl_hdr; 8782553d064SJulian Anastasov struct ctl_table *sysctl_tbl; 8792553d064SJulian Anastasov /* sysctl variables */ 8802553d064SJulian Anastasov int sysctl_amemthresh; 8812553d064SJulian Anastasov int sysctl_am_droprate; 8822553d064SJulian Anastasov int sysctl_drop_entry; 8832553d064SJulian Anastasov int sysctl_drop_packet; 8842553d064SJulian Anastasov int sysctl_secure_tcp; 8852553d064SJulian Anastasov #ifdef CONFIG_IP_VS_NFCT 8862553d064SJulian Anastasov int sysctl_conntrack; 8872553d064SJulian Anastasov #endif 8882553d064SJulian Anastasov int sysctl_snat_reroute; 8892553d064SJulian Anastasov int sysctl_sync_ver; 8902553d064SJulian Anastasov int sysctl_cache_bypass; 8912553d064SJulian Anastasov int sysctl_expire_nodest_conn; 8922553d064SJulian Anastasov int sysctl_expire_quiescent_template; 8932553d064SJulian Anastasov int sysctl_sync_threshold[2]; 8942553d064SJulian Anastasov int sysctl_nat_icmp_send; 8952553d064SJulian Anastasov 8962553d064SJulian Anastasov /* ip_vs_lblc */ 8972553d064SJulian Anastasov int sysctl_lblc_expiration; 8982553d064SJulian Anastasov struct ctl_table_header *lblc_ctl_header; 8992553d064SJulian Anastasov struct ctl_table *lblc_ctl_table; 9002553d064SJulian Anastasov /* ip_vs_lblcr */ 9012553d064SJulian Anastasov int sysctl_lblcr_expiration; 9022553d064SJulian Anastasov struct ctl_table_header *lblcr_ctl_header; 9032553d064SJulian Anastasov struct ctl_table *lblcr_ctl_table; 9042553d064SJulian Anastasov /* ip_vs_est */ 9052553d064SJulian Anastasov struct list_head est_list; /* estimator list */ 9062553d064SJulian Anastasov spinlock_t est_lock; 9072553d064SJulian Anastasov struct timer_list est_timer; /* Estimation timer */ 9082553d064SJulian Anastasov /* ip_vs_sync */ 9092553d064SJulian Anastasov struct list_head sync_queue; 9102553d064SJulian Anastasov spinlock_t sync_lock; 9112553d064SJulian Anastasov struct ip_vs_sync_buff *sync_buff; 9122553d064SJulian Anastasov spinlock_t sync_buff_lock; 9132553d064SJulian Anastasov struct sockaddr_in sync_mcast_addr; 9142553d064SJulian Anastasov struct task_struct *master_thread; 9152553d064SJulian Anastasov struct task_struct *backup_thread; 9162553d064SJulian Anastasov int send_mesg_maxlen; 9172553d064SJulian Anastasov int recv_mesg_maxlen; 9182553d064SJulian Anastasov volatile int sync_state; 9192553d064SJulian Anastasov volatile int master_syncid; 9202553d064SJulian Anastasov volatile int backup_syncid; 9212553d064SJulian Anastasov /* multicast interface name */ 9222553d064SJulian Anastasov char master_mcast_ifn[IP_VS_IFNAME_MAXLEN]; 9232553d064SJulian Anastasov char backup_mcast_ifn[IP_VS_IFNAME_MAXLEN]; 9242553d064SJulian Anastasov /* net name space ptr */ 9252553d064SJulian Anastasov struct net *net; /* Needed by timer routines */ 9262553d064SJulian Anastasov }; 9271da177e4SLinus Torvalds 9281da177e4SLinus Torvalds /* 9291da177e4SLinus Torvalds * IPVS core functions 9301da177e4SLinus Torvalds * (from ip_vs_core.c) 9311da177e4SLinus Torvalds */ 9321da177e4SLinus Torvalds extern const char *ip_vs_proto_name(unsigned proto); 9331da177e4SLinus Torvalds extern void ip_vs_init_hash_table(struct list_head *table, int rows); 934afdd6140SSven Wegener #define IP_VS_INIT_HASH_TABLE(t) ip_vs_init_hash_table((t), ARRAY_SIZE((t))) 9351da177e4SLinus Torvalds 9361da177e4SLinus Torvalds #define IP_VS_APP_TYPE_FTP 1 9371da177e4SLinus Torvalds 9381da177e4SLinus Torvalds /* 9391da177e4SLinus Torvalds * ip_vs_conn handling functions 9401da177e4SLinus Torvalds * (from ip_vs_conn.c) 9411da177e4SLinus Torvalds */ 9421da177e4SLinus Torvalds 9431da177e4SLinus Torvalds enum { 9441da177e4SLinus Torvalds IP_VS_DIR_INPUT = 0, 9451da177e4SLinus Torvalds IP_VS_DIR_OUTPUT, 9461da177e4SLinus Torvalds IP_VS_DIR_INPUT_ONLY, 9471da177e4SLinus Torvalds IP_VS_DIR_LAST, 9481da177e4SLinus Torvalds }; 9491da177e4SLinus Torvalds 9506e67e586SHans Schillstrom static inline void ip_vs_conn_fill_param(struct net *net, int af, int protocol, 951f11017ecSSimon Horman const union nf_inet_addr *caddr, 952f11017ecSSimon Horman __be16 cport, 953f11017ecSSimon Horman const union nf_inet_addr *vaddr, 954f11017ecSSimon Horman __be16 vport, 955f11017ecSSimon Horman struct ip_vs_conn_param *p) 956f11017ecSSimon Horman { 9576e67e586SHans Schillstrom p->net = net; 958f11017ecSSimon Horman p->af = af; 959f11017ecSSimon Horman p->protocol = protocol; 960f11017ecSSimon Horman p->caddr = caddr; 961f11017ecSSimon Horman p->cport = cport; 962f11017ecSSimon Horman p->vaddr = vaddr; 963f11017ecSSimon Horman p->vport = vport; 96485999283SSimon Horman p->pe = NULL; 96585999283SSimon Horman p->pe_data = NULL; 966f11017ecSSimon Horman } 96728364a59SJulius Volz 968f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_in_get(const struct ip_vs_conn_param *p); 969f11017ecSSimon Horman struct ip_vs_conn *ip_vs_ct_in_get(const struct ip_vs_conn_param *p); 97028364a59SJulius Volz 9715c0d2374SSimon Horman struct ip_vs_conn * ip_vs_conn_in_get_proto(int af, const struct sk_buff *skb, 9725c0d2374SSimon Horman const struct ip_vs_iphdr *iph, 9735c0d2374SSimon Horman unsigned int proto_off, 9745c0d2374SSimon Horman int inverse); 9755c0d2374SSimon Horman 976f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_out_get(const struct ip_vs_conn_param *p); 9771da177e4SLinus Torvalds 9785c0d2374SSimon Horman struct ip_vs_conn * ip_vs_conn_out_get_proto(int af, const struct sk_buff *skb, 9795c0d2374SSimon Horman const struct ip_vs_iphdr *iph, 9805c0d2374SSimon Horman unsigned int proto_off, 9815c0d2374SSimon Horman int inverse); 9825c0d2374SSimon Horman 9831da177e4SLinus Torvalds /* put back the conn without restarting its timer */ 9841da177e4SLinus Torvalds static inline void __ip_vs_conn_put(struct ip_vs_conn *cp) 9851da177e4SLinus Torvalds { 9861da177e4SLinus Torvalds atomic_dec(&cp->refcnt); 9871da177e4SLinus Torvalds } 9881da177e4SLinus Torvalds extern void ip_vs_conn_put(struct ip_vs_conn *cp); 989014d730dSAl Viro extern void ip_vs_conn_fill_cport(struct ip_vs_conn *cp, __be16 cport); 9901da177e4SLinus Torvalds 991f11017ecSSimon Horman struct ip_vs_conn *ip_vs_conn_new(const struct ip_vs_conn_param *p, 992f11017ecSSimon Horman const union nf_inet_addr *daddr, 993f11017ecSSimon Horman __be16 dport, unsigned flags, 9940e051e68SHans Schillstrom struct ip_vs_dest *dest, __u32 fwmark); 9951da177e4SLinus Torvalds extern void ip_vs_conn_expire_now(struct ip_vs_conn *cp); 9961da177e4SLinus Torvalds 9971da177e4SLinus Torvalds extern const char * ip_vs_state_name(__u16 proto, int state); 9981da177e4SLinus Torvalds 9994a85b96cSHans Schillstrom extern void ip_vs_tcp_conn_listen(struct net *net, struct ip_vs_conn *cp); 10001da177e4SLinus Torvalds extern int ip_vs_check_template(struct ip_vs_conn *ct); 1001f6340ee0SHans Schillstrom extern void ip_vs_random_dropentry(struct net *net); 10021da177e4SLinus Torvalds extern int ip_vs_conn_init(void); 10031da177e4SLinus Torvalds extern void ip_vs_conn_cleanup(void); 10041da177e4SLinus Torvalds 10051da177e4SLinus Torvalds static inline void ip_vs_control_del(struct ip_vs_conn *cp) 10061da177e4SLinus Torvalds { 10071da177e4SLinus Torvalds struct ip_vs_conn *ctl_cp = cp->control; 10081da177e4SLinus Torvalds if (!ctl_cp) { 1009cfc78c5aSJulius Volz IP_VS_ERR_BUF("request control DEL for uncontrolled: " 1010cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1011cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1012cfc78c5aSJulius Volz ntohs(cp->cport), 1013cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1014cfc78c5aSJulius Volz ntohs(cp->vport)); 1015cfc78c5aSJulius Volz 10161da177e4SLinus Torvalds return; 10171da177e4SLinus Torvalds } 10181da177e4SLinus Torvalds 1019cfc78c5aSJulius Volz IP_VS_DBG_BUF(7, "DELeting control for: " 1020cfc78c5aSJulius Volz "cp.dst=%s:%d ctl_cp.dst=%s:%d\n", 1021cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1022cfc78c5aSJulius Volz ntohs(cp->cport), 1023cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr), 1024cfc78c5aSJulius Volz ntohs(ctl_cp->cport)); 10251da177e4SLinus Torvalds 10261da177e4SLinus Torvalds cp->control = NULL; 10271da177e4SLinus Torvalds if (atomic_read(&ctl_cp->n_control) == 0) { 1028cfc78c5aSJulius Volz IP_VS_ERR_BUF("BUG control DEL with n=0 : " 1029cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1030cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1031cfc78c5aSJulius Volz ntohs(cp->cport), 1032cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1033cfc78c5aSJulius Volz ntohs(cp->vport)); 1034cfc78c5aSJulius Volz 10351da177e4SLinus Torvalds return; 10361da177e4SLinus Torvalds } 10371da177e4SLinus Torvalds atomic_dec(&ctl_cp->n_control); 10381da177e4SLinus Torvalds } 10391da177e4SLinus Torvalds 10401da177e4SLinus Torvalds static inline void 10411da177e4SLinus Torvalds ip_vs_control_add(struct ip_vs_conn *cp, struct ip_vs_conn *ctl_cp) 10421da177e4SLinus Torvalds { 10431da177e4SLinus Torvalds if (cp->control) { 1044cfc78c5aSJulius Volz IP_VS_ERR_BUF("request control ADD for already controlled: " 1045cfc78c5aSJulius Volz "%s:%d to %s:%d\n", 1046cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1047cfc78c5aSJulius Volz ntohs(cp->cport), 1048cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->vaddr), 1049cfc78c5aSJulius Volz ntohs(cp->vport)); 1050cfc78c5aSJulius Volz 10511da177e4SLinus Torvalds ip_vs_control_del(cp); 10521da177e4SLinus Torvalds } 10531da177e4SLinus Torvalds 1054cfc78c5aSJulius Volz IP_VS_DBG_BUF(7, "ADDing control for: " 1055cfc78c5aSJulius Volz "cp.dst=%s:%d ctl_cp.dst=%s:%d\n", 1056cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &cp->caddr), 1057cfc78c5aSJulius Volz ntohs(cp->cport), 1058cfc78c5aSJulius Volz IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr), 1059cfc78c5aSJulius Volz ntohs(ctl_cp->cport)); 10601da177e4SLinus Torvalds 10611da177e4SLinus Torvalds cp->control = ctl_cp; 10621da177e4SLinus Torvalds atomic_inc(&ctl_cp->n_control); 10631da177e4SLinus Torvalds } 10641da177e4SLinus Torvalds 10651da177e4SLinus Torvalds 10661da177e4SLinus Torvalds /* 10671da177e4SLinus Torvalds * IPVS application functions 10681da177e4SLinus Torvalds * (from ip_vs_app.c) 10691da177e4SLinus Torvalds */ 10701da177e4SLinus Torvalds #define IP_VS_APP_MAX_PORTS 8 1071ab8a5e84SHans Schillstrom extern int register_ip_vs_app(struct net *net, struct ip_vs_app *app); 1072ab8a5e84SHans Schillstrom extern void unregister_ip_vs_app(struct net *net, struct ip_vs_app *app); 10731da177e4SLinus Torvalds extern int ip_vs_bind_app(struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 10741da177e4SLinus Torvalds extern void ip_vs_unbind_app(struct ip_vs_conn *cp); 1075ab8a5e84SHans Schillstrom extern int register_ip_vs_app_inc(struct net *net, struct ip_vs_app *app, 1076ab8a5e84SHans Schillstrom __u16 proto, __u16 port); 10771da177e4SLinus Torvalds extern int ip_vs_app_inc_get(struct ip_vs_app *inc); 10781da177e4SLinus Torvalds extern void ip_vs_app_inc_put(struct ip_vs_app *inc); 10791da177e4SLinus Torvalds 10803db05feaSHerbert Xu extern int ip_vs_app_pkt_out(struct ip_vs_conn *, struct sk_buff *skb); 10813db05feaSHerbert Xu extern int ip_vs_app_pkt_in(struct ip_vs_conn *, struct sk_buff *skb); 10821da177e4SLinus Torvalds extern int ip_vs_app_init(void); 10831da177e4SLinus Torvalds extern void ip_vs_app_cleanup(void); 10841da177e4SLinus Torvalds 10858be67a66SSimon Horman void ip_vs_bind_pe(struct ip_vs_service *svc, struct ip_vs_pe *pe); 10868be67a66SSimon Horman void ip_vs_unbind_pe(struct ip_vs_service *svc); 10878be67a66SSimon Horman int register_ip_vs_pe(struct ip_vs_pe *pe); 10888be67a66SSimon Horman int unregister_ip_vs_pe(struct ip_vs_pe *pe); 1089e9e5eee8SSimon Horman struct ip_vs_pe *ip_vs_pe_getbyname(const char *name); 1090fe5e7a1eSHans Schillstrom struct ip_vs_pe *__ip_vs_pe_getbyname(const char *pe_name); 1091e9e5eee8SSimon Horman 1092e9e5eee8SSimon Horman static inline void ip_vs_pe_get(const struct ip_vs_pe *pe) 1093e9e5eee8SSimon Horman { 1094e9e5eee8SSimon Horman if (pe && pe->module) 1095e9e5eee8SSimon Horman __module_get(pe->module); 1096e9e5eee8SSimon Horman } 1097e9e5eee8SSimon Horman 1098e9e5eee8SSimon Horman static inline void ip_vs_pe_put(const struct ip_vs_pe *pe) 1099e9e5eee8SSimon Horman { 1100e9e5eee8SSimon Horman if (pe && pe->module) 1101e9e5eee8SSimon Horman module_put(pe->module); 1102e9e5eee8SSimon Horman } 11031da177e4SLinus Torvalds 11041da177e4SLinus Torvalds /* 11051da177e4SLinus Torvalds * IPVS protocol functions (from ip_vs_proto.c) 11061da177e4SLinus Torvalds */ 11071da177e4SLinus Torvalds extern int ip_vs_protocol_init(void); 11081da177e4SLinus Torvalds extern void ip_vs_protocol_cleanup(void); 11099330419dSHans Schillstrom extern void ip_vs_protocol_timeout_change(struct netns_ipvs *ipvs, int flags); 11101da177e4SLinus Torvalds extern int *ip_vs_create_timeout_table(int *table, int size); 11111da177e4SLinus Torvalds extern int 111236cbd3dcSJan Engelhardt ip_vs_set_state_timeout(int *table, int num, const char *const *names, 111336cbd3dcSJan Engelhardt const char *name, int to); 11141da177e4SLinus Torvalds extern void 11150d79641aSJulian Anastasov ip_vs_tcpudp_debug_packet(int af, struct ip_vs_protocol *pp, 11160d79641aSJulian Anastasov const struct sk_buff *skb, 11171da177e4SLinus Torvalds int offset, const char *msg); 11181da177e4SLinus Torvalds 11191da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_tcp; 11201da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_udp; 11211da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_icmp; 11221da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_esp; 11231da177e4SLinus Torvalds extern struct ip_vs_protocol ip_vs_protocol_ah; 11242906f66aSVenkata Mohan Reddy extern struct ip_vs_protocol ip_vs_protocol_sctp; 11251da177e4SLinus Torvalds 11261da177e4SLinus Torvalds /* 11271da177e4SLinus Torvalds * Registering/unregistering scheduler functions 11281da177e4SLinus Torvalds * (from ip_vs_sched.c) 11291da177e4SLinus Torvalds */ 11301da177e4SLinus Torvalds extern int register_ip_vs_scheduler(struct ip_vs_scheduler *scheduler); 11311da177e4SLinus Torvalds extern int unregister_ip_vs_scheduler(struct ip_vs_scheduler *scheduler); 11321da177e4SLinus Torvalds extern int ip_vs_bind_scheduler(struct ip_vs_service *svc, 11331da177e4SLinus Torvalds struct ip_vs_scheduler *scheduler); 11341da177e4SLinus Torvalds extern int ip_vs_unbind_scheduler(struct ip_vs_service *svc); 11351da177e4SLinus Torvalds extern struct ip_vs_scheduler *ip_vs_scheduler_get(const char *sched_name); 11361da177e4SLinus Torvalds extern void ip_vs_scheduler_put(struct ip_vs_scheduler *scheduler); 11371da177e4SLinus Torvalds extern struct ip_vs_conn * 1138190ecd27SJulian Anastasov ip_vs_schedule(struct ip_vs_service *svc, struct sk_buff *skb, 11399330419dSHans Schillstrom struct ip_vs_proto_data *pd, int *ignored); 11401da177e4SLinus Torvalds extern int ip_vs_leave(struct ip_vs_service *svc, struct sk_buff *skb, 11419330419dSHans Schillstrom struct ip_vs_proto_data *pd); 11421da177e4SLinus Torvalds 114341ac51eeSPatrick Schaaf extern void ip_vs_scheduler_err(struct ip_vs_service *svc, const char *msg); 114441ac51eeSPatrick Schaaf 11451da177e4SLinus Torvalds 11461da177e4SLinus Torvalds /* 11471da177e4SLinus Torvalds * IPVS control data and functions (from ip_vs_ctl.c) 11481da177e4SLinus Torvalds */ 11491da177e4SLinus Torvalds extern struct ip_vs_stats ip_vs_stats; 11505587da55SSven Wegener extern const struct ctl_path net_vs_ctl_path[]; 1151b880c1f0SHans Schillstrom extern int sysctl_ip_vs_sync_ver; 11521da177e4SLinus Torvalds 1153f131315fSHans Schillstrom extern void ip_vs_sync_switch_mode(struct net *net, int mode); 11541da177e4SLinus Torvalds extern struct ip_vs_service * 1155fc723250SHans Schillstrom ip_vs_service_get(struct net *net, int af, __u32 fwmark, __u16 protocol, 11563c2e0505SJulius Volz const union nf_inet_addr *vaddr, __be16 vport); 11571da177e4SLinus Torvalds 11581da177e4SLinus Torvalds static inline void ip_vs_service_put(struct ip_vs_service *svc) 11591da177e4SLinus Torvalds { 11601da177e4SLinus Torvalds atomic_dec(&svc->usecnt); 11611da177e4SLinus Torvalds } 11621da177e4SLinus Torvalds 11631da177e4SLinus Torvalds extern struct ip_vs_dest * 1164fc723250SHans Schillstrom ip_vs_lookup_real_service(struct net *net, int af, __u16 protocol, 11657937df15SJulius Volz const union nf_inet_addr *daddr, __be16 dport); 11667937df15SJulius Volz 11671da177e4SLinus Torvalds extern int ip_vs_use_count_inc(void); 11681da177e4SLinus Torvalds extern void ip_vs_use_count_dec(void); 11691da177e4SLinus Torvalds extern int ip_vs_control_init(void); 11701da177e4SLinus Torvalds extern void ip_vs_control_cleanup(void); 11711e356f9cSRumen G. Bogdanovski extern struct ip_vs_dest * 1172fc723250SHans Schillstrom ip_vs_find_dest(struct net *net, int af, const union nf_inet_addr *daddr, 1173fc723250SHans Schillstrom __be16 dport, const union nf_inet_addr *vaddr, __be16 vport, 1174fc723250SHans Schillstrom __u16 protocol, __u32 fwmark); 11751e356f9cSRumen G. Bogdanovski extern struct ip_vs_dest *ip_vs_try_bind_dest(struct ip_vs_conn *cp); 11761da177e4SLinus Torvalds 11771da177e4SLinus Torvalds 11781da177e4SLinus Torvalds /* 11791da177e4SLinus Torvalds * IPVS sync daemon data and function prototypes 11801da177e4SLinus Torvalds * (from ip_vs_sync.c) 11811da177e4SLinus Torvalds */ 1182f131315fSHans Schillstrom extern int start_sync_thread(struct net *net, int state, char *mcast_ifn, 1183f131315fSHans Schillstrom __u8 syncid); 1184f131315fSHans Schillstrom extern int stop_sync_thread(struct net *net, int state); 1185f131315fSHans Schillstrom extern void ip_vs_sync_conn(struct net *net, struct ip_vs_conn *cp); 118661b1ab45SHans Schillstrom extern int ip_vs_sync_init(void); 118761b1ab45SHans Schillstrom extern void ip_vs_sync_cleanup(void); 11881da177e4SLinus Torvalds 11891da177e4SLinus Torvalds 11901da177e4SLinus Torvalds /* 11911da177e4SLinus Torvalds * IPVS rate estimator prototypes (from ip_vs_est.c) 11921da177e4SLinus Torvalds */ 1193a919cf4bSSven Wegener extern int ip_vs_estimator_init(void); 1194a919cf4bSSven Wegener extern void ip_vs_estimator_cleanup(void); 119529c2026fSHans Schillstrom extern void ip_vs_new_estimator(struct net *net, struct ip_vs_stats *stats); 119629c2026fSHans Schillstrom extern void ip_vs_kill_estimator(struct net *net, struct ip_vs_stats *stats); 11971da177e4SLinus Torvalds extern void ip_vs_zero_estimator(struct ip_vs_stats *stats); 11981da177e4SLinus Torvalds 11991da177e4SLinus Torvalds /* 12001da177e4SLinus Torvalds * Various IPVS packet transmitters (from ip_vs_xmit.c) 12011da177e4SLinus Torvalds */ 12021da177e4SLinus Torvalds extern int ip_vs_null_xmit 12031da177e4SLinus Torvalds (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 12041da177e4SLinus Torvalds extern int ip_vs_bypass_xmit 12051da177e4SLinus Torvalds (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 12061da177e4SLinus Torvalds extern int ip_vs_nat_xmit 12071da177e4SLinus Torvalds (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 12081da177e4SLinus Torvalds extern int ip_vs_tunnel_xmit 12091da177e4SLinus Torvalds (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 12101da177e4SLinus Torvalds extern int ip_vs_dr_xmit 12111da177e4SLinus Torvalds (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 12121da177e4SLinus Torvalds extern int ip_vs_icmp_xmit 12131da177e4SLinus Torvalds (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp, int offset); 12141da177e4SLinus Torvalds extern void ip_vs_dst_reset(struct ip_vs_dest *dest); 12151da177e4SLinus Torvalds 1216b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6 1217b3cdd2a7SJulius Volz extern int ip_vs_bypass_xmit_v6 1218b3cdd2a7SJulius Volz (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 1219b3cdd2a7SJulius Volz extern int ip_vs_nat_xmit_v6 1220b3cdd2a7SJulius Volz (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 1221b3cdd2a7SJulius Volz extern int ip_vs_tunnel_xmit_v6 1222b3cdd2a7SJulius Volz (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 1223b3cdd2a7SJulius Volz extern int ip_vs_dr_xmit_v6 1224b3cdd2a7SJulius Volz (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp); 1225b3cdd2a7SJulius Volz extern int ip_vs_icmp_xmit_v6 1226b3cdd2a7SJulius Volz (struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp, 1227b3cdd2a7SJulius Volz int offset); 1228b3cdd2a7SJulius Volz #endif 12291da177e4SLinus Torvalds 12301da177e4SLinus Torvalds /* 12311da177e4SLinus Torvalds * This is a simple mechanism to ignore packets when 12321da177e4SLinus Torvalds * we are loaded. Just set ip_vs_drop_rate to 'n' and 12331da177e4SLinus Torvalds * we start to drop 1/rate of the packets 12341da177e4SLinus Torvalds */ 12351da177e4SLinus Torvalds 1236a0840e2eSHans Schillstrom static inline int ip_vs_todrop(struct netns_ipvs *ipvs) 12371da177e4SLinus Torvalds { 1238a0840e2eSHans Schillstrom if (!ipvs->drop_rate) 1239a0840e2eSHans Schillstrom return 0; 1240a0840e2eSHans Schillstrom if (--ipvs->drop_counter > 0) 1241a0840e2eSHans Schillstrom return 0; 1242a0840e2eSHans Schillstrom ipvs->drop_counter = ipvs->drop_rate; 12431da177e4SLinus Torvalds return 1; 12441da177e4SLinus Torvalds } 12451da177e4SLinus Torvalds 12461da177e4SLinus Torvalds /* 12471da177e4SLinus Torvalds * ip_vs_fwd_tag returns the forwarding tag of the connection 12481da177e4SLinus Torvalds */ 12491da177e4SLinus Torvalds #define IP_VS_FWD_METHOD(cp) (cp->flags & IP_VS_CONN_F_FWD_MASK) 12501da177e4SLinus Torvalds 1251732db659SAdrian Bunk static inline char ip_vs_fwd_tag(struct ip_vs_conn *cp) 12521da177e4SLinus Torvalds { 12531da177e4SLinus Torvalds char fwd; 12541da177e4SLinus Torvalds 12551da177e4SLinus Torvalds switch (IP_VS_FWD_METHOD(cp)) { 12561da177e4SLinus Torvalds case IP_VS_CONN_F_MASQ: 12571da177e4SLinus Torvalds fwd = 'M'; break; 12581da177e4SLinus Torvalds case IP_VS_CONN_F_LOCALNODE: 12591da177e4SLinus Torvalds fwd = 'L'; break; 12601da177e4SLinus Torvalds case IP_VS_CONN_F_TUNNEL: 12611da177e4SLinus Torvalds fwd = 'T'; break; 12621da177e4SLinus Torvalds case IP_VS_CONN_F_DROUTE: 12631da177e4SLinus Torvalds fwd = 'R'; break; 12641da177e4SLinus Torvalds case IP_VS_CONN_F_BYPASS: 12651da177e4SLinus Torvalds fwd = 'B'; break; 12661da177e4SLinus Torvalds default: 12671da177e4SLinus Torvalds fwd = '?'; break; 12681da177e4SLinus Torvalds } 12691da177e4SLinus Torvalds return fwd; 12701da177e4SLinus Torvalds } 12711da177e4SLinus Torvalds 12721da177e4SLinus Torvalds extern void ip_vs_nat_icmp(struct sk_buff *skb, struct ip_vs_protocol *pp, 12731da177e4SLinus Torvalds struct ip_vs_conn *cp, int dir); 12741da177e4SLinus Torvalds 1275b3cdd2a7SJulius Volz #ifdef CONFIG_IP_VS_IPV6 1276b3cdd2a7SJulius Volz extern void ip_vs_nat_icmp_v6(struct sk_buff *skb, struct ip_vs_protocol *pp, 1277b3cdd2a7SJulius Volz struct ip_vs_conn *cp, int dir); 1278b3cdd2a7SJulius Volz #endif 1279b3cdd2a7SJulius Volz 1280b1550f22SAl Viro extern __sum16 ip_vs_checksum_complete(struct sk_buff *skb, int offset); 12811da177e4SLinus Torvalds 1282f9214b26SAl Viro static inline __wsum ip_vs_check_diff4(__be32 old, __be32 new, __wsum oldsum) 12831da177e4SLinus Torvalds { 1284f9214b26SAl Viro __be32 diff[2] = { ~old, new }; 12851da177e4SLinus Torvalds 128607f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 1287f9214b26SAl Viro } 1288f9214b26SAl Viro 12890bbdd42bSJulius Volz #ifdef CONFIG_IP_VS_IPV6 12900bbdd42bSJulius Volz static inline __wsum ip_vs_check_diff16(const __be32 *old, const __be32 *new, 12910bbdd42bSJulius Volz __wsum oldsum) 12920bbdd42bSJulius Volz { 12930bbdd42bSJulius Volz __be32 diff[8] = { ~old[3], ~old[2], ~old[1], ~old[0], 12940bbdd42bSJulius Volz new[3], new[2], new[1], new[0] }; 12950bbdd42bSJulius Volz 129607f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 12970bbdd42bSJulius Volz } 12980bbdd42bSJulius Volz #endif 12990bbdd42bSJulius Volz 1300f9214b26SAl Viro static inline __wsum ip_vs_check_diff2(__be16 old, __be16 new, __wsum oldsum) 1301f9214b26SAl Viro { 1302f9214b26SAl Viro __be16 diff[2] = { ~old, new }; 1303f9214b26SAl Viro 130407f0757aSJoe Perches return csum_partial(diff, sizeof(diff), oldsum); 13051da177e4SLinus Torvalds } 13061da177e4SLinus Torvalds 1307cf356d69SJulian Anastasov /* 1308cf356d69SJulian Anastasov * Forget current conntrack (unconfirmed) and attach notrack entry 1309cf356d69SJulian Anastasov */ 1310cf356d69SJulian Anastasov static inline void ip_vs_notrack(struct sk_buff *skb) 1311cf356d69SJulian Anastasov { 1312cf356d69SJulian Anastasov #if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE) 1313cf356d69SJulian Anastasov enum ip_conntrack_info ctinfo; 131406b69390SJesper Juhl struct nf_conn *ct = nf_ct_get(skb, &ctinfo); 1315cf356d69SJulian Anastasov 1316cf356d69SJulian Anastasov if (!ct || !nf_ct_is_untracked(ct)) { 1317cf356d69SJulian Anastasov nf_reset(skb); 1318cf356d69SJulian Anastasov skb->nfct = &nf_ct_untracked_get()->ct_general; 1319cf356d69SJulian Anastasov skb->nfctinfo = IP_CT_NEW; 1320cf356d69SJulian Anastasov nf_conntrack_get(skb->nfct); 1321cf356d69SJulian Anastasov } 1322cf356d69SJulian Anastasov #endif 1323cf356d69SJulian Anastasov } 1324cf356d69SJulian Anastasov 1325f4bc17cdSJulian Anastasov #ifdef CONFIG_IP_VS_NFCT 1326f4bc17cdSJulian Anastasov /* 1327f4bc17cdSJulian Anastasov * Netfilter connection tracking 1328f4bc17cdSJulian Anastasov * (from ip_vs_nfct.c) 1329f4bc17cdSJulian Anastasov */ 1330a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs) 1331f4bc17cdSJulian Anastasov { 1332a0840e2eSHans Schillstrom return ipvs->sysctl_conntrack; 1333f4bc17cdSJulian Anastasov } 1334f4bc17cdSJulian Anastasov 13356523ce15SJulian Anastasov extern void ip_vs_update_conntrack(struct sk_buff *skb, struct ip_vs_conn *cp, 13366523ce15SJulian Anastasov int outin); 1337f4bc17cdSJulian Anastasov extern int ip_vs_confirm_conntrack(struct sk_buff *skb, struct ip_vs_conn *cp); 1338f4bc17cdSJulian Anastasov extern void ip_vs_nfct_expect_related(struct sk_buff *skb, struct nf_conn *ct, 1339f4bc17cdSJulian Anastasov struct ip_vs_conn *cp, u_int8_t proto, 1340f4bc17cdSJulian Anastasov const __be16 port, int from_rs); 1341f4bc17cdSJulian Anastasov extern void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp); 1342f4bc17cdSJulian Anastasov 1343f4bc17cdSJulian Anastasov #else 1344f4bc17cdSJulian Anastasov 1345a0840e2eSHans Schillstrom static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs) 1346f4bc17cdSJulian Anastasov { 1347f4bc17cdSJulian Anastasov return 0; 1348f4bc17cdSJulian Anastasov } 1349f4bc17cdSJulian Anastasov 1350f4bc17cdSJulian Anastasov static inline void ip_vs_update_conntrack(struct sk_buff *skb, 1351f4bc17cdSJulian Anastasov struct ip_vs_conn *cp, int outin) 1352f4bc17cdSJulian Anastasov { 1353f4bc17cdSJulian Anastasov } 1354f4bc17cdSJulian Anastasov 1355f4bc17cdSJulian Anastasov static inline int ip_vs_confirm_conntrack(struct sk_buff *skb, 1356f4bc17cdSJulian Anastasov struct ip_vs_conn *cp) 1357f4bc17cdSJulian Anastasov { 1358f4bc17cdSJulian Anastasov return NF_ACCEPT; 1359f4bc17cdSJulian Anastasov } 1360f4bc17cdSJulian Anastasov 1361f4bc17cdSJulian Anastasov static inline void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp) 1362f4bc17cdSJulian Anastasov { 1363f4bc17cdSJulian Anastasov } 1364f4bc17cdSJulian Anastasov /* CONFIG_IP_VS_NFCT */ 1365f4bc17cdSJulian Anastasov #endif 13666523ce15SJulian Anastasov 1367b552f7e3SChangli Gao static inline unsigned int 1368b552f7e3SChangli Gao ip_vs_dest_conn_overhead(struct ip_vs_dest *dest) 1369b552f7e3SChangli Gao { 1370b552f7e3SChangli Gao /* 1371b552f7e3SChangli Gao * We think the overhead of processing active connections is 256 1372b552f7e3SChangli Gao * times higher than that of inactive connections in average. (This 1373b552f7e3SChangli Gao * 256 times might not be accurate, we will change it later) We 1374b552f7e3SChangli Gao * use the following formula to estimate the overhead now: 1375b552f7e3SChangli Gao * dest->activeconns*256 + dest->inactconns 1376b552f7e3SChangli Gao */ 1377b552f7e3SChangli Gao return (atomic_read(&dest->activeconns) << 8) + 1378b552f7e3SChangli Gao atomic_read(&dest->inactconns); 1379b552f7e3SChangli Gao } 1380b552f7e3SChangli Gao 13811da177e4SLinus Torvalds #endif /* __KERNEL__ */ 13821da177e4SLinus Torvalds 1383bc4768ebSJulius Volz #endif /* _NET_IP_VS_H */ 1384