xref: /OK3568_Linux_fs/kernel/include/net/ip_vs.h (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0 */
2*4882a593Smuzhiyun /* IP Virtual Server
3*4882a593Smuzhiyun  * data structure and functionality definitions
4*4882a593Smuzhiyun  */
5*4882a593Smuzhiyun 
6*4882a593Smuzhiyun #ifndef _NET_IP_VS_H
7*4882a593Smuzhiyun #define _NET_IP_VS_H
8*4882a593Smuzhiyun 
9*4882a593Smuzhiyun #include <linux/ip_vs.h>                /* definitions shared with userland */
10*4882a593Smuzhiyun 
11*4882a593Smuzhiyun #include <asm/types.h>                  /* for __uXX types */
12*4882a593Smuzhiyun 
13*4882a593Smuzhiyun #include <linux/list.h>                 /* for struct list_head */
14*4882a593Smuzhiyun #include <linux/spinlock.h>             /* for struct rwlock_t */
15*4882a593Smuzhiyun #include <linux/atomic.h>               /* for struct atomic_t */
16*4882a593Smuzhiyun #include <linux/refcount.h>             /* for struct refcount_t */
17*4882a593Smuzhiyun #include <linux/workqueue.h>
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun #include <linux/compiler.h>
20*4882a593Smuzhiyun #include <linux/timer.h>
21*4882a593Smuzhiyun #include <linux/bug.h>
22*4882a593Smuzhiyun 
23*4882a593Smuzhiyun #include <net/checksum.h>
24*4882a593Smuzhiyun #include <linux/netfilter.h>		/* for union nf_inet_addr */
25*4882a593Smuzhiyun #include <linux/ip.h>
26*4882a593Smuzhiyun #include <linux/ipv6.h>			/* for struct ipv6hdr */
27*4882a593Smuzhiyun #include <net/ipv6.h>
28*4882a593Smuzhiyun #if IS_ENABLED(CONFIG_NF_CONNTRACK)
29*4882a593Smuzhiyun #include <net/netfilter/nf_conntrack.h>
30*4882a593Smuzhiyun #endif
31*4882a593Smuzhiyun #include <net/net_namespace.h>		/* Netw namespace */
32*4882a593Smuzhiyun 
33*4882a593Smuzhiyun #define IP_VS_HDR_INVERSE	1
34*4882a593Smuzhiyun #define IP_VS_HDR_ICMP		2
35*4882a593Smuzhiyun 
36*4882a593Smuzhiyun /* Generic access of ipvs struct */
net_ipvs(struct net * net)37*4882a593Smuzhiyun static inline struct netns_ipvs *net_ipvs(struct net* net)
38*4882a593Smuzhiyun {
39*4882a593Smuzhiyun 	return net->ipvs;
40*4882a593Smuzhiyun }
41*4882a593Smuzhiyun 
42*4882a593Smuzhiyun /* Connections' size value needed by ip_vs_ctl.c */
43*4882a593Smuzhiyun extern int ip_vs_conn_tab_size;
44*4882a593Smuzhiyun 
45*4882a593Smuzhiyun struct ip_vs_iphdr {
46*4882a593Smuzhiyun 	int hdr_flags;	/* ipvs flags */
47*4882a593Smuzhiyun 	__u32 off;	/* Where IP or IPv4 header starts */
48*4882a593Smuzhiyun 	__u32 len;	/* IPv4 simply where L4 starts
49*4882a593Smuzhiyun 			 * IPv6 where L4 Transport Header starts */
50*4882a593Smuzhiyun 	__u16 fragoffs; /* IPv6 fragment offset, 0 if first frag (or not frag)*/
51*4882a593Smuzhiyun 	__s16 protocol;
52*4882a593Smuzhiyun 	__s32 flags;
53*4882a593Smuzhiyun 	union nf_inet_addr saddr;
54*4882a593Smuzhiyun 	union nf_inet_addr daddr;
55*4882a593Smuzhiyun };
56*4882a593Smuzhiyun 
frag_safe_skb_hp(const struct sk_buff * skb,int offset,int len,void * buffer)57*4882a593Smuzhiyun static inline void *frag_safe_skb_hp(const struct sk_buff *skb, int offset,
58*4882a593Smuzhiyun 				      int len, void *buffer)
59*4882a593Smuzhiyun {
60*4882a593Smuzhiyun 	return skb_header_pointer(skb, offset, len, buffer);
61*4882a593Smuzhiyun }
62*4882a593Smuzhiyun 
63*4882a593Smuzhiyun /* This function handles filling *ip_vs_iphdr, both for IPv4 and IPv6.
64*4882a593Smuzhiyun  * IPv6 requires some extra work, as finding proper header position,
65*4882a593Smuzhiyun  * depend on the IPv6 extension headers.
66*4882a593Smuzhiyun  */
67*4882a593Smuzhiyun static inline int
ip_vs_fill_iph_skb_off(int af,const struct sk_buff * skb,int offset,int hdr_flags,struct ip_vs_iphdr * iphdr)68*4882a593Smuzhiyun ip_vs_fill_iph_skb_off(int af, const struct sk_buff *skb, int offset,
69*4882a593Smuzhiyun 		       int hdr_flags, struct ip_vs_iphdr *iphdr)
70*4882a593Smuzhiyun {
71*4882a593Smuzhiyun 	iphdr->hdr_flags = hdr_flags;
72*4882a593Smuzhiyun 	iphdr->off = offset;
73*4882a593Smuzhiyun 
74*4882a593Smuzhiyun #ifdef CONFIG_IP_VS_IPV6
75*4882a593Smuzhiyun 	if (af == AF_INET6) {
76*4882a593Smuzhiyun 		struct ipv6hdr _iph;
77*4882a593Smuzhiyun 		const struct ipv6hdr *iph = skb_header_pointer(
78*4882a593Smuzhiyun 			skb, offset, sizeof(_iph), &_iph);
79*4882a593Smuzhiyun 		if (!iph)
80*4882a593Smuzhiyun 			return 0;
81*4882a593Smuzhiyun 
82*4882a593Smuzhiyun 		iphdr->saddr.in6 = iph->saddr;
83*4882a593Smuzhiyun 		iphdr->daddr.in6 = iph->daddr;
84*4882a593Smuzhiyun 		/* ipv6_find_hdr() updates len, flags */
85*4882a593Smuzhiyun 		iphdr->len	 = offset;
86*4882a593Smuzhiyun 		iphdr->flags	 = 0;
87*4882a593Smuzhiyun 		iphdr->protocol  = ipv6_find_hdr(skb, &iphdr->len, -1,
88*4882a593Smuzhiyun 						 &iphdr->fragoffs,
89*4882a593Smuzhiyun 						 &iphdr->flags);
90*4882a593Smuzhiyun 		if (iphdr->protocol < 0)
91*4882a593Smuzhiyun 			return 0;
92*4882a593Smuzhiyun 	} else
93*4882a593Smuzhiyun #endif
94*4882a593Smuzhiyun 	{
95*4882a593Smuzhiyun 		struct iphdr _iph;
96*4882a593Smuzhiyun 		const struct iphdr *iph = skb_header_pointer(
97*4882a593Smuzhiyun 			skb, offset, sizeof(_iph), &_iph);
98*4882a593Smuzhiyun 		if (!iph)
99*4882a593Smuzhiyun 			return 0;
100*4882a593Smuzhiyun 
101*4882a593Smuzhiyun 		iphdr->len	= offset + iph->ihl * 4;
102*4882a593Smuzhiyun 		iphdr->fragoffs	= 0;
103*4882a593Smuzhiyun 		iphdr->protocol	= iph->protocol;
104*4882a593Smuzhiyun 		iphdr->saddr.ip	= iph->saddr;
105*4882a593Smuzhiyun 		iphdr->daddr.ip	= iph->daddr;
106*4882a593Smuzhiyun 	}
107*4882a593Smuzhiyun 
108*4882a593Smuzhiyun 	return 1;
109*4882a593Smuzhiyun }
110*4882a593Smuzhiyun 
111*4882a593Smuzhiyun static inline int
ip_vs_fill_iph_skb_icmp(int af,const struct sk_buff * skb,int offset,bool inverse,struct ip_vs_iphdr * iphdr)112*4882a593Smuzhiyun ip_vs_fill_iph_skb_icmp(int af, const struct sk_buff *skb, int offset,
113*4882a593Smuzhiyun 			bool inverse, struct ip_vs_iphdr *iphdr)
114*4882a593Smuzhiyun {
115*4882a593Smuzhiyun 	int hdr_flags = IP_VS_HDR_ICMP;
116*4882a593Smuzhiyun 
117*4882a593Smuzhiyun 	if (inverse)
118*4882a593Smuzhiyun 		hdr_flags |= IP_VS_HDR_INVERSE;
119*4882a593Smuzhiyun 
120*4882a593Smuzhiyun 	return ip_vs_fill_iph_skb_off(af, skb, offset, hdr_flags, iphdr);
121*4882a593Smuzhiyun }
122*4882a593Smuzhiyun 
123*4882a593Smuzhiyun static inline int
ip_vs_fill_iph_skb(int af,const struct sk_buff * skb,bool inverse,struct ip_vs_iphdr * iphdr)124*4882a593Smuzhiyun ip_vs_fill_iph_skb(int af, const struct sk_buff *skb, bool inverse,
125*4882a593Smuzhiyun 		   struct ip_vs_iphdr *iphdr)
126*4882a593Smuzhiyun {
127*4882a593Smuzhiyun 	int hdr_flags = 0;
128*4882a593Smuzhiyun 
129*4882a593Smuzhiyun 	if (inverse)
130*4882a593Smuzhiyun 		hdr_flags |= IP_VS_HDR_INVERSE;
131*4882a593Smuzhiyun 
132*4882a593Smuzhiyun 	return ip_vs_fill_iph_skb_off(af, skb, skb_network_offset(skb),
133*4882a593Smuzhiyun 				      hdr_flags, iphdr);
134*4882a593Smuzhiyun }
135*4882a593Smuzhiyun 
136*4882a593Smuzhiyun static inline bool
ip_vs_iph_inverse(const struct ip_vs_iphdr * iph)137*4882a593Smuzhiyun ip_vs_iph_inverse(const struct ip_vs_iphdr *iph)
138*4882a593Smuzhiyun {
139*4882a593Smuzhiyun 	return !!(iph->hdr_flags & IP_VS_HDR_INVERSE);
140*4882a593Smuzhiyun }
141*4882a593Smuzhiyun 
142*4882a593Smuzhiyun static inline bool
ip_vs_iph_icmp(const struct ip_vs_iphdr * iph)143*4882a593Smuzhiyun ip_vs_iph_icmp(const struct ip_vs_iphdr *iph)
144*4882a593Smuzhiyun {
145*4882a593Smuzhiyun 	return !!(iph->hdr_flags & IP_VS_HDR_ICMP);
146*4882a593Smuzhiyun }
147*4882a593Smuzhiyun 
ip_vs_addr_copy(int af,union nf_inet_addr * dst,const union nf_inet_addr * src)148*4882a593Smuzhiyun static inline void ip_vs_addr_copy(int af, union nf_inet_addr *dst,
149*4882a593Smuzhiyun 				   const union nf_inet_addr *src)
150*4882a593Smuzhiyun {
151*4882a593Smuzhiyun #ifdef CONFIG_IP_VS_IPV6
152*4882a593Smuzhiyun 	if (af == AF_INET6)
153*4882a593Smuzhiyun 		dst->in6 = src->in6;
154*4882a593Smuzhiyun 	else
155*4882a593Smuzhiyun #endif
156*4882a593Smuzhiyun 	dst->ip = src->ip;
157*4882a593Smuzhiyun }
158*4882a593Smuzhiyun 
ip_vs_addr_set(int af,union nf_inet_addr * dst,const union nf_inet_addr * src)159*4882a593Smuzhiyun static inline void ip_vs_addr_set(int af, union nf_inet_addr *dst,
160*4882a593Smuzhiyun 				  const union nf_inet_addr *src)
161*4882a593Smuzhiyun {
162*4882a593Smuzhiyun #ifdef CONFIG_IP_VS_IPV6
163*4882a593Smuzhiyun 	if (af == AF_INET6) {
164*4882a593Smuzhiyun 		dst->in6 = src->in6;
165*4882a593Smuzhiyun 		return;
166*4882a593Smuzhiyun 	}
167*4882a593Smuzhiyun #endif
168*4882a593Smuzhiyun 	dst->ip = src->ip;
169*4882a593Smuzhiyun 	dst->all[1] = 0;
170*4882a593Smuzhiyun 	dst->all[2] = 0;
171*4882a593Smuzhiyun 	dst->all[3] = 0;
172*4882a593Smuzhiyun }
173*4882a593Smuzhiyun 
ip_vs_addr_equal(int af,const union nf_inet_addr * a,const union nf_inet_addr * b)174*4882a593Smuzhiyun static inline int ip_vs_addr_equal(int af, const union nf_inet_addr *a,
175*4882a593Smuzhiyun 				   const union nf_inet_addr *b)
176*4882a593Smuzhiyun {
177*4882a593Smuzhiyun #ifdef CONFIG_IP_VS_IPV6
178*4882a593Smuzhiyun 	if (af == AF_INET6)
179*4882a593Smuzhiyun 		return ipv6_addr_equal(&a->in6, &b->in6);
180*4882a593Smuzhiyun #endif
181*4882a593Smuzhiyun 	return a->ip == b->ip;
182*4882a593Smuzhiyun }
183*4882a593Smuzhiyun 
184*4882a593Smuzhiyun #ifdef CONFIG_IP_VS_DEBUG
185*4882a593Smuzhiyun #include <linux/net.h>
186*4882a593Smuzhiyun 
187*4882a593Smuzhiyun int ip_vs_get_debug_level(void);
188*4882a593Smuzhiyun 
ip_vs_dbg_addr(int af,char * buf,size_t buf_len,const union nf_inet_addr * addr,int * idx)189*4882a593Smuzhiyun static inline const char *ip_vs_dbg_addr(int af, char *buf, size_t buf_len,
190*4882a593Smuzhiyun 					 const union nf_inet_addr *addr,
191*4882a593Smuzhiyun 					 int *idx)
192*4882a593Smuzhiyun {
193*4882a593Smuzhiyun 	int len;
194*4882a593Smuzhiyun #ifdef CONFIG_IP_VS_IPV6
195*4882a593Smuzhiyun 	if (af == AF_INET6)
196*4882a593Smuzhiyun 		len = snprintf(&buf[*idx], buf_len - *idx, "[%pI6c]",
197*4882a593Smuzhiyun 			       &addr->in6) + 1;
198*4882a593Smuzhiyun 	else
199*4882a593Smuzhiyun #endif
200*4882a593Smuzhiyun 		len = snprintf(&buf[*idx], buf_len - *idx, "%pI4",
201*4882a593Smuzhiyun 			       &addr->ip) + 1;
202*4882a593Smuzhiyun 
203*4882a593Smuzhiyun 	*idx += len;
204*4882a593Smuzhiyun 	BUG_ON(*idx > buf_len + 1);
205*4882a593Smuzhiyun 	return &buf[*idx - len];
206*4882a593Smuzhiyun }
207*4882a593Smuzhiyun 
208*4882a593Smuzhiyun #define IP_VS_DBG_BUF(level, msg, ...)					\
209*4882a593Smuzhiyun 	do {								\
210*4882a593Smuzhiyun 		char ip_vs_dbg_buf[160];				\
211*4882a593Smuzhiyun 		int ip_vs_dbg_idx = 0;					\
212*4882a593Smuzhiyun 		if (level <= ip_vs_get_debug_level())			\
213*4882a593Smuzhiyun 			printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__);	\
214*4882a593Smuzhiyun 	} while (0)
215*4882a593Smuzhiyun #define IP_VS_ERR_BUF(msg...)						\
216*4882a593Smuzhiyun 	do {								\
217*4882a593Smuzhiyun 		char ip_vs_dbg_buf[160];				\
218*4882a593Smuzhiyun 		int ip_vs_dbg_idx = 0;					\
219*4882a593Smuzhiyun 		pr_err(msg);						\
220*4882a593Smuzhiyun 	} while (0)
221*4882a593Smuzhiyun 
222*4882a593Smuzhiyun /* Only use from within IP_VS_DBG_BUF() or IP_VS_ERR_BUF macros */
223*4882a593Smuzhiyun #define IP_VS_DBG_ADDR(af, addr)					\
224*4882a593Smuzhiyun 	ip_vs_dbg_addr(af, ip_vs_dbg_buf,				\
225*4882a593Smuzhiyun 		       sizeof(ip_vs_dbg_buf), addr,			\
226*4882a593Smuzhiyun 		       &ip_vs_dbg_idx)
227*4882a593Smuzhiyun 
228*4882a593Smuzhiyun #define IP_VS_DBG(level, msg, ...)					\
229*4882a593Smuzhiyun 	do {								\
230*4882a593Smuzhiyun 		if (level <= ip_vs_get_debug_level())			\
231*4882a593Smuzhiyun 			printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__);	\
232*4882a593Smuzhiyun 	} while (0)
233*4882a593Smuzhiyun #define IP_VS_DBG_RL(msg, ...)						\
234*4882a593Smuzhiyun 	do {								\
235*4882a593Smuzhiyun 		if (net_ratelimit())					\
236*4882a593Smuzhiyun 			printk(KERN_DEBUG pr_fmt(msg), ##__VA_ARGS__);	\
237*4882a593Smuzhiyun 	} while (0)
238*4882a593Smuzhiyun #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg)			\
239*4882a593Smuzhiyun 	do {								\
240*4882a593Smuzhiyun 		if (level <= ip_vs_get_debug_level())			\
241*4882a593Smuzhiyun 			pp->debug_packet(af, pp, skb, ofs, msg);	\
242*4882a593Smuzhiyun 	} while (0)
243*4882a593Smuzhiyun #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg)			\
244*4882a593Smuzhiyun 	do {								\
245*4882a593Smuzhiyun 		if (level <= ip_vs_get_debug_level() &&			\
246*4882a593Smuzhiyun 		    net_ratelimit())					\
247*4882a593Smuzhiyun 			pp->debug_packet(af, pp, skb, ofs, msg);	\
248*4882a593Smuzhiyun 	} while (0)
249*4882a593Smuzhiyun #else	/* NO DEBUGGING at ALL */
250*4882a593Smuzhiyun #define IP_VS_DBG_BUF(level, msg...)  do {} while (0)
251*4882a593Smuzhiyun #define IP_VS_ERR_BUF(msg...)  do {} while (0)
252*4882a593Smuzhiyun #define IP_VS_DBG(level, msg...)  do {} while (0)
253*4882a593Smuzhiyun #define IP_VS_DBG_RL(msg...)  do {} while (0)
254*4882a593Smuzhiyun #define IP_VS_DBG_PKT(level, af, pp, skb, ofs, msg)	do {} while (0)
255*4882a593Smuzhiyun #define IP_VS_DBG_RL_PKT(level, af, pp, skb, ofs, msg)	do {} while (0)
256*4882a593Smuzhiyun #endif
257*4882a593Smuzhiyun 
258*4882a593Smuzhiyun #define IP_VS_BUG() BUG()
259*4882a593Smuzhiyun #define IP_VS_ERR_RL(msg, ...)						\
260*4882a593Smuzhiyun 	do {								\
261*4882a593Smuzhiyun 		if (net_ratelimit())					\
262*4882a593Smuzhiyun 			pr_err(msg, ##__VA_ARGS__);			\
263*4882a593Smuzhiyun 	} while (0)
264*4882a593Smuzhiyun 
265*4882a593Smuzhiyun #ifdef CONFIG_IP_VS_DEBUG
266*4882a593Smuzhiyun #define EnterFunction(level)						\
267*4882a593Smuzhiyun 	do {								\
268*4882a593Smuzhiyun 		if (level <= ip_vs_get_debug_level())			\
269*4882a593Smuzhiyun 			printk(KERN_DEBUG				\
270*4882a593Smuzhiyun 			       pr_fmt("Enter: %s, %s line %i\n"),	\
271*4882a593Smuzhiyun 			       __func__, __FILE__, __LINE__);		\
272*4882a593Smuzhiyun 	} while (0)
273*4882a593Smuzhiyun #define LeaveFunction(level)						\
274*4882a593Smuzhiyun 	do {								\
275*4882a593Smuzhiyun 		if (level <= ip_vs_get_debug_level())			\
276*4882a593Smuzhiyun 			printk(KERN_DEBUG				\
277*4882a593Smuzhiyun 			       pr_fmt("Leave: %s, %s line %i\n"),	\
278*4882a593Smuzhiyun 			       __func__, __FILE__, __LINE__);		\
279*4882a593Smuzhiyun 	} while (0)
280*4882a593Smuzhiyun #else
281*4882a593Smuzhiyun #define EnterFunction(level)   do {} while (0)
282*4882a593Smuzhiyun #define LeaveFunction(level)   do {} while (0)
283*4882a593Smuzhiyun #endif
284*4882a593Smuzhiyun 
285*4882a593Smuzhiyun /* The port number of FTP service (in network order). */
286*4882a593Smuzhiyun #define FTPPORT  cpu_to_be16(21)
287*4882a593Smuzhiyun #define FTPDATA  cpu_to_be16(20)
288*4882a593Smuzhiyun 
289*4882a593Smuzhiyun /* TCP State Values */
290*4882a593Smuzhiyun enum {
291*4882a593Smuzhiyun 	IP_VS_TCP_S_NONE = 0,
292*4882a593Smuzhiyun 	IP_VS_TCP_S_ESTABLISHED,
293*4882a593Smuzhiyun 	IP_VS_TCP_S_SYN_SENT,
294*4882a593Smuzhiyun 	IP_VS_TCP_S_SYN_RECV,
295*4882a593Smuzhiyun 	IP_VS_TCP_S_FIN_WAIT,
296*4882a593Smuzhiyun 	IP_VS_TCP_S_TIME_WAIT,
297*4882a593Smuzhiyun 	IP_VS_TCP_S_CLOSE,
298*4882a593Smuzhiyun 	IP_VS_TCP_S_CLOSE_WAIT,
299*4882a593Smuzhiyun 	IP_VS_TCP_S_LAST_ACK,
300*4882a593Smuzhiyun 	IP_VS_TCP_S_LISTEN,
301*4882a593Smuzhiyun 	IP_VS_TCP_S_SYNACK,
302*4882a593Smuzhiyun 	IP_VS_TCP_S_LAST
303*4882a593Smuzhiyun };
304*4882a593Smuzhiyun 
305*4882a593Smuzhiyun /* UDP State Values */
306*4882a593Smuzhiyun enum {
307*4882a593Smuzhiyun 	IP_VS_UDP_S_NORMAL,
308*4882a593Smuzhiyun 	IP_VS_UDP_S_LAST,
309*4882a593Smuzhiyun };
310*4882a593Smuzhiyun 
311*4882a593Smuzhiyun /* ICMP State Values */
312*4882a593Smuzhiyun enum {
313*4882a593Smuzhiyun 	IP_VS_ICMP_S_NORMAL,
314*4882a593Smuzhiyun 	IP_VS_ICMP_S_LAST,
315*4882a593Smuzhiyun };
316*4882a593Smuzhiyun 
317*4882a593Smuzhiyun /* SCTP State Values */
318*4882a593Smuzhiyun enum ip_vs_sctp_states {
319*4882a593Smuzhiyun 	IP_VS_SCTP_S_NONE,
320*4882a593Smuzhiyun 	IP_VS_SCTP_S_INIT1,
321*4882a593Smuzhiyun 	IP_VS_SCTP_S_INIT,
322*4882a593Smuzhiyun 	IP_VS_SCTP_S_COOKIE_SENT,
323*4882a593Smuzhiyun 	IP_VS_SCTP_S_COOKIE_REPLIED,
324*4882a593Smuzhiyun 	IP_VS_SCTP_S_COOKIE_WAIT,
325*4882a593Smuzhiyun 	IP_VS_SCTP_S_COOKIE,
326*4882a593Smuzhiyun 	IP_VS_SCTP_S_COOKIE_ECHOED,
327*4882a593Smuzhiyun 	IP_VS_SCTP_S_ESTABLISHED,
328*4882a593Smuzhiyun 	IP_VS_SCTP_S_SHUTDOWN_SENT,
329*4882a593Smuzhiyun 	IP_VS_SCTP_S_SHUTDOWN_RECEIVED,
330*4882a593Smuzhiyun 	IP_VS_SCTP_S_SHUTDOWN_ACK_SENT,
331*4882a593Smuzhiyun 	IP_VS_SCTP_S_REJECTED,
332*4882a593Smuzhiyun 	IP_VS_SCTP_S_CLOSED,
333*4882a593Smuzhiyun 	IP_VS_SCTP_S_LAST
334*4882a593Smuzhiyun };
335*4882a593Smuzhiyun 
336*4882a593Smuzhiyun /* Connection templates use bits from state */
337*4882a593Smuzhiyun #define IP_VS_CTPL_S_NONE		0x0000
338*4882a593Smuzhiyun #define IP_VS_CTPL_S_ASSURED		0x0001
339*4882a593Smuzhiyun #define IP_VS_CTPL_S_LAST		0x0002
340*4882a593Smuzhiyun 
341*4882a593Smuzhiyun /* Delta sequence info structure
342*4882a593Smuzhiyun  * Each ip_vs_conn has 2 (output AND input seq. changes).
343*4882a593Smuzhiyun  * Only used in the VS/NAT.
344*4882a593Smuzhiyun  */
345*4882a593Smuzhiyun struct ip_vs_seq {
346*4882a593Smuzhiyun 	__u32			init_seq;	/* Add delta from this seq */
347*4882a593Smuzhiyun 	__u32			delta;		/* Delta in sequence numbers */
348*4882a593Smuzhiyun 	__u32			previous_delta;	/* Delta in sequence numbers
349*4882a593Smuzhiyun 						 * before last resized pkt */
350*4882a593Smuzhiyun };
351*4882a593Smuzhiyun 
352*4882a593Smuzhiyun /* counters per cpu */
353*4882a593Smuzhiyun struct ip_vs_counters {
354*4882a593Smuzhiyun 	__u64		conns;		/* connections scheduled */
355*4882a593Smuzhiyun 	__u64		inpkts;		/* incoming packets */
356*4882a593Smuzhiyun 	__u64		outpkts;	/* outgoing packets */
357*4882a593Smuzhiyun 	__u64		inbytes;	/* incoming bytes */
358*4882a593Smuzhiyun 	__u64		outbytes;	/* outgoing bytes */
359*4882a593Smuzhiyun };
360*4882a593Smuzhiyun /* Stats per cpu */
361*4882a593Smuzhiyun struct ip_vs_cpu_stats {
362*4882a593Smuzhiyun 	struct ip_vs_counters   cnt;
363*4882a593Smuzhiyun 	struct u64_stats_sync   syncp;
364*4882a593Smuzhiyun };
365*4882a593Smuzhiyun 
366*4882a593Smuzhiyun /* IPVS statistics objects */
367*4882a593Smuzhiyun struct ip_vs_estimator {
368*4882a593Smuzhiyun 	struct list_head	list;
369*4882a593Smuzhiyun 
370*4882a593Smuzhiyun 	u64			last_inbytes;
371*4882a593Smuzhiyun 	u64			last_outbytes;
372*4882a593Smuzhiyun 	u64			last_conns;
373*4882a593Smuzhiyun 	u64			last_inpkts;
374*4882a593Smuzhiyun 	u64			last_outpkts;
375*4882a593Smuzhiyun 
376*4882a593Smuzhiyun 	u64			cps;
377*4882a593Smuzhiyun 	u64			inpps;
378*4882a593Smuzhiyun 	u64			outpps;
379*4882a593Smuzhiyun 	u64			inbps;
380*4882a593Smuzhiyun 	u64			outbps;
381*4882a593Smuzhiyun };
382*4882a593Smuzhiyun 
383*4882a593Smuzhiyun /*
384*4882a593Smuzhiyun  * IPVS statistics object, 64-bit kernel version of struct ip_vs_stats_user
385*4882a593Smuzhiyun  */
386*4882a593Smuzhiyun struct ip_vs_kstats {
387*4882a593Smuzhiyun 	u64			conns;		/* connections scheduled */
388*4882a593Smuzhiyun 	u64			inpkts;		/* incoming packets */
389*4882a593Smuzhiyun 	u64			outpkts;	/* outgoing packets */
390*4882a593Smuzhiyun 	u64			inbytes;	/* incoming bytes */
391*4882a593Smuzhiyun 	u64			outbytes;	/* outgoing bytes */
392*4882a593Smuzhiyun 
393*4882a593Smuzhiyun 	u64			cps;		/* current connection rate */
394*4882a593Smuzhiyun 	u64			inpps;		/* current in packet rate */
395*4882a593Smuzhiyun 	u64			outpps;		/* current out packet rate */
396*4882a593Smuzhiyun 	u64			inbps;		/* current in byte rate */
397*4882a593Smuzhiyun 	u64			outbps;		/* current out byte rate */
398*4882a593Smuzhiyun };
399*4882a593Smuzhiyun 
400*4882a593Smuzhiyun struct ip_vs_stats {
401*4882a593Smuzhiyun 	struct ip_vs_kstats	kstats;		/* kernel statistics */
402*4882a593Smuzhiyun 	struct ip_vs_estimator	est;		/* estimator */
403*4882a593Smuzhiyun 	struct ip_vs_cpu_stats __percpu	*cpustats;	/* per cpu counters */
404*4882a593Smuzhiyun 	spinlock_t		lock;		/* spin lock */
405*4882a593Smuzhiyun 	struct ip_vs_kstats	kstats0;	/* reset values */
406*4882a593Smuzhiyun };
407*4882a593Smuzhiyun 
408*4882a593Smuzhiyun struct dst_entry;
409*4882a593Smuzhiyun struct iphdr;
410*4882a593Smuzhiyun struct ip_vs_conn;
411*4882a593Smuzhiyun struct ip_vs_app;
412*4882a593Smuzhiyun struct sk_buff;
413*4882a593Smuzhiyun struct ip_vs_proto_data;
414*4882a593Smuzhiyun 
415*4882a593Smuzhiyun struct ip_vs_protocol {
416*4882a593Smuzhiyun 	struct ip_vs_protocol	*next;
417*4882a593Smuzhiyun 	char			*name;
418*4882a593Smuzhiyun 	u16			protocol;
419*4882a593Smuzhiyun 	u16			num_states;
420*4882a593Smuzhiyun 	int			dont_defrag;
421*4882a593Smuzhiyun 
422*4882a593Smuzhiyun 	void (*init)(struct ip_vs_protocol *pp);
423*4882a593Smuzhiyun 
424*4882a593Smuzhiyun 	void (*exit)(struct ip_vs_protocol *pp);
425*4882a593Smuzhiyun 
426*4882a593Smuzhiyun 	int (*init_netns)(struct netns_ipvs *ipvs, struct ip_vs_proto_data *pd);
427*4882a593Smuzhiyun 
428*4882a593Smuzhiyun 	void (*exit_netns)(struct netns_ipvs *ipvs, struct ip_vs_proto_data *pd);
429*4882a593Smuzhiyun 
430*4882a593Smuzhiyun 	int (*conn_schedule)(struct netns_ipvs *ipvs,
431*4882a593Smuzhiyun 			     int af, struct sk_buff *skb,
432*4882a593Smuzhiyun 			     struct ip_vs_proto_data *pd,
433*4882a593Smuzhiyun 			     int *verdict, struct ip_vs_conn **cpp,
434*4882a593Smuzhiyun 			     struct ip_vs_iphdr *iph);
435*4882a593Smuzhiyun 
436*4882a593Smuzhiyun 	struct ip_vs_conn *
437*4882a593Smuzhiyun 	(*conn_in_get)(struct netns_ipvs *ipvs,
438*4882a593Smuzhiyun 		       int af,
439*4882a593Smuzhiyun 		       const struct sk_buff *skb,
440*4882a593Smuzhiyun 		       const struct ip_vs_iphdr *iph);
441*4882a593Smuzhiyun 
442*4882a593Smuzhiyun 	struct ip_vs_conn *
443*4882a593Smuzhiyun 	(*conn_out_get)(struct netns_ipvs *ipvs,
444*4882a593Smuzhiyun 			int af,
445*4882a593Smuzhiyun 			const struct sk_buff *skb,
446*4882a593Smuzhiyun 			const struct ip_vs_iphdr *iph);
447*4882a593Smuzhiyun 
448*4882a593Smuzhiyun 	int (*snat_handler)(struct sk_buff *skb, struct ip_vs_protocol *pp,
449*4882a593Smuzhiyun 			    struct ip_vs_conn *cp, struct ip_vs_iphdr *iph);
450*4882a593Smuzhiyun 
451*4882a593Smuzhiyun 	int (*dnat_handler)(struct sk_buff *skb, struct ip_vs_protocol *pp,
452*4882a593Smuzhiyun 			    struct ip_vs_conn *cp, struct ip_vs_iphdr *iph);
453*4882a593Smuzhiyun 
454*4882a593Smuzhiyun 	const char *(*state_name)(int state);
455*4882a593Smuzhiyun 
456*4882a593Smuzhiyun 	void (*state_transition)(struct ip_vs_conn *cp, int direction,
457*4882a593Smuzhiyun 				 const struct sk_buff *skb,
458*4882a593Smuzhiyun 				 struct ip_vs_proto_data *pd);
459*4882a593Smuzhiyun 
460*4882a593Smuzhiyun 	int (*register_app)(struct netns_ipvs *ipvs, struct ip_vs_app *inc);
461*4882a593Smuzhiyun 
462*4882a593Smuzhiyun 	void (*unregister_app)(struct netns_ipvs *ipvs, struct ip_vs_app *inc);
463*4882a593Smuzhiyun 
464*4882a593Smuzhiyun 	int (*app_conn_bind)(struct ip_vs_conn *cp);
465*4882a593Smuzhiyun 
466*4882a593Smuzhiyun 	void (*debug_packet)(int af, struct ip_vs_protocol *pp,
467*4882a593Smuzhiyun 			     const struct sk_buff *skb,
468*4882a593Smuzhiyun 			     int offset,
469*4882a593Smuzhiyun 			     const char *msg);
470*4882a593Smuzhiyun 
471*4882a593Smuzhiyun 	void (*timeout_change)(struct ip_vs_proto_data *pd, int flags);
472*4882a593Smuzhiyun };
473*4882a593Smuzhiyun 
474*4882a593Smuzhiyun /* protocol data per netns */
475*4882a593Smuzhiyun struct ip_vs_proto_data {
476*4882a593Smuzhiyun 	struct ip_vs_proto_data	*next;
477*4882a593Smuzhiyun 	struct ip_vs_protocol	*pp;
478*4882a593Smuzhiyun 	int			*timeout_table;	/* protocol timeout table */
479*4882a593Smuzhiyun 	atomic_t		appcnt;		/* counter of proto app incs. */
480*4882a593Smuzhiyun 	struct tcp_states_t	*tcp_state_table;
481*4882a593Smuzhiyun };
482*4882a593Smuzhiyun 
483*4882a593Smuzhiyun struct ip_vs_protocol   *ip_vs_proto_get(unsigned short proto);
484*4882a593Smuzhiyun struct ip_vs_proto_data *ip_vs_proto_data_get(struct netns_ipvs *ipvs,
485*4882a593Smuzhiyun 					      unsigned short proto);
486*4882a593Smuzhiyun 
487*4882a593Smuzhiyun struct ip_vs_conn_param {
488*4882a593Smuzhiyun 	struct netns_ipvs		*ipvs;
489*4882a593Smuzhiyun 	const union nf_inet_addr	*caddr;
490*4882a593Smuzhiyun 	const union nf_inet_addr	*vaddr;
491*4882a593Smuzhiyun 	__be16				cport;
492*4882a593Smuzhiyun 	__be16				vport;
493*4882a593Smuzhiyun 	__u16				protocol;
494*4882a593Smuzhiyun 	u16				af;
495*4882a593Smuzhiyun 
496*4882a593Smuzhiyun 	const struct ip_vs_pe		*pe;
497*4882a593Smuzhiyun 	char				*pe_data;
498*4882a593Smuzhiyun 	__u8				pe_data_len;
499*4882a593Smuzhiyun };
500*4882a593Smuzhiyun 
501*4882a593Smuzhiyun /* IP_VS structure allocated for each dynamically scheduled connection */
502*4882a593Smuzhiyun struct ip_vs_conn {
503*4882a593Smuzhiyun 	struct hlist_node	c_list;         /* hashed list heads */
504*4882a593Smuzhiyun 	/* Protocol, addresses and port numbers */
505*4882a593Smuzhiyun 	__be16                  cport;
506*4882a593Smuzhiyun 	__be16                  dport;
507*4882a593Smuzhiyun 	__be16                  vport;
508*4882a593Smuzhiyun 	u16			af;		/* address family */
509*4882a593Smuzhiyun 	union nf_inet_addr      caddr;          /* client address */
510*4882a593Smuzhiyun 	union nf_inet_addr      vaddr;          /* virtual address */
511*4882a593Smuzhiyun 	union nf_inet_addr      daddr;          /* destination address */
512*4882a593Smuzhiyun 	volatile __u32          flags;          /* status flags */
513*4882a593Smuzhiyun 	__u16                   protocol;       /* Which protocol (TCP/UDP) */
514*4882a593Smuzhiyun 	__u16			daf;		/* Address family of the dest */
515*4882a593Smuzhiyun 	struct netns_ipvs	*ipvs;
516*4882a593Smuzhiyun 
517*4882a593Smuzhiyun 	/* counter and timer */
518*4882a593Smuzhiyun 	refcount_t		refcnt;		/* reference count */
519*4882a593Smuzhiyun 	struct timer_list	timer;		/* Expiration timer */
520*4882a593Smuzhiyun 	volatile unsigned long	timeout;	/* timeout */
521*4882a593Smuzhiyun 
522*4882a593Smuzhiyun 	/* Flags and state transition */
523*4882a593Smuzhiyun 	spinlock_t              lock;           /* lock for state transition */
524*4882a593Smuzhiyun 	volatile __u16          state;          /* state info */
525*4882a593Smuzhiyun 	volatile __u16          old_state;      /* old state, to be used for
526*4882a593Smuzhiyun 						 * state transition triggerd
527*4882a593Smuzhiyun 						 * synchronization
528*4882a593Smuzhiyun 						 */
529*4882a593Smuzhiyun 	__u32			fwmark;		/* Fire wall mark from skb */
530*4882a593Smuzhiyun 	unsigned long		sync_endtime;	/* jiffies + sent_retries */
531*4882a593Smuzhiyun 
532*4882a593Smuzhiyun 	/* Control members */
533*4882a593Smuzhiyun 	struct ip_vs_conn       *control;       /* Master control connection */
534*4882a593Smuzhiyun 	atomic_t                n_control;      /* Number of controlled ones */
535*4882a593Smuzhiyun 	struct ip_vs_dest       *dest;          /* real server */
536*4882a593Smuzhiyun 	atomic_t                in_pkts;        /* incoming packet counter */
537*4882a593Smuzhiyun 
538*4882a593Smuzhiyun 	/* Packet transmitter for different forwarding methods.  If it
539*4882a593Smuzhiyun 	 * mangles the packet, it must return NF_DROP or better NF_STOLEN,
540*4882a593Smuzhiyun 	 * otherwise this must be changed to a sk_buff **.
541*4882a593Smuzhiyun 	 * NF_ACCEPT can be returned when destination is local.
542*4882a593Smuzhiyun 	 */
543*4882a593Smuzhiyun 	int (*packet_xmit)(struct sk_buff *skb, struct ip_vs_conn *cp,
544*4882a593Smuzhiyun 			   struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
545*4882a593Smuzhiyun 
546*4882a593Smuzhiyun 	/* Note: we can group the following members into a structure,
547*4882a593Smuzhiyun 	 * in order to save more space, and the following members are
548*4882a593Smuzhiyun 	 * only used in VS/NAT anyway
549*4882a593Smuzhiyun 	 */
550*4882a593Smuzhiyun 	struct ip_vs_app        *app;           /* bound ip_vs_app object */
551*4882a593Smuzhiyun 	void                    *app_data;      /* Application private data */
552*4882a593Smuzhiyun 	struct ip_vs_seq        in_seq;         /* incoming seq. struct */
553*4882a593Smuzhiyun 	struct ip_vs_seq        out_seq;        /* outgoing seq. struct */
554*4882a593Smuzhiyun 
555*4882a593Smuzhiyun 	const struct ip_vs_pe	*pe;
556*4882a593Smuzhiyun 	char			*pe_data;
557*4882a593Smuzhiyun 	__u8			pe_data_len;
558*4882a593Smuzhiyun 
559*4882a593Smuzhiyun 	struct rcu_head		rcu_head;
560*4882a593Smuzhiyun };
561*4882a593Smuzhiyun 
562*4882a593Smuzhiyun /* Extended internal versions of struct ip_vs_service_user and ip_vs_dest_user
563*4882a593Smuzhiyun  * for IPv6 support.
564*4882a593Smuzhiyun  *
565*4882a593Smuzhiyun  * We need these to conveniently pass around service and destination
566*4882a593Smuzhiyun  * options, but unfortunately, we also need to keep the old definitions to
567*4882a593Smuzhiyun  * maintain userspace backwards compatibility for the setsockopt interface.
568*4882a593Smuzhiyun  */
569*4882a593Smuzhiyun struct ip_vs_service_user_kern {
570*4882a593Smuzhiyun 	/* virtual service addresses */
571*4882a593Smuzhiyun 	u16			af;
572*4882a593Smuzhiyun 	u16			protocol;
573*4882a593Smuzhiyun 	union nf_inet_addr	addr;		/* virtual ip address */
574*4882a593Smuzhiyun 	__be16			port;
575*4882a593Smuzhiyun 	u32			fwmark;		/* firwall mark of service */
576*4882a593Smuzhiyun 
577*4882a593Smuzhiyun 	/* virtual service options */
578*4882a593Smuzhiyun 	char			*sched_name;
579*4882a593Smuzhiyun 	char			*pe_name;
580*4882a593Smuzhiyun 	unsigned int		flags;		/* virtual service flags */
581*4882a593Smuzhiyun 	unsigned int		timeout;	/* persistent timeout in sec */
582*4882a593Smuzhiyun 	__be32			netmask;	/* persistent netmask or plen */
583*4882a593Smuzhiyun };
584*4882a593Smuzhiyun 
585*4882a593Smuzhiyun 
586*4882a593Smuzhiyun struct ip_vs_dest_user_kern {
587*4882a593Smuzhiyun 	/* destination server address */
588*4882a593Smuzhiyun 	union nf_inet_addr	addr;
589*4882a593Smuzhiyun 	__be16			port;
590*4882a593Smuzhiyun 
591*4882a593Smuzhiyun 	/* real server options */
592*4882a593Smuzhiyun 	unsigned int		conn_flags;	/* connection flags */
593*4882a593Smuzhiyun 	int			weight;		/* destination weight */
594*4882a593Smuzhiyun 
595*4882a593Smuzhiyun 	/* thresholds for active connections */
596*4882a593Smuzhiyun 	u32			u_threshold;	/* upper threshold */
597*4882a593Smuzhiyun 	u32			l_threshold;	/* lower threshold */
598*4882a593Smuzhiyun 
599*4882a593Smuzhiyun 	/* Address family of addr */
600*4882a593Smuzhiyun 	u16			af;
601*4882a593Smuzhiyun 
602*4882a593Smuzhiyun 	u16			tun_type;	/* tunnel type */
603*4882a593Smuzhiyun 	__be16			tun_port;	/* tunnel port */
604*4882a593Smuzhiyun 	u16			tun_flags;	/* tunnel flags */
605*4882a593Smuzhiyun };
606*4882a593Smuzhiyun 
607*4882a593Smuzhiyun 
608*4882a593Smuzhiyun /*
609*4882a593Smuzhiyun  * The information about the virtual service offered to the net and the
610*4882a593Smuzhiyun  * forwarding entries.
611*4882a593Smuzhiyun  */
612*4882a593Smuzhiyun struct ip_vs_service {
613*4882a593Smuzhiyun 	struct hlist_node	s_list;   /* for normal service table */
614*4882a593Smuzhiyun 	struct hlist_node	f_list;   /* for fwmark-based service table */
615*4882a593Smuzhiyun 	atomic_t		refcnt;   /* reference counter */
616*4882a593Smuzhiyun 
617*4882a593Smuzhiyun 	u16			af;       /* address family */
618*4882a593Smuzhiyun 	__u16			protocol; /* which protocol (TCP/UDP) */
619*4882a593Smuzhiyun 	union nf_inet_addr	addr;	  /* IP address for virtual service */
620*4882a593Smuzhiyun 	__be16			port;	  /* port number for the service */
621*4882a593Smuzhiyun 	__u32                   fwmark;   /* firewall mark of the service */
622*4882a593Smuzhiyun 	unsigned int		flags;	  /* service status flags */
623*4882a593Smuzhiyun 	unsigned int		timeout;  /* persistent timeout in ticks */
624*4882a593Smuzhiyun 	__be32			netmask;  /* grouping granularity, mask/plen */
625*4882a593Smuzhiyun 	struct netns_ipvs	*ipvs;
626*4882a593Smuzhiyun 
627*4882a593Smuzhiyun 	struct list_head	destinations;  /* real server d-linked list */
628*4882a593Smuzhiyun 	__u32			num_dests;     /* number of servers */
629*4882a593Smuzhiyun 	struct ip_vs_stats      stats;         /* statistics for the service */
630*4882a593Smuzhiyun 
631*4882a593Smuzhiyun 	/* for scheduling */
632*4882a593Smuzhiyun 	struct ip_vs_scheduler __rcu *scheduler; /* bound scheduler object */
633*4882a593Smuzhiyun 	spinlock_t		sched_lock;    /* lock sched_data */
634*4882a593Smuzhiyun 	void			*sched_data;   /* scheduler application data */
635*4882a593Smuzhiyun 
636*4882a593Smuzhiyun 	/* alternate persistence engine */
637*4882a593Smuzhiyun 	struct ip_vs_pe __rcu	*pe;
638*4882a593Smuzhiyun 	int			conntrack_afmask;
639*4882a593Smuzhiyun 
640*4882a593Smuzhiyun 	struct rcu_head		rcu_head;
641*4882a593Smuzhiyun };
642*4882a593Smuzhiyun 
643*4882a593Smuzhiyun /* Information for cached dst */
644*4882a593Smuzhiyun struct ip_vs_dest_dst {
645*4882a593Smuzhiyun 	struct dst_entry	*dst_cache;	/* destination cache entry */
646*4882a593Smuzhiyun 	u32			dst_cookie;
647*4882a593Smuzhiyun 	union nf_inet_addr	dst_saddr;
648*4882a593Smuzhiyun 	struct rcu_head		rcu_head;
649*4882a593Smuzhiyun };
650*4882a593Smuzhiyun 
651*4882a593Smuzhiyun /* The real server destination forwarding entry with ip address, port number,
652*4882a593Smuzhiyun  * and so on.
653*4882a593Smuzhiyun  */
654*4882a593Smuzhiyun struct ip_vs_dest {
655*4882a593Smuzhiyun 	struct list_head	n_list;   /* for the dests in the service */
656*4882a593Smuzhiyun 	struct hlist_node	d_list;   /* for table with all the dests */
657*4882a593Smuzhiyun 
658*4882a593Smuzhiyun 	u16			af;		/* address family */
659*4882a593Smuzhiyun 	__be16			port;		/* port number of the server */
660*4882a593Smuzhiyun 	union nf_inet_addr	addr;		/* IP address of the server */
661*4882a593Smuzhiyun 	volatile unsigned int	flags;		/* dest status flags */
662*4882a593Smuzhiyun 	atomic_t		conn_flags;	/* flags to copy to conn */
663*4882a593Smuzhiyun 	atomic_t		weight;		/* server weight */
664*4882a593Smuzhiyun 	atomic_t		last_weight;	/* server latest weight */
665*4882a593Smuzhiyun 	__u16			tun_type;	/* tunnel type */
666*4882a593Smuzhiyun 	__be16			tun_port;	/* tunnel port */
667*4882a593Smuzhiyun 	__u16			tun_flags;	/* tunnel flags */
668*4882a593Smuzhiyun 
669*4882a593Smuzhiyun 	refcount_t		refcnt;		/* reference counter */
670*4882a593Smuzhiyun 	struct ip_vs_stats      stats;          /* statistics */
671*4882a593Smuzhiyun 	unsigned long		idle_start;	/* start time, jiffies */
672*4882a593Smuzhiyun 
673*4882a593Smuzhiyun 	/* connection counters and thresholds */
674*4882a593Smuzhiyun 	atomic_t		activeconns;	/* active connections */
675*4882a593Smuzhiyun 	atomic_t		inactconns;	/* inactive connections */
676*4882a593Smuzhiyun 	atomic_t		persistconns;	/* persistent connections */
677*4882a593Smuzhiyun 	__u32			u_threshold;	/* upper threshold */
678*4882a593Smuzhiyun 	__u32			l_threshold;	/* lower threshold */
679*4882a593Smuzhiyun 
680*4882a593Smuzhiyun 	/* for destination cache */
681*4882a593Smuzhiyun 	spinlock_t		dst_lock;	/* lock of dst_cache */
682*4882a593Smuzhiyun 	struct ip_vs_dest_dst __rcu *dest_dst;	/* cached dst info */
683*4882a593Smuzhiyun 
684*4882a593Smuzhiyun 	/* for virtual service */
685*4882a593Smuzhiyun 	struct ip_vs_service __rcu *svc;	/* service it belongs to */
686*4882a593Smuzhiyun 	__u16			protocol;	/* which protocol (TCP/UDP) */
687*4882a593Smuzhiyun 	__be16			vport;		/* virtual port number */
688*4882a593Smuzhiyun 	union nf_inet_addr	vaddr;		/* virtual IP address */
689*4882a593Smuzhiyun 	__u32			vfwmark;	/* firewall mark of service */
690*4882a593Smuzhiyun 
691*4882a593Smuzhiyun 	struct list_head	t_list;		/* in dest_trash */
692*4882a593Smuzhiyun 	unsigned int		in_rs_table:1;	/* we are in rs_table */
693*4882a593Smuzhiyun };
694*4882a593Smuzhiyun 
695*4882a593Smuzhiyun /* The scheduler object */
696*4882a593Smuzhiyun struct ip_vs_scheduler {
697*4882a593Smuzhiyun 	struct list_head	n_list;		/* d-linked list head */
698*4882a593Smuzhiyun 	char			*name;		/* scheduler name */
699*4882a593Smuzhiyun 	atomic_t		refcnt;		/* reference counter */
700*4882a593Smuzhiyun 	struct module		*module;	/* THIS_MODULE/NULL */
701*4882a593Smuzhiyun 
702*4882a593Smuzhiyun 	/* scheduler initializing service */
703*4882a593Smuzhiyun 	int (*init_service)(struct ip_vs_service *svc);
704*4882a593Smuzhiyun 	/* scheduling service finish */
705*4882a593Smuzhiyun 	void (*done_service)(struct ip_vs_service *svc);
706*4882a593Smuzhiyun 	/* dest is linked */
707*4882a593Smuzhiyun 	int (*add_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest);
708*4882a593Smuzhiyun 	/* dest is unlinked */
709*4882a593Smuzhiyun 	int (*del_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest);
710*4882a593Smuzhiyun 	/* dest is updated */
711*4882a593Smuzhiyun 	int (*upd_dest)(struct ip_vs_service *svc, struct ip_vs_dest *dest);
712*4882a593Smuzhiyun 
713*4882a593Smuzhiyun 	/* selecting a server from the given service */
714*4882a593Smuzhiyun 	struct ip_vs_dest* (*schedule)(struct ip_vs_service *svc,
715*4882a593Smuzhiyun 				       const struct sk_buff *skb,
716*4882a593Smuzhiyun 				       struct ip_vs_iphdr *iph);
717*4882a593Smuzhiyun };
718*4882a593Smuzhiyun 
719*4882a593Smuzhiyun /* The persistence engine object */
720*4882a593Smuzhiyun struct ip_vs_pe {
721*4882a593Smuzhiyun 	struct list_head	n_list;		/* d-linked list head */
722*4882a593Smuzhiyun 	char			*name;		/* scheduler name */
723*4882a593Smuzhiyun 	atomic_t		refcnt;		/* reference counter */
724*4882a593Smuzhiyun 	struct module		*module;	/* THIS_MODULE/NULL */
725*4882a593Smuzhiyun 
726*4882a593Smuzhiyun 	/* get the connection template, if any */
727*4882a593Smuzhiyun 	int (*fill_param)(struct ip_vs_conn_param *p, struct sk_buff *skb);
728*4882a593Smuzhiyun 	bool (*ct_match)(const struct ip_vs_conn_param *p,
729*4882a593Smuzhiyun 			 struct ip_vs_conn *ct);
730*4882a593Smuzhiyun 	u32 (*hashkey_raw)(const struct ip_vs_conn_param *p, u32 initval,
731*4882a593Smuzhiyun 			   bool inverse);
732*4882a593Smuzhiyun 	int (*show_pe_data)(const struct ip_vs_conn *cp, char *buf);
733*4882a593Smuzhiyun 	/* create connections for real-server outgoing packets */
734*4882a593Smuzhiyun 	struct ip_vs_conn* (*conn_out)(struct ip_vs_service *svc,
735*4882a593Smuzhiyun 				       struct ip_vs_dest *dest,
736*4882a593Smuzhiyun 				       struct sk_buff *skb,
737*4882a593Smuzhiyun 				       const struct ip_vs_iphdr *iph,
738*4882a593Smuzhiyun 				       __be16 dport, __be16 cport);
739*4882a593Smuzhiyun };
740*4882a593Smuzhiyun 
741*4882a593Smuzhiyun /* The application module object (a.k.a. app incarnation) */
742*4882a593Smuzhiyun struct ip_vs_app {
743*4882a593Smuzhiyun 	struct list_head	a_list;		/* member in app list */
744*4882a593Smuzhiyun 	int			type;		/* IP_VS_APP_TYPE_xxx */
745*4882a593Smuzhiyun 	char			*name;		/* application module name */
746*4882a593Smuzhiyun 	__u16			protocol;
747*4882a593Smuzhiyun 	struct module		*module;	/* THIS_MODULE/NULL */
748*4882a593Smuzhiyun 	struct list_head	incs_list;	/* list of incarnations */
749*4882a593Smuzhiyun 
750*4882a593Smuzhiyun 	/* members for application incarnations */
751*4882a593Smuzhiyun 	struct list_head	p_list;		/* member in proto app list */
752*4882a593Smuzhiyun 	struct ip_vs_app	*app;		/* its real application */
753*4882a593Smuzhiyun 	__be16			port;		/* port number in net order */
754*4882a593Smuzhiyun 	atomic_t		usecnt;		/* usage counter */
755*4882a593Smuzhiyun 	struct rcu_head		rcu_head;
756*4882a593Smuzhiyun 
757*4882a593Smuzhiyun 	/* output hook: Process packet in inout direction, diff set for TCP.
758*4882a593Smuzhiyun 	 * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok,
759*4882a593Smuzhiyun 	 *	   2=Mangled but checksum was not updated
760*4882a593Smuzhiyun 	 */
761*4882a593Smuzhiyun 	int (*pkt_out)(struct ip_vs_app *, struct ip_vs_conn *,
762*4882a593Smuzhiyun 		       struct sk_buff *, int *diff, struct ip_vs_iphdr *ipvsh);
763*4882a593Smuzhiyun 
764*4882a593Smuzhiyun 	/* input hook: Process packet in outin direction, diff set for TCP.
765*4882a593Smuzhiyun 	 * Return: 0=Error, 1=Payload Not Mangled/Mangled but checksum is ok,
766*4882a593Smuzhiyun 	 *	   2=Mangled but checksum was not updated
767*4882a593Smuzhiyun 	 */
768*4882a593Smuzhiyun 	int (*pkt_in)(struct ip_vs_app *, struct ip_vs_conn *,
769*4882a593Smuzhiyun 		      struct sk_buff *, int *diff, struct ip_vs_iphdr *ipvsh);
770*4882a593Smuzhiyun 
771*4882a593Smuzhiyun 	/* ip_vs_app initializer */
772*4882a593Smuzhiyun 	int (*init_conn)(struct ip_vs_app *, struct ip_vs_conn *);
773*4882a593Smuzhiyun 
774*4882a593Smuzhiyun 	/* ip_vs_app finish */
775*4882a593Smuzhiyun 	int (*done_conn)(struct ip_vs_app *, struct ip_vs_conn *);
776*4882a593Smuzhiyun 
777*4882a593Smuzhiyun 
778*4882a593Smuzhiyun 	/* not used now */
779*4882a593Smuzhiyun 	int (*bind_conn)(struct ip_vs_app *, struct ip_vs_conn *,
780*4882a593Smuzhiyun 			 struct ip_vs_protocol *);
781*4882a593Smuzhiyun 
782*4882a593Smuzhiyun 	void (*unbind_conn)(struct ip_vs_app *, struct ip_vs_conn *);
783*4882a593Smuzhiyun 
784*4882a593Smuzhiyun 	int *			timeout_table;
785*4882a593Smuzhiyun 	int *			timeouts;
786*4882a593Smuzhiyun 	int			timeouts_size;
787*4882a593Smuzhiyun 
788*4882a593Smuzhiyun 	int (*conn_schedule)(struct sk_buff *skb, struct ip_vs_app *app,
789*4882a593Smuzhiyun 			     int *verdict, struct ip_vs_conn **cpp);
790*4882a593Smuzhiyun 
791*4882a593Smuzhiyun 	struct ip_vs_conn *
792*4882a593Smuzhiyun 	(*conn_in_get)(const struct sk_buff *skb, struct ip_vs_app *app,
793*4882a593Smuzhiyun 		       const struct iphdr *iph, int inverse);
794*4882a593Smuzhiyun 
795*4882a593Smuzhiyun 	struct ip_vs_conn *
796*4882a593Smuzhiyun 	(*conn_out_get)(const struct sk_buff *skb, struct ip_vs_app *app,
797*4882a593Smuzhiyun 			const struct iphdr *iph, int inverse);
798*4882a593Smuzhiyun 
799*4882a593Smuzhiyun 	int (*state_transition)(struct ip_vs_conn *cp, int direction,
800*4882a593Smuzhiyun 				const struct sk_buff *skb,
801*4882a593Smuzhiyun 				struct ip_vs_app *app);
802*4882a593Smuzhiyun 
803*4882a593Smuzhiyun 	void (*timeout_change)(struct ip_vs_app *app, int flags);
804*4882a593Smuzhiyun };
805*4882a593Smuzhiyun 
806*4882a593Smuzhiyun struct ipvs_master_sync_state {
807*4882a593Smuzhiyun 	struct list_head	sync_queue;
808*4882a593Smuzhiyun 	struct ip_vs_sync_buff	*sync_buff;
809*4882a593Smuzhiyun 	unsigned long		sync_queue_len;
810*4882a593Smuzhiyun 	unsigned int		sync_queue_delay;
811*4882a593Smuzhiyun 	struct delayed_work	master_wakeup_work;
812*4882a593Smuzhiyun 	struct netns_ipvs	*ipvs;
813*4882a593Smuzhiyun };
814*4882a593Smuzhiyun 
815*4882a593Smuzhiyun struct ip_vs_sync_thread_data;
816*4882a593Smuzhiyun 
817*4882a593Smuzhiyun /* How much time to keep dests in trash */
818*4882a593Smuzhiyun #define IP_VS_DEST_TRASH_PERIOD		(120 * HZ)
819*4882a593Smuzhiyun 
820*4882a593Smuzhiyun struct ipvs_sync_daemon_cfg {
821*4882a593Smuzhiyun 	union nf_inet_addr	mcast_group;
822*4882a593Smuzhiyun 	int			syncid;
823*4882a593Smuzhiyun 	u16			sync_maxlen;
824*4882a593Smuzhiyun 	u16			mcast_port;
825*4882a593Smuzhiyun 	u8			mcast_af;
826*4882a593Smuzhiyun 	u8			mcast_ttl;
827*4882a593Smuzhiyun 	/* multicast interface name */
828*4882a593Smuzhiyun 	char			mcast_ifn[IP_VS_IFNAME_MAXLEN];
829*4882a593Smuzhiyun };
830*4882a593Smuzhiyun 
831*4882a593Smuzhiyun /* IPVS in network namespace */
832*4882a593Smuzhiyun struct netns_ipvs {
833*4882a593Smuzhiyun 	int			gen;		/* Generation */
834*4882a593Smuzhiyun 	int			enable;		/* enable like nf_hooks do */
835*4882a593Smuzhiyun 	/* Hash table: for real service lookups */
836*4882a593Smuzhiyun 	#define IP_VS_RTAB_BITS 4
837*4882a593Smuzhiyun 	#define IP_VS_RTAB_SIZE (1 << IP_VS_RTAB_BITS)
838*4882a593Smuzhiyun 	#define IP_VS_RTAB_MASK (IP_VS_RTAB_SIZE - 1)
839*4882a593Smuzhiyun 
840*4882a593Smuzhiyun 	struct hlist_head	rs_table[IP_VS_RTAB_SIZE];
841*4882a593Smuzhiyun 	/* ip_vs_app */
842*4882a593Smuzhiyun 	struct list_head	app_list;
843*4882a593Smuzhiyun 	/* ip_vs_proto */
844*4882a593Smuzhiyun 	#define IP_VS_PROTO_TAB_SIZE	32	/* must be power of 2 */
845*4882a593Smuzhiyun 	struct ip_vs_proto_data *proto_data_table[IP_VS_PROTO_TAB_SIZE];
846*4882a593Smuzhiyun 	/* ip_vs_proto_tcp */
847*4882a593Smuzhiyun #ifdef CONFIG_IP_VS_PROTO_TCP
848*4882a593Smuzhiyun 	#define	TCP_APP_TAB_BITS	4
849*4882a593Smuzhiyun 	#define	TCP_APP_TAB_SIZE	(1 << TCP_APP_TAB_BITS)
850*4882a593Smuzhiyun 	#define	TCP_APP_TAB_MASK	(TCP_APP_TAB_SIZE - 1)
851*4882a593Smuzhiyun 	struct list_head	tcp_apps[TCP_APP_TAB_SIZE];
852*4882a593Smuzhiyun #endif
853*4882a593Smuzhiyun 	/* ip_vs_proto_udp */
854*4882a593Smuzhiyun #ifdef CONFIG_IP_VS_PROTO_UDP
855*4882a593Smuzhiyun 	#define	UDP_APP_TAB_BITS	4
856*4882a593Smuzhiyun 	#define	UDP_APP_TAB_SIZE	(1 << UDP_APP_TAB_BITS)
857*4882a593Smuzhiyun 	#define	UDP_APP_TAB_MASK	(UDP_APP_TAB_SIZE - 1)
858*4882a593Smuzhiyun 	struct list_head	udp_apps[UDP_APP_TAB_SIZE];
859*4882a593Smuzhiyun #endif
860*4882a593Smuzhiyun 	/* ip_vs_proto_sctp */
861*4882a593Smuzhiyun #ifdef CONFIG_IP_VS_PROTO_SCTP
862*4882a593Smuzhiyun 	#define SCTP_APP_TAB_BITS	4
863*4882a593Smuzhiyun 	#define SCTP_APP_TAB_SIZE	(1 << SCTP_APP_TAB_BITS)
864*4882a593Smuzhiyun 	#define SCTP_APP_TAB_MASK	(SCTP_APP_TAB_SIZE - 1)
865*4882a593Smuzhiyun 	/* Hash table for SCTP application incarnations	 */
866*4882a593Smuzhiyun 	struct list_head	sctp_apps[SCTP_APP_TAB_SIZE];
867*4882a593Smuzhiyun #endif
868*4882a593Smuzhiyun 	/* ip_vs_conn */
869*4882a593Smuzhiyun 	atomic_t		conn_count;      /* connection counter */
870*4882a593Smuzhiyun 
871*4882a593Smuzhiyun 	/* ip_vs_ctl */
872*4882a593Smuzhiyun 	struct ip_vs_stats		tot_stats;  /* Statistics & est. */
873*4882a593Smuzhiyun 
874*4882a593Smuzhiyun 	int			num_services;    /* no of virtual services */
875*4882a593Smuzhiyun 	int			num_services6;   /* IPv6 virtual services */
876*4882a593Smuzhiyun 
877*4882a593Smuzhiyun 	/* Trash for destinations */
878*4882a593Smuzhiyun 	struct list_head	dest_trash;
879*4882a593Smuzhiyun 	spinlock_t		dest_trash_lock;
880*4882a593Smuzhiyun 	struct timer_list	dest_trash_timer; /* expiration timer */
881*4882a593Smuzhiyun 	/* Service counters */
882*4882a593Smuzhiyun 	atomic_t		ftpsvc_counter;
883*4882a593Smuzhiyun 	atomic_t		nullsvc_counter;
884*4882a593Smuzhiyun 	atomic_t		conn_out_counter;
885*4882a593Smuzhiyun 
886*4882a593Smuzhiyun #ifdef CONFIG_SYSCTL
887*4882a593Smuzhiyun 	/* delayed work for expiring no dest connections */
888*4882a593Smuzhiyun 	struct delayed_work	expire_nodest_conn_work;
889*4882a593Smuzhiyun 	/* 1/rate drop and drop-entry variables */
890*4882a593Smuzhiyun 	struct delayed_work	defense_work;   /* Work handler */
891*4882a593Smuzhiyun 	int			drop_rate;
892*4882a593Smuzhiyun 	int			drop_counter;
893*4882a593Smuzhiyun 	int			old_secure_tcp;
894*4882a593Smuzhiyun 	atomic_t		dropentry;
895*4882a593Smuzhiyun 	/* locks in ctl.c */
896*4882a593Smuzhiyun 	spinlock_t		dropentry_lock;  /* drop entry handling */
897*4882a593Smuzhiyun 	spinlock_t		droppacket_lock; /* drop packet handling */
898*4882a593Smuzhiyun 	spinlock_t		securetcp_lock;  /* state and timeout tables */
899*4882a593Smuzhiyun 
900*4882a593Smuzhiyun 	/* sys-ctl struct */
901*4882a593Smuzhiyun 	struct ctl_table_header	*sysctl_hdr;
902*4882a593Smuzhiyun 	struct ctl_table	*sysctl_tbl;
903*4882a593Smuzhiyun #endif
904*4882a593Smuzhiyun 
905*4882a593Smuzhiyun 	/* sysctl variables */
906*4882a593Smuzhiyun 	int			sysctl_amemthresh;
907*4882a593Smuzhiyun 	int			sysctl_am_droprate;
908*4882a593Smuzhiyun 	int			sysctl_drop_entry;
909*4882a593Smuzhiyun 	int			sysctl_drop_packet;
910*4882a593Smuzhiyun 	int			sysctl_secure_tcp;
911*4882a593Smuzhiyun #ifdef CONFIG_IP_VS_NFCT
912*4882a593Smuzhiyun 	int			sysctl_conntrack;
913*4882a593Smuzhiyun #endif
914*4882a593Smuzhiyun 	int			sysctl_snat_reroute;
915*4882a593Smuzhiyun 	int			sysctl_sync_ver;
916*4882a593Smuzhiyun 	int			sysctl_sync_ports;
917*4882a593Smuzhiyun 	int			sysctl_sync_persist_mode;
918*4882a593Smuzhiyun 	unsigned long		sysctl_sync_qlen_max;
919*4882a593Smuzhiyun 	int			sysctl_sync_sock_size;
920*4882a593Smuzhiyun 	int			sysctl_cache_bypass;
921*4882a593Smuzhiyun 	int			sysctl_expire_nodest_conn;
922*4882a593Smuzhiyun 	int			sysctl_sloppy_tcp;
923*4882a593Smuzhiyun 	int			sysctl_sloppy_sctp;
924*4882a593Smuzhiyun 	int			sysctl_expire_quiescent_template;
925*4882a593Smuzhiyun 	int			sysctl_sync_threshold[2];
926*4882a593Smuzhiyun 	unsigned int		sysctl_sync_refresh_period;
927*4882a593Smuzhiyun 	int			sysctl_sync_retries;
928*4882a593Smuzhiyun 	int			sysctl_nat_icmp_send;
929*4882a593Smuzhiyun 	int			sysctl_pmtu_disc;
930*4882a593Smuzhiyun 	int			sysctl_backup_only;
931*4882a593Smuzhiyun 	int			sysctl_conn_reuse_mode;
932*4882a593Smuzhiyun 	int			sysctl_schedule_icmp;
933*4882a593Smuzhiyun 	int			sysctl_ignore_tunneled;
934*4882a593Smuzhiyun 
935*4882a593Smuzhiyun 	/* ip_vs_lblc */
936*4882a593Smuzhiyun 	int			sysctl_lblc_expiration;
937*4882a593Smuzhiyun 	struct ctl_table_header	*lblc_ctl_header;
938*4882a593Smuzhiyun 	struct ctl_table	*lblc_ctl_table;
939*4882a593Smuzhiyun 	/* ip_vs_lblcr */
940*4882a593Smuzhiyun 	int			sysctl_lblcr_expiration;
941*4882a593Smuzhiyun 	struct ctl_table_header	*lblcr_ctl_header;
942*4882a593Smuzhiyun 	struct ctl_table	*lblcr_ctl_table;
943*4882a593Smuzhiyun 	/* ip_vs_est */
944*4882a593Smuzhiyun 	struct list_head	est_list;	/* estimator list */
945*4882a593Smuzhiyun 	spinlock_t		est_lock;
946*4882a593Smuzhiyun 	struct timer_list	est_timer;	/* Estimation timer */
947*4882a593Smuzhiyun 	/* ip_vs_sync */
948*4882a593Smuzhiyun 	spinlock_t		sync_lock;
949*4882a593Smuzhiyun 	struct ipvs_master_sync_state *ms;
950*4882a593Smuzhiyun 	spinlock_t		sync_buff_lock;
951*4882a593Smuzhiyun 	struct ip_vs_sync_thread_data *master_tinfo;
952*4882a593Smuzhiyun 	struct ip_vs_sync_thread_data *backup_tinfo;
953*4882a593Smuzhiyun 	int			threads_mask;
954*4882a593Smuzhiyun 	volatile int		sync_state;
955*4882a593Smuzhiyun 	struct mutex		sync_mutex;
956*4882a593Smuzhiyun 	struct ipvs_sync_daemon_cfg	mcfg;	/* Master Configuration */
957*4882a593Smuzhiyun 	struct ipvs_sync_daemon_cfg	bcfg;	/* Backup Configuration */
958*4882a593Smuzhiyun 	/* net name space ptr */
959*4882a593Smuzhiyun 	struct net		*net;            /* Needed by timer routines */
960*4882a593Smuzhiyun 	/* Number of heterogeneous destinations, needed becaus heterogeneous
961*4882a593Smuzhiyun 	 * are not supported when synchronization is enabled.
962*4882a593Smuzhiyun 	 */
963*4882a593Smuzhiyun 	unsigned int		mixed_address_family_dests;
964*4882a593Smuzhiyun 	unsigned int		hooks_afmask;	/* &1=AF_INET, &2=AF_INET6 */
965*4882a593Smuzhiyun };
966*4882a593Smuzhiyun 
967*4882a593Smuzhiyun #define DEFAULT_SYNC_THRESHOLD	3
968*4882a593Smuzhiyun #define DEFAULT_SYNC_PERIOD	50
969*4882a593Smuzhiyun #define DEFAULT_SYNC_VER	1
970*4882a593Smuzhiyun #define DEFAULT_SLOPPY_TCP	0
971*4882a593Smuzhiyun #define DEFAULT_SLOPPY_SCTP	0
972*4882a593Smuzhiyun #define DEFAULT_SYNC_REFRESH_PERIOD	(0U * HZ)
973*4882a593Smuzhiyun #define DEFAULT_SYNC_RETRIES		0
974*4882a593Smuzhiyun #define IPVS_SYNC_WAKEUP_RATE	8
975*4882a593Smuzhiyun #define IPVS_SYNC_QLEN_MAX	(IPVS_SYNC_WAKEUP_RATE * 4)
976*4882a593Smuzhiyun #define IPVS_SYNC_SEND_DELAY	(HZ / 50)
977*4882a593Smuzhiyun #define IPVS_SYNC_CHECK_PERIOD	HZ
978*4882a593Smuzhiyun #define IPVS_SYNC_FLUSH_TIME	(HZ * 2)
979*4882a593Smuzhiyun #define IPVS_SYNC_PORTS_MAX	(1 << 6)
980*4882a593Smuzhiyun 
981*4882a593Smuzhiyun #ifdef CONFIG_SYSCTL
982*4882a593Smuzhiyun 
sysctl_sync_threshold(struct netns_ipvs * ipvs)983*4882a593Smuzhiyun static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs)
984*4882a593Smuzhiyun {
985*4882a593Smuzhiyun 	return ipvs->sysctl_sync_threshold[0];
986*4882a593Smuzhiyun }
987*4882a593Smuzhiyun 
sysctl_sync_period(struct netns_ipvs * ipvs)988*4882a593Smuzhiyun static inline int sysctl_sync_period(struct netns_ipvs *ipvs)
989*4882a593Smuzhiyun {
990*4882a593Smuzhiyun 	return READ_ONCE(ipvs->sysctl_sync_threshold[1]);
991*4882a593Smuzhiyun }
992*4882a593Smuzhiyun 
sysctl_sync_refresh_period(struct netns_ipvs * ipvs)993*4882a593Smuzhiyun static inline unsigned int sysctl_sync_refresh_period(struct netns_ipvs *ipvs)
994*4882a593Smuzhiyun {
995*4882a593Smuzhiyun 	return READ_ONCE(ipvs->sysctl_sync_refresh_period);
996*4882a593Smuzhiyun }
997*4882a593Smuzhiyun 
sysctl_sync_retries(struct netns_ipvs * ipvs)998*4882a593Smuzhiyun static inline int sysctl_sync_retries(struct netns_ipvs *ipvs)
999*4882a593Smuzhiyun {
1000*4882a593Smuzhiyun 	return ipvs->sysctl_sync_retries;
1001*4882a593Smuzhiyun }
1002*4882a593Smuzhiyun 
sysctl_sync_ver(struct netns_ipvs * ipvs)1003*4882a593Smuzhiyun static inline int sysctl_sync_ver(struct netns_ipvs *ipvs)
1004*4882a593Smuzhiyun {
1005*4882a593Smuzhiyun 	return ipvs->sysctl_sync_ver;
1006*4882a593Smuzhiyun }
1007*4882a593Smuzhiyun 
sysctl_sloppy_tcp(struct netns_ipvs * ipvs)1008*4882a593Smuzhiyun static inline int sysctl_sloppy_tcp(struct netns_ipvs *ipvs)
1009*4882a593Smuzhiyun {
1010*4882a593Smuzhiyun 	return ipvs->sysctl_sloppy_tcp;
1011*4882a593Smuzhiyun }
1012*4882a593Smuzhiyun 
sysctl_sloppy_sctp(struct netns_ipvs * ipvs)1013*4882a593Smuzhiyun static inline int sysctl_sloppy_sctp(struct netns_ipvs *ipvs)
1014*4882a593Smuzhiyun {
1015*4882a593Smuzhiyun 	return ipvs->sysctl_sloppy_sctp;
1016*4882a593Smuzhiyun }
1017*4882a593Smuzhiyun 
sysctl_sync_ports(struct netns_ipvs * ipvs)1018*4882a593Smuzhiyun static inline int sysctl_sync_ports(struct netns_ipvs *ipvs)
1019*4882a593Smuzhiyun {
1020*4882a593Smuzhiyun 	return READ_ONCE(ipvs->sysctl_sync_ports);
1021*4882a593Smuzhiyun }
1022*4882a593Smuzhiyun 
sysctl_sync_persist_mode(struct netns_ipvs * ipvs)1023*4882a593Smuzhiyun static inline int sysctl_sync_persist_mode(struct netns_ipvs *ipvs)
1024*4882a593Smuzhiyun {
1025*4882a593Smuzhiyun 	return ipvs->sysctl_sync_persist_mode;
1026*4882a593Smuzhiyun }
1027*4882a593Smuzhiyun 
sysctl_sync_qlen_max(struct netns_ipvs * ipvs)1028*4882a593Smuzhiyun static inline unsigned long sysctl_sync_qlen_max(struct netns_ipvs *ipvs)
1029*4882a593Smuzhiyun {
1030*4882a593Smuzhiyun 	return ipvs->sysctl_sync_qlen_max;
1031*4882a593Smuzhiyun }
1032*4882a593Smuzhiyun 
sysctl_sync_sock_size(struct netns_ipvs * ipvs)1033*4882a593Smuzhiyun static inline int sysctl_sync_sock_size(struct netns_ipvs *ipvs)
1034*4882a593Smuzhiyun {
1035*4882a593Smuzhiyun 	return ipvs->sysctl_sync_sock_size;
1036*4882a593Smuzhiyun }
1037*4882a593Smuzhiyun 
sysctl_pmtu_disc(struct netns_ipvs * ipvs)1038*4882a593Smuzhiyun static inline int sysctl_pmtu_disc(struct netns_ipvs *ipvs)
1039*4882a593Smuzhiyun {
1040*4882a593Smuzhiyun 	return ipvs->sysctl_pmtu_disc;
1041*4882a593Smuzhiyun }
1042*4882a593Smuzhiyun 
sysctl_backup_only(struct netns_ipvs * ipvs)1043*4882a593Smuzhiyun static inline int sysctl_backup_only(struct netns_ipvs *ipvs)
1044*4882a593Smuzhiyun {
1045*4882a593Smuzhiyun 	return ipvs->sync_state & IP_VS_STATE_BACKUP &&
1046*4882a593Smuzhiyun 	       ipvs->sysctl_backup_only;
1047*4882a593Smuzhiyun }
1048*4882a593Smuzhiyun 
sysctl_conn_reuse_mode(struct netns_ipvs * ipvs)1049*4882a593Smuzhiyun static inline int sysctl_conn_reuse_mode(struct netns_ipvs *ipvs)
1050*4882a593Smuzhiyun {
1051*4882a593Smuzhiyun 	return ipvs->sysctl_conn_reuse_mode;
1052*4882a593Smuzhiyun }
1053*4882a593Smuzhiyun 
sysctl_expire_nodest_conn(struct netns_ipvs * ipvs)1054*4882a593Smuzhiyun static inline int sysctl_expire_nodest_conn(struct netns_ipvs *ipvs)
1055*4882a593Smuzhiyun {
1056*4882a593Smuzhiyun 	return ipvs->sysctl_expire_nodest_conn;
1057*4882a593Smuzhiyun }
1058*4882a593Smuzhiyun 
sysctl_schedule_icmp(struct netns_ipvs * ipvs)1059*4882a593Smuzhiyun static inline int sysctl_schedule_icmp(struct netns_ipvs *ipvs)
1060*4882a593Smuzhiyun {
1061*4882a593Smuzhiyun 	return ipvs->sysctl_schedule_icmp;
1062*4882a593Smuzhiyun }
1063*4882a593Smuzhiyun 
sysctl_ignore_tunneled(struct netns_ipvs * ipvs)1064*4882a593Smuzhiyun static inline int sysctl_ignore_tunneled(struct netns_ipvs *ipvs)
1065*4882a593Smuzhiyun {
1066*4882a593Smuzhiyun 	return ipvs->sysctl_ignore_tunneled;
1067*4882a593Smuzhiyun }
1068*4882a593Smuzhiyun 
sysctl_cache_bypass(struct netns_ipvs * ipvs)1069*4882a593Smuzhiyun static inline int sysctl_cache_bypass(struct netns_ipvs *ipvs)
1070*4882a593Smuzhiyun {
1071*4882a593Smuzhiyun 	return ipvs->sysctl_cache_bypass;
1072*4882a593Smuzhiyun }
1073*4882a593Smuzhiyun 
1074*4882a593Smuzhiyun #else
1075*4882a593Smuzhiyun 
sysctl_sync_threshold(struct netns_ipvs * ipvs)1076*4882a593Smuzhiyun static inline int sysctl_sync_threshold(struct netns_ipvs *ipvs)
1077*4882a593Smuzhiyun {
1078*4882a593Smuzhiyun 	return DEFAULT_SYNC_THRESHOLD;
1079*4882a593Smuzhiyun }
1080*4882a593Smuzhiyun 
sysctl_sync_period(struct netns_ipvs * ipvs)1081*4882a593Smuzhiyun static inline int sysctl_sync_period(struct netns_ipvs *ipvs)
1082*4882a593Smuzhiyun {
1083*4882a593Smuzhiyun 	return DEFAULT_SYNC_PERIOD;
1084*4882a593Smuzhiyun }
1085*4882a593Smuzhiyun 
sysctl_sync_refresh_period(struct netns_ipvs * ipvs)1086*4882a593Smuzhiyun static inline unsigned int sysctl_sync_refresh_period(struct netns_ipvs *ipvs)
1087*4882a593Smuzhiyun {
1088*4882a593Smuzhiyun 	return DEFAULT_SYNC_REFRESH_PERIOD;
1089*4882a593Smuzhiyun }
1090*4882a593Smuzhiyun 
sysctl_sync_retries(struct netns_ipvs * ipvs)1091*4882a593Smuzhiyun static inline int sysctl_sync_retries(struct netns_ipvs *ipvs)
1092*4882a593Smuzhiyun {
1093*4882a593Smuzhiyun 	return DEFAULT_SYNC_RETRIES & 3;
1094*4882a593Smuzhiyun }
1095*4882a593Smuzhiyun 
sysctl_sync_ver(struct netns_ipvs * ipvs)1096*4882a593Smuzhiyun static inline int sysctl_sync_ver(struct netns_ipvs *ipvs)
1097*4882a593Smuzhiyun {
1098*4882a593Smuzhiyun 	return DEFAULT_SYNC_VER;
1099*4882a593Smuzhiyun }
1100*4882a593Smuzhiyun 
sysctl_sloppy_tcp(struct netns_ipvs * ipvs)1101*4882a593Smuzhiyun static inline int sysctl_sloppy_tcp(struct netns_ipvs *ipvs)
1102*4882a593Smuzhiyun {
1103*4882a593Smuzhiyun 	return DEFAULT_SLOPPY_TCP;
1104*4882a593Smuzhiyun }
1105*4882a593Smuzhiyun 
sysctl_sloppy_sctp(struct netns_ipvs * ipvs)1106*4882a593Smuzhiyun static inline int sysctl_sloppy_sctp(struct netns_ipvs *ipvs)
1107*4882a593Smuzhiyun {
1108*4882a593Smuzhiyun 	return DEFAULT_SLOPPY_SCTP;
1109*4882a593Smuzhiyun }
1110*4882a593Smuzhiyun 
sysctl_sync_ports(struct netns_ipvs * ipvs)1111*4882a593Smuzhiyun static inline int sysctl_sync_ports(struct netns_ipvs *ipvs)
1112*4882a593Smuzhiyun {
1113*4882a593Smuzhiyun 	return 1;
1114*4882a593Smuzhiyun }
1115*4882a593Smuzhiyun 
sysctl_sync_persist_mode(struct netns_ipvs * ipvs)1116*4882a593Smuzhiyun static inline int sysctl_sync_persist_mode(struct netns_ipvs *ipvs)
1117*4882a593Smuzhiyun {
1118*4882a593Smuzhiyun 	return 0;
1119*4882a593Smuzhiyun }
1120*4882a593Smuzhiyun 
sysctl_sync_qlen_max(struct netns_ipvs * ipvs)1121*4882a593Smuzhiyun static inline unsigned long sysctl_sync_qlen_max(struct netns_ipvs *ipvs)
1122*4882a593Smuzhiyun {
1123*4882a593Smuzhiyun 	return IPVS_SYNC_QLEN_MAX;
1124*4882a593Smuzhiyun }
1125*4882a593Smuzhiyun 
sysctl_sync_sock_size(struct netns_ipvs * ipvs)1126*4882a593Smuzhiyun static inline int sysctl_sync_sock_size(struct netns_ipvs *ipvs)
1127*4882a593Smuzhiyun {
1128*4882a593Smuzhiyun 	return 0;
1129*4882a593Smuzhiyun }
1130*4882a593Smuzhiyun 
sysctl_pmtu_disc(struct netns_ipvs * ipvs)1131*4882a593Smuzhiyun static inline int sysctl_pmtu_disc(struct netns_ipvs *ipvs)
1132*4882a593Smuzhiyun {
1133*4882a593Smuzhiyun 	return 1;
1134*4882a593Smuzhiyun }
1135*4882a593Smuzhiyun 
sysctl_backup_only(struct netns_ipvs * ipvs)1136*4882a593Smuzhiyun static inline int sysctl_backup_only(struct netns_ipvs *ipvs)
1137*4882a593Smuzhiyun {
1138*4882a593Smuzhiyun 	return 0;
1139*4882a593Smuzhiyun }
1140*4882a593Smuzhiyun 
sysctl_conn_reuse_mode(struct netns_ipvs * ipvs)1141*4882a593Smuzhiyun static inline int sysctl_conn_reuse_mode(struct netns_ipvs *ipvs)
1142*4882a593Smuzhiyun {
1143*4882a593Smuzhiyun 	return 1;
1144*4882a593Smuzhiyun }
1145*4882a593Smuzhiyun 
sysctl_expire_nodest_conn(struct netns_ipvs * ipvs)1146*4882a593Smuzhiyun static inline int sysctl_expire_nodest_conn(struct netns_ipvs *ipvs)
1147*4882a593Smuzhiyun {
1148*4882a593Smuzhiyun 	return 0;
1149*4882a593Smuzhiyun }
1150*4882a593Smuzhiyun 
sysctl_schedule_icmp(struct netns_ipvs * ipvs)1151*4882a593Smuzhiyun static inline int sysctl_schedule_icmp(struct netns_ipvs *ipvs)
1152*4882a593Smuzhiyun {
1153*4882a593Smuzhiyun 	return 0;
1154*4882a593Smuzhiyun }
1155*4882a593Smuzhiyun 
sysctl_ignore_tunneled(struct netns_ipvs * ipvs)1156*4882a593Smuzhiyun static inline int sysctl_ignore_tunneled(struct netns_ipvs *ipvs)
1157*4882a593Smuzhiyun {
1158*4882a593Smuzhiyun 	return 0;
1159*4882a593Smuzhiyun }
1160*4882a593Smuzhiyun 
sysctl_cache_bypass(struct netns_ipvs * ipvs)1161*4882a593Smuzhiyun static inline int sysctl_cache_bypass(struct netns_ipvs *ipvs)
1162*4882a593Smuzhiyun {
1163*4882a593Smuzhiyun 	return 0;
1164*4882a593Smuzhiyun }
1165*4882a593Smuzhiyun 
1166*4882a593Smuzhiyun #endif
1167*4882a593Smuzhiyun 
1168*4882a593Smuzhiyun /* IPVS core functions
1169*4882a593Smuzhiyun  * (from ip_vs_core.c)
1170*4882a593Smuzhiyun  */
1171*4882a593Smuzhiyun const char *ip_vs_proto_name(unsigned int proto);
1172*4882a593Smuzhiyun void ip_vs_init_hash_table(struct list_head *table, int rows);
1173*4882a593Smuzhiyun struct ip_vs_conn *ip_vs_new_conn_out(struct ip_vs_service *svc,
1174*4882a593Smuzhiyun 				      struct ip_vs_dest *dest,
1175*4882a593Smuzhiyun 				      struct sk_buff *skb,
1176*4882a593Smuzhiyun 				      const struct ip_vs_iphdr *iph,
1177*4882a593Smuzhiyun 				      __be16 dport,
1178*4882a593Smuzhiyun 				      __be16 cport);
1179*4882a593Smuzhiyun #define IP_VS_INIT_HASH_TABLE(t) ip_vs_init_hash_table((t), ARRAY_SIZE((t)))
1180*4882a593Smuzhiyun 
1181*4882a593Smuzhiyun #define IP_VS_APP_TYPE_FTP	1
1182*4882a593Smuzhiyun 
1183*4882a593Smuzhiyun /* ip_vs_conn handling functions
1184*4882a593Smuzhiyun  * (from ip_vs_conn.c)
1185*4882a593Smuzhiyun  */
1186*4882a593Smuzhiyun enum {
1187*4882a593Smuzhiyun 	IP_VS_DIR_INPUT = 0,
1188*4882a593Smuzhiyun 	IP_VS_DIR_OUTPUT,
1189*4882a593Smuzhiyun 	IP_VS_DIR_INPUT_ONLY,
1190*4882a593Smuzhiyun 	IP_VS_DIR_LAST,
1191*4882a593Smuzhiyun };
1192*4882a593Smuzhiyun 
ip_vs_conn_fill_param(struct netns_ipvs * ipvs,int af,int protocol,const union nf_inet_addr * caddr,__be16 cport,const union nf_inet_addr * vaddr,__be16 vport,struct ip_vs_conn_param * p)1193*4882a593Smuzhiyun static inline void ip_vs_conn_fill_param(struct netns_ipvs *ipvs, int af, int protocol,
1194*4882a593Smuzhiyun 					 const union nf_inet_addr *caddr,
1195*4882a593Smuzhiyun 					 __be16 cport,
1196*4882a593Smuzhiyun 					 const union nf_inet_addr *vaddr,
1197*4882a593Smuzhiyun 					 __be16 vport,
1198*4882a593Smuzhiyun 					 struct ip_vs_conn_param *p)
1199*4882a593Smuzhiyun {
1200*4882a593Smuzhiyun 	p->ipvs = ipvs;
1201*4882a593Smuzhiyun 	p->af = af;
1202*4882a593Smuzhiyun 	p->protocol = protocol;
1203*4882a593Smuzhiyun 	p->caddr = caddr;
1204*4882a593Smuzhiyun 	p->cport = cport;
1205*4882a593Smuzhiyun 	p->vaddr = vaddr;
1206*4882a593Smuzhiyun 	p->vport = vport;
1207*4882a593Smuzhiyun 	p->pe = NULL;
1208*4882a593Smuzhiyun 	p->pe_data = NULL;
1209*4882a593Smuzhiyun }
1210*4882a593Smuzhiyun 
1211*4882a593Smuzhiyun struct ip_vs_conn *ip_vs_conn_in_get(const struct ip_vs_conn_param *p);
1212*4882a593Smuzhiyun struct ip_vs_conn *ip_vs_ct_in_get(const struct ip_vs_conn_param *p);
1213*4882a593Smuzhiyun 
1214*4882a593Smuzhiyun struct ip_vs_conn * ip_vs_conn_in_get_proto(struct netns_ipvs *ipvs, int af,
1215*4882a593Smuzhiyun 					    const struct sk_buff *skb,
1216*4882a593Smuzhiyun 					    const struct ip_vs_iphdr *iph);
1217*4882a593Smuzhiyun 
1218*4882a593Smuzhiyun struct ip_vs_conn *ip_vs_conn_out_get(const struct ip_vs_conn_param *p);
1219*4882a593Smuzhiyun 
1220*4882a593Smuzhiyun struct ip_vs_conn * ip_vs_conn_out_get_proto(struct netns_ipvs *ipvs, int af,
1221*4882a593Smuzhiyun 					     const struct sk_buff *skb,
1222*4882a593Smuzhiyun 					     const struct ip_vs_iphdr *iph);
1223*4882a593Smuzhiyun 
1224*4882a593Smuzhiyun /* Get reference to gain full access to conn.
1225*4882a593Smuzhiyun  * By default, RCU read-side critical sections have access only to
1226*4882a593Smuzhiyun  * conn fields and its PE data, see ip_vs_conn_rcu_free() for reference.
1227*4882a593Smuzhiyun  */
__ip_vs_conn_get(struct ip_vs_conn * cp)1228*4882a593Smuzhiyun static inline bool __ip_vs_conn_get(struct ip_vs_conn *cp)
1229*4882a593Smuzhiyun {
1230*4882a593Smuzhiyun 	return refcount_inc_not_zero(&cp->refcnt);
1231*4882a593Smuzhiyun }
1232*4882a593Smuzhiyun 
1233*4882a593Smuzhiyun /* put back the conn without restarting its timer */
__ip_vs_conn_put(struct ip_vs_conn * cp)1234*4882a593Smuzhiyun static inline void __ip_vs_conn_put(struct ip_vs_conn *cp)
1235*4882a593Smuzhiyun {
1236*4882a593Smuzhiyun 	smp_mb__before_atomic();
1237*4882a593Smuzhiyun 	refcount_dec(&cp->refcnt);
1238*4882a593Smuzhiyun }
1239*4882a593Smuzhiyun void ip_vs_conn_put(struct ip_vs_conn *cp);
1240*4882a593Smuzhiyun void ip_vs_conn_fill_cport(struct ip_vs_conn *cp, __be16 cport);
1241*4882a593Smuzhiyun 
1242*4882a593Smuzhiyun struct ip_vs_conn *ip_vs_conn_new(const struct ip_vs_conn_param *p, int dest_af,
1243*4882a593Smuzhiyun 				  const union nf_inet_addr *daddr,
1244*4882a593Smuzhiyun 				  __be16 dport, unsigned int flags,
1245*4882a593Smuzhiyun 				  struct ip_vs_dest *dest, __u32 fwmark);
1246*4882a593Smuzhiyun void ip_vs_conn_expire_now(struct ip_vs_conn *cp);
1247*4882a593Smuzhiyun 
1248*4882a593Smuzhiyun const char *ip_vs_state_name(const struct ip_vs_conn *cp);
1249*4882a593Smuzhiyun 
1250*4882a593Smuzhiyun void ip_vs_tcp_conn_listen(struct ip_vs_conn *cp);
1251*4882a593Smuzhiyun int ip_vs_check_template(struct ip_vs_conn *ct, struct ip_vs_dest *cdest);
1252*4882a593Smuzhiyun void ip_vs_random_dropentry(struct netns_ipvs *ipvs);
1253*4882a593Smuzhiyun int ip_vs_conn_init(void);
1254*4882a593Smuzhiyun void ip_vs_conn_cleanup(void);
1255*4882a593Smuzhiyun 
ip_vs_control_del(struct ip_vs_conn * cp)1256*4882a593Smuzhiyun static inline void ip_vs_control_del(struct ip_vs_conn *cp)
1257*4882a593Smuzhiyun {
1258*4882a593Smuzhiyun 	struct ip_vs_conn *ctl_cp = cp->control;
1259*4882a593Smuzhiyun 	if (!ctl_cp) {
1260*4882a593Smuzhiyun 		IP_VS_ERR_BUF("request control DEL for uncontrolled: "
1261*4882a593Smuzhiyun 			      "%s:%d to %s:%d\n",
1262*4882a593Smuzhiyun 			      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1263*4882a593Smuzhiyun 			      ntohs(cp->cport),
1264*4882a593Smuzhiyun 			      IP_VS_DBG_ADDR(cp->af, &cp->vaddr),
1265*4882a593Smuzhiyun 			      ntohs(cp->vport));
1266*4882a593Smuzhiyun 
1267*4882a593Smuzhiyun 		return;
1268*4882a593Smuzhiyun 	}
1269*4882a593Smuzhiyun 
1270*4882a593Smuzhiyun 	IP_VS_DBG_BUF(7, "DELeting control for: "
1271*4882a593Smuzhiyun 		      "cp.dst=%s:%d ctl_cp.dst=%s:%d\n",
1272*4882a593Smuzhiyun 		      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1273*4882a593Smuzhiyun 		      ntohs(cp->cport),
1274*4882a593Smuzhiyun 		      IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr),
1275*4882a593Smuzhiyun 		      ntohs(ctl_cp->cport));
1276*4882a593Smuzhiyun 
1277*4882a593Smuzhiyun 	cp->control = NULL;
1278*4882a593Smuzhiyun 	if (atomic_read(&ctl_cp->n_control) == 0) {
1279*4882a593Smuzhiyun 		IP_VS_ERR_BUF("BUG control DEL with n=0 : "
1280*4882a593Smuzhiyun 			      "%s:%d to %s:%d\n",
1281*4882a593Smuzhiyun 			      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1282*4882a593Smuzhiyun 			      ntohs(cp->cport),
1283*4882a593Smuzhiyun 			      IP_VS_DBG_ADDR(cp->af, &cp->vaddr),
1284*4882a593Smuzhiyun 			      ntohs(cp->vport));
1285*4882a593Smuzhiyun 
1286*4882a593Smuzhiyun 		return;
1287*4882a593Smuzhiyun 	}
1288*4882a593Smuzhiyun 	atomic_dec(&ctl_cp->n_control);
1289*4882a593Smuzhiyun }
1290*4882a593Smuzhiyun 
1291*4882a593Smuzhiyun static inline void
ip_vs_control_add(struct ip_vs_conn * cp,struct ip_vs_conn * ctl_cp)1292*4882a593Smuzhiyun ip_vs_control_add(struct ip_vs_conn *cp, struct ip_vs_conn *ctl_cp)
1293*4882a593Smuzhiyun {
1294*4882a593Smuzhiyun 	if (cp->control) {
1295*4882a593Smuzhiyun 		IP_VS_ERR_BUF("request control ADD for already controlled: "
1296*4882a593Smuzhiyun 			      "%s:%d to %s:%d\n",
1297*4882a593Smuzhiyun 			      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1298*4882a593Smuzhiyun 			      ntohs(cp->cport),
1299*4882a593Smuzhiyun 			      IP_VS_DBG_ADDR(cp->af, &cp->vaddr),
1300*4882a593Smuzhiyun 			      ntohs(cp->vport));
1301*4882a593Smuzhiyun 
1302*4882a593Smuzhiyun 		ip_vs_control_del(cp);
1303*4882a593Smuzhiyun 	}
1304*4882a593Smuzhiyun 
1305*4882a593Smuzhiyun 	IP_VS_DBG_BUF(7, "ADDing control for: "
1306*4882a593Smuzhiyun 		      "cp.dst=%s:%d ctl_cp.dst=%s:%d\n",
1307*4882a593Smuzhiyun 		      IP_VS_DBG_ADDR(cp->af, &cp->caddr),
1308*4882a593Smuzhiyun 		      ntohs(cp->cport),
1309*4882a593Smuzhiyun 		      IP_VS_DBG_ADDR(cp->af, &ctl_cp->caddr),
1310*4882a593Smuzhiyun 		      ntohs(ctl_cp->cport));
1311*4882a593Smuzhiyun 
1312*4882a593Smuzhiyun 	cp->control = ctl_cp;
1313*4882a593Smuzhiyun 	atomic_inc(&ctl_cp->n_control);
1314*4882a593Smuzhiyun }
1315*4882a593Smuzhiyun 
1316*4882a593Smuzhiyun /* Mark our template as assured */
1317*4882a593Smuzhiyun static inline void
ip_vs_control_assure_ct(struct ip_vs_conn * cp)1318*4882a593Smuzhiyun ip_vs_control_assure_ct(struct ip_vs_conn *cp)
1319*4882a593Smuzhiyun {
1320*4882a593Smuzhiyun 	struct ip_vs_conn *ct = cp->control;
1321*4882a593Smuzhiyun 
1322*4882a593Smuzhiyun 	if (ct && !(ct->state & IP_VS_CTPL_S_ASSURED) &&
1323*4882a593Smuzhiyun 	    (ct->flags & IP_VS_CONN_F_TEMPLATE))
1324*4882a593Smuzhiyun 		ct->state |= IP_VS_CTPL_S_ASSURED;
1325*4882a593Smuzhiyun }
1326*4882a593Smuzhiyun 
1327*4882a593Smuzhiyun /* IPVS netns init & cleanup functions */
1328*4882a593Smuzhiyun int ip_vs_estimator_net_init(struct netns_ipvs *ipvs);
1329*4882a593Smuzhiyun int ip_vs_control_net_init(struct netns_ipvs *ipvs);
1330*4882a593Smuzhiyun int ip_vs_protocol_net_init(struct netns_ipvs *ipvs);
1331*4882a593Smuzhiyun int ip_vs_app_net_init(struct netns_ipvs *ipvs);
1332*4882a593Smuzhiyun int ip_vs_conn_net_init(struct netns_ipvs *ipvs);
1333*4882a593Smuzhiyun int ip_vs_sync_net_init(struct netns_ipvs *ipvs);
1334*4882a593Smuzhiyun void ip_vs_conn_net_cleanup(struct netns_ipvs *ipvs);
1335*4882a593Smuzhiyun void ip_vs_app_net_cleanup(struct netns_ipvs *ipvs);
1336*4882a593Smuzhiyun void ip_vs_protocol_net_cleanup(struct netns_ipvs *ipvs);
1337*4882a593Smuzhiyun void ip_vs_control_net_cleanup(struct netns_ipvs *ipvs);
1338*4882a593Smuzhiyun void ip_vs_estimator_net_cleanup(struct netns_ipvs *ipvs);
1339*4882a593Smuzhiyun void ip_vs_sync_net_cleanup(struct netns_ipvs *ipvs);
1340*4882a593Smuzhiyun void ip_vs_service_nets_cleanup(struct list_head *net_list);
1341*4882a593Smuzhiyun 
1342*4882a593Smuzhiyun /* IPVS application functions
1343*4882a593Smuzhiyun  * (from ip_vs_app.c)
1344*4882a593Smuzhiyun  */
1345*4882a593Smuzhiyun #define IP_VS_APP_MAX_PORTS  8
1346*4882a593Smuzhiyun struct ip_vs_app *register_ip_vs_app(struct netns_ipvs *ipvs, struct ip_vs_app *app);
1347*4882a593Smuzhiyun void unregister_ip_vs_app(struct netns_ipvs *ipvs, struct ip_vs_app *app);
1348*4882a593Smuzhiyun int ip_vs_bind_app(struct ip_vs_conn *cp, struct ip_vs_protocol *pp);
1349*4882a593Smuzhiyun void ip_vs_unbind_app(struct ip_vs_conn *cp);
1350*4882a593Smuzhiyun int register_ip_vs_app_inc(struct netns_ipvs *ipvs, struct ip_vs_app *app, __u16 proto,
1351*4882a593Smuzhiyun 			   __u16 port);
1352*4882a593Smuzhiyun int ip_vs_app_inc_get(struct ip_vs_app *inc);
1353*4882a593Smuzhiyun void ip_vs_app_inc_put(struct ip_vs_app *inc);
1354*4882a593Smuzhiyun 
1355*4882a593Smuzhiyun int ip_vs_app_pkt_out(struct ip_vs_conn *, struct sk_buff *skb,
1356*4882a593Smuzhiyun 		      struct ip_vs_iphdr *ipvsh);
1357*4882a593Smuzhiyun int ip_vs_app_pkt_in(struct ip_vs_conn *, struct sk_buff *skb,
1358*4882a593Smuzhiyun 		     struct ip_vs_iphdr *ipvsh);
1359*4882a593Smuzhiyun 
1360*4882a593Smuzhiyun int register_ip_vs_pe(struct ip_vs_pe *pe);
1361*4882a593Smuzhiyun int unregister_ip_vs_pe(struct ip_vs_pe *pe);
1362*4882a593Smuzhiyun struct ip_vs_pe *ip_vs_pe_getbyname(const char *name);
1363*4882a593Smuzhiyun struct ip_vs_pe *__ip_vs_pe_getbyname(const char *pe_name);
1364*4882a593Smuzhiyun 
1365*4882a593Smuzhiyun /* Use a #define to avoid all of module.h just for these trivial ops */
1366*4882a593Smuzhiyun #define ip_vs_pe_get(pe)			\
1367*4882a593Smuzhiyun 	if (pe && pe->module)			\
1368*4882a593Smuzhiyun 		__module_get(pe->module);
1369*4882a593Smuzhiyun 
1370*4882a593Smuzhiyun #define ip_vs_pe_put(pe)			\
1371*4882a593Smuzhiyun 	if (pe && pe->module)			\
1372*4882a593Smuzhiyun 		module_put(pe->module);
1373*4882a593Smuzhiyun 
1374*4882a593Smuzhiyun /* IPVS protocol functions (from ip_vs_proto.c) */
1375*4882a593Smuzhiyun int ip_vs_protocol_init(void);
1376*4882a593Smuzhiyun void ip_vs_protocol_cleanup(void);
1377*4882a593Smuzhiyun void ip_vs_protocol_timeout_change(struct netns_ipvs *ipvs, int flags);
1378*4882a593Smuzhiyun int *ip_vs_create_timeout_table(int *table, int size);
1379*4882a593Smuzhiyun void ip_vs_tcpudp_debug_packet(int af, struct ip_vs_protocol *pp,
1380*4882a593Smuzhiyun 			       const struct sk_buff *skb, int offset,
1381*4882a593Smuzhiyun 			       const char *msg);
1382*4882a593Smuzhiyun 
1383*4882a593Smuzhiyun extern struct ip_vs_protocol ip_vs_protocol_tcp;
1384*4882a593Smuzhiyun extern struct ip_vs_protocol ip_vs_protocol_udp;
1385*4882a593Smuzhiyun extern struct ip_vs_protocol ip_vs_protocol_icmp;
1386*4882a593Smuzhiyun extern struct ip_vs_protocol ip_vs_protocol_esp;
1387*4882a593Smuzhiyun extern struct ip_vs_protocol ip_vs_protocol_ah;
1388*4882a593Smuzhiyun extern struct ip_vs_protocol ip_vs_protocol_sctp;
1389*4882a593Smuzhiyun 
1390*4882a593Smuzhiyun /* Registering/unregistering scheduler functions
1391*4882a593Smuzhiyun  * (from ip_vs_sched.c)
1392*4882a593Smuzhiyun  */
1393*4882a593Smuzhiyun int register_ip_vs_scheduler(struct ip_vs_scheduler *scheduler);
1394*4882a593Smuzhiyun int unregister_ip_vs_scheduler(struct ip_vs_scheduler *scheduler);
1395*4882a593Smuzhiyun int ip_vs_bind_scheduler(struct ip_vs_service *svc,
1396*4882a593Smuzhiyun 			 struct ip_vs_scheduler *scheduler);
1397*4882a593Smuzhiyun void ip_vs_unbind_scheduler(struct ip_vs_service *svc,
1398*4882a593Smuzhiyun 			    struct ip_vs_scheduler *sched);
1399*4882a593Smuzhiyun struct ip_vs_scheduler *ip_vs_scheduler_get(const char *sched_name);
1400*4882a593Smuzhiyun void ip_vs_scheduler_put(struct ip_vs_scheduler *scheduler);
1401*4882a593Smuzhiyun struct ip_vs_conn *
1402*4882a593Smuzhiyun ip_vs_schedule(struct ip_vs_service *svc, struct sk_buff *skb,
1403*4882a593Smuzhiyun 	       struct ip_vs_proto_data *pd, int *ignored,
1404*4882a593Smuzhiyun 	       struct ip_vs_iphdr *iph);
1405*4882a593Smuzhiyun int ip_vs_leave(struct ip_vs_service *svc, struct sk_buff *skb,
1406*4882a593Smuzhiyun 		struct ip_vs_proto_data *pd, struct ip_vs_iphdr *iph);
1407*4882a593Smuzhiyun 
1408*4882a593Smuzhiyun void ip_vs_scheduler_err(struct ip_vs_service *svc, const char *msg);
1409*4882a593Smuzhiyun 
1410*4882a593Smuzhiyun /* IPVS control data and functions (from ip_vs_ctl.c) */
1411*4882a593Smuzhiyun extern struct ip_vs_stats ip_vs_stats;
1412*4882a593Smuzhiyun extern int sysctl_ip_vs_sync_ver;
1413*4882a593Smuzhiyun 
1414*4882a593Smuzhiyun struct ip_vs_service *
1415*4882a593Smuzhiyun ip_vs_service_find(struct netns_ipvs *ipvs, int af, __u32 fwmark, __u16 protocol,
1416*4882a593Smuzhiyun 		  const union nf_inet_addr *vaddr, __be16 vport);
1417*4882a593Smuzhiyun 
1418*4882a593Smuzhiyun bool ip_vs_has_real_service(struct netns_ipvs *ipvs, int af, __u16 protocol,
1419*4882a593Smuzhiyun 			    const union nf_inet_addr *daddr, __be16 dport);
1420*4882a593Smuzhiyun 
1421*4882a593Smuzhiyun struct ip_vs_dest *
1422*4882a593Smuzhiyun ip_vs_find_real_service(struct netns_ipvs *ipvs, int af, __u16 protocol,
1423*4882a593Smuzhiyun 			const union nf_inet_addr *daddr, __be16 dport);
1424*4882a593Smuzhiyun struct ip_vs_dest *ip_vs_find_tunnel(struct netns_ipvs *ipvs, int af,
1425*4882a593Smuzhiyun 				     const union nf_inet_addr *daddr,
1426*4882a593Smuzhiyun 				     __be16 tun_port);
1427*4882a593Smuzhiyun 
1428*4882a593Smuzhiyun int ip_vs_use_count_inc(void);
1429*4882a593Smuzhiyun void ip_vs_use_count_dec(void);
1430*4882a593Smuzhiyun int ip_vs_register_nl_ioctl(void);
1431*4882a593Smuzhiyun void ip_vs_unregister_nl_ioctl(void);
1432*4882a593Smuzhiyun int ip_vs_control_init(void);
1433*4882a593Smuzhiyun void ip_vs_control_cleanup(void);
1434*4882a593Smuzhiyun struct ip_vs_dest *
1435*4882a593Smuzhiyun ip_vs_find_dest(struct netns_ipvs *ipvs, int svc_af, int dest_af,
1436*4882a593Smuzhiyun 		const union nf_inet_addr *daddr, __be16 dport,
1437*4882a593Smuzhiyun 		const union nf_inet_addr *vaddr, __be16 vport,
1438*4882a593Smuzhiyun 		__u16 protocol, __u32 fwmark, __u32 flags);
1439*4882a593Smuzhiyun void ip_vs_try_bind_dest(struct ip_vs_conn *cp);
1440*4882a593Smuzhiyun 
ip_vs_dest_hold(struct ip_vs_dest * dest)1441*4882a593Smuzhiyun static inline void ip_vs_dest_hold(struct ip_vs_dest *dest)
1442*4882a593Smuzhiyun {
1443*4882a593Smuzhiyun 	refcount_inc(&dest->refcnt);
1444*4882a593Smuzhiyun }
1445*4882a593Smuzhiyun 
ip_vs_dest_put(struct ip_vs_dest * dest)1446*4882a593Smuzhiyun static inline void ip_vs_dest_put(struct ip_vs_dest *dest)
1447*4882a593Smuzhiyun {
1448*4882a593Smuzhiyun 	smp_mb__before_atomic();
1449*4882a593Smuzhiyun 	refcount_dec(&dest->refcnt);
1450*4882a593Smuzhiyun }
1451*4882a593Smuzhiyun 
ip_vs_dest_put_and_free(struct ip_vs_dest * dest)1452*4882a593Smuzhiyun static inline void ip_vs_dest_put_and_free(struct ip_vs_dest *dest)
1453*4882a593Smuzhiyun {
1454*4882a593Smuzhiyun 	if (refcount_dec_and_test(&dest->refcnt))
1455*4882a593Smuzhiyun 		kfree(dest);
1456*4882a593Smuzhiyun }
1457*4882a593Smuzhiyun 
1458*4882a593Smuzhiyun /* IPVS sync daemon data and function prototypes
1459*4882a593Smuzhiyun  * (from ip_vs_sync.c)
1460*4882a593Smuzhiyun  */
1461*4882a593Smuzhiyun int start_sync_thread(struct netns_ipvs *ipvs, struct ipvs_sync_daemon_cfg *cfg,
1462*4882a593Smuzhiyun 		      int state);
1463*4882a593Smuzhiyun int stop_sync_thread(struct netns_ipvs *ipvs, int state);
1464*4882a593Smuzhiyun void ip_vs_sync_conn(struct netns_ipvs *ipvs, struct ip_vs_conn *cp, int pkts);
1465*4882a593Smuzhiyun 
1466*4882a593Smuzhiyun /* IPVS rate estimator prototypes (from ip_vs_est.c) */
1467*4882a593Smuzhiyun void ip_vs_start_estimator(struct netns_ipvs *ipvs, struct ip_vs_stats *stats);
1468*4882a593Smuzhiyun void ip_vs_stop_estimator(struct netns_ipvs *ipvs, struct ip_vs_stats *stats);
1469*4882a593Smuzhiyun void ip_vs_zero_estimator(struct ip_vs_stats *stats);
1470*4882a593Smuzhiyun void ip_vs_read_estimator(struct ip_vs_kstats *dst, struct ip_vs_stats *stats);
1471*4882a593Smuzhiyun 
1472*4882a593Smuzhiyun /* Various IPVS packet transmitters (from ip_vs_xmit.c) */
1473*4882a593Smuzhiyun int ip_vs_null_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1474*4882a593Smuzhiyun 		    struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
1475*4882a593Smuzhiyun int ip_vs_bypass_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1476*4882a593Smuzhiyun 		      struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
1477*4882a593Smuzhiyun int ip_vs_nat_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1478*4882a593Smuzhiyun 		   struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
1479*4882a593Smuzhiyun int ip_vs_tunnel_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1480*4882a593Smuzhiyun 		      struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
1481*4882a593Smuzhiyun int ip_vs_dr_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1482*4882a593Smuzhiyun 		  struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
1483*4882a593Smuzhiyun int ip_vs_icmp_xmit(struct sk_buff *skb, struct ip_vs_conn *cp,
1484*4882a593Smuzhiyun 		    struct ip_vs_protocol *pp, int offset,
1485*4882a593Smuzhiyun 		    unsigned int hooknum, struct ip_vs_iphdr *iph);
1486*4882a593Smuzhiyun void ip_vs_dest_dst_rcu_free(struct rcu_head *head);
1487*4882a593Smuzhiyun 
1488*4882a593Smuzhiyun #ifdef CONFIG_IP_VS_IPV6
1489*4882a593Smuzhiyun int ip_vs_bypass_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
1490*4882a593Smuzhiyun 			 struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
1491*4882a593Smuzhiyun int ip_vs_nat_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
1492*4882a593Smuzhiyun 		      struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
1493*4882a593Smuzhiyun int ip_vs_tunnel_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
1494*4882a593Smuzhiyun 			 struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
1495*4882a593Smuzhiyun int ip_vs_dr_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
1496*4882a593Smuzhiyun 		     struct ip_vs_protocol *pp, struct ip_vs_iphdr *iph);
1497*4882a593Smuzhiyun int ip_vs_icmp_xmit_v6(struct sk_buff *skb, struct ip_vs_conn *cp,
1498*4882a593Smuzhiyun 		       struct ip_vs_protocol *pp, int offset,
1499*4882a593Smuzhiyun 		       unsigned int hooknum, struct ip_vs_iphdr *iph);
1500*4882a593Smuzhiyun #endif
1501*4882a593Smuzhiyun 
1502*4882a593Smuzhiyun #ifdef CONFIG_SYSCTL
1503*4882a593Smuzhiyun /* This is a simple mechanism to ignore packets when
1504*4882a593Smuzhiyun  * we are loaded. Just set ip_vs_drop_rate to 'n' and
1505*4882a593Smuzhiyun  * we start to drop 1/rate of the packets
1506*4882a593Smuzhiyun  */
ip_vs_todrop(struct netns_ipvs * ipvs)1507*4882a593Smuzhiyun static inline int ip_vs_todrop(struct netns_ipvs *ipvs)
1508*4882a593Smuzhiyun {
1509*4882a593Smuzhiyun 	if (!ipvs->drop_rate)
1510*4882a593Smuzhiyun 		return 0;
1511*4882a593Smuzhiyun 	if (--ipvs->drop_counter > 0)
1512*4882a593Smuzhiyun 		return 0;
1513*4882a593Smuzhiyun 	ipvs->drop_counter = ipvs->drop_rate;
1514*4882a593Smuzhiyun 	return 1;
1515*4882a593Smuzhiyun }
1516*4882a593Smuzhiyun #else
ip_vs_todrop(struct netns_ipvs * ipvs)1517*4882a593Smuzhiyun static inline int ip_vs_todrop(struct netns_ipvs *ipvs) { return 0; }
1518*4882a593Smuzhiyun #endif
1519*4882a593Smuzhiyun 
1520*4882a593Smuzhiyun #ifdef CONFIG_SYSCTL
1521*4882a593Smuzhiyun /* Enqueue delayed work for expiring no dest connections
1522*4882a593Smuzhiyun  * Only run when sysctl_expire_nodest=1
1523*4882a593Smuzhiyun  */
ip_vs_enqueue_expire_nodest_conns(struct netns_ipvs * ipvs)1524*4882a593Smuzhiyun static inline void ip_vs_enqueue_expire_nodest_conns(struct netns_ipvs *ipvs)
1525*4882a593Smuzhiyun {
1526*4882a593Smuzhiyun 	if (sysctl_expire_nodest_conn(ipvs))
1527*4882a593Smuzhiyun 		queue_delayed_work(system_long_wq,
1528*4882a593Smuzhiyun 				   &ipvs->expire_nodest_conn_work, 1);
1529*4882a593Smuzhiyun }
1530*4882a593Smuzhiyun 
1531*4882a593Smuzhiyun void ip_vs_expire_nodest_conn_flush(struct netns_ipvs *ipvs);
1532*4882a593Smuzhiyun #else
ip_vs_enqueue_expire_nodest_conns(struct netns_ipvs * ipvs)1533*4882a593Smuzhiyun static inline void ip_vs_enqueue_expire_nodest_conns(struct netns_ipvs *ipvs) {}
1534*4882a593Smuzhiyun #endif
1535*4882a593Smuzhiyun 
1536*4882a593Smuzhiyun #define IP_VS_DFWD_METHOD(dest) (atomic_read(&(dest)->conn_flags) & \
1537*4882a593Smuzhiyun 				 IP_VS_CONN_F_FWD_MASK)
1538*4882a593Smuzhiyun 
1539*4882a593Smuzhiyun /* ip_vs_fwd_tag returns the forwarding tag of the connection */
1540*4882a593Smuzhiyun #define IP_VS_FWD_METHOD(cp)  (cp->flags & IP_VS_CONN_F_FWD_MASK)
1541*4882a593Smuzhiyun 
ip_vs_fwd_tag(struct ip_vs_conn * cp)1542*4882a593Smuzhiyun static inline char ip_vs_fwd_tag(struct ip_vs_conn *cp)
1543*4882a593Smuzhiyun {
1544*4882a593Smuzhiyun 	char fwd;
1545*4882a593Smuzhiyun 
1546*4882a593Smuzhiyun 	switch (IP_VS_FWD_METHOD(cp)) {
1547*4882a593Smuzhiyun 	case IP_VS_CONN_F_MASQ:
1548*4882a593Smuzhiyun 		fwd = 'M'; break;
1549*4882a593Smuzhiyun 	case IP_VS_CONN_F_LOCALNODE:
1550*4882a593Smuzhiyun 		fwd = 'L'; break;
1551*4882a593Smuzhiyun 	case IP_VS_CONN_F_TUNNEL:
1552*4882a593Smuzhiyun 		fwd = 'T'; break;
1553*4882a593Smuzhiyun 	case IP_VS_CONN_F_DROUTE:
1554*4882a593Smuzhiyun 		fwd = 'R'; break;
1555*4882a593Smuzhiyun 	case IP_VS_CONN_F_BYPASS:
1556*4882a593Smuzhiyun 		fwd = 'B'; break;
1557*4882a593Smuzhiyun 	default:
1558*4882a593Smuzhiyun 		fwd = '?'; break;
1559*4882a593Smuzhiyun 	}
1560*4882a593Smuzhiyun 	return fwd;
1561*4882a593Smuzhiyun }
1562*4882a593Smuzhiyun 
1563*4882a593Smuzhiyun void ip_vs_nat_icmp(struct sk_buff *skb, struct ip_vs_protocol *pp,
1564*4882a593Smuzhiyun 		    struct ip_vs_conn *cp, int dir);
1565*4882a593Smuzhiyun 
1566*4882a593Smuzhiyun #ifdef CONFIG_IP_VS_IPV6
1567*4882a593Smuzhiyun void ip_vs_nat_icmp_v6(struct sk_buff *skb, struct ip_vs_protocol *pp,
1568*4882a593Smuzhiyun 		       struct ip_vs_conn *cp, int dir);
1569*4882a593Smuzhiyun #endif
1570*4882a593Smuzhiyun 
1571*4882a593Smuzhiyun __sum16 ip_vs_checksum_complete(struct sk_buff *skb, int offset);
1572*4882a593Smuzhiyun 
ip_vs_check_diff4(__be32 old,__be32 new,__wsum oldsum)1573*4882a593Smuzhiyun static inline __wsum ip_vs_check_diff4(__be32 old, __be32 new, __wsum oldsum)
1574*4882a593Smuzhiyun {
1575*4882a593Smuzhiyun 	__be32 diff[2] = { ~old, new };
1576*4882a593Smuzhiyun 
1577*4882a593Smuzhiyun 	return csum_partial(diff, sizeof(diff), oldsum);
1578*4882a593Smuzhiyun }
1579*4882a593Smuzhiyun 
1580*4882a593Smuzhiyun #ifdef CONFIG_IP_VS_IPV6
ip_vs_check_diff16(const __be32 * old,const __be32 * new,__wsum oldsum)1581*4882a593Smuzhiyun static inline __wsum ip_vs_check_diff16(const __be32 *old, const __be32 *new,
1582*4882a593Smuzhiyun 					__wsum oldsum)
1583*4882a593Smuzhiyun {
1584*4882a593Smuzhiyun 	__be32 diff[8] = { ~old[3], ~old[2], ~old[1], ~old[0],
1585*4882a593Smuzhiyun 			    new[3],  new[2],  new[1],  new[0] };
1586*4882a593Smuzhiyun 
1587*4882a593Smuzhiyun 	return csum_partial(diff, sizeof(diff), oldsum);
1588*4882a593Smuzhiyun }
1589*4882a593Smuzhiyun #endif
1590*4882a593Smuzhiyun 
ip_vs_check_diff2(__be16 old,__be16 new,__wsum oldsum)1591*4882a593Smuzhiyun static inline __wsum ip_vs_check_diff2(__be16 old, __be16 new, __wsum oldsum)
1592*4882a593Smuzhiyun {
1593*4882a593Smuzhiyun 	__be16 diff[2] = { ~old, new };
1594*4882a593Smuzhiyun 
1595*4882a593Smuzhiyun 	return csum_partial(diff, sizeof(diff), oldsum);
1596*4882a593Smuzhiyun }
1597*4882a593Smuzhiyun 
1598*4882a593Smuzhiyun /* Forget current conntrack (unconfirmed) and attach notrack entry */
ip_vs_notrack(struct sk_buff * skb)1599*4882a593Smuzhiyun static inline void ip_vs_notrack(struct sk_buff *skb)
1600*4882a593Smuzhiyun {
1601*4882a593Smuzhiyun #if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE)
1602*4882a593Smuzhiyun 	enum ip_conntrack_info ctinfo;
1603*4882a593Smuzhiyun 	struct nf_conn *ct = nf_ct_get(skb, &ctinfo);
1604*4882a593Smuzhiyun 
1605*4882a593Smuzhiyun 	if (ct) {
1606*4882a593Smuzhiyun 		nf_conntrack_put(&ct->ct_general);
1607*4882a593Smuzhiyun 		nf_ct_set(skb, NULL, IP_CT_UNTRACKED);
1608*4882a593Smuzhiyun 	}
1609*4882a593Smuzhiyun #endif
1610*4882a593Smuzhiyun }
1611*4882a593Smuzhiyun 
1612*4882a593Smuzhiyun #ifdef CONFIG_IP_VS_NFCT
1613*4882a593Smuzhiyun /* Netfilter connection tracking
1614*4882a593Smuzhiyun  * (from ip_vs_nfct.c)
1615*4882a593Smuzhiyun  */
ip_vs_conntrack_enabled(struct netns_ipvs * ipvs)1616*4882a593Smuzhiyun static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs)
1617*4882a593Smuzhiyun {
1618*4882a593Smuzhiyun #ifdef CONFIG_SYSCTL
1619*4882a593Smuzhiyun 	return ipvs->sysctl_conntrack;
1620*4882a593Smuzhiyun #else
1621*4882a593Smuzhiyun 	return 0;
1622*4882a593Smuzhiyun #endif
1623*4882a593Smuzhiyun }
1624*4882a593Smuzhiyun 
1625*4882a593Smuzhiyun void ip_vs_update_conntrack(struct sk_buff *skb, struct ip_vs_conn *cp,
1626*4882a593Smuzhiyun 			    int outin);
1627*4882a593Smuzhiyun int ip_vs_confirm_conntrack(struct sk_buff *skb);
1628*4882a593Smuzhiyun void ip_vs_nfct_expect_related(struct sk_buff *skb, struct nf_conn *ct,
1629*4882a593Smuzhiyun 			       struct ip_vs_conn *cp, u_int8_t proto,
1630*4882a593Smuzhiyun 			       const __be16 port, int from_rs);
1631*4882a593Smuzhiyun void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp);
1632*4882a593Smuzhiyun 
1633*4882a593Smuzhiyun #else
1634*4882a593Smuzhiyun 
ip_vs_conntrack_enabled(struct netns_ipvs * ipvs)1635*4882a593Smuzhiyun static inline int ip_vs_conntrack_enabled(struct netns_ipvs *ipvs)
1636*4882a593Smuzhiyun {
1637*4882a593Smuzhiyun 	return 0;
1638*4882a593Smuzhiyun }
1639*4882a593Smuzhiyun 
ip_vs_update_conntrack(struct sk_buff * skb,struct ip_vs_conn * cp,int outin)1640*4882a593Smuzhiyun static inline void ip_vs_update_conntrack(struct sk_buff *skb,
1641*4882a593Smuzhiyun 					  struct ip_vs_conn *cp, int outin)
1642*4882a593Smuzhiyun {
1643*4882a593Smuzhiyun }
1644*4882a593Smuzhiyun 
ip_vs_confirm_conntrack(struct sk_buff * skb)1645*4882a593Smuzhiyun static inline int ip_vs_confirm_conntrack(struct sk_buff *skb)
1646*4882a593Smuzhiyun {
1647*4882a593Smuzhiyun 	return NF_ACCEPT;
1648*4882a593Smuzhiyun }
1649*4882a593Smuzhiyun 
ip_vs_conn_drop_conntrack(struct ip_vs_conn * cp)1650*4882a593Smuzhiyun static inline void ip_vs_conn_drop_conntrack(struct ip_vs_conn *cp)
1651*4882a593Smuzhiyun {
1652*4882a593Smuzhiyun }
1653*4882a593Smuzhiyun #endif /* CONFIG_IP_VS_NFCT */
1654*4882a593Smuzhiyun 
1655*4882a593Smuzhiyun /* Using old conntrack that can not be redirected to another real server? */
ip_vs_conn_uses_old_conntrack(struct ip_vs_conn * cp,struct sk_buff * skb)1656*4882a593Smuzhiyun static inline bool ip_vs_conn_uses_old_conntrack(struct ip_vs_conn *cp,
1657*4882a593Smuzhiyun 						 struct sk_buff *skb)
1658*4882a593Smuzhiyun {
1659*4882a593Smuzhiyun #ifdef CONFIG_IP_VS_NFCT
1660*4882a593Smuzhiyun 	enum ip_conntrack_info ctinfo;
1661*4882a593Smuzhiyun 	struct nf_conn *ct;
1662*4882a593Smuzhiyun 
1663*4882a593Smuzhiyun 	ct = nf_ct_get(skb, &ctinfo);
1664*4882a593Smuzhiyun 	if (ct && nf_ct_is_confirmed(ct))
1665*4882a593Smuzhiyun 		return true;
1666*4882a593Smuzhiyun #endif
1667*4882a593Smuzhiyun 	return false;
1668*4882a593Smuzhiyun }
1669*4882a593Smuzhiyun 
ip_vs_register_conntrack(struct ip_vs_service * svc)1670*4882a593Smuzhiyun static inline int ip_vs_register_conntrack(struct ip_vs_service *svc)
1671*4882a593Smuzhiyun {
1672*4882a593Smuzhiyun #if IS_ENABLED(CONFIG_NF_CONNTRACK)
1673*4882a593Smuzhiyun 	int afmask = (svc->af == AF_INET6) ? 2 : 1;
1674*4882a593Smuzhiyun 	int ret = 0;
1675*4882a593Smuzhiyun 
1676*4882a593Smuzhiyun 	if (!(svc->conntrack_afmask & afmask)) {
1677*4882a593Smuzhiyun 		ret = nf_ct_netns_get(svc->ipvs->net, svc->af);
1678*4882a593Smuzhiyun 		if (ret >= 0)
1679*4882a593Smuzhiyun 			svc->conntrack_afmask |= afmask;
1680*4882a593Smuzhiyun 	}
1681*4882a593Smuzhiyun 	return ret;
1682*4882a593Smuzhiyun #else
1683*4882a593Smuzhiyun 	return 0;
1684*4882a593Smuzhiyun #endif
1685*4882a593Smuzhiyun }
1686*4882a593Smuzhiyun 
ip_vs_unregister_conntrack(struct ip_vs_service * svc)1687*4882a593Smuzhiyun static inline void ip_vs_unregister_conntrack(struct ip_vs_service *svc)
1688*4882a593Smuzhiyun {
1689*4882a593Smuzhiyun #if IS_ENABLED(CONFIG_NF_CONNTRACK)
1690*4882a593Smuzhiyun 	int afmask = (svc->af == AF_INET6) ? 2 : 1;
1691*4882a593Smuzhiyun 
1692*4882a593Smuzhiyun 	if (svc->conntrack_afmask & afmask) {
1693*4882a593Smuzhiyun 		nf_ct_netns_put(svc->ipvs->net, svc->af);
1694*4882a593Smuzhiyun 		svc->conntrack_afmask &= ~afmask;
1695*4882a593Smuzhiyun 	}
1696*4882a593Smuzhiyun #endif
1697*4882a593Smuzhiyun }
1698*4882a593Smuzhiyun 
1699*4882a593Smuzhiyun int ip_vs_register_hooks(struct netns_ipvs *ipvs, unsigned int af);
1700*4882a593Smuzhiyun void ip_vs_unregister_hooks(struct netns_ipvs *ipvs, unsigned int af);
1701*4882a593Smuzhiyun 
1702*4882a593Smuzhiyun static inline int
ip_vs_dest_conn_overhead(struct ip_vs_dest * dest)1703*4882a593Smuzhiyun ip_vs_dest_conn_overhead(struct ip_vs_dest *dest)
1704*4882a593Smuzhiyun {
1705*4882a593Smuzhiyun 	/* We think the overhead of processing active connections is 256
1706*4882a593Smuzhiyun 	 * times higher than that of inactive connections in average. (This
1707*4882a593Smuzhiyun 	 * 256 times might not be accurate, we will change it later) We
1708*4882a593Smuzhiyun 	 * use the following formula to estimate the overhead now:
1709*4882a593Smuzhiyun 	 *		  dest->activeconns*256 + dest->inactconns
1710*4882a593Smuzhiyun 	 */
1711*4882a593Smuzhiyun 	return (atomic_read(&dest->activeconns) << 8) +
1712*4882a593Smuzhiyun 		atomic_read(&dest->inactconns);
1713*4882a593Smuzhiyun }
1714*4882a593Smuzhiyun 
1715*4882a593Smuzhiyun #endif	/* _NET_IP_VS_H */
1716