blob: c8ee9b89b023d37bc538cc351128e47c9cc6b74e [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * IP Virtual Server
3 * data structure and functionality definitions
4 */
5
Julius Volzbc4768e2008-07-31 20:45:24 -07006#ifndef _NET_IP_VS_H
7#define _NET_IP_VS_H
Linus Torvalds1da177e2005-04-16 15:20:36 -07008
Julius Volzbc4768e2008-07-31 20:45:24 -07009#include <linux/ip_vs.h> /* definitions shared with userland */
Linus Torvalds1da177e2005-04-16 15:20:36 -070010
Julius Volzbc4768e2008-07-31 20:45:24 -070011/* old ipvsadm versions still include this file directly */
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#ifdef __KERNEL__
13
Julius Volzbc4768e2008-07-31 20:45:24 -070014#include <asm/types.h> /* for __uXX types */
15
16#include <linux/sysctl.h> /* for ctl_path */
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#include <linux/list.h> /* for struct list_head */
18#include <linux/spinlock.h> /* for struct rwlock_t */
Linus Torvalds1da177e2005-04-16 15:20:36 -070019#include <asm/atomic.h> /* for struct atomic_t */
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <linux/compiler.h>
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020021#include <linux/timer.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070022
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020023#include <net/checksum.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070024
25#ifdef CONFIG_IP_VS_DEBUG
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020026#include <linux/net.h>
27
Linus Torvalds1da177e2005-04-16 15:20:36 -070028extern int ip_vs_get_debug_level(void);
29#define IP_VS_DBG(level, msg...) \
30 do { \
31 if (level <= ip_vs_get_debug_level()) \
32 printk(KERN_DEBUG "IPVS: " msg); \
33 } while (0)
34#define IP_VS_DBG_RL(msg...) \
35 do { \
36 if (net_ratelimit()) \
37 printk(KERN_DEBUG "IPVS: " msg); \
38 } while (0)
39#define IP_VS_DBG_PKT(level, pp, skb, ofs, msg) \
40 do { \
41 if (level <= ip_vs_get_debug_level()) \
42 pp->debug_packet(pp, skb, ofs, msg); \
43 } while (0)
44#define IP_VS_DBG_RL_PKT(level, pp, skb, ofs, msg) \
45 do { \
46 if (level <= ip_vs_get_debug_level() && \
47 net_ratelimit()) \
48 pp->debug_packet(pp, skb, ofs, msg); \
49 } while (0)
50#else /* NO DEBUGGING at ALL */
51#define IP_VS_DBG(level, msg...) do {} while (0)
52#define IP_VS_DBG_RL(msg...) do {} while (0)
53#define IP_VS_DBG_PKT(level, pp, skb, ofs, msg) do {} while (0)
54#define IP_VS_DBG_RL_PKT(level, pp, skb, ofs, msg) do {} while (0)
55#endif
56
57#define IP_VS_BUG() BUG()
58#define IP_VS_ERR(msg...) printk(KERN_ERR "IPVS: " msg)
59#define IP_VS_INFO(msg...) printk(KERN_INFO "IPVS: " msg)
60#define IP_VS_WARNING(msg...) \
61 printk(KERN_WARNING "IPVS: " msg)
62#define IP_VS_ERR_RL(msg...) \
63 do { \
64 if (net_ratelimit()) \
65 printk(KERN_ERR "IPVS: " msg); \
66 } while (0)
67
68#ifdef CONFIG_IP_VS_DEBUG
69#define EnterFunction(level) \
70 do { \
71 if (level <= ip_vs_get_debug_level()) \
72 printk(KERN_DEBUG "Enter: %s, %s line %i\n", \
73 __FUNCTION__, __FILE__, __LINE__); \
74 } while (0)
75#define LeaveFunction(level) \
76 do { \
77 if (level <= ip_vs_get_debug_level()) \
78 printk(KERN_DEBUG "Leave: %s, %s line %i\n", \
79 __FUNCTION__, __FILE__, __LINE__); \
80 } while (0)
81#else
82#define EnterFunction(level) do {} while (0)
83#define LeaveFunction(level) do {} while (0)
84#endif
85
86#define IP_VS_WAIT_WHILE(expr) while (expr) { cpu_relax(); }
87
88
89/*
90 * The port number of FTP service (in network order).
91 */
92#define FTPPORT __constant_htons(21)
93#define FTPDATA __constant_htons(20)
94
95/*
Linus Torvalds1da177e2005-04-16 15:20:36 -070096 * TCP State Values
97 */
98enum {
99 IP_VS_TCP_S_NONE = 0,
100 IP_VS_TCP_S_ESTABLISHED,
101 IP_VS_TCP_S_SYN_SENT,
102 IP_VS_TCP_S_SYN_RECV,
103 IP_VS_TCP_S_FIN_WAIT,
104 IP_VS_TCP_S_TIME_WAIT,
105 IP_VS_TCP_S_CLOSE,
106 IP_VS_TCP_S_CLOSE_WAIT,
107 IP_VS_TCP_S_LAST_ACK,
108 IP_VS_TCP_S_LISTEN,
109 IP_VS_TCP_S_SYNACK,
110 IP_VS_TCP_S_LAST
111};
112
113/*
114 * UDP State Values
115 */
116enum {
117 IP_VS_UDP_S_NORMAL,
118 IP_VS_UDP_S_LAST,
119};
120
121/*
122 * ICMP State Values
123 */
124enum {
125 IP_VS_ICMP_S_NORMAL,
126 IP_VS_ICMP_S_LAST,
127};
128
129/*
130 * Delta sequence info structure
131 * Each ip_vs_conn has 2 (output AND input seq. changes).
132 * Only used in the VS/NAT.
133 */
134struct ip_vs_seq {
135 __u32 init_seq; /* Add delta from this seq */
136 __u32 delta; /* Delta in sequence numbers */
137 __u32 previous_delta; /* Delta in sequence numbers
138 before last resized pkt */
139};
140
141
142/*
143 * IPVS statistics object
144 */
145struct ip_vs_stats
146{
147 __u32 conns; /* connections scheduled */
148 __u32 inpkts; /* incoming packets */
149 __u32 outpkts; /* outgoing packets */
150 __u64 inbytes; /* incoming bytes */
151 __u64 outbytes; /* outgoing bytes */
152
153 __u32 cps; /* current connection rate */
154 __u32 inpps; /* current in packet rate */
155 __u32 outpps; /* current out packet rate */
156 __u32 inbps; /* current in byte rate */
157 __u32 outbps; /* current out byte rate */
158
159 spinlock_t lock; /* spin lock */
160};
161
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -0200162struct dst_entry;
163struct iphdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164struct ip_vs_conn;
165struct ip_vs_app;
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -0200166struct sk_buff;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167
168struct ip_vs_protocol {
169 struct ip_vs_protocol *next;
170 char *name;
Julian Anastasov2ad17de2008-04-29 03:21:23 -0700171 u16 protocol;
172 u16 num_states;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700173 int dont_defrag;
174 atomic_t appcnt; /* counter of proto app incs */
175 int *timeout_table; /* protocol timeout table */
176
177 void (*init)(struct ip_vs_protocol *pp);
178
179 void (*exit)(struct ip_vs_protocol *pp);
180
181 int (*conn_schedule)(struct sk_buff *skb,
182 struct ip_vs_protocol *pp,
183 int *verdict, struct ip_vs_conn **cpp);
184
185 struct ip_vs_conn *
186 (*conn_in_get)(const struct sk_buff *skb,
187 struct ip_vs_protocol *pp,
188 const struct iphdr *iph,
189 unsigned int proto_off,
190 int inverse);
191
192 struct ip_vs_conn *
193 (*conn_out_get)(const struct sk_buff *skb,
194 struct ip_vs_protocol *pp,
195 const struct iphdr *iph,
196 unsigned int proto_off,
197 int inverse);
198
Herbert Xu3db05fe2007-10-15 00:53:15 -0700199 int (*snat_handler)(struct sk_buff *skb,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200 struct ip_vs_protocol *pp, struct ip_vs_conn *cp);
201
Herbert Xu3db05fe2007-10-15 00:53:15 -0700202 int (*dnat_handler)(struct sk_buff *skb,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203 struct ip_vs_protocol *pp, struct ip_vs_conn *cp);
204
205 int (*csum_check)(struct sk_buff *skb, struct ip_vs_protocol *pp);
206
207 const char *(*state_name)(int state);
208
209 int (*state_transition)(struct ip_vs_conn *cp, int direction,
210 const struct sk_buff *skb,
211 struct ip_vs_protocol *pp);
212
213 int (*register_app)(struct ip_vs_app *inc);
214
215 void (*unregister_app)(struct ip_vs_app *inc);
216
217 int (*app_conn_bind)(struct ip_vs_conn *cp);
218
219 void (*debug_packet)(struct ip_vs_protocol *pp,
220 const struct sk_buff *skb,
221 int offset,
222 const char *msg);
223
224 void (*timeout_change)(struct ip_vs_protocol *pp, int flags);
225
226 int (*set_state_timeout)(struct ip_vs_protocol *pp, char *sname, int to);
227};
228
229extern struct ip_vs_protocol * ip_vs_proto_get(unsigned short proto);
230
231/*
232 * IP_VS structure allocated for each dynamically scheduled connection
233 */
234struct ip_vs_conn {
235 struct list_head c_list; /* hashed list heads */
236
237 /* Protocol, addresses and port numbers */
Al Viro014d7302006-09-28 14:29:52 -0700238 __be32 caddr; /* client address */
239 __be32 vaddr; /* virtual address */
240 __be32 daddr; /* destination address */
241 __be16 cport;
242 __be16 vport;
243 __be16 dport;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700244 __u16 protocol; /* Which protocol (TCP/UDP) */
245
246 /* counter and timer */
247 atomic_t refcnt; /* reference count */
248 struct timer_list timer; /* Expiration timer */
249 volatile unsigned long timeout; /* timeout */
250
251 /* Flags and state transition */
252 spinlock_t lock; /* lock for state transition */
253 volatile __u16 flags; /* status flags */
254 volatile __u16 state; /* state info */
Rumen G. Bogdanovskiefac5272007-11-07 02:36:55 -0800255 volatile __u16 old_state; /* old state, to be used for
256 * state transition triggerd
257 * synchronization
258 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700259
260 /* Control members */
261 struct ip_vs_conn *control; /* Master control connection */
262 atomic_t n_control; /* Number of controlled ones */
263 struct ip_vs_dest *dest; /* real server */
264 atomic_t in_pkts; /* incoming packet counter */
265
266 /* packet transmitter for different forwarding methods. If it
267 mangles the packet, it must return NF_DROP or better NF_STOLEN,
268 otherwise this must be changed to a sk_buff **.
269 */
270 int (*packet_xmit)(struct sk_buff *skb, struct ip_vs_conn *cp,
271 struct ip_vs_protocol *pp);
272
273 /* Note: we can group the following members into a structure,
274 in order to save more space, and the following members are
275 only used in VS/NAT anyway */
276 struct ip_vs_app *app; /* bound ip_vs_app object */
277 void *app_data; /* Application private data */
278 struct ip_vs_seq in_seq; /* incoming seq. struct */
279 struct ip_vs_seq out_seq; /* outgoing seq. struct */
280};
281
282
283/*
284 * The information about the virtual service offered to the net
285 * and the forwarding entries
286 */
287struct ip_vs_service {
288 struct list_head s_list; /* for normal service table */
289 struct list_head f_list; /* for fwmark-based service table */
290 atomic_t refcnt; /* reference counter */
291 atomic_t usecnt; /* use counter */
292
293 __u16 protocol; /* which protocol (TCP/UDP) */
Al Viro014d7302006-09-28 14:29:52 -0700294 __be32 addr; /* IP address for virtual service */
295 __be16 port; /* port number for the service */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700296 __u32 fwmark; /* firewall mark of the service */
297 unsigned flags; /* service status flags */
298 unsigned timeout; /* persistent timeout in ticks */
Al Viro014d7302006-09-28 14:29:52 -0700299 __be32 netmask; /* grouping granularity */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700300
301 struct list_head destinations; /* real server d-linked list */
302 __u32 num_dests; /* number of servers */
303 struct ip_vs_stats stats; /* statistics for the service */
304 struct ip_vs_app *inc; /* bind conns to this app inc */
305
306 /* for scheduling */
307 struct ip_vs_scheduler *scheduler; /* bound scheduler object */
308 rwlock_t sched_lock; /* lock sched_data */
309 void *sched_data; /* scheduler application data */
310};
311
312
313/*
314 * The real server destination forwarding entry
315 * with ip address, port number, and so on.
316 */
317struct ip_vs_dest {
318 struct list_head n_list; /* for the dests in the service */
319 struct list_head d_list; /* for table with all the dests */
320
Al Viro014d7302006-09-28 14:29:52 -0700321 __be32 addr; /* IP address of the server */
322 __be16 port; /* port number of the server */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323 volatile unsigned flags; /* dest status flags */
324 atomic_t conn_flags; /* flags to copy to conn */
325 atomic_t weight; /* server weight */
326
327 atomic_t refcnt; /* reference counter */
328 struct ip_vs_stats stats; /* statistics */
329
330 /* connection counters and thresholds */
331 atomic_t activeconns; /* active connections */
332 atomic_t inactconns; /* inactive connections */
333 atomic_t persistconns; /* persistent connections */
334 __u32 u_threshold; /* upper threshold */
335 __u32 l_threshold; /* lower threshold */
336
337 /* for destination cache */
338 spinlock_t dst_lock; /* lock of dst_cache */
339 struct dst_entry *dst_cache; /* destination cache entry */
340 u32 dst_rtos; /* RT_TOS(tos) for dst */
341
342 /* for virtual service */
343 struct ip_vs_service *svc; /* service it belongs to */
344 __u16 protocol; /* which protocol (TCP/UDP) */
Al Viro014d7302006-09-28 14:29:52 -0700345 __be32 vaddr; /* virtual IP address */
346 __be16 vport; /* virtual port number */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700347 __u32 vfwmark; /* firewall mark of service */
348};
349
350
351/*
352 * The scheduler object
353 */
354struct ip_vs_scheduler {
355 struct list_head n_list; /* d-linked list head */
356 char *name; /* scheduler name */
357 atomic_t refcnt; /* reference counter */
358 struct module *module; /* THIS_MODULE/NULL */
359
360 /* scheduler initializing service */
361 int (*init_service)(struct ip_vs_service *svc);
362 /* scheduling service finish */
363 int (*done_service)(struct ip_vs_service *svc);
364 /* scheduler updating service */
365 int (*update_service)(struct ip_vs_service *svc);
366
367 /* selecting a server from the given service */
368 struct ip_vs_dest* (*schedule)(struct ip_vs_service *svc,
369 const struct sk_buff *skb);
370};
371
372
373/*
374 * The application module object (a.k.a. app incarnation)
375 */
376struct ip_vs_app
377{
378 struct list_head a_list; /* member in app list */
379 int type; /* IP_VS_APP_TYPE_xxx */
380 char *name; /* application module name */
381 __u16 protocol;
382 struct module *module; /* THIS_MODULE/NULL */
383 struct list_head incs_list; /* list of incarnations */
384
385 /* members for application incarnations */
386 struct list_head p_list; /* member in proto app list */
387 struct ip_vs_app *app; /* its real application */
Al Viro014d7302006-09-28 14:29:52 -0700388 __be16 port; /* port number in net order */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700389 atomic_t usecnt; /* usage counter */
390
391 /* output hook: return false if can't linearize. diff set for TCP. */
392 int (*pkt_out)(struct ip_vs_app *, struct ip_vs_conn *,
Herbert Xu3db05fe2007-10-15 00:53:15 -0700393 struct sk_buff *, int *diff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700394
395 /* input hook: return false if can't linearize. diff set for TCP. */
396 int (*pkt_in)(struct ip_vs_app *, struct ip_vs_conn *,
Herbert Xu3db05fe2007-10-15 00:53:15 -0700397 struct sk_buff *, int *diff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700398
399 /* ip_vs_app initializer */
400 int (*init_conn)(struct ip_vs_app *, struct ip_vs_conn *);
401
402 /* ip_vs_app finish */
403 int (*done_conn)(struct ip_vs_app *, struct ip_vs_conn *);
404
405
406 /* not used now */
407 int (*bind_conn)(struct ip_vs_app *, struct ip_vs_conn *,
408 struct ip_vs_protocol *);
409
410 void (*unbind_conn)(struct ip_vs_app *, struct ip_vs_conn *);
411
412 int * timeout_table;
413 int * timeouts;
414 int timeouts_size;
415
416 int (*conn_schedule)(struct sk_buff *skb, struct ip_vs_app *app,
417 int *verdict, struct ip_vs_conn **cpp);
418
419 struct ip_vs_conn *
420 (*conn_in_get)(const struct sk_buff *skb, struct ip_vs_app *app,
421 const struct iphdr *iph, unsigned int proto_off,
422 int inverse);
423
424 struct ip_vs_conn *
425 (*conn_out_get)(const struct sk_buff *skb, struct ip_vs_app *app,
426 const struct iphdr *iph, unsigned int proto_off,
427 int inverse);
428
429 int (*state_transition)(struct ip_vs_conn *cp, int direction,
430 const struct sk_buff *skb,
431 struct ip_vs_app *app);
432
433 void (*timeout_change)(struct ip_vs_app *app, int flags);
434};
435
436
437/*
438 * IPVS core functions
439 * (from ip_vs_core.c)
440 */
441extern const char *ip_vs_proto_name(unsigned proto);
442extern void ip_vs_init_hash_table(struct list_head *table, int rows);
Sven Wegenerafdd6142008-08-10 09:18:01 +0000443#define IP_VS_INIT_HASH_TABLE(t) ip_vs_init_hash_table((t), ARRAY_SIZE((t)))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700444
Linus Torvalds1da177e2005-04-16 15:20:36 -0700445#define IP_VS_APP_TYPE_FTP 1
446
447/*
448 * ip_vs_conn handling functions
449 * (from ip_vs_conn.c)
450 */
451
452/*
453 * IPVS connection entry hash table
454 */
455#ifndef CONFIG_IP_VS_TAB_BITS
456#define CONFIG_IP_VS_TAB_BITS 12
457#endif
458/* make sure that IP_VS_CONN_TAB_BITS is located in [8, 20] */
459#if CONFIG_IP_VS_TAB_BITS < 8
460#define IP_VS_CONN_TAB_BITS 8
461#endif
462#if CONFIG_IP_VS_TAB_BITS > 20
463#define IP_VS_CONN_TAB_BITS 20
464#endif
465#if 8 <= CONFIG_IP_VS_TAB_BITS && CONFIG_IP_VS_TAB_BITS <= 20
466#define IP_VS_CONN_TAB_BITS CONFIG_IP_VS_TAB_BITS
467#endif
468#define IP_VS_CONN_TAB_SIZE (1 << IP_VS_CONN_TAB_BITS)
469#define IP_VS_CONN_TAB_MASK (IP_VS_CONN_TAB_SIZE - 1)
470
471enum {
472 IP_VS_DIR_INPUT = 0,
473 IP_VS_DIR_OUTPUT,
474 IP_VS_DIR_INPUT_ONLY,
475 IP_VS_DIR_LAST,
476};
477
478extern struct ip_vs_conn *ip_vs_conn_in_get
Al Viro014d7302006-09-28 14:29:52 -0700479(int protocol, __be32 s_addr, __be16 s_port, __be32 d_addr, __be16 d_port);
Julian Anastasov87375ab2005-09-14 21:08:51 -0700480extern struct ip_vs_conn *ip_vs_ct_in_get
Al Viro014d7302006-09-28 14:29:52 -0700481(int protocol, __be32 s_addr, __be16 s_port, __be32 d_addr, __be16 d_port);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700482extern struct ip_vs_conn *ip_vs_conn_out_get
Al Viro014d7302006-09-28 14:29:52 -0700483(int protocol, __be32 s_addr, __be16 s_port, __be32 d_addr, __be16 d_port);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700484
485/* put back the conn without restarting its timer */
486static inline void __ip_vs_conn_put(struct ip_vs_conn *cp)
487{
488 atomic_dec(&cp->refcnt);
489}
490extern void ip_vs_conn_put(struct ip_vs_conn *cp);
Al Viro014d7302006-09-28 14:29:52 -0700491extern void ip_vs_conn_fill_cport(struct ip_vs_conn *cp, __be16 cport);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700492
493extern struct ip_vs_conn *
Al Viro014d7302006-09-28 14:29:52 -0700494ip_vs_conn_new(int proto, __be32 caddr, __be16 cport, __be32 vaddr, __be16 vport,
495 __be32 daddr, __be16 dport, unsigned flags,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700496 struct ip_vs_dest *dest);
497extern void ip_vs_conn_expire_now(struct ip_vs_conn *cp);
498
499extern const char * ip_vs_state_name(__u16 proto, int state);
500
501extern void ip_vs_tcp_conn_listen(struct ip_vs_conn *cp);
502extern int ip_vs_check_template(struct ip_vs_conn *ct);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700503extern void ip_vs_random_dropentry(void);
504extern int ip_vs_conn_init(void);
505extern void ip_vs_conn_cleanup(void);
506
507static inline void ip_vs_control_del(struct ip_vs_conn *cp)
508{
509 struct ip_vs_conn *ctl_cp = cp->control;
510 if (!ctl_cp) {
511 IP_VS_ERR("request control DEL for uncontrolled: "
512 "%d.%d.%d.%d:%d to %d.%d.%d.%d:%d\n",
513 NIPQUAD(cp->caddr),ntohs(cp->cport),
514 NIPQUAD(cp->vaddr),ntohs(cp->vport));
515 return;
516 }
517
518 IP_VS_DBG(7, "DELeting control for: "
519 "cp.dst=%d.%d.%d.%d:%d ctl_cp.dst=%d.%d.%d.%d:%d\n",
520 NIPQUAD(cp->caddr),ntohs(cp->cport),
521 NIPQUAD(ctl_cp->caddr),ntohs(ctl_cp->cport));
522
523 cp->control = NULL;
524 if (atomic_read(&ctl_cp->n_control) == 0) {
525 IP_VS_ERR("BUG control DEL with n=0 : "
526 "%d.%d.%d.%d:%d to %d.%d.%d.%d:%d\n",
527 NIPQUAD(cp->caddr),ntohs(cp->cport),
528 NIPQUAD(cp->vaddr),ntohs(cp->vport));
529 return;
530 }
531 atomic_dec(&ctl_cp->n_control);
532}
533
534static inline void
535ip_vs_control_add(struct ip_vs_conn *cp, struct ip_vs_conn *ctl_cp)
536{
537 if (cp->control) {
538 IP_VS_ERR("request control ADD for already controlled: "
539 "%d.%d.%d.%d:%d to %d.%d.%d.%d:%d\n",
540 NIPQUAD(cp->caddr),ntohs(cp->cport),
541 NIPQUAD(cp->vaddr),ntohs(cp->vport));
542 ip_vs_control_del(cp);
543 }
544
545 IP_VS_DBG(7, "ADDing control for: "
546 "cp.dst=%d.%d.%d.%d:%d ctl_cp.dst=%d.%d.%d.%d:%d\n",
547 NIPQUAD(cp->caddr),ntohs(cp->cport),
548 NIPQUAD(ctl_cp->caddr),ntohs(ctl_cp->cport));
549
550 cp->control = ctl_cp;
551 atomic_inc(&ctl_cp->n_control);
552}
553
554
555/*
556 * IPVS application functions
557 * (from ip_vs_app.c)
558 */
559#define IP_VS_APP_MAX_PORTS 8
560extern int register_ip_vs_app(struct ip_vs_app *app);
561extern void unregister_ip_vs_app(struct ip_vs_app *app);
562extern int ip_vs_bind_app(struct ip_vs_conn *cp, struct ip_vs_protocol *pp);
563extern void ip_vs_unbind_app(struct ip_vs_conn *cp);
564extern int
565register_ip_vs_app_inc(struct ip_vs_app *app, __u16 proto, __u16 port);
566extern int ip_vs_app_inc_get(struct ip_vs_app *inc);
567extern void ip_vs_app_inc_put(struct ip_vs_app *inc);
568
Herbert Xu3db05fe2007-10-15 00:53:15 -0700569extern int ip_vs_app_pkt_out(struct ip_vs_conn *, struct sk_buff *skb);
570extern int ip_vs_app_pkt_in(struct ip_vs_conn *, struct sk_buff *skb);
Al Virodd0fc662005-10-07 07:46:04 +0100571extern int ip_vs_skb_replace(struct sk_buff *skb, gfp_t pri,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700572 char *o_buf, int o_len, char *n_buf, int n_len);
573extern int ip_vs_app_init(void);
574extern void ip_vs_app_cleanup(void);
575
576
577/*
578 * IPVS protocol functions (from ip_vs_proto.c)
579 */
580extern int ip_vs_protocol_init(void);
581extern void ip_vs_protocol_cleanup(void);
582extern void ip_vs_protocol_timeout_change(int flags);
583extern int *ip_vs_create_timeout_table(int *table, int size);
584extern int
585ip_vs_set_state_timeout(int *table, int num, char **names, char *name, int to);
586extern void
587ip_vs_tcpudp_debug_packet(struct ip_vs_protocol *pp, const struct sk_buff *skb,
588 int offset, const char *msg);
589
590extern struct ip_vs_protocol ip_vs_protocol_tcp;
591extern struct ip_vs_protocol ip_vs_protocol_udp;
592extern struct ip_vs_protocol ip_vs_protocol_icmp;
593extern struct ip_vs_protocol ip_vs_protocol_esp;
594extern struct ip_vs_protocol ip_vs_protocol_ah;
595
596
597/*
598 * Registering/unregistering scheduler functions
599 * (from ip_vs_sched.c)
600 */
601extern int register_ip_vs_scheduler(struct ip_vs_scheduler *scheduler);
602extern int unregister_ip_vs_scheduler(struct ip_vs_scheduler *scheduler);
603extern int ip_vs_bind_scheduler(struct ip_vs_service *svc,
604 struct ip_vs_scheduler *scheduler);
605extern int ip_vs_unbind_scheduler(struct ip_vs_service *svc);
606extern struct ip_vs_scheduler *ip_vs_scheduler_get(const char *sched_name);
607extern void ip_vs_scheduler_put(struct ip_vs_scheduler *scheduler);
608extern struct ip_vs_conn *
609ip_vs_schedule(struct ip_vs_service *svc, const struct sk_buff *skb);
610extern int ip_vs_leave(struct ip_vs_service *svc, struct sk_buff *skb,
611 struct ip_vs_protocol *pp);
612
613
614/*
615 * IPVS control data and functions (from ip_vs_ctl.c)
616 */
617extern int sysctl_ip_vs_cache_bypass;
618extern int sysctl_ip_vs_expire_nodest_conn;
619extern int sysctl_ip_vs_expire_quiescent_template;
620extern int sysctl_ip_vs_sync_threshold[2];
621extern int sysctl_ip_vs_nat_icmp_send;
622extern struct ip_vs_stats ip_vs_stats;
Sven Wegener5587da52008-08-10 18:24:40 +0000623extern const struct ctl_path net_vs_ctl_path[];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700624
625extern struct ip_vs_service *
Al Viro014d7302006-09-28 14:29:52 -0700626ip_vs_service_get(__u32 fwmark, __u16 protocol, __be32 vaddr, __be16 vport);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700627
628static inline void ip_vs_service_put(struct ip_vs_service *svc)
629{
630 atomic_dec(&svc->usecnt);
631}
632
633extern struct ip_vs_dest *
Al Viro014d7302006-09-28 14:29:52 -0700634ip_vs_lookup_real_service(__u16 protocol, __be32 daddr, __be16 dport);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700635extern int ip_vs_use_count_inc(void);
636extern void ip_vs_use_count_dec(void);
637extern int ip_vs_control_init(void);
638extern void ip_vs_control_cleanup(void);
Rumen G. Bogdanovski1e356f92007-11-07 02:35:54 -0800639extern struct ip_vs_dest *
640ip_vs_find_dest(__be32 daddr, __be16 dport,
641 __be32 vaddr, __be16 vport, __u16 protocol);
642extern struct ip_vs_dest *ip_vs_try_bind_dest(struct ip_vs_conn *cp);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700643
644
645/*
646 * IPVS sync daemon data and function prototypes
647 * (from ip_vs_sync.c)
648 */
649extern volatile int ip_vs_sync_state;
650extern volatile int ip_vs_master_syncid;
651extern volatile int ip_vs_backup_syncid;
652extern char ip_vs_master_mcast_ifn[IP_VS_IFNAME_MAXLEN];
653extern char ip_vs_backup_mcast_ifn[IP_VS_IFNAME_MAXLEN];
654extern int start_sync_thread(int state, char *mcast_ifn, __u8 syncid);
655extern int stop_sync_thread(int state);
656extern void ip_vs_sync_conn(struct ip_vs_conn *cp);
657
658
659/*
660 * IPVS rate estimator prototypes (from ip_vs_est.c)
661 */
662extern int ip_vs_new_estimator(struct ip_vs_stats *stats);
663extern void ip_vs_kill_estimator(struct ip_vs_stats *stats);
664extern void ip_vs_zero_estimator(struct ip_vs_stats *stats);
665
666/*
667 * Various IPVS packet transmitters (from ip_vs_xmit.c)
668 */
669extern int ip_vs_null_xmit
670(struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp);
671extern int ip_vs_bypass_xmit
672(struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp);
673extern int ip_vs_nat_xmit
674(struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp);
675extern int ip_vs_tunnel_xmit
676(struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp);
677extern int ip_vs_dr_xmit
678(struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp);
679extern int ip_vs_icmp_xmit
680(struct sk_buff *skb, struct ip_vs_conn *cp, struct ip_vs_protocol *pp, int offset);
681extern void ip_vs_dst_reset(struct ip_vs_dest *dest);
682
683
684/*
685 * This is a simple mechanism to ignore packets when
686 * we are loaded. Just set ip_vs_drop_rate to 'n' and
687 * we start to drop 1/rate of the packets
688 */
689extern int ip_vs_drop_rate;
690extern int ip_vs_drop_counter;
691
692static __inline__ int ip_vs_todrop(void)
693{
694 if (!ip_vs_drop_rate) return 0;
695 if (--ip_vs_drop_counter > 0) return 0;
696 ip_vs_drop_counter = ip_vs_drop_rate;
697 return 1;
698}
699
700/*
701 * ip_vs_fwd_tag returns the forwarding tag of the connection
702 */
703#define IP_VS_FWD_METHOD(cp) (cp->flags & IP_VS_CONN_F_FWD_MASK)
704
Adrian Bunk732db652005-09-01 17:40:26 -0700705static inline char ip_vs_fwd_tag(struct ip_vs_conn *cp)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700706{
707 char fwd;
708
709 switch (IP_VS_FWD_METHOD(cp)) {
710 case IP_VS_CONN_F_MASQ:
711 fwd = 'M'; break;
712 case IP_VS_CONN_F_LOCALNODE:
713 fwd = 'L'; break;
714 case IP_VS_CONN_F_TUNNEL:
715 fwd = 'T'; break;
716 case IP_VS_CONN_F_DROUTE:
717 fwd = 'R'; break;
718 case IP_VS_CONN_F_BYPASS:
719 fwd = 'B'; break;
720 default:
721 fwd = '?'; break;
722 }
723 return fwd;
724}
725
Linus Torvalds1da177e2005-04-16 15:20:36 -0700726extern void ip_vs_nat_icmp(struct sk_buff *skb, struct ip_vs_protocol *pp,
727 struct ip_vs_conn *cp, int dir);
728
Al Virob1550f22006-11-14 21:37:50 -0800729extern __sum16 ip_vs_checksum_complete(struct sk_buff *skb, int offset);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700730
Al Virof9214b22006-11-16 02:41:18 -0800731static inline __wsum ip_vs_check_diff4(__be32 old, __be32 new, __wsum oldsum)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700732{
Al Virof9214b22006-11-16 02:41:18 -0800733 __be32 diff[2] = { ~old, new };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700734
Al Virof9214b22006-11-16 02:41:18 -0800735 return csum_partial((char *) diff, sizeof(diff), oldsum);
736}
737
738static inline __wsum ip_vs_check_diff2(__be16 old, __be16 new, __wsum oldsum)
739{
740 __be16 diff[2] = { ~old, new };
741
742 return csum_partial((char *) diff, sizeof(diff), oldsum);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700743}
744
745#endif /* __KERNEL__ */
746
Julius Volzbc4768e2008-07-31 20:45:24 -0700747#endif /* _NET_IP_VS_H */