blob: b5ccf2b4b2e729d6ba31c959cc34c43efbe784df [file] [log] [blame]
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001/* (C) 1999-2001 Paul `Rusty' Russell
2 * (C) 2002-2004 Netfilter Core Team <coreteam@netfilter.org>
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License version 2 as
6 * published by the Free Software Foundation.
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08007 */
8
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08009#include <linux/types.h>
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -080010#include <linux/timer.h>
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -080011#include <linux/module.h>
12#include <linux/in.h>
13#include <linux/tcp.h>
14#include <linux/spinlock.h>
15#include <linux/skbuff.h>
16#include <linux/ipv6.h>
17#include <net/ip6_checksum.h>
Mark H. Weaver534f81a2009-03-23 13:46:12 +010018#include <asm/unaligned.h>
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -080019
20#include <net/tcp.h>
21
22#include <linux/netfilter.h>
23#include <linux/netfilter_ipv4.h>
24#include <linux/netfilter_ipv6.h>
25#include <net/netfilter/nf_conntrack.h>
Martin Josefsson605dcad2006-11-29 02:35:06 +010026#include <net/netfilter/nf_conntrack_l4proto.h>
Martin Josefssonf6180122006-11-29 02:35:01 +010027#include <net/netfilter/nf_conntrack_ecache.h>
Patrick McHardyf01ffbd2007-12-17 22:38:49 -080028#include <net/netfilter/nf_log.h>
Christoph Paasch9d2493f2009-03-16 15:15:35 +010029#include <net/netfilter/ipv4/nf_conntrack_ipv4.h>
30#include <net/netfilter/ipv6/nf_conntrack_ipv6.h>
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -080031
Patrick McHardyc88130b2008-01-31 04:42:11 -080032/* Protects ct->proto.tcp */
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -080033static DEFINE_RWLOCK(tcp_lock);
34
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -080035/* "Be conservative in what you do,
36 be liberal in what you accept from others."
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -080037 If it's non-zero, we mark only out of window RST segments as INVALID. */
Patrick McHardy3aef0fd2007-02-12 11:16:58 -080038static int nf_ct_tcp_be_liberal __read_mostly = 0;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -080039
Patrick McHardya09113c2007-02-07 15:05:33 -080040/* If it is set to zero, we disable picking up already established
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -080041 connections. */
Patrick McHardy3aef0fd2007-02-12 11:16:58 -080042static int nf_ct_tcp_loose __read_mostly = 1;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -080043
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -080044/* Max number of the retransmitted packets without receiving an (acceptable)
45 ACK from the destination. If this number is reached, a shorter timer
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -080046 will be started. */
Patrick McHardy3aef0fd2007-02-12 11:16:58 -080047static int nf_ct_tcp_max_retrans __read_mostly = 3;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -080048
49 /* FIXME: Examine ipfilter's timeouts and conntrack transitions more
50 closely. They're more complex. --RR */
51
Jan Engelhardt82f568f2008-01-31 04:52:07 -080052static const char *const tcp_conntrack_names[] = {
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -080053 "NONE",
54 "SYN_SENT",
55 "SYN_RECV",
56 "ESTABLISHED",
57 "FIN_WAIT",
58 "CLOSE_WAIT",
59 "LAST_ACK",
60 "TIME_WAIT",
61 "CLOSE",
62 "LISTEN"
63};
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -080064
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -080065#define SECS * HZ
66#define MINS * 60 SECS
67#define HOURS * 60 MINS
68#define DAYS * 24 HOURS
69
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -080070/* RFC1122 says the R2 limit should be at least 100 seconds.
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -080071 Linux uses 15 packets as limit, which corresponds
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -080072 to ~13-30min depending on RTO. */
Patrick McHardyae375042008-07-31 00:38:01 -070073static unsigned int nf_ct_tcp_timeout_max_retrans __read_mostly = 5 MINS;
74static unsigned int nf_ct_tcp_timeout_unacknowledged __read_mostly = 5 MINS;
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -080075
Patrick McHardy2d646282008-01-14 23:45:32 -080076static unsigned int tcp_timeouts[TCP_CONNTRACK_MAX] __read_mostly = {
77 [TCP_CONNTRACK_SYN_SENT] = 2 MINS,
78 [TCP_CONNTRACK_SYN_RECV] = 60 SECS,
79 [TCP_CONNTRACK_ESTABLISHED] = 5 DAYS,
80 [TCP_CONNTRACK_FIN_WAIT] = 2 MINS,
81 [TCP_CONNTRACK_CLOSE_WAIT] = 60 SECS,
82 [TCP_CONNTRACK_LAST_ACK] = 30 SECS,
83 [TCP_CONNTRACK_TIME_WAIT] = 2 MINS,
84 [TCP_CONNTRACK_CLOSE] = 10 SECS,
85};
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -080086
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -080087#define sNO TCP_CONNTRACK_NONE
88#define sSS TCP_CONNTRACK_SYN_SENT
89#define sSR TCP_CONNTRACK_SYN_RECV
90#define sES TCP_CONNTRACK_ESTABLISHED
91#define sFW TCP_CONNTRACK_FIN_WAIT
92#define sCW TCP_CONNTRACK_CLOSE_WAIT
93#define sLA TCP_CONNTRACK_LAST_ACK
94#define sTW TCP_CONNTRACK_TIME_WAIT
95#define sCL TCP_CONNTRACK_CLOSE
96#define sLI TCP_CONNTRACK_LISTEN
97#define sIV TCP_CONNTRACK_MAX
98#define sIG TCP_CONNTRACK_IGNORE
99
100/* What TCP flags are set from RST/SYN/FIN/ACK. */
101enum tcp_bit_set {
102 TCP_SYN_SET,
103 TCP_SYNACK_SET,
104 TCP_FIN_SET,
105 TCP_ACK_SET,
106 TCP_RST_SET,
107 TCP_NONE_SET,
108};
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800109
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800110/*
111 * The TCP state transition table needs a few words...
112 *
113 * We are the man in the middle. All the packets go through us
114 * but might get lost in transit to the destination.
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800115 * It is assumed that the destinations can't receive segments
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800116 * we haven't seen.
117 *
118 * The checked segment is in window, but our windows are *not*
119 * equivalent with the ones of the sender/receiver. We always
120 * try to guess the state of the current sender.
121 *
122 * The meaning of the states are:
123 *
124 * NONE: initial state
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800125 * SYN_SENT: SYN-only packet seen
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800126 * SYN_RECV: SYN-ACK packet seen
127 * ESTABLISHED: ACK packet seen
128 * FIN_WAIT: FIN packet seen
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800129 * CLOSE_WAIT: ACK seen (after FIN)
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800130 * LAST_ACK: FIN seen (after FIN)
131 * TIME_WAIT: last ACK seen
Jozsef Kadlecsikb2155e72008-02-07 17:54:56 -0800132 * CLOSE: closed connection (RST)
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800133 *
134 * LISTEN state is not used.
135 *
136 * Packets marked as IGNORED (sIG):
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800137 * if they may be either invalid or valid
138 * and the receiver may send back a connection
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800139 * closing RST or a SYN/ACK.
140 *
141 * Packets marked as INVALID (sIV):
142 * if they are invalid
143 * or we do not support the request (simultaneous open)
144 */
Patrick McHardya5e73c22008-01-14 23:45:11 -0800145static const u8 tcp_conntracks[2][6][TCP_CONNTRACK_MAX] = {
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800146 {
147/* ORIGINAL */
148/* sNO, sSS, sSR, sES, sFW, sCW, sLA, sTW, sCL, sLI */
149/*syn*/ { sSS, sSS, sIG, sIG, sIG, sIG, sIG, sSS, sSS, sIV },
150/*
151 * sNO -> sSS Initialize a new connection
152 * sSS -> sSS Retransmitted SYN
153 * sSR -> sIG Late retransmitted SYN?
154 * sES -> sIG Error: SYNs in window outside the SYN_SENT state
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800155 * are errors. Receiver will reply with RST
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800156 * and close the connection.
157 * Or we are not in sync and hold a dead connection.
158 * sFW -> sIG
159 * sCW -> sIG
160 * sLA -> sIG
161 * sTW -> sSS Reopened connection (RFC 1122).
162 * sCL -> sSS
163 */
164/* sNO, sSS, sSR, sES, sFW, sCW, sLA, sTW, sCL, sLI */
165/*synack*/ { sIV, sIV, sIV, sIV, sIV, sIV, sIV, sIV, sIV, sIV },
166/*
167 * A SYN/ACK from the client is always invalid:
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800168 * - either it tries to set up a simultaneous open, which is
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800169 * not supported;
170 * - or the firewall has just been inserted between the two hosts
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800171 * during the session set-up. The SYN will be retransmitted
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800172 * by the true client (or it'll time out).
173 */
174/* sNO, sSS, sSR, sES, sFW, sCW, sLA, sTW, sCL, sLI */
175/*fin*/ { sIV, sIV, sFW, sFW, sLA, sLA, sLA, sTW, sCL, sIV },
176/*
177 * sNO -> sIV Too late and no reason to do anything...
178 * sSS -> sIV Client migth not send FIN in this state:
179 * we enforce waiting for a SYN/ACK reply first.
180 * sSR -> sFW Close started.
181 * sES -> sFW
182 * sFW -> sLA FIN seen in both directions, waiting for
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800183 * the last ACK.
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800184 * Migth be a retransmitted FIN as well...
185 * sCW -> sLA
186 * sLA -> sLA Retransmitted FIN. Remain in the same state.
187 * sTW -> sTW
188 * sCL -> sCL
189 */
190/* sNO, sSS, sSR, sES, sFW, sCW, sLA, sTW, sCL, sLI */
191/*ack*/ { sES, sIV, sES, sES, sCW, sCW, sTW, sTW, sCL, sIV },
192/*
193 * sNO -> sES Assumed.
194 * sSS -> sIV ACK is invalid: we haven't seen a SYN/ACK yet.
195 * sSR -> sES Established state is reached.
196 * sES -> sES :-)
197 * sFW -> sCW Normal close request answered by ACK.
198 * sCW -> sCW
199 * sLA -> sTW Last ACK detected.
200 * sTW -> sTW Retransmitted last ACK. Remain in the same state.
201 * sCL -> sCL
202 */
203/* sNO, sSS, sSR, sES, sFW, sCW, sLA, sTW, sCL, sLI */
204/*rst*/ { sIV, sCL, sCL, sCL, sCL, sCL, sCL, sCL, sCL, sIV },
205/*none*/ { sIV, sIV, sIV, sIV, sIV, sIV, sIV, sIV, sIV, sIV }
206 },
207 {
208/* REPLY */
209/* sNO, sSS, sSR, sES, sFW, sCW, sLA, sTW, sCL, sLI */
210/*syn*/ { sIV, sIV, sIV, sIV, sIV, sIV, sIV, sIV, sIV, sIV },
211/*
212 * sNO -> sIV Never reached.
213 * sSS -> sIV Simultaneous open, not supported
214 * sSR -> sIV Simultaneous open, not supported.
215 * sES -> sIV Server may not initiate a connection.
216 * sFW -> sIV
217 * sCW -> sIV
218 * sLA -> sIV
219 * sTW -> sIV Reopened connection, but server may not do it.
220 * sCL -> sIV
221 */
222/* sNO, sSS, sSR, sES, sFW, sCW, sLA, sTW, sCL, sLI */
223/*synack*/ { sIV, sSR, sSR, sIG, sIG, sIG, sIG, sIG, sIG, sIV },
224/*
225 * sSS -> sSR Standard open.
226 * sSR -> sSR Retransmitted SYN/ACK.
227 * sES -> sIG Late retransmitted SYN/ACK?
228 * sFW -> sIG Might be SYN/ACK answering ignored SYN
229 * sCW -> sIG
230 * sLA -> sIG
231 * sTW -> sIG
232 * sCL -> sIG
233 */
234/* sNO, sSS, sSR, sES, sFW, sCW, sLA, sTW, sCL, sLI */
235/*fin*/ { sIV, sIV, sFW, sFW, sLA, sLA, sLA, sTW, sCL, sIV },
236/*
237 * sSS -> sIV Server might not send FIN in this state.
238 * sSR -> sFW Close started.
239 * sES -> sFW
240 * sFW -> sLA FIN seen in both directions.
241 * sCW -> sLA
242 * sLA -> sLA Retransmitted FIN.
243 * sTW -> sTW
244 * sCL -> sCL
245 */
246/* sNO, sSS, sSR, sES, sFW, sCW, sLA, sTW, sCL, sLI */
Jozsef Kadlecsik73f30602005-12-01 14:28:58 -0800247/*ack*/ { sIV, sIG, sSR, sES, sCW, sCW, sTW, sTW, sCL, sIV },
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800248/*
Jozsef Kadlecsik73f30602005-12-01 14:28:58 -0800249 * sSS -> sIG Might be a half-open connection.
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800250 * sSR -> sSR Might answer late resent SYN.
251 * sES -> sES :-)
252 * sFW -> sCW Normal close request answered by ACK.
253 * sCW -> sCW
254 * sLA -> sTW Last ACK detected.
255 * sTW -> sTW Retransmitted last ACK.
256 * sCL -> sCL
257 */
258/* sNO, sSS, sSR, sES, sFW, sCW, sLA, sTW, sCL, sLI */
259/*rst*/ { sIV, sCL, sCL, sCL, sCL, sCL, sCL, sCL, sCL, sIV },
260/*none*/ { sIV, sIV, sIV, sIV, sIV, sIV, sIV, sIV, sIV, sIV }
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800261 }
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800262};
263
Jan Engelhardt09f263c2008-04-14 11:15:53 +0200264static bool tcp_pkt_to_tuple(const struct sk_buff *skb, unsigned int dataoff,
265 struct nf_conntrack_tuple *tuple)
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800266{
Jan Engelhardt82f568f2008-01-31 04:52:07 -0800267 const struct tcphdr *hp;
268 struct tcphdr _hdr;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800269
270 /* Actually only need first 8 bytes. */
271 hp = skb_header_pointer(skb, dataoff, 8, &_hdr);
272 if (hp == NULL)
Jan Engelhardt09f263c2008-04-14 11:15:53 +0200273 return false;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800274
275 tuple->src.u.tcp.port = hp->source;
276 tuple->dst.u.tcp.port = hp->dest;
277
Jan Engelhardt09f263c2008-04-14 11:15:53 +0200278 return true;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800279}
280
Jan Engelhardt09f263c2008-04-14 11:15:53 +0200281static bool tcp_invert_tuple(struct nf_conntrack_tuple *tuple,
282 const struct nf_conntrack_tuple *orig)
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800283{
284 tuple->src.u.tcp.port = orig->dst.u.tcp.port;
285 tuple->dst.u.tcp.port = orig->src.u.tcp.port;
Jan Engelhardt09f263c2008-04-14 11:15:53 +0200286 return true;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800287}
288
289/* Print out the per-protocol part of the tuple. */
290static int tcp_print_tuple(struct seq_file *s,
291 const struct nf_conntrack_tuple *tuple)
292{
293 return seq_printf(s, "sport=%hu dport=%hu ",
294 ntohs(tuple->src.u.tcp.port),
295 ntohs(tuple->dst.u.tcp.port));
296}
297
298/* Print out the private part of the conntrack. */
Patrick McHardyc88130b2008-01-31 04:42:11 -0800299static int tcp_print_conntrack(struct seq_file *s, const struct nf_conn *ct)
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800300{
301 enum tcp_conntrack state;
302
303 read_lock_bh(&tcp_lock);
Patrick McHardyc88130b2008-01-31 04:42:11 -0800304 state = ct->proto.tcp.state;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800305 read_unlock_bh(&tcp_lock);
306
307 return seq_printf(s, "%s ", tcp_conntrack_names[state]);
308}
309
310static unsigned int get_conntrack_index(const struct tcphdr *tcph)
311{
312 if (tcph->rst) return TCP_RST_SET;
313 else if (tcph->syn) return (tcph->ack ? TCP_SYNACK_SET : TCP_SYN_SET);
314 else if (tcph->fin) return TCP_FIN_SET;
315 else if (tcph->ack) return TCP_ACK_SET;
316 else return TCP_NONE_SET;
317}
318
319/* TCP connection tracking based on 'Real Stateful TCP Packet Filtering
320 in IP Filter' by Guido van Rooij.
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800321
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800322 http://www.nluug.nl/events/sane2000/papers.html
323 http://www.iae.nl/users/guido/papers/tcp_filtering.ps.gz
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800324
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800325 The boundaries and the conditions are changed according to RFC793:
326 the packet must intersect the window (i.e. segments may be
327 after the right or before the left edge) and thus receivers may ACK
328 segments after the right edge of the window.
329
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800330 td_maxend = max(sack + max(win,1)) seen in reply packets
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800331 td_maxwin = max(max(win, 1)) + (sack - ack) seen in sent packets
332 td_maxwin += seq + len - sender.td_maxend
333 if seq + len > sender.td_maxend
334 td_end = max(seq + len) seen in sent packets
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800335
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800336 I. Upper bound for valid data: seq <= sender.td_maxend
337 II. Lower bound for valid data: seq + len >= sender.td_end - receiver.td_maxwin
Jozsef Kadlecsik84ebe1c2008-06-30 12:41:30 -0700338 III. Upper bound for valid (s)ack: sack <= receiver.td_end
339 IV. Lower bound for valid (s)ack: sack >= receiver.td_end - MAXACKWINDOW
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800340
Jozsef Kadlecsik84ebe1c2008-06-30 12:41:30 -0700341 where sack is the highest right edge of sack block found in the packet
342 or ack in the case of packet without SACK option.
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800343
Jozsef Kadlecsik84ebe1c2008-06-30 12:41:30 -0700344 The upper bound limit for a valid (s)ack is not ignored -
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800345 we doesn't have to deal with fragments.
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800346*/
347
348static inline __u32 segment_seq_plus_len(__u32 seq,
349 size_t len,
350 unsigned int dataoff,
Jan Engelhardt82f568f2008-01-31 04:52:07 -0800351 const struct tcphdr *tcph)
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800352{
353 /* XXX Should I use payload length field in IP/IPv6 header ?
354 * - YK */
355 return (seq + len - dataoff - tcph->doff*4
356 + (tcph->syn ? 1 : 0) + (tcph->fin ? 1 : 0));
357}
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800358
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800359/* Fixme: what about big packets? */
360#define MAXACKWINCONST 66000
361#define MAXACKWINDOW(sender) \
362 ((sender)->td_maxwin > MAXACKWINCONST ? (sender)->td_maxwin \
363 : MAXACKWINCONST)
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800364
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800365/*
366 * Simplified tcp_parse_options routine from tcp_input.c
367 */
368static void tcp_options(const struct sk_buff *skb,
369 unsigned int dataoff,
Jan Engelhardt82f568f2008-01-31 04:52:07 -0800370 const struct tcphdr *tcph,
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800371 struct ip_ct_tcp_state *state)
372{
373 unsigned char buff[(15 * 4) - sizeof(struct tcphdr)];
Jan Engelhardt82f568f2008-01-31 04:52:07 -0800374 const unsigned char *ptr;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800375 int length = (tcph->doff*4) - sizeof(struct tcphdr);
376
377 if (!length)
378 return;
379
380 ptr = skb_header_pointer(skb, dataoff + sizeof(struct tcphdr),
381 length, buff);
382 BUG_ON(ptr == NULL);
383
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800384 state->td_scale =
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800385 state->flags = 0;
386
387 while (length > 0) {
388 int opcode=*ptr++;
389 int opsize;
390
391 switch (opcode) {
392 case TCPOPT_EOL:
393 return;
394 case TCPOPT_NOP: /* Ref: RFC 793 section 3.1 */
395 length--;
396 continue;
397 default:
398 opsize=*ptr++;
399 if (opsize < 2) /* "silly options" */
400 return;
401 if (opsize > length)
402 break; /* don't parse partial options */
403
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800404 if (opcode == TCPOPT_SACK_PERM
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800405 && opsize == TCPOLEN_SACK_PERM)
406 state->flags |= IP_CT_TCP_FLAG_SACK_PERM;
407 else if (opcode == TCPOPT_WINDOW
408 && opsize == TCPOLEN_WINDOW) {
409 state->td_scale = *(u_int8_t *)ptr;
410
411 if (state->td_scale > 14) {
412 /* See RFC1323 */
413 state->td_scale = 14;
414 }
415 state->flags |=
416 IP_CT_TCP_FLAG_WINDOW_SCALE;
417 }
418 ptr += opsize - 2;
419 length -= opsize;
420 }
421 }
422}
423
424static void tcp_sack(const struct sk_buff *skb, unsigned int dataoff,
Jan Engelhardt82f568f2008-01-31 04:52:07 -0800425 const struct tcphdr *tcph, __u32 *sack)
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800426{
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800427 unsigned char buff[(15 * 4) - sizeof(struct tcphdr)];
Jan Engelhardt82f568f2008-01-31 04:52:07 -0800428 const unsigned char *ptr;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800429 int length = (tcph->doff*4) - sizeof(struct tcphdr);
430 __u32 tmp;
431
432 if (!length)
433 return;
434
435 ptr = skb_header_pointer(skb, dataoff + sizeof(struct tcphdr),
436 length, buff);
437 BUG_ON(ptr == NULL);
438
439 /* Fast path for timestamp-only option */
440 if (length == TCPOLEN_TSTAMP_ALIGNED*4
YOSHIFUJI Hideaki8f05ce92007-03-07 14:21:00 +0900441 && *(__be32 *)ptr == htonl((TCPOPT_NOP << 24)
442 | (TCPOPT_NOP << 16)
443 | (TCPOPT_TIMESTAMP << 8)
444 | TCPOLEN_TIMESTAMP))
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800445 return;
446
447 while (length > 0) {
448 int opcode = *ptr++;
449 int opsize, i;
450
451 switch (opcode) {
452 case TCPOPT_EOL:
453 return;
454 case TCPOPT_NOP: /* Ref: RFC 793 section 3.1 */
455 length--;
456 continue;
457 default:
458 opsize = *ptr++;
459 if (opsize < 2) /* "silly options" */
460 return;
461 if (opsize > length)
462 break; /* don't parse partial options */
463
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800464 if (opcode == TCPOPT_SACK
465 && opsize >= (TCPOLEN_SACK_BASE
466 + TCPOLEN_SACK_PERBLOCK)
467 && !((opsize - TCPOLEN_SACK_BASE)
468 % TCPOLEN_SACK_PERBLOCK)) {
469 for (i = 0;
470 i < (opsize - TCPOLEN_SACK_BASE);
471 i += TCPOLEN_SACK_PERBLOCK) {
Mark H. Weaver534f81a2009-03-23 13:46:12 +0100472 tmp = get_unaligned_be32((__be32 *)(ptr+i)+1);
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800473
474 if (after(tmp, *sack))
475 *sack = tmp;
476 }
477 return;
478 }
479 ptr += opsize - 2;
480 length -= opsize;
481 }
482 }
483}
484
Jan Engelhardt09f263c2008-04-14 11:15:53 +0200485static bool tcp_in_window(const struct nf_conn *ct,
486 struct ip_ct_tcp *state,
487 enum ip_conntrack_dir dir,
488 unsigned int index,
489 const struct sk_buff *skb,
490 unsigned int dataoff,
491 const struct tcphdr *tcph,
Jan Engelhardt76108ce2008-10-08 11:35:00 +0200492 u_int8_t pf)
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800493{
Alexey Dobriyanc2a2c7e2008-10-08 11:35:08 +0200494 struct net *net = nf_ct_net(ct);
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800495 struct ip_ct_tcp_state *sender = &state->seen[dir];
496 struct ip_ct_tcp_state *receiver = &state->seen[!dir];
Jan Engelhardt82f568f2008-01-31 04:52:07 -0800497 const struct nf_conntrack_tuple *tuple = &ct->tuplehash[dir].tuple;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800498 __u32 seq, ack, sack, end, win, swin;
Jan Engelhardt09f263c2008-04-14 11:15:53 +0200499 bool res;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800500
501 /*
502 * Get the required data from the packet.
503 */
504 seq = ntohl(tcph->seq);
505 ack = sack = ntohl(tcph->ack_seq);
506 win = ntohs(tcph->window);
507 end = segment_seq_plus_len(seq, skb->len, dataoff, tcph);
508
509 if (receiver->flags & IP_CT_TCP_FLAG_SACK_PERM)
510 tcp_sack(skb, dataoff, tcph, &sack);
511
Patrick McHardy0d537782007-07-07 22:39:38 -0700512 pr_debug("tcp_in_window: START\n");
513 pr_debug("tcp_in_window: ");
Jan Engelhardt3c9fba62008-04-14 11:15:54 +0200514 nf_ct_dump_tuple(tuple);
Patrick McHardy0d537782007-07-07 22:39:38 -0700515 pr_debug("seq=%u ack=%u sack=%u win=%u end=%u\n",
516 seq, ack, sack, win, end);
517 pr_debug("tcp_in_window: sender end=%u maxend=%u maxwin=%u scale=%i "
518 "receiver end=%u maxend=%u maxwin=%u scale=%i\n",
519 sender->td_end, sender->td_maxend, sender->td_maxwin,
520 sender->td_scale,
521 receiver->td_end, receiver->td_maxend, receiver->td_maxwin,
522 receiver->td_scale);
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800523
524 if (sender->td_end == 0) {
525 /*
526 * Initialize sender data.
527 */
528 if (tcph->syn && tcph->ack) {
529 /*
530 * Outgoing SYN-ACK in reply to a SYN.
531 */
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800532 sender->td_end =
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800533 sender->td_maxend = end;
534 sender->td_maxwin = (win == 0 ? 1 : win);
535
536 tcp_options(skb, dataoff, tcph, sender);
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800537 /*
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800538 * RFC 1323:
539 * Both sides must send the Window Scale option
540 * to enable window scaling in either direction.
541 */
542 if (!(sender->flags & IP_CT_TCP_FLAG_WINDOW_SCALE
543 && receiver->flags & IP_CT_TCP_FLAG_WINDOW_SCALE))
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800544 sender->td_scale =
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800545 receiver->td_scale = 0;
546 } else {
547 /*
548 * We are in the middle of a connection,
549 * its history is lost for us.
550 * Let's try to use the data from the packet.
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800551 */
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800552 sender->td_end = end;
553 sender->td_maxwin = (win == 0 ? 1 : win);
554 sender->td_maxend = end + sender->td_maxwin;
555 }
556 } else if (((state->state == TCP_CONNTRACK_SYN_SENT
557 && dir == IP_CT_DIR_ORIGINAL)
558 || (state->state == TCP_CONNTRACK_SYN_RECV
559 && dir == IP_CT_DIR_REPLY))
560 && after(end, sender->td_end)) {
561 /*
562 * RFC 793: "if a TCP is reinitialized ... then it need
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800563 * not wait at all; it must only be sure to use sequence
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800564 * numbers larger than those recently used."
565 */
566 sender->td_end =
567 sender->td_maxend = end;
568 sender->td_maxwin = (win == 0 ? 1 : win);
569
570 tcp_options(skb, dataoff, tcph, sender);
571 }
572
573 if (!(tcph->ack)) {
574 /*
575 * If there is no ACK, just pretend it was set and OK.
576 */
577 ack = sack = receiver->td_end;
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800578 } else if (((tcp_flag_word(tcph) & (TCP_FLAG_ACK|TCP_FLAG_RST)) ==
579 (TCP_FLAG_ACK|TCP_FLAG_RST))
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800580 && (ack == 0)) {
581 /*
582 * Broken TCP stacks, that set ACK in RST packets as well
583 * with zero ack value.
584 */
585 ack = sack = receiver->td_end;
586 }
587
588 if (seq == end
589 && (!tcph->rst
590 || (seq == 0 && state->state == TCP_CONNTRACK_SYN_SENT)))
591 /*
592 * Packets contains no data: we assume it is valid
593 * and check the ack value only.
594 * However RST segments are always validated by their
595 * SEQ number, except when seq == 0 (reset sent answering
596 * SYN.
597 */
598 seq = end = sender->td_end;
599
Patrick McHardy0d537782007-07-07 22:39:38 -0700600 pr_debug("tcp_in_window: ");
Jan Engelhardt3c9fba62008-04-14 11:15:54 +0200601 nf_ct_dump_tuple(tuple);
Patrick McHardy0d537782007-07-07 22:39:38 -0700602 pr_debug("seq=%u ack=%u sack =%u win=%u end=%u\n",
603 seq, ack, sack, win, end);
604 pr_debug("tcp_in_window: sender end=%u maxend=%u maxwin=%u scale=%i "
605 "receiver end=%u maxend=%u maxwin=%u scale=%i\n",
606 sender->td_end, sender->td_maxend, sender->td_maxwin,
607 sender->td_scale,
608 receiver->td_end, receiver->td_maxend, receiver->td_maxwin,
609 receiver->td_scale);
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800610
Patrick McHardy0d537782007-07-07 22:39:38 -0700611 pr_debug("tcp_in_window: I=%i II=%i III=%i IV=%i\n",
612 before(seq, sender->td_maxend + 1),
613 after(end, sender->td_end - receiver->td_maxwin - 1),
614 before(sack, receiver->td_end + 1),
Jozsef Kadlecsik84ebe1c2008-06-30 12:41:30 -0700615 after(sack, receiver->td_end - MAXACKWINDOW(sender) - 1));
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800616
Patrick McHardya09113c2007-02-07 15:05:33 -0800617 if (before(seq, sender->td_maxend + 1) &&
618 after(end, sender->td_end - receiver->td_maxwin - 1) &&
619 before(sack, receiver->td_end + 1) &&
Jozsef Kadlecsik84ebe1c2008-06-30 12:41:30 -0700620 after(sack, receiver->td_end - MAXACKWINDOW(sender) - 1)) {
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800621 /*
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800622 * Take into account window scaling (RFC 1323).
623 */
624 if (!tcph->syn)
625 win <<= sender->td_scale;
626
627 /*
628 * Update sender data.
629 */
630 swin = win + (sack - ack);
631 if (sender->td_maxwin < swin)
632 sender->td_maxwin = swin;
Patrick McHardyae375042008-07-31 00:38:01 -0700633 if (after(end, sender->td_end)) {
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800634 sender->td_end = end;
Patrick McHardyae375042008-07-31 00:38:01 -0700635 sender->flags |= IP_CT_TCP_FLAG_DATA_UNACKNOWLEDGED;
636 }
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800637 /*
638 * Update receiver data.
639 */
640 if (after(end, sender->td_maxend))
641 receiver->td_maxwin += end - sender->td_maxend;
642 if (after(sack + win, receiver->td_maxend - 1)) {
643 receiver->td_maxend = sack + win;
644 if (win == 0)
645 receiver->td_maxend++;
646 }
Patrick McHardyae375042008-07-31 00:38:01 -0700647 if (ack == receiver->td_end)
648 receiver->flags &= ~IP_CT_TCP_FLAG_DATA_UNACKNOWLEDGED;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800649
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800650 /*
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800651 * Check retransmissions.
652 */
653 if (index == TCP_ACK_SET) {
654 if (state->last_dir == dir
655 && state->last_seq == seq
656 && state->last_ack == ack
George Hansperc1fe3ca2006-09-20 12:03:23 -0700657 && state->last_end == end
658 && state->last_win == win)
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800659 state->retrans++;
660 else {
661 state->last_dir = dir;
662 state->last_seq = seq;
663 state->last_ack = ack;
664 state->last_end = end;
George Hansperc1fe3ca2006-09-20 12:03:23 -0700665 state->last_win = win;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800666 state->retrans = 0;
667 }
668 }
Jan Engelhardt09f263c2008-04-14 11:15:53 +0200669 res = true;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800670 } else {
Jan Engelhardt09f263c2008-04-14 11:15:53 +0200671 res = false;
Patrick McHardya09113c2007-02-07 15:05:33 -0800672 if (sender->flags & IP_CT_TCP_FLAG_BE_LIBERAL ||
673 nf_ct_tcp_be_liberal)
Jan Engelhardt09f263c2008-04-14 11:15:53 +0200674 res = true;
Alexey Dobriyanc2a2c7e2008-10-08 11:35:08 +0200675 if (!res && LOG_INVALID(net, IPPROTO_TCP))
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800676 nf_log_packet(pf, 0, skb, NULL, NULL, NULL,
677 "nf_ct_tcp: %s ",
678 before(seq, sender->td_maxend + 1) ?
679 after(end, sender->td_end - receiver->td_maxwin - 1) ?
680 before(sack, receiver->td_end + 1) ?
681 after(ack, receiver->td_end - MAXACKWINDOW(sender)) ? "BUG"
682 : "ACK is under the lower bound (possible overly delayed ACK)"
683 : "ACK is over the upper bound (ACKed data not seen yet)"
684 : "SEQ is under the lower bound (already ACKed data retransmitted)"
685 : "SEQ is over the upper bound (over the window of the receiver)");
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800686 }
687
Jan Engelhardt09f263c2008-04-14 11:15:53 +0200688 pr_debug("tcp_in_window: res=%u sender end=%u maxend=%u maxwin=%u "
Patrick McHardy0d537782007-07-07 22:39:38 -0700689 "receiver end=%u maxend=%u maxwin=%u\n",
690 res, sender->td_end, sender->td_maxend, sender->td_maxwin,
691 receiver->td_end, receiver->td_maxend, receiver->td_maxwin);
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800692
693 return res;
694}
695
Jozsef Kadlecsik5b1158e2006-12-02 22:07:13 -0800696#ifdef CONFIG_NF_NAT_NEEDED
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800697/* Update sender->td_end after NAT successfully mangled the packet */
698/* Caller must linearize skb at tcp header. */
Jan Engelhardt82f568f2008-01-31 04:52:07 -0800699void nf_conntrack_tcp_update(const struct sk_buff *skb,
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800700 unsigned int dataoff,
Patrick McHardyc88130b2008-01-31 04:42:11 -0800701 struct nf_conn *ct,
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800702 int dir)
703{
Jan Engelhardt82f568f2008-01-31 04:52:07 -0800704 const struct tcphdr *tcph = (const void *)skb->data + dataoff;
705 const struct ip_ct_tcp_state *sender = &ct->proto.tcp.seen[dir];
706 const struct ip_ct_tcp_state *receiver = &ct->proto.tcp.seen[!dir];
Patrick McHardy0d537782007-07-07 22:39:38 -0700707 __u32 end;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800708
709 end = segment_seq_plus_len(ntohl(tcph->seq), skb->len, dataoff, tcph);
710
711 write_lock_bh(&tcp_lock);
712 /*
713 * We have to worry for the ack in the reply packet only...
714 */
Patrick McHardyc88130b2008-01-31 04:42:11 -0800715 if (after(end, ct->proto.tcp.seen[dir].td_end))
716 ct->proto.tcp.seen[dir].td_end = end;
717 ct->proto.tcp.last_end = end;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800718 write_unlock_bh(&tcp_lock);
Patrick McHardy0d537782007-07-07 22:39:38 -0700719 pr_debug("tcp_update: sender end=%u maxend=%u maxwin=%u scale=%i "
720 "receiver end=%u maxend=%u maxwin=%u scale=%i\n",
721 sender->td_end, sender->td_maxend, sender->td_maxwin,
722 sender->td_scale,
723 receiver->td_end, receiver->td_maxend, receiver->td_maxwin,
724 receiver->td_scale);
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800725}
Patrick McHardy13b18332006-12-02 22:11:25 -0800726EXPORT_SYMBOL_GPL(nf_conntrack_tcp_update);
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800727#endif
728
729#define TH_FIN 0x01
730#define TH_SYN 0x02
731#define TH_RST 0x04
732#define TH_PUSH 0x08
733#define TH_ACK 0x10
734#define TH_URG 0x20
735#define TH_ECE 0x40
736#define TH_CWR 0x80
737
Willy Tarreau5c8ce7c2007-03-14 16:44:53 -0700738/* table of valid flag combinations - PUSH, ECE and CWR are always valid */
Jan Engelhardt82f568f2008-01-31 04:52:07 -0800739static const u8 tcp_valid_flags[(TH_FIN|TH_SYN|TH_RST|TH_ACK|TH_URG) + 1] =
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800740{
741 [TH_SYN] = 1,
Patrick McHardyd3ab4292007-03-04 15:57:46 -0800742 [TH_SYN|TH_URG] = 1,
Patrick McHardyd3ab4292007-03-04 15:57:46 -0800743 [TH_SYN|TH_ACK] = 1,
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800744 [TH_RST] = 1,
745 [TH_RST|TH_ACK] = 1,
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800746 [TH_FIN|TH_ACK] = 1,
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800747 [TH_FIN|TH_ACK|TH_URG] = 1,
Willy Tarreau5c8ce7c2007-03-14 16:44:53 -0700748 [TH_ACK] = 1,
749 [TH_ACK|TH_URG] = 1,
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800750};
751
752/* Protect conntrack agaist broken packets. Code taken from ipt_unclean.c. */
Alexey Dobriyan74c51a12008-10-08 11:35:05 +0200753static int tcp_error(struct net *net,
754 struct sk_buff *skb,
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800755 unsigned int dataoff,
756 enum ip_conntrack_info *ctinfo,
Jan Engelhardt76108ce2008-10-08 11:35:00 +0200757 u_int8_t pf,
Patrick McHardy96f6bf82006-04-06 14:19:24 -0700758 unsigned int hooknum)
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800759{
Jan Engelhardt82f568f2008-01-31 04:52:07 -0800760 const struct tcphdr *th;
761 struct tcphdr _tcph;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800762 unsigned int tcplen = skb->len - dataoff;
763 u_int8_t tcpflags;
764
765 /* Smaller that minimal TCP header? */
766 th = skb_header_pointer(skb, dataoff, sizeof(_tcph), &_tcph);
767 if (th == NULL) {
Alexey Dobriyanc2a2c7e2008-10-08 11:35:08 +0200768 if (LOG_INVALID(net, IPPROTO_TCP))
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800769 nf_log_packet(pf, 0, skb, NULL, NULL, NULL,
770 "nf_ct_tcp: short packet ");
771 return -NF_ACCEPT;
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800772 }
773
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800774 /* Not whole TCP header or malformed packet */
775 if (th->doff*4 < sizeof(struct tcphdr) || tcplen < th->doff*4) {
Alexey Dobriyanc2a2c7e2008-10-08 11:35:08 +0200776 if (LOG_INVALID(net, IPPROTO_TCP))
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800777 nf_log_packet(pf, 0, skb, NULL, NULL, NULL,
778 "nf_ct_tcp: truncated/malformed packet ");
779 return -NF_ACCEPT;
780 }
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800781
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800782 /* Checksum invalid? Ignore.
783 * We skip checking packets on the outgoing path
Patrick McHardy84fa7932006-08-29 16:44:56 -0700784 * because the checksum is assumed to be correct.
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800785 */
786 /* FIXME: Source route IP option packets --RR */
Alexey Dobriyanc04d0552008-10-08 11:35:08 +0200787 if (net->ct.sysctl_checksum && hooknum == NF_INET_PRE_ROUTING &&
Patrick McHardy96f6bf82006-04-06 14:19:24 -0700788 nf_checksum(skb, hooknum, dataoff, IPPROTO_TCP, pf)) {
Alexey Dobriyanc2a2c7e2008-10-08 11:35:08 +0200789 if (LOG_INVALID(net, IPPROTO_TCP))
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800790 nf_log_packet(pf, 0, skb, NULL, NULL, NULL,
791 "nf_ct_tcp: bad TCP checksum ");
792 return -NF_ACCEPT;
793 }
794
795 /* Check TCP flags. */
Willy Tarreau5c8ce7c2007-03-14 16:44:53 -0700796 tcpflags = (((u_int8_t *)th)[13] & ~(TH_ECE|TH_CWR|TH_PUSH));
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800797 if (!tcp_valid_flags[tcpflags]) {
Alexey Dobriyanc2a2c7e2008-10-08 11:35:08 +0200798 if (LOG_INVALID(net, IPPROTO_TCP))
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800799 nf_log_packet(pf, 0, skb, NULL, NULL, NULL,
800 "nf_ct_tcp: invalid TCP flag combination ");
801 return -NF_ACCEPT;
802 }
803
804 return NF_ACCEPT;
805}
806
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800807/* Returns verdict for packet, or -1 for invalid. */
Patrick McHardyc88130b2008-01-31 04:42:11 -0800808static int tcp_packet(struct nf_conn *ct,
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800809 const struct sk_buff *skb,
810 unsigned int dataoff,
811 enum ip_conntrack_info ctinfo,
Jan Engelhardt76108ce2008-10-08 11:35:00 +0200812 u_int8_t pf,
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800813 unsigned int hooknum)
814{
Alexey Dobriyanc2a2c7e2008-10-08 11:35:08 +0200815 struct net *net = nf_ct_net(ct);
Patrick McHardy0d537782007-07-07 22:39:38 -0700816 struct nf_conntrack_tuple *tuple;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800817 enum tcp_conntrack new_state, old_state;
818 enum ip_conntrack_dir dir;
Jan Engelhardt82f568f2008-01-31 04:52:07 -0800819 const struct tcphdr *th;
820 struct tcphdr _tcph;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800821 unsigned long timeout;
822 unsigned int index;
823
824 th = skb_header_pointer(skb, dataoff, sizeof(_tcph), &_tcph);
825 BUG_ON(th == NULL);
826
827 write_lock_bh(&tcp_lock);
Patrick McHardyc88130b2008-01-31 04:42:11 -0800828 old_state = ct->proto.tcp.state;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800829 dir = CTINFO2DIR(ctinfo);
830 index = get_conntrack_index(th);
831 new_state = tcp_conntracks[dir][index][old_state];
Patrick McHardyc88130b2008-01-31 04:42:11 -0800832 tuple = &ct->tuplehash[dir].tuple;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800833
834 switch (new_state) {
Jozsef Kadlecsik17311392007-10-11 14:35:52 -0700835 case TCP_CONNTRACK_SYN_SENT:
836 if (old_state < TCP_CONNTRACK_TIME_WAIT)
837 break;
Jozsef Kadlecsikb2155e72008-02-07 17:54:56 -0800838 /* RFC 1122: "When a connection is closed actively,
839 * it MUST linger in TIME-WAIT state for a time 2xMSL
840 * (Maximum Segment Lifetime). However, it MAY accept
841 * a new SYN from the remote TCP to reopen the connection
842 * directly from TIME-WAIT state, if..."
843 * We ignore the conditions because we are in the
844 * TIME-WAIT state anyway.
845 *
846 * Handle aborted connections: we and the server
847 * think there is an existing connection but the client
848 * aborts it and starts a new one.
849 */
850 if (((ct->proto.tcp.seen[dir].flags
851 | ct->proto.tcp.seen[!dir].flags)
852 & IP_CT_TCP_FLAG_CLOSE_INIT)
Patrick McHardyc88130b2008-01-31 04:42:11 -0800853 || (ct->proto.tcp.last_dir == dir
854 && ct->proto.tcp.last_index == TCP_RST_SET)) {
Jozsef Kadlecsikbc34b842007-10-18 05:20:12 -0700855 /* Attempt to reopen a closed/aborted connection.
856 * Delete this connection and look up again. */
Jozsef Kadlecsik17311392007-10-11 14:35:52 -0700857 write_unlock_bh(&tcp_lock);
David S. Miller2aec6092008-07-14 20:23:54 -0700858
Patrick McHardy6b69fe02008-07-09 15:06:12 -0700859 /* Only repeat if we can actually remove the timer.
860 * Destruction may already be in progress in process
861 * context and we must give it a chance to terminate.
862 */
David S. Miller2aec6092008-07-14 20:23:54 -0700863 if (nf_ct_kill(ct))
Patrick McHardy6b69fe02008-07-09 15:06:12 -0700864 return -NF_REPEAT;
Christoph Paaschec8d5402009-03-16 15:51:29 +0100865 return NF_DROP;
Jozsef Kadlecsik17311392007-10-11 14:35:52 -0700866 }
867 /* Fall through */
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800868 case TCP_CONNTRACK_IGNORE:
Jozsef Kadlecsik73f30602005-12-01 14:28:58 -0800869 /* Ignored packets:
870 *
Jozsef Kadlecsikb2155e72008-02-07 17:54:56 -0800871 * Our connection entry may be out of sync, so ignore
872 * packets which may signal the real connection between
873 * the client and the server.
874 *
Jozsef Kadlecsik73f30602005-12-01 14:28:58 -0800875 * a) SYN in ORIGINAL
876 * b) SYN/ACK in REPLY
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800877 * c) ACK in reply direction after initial SYN in original.
Jozsef Kadlecsikb2155e72008-02-07 17:54:56 -0800878 *
879 * If the ignored packet is invalid, the receiver will send
880 * a RST we'll catch below.
Jozsef Kadlecsik73f30602005-12-01 14:28:58 -0800881 */
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800882 if (index == TCP_SYNACK_SET
Patrick McHardyc88130b2008-01-31 04:42:11 -0800883 && ct->proto.tcp.last_index == TCP_SYN_SET
884 && ct->proto.tcp.last_dir != dir
885 && ntohl(th->ack_seq) == ct->proto.tcp.last_end) {
Jozsef Kadlecsikb2155e72008-02-07 17:54:56 -0800886 /* b) This SYN/ACK acknowledges a SYN that we earlier
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800887 * ignored as invalid. This means that the client and
888 * the server are both in sync, while the firewall is
889 * not. We kill this session and block the SYN/ACK so
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800890 * that the client cannot but retransmit its SYN and
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800891 * thus initiate a clean new session.
892 */
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800893 write_unlock_bh(&tcp_lock);
Alexey Dobriyanc2a2c7e2008-10-08 11:35:08 +0200894 if (LOG_INVALID(net, IPPROTO_TCP))
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800895 nf_log_packet(pf, 0, skb, NULL, NULL, NULL,
896 "nf_ct_tcp: killing out of sync session ");
Patrick McHardy51091762008-06-09 15:59:06 -0700897 nf_ct_kill(ct);
Christoph Paaschec8d5402009-03-16 15:51:29 +0100898 return NF_DROP;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800899 }
Patrick McHardyc88130b2008-01-31 04:42:11 -0800900 ct->proto.tcp.last_index = index;
901 ct->proto.tcp.last_dir = dir;
902 ct->proto.tcp.last_seq = ntohl(th->seq);
903 ct->proto.tcp.last_end =
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800904 segment_seq_plus_len(ntohl(th->seq), skb->len, dataoff, th);
905
906 write_unlock_bh(&tcp_lock);
Alexey Dobriyanc2a2c7e2008-10-08 11:35:08 +0200907 if (LOG_INVALID(net, IPPROTO_TCP))
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800908 nf_log_packet(pf, 0, skb, NULL, NULL, NULL,
Jozsef Kadlecsikb2155e72008-02-07 17:54:56 -0800909 "nf_ct_tcp: invalid packet ignored ");
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800910 return NF_ACCEPT;
911 case TCP_CONNTRACK_MAX:
912 /* Invalid packet */
Patrick McHardy0d537782007-07-07 22:39:38 -0700913 pr_debug("nf_ct_tcp: Invalid dir=%i index=%u ostate=%u\n",
914 dir, get_conntrack_index(th), old_state);
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800915 write_unlock_bh(&tcp_lock);
Alexey Dobriyanc2a2c7e2008-10-08 11:35:08 +0200916 if (LOG_INVALID(net, IPPROTO_TCP))
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800917 nf_log_packet(pf, 0, skb, NULL, NULL, NULL,
918 "nf_ct_tcp: invalid state ");
919 return -NF_ACCEPT;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800920 case TCP_CONNTRACK_CLOSE:
921 if (index == TCP_RST_SET
Patrick McHardyc88130b2008-01-31 04:42:11 -0800922 && ((test_bit(IPS_SEEN_REPLY_BIT, &ct->status)
923 && ct->proto.tcp.last_index == TCP_SYN_SET)
924 || (!test_bit(IPS_ASSURED_BIT, &ct->status)
925 && ct->proto.tcp.last_index == TCP_ACK_SET))
926 && ntohl(th->ack_seq) == ct->proto.tcp.last_end) {
Adrian Bunk93b1fae2006-01-10 00:13:33 +0100927 /* RST sent to invalid SYN or ACK we had let through
Jozsef Kadlecsik73f30602005-12-01 14:28:58 -0800928 * at a) and c) above:
929 *
930 * a) SYN was in window then
931 * c) we hold a half-open connection.
932 *
933 * Delete our connection entry.
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800934 * We skip window checking, because packet might ACK
Jozsef Kadlecsik73f30602005-12-01 14:28:58 -0800935 * segments we ignored. */
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800936 goto in_window;
937 }
Adrian Bunk93b1fae2006-01-10 00:13:33 +0100938 /* Just fall through */
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800939 default:
940 /* Keep compilers happy. */
941 break;
942 }
943
Patrick McHardyc88130b2008-01-31 04:42:11 -0800944 if (!tcp_in_window(ct, &ct->proto.tcp, dir, index,
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800945 skb, dataoff, th, pf)) {
946 write_unlock_bh(&tcp_lock);
947 return -NF_ACCEPT;
948 }
949 in_window:
950 /* From now on we have got in-window packets */
Patrick McHardyc88130b2008-01-31 04:42:11 -0800951 ct->proto.tcp.last_index = index;
952 ct->proto.tcp.last_dir = dir;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800953
Patrick McHardy0d537782007-07-07 22:39:38 -0700954 pr_debug("tcp_conntracks: ");
Jan Engelhardt3c9fba62008-04-14 11:15:54 +0200955 nf_ct_dump_tuple(tuple);
Patrick McHardy0d537782007-07-07 22:39:38 -0700956 pr_debug("syn=%i ack=%i fin=%i rst=%i old=%i new=%i\n",
957 (th->syn ? 1 : 0), (th->ack ? 1 : 0),
958 (th->fin ? 1 : 0), (th->rst ? 1 : 0),
959 old_state, new_state);
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800960
Patrick McHardyc88130b2008-01-31 04:42:11 -0800961 ct->proto.tcp.state = new_state;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800962 if (old_state != new_state
Jozsef Kadlecsikd0c1fd72008-02-14 14:50:21 -0800963 && new_state == TCP_CONNTRACK_FIN_WAIT)
Patrick McHardyc88130b2008-01-31 04:42:11 -0800964 ct->proto.tcp.seen[dir].flags |= IP_CT_TCP_FLAG_CLOSE_INIT;
Patrick McHardyae375042008-07-31 00:38:01 -0700965
966 if (ct->proto.tcp.retrans >= nf_ct_tcp_max_retrans &&
967 tcp_timeouts[new_state] > nf_ct_tcp_timeout_max_retrans)
968 timeout = nf_ct_tcp_timeout_max_retrans;
969 else if ((ct->proto.tcp.seen[0].flags | ct->proto.tcp.seen[1].flags) &
970 IP_CT_TCP_FLAG_DATA_UNACKNOWLEDGED &&
971 tcp_timeouts[new_state] > nf_ct_tcp_timeout_unacknowledged)
972 timeout = nf_ct_tcp_timeout_unacknowledged;
973 else
974 timeout = tcp_timeouts[new_state];
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800975 write_unlock_bh(&tcp_lock);
976
Alexey Dobriyana71996f2008-10-08 11:35:07 +0200977 nf_conntrack_event_cache(IPCT_PROTOINFO_VOLATILE, ct);
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800978 if (new_state != old_state)
Alexey Dobriyana71996f2008-10-08 11:35:07 +0200979 nf_conntrack_event_cache(IPCT_PROTOINFO, ct);
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800980
Patrick McHardyc88130b2008-01-31 04:42:11 -0800981 if (!test_bit(IPS_SEEN_REPLY_BIT, &ct->status)) {
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800982 /* If only reply is a RST, we can consider ourselves not to
983 have an established connection: this is a fairly common
984 problem case, so we can delete the conntrack
985 immediately. --RR */
986 if (th->rst) {
Fabian Hugelshofer718d4ad2008-06-09 15:59:40 -0700987 nf_ct_kill_acct(ct, ctinfo, skb);
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800988 return NF_ACCEPT;
989 }
Patrick McHardyc88130b2008-01-31 04:42:11 -0800990 } else if (!test_bit(IPS_ASSURED_BIT, &ct->status)
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800991 && (old_state == TCP_CONNTRACK_SYN_RECV
992 || old_state == TCP_CONNTRACK_ESTABLISHED)
993 && new_state == TCP_CONNTRACK_ESTABLISHED) {
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -0800994 /* Set ASSURED if we see see valid ack in ESTABLISHED
995 after SYN_RECV or a valid answer for a picked up
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800996 connection. */
Patrick McHardyc88130b2008-01-31 04:42:11 -0800997 set_bit(IPS_ASSURED_BIT, &ct->status);
Alexey Dobriyana71996f2008-10-08 11:35:07 +0200998 nf_conntrack_event_cache(IPCT_STATUS, ct);
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -0800999 }
Patrick McHardyc88130b2008-01-31 04:42:11 -08001000 nf_ct_refresh_acct(ct, ctinfo, skb, timeout);
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001001
1002 return NF_ACCEPT;
1003}
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -08001004
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001005/* Called when a new connection for this protocol found. */
Jan Engelhardt09f263c2008-04-14 11:15:53 +02001006static bool tcp_new(struct nf_conn *ct, const struct sk_buff *skb,
1007 unsigned int dataoff)
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001008{
1009 enum tcp_conntrack new_state;
Jan Engelhardt82f568f2008-01-31 04:52:07 -08001010 const struct tcphdr *th;
1011 struct tcphdr _tcph;
1012 const struct ip_ct_tcp_state *sender = &ct->proto.tcp.seen[0];
1013 const struct ip_ct_tcp_state *receiver = &ct->proto.tcp.seen[1];
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001014
1015 th = skb_header_pointer(skb, dataoff, sizeof(_tcph), &_tcph);
1016 BUG_ON(th == NULL);
1017
1018 /* Don't need lock here: this conntrack not in circulation yet */
1019 new_state
1020 = tcp_conntracks[0][get_conntrack_index(th)]
1021 [TCP_CONNTRACK_NONE];
1022
1023 /* Invalid: delete conntrack */
1024 if (new_state >= TCP_CONNTRACK_MAX) {
Patrick McHardy0d537782007-07-07 22:39:38 -07001025 pr_debug("nf_ct_tcp: invalid new deleting.\n");
Jan Engelhardt09f263c2008-04-14 11:15:53 +02001026 return false;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001027 }
1028
1029 if (new_state == TCP_CONNTRACK_SYN_SENT) {
1030 /* SYN packet */
Patrick McHardyc88130b2008-01-31 04:42:11 -08001031 ct->proto.tcp.seen[0].td_end =
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001032 segment_seq_plus_len(ntohl(th->seq), skb->len,
1033 dataoff, th);
Patrick McHardyc88130b2008-01-31 04:42:11 -08001034 ct->proto.tcp.seen[0].td_maxwin = ntohs(th->window);
1035 if (ct->proto.tcp.seen[0].td_maxwin == 0)
1036 ct->proto.tcp.seen[0].td_maxwin = 1;
1037 ct->proto.tcp.seen[0].td_maxend =
1038 ct->proto.tcp.seen[0].td_end;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001039
Patrick McHardyc88130b2008-01-31 04:42:11 -08001040 tcp_options(skb, dataoff, th, &ct->proto.tcp.seen[0]);
1041 ct->proto.tcp.seen[1].flags = 0;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001042 } else if (nf_ct_tcp_loose == 0) {
1043 /* Don't try to pick up connections. */
Jan Engelhardt09f263c2008-04-14 11:15:53 +02001044 return false;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001045 } else {
1046 /*
1047 * We are in the middle of a connection,
1048 * its history is lost for us.
1049 * Let's try to use the data from the packet.
1050 */
Patrick McHardyc88130b2008-01-31 04:42:11 -08001051 ct->proto.tcp.seen[0].td_end =
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001052 segment_seq_plus_len(ntohl(th->seq), skb->len,
1053 dataoff, th);
Patrick McHardyc88130b2008-01-31 04:42:11 -08001054 ct->proto.tcp.seen[0].td_maxwin = ntohs(th->window);
1055 if (ct->proto.tcp.seen[0].td_maxwin == 0)
1056 ct->proto.tcp.seen[0].td_maxwin = 1;
1057 ct->proto.tcp.seen[0].td_maxend =
1058 ct->proto.tcp.seen[0].td_end +
1059 ct->proto.tcp.seen[0].td_maxwin;
1060 ct->proto.tcp.seen[0].td_scale = 0;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001061
Patrick McHardya09113c2007-02-07 15:05:33 -08001062 /* We assume SACK and liberal window checking to handle
1063 * window scaling */
Patrick McHardyc88130b2008-01-31 04:42:11 -08001064 ct->proto.tcp.seen[0].flags =
1065 ct->proto.tcp.seen[1].flags = IP_CT_TCP_FLAG_SACK_PERM |
1066 IP_CT_TCP_FLAG_BE_LIBERAL;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001067 }
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -08001068
Patrick McHardyc88130b2008-01-31 04:42:11 -08001069 ct->proto.tcp.seen[1].td_end = 0;
1070 ct->proto.tcp.seen[1].td_maxend = 0;
1071 ct->proto.tcp.seen[1].td_maxwin = 1;
1072 ct->proto.tcp.seen[1].td_scale = 0;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001073
1074 /* tcp_packet will set them */
Patrick McHardyc88130b2008-01-31 04:42:11 -08001075 ct->proto.tcp.state = TCP_CONNTRACK_NONE;
1076 ct->proto.tcp.last_index = TCP_NONE_SET;
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -08001077
Patrick McHardy0d537782007-07-07 22:39:38 -07001078 pr_debug("tcp_new: sender end=%u maxend=%u maxwin=%u scale=%i "
1079 "receiver end=%u maxend=%u maxwin=%u scale=%i\n",
1080 sender->td_end, sender->td_maxend, sender->td_maxwin,
1081 sender->td_scale,
1082 receiver->td_end, receiver->td_maxend, receiver->td_maxwin,
1083 receiver->td_scale);
Jan Engelhardt09f263c2008-04-14 11:15:53 +02001084 return true;
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001085}
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001086
Patrick McHardye281db5c2007-03-04 15:57:25 -08001087#if defined(CONFIG_NF_CT_NETLINK) || defined(CONFIG_NF_CT_NETLINK_MODULE)
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001088
1089#include <linux/netfilter/nfnetlink.h>
1090#include <linux/netfilter/nfnetlink_conntrack.h>
1091
Patrick McHardyfdf70832007-09-28 14:37:41 -07001092static int tcp_to_nlattr(struct sk_buff *skb, struct nlattr *nla,
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001093 const struct nf_conn *ct)
1094{
Patrick McHardydf6fb862007-09-28 14:37:03 -07001095 struct nlattr *nest_parms;
Pablo Neira Ayusoc8e20782007-03-14 16:45:19 -07001096 struct nf_ct_tcp_flags tmp = {};
YOSHIFUJI Hideaki601e68e2007-02-12 11:15:49 -08001097
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001098 read_lock_bh(&tcp_lock);
Patrick McHardydf6fb862007-09-28 14:37:03 -07001099 nest_parms = nla_nest_start(skb, CTA_PROTOINFO_TCP | NLA_F_NESTED);
1100 if (!nest_parms)
1101 goto nla_put_failure;
1102
Patrick McHardy77236b62007-12-17 22:29:45 -08001103 NLA_PUT_U8(skb, CTA_PROTOINFO_TCP_STATE, ct->proto.tcp.state);
Pablo Neira Ayusoc8e20782007-03-14 16:45:19 -07001104
Patrick McHardy77236b62007-12-17 22:29:45 -08001105 NLA_PUT_U8(skb, CTA_PROTOINFO_TCP_WSCALE_ORIGINAL,
1106 ct->proto.tcp.seen[0].td_scale);
Pablo Neira Ayusoc8e20782007-03-14 16:45:19 -07001107
Patrick McHardy77236b62007-12-17 22:29:45 -08001108 NLA_PUT_U8(skb, CTA_PROTOINFO_TCP_WSCALE_REPLY,
1109 ct->proto.tcp.seen[1].td_scale);
Pablo Neira Ayusoc8e20782007-03-14 16:45:19 -07001110
1111 tmp.flags = ct->proto.tcp.seen[0].flags;
Patrick McHardydf6fb862007-09-28 14:37:03 -07001112 NLA_PUT(skb, CTA_PROTOINFO_TCP_FLAGS_ORIGINAL,
Pablo Neira Ayusoc8e20782007-03-14 16:45:19 -07001113 sizeof(struct nf_ct_tcp_flags), &tmp);
1114
1115 tmp.flags = ct->proto.tcp.seen[1].flags;
Patrick McHardydf6fb862007-09-28 14:37:03 -07001116 NLA_PUT(skb, CTA_PROTOINFO_TCP_FLAGS_REPLY,
Pablo Neira Ayusoc8e20782007-03-14 16:45:19 -07001117 sizeof(struct nf_ct_tcp_flags), &tmp);
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001118 read_unlock_bh(&tcp_lock);
1119
Patrick McHardydf6fb862007-09-28 14:37:03 -07001120 nla_nest_end(skb, nest_parms);
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001121
1122 return 0;
1123
Patrick McHardydf6fb862007-09-28 14:37:03 -07001124nla_put_failure:
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001125 read_unlock_bh(&tcp_lock);
1126 return -1;
1127}
1128
Patrick McHardyf73e9242007-09-28 14:39:55 -07001129static const struct nla_policy tcp_nla_policy[CTA_PROTOINFO_TCP_MAX+1] = {
1130 [CTA_PROTOINFO_TCP_STATE] = { .type = NLA_U8 },
1131 [CTA_PROTOINFO_TCP_WSCALE_ORIGINAL] = { .type = NLA_U8 },
1132 [CTA_PROTOINFO_TCP_WSCALE_REPLY] = { .type = NLA_U8 },
1133 [CTA_PROTOINFO_TCP_FLAGS_ORIGINAL] = { .len = sizeof(struct nf_ct_tcp_flags) },
1134 [CTA_PROTOINFO_TCP_FLAGS_REPLY] = { .len = sizeof(struct nf_ct_tcp_flags) },
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001135};
1136
Patrick McHardyfdf70832007-09-28 14:37:41 -07001137static int nlattr_to_tcp(struct nlattr *cda[], struct nf_conn *ct)
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001138{
Stephen Hemminger2f0d2f12008-01-31 04:08:10 -08001139 struct nlattr *pattr = cda[CTA_PROTOINFO_TCP];
Patrick McHardydf6fb862007-09-28 14:37:03 -07001140 struct nlattr *tb[CTA_PROTOINFO_TCP_MAX+1];
Patrick McHardyf73e9242007-09-28 14:39:55 -07001141 int err;
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001142
1143 /* updates could not contain anything about the private
1144 * protocol info, in that case skip the parsing */
Stephen Hemminger2f0d2f12008-01-31 04:08:10 -08001145 if (!pattr)
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001146 return 0;
1147
Stephen Hemminger2f0d2f12008-01-31 04:08:10 -08001148 err = nla_parse_nested(tb, CTA_PROTOINFO_TCP_MAX, pattr, tcp_nla_policy);
Patrick McHardyf73e9242007-09-28 14:39:55 -07001149 if (err < 0)
1150 return err;
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001151
Patrick McHardy5f7da4d2008-04-14 11:15:52 +02001152 if (tb[CTA_PROTOINFO_TCP_STATE] &&
1153 nla_get_u8(tb[CTA_PROTOINFO_TCP_STATE]) >= TCP_CONNTRACK_MAX)
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001154 return -EINVAL;
1155
1156 write_lock_bh(&tcp_lock);
Patrick McHardy5f7da4d2008-04-14 11:15:52 +02001157 if (tb[CTA_PROTOINFO_TCP_STATE])
1158 ct->proto.tcp.state = nla_get_u8(tb[CTA_PROTOINFO_TCP_STATE]);
Pablo Neira Ayusoc8e20782007-03-14 16:45:19 -07001159
Patrick McHardydf6fb862007-09-28 14:37:03 -07001160 if (tb[CTA_PROTOINFO_TCP_FLAGS_ORIGINAL]) {
Pablo Neira Ayusoc8e20782007-03-14 16:45:19 -07001161 struct nf_ct_tcp_flags *attr =
Patrick McHardydf6fb862007-09-28 14:37:03 -07001162 nla_data(tb[CTA_PROTOINFO_TCP_FLAGS_ORIGINAL]);
Pablo Neira Ayusoc8e20782007-03-14 16:45:19 -07001163 ct->proto.tcp.seen[0].flags &= ~attr->mask;
1164 ct->proto.tcp.seen[0].flags |= attr->flags & attr->mask;
1165 }
1166
Patrick McHardydf6fb862007-09-28 14:37:03 -07001167 if (tb[CTA_PROTOINFO_TCP_FLAGS_REPLY]) {
Pablo Neira Ayusoc8e20782007-03-14 16:45:19 -07001168 struct nf_ct_tcp_flags *attr =
Patrick McHardydf6fb862007-09-28 14:37:03 -07001169 nla_data(tb[CTA_PROTOINFO_TCP_FLAGS_REPLY]);
Pablo Neira Ayusoc8e20782007-03-14 16:45:19 -07001170 ct->proto.tcp.seen[1].flags &= ~attr->mask;
1171 ct->proto.tcp.seen[1].flags |= attr->flags & attr->mask;
1172 }
1173
Patrick McHardydf6fb862007-09-28 14:37:03 -07001174 if (tb[CTA_PROTOINFO_TCP_WSCALE_ORIGINAL] &&
1175 tb[CTA_PROTOINFO_TCP_WSCALE_REPLY] &&
Pablo Neira Ayusoc8e20782007-03-14 16:45:19 -07001176 ct->proto.tcp.seen[0].flags & IP_CT_TCP_FLAG_WINDOW_SCALE &&
1177 ct->proto.tcp.seen[1].flags & IP_CT_TCP_FLAG_WINDOW_SCALE) {
Patrick McHardy77236b62007-12-17 22:29:45 -08001178 ct->proto.tcp.seen[0].td_scale =
1179 nla_get_u8(tb[CTA_PROTOINFO_TCP_WSCALE_ORIGINAL]);
1180 ct->proto.tcp.seen[1].td_scale =
1181 nla_get_u8(tb[CTA_PROTOINFO_TCP_WSCALE_REPLY]);
Pablo Neira Ayusoc8e20782007-03-14 16:45:19 -07001182 }
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001183 write_unlock_bh(&tcp_lock);
1184
1185 return 0;
1186}
Holger Eitzenbergera400c302009-03-25 21:53:39 +01001187
1188static int tcp_nlattr_size(void)
1189{
1190 return nla_total_size(0) /* CTA_PROTOINFO_TCP */
1191 + nla_policy_len(tcp_nla_policy, CTA_PROTOINFO_TCP_MAX + 1);
1192}
1193
1194static int tcp_nlattr_tuple_size(void)
1195{
1196 return nla_policy_len(nf_ct_port_nla_policy, CTA_PROTO_MAX + 1);
1197}
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001198#endif
Patrick McHardy933a41e2006-11-29 02:35:18 +01001199
1200#ifdef CONFIG_SYSCTL
1201static unsigned int tcp_sysctl_table_users;
1202static struct ctl_table_header *tcp_sysctl_header;
1203static struct ctl_table tcp_sysctl_table[] = {
1204 {
Patrick McHardy933a41e2006-11-29 02:35:18 +01001205 .procname = "nf_conntrack_tcp_timeout_syn_sent",
Patrick McHardy2d646282008-01-14 23:45:32 -08001206 .data = &tcp_timeouts[TCP_CONNTRACK_SYN_SENT],
Patrick McHardy933a41e2006-11-29 02:35:18 +01001207 .maxlen = sizeof(unsigned int),
1208 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001209 .proc_handler = proc_dointvec_jiffies,
Patrick McHardy933a41e2006-11-29 02:35:18 +01001210 },
1211 {
Patrick McHardy933a41e2006-11-29 02:35:18 +01001212 .procname = "nf_conntrack_tcp_timeout_syn_recv",
Patrick McHardy2d646282008-01-14 23:45:32 -08001213 .data = &tcp_timeouts[TCP_CONNTRACK_SYN_RECV],
Patrick McHardy933a41e2006-11-29 02:35:18 +01001214 .maxlen = sizeof(unsigned int),
1215 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001216 .proc_handler = proc_dointvec_jiffies,
Patrick McHardy933a41e2006-11-29 02:35:18 +01001217 },
1218 {
Patrick McHardy933a41e2006-11-29 02:35:18 +01001219 .procname = "nf_conntrack_tcp_timeout_established",
Patrick McHardy2d646282008-01-14 23:45:32 -08001220 .data = &tcp_timeouts[TCP_CONNTRACK_ESTABLISHED],
Patrick McHardy933a41e2006-11-29 02:35:18 +01001221 .maxlen = sizeof(unsigned int),
1222 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001223 .proc_handler = proc_dointvec_jiffies,
Patrick McHardy933a41e2006-11-29 02:35:18 +01001224 },
1225 {
Patrick McHardy933a41e2006-11-29 02:35:18 +01001226 .procname = "nf_conntrack_tcp_timeout_fin_wait",
Patrick McHardy2d646282008-01-14 23:45:32 -08001227 .data = &tcp_timeouts[TCP_CONNTRACK_FIN_WAIT],
Patrick McHardy933a41e2006-11-29 02:35:18 +01001228 .maxlen = sizeof(unsigned int),
1229 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001230 .proc_handler = proc_dointvec_jiffies,
Patrick McHardy933a41e2006-11-29 02:35:18 +01001231 },
1232 {
Patrick McHardy933a41e2006-11-29 02:35:18 +01001233 .procname = "nf_conntrack_tcp_timeout_close_wait",
Patrick McHardy2d646282008-01-14 23:45:32 -08001234 .data = &tcp_timeouts[TCP_CONNTRACK_CLOSE_WAIT],
Patrick McHardy933a41e2006-11-29 02:35:18 +01001235 .maxlen = sizeof(unsigned int),
1236 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001237 .proc_handler = proc_dointvec_jiffies,
Patrick McHardy933a41e2006-11-29 02:35:18 +01001238 },
1239 {
Patrick McHardy933a41e2006-11-29 02:35:18 +01001240 .procname = "nf_conntrack_tcp_timeout_last_ack",
Patrick McHardy2d646282008-01-14 23:45:32 -08001241 .data = &tcp_timeouts[TCP_CONNTRACK_LAST_ACK],
Patrick McHardy933a41e2006-11-29 02:35:18 +01001242 .maxlen = sizeof(unsigned int),
1243 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001244 .proc_handler = proc_dointvec_jiffies,
Patrick McHardy933a41e2006-11-29 02:35:18 +01001245 },
1246 {
Patrick McHardy933a41e2006-11-29 02:35:18 +01001247 .procname = "nf_conntrack_tcp_timeout_time_wait",
Patrick McHardy2d646282008-01-14 23:45:32 -08001248 .data = &tcp_timeouts[TCP_CONNTRACK_TIME_WAIT],
Patrick McHardy933a41e2006-11-29 02:35:18 +01001249 .maxlen = sizeof(unsigned int),
1250 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001251 .proc_handler = proc_dointvec_jiffies,
Patrick McHardy933a41e2006-11-29 02:35:18 +01001252 },
1253 {
Patrick McHardy933a41e2006-11-29 02:35:18 +01001254 .procname = "nf_conntrack_tcp_timeout_close",
Patrick McHardy2d646282008-01-14 23:45:32 -08001255 .data = &tcp_timeouts[TCP_CONNTRACK_CLOSE],
Patrick McHardy933a41e2006-11-29 02:35:18 +01001256 .maxlen = sizeof(unsigned int),
1257 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001258 .proc_handler = proc_dointvec_jiffies,
Patrick McHardy933a41e2006-11-29 02:35:18 +01001259 },
1260 {
Patrick McHardy933a41e2006-11-29 02:35:18 +01001261 .procname = "nf_conntrack_tcp_timeout_max_retrans",
1262 .data = &nf_ct_tcp_timeout_max_retrans,
1263 .maxlen = sizeof(unsigned int),
1264 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001265 .proc_handler = proc_dointvec_jiffies,
Patrick McHardy933a41e2006-11-29 02:35:18 +01001266 },
1267 {
Patrick McHardyae375042008-07-31 00:38:01 -07001268 .procname = "nf_conntrack_tcp_timeout_unacknowledged",
1269 .data = &nf_ct_tcp_timeout_unacknowledged,
1270 .maxlen = sizeof(unsigned int),
1271 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001272 .proc_handler = proc_dointvec_jiffies,
Patrick McHardyae375042008-07-31 00:38:01 -07001273 },
1274 {
Patrick McHardy933a41e2006-11-29 02:35:18 +01001275 .ctl_name = NET_NF_CONNTRACK_TCP_LOOSE,
1276 .procname = "nf_conntrack_tcp_loose",
1277 .data = &nf_ct_tcp_loose,
1278 .maxlen = sizeof(unsigned int),
1279 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001280 .proc_handler = proc_dointvec,
Patrick McHardy933a41e2006-11-29 02:35:18 +01001281 },
1282 {
1283 .ctl_name = NET_NF_CONNTRACK_TCP_BE_LIBERAL,
1284 .procname = "nf_conntrack_tcp_be_liberal",
1285 .data = &nf_ct_tcp_be_liberal,
1286 .maxlen = sizeof(unsigned int),
1287 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001288 .proc_handler = proc_dointvec,
Patrick McHardy933a41e2006-11-29 02:35:18 +01001289 },
1290 {
1291 .ctl_name = NET_NF_CONNTRACK_TCP_MAX_RETRANS,
1292 .procname = "nf_conntrack_tcp_max_retrans",
1293 .data = &nf_ct_tcp_max_retrans,
1294 .maxlen = sizeof(unsigned int),
1295 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001296 .proc_handler = proc_dointvec,
Patrick McHardy933a41e2006-11-29 02:35:18 +01001297 },
1298 {
1299 .ctl_name = 0
1300 }
1301};
Patrick McHardya999e682006-11-29 02:35:20 +01001302
1303#ifdef CONFIG_NF_CONNTRACK_PROC_COMPAT
1304static struct ctl_table tcp_compat_sysctl_table[] = {
1305 {
Patrick McHardya999e682006-11-29 02:35:20 +01001306 .procname = "ip_conntrack_tcp_timeout_syn_sent",
Patrick McHardy2d646282008-01-14 23:45:32 -08001307 .data = &tcp_timeouts[TCP_CONNTRACK_SYN_SENT],
Patrick McHardya999e682006-11-29 02:35:20 +01001308 .maxlen = sizeof(unsigned int),
1309 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001310 .proc_handler = proc_dointvec_jiffies,
Patrick McHardya999e682006-11-29 02:35:20 +01001311 },
1312 {
Patrick McHardya999e682006-11-29 02:35:20 +01001313 .procname = "ip_conntrack_tcp_timeout_syn_recv",
Patrick McHardy2d646282008-01-14 23:45:32 -08001314 .data = &tcp_timeouts[TCP_CONNTRACK_SYN_RECV],
Patrick McHardya999e682006-11-29 02:35:20 +01001315 .maxlen = sizeof(unsigned int),
1316 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001317 .proc_handler = proc_dointvec_jiffies,
Patrick McHardya999e682006-11-29 02:35:20 +01001318 },
1319 {
Patrick McHardya999e682006-11-29 02:35:20 +01001320 .procname = "ip_conntrack_tcp_timeout_established",
Patrick McHardy2d646282008-01-14 23:45:32 -08001321 .data = &tcp_timeouts[TCP_CONNTRACK_ESTABLISHED],
Patrick McHardya999e682006-11-29 02:35:20 +01001322 .maxlen = sizeof(unsigned int),
1323 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001324 .proc_handler = proc_dointvec_jiffies,
Patrick McHardya999e682006-11-29 02:35:20 +01001325 },
1326 {
Patrick McHardya999e682006-11-29 02:35:20 +01001327 .procname = "ip_conntrack_tcp_timeout_fin_wait",
Patrick McHardy2d646282008-01-14 23:45:32 -08001328 .data = &tcp_timeouts[TCP_CONNTRACK_FIN_WAIT],
Patrick McHardya999e682006-11-29 02:35:20 +01001329 .maxlen = sizeof(unsigned int),
1330 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001331 .proc_handler = proc_dointvec_jiffies,
Patrick McHardya999e682006-11-29 02:35:20 +01001332 },
1333 {
Patrick McHardya999e682006-11-29 02:35:20 +01001334 .procname = "ip_conntrack_tcp_timeout_close_wait",
Patrick McHardy2d646282008-01-14 23:45:32 -08001335 .data = &tcp_timeouts[TCP_CONNTRACK_CLOSE_WAIT],
Patrick McHardya999e682006-11-29 02:35:20 +01001336 .maxlen = sizeof(unsigned int),
1337 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001338 .proc_handler = proc_dointvec_jiffies,
Patrick McHardya999e682006-11-29 02:35:20 +01001339 },
1340 {
Patrick McHardya999e682006-11-29 02:35:20 +01001341 .procname = "ip_conntrack_tcp_timeout_last_ack",
Patrick McHardy2d646282008-01-14 23:45:32 -08001342 .data = &tcp_timeouts[TCP_CONNTRACK_LAST_ACK],
Patrick McHardya999e682006-11-29 02:35:20 +01001343 .maxlen = sizeof(unsigned int),
1344 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001345 .proc_handler = proc_dointvec_jiffies,
Patrick McHardya999e682006-11-29 02:35:20 +01001346 },
1347 {
Patrick McHardya999e682006-11-29 02:35:20 +01001348 .procname = "ip_conntrack_tcp_timeout_time_wait",
Patrick McHardy2d646282008-01-14 23:45:32 -08001349 .data = &tcp_timeouts[TCP_CONNTRACK_TIME_WAIT],
Patrick McHardya999e682006-11-29 02:35:20 +01001350 .maxlen = sizeof(unsigned int),
1351 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001352 .proc_handler = proc_dointvec_jiffies,
Patrick McHardya999e682006-11-29 02:35:20 +01001353 },
1354 {
Patrick McHardya999e682006-11-29 02:35:20 +01001355 .procname = "ip_conntrack_tcp_timeout_close",
Patrick McHardy2d646282008-01-14 23:45:32 -08001356 .data = &tcp_timeouts[TCP_CONNTRACK_CLOSE],
Patrick McHardya999e682006-11-29 02:35:20 +01001357 .maxlen = sizeof(unsigned int),
1358 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001359 .proc_handler = proc_dointvec_jiffies,
Patrick McHardya999e682006-11-29 02:35:20 +01001360 },
1361 {
Patrick McHardya999e682006-11-29 02:35:20 +01001362 .procname = "ip_conntrack_tcp_timeout_max_retrans",
1363 .data = &nf_ct_tcp_timeout_max_retrans,
1364 .maxlen = sizeof(unsigned int),
1365 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001366 .proc_handler = proc_dointvec_jiffies,
Patrick McHardya999e682006-11-29 02:35:20 +01001367 },
1368 {
1369 .ctl_name = NET_IPV4_NF_CONNTRACK_TCP_LOOSE,
1370 .procname = "ip_conntrack_tcp_loose",
1371 .data = &nf_ct_tcp_loose,
1372 .maxlen = sizeof(unsigned int),
1373 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001374 .proc_handler = proc_dointvec,
Patrick McHardya999e682006-11-29 02:35:20 +01001375 },
1376 {
1377 .ctl_name = NET_IPV4_NF_CONNTRACK_TCP_BE_LIBERAL,
1378 .procname = "ip_conntrack_tcp_be_liberal",
1379 .data = &nf_ct_tcp_be_liberal,
1380 .maxlen = sizeof(unsigned int),
1381 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001382 .proc_handler = proc_dointvec,
Patrick McHardya999e682006-11-29 02:35:20 +01001383 },
1384 {
1385 .ctl_name = NET_IPV4_NF_CONNTRACK_TCP_MAX_RETRANS,
1386 .procname = "ip_conntrack_tcp_max_retrans",
1387 .data = &nf_ct_tcp_max_retrans,
1388 .maxlen = sizeof(unsigned int),
1389 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08001390 .proc_handler = proc_dointvec,
Patrick McHardya999e682006-11-29 02:35:20 +01001391 },
1392 {
1393 .ctl_name = 0
1394 }
1395};
1396#endif /* CONFIG_NF_CONNTRACK_PROC_COMPAT */
Patrick McHardy933a41e2006-11-29 02:35:18 +01001397#endif /* CONFIG_SYSCTL */
1398
Patrick McHardy61075af2007-07-14 20:48:19 -07001399struct nf_conntrack_l4proto nf_conntrack_l4proto_tcp4 __read_mostly =
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001400{
1401 .l3proto = PF_INET,
Martin Josefsson605dcad2006-11-29 02:35:06 +01001402 .l4proto = IPPROTO_TCP,
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001403 .name = "tcp",
1404 .pkt_to_tuple = tcp_pkt_to_tuple,
1405 .invert_tuple = tcp_invert_tuple,
1406 .print_tuple = tcp_print_tuple,
1407 .print_conntrack = tcp_print_conntrack,
1408 .packet = tcp_packet,
1409 .new = tcp_new,
Patrick McHardy96f6bf82006-04-06 14:19:24 -07001410 .error = tcp_error,
Patrick McHardye281db5c2007-03-04 15:57:25 -08001411#if defined(CONFIG_NF_CT_NETLINK) || defined(CONFIG_NF_CT_NETLINK_MODULE)
Patrick McHardyfdf70832007-09-28 14:37:41 -07001412 .to_nlattr = tcp_to_nlattr,
Holger Eitzenbergera400c302009-03-25 21:53:39 +01001413 .nlattr_size = tcp_nlattr_size,
Patrick McHardyfdf70832007-09-28 14:37:41 -07001414 .from_nlattr = nlattr_to_tcp,
1415 .tuple_to_nlattr = nf_ct_port_tuple_to_nlattr,
1416 .nlattr_to_tuple = nf_ct_port_nlattr_to_tuple,
Holger Eitzenbergera400c302009-03-25 21:53:39 +01001417 .nlattr_tuple_size = tcp_nlattr_tuple_size,
Patrick McHardyf73e9242007-09-28 14:39:55 -07001418 .nla_policy = nf_ct_port_nla_policy,
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001419#endif
Patrick McHardy933a41e2006-11-29 02:35:18 +01001420#ifdef CONFIG_SYSCTL
1421 .ctl_table_users = &tcp_sysctl_table_users,
1422 .ctl_table_header = &tcp_sysctl_header,
1423 .ctl_table = tcp_sysctl_table,
Patrick McHardya999e682006-11-29 02:35:20 +01001424#ifdef CONFIG_NF_CONNTRACK_PROC_COMPAT
1425 .ctl_compat_table = tcp_compat_sysctl_table,
1426#endif
Patrick McHardy933a41e2006-11-29 02:35:18 +01001427#endif
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001428};
Patrick McHardy13b18332006-12-02 22:11:25 -08001429EXPORT_SYMBOL_GPL(nf_conntrack_l4proto_tcp4);
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001430
Patrick McHardy61075af2007-07-14 20:48:19 -07001431struct nf_conntrack_l4proto nf_conntrack_l4proto_tcp6 __read_mostly =
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001432{
1433 .l3proto = PF_INET6,
Martin Josefsson605dcad2006-11-29 02:35:06 +01001434 .l4proto = IPPROTO_TCP,
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001435 .name = "tcp",
1436 .pkt_to_tuple = tcp_pkt_to_tuple,
1437 .invert_tuple = tcp_invert_tuple,
1438 .print_tuple = tcp_print_tuple,
1439 .print_conntrack = tcp_print_conntrack,
1440 .packet = tcp_packet,
1441 .new = tcp_new,
Patrick McHardy96f6bf82006-04-06 14:19:24 -07001442 .error = tcp_error,
Patrick McHardye281db5c2007-03-04 15:57:25 -08001443#if defined(CONFIG_NF_CT_NETLINK) || defined(CONFIG_NF_CT_NETLINK_MODULE)
Patrick McHardyfdf70832007-09-28 14:37:41 -07001444 .to_nlattr = tcp_to_nlattr,
Holger Eitzenbergera400c302009-03-25 21:53:39 +01001445 .nlattr_size = tcp_nlattr_size,
Patrick McHardyfdf70832007-09-28 14:37:41 -07001446 .from_nlattr = nlattr_to_tcp,
1447 .tuple_to_nlattr = nf_ct_port_tuple_to_nlattr,
1448 .nlattr_to_tuple = nf_ct_port_nlattr_to_tuple,
Holger Eitzenbergera400c302009-03-25 21:53:39 +01001449 .nlattr_tuple_size = tcp_nlattr_tuple_size,
Patrick McHardyf73e9242007-09-28 14:39:55 -07001450 .nla_policy = nf_ct_port_nla_policy,
Pablo Neira Ayusoc1d10ad2006-01-05 12:19:05 -08001451#endif
Patrick McHardy933a41e2006-11-29 02:35:18 +01001452#ifdef CONFIG_SYSCTL
1453 .ctl_table_users = &tcp_sysctl_table_users,
1454 .ctl_table_header = &tcp_sysctl_header,
1455 .ctl_table = tcp_sysctl_table,
1456#endif
Yasuyuki Kozakai9fb9cbb2005-11-09 16:38:16 -08001457};
Patrick McHardy13b18332006-12-02 22:11:25 -08001458EXPORT_SYMBOL_GPL(nf_conntrack_l4proto_tcp6);