blob: 217e2b6863225acf4353e7cd6f4869df3ce1da56 [file] [log] [blame]
Patrick McHardycdd289a2007-02-07 15:09:46 -08001/*
2 * This is a module which is used for setting the MSS option in TCP packets.
3 *
4 * Copyright (C) 2000 Marc Boucher <marc@mbsi.ca>
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 as
8 * published by the Free Software Foundation.
9 */
10
11#include <linux/module.h>
12#include <linux/skbuff.h>
13#include <linux/ip.h>
14#include <linux/ipv6.h>
15#include <linux/tcp.h>
Jan Engelhardt37c08382008-01-31 04:06:10 -080016#include <net/dst.h>
17#include <net/flow.h>
Patrick McHardycdd289a2007-02-07 15:09:46 -080018#include <net/ipv6.h>
Jan Engelhardt37c08382008-01-31 04:06:10 -080019#include <net/route.h>
Patrick McHardycdd289a2007-02-07 15:09:46 -080020#include <net/tcp.h>
21
22#include <linux/netfilter_ipv4/ip_tables.h>
23#include <linux/netfilter_ipv6/ip6_tables.h>
24#include <linux/netfilter/x_tables.h>
25#include <linux/netfilter/xt_tcpudp.h>
26#include <linux/netfilter/xt_TCPMSS.h>
27
28MODULE_LICENSE("GPL");
29MODULE_AUTHOR("Marc Boucher <marc@mbsi.ca>");
Jan Engelhardt2ae15b62008-01-14 23:42:28 -080030MODULE_DESCRIPTION("Xtables: TCP Maximum Segment Size (MSS) adjustment");
Patrick McHardycdd289a2007-02-07 15:09:46 -080031MODULE_ALIAS("ipt_TCPMSS");
32MODULE_ALIAS("ip6t_TCPMSS");
33
34static inline unsigned int
35optlen(const u_int8_t *opt, unsigned int offset)
36{
37 /* Beware zero-length options: make finite progress */
38 if (opt[offset] <= TCPOPT_NOP || opt[offset+1] == 0)
39 return 1;
40 else
41 return opt[offset+1];
42}
43
44static int
Herbert Xu3db05fe2007-10-15 00:53:15 -070045tcpmss_mangle_packet(struct sk_buff *skb,
Patrick McHardycdd289a2007-02-07 15:09:46 -080046 const struct xt_tcpmss_info *info,
Jan Engelhardt37c08382008-01-31 04:06:10 -080047 unsigned int in_mtu,
Patrick McHardycdd289a2007-02-07 15:09:46 -080048 unsigned int tcphoff,
49 unsigned int minlen)
50{
51 struct tcphdr *tcph;
52 unsigned int tcplen, i;
53 __be16 oldval;
54 u16 newmss;
55 u8 *opt;
56
Herbert Xu3db05fe2007-10-15 00:53:15 -070057 if (!skb_make_writable(skb, skb->len))
Patrick McHardycdd289a2007-02-07 15:09:46 -080058 return -1;
59
Herbert Xu3db05fe2007-10-15 00:53:15 -070060 tcplen = skb->len - tcphoff;
61 tcph = (struct tcphdr *)(skb_network_header(skb) + tcphoff);
Patrick McHardycdd289a2007-02-07 15:09:46 -080062
63 /* Since it passed flags test in tcp match, we know it is is
64 not a fragment, and has data >= tcp header length. SYN
65 packets should not contain data: if they did, then we risk
66 running over MTU, sending Frag Needed and breaking things
67 badly. --RR */
68 if (tcplen != tcph->doff*4) {
69 if (net_ratelimit())
70 printk(KERN_ERR "xt_TCPMSS: bad length (%u bytes)\n",
Herbert Xu3db05fe2007-10-15 00:53:15 -070071 skb->len);
Patrick McHardycdd289a2007-02-07 15:09:46 -080072 return -1;
73 }
74
75 if (info->mss == XT_TCPMSS_CLAMP_PMTU) {
Herbert Xu3db05fe2007-10-15 00:53:15 -070076 if (dst_mtu(skb->dst) <= minlen) {
Patrick McHardycdd289a2007-02-07 15:09:46 -080077 if (net_ratelimit())
78 printk(KERN_ERR "xt_TCPMSS: "
79 "unknown or invalid path-MTU (%u)\n",
Herbert Xu3db05fe2007-10-15 00:53:15 -070080 dst_mtu(skb->dst));
Patrick McHardycdd289a2007-02-07 15:09:46 -080081 return -1;
82 }
Jan Engelhardt37c08382008-01-31 04:06:10 -080083 if (in_mtu <= minlen) {
84 if (net_ratelimit())
85 printk(KERN_ERR "xt_TCPMSS: unknown or "
86 "invalid path-MTU (%u)\n", in_mtu);
87 return -1;
88 }
89 newmss = min(dst_mtu(skb->dst), in_mtu) - minlen;
Patrick McHardycdd289a2007-02-07 15:09:46 -080090 } else
91 newmss = info->mss;
92
93 opt = (u_int8_t *)tcph;
94 for (i = sizeof(struct tcphdr); i < tcph->doff*4; i += optlen(opt, i)) {
95 if (opt[i] == TCPOPT_MSS && tcph->doff*4 - i >= TCPOLEN_MSS &&
96 opt[i+1] == TCPOLEN_MSS) {
97 u_int16_t oldmss;
98
99 oldmss = (opt[i+2] << 8) | opt[i+3];
100
Benjamin LaHaise17008062007-12-17 22:27:36 -0800101 /* Never increase MSS, even when setting it, as
102 * doing so results in problems for hosts that rely
103 * on MSS being set correctly.
104 */
105 if (oldmss <= newmss)
Patrick McHardycdd289a2007-02-07 15:09:46 -0800106 return 0;
107
108 opt[i+2] = (newmss & 0xff00) >> 8;
Jan Engelhardt7c4e36b2007-07-07 22:19:08 -0700109 opt[i+3] = newmss & 0x00ff;
Patrick McHardycdd289a2007-02-07 15:09:46 -0800110
Patrick McHardybe0ea7d2007-11-30 01:17:11 +1100111 inet_proto_csum_replace2(&tcph->check, skb,
112 htons(oldmss), htons(newmss),
113 0);
Patrick McHardycdd289a2007-02-07 15:09:46 -0800114 return 0;
115 }
116 }
117
118 /*
119 * MSS Option not found ?! add it..
120 */
Herbert Xu3db05fe2007-10-15 00:53:15 -0700121 if (skb_tailroom(skb) < TCPOLEN_MSS) {
122 if (pskb_expand_head(skb, 0,
123 TCPOLEN_MSS - skb_tailroom(skb),
Herbert Xu2ca7b0a2007-10-14 00:39:55 -0700124 GFP_ATOMIC))
Patrick McHardycdd289a2007-02-07 15:09:46 -0800125 return -1;
Herbert Xu3db05fe2007-10-15 00:53:15 -0700126 tcph = (struct tcphdr *)(skb_network_header(skb) + tcphoff);
Patrick McHardycdd289a2007-02-07 15:09:46 -0800127 }
128
Herbert Xu3db05fe2007-10-15 00:53:15 -0700129 skb_put(skb, TCPOLEN_MSS);
Patrick McHardycdd289a2007-02-07 15:09:46 -0800130
131 opt = (u_int8_t *)tcph + sizeof(struct tcphdr);
132 memmove(opt + TCPOLEN_MSS, opt, tcplen - sizeof(struct tcphdr));
133
Patrick McHardybe0ea7d2007-11-30 01:17:11 +1100134 inet_proto_csum_replace2(&tcph->check, skb,
135 htons(tcplen), htons(tcplen + TCPOLEN_MSS), 1);
Patrick McHardycdd289a2007-02-07 15:09:46 -0800136 opt[0] = TCPOPT_MSS;
137 opt[1] = TCPOLEN_MSS;
138 opt[2] = (newmss & 0xff00) >> 8;
Jan Engelhardt7c4e36b2007-07-07 22:19:08 -0700139 opt[3] = newmss & 0x00ff;
Patrick McHardycdd289a2007-02-07 15:09:46 -0800140
Patrick McHardybe0ea7d2007-11-30 01:17:11 +1100141 inet_proto_csum_replace4(&tcph->check, skb, 0, *((__be32 *)opt), 0);
Patrick McHardycdd289a2007-02-07 15:09:46 -0800142
143 oldval = ((__be16 *)tcph)[6];
144 tcph->doff += TCPOLEN_MSS/4;
Patrick McHardybe0ea7d2007-11-30 01:17:11 +1100145 inet_proto_csum_replace2(&tcph->check, skb,
146 oldval, ((__be16 *)tcph)[6], 0);
Patrick McHardycdd289a2007-02-07 15:09:46 -0800147 return TCPOLEN_MSS;
148}
149
Jan Engelhardt37c08382008-01-31 04:06:10 -0800150static u_int32_t tcpmss_reverse_mtu4(const struct iphdr *iph)
151{
152 struct flowi fl = {
153 .fl4_dst = iph->saddr,
154 };
155 const struct nf_afinfo *ai;
156 struct rtable *rt = NULL;
157 u_int32_t mtu = ~0U;
158
159 rcu_read_lock();
160 ai = nf_get_afinfo(AF_INET);
161 if (ai != NULL)
162 ai->route((struct dst_entry **)&rt, &fl);
163 rcu_read_unlock();
164
165 if (rt != NULL) {
166 mtu = dst_mtu(&rt->u.dst);
167 dst_release(&rt->u.dst);
168 }
169 return mtu;
170}
171
Patrick McHardycdd289a2007-02-07 15:09:46 -0800172static unsigned int
Jan Engelhardtd3c5ee62007-12-04 23:24:03 -0800173tcpmss_tg4(struct sk_buff *skb, const struct net_device *in,
174 const struct net_device *out, unsigned int hooknum,
175 const struct xt_target *target, const void *targinfo)
Patrick McHardycdd289a2007-02-07 15:09:46 -0800176{
Herbert Xu3db05fe2007-10-15 00:53:15 -0700177 struct iphdr *iph = ip_hdr(skb);
Patrick McHardycdd289a2007-02-07 15:09:46 -0800178 __be16 newlen;
179 int ret;
180
Jan Engelhardt37c08382008-01-31 04:06:10 -0800181 ret = tcpmss_mangle_packet(skb, targinfo, tcpmss_reverse_mtu4(iph),
182 iph->ihl * 4,
Patrick McHardycdd289a2007-02-07 15:09:46 -0800183 sizeof(*iph) + sizeof(struct tcphdr));
184 if (ret < 0)
185 return NF_DROP;
186 if (ret > 0) {
Herbert Xu3db05fe2007-10-15 00:53:15 -0700187 iph = ip_hdr(skb);
Patrick McHardycdd289a2007-02-07 15:09:46 -0800188 newlen = htons(ntohs(iph->tot_len) + ret);
Patrick McHardybe0ea7d2007-11-30 01:17:11 +1100189 csum_replace2(&iph->check, iph->tot_len, newlen);
Patrick McHardycdd289a2007-02-07 15:09:46 -0800190 iph->tot_len = newlen;
191 }
192 return XT_CONTINUE;
193}
194
195#if defined(CONFIG_IP6_NF_IPTABLES) || defined(CONFIG_IP6_NF_IPTABLES_MODULE)
Jan Engelhardt37c08382008-01-31 04:06:10 -0800196static u_int32_t tcpmss_reverse_mtu6(const struct ipv6hdr *iph)
197{
198 struct flowi fl = {
199 .fl6_dst = iph->saddr,
200 };
201 const struct nf_afinfo *ai;
202 struct rtable *rt = NULL;
203 u_int32_t mtu = ~0U;
204
205 rcu_read_lock();
206 ai = nf_get_afinfo(AF_INET6);
207 if (ai != NULL)
208 ai->route((struct dst_entry **)&rt, &fl);
209 rcu_read_unlock();
210
211 if (rt != NULL) {
212 mtu = dst_mtu(&rt->u.dst);
213 dst_release(&rt->u.dst);
214 }
215 return mtu;
216}
217
Patrick McHardycdd289a2007-02-07 15:09:46 -0800218static unsigned int
Jan Engelhardtd3c5ee62007-12-04 23:24:03 -0800219tcpmss_tg6(struct sk_buff *skb, const struct net_device *in,
220 const struct net_device *out, unsigned int hooknum,
221 const struct xt_target *target, const void *targinfo)
Patrick McHardycdd289a2007-02-07 15:09:46 -0800222{
Herbert Xu3db05fe2007-10-15 00:53:15 -0700223 struct ipv6hdr *ipv6h = ipv6_hdr(skb);
Patrick McHardycdd289a2007-02-07 15:09:46 -0800224 u8 nexthdr;
225 int tcphoff;
226 int ret;
227
228 nexthdr = ipv6h->nexthdr;
Herbert Xu3db05fe2007-10-15 00:53:15 -0700229 tcphoff = ipv6_skip_exthdr(skb, sizeof(*ipv6h), &nexthdr);
Patrick McHardy9dc05642007-11-30 23:58:03 +1100230 if (tcphoff < 0)
Patrick McHardycdd289a2007-02-07 15:09:46 -0800231 return NF_DROP;
Jan Engelhardt37c08382008-01-31 04:06:10 -0800232 ret = tcpmss_mangle_packet(skb, targinfo, tcpmss_reverse_mtu6(ipv6h),
233 tcphoff,
Patrick McHardycdd289a2007-02-07 15:09:46 -0800234 sizeof(*ipv6h) + sizeof(struct tcphdr));
235 if (ret < 0)
236 return NF_DROP;
237 if (ret > 0) {
Herbert Xu3db05fe2007-10-15 00:53:15 -0700238 ipv6h = ipv6_hdr(skb);
Patrick McHardycdd289a2007-02-07 15:09:46 -0800239 ipv6h->payload_len = htons(ntohs(ipv6h->payload_len) + ret);
240 }
241 return XT_CONTINUE;
242}
243#endif
244
245#define TH_SYN 0x02
246
247/* Must specify -p tcp --syn */
Jan Engelhardte1931b72007-07-07 22:16:26 -0700248static inline bool find_syn_match(const struct xt_entry_match *m)
Patrick McHardycdd289a2007-02-07 15:09:46 -0800249{
250 const struct xt_tcp *tcpinfo = (const struct xt_tcp *)m->data;
251
252 if (strcmp(m->u.kernel.match->name, "tcp") == 0 &&
253 tcpinfo->flg_cmp & TH_SYN &&
254 !(tcpinfo->invflags & XT_TCP_INV_FLAGS))
Jan Engelhardte1931b72007-07-07 22:16:26 -0700255 return true;
Patrick McHardycdd289a2007-02-07 15:09:46 -0800256
Jan Engelhardte1931b72007-07-07 22:16:26 -0700257 return false;
Patrick McHardycdd289a2007-02-07 15:09:46 -0800258}
259
Jan Engelhardte1931b72007-07-07 22:16:26 -0700260static bool
Jan Engelhardtd3c5ee62007-12-04 23:24:03 -0800261tcpmss_tg4_check(const char *tablename, const void *entry,
262 const struct xt_target *target, void *targinfo,
263 unsigned int hook_mask)
Patrick McHardycdd289a2007-02-07 15:09:46 -0800264{
265 const struct xt_tcpmss_info *info = targinfo;
266 const struct ipt_entry *e = entry;
267
268 if (info->mss == XT_TCPMSS_CLAMP_PMTU &&
Patrick McHardy6e23ae22007-11-19 18:53:30 -0800269 (hook_mask & ~((1 << NF_INET_FORWARD) |
270 (1 << NF_INET_LOCAL_OUT) |
271 (1 << NF_INET_POST_ROUTING))) != 0) {
Patrick McHardycdd289a2007-02-07 15:09:46 -0800272 printk("xt_TCPMSS: path-MTU clamping only supported in "
273 "FORWARD, OUTPUT and POSTROUTING hooks\n");
Jan Engelhardte1931b72007-07-07 22:16:26 -0700274 return false;
Patrick McHardycdd289a2007-02-07 15:09:46 -0800275 }
276 if (IPT_MATCH_ITERATE(e, find_syn_match))
Jan Engelhardte1931b72007-07-07 22:16:26 -0700277 return true;
Patrick McHardycdd289a2007-02-07 15:09:46 -0800278 printk("xt_TCPMSS: Only works on TCP SYN packets\n");
Jan Engelhardte1931b72007-07-07 22:16:26 -0700279 return false;
Patrick McHardycdd289a2007-02-07 15:09:46 -0800280}
281
282#if defined(CONFIG_IP6_NF_IPTABLES) || defined(CONFIG_IP6_NF_IPTABLES_MODULE)
Jan Engelhardte1931b72007-07-07 22:16:26 -0700283static bool
Jan Engelhardtd3c5ee62007-12-04 23:24:03 -0800284tcpmss_tg6_check(const char *tablename, const void *entry,
285 const struct xt_target *target, void *targinfo,
286 unsigned int hook_mask)
Patrick McHardycdd289a2007-02-07 15:09:46 -0800287{
288 const struct xt_tcpmss_info *info = targinfo;
289 const struct ip6t_entry *e = entry;
290
291 if (info->mss == XT_TCPMSS_CLAMP_PMTU &&
Patrick McHardy6e23ae22007-11-19 18:53:30 -0800292 (hook_mask & ~((1 << NF_INET_FORWARD) |
293 (1 << NF_INET_LOCAL_OUT) |
294 (1 << NF_INET_POST_ROUTING))) != 0) {
Patrick McHardycdd289a2007-02-07 15:09:46 -0800295 printk("xt_TCPMSS: path-MTU clamping only supported in "
296 "FORWARD, OUTPUT and POSTROUTING hooks\n");
Jan Engelhardte1931b72007-07-07 22:16:26 -0700297 return false;
Patrick McHardycdd289a2007-02-07 15:09:46 -0800298 }
299 if (IP6T_MATCH_ITERATE(e, find_syn_match))
Jan Engelhardte1931b72007-07-07 22:16:26 -0700300 return true;
Patrick McHardycdd289a2007-02-07 15:09:46 -0800301 printk("xt_TCPMSS: Only works on TCP SYN packets\n");
Jan Engelhardte1931b72007-07-07 22:16:26 -0700302 return false;
Patrick McHardycdd289a2007-02-07 15:09:46 -0800303}
304#endif
305
Jan Engelhardtd3c5ee62007-12-04 23:24:03 -0800306static struct xt_target tcpmss_tg_reg[] __read_mostly = {
Patrick McHardycdd289a2007-02-07 15:09:46 -0800307 {
308 .family = AF_INET,
309 .name = "TCPMSS",
Jan Engelhardtd3c5ee62007-12-04 23:24:03 -0800310 .checkentry = tcpmss_tg4_check,
311 .target = tcpmss_tg4,
Patrick McHardycdd289a2007-02-07 15:09:46 -0800312 .targetsize = sizeof(struct xt_tcpmss_info),
313 .proto = IPPROTO_TCP,
314 .me = THIS_MODULE,
315 },
316#if defined(CONFIG_IP6_NF_IPTABLES) || defined(CONFIG_IP6_NF_IPTABLES_MODULE)
317 {
318 .family = AF_INET6,
319 .name = "TCPMSS",
Jan Engelhardtd3c5ee62007-12-04 23:24:03 -0800320 .checkentry = tcpmss_tg6_check,
321 .target = tcpmss_tg6,
Patrick McHardycdd289a2007-02-07 15:09:46 -0800322 .targetsize = sizeof(struct xt_tcpmss_info),
323 .proto = IPPROTO_TCP,
324 .me = THIS_MODULE,
325 },
326#endif
327};
328
Jan Engelhardtd3c5ee62007-12-04 23:24:03 -0800329static int __init tcpmss_tg_init(void)
Patrick McHardycdd289a2007-02-07 15:09:46 -0800330{
Jan Engelhardtd3c5ee62007-12-04 23:24:03 -0800331 return xt_register_targets(tcpmss_tg_reg, ARRAY_SIZE(tcpmss_tg_reg));
Patrick McHardycdd289a2007-02-07 15:09:46 -0800332}
333
Jan Engelhardtd3c5ee62007-12-04 23:24:03 -0800334static void __exit tcpmss_tg_exit(void)
Patrick McHardycdd289a2007-02-07 15:09:46 -0800335{
Jan Engelhardtd3c5ee62007-12-04 23:24:03 -0800336 xt_unregister_targets(tcpmss_tg_reg, ARRAY_SIZE(tcpmss_tg_reg));
Patrick McHardycdd289a2007-02-07 15:09:46 -0800337}
338
Jan Engelhardtd3c5ee62007-12-04 23:24:03 -0800339module_init(tcpmss_tg_init);
340module_exit(tcpmss_tg_exit);