blob: 3277680186b4894a62f3791f3fcca9aa7ed99a23 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * TCP over IPv6
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09003 * Linux INET6 implementation
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 *
5 * Authors:
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09006 * Pedro Roque <roque@di.fc.ul.pt>
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 *
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09008 * Based on:
Linus Torvalds1da177e2005-04-16 15:20:36 -07009 * linux/net/ipv4/tcp.c
10 * linux/net/ipv4/tcp_input.c
11 * linux/net/ipv4/tcp_output.c
12 *
13 * Fixes:
14 * Hideaki YOSHIFUJI : sin6_scope_id support
15 * YOSHIFUJI Hideaki @USAGI and: Support IPV6_V6ONLY socket option, which
16 * Alexey Kuznetsov allow both IPv4 and IPv6 sockets to bind
17 * a single port at the same time.
18 * YOSHIFUJI Hideaki @USAGI: convert /proc/net/tcp6 to seq_file.
19 *
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * as published by the Free Software Foundation; either version
23 * 2 of the License, or (at your option) any later version.
24 */
25
Herbert Xueb4dea52008-12-29 23:04:08 -080026#include <linux/bottom_half.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070027#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070028#include <linux/errno.h>
29#include <linux/types.h>
30#include <linux/socket.h>
31#include <linux/sockios.h>
32#include <linux/net.h>
33#include <linux/jiffies.h>
34#include <linux/in.h>
35#include <linux/in6.h>
36#include <linux/netdevice.h>
37#include <linux/init.h>
38#include <linux/jhash.h>
39#include <linux/ipsec.h>
40#include <linux/times.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090041#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070042
43#include <linux/ipv6.h>
44#include <linux/icmpv6.h>
45#include <linux/random.h>
46
47#include <net/tcp.h>
48#include <net/ndisc.h>
Arnaldo Carvalho de Melo5324a042005-08-12 09:26:18 -030049#include <net/inet6_hashtables.h>
Arnaldo Carvalho de Melo81297652005-12-13 23:15:24 -080050#include <net/inet6_connection_sock.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070051#include <net/ipv6.h>
52#include <net/transp_v6.h>
53#include <net/addrconf.h>
54#include <net/ip6_route.h>
55#include <net/ip6_checksum.h>
56#include <net/inet_ecn.h>
57#include <net/protocol.h>
58#include <net/xfrm.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070059#include <net/snmp.h>
60#include <net/dsfield.h>
Arnaldo Carvalho de Melo6d6ee432005-12-13 23:25:19 -080061#include <net/timewait_sock.h>
Jeff Garzik18134be2007-10-26 22:53:14 -070062#include <net/netdma.h>
Denis V. Lunev3d58b5f2008-04-03 14:22:32 -070063#include <net/inet_common.h>
David S. Miller6e5714e2011-08-03 20:50:44 -070064#include <net/secure_seq.h>
Glauber Costad1a4c0b2011-12-11 21:47:04 +000065#include <net/tcp_memcontrol.h>
Eliezer Tamir076bb0c2013-07-10 17:13:17 +030066#include <net/busy_poll.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070067
68#include <asm/uaccess.h>
69
70#include <linux/proc_fs.h>
71#include <linux/seq_file.h>
72
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -080073#include <linux/crypto.h>
74#include <linux/scatterlist.h>
75
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -080076static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
Gui Jianfeng6edafaa2008-08-06 23:50:04 -070077static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
78 struct request_sock *req);
Linus Torvalds1da177e2005-04-16 15:20:36 -070079
80static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -070081
Stephen Hemminger3b401a82009-09-01 19:25:04 +000082static const struct inet_connection_sock_af_ops ipv6_mapped;
83static const struct inet_connection_sock_af_ops ipv6_specific;
David S. Millera9286302006-11-14 19:53:22 -080084#ifdef CONFIG_TCP_MD5SIG
Stephen Hemmingerb2e4b3d2009-09-01 19:25:03 +000085static const struct tcp_sock_af_ops tcp_sock_ipv6_specific;
86static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
YOSHIFUJI Hideaki9501f972008-04-18 12:45:16 +090087#else
88static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
Eric Dumazetb71d1d42011-04-22 04:53:02 +000089 const struct in6_addr *addr)
YOSHIFUJI Hideaki9501f972008-04-18 12:45:16 +090090{
91 return NULL;
92}
David S. Millera9286302006-11-14 19:53:22 -080093#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070094
Neal Cardwellfae6ef82012-08-19 03:30:38 +000095static void inet6_sk_rx_dst_set(struct sock *sk, const struct sk_buff *skb)
96{
97 struct dst_entry *dst = skb_dst(skb);
98 const struct rt6_info *rt = (const struct rt6_info *)dst;
99
100 dst_hold(dst);
101 sk->sk_rx_dst = dst;
102 inet_sk(sk)->rx_dst_ifindex = skb->skb_iif;
103 if (rt->rt6i_node)
104 inet6_sk(sk)->rx_dst_cookie = rt->rt6i_node->fn_sernum;
105}
106
Linus Torvalds1da177e2005-04-16 15:20:36 -0700107static void tcp_v6_hash(struct sock *sk)
108{
109 if (sk->sk_state != TCP_CLOSE) {
Arnaldo Carvalho de Melo8292a172005-12-13 23:15:52 -0800110 if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700111 tcp_prot.hash(sk);
112 return;
113 }
114 local_bh_disable();
Eric Dumazet9327f702009-12-04 03:46:54 +0000115 __inet6_hash(sk, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700116 local_bh_enable();
117 }
118}
119
Eric Dumazetcf533ea2011-10-21 05:22:42 -0400120static __u32 tcp_v6_init_sequence(const struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700121{
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700122 return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
123 ipv6_hdr(skb)->saddr.s6_addr32,
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -0700124 tcp_hdr(skb)->dest,
125 tcp_hdr(skb)->source);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700126}
127
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900128static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700129 int addr_len)
130{
131 struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900132 struct inet_sock *inet = inet_sk(sk);
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800133 struct inet_connection_sock *icsk = inet_csk(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700134 struct ipv6_pinfo *np = inet6_sk(sk);
135 struct tcp_sock *tp = tcp_sk(sk);
Arnaud Ebalard20c59de2010-06-01 21:35:01 +0000136 struct in6_addr *saddr = NULL, *final_p, final;
David S. Miller493f3772010-12-02 12:14:29 -0800137 struct rt6_info *rt;
David S. Miller4c9483b2011-03-12 16:22:43 -0500138 struct flowi6 fl6;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700139 struct dst_entry *dst;
140 int addr_type;
141 int err;
142
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900143 if (addr_len < SIN6_LEN_RFC2133)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700144 return -EINVAL;
145
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900146 if (usin->sin6_family != AF_INET6)
Eric Dumazeta02cec22010-09-22 20:43:57 +0000147 return -EAFNOSUPPORT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148
David S. Miller4c9483b2011-03-12 16:22:43 -0500149 memset(&fl6, 0, sizeof(fl6));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700150
151 if (np->sndflow) {
David S. Miller4c9483b2011-03-12 16:22:43 -0500152 fl6.flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
153 IP6_ECN_flow_init(fl6.flowlabel);
154 if (fl6.flowlabel&IPV6_FLOWLABEL_MASK) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155 struct ip6_flowlabel *flowlabel;
David S. Miller4c9483b2011-03-12 16:22:43 -0500156 flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700157 if (flowlabel == NULL)
158 return -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700159 fl6_sock_release(flowlabel);
160 }
161 }
162
163 /*
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900164 * connect() to INADDR_ANY means loopback (BSD'ism).
165 */
166
Weilong Chen4c99aa42013-12-19 18:44:34 +0800167 if (ipv6_addr_any(&usin->sin6_addr))
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900168 usin->sin6_addr.s6_addr[15] = 0x1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700169
170 addr_type = ipv6_addr_type(&usin->sin6_addr);
171
Weilong Chen4c99aa42013-12-19 18:44:34 +0800172 if (addr_type & IPV6_ADDR_MULTICAST)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700173 return -ENETUNREACH;
174
175 if (addr_type&IPV6_ADDR_LINKLOCAL) {
176 if (addr_len >= sizeof(struct sockaddr_in6) &&
177 usin->sin6_scope_id) {
178 /* If interface is set while binding, indices
179 * must coincide.
180 */
181 if (sk->sk_bound_dev_if &&
182 sk->sk_bound_dev_if != usin->sin6_scope_id)
183 return -EINVAL;
184
185 sk->sk_bound_dev_if = usin->sin6_scope_id;
186 }
187
188 /* Connect to link-local address requires an interface */
189 if (!sk->sk_bound_dev_if)
190 return -EINVAL;
191 }
192
193 if (tp->rx_opt.ts_recent_stamp &&
Eric Dumazetefe42082013-10-03 15:42:29 -0700194 !ipv6_addr_equal(&sk->sk_v6_daddr, &usin->sin6_addr)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700195 tp->rx_opt.ts_recent = 0;
196 tp->rx_opt.ts_recent_stamp = 0;
197 tp->write_seq = 0;
198 }
199
Eric Dumazetefe42082013-10-03 15:42:29 -0700200 sk->sk_v6_daddr = usin->sin6_addr;
David S. Miller4c9483b2011-03-12 16:22:43 -0500201 np->flow_label = fl6.flowlabel;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700202
203 /*
204 * TCP over IPv4
205 */
206
207 if (addr_type == IPV6_ADDR_MAPPED) {
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800208 u32 exthdrlen = icsk->icsk_ext_hdr_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700209 struct sockaddr_in sin;
210
211 SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
212
213 if (__ipv6_only_sock(sk))
214 return -ENETUNREACH;
215
216 sin.sin_family = AF_INET;
217 sin.sin_port = usin->sin6_port;
218 sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
219
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800220 icsk->icsk_af_ops = &ipv6_mapped;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700221 sk->sk_backlog_rcv = tcp_v4_do_rcv;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800222#ifdef CONFIG_TCP_MD5SIG
223 tp->af_specific = &tcp_sock_ipv6_mapped_specific;
224#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700225
226 err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
227
228 if (err) {
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800229 icsk->icsk_ext_hdr_len = exthdrlen;
230 icsk->icsk_af_ops = &ipv6_specific;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700231 sk->sk_backlog_rcv = tcp_v6_do_rcv;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800232#ifdef CONFIG_TCP_MD5SIG
233 tp->af_specific = &tcp_sock_ipv6_specific;
234#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700235 goto failure;
236 } else {
Eric Dumazetc720c7e2009-10-15 06:30:45 +0000237 ipv6_addr_set_v4mapped(inet->inet_saddr, &np->saddr);
238 ipv6_addr_set_v4mapped(inet->inet_rcv_saddr,
Eric Dumazetefe42082013-10-03 15:42:29 -0700239 &sk->sk_v6_rcv_saddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700240 }
241
242 return err;
243 }
244
Eric Dumazetefe42082013-10-03 15:42:29 -0700245 if (!ipv6_addr_any(&sk->sk_v6_rcv_saddr))
246 saddr = &sk->sk_v6_rcv_saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247
David S. Miller4c9483b2011-03-12 16:22:43 -0500248 fl6.flowi6_proto = IPPROTO_TCP;
Eric Dumazetefe42082013-10-03 15:42:29 -0700249 fl6.daddr = sk->sk_v6_daddr;
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000250 fl6.saddr = saddr ? *saddr : np->saddr;
David S. Miller4c9483b2011-03-12 16:22:43 -0500251 fl6.flowi6_oif = sk->sk_bound_dev_if;
252 fl6.flowi6_mark = sk->sk_mark;
David S. Miller1958b852011-03-12 16:36:19 -0500253 fl6.fl6_dport = usin->sin6_port;
254 fl6.fl6_sport = inet->inet_sport;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255
David S. Miller4c9483b2011-03-12 16:22:43 -0500256 final_p = fl6_update_dst(&fl6, np->opt, &final);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700257
David S. Miller4c9483b2011-03-12 16:22:43 -0500258 security_sk_classify_flow(sk, flowi6_to_flowi(&fl6));
Venkat Yekkiralabeb8d132006-08-04 23:12:42 -0700259
Steffen Klassert0e0d44a2013-08-28 08:04:14 +0200260 dst = ip6_dst_lookup_flow(sk, &fl6, final_p);
David S. Miller68d0c6d2011-03-01 13:19:07 -0800261 if (IS_ERR(dst)) {
262 err = PTR_ERR(dst);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700263 goto failure;
David S. Miller14e50e52007-05-24 18:17:54 -0700264 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700265
266 if (saddr == NULL) {
David S. Miller4c9483b2011-03-12 16:22:43 -0500267 saddr = &fl6.saddr;
Eric Dumazetefe42082013-10-03 15:42:29 -0700268 sk->sk_v6_rcv_saddr = *saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700269 }
270
271 /* set the source address */
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000272 np->saddr = *saddr;
Eric Dumazetc720c7e2009-10-15 06:30:45 +0000273 inet->inet_rcv_saddr = LOOPBACK4_IPV6;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700274
Herbert Xuf83ef8c2006-06-30 13:37:03 -0700275 sk->sk_gso_type = SKB_GSO_TCPV6;
YOSHIFUJI Hideaki8e1ef0a2006-08-29 17:15:09 -0700276 __ip6_dst_store(sk, dst, NULL, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700277
David S. Miller493f3772010-12-02 12:14:29 -0800278 rt = (struct rt6_info *) dst;
279 if (tcp_death_row.sysctl_tw_recycle &&
280 !tp->rx_opt.ts_recent_stamp &&
Eric Dumazetefe42082013-10-03 15:42:29 -0700281 ipv6_addr_equal(&rt->rt6i_dst.addr, &sk->sk_v6_daddr))
David S. Miller81166dd2012-07-10 03:14:24 -0700282 tcp_fetch_timewait_stamp(sk, dst);
David S. Miller493f3772010-12-02 12:14:29 -0800283
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800284 icsk->icsk_ext_hdr_len = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700285 if (np->opt)
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -0800286 icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
287 np->opt->opt_nflen);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288
289 tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
290
Eric Dumazetc720c7e2009-10-15 06:30:45 +0000291 inet->inet_dport = usin->sin6_port;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700292
293 tcp_set_state(sk, TCP_SYN_SENT);
Arnaldo Carvalho de Melod8313f52005-12-13 23:25:44 -0800294 err = inet6_hash_connect(&tcp_death_row, sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700295 if (err)
296 goto late_failure;
297
Andrey Vagin2b916472012-11-22 01:13:58 +0000298 if (!tp->write_seq && likely(!tp->repair))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700299 tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
Eric Dumazetefe42082013-10-03 15:42:29 -0700300 sk->sk_v6_daddr.s6_addr32,
Eric Dumazetc720c7e2009-10-15 06:30:45 +0000301 inet->inet_sport,
302 inet->inet_dport);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700303
304 err = tcp_connect(sk);
305 if (err)
306 goto late_failure;
307
308 return 0;
309
310late_failure:
311 tcp_set_state(sk, TCP_CLOSE);
312 __sk_dst_reset(sk);
313failure:
Eric Dumazetc720c7e2009-10-15 06:30:45 +0000314 inet->inet_dport = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315 sk->sk_route_caps = 0;
316 return err;
317}
318
Eric Dumazet563d34d2012-07-23 09:48:52 +0200319static void tcp_v6_mtu_reduced(struct sock *sk)
320{
321 struct dst_entry *dst;
322
323 if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
324 return;
325
326 dst = inet6_csk_update_pmtu(sk, tcp_sk(sk)->mtu_info);
327 if (!dst)
328 return;
329
330 if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
331 tcp_sync_mss(sk, dst_mtu(dst));
332 tcp_simple_retransmit(sk);
333 }
334}
335
Linus Torvalds1da177e2005-04-16 15:20:36 -0700336static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
Brian Haleyd5fdd6b2009-06-23 04:31:07 -0700337 u8 type, u8 code, int offset, __be32 info)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700338{
Weilong Chen4c99aa42013-12-19 18:44:34 +0800339 const struct ipv6hdr *hdr = (const struct ipv6hdr *)skb->data;
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -0300340 const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700341 struct ipv6_pinfo *np;
342 struct sock *sk;
343 int err;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900344 struct tcp_sock *tp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700345 __u32 seq;
Pavel Emelyanovca12a1a2008-07-16 20:28:42 -0700346 struct net *net = dev_net(skb->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700347
Pavel Emelyanovca12a1a2008-07-16 20:28:42 -0700348 sk = inet6_lookup(net, &tcp_hashinfo, &hdr->daddr,
Pavel Emelyanovd86e0da2008-01-31 05:07:21 -0800349 th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700350
351 if (sk == NULL) {
Denis V. Luneve41b5362008-10-08 10:33:26 -0700352 ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
353 ICMP6_MIB_INERRORS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700354 return;
355 }
356
357 if (sk->sk_state == TCP_TIME_WAIT) {
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -0700358 inet_twsk_put(inet_twsk(sk));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700359 return;
360 }
361
362 bh_lock_sock(sk);
Eric Dumazet563d34d2012-07-23 09:48:52 +0200363 if (sock_owned_by_user(sk) && type != ICMPV6_PKT_TOOBIG)
Pavel Emelyanovde0744a2008-07-16 20:31:16 -0700364 NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700365
366 if (sk->sk_state == TCP_CLOSE)
367 goto out;
368
Stephen Hemmingere802af92010-04-22 15:24:53 -0700369 if (ipv6_hdr(skb)->hop_limit < inet6_sk(sk)->min_hopcount) {
370 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
371 goto out;
372 }
373
Linus Torvalds1da177e2005-04-16 15:20:36 -0700374 tp = tcp_sk(sk);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900375 seq = ntohl(th->seq);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376 if (sk->sk_state != TCP_LISTEN &&
377 !between(seq, tp->snd_una, tp->snd_nxt)) {
Pavel Emelyanovde0744a2008-07-16 20:31:16 -0700378 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700379 goto out;
380 }
381
382 np = inet6_sk(sk);
383
David S. Millerec18d9a2012-07-12 00:25:15 -0700384 if (type == NDISC_REDIRECT) {
385 struct dst_entry *dst = __sk_dst_check(sk, np->dst_cookie);
386
David S. Miller1ed5c482012-07-12 00:41:25 -0700387 if (dst)
David S. Miller6700c272012-07-17 03:29:28 -0700388 dst->ops->redirect(dst, sk, skb);
Christoph Paasch50a75a82013-04-07 04:53:15 +0000389 goto out;
David S. Millerec18d9a2012-07-12 00:25:15 -0700390 }
391
Linus Torvalds1da177e2005-04-16 15:20:36 -0700392 if (type == ICMPV6_PKT_TOOBIG) {
Eric Dumazet0d4f0602013-03-18 07:01:28 +0000393 /* We are not interested in TCP_LISTEN and open_requests
394 * (SYN-ACKs send out by Linux are always <576bytes so
395 * they should go through unfragmented).
396 */
397 if (sk->sk_state == TCP_LISTEN)
398 goto out;
399
Hannes Frederic Sowa93b36cf2013-12-15 03:41:14 +0100400 if (!ip6_sk_accept_pmtu(sk))
401 goto out;
402
Eric Dumazet563d34d2012-07-23 09:48:52 +0200403 tp->mtu_info = ntohl(info);
404 if (!sock_owned_by_user(sk))
405 tcp_v6_mtu_reduced(sk);
Julian Anastasovd013ef2a2012-09-05 10:53:18 +0000406 else if (!test_and_set_bit(TCP_MTU_REDUCED_DEFERRED,
407 &tp->tsq_flags))
408 sock_hold(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700409 goto out;
410 }
411
412 icmpv6_err_convert(type, code, &err);
413
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700414 /* Might be for an request_sock */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700415 switch (sk->sk_state) {
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700416 struct request_sock *req, **prev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700417 case TCP_LISTEN:
418 if (sock_owned_by_user(sk))
419 goto out;
420
Arnaldo Carvalho de Melo81297652005-12-13 23:15:24 -0800421 req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
422 &hdr->saddr, inet6_iif(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700423 if (!req)
424 goto out;
425
426 /* ICMPs are not backlogged, hence we cannot get
427 * an established socket here.
428 */
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700429 WARN_ON(req->sk != NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700430
Arnaldo Carvalho de Melo2e6599c2005-06-18 22:46:52 -0700431 if (seq != tcp_rsk(req)->snt_isn) {
Pavel Emelyanovde0744a2008-07-16 20:31:16 -0700432 NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700433 goto out;
434 }
435
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -0700436 inet_csk_reqsk_queue_drop(sk, req, prev);
Vijay Subramanian5f1e9422013-01-31 08:24:19 +0000437 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700438 goto out;
439
440 case TCP_SYN_SENT:
441 case TCP_SYN_RECV: /* Cannot happen.
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900442 It can, it SYNs are crossed. --ANK */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700443 if (!sock_owned_by_user(sk)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700444 sk->sk_err = err;
445 sk->sk_error_report(sk); /* Wake people up to see the error (see connect in sock.c) */
446
447 tcp_done(sk);
448 } else
449 sk->sk_err_soft = err;
450 goto out;
451 }
452
453 if (!sock_owned_by_user(sk) && np->recverr) {
454 sk->sk_err = err;
455 sk->sk_error_report(sk);
456 } else
457 sk->sk_err_soft = err;
458
459out:
460 bh_unlock_sock(sk);
461 sock_put(sk);
462}
463
464
Neal Cardwell9f10d3f2012-06-28 12:34:21 +0000465static int tcp_v6_send_synack(struct sock *sk, struct dst_entry *dst,
466 struct flowi6 *fl6,
Neal Cardwell3840a062012-06-28 12:34:19 +0000467 struct request_sock *req,
Eric Dumazetfff32692012-06-01 01:47:50 +0000468 u16 queue_mapping)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700469{
Eric Dumazet634fb9792013-10-09 15:21:29 -0700470 struct inet_request_sock *ireq = inet_rsk(req);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700471 struct ipv6_pinfo *np = inet6_sk(sk);
Weilong Chen4c99aa42013-12-19 18:44:34 +0800472 struct sk_buff *skb;
Neal Cardwell94942182012-06-28 12:34:20 +0000473 int err = -ENOMEM;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700474
Neal Cardwell9f10d3f2012-06-28 12:34:21 +0000475 /* First, grab a route. */
476 if (!dst && (dst = inet6_csk_route_req(sk, fl6, req)) == NULL)
Denis V. Lunevfd80eb92008-02-29 11:43:03 -0800477 goto done;
Neal Cardwell94942182012-06-28 12:34:20 +0000478
Christoph Paasch1a2c6182013-03-17 08:23:34 +0000479 skb = tcp_make_synack(sk, dst, req, NULL);
Neal Cardwell94942182012-06-28 12:34:20 +0000480
Linus Torvalds1da177e2005-04-16 15:20:36 -0700481 if (skb) {
Eric Dumazet634fb9792013-10-09 15:21:29 -0700482 __tcp_v6_send_check(skb, &ireq->ir_v6_loc_addr,
483 &ireq->ir_v6_rmt_addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700484
Eric Dumazet634fb9792013-10-09 15:21:29 -0700485 fl6->daddr = ireq->ir_v6_rmt_addr;
Florent Fourcotdf3687f2014-01-17 17:15:03 +0100486 if (np->repflow && (ireq->pktopts != NULL))
487 fl6->flowlabel = ip6_flowlabel(ipv6_hdr(ireq->pktopts));
488
Eric Dumazetfff32692012-06-01 01:47:50 +0000489 skb_set_queue_mapping(skb, queue_mapping);
RongQing.Li43264e02012-07-01 17:18:59 +0000490 err = ip6_xmit(sk, skb, fl6, np->opt, np->tclass);
Gerrit Renkerb9df3cb2006-11-14 11:21:36 -0200491 err = net_xmit_eval(err);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700492 }
493
494done:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700495 return err;
496}
497
Christoph Paasch1a2c6182013-03-17 08:23:34 +0000498static int tcp_v6_rtx_synack(struct sock *sk, struct request_sock *req)
Octavian Purdila72659ec2010-01-17 19:09:39 -0800499{
Neal Cardwell9f10d3f2012-06-28 12:34:21 +0000500 struct flowi6 fl6;
Eric Dumazete6c022a2012-10-27 23:16:46 +0000501 int res;
Neal Cardwell9f10d3f2012-06-28 12:34:21 +0000502
Christoph Paasch1a2c6182013-03-17 08:23:34 +0000503 res = tcp_v6_send_synack(sk, NULL, &fl6, req, 0);
Yuchung Chengf19c29e2014-03-03 12:31:36 -0800504 if (!res) {
Eric Dumazete6c022a2012-10-27 23:16:46 +0000505 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_RETRANSSEGS);
Yuchung Chengf19c29e2014-03-03 12:31:36 -0800506 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPSYNRETRANS);
507 }
Eric Dumazete6c022a2012-10-27 23:16:46 +0000508 return res;
Octavian Purdila72659ec2010-01-17 19:09:39 -0800509}
510
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700511static void tcp_v6_reqsk_destructor(struct request_sock *req)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700512{
Eric Dumazet634fb9792013-10-09 15:21:29 -0700513 kfree_skb(inet_rsk(req)->pktopts);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700514}
515
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800516#ifdef CONFIG_TCP_MD5SIG
517static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000518 const struct in6_addr *addr)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800519{
Eric Dumazeta915da9b2012-01-31 05:18:33 +0000520 return tcp_md5_do_lookup(sk, (union tcp_md5_addr *)addr, AF_INET6);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800521}
522
523static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
524 struct sock *addr_sk)
525{
Eric Dumazetefe42082013-10-03 15:42:29 -0700526 return tcp_v6_md5_do_lookup(sk, &addr_sk->sk_v6_daddr);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800527}
528
529static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
530 struct request_sock *req)
531{
Eric Dumazet634fb9792013-10-09 15:21:29 -0700532 return tcp_v6_md5_do_lookup(sk, &inet_rsk(req)->ir_v6_rmt_addr);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800533}
534
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800535static int tcp_v6_parse_md5_keys (struct sock *sk, char __user *optval,
536 int optlen)
537{
538 struct tcp_md5sig cmd;
539 struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800540
541 if (optlen < sizeof(cmd))
542 return -EINVAL;
543
544 if (copy_from_user(&cmd, optval, sizeof(cmd)))
545 return -EFAULT;
546
547 if (sin6->sin6_family != AF_INET6)
548 return -EINVAL;
549
550 if (!cmd.tcpm_keylen) {
Brian Haleye773e4f2007-08-24 23:16:08 -0700551 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
Eric Dumazeta915da9b2012-01-31 05:18:33 +0000552 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
553 AF_INET);
554 return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
555 AF_INET6);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800556 }
557
558 if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
559 return -EINVAL;
560
Eric Dumazeta915da9b2012-01-31 05:18:33 +0000561 if (ipv6_addr_v4mapped(&sin6->sin6_addr))
562 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
563 AF_INET, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800564
Eric Dumazeta915da9b2012-01-31 05:18:33 +0000565 return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
566 AF_INET6, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800567}
568
Adam Langley49a72df2008-07-19 00:01:42 -0700569static int tcp_v6_md5_hash_pseudoheader(struct tcp_md5sig_pool *hp,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000570 const struct in6_addr *daddr,
571 const struct in6_addr *saddr, int nbytes)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800572{
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800573 struct tcp6_pseudohdr *bp;
Adam Langley49a72df2008-07-19 00:01:42 -0700574 struct scatterlist sg;
YOSHIFUJI Hideaki8d26d762008-04-17 13:19:16 +0900575
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800576 bp = &hp->md5_blk.ip6;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800577 /* 1. TCP pseudo-header (RFC2460) */
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000578 bp->saddr = *saddr;
579 bp->daddr = *daddr;
Adam Langley49a72df2008-07-19 00:01:42 -0700580 bp->protocol = cpu_to_be32(IPPROTO_TCP);
Adam Langley00b13042008-07-31 21:36:07 -0700581 bp->len = cpu_to_be32(nbytes);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800582
Adam Langley49a72df2008-07-19 00:01:42 -0700583 sg_init_one(&sg, bp, sizeof(*bp));
584 return crypto_hash_update(&hp->md5_desc, &sg, sizeof(*bp));
585}
David S. Millerc7da57a2007-10-26 00:41:21 -0700586
Adam Langley49a72df2008-07-19 00:01:42 -0700587static int tcp_v6_md5_hash_hdr(char *md5_hash, struct tcp_md5sig_key *key,
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000588 const struct in6_addr *daddr, struct in6_addr *saddr,
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400589 const struct tcphdr *th)
Adam Langley49a72df2008-07-19 00:01:42 -0700590{
591 struct tcp_md5sig_pool *hp;
592 struct hash_desc *desc;
593
594 hp = tcp_get_md5sig_pool();
595 if (!hp)
596 goto clear_hash_noput;
597 desc = &hp->md5_desc;
598
599 if (crypto_hash_init(desc))
600 goto clear_hash;
601 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, th->doff << 2))
602 goto clear_hash;
603 if (tcp_md5_hash_header(hp, th))
604 goto clear_hash;
605 if (tcp_md5_hash_key(hp, key))
606 goto clear_hash;
607 if (crypto_hash_final(desc, md5_hash))
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800608 goto clear_hash;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800609
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800610 tcp_put_md5sig_pool();
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800611 return 0;
Adam Langley49a72df2008-07-19 00:01:42 -0700612
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800613clear_hash:
614 tcp_put_md5sig_pool();
615clear_hash_noput:
616 memset(md5_hash, 0, 16);
Adam Langley49a72df2008-07-19 00:01:42 -0700617 return 1;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800618}
619
Adam Langley49a72df2008-07-19 00:01:42 -0700620static int tcp_v6_md5_hash_skb(char *md5_hash, struct tcp_md5sig_key *key,
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400621 const struct sock *sk,
622 const struct request_sock *req,
623 const struct sk_buff *skb)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800624{
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000625 const struct in6_addr *saddr, *daddr;
Adam Langley49a72df2008-07-19 00:01:42 -0700626 struct tcp_md5sig_pool *hp;
627 struct hash_desc *desc;
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400628 const struct tcphdr *th = tcp_hdr(skb);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800629
630 if (sk) {
631 saddr = &inet6_sk(sk)->saddr;
Eric Dumazetefe42082013-10-03 15:42:29 -0700632 daddr = &sk->sk_v6_daddr;
Adam Langley49a72df2008-07-19 00:01:42 -0700633 } else if (req) {
Eric Dumazet634fb9792013-10-09 15:21:29 -0700634 saddr = &inet_rsk(req)->ir_v6_loc_addr;
635 daddr = &inet_rsk(req)->ir_v6_rmt_addr;
Adam Langley49a72df2008-07-19 00:01:42 -0700636 } else {
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000637 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
Adam Langley49a72df2008-07-19 00:01:42 -0700638 saddr = &ip6h->saddr;
639 daddr = &ip6h->daddr;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800640 }
Adam Langley49a72df2008-07-19 00:01:42 -0700641
642 hp = tcp_get_md5sig_pool();
643 if (!hp)
644 goto clear_hash_noput;
645 desc = &hp->md5_desc;
646
647 if (crypto_hash_init(desc))
648 goto clear_hash;
649
650 if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, skb->len))
651 goto clear_hash;
652 if (tcp_md5_hash_header(hp, th))
653 goto clear_hash;
654 if (tcp_md5_hash_skb_data(hp, skb, th->doff << 2))
655 goto clear_hash;
656 if (tcp_md5_hash_key(hp, key))
657 goto clear_hash;
658 if (crypto_hash_final(desc, md5_hash))
659 goto clear_hash;
660
661 tcp_put_md5sig_pool();
662 return 0;
663
664clear_hash:
665 tcp_put_md5sig_pool();
666clear_hash_noput:
667 memset(md5_hash, 0, 16);
668 return 1;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800669}
670
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400671static int tcp_v6_inbound_md5_hash(struct sock *sk, const struct sk_buff *skb)
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800672{
Eric Dumazetcf533ea2011-10-21 05:22:42 -0400673 const __u8 *hash_location = NULL;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800674 struct tcp_md5sig_key *hash_expected;
Eric Dumazetb71d1d42011-04-22 04:53:02 +0000675 const struct ipv6hdr *ip6h = ipv6_hdr(skb);
Eric Dumazet318cf7a2011-10-24 02:46:04 -0400676 const struct tcphdr *th = tcp_hdr(skb);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800677 int genhash;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800678 u8 newhash[16];
679
680 hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
YOSHIFUJI Hideaki7d5d5522008-04-17 12:29:53 +0900681 hash_location = tcp_parse_md5sig_option(th);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800682
David S. Miller785957d2008-07-30 03:03:15 -0700683 /* We've parsed the options - do we have a hash? */
684 if (!hash_expected && !hash_location)
685 return 0;
686
687 if (hash_expected && !hash_location) {
688 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5NOTFOUND);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800689 return 1;
690 }
691
David S. Miller785957d2008-07-30 03:03:15 -0700692 if (!hash_expected && hash_location) {
693 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5UNEXPECTED);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800694 return 1;
695 }
696
697 /* check the signature */
Adam Langley49a72df2008-07-19 00:01:42 -0700698 genhash = tcp_v6_md5_hash_skb(newhash,
699 hash_expected,
700 NULL, NULL, skb);
701
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800702 if (genhash || memcmp(hash_location, newhash, 16) != 0) {
Joe Perchese87cc472012-05-13 21:56:26 +0000703 net_info_ratelimited("MD5 Hash %s for [%pI6c]:%u->[%pI6c]:%u\n",
704 genhash ? "failed" : "mismatch",
705 &ip6h->saddr, ntohs(th->source),
706 &ip6h->daddr, ntohs(th->dest));
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800707 return 1;
708 }
709 return 0;
710}
711#endif
712
Glenn Griffinc6aefaf2008-02-07 21:49:26 -0800713struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700714 .family = AF_INET6,
Arnaldo Carvalho de Melo2e6599c2005-06-18 22:46:52 -0700715 .obj_size = sizeof(struct tcp6_request_sock),
Octavian Purdila72659ec2010-01-17 19:09:39 -0800716 .rtx_syn_ack = tcp_v6_rtx_synack,
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700717 .send_ack = tcp_v6_reqsk_send_ack,
718 .destructor = tcp_v6_reqsk_destructor,
Octavian Purdila72659ec2010-01-17 19:09:39 -0800719 .send_reset = tcp_v6_send_reset,
720 .syn_ack_timeout = tcp_syn_ack_timeout,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700721};
722
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800723#ifdef CONFIG_TCP_MD5SIG
Stephen Hemmingerb2e4b3d2009-09-01 19:25:03 +0000724static const struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800725 .md5_lookup = tcp_v6_reqsk_md5_lookup,
John Dykstrae3afe7b2009-07-16 05:04:51 +0000726 .calc_md5_hash = tcp_v6_md5_hash_skb,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800727};
Andrew Mortonb6332e62006-11-30 19:16:28 -0800728#endif
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800729
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700730static void tcp_v6_send_response(struct sk_buff *skb, u32 seq, u32 ack, u32 win,
Andrey Vaginee684b62013-02-11 05:50:19 +0000731 u32 tsval, u32 tsecr,
Florent Fourcot1d13a962014-01-16 17:21:22 +0100732 struct tcp_md5sig_key *key, int rst, u8 tclass,
733 u32 label)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700734{
Eric Dumazetcf533ea2011-10-21 05:22:42 -0400735 const struct tcphdr *th = tcp_hdr(skb);
736 struct tcphdr *t1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700737 struct sk_buff *buff;
David S. Miller4c9483b2011-03-12 16:22:43 -0500738 struct flowi6 fl6;
Eric Dumazetadf30902009-06-02 05:19:30 +0000739 struct net *net = dev_net(skb_dst(skb)->dev);
Daniel Lezcanoe5047992008-03-07 11:16:26 -0800740 struct sock *ctl_sk = net->ipv6.tcp_sk;
YOSHIFUJI Hideaki9cb57342008-01-12 02:16:03 -0800741 unsigned int tot_len = sizeof(struct tcphdr);
Eric Dumazetadf30902009-06-02 05:19:30 +0000742 struct dst_entry *dst;
Al Viroe69a4adc2006-11-14 20:56:00 -0800743 __be32 *topt;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700744
Andrey Vaginee684b62013-02-11 05:50:19 +0000745 if (tsecr)
YOSHIFUJI Hideaki4244f8a2006-10-10 19:40:50 -0700746 tot_len += TCPOLEN_TSTAMP_ALIGNED;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800747#ifdef CONFIG_TCP_MD5SIG
748 if (key)
749 tot_len += TCPOLEN_MD5SIG_ALIGNED;
750#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700751
752 buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
753 GFP_ATOMIC);
754 if (buff == NULL)
755 return;
756
757 skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
758
Ilpo Järvinen77c676d2008-10-09 14:41:38 -0700759 t1 = (struct tcphdr *) skb_push(buff, tot_len);
Herbert Xu6651ffc2010-04-21 00:47:15 -0700760 skb_reset_transport_header(buff);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700761
762 /* Swap the send and the receive. */
763 memset(t1, 0, sizeof(*t1));
764 t1->dest = th->source;
765 t1->source = th->dest;
Ilpo Järvinen77c676d2008-10-09 14:41:38 -0700766 t1->doff = tot_len / 4;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700767 t1->seq = htonl(seq);
768 t1->ack_seq = htonl(ack);
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700769 t1->ack = !rst || !th->ack;
770 t1->rst = rst;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700771 t1->window = htons(win);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800772
Al Viroe69a4adc2006-11-14 20:56:00 -0800773 topt = (__be32 *)(t1 + 1);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900774
Andrey Vaginee684b62013-02-11 05:50:19 +0000775 if (tsecr) {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800776 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
777 (TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
Andrey Vaginee684b62013-02-11 05:50:19 +0000778 *topt++ = htonl(tsval);
779 *topt++ = htonl(tsecr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700780 }
781
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800782#ifdef CONFIG_TCP_MD5SIG
783 if (key) {
784 *topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
785 (TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
Adam Langley49a72df2008-07-19 00:01:42 -0700786 tcp_v6_md5_hash_hdr((__u8 *)topt, key,
Adam Langley90b7e112008-07-31 20:49:48 -0700787 &ipv6_hdr(skb)->saddr,
788 &ipv6_hdr(skb)->daddr, t1);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800789 }
790#endif
791
David S. Miller4c9483b2011-03-12 16:22:43 -0500792 memset(&fl6, 0, sizeof(fl6));
Alexey Dobriyan4e3fd7a2011-11-21 03:39:03 +0000793 fl6.daddr = ipv6_hdr(skb)->saddr;
794 fl6.saddr = ipv6_hdr(skb)->daddr;
Florent Fourcot1d13a962014-01-16 17:21:22 +0100795 fl6.flowlabel = label;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700796
David S. Millere5700af2010-04-21 14:59:20 -0700797 buff->ip_summed = CHECKSUM_PARTIAL;
798 buff->csum = 0;
799
David S. Miller4c9483b2011-03-12 16:22:43 -0500800 __tcp_v6_send_check(buff, &fl6.saddr, &fl6.daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700801
David S. Miller4c9483b2011-03-12 16:22:43 -0500802 fl6.flowi6_proto = IPPROTO_TCP;
Alexey Kuznetsov4c675252012-10-12 04:34:17 +0000803 if (ipv6_addr_type(&fl6.daddr) & IPV6_ADDR_LINKLOCAL)
804 fl6.flowi6_oif = inet6_iif(skb);
David S. Miller1958b852011-03-12 16:36:19 -0500805 fl6.fl6_dport = t1->dest;
806 fl6.fl6_sport = t1->source;
David S. Miller4c9483b2011-03-12 16:22:43 -0500807 security_skb_classify_flow(skb, flowi6_to_flowi(&fl6));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700808
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700809 /* Pass a socket to ip6_dst_lookup either it is for RST
810 * Underlying function will use this to retrieve the network
811 * namespace
812 */
Steffen Klassert0e0d44a2013-08-28 08:04:14 +0200813 dst = ip6_dst_lookup_flow(ctl_sk, &fl6, NULL);
David S. Miller68d0c6d2011-03-01 13:19:07 -0800814 if (!IS_ERR(dst)) {
815 skb_dst_set(buff, dst);
Eric Dumazetb903d322011-10-27 00:44:35 -0400816 ip6_xmit(ctl_sk, buff, &fl6, NULL, tclass);
David S. Miller68d0c6d2011-03-01 13:19:07 -0800817 TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
818 if (rst)
819 TCP_INC_STATS_BH(net, TCP_MIB_OUTRSTS);
820 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700821 }
822
823 kfree_skb(buff);
824}
825
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700826static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
827{
Eric Dumazetcf533ea2011-10-21 05:22:42 -0400828 const struct tcphdr *th = tcp_hdr(skb);
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700829 u32 seq = 0, ack_seq = 0;
Guo-Fu Tsengfa3e5b42008-10-09 21:11:56 -0700830 struct tcp_md5sig_key *key = NULL;
Shawn Lu658ddaa2012-01-31 22:35:48 +0000831#ifdef CONFIG_TCP_MD5SIG
832 const __u8 *hash_location = NULL;
833 struct ipv6hdr *ipv6h = ipv6_hdr(skb);
834 unsigned char newhash[16];
835 int genhash;
836 struct sock *sk1 = NULL;
837#endif
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700838
839 if (th->rst)
840 return;
841
842 if (!ipv6_unicast_destination(skb))
843 return;
844
845#ifdef CONFIG_TCP_MD5SIG
Shawn Lu658ddaa2012-01-31 22:35:48 +0000846 hash_location = tcp_parse_md5sig_option(th);
847 if (!sk && hash_location) {
848 /*
849 * active side is lost. Try to find listening socket through
850 * source port, and then find md5 key through listening socket.
851 * we are not loose security here:
852 * Incoming packet is checked with md5 hash with finding key,
853 * no RST generated if md5 hash doesn't match.
854 */
855 sk1 = inet6_lookup_listener(dev_net(skb_dst(skb)->dev),
Tom Herbert5ba24952013-01-22 09:50:39 +0000856 &tcp_hashinfo, &ipv6h->saddr,
857 th->source, &ipv6h->daddr,
Shawn Lu658ddaa2012-01-31 22:35:48 +0000858 ntohs(th->source), inet6_iif(skb));
859 if (!sk1)
860 return;
861
862 rcu_read_lock();
863 key = tcp_v6_md5_do_lookup(sk1, &ipv6h->saddr);
864 if (!key)
865 goto release_sk1;
866
867 genhash = tcp_v6_md5_hash_skb(newhash, key, NULL, NULL, skb);
868 if (genhash || memcmp(hash_location, newhash, 16) != 0)
869 goto release_sk1;
870 } else {
871 key = sk ? tcp_v6_md5_do_lookup(sk, &ipv6h->saddr) : NULL;
872 }
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700873#endif
874
875 if (th->ack)
876 seq = ntohl(th->ack_seq);
877 else
878 ack_seq = ntohl(th->seq) + th->syn + th->fin + skb->len -
879 (th->doff << 2);
880
Florent Fourcot1d13a962014-01-16 17:21:22 +0100881 tcp_v6_send_response(skb, seq, ack_seq, 0, 0, 0, key, 1, 0, 0);
Shawn Lu658ddaa2012-01-31 22:35:48 +0000882
883#ifdef CONFIG_TCP_MD5SIG
884release_sk1:
885 if (sk1) {
886 rcu_read_unlock();
887 sock_put(sk1);
888 }
889#endif
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700890}
891
Andrey Vaginee684b62013-02-11 05:50:19 +0000892static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack,
893 u32 win, u32 tsval, u32 tsecr,
Florent Fourcot1d13a962014-01-16 17:21:22 +0100894 struct tcp_md5sig_key *key, u8 tclass,
895 u32 label)
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700896{
Florent Fourcot1d13a962014-01-16 17:21:22 +0100897 tcp_v6_send_response(skb, seq, ack, win, tsval, tsecr, key, 0, tclass,
898 label);
Ilpo Järvinen626e2642008-10-09 14:42:40 -0700899}
900
Linus Torvalds1da177e2005-04-16 15:20:36 -0700901static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
902{
Arnaldo Carvalho de Melo8feaf0c02005-08-09 20:09:30 -0700903 struct inet_timewait_sock *tw = inet_twsk(sk);
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800904 struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700905
YOSHIFUJI Hideaki9501f972008-04-18 12:45:16 +0900906 tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
Arnaldo Carvalho de Melo8feaf0c02005-08-09 20:09:30 -0700907 tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
Andrey Vaginee684b62013-02-11 05:50:19 +0000908 tcp_time_stamp + tcptw->tw_ts_offset,
Eric Dumazetb903d322011-10-27 00:44:35 -0400909 tcptw->tw_ts_recent, tcp_twsk_md5_key(tcptw),
Florent Fourcot1d13a962014-01-16 17:21:22 +0100910 tw->tw_tclass, (tw->tw_flowlabel << 12));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700911
Arnaldo Carvalho de Melo8feaf0c02005-08-09 20:09:30 -0700912 inet_twsk_put(tw);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700913}
914
Gui Jianfeng6edafaa2008-08-06 23:50:04 -0700915static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
916 struct request_sock *req)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700917{
Andrey Vaginee684b62013-02-11 05:50:19 +0000918 tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1,
919 req->rcv_wnd, tcp_time_stamp, req->ts_recent,
Florent Fourcot1d13a962014-01-16 17:21:22 +0100920 tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr),
921 0, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700922}
923
924
Weilong Chen4c99aa42013-12-19 18:44:34 +0800925static struct sock *tcp_v6_hnd_req(struct sock *sk, struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700926{
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -0700927 struct request_sock *req, **prev;
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -0700928 const struct tcphdr *th = tcp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700929 struct sock *nsk;
930
931 /* Find possible connection requests. */
Arnaldo Carvalho de Melo81297652005-12-13 23:15:24 -0800932 req = inet6_csk_search_req(sk, &prev, th->source,
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700933 &ipv6_hdr(skb)->saddr,
934 &ipv6_hdr(skb)->daddr, inet6_iif(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700935 if (req)
Jerry Chu83368862012-08-31 12:29:12 +0000936 return tcp_check_req(sk, skb, req, prev, false);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700937
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +0900938 nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
Pavel Emelyanovd86e0da2008-01-31 05:07:21 -0800939 &ipv6_hdr(skb)->saddr, th->source,
940 &ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700941
942 if (nsk) {
943 if (nsk->sk_state != TCP_TIME_WAIT) {
944 bh_lock_sock(nsk);
945 return nsk;
946 }
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -0700947 inet_twsk_put(inet_twsk(nsk));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700948 return NULL;
949 }
950
Glenn Griffinc6aefaf2008-02-07 21:49:26 -0800951#ifdef CONFIG_SYN_COOKIES
Florian Westphalaf9b4732010-06-03 00:43:44 +0000952 if (!th->syn)
Glenn Griffinc6aefaf2008-02-07 21:49:26 -0800953 sk = cookie_v6_check(sk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700954#endif
955 return sk;
956}
957
Linus Torvalds1da177e2005-04-16 15:20:36 -0700958/* FIXME: this is substantially similar to the ipv4 code.
959 * Can some kind of merge be done? -- erics
960 */
961static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
962{
William Allen Simpsone6b4d112009-12-02 18:07:39 +0000963 struct tcp_options_received tmp_opt;
964 struct request_sock *req;
Eric Dumazet634fb9792013-10-09 15:21:29 -0700965 struct inet_request_sock *ireq;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700966 struct ipv6_pinfo *np = inet6_sk(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700967 struct tcp_sock *tp = tcp_sk(sk);
William Allen Simpsone6b4d112009-12-02 18:07:39 +0000968 __u32 isn = TCP_SKB_CB(skb)->when;
David S. Miller493f3772010-12-02 12:14:29 -0800969 struct dst_entry *dst = NULL;
Neal Cardwell3840a062012-06-28 12:34:19 +0000970 struct flowi6 fl6;
Eric Dumazeta2a385d2012-05-16 23:15:34 +0000971 bool want_cookie = false;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700972
973 if (skb->protocol == htons(ETH_P_IP))
974 return tcp_v4_conn_request(sk, skb);
975
976 if (!ipv6_unicast_destination(skb))
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900977 goto drop;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700978
Hannes Frederic Sowa5ad37d52013-07-26 17:43:23 +0200979 if ((sysctl_tcp_syncookies == 2 ||
980 inet_csk_reqsk_queue_is_full(sk)) && !isn) {
Eric Dumazet946cedc2011-08-30 03:21:44 +0000981 want_cookie = tcp_syn_flood_action(sk, skb, "TCPv6");
982 if (!want_cookie)
983 goto drop;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700984 }
985
Vijay Subramanian5f1e9422013-01-31 08:24:19 +0000986 if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1) {
987 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700988 goto drop;
Vijay Subramanian5f1e9422013-01-31 08:24:19 +0000989 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700990
Arnaldo Carvalho de Meloca304b62005-12-13 23:15:40 -0800991 req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700992 if (req == NULL)
993 goto drop;
994
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -0800995#ifdef CONFIG_TCP_MD5SIG
996 tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
997#endif
998
Linus Torvalds1da177e2005-04-16 15:20:36 -0700999 tcp_clear_options(&tmp_opt);
1000 tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
1001 tmp_opt.user_mss = tp->rx_opt.user_mss;
Christoph Paasch1a2c6182013-03-17 08:23:34 +00001002 tcp_parse_options(skb, &tmp_opt, 0, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001003
Florian Westphal4dfc2812008-04-10 03:12:40 -07001004 if (want_cookie && !tmp_opt.saw_tstamp)
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001005 tcp_clear_options(&tmp_opt);
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001006
Linus Torvalds1da177e2005-04-16 15:20:36 -07001007 tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
1008 tcp_openreq_init(req, &tmp_opt, skb);
1009
Eric Dumazet634fb9792013-10-09 15:21:29 -07001010 ireq = inet_rsk(req);
1011 ireq->ir_v6_rmt_addr = ipv6_hdr(skb)->saddr;
1012 ireq->ir_v6_loc_addr = ipv6_hdr(skb)->daddr;
Florian Westphal172d69e2010-06-21 11:48:45 +00001013 if (!want_cookie || tmp_opt.tstamp_ok)
Hannes Frederic Sowa5d134f12013-01-05 16:10:48 +00001014 TCP_ECN_create_request(req, skb, sock_net(sk));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001015
Eric Dumazet634fb9792013-10-09 15:21:29 -07001016 ireq->ir_iif = sk->sk_bound_dev_if;
Eric Dumazet4d0fe502011-11-23 17:29:23 -05001017
1018 /* So that link locals have meaning */
1019 if (!sk->sk_bound_dev_if &&
Eric Dumazet634fb9792013-10-09 15:21:29 -07001020 ipv6_addr_type(&ireq->ir_v6_rmt_addr) & IPV6_ADDR_LINKLOCAL)
1021 ireq->ir_iif = inet6_iif(skb);
Eric Dumazet4d0fe502011-11-23 17:29:23 -05001022
Florian Westphal2bbdf382010-06-13 11:29:39 +00001023 if (!isn) {
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001024 if (ipv6_opt_accepted(sk, skb) ||
1025 np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
Florent Fourcotdf3687f2014-01-17 17:15:03 +01001026 np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim ||
1027 np->repflow) {
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001028 atomic_inc(&skb->users);
Eric Dumazet634fb9792013-10-09 15:21:29 -07001029 ireq->pktopts = skb;
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001030 }
David S. Miller493f3772010-12-02 12:14:29 -08001031
1032 if (want_cookie) {
Florian Westphal2bbdf382010-06-13 11:29:39 +00001033 isn = cookie_v6_init_sequence(sk, skb, &req->mss);
1034 req->cookie_ts = tmp_opt.tstamp_ok;
David S. Miller493f3772010-12-02 12:14:29 -08001035 goto have_isn;
Florian Westphal2bbdf382010-06-13 11:29:39 +00001036 }
David S. Miller493f3772010-12-02 12:14:29 -08001037
1038 /* VJ's idea. We save last timestamp seen
1039 * from the destination in peer table, when entering
1040 * state TIME-WAIT, and check against it before
1041 * accepting new connection request.
1042 *
1043 * If "isn" is not zero, this request hit alive
1044 * timewait bucket, so that all the necessary checks
1045 * are made in the function processing timewait state.
1046 */
1047 if (tmp_opt.saw_tstamp &&
1048 tcp_death_row.sysctl_tw_recycle &&
David S. Miller81166dd2012-07-10 03:14:24 -07001049 (dst = inet6_csk_route_req(sk, &fl6, req)) != NULL) {
1050 if (!tcp_peer_is_proven(req, dst, true)) {
David S. Miller493f3772010-12-02 12:14:29 -08001051 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_PAWSPASSIVEREJECTED);
1052 goto drop_and_release;
1053 }
1054 }
1055 /* Kill the following clause, if you dislike this way. */
1056 else if (!sysctl_tcp_syncookies &&
1057 (sysctl_max_syn_backlog - inet_csk_reqsk_queue_len(sk) <
1058 (sysctl_max_syn_backlog >> 2)) &&
David S. Miller81166dd2012-07-10 03:14:24 -07001059 !tcp_peer_is_proven(req, dst, false)) {
David S. Miller493f3772010-12-02 12:14:29 -08001060 /* Without syncookies last quarter of
1061 * backlog is filled with destinations,
1062 * proven to be alive.
1063 * It means that we continue to communicate
1064 * to destinations, already remembered
1065 * to the moment of synflood.
1066 */
1067 LIMIT_NETDEBUG(KERN_DEBUG "TCP: drop open request from %pI6/%u\n",
Eric Dumazet634fb9792013-10-09 15:21:29 -07001068 &ireq->ir_v6_rmt_addr, ntohs(tcp_hdr(skb)->source));
David S. Miller493f3772010-12-02 12:14:29 -08001069 goto drop_and_release;
1070 }
1071
1072 isn = tcp_v6_init_sequence(skb);
Glenn Griffinc6aefaf2008-02-07 21:49:26 -08001073 }
David S. Miller493f3772010-12-02 12:14:29 -08001074have_isn:
Arnaldo Carvalho de Melo2e6599c2005-06-18 22:46:52 -07001075 tcp_rsk(req)->snt_isn = isn;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001076
Neal Cardwell437c5b52012-06-23 19:22:00 +00001077 if (security_inet_conn_request(sk, skb, req))
1078 goto drop_and_release;
Venkat Yekkirala4237c752006-07-24 23:32:50 -07001079
Neal Cardwell9f10d3f2012-06-28 12:34:21 +00001080 if (tcp_v6_send_synack(sk, dst, &fl6, req,
Eric Dumazetfff32692012-06-01 01:47:50 +00001081 skb_get_queue_mapping(skb)) ||
William Allen Simpson4957faade2009-12-02 18:25:27 +00001082 want_cookie)
William Allen Simpsone6b4d112009-12-02 18:07:39 +00001083 goto drop_and_free;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001084
Neal Cardwell016818d2012-09-22 04:18:55 +00001085 tcp_rsk(req)->snt_synack = tcp_time_stamp;
Jerry Chu83368862012-08-31 12:29:12 +00001086 tcp_rsk(req)->listener = NULL;
William Allen Simpsone6b4d112009-12-02 18:07:39 +00001087 inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1088 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001089
David S. Miller493f3772010-12-02 12:14:29 -08001090drop_and_release:
1091 dst_release(dst);
William Allen Simpsone6b4d112009-12-02 18:07:39 +00001092drop_and_free:
1093 reqsk_free(req);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001094drop:
Vijay Subramanian5f1e9422013-01-31 08:24:19 +00001095 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001096 return 0; /* don't send reset */
1097}
1098
Weilong Chen4c99aa42013-12-19 18:44:34 +08001099static struct sock *tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
1100 struct request_sock *req,
1101 struct dst_entry *dst)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001102{
Eric Dumazet634fb9792013-10-09 15:21:29 -07001103 struct inet_request_sock *ireq;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001104 struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1105 struct tcp6_sock *newtcp6sk;
1106 struct inet_sock *newinet;
1107 struct tcp_sock *newtp;
1108 struct sock *newsk;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001109#ifdef CONFIG_TCP_MD5SIG
1110 struct tcp_md5sig_key *key;
1111#endif
Neal Cardwell3840a062012-06-28 12:34:19 +00001112 struct flowi6 fl6;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001113
1114 if (skb->protocol == htons(ETH_P_IP)) {
1115 /*
1116 * v6 mapped
1117 */
1118
1119 newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1120
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001121 if (newsk == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001122 return NULL;
1123
1124 newtcp6sk = (struct tcp6_sock *)newsk;
1125 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1126
1127 newinet = inet_sk(newsk);
1128 newnp = inet6_sk(newsk);
1129 newtp = tcp_sk(newsk);
1130
1131 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1132
Eric Dumazetefe42082013-10-03 15:42:29 -07001133 ipv6_addr_set_v4mapped(newinet->inet_daddr, &newsk->sk_v6_daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001134
Eric Dumazetc720c7e2009-10-15 06:30:45 +00001135 ipv6_addr_set_v4mapped(newinet->inet_saddr, &newnp->saddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001136
Eric Dumazetefe42082013-10-03 15:42:29 -07001137 newsk->sk_v6_rcv_saddr = newnp->saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001138
Arnaldo Carvalho de Melo8292a172005-12-13 23:15:52 -08001139 inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001140 newsk->sk_backlog_rcv = tcp_v4_do_rcv;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001141#ifdef CONFIG_TCP_MD5SIG
1142 newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1143#endif
1144
Yan, Zheng676a1182011-09-25 02:21:30 +00001145 newnp->ipv6_ac_list = NULL;
1146 newnp->ipv6_fl_list = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001147 newnp->pktoptions = NULL;
1148 newnp->opt = NULL;
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -03001149 newnp->mcast_oif = inet6_iif(skb);
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001150 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
Florent Fourcot1397ed32013-12-08 15:46:57 +01001151 newnp->rcv_flowinfo = ip6_flowinfo(ipv6_hdr(skb));
Florent Fourcotdf3687f2014-01-17 17:15:03 +01001152 if (np->repflow)
1153 newnp->flow_label = ip6_flowlabel(ipv6_hdr(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001154
Arnaldo Carvalho de Meloe6848972005-08-09 19:45:38 -07001155 /*
1156 * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1157 * here, tcp_create_openreq_child now does this for us, see the comment in
1158 * that function for the gory details. -acme
Linus Torvalds1da177e2005-04-16 15:20:36 -07001159 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001160
1161 /* It is tricky place. Until this moment IPv4 tcp
Arnaldo Carvalho de Melo8292a172005-12-13 23:15:52 -08001162 worked with IPv6 icsk.icsk_af_ops.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001163 Sync it now.
1164 */
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08001165 tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001166
1167 return newsk;
1168 }
1169
Eric Dumazet634fb9792013-10-09 15:21:29 -07001170 ireq = inet_rsk(req);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001171
1172 if (sk_acceptq_is_full(sk))
1173 goto out_overflow;
1174
David S. Miller493f3772010-12-02 12:14:29 -08001175 if (!dst) {
Neal Cardwell3840a062012-06-28 12:34:19 +00001176 dst = inet6_csk_route_req(sk, &fl6, req);
David S. Miller493f3772010-12-02 12:14:29 -08001177 if (!dst)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001178 goto out;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001179 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001180
1181 newsk = tcp_create_openreq_child(sk, req, skb);
1182 if (newsk == NULL)
Balazs Scheidler093d2822010-10-21 13:06:43 +02001183 goto out_nonewsk;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001184
Arnaldo Carvalho de Meloe6848972005-08-09 19:45:38 -07001185 /*
1186 * No need to charge this sock to the relevant IPv6 refcnt debug socks
1187 * count here, tcp_create_openreq_child now does this for us, see the
1188 * comment in that function for the gory details. -acme
1189 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001190
Stephen Hemminger59eed272006-08-25 15:55:43 -07001191 newsk->sk_gso_type = SKB_GSO_TCPV6;
YOSHIFUJI Hideaki8e1ef0a2006-08-29 17:15:09 -07001192 __ip6_dst_store(newsk, dst, NULL, NULL);
Neal Cardwellfae6ef82012-08-19 03:30:38 +00001193 inet6_sk_rx_dst_set(newsk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001194
1195 newtcp6sk = (struct tcp6_sock *)newsk;
1196 inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1197
1198 newtp = tcp_sk(newsk);
1199 newinet = inet_sk(newsk);
1200 newnp = inet6_sk(newsk);
1201
1202 memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1203
Eric Dumazet634fb9792013-10-09 15:21:29 -07001204 newsk->sk_v6_daddr = ireq->ir_v6_rmt_addr;
1205 newnp->saddr = ireq->ir_v6_loc_addr;
1206 newsk->sk_v6_rcv_saddr = ireq->ir_v6_loc_addr;
1207 newsk->sk_bound_dev_if = ireq->ir_iif;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001208
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001209 /* Now IPv6 options...
Linus Torvalds1da177e2005-04-16 15:20:36 -07001210
1211 First: no IPv4 options.
1212 */
Eric Dumazetf6d8bd02011-04-21 09:45:37 +00001213 newinet->inet_opt = NULL;
Yan, Zheng676a1182011-09-25 02:21:30 +00001214 newnp->ipv6_ac_list = NULL;
Masayuki Nakagawad35690b2007-03-16 16:14:03 -07001215 newnp->ipv6_fl_list = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001216
1217 /* Clone RX bits */
1218 newnp->rxopt.all = np->rxopt.all;
1219
1220 /* Clone pktoptions received with SYN */
1221 newnp->pktoptions = NULL;
Eric Dumazet634fb9792013-10-09 15:21:29 -07001222 if (ireq->pktopts != NULL) {
1223 newnp->pktoptions = skb_clone(ireq->pktopts,
Mel Gorman99a1dec2012-07-31 16:44:14 -07001224 sk_gfp_atomic(sk, GFP_ATOMIC));
Eric Dumazet634fb9792013-10-09 15:21:29 -07001225 consume_skb(ireq->pktopts);
1226 ireq->pktopts = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001227 if (newnp->pktoptions)
1228 skb_set_owner_r(newnp->pktoptions, newsk);
1229 }
1230 newnp->opt = NULL;
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -03001231 newnp->mcast_oif = inet6_iif(skb);
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001232 newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
Florent Fourcot1397ed32013-12-08 15:46:57 +01001233 newnp->rcv_flowinfo = ip6_flowinfo(ipv6_hdr(skb));
Florent Fourcotdf3687f2014-01-17 17:15:03 +01001234 if (np->repflow)
1235 newnp->flow_label = ip6_flowlabel(ipv6_hdr(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001236
1237 /* Clone native IPv6 options from listening socket (if any)
1238
1239 Yes, keeping reference count would be much more clever,
1240 but we make one more one thing there: reattach optmem
1241 to newsk.
1242 */
RongQing.Li43264e02012-07-01 17:18:59 +00001243 if (np->opt)
1244 newnp->opt = ipv6_dup_options(newsk, np->opt);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001245
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08001246 inet_csk(newsk)->icsk_ext_hdr_len = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001247 if (newnp->opt)
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08001248 inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1249 newnp->opt->opt_flen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001250
1251 tcp_sync_mss(newsk, dst_mtu(dst));
David S. Miller0dbaee32010-12-13 12:52:14 -08001252 newtp->advmss = dst_metric_advmss(dst);
Neal Cardwelld135c522012-04-22 09:45:47 +00001253 if (tcp_sk(sk)->rx_opt.user_mss &&
1254 tcp_sk(sk)->rx_opt.user_mss < newtp->advmss)
1255 newtp->advmss = tcp_sk(sk)->rx_opt.user_mss;
1256
Linus Torvalds1da177e2005-04-16 15:20:36 -07001257 tcp_initialize_rcv_mss(newsk);
1258
Eric Dumazetc720c7e2009-10-15 06:30:45 +00001259 newinet->inet_daddr = newinet->inet_saddr = LOOPBACK4_IPV6;
1260 newinet->inet_rcv_saddr = LOOPBACK4_IPV6;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001261
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001262#ifdef CONFIG_TCP_MD5SIG
1263 /* Copy over the MD5 key from the original socket */
Eric Dumazetefe42082013-10-03 15:42:29 -07001264 if ((key = tcp_v6_md5_do_lookup(sk, &newsk->sk_v6_daddr)) != NULL) {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001265 /* We're using one, so create a matching key
1266 * on the newsk structure. If we fail to get
1267 * memory, then we end up not copying the key
1268 * across. Shucks.
1269 */
Eric Dumazetefe42082013-10-03 15:42:29 -07001270 tcp_md5_do_add(newsk, (union tcp_md5_addr *)&newsk->sk_v6_daddr,
Mel Gorman99a1dec2012-07-31 16:44:14 -07001271 AF_INET6, key->key, key->keylen,
1272 sk_gfp_atomic(sk, GFP_ATOMIC));
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001273 }
1274#endif
1275
Balazs Scheidler093d2822010-10-21 13:06:43 +02001276 if (__inet_inherit_port(sk, newsk) < 0) {
Christoph Paasche337e242012-12-14 04:07:58 +00001277 inet_csk_prepare_forced_close(newsk);
1278 tcp_done(newsk);
Balazs Scheidler093d2822010-10-21 13:06:43 +02001279 goto out;
1280 }
Eric Dumazet9327f702009-12-04 03:46:54 +00001281 __inet6_hash(newsk, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001282
1283 return newsk;
1284
1285out_overflow:
Pavel Emelyanovde0744a2008-07-16 20:31:16 -07001286 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
Balazs Scheidler093d2822010-10-21 13:06:43 +02001287out_nonewsk:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001288 dst_release(dst);
Balazs Scheidler093d2822010-10-21 13:06:43 +02001289out:
1290 NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001291 return NULL;
1292}
1293
Al Virob51655b2006-11-14 21:40:42 -08001294static __sum16 tcp_v6_checksum_init(struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001295{
Patrick McHardy84fa7932006-08-29 16:44:56 -07001296 if (skb->ip_summed == CHECKSUM_COMPLETE) {
Herbert Xu684f2172009-01-08 10:41:23 -08001297 if (!tcp_v6_check(skb->len, &ipv6_hdr(skb)->saddr,
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001298 &ipv6_hdr(skb)->daddr, skb->csum)) {
Herbert Xufb286bb2005-11-10 13:01:24 -08001299 skb->ip_summed = CHECKSUM_UNNECESSARY;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001300 return 0;
Herbert Xufb286bb2005-11-10 13:01:24 -08001301 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001302 }
Herbert Xufb286bb2005-11-10 13:01:24 -08001303
Herbert Xu684f2172009-01-08 10:41:23 -08001304 skb->csum = ~csum_unfold(tcp_v6_check(skb->len,
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001305 &ipv6_hdr(skb)->saddr,
1306 &ipv6_hdr(skb)->daddr, 0));
Herbert Xufb286bb2005-11-10 13:01:24 -08001307
Linus Torvalds1da177e2005-04-16 15:20:36 -07001308 if (skb->len <= 76) {
Herbert Xufb286bb2005-11-10 13:01:24 -08001309 return __skb_checksum_complete(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001310 }
1311 return 0;
1312}
1313
1314/* The socket must have it's spinlock held when we get
1315 * here.
1316 *
1317 * We have a potential double-lock case here, so even when
1318 * doing backlog processing we use the BH locking scheme.
1319 * This is because we cannot sleep with the original spinlock
1320 * held.
1321 */
1322static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1323{
1324 struct ipv6_pinfo *np = inet6_sk(sk);
1325 struct tcp_sock *tp;
1326 struct sk_buff *opt_skb = NULL;
1327
1328 /* Imagine: socket is IPv6. IPv4 packet arrives,
1329 goes to IPv4 receive handler and backlogged.
1330 From backlog it always goes here. Kerboom...
1331 Fortunately, tcp_rcv_established and rcv_established
1332 handle them correctly, but it is not case with
1333 tcp_v6_hnd_req and tcp_v6_send_reset(). --ANK
1334 */
1335
1336 if (skb->protocol == htons(ETH_P_IP))
1337 return tcp_v4_do_rcv(sk, skb);
1338
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001339#ifdef CONFIG_TCP_MD5SIG
1340 if (tcp_v6_inbound_md5_hash (sk, skb))
1341 goto discard;
1342#endif
1343
Dmitry Mishinfda9ef52006-08-31 15:28:39 -07001344 if (sk_filter(sk, skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001345 goto discard;
1346
1347 /*
1348 * socket locking is here for SMP purposes as backlog rcv
1349 * is currently called with bh processing disabled.
1350 */
1351
1352 /* Do Stevens' IPV6_PKTOPTIONS.
1353
1354 Yes, guys, it is the only place in our code, where we
1355 may make it not affecting IPv4.
1356 The rest of code is protocol independent,
1357 and I do not like idea to uglify IPv4.
1358
1359 Actually, all the idea behind IPV6_PKTOPTIONS
1360 looks not very well thought. For now we latch
1361 options, received in the last packet, enqueued
1362 by tcp. Feel free to propose better solution.
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001363 --ANK (980728)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001364 */
1365 if (np->rxopt.all)
Mel Gorman99a1dec2012-07-31 16:44:14 -07001366 opt_skb = skb_clone(skb, sk_gfp_atomic(sk, GFP_ATOMIC));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001367
1368 if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
Eric Dumazet5d299f32012-08-06 05:09:33 +00001369 struct dst_entry *dst = sk->sk_rx_dst;
1370
Tom Herbertbdeab992011-08-14 19:45:55 +00001371 sock_rps_save_rxhash(sk, skb);
Eric Dumazet5d299f32012-08-06 05:09:33 +00001372 if (dst) {
1373 if (inet_sk(sk)->rx_dst_ifindex != skb->skb_iif ||
1374 dst->ops->check(dst, np->rx_dst_cookie) == NULL) {
1375 dst_release(dst);
1376 sk->sk_rx_dst = NULL;
1377 }
1378 }
1379
Vijay Subramanianc995ae22013-09-03 12:23:22 -07001380 tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001381 if (opt_skb)
1382 goto ipv6_pktoptions;
1383 return 0;
1384 }
1385
Arnaldo Carvalho de Meloab6a5bb2007-03-18 17:43:48 -07001386 if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001387 goto csum_err;
1388
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001389 if (sk->sk_state == TCP_LISTEN) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001390 struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1391 if (!nsk)
1392 goto discard;
1393
1394 /*
1395 * Queue it on the new socket if the new socket is active,
1396 * otherwise we just shortcircuit this and continue with
1397 * the new socket..
1398 */
Weilong Chen4c99aa42013-12-19 18:44:34 +08001399 if (nsk != sk) {
Tom Herbertbdeab992011-08-14 19:45:55 +00001400 sock_rps_save_rxhash(nsk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001401 if (tcp_child_process(sk, nsk, skb))
1402 goto reset;
1403 if (opt_skb)
1404 __kfree_skb(opt_skb);
1405 return 0;
1406 }
Neil Horman47482f12011-04-06 13:07:09 -07001407 } else
Tom Herbertbdeab992011-08-14 19:45:55 +00001408 sock_rps_save_rxhash(sk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001409
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -07001410 if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001411 goto reset;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001412 if (opt_skb)
1413 goto ipv6_pktoptions;
1414 return 0;
1415
1416reset:
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001417 tcp_v6_send_reset(sk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001418discard:
1419 if (opt_skb)
1420 __kfree_skb(opt_skb);
1421 kfree_skb(skb);
1422 return 0;
1423csum_err:
Eric Dumazet6a5dc9e2013-04-29 08:39:56 +00001424 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_CSUMERRORS);
Pavel Emelyanov63231bd2008-07-16 20:22:25 -07001425 TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_INERRS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001426 goto discard;
1427
1428
1429ipv6_pktoptions:
1430 /* Do you ask, what is it?
1431
1432 1. skb was enqueued by tcp.
1433 2. skb is added to tail of read queue, rather than out of order.
1434 3. socket is not in passive state.
1435 4. Finally, it really contains options, which user wants to receive.
1436 */
1437 tp = tcp_sk(sk);
1438 if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1439 !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
YOSHIFUJI Hideaki333fad52005-09-08 09:59:17 +09001440 if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -03001441 np->mcast_oif = inet6_iif(opt_skb);
YOSHIFUJI Hideaki333fad52005-09-08 09:59:17 +09001442 if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001443 np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
Florent Fourcot82e9f102013-12-08 15:46:59 +01001444 if (np->rxopt.bits.rxflow || np->rxopt.bits.rxtclass)
Florent Fourcot1397ed32013-12-08 15:46:57 +01001445 np->rcv_flowinfo = ip6_flowinfo(ipv6_hdr(opt_skb));
Florent Fourcotdf3687f2014-01-17 17:15:03 +01001446 if (np->repflow)
1447 np->flow_label = ip6_flowlabel(ipv6_hdr(opt_skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001448 if (ipv6_opt_accepted(sk, opt_skb)) {
1449 skb_set_owner_r(opt_skb, sk);
1450 opt_skb = xchg(&np->pktoptions, opt_skb);
1451 } else {
1452 __kfree_skb(opt_skb);
1453 opt_skb = xchg(&np->pktoptions, NULL);
1454 }
1455 }
1456
Wei Yongjun800d55f2009-02-23 21:45:33 +00001457 kfree_skb(opt_skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001458 return 0;
1459}
1460
Herbert Xue5bbef22007-10-15 12:50:28 -07001461static int tcp_v6_rcv(struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001462{
Eric Dumazetcf533ea2011-10-21 05:22:42 -04001463 const struct tcphdr *th;
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001464 const struct ipv6hdr *hdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001465 struct sock *sk;
1466 int ret;
Pavel Emelyanova86b1e32008-07-16 20:20:58 -07001467 struct net *net = dev_net(skb->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001468
1469 if (skb->pkt_type != PACKET_HOST)
1470 goto discard_it;
1471
1472 /*
1473 * Count it even if it's bad.
1474 */
Pavel Emelyanov63231bd2008-07-16 20:22:25 -07001475 TCP_INC_STATS_BH(net, TCP_MIB_INSEGS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001476
1477 if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1478 goto discard_it;
1479
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -07001480 th = tcp_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001481
1482 if (th->doff < sizeof(struct tcphdr)/4)
1483 goto bad_packet;
1484 if (!pskb_may_pull(skb, th->doff*4))
1485 goto discard_it;
1486
Herbert Xu60476372007-04-09 11:59:39 -07001487 if (!skb_csum_unnecessary(skb) && tcp_v6_checksum_init(skb))
Eric Dumazet6a5dc9e2013-04-29 08:39:56 +00001488 goto csum_error;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001489
Arnaldo Carvalho de Meloaa8223c2007-04-10 21:04:22 -07001490 th = tcp_hdr(skb);
Stephen Hemmingere802af92010-04-22 15:24:53 -07001491 hdr = ipv6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001492 TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1493 TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1494 skb->len - th->doff*4);
1495 TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1496 TCP_SKB_CB(skb)->when = 0;
Eric Dumazetb82d1bb2011-09-27 02:20:08 -04001497 TCP_SKB_CB(skb)->ip_dsfield = ipv6_get_dsfield(hdr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001498 TCP_SKB_CB(skb)->sacked = 0;
1499
Arnaldo Carvalho de Melo9a1f27c2008-10-07 11:41:57 -07001500 sk = __inet6_lookup_skb(&tcp_hashinfo, skb, th->source, th->dest);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001501 if (!sk)
1502 goto no_tcp_socket;
1503
1504process:
1505 if (sk->sk_state == TCP_TIME_WAIT)
1506 goto do_time_wait;
1507
Stephen Hemmingere802af92010-04-22 15:24:53 -07001508 if (hdr->hop_limit < inet6_sk(sk)->min_hopcount) {
1509 NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
1510 goto discard_and_relse;
1511 }
1512
Linus Torvalds1da177e2005-04-16 15:20:36 -07001513 if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1514 goto discard_and_relse;
1515
Dmitry Mishinfda9ef52006-08-31 15:28:39 -07001516 if (sk_filter(sk, skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001517 goto discard_and_relse;
1518
Eliezer Tamir8b80cda2013-07-10 17:13:26 +03001519 sk_mark_napi_id(sk, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001520 skb->dev = NULL;
1521
Fabio Olive Leite293b9c42006-09-25 22:28:47 -07001522 bh_lock_sock_nested(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001523 ret = 0;
1524 if (!sock_owned_by_user(sk)) {
Chris Leech1a2449a2006-05-23 18:05:53 -07001525#ifdef CONFIG_NET_DMA
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001526 struct tcp_sock *tp = tcp_sk(sk);
David S. Millerb4caea82007-10-26 04:20:13 -07001527 if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
Dave Jianga2bd1142012-04-04 16:10:46 -07001528 tp->ucopy.dma_chan = net_dma_find_channel();
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001529 if (tp->ucopy.dma_chan)
1530 ret = tcp_v6_do_rcv(sk, skb);
1531 else
Chris Leech1a2449a2006-05-23 18:05:53 -07001532#endif
1533 {
1534 if (!tcp_prequeue(sk, skb))
1535 ret = tcp_v6_do_rcv(sk, skb);
1536 }
Eric Dumazetda882c12012-04-22 23:38:54 +00001537 } else if (unlikely(sk_add_backlog(sk, skb,
1538 sk->sk_rcvbuf + sk->sk_sndbuf))) {
Zhu Yi6b03a532010-03-04 18:01:41 +00001539 bh_unlock_sock(sk);
Eric Dumazet6cce09f2010-03-07 23:21:57 +00001540 NET_INC_STATS_BH(net, LINUX_MIB_TCPBACKLOGDROP);
Zhu Yi6b03a532010-03-04 18:01:41 +00001541 goto discard_and_relse;
1542 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001543 bh_unlock_sock(sk);
1544
1545 sock_put(sk);
1546 return ret ? -1 : 0;
1547
1548no_tcp_socket:
1549 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1550 goto discard_it;
1551
1552 if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
Eric Dumazet6a5dc9e2013-04-29 08:39:56 +00001553csum_error:
1554 TCP_INC_STATS_BH(net, TCP_MIB_CSUMERRORS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001555bad_packet:
Pavel Emelyanov63231bd2008-07-16 20:22:25 -07001556 TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001557 } else {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001558 tcp_v6_send_reset(NULL, skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001559 }
1560
1561discard_it:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001562 kfree_skb(skb);
1563 return 0;
1564
1565discard_and_relse:
1566 sock_put(sk);
1567 goto discard_it;
1568
1569do_time_wait:
1570 if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -07001571 inet_twsk_put(inet_twsk(sk));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001572 goto discard_it;
1573 }
1574
Eric Dumazet6a5dc9e2013-04-29 08:39:56 +00001575 if (skb->len < (th->doff<<2)) {
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -07001576 inet_twsk_put(inet_twsk(sk));
Eric Dumazet6a5dc9e2013-04-29 08:39:56 +00001577 goto bad_packet;
1578 }
1579 if (tcp_checksum_complete(skb)) {
1580 inet_twsk_put(inet_twsk(sk));
1581 goto csum_error;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001582 }
1583
YOSHIFUJI Hideaki9469c7b2006-10-10 19:41:46 -07001584 switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001585 case TCP_TW_SYN:
1586 {
1587 struct sock *sk2;
1588
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001589 sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
Tom Herbert5ba24952013-01-22 09:50:39 +00001590 &ipv6_hdr(skb)->saddr, th->source,
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001591 &ipv6_hdr(skb)->daddr,
Arnaldo Carvalho de Melo505cbfc2005-08-12 09:19:38 -03001592 ntohs(th->dest), inet6_iif(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001593 if (sk2 != NULL) {
Arnaldo Carvalho de Melo295ff7e2005-08-09 20:44:40 -07001594 struct inet_timewait_sock *tw = inet_twsk(sk);
1595 inet_twsk_deschedule(tw, &tcp_death_row);
1596 inet_twsk_put(tw);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001597 sk = sk2;
1598 goto process;
1599 }
1600 /* Fall through to ACK */
1601 }
1602 case TCP_TW_ACK:
1603 tcp_v6_timewait_ack(sk, skb);
1604 break;
1605 case TCP_TW_RST:
1606 goto no_tcp_socket;
1607 case TCP_TW_SUCCESS:;
1608 }
1609 goto discard_it;
1610}
1611
Eric Dumazetc7109982012-07-26 12:18:11 +00001612static void tcp_v6_early_demux(struct sk_buff *skb)
1613{
1614 const struct ipv6hdr *hdr;
1615 const struct tcphdr *th;
1616 struct sock *sk;
1617
1618 if (skb->pkt_type != PACKET_HOST)
1619 return;
1620
1621 if (!pskb_may_pull(skb, skb_transport_offset(skb) + sizeof(struct tcphdr)))
1622 return;
1623
1624 hdr = ipv6_hdr(skb);
1625 th = tcp_hdr(skb);
1626
1627 if (th->doff < sizeof(struct tcphdr) / 4)
1628 return;
1629
1630 sk = __inet6_lookup_established(dev_net(skb->dev), &tcp_hashinfo,
1631 &hdr->saddr, th->source,
1632 &hdr->daddr, ntohs(th->dest),
1633 inet6_iif(skb));
1634 if (sk) {
1635 skb->sk = sk;
1636 skb->destructor = sock_edemux;
1637 if (sk->sk_state != TCP_TIME_WAIT) {
1638 struct dst_entry *dst = sk->sk_rx_dst;
Neal Cardwellf3f12132012-10-22 21:41:48 +00001639
Eric Dumazetc7109982012-07-26 12:18:11 +00001640 if (dst)
Eric Dumazet5d299f32012-08-06 05:09:33 +00001641 dst = dst_check(dst, inet6_sk(sk)->rx_dst_cookie);
Eric Dumazetc7109982012-07-26 12:18:11 +00001642 if (dst &&
Neal Cardwellf3f12132012-10-22 21:41:48 +00001643 inet_sk(sk)->rx_dst_ifindex == skb->skb_iif)
Eric Dumazetc7109982012-07-26 12:18:11 +00001644 skb_dst_set_noref(skb, dst);
1645 }
1646 }
1647}
1648
David S. Millerccb7c412010-12-01 18:09:13 -08001649static struct timewait_sock_ops tcp6_timewait_sock_ops = {
1650 .twsk_obj_size = sizeof(struct tcp6_timewait_sock),
1651 .twsk_unique = tcp_twsk_unique,
1652 .twsk_destructor= tcp_twsk_destructor,
David S. Millerccb7c412010-12-01 18:09:13 -08001653};
1654
Stephen Hemminger3b401a82009-09-01 19:25:04 +00001655static const struct inet_connection_sock_af_ops ipv6_specific = {
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001656 .queue_xmit = inet6_csk_xmit,
1657 .send_check = tcp_v6_send_check,
1658 .rebuild_header = inet6_sk_rebuild_header,
Eric Dumazet5d299f32012-08-06 05:09:33 +00001659 .sk_rx_dst_set = inet6_sk_rx_dst_set,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001660 .conn_request = tcp_v6_conn_request,
1661 .syn_recv_sock = tcp_v6_syn_recv_sock,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001662 .net_header_len = sizeof(struct ipv6hdr),
Eric Dumazet67469602012-04-24 07:37:38 +00001663 .net_frag_header_len = sizeof(struct frag_hdr),
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001664 .setsockopt = ipv6_setsockopt,
1665 .getsockopt = ipv6_getsockopt,
1666 .addr2sockaddr = inet6_csk_addr2sockaddr,
1667 .sockaddr_len = sizeof(struct sockaddr_in6),
Arnaldo Carvalho de Meloab1e0a12008-02-03 04:06:04 -08001668 .bind_conflict = inet6_csk_bind_conflict,
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001669#ifdef CONFIG_COMPAT
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001670 .compat_setsockopt = compat_ipv6_setsockopt,
1671 .compat_getsockopt = compat_ipv6_getsockopt,
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001672#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001673};
1674
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001675#ifdef CONFIG_TCP_MD5SIG
Stephen Hemmingerb2e4b3d2009-09-01 19:25:03 +00001676static const struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001677 .md5_lookup = tcp_v6_md5_lookup,
Adam Langley49a72df2008-07-19 00:01:42 -07001678 .calc_md5_hash = tcp_v6_md5_hash_skb,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001679 .md5_parse = tcp_v6_parse_md5_keys,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001680};
David S. Millera9286302006-11-14 19:53:22 -08001681#endif
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001682
Linus Torvalds1da177e2005-04-16 15:20:36 -07001683/*
1684 * TCP over IPv4 via INET6 API
1685 */
1686
Stephen Hemminger3b401a82009-09-01 19:25:04 +00001687static const struct inet_connection_sock_af_ops ipv6_mapped = {
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001688 .queue_xmit = ip_queue_xmit,
1689 .send_check = tcp_v4_send_check,
1690 .rebuild_header = inet_sk_rebuild_header,
Eric Dumazet63d02d12012-08-09 14:11:00 +00001691 .sk_rx_dst_set = inet_sk_rx_dst_set,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001692 .conn_request = tcp_v6_conn_request,
1693 .syn_recv_sock = tcp_v6_syn_recv_sock,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001694 .net_header_len = sizeof(struct iphdr),
1695 .setsockopt = ipv6_setsockopt,
1696 .getsockopt = ipv6_getsockopt,
1697 .addr2sockaddr = inet6_csk_addr2sockaddr,
1698 .sockaddr_len = sizeof(struct sockaddr_in6),
Arnaldo Carvalho de Meloab1e0a12008-02-03 04:06:04 -08001699 .bind_conflict = inet6_csk_bind_conflict,
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001700#ifdef CONFIG_COMPAT
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001701 .compat_setsockopt = compat_ipv6_setsockopt,
1702 .compat_getsockopt = compat_ipv6_getsockopt,
Dmitry Mishin3fdadf72006-03-20 22:45:21 -08001703#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001704};
1705
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001706#ifdef CONFIG_TCP_MD5SIG
Stephen Hemmingerb2e4b3d2009-09-01 19:25:03 +00001707static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001708 .md5_lookup = tcp_v4_md5_lookup,
Adam Langley49a72df2008-07-19 00:01:42 -07001709 .calc_md5_hash = tcp_v4_md5_hash_skb,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001710 .md5_parse = tcp_v6_parse_md5_keys,
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001711};
David S. Millera9286302006-11-14 19:53:22 -08001712#endif
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001713
Linus Torvalds1da177e2005-04-16 15:20:36 -07001714/* NOTE: A lot of things set to zero explicitly by call to
1715 * sk_alloc() so need not be done here.
1716 */
1717static int tcp_v6_init_sock(struct sock *sk)
1718{
Arnaldo Carvalho de Melo6687e982005-08-10 04:03:31 -03001719 struct inet_connection_sock *icsk = inet_csk(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001720
Neal Cardwell900f65d2012-04-19 09:55:21 +00001721 tcp_init_sock(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001722
Arnaldo Carvalho de Melo8292a172005-12-13 23:15:52 -08001723 icsk->icsk_af_ops = &ipv6_specific;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001724
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001725#ifdef CONFIG_TCP_MD5SIG
David S. Millerac807fa2012-04-23 03:21:58 -04001726 tcp_sk(sk)->af_specific = &tcp_sock_ipv6_specific;
YOSHIFUJI Hideakicfb6eeb2006-11-14 19:07:45 -08001727#endif
1728
Linus Torvalds1da177e2005-04-16 15:20:36 -07001729 return 0;
1730}
1731
Brian Haley7d06b2e2008-06-14 17:04:49 -07001732static void tcp_v6_destroy_sock(struct sock *sk)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001733{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001734 tcp_v4_destroy_sock(sk);
Brian Haley7d06b2e2008-06-14 17:04:49 -07001735 inet6_destroy_sock(sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001736}
1737
YOSHIFUJI Hideaki952a10b2007-04-21 20:13:44 +09001738#ifdef CONFIG_PROC_FS
Linus Torvalds1da177e2005-04-16 15:20:36 -07001739/* Proc filesystem TCPv6 sock list dumping. */
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001740static void get_openreq6(struct seq_file *seq,
Eric W. Biedermana7cb5a42012-05-24 01:10:10 -06001741 const struct sock *sk, struct request_sock *req, int i, kuid_t uid)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001742{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001743 int ttd = req->expires - jiffies;
Eric Dumazet634fb9792013-10-09 15:21:29 -07001744 const struct in6_addr *src = &inet_rsk(req)->ir_v6_loc_addr;
1745 const struct in6_addr *dest = &inet_rsk(req)->ir_v6_rmt_addr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001746
1747 if (ttd < 0)
1748 ttd = 0;
1749
Linus Torvalds1da177e2005-04-16 15:20:36 -07001750 seq_printf(seq,
1751 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
Francesco Fuscod14c5ab2013-08-15 13:42:14 +02001752 "%02X %08X:%08X %02X:%08lX %08X %5u %8d %d %d %pK\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001753 i,
1754 src->s6_addr32[0], src->s6_addr32[1],
1755 src->s6_addr32[2], src->s6_addr32[3],
Eric Dumazetb44084c2013-10-10 00:04:37 -07001756 inet_rsk(req)->ir_num,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001757 dest->s6_addr32[0], dest->s6_addr32[1],
1758 dest->s6_addr32[2], dest->s6_addr32[3],
Eric Dumazet634fb9792013-10-09 15:21:29 -07001759 ntohs(inet_rsk(req)->ir_rmt_port),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001760 TCP_SYN_RECV,
Weilong Chen4c99aa42013-12-19 18:44:34 +08001761 0, 0, /* could print option size, but that is af dependent. */
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001762 1, /* timers active (only the expire timer) */
1763 jiffies_to_clock_t(ttd),
Eric Dumazete6c022a2012-10-27 23:16:46 +00001764 req->num_timeout,
Eric W. Biedermana7cb5a42012-05-24 01:10:10 -06001765 from_kuid_munged(seq_user_ns(seq), uid),
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001766 0, /* non standard timer */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001767 0, /* open_requests have no inode */
1768 0, req);
1769}
1770
1771static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1772{
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001773 const struct in6_addr *dest, *src;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001774 __u16 destp, srcp;
1775 int timer_active;
1776 unsigned long timer_expires;
Eric Dumazetcf533ea2011-10-21 05:22:42 -04001777 const struct inet_sock *inet = inet_sk(sp);
1778 const struct tcp_sock *tp = tcp_sk(sp);
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001779 const struct inet_connection_sock *icsk = inet_csk(sp);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001780
Eric Dumazetefe42082013-10-03 15:42:29 -07001781 dest = &sp->sk_v6_daddr;
1782 src = &sp->sk_v6_rcv_saddr;
Eric Dumazetc720c7e2009-10-15 06:30:45 +00001783 destp = ntohs(inet->inet_dport);
1784 srcp = ntohs(inet->inet_sport);
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001785
1786 if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001787 timer_active = 1;
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001788 timer_expires = icsk->icsk_timeout;
1789 } else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001790 timer_active = 4;
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001791 timer_expires = icsk->icsk_timeout;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001792 } else if (timer_pending(&sp->sk_timer)) {
1793 timer_active = 2;
1794 timer_expires = sp->sk_timer.expires;
1795 } else {
1796 timer_active = 0;
1797 timer_expires = jiffies;
1798 }
1799
1800 seq_printf(seq,
1801 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
Francesco Fuscod14c5ab2013-08-15 13:42:14 +02001802 "%02X %08X:%08X %02X:%08lX %08X %5u %8d %lu %d %pK %lu %lu %u %u %d\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001803 i,
1804 src->s6_addr32[0], src->s6_addr32[1],
1805 src->s6_addr32[2], src->s6_addr32[3], srcp,
1806 dest->s6_addr32[0], dest->s6_addr32[1],
1807 dest->s6_addr32[2], dest->s6_addr32[3], destp,
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001808 sp->sk_state,
Sridhar Samudrala47da8ee2006-06-27 13:29:00 -07001809 tp->write_seq-tp->snd_una,
1810 (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001811 timer_active,
Eric Dumazeta399a802012-08-08 21:13:53 +00001812 jiffies_delta_to_clock_t(timer_expires - jiffies),
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001813 icsk->icsk_retransmits,
Eric W. Biedermana7cb5a42012-05-24 01:10:10 -06001814 from_kuid_munged(seq_user_ns(seq), sock_i_uid(sp)),
Arnaldo Carvalho de Melo6687e982005-08-10 04:03:31 -03001815 icsk->icsk_probes_out,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001816 sock_i_ino(sp),
1817 atomic_read(&sp->sk_refcnt), sp,
Stephen Hemminger7be87352008-06-27 20:00:19 -07001818 jiffies_to_clock_t(icsk->icsk_rto),
1819 jiffies_to_clock_t(icsk->icsk_ack.ato),
Weilong Chen4c99aa42013-12-19 18:44:34 +08001820 (icsk->icsk_ack.quick << 1) | icsk->icsk_ack.pingpong,
Ilpo Järvinen0b6a05c2009-09-15 01:30:10 -07001821 tp->snd_cwnd,
1822 tcp_in_initial_slowstart(tp) ? -1 : tp->snd_ssthresh
Linus Torvalds1da177e2005-04-16 15:20:36 -07001823 );
1824}
1825
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001826static void get_timewait6_sock(struct seq_file *seq,
Arnaldo Carvalho de Melo8feaf0c02005-08-09 20:09:30 -07001827 struct inet_timewait_sock *tw, int i)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001828{
Eric Dumazetb71d1d42011-04-22 04:53:02 +00001829 const struct in6_addr *dest, *src;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001830 __u16 destp, srcp;
Eric Dumazet96f817f2013-10-03 14:27:25 -07001831 s32 delta = tw->tw_ttd - inet_tw_time_stamp();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001832
Eric Dumazetefe42082013-10-03 15:42:29 -07001833 dest = &tw->tw_v6_daddr;
1834 src = &tw->tw_v6_rcv_saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001835 destp = ntohs(tw->tw_dport);
1836 srcp = ntohs(tw->tw_sport);
1837
1838 seq_printf(seq,
1839 "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
Dan Rosenberg71338aa2011-05-23 12:17:35 +00001840 "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001841 i,
1842 src->s6_addr32[0], src->s6_addr32[1],
1843 src->s6_addr32[2], src->s6_addr32[3], srcp,
1844 dest->s6_addr32[0], dest->s6_addr32[1],
1845 dest->s6_addr32[2], dest->s6_addr32[3], destp,
1846 tw->tw_substate, 0, 0,
Eric Dumazeta399a802012-08-08 21:13:53 +00001847 3, jiffies_delta_to_clock_t(delta), 0, 0, 0, 0,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001848 atomic_read(&tw->tw_refcnt), tw);
1849}
1850
Linus Torvalds1da177e2005-04-16 15:20:36 -07001851static int tcp6_seq_show(struct seq_file *seq, void *v)
1852{
1853 struct tcp_iter_state *st;
Eric Dumazet05dbc7b2013-10-03 00:22:02 -07001854 struct sock *sk = v;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001855
1856 if (v == SEQ_START_TOKEN) {
1857 seq_puts(seq,
1858 " sl "
1859 "local_address "
1860 "remote_address "
1861 "st tx_queue rx_queue tr tm->when retrnsmt"
1862 " uid timeout inode\n");
1863 goto out;
1864 }
1865 st = seq->private;
1866
1867 switch (st->state) {
1868 case TCP_SEQ_STATE_LISTENING:
1869 case TCP_SEQ_STATE_ESTABLISHED:
Eric Dumazet05dbc7b2013-10-03 00:22:02 -07001870 if (sk->sk_state == TCP_TIME_WAIT)
1871 get_timewait6_sock(seq, v, st->num);
1872 else
1873 get_tcp6_sock(seq, v, st->num);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001874 break;
1875 case TCP_SEQ_STATE_OPENREQ:
1876 get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
1877 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001878 }
1879out:
1880 return 0;
1881}
1882
Arjan van de Ven73cb88e2011-10-30 06:46:30 +00001883static const struct file_operations tcp6_afinfo_seq_fops = {
1884 .owner = THIS_MODULE,
1885 .open = tcp_seq_open,
1886 .read = seq_read,
1887 .llseek = seq_lseek,
1888 .release = seq_release_net
1889};
1890
Linus Torvalds1da177e2005-04-16 15:20:36 -07001891static struct tcp_seq_afinfo tcp6_seq_afinfo = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001892 .name = "tcp6",
1893 .family = AF_INET6,
Arjan van de Ven73cb88e2011-10-30 06:46:30 +00001894 .seq_fops = &tcp6_afinfo_seq_fops,
Denis V. Lunev9427c4b2008-04-13 22:12:13 -07001895 .seq_ops = {
1896 .show = tcp6_seq_show,
1897 },
Linus Torvalds1da177e2005-04-16 15:20:36 -07001898};
1899
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00001900int __net_init tcp6_proc_init(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001901{
Daniel Lezcano6f8b13b2008-03-21 04:14:45 -07001902 return tcp_proc_register(net, &tcp6_seq_afinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001903}
1904
Daniel Lezcano6f8b13b2008-03-21 04:14:45 -07001905void tcp6_proc_exit(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001906{
Daniel Lezcano6f8b13b2008-03-21 04:14:45 -07001907 tcp_proc_unregister(net, &tcp6_seq_afinfo);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001908}
1909#endif
1910
Eric Dumazetf77d6022013-05-09 10:28:16 +00001911static void tcp_v6_clear_sk(struct sock *sk, int size)
1912{
1913 struct inet_sock *inet = inet_sk(sk);
1914
1915 /* we do not want to clear pinet6 field, because of RCU lookups */
1916 sk_prot_clear_nulls(sk, offsetof(struct inet_sock, pinet6));
1917
1918 size -= offsetof(struct inet_sock, pinet6) + sizeof(inet->pinet6);
1919 memset(&inet->pinet6 + 1, 0, size);
1920}
1921
Linus Torvalds1da177e2005-04-16 15:20:36 -07001922struct proto tcpv6_prot = {
1923 .name = "TCPv6",
1924 .owner = THIS_MODULE,
1925 .close = tcp_close,
1926 .connect = tcp_v6_connect,
1927 .disconnect = tcp_disconnect,
Arnaldo Carvalho de Melo463c84b2005-08-09 20:10:42 -07001928 .accept = inet_csk_accept,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001929 .ioctl = tcp_ioctl,
1930 .init = tcp_v6_init_sock,
1931 .destroy = tcp_v6_destroy_sock,
1932 .shutdown = tcp_shutdown,
1933 .setsockopt = tcp_setsockopt,
1934 .getsockopt = tcp_getsockopt,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001935 .recvmsg = tcp_recvmsg,
Changli Gao7ba42912010-07-10 20:41:55 +00001936 .sendmsg = tcp_sendmsg,
1937 .sendpage = tcp_sendpage,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001938 .backlog_rcv = tcp_v6_do_rcv,
Eric Dumazet46d3cea2012-07-11 05:50:31 +00001939 .release_cb = tcp_release_cb,
Eric Dumazet563d34d2012-07-23 09:48:52 +02001940 .mtu_reduced = tcp_v6_mtu_reduced,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001941 .hash = tcp_v6_hash,
Arnaldo Carvalho de Meloab1e0a12008-02-03 04:06:04 -08001942 .unhash = inet_unhash,
1943 .get_port = inet_csk_get_port,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001944 .enter_memory_pressure = tcp_enter_memory_pressure,
Eric Dumazetc9bee3b72013-07-22 20:27:07 -07001945 .stream_memory_free = tcp_stream_memory_free,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001946 .sockets_allocated = &tcp_sockets_allocated,
1947 .memory_allocated = &tcp_memory_allocated,
1948 .memory_pressure = &tcp_memory_pressure,
Arnaldo Carvalho de Melo0a5578c2005-08-09 20:11:41 -07001949 .orphan_count = &tcp_orphan_count,
Eric W. Biedermana4fe34b2013-10-19 16:25:36 -07001950 .sysctl_mem = sysctl_tcp_mem,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001951 .sysctl_wmem = sysctl_tcp_wmem,
1952 .sysctl_rmem = sysctl_tcp_rmem,
1953 .max_header = MAX_TCP_HEADER,
1954 .obj_size = sizeof(struct tcp6_sock),
Eric Dumazet3ab5aee2008-11-16 19:40:17 -08001955 .slab_flags = SLAB_DESTROY_BY_RCU,
Arnaldo Carvalho de Melo6d6ee432005-12-13 23:25:19 -08001956 .twsk_prot = &tcp6_timewait_sock_ops,
Arnaldo Carvalho de Melo60236fd2005-06-18 22:47:21 -07001957 .rsk_prot = &tcp6_request_sock_ops,
Pavel Emelyanov39d8cda2008-03-22 16:50:58 -07001958 .h.hashinfo = &tcp_hashinfo,
Changli Gao7ba42912010-07-10 20:41:55 +00001959 .no_autobind = true,
Arnaldo Carvalho de Melo543d9cf2006-03-20 22:48:35 -08001960#ifdef CONFIG_COMPAT
1961 .compat_setsockopt = compat_tcp_setsockopt,
1962 .compat_getsockopt = compat_tcp_getsockopt,
1963#endif
Andrew Mortonc255a452012-07-31 16:43:02 -07001964#ifdef CONFIG_MEMCG_KMEM
Glauber Costad1a4c0b2011-12-11 21:47:04 +00001965 .proto_cgroup = tcp_proto_cgroup,
1966#endif
Eric Dumazetf77d6022013-05-09 10:28:16 +00001967 .clear_sk = tcp_v6_clear_sk,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001968};
1969
Alexey Dobriyan41135cc2009-09-14 12:22:28 +00001970static const struct inet6_protocol tcpv6_protocol = {
Eric Dumazetc7109982012-07-26 12:18:11 +00001971 .early_demux = tcp_v6_early_demux,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001972 .handler = tcp_v6_rcv,
1973 .err_handler = tcp_v6_err,
1974 .flags = INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
1975};
1976
Linus Torvalds1da177e2005-04-16 15:20:36 -07001977static struct inet_protosw tcpv6_protosw = {
1978 .type = SOCK_STREAM,
1979 .protocol = IPPROTO_TCP,
1980 .prot = &tcpv6_prot,
1981 .ops = &inet6_stream_ops,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001982 .no_check = 0,
Arnaldo Carvalho de Melod83d8462005-12-13 23:26:10 -08001983 .flags = INET_PROTOSW_PERMANENT |
1984 INET_PROTOSW_ICSK,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001985};
1986
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00001987static int __net_init tcpv6_net_init(struct net *net)
Daniel Lezcano93ec9262008-03-07 11:16:02 -08001988{
Denis V. Lunev56772422008-04-03 14:28:30 -07001989 return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
1990 SOCK_RAW, IPPROTO_TCP, net);
Daniel Lezcano93ec9262008-03-07 11:16:02 -08001991}
1992
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00001993static void __net_exit tcpv6_net_exit(struct net *net)
Daniel Lezcano93ec9262008-03-07 11:16:02 -08001994{
Denis V. Lunev56772422008-04-03 14:28:30 -07001995 inet_ctl_sock_destroy(net->ipv6.tcp_sk);
Eric W. Biedermanb099ce22009-12-03 02:29:09 +00001996}
1997
Alexey Dobriyan2c8c1e72010-01-17 03:35:32 +00001998static void __net_exit tcpv6_net_exit_batch(struct list_head *net_exit_list)
Eric W. Biedermanb099ce22009-12-03 02:29:09 +00001999{
2000 inet_twsk_purge(&tcp_hashinfo, &tcp_death_row, AF_INET6);
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002001}
2002
2003static struct pernet_operations tcpv6_net_ops = {
Eric W. Biedermanb099ce22009-12-03 02:29:09 +00002004 .init = tcpv6_net_init,
2005 .exit = tcpv6_net_exit,
2006 .exit_batch = tcpv6_net_exit_batch,
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002007};
2008
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002009int __init tcpv6_init(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002010{
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002011 int ret;
David Woodhouseae0f7d52006-01-11 15:53:04 -08002012
Vlad Yasevich33362882012-11-15 08:49:15 +00002013 ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
2014 if (ret)
Vlad Yasevichc6b641a2012-11-15 08:49:22 +00002015 goto out;
Vlad Yasevich33362882012-11-15 08:49:15 +00002016
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002017 /* register inet6 protocol */
2018 ret = inet6_register_protosw(&tcpv6_protosw);
2019 if (ret)
2020 goto out_tcpv6_protocol;
2021
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002022 ret = register_pernet_subsys(&tcpv6_net_ops);
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002023 if (ret)
2024 goto out_tcpv6_protosw;
2025out:
2026 return ret;
2027
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002028out_tcpv6_protosw:
2029 inet6_unregister_protosw(&tcpv6_protosw);
Vlad Yasevich33362882012-11-15 08:49:15 +00002030out_tcpv6_protocol:
2031 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002032 goto out;
2033}
2034
Daniel Lezcano09f77092007-12-13 05:34:58 -08002035void tcpv6_exit(void)
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002036{
Daniel Lezcano93ec9262008-03-07 11:16:02 -08002037 unregister_pernet_subsys(&tcpv6_net_ops);
Daniel Lezcano7f4e4862007-12-11 02:25:35 -08002038 inet6_unregister_protosw(&tcpv6_protosw);
2039 inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002040}