blob: 9bb031fa1c2f538c827402e3ecc8f90774fd6a55 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Internet Control Message Protocol (ICMPv6)
3 * Linux INET6 implementation
4 *
5 * Authors:
6 * Pedro Roque <roque@di.fc.ul.pt>
7 *
8 * $Id: icmp.c,v 1.38 2002/02/08 03:57:19 davem Exp $
9 *
10 * Based on net/ipv4/icmp.c
11 *
12 * RFC 1885
13 *
14 * This program is free software; you can redistribute it and/or
15 * modify it under the terms of the GNU General Public License
16 * as published by the Free Software Foundation; either version
17 * 2 of the License, or (at your option) any later version.
18 */
19
20/*
21 * Changes:
22 *
23 * Andi Kleen : exception handling
24 * Andi Kleen add rate limits. never reply to a icmp.
25 * add more length checks and other fixes.
26 * yoshfuji : ensure to sent parameter problem for
27 * fragments.
28 * YOSHIFUJI Hideaki @USAGI: added sysctl for icmp rate limit.
29 * Randy Dunlap and
30 * YOSHIFUJI Hideaki @USAGI: Per-interface statistics support
31 * Kazunori MIYAZAWA @USAGI: change output process to use ip6_append_data
32 */
33
34#include <linux/module.h>
35#include <linux/errno.h>
36#include <linux/types.h>
37#include <linux/socket.h>
38#include <linux/in.h>
39#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070040#include <linux/sockios.h>
41#include <linux/net.h>
42#include <linux/skbuff.h>
43#include <linux/init.h>
Yasuyuki Kozakai763ecff2006-02-15 15:24:15 -080044#include <linux/netfilter.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070045
46#ifdef CONFIG_SYSCTL
47#include <linux/sysctl.h>
48#endif
49
50#include <linux/inet.h>
51#include <linux/netdevice.h>
52#include <linux/icmpv6.h>
53
54#include <net/ip.h>
55#include <net/sock.h>
56
57#include <net/ipv6.h>
58#include <net/ip6_checksum.h>
59#include <net/protocol.h>
60#include <net/raw.h>
61#include <net/rawv6.h>
62#include <net/transp_v6.h>
63#include <net/ip6_route.h>
64#include <net/addrconf.h>
65#include <net/icmp.h>
66
67#include <asm/uaccess.h>
68#include <asm/system.h>
69
Eric Dumazetba899662005-08-26 12:05:31 -070070DEFINE_SNMP_STAT(struct icmpv6_mib, icmpv6_statistics) __read_mostly;
YOSHIFUJI Hideaki71590392007-02-22 22:05:40 +090071EXPORT_SYMBOL(icmpv6_statistics);
David L Stevens14878f72007-09-16 16:52:35 -070072DEFINE_SNMP_STAT(struct icmpv6msg_mib, icmpv6msg_statistics) __read_mostly;
73EXPORT_SYMBOL(icmpv6msg_statistics);
Linus Torvalds1da177e2005-04-16 15:20:36 -070074
75/*
76 * The ICMP socket(s). This is the most convenient way to flow control
77 * our ICMP output as well as maintain a clean interface throughout
78 * all layers. All Socketless IP sends will soon be gone.
79 *
80 * On SMP we have one ICMP socket per-cpu.
81 */
82static DEFINE_PER_CPU(struct socket *, __icmpv6_socket) = NULL;
83#define icmpv6_socket __get_cpu_var(__icmpv6_socket)
84
Herbert Xue5bbef22007-10-15 12:50:28 -070085static int icmpv6_rcv(struct sk_buff *skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -070086
87static struct inet6_protocol icmpv6_protocol = {
88 .handler = icmpv6_rcv,
89 .flags = INET6_PROTO_FINAL,
90};
91
92static __inline__ int icmpv6_xmit_lock(void)
93{
94 local_bh_disable();
95
96 if (unlikely(!spin_trylock(&icmpv6_socket->sk->sk_lock.slock))) {
97 /* This can happen if the output path (f.e. SIT or
98 * ip6ip6 tunnel) signals dst_link_failure() for an
99 * outgoing ICMP6 packet.
100 */
101 local_bh_enable();
102 return 1;
103 }
104 return 0;
105}
106
107static __inline__ void icmpv6_xmit_unlock(void)
108{
109 spin_unlock_bh(&icmpv6_socket->sk->sk_lock.slock);
110}
111
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900112/*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700113 * Slightly more convenient version of icmpv6_send.
114 */
115void icmpv6_param_prob(struct sk_buff *skb, int code, int pos)
116{
117 icmpv6_send(skb, ICMPV6_PARAMPROB, code, pos, skb->dev);
118 kfree_skb(skb);
119}
120
121/*
122 * Figure out, may we reply to this packet with icmp error.
123 *
124 * We do not reply, if:
125 * - it was icmp error message.
126 * - it is truncated, so that it is known, that protocol is ICMPV6
127 * (i.e. in the middle of some exthdr)
128 *
129 * --ANK (980726)
130 */
131
132static int is_ineligible(struct sk_buff *skb)
133{
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700134 int ptr = (u8 *)(ipv6_hdr(skb) + 1) - skb->data;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700135 int len = skb->len - ptr;
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700136 __u8 nexthdr = ipv6_hdr(skb)->nexthdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700137
138 if (len < 0)
139 return 1;
140
Herbert Xu0d3d0772005-04-24 20:16:19 -0700141 ptr = ipv6_skip_exthdr(skb, ptr, &nexthdr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700142 if (ptr < 0)
143 return 0;
144 if (nexthdr == IPPROTO_ICMPV6) {
145 u8 _type, *tp;
146 tp = skb_header_pointer(skb,
147 ptr+offsetof(struct icmp6hdr, icmp6_type),
148 sizeof(_type), &_type);
149 if (tp == NULL ||
150 !(*tp & ICMPV6_INFOMSG_MASK))
151 return 1;
152 }
153 return 0;
154}
155
Brian Haleyab32ea52006-09-22 14:15:41 -0700156static int sysctl_icmpv6_time __read_mostly = 1*HZ;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700157
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900158/*
159 * Check the ICMP output rate limit
Linus Torvalds1da177e2005-04-16 15:20:36 -0700160 */
161static inline int icmpv6_xrlim_allow(struct sock *sk, int type,
162 struct flowi *fl)
163{
164 struct dst_entry *dst;
165 int res = 0;
166
167 /* Informational messages are not limited. */
168 if (type & ICMPV6_INFOMSG_MASK)
169 return 1;
170
171 /* Do not limit pmtu discovery, it would break it. */
172 if (type == ICMPV6_PKT_TOOBIG)
173 return 1;
174
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900175 /*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700176 * Look up the output route.
177 * XXX: perhaps the expire for routing entries cloned by
178 * this lookup should be more aggressive (not longer than timeout).
179 */
180 dst = ip6_route_output(sk, fl);
181 if (dst->error) {
YOSHIFUJI Hideakia11d2062006-11-04 20:11:37 +0900182 IP6_INC_STATS(ip6_dst_idev(dst),
183 IPSTATS_MIB_OUTNOROUTES);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700184 } else if (dst->dev && (dst->dev->flags&IFF_LOOPBACK)) {
185 res = 1;
186 } else {
187 struct rt6_info *rt = (struct rt6_info *)dst;
188 int tmo = sysctl_icmpv6_time;
189
190 /* Give more bandwidth to wider prefixes. */
191 if (rt->rt6i_dst.plen < 128)
192 tmo >>= ((128 - rt->rt6i_dst.plen)>>5);
193
194 res = xrlim_allow(dst, tmo);
195 }
196 dst_release(dst);
197 return res;
198}
199
200/*
201 * an inline helper for the "simple" if statement below
202 * checks if parameter problem report is caused by an
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900203 * unrecognized IPv6 option that has the Option Type
Linus Torvalds1da177e2005-04-16 15:20:36 -0700204 * highest-order two bits set to 10
205 */
206
207static __inline__ int opt_unrec(struct sk_buff *skb, __u32 offset)
208{
209 u8 _optval, *op;
210
Arnaldo Carvalho de Melobbe735e2007-03-10 22:16:10 -0300211 offset += skb_network_offset(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700212 op = skb_header_pointer(skb, offset, sizeof(_optval), &_optval);
213 if (op == NULL)
214 return 1;
215 return (*op & 0xC0) == 0x80;
216}
217
218static int icmpv6_push_pending_frames(struct sock *sk, struct flowi *fl, struct icmp6hdr *thdr, int len)
219{
220 struct sk_buff *skb;
221 struct icmp6hdr *icmp6h;
222 int err = 0;
223
224 if ((skb = skb_peek(&sk->sk_write_queue)) == NULL)
225 goto out;
226
Arnaldo Carvalho de Melocc70ab22007-03-13 14:03:22 -0300227 icmp6h = icmp6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700228 memcpy(icmp6h, thdr, sizeof(struct icmp6hdr));
229 icmp6h->icmp6_cksum = 0;
230
231 if (skb_queue_len(&sk->sk_write_queue) == 1) {
232 skb->csum = csum_partial((char *)icmp6h,
233 sizeof(struct icmp6hdr), skb->csum);
234 icmp6h->icmp6_cksum = csum_ipv6_magic(&fl->fl6_src,
235 &fl->fl6_dst,
236 len, fl->proto,
237 skb->csum);
238 } else {
Al Viro868c86b2006-11-14 21:35:48 -0800239 __wsum tmp_csum = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700240
241 skb_queue_walk(&sk->sk_write_queue, skb) {
242 tmp_csum = csum_add(tmp_csum, skb->csum);
243 }
244
245 tmp_csum = csum_partial((char *)icmp6h,
246 sizeof(struct icmp6hdr), tmp_csum);
Al Viro868c86b2006-11-14 21:35:48 -0800247 icmp6h->icmp6_cksum = csum_ipv6_magic(&fl->fl6_src,
248 &fl->fl6_dst,
249 len, fl->proto,
250 tmp_csum);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252 ip6_push_pending_frames(sk);
253out:
254 return err;
255}
256
257struct icmpv6_msg {
258 struct sk_buff *skb;
259 int offset;
Yasuyuki Kozakai763ecff2006-02-15 15:24:15 -0800260 uint8_t type;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261};
262
263static int icmpv6_getfrag(void *from, char *to, int offset, int len, int odd, struct sk_buff *skb)
264{
265 struct icmpv6_msg *msg = (struct icmpv6_msg *) from;
266 struct sk_buff *org_skb = msg->skb;
Al Viro5f92a732006-11-14 21:36:54 -0800267 __wsum csum = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268
269 csum = skb_copy_and_csum_bits(org_skb, msg->offset + offset,
270 to, len, csum);
271 skb->csum = csum_block_add(skb->csum, csum, odd);
Yasuyuki Kozakai763ecff2006-02-15 15:24:15 -0800272 if (!(msg->type & ICMPV6_INFOMSG_MASK))
273 nf_ct_attach(skb, org_skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700274 return 0;
275}
276
Masahide NAKAMURA59fbb3a2007-06-26 23:56:32 -0700277#if defined(CONFIG_IPV6_MIP6) || defined(CONFIG_IPV6_MIP6_MODULE)
Masahide NAKAMURA79383232006-08-23 19:27:25 -0700278static void mip6_addr_swap(struct sk_buff *skb)
279{
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700280 struct ipv6hdr *iph = ipv6_hdr(skb);
Masahide NAKAMURA79383232006-08-23 19:27:25 -0700281 struct inet6_skb_parm *opt = IP6CB(skb);
282 struct ipv6_destopt_hao *hao;
283 struct in6_addr tmp;
284 int off;
285
286 if (opt->dsthao) {
287 off = ipv6_find_tlv(skb, opt->dsthao, IPV6_TLV_HAO);
288 if (likely(off >= 0)) {
Arnaldo Carvalho de Melod56f90a2007-04-10 20:50:43 -0700289 hao = (struct ipv6_destopt_hao *)
290 (skb_network_header(skb) + off);
Masahide NAKAMURA79383232006-08-23 19:27:25 -0700291 ipv6_addr_copy(&tmp, &iph->saddr);
292 ipv6_addr_copy(&iph->saddr, &hao->addr);
293 ipv6_addr_copy(&hao->addr, &tmp);
294 }
295 }
296}
297#else
298static inline void mip6_addr_swap(struct sk_buff *skb) {}
299#endif
300
Linus Torvalds1da177e2005-04-16 15:20:36 -0700301/*
302 * Send an ICMP message in response to a packet in error
303 */
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900304void icmpv6_send(struct sk_buff *skb, int type, int code, __u32 info,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700305 struct net_device *dev)
306{
307 struct inet6_dev *idev = NULL;
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700308 struct ipv6hdr *hdr = ipv6_hdr(skb);
YOSHIFUJI Hideaki84427d52005-06-13 14:59:44 -0700309 struct sock *sk;
310 struct ipv6_pinfo *np;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700311 struct in6_addr *saddr = NULL;
312 struct dst_entry *dst;
313 struct icmp6hdr tmp_hdr;
314 struct flowi fl;
315 struct icmpv6_msg msg;
316 int iif = 0;
317 int addr_type = 0;
318 int len;
YOSHIFUJI Hideaki41a1f8e2005-09-08 10:19:03 +0900319 int hlimit, tclass;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700320 int err = 0;
321
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -0700322 if ((u8 *)hdr < skb->head ||
323 (skb->network_header + sizeof(*hdr)) > skb->tail)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700324 return;
325
326 /*
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900327 * Make sure we respect the rules
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328 * i.e. RFC 1885 2.4(e)
329 * Rule (e.1) is enforced by not using icmpv6_send
330 * in any code that processes icmp errors.
331 */
332 addr_type = ipv6_addr_type(&hdr->daddr);
333
334 if (ipv6_chk_addr(&hdr->daddr, skb->dev, 0))
335 saddr = &hdr->daddr;
336
337 /*
338 * Dest addr check
339 */
340
341 if ((addr_type & IPV6_ADDR_MULTICAST || skb->pkt_type != PACKET_HOST)) {
342 if (type != ICMPV6_PKT_TOOBIG &&
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900343 !(type == ICMPV6_PARAMPROB &&
344 code == ICMPV6_UNK_OPTION &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700345 (opt_unrec(skb, info))))
346 return;
347
348 saddr = NULL;
349 }
350
351 addr_type = ipv6_addr_type(&hdr->saddr);
352
353 /*
354 * Source addr check
355 */
356
357 if (addr_type & IPV6_ADDR_LINKLOCAL)
358 iif = skb->dev->ifindex;
359
360 /*
YOSHIFUJI Hideaki8de33512005-12-21 22:57:06 +0900361 * Must not send error if the source does not uniquely
362 * identify a single node (RFC2463 Section 2.4).
363 * We check unspecified / multicast addresses here,
364 * and anycast addresses will be checked later.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700365 */
366 if ((addr_type == IPV6_ADDR_ANY) || (addr_type & IPV6_ADDR_MULTICAST)) {
Patrick McHardy64ce2072005-08-09 20:50:53 -0700367 LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: addr_any/mcast source\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700368 return;
369 }
370
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900371 /*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700372 * Never answer to a ICMP packet.
373 */
374 if (is_ineligible(skb)) {
Patrick McHardy64ce2072005-08-09 20:50:53 -0700375 LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: no reply to icmp error\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376 return;
377 }
378
Masahide NAKAMURA79383232006-08-23 19:27:25 -0700379 mip6_addr_swap(skb);
380
Linus Torvalds1da177e2005-04-16 15:20:36 -0700381 memset(&fl, 0, sizeof(fl));
382 fl.proto = IPPROTO_ICMPV6;
383 ipv6_addr_copy(&fl.fl6_dst, &hdr->saddr);
384 if (saddr)
385 ipv6_addr_copy(&fl.fl6_src, saddr);
386 fl.oif = iif;
387 fl.fl_icmp_type = type;
388 fl.fl_icmp_code = code;
Venkat Yekkiralabeb8d132006-08-04 23:12:42 -0700389 security_skb_classify_flow(skb, &fl);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700390
391 if (icmpv6_xmit_lock())
392 return;
393
YOSHIFUJI Hideaki84427d52005-06-13 14:59:44 -0700394 sk = icmpv6_socket->sk;
395 np = inet6_sk(sk);
396
Linus Torvalds1da177e2005-04-16 15:20:36 -0700397 if (!icmpv6_xrlim_allow(sk, type, &fl))
398 goto out;
399
400 tmp_hdr.icmp6_type = type;
401 tmp_hdr.icmp6_code = code;
402 tmp_hdr.icmp6_cksum = 0;
403 tmp_hdr.icmp6_pointer = htonl(info);
404
405 if (!fl.oif && ipv6_addr_is_multicast(&fl.fl6_dst))
406 fl.oif = np->mcast_oif;
407
408 err = ip6_dst_lookup(sk, &dst, &fl);
409 if (err)
410 goto out;
YOSHIFUJI Hideaki8de33512005-12-21 22:57:06 +0900411
412 /*
413 * We won't send icmp if the destination is known
414 * anycast.
415 */
416 if (((struct rt6_info *)dst)->rt6i_flags & RTF_ANYCAST) {
417 LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: acast source\n");
418 goto out_dst_release;
419 }
420
Linus Torvalds1da177e2005-04-16 15:20:36 -0700421 if ((err = xfrm_lookup(&dst, &fl, sk, 0)) < 0)
Patrick McHardye1044112005-09-08 15:11:55 -0700422 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700423
424 if (ipv6_addr_is_multicast(&fl.fl6_dst))
425 hlimit = np->mcast_hops;
426 else
427 hlimit = np->hop_limit;
428 if (hlimit < 0)
429 hlimit = dst_metric(dst, RTAX_HOPLIMIT);
430 if (hlimit < 0)
431 hlimit = ipv6_get_hoplimit(dst->dev);
432
YOSHIFUJI Hideakie012d512006-09-13 20:01:28 -0700433 tclass = np->tclass;
YOSHIFUJI Hideaki41a1f8e2005-09-08 10:19:03 +0900434 if (tclass < 0)
435 tclass = 0;
436
Linus Torvalds1da177e2005-04-16 15:20:36 -0700437 msg.skb = skb;
Arnaldo Carvalho de Melobbe735e2007-03-10 22:16:10 -0300438 msg.offset = skb_network_offset(skb);
Yasuyuki Kozakai763ecff2006-02-15 15:24:15 -0800439 msg.type = type;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700440
441 len = skb->len - msg.offset;
442 len = min_t(unsigned int, len, IPV6_MIN_MTU - sizeof(struct ipv6hdr) -sizeof(struct icmp6hdr));
443 if (len < 0) {
Patrick McHardy64ce2072005-08-09 20:50:53 -0700444 LIMIT_NETDEBUG(KERN_DEBUG "icmp: len problem\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700445 goto out_dst_release;
446 }
447
448 idev = in6_dev_get(skb->dev);
449
450 err = ip6_append_data(sk, icmpv6_getfrag, &msg,
451 len + sizeof(struct icmp6hdr),
452 sizeof(struct icmp6hdr),
YOSHIFUJI Hideaki41a1f8e2005-09-08 10:19:03 +0900453 hlimit, tclass, NULL, &fl, (struct rt6_info*)dst,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700454 MSG_DONTWAIT);
455 if (err) {
456 ip6_flush_pending_frames(sk);
457 goto out_put;
458 }
459 err = icmpv6_push_pending_frames(sk, &fl, &tmp_hdr, len + sizeof(struct icmp6hdr));
460
Linus Torvalds1da177e2005-04-16 15:20:36 -0700461 ICMP6_INC_STATS_BH(idev, ICMP6_MIB_OUTMSGS);
462
463out_put:
464 if (likely(idev != NULL))
465 in6_dev_put(idev);
466out_dst_release:
467 dst_release(dst);
468out:
469 icmpv6_xmit_unlock();
470}
471
YOSHIFUJI Hideaki71590392007-02-22 22:05:40 +0900472EXPORT_SYMBOL(icmpv6_send);
473
Linus Torvalds1da177e2005-04-16 15:20:36 -0700474static void icmpv6_echo_reply(struct sk_buff *skb)
475{
YOSHIFUJI Hideaki84427d52005-06-13 14:59:44 -0700476 struct sock *sk;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700477 struct inet6_dev *idev;
YOSHIFUJI Hideaki84427d52005-06-13 14:59:44 -0700478 struct ipv6_pinfo *np;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700479 struct in6_addr *saddr = NULL;
Arnaldo Carvalho de Melocc70ab22007-03-13 14:03:22 -0300480 struct icmp6hdr *icmph = icmp6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700481 struct icmp6hdr tmp_hdr;
482 struct flowi fl;
483 struct icmpv6_msg msg;
484 struct dst_entry *dst;
485 int err = 0;
486 int hlimit;
YOSHIFUJI Hideaki41a1f8e2005-09-08 10:19:03 +0900487 int tclass;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700488
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700489 saddr = &ipv6_hdr(skb)->daddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490
491 if (!ipv6_unicast_destination(skb))
492 saddr = NULL;
493
494 memcpy(&tmp_hdr, icmph, sizeof(tmp_hdr));
495 tmp_hdr.icmp6_type = ICMPV6_ECHO_REPLY;
496
497 memset(&fl, 0, sizeof(fl));
498 fl.proto = IPPROTO_ICMPV6;
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700499 ipv6_addr_copy(&fl.fl6_dst, &ipv6_hdr(skb)->saddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700500 if (saddr)
501 ipv6_addr_copy(&fl.fl6_src, saddr);
502 fl.oif = skb->dev->ifindex;
503 fl.fl_icmp_type = ICMPV6_ECHO_REPLY;
Venkat Yekkiralabeb8d132006-08-04 23:12:42 -0700504 security_skb_classify_flow(skb, &fl);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700505
506 if (icmpv6_xmit_lock())
507 return;
508
YOSHIFUJI Hideaki84427d52005-06-13 14:59:44 -0700509 sk = icmpv6_socket->sk;
510 np = inet6_sk(sk);
511
Linus Torvalds1da177e2005-04-16 15:20:36 -0700512 if (!fl.oif && ipv6_addr_is_multicast(&fl.fl6_dst))
513 fl.oif = np->mcast_oif;
514
515 err = ip6_dst_lookup(sk, &dst, &fl);
516 if (err)
517 goto out;
518 if ((err = xfrm_lookup(&dst, &fl, sk, 0)) < 0)
Patrick McHardye1044112005-09-08 15:11:55 -0700519 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700520
521 if (ipv6_addr_is_multicast(&fl.fl6_dst))
522 hlimit = np->mcast_hops;
523 else
524 hlimit = np->hop_limit;
525 if (hlimit < 0)
526 hlimit = dst_metric(dst, RTAX_HOPLIMIT);
527 if (hlimit < 0)
528 hlimit = ipv6_get_hoplimit(dst->dev);
529
YOSHIFUJI Hideakie012d512006-09-13 20:01:28 -0700530 tclass = np->tclass;
YOSHIFUJI Hideaki41a1f8e2005-09-08 10:19:03 +0900531 if (tclass < 0)
532 tclass = 0;
533
Linus Torvalds1da177e2005-04-16 15:20:36 -0700534 idev = in6_dev_get(skb->dev);
535
536 msg.skb = skb;
537 msg.offset = 0;
Yasuyuki Kozakai763ecff2006-02-15 15:24:15 -0800538 msg.type = ICMPV6_ECHO_REPLY;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700539
540 err = ip6_append_data(sk, icmpv6_getfrag, &msg, skb->len + sizeof(struct icmp6hdr),
YOSHIFUJI Hideaki41a1f8e2005-09-08 10:19:03 +0900541 sizeof(struct icmp6hdr), hlimit, tclass, NULL, &fl,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700542 (struct rt6_info*)dst, MSG_DONTWAIT);
543
544 if (err) {
545 ip6_flush_pending_frames(sk);
546 goto out_put;
547 }
548 err = icmpv6_push_pending_frames(sk, &fl, &tmp_hdr, skb->len + sizeof(struct icmp6hdr));
549
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900550out_put:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700551 if (likely(idev != NULL))
552 in6_dev_put(idev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700553 dst_release(dst);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900554out:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700555 icmpv6_xmit_unlock();
556}
557
Al Viro04ce6902006-11-08 00:21:01 -0800558static void icmpv6_notify(struct sk_buff *skb, int type, int code, __be32 info)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700559{
560 struct in6_addr *saddr, *daddr;
561 struct inet6_protocol *ipprot;
562 struct sock *sk;
563 int inner_offset;
564 int hash;
565 u8 nexthdr;
566
567 if (!pskb_may_pull(skb, sizeof(struct ipv6hdr)))
568 return;
569
570 nexthdr = ((struct ipv6hdr *)skb->data)->nexthdr;
571 if (ipv6_ext_hdr(nexthdr)) {
572 /* now skip over extension headers */
Herbert Xu0d3d0772005-04-24 20:16:19 -0700573 inner_offset = ipv6_skip_exthdr(skb, sizeof(struct ipv6hdr), &nexthdr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700574 if (inner_offset<0)
575 return;
576 } else {
577 inner_offset = sizeof(struct ipv6hdr);
578 }
579
580 /* Checkin header including 8 bytes of inner protocol header. */
581 if (!pskb_may_pull(skb, inner_offset+8))
582 return;
583
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700584 saddr = &ipv6_hdr(skb)->saddr;
585 daddr = &ipv6_hdr(skb)->daddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700586
587 /* BUGGG_FUTURE: we should try to parse exthdrs in this packet.
588 Without this we will not able f.e. to make source routed
589 pmtu discovery.
590 Corresponding argument (opt) to notifiers is already added.
591 --ANK (980726)
592 */
593
594 hash = nexthdr & (MAX_INET_PROTOS - 1);
595
596 rcu_read_lock();
597 ipprot = rcu_dereference(inet6_protos[hash]);
598 if (ipprot && ipprot->err_handler)
599 ipprot->err_handler(skb, NULL, type, code, inner_offset, info);
600 rcu_read_unlock();
601
602 read_lock(&raw_v6_lock);
603 if ((sk = sk_head(&raw_v6_htable[hash])) != NULL) {
Dmitry Butskoyf13ec932007-07-14 23:53:08 -0700604 while ((sk = __raw_v6_lookup(sk, nexthdr, saddr, daddr,
YOSHIFUJI Hideaki2dac4b92005-09-01 17:44:49 -0700605 IP6CB(skb)->iif))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700606 rawv6_err(sk, skb, NULL, type, code, inner_offset, info);
607 sk = sk_next(sk);
608 }
609 }
610 read_unlock(&raw_v6_lock);
611}
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900612
Linus Torvalds1da177e2005-04-16 15:20:36 -0700613/*
614 * Handle icmp messages
615 */
616
Herbert Xue5bbef22007-10-15 12:50:28 -0700617static int icmpv6_rcv(struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700618{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700619 struct net_device *dev = skb->dev;
620 struct inet6_dev *idev = __in6_dev_get(dev);
621 struct in6_addr *saddr, *daddr;
622 struct ipv6hdr *orig_hdr;
623 struct icmp6hdr *hdr;
624 int type;
625
626 ICMP6_INC_STATS_BH(idev, ICMP6_MIB_INMSGS);
627
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700628 saddr = &ipv6_hdr(skb)->saddr;
629 daddr = &ipv6_hdr(skb)->daddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700630
631 /* Perform checksum. */
Herbert Xufb286bb2005-11-10 13:01:24 -0800632 switch (skb->ip_summed) {
Patrick McHardy84fa7932006-08-29 16:44:56 -0700633 case CHECKSUM_COMPLETE:
Herbert Xufb286bb2005-11-10 13:01:24 -0800634 if (!csum_ipv6_magic(saddr, daddr, skb->len, IPPROTO_ICMPV6,
635 skb->csum))
636 break;
637 /* fall through */
638 case CHECKSUM_NONE:
Al Viro868c86b2006-11-14 21:35:48 -0800639 skb->csum = ~csum_unfold(csum_ipv6_magic(saddr, daddr, skb->len,
640 IPPROTO_ICMPV6, 0));
Herbert Xufb286bb2005-11-10 13:01:24 -0800641 if (__skb_checksum_complete(skb)) {
Joe Perches46b86a22006-01-13 14:29:07 -0800642 LIMIT_NETDEBUG(KERN_DEBUG "ICMPv6 checksum failed [" NIP6_FMT " > " NIP6_FMT "]\n",
Patrick McHardy64ce2072005-08-09 20:50:53 -0700643 NIP6(*saddr), NIP6(*daddr));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700644 goto discard_it;
645 }
646 }
647
648 if (!pskb_pull(skb, sizeof(struct icmp6hdr)))
649 goto discard_it;
650
Arnaldo Carvalho de Melocc70ab22007-03-13 14:03:22 -0300651 hdr = icmp6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700652
653 type = hdr->icmp6_type;
654
David L Stevens14878f72007-09-16 16:52:35 -0700655 ICMP6MSGIN_INC_STATS_BH(idev, type);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700656
657 switch (type) {
658 case ICMPV6_ECHO_REQUEST:
659 icmpv6_echo_reply(skb);
660 break;
661
662 case ICMPV6_ECHO_REPLY:
663 /* we couldn't care less */
664 break;
665
666 case ICMPV6_PKT_TOOBIG:
667 /* BUGGG_FUTURE: if packet contains rthdr, we cannot update
668 standard destination cache. Seems, only "advanced"
669 destination cache will allow to solve this problem
670 --ANK (980726)
671 */
672 if (!pskb_may_pull(skb, sizeof(struct ipv6hdr)))
673 goto discard_it;
Arnaldo Carvalho de Melocc70ab22007-03-13 14:03:22 -0300674 hdr = icmp6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700675 orig_hdr = (struct ipv6hdr *) (hdr + 1);
676 rt6_pmtu_discovery(&orig_hdr->daddr, &orig_hdr->saddr, dev,
677 ntohl(hdr->icmp6_mtu));
678
679 /*
680 * Drop through to notify
681 */
682
683 case ICMPV6_DEST_UNREACH:
684 case ICMPV6_TIME_EXCEED:
685 case ICMPV6_PARAMPROB:
686 icmpv6_notify(skb, type, hdr->icmp6_code, hdr->icmp6_mtu);
687 break;
688
689 case NDISC_ROUTER_SOLICITATION:
690 case NDISC_ROUTER_ADVERTISEMENT:
691 case NDISC_NEIGHBOUR_SOLICITATION:
692 case NDISC_NEIGHBOUR_ADVERTISEMENT:
693 case NDISC_REDIRECT:
694 ndisc_rcv(skb);
695 break;
696
697 case ICMPV6_MGM_QUERY:
698 igmp6_event_query(skb);
699 break;
700
701 case ICMPV6_MGM_REPORT:
702 igmp6_event_report(skb);
703 break;
704
705 case ICMPV6_MGM_REDUCTION:
706 case ICMPV6_NI_QUERY:
707 case ICMPV6_NI_REPLY:
708 case ICMPV6_MLD2_REPORT:
709 case ICMPV6_DHAAD_REQUEST:
710 case ICMPV6_DHAAD_REPLY:
711 case ICMPV6_MOBILE_PREFIX_SOL:
712 case ICMPV6_MOBILE_PREFIX_ADV:
713 break;
714
715 default:
Patrick McHardy64ce2072005-08-09 20:50:53 -0700716 LIMIT_NETDEBUG(KERN_DEBUG "icmpv6: msg of unknown type\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700717
718 /* informational */
719 if (type & ICMPV6_INFOMSG_MASK)
720 break;
721
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900722 /*
723 * error of unknown type.
724 * must pass to upper level
Linus Torvalds1da177e2005-04-16 15:20:36 -0700725 */
726
727 icmpv6_notify(skb, type, hdr->icmp6_code, hdr->icmp6_mtu);
Stephen Hemminger3ff50b72007-04-20 17:09:22 -0700728 }
729
Linus Torvalds1da177e2005-04-16 15:20:36 -0700730 kfree_skb(skb);
731 return 0;
732
733discard_it:
734 ICMP6_INC_STATS_BH(idev, ICMP6_MIB_INERRORS);
735 kfree_skb(skb);
736 return 0;
737}
738
Ingo Molnar640c41c2006-08-15 00:06:56 -0700739/*
740 * Special lock-class for __icmpv6_socket:
741 */
742static struct lock_class_key icmpv6_socket_sk_dst_lock_key;
743
Linus Torvalds1da177e2005-04-16 15:20:36 -0700744int __init icmpv6_init(struct net_proto_family *ops)
745{
746 struct sock *sk;
747 int err, i, j;
748
KAMEZAWA Hiroyuki6f912042006-04-10 22:52:50 -0700749 for_each_possible_cpu(i) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700750 err = sock_create_kern(PF_INET6, SOCK_RAW, IPPROTO_ICMPV6,
751 &per_cpu(__icmpv6_socket, i));
752 if (err < 0) {
753 printk(KERN_ERR
754 "Failed to initialize the ICMP6 control socket "
755 "(err %d).\n",
756 err);
757 goto fail;
758 }
759
760 sk = per_cpu(__icmpv6_socket, i)->sk;
761 sk->sk_allocation = GFP_ATOMIC;
Ingo Molnar640c41c2006-08-15 00:06:56 -0700762 /*
763 * Split off their lock-class, because sk->sk_dst_lock
764 * gets used from softirqs, which is safe for
765 * __icmpv6_socket (because those never get directly used
766 * via userspace syscalls), but unsafe for normal sockets.
767 */
768 lockdep_set_class(&sk->sk_dst_lock,
769 &icmpv6_socket_sk_dst_lock_key);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700770
771 /* Enough space for 2 64K ICMP packets, including
772 * sk_buff struct overhead.
773 */
774 sk->sk_sndbuf =
775 (2 * ((64 * 1024) + sizeof(struct sk_buff)));
776
777 sk->sk_prot->unhash(sk);
778 }
779
780
781 if (inet6_add_protocol(&icmpv6_protocol, IPPROTO_ICMPV6) < 0) {
782 printk(KERN_ERR "Failed to register ICMP6 protocol\n");
783 err = -EAGAIN;
784 goto fail;
785 }
786
787 return 0;
788
789 fail:
790 for (j = 0; j < i; j++) {
791 if (!cpu_possible(j))
792 continue;
793 sock_release(per_cpu(__icmpv6_socket, j));
794 }
795
796 return err;
797}
798
799void icmpv6_cleanup(void)
800{
801 int i;
802
KAMEZAWA Hiroyuki6f912042006-04-10 22:52:50 -0700803 for_each_possible_cpu(i) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700804 sock_release(per_cpu(__icmpv6_socket, i));
805 }
806 inet6_del_protocol(&icmpv6_protocol, IPPROTO_ICMPV6);
807}
808
Arjan van de Ven9b5b5cf2005-11-29 16:21:38 -0800809static const struct icmp6_err {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700810 int err;
811 int fatal;
812} tab_unreach[] = {
813 { /* NOROUTE */
814 .err = ENETUNREACH,
815 .fatal = 0,
816 },
817 { /* ADM_PROHIBITED */
818 .err = EACCES,
819 .fatal = 1,
820 },
821 { /* Was NOT_NEIGHBOUR, now reserved */
822 .err = EHOSTUNREACH,
823 .fatal = 0,
824 },
825 { /* ADDR_UNREACH */
826 .err = EHOSTUNREACH,
827 .fatal = 0,
828 },
829 { /* PORT_UNREACH */
830 .err = ECONNREFUSED,
831 .fatal = 1,
832 },
833};
834
835int icmpv6_err_convert(int type, int code, int *err)
836{
837 int fatal = 0;
838
839 *err = EPROTO;
840
841 switch (type) {
842 case ICMPV6_DEST_UNREACH:
843 fatal = 1;
844 if (code <= ICMPV6_PORT_UNREACH) {
845 *err = tab_unreach[code].err;
846 fatal = tab_unreach[code].fatal;
847 }
848 break;
849
850 case ICMPV6_PKT_TOOBIG:
851 *err = EMSGSIZE;
852 break;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900853
Linus Torvalds1da177e2005-04-16 15:20:36 -0700854 case ICMPV6_PARAMPROB:
855 *err = EPROTO;
856 fatal = 1;
857 break;
858
859 case ICMPV6_TIME_EXCEED:
860 *err = EHOSTUNREACH;
861 break;
Stephen Hemminger3ff50b72007-04-20 17:09:22 -0700862 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700863
864 return fatal;
865}
866
YOSHIFUJI Hideaki71590392007-02-22 22:05:40 +0900867EXPORT_SYMBOL(icmpv6_err_convert);
868
Linus Torvalds1da177e2005-04-16 15:20:36 -0700869#ifdef CONFIG_SYSCTL
870ctl_table ipv6_icmp_table[] = {
871 {
872 .ctl_name = NET_IPV6_ICMP_RATELIMIT,
873 .procname = "ratelimit",
874 .data = &sysctl_icmpv6_time,
875 .maxlen = sizeof(int),
876 .mode = 0644,
877 .proc_handler = &proc_dointvec
878 },
879 { .ctl_name = 0 },
880};
881#endif
882