blob: 53b546019fd58f9c3565b98f71b9b022324454f8 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Neighbour Discovery for IPv6
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09003 * Linux INET6 implementation
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 *
5 * Authors:
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09006 * Pedro Roque <roque@di.fc.ul.pt>
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 * Mike Shaver <shaver@ingenia.com>
8 *
9 * This program is free software; you can redistribute it and/or
10 * modify it under the terms of the GNU General Public License
11 * as published by the Free Software Foundation; either version
12 * 2 of the License, or (at your option) any later version.
13 */
14
15/*
16 * Changes:
17 *
Pierre Ynard31910572007-10-10 21:22:05 -070018 * Pierre Ynard : export userland ND options
19 * through netlink (RDNSS support)
Linus Torvalds1da177e2005-04-16 15:20:36 -070020 * Lars Fenneberg : fixed MTU setting on receipt
21 * of an RA.
Linus Torvalds1da177e2005-04-16 15:20:36 -070022 * Janos Farkas : kmalloc failure checks
23 * Alexey Kuznetsov : state machine reworked
24 * and moved to net/core.
25 * Pekka Savola : RFC2461 validation
26 * YOSHIFUJI Hideaki @USAGI : Verify ND options properly
27 */
28
29/* Set to 3 to get tracing... */
30#define ND_DEBUG 1
31
32#define ND_PRINTK(fmt, args...) do { if (net_ratelimit()) { printk(fmt, ## args); } } while(0)
33#define ND_NOPRINTK(x...) do { ; } while(0)
34#define ND_PRINTK0 ND_PRINTK
35#define ND_PRINTK1 ND_NOPRINTK
36#define ND_PRINTK2 ND_NOPRINTK
37#define ND_PRINTK3 ND_NOPRINTK
38#if ND_DEBUG >= 1
39#undef ND_PRINTK1
40#define ND_PRINTK1 ND_PRINTK
41#endif
42#if ND_DEBUG >= 2
43#undef ND_PRINTK2
44#define ND_PRINTK2 ND_PRINTK
45#endif
46#if ND_DEBUG >= 3
47#undef ND_PRINTK3
48#define ND_PRINTK3 ND_PRINTK
49#endif
50
51#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070052#include <linux/errno.h>
53#include <linux/types.h>
54#include <linux/socket.h>
55#include <linux/sockios.h>
56#include <linux/sched.h>
57#include <linux/net.h>
58#include <linux/in6.h>
59#include <linux/route.h>
60#include <linux/init.h>
61#include <linux/rcupdate.h>
62#ifdef CONFIG_SYSCTL
63#include <linux/sysctl.h>
64#endif
65
Thomas Graf18237302006-08-04 23:04:54 -070066#include <linux/if_addr.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070067#include <linux/if_arp.h>
68#include <linux/ipv6.h>
69#include <linux/icmpv6.h>
70#include <linux/jhash.h>
71
72#include <net/sock.h>
73#include <net/snmp.h>
74
75#include <net/ipv6.h>
76#include <net/protocol.h>
77#include <net/ndisc.h>
78#include <net/ip6_route.h>
79#include <net/addrconf.h>
80#include <net/icmp.h>
81
Pierre Ynard31910572007-10-10 21:22:05 -070082#include <net/netlink.h>
83#include <linux/rtnetlink.h>
84
Linus Torvalds1da177e2005-04-16 15:20:36 -070085#include <net/flow.h>
86#include <net/ip6_checksum.h>
87#include <linux/proc_fs.h>
88
89#include <linux/netfilter.h>
90#include <linux/netfilter_ipv6.h>
91
Linus Torvalds1da177e2005-04-16 15:20:36 -070092static u32 ndisc_hash(const void *pkey, const struct net_device *dev);
93static int ndisc_constructor(struct neighbour *neigh);
94static void ndisc_solicit(struct neighbour *neigh, struct sk_buff *skb);
95static void ndisc_error_report(struct neighbour *neigh, struct sk_buff *skb);
96static int pndisc_constructor(struct pneigh_entry *n);
97static void pndisc_destructor(struct pneigh_entry *n);
98static void pndisc_redo(struct sk_buff *skb);
99
100static struct neigh_ops ndisc_generic_ops = {
101 .family = AF_INET6,
102 .solicit = ndisc_solicit,
103 .error_report = ndisc_error_report,
104 .output = neigh_resolve_output,
105 .connected_output = neigh_connected_output,
106 .hh_output = dev_queue_xmit,
107 .queue_xmit = dev_queue_xmit,
108};
109
110static struct neigh_ops ndisc_hh_ops = {
111 .family = AF_INET6,
112 .solicit = ndisc_solicit,
113 .error_report = ndisc_error_report,
114 .output = neigh_resolve_output,
115 .connected_output = neigh_resolve_output,
116 .hh_output = dev_queue_xmit,
117 .queue_xmit = dev_queue_xmit,
118};
119
120
121static struct neigh_ops ndisc_direct_ops = {
122 .family = AF_INET6,
123 .output = dev_queue_xmit,
124 .connected_output = dev_queue_xmit,
125 .hh_output = dev_queue_xmit,
126 .queue_xmit = dev_queue_xmit,
127};
128
129struct neigh_table nd_tbl = {
130 .family = AF_INET6,
131 .entry_size = sizeof(struct neighbour) + sizeof(struct in6_addr),
132 .key_len = sizeof(struct in6_addr),
133 .hash = ndisc_hash,
134 .constructor = ndisc_constructor,
135 .pconstructor = pndisc_constructor,
136 .pdestructor = pndisc_destructor,
137 .proxy_redo = pndisc_redo,
138 .id = "ndisc_cache",
139 .parms = {
140 .tbl = &nd_tbl,
141 .base_reachable_time = 30 * HZ,
142 .retrans_time = 1 * HZ,
143 .gc_staletime = 60 * HZ,
144 .reachable_time = 30 * HZ,
145 .delay_probe_time = 5 * HZ,
146 .queue_len = 3,
147 .ucast_probes = 3,
148 .mcast_probes = 3,
149 .anycast_delay = 1 * HZ,
150 .proxy_delay = (8 * HZ) / 10,
151 .proxy_qlen = 64,
152 },
153 .gc_interval = 30 * HZ,
154 .gc_thresh1 = 128,
155 .gc_thresh2 = 512,
156 .gc_thresh3 = 1024,
157};
158
159/* ND options */
160struct ndisc_options {
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -0800161 struct nd_opt_hdr *nd_opt_array[__ND_OPT_ARRAY_MAX];
162#ifdef CONFIG_IPV6_ROUTE_INFO
163 struct nd_opt_hdr *nd_opts_ri;
164 struct nd_opt_hdr *nd_opts_ri_end;
165#endif
Pierre Ynard31910572007-10-10 21:22:05 -0700166 struct nd_opt_hdr *nd_useropts;
167 struct nd_opt_hdr *nd_useropts_end;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168};
169
170#define nd_opts_src_lladdr nd_opt_array[ND_OPT_SOURCE_LL_ADDR]
171#define nd_opts_tgt_lladdr nd_opt_array[ND_OPT_TARGET_LL_ADDR]
172#define nd_opts_pi nd_opt_array[ND_OPT_PREFIX_INFO]
173#define nd_opts_pi_end nd_opt_array[__ND_OPT_PREFIX_INFO_END]
174#define nd_opts_rh nd_opt_array[ND_OPT_REDIRECT_HDR]
175#define nd_opts_mtu nd_opt_array[ND_OPT_MTU]
176
177#define NDISC_OPT_SPACE(len) (((len)+2+7)&~7)
178
179/*
180 * Return the padding between the option length and the start of the
181 * link addr. Currently only IP-over-InfiniBand needs this, although
182 * if RFC 3831 IPv6-over-Fibre Channel is ever implemented it may
183 * also need a pad of 2.
184 */
185static int ndisc_addr_option_pad(unsigned short type)
186{
187 switch (type) {
188 case ARPHRD_INFINIBAND: return 2;
189 default: return 0;
190 }
191}
192
193static inline int ndisc_opt_addr_space(struct net_device *dev)
194{
195 return NDISC_OPT_SPACE(dev->addr_len + ndisc_addr_option_pad(dev->type));
196}
197
198static u8 *ndisc_fill_addr_option(u8 *opt, int type, void *data, int data_len,
199 unsigned short addr_type)
200{
201 int space = NDISC_OPT_SPACE(data_len);
202 int pad = ndisc_addr_option_pad(addr_type);
203
204 opt[0] = type;
205 opt[1] = space>>3;
206
207 memset(opt + 2, 0, pad);
208 opt += pad;
209 space -= pad;
210
211 memcpy(opt+2, data, data_len);
212 data_len += 2;
213 opt += data_len;
214 if ((space -= data_len) > 0)
215 memset(opt, 0, space);
216 return opt + space;
217}
218
219static struct nd_opt_hdr *ndisc_next_option(struct nd_opt_hdr *cur,
220 struct nd_opt_hdr *end)
221{
222 int type;
223 if (!cur || !end || cur >= end)
224 return NULL;
225 type = cur->nd_opt_type;
226 do {
227 cur = ((void *)cur) + (cur->nd_opt_len << 3);
228 } while(cur < end && cur->nd_opt_type != type);
229 return (cur <= end && cur->nd_opt_type == type ? cur : NULL);
230}
231
Pierre Ynard31910572007-10-10 21:22:05 -0700232static inline int ndisc_is_useropt(struct nd_opt_hdr *opt)
233{
234 return (opt->nd_opt_type == ND_OPT_RDNSS);
235}
236
237static struct nd_opt_hdr *ndisc_next_useropt(struct nd_opt_hdr *cur,
238 struct nd_opt_hdr *end)
239{
240 if (!cur || !end || cur >= end)
241 return NULL;
242 do {
243 cur = ((void *)cur) + (cur->nd_opt_len << 3);
244 } while(cur < end && !ndisc_is_useropt(cur));
245 return (cur <= end && ndisc_is_useropt(cur) ? cur : NULL);
246}
247
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248static struct ndisc_options *ndisc_parse_options(u8 *opt, int opt_len,
249 struct ndisc_options *ndopts)
250{
251 struct nd_opt_hdr *nd_opt = (struct nd_opt_hdr *)opt;
252
253 if (!nd_opt || opt_len < 0 || !ndopts)
254 return NULL;
255 memset(ndopts, 0, sizeof(*ndopts));
256 while (opt_len) {
257 int l;
258 if (opt_len < sizeof(struct nd_opt_hdr))
259 return NULL;
260 l = nd_opt->nd_opt_len << 3;
261 if (opt_len < l || l == 0)
262 return NULL;
263 switch (nd_opt->nd_opt_type) {
264 case ND_OPT_SOURCE_LL_ADDR:
265 case ND_OPT_TARGET_LL_ADDR:
266 case ND_OPT_MTU:
267 case ND_OPT_REDIRECT_HDR:
268 if (ndopts->nd_opt_array[nd_opt->nd_opt_type]) {
269 ND_PRINTK2(KERN_WARNING
270 "%s(): duplicated ND6 option found: type=%d\n",
Harvey Harrison0dc47872008-03-05 20:47:47 -0800271 __func__,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272 nd_opt->nd_opt_type);
273 } else {
274 ndopts->nd_opt_array[nd_opt->nd_opt_type] = nd_opt;
275 }
276 break;
277 case ND_OPT_PREFIX_INFO:
278 ndopts->nd_opts_pi_end = nd_opt;
Stephen Hemmingercfcabdc2007-10-09 01:59:42 -0700279 if (!ndopts->nd_opt_array[nd_opt->nd_opt_type])
Linus Torvalds1da177e2005-04-16 15:20:36 -0700280 ndopts->nd_opt_array[nd_opt->nd_opt_type] = nd_opt;
281 break;
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -0800282#ifdef CONFIG_IPV6_ROUTE_INFO
283 case ND_OPT_ROUTE_INFO:
284 ndopts->nd_opts_ri_end = nd_opt;
285 if (!ndopts->nd_opts_ri)
286 ndopts->nd_opts_ri = nd_opt;
287 break;
288#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700289 default:
Pierre Ynard31910572007-10-10 21:22:05 -0700290 if (ndisc_is_useropt(nd_opt)) {
291 ndopts->nd_useropts_end = nd_opt;
292 if (!ndopts->nd_useropts)
293 ndopts->nd_useropts = nd_opt;
294 } else {
295 /*
296 * Unknown options must be silently ignored,
297 * to accommodate future extension to the
298 * protocol.
299 */
300 ND_PRINTK2(KERN_NOTICE
301 "%s(): ignored unsupported option; type=%d, len=%d\n",
Harvey Harrison0dc47872008-03-05 20:47:47 -0800302 __func__,
Pierre Ynard31910572007-10-10 21:22:05 -0700303 nd_opt->nd_opt_type, nd_opt->nd_opt_len);
304 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700305 }
306 opt_len -= l;
307 nd_opt = ((void *)nd_opt) + l;
308 }
309 return ndopts;
310}
311
312static inline u8 *ndisc_opt_addr_data(struct nd_opt_hdr *p,
313 struct net_device *dev)
314{
315 u8 *lladdr = (u8 *)(p + 1);
316 int lladdrlen = p->nd_opt_len << 3;
317 int prepad = ndisc_addr_option_pad(dev->type);
318 if (lladdrlen != NDISC_OPT_SPACE(dev->addr_len + prepad))
319 return NULL;
320 return (lladdr + prepad);
321}
322
323int ndisc_mc_map(struct in6_addr *addr, char *buf, struct net_device *dev, int dir)
324{
325 switch (dev->type) {
326 case ARPHRD_ETHER:
327 case ARPHRD_IEEE802: /* Not sure. Check it later. --ANK */
328 case ARPHRD_FDDI:
329 ipv6_eth_mc_map(addr, buf);
330 return 0;
331 case ARPHRD_IEEE802_TR:
332 ipv6_tr_mc_map(addr,buf);
333 return 0;
334 case ARPHRD_ARCNET:
335 ipv6_arcnet_mc_map(addr, buf);
336 return 0;
337 case ARPHRD_INFINIBAND:
Rolf Manderscheida9e527e2007-12-10 13:38:41 -0700338 ipv6_ib_mc_map(addr, dev->broadcast, buf);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339 return 0;
340 default:
341 if (dir) {
342 memcpy(buf, dev->broadcast, dev->addr_len);
343 return 0;
344 }
345 }
346 return -EINVAL;
347}
348
YOSHIFUJI Hideaki71590392007-02-22 22:05:40 +0900349EXPORT_SYMBOL(ndisc_mc_map);
350
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351static u32 ndisc_hash(const void *pkey, const struct net_device *dev)
352{
353 const u32 *p32 = pkey;
354 u32 addr_hash, i;
355
356 addr_hash = 0;
357 for (i = 0; i < (sizeof(struct in6_addr) / sizeof(u32)); i++)
358 addr_hash ^= *p32++;
359
360 return jhash_2words(addr_hash, dev->ifindex, nd_tbl.hash_rnd);
361}
362
363static int ndisc_constructor(struct neighbour *neigh)
364{
365 struct in6_addr *addr = (struct in6_addr*)&neigh->primary_key;
366 struct net_device *dev = neigh->dev;
367 struct inet6_dev *in6_dev;
368 struct neigh_parms *parms;
369 int is_multicast = ipv6_addr_is_multicast(addr);
370
371 rcu_read_lock();
372 in6_dev = in6_dev_get(dev);
373 if (in6_dev == NULL) {
374 rcu_read_unlock();
375 return -EINVAL;
376 }
377
378 parms = in6_dev->nd_parms;
379 __neigh_parms_put(neigh->parms);
380 neigh->parms = neigh_parms_clone(parms);
381 rcu_read_unlock();
382
383 neigh->type = is_multicast ? RTN_MULTICAST : RTN_UNICAST;
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700384 if (!dev->header_ops) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700385 neigh->nud_state = NUD_NOARP;
386 neigh->ops = &ndisc_direct_ops;
387 neigh->output = neigh->ops->queue_xmit;
388 } else {
389 if (is_multicast) {
390 neigh->nud_state = NUD_NOARP;
391 ndisc_mc_map(addr, neigh->ha, dev, 1);
392 } else if (dev->flags&(IFF_NOARP|IFF_LOOPBACK)) {
393 neigh->nud_state = NUD_NOARP;
394 memcpy(neigh->ha, dev->dev_addr, dev->addr_len);
395 if (dev->flags&IFF_LOOPBACK)
396 neigh->type = RTN_LOCAL;
397 } else if (dev->flags&IFF_POINTOPOINT) {
398 neigh->nud_state = NUD_NOARP;
399 memcpy(neigh->ha, dev->broadcast, dev->addr_len);
400 }
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700401 if (dev->header_ops->cache)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700402 neigh->ops = &ndisc_hh_ops;
403 else
404 neigh->ops = &ndisc_generic_ops;
405 if (neigh->nud_state&NUD_VALID)
406 neigh->output = neigh->ops->connected_output;
407 else
408 neigh->output = neigh->ops->output;
409 }
410 in6_dev_put(in6_dev);
411 return 0;
412}
413
414static int pndisc_constructor(struct pneigh_entry *n)
415{
416 struct in6_addr *addr = (struct in6_addr*)&n->key;
417 struct in6_addr maddr;
418 struct net_device *dev = n->dev;
419
420 if (dev == NULL || __in6_dev_get(dev) == NULL)
421 return -EINVAL;
422 addrconf_addr_solict_mult(addr, &maddr);
423 ipv6_dev_mc_inc(dev, &maddr);
424 return 0;
425}
426
427static void pndisc_destructor(struct pneigh_entry *n)
428{
429 struct in6_addr *addr = (struct in6_addr*)&n->key;
430 struct in6_addr maddr;
431 struct net_device *dev = n->dev;
432
433 if (dev == NULL || __in6_dev_get(dev) == NULL)
434 return;
435 addrconf_addr_solict_mult(addr, &maddr);
436 ipv6_dev_mc_dec(dev, &maddr);
437}
438
439/*
440 * Send a Neighbour Advertisement
441 */
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900442static void __ndisc_send(struct net_device *dev,
443 struct neighbour *neigh,
444 struct in6_addr *daddr, struct in6_addr *saddr,
445 struct icmp6hdr *icmp6h, struct in6_addr *target,
David L Stevens14878f72007-09-16 16:52:35 -0700446 int llinfo)
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900447{
448 struct flowi fl;
449 struct dst_entry *dst;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900450 struct net *net = dev_net(dev);
Daniel Lezcano1762f7e2008-03-07 11:15:34 -0800451 struct sock *sk = net->ipv6.ndisc_sk;
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900452 struct sk_buff *skb;
453 struct icmp6hdr *hdr;
454 struct inet6_dev *idev;
455 int len;
456 int err;
David L Stevens14878f72007-09-16 16:52:35 -0700457 u8 *opt, type;
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900458
David L Stevens14878f72007-09-16 16:52:35 -0700459 type = icmp6h->icmp6_type;
460
Daniel Lezcano1762f7e2008-03-07 11:15:34 -0800461 icmpv6_flow_init(sk, &fl, type, saddr, daddr, dev->ifindex);
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900462
YOSHIFUJI Hideaki3b009442007-12-06 16:11:48 -0800463 dst = icmp6_dst_alloc(dev, neigh, daddr);
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900464 if (!dst)
465 return;
466
467 err = xfrm_lookup(&dst, &fl, NULL, 0);
468 if (err < 0)
469 return;
470
471 if (!dev->addr_len)
472 llinfo = 0;
473
474 len = sizeof(struct icmp6hdr) + (target ? sizeof(*target) : 0);
475 if (llinfo)
476 len += ndisc_opt_addr_space(dev);
477
478 skb = sock_alloc_send_skb(sk,
479 (MAX_HEADER + sizeof(struct ipv6hdr) +
480 len + LL_RESERVED_SPACE(dev)),
481 1, &err);
482 if (!skb) {
483 ND_PRINTK0(KERN_ERR
484 "ICMPv6 ND: %s() failed to allocate an skb.\n",
Harvey Harrison0dc47872008-03-05 20:47:47 -0800485 __func__);
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900486 dst_release(dst);
487 return;
488 }
489
490 skb_reserve(skb, LL_RESERVED_SPACE(dev));
491 ip6_nd_hdr(sk, skb, dev, saddr, daddr, IPPROTO_ICMPV6, len);
492
493 skb->transport_header = skb->tail;
494 skb_put(skb, len);
495
496 hdr = (struct icmp6hdr *)skb_transport_header(skb);
497 memcpy(hdr, icmp6h, sizeof(*hdr));
498
499 opt = skb_transport_header(skb) + sizeof(struct icmp6hdr);
500 if (target) {
501 ipv6_addr_copy((struct in6_addr *)opt, target);
502 opt += sizeof(*target);
503 }
504
505 if (llinfo)
506 ndisc_fill_addr_option(opt, llinfo, dev->dev_addr,
507 dev->addr_len, dev->type);
508
509 hdr->icmp6_cksum = csum_ipv6_magic(saddr, daddr, len,
510 IPPROTO_ICMPV6,
511 csum_partial((__u8 *) hdr,
512 len, 0));
513
514 skb->dst = dst;
515
516 idev = in6_dev_get(dst->dev);
517 IP6_INC_STATS(idev, IPSTATS_MIB_OUTREQUESTS);
518
Patrick McHardy6e23ae22007-11-19 18:53:30 -0800519 err = NF_HOOK(PF_INET6, NF_INET_LOCAL_OUT, skb, NULL, dst->dev,
520 dst_output);
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900521 if (!err) {
David L Stevens14878f72007-09-16 16:52:35 -0700522 ICMP6MSGOUT_INC_STATS(idev, type);
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900523 ICMP6_INC_STATS(idev, ICMP6_MIB_OUTMSGS);
524 }
525
526 if (likely(idev != NULL))
527 in6_dev_put(idev);
528}
529
Linus Torvalds1da177e2005-04-16 15:20:36 -0700530static void ndisc_send_na(struct net_device *dev, struct neighbour *neigh,
531 struct in6_addr *daddr, struct in6_addr *solicited_addr,
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900532 int router, int solicited, int override, int inc_opt)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700533{
534 struct in6_addr tmpaddr;
535 struct inet6_ifaddr *ifp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700536 struct in6_addr *src_addr;
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900537 struct icmp6hdr icmp6h = {
538 .icmp6_type = NDISC_NEIGHBOUR_ADVERTISEMENT,
539 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700540
541 /* for anycast or proxy, solicited_addr != src_addr */
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900542 ifp = ipv6_get_ifaddr(dev_net(dev), solicited_addr, dev, 1);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900543 if (ifp) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700544 src_addr = solicited_addr;
Neil Horman95c385b2007-04-25 17:08:10 -0700545 if (ifp->flags & IFA_F_OPTIMISTIC)
546 override = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700547 in6_ifa_put(ifp);
548 } else {
YOSHIFUJI Hideaki7cbca672008-03-25 09:37:42 +0900549 if (ipv6_dev_get_saddr(dev, daddr,
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900550 inet6_sk(dev_net(dev)->ipv6.ndisc_sk)->srcprefs,
YOSHIFUJI Hideaki7cbca672008-03-25 09:37:42 +0900551 &tmpaddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700552 return;
553 src_addr = &tmpaddr;
554 }
555
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900556 icmp6h.icmp6_router = router;
557 icmp6h.icmp6_solicited = solicited;
558 icmp6h.icmp6_override = override;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700559
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900560 __ndisc_send(dev, neigh, daddr, src_addr,
561 &icmp6h, solicited_addr,
David L Stevens14878f72007-09-16 16:52:35 -0700562 inc_opt ? ND_OPT_TARGET_LL_ADDR : 0);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900563}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700564
565void ndisc_send_ns(struct net_device *dev, struct neighbour *neigh,
566 struct in6_addr *solicit,
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900567 struct in6_addr *daddr, struct in6_addr *saddr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700568{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700569 struct in6_addr addr_buf;
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900570 struct icmp6hdr icmp6h = {
571 .icmp6_type = NDISC_NEIGHBOUR_SOLICITATION,
572 };
Linus Torvalds1da177e2005-04-16 15:20:36 -0700573
574 if (saddr == NULL) {
Neil Horman95c385b2007-04-25 17:08:10 -0700575 if (ipv6_get_lladdr(dev, &addr_buf,
576 (IFA_F_TENTATIVE|IFA_F_OPTIMISTIC)))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700577 return;
578 saddr = &addr_buf;
579 }
580
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900581 __ndisc_send(dev, neigh, daddr, saddr,
582 &icmp6h, solicit,
David L Stevens14878f72007-09-16 16:52:35 -0700583 !ipv6_addr_any(saddr) ? ND_OPT_SOURCE_LL_ADDR : 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700584}
585
586void ndisc_send_rs(struct net_device *dev, struct in6_addr *saddr,
587 struct in6_addr *daddr)
588{
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900589 struct icmp6hdr icmp6h = {
590 .icmp6_type = NDISC_ROUTER_SOLICITATION,
591 };
Neil Horman95c385b2007-04-25 17:08:10 -0700592 int send_sllao = dev->addr_len;
Neil Horman95c385b2007-04-25 17:08:10 -0700593
594#ifdef CONFIG_IPV6_OPTIMISTIC_DAD
595 /*
596 * According to section 2.2 of RFC 4429, we must not
597 * send router solicitations with a sllao from
598 * optimistic addresses, but we may send the solicitation
599 * if we don't include the sllao. So here we check
600 * if our address is optimistic, and if so, we
Joe Perchesbea85192007-12-20 14:01:35 -0800601 * suppress the inclusion of the sllao.
Neil Horman95c385b2007-04-25 17:08:10 -0700602 */
603 if (send_sllao) {
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900604 struct inet6_ifaddr *ifp = ipv6_get_ifaddr(dev_net(dev), saddr,
Daniel Lezcano1cab3da2008-01-10 22:44:09 -0800605 dev, 1);
Neil Horman95c385b2007-04-25 17:08:10 -0700606 if (ifp) {
607 if (ifp->flags & IFA_F_OPTIMISTIC) {
YOSHIFUJI Hideakica043562007-02-28 23:13:20 +0900608 send_sllao = 0;
Neil Horman95c385b2007-04-25 17:08:10 -0700609 }
YOSHIFUJI Hideakica043562007-02-28 23:13:20 +0900610 in6_ifa_put(ifp);
Neil Horman95c385b2007-04-25 17:08:10 -0700611 } else {
612 send_sllao = 0;
613 }
614 }
615#endif
YOSHIFUJI Hideakie1ec7842007-04-24 20:44:52 +0900616 __ndisc_send(dev, NULL, daddr, saddr,
617 &icmp6h, NULL,
David L Stevens14878f72007-09-16 16:52:35 -0700618 send_sllao ? ND_OPT_SOURCE_LL_ADDR : 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700619}
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900620
Linus Torvalds1da177e2005-04-16 15:20:36 -0700621
622static void ndisc_error_report(struct neighbour *neigh, struct sk_buff *skb)
623{
624 /*
625 * "The sender MUST return an ICMP
626 * destination unreachable"
627 */
628 dst_link_failure(skb);
629 kfree_skb(skb);
630}
631
632/* Called with locked neigh: either read or both */
633
634static void ndisc_solicit(struct neighbour *neigh, struct sk_buff *skb)
635{
636 struct in6_addr *saddr = NULL;
637 struct in6_addr mcaddr;
638 struct net_device *dev = neigh->dev;
639 struct in6_addr *target = (struct in6_addr *)&neigh->primary_key;
640 int probes = atomic_read(&neigh->probes);
641
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900642 if (skb && ipv6_chk_addr(dev_net(dev), &ipv6_hdr(skb)->saddr, dev, 1))
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700643 saddr = &ipv6_hdr(skb)->saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700644
645 if ((probes -= neigh->parms->ucast_probes) < 0) {
646 if (!(neigh->nud_state & NUD_VALID)) {
647 ND_PRINTK1(KERN_DEBUG
648 "%s(): trying to ucast probe in NUD_INVALID: "
Joe Perches46b86a22006-01-13 14:29:07 -0800649 NIP6_FMT "\n",
Harvey Harrison0dc47872008-03-05 20:47:47 -0800650 __func__,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700651 NIP6(*target));
652 }
653 ndisc_send_ns(dev, neigh, target, target, saddr);
654 } else if ((probes -= neigh->parms->app_probes) < 0) {
655#ifdef CONFIG_ARPD
656 neigh_app_ns(neigh);
657#endif
658 } else {
659 addrconf_addr_solict_mult(target, &mcaddr);
660 ndisc_send_ns(dev, NULL, target, &mcaddr, saddr);
661 }
662}
663
YOSHIFUJI Hideaki0736ffc2008-03-28 13:37:58 +0900664static int pndisc_is_router(const void *pkey,
665 struct net_device *dev)
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700666{
667 struct pneigh_entry *n;
YOSHIFUJI Hideaki0736ffc2008-03-28 13:37:58 +0900668 int ret = -1;
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700669
670 read_lock_bh(&nd_tbl.lock);
YOSHIFUJI Hideaki0736ffc2008-03-28 13:37:58 +0900671 n = __pneigh_lookup(&nd_tbl, dev_net(dev), pkey, dev);
672 if (n)
673 ret = !!(n->flags & NTF_ROUTER);
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700674 read_unlock_bh(&nd_tbl.lock);
675
YOSHIFUJI Hideaki0736ffc2008-03-28 13:37:58 +0900676 return ret;
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700677}
678
Linus Torvalds1da177e2005-04-16 15:20:36 -0700679static void ndisc_recv_ns(struct sk_buff *skb)
680{
Arnaldo Carvalho de Melo9c702202007-04-25 18:04:18 -0700681 struct nd_msg *msg = (struct nd_msg *)skb_transport_header(skb);
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700682 struct in6_addr *saddr = &ipv6_hdr(skb)->saddr;
683 struct in6_addr *daddr = &ipv6_hdr(skb)->daddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700684 u8 *lladdr = NULL;
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -0700685 u32 ndoptlen = skb->tail - (skb->transport_header +
686 offsetof(struct nd_msg, opt));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700687 struct ndisc_options ndopts;
688 struct net_device *dev = skb->dev;
689 struct inet6_ifaddr *ifp;
690 struct inet6_dev *idev = NULL;
691 struct neighbour *neigh;
692 int dad = ipv6_addr_any(saddr);
693 int inc;
YOSHIFUJI Hideaki0736ffc2008-03-28 13:37:58 +0900694 int is_router = -1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700695
696 if (ipv6_addr_is_multicast(&msg->target)) {
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900697 ND_PRINTK2(KERN_WARNING
Linus Torvalds1da177e2005-04-16 15:20:36 -0700698 "ICMPv6 NS: multicast target address");
699 return;
700 }
701
702 /*
703 * RFC2461 7.1.1:
704 * DAD has to be destined for solicited node multicast address.
705 */
706 if (dad &&
707 !(daddr->s6_addr32[0] == htonl(0xff020000) &&
708 daddr->s6_addr32[1] == htonl(0x00000000) &&
709 daddr->s6_addr32[2] == htonl(0x00000001) &&
710 daddr->s6_addr [12] == 0xff )) {
711 ND_PRINTK2(KERN_WARNING
712 "ICMPv6 NS: bad DAD packet (wrong destination)\n");
713 return;
714 }
715
716 if (!ndisc_parse_options(msg->opt, ndoptlen, &ndopts)) {
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900717 ND_PRINTK2(KERN_WARNING
Linus Torvalds1da177e2005-04-16 15:20:36 -0700718 "ICMPv6 NS: invalid ND options\n");
719 return;
720 }
721
722 if (ndopts.nd_opts_src_lladdr) {
723 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_src_lladdr, dev);
724 if (!lladdr) {
725 ND_PRINTK2(KERN_WARNING
726 "ICMPv6 NS: invalid link-layer address length\n");
727 return;
728 }
729
730 /* RFC2461 7.1.1:
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900731 * If the IP source address is the unspecified address,
732 * there MUST NOT be source link-layer address option
Linus Torvalds1da177e2005-04-16 15:20:36 -0700733 * in the message.
734 */
735 if (dad) {
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900736 ND_PRINTK2(KERN_WARNING
Linus Torvalds1da177e2005-04-16 15:20:36 -0700737 "ICMPv6 NS: bad DAD packet (link-layer address option)\n");
738 return;
739 }
740 }
741
742 inc = ipv6_addr_is_multicast(daddr);
743
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900744 ifp = ipv6_get_ifaddr(dev_net(dev), &msg->target, dev, 1);
Daniel Lezcanoa18bc692008-03-07 11:14:49 -0800745 if (ifp) {
Neil Horman95c385b2007-04-25 17:08:10 -0700746
747 if (ifp->flags & (IFA_F_TENTATIVE|IFA_F_OPTIMISTIC)) {
748 if (dad) {
749 if (dev->type == ARPHRD_IEEE802_TR) {
Arnaldo Carvalho de Melo98e399f2007-03-19 15:33:04 -0700750 const unsigned char *sadr;
751 sadr = skb_mac_header(skb);
Neil Horman95c385b2007-04-25 17:08:10 -0700752 if (((sadr[8] ^ dev->dev_addr[0]) & 0x7f) == 0 &&
753 sadr[9] == dev->dev_addr[1] &&
754 sadr[10] == dev->dev_addr[2] &&
755 sadr[11] == dev->dev_addr[3] &&
756 sadr[12] == dev->dev_addr[4] &&
757 sadr[13] == dev->dev_addr[5]) {
758 /* looped-back to us */
759 goto out;
760 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700761 }
Neil Horman95c385b2007-04-25 17:08:10 -0700762
763 /*
764 * We are colliding with another node
765 * who is doing DAD
766 * so fail our DAD process
767 */
768 addrconf_dad_failure(ifp);
Denis V. Lunev9e3be4b2007-09-11 11:04:49 +0200769 return;
Neil Horman95c385b2007-04-25 17:08:10 -0700770 } else {
771 /*
772 * This is not a dad solicitation.
773 * If we are an optimistic node,
774 * we should respond.
775 * Otherwise, we should ignore it.
776 */
777 if (!(ifp->flags & IFA_F_OPTIMISTIC))
778 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700779 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700780 }
781
782 idev = ifp->idev;
783 } else {
784 idev = in6_dev_get(dev);
785 if (!idev) {
786 /* XXX: count this drop? */
787 return;
788 }
789
Daniel Lezcano6ab57e72008-03-26 16:52:32 -0700790 if (ipv6_chk_acast_addr(dev_net(dev), dev, &msg->target) ||
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900791 (idev->cnf.forwarding &&
YOSHIFUJI Hideakifbea49e2006-09-22 14:43:49 -0700792 (ipv6_devconf.proxy_ndp || idev->cnf.proxy_ndp) &&
YOSHIFUJI Hideaki0736ffc2008-03-28 13:37:58 +0900793 (is_router = pndisc_is_router(&msg->target, dev)) >= 0)) {
Patrick McHardya61bbcf2005-08-14 17:24:31 -0700794 if (!(NEIGH_CB(skb)->flags & LOCALLY_ENQUEUED) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -0700795 skb->pkt_type != PACKET_HOST &&
796 inc != 0 &&
797 idev->nd_parms->proxy_delay != 0) {
798 /*
799 * for anycast or proxy,
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900800 * sender should delay its response
801 * by a random time between 0 and
Linus Torvalds1da177e2005-04-16 15:20:36 -0700802 * MAX_ANYCAST_DELAY_TIME seconds.
803 * (RFC2461) -- yoshfuji
804 */
805 struct sk_buff *n = skb_clone(skb, GFP_ATOMIC);
806 if (n)
807 pneigh_enqueue(&nd_tbl, idev->nd_parms, n);
808 goto out;
809 }
810 } else
811 goto out;
812 }
813
YOSHIFUJI Hideaki0736ffc2008-03-28 13:37:58 +0900814 if (is_router < 0)
815 is_router = !!idev->cnf.forwarding;
Ville Nuorvala62dd9312006-09-22 14:43:19 -0700816
Linus Torvalds1da177e2005-04-16 15:20:36 -0700817 if (dad) {
818 struct in6_addr maddr;
819
820 ipv6_addr_all_nodes(&maddr);
821 ndisc_send_na(dev, NULL, &maddr, &msg->target,
Ville Nuorvala62dd9312006-09-22 14:43:19 -0700822 is_router, 0, (ifp != NULL), 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700823 goto out;
824 }
825
826 if (inc)
827 NEIGH_CACHE_STAT_INC(&nd_tbl, rcv_probes_mcast);
828 else
829 NEIGH_CACHE_STAT_INC(&nd_tbl, rcv_probes_ucast);
830
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900831 /*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700832 * update / create cache entry
833 * for the source address
834 */
835 neigh = __neigh_lookup(&nd_tbl, saddr, dev,
836 !inc || lladdr || !dev->addr_len);
837 if (neigh)
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900838 neigh_update(neigh, lladdr, NUD_STALE,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700839 NEIGH_UPDATE_F_WEAK_OVERRIDE|
840 NEIGH_UPDATE_F_OVERRIDE);
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -0700841 if (neigh || !dev->header_ops) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700842 ndisc_send_na(dev, neigh, saddr, &msg->target,
Ville Nuorvala62dd9312006-09-22 14:43:19 -0700843 is_router,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700844 1, (ifp != NULL && inc), inc);
845 if (neigh)
846 neigh_release(neigh);
847 }
848
849out:
850 if (ifp)
851 in6_ifa_put(ifp);
852 else
853 in6_dev_put(idev);
854
855 return;
856}
857
858static void ndisc_recv_na(struct sk_buff *skb)
859{
Arnaldo Carvalho de Melo9c702202007-04-25 18:04:18 -0700860 struct nd_msg *msg = (struct nd_msg *)skb_transport_header(skb);
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700861 struct in6_addr *saddr = &ipv6_hdr(skb)->saddr;
862 struct in6_addr *daddr = &ipv6_hdr(skb)->daddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700863 u8 *lladdr = NULL;
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -0700864 u32 ndoptlen = skb->tail - (skb->transport_header +
865 offsetof(struct nd_msg, opt));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700866 struct ndisc_options ndopts;
867 struct net_device *dev = skb->dev;
868 struct inet6_ifaddr *ifp;
869 struct neighbour *neigh;
870
871 if (skb->len < sizeof(struct nd_msg)) {
872 ND_PRINTK2(KERN_WARNING
873 "ICMPv6 NA: packet too short\n");
874 return;
875 }
876
877 if (ipv6_addr_is_multicast(&msg->target)) {
878 ND_PRINTK2(KERN_WARNING
879 "ICMPv6 NA: target address is multicast.\n");
880 return;
881 }
882
883 if (ipv6_addr_is_multicast(daddr) &&
884 msg->icmph.icmp6_solicited) {
885 ND_PRINTK2(KERN_WARNING
886 "ICMPv6 NA: solicited NA is multicasted.\n");
887 return;
888 }
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +0900889
Linus Torvalds1da177e2005-04-16 15:20:36 -0700890 if (!ndisc_parse_options(msg->opt, ndoptlen, &ndopts)) {
891 ND_PRINTK2(KERN_WARNING
892 "ICMPv6 NS: invalid ND option\n");
893 return;
894 }
895 if (ndopts.nd_opts_tgt_lladdr) {
896 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_tgt_lladdr, dev);
897 if (!lladdr) {
898 ND_PRINTK2(KERN_WARNING
899 "ICMPv6 NA: invalid link-layer address length\n");
900 return;
901 }
902 }
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900903 ifp = ipv6_get_ifaddr(dev_net(dev), &msg->target, dev, 1);
Daniel Lezcanoa18bc692008-03-07 11:14:49 -0800904 if (ifp) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700905 if (ifp->flags & IFA_F_TENTATIVE) {
906 addrconf_dad_failure(ifp);
907 return;
908 }
909 /* What should we make now? The advertisement
910 is invalid, but ndisc specs say nothing
911 about it. It could be misconfiguration, or
912 an smart proxy agent tries to help us :-)
913 */
914 ND_PRINTK1(KERN_WARNING
915 "ICMPv6 NA: someone advertises our address on %s!\n",
916 ifp->idev->dev->name);
917 in6_ifa_put(ifp);
918 return;
919 }
920 neigh = neigh_lookup(&nd_tbl, &msg->target, dev);
921
922 if (neigh) {
923 u8 old_flags = neigh->flags;
924
925 if (neigh->nud_state & NUD_FAILED)
926 goto out;
927
Ville Nuorvala5f3e6e92006-09-22 14:42:46 -0700928 /*
929 * Don't update the neighbor cache entry on a proxy NA from
930 * ourselves because either the proxied node is off link or it
931 * has already sent a NA to us.
932 */
933 if (lladdr && !memcmp(lladdr, dev->dev_addr, dev->addr_len) &&
YOSHIFUJI Hideakifbea49e2006-09-22 14:43:49 -0700934 ipv6_devconf.forwarding && ipv6_devconf.proxy_ndp &&
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900935 pneigh_lookup(&nd_tbl, dev_net(dev), &msg->target, dev, 0)) {
YOSHIFUJI Hideakifbea49e2006-09-22 14:43:49 -0700936 /* XXX: idev->cnf.prixy_ndp */
Ville Nuorvala5f3e6e92006-09-22 14:42:46 -0700937 goto out;
YOSHIFUJI Hideakifbea49e2006-09-22 14:43:49 -0700938 }
Ville Nuorvala5f3e6e92006-09-22 14:42:46 -0700939
Linus Torvalds1da177e2005-04-16 15:20:36 -0700940 neigh_update(neigh, lladdr,
941 msg->icmph.icmp6_solicited ? NUD_REACHABLE : NUD_STALE,
942 NEIGH_UPDATE_F_WEAK_OVERRIDE|
943 (msg->icmph.icmp6_override ? NEIGH_UPDATE_F_OVERRIDE : 0)|
944 NEIGH_UPDATE_F_OVERRIDE_ISROUTER|
945 (msg->icmph.icmp6_router ? NEIGH_UPDATE_F_ISROUTER : 0));
946
947 if ((old_flags & ~neigh->flags) & NTF_ROUTER) {
948 /*
949 * Change: router to host
950 */
951 struct rt6_info *rt;
952 rt = rt6_get_dflt_router(saddr, dev);
953 if (rt)
Thomas Grafe0a1ad732006-08-22 00:00:21 -0700954 ip6_del_rt(rt);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700955 }
956
957out:
958 neigh_release(neigh);
959 }
960}
961
962static void ndisc_recv_rs(struct sk_buff *skb)
963{
Arnaldo Carvalho de Melo9c702202007-04-25 18:04:18 -0700964 struct rs_msg *rs_msg = (struct rs_msg *)skb_transport_header(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700965 unsigned long ndoptlen = skb->len - sizeof(*rs_msg);
966 struct neighbour *neigh;
967 struct inet6_dev *idev;
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -0700968 struct in6_addr *saddr = &ipv6_hdr(skb)->saddr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700969 struct ndisc_options ndopts;
970 u8 *lladdr = NULL;
971
972 if (skb->len < sizeof(*rs_msg))
973 return;
974
975 idev = in6_dev_get(skb->dev);
976 if (!idev) {
977 if (net_ratelimit())
978 ND_PRINTK1("ICMP6 RS: can't find in6 device\n");
979 return;
980 }
981
982 /* Don't accept RS if we're not in router mode */
983 if (!idev->cnf.forwarding)
984 goto out;
985
986 /*
987 * Don't update NCE if src = ::;
988 * this implies that the source node has no ip address assigned yet.
989 */
990 if (ipv6_addr_any(saddr))
991 goto out;
992
993 /* Parse ND options */
994 if (!ndisc_parse_options(rs_msg->opt, ndoptlen, &ndopts)) {
995 if (net_ratelimit())
996 ND_PRINTK2("ICMP6 NS: invalid ND option, ignored\n");
997 goto out;
998 }
999
1000 if (ndopts.nd_opts_src_lladdr) {
1001 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_src_lladdr,
1002 skb->dev);
1003 if (!lladdr)
1004 goto out;
1005 }
1006
1007 neigh = __neigh_lookup(&nd_tbl, saddr, skb->dev, 1);
1008 if (neigh) {
1009 neigh_update(neigh, lladdr, NUD_STALE,
1010 NEIGH_UPDATE_F_WEAK_OVERRIDE|
1011 NEIGH_UPDATE_F_OVERRIDE|
1012 NEIGH_UPDATE_F_OVERRIDE_ISROUTER);
1013 neigh_release(neigh);
1014 }
1015out:
1016 in6_dev_put(idev);
1017}
1018
Pierre Ynard31910572007-10-10 21:22:05 -07001019static void ndisc_ra_useropt(struct sk_buff *ra, struct nd_opt_hdr *opt)
1020{
1021 struct icmp6hdr *icmp6h = (struct icmp6hdr *)skb_transport_header(ra);
1022 struct sk_buff *skb;
1023 struct nlmsghdr *nlh;
1024 struct nduseroptmsg *ndmsg;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001025 struct net *net = dev_net(ra->dev);
Pierre Ynard31910572007-10-10 21:22:05 -07001026 int err;
1027 int base_size = NLMSG_ALIGN(sizeof(struct nduseroptmsg)
1028 + (opt->nd_opt_len << 3));
1029 size_t msg_size = base_size + nla_total_size(sizeof(struct in6_addr));
1030
1031 skb = nlmsg_new(msg_size, GFP_ATOMIC);
1032 if (skb == NULL) {
1033 err = -ENOBUFS;
1034 goto errout;
1035 }
1036
1037 nlh = nlmsg_put(skb, 0, 0, RTM_NEWNDUSEROPT, base_size, 0);
1038 if (nlh == NULL) {
1039 goto nla_put_failure;
1040 }
1041
1042 ndmsg = nlmsg_data(nlh);
1043 ndmsg->nduseropt_family = AF_INET6;
Pierre Ynarddbb2ed22007-11-12 17:58:35 -08001044 ndmsg->nduseropt_ifindex = ra->dev->ifindex;
Pierre Ynard31910572007-10-10 21:22:05 -07001045 ndmsg->nduseropt_icmp_type = icmp6h->icmp6_type;
1046 ndmsg->nduseropt_icmp_code = icmp6h->icmp6_code;
1047 ndmsg->nduseropt_opts_len = opt->nd_opt_len << 3;
1048
1049 memcpy(ndmsg + 1, opt, opt->nd_opt_len << 3);
1050
1051 NLA_PUT(skb, NDUSEROPT_SRCADDR, sizeof(struct in6_addr),
1052 &ipv6_hdr(ra)->saddr);
1053 nlmsg_end(skb, nlh);
1054
Daniel Lezcanoa18bc692008-03-07 11:14:49 -08001055 err = rtnl_notify(skb, net, 0, RTNLGRP_ND_USEROPT, NULL,
Denis V. Lunev97c53ca2007-11-19 22:26:51 -08001056 GFP_ATOMIC);
Pierre Ynard31910572007-10-10 21:22:05 -07001057 if (err < 0)
1058 goto errout;
1059
1060 return;
1061
1062nla_put_failure:
1063 nlmsg_free(skb);
1064 err = -EMSGSIZE;
1065errout:
Daniel Lezcanoa18bc692008-03-07 11:14:49 -08001066 rtnl_set_sk_err(net, RTNLGRP_ND_USEROPT, err);
Pierre Ynard31910572007-10-10 21:22:05 -07001067}
1068
Linus Torvalds1da177e2005-04-16 15:20:36 -07001069static void ndisc_router_discovery(struct sk_buff *skb)
1070{
Arnaldo Carvalho de Melo9c702202007-04-25 18:04:18 -07001071 struct ra_msg *ra_msg = (struct ra_msg *)skb_transport_header(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001072 struct neighbour *neigh = NULL;
1073 struct inet6_dev *in6_dev;
YOSHIFUJI Hideaki65f5c7c2006-03-20 16:55:08 -08001074 struct rt6_info *rt = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001075 int lifetime;
1076 struct ndisc_options ndopts;
1077 int optlen;
YOSHIFUJI Hideakiebacaaa2006-03-20 17:04:53 -08001078 unsigned int pref = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001079
1080 __u8 * opt = (__u8 *)(ra_msg + 1);
1081
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -07001082 optlen = (skb->tail - skb->transport_header) - sizeof(struct ra_msg);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001083
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001084 if (!(ipv6_addr_type(&ipv6_hdr(skb)->saddr) & IPV6_ADDR_LINKLOCAL)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001085 ND_PRINTK2(KERN_WARNING
1086 "ICMPv6 RA: source address is not link-local.\n");
1087 return;
1088 }
1089 if (optlen < 0) {
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001090 ND_PRINTK2(KERN_WARNING
Linus Torvalds1da177e2005-04-16 15:20:36 -07001091 "ICMPv6 RA: packet too short\n");
1092 return;
1093 }
1094
Templin, Fred Lfadf6bf2008-03-11 18:35:59 -04001095 if (skb->ndisc_nodetype == NDISC_NODETYPE_HOST) {
1096 ND_PRINTK2(KERN_WARNING
1097 "ICMPv6 RA: from host or unauthorized router\n");
1098 return;
1099 }
1100
Linus Torvalds1da177e2005-04-16 15:20:36 -07001101 /*
1102 * set the RA_RECV flag in the interface
1103 */
1104
1105 in6_dev = in6_dev_get(skb->dev);
1106 if (in6_dev == NULL) {
1107 ND_PRINTK0(KERN_ERR
1108 "ICMPv6 RA: can't find inet6 device for %s.\n",
1109 skb->dev->name);
1110 return;
1111 }
1112 if (in6_dev->cnf.forwarding || !in6_dev->cnf.accept_ra) {
1113 in6_dev_put(in6_dev);
1114 return;
1115 }
1116
1117 if (!ndisc_parse_options(opt, optlen, &ndopts)) {
1118 in6_dev_put(in6_dev);
1119 ND_PRINTK2(KERN_WARNING
1120 "ICMP6 RA: invalid ND options\n");
1121 return;
1122 }
1123
Templin, Fred Lfadf6bf2008-03-11 18:35:59 -04001124 /* skip link-specific parameters from interior routers */
1125 if (skb->ndisc_nodetype == NDISC_NODETYPE_NODEFAULT)
1126 goto skip_linkparms;
1127
Linus Torvalds1da177e2005-04-16 15:20:36 -07001128 if (in6_dev->if_flags & IF_RS_SENT) {
1129 /*
1130 * flag that an RA was received after an RS was sent
1131 * out on this interface.
1132 */
1133 in6_dev->if_flags |= IF_RA_RCVD;
1134 }
1135
1136 /*
1137 * Remember the managed/otherconf flags from most recently
1138 * received RA message (RFC 2462) -- yoshfuji
1139 */
1140 in6_dev->if_flags = (in6_dev->if_flags & ~(IF_RA_MANAGED |
1141 IF_RA_OTHERCONF)) |
1142 (ra_msg->icmph.icmp6_addrconf_managed ?
1143 IF_RA_MANAGED : 0) |
1144 (ra_msg->icmph.icmp6_addrconf_other ?
1145 IF_RA_OTHERCONF : 0);
1146
YOSHIFUJI Hideaki65f5c7c2006-03-20 16:55:08 -08001147 if (!in6_dev->cnf.accept_ra_defrtr)
1148 goto skip_defrtr;
1149
Linus Torvalds1da177e2005-04-16 15:20:36 -07001150 lifetime = ntohs(ra_msg->icmph.icmp6_rt_lifetime);
1151
YOSHIFUJI Hideakiebacaaa2006-03-20 17:04:53 -08001152#ifdef CONFIG_IPV6_ROUTER_PREF
1153 pref = ra_msg->icmph.icmp6_router_pref;
1154 /* 10b is handled as if it were 00b (medium) */
YOSHIFUJI Hideaki930d6ff2006-03-20 17:05:30 -08001155 if (pref == ICMPV6_ROUTER_PREF_INVALID ||
YOSHIFUJI Hideaki6d5b78c2007-06-22 16:07:04 -07001156 !in6_dev->cnf.accept_ra_rtr_pref)
YOSHIFUJI Hideakiebacaaa2006-03-20 17:04:53 -08001157 pref = ICMPV6_ROUTER_PREF_MEDIUM;
1158#endif
1159
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001160 rt = rt6_get_dflt_router(&ipv6_hdr(skb)->saddr, skb->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001161
1162 if (rt)
1163 neigh = rt->rt6i_nexthop;
1164
1165 if (rt && lifetime == 0) {
1166 neigh_clone(neigh);
Thomas Grafe0a1ad732006-08-22 00:00:21 -07001167 ip6_del_rt(rt);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001168 rt = NULL;
1169 }
1170
1171 if (rt == NULL && lifetime) {
1172 ND_PRINTK3(KERN_DEBUG
1173 "ICMPv6 RA: adding default router.\n");
1174
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001175 rt = rt6_add_dflt_router(&ipv6_hdr(skb)->saddr, skb->dev, pref);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001176 if (rt == NULL) {
1177 ND_PRINTK0(KERN_ERR
1178 "ICMPv6 RA: %s() failed to add default route.\n",
Harvey Harrison0dc47872008-03-05 20:47:47 -08001179 __func__);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001180 in6_dev_put(in6_dev);
1181 return;
1182 }
1183
1184 neigh = rt->rt6i_nexthop;
1185 if (neigh == NULL) {
1186 ND_PRINTK0(KERN_ERR
1187 "ICMPv6 RA: %s() got default router without neighbour.\n",
Harvey Harrison0dc47872008-03-05 20:47:47 -08001188 __func__);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001189 dst_release(&rt->u.dst);
1190 in6_dev_put(in6_dev);
1191 return;
1192 }
1193 neigh->flags |= NTF_ROUTER;
YOSHIFUJI Hideakiebacaaa2006-03-20 17:04:53 -08001194 } else if (rt) {
1195 rt->rt6i_flags |= (rt->rt6i_flags & ~RTF_PREF_MASK) | RTF_PREF(pref);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001196 }
1197
1198 if (rt)
1199 rt->rt6i_expires = jiffies + (HZ * lifetime);
1200
1201 if (ra_msg->icmph.icmp6_hop_limit) {
1202 in6_dev->cnf.hop_limit = ra_msg->icmph.icmp6_hop_limit;
1203 if (rt)
1204 rt->u.dst.metrics[RTAX_HOPLIMIT-1] = ra_msg->icmph.icmp6_hop_limit;
1205 }
1206
YOSHIFUJI Hideaki65f5c7c2006-03-20 16:55:08 -08001207skip_defrtr:
1208
Linus Torvalds1da177e2005-04-16 15:20:36 -07001209 /*
1210 * Update Reachable Time and Retrans Timer
1211 */
1212
1213 if (in6_dev->nd_parms) {
1214 unsigned long rtime = ntohl(ra_msg->retrans_timer);
1215
1216 if (rtime && rtime/1000 < MAX_SCHEDULE_TIMEOUT/HZ) {
1217 rtime = (rtime*HZ)/1000;
1218 if (rtime < HZ/10)
1219 rtime = HZ/10;
1220 in6_dev->nd_parms->retrans_time = rtime;
1221 in6_dev->tstamp = jiffies;
1222 inet6_ifinfo_notify(RTM_NEWLINK, in6_dev);
1223 }
1224
1225 rtime = ntohl(ra_msg->reachable_time);
1226 if (rtime && rtime/1000 < MAX_SCHEDULE_TIMEOUT/(3*HZ)) {
1227 rtime = (rtime*HZ)/1000;
1228
1229 if (rtime < HZ/10)
1230 rtime = HZ/10;
1231
1232 if (rtime != in6_dev->nd_parms->base_reachable_time) {
1233 in6_dev->nd_parms->base_reachable_time = rtime;
1234 in6_dev->nd_parms->gc_staletime = 3 * rtime;
1235 in6_dev->nd_parms->reachable_time = neigh_rand_reach_time(rtime);
1236 in6_dev->tstamp = jiffies;
1237 inet6_ifinfo_notify(RTM_NEWLINK, in6_dev);
1238 }
1239 }
1240 }
1241
Templin, Fred Lfadf6bf2008-03-11 18:35:59 -04001242skip_linkparms:
1243
Linus Torvalds1da177e2005-04-16 15:20:36 -07001244 /*
1245 * Process options.
1246 */
1247
1248 if (!neigh)
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001249 neigh = __neigh_lookup(&nd_tbl, &ipv6_hdr(skb)->saddr,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001250 skb->dev, 1);
1251 if (neigh) {
1252 u8 *lladdr = NULL;
1253 if (ndopts.nd_opts_src_lladdr) {
1254 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_src_lladdr,
1255 skb->dev);
1256 if (!lladdr) {
1257 ND_PRINTK2(KERN_WARNING
1258 "ICMPv6 RA: invalid link-layer address length\n");
1259 goto out;
1260 }
1261 }
1262 neigh_update(neigh, lladdr, NUD_STALE,
1263 NEIGH_UPDATE_F_WEAK_OVERRIDE|
1264 NEIGH_UPDATE_F_OVERRIDE|
1265 NEIGH_UPDATE_F_OVERRIDE_ISROUTER|
1266 NEIGH_UPDATE_F_ISROUTER);
1267 }
1268
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001269#ifdef CONFIG_IPV6_ROUTE_INFO
YOSHIFUJI Hideaki09c884d2006-03-20 17:07:03 -08001270 if (in6_dev->cnf.accept_ra_rtr_pref && ndopts.nd_opts_ri) {
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001271 struct nd_opt_hdr *p;
1272 for (p = ndopts.nd_opts_ri;
1273 p;
1274 p = ndisc_next_option(p, ndopts.nd_opts_ri_end)) {
YOSHIFUJI Hideaki09c884d2006-03-20 17:07:03 -08001275 if (((struct route_info *)p)->prefix_len > in6_dev->cnf.accept_ra_rt_info_max_plen)
1276 continue;
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001277 rt6_route_rcv(skb->dev, (u8*)p, (p->nd_opt_len) << 3,
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001278 &ipv6_hdr(skb)->saddr);
YOSHIFUJI Hideaki70ceb4f2006-03-20 17:06:24 -08001279 }
1280 }
1281#endif
1282
Templin, Fred Lfadf6bf2008-03-11 18:35:59 -04001283 /* skip link-specific ndopts from interior routers */
1284 if (skb->ndisc_nodetype == NDISC_NODETYPE_NODEFAULT)
1285 goto out;
1286
YOSHIFUJI Hideakic4fd30e2006-03-20 16:55:26 -08001287 if (in6_dev->cnf.accept_ra_pinfo && ndopts.nd_opts_pi) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001288 struct nd_opt_hdr *p;
1289 for (p = ndopts.nd_opts_pi;
1290 p;
1291 p = ndisc_next_option(p, ndopts.nd_opts_pi_end)) {
1292 addrconf_prefix_rcv(skb->dev, (u8*)p, (p->nd_opt_len) << 3);
1293 }
1294 }
1295
1296 if (ndopts.nd_opts_mtu) {
Al Viroe69a4ad2006-11-14 20:56:00 -08001297 __be32 n;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001298 u32 mtu;
1299
Al Viroe69a4ad2006-11-14 20:56:00 -08001300 memcpy(&n, ((u8*)(ndopts.nd_opts_mtu+1))+2, sizeof(mtu));
1301 mtu = ntohl(n);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001302
1303 if (mtu < IPV6_MIN_MTU || mtu > skb->dev->mtu) {
1304 ND_PRINTK2(KERN_WARNING
1305 "ICMPv6 RA: invalid mtu: %d\n",
1306 mtu);
1307 } else if (in6_dev->cnf.mtu6 != mtu) {
1308 in6_dev->cnf.mtu6 = mtu;
1309
1310 if (rt)
1311 rt->u.dst.metrics[RTAX_MTU-1] = mtu;
1312
1313 rt6_mtu_change(skb->dev, mtu);
1314 }
1315 }
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001316
Pierre Ynard31910572007-10-10 21:22:05 -07001317 if (ndopts.nd_useropts) {
YOSHIFUJI Hideaki61cf46a2008-01-22 17:32:53 +09001318 struct nd_opt_hdr *p;
1319 for (p = ndopts.nd_useropts;
1320 p;
1321 p = ndisc_next_useropt(p, ndopts.nd_useropts_end)) {
1322 ndisc_ra_useropt(skb, p);
Pierre Ynard31910572007-10-10 21:22:05 -07001323 }
1324 }
1325
Linus Torvalds1da177e2005-04-16 15:20:36 -07001326 if (ndopts.nd_opts_tgt_lladdr || ndopts.nd_opts_rh) {
1327 ND_PRINTK2(KERN_WARNING
1328 "ICMPv6 RA: invalid RA options");
1329 }
1330out:
1331 if (rt)
1332 dst_release(&rt->u.dst);
1333 else if (neigh)
1334 neigh_release(neigh);
1335 in6_dev_put(in6_dev);
1336}
1337
1338static void ndisc_redirect_rcv(struct sk_buff *skb)
1339{
1340 struct inet6_dev *in6_dev;
1341 struct icmp6hdr *icmph;
1342 struct in6_addr *dest;
1343 struct in6_addr *target; /* new first hop to destination */
1344 struct neighbour *neigh;
1345 int on_link = 0;
1346 struct ndisc_options ndopts;
1347 int optlen;
1348 u8 *lladdr = NULL;
1349
Templin, Fred Lfadf6bf2008-03-11 18:35:59 -04001350 switch (skb->ndisc_nodetype) {
1351 case NDISC_NODETYPE_HOST:
1352 case NDISC_NODETYPE_NODEFAULT:
1353 ND_PRINTK2(KERN_WARNING
1354 "ICMPv6 Redirect: from host or unauthorized router\n");
1355 return;
1356 }
1357
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001358 if (!(ipv6_addr_type(&ipv6_hdr(skb)->saddr) & IPV6_ADDR_LINKLOCAL)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001359 ND_PRINTK2(KERN_WARNING
1360 "ICMPv6 Redirect: source address is not link-local.\n");
1361 return;
1362 }
1363
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -07001364 optlen = skb->tail - skb->transport_header;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001365 optlen -= sizeof(struct icmp6hdr) + 2 * sizeof(struct in6_addr);
1366
1367 if (optlen < 0) {
1368 ND_PRINTK2(KERN_WARNING
1369 "ICMPv6 Redirect: packet too short\n");
1370 return;
1371 }
1372
Arnaldo Carvalho de Melocc70ab22007-03-13 14:03:22 -03001373 icmph = icmp6_hdr(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001374 target = (struct in6_addr *) (icmph + 1);
1375 dest = target + 1;
1376
1377 if (ipv6_addr_is_multicast(dest)) {
1378 ND_PRINTK2(KERN_WARNING
1379 "ICMPv6 Redirect: destination address is multicast.\n");
1380 return;
1381 }
1382
1383 if (ipv6_addr_equal(dest, target)) {
1384 on_link = 1;
Brian Haleybf0b48d2007-10-08 00:12:05 -07001385 } else if (ipv6_addr_type(target) !=
1386 (IPV6_ADDR_UNICAST|IPV6_ADDR_LINKLOCAL)) {
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001387 ND_PRINTK2(KERN_WARNING
Brian Haleybf0b48d2007-10-08 00:12:05 -07001388 "ICMPv6 Redirect: target address is not link-local unicast.\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001389 return;
1390 }
1391
1392 in6_dev = in6_dev_get(skb->dev);
1393 if (!in6_dev)
1394 return;
1395 if (in6_dev->cnf.forwarding || !in6_dev->cnf.accept_redirects) {
1396 in6_dev_put(in6_dev);
1397 return;
1398 }
1399
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001400 /* RFC2461 8.1:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001401 * The IP source address of the Redirect MUST be the same as the current
1402 * first-hop router for the specified ICMP Destination Address.
1403 */
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001404
Linus Torvalds1da177e2005-04-16 15:20:36 -07001405 if (!ndisc_parse_options((u8*)(dest + 1), optlen, &ndopts)) {
1406 ND_PRINTK2(KERN_WARNING
1407 "ICMPv6 Redirect: invalid ND options\n");
1408 in6_dev_put(in6_dev);
1409 return;
1410 }
1411 if (ndopts.nd_opts_tgt_lladdr) {
1412 lladdr = ndisc_opt_addr_data(ndopts.nd_opts_tgt_lladdr,
1413 skb->dev);
1414 if (!lladdr) {
1415 ND_PRINTK2(KERN_WARNING
1416 "ICMPv6 Redirect: invalid link-layer address length\n");
1417 in6_dev_put(in6_dev);
1418 return;
1419 }
1420 }
1421
1422 neigh = __neigh_lookup(&nd_tbl, target, skb->dev, 1);
1423 if (neigh) {
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001424 rt6_redirect(dest, &ipv6_hdr(skb)->daddr,
1425 &ipv6_hdr(skb)->saddr, neigh, lladdr,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001426 on_link);
1427 neigh_release(neigh);
1428 }
1429 in6_dev_put(in6_dev);
1430}
1431
1432void ndisc_send_redirect(struct sk_buff *skb, struct neighbour *neigh,
1433 struct in6_addr *target)
1434{
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001435 struct net_device *dev = skb->dev;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001436 struct net *net = dev_net(dev);
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001437 struct sock *sk = net->ipv6.ndisc_sk;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001438 int len = sizeof(struct icmp6hdr) + 2 * sizeof(struct in6_addr);
1439 struct sk_buff *buff;
1440 struct icmp6hdr *icmph;
1441 struct in6_addr saddr_buf;
1442 struct in6_addr *addrp;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001443 struct rt6_info *rt;
1444 struct dst_entry *dst;
1445 struct inet6_dev *idev;
1446 struct flowi fl;
1447 u8 *opt;
1448 int rd_len;
1449 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001450 u8 ha_buf[MAX_ADDR_LEN], *ha = NULL;
1451
Neil Horman95c385b2007-04-25 17:08:10 -07001452 if (ipv6_get_lladdr(dev, &saddr_buf, IFA_F_TENTATIVE)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001453 ND_PRINTK2(KERN_WARNING
1454 "ICMPv6 Redirect: no link-local address on %s\n",
1455 dev->name);
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001456 return;
1457 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001458
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001459 if (!ipv6_addr_equal(&ipv6_hdr(skb)->daddr, target) &&
Brian Haleybf0b48d2007-10-08 00:12:05 -07001460 ipv6_addr_type(target) != (IPV6_ADDR_UNICAST|IPV6_ADDR_LINKLOCAL)) {
Li Yewang29556522007-01-30 14:33:20 -08001461 ND_PRINTK2(KERN_WARNING
Brian Haleybf0b48d2007-10-08 00:12:05 -07001462 "ICMPv6 Redirect: target address is not link-local unicast.\n");
Li Yewang29556522007-01-30 14:33:20 -08001463 return;
1464 }
1465
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001466 icmpv6_flow_init(sk, &fl, NDISC_REDIRECT,
YOSHIFUJI Hideaki95e41e92007-12-06 15:43:30 -08001467 &saddr_buf, &ipv6_hdr(skb)->saddr, dev->ifindex);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001468
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001469 dst = ip6_route_output(net, NULL, &fl);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001470 if (dst == NULL)
1471 return;
1472
1473 err = xfrm_lookup(&dst, &fl, NULL, 0);
Patrick McHardye1044112005-09-08 15:11:55 -07001474 if (err)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001475 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001476
1477 rt = (struct rt6_info *) dst;
1478
1479 if (rt->rt6i_flags & RTF_GATEWAY) {
1480 ND_PRINTK2(KERN_WARNING
1481 "ICMPv6 Redirect: destination is not a neighbour.\n");
1482 dst_release(dst);
1483 return;
1484 }
1485 if (!xrlim_allow(dst, 1*HZ)) {
1486 dst_release(dst);
1487 return;
1488 }
1489
1490 if (dev->addr_len) {
1491 read_lock_bh(&neigh->lock);
1492 if (neigh->nud_state & NUD_VALID) {
1493 memcpy(ha_buf, neigh->ha, dev->addr_len);
1494 read_unlock_bh(&neigh->lock);
1495 ha = ha_buf;
1496 len += ndisc_opt_addr_space(dev);
1497 } else
1498 read_unlock_bh(&neigh->lock);
1499 }
1500
1501 rd_len = min_t(unsigned int,
1502 IPV6_MIN_MTU-sizeof(struct ipv6hdr)-len, skb->len + 8);
1503 rd_len &= ~0x7;
1504 len += rd_len;
1505
David S. Millerd54a81d2006-12-02 21:00:06 -08001506 buff = sock_alloc_send_skb(sk,
1507 (MAX_HEADER + sizeof(struct ipv6hdr) +
1508 len + LL_RESERVED_SPACE(dev)),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001509 1, &err);
1510 if (buff == NULL) {
1511 ND_PRINTK0(KERN_ERR
1512 "ICMPv6 Redirect: %s() failed to allocate an skb.\n",
Harvey Harrison0dc47872008-03-05 20:47:47 -08001513 __func__);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001514 dst_release(dst);
1515 return;
1516 }
1517
Linus Torvalds1da177e2005-04-16 15:20:36 -07001518 skb_reserve(buff, LL_RESERVED_SPACE(dev));
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001519 ip6_nd_hdr(sk, buff, dev, &saddr_buf, &ipv6_hdr(skb)->saddr,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001520 IPPROTO_ICMPV6, len);
1521
Arnaldo Carvalho de Melo27a884d2007-04-19 20:29:13 -07001522 skb_set_transport_header(buff, skb_tail_pointer(buff) - buff->data);
Arnaldo Carvalho de Melod10ba342007-03-14 21:05:37 -03001523 skb_put(buff, len);
1524 icmph = icmp6_hdr(buff);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001525
1526 memset(icmph, 0, sizeof(struct icmp6hdr));
1527 icmph->icmp6_type = NDISC_REDIRECT;
1528
1529 /*
1530 * copy target and destination addresses
1531 */
1532
1533 addrp = (struct in6_addr *)(icmph + 1);
1534 ipv6_addr_copy(addrp, target);
1535 addrp++;
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001536 ipv6_addr_copy(addrp, &ipv6_hdr(skb)->daddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001537
1538 opt = (u8*) (addrp + 1);
1539
1540 /*
1541 * include target_address option
1542 */
1543
1544 if (ha)
1545 opt = ndisc_fill_addr_option(opt, ND_OPT_TARGET_LL_ADDR, ha,
1546 dev->addr_len, dev->type);
1547
1548 /*
1549 * build redirect option and copy skb over to the new packet.
1550 */
1551
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001552 memset(opt, 0, 8);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001553 *(opt++) = ND_OPT_REDIRECT_HDR;
1554 *(opt++) = (rd_len >> 3);
1555 opt += 6;
1556
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001557 memcpy(opt, ipv6_hdr(skb), rd_len - 8);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001558
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001559 icmph->icmp6_cksum = csum_ipv6_magic(&saddr_buf, &ipv6_hdr(skb)->saddr,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001560 len, IPPROTO_ICMPV6,
1561 csum_partial((u8 *) icmph, len, 0));
1562
1563 buff->dst = dst;
1564 idev = in6_dev_get(dst->dev);
YOSHIFUJI Hideakia11d2062006-11-04 20:11:37 +09001565 IP6_INC_STATS(idev, IPSTATS_MIB_OUTREQUESTS);
Patrick McHardy6e23ae22007-11-19 18:53:30 -08001566 err = NF_HOOK(PF_INET6, NF_INET_LOCAL_OUT, buff, NULL, dst->dev,
1567 dst_output);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001568 if (!err) {
David L Stevens14878f72007-09-16 16:52:35 -07001569 ICMP6MSGOUT_INC_STATS(idev, NDISC_REDIRECT);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001570 ICMP6_INC_STATS(idev, ICMP6_MIB_OUTMSGS);
1571 }
1572
1573 if (likely(idev != NULL))
1574 in6_dev_put(idev);
1575}
1576
1577static void pndisc_redo(struct sk_buff *skb)
1578{
YOSHIFUJI Hideaki140e26fc2005-10-05 12:11:41 -07001579 ndisc_recv_ns(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001580 kfree_skb(skb);
1581}
1582
1583int ndisc_rcv(struct sk_buff *skb)
1584{
1585 struct nd_msg *msg;
1586
1587 if (!pskb_may_pull(skb, skb->len))
1588 return 0;
1589
Arnaldo Carvalho de Melo9c702202007-04-25 18:04:18 -07001590 msg = (struct nd_msg *)skb_transport_header(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001591
Arnaldo Carvalho de Melo9c702202007-04-25 18:04:18 -07001592 __skb_push(skb, skb->data - skb_transport_header(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001593
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001594 if (ipv6_hdr(skb)->hop_limit != 255) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001595 ND_PRINTK2(KERN_WARNING
1596 "ICMPv6 NDISC: invalid hop-limit: %d\n",
Arnaldo Carvalho de Melo0660e032007-04-25 17:54:47 -07001597 ipv6_hdr(skb)->hop_limit);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001598 return 0;
1599 }
1600
1601 if (msg->icmph.icmp6_code != 0) {
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001602 ND_PRINTK2(KERN_WARNING
Linus Torvalds1da177e2005-04-16 15:20:36 -07001603 "ICMPv6 NDISC: invalid ICMPv6 code: %d\n",
1604 msg->icmph.icmp6_code);
1605 return 0;
1606 }
1607
Patrick McHardya61bbcf2005-08-14 17:24:31 -07001608 memset(NEIGH_CB(skb), 0, sizeof(struct neighbour_cb));
1609
Linus Torvalds1da177e2005-04-16 15:20:36 -07001610 switch (msg->icmph.icmp6_type) {
1611 case NDISC_NEIGHBOUR_SOLICITATION:
1612 ndisc_recv_ns(skb);
1613 break;
1614
1615 case NDISC_NEIGHBOUR_ADVERTISEMENT:
1616 ndisc_recv_na(skb);
1617 break;
1618
1619 case NDISC_ROUTER_SOLICITATION:
1620 ndisc_recv_rs(skb);
1621 break;
1622
1623 case NDISC_ROUTER_ADVERTISEMENT:
1624 ndisc_router_discovery(skb);
1625 break;
1626
1627 case NDISC_REDIRECT:
1628 ndisc_redirect_rcv(skb);
1629 break;
Stephen Hemminger3ff50b72007-04-20 17:09:22 -07001630 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001631
1632 return 0;
1633}
1634
1635static int ndisc_netdev_event(struct notifier_block *this, unsigned long event, void *ptr)
1636{
1637 struct net_device *dev = ptr;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001638 struct net *net = dev_net(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001639
1640 switch (event) {
1641 case NETDEV_CHANGEADDR:
1642 neigh_changeaddr(&nd_tbl, dev);
Daniel Lezcano5b7c9312008-03-03 23:28:58 -08001643 fib6_run_gc(~0UL, net);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001644 break;
1645 case NETDEV_DOWN:
1646 neigh_ifdown(&nd_tbl, dev);
Daniel Lezcano5b7c9312008-03-03 23:28:58 -08001647 fib6_run_gc(~0UL, net);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001648 break;
1649 default:
1650 break;
1651 }
1652
1653 return NOTIFY_DONE;
1654}
1655
1656static struct notifier_block ndisc_netdev_notifier = {
1657 .notifier_call = ndisc_netdev_event,
1658};
1659
1660#ifdef CONFIG_SYSCTL
1661static void ndisc_warn_deprecated_sysctl(struct ctl_table *ctl,
1662 const char *func, const char *dev_name)
1663{
1664 static char warncomm[TASK_COMM_LEN];
1665 static int warned;
1666 if (strcmp(warncomm, current->comm) && warned < 5) {
1667 strcpy(warncomm, current->comm);
1668 printk(KERN_WARNING
1669 "process `%s' is using deprecated sysctl (%s) "
1670 "net.ipv6.neigh.%s.%s; "
1671 "Use net.ipv6.neigh.%s.%s_ms "
1672 "instead.\n",
1673 warncomm, func,
1674 dev_name, ctl->procname,
1675 dev_name, ctl->procname);
1676 warned++;
1677 }
1678}
1679
1680int ndisc_ifinfo_sysctl_change(struct ctl_table *ctl, int write, struct file * filp, void __user *buffer, size_t *lenp, loff_t *ppos)
1681{
1682 struct net_device *dev = ctl->extra1;
1683 struct inet6_dev *idev;
1684 int ret;
1685
Eric W. Biedermand12af672007-10-18 03:05:25 -07001686 if ((strcmp(ctl->procname, "retrans_time") == 0) ||
1687 (strcmp(ctl->procname, "base_reachable_time") == 0))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001688 ndisc_warn_deprecated_sysctl(ctl, "syscall", dev ? dev->name : "default");
1689
Eric W. Biedermand12af672007-10-18 03:05:25 -07001690 if (strcmp(ctl->procname, "retrans_time") == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001691 ret = proc_dointvec(ctl, write, filp, buffer, lenp, ppos);
Eric W. Biedermand12af672007-10-18 03:05:25 -07001692
1693 else if (strcmp(ctl->procname, "base_reachable_time") == 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001694 ret = proc_dointvec_jiffies(ctl, write,
1695 filp, buffer, lenp, ppos);
Eric W. Biedermand12af672007-10-18 03:05:25 -07001696
1697 else if ((strcmp(ctl->procname, "retrans_time_ms") == 0) ||
YOSHIFUJI Hideakiad02ac12007-10-29 01:32:23 -07001698 (strcmp(ctl->procname, "base_reachable_time_ms") == 0))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001699 ret = proc_dointvec_ms_jiffies(ctl, write,
1700 filp, buffer, lenp, ppos);
Eric W. Biedermand12af672007-10-18 03:05:25 -07001701 else
Linus Torvalds1da177e2005-04-16 15:20:36 -07001702 ret = -1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001703
1704 if (write && ret == 0 && dev && (idev = in6_dev_get(dev)) != NULL) {
Eric W. Biedermand12af672007-10-18 03:05:25 -07001705 if (ctl->data == &idev->nd_parms->base_reachable_time)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001706 idev->nd_parms->reachable_time = neigh_rand_reach_time(idev->nd_parms->base_reachable_time);
1707 idev->tstamp = jiffies;
1708 inet6_ifinfo_notify(RTM_NEWLINK, idev);
1709 in6_dev_put(idev);
1710 }
1711 return ret;
1712}
1713
1714static int ndisc_ifinfo_sysctl_strategy(ctl_table *ctl, int __user *name,
1715 int nlen, void __user *oldval,
1716 size_t __user *oldlenp,
Alexey Dobriyan1f29bcd2006-12-10 02:19:10 -08001717 void __user *newval, size_t newlen)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001718{
1719 struct net_device *dev = ctl->extra1;
1720 struct inet6_dev *idev;
1721 int ret;
1722
1723 if (ctl->ctl_name == NET_NEIGH_RETRANS_TIME ||
1724 ctl->ctl_name == NET_NEIGH_REACHABLE_TIME)
1725 ndisc_warn_deprecated_sysctl(ctl, "procfs", dev ? dev->name : "default");
1726
1727 switch (ctl->ctl_name) {
1728 case NET_NEIGH_REACHABLE_TIME:
1729 ret = sysctl_jiffies(ctl, name, nlen,
Alexey Dobriyan1f29bcd2006-12-10 02:19:10 -08001730 oldval, oldlenp, newval, newlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001731 break;
1732 case NET_NEIGH_RETRANS_TIME_MS:
1733 case NET_NEIGH_REACHABLE_TIME_MS:
1734 ret = sysctl_ms_jiffies(ctl, name, nlen,
Alexey Dobriyan1f29bcd2006-12-10 02:19:10 -08001735 oldval, oldlenp, newval, newlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001736 break;
1737 default:
1738 ret = 0;
1739 }
1740
1741 if (newval && newlen && ret > 0 &&
1742 dev && (idev = in6_dev_get(dev)) != NULL) {
1743 if (ctl->ctl_name == NET_NEIGH_REACHABLE_TIME ||
1744 ctl->ctl_name == NET_NEIGH_REACHABLE_TIME_MS)
1745 idev->nd_parms->reachable_time = neigh_rand_reach_time(idev->nd_parms->base_reachable_time);
1746 idev->tstamp = jiffies;
1747 inet6_ifinfo_notify(RTM_NEWLINK, idev);
1748 in6_dev_put(idev);
1749 }
1750
1751 return ret;
1752}
1753
1754#endif
1755
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001756static int ndisc_net_init(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001757{
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001758 struct socket *sock;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001759 struct ipv6_pinfo *np;
1760 struct sock *sk;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001761 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001762
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001763 err = sock_create_kern(PF_INET6, SOCK_RAW, IPPROTO_ICMPV6, &sock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001764 if (err < 0) {
1765 ND_PRINTK0(KERN_ERR
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001766 "ICMPv6 NDISC: Failed to initialize the control socket (err %d).\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001767 err);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001768 return err;
1769 }
1770
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001771 net->ipv6.ndisc_sk = sk = sock->sk;
1772 sk_change_net(sk, net);
1773
Linus Torvalds1da177e2005-04-16 15:20:36 -07001774 np = inet6_sk(sk);
1775 sk->sk_allocation = GFP_ATOMIC;
1776 np->hop_limit = 255;
1777 /* Do not loopback ndisc messages */
1778 np->mc_loop = 0;
1779 sk->sk_prot->unhash(sk);
1780
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001781 return 0;
1782}
1783
1784static void ndisc_net_exit(struct net *net)
1785{
1786 sk_release_kernel(net->ipv6.ndisc_sk);
1787}
1788
1789static struct pernet_operations ndisc_net_ops = {
1790 .init = ndisc_net_init,
1791 .exit = ndisc_net_exit,
1792};
1793
1794int __init ndisc_init(void)
1795{
1796 int err;
1797
1798 err = register_pernet_subsys(&ndisc_net_ops);
1799 if (err)
1800 return err;
YOSHIFUJI Hideaki1ab14572007-02-09 23:24:49 +09001801 /*
1802 * Initialize the neighbour table
1803 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001804 neigh_table_init(&nd_tbl);
1805
1806#ifdef CONFIG_SYSCTL
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001807 err = neigh_sysctl_register(NULL, &nd_tbl.parms, NET_IPV6,
1808 NET_IPV6_NEIGH, "ipv6",
1809 &ndisc_ifinfo_sysctl_change,
1810 &ndisc_ifinfo_sysctl_strategy);
1811 if (err)
1812 goto out_unregister_pernet;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001813#endif
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001814 err = register_netdevice_notifier(&ndisc_netdev_notifier);
1815 if (err)
1816 goto out_unregister_sysctl;
1817out:
1818 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001819
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001820out_unregister_sysctl:
1821#ifdef CONFIG_SYSCTL
1822 neigh_sysctl_unregister(&nd_tbl.parms);
1823out_unregister_pernet:
1824#endif
1825 unregister_pernet_subsys(&ndisc_net_ops);
1826 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001827}
1828
1829void ndisc_cleanup(void)
1830{
Dmitry Mishin36f73d02006-11-03 16:08:19 -08001831 unregister_netdevice_notifier(&ndisc_netdev_notifier);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001832#ifdef CONFIG_SYSCTL
1833 neigh_sysctl_unregister(&nd_tbl.parms);
1834#endif
1835 neigh_table_clear(&nd_tbl);
Daniel Lezcano1762f7e2008-03-07 11:15:34 -08001836 unregister_pernet_subsys(&ndisc_net_ops);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001837}