blob: 25c8a42965dff1d3eeea77f8ac8dad2809c33e28 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * NET3 IP device support routines.
3 *
4 * Version: $Id: devinet.c,v 1.44 2001/10/31 21:55:54 davem Exp $
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 *
11 * Derived from the IP parts of dev.c 1.0.19
Jesper Juhl02c30a82005-05-05 16:16:16 -070012 * Authors: Ross Biro
Linus Torvalds1da177e2005-04-16 15:20:36 -070013 * Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
14 * Mark Evans, <evansmp@uhura.aston.ac.uk>
15 *
16 * Additional Authors:
17 * Alan Cox, <gw4pts@gw4pts.ampr.org>
18 * Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
19 *
20 * Changes:
21 * Alexey Kuznetsov: pa_* fields are replaced with ifaddr
22 * lists.
23 * Cyrus Durgin: updated for kmod
24 * Matthias Andree: in devinet_ioctl, compare label and
25 * address (4.4BSD alias style support),
26 * fall back to comparing just the label
27 * if no match found.
28 */
29
Linus Torvalds1da177e2005-04-16 15:20:36 -070030
31#include <asm/uaccess.h>
32#include <asm/system.h>
33#include <linux/bitops.h>
Randy Dunlap4fc268d2006-01-11 12:17:47 -080034#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035#include <linux/module.h>
36#include <linux/types.h>
37#include <linux/kernel.h>
38#include <linux/sched.h>
39#include <linux/string.h>
40#include <linux/mm.h>
41#include <linux/socket.h>
42#include <linux/sockios.h>
43#include <linux/in.h>
44#include <linux/errno.h>
45#include <linux/interrupt.h>
Thomas Graf18237302006-08-04 23:04:54 -070046#include <linux/if_addr.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070047#include <linux/if_ether.h>
48#include <linux/inet.h>
49#include <linux/netdevice.h>
50#include <linux/etherdevice.h>
51#include <linux/skbuff.h>
52#include <linux/rtnetlink.h>
53#include <linux/init.h>
54#include <linux/notifier.h>
55#include <linux/inetdevice.h>
56#include <linux/igmp.h>
57#ifdef CONFIG_SYSCTL
58#include <linux/sysctl.h>
59#endif
60#include <linux/kmod.h>
61
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020062#include <net/arp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070063#include <net/ip.h>
64#include <net/route.h>
65#include <net/ip_fib.h>
Thomas Graf5c753972006-08-04 23:03:53 -070066#include <net/netlink.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070067
68struct ipv4_devconf ipv4_devconf = {
69 .accept_redirects = 1,
70 .send_redirects = 1,
71 .secure_redirects = 1,
72 .shared_media = 1,
73};
74
75static struct ipv4_devconf ipv4_devconf_dflt = {
76 .accept_redirects = 1,
77 .send_redirects = 1,
78 .secure_redirects = 1,
79 .shared_media = 1,
80 .accept_source_route = 1,
81};
82
Thomas Graf5c753972006-08-04 23:03:53 -070083static struct nla_policy ifa_ipv4_policy[IFA_MAX+1] __read_mostly = {
84 [IFA_LOCAL] = { .type = NLA_U32 },
85 [IFA_ADDRESS] = { .type = NLA_U32 },
86 [IFA_BROADCAST] = { .type = NLA_U32 },
87 [IFA_ANYCAST] = { .type = NLA_U32 },
Thomas Graf5176f912006-08-26 20:13:18 -070088 [IFA_LABEL] = { .type = NLA_STRING, .len = IFNAMSIZ - 1 },
Thomas Graf5c753972006-08-04 23:03:53 -070089};
90
Thomas Grafd6062cb2006-08-15 00:33:59 -070091static void rtmsg_ifa(int event, struct in_ifaddr *, struct nlmsghdr *, u32);
Linus Torvalds1da177e2005-04-16 15:20:36 -070092
Alan Sterne041c682006-03-27 01:16:30 -080093static BLOCKING_NOTIFIER_HEAD(inetaddr_chain);
Linus Torvalds1da177e2005-04-16 15:20:36 -070094static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
95 int destroy);
96#ifdef CONFIG_SYSCTL
97static void devinet_sysctl_register(struct in_device *in_dev,
98 struct ipv4_devconf *p);
99static void devinet_sysctl_unregister(struct ipv4_devconf *p);
100#endif
101
102/* Locks all the inet devices. */
103
104static struct in_ifaddr *inet_alloc_ifa(void)
105{
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700106 struct in_ifaddr *ifa = kzalloc(sizeof(*ifa), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700107
108 if (ifa) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109 INIT_RCU_HEAD(&ifa->rcu_head);
110 }
111
112 return ifa;
113}
114
115static void inet_rcu_free_ifa(struct rcu_head *head)
116{
117 struct in_ifaddr *ifa = container_of(head, struct in_ifaddr, rcu_head);
118 if (ifa->ifa_dev)
119 in_dev_put(ifa->ifa_dev);
120 kfree(ifa);
121}
122
123static inline void inet_free_ifa(struct in_ifaddr *ifa)
124{
125 call_rcu(&ifa->rcu_head, inet_rcu_free_ifa);
126}
127
128void in_dev_finish_destroy(struct in_device *idev)
129{
130 struct net_device *dev = idev->dev;
131
132 BUG_TRAP(!idev->ifa_list);
133 BUG_TRAP(!idev->mc_list);
134#ifdef NET_REFCNT_DEBUG
135 printk(KERN_DEBUG "in_dev_finish_destroy: %p=%s\n",
136 idev, dev ? dev->name : "NIL");
137#endif
138 dev_put(dev);
139 if (!idev->dead)
140 printk("Freeing alive in_device %p\n", idev);
141 else {
142 kfree(idev);
143 }
144}
145
146struct in_device *inetdev_init(struct net_device *dev)
147{
148 struct in_device *in_dev;
149
150 ASSERT_RTNL();
151
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700152 in_dev = kzalloc(sizeof(*in_dev), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700153 if (!in_dev)
154 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155 INIT_RCU_HEAD(&in_dev->rcu_head);
156 memcpy(&in_dev->cnf, &ipv4_devconf_dflt, sizeof(in_dev->cnf));
157 in_dev->cnf.sysctl = NULL;
158 in_dev->dev = dev;
159 if ((in_dev->arp_parms = neigh_parms_alloc(dev, &arp_tbl)) == NULL)
160 goto out_kfree;
161 /* Reference in_dev->dev */
162 dev_hold(dev);
163#ifdef CONFIG_SYSCTL
164 neigh_sysctl_register(dev, in_dev->arp_parms, NET_IPV4,
165 NET_IPV4_NEIGH, "ipv4", NULL, NULL);
166#endif
167
David L Stevens30c4cf52007-01-04 12:31:14 -0800168 /* Account for reference dev->ip_ptr (below) */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700169 in_dev_hold(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700170
171#ifdef CONFIG_SYSCTL
172 devinet_sysctl_register(in_dev, &in_dev->cnf);
173#endif
174 ip_mc_init_dev(in_dev);
175 if (dev->flags & IFF_UP)
176 ip_mc_up(in_dev);
177out:
David L Stevens30c4cf52007-01-04 12:31:14 -0800178 /* we can receive as soon as ip_ptr is set -- do this last */
179 rcu_assign_pointer(dev->ip_ptr, in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180 return in_dev;
181out_kfree:
182 kfree(in_dev);
183 in_dev = NULL;
184 goto out;
185}
186
187static void in_dev_rcu_put(struct rcu_head *head)
188{
189 struct in_device *idev = container_of(head, struct in_device, rcu_head);
190 in_dev_put(idev);
191}
192
193static void inetdev_destroy(struct in_device *in_dev)
194{
195 struct in_ifaddr *ifa;
196 struct net_device *dev;
197
198 ASSERT_RTNL();
199
200 dev = in_dev->dev;
201 if (dev == &loopback_dev)
202 return;
203
204 in_dev->dead = 1;
205
206 ip_mc_destroy_dev(in_dev);
207
208 while ((ifa = in_dev->ifa_list) != NULL) {
209 inet_del_ifa(in_dev, &in_dev->ifa_list, 0);
210 inet_free_ifa(ifa);
211 }
212
213#ifdef CONFIG_SYSCTL
214 devinet_sysctl_unregister(&in_dev->cnf);
215#endif
216
217 dev->ip_ptr = NULL;
218
219#ifdef CONFIG_SYSCTL
220 neigh_sysctl_unregister(in_dev->arp_parms);
221#endif
222 neigh_parms_release(&arp_tbl, in_dev->arp_parms);
223 arp_ifdown(dev);
224
225 call_rcu(&in_dev->rcu_head, in_dev_rcu_put);
226}
227
Al Viroff428d72006-09-26 22:13:35 -0700228int inet_addr_onlink(struct in_device *in_dev, __be32 a, __be32 b)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229{
230 rcu_read_lock();
231 for_primary_ifa(in_dev) {
232 if (inet_ifa_match(a, ifa)) {
233 if (!b || inet_ifa_match(b, ifa)) {
234 rcu_read_unlock();
235 return 1;
236 }
237 }
238 } endfor_ifa(in_dev);
239 rcu_read_unlock();
240 return 0;
241}
242
Thomas Grafd6062cb2006-08-15 00:33:59 -0700243static void __inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
244 int destroy, struct nlmsghdr *nlh, u32 pid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245{
Harald Welte8f937c62005-05-29 20:23:46 -0700246 struct in_ifaddr *promote = NULL;
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800247 struct in_ifaddr *ifa, *ifa1 = *ifap;
248 struct in_ifaddr *last_prim = in_dev->ifa_list;
249 struct in_ifaddr *prev_prom = NULL;
250 int do_promote = IN_DEV_PROMOTE_SECONDARIES(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251
252 ASSERT_RTNL();
253
Harald Welte8f937c62005-05-29 20:23:46 -0700254 /* 1. Deleting primary ifaddr forces deletion all secondaries
255 * unless alias promotion is set
256 **/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700257
258 if (!(ifa1->ifa_flags & IFA_F_SECONDARY)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700259 struct in_ifaddr **ifap1 = &ifa1->ifa_next;
260
261 while ((ifa = *ifap1) != NULL) {
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800262 if (!(ifa->ifa_flags & IFA_F_SECONDARY) &&
263 ifa1->ifa_scope <= ifa->ifa_scope)
264 last_prim = ifa;
265
Linus Torvalds1da177e2005-04-16 15:20:36 -0700266 if (!(ifa->ifa_flags & IFA_F_SECONDARY) ||
267 ifa1->ifa_mask != ifa->ifa_mask ||
268 !inet_ifa_match(ifa1->ifa_address, ifa)) {
269 ifap1 = &ifa->ifa_next;
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800270 prev_prom = ifa;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700271 continue;
272 }
273
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800274 if (!do_promote) {
Harald Welte8f937c62005-05-29 20:23:46 -0700275 *ifap1 = ifa->ifa_next;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276
Thomas Grafd6062cb2006-08-15 00:33:59 -0700277 rtmsg_ifa(RTM_DELADDR, ifa, nlh, pid);
Alan Sterne041c682006-03-27 01:16:30 -0800278 blocking_notifier_call_chain(&inetaddr_chain,
279 NETDEV_DOWN, ifa);
Harald Welte8f937c62005-05-29 20:23:46 -0700280 inet_free_ifa(ifa);
281 } else {
282 promote = ifa;
283 break;
284 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700285 }
286 }
287
288 /* 2. Unlink it */
289
290 *ifap = ifa1->ifa_next;
291
292 /* 3. Announce address deletion */
293
294 /* Send message first, then call notifier.
295 At first sight, FIB update triggered by notifier
296 will refer to already deleted ifaddr, that could confuse
297 netlink listeners. It is not true: look, gated sees
298 that route deleted and if it still thinks that ifaddr
299 is valid, it will try to restore deleted routes... Grr.
300 So that, this order is correct.
301 */
Thomas Grafd6062cb2006-08-15 00:33:59 -0700302 rtmsg_ifa(RTM_DELADDR, ifa1, nlh, pid);
Alan Sterne041c682006-03-27 01:16:30 -0800303 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_DOWN, ifa1);
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800304
305 if (promote) {
306
307 if (prev_prom) {
308 prev_prom->ifa_next = promote->ifa_next;
309 promote->ifa_next = last_prim->ifa_next;
310 last_prim->ifa_next = promote;
311 }
312
313 promote->ifa_flags &= ~IFA_F_SECONDARY;
Thomas Grafd6062cb2006-08-15 00:33:59 -0700314 rtmsg_ifa(RTM_NEWADDR, promote, nlh, pid);
Alan Sterne041c682006-03-27 01:16:30 -0800315 blocking_notifier_call_chain(&inetaddr_chain,
316 NETDEV_UP, promote);
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800317 for (ifa = promote->ifa_next; ifa; ifa = ifa->ifa_next) {
318 if (ifa1->ifa_mask != ifa->ifa_mask ||
319 !inet_ifa_match(ifa1->ifa_address, ifa))
320 continue;
321 fib_add_ifaddr(ifa);
322 }
323
324 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700325 if (destroy) {
326 inet_free_ifa(ifa1);
327
328 if (!in_dev->ifa_list)
329 inetdev_destroy(in_dev);
330 }
331}
332
Thomas Grafd6062cb2006-08-15 00:33:59 -0700333static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
334 int destroy)
335{
336 __inet_del_ifa(in_dev, ifap, destroy, NULL, 0);
337}
338
339static int __inet_insert_ifa(struct in_ifaddr *ifa, struct nlmsghdr *nlh,
340 u32 pid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700341{
342 struct in_device *in_dev = ifa->ifa_dev;
343 struct in_ifaddr *ifa1, **ifap, **last_primary;
344
345 ASSERT_RTNL();
346
347 if (!ifa->ifa_local) {
348 inet_free_ifa(ifa);
349 return 0;
350 }
351
352 ifa->ifa_flags &= ~IFA_F_SECONDARY;
353 last_primary = &in_dev->ifa_list;
354
355 for (ifap = &in_dev->ifa_list; (ifa1 = *ifap) != NULL;
356 ifap = &ifa1->ifa_next) {
357 if (!(ifa1->ifa_flags & IFA_F_SECONDARY) &&
358 ifa->ifa_scope <= ifa1->ifa_scope)
359 last_primary = &ifa1->ifa_next;
360 if (ifa1->ifa_mask == ifa->ifa_mask &&
361 inet_ifa_match(ifa1->ifa_address, ifa)) {
362 if (ifa1->ifa_local == ifa->ifa_local) {
363 inet_free_ifa(ifa);
364 return -EEXIST;
365 }
366 if (ifa1->ifa_scope != ifa->ifa_scope) {
367 inet_free_ifa(ifa);
368 return -EINVAL;
369 }
370 ifa->ifa_flags |= IFA_F_SECONDARY;
371 }
372 }
373
374 if (!(ifa->ifa_flags & IFA_F_SECONDARY)) {
375 net_srandom(ifa->ifa_local);
376 ifap = last_primary;
377 }
378
379 ifa->ifa_next = *ifap;
380 *ifap = ifa;
381
382 /* Send message first, then call notifier.
383 Notifier will trigger FIB update, so that
384 listeners of netlink will know about new ifaddr */
Thomas Grafd6062cb2006-08-15 00:33:59 -0700385 rtmsg_ifa(RTM_NEWADDR, ifa, nlh, pid);
Alan Sterne041c682006-03-27 01:16:30 -0800386 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_UP, ifa);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700387
388 return 0;
389}
390
Thomas Grafd6062cb2006-08-15 00:33:59 -0700391static int inet_insert_ifa(struct in_ifaddr *ifa)
392{
393 return __inet_insert_ifa(ifa, NULL, 0);
394}
395
Linus Torvalds1da177e2005-04-16 15:20:36 -0700396static int inet_set_ifa(struct net_device *dev, struct in_ifaddr *ifa)
397{
Herbert Xue5ed6392005-10-03 14:35:55 -0700398 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399
400 ASSERT_RTNL();
401
402 if (!in_dev) {
403 in_dev = inetdev_init(dev);
404 if (!in_dev) {
405 inet_free_ifa(ifa);
406 return -ENOBUFS;
407 }
408 }
409 if (ifa->ifa_dev != in_dev) {
410 BUG_TRAP(!ifa->ifa_dev);
411 in_dev_hold(in_dev);
412 ifa->ifa_dev = in_dev;
413 }
414 if (LOOPBACK(ifa->ifa_local))
415 ifa->ifa_scope = RT_SCOPE_HOST;
416 return inet_insert_ifa(ifa);
417}
418
419struct in_device *inetdev_by_index(int ifindex)
420{
421 struct net_device *dev;
422 struct in_device *in_dev = NULL;
423 read_lock(&dev_base_lock);
424 dev = __dev_get_by_index(ifindex);
425 if (dev)
426 in_dev = in_dev_get(dev);
427 read_unlock(&dev_base_lock);
428 return in_dev;
429}
430
431/* Called only from RTNL semaphored context. No locks. */
432
Al Viro60cad5d2006-09-26 22:17:09 -0700433struct in_ifaddr *inet_ifa_byprefix(struct in_device *in_dev, __be32 prefix,
434 __be32 mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700435{
436 ASSERT_RTNL();
437
438 for_primary_ifa(in_dev) {
439 if (ifa->ifa_mask == mask && inet_ifa_match(prefix, ifa))
440 return ifa;
441 } endfor_ifa(in_dev);
442 return NULL;
443}
444
445static int inet_rtm_deladdr(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
446{
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700447 struct nlattr *tb[IFA_MAX+1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700448 struct in_device *in_dev;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700449 struct ifaddrmsg *ifm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700450 struct in_ifaddr *ifa, **ifap;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700451 int err = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700452
453 ASSERT_RTNL();
454
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700455 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy);
456 if (err < 0)
457 goto errout;
458
459 ifm = nlmsg_data(nlh);
460 in_dev = inetdev_by_index(ifm->ifa_index);
461 if (in_dev == NULL) {
462 err = -ENODEV;
463 goto errout;
464 }
465
Linus Torvalds1da177e2005-04-16 15:20:36 -0700466 __in_dev_put(in_dev);
467
468 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
469 ifap = &ifa->ifa_next) {
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700470 if (tb[IFA_LOCAL] &&
Al Viroa7a628c2006-09-26 22:16:43 -0700471 ifa->ifa_local != nla_get_be32(tb[IFA_LOCAL]))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700472 continue;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700473
474 if (tb[IFA_LABEL] && nla_strcmp(tb[IFA_LABEL], ifa->ifa_label))
475 continue;
476
477 if (tb[IFA_ADDRESS] &&
478 (ifm->ifa_prefixlen != ifa->ifa_prefixlen ||
Al Viroa7a628c2006-09-26 22:16:43 -0700479 !inet_ifa_match(nla_get_be32(tb[IFA_ADDRESS]), ifa)))
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700480 continue;
481
Thomas Grafd6062cb2006-08-15 00:33:59 -0700482 __inet_del_ifa(in_dev, ifap, 1, nlh, NETLINK_CB(skb).pid);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700483 return 0;
484 }
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700485
486 err = -EADDRNOTAVAIL;
487errout:
488 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700489}
490
Thomas Graf5c753972006-08-04 23:03:53 -0700491static struct in_ifaddr *rtm_to_ifaddr(struct nlmsghdr *nlh)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700492{
Thomas Graf5c753972006-08-04 23:03:53 -0700493 struct nlattr *tb[IFA_MAX+1];
494 struct in_ifaddr *ifa;
495 struct ifaddrmsg *ifm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700496 struct net_device *dev;
497 struct in_device *in_dev;
Thomas Graf5c753972006-08-04 23:03:53 -0700498 int err = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700499
Thomas Graf5c753972006-08-04 23:03:53 -0700500 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy);
501 if (err < 0)
502 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700503
Thomas Graf5c753972006-08-04 23:03:53 -0700504 ifm = nlmsg_data(nlh);
505 if (ifm->ifa_prefixlen > 32 || tb[IFA_LOCAL] == NULL)
506 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700507
Thomas Graf5c753972006-08-04 23:03:53 -0700508 dev = __dev_get_by_index(ifm->ifa_index);
509 if (dev == NULL) {
510 err = -ENODEV;
511 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700512 }
513
Thomas Graf5c753972006-08-04 23:03:53 -0700514 in_dev = __in_dev_get_rtnl(dev);
515 if (in_dev == NULL) {
516 in_dev = inetdev_init(dev);
517 if (in_dev == NULL) {
518 err = -ENOBUFS;
519 goto errout;
520 }
521 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700522
Thomas Graf5c753972006-08-04 23:03:53 -0700523 ifa = inet_alloc_ifa();
524 if (ifa == NULL) {
525 /*
526 * A potential indev allocation can be left alive, it stays
527 * assigned to its device and is destroy with it.
528 */
529 err = -ENOBUFS;
530 goto errout;
531 }
532
533 in_dev_hold(in_dev);
534
535 if (tb[IFA_ADDRESS] == NULL)
536 tb[IFA_ADDRESS] = tb[IFA_LOCAL];
537
Linus Torvalds1da177e2005-04-16 15:20:36 -0700538 ifa->ifa_prefixlen = ifm->ifa_prefixlen;
539 ifa->ifa_mask = inet_make_mask(ifm->ifa_prefixlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700540 ifa->ifa_flags = ifm->ifa_flags;
541 ifa->ifa_scope = ifm->ifa_scope;
Thomas Graf5c753972006-08-04 23:03:53 -0700542 ifa->ifa_dev = in_dev;
543
Al Viroa7a628c2006-09-26 22:16:43 -0700544 ifa->ifa_local = nla_get_be32(tb[IFA_LOCAL]);
545 ifa->ifa_address = nla_get_be32(tb[IFA_ADDRESS]);
Thomas Graf5c753972006-08-04 23:03:53 -0700546
547 if (tb[IFA_BROADCAST])
Al Viroa7a628c2006-09-26 22:16:43 -0700548 ifa->ifa_broadcast = nla_get_be32(tb[IFA_BROADCAST]);
Thomas Graf5c753972006-08-04 23:03:53 -0700549
550 if (tb[IFA_ANYCAST])
Al Viroa7a628c2006-09-26 22:16:43 -0700551 ifa->ifa_anycast = nla_get_be32(tb[IFA_ANYCAST]);
Thomas Graf5c753972006-08-04 23:03:53 -0700552
553 if (tb[IFA_LABEL])
554 nla_strlcpy(ifa->ifa_label, tb[IFA_LABEL], IFNAMSIZ);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700555 else
556 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
557
Thomas Graf5c753972006-08-04 23:03:53 -0700558 return ifa;
559
560errout:
561 return ERR_PTR(err);
562}
563
564static int inet_rtm_newaddr(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
565{
566 struct in_ifaddr *ifa;
567
568 ASSERT_RTNL();
569
570 ifa = rtm_to_ifaddr(nlh);
571 if (IS_ERR(ifa))
572 return PTR_ERR(ifa);
573
Thomas Grafd6062cb2006-08-15 00:33:59 -0700574 return __inet_insert_ifa(ifa, nlh, NETLINK_CB(skb).pid);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700575}
576
577/*
578 * Determine a default network mask, based on the IP address.
579 */
580
Al Viro714e85b2006-11-14 20:51:49 -0800581static __inline__ int inet_abc_len(__be32 addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700582{
583 int rc = -1; /* Something else, probably a multicast. */
584
585 if (ZERONET(addr))
586 rc = 0;
587 else {
Al Viro714e85b2006-11-14 20:51:49 -0800588 __u32 haddr = ntohl(addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700589
Al Viro714e85b2006-11-14 20:51:49 -0800590 if (IN_CLASSA(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700591 rc = 8;
Al Viro714e85b2006-11-14 20:51:49 -0800592 else if (IN_CLASSB(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700593 rc = 16;
Al Viro714e85b2006-11-14 20:51:49 -0800594 else if (IN_CLASSC(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700595 rc = 24;
596 }
597
598 return rc;
599}
600
601
602int devinet_ioctl(unsigned int cmd, void __user *arg)
603{
604 struct ifreq ifr;
605 struct sockaddr_in sin_orig;
606 struct sockaddr_in *sin = (struct sockaddr_in *)&ifr.ifr_addr;
607 struct in_device *in_dev;
608 struct in_ifaddr **ifap = NULL;
609 struct in_ifaddr *ifa = NULL;
610 struct net_device *dev;
611 char *colon;
612 int ret = -EFAULT;
613 int tryaddrmatch = 0;
614
615 /*
616 * Fetch the caller's info block into kernel space
617 */
618
619 if (copy_from_user(&ifr, arg, sizeof(struct ifreq)))
620 goto out;
621 ifr.ifr_name[IFNAMSIZ - 1] = 0;
622
623 /* save original address for comparison */
624 memcpy(&sin_orig, sin, sizeof(*sin));
625
626 colon = strchr(ifr.ifr_name, ':');
627 if (colon)
628 *colon = 0;
629
630#ifdef CONFIG_KMOD
631 dev_load(ifr.ifr_name);
632#endif
633
634 switch(cmd) {
635 case SIOCGIFADDR: /* Get interface address */
636 case SIOCGIFBRDADDR: /* Get the broadcast address */
637 case SIOCGIFDSTADDR: /* Get the destination address */
638 case SIOCGIFNETMASK: /* Get the netmask for the interface */
639 /* Note that these ioctls will not sleep,
640 so that we do not impose a lock.
641 One day we will be forced to put shlock here (I mean SMP)
642 */
643 tryaddrmatch = (sin_orig.sin_family == AF_INET);
644 memset(sin, 0, sizeof(*sin));
645 sin->sin_family = AF_INET;
646 break;
647
648 case SIOCSIFFLAGS:
649 ret = -EACCES;
650 if (!capable(CAP_NET_ADMIN))
651 goto out;
652 break;
653 case SIOCSIFADDR: /* Set interface address (and family) */
654 case SIOCSIFBRDADDR: /* Set the broadcast address */
655 case SIOCSIFDSTADDR: /* Set the destination address */
656 case SIOCSIFNETMASK: /* Set the netmask for the interface */
657 ret = -EACCES;
658 if (!capable(CAP_NET_ADMIN))
659 goto out;
660 ret = -EINVAL;
661 if (sin->sin_family != AF_INET)
662 goto out;
663 break;
664 default:
665 ret = -EINVAL;
666 goto out;
667 }
668
669 rtnl_lock();
670
671 ret = -ENODEV;
672 if ((dev = __dev_get_by_name(ifr.ifr_name)) == NULL)
673 goto done;
674
675 if (colon)
676 *colon = ':';
677
Herbert Xue5ed6392005-10-03 14:35:55 -0700678 if ((in_dev = __in_dev_get_rtnl(dev)) != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700679 if (tryaddrmatch) {
680 /* Matthias Andree */
681 /* compare label and address (4.4BSD style) */
682 /* note: we only do this for a limited set of ioctls
683 and only if the original address family was AF_INET.
684 This is checked above. */
685 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
686 ifap = &ifa->ifa_next) {
687 if (!strcmp(ifr.ifr_name, ifa->ifa_label) &&
688 sin_orig.sin_addr.s_addr ==
689 ifa->ifa_address) {
690 break; /* found */
691 }
692 }
693 }
694 /* we didn't get a match, maybe the application is
695 4.3BSD-style and passed in junk so we fall back to
696 comparing just the label */
697 if (!ifa) {
698 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
699 ifap = &ifa->ifa_next)
700 if (!strcmp(ifr.ifr_name, ifa->ifa_label))
701 break;
702 }
703 }
704
705 ret = -EADDRNOTAVAIL;
706 if (!ifa && cmd != SIOCSIFADDR && cmd != SIOCSIFFLAGS)
707 goto done;
708
709 switch(cmd) {
710 case SIOCGIFADDR: /* Get interface address */
711 sin->sin_addr.s_addr = ifa->ifa_local;
712 goto rarok;
713
714 case SIOCGIFBRDADDR: /* Get the broadcast address */
715 sin->sin_addr.s_addr = ifa->ifa_broadcast;
716 goto rarok;
717
718 case SIOCGIFDSTADDR: /* Get the destination address */
719 sin->sin_addr.s_addr = ifa->ifa_address;
720 goto rarok;
721
722 case SIOCGIFNETMASK: /* Get the netmask for the interface */
723 sin->sin_addr.s_addr = ifa->ifa_mask;
724 goto rarok;
725
726 case SIOCSIFFLAGS:
727 if (colon) {
728 ret = -EADDRNOTAVAIL;
729 if (!ifa)
730 break;
731 ret = 0;
732 if (!(ifr.ifr_flags & IFF_UP))
733 inet_del_ifa(in_dev, ifap, 1);
734 break;
735 }
736 ret = dev_change_flags(dev, ifr.ifr_flags);
737 break;
738
739 case SIOCSIFADDR: /* Set interface address (and family) */
740 ret = -EINVAL;
741 if (inet_abc_len(sin->sin_addr.s_addr) < 0)
742 break;
743
744 if (!ifa) {
745 ret = -ENOBUFS;
746 if ((ifa = inet_alloc_ifa()) == NULL)
747 break;
748 if (colon)
749 memcpy(ifa->ifa_label, ifr.ifr_name, IFNAMSIZ);
750 else
751 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
752 } else {
753 ret = 0;
754 if (ifa->ifa_local == sin->sin_addr.s_addr)
755 break;
756 inet_del_ifa(in_dev, ifap, 0);
757 ifa->ifa_broadcast = 0;
758 ifa->ifa_anycast = 0;
759 }
760
761 ifa->ifa_address = ifa->ifa_local = sin->sin_addr.s_addr;
762
763 if (!(dev->flags & IFF_POINTOPOINT)) {
764 ifa->ifa_prefixlen = inet_abc_len(ifa->ifa_address);
765 ifa->ifa_mask = inet_make_mask(ifa->ifa_prefixlen);
766 if ((dev->flags & IFF_BROADCAST) &&
767 ifa->ifa_prefixlen < 31)
768 ifa->ifa_broadcast = ifa->ifa_address |
769 ~ifa->ifa_mask;
770 } else {
771 ifa->ifa_prefixlen = 32;
772 ifa->ifa_mask = inet_make_mask(32);
773 }
774 ret = inet_set_ifa(dev, ifa);
775 break;
776
777 case SIOCSIFBRDADDR: /* Set the broadcast address */
778 ret = 0;
779 if (ifa->ifa_broadcast != sin->sin_addr.s_addr) {
780 inet_del_ifa(in_dev, ifap, 0);
781 ifa->ifa_broadcast = sin->sin_addr.s_addr;
782 inet_insert_ifa(ifa);
783 }
784 break;
785
786 case SIOCSIFDSTADDR: /* Set the destination address */
787 ret = 0;
788 if (ifa->ifa_address == sin->sin_addr.s_addr)
789 break;
790 ret = -EINVAL;
791 if (inet_abc_len(sin->sin_addr.s_addr) < 0)
792 break;
793 ret = 0;
794 inet_del_ifa(in_dev, ifap, 0);
795 ifa->ifa_address = sin->sin_addr.s_addr;
796 inet_insert_ifa(ifa);
797 break;
798
799 case SIOCSIFNETMASK: /* Set the netmask for the interface */
800
801 /*
802 * The mask we set must be legal.
803 */
804 ret = -EINVAL;
805 if (bad_mask(sin->sin_addr.s_addr, 0))
806 break;
807 ret = 0;
808 if (ifa->ifa_mask != sin->sin_addr.s_addr) {
Al Viroa144ea42006-09-28 18:00:55 -0700809 __be32 old_mask = ifa->ifa_mask;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700810 inet_del_ifa(in_dev, ifap, 0);
811 ifa->ifa_mask = sin->sin_addr.s_addr;
812 ifa->ifa_prefixlen = inet_mask_len(ifa->ifa_mask);
813
814 /* See if current broadcast address matches
815 * with current netmask, then recalculate
816 * the broadcast address. Otherwise it's a
817 * funny address, so don't touch it since
818 * the user seems to know what (s)he's doing...
819 */
820 if ((dev->flags & IFF_BROADCAST) &&
821 (ifa->ifa_prefixlen < 31) &&
822 (ifa->ifa_broadcast ==
David Engeldcab5e12005-10-21 22:09:16 -0500823 (ifa->ifa_local|~old_mask))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700824 ifa->ifa_broadcast = (ifa->ifa_local |
825 ~sin->sin_addr.s_addr);
826 }
827 inet_insert_ifa(ifa);
828 }
829 break;
830 }
831done:
832 rtnl_unlock();
833out:
834 return ret;
835rarok:
836 rtnl_unlock();
837 ret = copy_to_user(arg, &ifr, sizeof(struct ifreq)) ? -EFAULT : 0;
838 goto out;
839}
840
841static int inet_gifconf(struct net_device *dev, char __user *buf, int len)
842{
Herbert Xue5ed6392005-10-03 14:35:55 -0700843 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700844 struct in_ifaddr *ifa;
845 struct ifreq ifr;
846 int done = 0;
847
848 if (!in_dev || (ifa = in_dev->ifa_list) == NULL)
849 goto out;
850
851 for (; ifa; ifa = ifa->ifa_next) {
852 if (!buf) {
853 done += sizeof(ifr);
854 continue;
855 }
856 if (len < (int) sizeof(ifr))
857 break;
858 memset(&ifr, 0, sizeof(struct ifreq));
859 if (ifa->ifa_label)
860 strcpy(ifr.ifr_name, ifa->ifa_label);
861 else
862 strcpy(ifr.ifr_name, dev->name);
863
864 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_family = AF_INET;
865 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_addr.s_addr =
866 ifa->ifa_local;
867
868 if (copy_to_user(buf, &ifr, sizeof(struct ifreq))) {
869 done = -EFAULT;
870 break;
871 }
872 buf += sizeof(struct ifreq);
873 len -= sizeof(struct ifreq);
874 done += sizeof(struct ifreq);
875 }
876out:
877 return done;
878}
879
Al Viroa61ced52006-09-26 21:27:54 -0700880__be32 inet_select_addr(const struct net_device *dev, __be32 dst, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700881{
Al Viroa61ced52006-09-26 21:27:54 -0700882 __be32 addr = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700883 struct in_device *in_dev;
884
885 rcu_read_lock();
Herbert Xue5ed6392005-10-03 14:35:55 -0700886 in_dev = __in_dev_get_rcu(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700887 if (!in_dev)
888 goto no_in_dev;
889
890 for_primary_ifa(in_dev) {
891 if (ifa->ifa_scope > scope)
892 continue;
893 if (!dst || inet_ifa_match(dst, ifa)) {
894 addr = ifa->ifa_local;
895 break;
896 }
897 if (!addr)
898 addr = ifa->ifa_local;
899 } endfor_ifa(in_dev);
900no_in_dev:
901 rcu_read_unlock();
902
903 if (addr)
904 goto out;
905
906 /* Not loopback addresses on loopback should be preferred
907 in this case. It is importnat that lo is the first interface
908 in dev_base list.
909 */
910 read_lock(&dev_base_lock);
911 rcu_read_lock();
912 for (dev = dev_base; dev; dev = dev->next) {
Herbert Xue5ed6392005-10-03 14:35:55 -0700913 if ((in_dev = __in_dev_get_rcu(dev)) == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700914 continue;
915
916 for_primary_ifa(in_dev) {
917 if (ifa->ifa_scope != RT_SCOPE_LINK &&
918 ifa->ifa_scope <= scope) {
919 addr = ifa->ifa_local;
920 goto out_unlock_both;
921 }
922 } endfor_ifa(in_dev);
923 }
924out_unlock_both:
925 read_unlock(&dev_base_lock);
926 rcu_read_unlock();
927out:
928 return addr;
929}
930
Al Viro60cad5d2006-09-26 22:17:09 -0700931static __be32 confirm_addr_indev(struct in_device *in_dev, __be32 dst,
932 __be32 local, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700933{
934 int same = 0;
Al Viroa144ea42006-09-28 18:00:55 -0700935 __be32 addr = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700936
937 for_ifa(in_dev) {
938 if (!addr &&
939 (local == ifa->ifa_local || !local) &&
940 ifa->ifa_scope <= scope) {
941 addr = ifa->ifa_local;
942 if (same)
943 break;
944 }
945 if (!same) {
946 same = (!local || inet_ifa_match(local, ifa)) &&
947 (!dst || inet_ifa_match(dst, ifa));
948 if (same && addr) {
949 if (local || !dst)
950 break;
951 /* Is the selected addr into dst subnet? */
952 if (inet_ifa_match(addr, ifa))
953 break;
954 /* No, then can we use new local src? */
955 if (ifa->ifa_scope <= scope) {
956 addr = ifa->ifa_local;
957 break;
958 }
959 /* search for large dst subnet for addr */
960 same = 0;
961 }
962 }
963 } endfor_ifa(in_dev);
964
965 return same? addr : 0;
966}
967
968/*
969 * Confirm that local IP address exists using wildcards:
970 * - dev: only on this interface, 0=any interface
971 * - dst: only in the same subnet as dst, 0=any dst
972 * - local: address, 0=autoselect the local address
973 * - scope: maximum allowed scope value for the local address
974 */
Al Viro60cad5d2006-09-26 22:17:09 -0700975__be32 inet_confirm_addr(const struct net_device *dev, __be32 dst, __be32 local, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700976{
Al Viro60cad5d2006-09-26 22:17:09 -0700977 __be32 addr = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700978 struct in_device *in_dev;
979
980 if (dev) {
981 rcu_read_lock();
Herbert Xue5ed6392005-10-03 14:35:55 -0700982 if ((in_dev = __in_dev_get_rcu(dev)))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700983 addr = confirm_addr_indev(in_dev, dst, local, scope);
984 rcu_read_unlock();
985
986 return addr;
987 }
988
989 read_lock(&dev_base_lock);
990 rcu_read_lock();
991 for (dev = dev_base; dev; dev = dev->next) {
Herbert Xue5ed6392005-10-03 14:35:55 -0700992 if ((in_dev = __in_dev_get_rcu(dev))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700993 addr = confirm_addr_indev(in_dev, dst, local, scope);
994 if (addr)
995 break;
996 }
997 }
998 rcu_read_unlock();
999 read_unlock(&dev_base_lock);
1000
1001 return addr;
1002}
1003
1004/*
1005 * Device notifier
1006 */
1007
1008int register_inetaddr_notifier(struct notifier_block *nb)
1009{
Alan Sterne041c682006-03-27 01:16:30 -08001010 return blocking_notifier_chain_register(&inetaddr_chain, nb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001011}
1012
1013int unregister_inetaddr_notifier(struct notifier_block *nb)
1014{
Alan Sterne041c682006-03-27 01:16:30 -08001015 return blocking_notifier_chain_unregister(&inetaddr_chain, nb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001016}
1017
1018/* Rename ifa_labels for a device name change. Make some effort to preserve existing
1019 * alias numbering and to create unique labels if possible.
1020*/
1021static void inetdev_changename(struct net_device *dev, struct in_device *in_dev)
1022{
1023 struct in_ifaddr *ifa;
1024 int named = 0;
1025
1026 for (ifa = in_dev->ifa_list; ifa; ifa = ifa->ifa_next) {
1027 char old[IFNAMSIZ], *dot;
1028
1029 memcpy(old, ifa->ifa_label, IFNAMSIZ);
1030 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
1031 if (named++ == 0)
1032 continue;
1033 dot = strchr(ifa->ifa_label, ':');
1034 if (dot == NULL) {
1035 sprintf(old, ":%d", named);
1036 dot = old;
1037 }
1038 if (strlen(dot) + strlen(dev->name) < IFNAMSIZ) {
1039 strcat(ifa->ifa_label, dot);
1040 } else {
1041 strcpy(ifa->ifa_label + (IFNAMSIZ - strlen(dot) - 1), dot);
1042 }
1043 }
1044}
1045
1046/* Called only under RTNL semaphore */
1047
1048static int inetdev_event(struct notifier_block *this, unsigned long event,
1049 void *ptr)
1050{
1051 struct net_device *dev = ptr;
Herbert Xue5ed6392005-10-03 14:35:55 -07001052 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001053
1054 ASSERT_RTNL();
1055
1056 if (!in_dev) {
1057 if (event == NETDEV_REGISTER && dev == &loopback_dev) {
1058 in_dev = inetdev_init(dev);
1059 if (!in_dev)
1060 panic("devinet: Failed to create loopback\n");
1061 in_dev->cnf.no_xfrm = 1;
1062 in_dev->cnf.no_policy = 1;
1063 }
1064 goto out;
1065 }
1066
1067 switch (event) {
1068 case NETDEV_REGISTER:
1069 printk(KERN_DEBUG "inetdev_event: bug\n");
1070 dev->ip_ptr = NULL;
1071 break;
1072 case NETDEV_UP:
1073 if (dev->mtu < 68)
1074 break;
1075 if (dev == &loopback_dev) {
1076 struct in_ifaddr *ifa;
1077 if ((ifa = inet_alloc_ifa()) != NULL) {
1078 ifa->ifa_local =
1079 ifa->ifa_address = htonl(INADDR_LOOPBACK);
1080 ifa->ifa_prefixlen = 8;
1081 ifa->ifa_mask = inet_make_mask(8);
1082 in_dev_hold(in_dev);
1083 ifa->ifa_dev = in_dev;
1084 ifa->ifa_scope = RT_SCOPE_HOST;
1085 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
1086 inet_insert_ifa(ifa);
1087 }
1088 }
1089 ip_mc_up(in_dev);
1090 break;
1091 case NETDEV_DOWN:
1092 ip_mc_down(in_dev);
1093 break;
1094 case NETDEV_CHANGEMTU:
1095 if (dev->mtu >= 68)
1096 break;
1097 /* MTU falled under 68, disable IP */
1098 case NETDEV_UNREGISTER:
1099 inetdev_destroy(in_dev);
1100 break;
1101 case NETDEV_CHANGENAME:
1102 /* Do not notify about label change, this event is
1103 * not interesting to applications using netlink.
1104 */
1105 inetdev_changename(dev, in_dev);
1106
1107#ifdef CONFIG_SYSCTL
1108 devinet_sysctl_unregister(&in_dev->cnf);
1109 neigh_sysctl_unregister(in_dev->arp_parms);
1110 neigh_sysctl_register(dev, in_dev->arp_parms, NET_IPV4,
1111 NET_IPV4_NEIGH, "ipv4", NULL, NULL);
1112 devinet_sysctl_register(in_dev, &in_dev->cnf);
1113#endif
1114 break;
1115 }
1116out:
1117 return NOTIFY_DONE;
1118}
1119
1120static struct notifier_block ip_netdev_notifier = {
1121 .notifier_call =inetdev_event,
1122};
1123
Thomas Graf339bf982006-11-10 14:10:15 -08001124static inline size_t inet_nlmsg_size(void)
1125{
1126 return NLMSG_ALIGN(sizeof(struct ifaddrmsg))
1127 + nla_total_size(4) /* IFA_ADDRESS */
1128 + nla_total_size(4) /* IFA_LOCAL */
1129 + nla_total_size(4) /* IFA_BROADCAST */
1130 + nla_total_size(4) /* IFA_ANYCAST */
1131 + nla_total_size(IFNAMSIZ); /* IFA_LABEL */
1132}
1133
Linus Torvalds1da177e2005-04-16 15:20:36 -07001134static int inet_fill_ifaddr(struct sk_buff *skb, struct in_ifaddr *ifa,
Jamal Hadi Salimb6544c02005-06-18 22:54:12 -07001135 u32 pid, u32 seq, int event, unsigned int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001136{
1137 struct ifaddrmsg *ifm;
1138 struct nlmsghdr *nlh;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001139
Thomas Graf47f68512006-08-04 23:04:36 -07001140 nlh = nlmsg_put(skb, pid, seq, event, sizeof(*ifm), flags);
1141 if (nlh == NULL)
1142 return -ENOBUFS;
1143
1144 ifm = nlmsg_data(nlh);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001145 ifm->ifa_family = AF_INET;
1146 ifm->ifa_prefixlen = ifa->ifa_prefixlen;
1147 ifm->ifa_flags = ifa->ifa_flags|IFA_F_PERMANENT;
1148 ifm->ifa_scope = ifa->ifa_scope;
1149 ifm->ifa_index = ifa->ifa_dev->dev->ifindex;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001150
Thomas Graf47f68512006-08-04 23:04:36 -07001151 if (ifa->ifa_address)
Al Viroa7a628c2006-09-26 22:16:43 -07001152 NLA_PUT_BE32(skb, IFA_ADDRESS, ifa->ifa_address);
Thomas Graf47f68512006-08-04 23:04:36 -07001153
1154 if (ifa->ifa_local)
Al Viroa7a628c2006-09-26 22:16:43 -07001155 NLA_PUT_BE32(skb, IFA_LOCAL, ifa->ifa_local);
Thomas Graf47f68512006-08-04 23:04:36 -07001156
1157 if (ifa->ifa_broadcast)
Al Viroa7a628c2006-09-26 22:16:43 -07001158 NLA_PUT_BE32(skb, IFA_BROADCAST, ifa->ifa_broadcast);
Thomas Graf47f68512006-08-04 23:04:36 -07001159
1160 if (ifa->ifa_anycast)
Al Viroa7a628c2006-09-26 22:16:43 -07001161 NLA_PUT_BE32(skb, IFA_ANYCAST, ifa->ifa_anycast);
Thomas Graf47f68512006-08-04 23:04:36 -07001162
1163 if (ifa->ifa_label[0])
1164 NLA_PUT_STRING(skb, IFA_LABEL, ifa->ifa_label);
1165
1166 return nlmsg_end(skb, nlh);
1167
1168nla_put_failure:
1169 return nlmsg_cancel(skb, nlh);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001170}
1171
1172static int inet_dump_ifaddr(struct sk_buff *skb, struct netlink_callback *cb)
1173{
1174 int idx, ip_idx;
1175 struct net_device *dev;
1176 struct in_device *in_dev;
1177 struct in_ifaddr *ifa;
1178 int s_ip_idx, s_idx = cb->args[0];
1179
1180 s_ip_idx = ip_idx = cb->args[1];
1181 read_lock(&dev_base_lock);
1182 for (dev = dev_base, idx = 0; dev; dev = dev->next, idx++) {
1183 if (idx < s_idx)
1184 continue;
1185 if (idx > s_idx)
1186 s_ip_idx = 0;
1187 rcu_read_lock();
Herbert Xue5ed6392005-10-03 14:35:55 -07001188 if ((in_dev = __in_dev_get_rcu(dev)) == NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001189 rcu_read_unlock();
1190 continue;
1191 }
1192
1193 for (ifa = in_dev->ifa_list, ip_idx = 0; ifa;
1194 ifa = ifa->ifa_next, ip_idx++) {
1195 if (ip_idx < s_ip_idx)
1196 continue;
1197 if (inet_fill_ifaddr(skb, ifa, NETLINK_CB(cb->skb).pid,
1198 cb->nlh->nlmsg_seq,
Jamal Hadi Salimb6544c02005-06-18 22:54:12 -07001199 RTM_NEWADDR, NLM_F_MULTI) <= 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001200 rcu_read_unlock();
1201 goto done;
1202 }
1203 }
1204 rcu_read_unlock();
1205 }
1206
1207done:
1208 read_unlock(&dev_base_lock);
1209 cb->args[0] = idx;
1210 cb->args[1] = ip_idx;
1211
1212 return skb->len;
1213}
1214
Thomas Grafd6062cb2006-08-15 00:33:59 -07001215static void rtmsg_ifa(int event, struct in_ifaddr* ifa, struct nlmsghdr *nlh,
1216 u32 pid)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001217{
Thomas Graf47f68512006-08-04 23:04:36 -07001218 struct sk_buff *skb;
Thomas Grafd6062cb2006-08-15 00:33:59 -07001219 u32 seq = nlh ? nlh->nlmsg_seq : 0;
1220 int err = -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001221
Thomas Graf339bf982006-11-10 14:10:15 -08001222 skb = nlmsg_new(inet_nlmsg_size(), GFP_KERNEL);
Thomas Graf47f68512006-08-04 23:04:36 -07001223 if (skb == NULL)
Thomas Grafd6062cb2006-08-15 00:33:59 -07001224 goto errout;
1225
1226 err = inet_fill_ifaddr(skb, ifa, pid, seq, event, 0);
Thomas Graf339bf982006-11-10 14:10:15 -08001227 /* failure implies BUG in inet_nlmsg_size() */
1228 BUG_ON(err < 0);
Thomas Grafd6062cb2006-08-15 00:33:59 -07001229
1230 err = rtnl_notify(skb, pid, RTNLGRP_IPV4_IFADDR, nlh, GFP_KERNEL);
1231errout:
1232 if (err < 0)
1233 rtnl_set_sk_err(RTNLGRP_IPV4_IFADDR, err);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001234}
1235
Thomas Grafdb46edc2005-05-03 14:29:39 -07001236static struct rtnetlink_link inet_rtnetlink_table[RTM_NR_MSGTYPES] = {
1237 [RTM_NEWADDR - RTM_BASE] = { .doit = inet_rtm_newaddr, },
1238 [RTM_DELADDR - RTM_BASE] = { .doit = inet_rtm_deladdr, },
1239 [RTM_GETADDR - RTM_BASE] = { .dumpit = inet_dump_ifaddr, },
1240 [RTM_NEWROUTE - RTM_BASE] = { .doit = inet_rtm_newroute, },
1241 [RTM_DELROUTE - RTM_BASE] = { .doit = inet_rtm_delroute, },
1242 [RTM_GETROUTE - RTM_BASE] = { .doit = inet_rtm_getroute,
1243 .dumpit = inet_dump_fib, },
Linus Torvalds1da177e2005-04-16 15:20:36 -07001244#ifdef CONFIG_IP_MULTIPLE_TABLES
Thomas Grafe1ef4bf2006-08-04 03:39:22 -07001245 [RTM_GETRULE - RTM_BASE] = { .dumpit = fib4_rules_dump, },
Linus Torvalds1da177e2005-04-16 15:20:36 -07001246#endif
1247};
1248
1249#ifdef CONFIG_SYSCTL
1250
1251void inet_forward_change(void)
1252{
1253 struct net_device *dev;
1254 int on = ipv4_devconf.forwarding;
1255
1256 ipv4_devconf.accept_redirects = !on;
1257 ipv4_devconf_dflt.forwarding = on;
1258
1259 read_lock(&dev_base_lock);
1260 for (dev = dev_base; dev; dev = dev->next) {
1261 struct in_device *in_dev;
1262 rcu_read_lock();
Herbert Xue5ed6392005-10-03 14:35:55 -07001263 in_dev = __in_dev_get_rcu(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001264 if (in_dev)
1265 in_dev->cnf.forwarding = on;
1266 rcu_read_unlock();
1267 }
1268 read_unlock(&dev_base_lock);
1269
1270 rt_cache_flush(0);
1271}
1272
1273static int devinet_sysctl_forward(ctl_table *ctl, int write,
1274 struct file* filp, void __user *buffer,
1275 size_t *lenp, loff_t *ppos)
1276{
1277 int *valp = ctl->data;
1278 int val = *valp;
1279 int ret = proc_dointvec(ctl, write, filp, buffer, lenp, ppos);
1280
1281 if (write && *valp != val) {
1282 if (valp == &ipv4_devconf.forwarding)
1283 inet_forward_change();
1284 else if (valp != &ipv4_devconf_dflt.forwarding)
1285 rt_cache_flush(0);
1286 }
1287
1288 return ret;
1289}
1290
1291int ipv4_doint_and_flush(ctl_table *ctl, int write,
1292 struct file* filp, void __user *buffer,
1293 size_t *lenp, loff_t *ppos)
1294{
1295 int *valp = ctl->data;
1296 int val = *valp;
1297 int ret = proc_dointvec(ctl, write, filp, buffer, lenp, ppos);
1298
1299 if (write && *valp != val)
1300 rt_cache_flush(0);
1301
1302 return ret;
1303}
1304
1305int ipv4_doint_and_flush_strategy(ctl_table *table, int __user *name, int nlen,
1306 void __user *oldval, size_t __user *oldlenp,
Alexey Dobriyan1f29bcd2006-12-10 02:19:10 -08001307 void __user *newval, size_t newlen)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001308{
1309 int *valp = table->data;
1310 int new;
1311
1312 if (!newval || !newlen)
1313 return 0;
1314
1315 if (newlen != sizeof(int))
1316 return -EINVAL;
1317
1318 if (get_user(new, (int __user *)newval))
1319 return -EFAULT;
1320
1321 if (new == *valp)
1322 return 0;
1323
1324 if (oldval && oldlenp) {
1325 size_t len;
1326
1327 if (get_user(len, oldlenp))
1328 return -EFAULT;
1329
1330 if (len) {
1331 if (len > table->maxlen)
1332 len = table->maxlen;
1333 if (copy_to_user(oldval, valp, len))
1334 return -EFAULT;
1335 if (put_user(len, oldlenp))
1336 return -EFAULT;
1337 }
1338 }
1339
1340 *valp = new;
1341 rt_cache_flush(0);
1342 return 1;
1343}
1344
1345
1346static struct devinet_sysctl_table {
1347 struct ctl_table_header *sysctl_header;
1348 ctl_table devinet_vars[__NET_IPV4_CONF_MAX];
1349 ctl_table devinet_dev[2];
1350 ctl_table devinet_conf_dir[2];
1351 ctl_table devinet_proto_dir[2];
1352 ctl_table devinet_root_dir[2];
1353} devinet_sysctl = {
1354 .devinet_vars = {
1355 {
1356 .ctl_name = NET_IPV4_CONF_FORWARDING,
1357 .procname = "forwarding",
1358 .data = &ipv4_devconf.forwarding,
1359 .maxlen = sizeof(int),
1360 .mode = 0644,
1361 .proc_handler = &devinet_sysctl_forward,
1362 },
1363 {
1364 .ctl_name = NET_IPV4_CONF_MC_FORWARDING,
1365 .procname = "mc_forwarding",
1366 .data = &ipv4_devconf.mc_forwarding,
1367 .maxlen = sizeof(int),
1368 .mode = 0444,
1369 .proc_handler = &proc_dointvec,
1370 },
1371 {
1372 .ctl_name = NET_IPV4_CONF_ACCEPT_REDIRECTS,
1373 .procname = "accept_redirects",
1374 .data = &ipv4_devconf.accept_redirects,
1375 .maxlen = sizeof(int),
1376 .mode = 0644,
1377 .proc_handler = &proc_dointvec,
1378 },
1379 {
1380 .ctl_name = NET_IPV4_CONF_SECURE_REDIRECTS,
1381 .procname = "secure_redirects",
1382 .data = &ipv4_devconf.secure_redirects,
1383 .maxlen = sizeof(int),
1384 .mode = 0644,
1385 .proc_handler = &proc_dointvec,
1386 },
1387 {
1388 .ctl_name = NET_IPV4_CONF_SHARED_MEDIA,
1389 .procname = "shared_media",
1390 .data = &ipv4_devconf.shared_media,
1391 .maxlen = sizeof(int),
1392 .mode = 0644,
1393 .proc_handler = &proc_dointvec,
1394 },
1395 {
1396 .ctl_name = NET_IPV4_CONF_RP_FILTER,
1397 .procname = "rp_filter",
1398 .data = &ipv4_devconf.rp_filter,
1399 .maxlen = sizeof(int),
1400 .mode = 0644,
1401 .proc_handler = &proc_dointvec,
1402 },
1403 {
1404 .ctl_name = NET_IPV4_CONF_SEND_REDIRECTS,
1405 .procname = "send_redirects",
1406 .data = &ipv4_devconf.send_redirects,
1407 .maxlen = sizeof(int),
1408 .mode = 0644,
1409 .proc_handler = &proc_dointvec,
1410 },
1411 {
1412 .ctl_name = NET_IPV4_CONF_ACCEPT_SOURCE_ROUTE,
1413 .procname = "accept_source_route",
1414 .data = &ipv4_devconf.accept_source_route,
1415 .maxlen = sizeof(int),
1416 .mode = 0644,
1417 .proc_handler = &proc_dointvec,
1418 },
1419 {
1420 .ctl_name = NET_IPV4_CONF_PROXY_ARP,
1421 .procname = "proxy_arp",
1422 .data = &ipv4_devconf.proxy_arp,
1423 .maxlen = sizeof(int),
1424 .mode = 0644,
1425 .proc_handler = &proc_dointvec,
1426 },
1427 {
1428 .ctl_name = NET_IPV4_CONF_MEDIUM_ID,
1429 .procname = "medium_id",
1430 .data = &ipv4_devconf.medium_id,
1431 .maxlen = sizeof(int),
1432 .mode = 0644,
1433 .proc_handler = &proc_dointvec,
1434 },
1435 {
1436 .ctl_name = NET_IPV4_CONF_BOOTP_RELAY,
1437 .procname = "bootp_relay",
1438 .data = &ipv4_devconf.bootp_relay,
1439 .maxlen = sizeof(int),
1440 .mode = 0644,
1441 .proc_handler = &proc_dointvec,
1442 },
1443 {
1444 .ctl_name = NET_IPV4_CONF_LOG_MARTIANS,
1445 .procname = "log_martians",
1446 .data = &ipv4_devconf.log_martians,
1447 .maxlen = sizeof(int),
1448 .mode = 0644,
1449 .proc_handler = &proc_dointvec,
1450 },
1451 {
1452 .ctl_name = NET_IPV4_CONF_TAG,
1453 .procname = "tag",
1454 .data = &ipv4_devconf.tag,
1455 .maxlen = sizeof(int),
1456 .mode = 0644,
1457 .proc_handler = &proc_dointvec,
1458 },
1459 {
1460 .ctl_name = NET_IPV4_CONF_ARPFILTER,
1461 .procname = "arp_filter",
1462 .data = &ipv4_devconf.arp_filter,
1463 .maxlen = sizeof(int),
1464 .mode = 0644,
1465 .proc_handler = &proc_dointvec,
1466 },
1467 {
1468 .ctl_name = NET_IPV4_CONF_ARP_ANNOUNCE,
1469 .procname = "arp_announce",
1470 .data = &ipv4_devconf.arp_announce,
1471 .maxlen = sizeof(int),
1472 .mode = 0644,
1473 .proc_handler = &proc_dointvec,
1474 },
1475 {
1476 .ctl_name = NET_IPV4_CONF_ARP_IGNORE,
1477 .procname = "arp_ignore",
1478 .data = &ipv4_devconf.arp_ignore,
1479 .maxlen = sizeof(int),
1480 .mode = 0644,
1481 .proc_handler = &proc_dointvec,
1482 },
1483 {
Neil Hormanabd596a2006-03-20 22:39:47 -08001484 .ctl_name = NET_IPV4_CONF_ARP_ACCEPT,
1485 .procname = "arp_accept",
1486 .data = &ipv4_devconf.arp_accept,
1487 .maxlen = sizeof(int),
1488 .mode = 0644,
1489 .proc_handler = &proc_dointvec,
1490 },
1491 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001492 .ctl_name = NET_IPV4_CONF_NOXFRM,
1493 .procname = "disable_xfrm",
1494 .data = &ipv4_devconf.no_xfrm,
1495 .maxlen = sizeof(int),
1496 .mode = 0644,
1497 .proc_handler = &ipv4_doint_and_flush,
1498 .strategy = &ipv4_doint_and_flush_strategy,
1499 },
1500 {
1501 .ctl_name = NET_IPV4_CONF_NOPOLICY,
1502 .procname = "disable_policy",
1503 .data = &ipv4_devconf.no_policy,
1504 .maxlen = sizeof(int),
1505 .mode = 0644,
1506 .proc_handler = &ipv4_doint_and_flush,
1507 .strategy = &ipv4_doint_and_flush_strategy,
1508 },
1509 {
1510 .ctl_name = NET_IPV4_CONF_FORCE_IGMP_VERSION,
1511 .procname = "force_igmp_version",
1512 .data = &ipv4_devconf.force_igmp_version,
1513 .maxlen = sizeof(int),
1514 .mode = 0644,
1515 .proc_handler = &ipv4_doint_and_flush,
1516 .strategy = &ipv4_doint_and_flush_strategy,
1517 },
Harald Welte8f937c62005-05-29 20:23:46 -07001518 {
1519 .ctl_name = NET_IPV4_CONF_PROMOTE_SECONDARIES,
1520 .procname = "promote_secondaries",
1521 .data = &ipv4_devconf.promote_secondaries,
1522 .maxlen = sizeof(int),
1523 .mode = 0644,
1524 .proc_handler = &ipv4_doint_and_flush,
1525 .strategy = &ipv4_doint_and_flush_strategy,
1526 },
Linus Torvalds1da177e2005-04-16 15:20:36 -07001527 },
1528 .devinet_dev = {
1529 {
1530 .ctl_name = NET_PROTO_CONF_ALL,
1531 .procname = "all",
1532 .mode = 0555,
1533 .child = devinet_sysctl.devinet_vars,
1534 },
1535 },
1536 .devinet_conf_dir = {
1537 {
1538 .ctl_name = NET_IPV4_CONF,
1539 .procname = "conf",
1540 .mode = 0555,
1541 .child = devinet_sysctl.devinet_dev,
1542 },
1543 },
1544 .devinet_proto_dir = {
1545 {
1546 .ctl_name = NET_IPV4,
1547 .procname = "ipv4",
1548 .mode = 0555,
1549 .child = devinet_sysctl.devinet_conf_dir,
1550 },
1551 },
1552 .devinet_root_dir = {
1553 {
1554 .ctl_name = CTL_NET,
1555 .procname = "net",
1556 .mode = 0555,
1557 .child = devinet_sysctl.devinet_proto_dir,
1558 },
1559 },
1560};
1561
1562static void devinet_sysctl_register(struct in_device *in_dev,
1563 struct ipv4_devconf *p)
1564{
1565 int i;
1566 struct net_device *dev = in_dev ? in_dev->dev : NULL;
Arnaldo Carvalho de Melo42e5ea462006-11-17 11:18:20 -02001567 struct devinet_sysctl_table *t = kmemdup(&devinet_sysctl, sizeof(*t),
1568 GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001569 char *dev_name = NULL;
1570
1571 if (!t)
1572 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001573 for (i = 0; i < ARRAY_SIZE(t->devinet_vars) - 1; i++) {
1574 t->devinet_vars[i].data += (char *)p - (char *)&ipv4_devconf;
1575 t->devinet_vars[i].de = NULL;
1576 }
1577
1578 if (dev) {
1579 dev_name = dev->name;
1580 t->devinet_dev[0].ctl_name = dev->ifindex;
1581 } else {
1582 dev_name = "default";
1583 t->devinet_dev[0].ctl_name = NET_PROTO_CONF_DEFAULT;
1584 }
1585
1586 /*
1587 * Make a copy of dev_name, because '.procname' is regarded as const
1588 * by sysctl and we wouldn't want anyone to change it under our feet
1589 * (see SIOCSIFNAME).
1590 */
Paulo Marques543537b2005-06-23 00:09:02 -07001591 dev_name = kstrdup(dev_name, GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001592 if (!dev_name)
1593 goto free;
1594
1595 t->devinet_dev[0].procname = dev_name;
1596 t->devinet_dev[0].child = t->devinet_vars;
1597 t->devinet_dev[0].de = NULL;
1598 t->devinet_conf_dir[0].child = t->devinet_dev;
1599 t->devinet_conf_dir[0].de = NULL;
1600 t->devinet_proto_dir[0].child = t->devinet_conf_dir;
1601 t->devinet_proto_dir[0].de = NULL;
1602 t->devinet_root_dir[0].child = t->devinet_proto_dir;
1603 t->devinet_root_dir[0].de = NULL;
1604
1605 t->sysctl_header = register_sysctl_table(t->devinet_root_dir, 0);
1606 if (!t->sysctl_header)
1607 goto free_procname;
1608
1609 p->sysctl = t;
1610 return;
1611
1612 /* error path */
1613 free_procname:
1614 kfree(dev_name);
1615 free:
1616 kfree(t);
1617 return;
1618}
1619
1620static void devinet_sysctl_unregister(struct ipv4_devconf *p)
1621{
1622 if (p->sysctl) {
1623 struct devinet_sysctl_table *t = p->sysctl;
1624 p->sysctl = NULL;
1625 unregister_sysctl_table(t->sysctl_header);
1626 kfree(t->devinet_dev[0].procname);
1627 kfree(t);
1628 }
1629}
1630#endif
1631
1632void __init devinet_init(void)
1633{
1634 register_gifconf(PF_INET, inet_gifconf);
1635 register_netdevice_notifier(&ip_netdev_notifier);
1636 rtnetlink_links[PF_INET] = inet_rtnetlink_table;
1637#ifdef CONFIG_SYSCTL
1638 devinet_sysctl.sysctl_header =
1639 register_sysctl_table(devinet_sysctl.devinet_root_dir, 0);
1640 devinet_sysctl_register(NULL, &ipv4_devconf_dflt);
1641#endif
1642}
1643
Linus Torvalds1da177e2005-04-16 15:20:36 -07001644EXPORT_SYMBOL(in_dev_finish_destroy);
1645EXPORT_SYMBOL(inet_select_addr);
1646EXPORT_SYMBOL(inetdev_by_index);
1647EXPORT_SYMBOL(register_inetaddr_notifier);
1648EXPORT_SYMBOL(unregister_inetaddr_notifier);