blob: 82def2c1c65050db75ea0a7163d00d0bfa72582c [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * NET3 IP device support routines.
3 *
4 * Version: $Id: devinet.c,v 1.44 2001/10/31 21:55:54 davem Exp $
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License
8 * as published by the Free Software Foundation; either version
9 * 2 of the License, or (at your option) any later version.
10 *
11 * Derived from the IP parts of dev.c 1.0.19
Jesper Juhl02c30a82005-05-05 16:16:16 -070012 * Authors: Ross Biro
Linus Torvalds1da177e2005-04-16 15:20:36 -070013 * Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
14 * Mark Evans, <evansmp@uhura.aston.ac.uk>
15 *
16 * Additional Authors:
17 * Alan Cox, <gw4pts@gw4pts.ampr.org>
18 * Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
19 *
20 * Changes:
21 * Alexey Kuznetsov: pa_* fields are replaced with ifaddr
22 * lists.
23 * Cyrus Durgin: updated for kmod
24 * Matthias Andree: in devinet_ioctl, compare label and
25 * address (4.4BSD alias style support),
26 * fall back to comparing just the label
27 * if no match found.
28 */
29
Linus Torvalds1da177e2005-04-16 15:20:36 -070030
31#include <asm/uaccess.h>
32#include <asm/system.h>
33#include <linux/bitops.h>
Randy Dunlap4fc268d2006-01-11 12:17:47 -080034#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035#include <linux/module.h>
36#include <linux/types.h>
37#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070038#include <linux/string.h>
39#include <linux/mm.h>
40#include <linux/socket.h>
41#include <linux/sockios.h>
42#include <linux/in.h>
43#include <linux/errno.h>
44#include <linux/interrupt.h>
Thomas Graf18237302006-08-04 23:04:54 -070045#include <linux/if_addr.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070046#include <linux/if_ether.h>
47#include <linux/inet.h>
48#include <linux/netdevice.h>
49#include <linux/etherdevice.h>
50#include <linux/skbuff.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070051#include <linux/init.h>
52#include <linux/notifier.h>
53#include <linux/inetdevice.h>
54#include <linux/igmp.h>
55#ifdef CONFIG_SYSCTL
56#include <linux/sysctl.h>
57#endif
58#include <linux/kmod.h>
59
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020060#include <net/arp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070061#include <net/ip.h>
62#include <net/route.h>
63#include <net/ip_fib.h>
Thomas Graf63f34442007-03-22 11:55:17 -070064#include <net/rtnetlink.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070065
66struct ipv4_devconf ipv4_devconf = {
Herbert Xu42f811b2007-06-04 23:34:44 -070067 .data = {
68 [NET_IPV4_CONF_ACCEPT_REDIRECTS - 1] = 1,
69 [NET_IPV4_CONF_SEND_REDIRECTS - 1] = 1,
70 [NET_IPV4_CONF_SECURE_REDIRECTS - 1] = 1,
71 [NET_IPV4_CONF_SHARED_MEDIA - 1] = 1,
72 },
Linus Torvalds1da177e2005-04-16 15:20:36 -070073};
74
75static struct ipv4_devconf ipv4_devconf_dflt = {
Herbert Xu42f811b2007-06-04 23:34:44 -070076 .data = {
77 [NET_IPV4_CONF_ACCEPT_REDIRECTS - 1] = 1,
78 [NET_IPV4_CONF_SEND_REDIRECTS - 1] = 1,
79 [NET_IPV4_CONF_SECURE_REDIRECTS - 1] = 1,
80 [NET_IPV4_CONF_SHARED_MEDIA - 1] = 1,
81 [NET_IPV4_CONF_ACCEPT_SOURCE_ROUTE - 1] = 1,
82 },
Linus Torvalds1da177e2005-04-16 15:20:36 -070083};
84
Herbert Xu42f811b2007-06-04 23:34:44 -070085#define IPV4_DEVCONF_DFLT(attr) IPV4_DEVCONF(ipv4_devconf_dflt, attr)
86
Patrick McHardyef7c79e2007-06-05 12:38:30 -070087static const struct nla_policy ifa_ipv4_policy[IFA_MAX+1] = {
Thomas Graf5c753972006-08-04 23:03:53 -070088 [IFA_LOCAL] = { .type = NLA_U32 },
89 [IFA_ADDRESS] = { .type = NLA_U32 },
90 [IFA_BROADCAST] = { .type = NLA_U32 },
91 [IFA_ANYCAST] = { .type = NLA_U32 },
Thomas Graf5176f912006-08-26 20:13:18 -070092 [IFA_LABEL] = { .type = NLA_STRING, .len = IFNAMSIZ - 1 },
Thomas Graf5c753972006-08-04 23:03:53 -070093};
94
Thomas Grafd6062cb2006-08-15 00:33:59 -070095static void rtmsg_ifa(int event, struct in_ifaddr *, struct nlmsghdr *, u32);
Linus Torvalds1da177e2005-04-16 15:20:36 -070096
Alan Sterne041c682006-03-27 01:16:30 -080097static BLOCKING_NOTIFIER_HEAD(inetaddr_chain);
Linus Torvalds1da177e2005-04-16 15:20:36 -070098static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
99 int destroy);
100#ifdef CONFIG_SYSCTL
Pavel Emelyanov66f27a52007-12-02 00:55:54 +1100101static void devinet_sysctl_register(struct in_device *idev);
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800102static void devinet_sysctl_unregister(struct in_device *idev);
103#else
104static inline void devinet_sysctl_register(struct in_device *idev)
105{
106}
107static inline void devinet_sysctl_unregister(struct in_device *idev)
108{
109}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700110#endif
111
112/* Locks all the inet devices. */
113
114static struct in_ifaddr *inet_alloc_ifa(void)
115{
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700116 struct in_ifaddr *ifa = kzalloc(sizeof(*ifa), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700117
118 if (ifa) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119 INIT_RCU_HEAD(&ifa->rcu_head);
120 }
121
122 return ifa;
123}
124
125static void inet_rcu_free_ifa(struct rcu_head *head)
126{
127 struct in_ifaddr *ifa = container_of(head, struct in_ifaddr, rcu_head);
128 if (ifa->ifa_dev)
129 in_dev_put(ifa->ifa_dev);
130 kfree(ifa);
131}
132
133static inline void inet_free_ifa(struct in_ifaddr *ifa)
134{
135 call_rcu(&ifa->rcu_head, inet_rcu_free_ifa);
136}
137
138void in_dev_finish_destroy(struct in_device *idev)
139{
140 struct net_device *dev = idev->dev;
141
142 BUG_TRAP(!idev->ifa_list);
143 BUG_TRAP(!idev->mc_list);
144#ifdef NET_REFCNT_DEBUG
145 printk(KERN_DEBUG "in_dev_finish_destroy: %p=%s\n",
146 idev, dev ? dev->name : "NIL");
147#endif
148 dev_put(dev);
149 if (!idev->dead)
150 printk("Freeing alive in_device %p\n", idev);
151 else {
152 kfree(idev);
153 }
154}
155
Herbert Xu71e27da2007-06-04 23:36:06 -0700156static struct in_device *inetdev_init(struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700157{
158 struct in_device *in_dev;
159
160 ASSERT_RTNL();
161
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700162 in_dev = kzalloc(sizeof(*in_dev), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700163 if (!in_dev)
164 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700165 INIT_RCU_HEAD(&in_dev->rcu_head);
166 memcpy(&in_dev->cnf, &ipv4_devconf_dflt, sizeof(in_dev->cnf));
167 in_dev->cnf.sysctl = NULL;
168 in_dev->dev = dev;
169 if ((in_dev->arp_parms = neigh_parms_alloc(dev, &arp_tbl)) == NULL)
170 goto out_kfree;
171 /* Reference in_dev->dev */
172 dev_hold(dev);
David L Stevens30c4cf52007-01-04 12:31:14 -0800173 /* Account for reference dev->ip_ptr (below) */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700174 in_dev_hold(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700175
Pavel Emelyanov66f27a52007-12-02 00:55:54 +1100176 devinet_sysctl_register(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700177 ip_mc_init_dev(in_dev);
178 if (dev->flags & IFF_UP)
179 ip_mc_up(in_dev);
Jarek Poplawski483479e2007-01-09 14:38:31 -0800180
David L Stevens30c4cf52007-01-04 12:31:14 -0800181 /* we can receive as soon as ip_ptr is set -- do this last */
182 rcu_assign_pointer(dev->ip_ptr, in_dev);
Jarek Poplawski483479e2007-01-09 14:38:31 -0800183out:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700184 return in_dev;
185out_kfree:
186 kfree(in_dev);
187 in_dev = NULL;
188 goto out;
189}
190
191static void in_dev_rcu_put(struct rcu_head *head)
192{
193 struct in_device *idev = container_of(head, struct in_device, rcu_head);
194 in_dev_put(idev);
195}
196
197static void inetdev_destroy(struct in_device *in_dev)
198{
199 struct in_ifaddr *ifa;
200 struct net_device *dev;
201
202 ASSERT_RTNL();
203
204 dev = in_dev->dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700205
206 in_dev->dead = 1;
207
208 ip_mc_destroy_dev(in_dev);
209
210 while ((ifa = in_dev->ifa_list) != NULL) {
211 inet_del_ifa(in_dev, &in_dev->ifa_list, 0);
212 inet_free_ifa(ifa);
213 }
214
Linus Torvalds1da177e2005-04-16 15:20:36 -0700215 dev->ip_ptr = NULL;
216
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800217 devinet_sysctl_unregister(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700218 neigh_parms_release(&arp_tbl, in_dev->arp_parms);
219 arp_ifdown(dev);
220
221 call_rcu(&in_dev->rcu_head, in_dev_rcu_put);
222}
223
Al Viroff428d72006-09-26 22:13:35 -0700224int inet_addr_onlink(struct in_device *in_dev, __be32 a, __be32 b)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700225{
226 rcu_read_lock();
227 for_primary_ifa(in_dev) {
228 if (inet_ifa_match(a, ifa)) {
229 if (!b || inet_ifa_match(b, ifa)) {
230 rcu_read_unlock();
231 return 1;
232 }
233 }
234 } endfor_ifa(in_dev);
235 rcu_read_unlock();
236 return 0;
237}
238
Thomas Grafd6062cb2006-08-15 00:33:59 -0700239static void __inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
240 int destroy, struct nlmsghdr *nlh, u32 pid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241{
Harald Welte8f937c62005-05-29 20:23:46 -0700242 struct in_ifaddr *promote = NULL;
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800243 struct in_ifaddr *ifa, *ifa1 = *ifap;
244 struct in_ifaddr *last_prim = in_dev->ifa_list;
245 struct in_ifaddr *prev_prom = NULL;
246 int do_promote = IN_DEV_PROMOTE_SECONDARIES(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247
248 ASSERT_RTNL();
249
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900250 /* 1. Deleting primary ifaddr forces deletion all secondaries
Harald Welte8f937c62005-05-29 20:23:46 -0700251 * unless alias promotion is set
252 **/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253
254 if (!(ifa1->ifa_flags & IFA_F_SECONDARY)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255 struct in_ifaddr **ifap1 = &ifa1->ifa_next;
256
257 while ((ifa = *ifap1) != NULL) {
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900258 if (!(ifa->ifa_flags & IFA_F_SECONDARY) &&
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800259 ifa1->ifa_scope <= ifa->ifa_scope)
260 last_prim = ifa;
261
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262 if (!(ifa->ifa_flags & IFA_F_SECONDARY) ||
263 ifa1->ifa_mask != ifa->ifa_mask ||
264 !inet_ifa_match(ifa1->ifa_address, ifa)) {
265 ifap1 = &ifa->ifa_next;
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800266 prev_prom = ifa;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700267 continue;
268 }
269
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800270 if (!do_promote) {
Harald Welte8f937c62005-05-29 20:23:46 -0700271 *ifap1 = ifa->ifa_next;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272
Thomas Grafd6062cb2006-08-15 00:33:59 -0700273 rtmsg_ifa(RTM_DELADDR, ifa, nlh, pid);
Alan Sterne041c682006-03-27 01:16:30 -0800274 blocking_notifier_call_chain(&inetaddr_chain,
275 NETDEV_DOWN, ifa);
Harald Welte8f937c62005-05-29 20:23:46 -0700276 inet_free_ifa(ifa);
277 } else {
278 promote = ifa;
279 break;
280 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700281 }
282 }
283
284 /* 2. Unlink it */
285
286 *ifap = ifa1->ifa_next;
287
288 /* 3. Announce address deletion */
289
290 /* Send message first, then call notifier.
291 At first sight, FIB update triggered by notifier
292 will refer to already deleted ifaddr, that could confuse
293 netlink listeners. It is not true: look, gated sees
294 that route deleted and if it still thinks that ifaddr
295 is valid, it will try to restore deleted routes... Grr.
296 So that, this order is correct.
297 */
Thomas Grafd6062cb2006-08-15 00:33:59 -0700298 rtmsg_ifa(RTM_DELADDR, ifa1, nlh, pid);
Alan Sterne041c682006-03-27 01:16:30 -0800299 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_DOWN, ifa1);
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800300
301 if (promote) {
302
303 if (prev_prom) {
304 prev_prom->ifa_next = promote->ifa_next;
305 promote->ifa_next = last_prim->ifa_next;
306 last_prim->ifa_next = promote;
307 }
308
309 promote->ifa_flags &= ~IFA_F_SECONDARY;
Thomas Grafd6062cb2006-08-15 00:33:59 -0700310 rtmsg_ifa(RTM_NEWADDR, promote, nlh, pid);
Alan Sterne041c682006-03-27 01:16:30 -0800311 blocking_notifier_call_chain(&inetaddr_chain,
312 NETDEV_UP, promote);
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800313 for (ifa = promote->ifa_next; ifa; ifa = ifa->ifa_next) {
314 if (ifa1->ifa_mask != ifa->ifa_mask ||
315 !inet_ifa_match(ifa1->ifa_address, ifa))
316 continue;
317 fib_add_ifaddr(ifa);
318 }
319
320 }
Herbert Xu63630972007-06-07 18:35:38 -0700321 if (destroy)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700322 inet_free_ifa(ifa1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323}
324
Thomas Grafd6062cb2006-08-15 00:33:59 -0700325static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
326 int destroy)
327{
328 __inet_del_ifa(in_dev, ifap, destroy, NULL, 0);
329}
330
331static int __inet_insert_ifa(struct in_ifaddr *ifa, struct nlmsghdr *nlh,
332 u32 pid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700333{
334 struct in_device *in_dev = ifa->ifa_dev;
335 struct in_ifaddr *ifa1, **ifap, **last_primary;
336
337 ASSERT_RTNL();
338
339 if (!ifa->ifa_local) {
340 inet_free_ifa(ifa);
341 return 0;
342 }
343
344 ifa->ifa_flags &= ~IFA_F_SECONDARY;
345 last_primary = &in_dev->ifa_list;
346
347 for (ifap = &in_dev->ifa_list; (ifa1 = *ifap) != NULL;
348 ifap = &ifa1->ifa_next) {
349 if (!(ifa1->ifa_flags & IFA_F_SECONDARY) &&
350 ifa->ifa_scope <= ifa1->ifa_scope)
351 last_primary = &ifa1->ifa_next;
352 if (ifa1->ifa_mask == ifa->ifa_mask &&
353 inet_ifa_match(ifa1->ifa_address, ifa)) {
354 if (ifa1->ifa_local == ifa->ifa_local) {
355 inet_free_ifa(ifa);
356 return -EEXIST;
357 }
358 if (ifa1->ifa_scope != ifa->ifa_scope) {
359 inet_free_ifa(ifa);
360 return -EINVAL;
361 }
362 ifa->ifa_flags |= IFA_F_SECONDARY;
363 }
364 }
365
366 if (!(ifa->ifa_flags & IFA_F_SECONDARY)) {
367 net_srandom(ifa->ifa_local);
368 ifap = last_primary;
369 }
370
371 ifa->ifa_next = *ifap;
372 *ifap = ifa;
373
374 /* Send message first, then call notifier.
375 Notifier will trigger FIB update, so that
376 listeners of netlink will know about new ifaddr */
Thomas Grafd6062cb2006-08-15 00:33:59 -0700377 rtmsg_ifa(RTM_NEWADDR, ifa, nlh, pid);
Alan Sterne041c682006-03-27 01:16:30 -0800378 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_UP, ifa);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700379
380 return 0;
381}
382
Thomas Grafd6062cb2006-08-15 00:33:59 -0700383static int inet_insert_ifa(struct in_ifaddr *ifa)
384{
385 return __inet_insert_ifa(ifa, NULL, 0);
386}
387
Linus Torvalds1da177e2005-04-16 15:20:36 -0700388static int inet_set_ifa(struct net_device *dev, struct in_ifaddr *ifa)
389{
Herbert Xue5ed6392005-10-03 14:35:55 -0700390 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700391
392 ASSERT_RTNL();
393
394 if (!in_dev) {
Herbert Xu71e27da2007-06-04 23:36:06 -0700395 inet_free_ifa(ifa);
396 return -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700397 }
Herbert Xu71e27da2007-06-04 23:36:06 -0700398 ipv4_devconf_setall(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399 if (ifa->ifa_dev != in_dev) {
400 BUG_TRAP(!ifa->ifa_dev);
401 in_dev_hold(in_dev);
402 ifa->ifa_dev = in_dev;
403 }
404 if (LOOPBACK(ifa->ifa_local))
405 ifa->ifa_scope = RT_SCOPE_HOST;
406 return inet_insert_ifa(ifa);
407}
408
409struct in_device *inetdev_by_index(int ifindex)
410{
411 struct net_device *dev;
412 struct in_device *in_dev = NULL;
413 read_lock(&dev_base_lock);
Eric W. Biederman881d9662007-09-17 11:56:21 -0700414 dev = __dev_get_by_index(&init_net, ifindex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700415 if (dev)
416 in_dev = in_dev_get(dev);
417 read_unlock(&dev_base_lock);
418 return in_dev;
419}
420
421/* Called only from RTNL semaphored context. No locks. */
422
Al Viro60cad5d2006-09-26 22:17:09 -0700423struct in_ifaddr *inet_ifa_byprefix(struct in_device *in_dev, __be32 prefix,
424 __be32 mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700425{
426 ASSERT_RTNL();
427
428 for_primary_ifa(in_dev) {
429 if (ifa->ifa_mask == mask && inet_ifa_match(prefix, ifa))
430 return ifa;
431 } endfor_ifa(in_dev);
432 return NULL;
433}
434
435static int inet_rtm_deladdr(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
436{
Denis V. Lunevb8542722007-12-01 00:21:31 +1100437 struct net *net = skb->sk->sk_net;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700438 struct nlattr *tb[IFA_MAX+1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700439 struct in_device *in_dev;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700440 struct ifaddrmsg *ifm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700441 struct in_ifaddr *ifa, **ifap;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700442 int err = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700443
444 ASSERT_RTNL();
445
Denis V. Lunevb8542722007-12-01 00:21:31 +1100446 if (net != &init_net)
447 return -EINVAL;
448
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700449 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy);
450 if (err < 0)
451 goto errout;
452
453 ifm = nlmsg_data(nlh);
454 in_dev = inetdev_by_index(ifm->ifa_index);
455 if (in_dev == NULL) {
456 err = -ENODEV;
457 goto errout;
458 }
459
Linus Torvalds1da177e2005-04-16 15:20:36 -0700460 __in_dev_put(in_dev);
461
462 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
463 ifap = &ifa->ifa_next) {
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700464 if (tb[IFA_LOCAL] &&
Al Viroa7a628c2006-09-26 22:16:43 -0700465 ifa->ifa_local != nla_get_be32(tb[IFA_LOCAL]))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700466 continue;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700467
468 if (tb[IFA_LABEL] && nla_strcmp(tb[IFA_LABEL], ifa->ifa_label))
469 continue;
470
471 if (tb[IFA_ADDRESS] &&
472 (ifm->ifa_prefixlen != ifa->ifa_prefixlen ||
Al Viroa7a628c2006-09-26 22:16:43 -0700473 !inet_ifa_match(nla_get_be32(tb[IFA_ADDRESS]), ifa)))
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700474 continue;
475
Thomas Grafd6062cb2006-08-15 00:33:59 -0700476 __inet_del_ifa(in_dev, ifap, 1, nlh, NETLINK_CB(skb).pid);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700477 return 0;
478 }
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700479
480 err = -EADDRNOTAVAIL;
481errout:
482 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700483}
484
Thomas Graf5c753972006-08-04 23:03:53 -0700485static struct in_ifaddr *rtm_to_ifaddr(struct nlmsghdr *nlh)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700486{
Thomas Graf5c753972006-08-04 23:03:53 -0700487 struct nlattr *tb[IFA_MAX+1];
488 struct in_ifaddr *ifa;
489 struct ifaddrmsg *ifm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490 struct net_device *dev;
491 struct in_device *in_dev;
Thomas Graf5c753972006-08-04 23:03:53 -0700492 int err = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700493
Thomas Graf5c753972006-08-04 23:03:53 -0700494 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy);
495 if (err < 0)
496 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700497
Thomas Graf5c753972006-08-04 23:03:53 -0700498 ifm = nlmsg_data(nlh);
Evgeniy Polyakovc4e38f42007-03-09 13:43:24 -0800499 if (ifm->ifa_prefixlen > 32 || tb[IFA_LOCAL] == NULL) {
500 err = -EINVAL;
Thomas Graf5c753972006-08-04 23:03:53 -0700501 goto errout;
Evgeniy Polyakovc4e38f42007-03-09 13:43:24 -0800502 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700503
Eric W. Biederman881d9662007-09-17 11:56:21 -0700504 dev = __dev_get_by_index(&init_net, ifm->ifa_index);
Thomas Graf5c753972006-08-04 23:03:53 -0700505 if (dev == NULL) {
506 err = -ENODEV;
507 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508 }
509
Thomas Graf5c753972006-08-04 23:03:53 -0700510 in_dev = __in_dev_get_rtnl(dev);
511 if (in_dev == NULL) {
Herbert Xu71e27da2007-06-04 23:36:06 -0700512 err = -ENOBUFS;
513 goto errout;
Thomas Graf5c753972006-08-04 23:03:53 -0700514 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700515
Thomas Graf5c753972006-08-04 23:03:53 -0700516 ifa = inet_alloc_ifa();
517 if (ifa == NULL) {
518 /*
519 * A potential indev allocation can be left alive, it stays
520 * assigned to its device and is destroy with it.
521 */
522 err = -ENOBUFS;
523 goto errout;
524 }
525
Pavel Emelyanova4e65d32007-12-07 23:55:43 -0800526 ipv4_devconf_setall(in_dev);
Thomas Graf5c753972006-08-04 23:03:53 -0700527 in_dev_hold(in_dev);
528
529 if (tb[IFA_ADDRESS] == NULL)
530 tb[IFA_ADDRESS] = tb[IFA_LOCAL];
531
Linus Torvalds1da177e2005-04-16 15:20:36 -0700532 ifa->ifa_prefixlen = ifm->ifa_prefixlen;
533 ifa->ifa_mask = inet_make_mask(ifm->ifa_prefixlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700534 ifa->ifa_flags = ifm->ifa_flags;
535 ifa->ifa_scope = ifm->ifa_scope;
Thomas Graf5c753972006-08-04 23:03:53 -0700536 ifa->ifa_dev = in_dev;
537
Al Viroa7a628c2006-09-26 22:16:43 -0700538 ifa->ifa_local = nla_get_be32(tb[IFA_LOCAL]);
539 ifa->ifa_address = nla_get_be32(tb[IFA_ADDRESS]);
Thomas Graf5c753972006-08-04 23:03:53 -0700540
541 if (tb[IFA_BROADCAST])
Al Viroa7a628c2006-09-26 22:16:43 -0700542 ifa->ifa_broadcast = nla_get_be32(tb[IFA_BROADCAST]);
Thomas Graf5c753972006-08-04 23:03:53 -0700543
544 if (tb[IFA_ANYCAST])
Al Viroa7a628c2006-09-26 22:16:43 -0700545 ifa->ifa_anycast = nla_get_be32(tb[IFA_ANYCAST]);
Thomas Graf5c753972006-08-04 23:03:53 -0700546
547 if (tb[IFA_LABEL])
548 nla_strlcpy(ifa->ifa_label, tb[IFA_LABEL], IFNAMSIZ);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700549 else
550 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
551
Thomas Graf5c753972006-08-04 23:03:53 -0700552 return ifa;
553
554errout:
555 return ERR_PTR(err);
556}
557
558static int inet_rtm_newaddr(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
559{
Denis V. Lunevb8542722007-12-01 00:21:31 +1100560 struct net *net = skb->sk->sk_net;
Thomas Graf5c753972006-08-04 23:03:53 -0700561 struct in_ifaddr *ifa;
562
563 ASSERT_RTNL();
564
Denis V. Lunevb8542722007-12-01 00:21:31 +1100565 if (net != &init_net)
566 return -EINVAL;
567
Thomas Graf5c753972006-08-04 23:03:53 -0700568 ifa = rtm_to_ifaddr(nlh);
569 if (IS_ERR(ifa))
570 return PTR_ERR(ifa);
571
Thomas Grafd6062cb2006-08-15 00:33:59 -0700572 return __inet_insert_ifa(ifa, nlh, NETLINK_CB(skb).pid);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700573}
574
575/*
576 * Determine a default network mask, based on the IP address.
577 */
578
Al Viro714e85b2006-11-14 20:51:49 -0800579static __inline__ int inet_abc_len(__be32 addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700580{
581 int rc = -1; /* Something else, probably a multicast. */
582
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900583 if (ZERONET(addr))
584 rc = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700585 else {
Al Viro714e85b2006-11-14 20:51:49 -0800586 __u32 haddr = ntohl(addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700587
Al Viro714e85b2006-11-14 20:51:49 -0800588 if (IN_CLASSA(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700589 rc = 8;
Al Viro714e85b2006-11-14 20:51:49 -0800590 else if (IN_CLASSB(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700591 rc = 16;
Al Viro714e85b2006-11-14 20:51:49 -0800592 else if (IN_CLASSC(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700593 rc = 24;
594 }
595
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900596 return rc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700597}
598
599
600int devinet_ioctl(unsigned int cmd, void __user *arg)
601{
602 struct ifreq ifr;
603 struct sockaddr_in sin_orig;
604 struct sockaddr_in *sin = (struct sockaddr_in *)&ifr.ifr_addr;
605 struct in_device *in_dev;
606 struct in_ifaddr **ifap = NULL;
607 struct in_ifaddr *ifa = NULL;
608 struct net_device *dev;
609 char *colon;
610 int ret = -EFAULT;
611 int tryaddrmatch = 0;
612
613 /*
614 * Fetch the caller's info block into kernel space
615 */
616
617 if (copy_from_user(&ifr, arg, sizeof(struct ifreq)))
618 goto out;
619 ifr.ifr_name[IFNAMSIZ - 1] = 0;
620
621 /* save original address for comparison */
622 memcpy(&sin_orig, sin, sizeof(*sin));
623
624 colon = strchr(ifr.ifr_name, ':');
625 if (colon)
626 *colon = 0;
627
628#ifdef CONFIG_KMOD
Eric W. Biederman881d9662007-09-17 11:56:21 -0700629 dev_load(&init_net, ifr.ifr_name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700630#endif
631
Stephen Hemminger132adf52007-03-08 20:44:43 -0800632 switch (cmd) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700633 case SIOCGIFADDR: /* Get interface address */
634 case SIOCGIFBRDADDR: /* Get the broadcast address */
635 case SIOCGIFDSTADDR: /* Get the destination address */
636 case SIOCGIFNETMASK: /* Get the netmask for the interface */
637 /* Note that these ioctls will not sleep,
638 so that we do not impose a lock.
639 One day we will be forced to put shlock here (I mean SMP)
640 */
641 tryaddrmatch = (sin_orig.sin_family == AF_INET);
642 memset(sin, 0, sizeof(*sin));
643 sin->sin_family = AF_INET;
644 break;
645
646 case SIOCSIFFLAGS:
647 ret = -EACCES;
648 if (!capable(CAP_NET_ADMIN))
649 goto out;
650 break;
651 case SIOCSIFADDR: /* Set interface address (and family) */
652 case SIOCSIFBRDADDR: /* Set the broadcast address */
653 case SIOCSIFDSTADDR: /* Set the destination address */
654 case SIOCSIFNETMASK: /* Set the netmask for the interface */
655 ret = -EACCES;
656 if (!capable(CAP_NET_ADMIN))
657 goto out;
658 ret = -EINVAL;
659 if (sin->sin_family != AF_INET)
660 goto out;
661 break;
662 default:
663 ret = -EINVAL;
664 goto out;
665 }
666
667 rtnl_lock();
668
669 ret = -ENODEV;
Eric W. Biederman881d9662007-09-17 11:56:21 -0700670 if ((dev = __dev_get_by_name(&init_net, ifr.ifr_name)) == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700671 goto done;
672
673 if (colon)
674 *colon = ':';
675
Herbert Xue5ed6392005-10-03 14:35:55 -0700676 if ((in_dev = __in_dev_get_rtnl(dev)) != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700677 if (tryaddrmatch) {
678 /* Matthias Andree */
679 /* compare label and address (4.4BSD style) */
680 /* note: we only do this for a limited set of ioctls
681 and only if the original address family was AF_INET.
682 This is checked above. */
683 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
684 ifap = &ifa->ifa_next) {
685 if (!strcmp(ifr.ifr_name, ifa->ifa_label) &&
686 sin_orig.sin_addr.s_addr ==
687 ifa->ifa_address) {
688 break; /* found */
689 }
690 }
691 }
692 /* we didn't get a match, maybe the application is
693 4.3BSD-style and passed in junk so we fall back to
694 comparing just the label */
695 if (!ifa) {
696 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
697 ifap = &ifa->ifa_next)
698 if (!strcmp(ifr.ifr_name, ifa->ifa_label))
699 break;
700 }
701 }
702
703 ret = -EADDRNOTAVAIL;
704 if (!ifa && cmd != SIOCSIFADDR && cmd != SIOCSIFFLAGS)
705 goto done;
706
Stephen Hemminger132adf52007-03-08 20:44:43 -0800707 switch (cmd) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700708 case SIOCGIFADDR: /* Get interface address */
709 sin->sin_addr.s_addr = ifa->ifa_local;
710 goto rarok;
711
712 case SIOCGIFBRDADDR: /* Get the broadcast address */
713 sin->sin_addr.s_addr = ifa->ifa_broadcast;
714 goto rarok;
715
716 case SIOCGIFDSTADDR: /* Get the destination address */
717 sin->sin_addr.s_addr = ifa->ifa_address;
718 goto rarok;
719
720 case SIOCGIFNETMASK: /* Get the netmask for the interface */
721 sin->sin_addr.s_addr = ifa->ifa_mask;
722 goto rarok;
723
724 case SIOCSIFFLAGS:
725 if (colon) {
726 ret = -EADDRNOTAVAIL;
727 if (!ifa)
728 break;
729 ret = 0;
730 if (!(ifr.ifr_flags & IFF_UP))
731 inet_del_ifa(in_dev, ifap, 1);
732 break;
733 }
734 ret = dev_change_flags(dev, ifr.ifr_flags);
735 break;
736
737 case SIOCSIFADDR: /* Set interface address (and family) */
738 ret = -EINVAL;
739 if (inet_abc_len(sin->sin_addr.s_addr) < 0)
740 break;
741
742 if (!ifa) {
743 ret = -ENOBUFS;
744 if ((ifa = inet_alloc_ifa()) == NULL)
745 break;
746 if (colon)
747 memcpy(ifa->ifa_label, ifr.ifr_name, IFNAMSIZ);
748 else
749 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
750 } else {
751 ret = 0;
752 if (ifa->ifa_local == sin->sin_addr.s_addr)
753 break;
754 inet_del_ifa(in_dev, ifap, 0);
755 ifa->ifa_broadcast = 0;
756 ifa->ifa_anycast = 0;
757 }
758
759 ifa->ifa_address = ifa->ifa_local = sin->sin_addr.s_addr;
760
761 if (!(dev->flags & IFF_POINTOPOINT)) {
762 ifa->ifa_prefixlen = inet_abc_len(ifa->ifa_address);
763 ifa->ifa_mask = inet_make_mask(ifa->ifa_prefixlen);
764 if ((dev->flags & IFF_BROADCAST) &&
765 ifa->ifa_prefixlen < 31)
766 ifa->ifa_broadcast = ifa->ifa_address |
767 ~ifa->ifa_mask;
768 } else {
769 ifa->ifa_prefixlen = 32;
770 ifa->ifa_mask = inet_make_mask(32);
771 }
772 ret = inet_set_ifa(dev, ifa);
773 break;
774
775 case SIOCSIFBRDADDR: /* Set the broadcast address */
776 ret = 0;
777 if (ifa->ifa_broadcast != sin->sin_addr.s_addr) {
778 inet_del_ifa(in_dev, ifap, 0);
779 ifa->ifa_broadcast = sin->sin_addr.s_addr;
780 inet_insert_ifa(ifa);
781 }
782 break;
783
784 case SIOCSIFDSTADDR: /* Set the destination address */
785 ret = 0;
786 if (ifa->ifa_address == sin->sin_addr.s_addr)
787 break;
788 ret = -EINVAL;
789 if (inet_abc_len(sin->sin_addr.s_addr) < 0)
790 break;
791 ret = 0;
792 inet_del_ifa(in_dev, ifap, 0);
793 ifa->ifa_address = sin->sin_addr.s_addr;
794 inet_insert_ifa(ifa);
795 break;
796
797 case SIOCSIFNETMASK: /* Set the netmask for the interface */
798
799 /*
800 * The mask we set must be legal.
801 */
802 ret = -EINVAL;
803 if (bad_mask(sin->sin_addr.s_addr, 0))
804 break;
805 ret = 0;
806 if (ifa->ifa_mask != sin->sin_addr.s_addr) {
Al Viroa144ea42006-09-28 18:00:55 -0700807 __be32 old_mask = ifa->ifa_mask;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700808 inet_del_ifa(in_dev, ifap, 0);
809 ifa->ifa_mask = sin->sin_addr.s_addr;
810 ifa->ifa_prefixlen = inet_mask_len(ifa->ifa_mask);
811
812 /* See if current broadcast address matches
813 * with current netmask, then recalculate
814 * the broadcast address. Otherwise it's a
815 * funny address, so don't touch it since
816 * the user seems to know what (s)he's doing...
817 */
818 if ((dev->flags & IFF_BROADCAST) &&
819 (ifa->ifa_prefixlen < 31) &&
820 (ifa->ifa_broadcast ==
David Engeldcab5e12005-10-21 22:09:16 -0500821 (ifa->ifa_local|~old_mask))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700822 ifa->ifa_broadcast = (ifa->ifa_local |
823 ~sin->sin_addr.s_addr);
824 }
825 inet_insert_ifa(ifa);
826 }
827 break;
828 }
829done:
830 rtnl_unlock();
831out:
832 return ret;
833rarok:
834 rtnl_unlock();
835 ret = copy_to_user(arg, &ifr, sizeof(struct ifreq)) ? -EFAULT : 0;
836 goto out;
837}
838
839static int inet_gifconf(struct net_device *dev, char __user *buf, int len)
840{
Herbert Xue5ed6392005-10-03 14:35:55 -0700841 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700842 struct in_ifaddr *ifa;
843 struct ifreq ifr;
844 int done = 0;
845
846 if (!in_dev || (ifa = in_dev->ifa_list) == NULL)
847 goto out;
848
849 for (; ifa; ifa = ifa->ifa_next) {
850 if (!buf) {
851 done += sizeof(ifr);
852 continue;
853 }
854 if (len < (int) sizeof(ifr))
855 break;
856 memset(&ifr, 0, sizeof(struct ifreq));
857 if (ifa->ifa_label)
858 strcpy(ifr.ifr_name, ifa->ifa_label);
859 else
860 strcpy(ifr.ifr_name, dev->name);
861
862 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_family = AF_INET;
863 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_addr.s_addr =
864 ifa->ifa_local;
865
866 if (copy_to_user(buf, &ifr, sizeof(struct ifreq))) {
867 done = -EFAULT;
868 break;
869 }
870 buf += sizeof(struct ifreq);
871 len -= sizeof(struct ifreq);
872 done += sizeof(struct ifreq);
873 }
874out:
875 return done;
876}
877
Al Viroa61ced52006-09-26 21:27:54 -0700878__be32 inet_select_addr(const struct net_device *dev, __be32 dst, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700879{
Al Viroa61ced52006-09-26 21:27:54 -0700880 __be32 addr = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700881 struct in_device *in_dev;
882
883 rcu_read_lock();
Herbert Xue5ed6392005-10-03 14:35:55 -0700884 in_dev = __in_dev_get_rcu(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700885 if (!in_dev)
886 goto no_in_dev;
887
888 for_primary_ifa(in_dev) {
889 if (ifa->ifa_scope > scope)
890 continue;
891 if (!dst || inet_ifa_match(dst, ifa)) {
892 addr = ifa->ifa_local;
893 break;
894 }
895 if (!addr)
896 addr = ifa->ifa_local;
897 } endfor_ifa(in_dev);
898no_in_dev:
899 rcu_read_unlock();
900
901 if (addr)
902 goto out;
903
904 /* Not loopback addresses on loopback should be preferred
905 in this case. It is importnat that lo is the first interface
906 in dev_base list.
907 */
908 read_lock(&dev_base_lock);
909 rcu_read_lock();
Eric W. Biederman881d9662007-09-17 11:56:21 -0700910 for_each_netdev(&init_net, dev) {
Herbert Xue5ed6392005-10-03 14:35:55 -0700911 if ((in_dev = __in_dev_get_rcu(dev)) == NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700912 continue;
913
914 for_primary_ifa(in_dev) {
915 if (ifa->ifa_scope != RT_SCOPE_LINK &&
916 ifa->ifa_scope <= scope) {
917 addr = ifa->ifa_local;
918 goto out_unlock_both;
919 }
920 } endfor_ifa(in_dev);
921 }
922out_unlock_both:
923 read_unlock(&dev_base_lock);
924 rcu_read_unlock();
925out:
926 return addr;
927}
928
Al Viro60cad5d2006-09-26 22:17:09 -0700929static __be32 confirm_addr_indev(struct in_device *in_dev, __be32 dst,
930 __be32 local, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700931{
932 int same = 0;
Al Viroa144ea42006-09-28 18:00:55 -0700933 __be32 addr = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700934
935 for_ifa(in_dev) {
936 if (!addr &&
937 (local == ifa->ifa_local || !local) &&
938 ifa->ifa_scope <= scope) {
939 addr = ifa->ifa_local;
940 if (same)
941 break;
942 }
943 if (!same) {
944 same = (!local || inet_ifa_match(local, ifa)) &&
945 (!dst || inet_ifa_match(dst, ifa));
946 if (same && addr) {
947 if (local || !dst)
948 break;
949 /* Is the selected addr into dst subnet? */
950 if (inet_ifa_match(addr, ifa))
951 break;
952 /* No, then can we use new local src? */
953 if (ifa->ifa_scope <= scope) {
954 addr = ifa->ifa_local;
955 break;
956 }
957 /* search for large dst subnet for addr */
958 same = 0;
959 }
960 }
961 } endfor_ifa(in_dev);
962
963 return same? addr : 0;
964}
965
966/*
967 * Confirm that local IP address exists using wildcards:
968 * - dev: only on this interface, 0=any interface
969 * - dst: only in the same subnet as dst, 0=any dst
970 * - local: address, 0=autoselect the local address
971 * - scope: maximum allowed scope value for the local address
972 */
Al Viro60cad5d2006-09-26 22:17:09 -0700973__be32 inet_confirm_addr(const struct net_device *dev, __be32 dst, __be32 local, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700974{
Al Viro60cad5d2006-09-26 22:17:09 -0700975 __be32 addr = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700976 struct in_device *in_dev;
977
978 if (dev) {
979 rcu_read_lock();
Herbert Xue5ed6392005-10-03 14:35:55 -0700980 if ((in_dev = __in_dev_get_rcu(dev)))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700981 addr = confirm_addr_indev(in_dev, dst, local, scope);
982 rcu_read_unlock();
983
984 return addr;
985 }
986
987 read_lock(&dev_base_lock);
988 rcu_read_lock();
Eric W. Biederman881d9662007-09-17 11:56:21 -0700989 for_each_netdev(&init_net, dev) {
Herbert Xue5ed6392005-10-03 14:35:55 -0700990 if ((in_dev = __in_dev_get_rcu(dev))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700991 addr = confirm_addr_indev(in_dev, dst, local, scope);
992 if (addr)
993 break;
994 }
995 }
996 rcu_read_unlock();
997 read_unlock(&dev_base_lock);
998
999 return addr;
1000}
1001
1002/*
1003 * Device notifier
1004 */
1005
1006int register_inetaddr_notifier(struct notifier_block *nb)
1007{
Alan Sterne041c682006-03-27 01:16:30 -08001008 return blocking_notifier_chain_register(&inetaddr_chain, nb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001009}
1010
1011int unregister_inetaddr_notifier(struct notifier_block *nb)
1012{
Alan Sterne041c682006-03-27 01:16:30 -08001013 return blocking_notifier_chain_unregister(&inetaddr_chain, nb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001014}
1015
1016/* Rename ifa_labels for a device name change. Make some effort to preserve existing
1017 * alias numbering and to create unique labels if possible.
1018*/
1019static void inetdev_changename(struct net_device *dev, struct in_device *in_dev)
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001020{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001021 struct in_ifaddr *ifa;
1022 int named = 0;
1023
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001024 for (ifa = in_dev->ifa_list; ifa; ifa = ifa->ifa_next) {
1025 char old[IFNAMSIZ], *dot;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001026
1027 memcpy(old, ifa->ifa_label, IFNAMSIZ);
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001028 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001029 if (named++ == 0)
1030 continue;
Mark McLoughlin44344b22008-01-04 00:56:25 -08001031 dot = strchr(old, ':');
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001032 if (dot == NULL) {
1033 sprintf(old, ":%d", named);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001034 dot = old;
1035 }
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001036 if (strlen(dot) + strlen(dev->name) < IFNAMSIZ) {
1037 strcat(ifa->ifa_label, dot);
1038 } else {
1039 strcpy(ifa->ifa_label + (IFNAMSIZ - strlen(dot) - 1), dot);
1040 }
1041 }
1042}
Linus Torvalds1da177e2005-04-16 15:20:36 -07001043
1044/* Called only under RTNL semaphore */
1045
1046static int inetdev_event(struct notifier_block *this, unsigned long event,
1047 void *ptr)
1048{
1049 struct net_device *dev = ptr;
Herbert Xue5ed6392005-10-03 14:35:55 -07001050 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001051
Eric W. Biedermane9dc8652007-09-12 13:02:17 +02001052 if (dev->nd_net != &init_net)
1053 return NOTIFY_DONE;
1054
Linus Torvalds1da177e2005-04-16 15:20:36 -07001055 ASSERT_RTNL();
1056
1057 if (!in_dev) {
Herbert Xu8030f542007-02-22 01:53:47 +09001058 if (event == NETDEV_REGISTER) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001059 in_dev = inetdev_init(dev);
Herbert Xub217d612007-07-30 17:04:52 -07001060 if (!in_dev)
1061 return notifier_from_errno(-ENOMEM);
Eric W. Biederman0cc217e2007-09-26 22:10:06 -07001062 if (dev->flags & IFF_LOOPBACK) {
Herbert Xu42f811b2007-06-04 23:34:44 -07001063 IN_DEV_CONF_SET(in_dev, NOXFRM, 1);
1064 IN_DEV_CONF_SET(in_dev, NOPOLICY, 1);
Herbert Xu8030f542007-02-22 01:53:47 +09001065 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001066 }
1067 goto out;
1068 }
1069
1070 switch (event) {
1071 case NETDEV_REGISTER:
1072 printk(KERN_DEBUG "inetdev_event: bug\n");
1073 dev->ip_ptr = NULL;
1074 break;
1075 case NETDEV_UP:
1076 if (dev->mtu < 68)
1077 break;
Eric W. Biederman0cc217e2007-09-26 22:10:06 -07001078 if (dev->flags & IFF_LOOPBACK) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001079 struct in_ifaddr *ifa;
1080 if ((ifa = inet_alloc_ifa()) != NULL) {
1081 ifa->ifa_local =
1082 ifa->ifa_address = htonl(INADDR_LOOPBACK);
1083 ifa->ifa_prefixlen = 8;
1084 ifa->ifa_mask = inet_make_mask(8);
1085 in_dev_hold(in_dev);
1086 ifa->ifa_dev = in_dev;
1087 ifa->ifa_scope = RT_SCOPE_HOST;
1088 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
1089 inet_insert_ifa(ifa);
1090 }
1091 }
1092 ip_mc_up(in_dev);
1093 break;
1094 case NETDEV_DOWN:
1095 ip_mc_down(in_dev);
1096 break;
1097 case NETDEV_CHANGEMTU:
1098 if (dev->mtu >= 68)
1099 break;
1100 /* MTU falled under 68, disable IP */
1101 case NETDEV_UNREGISTER:
1102 inetdev_destroy(in_dev);
1103 break;
1104 case NETDEV_CHANGENAME:
1105 /* Do not notify about label change, this event is
1106 * not interesting to applications using netlink.
1107 */
1108 inetdev_changename(dev, in_dev);
1109
Pavel Emelyanov51602b22007-12-11 02:17:40 -08001110 devinet_sysctl_unregister(in_dev);
Pavel Emelyanov66f27a52007-12-02 00:55:54 +11001111 devinet_sysctl_register(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001112 break;
1113 }
1114out:
1115 return NOTIFY_DONE;
1116}
1117
1118static struct notifier_block ip_netdev_notifier = {
1119 .notifier_call =inetdev_event,
1120};
1121
Thomas Graf339bf982006-11-10 14:10:15 -08001122static inline size_t inet_nlmsg_size(void)
1123{
1124 return NLMSG_ALIGN(sizeof(struct ifaddrmsg))
1125 + nla_total_size(4) /* IFA_ADDRESS */
1126 + nla_total_size(4) /* IFA_LOCAL */
1127 + nla_total_size(4) /* IFA_BROADCAST */
1128 + nla_total_size(4) /* IFA_ANYCAST */
1129 + nla_total_size(IFNAMSIZ); /* IFA_LABEL */
1130}
1131
Linus Torvalds1da177e2005-04-16 15:20:36 -07001132static int inet_fill_ifaddr(struct sk_buff *skb, struct in_ifaddr *ifa,
Jamal Hadi Salimb6544c02005-06-18 22:54:12 -07001133 u32 pid, u32 seq, int event, unsigned int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001134{
1135 struct ifaddrmsg *ifm;
1136 struct nlmsghdr *nlh;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001137
Thomas Graf47f68512006-08-04 23:04:36 -07001138 nlh = nlmsg_put(skb, pid, seq, event, sizeof(*ifm), flags);
1139 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08001140 return -EMSGSIZE;
Thomas Graf47f68512006-08-04 23:04:36 -07001141
1142 ifm = nlmsg_data(nlh);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001143 ifm->ifa_family = AF_INET;
1144 ifm->ifa_prefixlen = ifa->ifa_prefixlen;
1145 ifm->ifa_flags = ifa->ifa_flags|IFA_F_PERMANENT;
1146 ifm->ifa_scope = ifa->ifa_scope;
1147 ifm->ifa_index = ifa->ifa_dev->dev->ifindex;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001148
Thomas Graf47f68512006-08-04 23:04:36 -07001149 if (ifa->ifa_address)
Al Viroa7a628c2006-09-26 22:16:43 -07001150 NLA_PUT_BE32(skb, IFA_ADDRESS, ifa->ifa_address);
Thomas Graf47f68512006-08-04 23:04:36 -07001151
1152 if (ifa->ifa_local)
Al Viroa7a628c2006-09-26 22:16:43 -07001153 NLA_PUT_BE32(skb, IFA_LOCAL, ifa->ifa_local);
Thomas Graf47f68512006-08-04 23:04:36 -07001154
1155 if (ifa->ifa_broadcast)
Al Viroa7a628c2006-09-26 22:16:43 -07001156 NLA_PUT_BE32(skb, IFA_BROADCAST, ifa->ifa_broadcast);
Thomas Graf47f68512006-08-04 23:04:36 -07001157
1158 if (ifa->ifa_anycast)
Al Viroa7a628c2006-09-26 22:16:43 -07001159 NLA_PUT_BE32(skb, IFA_ANYCAST, ifa->ifa_anycast);
Thomas Graf47f68512006-08-04 23:04:36 -07001160
1161 if (ifa->ifa_label[0])
1162 NLA_PUT_STRING(skb, IFA_LABEL, ifa->ifa_label);
1163
1164 return nlmsg_end(skb, nlh);
1165
1166nla_put_failure:
Patrick McHardy26932562007-01-31 23:16:40 -08001167 nlmsg_cancel(skb, nlh);
1168 return -EMSGSIZE;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001169}
1170
1171static int inet_dump_ifaddr(struct sk_buff *skb, struct netlink_callback *cb)
1172{
Denis V. Lunevb8542722007-12-01 00:21:31 +11001173 struct net *net = skb->sk->sk_net;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001174 int idx, ip_idx;
1175 struct net_device *dev;
1176 struct in_device *in_dev;
1177 struct in_ifaddr *ifa;
1178 int s_ip_idx, s_idx = cb->args[0];
1179
Denis V. Lunevb8542722007-12-01 00:21:31 +11001180 if (net != &init_net)
1181 return 0;
1182
Linus Torvalds1da177e2005-04-16 15:20:36 -07001183 s_ip_idx = ip_idx = cb->args[1];
Pavel Emelianov7562f872007-05-03 15:13:45 -07001184 idx = 0;
Eric W. Biederman881d9662007-09-17 11:56:21 -07001185 for_each_netdev(&init_net, dev) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001186 if (idx < s_idx)
Pavel Emelianov7562f872007-05-03 15:13:45 -07001187 goto cont;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001188 if (idx > s_idx)
1189 s_ip_idx = 0;
Patrick McHardy6313c1e2007-04-16 17:00:53 -07001190 if ((in_dev = __in_dev_get_rtnl(dev)) == NULL)
Pavel Emelianov7562f872007-05-03 15:13:45 -07001191 goto cont;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001192
1193 for (ifa = in_dev->ifa_list, ip_idx = 0; ifa;
1194 ifa = ifa->ifa_next, ip_idx++) {
1195 if (ip_idx < s_ip_idx)
Stephen Hemminger596e4152007-09-11 10:41:04 +02001196 continue;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001197 if (inet_fill_ifaddr(skb, ifa, NETLINK_CB(cb->skb).pid,
1198 cb->nlh->nlmsg_seq,
Patrick McHardy6313c1e2007-04-16 17:00:53 -07001199 RTM_NEWADDR, NLM_F_MULTI) <= 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001200 goto done;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001201 }
Pavel Emelianov7562f872007-05-03 15:13:45 -07001202cont:
1203 idx++;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001204 }
1205
1206done:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001207 cb->args[0] = idx;
1208 cb->args[1] = ip_idx;
1209
1210 return skb->len;
1211}
1212
Thomas Grafd6062cb2006-08-15 00:33:59 -07001213static void rtmsg_ifa(int event, struct in_ifaddr* ifa, struct nlmsghdr *nlh,
1214 u32 pid)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001215{
Thomas Graf47f68512006-08-04 23:04:36 -07001216 struct sk_buff *skb;
Thomas Grafd6062cb2006-08-15 00:33:59 -07001217 u32 seq = nlh ? nlh->nlmsg_seq : 0;
1218 int err = -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001219
Thomas Graf339bf982006-11-10 14:10:15 -08001220 skb = nlmsg_new(inet_nlmsg_size(), GFP_KERNEL);
Thomas Graf47f68512006-08-04 23:04:36 -07001221 if (skb == NULL)
Thomas Grafd6062cb2006-08-15 00:33:59 -07001222 goto errout;
1223
1224 err = inet_fill_ifaddr(skb, ifa, pid, seq, event, 0);
Patrick McHardy26932562007-01-31 23:16:40 -08001225 if (err < 0) {
1226 /* -EMSGSIZE implies BUG in inet_nlmsg_size() */
1227 WARN_ON(err == -EMSGSIZE);
1228 kfree_skb(skb);
1229 goto errout;
1230 }
Denis V. Lunev97c53ca2007-11-19 22:26:51 -08001231 err = rtnl_notify(skb, &init_net, pid, RTNLGRP_IPV4_IFADDR, nlh, GFP_KERNEL);
Thomas Grafd6062cb2006-08-15 00:33:59 -07001232errout:
1233 if (err < 0)
Denis V. Lunev97c53ca2007-11-19 22:26:51 -08001234 rtnl_set_sk_err(&init_net, RTNLGRP_IPV4_IFADDR, err);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001235}
1236
Linus Torvalds1da177e2005-04-16 15:20:36 -07001237#ifdef CONFIG_SYSCTL
1238
Herbert Xu31be3082007-06-04 23:35:37 -07001239static void devinet_copy_dflt_conf(int i)
1240{
1241 struct net_device *dev;
1242
1243 read_lock(&dev_base_lock);
Eric W. Biederman881d9662007-09-17 11:56:21 -07001244 for_each_netdev(&init_net, dev) {
Herbert Xu31be3082007-06-04 23:35:37 -07001245 struct in_device *in_dev;
1246 rcu_read_lock();
1247 in_dev = __in_dev_get_rcu(dev);
1248 if (in_dev && !test_bit(i, in_dev->cnf.state))
1249 in_dev->cnf.data[i] = ipv4_devconf_dflt.data[i];
1250 rcu_read_unlock();
1251 }
1252 read_unlock(&dev_base_lock);
1253}
1254
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001255static void inet_forward_change(void)
1256{
1257 struct net_device *dev;
1258 int on = IPV4_DEVCONF_ALL(FORWARDING);
1259
1260 IPV4_DEVCONF_ALL(ACCEPT_REDIRECTS) = !on;
1261 IPV4_DEVCONF_DFLT(FORWARDING) = on;
1262
1263 read_lock(&dev_base_lock);
1264 for_each_netdev(&init_net, dev) {
1265 struct in_device *in_dev;
1266 rcu_read_lock();
1267 in_dev = __in_dev_get_rcu(dev);
1268 if (in_dev)
1269 IN_DEV_CONF_SET(in_dev, FORWARDING, on);
1270 rcu_read_unlock();
1271 }
1272 read_unlock(&dev_base_lock);
1273
1274 rt_cache_flush(0);
1275}
1276
Herbert Xu31be3082007-06-04 23:35:37 -07001277static int devinet_conf_proc(ctl_table *ctl, int write,
1278 struct file* filp, void __user *buffer,
1279 size_t *lenp, loff_t *ppos)
1280{
1281 int ret = proc_dointvec(ctl, write, filp, buffer, lenp, ppos);
1282
1283 if (write) {
1284 struct ipv4_devconf *cnf = ctl->extra1;
1285 int i = (int *)ctl->data - cnf->data;
1286
1287 set_bit(i, cnf->state);
1288
1289 if (cnf == &ipv4_devconf_dflt)
1290 devinet_copy_dflt_conf(i);
1291 }
1292
1293 return ret;
1294}
1295
1296static int devinet_conf_sysctl(ctl_table *table, int __user *name, int nlen,
1297 void __user *oldval, size_t __user *oldlenp,
1298 void __user *newval, size_t newlen)
1299{
1300 struct ipv4_devconf *cnf;
1301 int *valp = table->data;
1302 int new;
1303 int i;
1304
1305 if (!newval || !newlen)
1306 return 0;
1307
1308 if (newlen != sizeof(int))
1309 return -EINVAL;
1310
1311 if (get_user(new, (int __user *)newval))
1312 return -EFAULT;
1313
1314 if (new == *valp)
1315 return 0;
1316
1317 if (oldval && oldlenp) {
1318 size_t len;
1319
1320 if (get_user(len, oldlenp))
1321 return -EFAULT;
1322
1323 if (len) {
1324 if (len > table->maxlen)
1325 len = table->maxlen;
1326 if (copy_to_user(oldval, valp, len))
1327 return -EFAULT;
1328 if (put_user(len, oldlenp))
1329 return -EFAULT;
1330 }
1331 }
1332
1333 *valp = new;
1334
1335 cnf = table->extra1;
1336 i = (int *)table->data - cnf->data;
1337
1338 set_bit(i, cnf->state);
1339
1340 if (cnf == &ipv4_devconf_dflt)
1341 devinet_copy_dflt_conf(i);
1342
1343 return 1;
1344}
1345
Linus Torvalds1da177e2005-04-16 15:20:36 -07001346static int devinet_sysctl_forward(ctl_table *ctl, int write,
1347 struct file* filp, void __user *buffer,
1348 size_t *lenp, loff_t *ppos)
1349{
1350 int *valp = ctl->data;
1351 int val = *valp;
1352 int ret = proc_dointvec(ctl, write, filp, buffer, lenp, ppos);
1353
1354 if (write && *valp != val) {
Herbert Xu42f811b2007-06-04 23:34:44 -07001355 if (valp == &IPV4_DEVCONF_ALL(FORWARDING))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001356 inet_forward_change();
Herbert Xu42f811b2007-06-04 23:34:44 -07001357 else if (valp != &IPV4_DEVCONF_DFLT(FORWARDING))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001358 rt_cache_flush(0);
1359 }
1360
1361 return ret;
1362}
1363
1364int ipv4_doint_and_flush(ctl_table *ctl, int write,
1365 struct file* filp, void __user *buffer,
1366 size_t *lenp, loff_t *ppos)
1367{
1368 int *valp = ctl->data;
1369 int val = *valp;
1370 int ret = proc_dointvec(ctl, write, filp, buffer, lenp, ppos);
1371
1372 if (write && *valp != val)
1373 rt_cache_flush(0);
1374
1375 return ret;
1376}
1377
1378int ipv4_doint_and_flush_strategy(ctl_table *table, int __user *name, int nlen,
1379 void __user *oldval, size_t __user *oldlenp,
Alexey Dobriyan1f29bcd2006-12-10 02:19:10 -08001380 void __user *newval, size_t newlen)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001381{
Herbert Xu31be3082007-06-04 23:35:37 -07001382 int ret = devinet_conf_sysctl(table, name, nlen, oldval, oldlenp,
1383 newval, newlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001384
Herbert Xu31be3082007-06-04 23:35:37 -07001385 if (ret == 1)
1386 rt_cache_flush(0);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001387
Herbert Xu31be3082007-06-04 23:35:37 -07001388 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001389}
1390
1391
Herbert Xu42f811b2007-06-04 23:34:44 -07001392#define DEVINET_SYSCTL_ENTRY(attr, name, mval, proc, sysctl) \
1393 { \
1394 .ctl_name = NET_IPV4_CONF_ ## attr, \
1395 .procname = name, \
1396 .data = ipv4_devconf.data + \
1397 NET_IPV4_CONF_ ## attr - 1, \
1398 .maxlen = sizeof(int), \
1399 .mode = mval, \
1400 .proc_handler = proc, \
1401 .strategy = sysctl, \
Herbert Xu31be3082007-06-04 23:35:37 -07001402 .extra1 = &ipv4_devconf, \
Herbert Xu42f811b2007-06-04 23:34:44 -07001403 }
1404
1405#define DEVINET_SYSCTL_RW_ENTRY(attr, name) \
Herbert Xu31be3082007-06-04 23:35:37 -07001406 DEVINET_SYSCTL_ENTRY(attr, name, 0644, devinet_conf_proc, \
1407 devinet_conf_sysctl)
Herbert Xu42f811b2007-06-04 23:34:44 -07001408
1409#define DEVINET_SYSCTL_RO_ENTRY(attr, name) \
Herbert Xu31be3082007-06-04 23:35:37 -07001410 DEVINET_SYSCTL_ENTRY(attr, name, 0444, devinet_conf_proc, \
1411 devinet_conf_sysctl)
Herbert Xu42f811b2007-06-04 23:34:44 -07001412
1413#define DEVINET_SYSCTL_COMPLEX_ENTRY(attr, name, proc, sysctl) \
1414 DEVINET_SYSCTL_ENTRY(attr, name, 0644, proc, sysctl)
1415
1416#define DEVINET_SYSCTL_FLUSHING_ENTRY(attr, name) \
1417 DEVINET_SYSCTL_COMPLEX_ENTRY(attr, name, ipv4_doint_and_flush, \
1418 ipv4_doint_and_flush_strategy)
1419
Linus Torvalds1da177e2005-04-16 15:20:36 -07001420static struct devinet_sysctl_table {
1421 struct ctl_table_header *sysctl_header;
Pavel Emelyanovbfada692007-12-02 00:57:08 +11001422 struct ctl_table devinet_vars[__NET_IPV4_CONF_MAX];
1423 char *dev_name;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001424} devinet_sysctl = {
1425 .devinet_vars = {
Herbert Xu42f811b2007-06-04 23:34:44 -07001426 DEVINET_SYSCTL_COMPLEX_ENTRY(FORWARDING, "forwarding",
Herbert Xu31be3082007-06-04 23:35:37 -07001427 devinet_sysctl_forward,
1428 devinet_conf_sysctl),
Herbert Xu42f811b2007-06-04 23:34:44 -07001429 DEVINET_SYSCTL_RO_ENTRY(MC_FORWARDING, "mc_forwarding"),
1430
1431 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_REDIRECTS, "accept_redirects"),
1432 DEVINET_SYSCTL_RW_ENTRY(SECURE_REDIRECTS, "secure_redirects"),
1433 DEVINET_SYSCTL_RW_ENTRY(SHARED_MEDIA, "shared_media"),
1434 DEVINET_SYSCTL_RW_ENTRY(RP_FILTER, "rp_filter"),
1435 DEVINET_SYSCTL_RW_ENTRY(SEND_REDIRECTS, "send_redirects"),
1436 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_SOURCE_ROUTE,
1437 "accept_source_route"),
1438 DEVINET_SYSCTL_RW_ENTRY(PROXY_ARP, "proxy_arp"),
1439 DEVINET_SYSCTL_RW_ENTRY(MEDIUM_ID, "medium_id"),
1440 DEVINET_SYSCTL_RW_ENTRY(BOOTP_RELAY, "bootp_relay"),
1441 DEVINET_SYSCTL_RW_ENTRY(LOG_MARTIANS, "log_martians"),
1442 DEVINET_SYSCTL_RW_ENTRY(TAG, "tag"),
1443 DEVINET_SYSCTL_RW_ENTRY(ARPFILTER, "arp_filter"),
1444 DEVINET_SYSCTL_RW_ENTRY(ARP_ANNOUNCE, "arp_announce"),
1445 DEVINET_SYSCTL_RW_ENTRY(ARP_IGNORE, "arp_ignore"),
1446 DEVINET_SYSCTL_RW_ENTRY(ARP_ACCEPT, "arp_accept"),
1447
1448 DEVINET_SYSCTL_FLUSHING_ENTRY(NOXFRM, "disable_xfrm"),
1449 DEVINET_SYSCTL_FLUSHING_ENTRY(NOPOLICY, "disable_policy"),
1450 DEVINET_SYSCTL_FLUSHING_ENTRY(FORCE_IGMP_VERSION,
1451 "force_igmp_version"),
1452 DEVINET_SYSCTL_FLUSHING_ENTRY(PROMOTE_SECONDARIES,
1453 "promote_secondaries"),
Linus Torvalds1da177e2005-04-16 15:20:36 -07001454 },
Linus Torvalds1da177e2005-04-16 15:20:36 -07001455};
1456
Pavel Emelyanovea40b322007-12-16 13:30:07 -08001457static int __devinet_sysctl_register(struct net *net, char *dev_name,
1458 int ctl_name, struct ipv4_devconf *p)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001459{
1460 int i;
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11001461 struct devinet_sysctl_table *t;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001462
Pavel Emelyanovbfada692007-12-02 00:57:08 +11001463#define DEVINET_CTL_PATH_DEV 3
1464
1465 struct ctl_path devinet_ctl_path[] = {
1466 { .procname = "net", .ctl_name = CTL_NET, },
1467 { .procname = "ipv4", .ctl_name = NET_IPV4, },
1468 { .procname = "conf", .ctl_name = NET_IPV4_CONF, },
1469 { /* to be set */ },
1470 { },
1471 };
1472
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11001473 t = kmemdup(&devinet_sysctl, sizeof(*t), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001474 if (!t)
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11001475 goto out;
1476
Linus Torvalds1da177e2005-04-16 15:20:36 -07001477 for (i = 0; i < ARRAY_SIZE(t->devinet_vars) - 1; i++) {
1478 t->devinet_vars[i].data += (char *)p - (char *)&ipv4_devconf;
Herbert Xu31be3082007-06-04 23:35:37 -07001479 t->devinet_vars[i].extra1 = p;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001480 }
1481
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001482 /*
1483 * Make a copy of dev_name, because '.procname' is regarded as const
Linus Torvalds1da177e2005-04-16 15:20:36 -07001484 * by sysctl and we wouldn't want anyone to change it under our feet
1485 * (see SIOCSIFNAME).
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001486 */
Pavel Emelyanovbfada692007-12-02 00:57:08 +11001487 t->dev_name = kstrdup(dev_name, GFP_KERNEL);
1488 if (!t->dev_name)
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11001489 goto free;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001490
Pavel Emelyanovbfada692007-12-02 00:57:08 +11001491 devinet_ctl_path[DEVINET_CTL_PATH_DEV].procname = t->dev_name;
1492 devinet_ctl_path[DEVINET_CTL_PATH_DEV].ctl_name = ctl_name;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001493
Pavel Emelyanovbfada692007-12-02 00:57:08 +11001494 t->sysctl_header = register_sysctl_paths(devinet_ctl_path,
1495 t->devinet_vars);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001496 if (!t->sysctl_header)
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11001497 goto free_procname;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001498
1499 p->sysctl = t;
Pavel Emelyanovea40b322007-12-16 13:30:07 -08001500 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001501
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11001502free_procname:
Pavel Emelyanovbfada692007-12-02 00:57:08 +11001503 kfree(t->dev_name);
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11001504free:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001505 kfree(t);
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11001506out:
Pavel Emelyanovea40b322007-12-16 13:30:07 -08001507 return -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001508}
1509
Pavel Emelyanov51602b22007-12-11 02:17:40 -08001510static void __devinet_sysctl_unregister(struct ipv4_devconf *cnf)
1511{
1512 struct devinet_sysctl_table *t = cnf->sysctl;
1513
1514 if (t == NULL)
1515 return;
1516
1517 cnf->sysctl = NULL;
1518 unregister_sysctl_table(t->sysctl_header);
1519 kfree(t->dev_name);
1520 kfree(t);
1521}
1522
Pavel Emelyanov66f27a52007-12-02 00:55:54 +11001523static void devinet_sysctl_register(struct in_device *idev)
1524{
Pavel Emelyanov51602b22007-12-11 02:17:40 -08001525 neigh_sysctl_register(idev->dev, idev->arp_parms, NET_IPV4,
1526 NET_IPV4_NEIGH, "ipv4", NULL, NULL);
1527 __devinet_sysctl_register(idev->dev->name, idev->dev->ifindex,
Pavel Emelyanov66f27a52007-12-02 00:55:54 +11001528 &idev->cnf);
1529}
1530
Pavel Emelyanov51602b22007-12-11 02:17:40 -08001531static void devinet_sysctl_unregister(struct in_device *idev)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001532{
Pavel Emelyanov51602b22007-12-11 02:17:40 -08001533 __devinet_sysctl_unregister(&idev->cnf);
1534 neigh_sysctl_unregister(idev->arp_parms);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001535}
1536#endif
1537
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001538static struct ctl_table ctl_forward_entry[] = {
1539 {
1540 .ctl_name = NET_IPV4_FORWARD,
1541 .procname = "ip_forward",
1542 .data = &ipv4_devconf.data[
1543 NET_IPV4_CONF_FORWARDING - 1],
1544 .maxlen = sizeof(int),
1545 .mode = 0644,
1546 .proc_handler = devinet_sysctl_forward,
1547 .strategy = devinet_conf_sysctl,
1548 .extra1 = &ipv4_devconf,
1549 },
1550 { },
1551};
1552
1553static __initdata struct ctl_path net_ipv4_path[] = {
1554 { .procname = "net", .ctl_name = CTL_NET, },
1555 { .procname = "ipv4", .ctl_name = NET_IPV4, },
1556 { },
1557};
1558
Linus Torvalds1da177e2005-04-16 15:20:36 -07001559void __init devinet_init(void)
1560{
1561 register_gifconf(PF_INET, inet_gifconf);
1562 register_netdevice_notifier(&ip_netdev_notifier);
Thomas Graf63f34442007-03-22 11:55:17 -07001563
1564 rtnl_register(PF_INET, RTM_NEWADDR, inet_rtm_newaddr, NULL);
1565 rtnl_register(PF_INET, RTM_DELADDR, inet_rtm_deladdr, NULL);
1566 rtnl_register(PF_INET, RTM_GETADDR, NULL, inet_dump_ifaddr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001567#ifdef CONFIG_SYSCTL
Pavel Emelyanov66f27a52007-12-02 00:55:54 +11001568 __devinet_sysctl_register("all", NET_PROTO_CONF_ALL,
1569 &ipv4_devconf);
1570 __devinet_sysctl_register("default", NET_PROTO_CONF_DEFAULT,
1571 &ipv4_devconf_dflt);
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001572 register_sysctl_paths(net_ipv4_path, ctl_forward_entry);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001573#endif
1574}
1575
Linus Torvalds1da177e2005-04-16 15:20:36 -07001576EXPORT_SYMBOL(in_dev_finish_destroy);
1577EXPORT_SYMBOL(inet_select_addr);
1578EXPORT_SYMBOL(inetdev_by_index);
1579EXPORT_SYMBOL(register_inetaddr_notifier);
1580EXPORT_SYMBOL(unregister_inetaddr_notifier);