blob: dfc39d4d48b7471fc83035746026fa14d1dcf497 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * NET3 IP device support routines.
3 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Derived from the IP parts of dev.c 1.0.19
Jesper Juhl02c30a82005-05-05 16:16:16 -070010 * Authors: Ross Biro
Linus Torvalds1da177e2005-04-16 15:20:36 -070011 * Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
12 * Mark Evans, <evansmp@uhura.aston.ac.uk>
13 *
14 * Additional Authors:
15 * Alan Cox, <gw4pts@gw4pts.ampr.org>
16 * Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
17 *
18 * Changes:
19 * Alexey Kuznetsov: pa_* fields are replaced with ifaddr
20 * lists.
21 * Cyrus Durgin: updated for kmod
22 * Matthias Andree: in devinet_ioctl, compare label and
23 * address (4.4BSD alias style support),
24 * fall back to comparing just the label
25 * if no match found.
26 */
27
Linus Torvalds1da177e2005-04-16 15:20:36 -070028
29#include <asm/uaccess.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070030#include <linux/bitops.h>
Randy Dunlap4fc268d2006-01-11 12:17:47 -080031#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070032#include <linux/module.h>
33#include <linux/types.h>
34#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035#include <linux/string.h>
36#include <linux/mm.h>
37#include <linux/socket.h>
38#include <linux/sockios.h>
39#include <linux/in.h>
40#include <linux/errno.h>
41#include <linux/interrupt.h>
Thomas Graf18237302006-08-04 23:04:54 -070042#include <linux/if_addr.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070043#include <linux/if_ether.h>
44#include <linux/inet.h>
45#include <linux/netdevice.h>
46#include <linux/etherdevice.h>
47#include <linux/skbuff.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070048#include <linux/init.h>
49#include <linux/notifier.h>
50#include <linux/inetdevice.h>
51#include <linux/igmp.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090052#include <linux/slab.h>
David S. Millerfd23c3b2011-02-18 12:42:28 -080053#include <linux/hash.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070054#ifdef CONFIG_SYSCTL
55#include <linux/sysctl.h>
56#endif
57#include <linux/kmod.h>
Nicolas Dichteledc9e742012-10-25 22:28:52 +000058#include <linux/netconf.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070059
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020060#include <net/arp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070061#include <net/ip.h>
62#include <net/route.h>
63#include <net/ip_fib.h>
Thomas Graf63f34442007-03-22 11:55:17 -070064#include <net/rtnetlink.h>
Pavel Emelyanov752d14d2007-12-16 13:31:47 -080065#include <net/net_namespace.h>
Jiri Pirko5c766d62013-01-24 09:41:41 +000066#include <net/addrconf.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070067
David S. Miller406b6f92011-03-22 21:56:23 -070068#include "fib_lookup.h"
69
Adrian Bunk0027ba82008-01-31 17:17:31 -080070static struct ipv4_devconf ipv4_devconf = {
Herbert Xu42f811b2007-06-04 23:34:44 -070071 .data = {
Eric W. Biederman02291682010-02-14 03:25:51 +000072 [IPV4_DEVCONF_ACCEPT_REDIRECTS - 1] = 1,
73 [IPV4_DEVCONF_SEND_REDIRECTS - 1] = 1,
74 [IPV4_DEVCONF_SECURE_REDIRECTS - 1] = 1,
75 [IPV4_DEVCONF_SHARED_MEDIA - 1] = 1,
Herbert Xu42f811b2007-06-04 23:34:44 -070076 },
Linus Torvalds1da177e2005-04-16 15:20:36 -070077};
78
79static struct ipv4_devconf ipv4_devconf_dflt = {
Herbert Xu42f811b2007-06-04 23:34:44 -070080 .data = {
Eric W. Biederman02291682010-02-14 03:25:51 +000081 [IPV4_DEVCONF_ACCEPT_REDIRECTS - 1] = 1,
82 [IPV4_DEVCONF_SEND_REDIRECTS - 1] = 1,
83 [IPV4_DEVCONF_SECURE_REDIRECTS - 1] = 1,
84 [IPV4_DEVCONF_SHARED_MEDIA - 1] = 1,
85 [IPV4_DEVCONF_ACCEPT_SOURCE_ROUTE - 1] = 1,
Herbert Xu42f811b2007-06-04 23:34:44 -070086 },
Linus Torvalds1da177e2005-04-16 15:20:36 -070087};
88
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -080089#define IPV4_DEVCONF_DFLT(net, attr) \
90 IPV4_DEVCONF((*net->ipv4.devconf_dflt), attr)
Herbert Xu42f811b2007-06-04 23:34:44 -070091
Patrick McHardyef7c79e2007-06-05 12:38:30 -070092static const struct nla_policy ifa_ipv4_policy[IFA_MAX+1] = {
Thomas Graf5c753972006-08-04 23:03:53 -070093 [IFA_LOCAL] = { .type = NLA_U32 },
94 [IFA_ADDRESS] = { .type = NLA_U32 },
95 [IFA_BROADCAST] = { .type = NLA_U32 },
Thomas Graf5176f912006-08-26 20:13:18 -070096 [IFA_LABEL] = { .type = NLA_STRING, .len = IFNAMSIZ - 1 },
Jiri Pirko5c766d62013-01-24 09:41:41 +000097 [IFA_CACHEINFO] = { .len = sizeof(struct ifa_cacheinfo) },
Thomas Graf5c753972006-08-04 23:03:53 -070098};
99
Eric Dumazet40384992012-08-03 21:06:50 +0000100#define IN4_ADDR_HSIZE_SHIFT 8
101#define IN4_ADDR_HSIZE (1U << IN4_ADDR_HSIZE_SHIFT)
102
David S. Millerfd23c3b2011-02-18 12:42:28 -0800103static struct hlist_head inet_addr_lst[IN4_ADDR_HSIZE];
104static DEFINE_SPINLOCK(inet_addr_hash_lock);
105
Eric Dumazet40384992012-08-03 21:06:50 +0000106static u32 inet_addr_hash(struct net *net, __be32 addr)
David S. Millerfd23c3b2011-02-18 12:42:28 -0800107{
Eric Dumazet40384992012-08-03 21:06:50 +0000108 u32 val = (__force u32) addr ^ net_hash_mix(net);
David S. Millerfd23c3b2011-02-18 12:42:28 -0800109
Eric Dumazet40384992012-08-03 21:06:50 +0000110 return hash_32(val, IN4_ADDR_HSIZE_SHIFT);
David S. Millerfd23c3b2011-02-18 12:42:28 -0800111}
112
113static void inet_hash_insert(struct net *net, struct in_ifaddr *ifa)
114{
Eric Dumazet40384992012-08-03 21:06:50 +0000115 u32 hash = inet_addr_hash(net, ifa->ifa_local);
David S. Millerfd23c3b2011-02-18 12:42:28 -0800116
117 spin_lock(&inet_addr_hash_lock);
118 hlist_add_head_rcu(&ifa->hash, &inet_addr_lst[hash]);
119 spin_unlock(&inet_addr_hash_lock);
120}
121
122static void inet_hash_remove(struct in_ifaddr *ifa)
123{
124 spin_lock(&inet_addr_hash_lock);
125 hlist_del_init_rcu(&ifa->hash);
126 spin_unlock(&inet_addr_hash_lock);
127}
128
David S. Miller9435eb12011-02-18 12:43:09 -0800129/**
130 * __ip_dev_find - find the first device with a given source address.
131 * @net: the net namespace
132 * @addr: the source address
133 * @devref: if true, take a reference on the found device
134 *
135 * If a caller uses devref=false, it should be protected by RCU, or RTNL
136 */
137struct net_device *__ip_dev_find(struct net *net, __be32 addr, bool devref)
138{
Eric Dumazet40384992012-08-03 21:06:50 +0000139 u32 hash = inet_addr_hash(net, addr);
David S. Miller9435eb12011-02-18 12:43:09 -0800140 struct net_device *result = NULL;
141 struct in_ifaddr *ifa;
David S. Miller9435eb12011-02-18 12:43:09 -0800142
143 rcu_read_lock();
Sasha Levinb67bfe02013-02-27 17:06:00 -0800144 hlist_for_each_entry_rcu(ifa, &inet_addr_lst[hash], hash) {
David S. Millere0660082011-03-03 11:24:19 -0800145 if (ifa->ifa_local == addr) {
Eric Dumazet40384992012-08-03 21:06:50 +0000146 struct net_device *dev = ifa->ifa_dev->dev;
147
148 if (!net_eq(dev_net(dev), net))
149 continue;
David S. Miller9435eb12011-02-18 12:43:09 -0800150 result = dev;
151 break;
152 }
153 }
David S. Miller406b6f92011-03-22 21:56:23 -0700154 if (!result) {
155 struct flowi4 fl4 = { .daddr = addr };
156 struct fib_result res = { 0 };
157 struct fib_table *local;
158
159 /* Fallback to FIB local table so that communication
160 * over loopback subnets work.
161 */
162 local = fib_get_table(net, RT_TABLE_LOCAL);
163 if (local &&
164 !fib_table_lookup(local, &fl4, &res, FIB_LOOKUP_NOREF) &&
165 res.type == RTN_LOCAL)
166 result = FIB_RES_DEV(res);
167 }
David S. Miller9435eb12011-02-18 12:43:09 -0800168 if (result && devref)
169 dev_hold(result);
170 rcu_read_unlock();
171 return result;
172}
173EXPORT_SYMBOL(__ip_dev_find);
174
Thomas Grafd6062cb2006-08-15 00:33:59 -0700175static void rtmsg_ifa(int event, struct in_ifaddr *, struct nlmsghdr *, u32);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700176
Alan Sterne041c682006-03-27 01:16:30 -0800177static BLOCKING_NOTIFIER_HEAD(inetaddr_chain);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700178static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
179 int destroy);
180#ifdef CONFIG_SYSCTL
Pavel Emelyanov66f27a52007-12-02 00:55:54 +1100181static void devinet_sysctl_register(struct in_device *idev);
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800182static void devinet_sysctl_unregister(struct in_device *idev);
183#else
Eric Dumazet40384992012-08-03 21:06:50 +0000184static void devinet_sysctl_register(struct in_device *idev)
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800185{
186}
Eric Dumazet40384992012-08-03 21:06:50 +0000187static void devinet_sysctl_unregister(struct in_device *idev)
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800188{
189}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700190#endif
191
192/* Locks all the inet devices. */
193
194static struct in_ifaddr *inet_alloc_ifa(void)
195{
Alexey Dobriyan93adcc82008-10-28 13:25:09 -0700196 return kzalloc(sizeof(struct in_ifaddr), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700197}
198
199static void inet_rcu_free_ifa(struct rcu_head *head)
200{
201 struct in_ifaddr *ifa = container_of(head, struct in_ifaddr, rcu_head);
202 if (ifa->ifa_dev)
203 in_dev_put(ifa->ifa_dev);
204 kfree(ifa);
205}
206
Eric Dumazet40384992012-08-03 21:06:50 +0000207static void inet_free_ifa(struct in_ifaddr *ifa)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700208{
209 call_rcu(&ifa->rcu_head, inet_rcu_free_ifa);
210}
211
212void in_dev_finish_destroy(struct in_device *idev)
213{
214 struct net_device *dev = idev->dev;
215
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700216 WARN_ON(idev->ifa_list);
217 WARN_ON(idev->mc_list);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700218#ifdef NET_REFCNT_DEBUG
Joe Perches91df42b2012-05-15 14:11:54 +0000219 pr_debug("%s: %p=%s\n", __func__, idev, dev ? dev->name : "NIL");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700220#endif
221 dev_put(dev);
222 if (!idev->dead)
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800223 pr_err("Freeing alive in_device %p\n", idev);
224 else
Linus Torvalds1da177e2005-04-16 15:20:36 -0700225 kfree(idev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700226}
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800227EXPORT_SYMBOL(in_dev_finish_destroy);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700228
Herbert Xu71e27da2007-06-04 23:36:06 -0700229static struct in_device *inetdev_init(struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700230{
231 struct in_device *in_dev;
232
233 ASSERT_RTNL();
234
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700235 in_dev = kzalloc(sizeof(*in_dev), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700236 if (!in_dev)
237 goto out;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900238 memcpy(&in_dev->cnf, dev_net(dev)->ipv4.devconf_dflt,
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -0800239 sizeof(in_dev->cnf));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700240 in_dev->cnf.sysctl = NULL;
241 in_dev->dev = dev;
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800242 in_dev->arp_parms = neigh_parms_alloc(dev, &arp_tbl);
243 if (!in_dev->arp_parms)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700244 goto out_kfree;
Ben Hutchings0187bdf2008-06-19 16:15:47 -0700245 if (IPV4_DEVCONF(in_dev->cnf, FORWARDING))
246 dev_disable_lro(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247 /* Reference in_dev->dev */
248 dev_hold(dev);
David L Stevens30c4cf52007-01-04 12:31:14 -0800249 /* Account for reference dev->ip_ptr (below) */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700250 in_dev_hold(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700251
Pavel Emelyanov66f27a52007-12-02 00:55:54 +1100252 devinet_sysctl_register(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253 ip_mc_init_dev(in_dev);
254 if (dev->flags & IFF_UP)
255 ip_mc_up(in_dev);
Jarek Poplawski483479e2007-01-09 14:38:31 -0800256
David L Stevens30c4cf52007-01-04 12:31:14 -0800257 /* we can receive as soon as ip_ptr is set -- do this last */
Eric Dumazetcf778b02012-01-12 04:41:32 +0000258 rcu_assign_pointer(dev->ip_ptr, in_dev);
Jarek Poplawski483479e2007-01-09 14:38:31 -0800259out:
Linus Torvalds1da177e2005-04-16 15:20:36 -0700260 return in_dev;
261out_kfree:
262 kfree(in_dev);
263 in_dev = NULL;
264 goto out;
265}
266
267static void in_dev_rcu_put(struct rcu_head *head)
268{
269 struct in_device *idev = container_of(head, struct in_device, rcu_head);
270 in_dev_put(idev);
271}
272
273static void inetdev_destroy(struct in_device *in_dev)
274{
275 struct in_ifaddr *ifa;
276 struct net_device *dev;
277
278 ASSERT_RTNL();
279
280 dev = in_dev->dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700281
282 in_dev->dead = 1;
283
284 ip_mc_destroy_dev(in_dev);
285
286 while ((ifa = in_dev->ifa_list) != NULL) {
287 inet_del_ifa(in_dev, &in_dev->ifa_list, 0);
288 inet_free_ifa(ifa);
289 }
290
Stephen Hemmingera9b3cd72011-08-01 16:19:00 +0000291 RCU_INIT_POINTER(dev->ip_ptr, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700292
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800293 devinet_sysctl_unregister(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294 neigh_parms_release(&arp_tbl, in_dev->arp_parms);
295 arp_ifdown(dev);
296
297 call_rcu(&in_dev->rcu_head, in_dev_rcu_put);
298}
299
Al Viroff428d72006-09-26 22:13:35 -0700300int inet_addr_onlink(struct in_device *in_dev, __be32 a, __be32 b)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700301{
302 rcu_read_lock();
303 for_primary_ifa(in_dev) {
304 if (inet_ifa_match(a, ifa)) {
305 if (!b || inet_ifa_match(b, ifa)) {
306 rcu_read_unlock();
307 return 1;
308 }
309 }
310 } endfor_ifa(in_dev);
311 rcu_read_unlock();
312 return 0;
313}
314
Thomas Grafd6062cb2006-08-15 00:33:59 -0700315static void __inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
Eric W. Biederman15e47302012-09-07 20:12:54 +0000316 int destroy, struct nlmsghdr *nlh, u32 portid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700317{
Harald Welte8f937c62005-05-29 20:23:46 -0700318 struct in_ifaddr *promote = NULL;
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800319 struct in_ifaddr *ifa, *ifa1 = *ifap;
320 struct in_ifaddr *last_prim = in_dev->ifa_list;
321 struct in_ifaddr *prev_prom = NULL;
322 int do_promote = IN_DEV_PROMOTE_SECONDARIES(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323
324 ASSERT_RTNL();
325
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900326 /* 1. Deleting primary ifaddr forces deletion all secondaries
Harald Welte8f937c62005-05-29 20:23:46 -0700327 * unless alias promotion is set
328 **/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700329
330 if (!(ifa1->ifa_flags & IFA_F_SECONDARY)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700331 struct in_ifaddr **ifap1 = &ifa1->ifa_next;
332
333 while ((ifa = *ifap1) != NULL) {
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900334 if (!(ifa->ifa_flags & IFA_F_SECONDARY) &&
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800335 ifa1->ifa_scope <= ifa->ifa_scope)
336 last_prim = ifa;
337
Linus Torvalds1da177e2005-04-16 15:20:36 -0700338 if (!(ifa->ifa_flags & IFA_F_SECONDARY) ||
339 ifa1->ifa_mask != ifa->ifa_mask ||
340 !inet_ifa_match(ifa1->ifa_address, ifa)) {
341 ifap1 = &ifa->ifa_next;
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800342 prev_prom = ifa;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700343 continue;
344 }
345
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800346 if (!do_promote) {
David S. Millerfd23c3b2011-02-18 12:42:28 -0800347 inet_hash_remove(ifa);
Harald Welte8f937c62005-05-29 20:23:46 -0700348 *ifap1 = ifa->ifa_next;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349
Eric W. Biederman15e47302012-09-07 20:12:54 +0000350 rtmsg_ifa(RTM_DELADDR, ifa, nlh, portid);
Alan Sterne041c682006-03-27 01:16:30 -0800351 blocking_notifier_call_chain(&inetaddr_chain,
352 NETDEV_DOWN, ifa);
Harald Welte8f937c62005-05-29 20:23:46 -0700353 inet_free_ifa(ifa);
354 } else {
355 promote = ifa;
356 break;
357 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700358 }
359 }
360
Julian Anastasov2d230e22011-03-19 12:13:52 +0000361 /* On promotion all secondaries from subnet are changing
362 * the primary IP, we must remove all their routes silently
363 * and later to add them back with new prefsrc. Do this
364 * while all addresses are on the device list.
365 */
366 for (ifa = promote; ifa; ifa = ifa->ifa_next) {
367 if (ifa1->ifa_mask == ifa->ifa_mask &&
368 inet_ifa_match(ifa1->ifa_address, ifa))
369 fib_del_ifaddr(ifa, ifa1);
370 }
371
Linus Torvalds1da177e2005-04-16 15:20:36 -0700372 /* 2. Unlink it */
373
374 *ifap = ifa1->ifa_next;
David S. Millerfd23c3b2011-02-18 12:42:28 -0800375 inet_hash_remove(ifa1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376
377 /* 3. Announce address deletion */
378
379 /* Send message first, then call notifier.
380 At first sight, FIB update triggered by notifier
381 will refer to already deleted ifaddr, that could confuse
382 netlink listeners. It is not true: look, gated sees
383 that route deleted and if it still thinks that ifaddr
384 is valid, it will try to restore deleted routes... Grr.
385 So that, this order is correct.
386 */
Eric W. Biederman15e47302012-09-07 20:12:54 +0000387 rtmsg_ifa(RTM_DELADDR, ifa1, nlh, portid);
Alan Sterne041c682006-03-27 01:16:30 -0800388 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_DOWN, ifa1);
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800389
390 if (promote) {
Julian Anastasov04024b92011-03-19 12:13:54 +0000391 struct in_ifaddr *next_sec = promote->ifa_next;
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800392
393 if (prev_prom) {
394 prev_prom->ifa_next = promote->ifa_next;
395 promote->ifa_next = last_prim->ifa_next;
396 last_prim->ifa_next = promote;
397 }
398
399 promote->ifa_flags &= ~IFA_F_SECONDARY;
Eric W. Biederman15e47302012-09-07 20:12:54 +0000400 rtmsg_ifa(RTM_NEWADDR, promote, nlh, portid);
Alan Sterne041c682006-03-27 01:16:30 -0800401 blocking_notifier_call_chain(&inetaddr_chain,
402 NETDEV_UP, promote);
Julian Anastasov04024b92011-03-19 12:13:54 +0000403 for (ifa = next_sec; ifa; ifa = ifa->ifa_next) {
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800404 if (ifa1->ifa_mask != ifa->ifa_mask ||
405 !inet_ifa_match(ifa1->ifa_address, ifa))
406 continue;
407 fib_add_ifaddr(ifa);
408 }
409
410 }
Herbert Xu63630972007-06-07 18:35:38 -0700411 if (destroy)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700412 inet_free_ifa(ifa1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700413}
414
Thomas Grafd6062cb2006-08-15 00:33:59 -0700415static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
416 int destroy)
417{
418 __inet_del_ifa(in_dev, ifap, destroy, NULL, 0);
419}
420
Jiri Pirko5c766d62013-01-24 09:41:41 +0000421static void check_lifetime(struct work_struct *work);
422
423static DECLARE_DELAYED_WORK(check_lifetime_work, check_lifetime);
424
Thomas Grafd6062cb2006-08-15 00:33:59 -0700425static int __inet_insert_ifa(struct in_ifaddr *ifa, struct nlmsghdr *nlh,
Eric W. Biederman15e47302012-09-07 20:12:54 +0000426 u32 portid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700427{
428 struct in_device *in_dev = ifa->ifa_dev;
429 struct in_ifaddr *ifa1, **ifap, **last_primary;
430
431 ASSERT_RTNL();
432
433 if (!ifa->ifa_local) {
434 inet_free_ifa(ifa);
435 return 0;
436 }
437
438 ifa->ifa_flags &= ~IFA_F_SECONDARY;
439 last_primary = &in_dev->ifa_list;
440
441 for (ifap = &in_dev->ifa_list; (ifa1 = *ifap) != NULL;
442 ifap = &ifa1->ifa_next) {
443 if (!(ifa1->ifa_flags & IFA_F_SECONDARY) &&
444 ifa->ifa_scope <= ifa1->ifa_scope)
445 last_primary = &ifa1->ifa_next;
446 if (ifa1->ifa_mask == ifa->ifa_mask &&
447 inet_ifa_match(ifa1->ifa_address, ifa)) {
448 if (ifa1->ifa_local == ifa->ifa_local) {
449 inet_free_ifa(ifa);
450 return -EEXIST;
451 }
452 if (ifa1->ifa_scope != ifa->ifa_scope) {
453 inet_free_ifa(ifa);
454 return -EINVAL;
455 }
456 ifa->ifa_flags |= IFA_F_SECONDARY;
457 }
458 }
459
460 if (!(ifa->ifa_flags & IFA_F_SECONDARY)) {
461 net_srandom(ifa->ifa_local);
462 ifap = last_primary;
463 }
464
465 ifa->ifa_next = *ifap;
466 *ifap = ifa;
467
David S. Millerfd23c3b2011-02-18 12:42:28 -0800468 inet_hash_insert(dev_net(in_dev->dev), ifa);
469
Jiri Pirko5c766d62013-01-24 09:41:41 +0000470 cancel_delayed_work(&check_lifetime_work);
471 schedule_delayed_work(&check_lifetime_work, 0);
472
Linus Torvalds1da177e2005-04-16 15:20:36 -0700473 /* Send message first, then call notifier.
474 Notifier will trigger FIB update, so that
475 listeners of netlink will know about new ifaddr */
Eric W. Biederman15e47302012-09-07 20:12:54 +0000476 rtmsg_ifa(RTM_NEWADDR, ifa, nlh, portid);
Alan Sterne041c682006-03-27 01:16:30 -0800477 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_UP, ifa);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700478
479 return 0;
480}
481
Thomas Grafd6062cb2006-08-15 00:33:59 -0700482static int inet_insert_ifa(struct in_ifaddr *ifa)
483{
484 return __inet_insert_ifa(ifa, NULL, 0);
485}
486
Linus Torvalds1da177e2005-04-16 15:20:36 -0700487static int inet_set_ifa(struct net_device *dev, struct in_ifaddr *ifa)
488{
Herbert Xue5ed6392005-10-03 14:35:55 -0700489 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700490
491 ASSERT_RTNL();
492
493 if (!in_dev) {
Herbert Xu71e27da2007-06-04 23:36:06 -0700494 inet_free_ifa(ifa);
495 return -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700496 }
Herbert Xu71e27da2007-06-04 23:36:06 -0700497 ipv4_devconf_setall(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700498 if (ifa->ifa_dev != in_dev) {
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700499 WARN_ON(ifa->ifa_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700500 in_dev_hold(in_dev);
501 ifa->ifa_dev = in_dev;
502 }
Joe Perchesf97c1e02007-12-16 13:45:43 -0800503 if (ipv4_is_loopback(ifa->ifa_local))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700504 ifa->ifa_scope = RT_SCOPE_HOST;
505 return inet_insert_ifa(ifa);
506}
507
Eric Dumazet8723e1b2010-10-19 00:39:26 +0000508/* Caller must hold RCU or RTNL :
509 * We dont take a reference on found in_device
510 */
Denis V. Lunev7fee0ca2008-01-21 17:32:38 -0800511struct in_device *inetdev_by_index(struct net *net, int ifindex)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700512{
513 struct net_device *dev;
514 struct in_device *in_dev = NULL;
Eric Dumazetc148fc22009-11-01 19:23:04 +0000515
516 rcu_read_lock();
517 dev = dev_get_by_index_rcu(net, ifindex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700518 if (dev)
Eric Dumazet8723e1b2010-10-19 00:39:26 +0000519 in_dev = rcu_dereference_rtnl(dev->ip_ptr);
Eric Dumazetc148fc22009-11-01 19:23:04 +0000520 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700521 return in_dev;
522}
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800523EXPORT_SYMBOL(inetdev_by_index);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700524
525/* Called only from RTNL semaphored context. No locks. */
526
Al Viro60cad5d2006-09-26 22:17:09 -0700527struct in_ifaddr *inet_ifa_byprefix(struct in_device *in_dev, __be32 prefix,
528 __be32 mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700529{
530 ASSERT_RTNL();
531
532 for_primary_ifa(in_dev) {
533 if (ifa->ifa_mask == mask && inet_ifa_match(prefix, ifa))
534 return ifa;
535 } endfor_ifa(in_dev);
536 return NULL;
537}
538
Thomas Graf661d2962013-03-21 07:45:29 +0000539static int inet_rtm_deladdr(struct sk_buff *skb, struct nlmsghdr *nlh)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700540{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +0900541 struct net *net = sock_net(skb->sk);
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700542 struct nlattr *tb[IFA_MAX+1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700543 struct in_device *in_dev;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700544 struct ifaddrmsg *ifm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700545 struct in_ifaddr *ifa, **ifap;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700546 int err = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700547
548 ASSERT_RTNL();
549
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700550 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy);
551 if (err < 0)
552 goto errout;
553
554 ifm = nlmsg_data(nlh);
Denis V. Lunev7fee0ca2008-01-21 17:32:38 -0800555 in_dev = inetdev_by_index(net, ifm->ifa_index);
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700556 if (in_dev == NULL) {
557 err = -ENODEV;
558 goto errout;
559 }
560
Linus Torvalds1da177e2005-04-16 15:20:36 -0700561 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
562 ifap = &ifa->ifa_next) {
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700563 if (tb[IFA_LOCAL] &&
Al Viroa7a628c2006-09-26 22:16:43 -0700564 ifa->ifa_local != nla_get_be32(tb[IFA_LOCAL]))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700565 continue;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700566
567 if (tb[IFA_LABEL] && nla_strcmp(tb[IFA_LABEL], ifa->ifa_label))
568 continue;
569
570 if (tb[IFA_ADDRESS] &&
571 (ifm->ifa_prefixlen != ifa->ifa_prefixlen ||
Al Viroa7a628c2006-09-26 22:16:43 -0700572 !inet_ifa_match(nla_get_be32(tb[IFA_ADDRESS]), ifa)))
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700573 continue;
574
Eric W. Biederman15e47302012-09-07 20:12:54 +0000575 __inet_del_ifa(in_dev, ifap, 1, nlh, NETLINK_CB(skb).portid);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700576 return 0;
577 }
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700578
579 err = -EADDRNOTAVAIL;
580errout:
581 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700582}
583
Jiri Pirko5c766d62013-01-24 09:41:41 +0000584#define INFINITY_LIFE_TIME 0xFFFFFFFF
585
586static void check_lifetime(struct work_struct *work)
587{
588 unsigned long now, next, next_sec, next_sched;
589 struct in_ifaddr *ifa;
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000590 struct hlist_node *n;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000591 int i;
592
593 now = jiffies;
594 next = round_jiffies_up(now + ADDR_CHECK_FREQUENCY);
595
Jiri Pirko5c766d62013-01-24 09:41:41 +0000596 for (i = 0; i < IN4_ADDR_HSIZE; i++) {
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000597 bool change_needed = false;
598
599 rcu_read_lock();
Sasha Levinb67bfe02013-02-27 17:06:00 -0800600 hlist_for_each_entry_rcu(ifa, &inet_addr_lst[i], hash) {
Jiri Pirko5c766d62013-01-24 09:41:41 +0000601 unsigned long age;
602
603 if (ifa->ifa_flags & IFA_F_PERMANENT)
604 continue;
605
606 /* We try to batch several events at once. */
607 age = (now - ifa->ifa_tstamp +
608 ADDRCONF_TIMER_FUZZ_MINUS) / HZ;
609
610 if (ifa->ifa_valid_lft != INFINITY_LIFE_TIME &&
611 age >= ifa->ifa_valid_lft) {
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000612 change_needed = true;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000613 } else if (ifa->ifa_preferred_lft ==
614 INFINITY_LIFE_TIME) {
615 continue;
616 } else if (age >= ifa->ifa_preferred_lft) {
617 if (time_before(ifa->ifa_tstamp +
618 ifa->ifa_valid_lft * HZ, next))
619 next = ifa->ifa_tstamp +
620 ifa->ifa_valid_lft * HZ;
621
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000622 if (!(ifa->ifa_flags & IFA_F_DEPRECATED))
623 change_needed = true;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000624 } else if (time_before(ifa->ifa_tstamp +
625 ifa->ifa_preferred_lft * HZ,
626 next)) {
627 next = ifa->ifa_tstamp +
628 ifa->ifa_preferred_lft * HZ;
629 }
630 }
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000631 rcu_read_unlock();
632 if (!change_needed)
633 continue;
634 rtnl_lock();
635 hlist_for_each_entry_safe(ifa, n, &inet_addr_lst[i], hash) {
636 unsigned long age;
637
638 if (ifa->ifa_flags & IFA_F_PERMANENT)
639 continue;
640
641 /* We try to batch several events at once. */
642 age = (now - ifa->ifa_tstamp +
643 ADDRCONF_TIMER_FUZZ_MINUS) / HZ;
644
645 if (ifa->ifa_valid_lft != INFINITY_LIFE_TIME &&
646 age >= ifa->ifa_valid_lft) {
647 struct in_ifaddr **ifap;
648
649 for (ifap = &ifa->ifa_dev->ifa_list;
650 *ifap != NULL; ifap = &(*ifap)->ifa_next) {
651 if (*ifap == ifa) {
652 inet_del_ifa(ifa->ifa_dev,
653 ifap, 1);
654 break;
655 }
656 }
657 } else if (ifa->ifa_preferred_lft !=
658 INFINITY_LIFE_TIME &&
659 age >= ifa->ifa_preferred_lft &&
660 !(ifa->ifa_flags & IFA_F_DEPRECATED)) {
661 ifa->ifa_flags |= IFA_F_DEPRECATED;
662 rtmsg_ifa(RTM_NEWADDR, ifa, NULL, 0);
663 }
664 }
665 rtnl_unlock();
Jiri Pirko5c766d62013-01-24 09:41:41 +0000666 }
Jiri Pirko5c766d62013-01-24 09:41:41 +0000667
668 next_sec = round_jiffies_up(next);
669 next_sched = next;
670
671 /* If rounded timeout is accurate enough, accept it. */
672 if (time_before(next_sec, next + ADDRCONF_TIMER_FUZZ))
673 next_sched = next_sec;
674
675 now = jiffies;
676 /* And minimum interval is ADDRCONF_TIMER_FUZZ_MAX. */
677 if (time_before(next_sched, now + ADDRCONF_TIMER_FUZZ_MAX))
678 next_sched = now + ADDRCONF_TIMER_FUZZ_MAX;
679
680 schedule_delayed_work(&check_lifetime_work, next_sched - now);
681}
682
683static void set_ifa_lifetime(struct in_ifaddr *ifa, __u32 valid_lft,
684 __u32 prefered_lft)
685{
686 unsigned long timeout;
687
688 ifa->ifa_flags &= ~(IFA_F_PERMANENT | IFA_F_DEPRECATED);
689
690 timeout = addrconf_timeout_fixup(valid_lft, HZ);
691 if (addrconf_finite_timeout(timeout))
692 ifa->ifa_valid_lft = timeout;
693 else
694 ifa->ifa_flags |= IFA_F_PERMANENT;
695
696 timeout = addrconf_timeout_fixup(prefered_lft, HZ);
697 if (addrconf_finite_timeout(timeout)) {
698 if (timeout == 0)
699 ifa->ifa_flags |= IFA_F_DEPRECATED;
700 ifa->ifa_preferred_lft = timeout;
701 }
702 ifa->ifa_tstamp = jiffies;
703 if (!ifa->ifa_cstamp)
704 ifa->ifa_cstamp = ifa->ifa_tstamp;
705}
706
707static struct in_ifaddr *rtm_to_ifaddr(struct net *net, struct nlmsghdr *nlh,
708 __u32 *pvalid_lft, __u32 *pprefered_lft)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700709{
Thomas Graf5c753972006-08-04 23:03:53 -0700710 struct nlattr *tb[IFA_MAX+1];
711 struct in_ifaddr *ifa;
712 struct ifaddrmsg *ifm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700713 struct net_device *dev;
714 struct in_device *in_dev;
Denis V. Lunev7b218572008-01-31 18:47:00 -0800715 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700716
Thomas Graf5c753972006-08-04 23:03:53 -0700717 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy);
718 if (err < 0)
719 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700720
Thomas Graf5c753972006-08-04 23:03:53 -0700721 ifm = nlmsg_data(nlh);
Denis V. Lunev7b218572008-01-31 18:47:00 -0800722 err = -EINVAL;
723 if (ifm->ifa_prefixlen > 32 || tb[IFA_LOCAL] == NULL)
Thomas Graf5c753972006-08-04 23:03:53 -0700724 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700725
Denis V. Lunev4b8aa9a2008-01-31 18:47:40 -0800726 dev = __dev_get_by_index(net, ifm->ifa_index);
Denis V. Lunev7b218572008-01-31 18:47:00 -0800727 err = -ENODEV;
728 if (dev == NULL)
Thomas Graf5c753972006-08-04 23:03:53 -0700729 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700730
Thomas Graf5c753972006-08-04 23:03:53 -0700731 in_dev = __in_dev_get_rtnl(dev);
Denis V. Lunev7b218572008-01-31 18:47:00 -0800732 err = -ENOBUFS;
733 if (in_dev == NULL)
Herbert Xu71e27da2007-06-04 23:36:06 -0700734 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700735
Thomas Graf5c753972006-08-04 23:03:53 -0700736 ifa = inet_alloc_ifa();
Denis V. Lunev7b218572008-01-31 18:47:00 -0800737 if (ifa == NULL)
Thomas Graf5c753972006-08-04 23:03:53 -0700738 /*
739 * A potential indev allocation can be left alive, it stays
740 * assigned to its device and is destroy with it.
741 */
Thomas Graf5c753972006-08-04 23:03:53 -0700742 goto errout;
Thomas Graf5c753972006-08-04 23:03:53 -0700743
Pavel Emelyanova4e65d32007-12-07 23:55:43 -0800744 ipv4_devconf_setall(in_dev);
Thomas Graf5c753972006-08-04 23:03:53 -0700745 in_dev_hold(in_dev);
746
747 if (tb[IFA_ADDRESS] == NULL)
748 tb[IFA_ADDRESS] = tb[IFA_LOCAL];
749
David S. Millerfd23c3b2011-02-18 12:42:28 -0800750 INIT_HLIST_NODE(&ifa->hash);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700751 ifa->ifa_prefixlen = ifm->ifa_prefixlen;
752 ifa->ifa_mask = inet_make_mask(ifm->ifa_prefixlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700753 ifa->ifa_flags = ifm->ifa_flags;
754 ifa->ifa_scope = ifm->ifa_scope;
Thomas Graf5c753972006-08-04 23:03:53 -0700755 ifa->ifa_dev = in_dev;
756
Al Viroa7a628c2006-09-26 22:16:43 -0700757 ifa->ifa_local = nla_get_be32(tb[IFA_LOCAL]);
758 ifa->ifa_address = nla_get_be32(tb[IFA_ADDRESS]);
Thomas Graf5c753972006-08-04 23:03:53 -0700759
760 if (tb[IFA_BROADCAST])
Al Viroa7a628c2006-09-26 22:16:43 -0700761 ifa->ifa_broadcast = nla_get_be32(tb[IFA_BROADCAST]);
Thomas Graf5c753972006-08-04 23:03:53 -0700762
Thomas Graf5c753972006-08-04 23:03:53 -0700763 if (tb[IFA_LABEL])
764 nla_strlcpy(ifa->ifa_label, tb[IFA_LABEL], IFNAMSIZ);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700765 else
766 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
767
Jiri Pirko5c766d62013-01-24 09:41:41 +0000768 if (tb[IFA_CACHEINFO]) {
769 struct ifa_cacheinfo *ci;
770
771 ci = nla_data(tb[IFA_CACHEINFO]);
772 if (!ci->ifa_valid || ci->ifa_prefered > ci->ifa_valid) {
773 err = -EINVAL;
774 goto errout;
775 }
776 *pvalid_lft = ci->ifa_valid;
777 *pprefered_lft = ci->ifa_prefered;
778 }
779
Thomas Graf5c753972006-08-04 23:03:53 -0700780 return ifa;
781
782errout:
783 return ERR_PTR(err);
784}
785
Jiri Pirko5c766d62013-01-24 09:41:41 +0000786static struct in_ifaddr *find_matching_ifa(struct in_ifaddr *ifa)
787{
788 struct in_device *in_dev = ifa->ifa_dev;
789 struct in_ifaddr *ifa1, **ifap;
790
791 if (!ifa->ifa_local)
792 return NULL;
793
794 for (ifap = &in_dev->ifa_list; (ifa1 = *ifap) != NULL;
795 ifap = &ifa1->ifa_next) {
796 if (ifa1->ifa_mask == ifa->ifa_mask &&
797 inet_ifa_match(ifa1->ifa_address, ifa) &&
798 ifa1->ifa_local == ifa->ifa_local)
799 return ifa1;
800 }
801 return NULL;
802}
803
Thomas Graf661d2962013-03-21 07:45:29 +0000804static int inet_rtm_newaddr(struct sk_buff *skb, struct nlmsghdr *nlh)
Thomas Graf5c753972006-08-04 23:03:53 -0700805{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +0900806 struct net *net = sock_net(skb->sk);
Thomas Graf5c753972006-08-04 23:03:53 -0700807 struct in_ifaddr *ifa;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000808 struct in_ifaddr *ifa_existing;
809 __u32 valid_lft = INFINITY_LIFE_TIME;
810 __u32 prefered_lft = INFINITY_LIFE_TIME;
Thomas Graf5c753972006-08-04 23:03:53 -0700811
812 ASSERT_RTNL();
813
Jiri Pirko5c766d62013-01-24 09:41:41 +0000814 ifa = rtm_to_ifaddr(net, nlh, &valid_lft, &prefered_lft);
Thomas Graf5c753972006-08-04 23:03:53 -0700815 if (IS_ERR(ifa))
816 return PTR_ERR(ifa);
817
Jiri Pirko5c766d62013-01-24 09:41:41 +0000818 ifa_existing = find_matching_ifa(ifa);
819 if (!ifa_existing) {
820 /* It would be best to check for !NLM_F_CREATE here but
821 * userspace alreay relies on not having to provide this.
822 */
823 set_ifa_lifetime(ifa, valid_lft, prefered_lft);
824 return __inet_insert_ifa(ifa, nlh, NETLINK_CB(skb).portid);
825 } else {
826 inet_free_ifa(ifa);
827
828 if (nlh->nlmsg_flags & NLM_F_EXCL ||
829 !(nlh->nlmsg_flags & NLM_F_REPLACE))
830 return -EEXIST;
Jiri Pirko34e2ed32013-04-04 08:33:00 +0000831 ifa = ifa_existing;
832 set_ifa_lifetime(ifa, valid_lft, prefered_lft);
Jiri Pirko05a324b2013-04-04 23:39:38 +0000833 cancel_delayed_work(&check_lifetime_work);
834 schedule_delayed_work(&check_lifetime_work, 0);
Jiri Pirko34e2ed32013-04-04 08:33:00 +0000835 rtmsg_ifa(RTM_NEWADDR, ifa, nlh, NETLINK_CB(skb).portid);
836 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_UP, ifa);
Jiri Pirko5c766d62013-01-24 09:41:41 +0000837 }
838 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700839}
840
841/*
842 * Determine a default network mask, based on the IP address.
843 */
844
Eric Dumazet40384992012-08-03 21:06:50 +0000845static int inet_abc_len(__be32 addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700846{
847 int rc = -1; /* Something else, probably a multicast. */
848
Joe Perchesf97c1e02007-12-16 13:45:43 -0800849 if (ipv4_is_zeronet(addr))
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900850 rc = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700851 else {
Al Viro714e85b2006-11-14 20:51:49 -0800852 __u32 haddr = ntohl(addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700853
Al Viro714e85b2006-11-14 20:51:49 -0800854 if (IN_CLASSA(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700855 rc = 8;
Al Viro714e85b2006-11-14 20:51:49 -0800856 else if (IN_CLASSB(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700857 rc = 16;
Al Viro714e85b2006-11-14 20:51:49 -0800858 else if (IN_CLASSC(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700859 rc = 24;
860 }
861
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900862 return rc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700863}
864
865
Denis V. Luneve5b13cb2008-02-28 20:51:43 -0800866int devinet_ioctl(struct net *net, unsigned int cmd, void __user *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700867{
868 struct ifreq ifr;
869 struct sockaddr_in sin_orig;
870 struct sockaddr_in *sin = (struct sockaddr_in *)&ifr.ifr_addr;
871 struct in_device *in_dev;
872 struct in_ifaddr **ifap = NULL;
873 struct in_ifaddr *ifa = NULL;
874 struct net_device *dev;
875 char *colon;
876 int ret = -EFAULT;
877 int tryaddrmatch = 0;
878
879 /*
880 * Fetch the caller's info block into kernel space
881 */
882
883 if (copy_from_user(&ifr, arg, sizeof(struct ifreq)))
884 goto out;
885 ifr.ifr_name[IFNAMSIZ - 1] = 0;
886
887 /* save original address for comparison */
888 memcpy(&sin_orig, sin, sizeof(*sin));
889
890 colon = strchr(ifr.ifr_name, ':');
891 if (colon)
892 *colon = 0;
893
Denis V. Luneve5b13cb2008-02-28 20:51:43 -0800894 dev_load(net, ifr.ifr_name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700895
Stephen Hemminger132adf52007-03-08 20:44:43 -0800896 switch (cmd) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700897 case SIOCGIFADDR: /* Get interface address */
898 case SIOCGIFBRDADDR: /* Get the broadcast address */
899 case SIOCGIFDSTADDR: /* Get the destination address */
900 case SIOCGIFNETMASK: /* Get the netmask for the interface */
901 /* Note that these ioctls will not sleep,
902 so that we do not impose a lock.
903 One day we will be forced to put shlock here (I mean SMP)
904 */
905 tryaddrmatch = (sin_orig.sin_family == AF_INET);
906 memset(sin, 0, sizeof(*sin));
907 sin->sin_family = AF_INET;
908 break;
909
910 case SIOCSIFFLAGS:
Zhao Hongjiangbf5b30b2012-09-20 22:37:25 +0000911 ret = -EPERM;
Eric W. Biederman52e804c2012-11-16 03:03:05 +0000912 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700913 goto out;
914 break;
915 case SIOCSIFADDR: /* Set interface address (and family) */
916 case SIOCSIFBRDADDR: /* Set the broadcast address */
917 case SIOCSIFDSTADDR: /* Set the destination address */
918 case SIOCSIFNETMASK: /* Set the netmask for the interface */
Zhao Hongjiangbf5b30b2012-09-20 22:37:25 +0000919 ret = -EPERM;
Eric W. Biederman52e804c2012-11-16 03:03:05 +0000920 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700921 goto out;
922 ret = -EINVAL;
923 if (sin->sin_family != AF_INET)
924 goto out;
925 break;
926 default:
927 ret = -EINVAL;
928 goto out;
929 }
930
931 rtnl_lock();
932
933 ret = -ENODEV;
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800934 dev = __dev_get_by_name(net, ifr.ifr_name);
935 if (!dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700936 goto done;
937
938 if (colon)
939 *colon = ':';
940
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800941 in_dev = __in_dev_get_rtnl(dev);
942 if (in_dev) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700943 if (tryaddrmatch) {
944 /* Matthias Andree */
945 /* compare label and address (4.4BSD style) */
946 /* note: we only do this for a limited set of ioctls
947 and only if the original address family was AF_INET.
948 This is checked above. */
949 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
950 ifap = &ifa->ifa_next) {
951 if (!strcmp(ifr.ifr_name, ifa->ifa_label) &&
952 sin_orig.sin_addr.s_addr ==
David S. Miller6c91afe2011-03-09 13:27:16 -0800953 ifa->ifa_local) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700954 break; /* found */
955 }
956 }
957 }
958 /* we didn't get a match, maybe the application is
959 4.3BSD-style and passed in junk so we fall back to
960 comparing just the label */
961 if (!ifa) {
962 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
963 ifap = &ifa->ifa_next)
964 if (!strcmp(ifr.ifr_name, ifa->ifa_label))
965 break;
966 }
967 }
968
969 ret = -EADDRNOTAVAIL;
970 if (!ifa && cmd != SIOCSIFADDR && cmd != SIOCSIFFLAGS)
971 goto done;
972
Stephen Hemminger132adf52007-03-08 20:44:43 -0800973 switch (cmd) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700974 case SIOCGIFADDR: /* Get interface address */
975 sin->sin_addr.s_addr = ifa->ifa_local;
976 goto rarok;
977
978 case SIOCGIFBRDADDR: /* Get the broadcast address */
979 sin->sin_addr.s_addr = ifa->ifa_broadcast;
980 goto rarok;
981
982 case SIOCGIFDSTADDR: /* Get the destination address */
983 sin->sin_addr.s_addr = ifa->ifa_address;
984 goto rarok;
985
986 case SIOCGIFNETMASK: /* Get the netmask for the interface */
987 sin->sin_addr.s_addr = ifa->ifa_mask;
988 goto rarok;
989
990 case SIOCSIFFLAGS:
991 if (colon) {
992 ret = -EADDRNOTAVAIL;
993 if (!ifa)
994 break;
995 ret = 0;
996 if (!(ifr.ifr_flags & IFF_UP))
997 inet_del_ifa(in_dev, ifap, 1);
998 break;
999 }
1000 ret = dev_change_flags(dev, ifr.ifr_flags);
1001 break;
1002
1003 case SIOCSIFADDR: /* Set interface address (and family) */
1004 ret = -EINVAL;
1005 if (inet_abc_len(sin->sin_addr.s_addr) < 0)
1006 break;
1007
1008 if (!ifa) {
1009 ret = -ENOBUFS;
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001010 ifa = inet_alloc_ifa();
1011 if (!ifa)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001012 break;
Xi Wangc7e2e1d2013-01-05 11:19:24 +00001013 INIT_HLIST_NODE(&ifa->hash);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001014 if (colon)
1015 memcpy(ifa->ifa_label, ifr.ifr_name, IFNAMSIZ);
1016 else
1017 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
1018 } else {
1019 ret = 0;
1020 if (ifa->ifa_local == sin->sin_addr.s_addr)
1021 break;
1022 inet_del_ifa(in_dev, ifap, 0);
1023 ifa->ifa_broadcast = 0;
Bjorn Mork148f9722008-02-26 18:17:53 -08001024 ifa->ifa_scope = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001025 }
1026
1027 ifa->ifa_address = ifa->ifa_local = sin->sin_addr.s_addr;
1028
1029 if (!(dev->flags & IFF_POINTOPOINT)) {
1030 ifa->ifa_prefixlen = inet_abc_len(ifa->ifa_address);
1031 ifa->ifa_mask = inet_make_mask(ifa->ifa_prefixlen);
1032 if ((dev->flags & IFF_BROADCAST) &&
1033 ifa->ifa_prefixlen < 31)
1034 ifa->ifa_broadcast = ifa->ifa_address |
1035 ~ifa->ifa_mask;
1036 } else {
1037 ifa->ifa_prefixlen = 32;
1038 ifa->ifa_mask = inet_make_mask(32);
1039 }
Jiri Pirko5c766d62013-01-24 09:41:41 +00001040 set_ifa_lifetime(ifa, INFINITY_LIFE_TIME, INFINITY_LIFE_TIME);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001041 ret = inet_set_ifa(dev, ifa);
1042 break;
1043
1044 case SIOCSIFBRDADDR: /* Set the broadcast address */
1045 ret = 0;
1046 if (ifa->ifa_broadcast != sin->sin_addr.s_addr) {
1047 inet_del_ifa(in_dev, ifap, 0);
1048 ifa->ifa_broadcast = sin->sin_addr.s_addr;
1049 inet_insert_ifa(ifa);
1050 }
1051 break;
1052
1053 case SIOCSIFDSTADDR: /* Set the destination address */
1054 ret = 0;
1055 if (ifa->ifa_address == sin->sin_addr.s_addr)
1056 break;
1057 ret = -EINVAL;
1058 if (inet_abc_len(sin->sin_addr.s_addr) < 0)
1059 break;
1060 ret = 0;
1061 inet_del_ifa(in_dev, ifap, 0);
1062 ifa->ifa_address = sin->sin_addr.s_addr;
1063 inet_insert_ifa(ifa);
1064 break;
1065
1066 case SIOCSIFNETMASK: /* Set the netmask for the interface */
1067
1068 /*
1069 * The mask we set must be legal.
1070 */
1071 ret = -EINVAL;
1072 if (bad_mask(sin->sin_addr.s_addr, 0))
1073 break;
1074 ret = 0;
1075 if (ifa->ifa_mask != sin->sin_addr.s_addr) {
Al Viroa144ea42006-09-28 18:00:55 -07001076 __be32 old_mask = ifa->ifa_mask;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001077 inet_del_ifa(in_dev, ifap, 0);
1078 ifa->ifa_mask = sin->sin_addr.s_addr;
1079 ifa->ifa_prefixlen = inet_mask_len(ifa->ifa_mask);
1080
1081 /* See if current broadcast address matches
1082 * with current netmask, then recalculate
1083 * the broadcast address. Otherwise it's a
1084 * funny address, so don't touch it since
1085 * the user seems to know what (s)he's doing...
1086 */
1087 if ((dev->flags & IFF_BROADCAST) &&
1088 (ifa->ifa_prefixlen < 31) &&
1089 (ifa->ifa_broadcast ==
David Engeldcab5e12005-10-21 22:09:16 -05001090 (ifa->ifa_local|~old_mask))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001091 ifa->ifa_broadcast = (ifa->ifa_local |
1092 ~sin->sin_addr.s_addr);
1093 }
1094 inet_insert_ifa(ifa);
1095 }
1096 break;
1097 }
1098done:
1099 rtnl_unlock();
1100out:
1101 return ret;
1102rarok:
1103 rtnl_unlock();
1104 ret = copy_to_user(arg, &ifr, sizeof(struct ifreq)) ? -EFAULT : 0;
1105 goto out;
1106}
1107
1108static int inet_gifconf(struct net_device *dev, char __user *buf, int len)
1109{
Herbert Xue5ed6392005-10-03 14:35:55 -07001110 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001111 struct in_ifaddr *ifa;
1112 struct ifreq ifr;
1113 int done = 0;
1114
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001115 if (!in_dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001116 goto out;
1117
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001118 for (ifa = in_dev->ifa_list; ifa; ifa = ifa->ifa_next) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001119 if (!buf) {
1120 done += sizeof(ifr);
1121 continue;
1122 }
1123 if (len < (int) sizeof(ifr))
1124 break;
1125 memset(&ifr, 0, sizeof(struct ifreq));
1126 if (ifa->ifa_label)
1127 strcpy(ifr.ifr_name, ifa->ifa_label);
1128 else
1129 strcpy(ifr.ifr_name, dev->name);
1130
1131 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_family = AF_INET;
1132 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_addr.s_addr =
1133 ifa->ifa_local;
1134
1135 if (copy_to_user(buf, &ifr, sizeof(struct ifreq))) {
1136 done = -EFAULT;
1137 break;
1138 }
1139 buf += sizeof(struct ifreq);
1140 len -= sizeof(struct ifreq);
1141 done += sizeof(struct ifreq);
1142 }
1143out:
1144 return done;
1145}
1146
Al Viroa61ced52006-09-26 21:27:54 -07001147__be32 inet_select_addr(const struct net_device *dev, __be32 dst, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001148{
Al Viroa61ced52006-09-26 21:27:54 -07001149 __be32 addr = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001150 struct in_device *in_dev;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001151 struct net *net = dev_net(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001152
1153 rcu_read_lock();
Herbert Xue5ed6392005-10-03 14:35:55 -07001154 in_dev = __in_dev_get_rcu(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001155 if (!in_dev)
1156 goto no_in_dev;
1157
1158 for_primary_ifa(in_dev) {
1159 if (ifa->ifa_scope > scope)
1160 continue;
1161 if (!dst || inet_ifa_match(dst, ifa)) {
1162 addr = ifa->ifa_local;
1163 break;
1164 }
1165 if (!addr)
1166 addr = ifa->ifa_local;
1167 } endfor_ifa(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001168
1169 if (addr)
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001170 goto out_unlock;
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001171no_in_dev:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001172
1173 /* Not loopback addresses on loopback should be preferred
1174 in this case. It is importnat that lo is the first interface
1175 in dev_base list.
1176 */
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001177 for_each_netdev_rcu(net, dev) {
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001178 in_dev = __in_dev_get_rcu(dev);
1179 if (!in_dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001180 continue;
1181
1182 for_primary_ifa(in_dev) {
1183 if (ifa->ifa_scope != RT_SCOPE_LINK &&
1184 ifa->ifa_scope <= scope) {
1185 addr = ifa->ifa_local;
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001186 goto out_unlock;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001187 }
1188 } endfor_ifa(in_dev);
1189 }
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001190out_unlock:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001191 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001192 return addr;
1193}
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001194EXPORT_SYMBOL(inet_select_addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001195
Al Viro60cad5d2006-09-26 22:17:09 -07001196static __be32 confirm_addr_indev(struct in_device *in_dev, __be32 dst,
1197 __be32 local, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001198{
1199 int same = 0;
Al Viroa144ea42006-09-28 18:00:55 -07001200 __be32 addr = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001201
1202 for_ifa(in_dev) {
1203 if (!addr &&
1204 (local == ifa->ifa_local || !local) &&
1205 ifa->ifa_scope <= scope) {
1206 addr = ifa->ifa_local;
1207 if (same)
1208 break;
1209 }
1210 if (!same) {
1211 same = (!local || inet_ifa_match(local, ifa)) &&
1212 (!dst || inet_ifa_match(dst, ifa));
1213 if (same && addr) {
1214 if (local || !dst)
1215 break;
1216 /* Is the selected addr into dst subnet? */
1217 if (inet_ifa_match(addr, ifa))
1218 break;
1219 /* No, then can we use new local src? */
1220 if (ifa->ifa_scope <= scope) {
1221 addr = ifa->ifa_local;
1222 break;
1223 }
1224 /* search for large dst subnet for addr */
1225 same = 0;
1226 }
1227 }
1228 } endfor_ifa(in_dev);
1229
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001230 return same ? addr : 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001231}
1232
1233/*
1234 * Confirm that local IP address exists using wildcards:
Denis V. Lunev9bd85e32008-01-14 23:05:55 -08001235 * - in_dev: only on this interface, 0=any interface
Linus Torvalds1da177e2005-04-16 15:20:36 -07001236 * - dst: only in the same subnet as dst, 0=any dst
1237 * - local: address, 0=autoselect the local address
1238 * - scope: maximum allowed scope value for the local address
1239 */
Denis V. Lunev9bd85e32008-01-14 23:05:55 -08001240__be32 inet_confirm_addr(struct in_device *in_dev,
1241 __be32 dst, __be32 local, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001242{
Al Viro60cad5d2006-09-26 22:17:09 -07001243 __be32 addr = 0;
Denis V. Lunev9bd85e32008-01-14 23:05:55 -08001244 struct net_device *dev;
Denis V. Lunev39a6d062008-01-14 23:06:19 -08001245 struct net *net;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001246
Denis V. Lunev39a6d062008-01-14 23:06:19 -08001247 if (scope != RT_SCOPE_LINK)
Denis V. Lunev9bd85e32008-01-14 23:05:55 -08001248 return confirm_addr_indev(in_dev, dst, local, scope);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001249
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001250 net = dev_net(in_dev->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001251 rcu_read_lock();
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001252 for_each_netdev_rcu(net, dev) {
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001253 in_dev = __in_dev_get_rcu(dev);
1254 if (in_dev) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001255 addr = confirm_addr_indev(in_dev, dst, local, scope);
1256 if (addr)
1257 break;
1258 }
1259 }
1260 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001261
1262 return addr;
1263}
Andy Gospodarekeaddcd72012-03-22 16:14:29 +00001264EXPORT_SYMBOL(inet_confirm_addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001265
1266/*
1267 * Device notifier
1268 */
1269
1270int register_inetaddr_notifier(struct notifier_block *nb)
1271{
Alan Sterne041c682006-03-27 01:16:30 -08001272 return blocking_notifier_chain_register(&inetaddr_chain, nb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001273}
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001274EXPORT_SYMBOL(register_inetaddr_notifier);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001275
1276int unregister_inetaddr_notifier(struct notifier_block *nb)
1277{
Alan Sterne041c682006-03-27 01:16:30 -08001278 return blocking_notifier_chain_unregister(&inetaddr_chain, nb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001279}
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001280EXPORT_SYMBOL(unregister_inetaddr_notifier);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001281
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001282/* Rename ifa_labels for a device name change. Make some effort to preserve
1283 * existing alias numbering and to create unique labels if possible.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001284*/
1285static void inetdev_changename(struct net_device *dev, struct in_device *in_dev)
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001286{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001287 struct in_ifaddr *ifa;
1288 int named = 0;
1289
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001290 for (ifa = in_dev->ifa_list; ifa; ifa = ifa->ifa_next) {
1291 char old[IFNAMSIZ], *dot;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001292
1293 memcpy(old, ifa->ifa_label, IFNAMSIZ);
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001294 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001295 if (named++ == 0)
Thomas Graf573bf472008-06-10 15:40:04 -07001296 goto skip;
Mark McLoughlin44344b22008-01-04 00:56:25 -08001297 dot = strchr(old, ':');
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001298 if (dot == NULL) {
1299 sprintf(old, ":%d", named);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001300 dot = old;
1301 }
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001302 if (strlen(dot) + strlen(dev->name) < IFNAMSIZ)
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001303 strcat(ifa->ifa_label, dot);
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001304 else
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001305 strcpy(ifa->ifa_label + (IFNAMSIZ - strlen(dot) - 1), dot);
Thomas Graf573bf472008-06-10 15:40:04 -07001306skip:
1307 rtmsg_ifa(RTM_NEWADDR, ifa, NULL, 0);
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001308 }
1309}
Linus Torvalds1da177e2005-04-16 15:20:36 -07001310
Eric Dumazet40384992012-08-03 21:06:50 +00001311static bool inetdev_valid_mtu(unsigned int mtu)
Breno Leitao06770842008-09-02 17:28:58 -07001312{
1313 return mtu >= 68;
1314}
1315
Ian Campbelld11327ad2011-02-11 07:44:16 +00001316static void inetdev_send_gratuitous_arp(struct net_device *dev,
1317 struct in_device *in_dev)
1318
1319{
Zoltan Kissb76d0782011-07-24 13:09:30 +00001320 struct in_ifaddr *ifa;
Ian Campbelld11327ad2011-02-11 07:44:16 +00001321
Zoltan Kissb76d0782011-07-24 13:09:30 +00001322 for (ifa = in_dev->ifa_list; ifa;
1323 ifa = ifa->ifa_next) {
1324 arp_send(ARPOP_REQUEST, ETH_P_ARP,
1325 ifa->ifa_local, dev,
1326 ifa->ifa_local, NULL,
1327 dev->dev_addr, NULL);
1328 }
Ian Campbelld11327ad2011-02-11 07:44:16 +00001329}
1330
Linus Torvalds1da177e2005-04-16 15:20:36 -07001331/* Called only under RTNL semaphore */
1332
1333static int inetdev_event(struct notifier_block *this, unsigned long event,
1334 void *ptr)
1335{
1336 struct net_device *dev = ptr;
Eric Dumazet748e2d92012-08-22 21:50:59 +00001337 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001338
1339 ASSERT_RTNL();
1340
1341 if (!in_dev) {
Herbert Xu8030f542007-02-22 01:53:47 +09001342 if (event == NETDEV_REGISTER) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001343 in_dev = inetdev_init(dev);
Herbert Xub217d612007-07-30 17:04:52 -07001344 if (!in_dev)
1345 return notifier_from_errno(-ENOMEM);
Eric W. Biederman0cc217e2007-09-26 22:10:06 -07001346 if (dev->flags & IFF_LOOPBACK) {
Herbert Xu42f811b2007-06-04 23:34:44 -07001347 IN_DEV_CONF_SET(in_dev, NOXFRM, 1);
1348 IN_DEV_CONF_SET(in_dev, NOPOLICY, 1);
Herbert Xu8030f542007-02-22 01:53:47 +09001349 }
Breno Leitao06770842008-09-02 17:28:58 -07001350 } else if (event == NETDEV_CHANGEMTU) {
1351 /* Re-enabling IP */
1352 if (inetdev_valid_mtu(dev->mtu))
1353 in_dev = inetdev_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001354 }
1355 goto out;
1356 }
1357
1358 switch (event) {
1359 case NETDEV_REGISTER:
Joe Perches91df42b2012-05-15 14:11:54 +00001360 pr_debug("%s: bug\n", __func__);
Stephen Hemmingera9b3cd72011-08-01 16:19:00 +00001361 RCU_INIT_POINTER(dev->ip_ptr, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001362 break;
1363 case NETDEV_UP:
Breno Leitao06770842008-09-02 17:28:58 -07001364 if (!inetdev_valid_mtu(dev->mtu))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001365 break;
Eric W. Biederman0cc217e2007-09-26 22:10:06 -07001366 if (dev->flags & IFF_LOOPBACK) {
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001367 struct in_ifaddr *ifa = inet_alloc_ifa();
1368
1369 if (ifa) {
David S. Millerfd23c3b2011-02-18 12:42:28 -08001370 INIT_HLIST_NODE(&ifa->hash);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001371 ifa->ifa_local =
1372 ifa->ifa_address = htonl(INADDR_LOOPBACK);
1373 ifa->ifa_prefixlen = 8;
1374 ifa->ifa_mask = inet_make_mask(8);
1375 in_dev_hold(in_dev);
1376 ifa->ifa_dev = in_dev;
1377 ifa->ifa_scope = RT_SCOPE_HOST;
1378 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
Jiri Pirko5c766d62013-01-24 09:41:41 +00001379 set_ifa_lifetime(ifa, INFINITY_LIFE_TIME,
1380 INFINITY_LIFE_TIME);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001381 inet_insert_ifa(ifa);
1382 }
1383 }
1384 ip_mc_up(in_dev);
Stephen Hemmingereefef1c2009-02-01 01:04:33 -08001385 /* fall through */
1386 case NETDEV_CHANGEADDR:
Ian Campbelld11327ad2011-02-11 07:44:16 +00001387 if (!IN_DEV_ARP_NOTIFY(in_dev))
1388 break;
1389 /* fall through */
1390 case NETDEV_NOTIFY_PEERS:
Stephen Hemmingera21090c2009-10-07 03:18:17 -07001391 /* Send gratuitous ARP to notify of link change */
Ian Campbelld11327ad2011-02-11 07:44:16 +00001392 inetdev_send_gratuitous_arp(dev, in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001393 break;
1394 case NETDEV_DOWN:
1395 ip_mc_down(in_dev);
1396 break;
Jiri Pirko93d9b7d2010-03-10 10:28:56 +00001397 case NETDEV_PRE_TYPE_CHANGE:
Moni Shoua75c78502009-09-15 02:37:40 -07001398 ip_mc_unmap(in_dev);
1399 break;
Jiri Pirko93d9b7d2010-03-10 10:28:56 +00001400 case NETDEV_POST_TYPE_CHANGE:
Moni Shoua75c78502009-09-15 02:37:40 -07001401 ip_mc_remap(in_dev);
1402 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001403 case NETDEV_CHANGEMTU:
Breno Leitao06770842008-09-02 17:28:58 -07001404 if (inetdev_valid_mtu(dev->mtu))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001405 break;
Breno Leitao06770842008-09-02 17:28:58 -07001406 /* disable IP when MTU is not enough */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001407 case NETDEV_UNREGISTER:
1408 inetdev_destroy(in_dev);
1409 break;
1410 case NETDEV_CHANGENAME:
1411 /* Do not notify about label change, this event is
1412 * not interesting to applications using netlink.
1413 */
1414 inetdev_changename(dev, in_dev);
1415
Pavel Emelyanov51602b22007-12-11 02:17:40 -08001416 devinet_sysctl_unregister(in_dev);
Pavel Emelyanov66f27a52007-12-02 00:55:54 +11001417 devinet_sysctl_register(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001418 break;
1419 }
1420out:
1421 return NOTIFY_DONE;
1422}
1423
1424static struct notifier_block ip_netdev_notifier = {
Jianjun Kong539afed2008-11-03 02:48:48 -08001425 .notifier_call = inetdev_event,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001426};
1427
Eric Dumazet40384992012-08-03 21:06:50 +00001428static size_t inet_nlmsg_size(void)
Thomas Graf339bf982006-11-10 14:10:15 -08001429{
1430 return NLMSG_ALIGN(sizeof(struct ifaddrmsg))
1431 + nla_total_size(4) /* IFA_ADDRESS */
1432 + nla_total_size(4) /* IFA_LOCAL */
1433 + nla_total_size(4) /* IFA_BROADCAST */
Thomas Graf339bf982006-11-10 14:10:15 -08001434 + nla_total_size(IFNAMSIZ); /* IFA_LABEL */
1435}
1436
Jiri Pirko5c766d62013-01-24 09:41:41 +00001437static inline u32 cstamp_delta(unsigned long cstamp)
1438{
1439 return (cstamp - INITIAL_JIFFIES) * 100UL / HZ;
1440}
1441
1442static int put_cacheinfo(struct sk_buff *skb, unsigned long cstamp,
1443 unsigned long tstamp, u32 preferred, u32 valid)
1444{
1445 struct ifa_cacheinfo ci;
1446
1447 ci.cstamp = cstamp_delta(cstamp);
1448 ci.tstamp = cstamp_delta(tstamp);
1449 ci.ifa_prefered = preferred;
1450 ci.ifa_valid = valid;
1451
1452 return nla_put(skb, IFA_CACHEINFO, sizeof(ci), &ci);
1453}
1454
Linus Torvalds1da177e2005-04-16 15:20:36 -07001455static int inet_fill_ifaddr(struct sk_buff *skb, struct in_ifaddr *ifa,
Eric W. Biederman15e47302012-09-07 20:12:54 +00001456 u32 portid, u32 seq, int event, unsigned int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001457{
1458 struct ifaddrmsg *ifm;
1459 struct nlmsghdr *nlh;
Jiri Pirko5c766d62013-01-24 09:41:41 +00001460 u32 preferred, valid;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001461
Eric W. Biederman15e47302012-09-07 20:12:54 +00001462 nlh = nlmsg_put(skb, portid, seq, event, sizeof(*ifm), flags);
Thomas Graf47f68512006-08-04 23:04:36 -07001463 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08001464 return -EMSGSIZE;
Thomas Graf47f68512006-08-04 23:04:36 -07001465
1466 ifm = nlmsg_data(nlh);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001467 ifm->ifa_family = AF_INET;
1468 ifm->ifa_prefixlen = ifa->ifa_prefixlen;
Jiri Pirko5c766d62013-01-24 09:41:41 +00001469 ifm->ifa_flags = ifa->ifa_flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001470 ifm->ifa_scope = ifa->ifa_scope;
1471 ifm->ifa_index = ifa->ifa_dev->dev->ifindex;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001472
Jiri Pirko5c766d62013-01-24 09:41:41 +00001473 if (!(ifm->ifa_flags & IFA_F_PERMANENT)) {
1474 preferred = ifa->ifa_preferred_lft;
1475 valid = ifa->ifa_valid_lft;
1476 if (preferred != INFINITY_LIFE_TIME) {
1477 long tval = (jiffies - ifa->ifa_tstamp) / HZ;
1478
1479 if (preferred > tval)
1480 preferred -= tval;
1481 else
1482 preferred = 0;
1483 if (valid != INFINITY_LIFE_TIME) {
1484 if (valid > tval)
1485 valid -= tval;
1486 else
1487 valid = 0;
1488 }
1489 }
1490 } else {
1491 preferred = INFINITY_LIFE_TIME;
1492 valid = INFINITY_LIFE_TIME;
1493 }
David S. Millerf3756b72012-04-01 20:39:02 -04001494 if ((ifa->ifa_address &&
1495 nla_put_be32(skb, IFA_ADDRESS, ifa->ifa_address)) ||
1496 (ifa->ifa_local &&
1497 nla_put_be32(skb, IFA_LOCAL, ifa->ifa_local)) ||
1498 (ifa->ifa_broadcast &&
1499 nla_put_be32(skb, IFA_BROADCAST, ifa->ifa_broadcast)) ||
1500 (ifa->ifa_label[0] &&
Jiri Pirko5c766d62013-01-24 09:41:41 +00001501 nla_put_string(skb, IFA_LABEL, ifa->ifa_label)) ||
1502 put_cacheinfo(skb, ifa->ifa_cstamp, ifa->ifa_tstamp,
1503 preferred, valid))
David S. Millerf3756b72012-04-01 20:39:02 -04001504 goto nla_put_failure;
Thomas Graf47f68512006-08-04 23:04:36 -07001505
1506 return nlmsg_end(skb, nlh);
1507
1508nla_put_failure:
Patrick McHardy26932562007-01-31 23:16:40 -08001509 nlmsg_cancel(skb, nlh);
1510 return -EMSGSIZE;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001511}
1512
1513static int inet_dump_ifaddr(struct sk_buff *skb, struct netlink_callback *cb)
1514{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001515 struct net *net = sock_net(skb->sk);
Eric Dumazeteec4df92009-11-12 07:44:25 +00001516 int h, s_h;
1517 int idx, s_idx;
1518 int ip_idx, s_ip_idx;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001519 struct net_device *dev;
1520 struct in_device *in_dev;
1521 struct in_ifaddr *ifa;
Eric Dumazeteec4df92009-11-12 07:44:25 +00001522 struct hlist_head *head;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001523
Eric Dumazeteec4df92009-11-12 07:44:25 +00001524 s_h = cb->args[0];
1525 s_idx = idx = cb->args[1];
1526 s_ip_idx = ip_idx = cb->args[2];
Linus Torvalds1da177e2005-04-16 15:20:36 -07001527
Eric Dumazeteec4df92009-11-12 07:44:25 +00001528 for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) {
1529 idx = 0;
1530 head = &net->dev_index_head[h];
1531 rcu_read_lock();
Nicolas Dichtel04652772013-03-22 06:28:42 +00001532 cb->seq = atomic_read(&net->ipv4.dev_addr_genid) ^
1533 net->dev_base_seq;
Sasha Levinb67bfe02013-02-27 17:06:00 -08001534 hlist_for_each_entry_rcu(dev, head, index_hlist) {
Eric Dumazeteec4df92009-11-12 07:44:25 +00001535 if (idx < s_idx)
1536 goto cont;
Patrick McHardy4b97efd2010-03-26 20:27:49 -07001537 if (h > s_h || idx > s_idx)
Eric Dumazeteec4df92009-11-12 07:44:25 +00001538 s_ip_idx = 0;
1539 in_dev = __in_dev_get_rcu(dev);
1540 if (!in_dev)
1541 goto cont;
1542
1543 for (ifa = in_dev->ifa_list, ip_idx = 0; ifa;
1544 ifa = ifa->ifa_next, ip_idx++) {
1545 if (ip_idx < s_ip_idx)
1546 continue;
1547 if (inet_fill_ifaddr(skb, ifa,
Eric W. Biederman15e47302012-09-07 20:12:54 +00001548 NETLINK_CB(cb->skb).portid,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001549 cb->nlh->nlmsg_seq,
Eric Dumazeteec4df92009-11-12 07:44:25 +00001550 RTM_NEWADDR, NLM_F_MULTI) <= 0) {
1551 rcu_read_unlock();
1552 goto done;
1553 }
Nicolas Dichtel04652772013-03-22 06:28:42 +00001554 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
Eric Dumazeteec4df92009-11-12 07:44:25 +00001555 }
Pavel Emelianov7562f872007-05-03 15:13:45 -07001556cont:
Eric Dumazeteec4df92009-11-12 07:44:25 +00001557 idx++;
1558 }
1559 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001560 }
1561
1562done:
Eric Dumazeteec4df92009-11-12 07:44:25 +00001563 cb->args[0] = h;
1564 cb->args[1] = idx;
1565 cb->args[2] = ip_idx;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001566
1567 return skb->len;
1568}
1569
Jianjun Kong539afed2008-11-03 02:48:48 -08001570static void rtmsg_ifa(int event, struct in_ifaddr *ifa, struct nlmsghdr *nlh,
Eric W. Biederman15e47302012-09-07 20:12:54 +00001571 u32 portid)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001572{
Thomas Graf47f68512006-08-04 23:04:36 -07001573 struct sk_buff *skb;
Thomas Grafd6062cb2006-08-15 00:33:59 -07001574 u32 seq = nlh ? nlh->nlmsg_seq : 0;
1575 int err = -ENOBUFS;
Denis V. Lunev4b8aa9a2008-01-31 18:47:40 -08001576 struct net *net;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001577
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001578 net = dev_net(ifa->ifa_dev->dev);
Thomas Graf339bf982006-11-10 14:10:15 -08001579 skb = nlmsg_new(inet_nlmsg_size(), GFP_KERNEL);
Thomas Graf47f68512006-08-04 23:04:36 -07001580 if (skb == NULL)
Thomas Grafd6062cb2006-08-15 00:33:59 -07001581 goto errout;
1582
Eric W. Biederman15e47302012-09-07 20:12:54 +00001583 err = inet_fill_ifaddr(skb, ifa, portid, seq, event, 0);
Patrick McHardy26932562007-01-31 23:16:40 -08001584 if (err < 0) {
1585 /* -EMSGSIZE implies BUG in inet_nlmsg_size() */
1586 WARN_ON(err == -EMSGSIZE);
1587 kfree_skb(skb);
1588 goto errout;
1589 }
Eric W. Biederman15e47302012-09-07 20:12:54 +00001590 rtnl_notify(skb, net, portid, RTNLGRP_IPV4_IFADDR, nlh, GFP_KERNEL);
Pablo Neira Ayuso1ce85fe2009-02-24 23:18:28 -08001591 return;
Thomas Grafd6062cb2006-08-15 00:33:59 -07001592errout:
1593 if (err < 0)
Denis V. Lunev4b8aa9a2008-01-31 18:47:40 -08001594 rtnl_set_sk_err(net, RTNLGRP_IPV4_IFADDR, err);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001595}
1596
Thomas Graf9f0f7272010-11-16 04:32:48 +00001597static size_t inet_get_link_af_size(const struct net_device *dev)
1598{
Eric Dumazet1fc19af2011-05-09 20:55:03 -07001599 struct in_device *in_dev = rcu_dereference_rtnl(dev->ip_ptr);
Thomas Graf9f0f7272010-11-16 04:32:48 +00001600
1601 if (!in_dev)
1602 return 0;
1603
1604 return nla_total_size(IPV4_DEVCONF_MAX * 4); /* IFLA_INET_CONF */
1605}
1606
1607static int inet_fill_link_af(struct sk_buff *skb, const struct net_device *dev)
1608{
Eric Dumazet1fc19af2011-05-09 20:55:03 -07001609 struct in_device *in_dev = rcu_dereference_rtnl(dev->ip_ptr);
Thomas Graf9f0f7272010-11-16 04:32:48 +00001610 struct nlattr *nla;
1611 int i;
1612
1613 if (!in_dev)
1614 return -ENODATA;
1615
1616 nla = nla_reserve(skb, IFLA_INET_CONF, IPV4_DEVCONF_MAX * 4);
1617 if (nla == NULL)
1618 return -EMSGSIZE;
1619
1620 for (i = 0; i < IPV4_DEVCONF_MAX; i++)
1621 ((u32 *) nla_data(nla))[i] = in_dev->cnf.data[i];
1622
1623 return 0;
1624}
1625
1626static const struct nla_policy inet_af_policy[IFLA_INET_MAX+1] = {
1627 [IFLA_INET_CONF] = { .type = NLA_NESTED },
1628};
1629
Thomas Grafcf7afbf2010-11-22 01:31:54 +00001630static int inet_validate_link_af(const struct net_device *dev,
1631 const struct nlattr *nla)
Thomas Graf9f0f7272010-11-16 04:32:48 +00001632{
Thomas Graf9f0f7272010-11-16 04:32:48 +00001633 struct nlattr *a, *tb[IFLA_INET_MAX+1];
1634 int err, rem;
1635
Eric Dumazetf7fce742010-12-01 06:03:06 +00001636 if (dev && !__in_dev_get_rtnl(dev))
Thomas Grafcf7afbf2010-11-22 01:31:54 +00001637 return -EAFNOSUPPORT;
Thomas Graf9f0f7272010-11-16 04:32:48 +00001638
1639 err = nla_parse_nested(tb, IFLA_INET_MAX, nla, inet_af_policy);
1640 if (err < 0)
1641 return err;
1642
1643 if (tb[IFLA_INET_CONF]) {
1644 nla_for_each_nested(a, tb[IFLA_INET_CONF], rem) {
1645 int cfgid = nla_type(a);
1646
1647 if (nla_len(a) < 4)
1648 return -EINVAL;
1649
1650 if (cfgid <= 0 || cfgid > IPV4_DEVCONF_MAX)
1651 return -EINVAL;
1652 }
1653 }
1654
Thomas Grafcf7afbf2010-11-22 01:31:54 +00001655 return 0;
1656}
1657
1658static int inet_set_link_af(struct net_device *dev, const struct nlattr *nla)
1659{
Eric Dumazetf7fce742010-12-01 06:03:06 +00001660 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Thomas Grafcf7afbf2010-11-22 01:31:54 +00001661 struct nlattr *a, *tb[IFLA_INET_MAX+1];
1662 int rem;
1663
1664 if (!in_dev)
1665 return -EAFNOSUPPORT;
1666
1667 if (nla_parse_nested(tb, IFLA_INET_MAX, nla, NULL) < 0)
1668 BUG();
1669
Thomas Graf9f0f7272010-11-16 04:32:48 +00001670 if (tb[IFLA_INET_CONF]) {
1671 nla_for_each_nested(a, tb[IFLA_INET_CONF], rem)
1672 ipv4_devconf_set(in_dev, nla_type(a), nla_get_u32(a));
1673 }
1674
1675 return 0;
1676}
1677
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001678static int inet_netconf_msgsize_devconf(int type)
1679{
1680 int size = NLMSG_ALIGN(sizeof(struct netconfmsg))
1681 + nla_total_size(4); /* NETCONFA_IFINDEX */
1682
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001683 /* type -1 is used for ALL */
1684 if (type == -1 || type == NETCONFA_FORWARDING)
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001685 size += nla_total_size(4);
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00001686 if (type == -1 || type == NETCONFA_RP_FILTER)
1687 size += nla_total_size(4);
Nicolas Dichteld67b8c62012-12-04 01:13:35 +00001688 if (type == -1 || type == NETCONFA_MC_FORWARDING)
1689 size += nla_total_size(4);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001690
1691 return size;
1692}
1693
1694static int inet_netconf_fill_devconf(struct sk_buff *skb, int ifindex,
1695 struct ipv4_devconf *devconf, u32 portid,
1696 u32 seq, int event, unsigned int flags,
1697 int type)
1698{
1699 struct nlmsghdr *nlh;
1700 struct netconfmsg *ncm;
1701
1702 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct netconfmsg),
1703 flags);
1704 if (nlh == NULL)
1705 return -EMSGSIZE;
1706
1707 ncm = nlmsg_data(nlh);
1708 ncm->ncm_family = AF_INET;
1709
1710 if (nla_put_s32(skb, NETCONFA_IFINDEX, ifindex) < 0)
1711 goto nla_put_failure;
1712
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001713 /* type -1 is used for ALL */
1714 if ((type == -1 || type == NETCONFA_FORWARDING) &&
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001715 nla_put_s32(skb, NETCONFA_FORWARDING,
1716 IPV4_DEVCONF(*devconf, FORWARDING)) < 0)
1717 goto nla_put_failure;
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00001718 if ((type == -1 || type == NETCONFA_RP_FILTER) &&
1719 nla_put_s32(skb, NETCONFA_RP_FILTER,
1720 IPV4_DEVCONF(*devconf, RP_FILTER)) < 0)
1721 goto nla_put_failure;
Nicolas Dichteld67b8c62012-12-04 01:13:35 +00001722 if ((type == -1 || type == NETCONFA_MC_FORWARDING) &&
1723 nla_put_s32(skb, NETCONFA_MC_FORWARDING,
1724 IPV4_DEVCONF(*devconf, MC_FORWARDING)) < 0)
1725 goto nla_put_failure;
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001726
1727 return nlmsg_end(skb, nlh);
1728
1729nla_put_failure:
1730 nlmsg_cancel(skb, nlh);
1731 return -EMSGSIZE;
1732}
1733
Nicolas Dichteld67b8c62012-12-04 01:13:35 +00001734void inet_netconf_notify_devconf(struct net *net, int type, int ifindex,
1735 struct ipv4_devconf *devconf)
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001736{
1737 struct sk_buff *skb;
1738 int err = -ENOBUFS;
1739
1740 skb = nlmsg_new(inet_netconf_msgsize_devconf(type), GFP_ATOMIC);
1741 if (skb == NULL)
1742 goto errout;
1743
1744 err = inet_netconf_fill_devconf(skb, ifindex, devconf, 0, 0,
1745 RTM_NEWNETCONF, 0, type);
1746 if (err < 0) {
1747 /* -EMSGSIZE implies BUG in inet_netconf_msgsize_devconf() */
1748 WARN_ON(err == -EMSGSIZE);
1749 kfree_skb(skb);
1750 goto errout;
1751 }
1752 rtnl_notify(skb, net, 0, RTNLGRP_IPV4_NETCONF, NULL, GFP_ATOMIC);
1753 return;
1754errout:
1755 if (err < 0)
1756 rtnl_set_sk_err(net, RTNLGRP_IPV4_NETCONF, err);
1757}
1758
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001759static const struct nla_policy devconf_ipv4_policy[NETCONFA_MAX+1] = {
1760 [NETCONFA_IFINDEX] = { .len = sizeof(int) },
1761 [NETCONFA_FORWARDING] = { .len = sizeof(int) },
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00001762 [NETCONFA_RP_FILTER] = { .len = sizeof(int) },
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001763};
1764
1765static int inet_netconf_get_devconf(struct sk_buff *in_skb,
Thomas Graf661d2962013-03-21 07:45:29 +00001766 struct nlmsghdr *nlh)
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001767{
1768 struct net *net = sock_net(in_skb->sk);
1769 struct nlattr *tb[NETCONFA_MAX+1];
1770 struct netconfmsg *ncm;
1771 struct sk_buff *skb;
1772 struct ipv4_devconf *devconf;
1773 struct in_device *in_dev;
1774 struct net_device *dev;
1775 int ifindex;
1776 int err;
1777
1778 err = nlmsg_parse(nlh, sizeof(*ncm), tb, NETCONFA_MAX,
1779 devconf_ipv4_policy);
1780 if (err < 0)
1781 goto errout;
1782
1783 err = EINVAL;
1784 if (!tb[NETCONFA_IFINDEX])
1785 goto errout;
1786
1787 ifindex = nla_get_s32(tb[NETCONFA_IFINDEX]);
1788 switch (ifindex) {
1789 case NETCONFA_IFINDEX_ALL:
1790 devconf = net->ipv4.devconf_all;
1791 break;
1792 case NETCONFA_IFINDEX_DEFAULT:
1793 devconf = net->ipv4.devconf_dflt;
1794 break;
1795 default:
1796 dev = __dev_get_by_index(net, ifindex);
1797 if (dev == NULL)
1798 goto errout;
1799 in_dev = __in_dev_get_rtnl(dev);
1800 if (in_dev == NULL)
1801 goto errout;
1802 devconf = &in_dev->cnf;
1803 break;
1804 }
1805
1806 err = -ENOBUFS;
1807 skb = nlmsg_new(inet_netconf_msgsize_devconf(-1), GFP_ATOMIC);
1808 if (skb == NULL)
1809 goto errout;
1810
1811 err = inet_netconf_fill_devconf(skb, ifindex, devconf,
1812 NETLINK_CB(in_skb).portid,
1813 nlh->nlmsg_seq, RTM_NEWNETCONF, 0,
1814 -1);
1815 if (err < 0) {
1816 /* -EMSGSIZE implies BUG in inet_netconf_msgsize_devconf() */
1817 WARN_ON(err == -EMSGSIZE);
1818 kfree_skb(skb);
1819 goto errout;
1820 }
1821 err = rtnl_unicast(skb, net, NETLINK_CB(in_skb).portid);
1822errout:
1823 return err;
1824}
1825
Nicolas Dichtel7a674202013-03-05 23:42:06 +00001826static int inet_netconf_dump_devconf(struct sk_buff *skb,
1827 struct netlink_callback *cb)
1828{
1829 struct net *net = sock_net(skb->sk);
1830 int h, s_h;
1831 int idx, s_idx;
1832 struct net_device *dev;
1833 struct in_device *in_dev;
1834 struct hlist_head *head;
1835
1836 s_h = cb->args[0];
1837 s_idx = idx = cb->args[1];
1838
1839 for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) {
1840 idx = 0;
1841 head = &net->dev_index_head[h];
1842 rcu_read_lock();
Nicolas Dichtel04652772013-03-22 06:28:42 +00001843 cb->seq = atomic_read(&net->ipv4.dev_addr_genid) ^
1844 net->dev_base_seq;
Nicolas Dichtel7a674202013-03-05 23:42:06 +00001845 hlist_for_each_entry_rcu(dev, head, index_hlist) {
1846 if (idx < s_idx)
1847 goto cont;
1848 in_dev = __in_dev_get_rcu(dev);
1849 if (!in_dev)
1850 goto cont;
1851
1852 if (inet_netconf_fill_devconf(skb, dev->ifindex,
1853 &in_dev->cnf,
1854 NETLINK_CB(cb->skb).portid,
1855 cb->nlh->nlmsg_seq,
1856 RTM_NEWNETCONF,
1857 NLM_F_MULTI,
1858 -1) <= 0) {
1859 rcu_read_unlock();
1860 goto done;
1861 }
Nicolas Dichtel04652772013-03-22 06:28:42 +00001862 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
Nicolas Dichtel7a674202013-03-05 23:42:06 +00001863cont:
1864 idx++;
1865 }
1866 rcu_read_unlock();
1867 }
1868 if (h == NETDEV_HASHENTRIES) {
1869 if (inet_netconf_fill_devconf(skb, NETCONFA_IFINDEX_ALL,
1870 net->ipv4.devconf_all,
1871 NETLINK_CB(cb->skb).portid,
1872 cb->nlh->nlmsg_seq,
1873 RTM_NEWNETCONF, NLM_F_MULTI,
1874 -1) <= 0)
1875 goto done;
1876 else
1877 h++;
1878 }
1879 if (h == NETDEV_HASHENTRIES + 1) {
1880 if (inet_netconf_fill_devconf(skb, NETCONFA_IFINDEX_DEFAULT,
1881 net->ipv4.devconf_dflt,
1882 NETLINK_CB(cb->skb).portid,
1883 cb->nlh->nlmsg_seq,
1884 RTM_NEWNETCONF, NLM_F_MULTI,
1885 -1) <= 0)
1886 goto done;
1887 else
1888 h++;
1889 }
1890done:
1891 cb->args[0] = h;
1892 cb->args[1] = idx;
1893
1894 return skb->len;
1895}
1896
Linus Torvalds1da177e2005-04-16 15:20:36 -07001897#ifdef CONFIG_SYSCTL
1898
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001899static void devinet_copy_dflt_conf(struct net *net, int i)
Herbert Xu31be3082007-06-04 23:35:37 -07001900{
1901 struct net_device *dev;
1902
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001903 rcu_read_lock();
1904 for_each_netdev_rcu(net, dev) {
Herbert Xu31be3082007-06-04 23:35:37 -07001905 struct in_device *in_dev;
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001906
Herbert Xu31be3082007-06-04 23:35:37 -07001907 in_dev = __in_dev_get_rcu(dev);
1908 if (in_dev && !test_bit(i, in_dev->cnf.state))
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -08001909 in_dev->cnf.data[i] = net->ipv4.devconf_dflt->data[i];
Herbert Xu31be3082007-06-04 23:35:37 -07001910 }
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001911 rcu_read_unlock();
Herbert Xu31be3082007-06-04 23:35:37 -07001912}
1913
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001914/* called with RTNL locked */
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001915static void inet_forward_change(struct net *net)
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001916{
1917 struct net_device *dev;
Pavel Emelyanov586f1212007-12-16 13:32:48 -08001918 int on = IPV4_DEVCONF_ALL(net, FORWARDING);
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001919
Pavel Emelyanov586f1212007-12-16 13:32:48 -08001920 IPV4_DEVCONF_ALL(net, ACCEPT_REDIRECTS) = !on;
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -08001921 IPV4_DEVCONF_DFLT(net, FORWARDING) = on;
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001922 inet_netconf_notify_devconf(net, NETCONFA_FORWARDING,
1923 NETCONFA_IFINDEX_ALL,
1924 net->ipv4.devconf_all);
1925 inet_netconf_notify_devconf(net, NETCONFA_FORWARDING,
1926 NETCONFA_IFINDEX_DEFAULT,
1927 net->ipv4.devconf_dflt);
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001928
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001929 for_each_netdev(net, dev) {
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001930 struct in_device *in_dev;
Ben Hutchings0187bdf2008-06-19 16:15:47 -07001931 if (on)
1932 dev_disable_lro(dev);
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001933 rcu_read_lock();
1934 in_dev = __in_dev_get_rcu(dev);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001935 if (in_dev) {
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001936 IN_DEV_CONF_SET(in_dev, FORWARDING, on);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001937 inet_netconf_notify_devconf(net, NETCONFA_FORWARDING,
1938 dev->ifindex, &in_dev->cnf);
1939 }
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001940 rcu_read_unlock();
1941 }
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001942}
1943
Herbert Xu31be3082007-06-04 23:35:37 -07001944static int devinet_conf_proc(ctl_table *ctl, int write,
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07001945 void __user *buffer,
Herbert Xu31be3082007-06-04 23:35:37 -07001946 size_t *lenp, loff_t *ppos)
1947{
Peter Pan(潘卫平)d01ff0a2011-12-01 15:47:06 +00001948 int old_value = *(int *)ctl->data;
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07001949 int ret = proc_dointvec(ctl, write, buffer, lenp, ppos);
Peter Pan(潘卫平)d01ff0a2011-12-01 15:47:06 +00001950 int new_value = *(int *)ctl->data;
Herbert Xu31be3082007-06-04 23:35:37 -07001951
1952 if (write) {
1953 struct ipv4_devconf *cnf = ctl->extra1;
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001954 struct net *net = ctl->extra2;
Herbert Xu31be3082007-06-04 23:35:37 -07001955 int i = (int *)ctl->data - cnf->data;
1956
1957 set_bit(i, cnf->state);
1958
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -08001959 if (cnf == net->ipv4.devconf_dflt)
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001960 devinet_copy_dflt_conf(net, i);
Thomas Grafd0daebc32012-06-12 00:44:01 +00001961 if (i == IPV4_DEVCONF_ACCEPT_LOCAL - 1 ||
1962 i == IPV4_DEVCONF_ROUTE_LOCALNET - 1)
Peter Pan(潘卫平)d01ff0a2011-12-01 15:47:06 +00001963 if ((new_value == 0) && (old_value != 0))
Nicolas Dichtel4ccfe6d2012-09-07 00:45:29 +00001964 rt_cache_flush(net);
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00001965 if (i == IPV4_DEVCONF_RP_FILTER - 1 &&
1966 new_value != old_value) {
1967 int ifindex;
1968
1969 if (cnf == net->ipv4.devconf_dflt)
1970 ifindex = NETCONFA_IFINDEX_DEFAULT;
1971 else if (cnf == net->ipv4.devconf_all)
1972 ifindex = NETCONFA_IFINDEX_ALL;
1973 else {
1974 struct in_device *idev =
1975 container_of(cnf, struct in_device,
1976 cnf);
1977 ifindex = idev->dev->ifindex;
1978 }
1979 inet_netconf_notify_devconf(net, NETCONFA_RP_FILTER,
1980 ifindex, cnf);
1981 }
Herbert Xu31be3082007-06-04 23:35:37 -07001982 }
1983
1984 return ret;
1985}
1986
Linus Torvalds1da177e2005-04-16 15:20:36 -07001987static int devinet_sysctl_forward(ctl_table *ctl, int write,
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07001988 void __user *buffer,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001989 size_t *lenp, loff_t *ppos)
1990{
1991 int *valp = ctl->data;
1992 int val = *valp;
Eric W. Biederman88af1822010-02-19 13:22:59 +00001993 loff_t pos = *ppos;
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07001994 int ret = proc_dointvec(ctl, write, buffer, lenp, ppos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001995
1996 if (write && *valp != val) {
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001997 struct net *net = ctl->extra2;
1998
Ben Hutchings0187bdf2008-06-19 16:15:47 -07001999 if (valp != &IPV4_DEVCONF_DFLT(net, FORWARDING)) {
Eric W. Biederman88af1822010-02-19 13:22:59 +00002000 if (!rtnl_trylock()) {
2001 /* Restore the original values before restarting */
2002 *valp = val;
2003 *ppos = pos;
Eric W. Biederman9b8adb52009-05-13 16:59:21 +00002004 return restart_syscall();
Eric W. Biederman88af1822010-02-19 13:22:59 +00002005 }
Ben Hutchings0187bdf2008-06-19 16:15:47 -07002006 if (valp == &IPV4_DEVCONF_ALL(net, FORWARDING)) {
2007 inet_forward_change(net);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00002008 } else {
Ben Hutchings0187bdf2008-06-19 16:15:47 -07002009 struct ipv4_devconf *cnf = ctl->extra1;
2010 struct in_device *idev =
2011 container_of(cnf, struct in_device, cnf);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00002012 if (*valp)
2013 dev_disable_lro(idev->dev);
2014 inet_netconf_notify_devconf(net,
2015 NETCONFA_FORWARDING,
2016 idev->dev->ifindex,
2017 cnf);
Ben Hutchings0187bdf2008-06-19 16:15:47 -07002018 }
2019 rtnl_unlock();
Nicolas Dichtel4ccfe6d2012-09-07 00:45:29 +00002020 rt_cache_flush(net);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00002021 } else
2022 inet_netconf_notify_devconf(net, NETCONFA_FORWARDING,
2023 NETCONFA_IFINDEX_DEFAULT,
2024 net->ipv4.devconf_dflt);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002025 }
2026
2027 return ret;
2028}
2029
David S. Miller323e1262010-12-12 21:55:08 -08002030static int ipv4_doint_and_flush(ctl_table *ctl, int write,
2031 void __user *buffer,
2032 size_t *lenp, loff_t *ppos)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002033{
2034 int *valp = ctl->data;
2035 int val = *valp;
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07002036 int ret = proc_dointvec(ctl, write, buffer, lenp, ppos);
Denis V. Lunev76e6ebf2008-07-05 19:00:44 -07002037 struct net *net = ctl->extra2;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002038
2039 if (write && *valp != val)
Nicolas Dichtel4ccfe6d2012-09-07 00:45:29 +00002040 rt_cache_flush(net);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002041
2042 return ret;
2043}
2044
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002045#define DEVINET_SYSCTL_ENTRY(attr, name, mval, proc) \
Herbert Xu42f811b2007-06-04 23:34:44 -07002046 { \
Herbert Xu42f811b2007-06-04 23:34:44 -07002047 .procname = name, \
2048 .data = ipv4_devconf.data + \
Eric W. Biederman02291682010-02-14 03:25:51 +00002049 IPV4_DEVCONF_ ## attr - 1, \
Herbert Xu42f811b2007-06-04 23:34:44 -07002050 .maxlen = sizeof(int), \
2051 .mode = mval, \
2052 .proc_handler = proc, \
Herbert Xu31be3082007-06-04 23:35:37 -07002053 .extra1 = &ipv4_devconf, \
Herbert Xu42f811b2007-06-04 23:34:44 -07002054 }
2055
2056#define DEVINET_SYSCTL_RW_ENTRY(attr, name) \
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002057 DEVINET_SYSCTL_ENTRY(attr, name, 0644, devinet_conf_proc)
Herbert Xu42f811b2007-06-04 23:34:44 -07002058
2059#define DEVINET_SYSCTL_RO_ENTRY(attr, name) \
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002060 DEVINET_SYSCTL_ENTRY(attr, name, 0444, devinet_conf_proc)
Herbert Xu42f811b2007-06-04 23:34:44 -07002061
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002062#define DEVINET_SYSCTL_COMPLEX_ENTRY(attr, name, proc) \
2063 DEVINET_SYSCTL_ENTRY(attr, name, 0644, proc)
Herbert Xu42f811b2007-06-04 23:34:44 -07002064
2065#define DEVINET_SYSCTL_FLUSHING_ENTRY(attr, name) \
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002066 DEVINET_SYSCTL_COMPLEX_ENTRY(attr, name, ipv4_doint_and_flush)
Herbert Xu42f811b2007-06-04 23:34:44 -07002067
Linus Torvalds1da177e2005-04-16 15:20:36 -07002068static struct devinet_sysctl_table {
2069 struct ctl_table_header *sysctl_header;
Eric W. Biederman02291682010-02-14 03:25:51 +00002070 struct ctl_table devinet_vars[__IPV4_DEVCONF_MAX];
Linus Torvalds1da177e2005-04-16 15:20:36 -07002071} devinet_sysctl = {
2072 .devinet_vars = {
Herbert Xu42f811b2007-06-04 23:34:44 -07002073 DEVINET_SYSCTL_COMPLEX_ENTRY(FORWARDING, "forwarding",
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002074 devinet_sysctl_forward),
Herbert Xu42f811b2007-06-04 23:34:44 -07002075 DEVINET_SYSCTL_RO_ENTRY(MC_FORWARDING, "mc_forwarding"),
2076
2077 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_REDIRECTS, "accept_redirects"),
2078 DEVINET_SYSCTL_RW_ENTRY(SECURE_REDIRECTS, "secure_redirects"),
2079 DEVINET_SYSCTL_RW_ENTRY(SHARED_MEDIA, "shared_media"),
2080 DEVINET_SYSCTL_RW_ENTRY(RP_FILTER, "rp_filter"),
2081 DEVINET_SYSCTL_RW_ENTRY(SEND_REDIRECTS, "send_redirects"),
2082 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_SOURCE_ROUTE,
2083 "accept_source_route"),
Patrick McHardy8153a102009-12-03 01:25:58 +00002084 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_LOCAL, "accept_local"),
Jamal Hadi Salim28f6aee2009-12-25 17:30:22 -08002085 DEVINET_SYSCTL_RW_ENTRY(SRC_VMARK, "src_valid_mark"),
Herbert Xu42f811b2007-06-04 23:34:44 -07002086 DEVINET_SYSCTL_RW_ENTRY(PROXY_ARP, "proxy_arp"),
2087 DEVINET_SYSCTL_RW_ENTRY(MEDIUM_ID, "medium_id"),
2088 DEVINET_SYSCTL_RW_ENTRY(BOOTP_RELAY, "bootp_relay"),
2089 DEVINET_SYSCTL_RW_ENTRY(LOG_MARTIANS, "log_martians"),
2090 DEVINET_SYSCTL_RW_ENTRY(TAG, "tag"),
2091 DEVINET_SYSCTL_RW_ENTRY(ARPFILTER, "arp_filter"),
2092 DEVINET_SYSCTL_RW_ENTRY(ARP_ANNOUNCE, "arp_announce"),
2093 DEVINET_SYSCTL_RW_ENTRY(ARP_IGNORE, "arp_ignore"),
2094 DEVINET_SYSCTL_RW_ENTRY(ARP_ACCEPT, "arp_accept"),
Stephen Hemmingereefef1c2009-02-01 01:04:33 -08002095 DEVINET_SYSCTL_RW_ENTRY(ARP_NOTIFY, "arp_notify"),
Jesper Dangaard Brouer65324142010-01-05 05:50:47 +00002096 DEVINET_SYSCTL_RW_ENTRY(PROXY_ARP_PVLAN, "proxy_arp_pvlan"),
Herbert Xu42f811b2007-06-04 23:34:44 -07002097
2098 DEVINET_SYSCTL_FLUSHING_ENTRY(NOXFRM, "disable_xfrm"),
2099 DEVINET_SYSCTL_FLUSHING_ENTRY(NOPOLICY, "disable_policy"),
2100 DEVINET_SYSCTL_FLUSHING_ENTRY(FORCE_IGMP_VERSION,
2101 "force_igmp_version"),
2102 DEVINET_SYSCTL_FLUSHING_ENTRY(PROMOTE_SECONDARIES,
2103 "promote_secondaries"),
Thomas Grafd0daebc32012-06-12 00:44:01 +00002104 DEVINET_SYSCTL_FLUSHING_ENTRY(ROUTE_LOCALNET,
2105 "route_localnet"),
Linus Torvalds1da177e2005-04-16 15:20:36 -07002106 },
Linus Torvalds1da177e2005-04-16 15:20:36 -07002107};
2108
Pavel Emelyanovea40b322007-12-16 13:30:07 -08002109static int __devinet_sysctl_register(struct net *net, char *dev_name,
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002110 struct ipv4_devconf *p)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002111{
2112 int i;
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002113 struct devinet_sysctl_table *t;
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002114 char path[sizeof("net/ipv4/conf/") + IFNAMSIZ];
Pavel Emelyanovbfada692007-12-02 00:57:08 +11002115
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002116 t = kmemdup(&devinet_sysctl, sizeof(*t), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002117 if (!t)
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002118 goto out;
2119
Linus Torvalds1da177e2005-04-16 15:20:36 -07002120 for (i = 0; i < ARRAY_SIZE(t->devinet_vars) - 1; i++) {
2121 t->devinet_vars[i].data += (char *)p - (char *)&ipv4_devconf;
Herbert Xu31be3082007-06-04 23:35:37 -07002122 t->devinet_vars[i].extra1 = p;
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08002123 t->devinet_vars[i].extra2 = net;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002124 }
2125
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002126 snprintf(path, sizeof(path), "net/ipv4/conf/%s", dev_name);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002127
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002128 t->sysctl_header = register_net_sysctl(net, path, t->devinet_vars);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002129 if (!t->sysctl_header)
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002130 goto free;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002131
2132 p->sysctl = t;
Pavel Emelyanovea40b322007-12-16 13:30:07 -08002133 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002134
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002135free:
Linus Torvalds1da177e2005-04-16 15:20:36 -07002136 kfree(t);
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002137out:
Pavel Emelyanovea40b322007-12-16 13:30:07 -08002138 return -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002139}
2140
Pavel Emelyanov51602b22007-12-11 02:17:40 -08002141static void __devinet_sysctl_unregister(struct ipv4_devconf *cnf)
2142{
2143 struct devinet_sysctl_table *t = cnf->sysctl;
2144
2145 if (t == NULL)
2146 return;
2147
2148 cnf->sysctl = NULL;
Lucian Adrian Grijincuff538812011-05-01 01:44:01 +00002149 unregister_net_sysctl_table(t->sysctl_header);
Pavel Emelyanov51602b22007-12-11 02:17:40 -08002150 kfree(t);
2151}
2152
Pavel Emelyanov66f27a52007-12-02 00:55:54 +11002153static void devinet_sysctl_register(struct in_device *idev)
2154{
Eric W. Biederman54716e32010-02-14 03:27:03 +00002155 neigh_sysctl_register(idev->dev, idev->arp_parms, "ipv4", NULL);
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09002156 __devinet_sysctl_register(dev_net(idev->dev), idev->dev->name,
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002157 &idev->cnf);
Pavel Emelyanov66f27a52007-12-02 00:55:54 +11002158}
2159
Pavel Emelyanov51602b22007-12-11 02:17:40 -08002160static void devinet_sysctl_unregister(struct in_device *idev)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002161{
Pavel Emelyanov51602b22007-12-11 02:17:40 -08002162 __devinet_sysctl_unregister(&idev->cnf);
2163 neigh_sysctl_unregister(idev->arp_parms);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002164}
Linus Torvalds1da177e2005-04-16 15:20:36 -07002165
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002166static struct ctl_table ctl_forward_entry[] = {
2167 {
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002168 .procname = "ip_forward",
2169 .data = &ipv4_devconf.data[
Eric W. Biederman02291682010-02-14 03:25:51 +00002170 IPV4_DEVCONF_FORWARDING - 1],
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002171 .maxlen = sizeof(int),
2172 .mode = 0644,
2173 .proc_handler = devinet_sysctl_forward,
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002174 .extra1 = &ipv4_devconf,
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08002175 .extra2 = &init_net,
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002176 },
2177 { },
2178};
Eric Dumazet2a75de02008-01-05 23:08:49 -08002179#endif
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002180
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002181static __net_init int devinet_init_net(struct net *net)
2182{
2183 int err;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002184 struct ipv4_devconf *all, *dflt;
Eric Dumazet2a75de02008-01-05 23:08:49 -08002185#ifdef CONFIG_SYSCTL
2186 struct ctl_table *tbl = ctl_forward_entry;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002187 struct ctl_table_header *forw_hdr;
Eric Dumazet2a75de02008-01-05 23:08:49 -08002188#endif
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002189
2190 err = -ENOMEM;
2191 all = &ipv4_devconf;
2192 dflt = &ipv4_devconf_dflt;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002193
Octavian Purdila09ad9bc2009-11-25 15:14:13 -08002194 if (!net_eq(net, &init_net)) {
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002195 all = kmemdup(all, sizeof(ipv4_devconf), GFP_KERNEL);
2196 if (all == NULL)
2197 goto err_alloc_all;
2198
2199 dflt = kmemdup(dflt, sizeof(ipv4_devconf_dflt), GFP_KERNEL);
2200 if (dflt == NULL)
2201 goto err_alloc_dflt;
2202
Eric Dumazet2a75de02008-01-05 23:08:49 -08002203#ifdef CONFIG_SYSCTL
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002204 tbl = kmemdup(tbl, sizeof(ctl_forward_entry), GFP_KERNEL);
2205 if (tbl == NULL)
2206 goto err_alloc_ctl;
2207
Eric W. Biederman02291682010-02-14 03:25:51 +00002208 tbl[0].data = &all->data[IPV4_DEVCONF_FORWARDING - 1];
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002209 tbl[0].extra1 = all;
2210 tbl[0].extra2 = net;
Eric Dumazet2a75de02008-01-05 23:08:49 -08002211#endif
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002212 }
2213
2214#ifdef CONFIG_SYSCTL
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002215 err = __devinet_sysctl_register(net, "all", all);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002216 if (err < 0)
2217 goto err_reg_all;
2218
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002219 err = __devinet_sysctl_register(net, "default", dflt);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002220 if (err < 0)
2221 goto err_reg_dflt;
2222
2223 err = -ENOMEM;
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002224 forw_hdr = register_net_sysctl(net, "net/ipv4", tbl);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002225 if (forw_hdr == NULL)
2226 goto err_reg_ctl;
Eric Dumazet2a75de02008-01-05 23:08:49 -08002227 net->ipv4.forw_hdr = forw_hdr;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002228#endif
2229
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002230 net->ipv4.devconf_all = all;
2231 net->ipv4.devconf_dflt = dflt;
2232 return 0;
2233
2234#ifdef CONFIG_SYSCTL
2235err_reg_ctl:
2236 __devinet_sysctl_unregister(dflt);
2237err_reg_dflt:
2238 __devinet_sysctl_unregister(all);
2239err_reg_all:
2240 if (tbl != ctl_forward_entry)
2241 kfree(tbl);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002242err_alloc_ctl:
Eric Dumazet2a75de02008-01-05 23:08:49 -08002243#endif
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002244 if (dflt != &ipv4_devconf_dflt)
2245 kfree(dflt);
2246err_alloc_dflt:
2247 if (all != &ipv4_devconf)
2248 kfree(all);
2249err_alloc_all:
2250 return err;
2251}
2252
2253static __net_exit void devinet_exit_net(struct net *net)
2254{
Eric Dumazet2a75de02008-01-05 23:08:49 -08002255#ifdef CONFIG_SYSCTL
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002256 struct ctl_table *tbl;
2257
2258 tbl = net->ipv4.forw_hdr->ctl_table_arg;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002259 unregister_net_sysctl_table(net->ipv4.forw_hdr);
2260 __devinet_sysctl_unregister(net->ipv4.devconf_dflt);
2261 __devinet_sysctl_unregister(net->ipv4.devconf_all);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002262 kfree(tbl);
Eric Dumazet2a75de02008-01-05 23:08:49 -08002263#endif
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002264 kfree(net->ipv4.devconf_dflt);
2265 kfree(net->ipv4.devconf_all);
2266}
2267
2268static __net_initdata struct pernet_operations devinet_ops = {
2269 .init = devinet_init_net,
2270 .exit = devinet_exit_net,
2271};
2272
Thomas Graf9f0f7272010-11-16 04:32:48 +00002273static struct rtnl_af_ops inet_af_ops = {
2274 .family = AF_INET,
2275 .fill_link_af = inet_fill_link_af,
2276 .get_link_af_size = inet_get_link_af_size,
Thomas Grafcf7afbf2010-11-22 01:31:54 +00002277 .validate_link_af = inet_validate_link_af,
2278 .set_link_af = inet_set_link_af,
Thomas Graf9f0f7272010-11-16 04:32:48 +00002279};
2280
Linus Torvalds1da177e2005-04-16 15:20:36 -07002281void __init devinet_init(void)
2282{
David S. Millerfd23c3b2011-02-18 12:42:28 -08002283 int i;
2284
2285 for (i = 0; i < IN4_ADDR_HSIZE; i++)
2286 INIT_HLIST_HEAD(&inet_addr_lst[i]);
2287
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002288 register_pernet_subsys(&devinet_ops);
2289
Linus Torvalds1da177e2005-04-16 15:20:36 -07002290 register_gifconf(PF_INET, inet_gifconf);
2291 register_netdevice_notifier(&ip_netdev_notifier);
Thomas Graf63f34442007-03-22 11:55:17 -07002292
Jiri Pirko5c766d62013-01-24 09:41:41 +00002293 schedule_delayed_work(&check_lifetime_work, 0);
2294
Thomas Graf9f0f7272010-11-16 04:32:48 +00002295 rtnl_af_register(&inet_af_ops);
2296
Greg Rosec7ac8672011-06-10 01:27:09 +00002297 rtnl_register(PF_INET, RTM_NEWADDR, inet_rtm_newaddr, NULL, NULL);
2298 rtnl_register(PF_INET, RTM_DELADDR, inet_rtm_deladdr, NULL, NULL);
2299 rtnl_register(PF_INET, RTM_GETADDR, NULL, inet_dump_ifaddr, NULL);
Nicolas Dichtel9e551112012-10-25 22:28:53 +00002300 rtnl_register(PF_INET, RTM_GETNETCONF, inet_netconf_get_devconf,
Nicolas Dichtel7a674202013-03-05 23:42:06 +00002301 inet_netconf_dump_devconf, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002302}
2303