blob: 59ebe16d06fc2db1c0a3a1d8d2ac3d1c74646c3b [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * NET3 IP device support routines.
3 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 * This program is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU General Public License
6 * as published by the Free Software Foundation; either version
7 * 2 of the License, or (at your option) any later version.
8 *
9 * Derived from the IP parts of dev.c 1.0.19
Jesper Juhl02c30a82005-05-05 16:16:16 -070010 * Authors: Ross Biro
Linus Torvalds1da177e2005-04-16 15:20:36 -070011 * Fred N. van Kempen, <waltje@uWalt.NL.Mugnet.ORG>
12 * Mark Evans, <evansmp@uhura.aston.ac.uk>
13 *
14 * Additional Authors:
15 * Alan Cox, <gw4pts@gw4pts.ampr.org>
16 * Alexey Kuznetsov, <kuznet@ms2.inr.ac.ru>
17 *
18 * Changes:
19 * Alexey Kuznetsov: pa_* fields are replaced with ifaddr
20 * lists.
21 * Cyrus Durgin: updated for kmod
22 * Matthias Andree: in devinet_ioctl, compare label and
23 * address (4.4BSD alias style support),
24 * fall back to comparing just the label
25 * if no match found.
26 */
27
Linus Torvalds1da177e2005-04-16 15:20:36 -070028
29#include <asm/uaccess.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070030#include <linux/bitops.h>
Randy Dunlap4fc268d2006-01-11 12:17:47 -080031#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070032#include <linux/module.h>
33#include <linux/types.h>
34#include <linux/kernel.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035#include <linux/string.h>
36#include <linux/mm.h>
37#include <linux/socket.h>
38#include <linux/sockios.h>
39#include <linux/in.h>
40#include <linux/errno.h>
41#include <linux/interrupt.h>
Thomas Graf18237302006-08-04 23:04:54 -070042#include <linux/if_addr.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070043#include <linux/if_ether.h>
44#include <linux/inet.h>
45#include <linux/netdevice.h>
46#include <linux/etherdevice.h>
47#include <linux/skbuff.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070048#include <linux/init.h>
49#include <linux/notifier.h>
50#include <linux/inetdevice.h>
51#include <linux/igmp.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090052#include <linux/slab.h>
David S. Millerfd23c3b2011-02-18 12:42:28 -080053#include <linux/hash.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070054#ifdef CONFIG_SYSCTL
55#include <linux/sysctl.h>
56#endif
57#include <linux/kmod.h>
Nicolas Dichteledc9e742012-10-25 22:28:52 +000058#include <linux/netconf.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070059
Arnaldo Carvalho de Melo14c85022005-12-27 02:43:12 -020060#include <net/arp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070061#include <net/ip.h>
62#include <net/route.h>
63#include <net/ip_fib.h>
Thomas Graf63f34442007-03-22 11:55:17 -070064#include <net/rtnetlink.h>
Pavel Emelyanov752d14d2007-12-16 13:31:47 -080065#include <net/net_namespace.h>
Jiri Pirko5c766d62013-01-24 09:41:41 +000066#include <net/addrconf.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070067
David S. Miller406b6f92011-03-22 21:56:23 -070068#include "fib_lookup.h"
69
Adrian Bunk0027ba82008-01-31 17:17:31 -080070static struct ipv4_devconf ipv4_devconf = {
Herbert Xu42f811b2007-06-04 23:34:44 -070071 .data = {
Eric W. Biederman02291682010-02-14 03:25:51 +000072 [IPV4_DEVCONF_ACCEPT_REDIRECTS - 1] = 1,
73 [IPV4_DEVCONF_SEND_REDIRECTS - 1] = 1,
74 [IPV4_DEVCONF_SECURE_REDIRECTS - 1] = 1,
75 [IPV4_DEVCONF_SHARED_MEDIA - 1] = 1,
William Manley26900482013-08-06 19:03:15 +010076 [IPV4_DEVCONF_IGMPV2_UNSOLICITED_REPORT_INTERVAL - 1] = 10000 /*ms*/,
77 [IPV4_DEVCONF_IGMPV3_UNSOLICITED_REPORT_INTERVAL - 1] = 1000 /*ms*/,
Herbert Xu42f811b2007-06-04 23:34:44 -070078 },
Linus Torvalds1da177e2005-04-16 15:20:36 -070079};
80
81static struct ipv4_devconf ipv4_devconf_dflt = {
Herbert Xu42f811b2007-06-04 23:34:44 -070082 .data = {
Eric W. Biederman02291682010-02-14 03:25:51 +000083 [IPV4_DEVCONF_ACCEPT_REDIRECTS - 1] = 1,
84 [IPV4_DEVCONF_SEND_REDIRECTS - 1] = 1,
85 [IPV4_DEVCONF_SECURE_REDIRECTS - 1] = 1,
86 [IPV4_DEVCONF_SHARED_MEDIA - 1] = 1,
87 [IPV4_DEVCONF_ACCEPT_SOURCE_ROUTE - 1] = 1,
William Manley26900482013-08-06 19:03:15 +010088 [IPV4_DEVCONF_IGMPV2_UNSOLICITED_REPORT_INTERVAL - 1] = 10000 /*ms*/,
89 [IPV4_DEVCONF_IGMPV3_UNSOLICITED_REPORT_INTERVAL - 1] = 1000 /*ms*/,
Herbert Xu42f811b2007-06-04 23:34:44 -070090 },
Linus Torvalds1da177e2005-04-16 15:20:36 -070091};
92
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -080093#define IPV4_DEVCONF_DFLT(net, attr) \
94 IPV4_DEVCONF((*net->ipv4.devconf_dflt), attr)
Herbert Xu42f811b2007-06-04 23:34:44 -070095
Patrick McHardyef7c79e2007-06-05 12:38:30 -070096static const struct nla_policy ifa_ipv4_policy[IFA_MAX+1] = {
Thomas Graf5c753972006-08-04 23:03:53 -070097 [IFA_LOCAL] = { .type = NLA_U32 },
98 [IFA_ADDRESS] = { .type = NLA_U32 },
99 [IFA_BROADCAST] = { .type = NLA_U32 },
Thomas Graf5176f912006-08-26 20:13:18 -0700100 [IFA_LABEL] = { .type = NLA_STRING, .len = IFNAMSIZ - 1 },
Jiri Pirko5c766d62013-01-24 09:41:41 +0000101 [IFA_CACHEINFO] = { .len = sizeof(struct ifa_cacheinfo) },
Jiri Pirkoad6c8132013-12-08 12:16:10 +0100102 [IFA_FLAGS] = { .type = NLA_U32 },
Thomas Graf5c753972006-08-04 23:03:53 -0700103};
104
Eric Dumazet40384992012-08-03 21:06:50 +0000105#define IN4_ADDR_HSIZE_SHIFT 8
106#define IN4_ADDR_HSIZE (1U << IN4_ADDR_HSIZE_SHIFT)
107
David S. Millerfd23c3b2011-02-18 12:42:28 -0800108static struct hlist_head inet_addr_lst[IN4_ADDR_HSIZE];
David S. Millerfd23c3b2011-02-18 12:42:28 -0800109
Eric Dumazet40384992012-08-03 21:06:50 +0000110static u32 inet_addr_hash(struct net *net, __be32 addr)
David S. Millerfd23c3b2011-02-18 12:42:28 -0800111{
Eric Dumazet40384992012-08-03 21:06:50 +0000112 u32 val = (__force u32) addr ^ net_hash_mix(net);
David S. Millerfd23c3b2011-02-18 12:42:28 -0800113
Eric Dumazet40384992012-08-03 21:06:50 +0000114 return hash_32(val, IN4_ADDR_HSIZE_SHIFT);
David S. Millerfd23c3b2011-02-18 12:42:28 -0800115}
116
117static void inet_hash_insert(struct net *net, struct in_ifaddr *ifa)
118{
Eric Dumazet40384992012-08-03 21:06:50 +0000119 u32 hash = inet_addr_hash(net, ifa->ifa_local);
David S. Millerfd23c3b2011-02-18 12:42:28 -0800120
WANG Cong32a4be42014-05-06 11:15:56 -0700121 ASSERT_RTNL();
David S. Millerfd23c3b2011-02-18 12:42:28 -0800122 hlist_add_head_rcu(&ifa->hash, &inet_addr_lst[hash]);
David S. Millerfd23c3b2011-02-18 12:42:28 -0800123}
124
125static void inet_hash_remove(struct in_ifaddr *ifa)
126{
WANG Cong32a4be42014-05-06 11:15:56 -0700127 ASSERT_RTNL();
David S. Millerfd23c3b2011-02-18 12:42:28 -0800128 hlist_del_init_rcu(&ifa->hash);
David S. Millerfd23c3b2011-02-18 12:42:28 -0800129}
130
David S. Miller9435eb12011-02-18 12:43:09 -0800131/**
132 * __ip_dev_find - find the first device with a given source address.
133 * @net: the net namespace
134 * @addr: the source address
135 * @devref: if true, take a reference on the found device
136 *
137 * If a caller uses devref=false, it should be protected by RCU, or RTNL
138 */
139struct net_device *__ip_dev_find(struct net *net, __be32 addr, bool devref)
140{
Eric Dumazet40384992012-08-03 21:06:50 +0000141 u32 hash = inet_addr_hash(net, addr);
David S. Miller9435eb12011-02-18 12:43:09 -0800142 struct net_device *result = NULL;
143 struct in_ifaddr *ifa;
David S. Miller9435eb12011-02-18 12:43:09 -0800144
145 rcu_read_lock();
Sasha Levinb67bfe02013-02-27 17:06:00 -0800146 hlist_for_each_entry_rcu(ifa, &inet_addr_lst[hash], hash) {
David S. Millere0660082011-03-03 11:24:19 -0800147 if (ifa->ifa_local == addr) {
Eric Dumazet40384992012-08-03 21:06:50 +0000148 struct net_device *dev = ifa->ifa_dev->dev;
149
150 if (!net_eq(dev_net(dev), net))
151 continue;
David S. Miller9435eb12011-02-18 12:43:09 -0800152 result = dev;
153 break;
154 }
155 }
David S. Miller406b6f92011-03-22 21:56:23 -0700156 if (!result) {
157 struct flowi4 fl4 = { .daddr = addr };
158 struct fib_result res = { 0 };
159 struct fib_table *local;
160
161 /* Fallback to FIB local table so that communication
162 * over loopback subnets work.
163 */
164 local = fib_get_table(net, RT_TABLE_LOCAL);
165 if (local &&
166 !fib_table_lookup(local, &fl4, &res, FIB_LOOKUP_NOREF) &&
167 res.type == RTN_LOCAL)
168 result = FIB_RES_DEV(res);
169 }
David S. Miller9435eb12011-02-18 12:43:09 -0800170 if (result && devref)
171 dev_hold(result);
172 rcu_read_unlock();
173 return result;
174}
175EXPORT_SYMBOL(__ip_dev_find);
176
Thomas Grafd6062cb2006-08-15 00:33:59 -0700177static void rtmsg_ifa(int event, struct in_ifaddr *, struct nlmsghdr *, u32);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700178
Alan Sterne041c682006-03-27 01:16:30 -0800179static BLOCKING_NOTIFIER_HEAD(inetaddr_chain);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
181 int destroy);
182#ifdef CONFIG_SYSCTL
WANG Cong20e61da2014-07-25 15:25:08 -0700183static int devinet_sysctl_register(struct in_device *idev);
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800184static void devinet_sysctl_unregister(struct in_device *idev);
185#else
WANG Cong20e61da2014-07-25 15:25:08 -0700186static int devinet_sysctl_register(struct in_device *idev)
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800187{
WANG Cong20e61da2014-07-25 15:25:08 -0700188 return 0;
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800189}
Eric Dumazet40384992012-08-03 21:06:50 +0000190static void devinet_sysctl_unregister(struct in_device *idev)
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800191{
192}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700193#endif
194
195/* Locks all the inet devices. */
196
197static struct in_ifaddr *inet_alloc_ifa(void)
198{
Alexey Dobriyan93adcc82008-10-28 13:25:09 -0700199 return kzalloc(sizeof(struct in_ifaddr), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200}
201
202static void inet_rcu_free_ifa(struct rcu_head *head)
203{
204 struct in_ifaddr *ifa = container_of(head, struct in_ifaddr, rcu_head);
205 if (ifa->ifa_dev)
206 in_dev_put(ifa->ifa_dev);
207 kfree(ifa);
208}
209
Eric Dumazet40384992012-08-03 21:06:50 +0000210static void inet_free_ifa(struct in_ifaddr *ifa)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700211{
212 call_rcu(&ifa->rcu_head, inet_rcu_free_ifa);
213}
214
215void in_dev_finish_destroy(struct in_device *idev)
216{
217 struct net_device *dev = idev->dev;
218
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700219 WARN_ON(idev->ifa_list);
220 WARN_ON(idev->mc_list);
Eric Dumazete9897072013-06-07 08:48:57 -0700221 kfree(rcu_dereference_protected(idev->mc_hash, 1));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700222#ifdef NET_REFCNT_DEBUG
Joe Perches91df42b2012-05-15 14:11:54 +0000223 pr_debug("%s: %p=%s\n", __func__, idev, dev ? dev->name : "NIL");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700224#endif
225 dev_put(dev);
226 if (!idev->dead)
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800227 pr_err("Freeing alive in_device %p\n", idev);
228 else
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229 kfree(idev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700230}
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800231EXPORT_SYMBOL(in_dev_finish_destroy);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700232
Herbert Xu71e27da2007-06-04 23:36:06 -0700233static struct in_device *inetdev_init(struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700234{
235 struct in_device *in_dev;
WANG Cong20e61da2014-07-25 15:25:08 -0700236 int err = -ENOMEM;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700237
238 ASSERT_RTNL();
239
Panagiotis Issaris0da974f2006-07-21 14:51:30 -0700240 in_dev = kzalloc(sizeof(*in_dev), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700241 if (!in_dev)
242 goto out;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +0900243 memcpy(&in_dev->cnf, dev_net(dev)->ipv4.devconf_dflt,
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -0800244 sizeof(in_dev->cnf));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245 in_dev->cnf.sysctl = NULL;
246 in_dev->dev = dev;
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800247 in_dev->arp_parms = neigh_parms_alloc(dev, &arp_tbl);
248 if (!in_dev->arp_parms)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700249 goto out_kfree;
Ben Hutchings0187bdf2008-06-19 16:15:47 -0700250 if (IPV4_DEVCONF(in_dev->cnf, FORWARDING))
251 dev_disable_lro(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252 /* Reference in_dev->dev */
253 dev_hold(dev);
David L Stevens30c4cf52007-01-04 12:31:14 -0800254 /* Account for reference dev->ip_ptr (below) */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255 in_dev_hold(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700256
WANG Cong20e61da2014-07-25 15:25:08 -0700257 err = devinet_sysctl_register(in_dev);
258 if (err) {
259 in_dev->dead = 1;
260 in_dev_put(in_dev);
261 in_dev = NULL;
262 goto out;
263 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700264 ip_mc_init_dev(in_dev);
265 if (dev->flags & IFF_UP)
266 ip_mc_up(in_dev);
Jarek Poplawski483479e2007-01-09 14:38:31 -0800267
David L Stevens30c4cf52007-01-04 12:31:14 -0800268 /* we can receive as soon as ip_ptr is set -- do this last */
Eric Dumazetcf778b02012-01-12 04:41:32 +0000269 rcu_assign_pointer(dev->ip_ptr, in_dev);
Jarek Poplawski483479e2007-01-09 14:38:31 -0800270out:
WANG Cong20e61da2014-07-25 15:25:08 -0700271 return in_dev ?: ERR_PTR(err);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272out_kfree:
273 kfree(in_dev);
274 in_dev = NULL;
275 goto out;
276}
277
278static void in_dev_rcu_put(struct rcu_head *head)
279{
280 struct in_device *idev = container_of(head, struct in_device, rcu_head);
281 in_dev_put(idev);
282}
283
284static void inetdev_destroy(struct in_device *in_dev)
285{
286 struct in_ifaddr *ifa;
287 struct net_device *dev;
288
289 ASSERT_RTNL();
290
291 dev = in_dev->dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700292
293 in_dev->dead = 1;
294
295 ip_mc_destroy_dev(in_dev);
296
297 while ((ifa = in_dev->ifa_list) != NULL) {
298 inet_del_ifa(in_dev, &in_dev->ifa_list, 0);
299 inet_free_ifa(ifa);
300 }
301
Stephen Hemmingera9b3cd72011-08-01 16:19:00 +0000302 RCU_INIT_POINTER(dev->ip_ptr, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700303
Pavel Emelyanov51602b22007-12-11 02:17:40 -0800304 devinet_sysctl_unregister(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700305 neigh_parms_release(&arp_tbl, in_dev->arp_parms);
306 arp_ifdown(dev);
307
308 call_rcu(&in_dev->rcu_head, in_dev_rcu_put);
309}
310
Al Viroff428d72006-09-26 22:13:35 -0700311int inet_addr_onlink(struct in_device *in_dev, __be32 a, __be32 b)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312{
313 rcu_read_lock();
314 for_primary_ifa(in_dev) {
315 if (inet_ifa_match(a, ifa)) {
316 if (!b || inet_ifa_match(b, ifa)) {
317 rcu_read_unlock();
318 return 1;
319 }
320 }
321 } endfor_ifa(in_dev);
322 rcu_read_unlock();
323 return 0;
324}
325
Thomas Grafd6062cb2006-08-15 00:33:59 -0700326static void __inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
Eric W. Biederman15e47302012-09-07 20:12:54 +0000327 int destroy, struct nlmsghdr *nlh, u32 portid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328{
Harald Welte8f937c62005-05-29 20:23:46 -0700329 struct in_ifaddr *promote = NULL;
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800330 struct in_ifaddr *ifa, *ifa1 = *ifap;
331 struct in_ifaddr *last_prim = in_dev->ifa_list;
332 struct in_ifaddr *prev_prom = NULL;
333 int do_promote = IN_DEV_PROMOTE_SECONDARIES(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700334
335 ASSERT_RTNL();
336
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900337 /* 1. Deleting primary ifaddr forces deletion all secondaries
Harald Welte8f937c62005-05-29 20:23:46 -0700338 * unless alias promotion is set
339 **/
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340
341 if (!(ifa1->ifa_flags & IFA_F_SECONDARY)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700342 struct in_ifaddr **ifap1 = &ifa1->ifa_next;
343
344 while ((ifa = *ifap1) != NULL) {
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900345 if (!(ifa->ifa_flags & IFA_F_SECONDARY) &&
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800346 ifa1->ifa_scope <= ifa->ifa_scope)
347 last_prim = ifa;
348
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349 if (!(ifa->ifa_flags & IFA_F_SECONDARY) ||
350 ifa1->ifa_mask != ifa->ifa_mask ||
351 !inet_ifa_match(ifa1->ifa_address, ifa)) {
352 ifap1 = &ifa->ifa_next;
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800353 prev_prom = ifa;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700354 continue;
355 }
356
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800357 if (!do_promote) {
David S. Millerfd23c3b2011-02-18 12:42:28 -0800358 inet_hash_remove(ifa);
Harald Welte8f937c62005-05-29 20:23:46 -0700359 *ifap1 = ifa->ifa_next;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700360
Eric W. Biederman15e47302012-09-07 20:12:54 +0000361 rtmsg_ifa(RTM_DELADDR, ifa, nlh, portid);
Alan Sterne041c682006-03-27 01:16:30 -0800362 blocking_notifier_call_chain(&inetaddr_chain,
363 NETDEV_DOWN, ifa);
Harald Welte8f937c62005-05-29 20:23:46 -0700364 inet_free_ifa(ifa);
365 } else {
366 promote = ifa;
367 break;
368 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700369 }
370 }
371
Julian Anastasov2d230e22011-03-19 12:13:52 +0000372 /* On promotion all secondaries from subnet are changing
373 * the primary IP, we must remove all their routes silently
374 * and later to add them back with new prefsrc. Do this
375 * while all addresses are on the device list.
376 */
377 for (ifa = promote; ifa; ifa = ifa->ifa_next) {
378 if (ifa1->ifa_mask == ifa->ifa_mask &&
379 inet_ifa_match(ifa1->ifa_address, ifa))
380 fib_del_ifaddr(ifa, ifa1);
381 }
382
Linus Torvalds1da177e2005-04-16 15:20:36 -0700383 /* 2. Unlink it */
384
385 *ifap = ifa1->ifa_next;
David S. Millerfd23c3b2011-02-18 12:42:28 -0800386 inet_hash_remove(ifa1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700387
388 /* 3. Announce address deletion */
389
390 /* Send message first, then call notifier.
391 At first sight, FIB update triggered by notifier
392 will refer to already deleted ifaddr, that could confuse
393 netlink listeners. It is not true: look, gated sees
394 that route deleted and if it still thinks that ifaddr
395 is valid, it will try to restore deleted routes... Grr.
396 So that, this order is correct.
397 */
Eric W. Biederman15e47302012-09-07 20:12:54 +0000398 rtmsg_ifa(RTM_DELADDR, ifa1, nlh, portid);
Alan Sterne041c682006-03-27 01:16:30 -0800399 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_DOWN, ifa1);
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800400
401 if (promote) {
Julian Anastasov04024b92011-03-19 12:13:54 +0000402 struct in_ifaddr *next_sec = promote->ifa_next;
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800403
404 if (prev_prom) {
405 prev_prom->ifa_next = promote->ifa_next;
406 promote->ifa_next = last_prim->ifa_next;
407 last_prim->ifa_next = promote;
408 }
409
410 promote->ifa_flags &= ~IFA_F_SECONDARY;
Eric W. Biederman15e47302012-09-07 20:12:54 +0000411 rtmsg_ifa(RTM_NEWADDR, promote, nlh, portid);
Alan Sterne041c682006-03-27 01:16:30 -0800412 blocking_notifier_call_chain(&inetaddr_chain,
413 NETDEV_UP, promote);
Julian Anastasov04024b92011-03-19 12:13:54 +0000414 for (ifa = next_sec; ifa; ifa = ifa->ifa_next) {
Jamal Hadi Salim0ff60a42005-11-22 14:47:37 -0800415 if (ifa1->ifa_mask != ifa->ifa_mask ||
416 !inet_ifa_match(ifa1->ifa_address, ifa))
417 continue;
418 fib_add_ifaddr(ifa);
419 }
420
421 }
Herbert Xu63630972007-06-07 18:35:38 -0700422 if (destroy)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700423 inet_free_ifa(ifa1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700424}
425
Thomas Grafd6062cb2006-08-15 00:33:59 -0700426static void inet_del_ifa(struct in_device *in_dev, struct in_ifaddr **ifap,
427 int destroy)
428{
429 __inet_del_ifa(in_dev, ifap, destroy, NULL, 0);
430}
431
Jiri Pirko5c766d62013-01-24 09:41:41 +0000432static void check_lifetime(struct work_struct *work);
433
434static DECLARE_DELAYED_WORK(check_lifetime_work, check_lifetime);
435
Thomas Grafd6062cb2006-08-15 00:33:59 -0700436static int __inet_insert_ifa(struct in_ifaddr *ifa, struct nlmsghdr *nlh,
Eric W. Biederman15e47302012-09-07 20:12:54 +0000437 u32 portid)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700438{
439 struct in_device *in_dev = ifa->ifa_dev;
440 struct in_ifaddr *ifa1, **ifap, **last_primary;
441
442 ASSERT_RTNL();
443
444 if (!ifa->ifa_local) {
445 inet_free_ifa(ifa);
446 return 0;
447 }
448
449 ifa->ifa_flags &= ~IFA_F_SECONDARY;
450 last_primary = &in_dev->ifa_list;
451
452 for (ifap = &in_dev->ifa_list; (ifa1 = *ifap) != NULL;
453 ifap = &ifa1->ifa_next) {
454 if (!(ifa1->ifa_flags & IFA_F_SECONDARY) &&
455 ifa->ifa_scope <= ifa1->ifa_scope)
456 last_primary = &ifa1->ifa_next;
457 if (ifa1->ifa_mask == ifa->ifa_mask &&
458 inet_ifa_match(ifa1->ifa_address, ifa)) {
459 if (ifa1->ifa_local == ifa->ifa_local) {
460 inet_free_ifa(ifa);
461 return -EEXIST;
462 }
463 if (ifa1->ifa_scope != ifa->ifa_scope) {
464 inet_free_ifa(ifa);
465 return -EINVAL;
466 }
467 ifa->ifa_flags |= IFA_F_SECONDARY;
468 }
469 }
470
471 if (!(ifa->ifa_flags & IFA_F_SECONDARY)) {
Aruna-Hewapathirane63862b52014-01-11 07:15:59 -0500472 prandom_seed((__force u32) ifa->ifa_local);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700473 ifap = last_primary;
474 }
475
476 ifa->ifa_next = *ifap;
477 *ifap = ifa;
478
David S. Millerfd23c3b2011-02-18 12:42:28 -0800479 inet_hash_insert(dev_net(in_dev->dev), ifa);
480
Jiri Pirko5c766d62013-01-24 09:41:41 +0000481 cancel_delayed_work(&check_lifetime_work);
viresh kumar906e0732014-01-22 12:23:32 +0530482 queue_delayed_work(system_power_efficient_wq, &check_lifetime_work, 0);
Jiri Pirko5c766d62013-01-24 09:41:41 +0000483
Linus Torvalds1da177e2005-04-16 15:20:36 -0700484 /* Send message first, then call notifier.
485 Notifier will trigger FIB update, so that
486 listeners of netlink will know about new ifaddr */
Eric W. Biederman15e47302012-09-07 20:12:54 +0000487 rtmsg_ifa(RTM_NEWADDR, ifa, nlh, portid);
Alan Sterne041c682006-03-27 01:16:30 -0800488 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_UP, ifa);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700489
490 return 0;
491}
492
Thomas Grafd6062cb2006-08-15 00:33:59 -0700493static int inet_insert_ifa(struct in_ifaddr *ifa)
494{
495 return __inet_insert_ifa(ifa, NULL, 0);
496}
497
Linus Torvalds1da177e2005-04-16 15:20:36 -0700498static int inet_set_ifa(struct net_device *dev, struct in_ifaddr *ifa)
499{
Herbert Xue5ed6392005-10-03 14:35:55 -0700500 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700501
502 ASSERT_RTNL();
503
504 if (!in_dev) {
Herbert Xu71e27da2007-06-04 23:36:06 -0700505 inet_free_ifa(ifa);
506 return -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700507 }
Herbert Xu71e27da2007-06-04 23:36:06 -0700508 ipv4_devconf_setall(in_dev);
Jiri Pirko1d4c8c22013-12-07 19:26:56 +0100509 neigh_parms_data_state_setall(in_dev->arp_parms);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700510 if (ifa->ifa_dev != in_dev) {
Ilpo Järvinen547b7922008-07-25 21:43:18 -0700511 WARN_ON(ifa->ifa_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700512 in_dev_hold(in_dev);
513 ifa->ifa_dev = in_dev;
514 }
Joe Perchesf97c1e02007-12-16 13:45:43 -0800515 if (ipv4_is_loopback(ifa->ifa_local))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700516 ifa->ifa_scope = RT_SCOPE_HOST;
517 return inet_insert_ifa(ifa);
518}
519
Eric Dumazet8723e1b2010-10-19 00:39:26 +0000520/* Caller must hold RCU or RTNL :
521 * We dont take a reference on found in_device
522 */
Denis V. Lunev7fee0ca2008-01-21 17:32:38 -0800523struct in_device *inetdev_by_index(struct net *net, int ifindex)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700524{
525 struct net_device *dev;
526 struct in_device *in_dev = NULL;
Eric Dumazetc148fc22009-11-01 19:23:04 +0000527
528 rcu_read_lock();
529 dev = dev_get_by_index_rcu(net, ifindex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700530 if (dev)
Eric Dumazet8723e1b2010-10-19 00:39:26 +0000531 in_dev = rcu_dereference_rtnl(dev->ip_ptr);
Eric Dumazetc148fc22009-11-01 19:23:04 +0000532 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700533 return in_dev;
534}
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800535EXPORT_SYMBOL(inetdev_by_index);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700536
537/* Called only from RTNL semaphored context. No locks. */
538
Al Viro60cad5d2006-09-26 22:17:09 -0700539struct in_ifaddr *inet_ifa_byprefix(struct in_device *in_dev, __be32 prefix,
540 __be32 mask)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700541{
542 ASSERT_RTNL();
543
544 for_primary_ifa(in_dev) {
545 if (ifa->ifa_mask == mask && inet_ifa_match(prefix, ifa))
546 return ifa;
547 } endfor_ifa(in_dev);
548 return NULL;
549}
550
Thomas Graf661d2962013-03-21 07:45:29 +0000551static int inet_rtm_deladdr(struct sk_buff *skb, struct nlmsghdr *nlh)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700552{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +0900553 struct net *net = sock_net(skb->sk);
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700554 struct nlattr *tb[IFA_MAX+1];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700555 struct in_device *in_dev;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700556 struct ifaddrmsg *ifm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700557 struct in_ifaddr *ifa, **ifap;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700558 int err = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700559
560 ASSERT_RTNL();
561
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700562 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy);
563 if (err < 0)
564 goto errout;
565
566 ifm = nlmsg_data(nlh);
Denis V. Lunev7fee0ca2008-01-21 17:32:38 -0800567 in_dev = inetdev_by_index(net, ifm->ifa_index);
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700568 if (in_dev == NULL) {
569 err = -ENODEV;
570 goto errout;
571 }
572
Linus Torvalds1da177e2005-04-16 15:20:36 -0700573 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
574 ifap = &ifa->ifa_next) {
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700575 if (tb[IFA_LOCAL] &&
Al Viroa7a628c2006-09-26 22:16:43 -0700576 ifa->ifa_local != nla_get_be32(tb[IFA_LOCAL]))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700577 continue;
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700578
579 if (tb[IFA_LABEL] && nla_strcmp(tb[IFA_LABEL], ifa->ifa_label))
580 continue;
581
582 if (tb[IFA_ADDRESS] &&
583 (ifm->ifa_prefixlen != ifa->ifa_prefixlen ||
Al Viroa7a628c2006-09-26 22:16:43 -0700584 !inet_ifa_match(nla_get_be32(tb[IFA_ADDRESS]), ifa)))
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700585 continue;
586
Eric W. Biederman15e47302012-09-07 20:12:54 +0000587 __inet_del_ifa(in_dev, ifap, 1, nlh, NETLINK_CB(skb).portid);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700588 return 0;
589 }
Thomas Grafdfdd5fd2006-08-04 23:04:17 -0700590
591 err = -EADDRNOTAVAIL;
592errout:
593 return err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700594}
595
Jiri Pirko5c766d62013-01-24 09:41:41 +0000596#define INFINITY_LIFE_TIME 0xFFFFFFFF
597
598static void check_lifetime(struct work_struct *work)
599{
600 unsigned long now, next, next_sec, next_sched;
601 struct in_ifaddr *ifa;
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000602 struct hlist_node *n;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000603 int i;
604
605 now = jiffies;
606 next = round_jiffies_up(now + ADDR_CHECK_FREQUENCY);
607
Jiri Pirko5c766d62013-01-24 09:41:41 +0000608 for (i = 0; i < IN4_ADDR_HSIZE; i++) {
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000609 bool change_needed = false;
610
611 rcu_read_lock();
Sasha Levinb67bfe02013-02-27 17:06:00 -0800612 hlist_for_each_entry_rcu(ifa, &inet_addr_lst[i], hash) {
Jiri Pirko5c766d62013-01-24 09:41:41 +0000613 unsigned long age;
614
615 if (ifa->ifa_flags & IFA_F_PERMANENT)
616 continue;
617
618 /* We try to batch several events at once. */
619 age = (now - ifa->ifa_tstamp +
620 ADDRCONF_TIMER_FUZZ_MINUS) / HZ;
621
622 if (ifa->ifa_valid_lft != INFINITY_LIFE_TIME &&
623 age >= ifa->ifa_valid_lft) {
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000624 change_needed = true;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000625 } else if (ifa->ifa_preferred_lft ==
626 INFINITY_LIFE_TIME) {
627 continue;
628 } else if (age >= ifa->ifa_preferred_lft) {
629 if (time_before(ifa->ifa_tstamp +
630 ifa->ifa_valid_lft * HZ, next))
631 next = ifa->ifa_tstamp +
632 ifa->ifa_valid_lft * HZ;
633
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000634 if (!(ifa->ifa_flags & IFA_F_DEPRECATED))
635 change_needed = true;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000636 } else if (time_before(ifa->ifa_tstamp +
637 ifa->ifa_preferred_lft * HZ,
638 next)) {
639 next = ifa->ifa_tstamp +
640 ifa->ifa_preferred_lft * HZ;
641 }
642 }
Jiri Pirkoc988d1e2013-04-04 23:39:39 +0000643 rcu_read_unlock();
644 if (!change_needed)
645 continue;
646 rtnl_lock();
647 hlist_for_each_entry_safe(ifa, n, &inet_addr_lst[i], hash) {
648 unsigned long age;
649
650 if (ifa->ifa_flags & IFA_F_PERMANENT)
651 continue;
652
653 /* We try to batch several events at once. */
654 age = (now - ifa->ifa_tstamp +
655 ADDRCONF_TIMER_FUZZ_MINUS) / HZ;
656
657 if (ifa->ifa_valid_lft != INFINITY_LIFE_TIME &&
658 age >= ifa->ifa_valid_lft) {
659 struct in_ifaddr **ifap;
660
661 for (ifap = &ifa->ifa_dev->ifa_list;
662 *ifap != NULL; ifap = &(*ifap)->ifa_next) {
663 if (*ifap == ifa) {
664 inet_del_ifa(ifa->ifa_dev,
665 ifap, 1);
666 break;
667 }
668 }
669 } else if (ifa->ifa_preferred_lft !=
670 INFINITY_LIFE_TIME &&
671 age >= ifa->ifa_preferred_lft &&
672 !(ifa->ifa_flags & IFA_F_DEPRECATED)) {
673 ifa->ifa_flags |= IFA_F_DEPRECATED;
674 rtmsg_ifa(RTM_NEWADDR, ifa, NULL, 0);
675 }
676 }
677 rtnl_unlock();
Jiri Pirko5c766d62013-01-24 09:41:41 +0000678 }
Jiri Pirko5c766d62013-01-24 09:41:41 +0000679
680 next_sec = round_jiffies_up(next);
681 next_sched = next;
682
683 /* If rounded timeout is accurate enough, accept it. */
684 if (time_before(next_sec, next + ADDRCONF_TIMER_FUZZ))
685 next_sched = next_sec;
686
687 now = jiffies;
688 /* And minimum interval is ADDRCONF_TIMER_FUZZ_MAX. */
689 if (time_before(next_sched, now + ADDRCONF_TIMER_FUZZ_MAX))
690 next_sched = now + ADDRCONF_TIMER_FUZZ_MAX;
691
viresh kumar906e0732014-01-22 12:23:32 +0530692 queue_delayed_work(system_power_efficient_wq, &check_lifetime_work,
693 next_sched - now);
Jiri Pirko5c766d62013-01-24 09:41:41 +0000694}
695
696static void set_ifa_lifetime(struct in_ifaddr *ifa, __u32 valid_lft,
697 __u32 prefered_lft)
698{
699 unsigned long timeout;
700
701 ifa->ifa_flags &= ~(IFA_F_PERMANENT | IFA_F_DEPRECATED);
702
703 timeout = addrconf_timeout_fixup(valid_lft, HZ);
704 if (addrconf_finite_timeout(timeout))
705 ifa->ifa_valid_lft = timeout;
706 else
707 ifa->ifa_flags |= IFA_F_PERMANENT;
708
709 timeout = addrconf_timeout_fixup(prefered_lft, HZ);
710 if (addrconf_finite_timeout(timeout)) {
711 if (timeout == 0)
712 ifa->ifa_flags |= IFA_F_DEPRECATED;
713 ifa->ifa_preferred_lft = timeout;
714 }
715 ifa->ifa_tstamp = jiffies;
716 if (!ifa->ifa_cstamp)
717 ifa->ifa_cstamp = ifa->ifa_tstamp;
718}
719
720static struct in_ifaddr *rtm_to_ifaddr(struct net *net, struct nlmsghdr *nlh,
721 __u32 *pvalid_lft, __u32 *pprefered_lft)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700722{
Thomas Graf5c753972006-08-04 23:03:53 -0700723 struct nlattr *tb[IFA_MAX+1];
724 struct in_ifaddr *ifa;
725 struct ifaddrmsg *ifm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700726 struct net_device *dev;
727 struct in_device *in_dev;
Denis V. Lunev7b218572008-01-31 18:47:00 -0800728 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700729
Thomas Graf5c753972006-08-04 23:03:53 -0700730 err = nlmsg_parse(nlh, sizeof(*ifm), tb, IFA_MAX, ifa_ipv4_policy);
731 if (err < 0)
732 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700733
Thomas Graf5c753972006-08-04 23:03:53 -0700734 ifm = nlmsg_data(nlh);
Denis V. Lunev7b218572008-01-31 18:47:00 -0800735 err = -EINVAL;
736 if (ifm->ifa_prefixlen > 32 || tb[IFA_LOCAL] == NULL)
Thomas Graf5c753972006-08-04 23:03:53 -0700737 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700738
Denis V. Lunev4b8aa9a2008-01-31 18:47:40 -0800739 dev = __dev_get_by_index(net, ifm->ifa_index);
Denis V. Lunev7b218572008-01-31 18:47:00 -0800740 err = -ENODEV;
741 if (dev == NULL)
Thomas Graf5c753972006-08-04 23:03:53 -0700742 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700743
Thomas Graf5c753972006-08-04 23:03:53 -0700744 in_dev = __in_dev_get_rtnl(dev);
Denis V. Lunev7b218572008-01-31 18:47:00 -0800745 err = -ENOBUFS;
746 if (in_dev == NULL)
Herbert Xu71e27da2007-06-04 23:36:06 -0700747 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700748
Thomas Graf5c753972006-08-04 23:03:53 -0700749 ifa = inet_alloc_ifa();
Denis V. Lunev7b218572008-01-31 18:47:00 -0800750 if (ifa == NULL)
Thomas Graf5c753972006-08-04 23:03:53 -0700751 /*
752 * A potential indev allocation can be left alive, it stays
753 * assigned to its device and is destroy with it.
754 */
Thomas Graf5c753972006-08-04 23:03:53 -0700755 goto errout;
Thomas Graf5c753972006-08-04 23:03:53 -0700756
Pavel Emelyanova4e65d32007-12-07 23:55:43 -0800757 ipv4_devconf_setall(in_dev);
Jiri Pirko1d4c8c22013-12-07 19:26:56 +0100758 neigh_parms_data_state_setall(in_dev->arp_parms);
Thomas Graf5c753972006-08-04 23:03:53 -0700759 in_dev_hold(in_dev);
760
761 if (tb[IFA_ADDRESS] == NULL)
762 tb[IFA_ADDRESS] = tb[IFA_LOCAL];
763
David S. Millerfd23c3b2011-02-18 12:42:28 -0800764 INIT_HLIST_NODE(&ifa->hash);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700765 ifa->ifa_prefixlen = ifm->ifa_prefixlen;
766 ifa->ifa_mask = inet_make_mask(ifm->ifa_prefixlen);
Jiri Pirkoad6c8132013-12-08 12:16:10 +0100767 ifa->ifa_flags = tb[IFA_FLAGS] ? nla_get_u32(tb[IFA_FLAGS]) :
768 ifm->ifa_flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700769 ifa->ifa_scope = ifm->ifa_scope;
Thomas Graf5c753972006-08-04 23:03:53 -0700770 ifa->ifa_dev = in_dev;
771
Al Viroa7a628c2006-09-26 22:16:43 -0700772 ifa->ifa_local = nla_get_be32(tb[IFA_LOCAL]);
773 ifa->ifa_address = nla_get_be32(tb[IFA_ADDRESS]);
Thomas Graf5c753972006-08-04 23:03:53 -0700774
775 if (tb[IFA_BROADCAST])
Al Viroa7a628c2006-09-26 22:16:43 -0700776 ifa->ifa_broadcast = nla_get_be32(tb[IFA_BROADCAST]);
Thomas Graf5c753972006-08-04 23:03:53 -0700777
Thomas Graf5c753972006-08-04 23:03:53 -0700778 if (tb[IFA_LABEL])
779 nla_strlcpy(ifa->ifa_label, tb[IFA_LABEL], IFNAMSIZ);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700780 else
781 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
782
Jiri Pirko5c766d62013-01-24 09:41:41 +0000783 if (tb[IFA_CACHEINFO]) {
784 struct ifa_cacheinfo *ci;
785
786 ci = nla_data(tb[IFA_CACHEINFO]);
787 if (!ci->ifa_valid || ci->ifa_prefered > ci->ifa_valid) {
788 err = -EINVAL;
Daniel Borkmann446266b2013-08-02 11:32:43 +0200789 goto errout_free;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000790 }
791 *pvalid_lft = ci->ifa_valid;
792 *pprefered_lft = ci->ifa_prefered;
793 }
794
Thomas Graf5c753972006-08-04 23:03:53 -0700795 return ifa;
796
Daniel Borkmann446266b2013-08-02 11:32:43 +0200797errout_free:
798 inet_free_ifa(ifa);
Thomas Graf5c753972006-08-04 23:03:53 -0700799errout:
800 return ERR_PTR(err);
801}
802
Jiri Pirko5c766d62013-01-24 09:41:41 +0000803static struct in_ifaddr *find_matching_ifa(struct in_ifaddr *ifa)
804{
805 struct in_device *in_dev = ifa->ifa_dev;
806 struct in_ifaddr *ifa1, **ifap;
807
808 if (!ifa->ifa_local)
809 return NULL;
810
811 for (ifap = &in_dev->ifa_list; (ifa1 = *ifap) != NULL;
812 ifap = &ifa1->ifa_next) {
813 if (ifa1->ifa_mask == ifa->ifa_mask &&
814 inet_ifa_match(ifa1->ifa_address, ifa) &&
815 ifa1->ifa_local == ifa->ifa_local)
816 return ifa1;
817 }
818 return NULL;
819}
820
Thomas Graf661d2962013-03-21 07:45:29 +0000821static int inet_rtm_newaddr(struct sk_buff *skb, struct nlmsghdr *nlh)
Thomas Graf5c753972006-08-04 23:03:53 -0700822{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +0900823 struct net *net = sock_net(skb->sk);
Thomas Graf5c753972006-08-04 23:03:53 -0700824 struct in_ifaddr *ifa;
Jiri Pirko5c766d62013-01-24 09:41:41 +0000825 struct in_ifaddr *ifa_existing;
826 __u32 valid_lft = INFINITY_LIFE_TIME;
827 __u32 prefered_lft = INFINITY_LIFE_TIME;
Thomas Graf5c753972006-08-04 23:03:53 -0700828
829 ASSERT_RTNL();
830
Jiri Pirko5c766d62013-01-24 09:41:41 +0000831 ifa = rtm_to_ifaddr(net, nlh, &valid_lft, &prefered_lft);
Thomas Graf5c753972006-08-04 23:03:53 -0700832 if (IS_ERR(ifa))
833 return PTR_ERR(ifa);
834
Jiri Pirko5c766d62013-01-24 09:41:41 +0000835 ifa_existing = find_matching_ifa(ifa);
836 if (!ifa_existing) {
837 /* It would be best to check for !NLM_F_CREATE here but
stephen hemminger614d0562014-05-16 20:46:58 -0700838 * userspace already relies on not having to provide this.
Jiri Pirko5c766d62013-01-24 09:41:41 +0000839 */
840 set_ifa_lifetime(ifa, valid_lft, prefered_lft);
841 return __inet_insert_ifa(ifa, nlh, NETLINK_CB(skb).portid);
842 } else {
843 inet_free_ifa(ifa);
844
845 if (nlh->nlmsg_flags & NLM_F_EXCL ||
846 !(nlh->nlmsg_flags & NLM_F_REPLACE))
847 return -EEXIST;
Jiri Pirko34e2ed32013-04-04 08:33:00 +0000848 ifa = ifa_existing;
849 set_ifa_lifetime(ifa, valid_lft, prefered_lft);
Jiri Pirko05a324b2013-04-04 23:39:38 +0000850 cancel_delayed_work(&check_lifetime_work);
viresh kumar906e0732014-01-22 12:23:32 +0530851 queue_delayed_work(system_power_efficient_wq,
852 &check_lifetime_work, 0);
Jiri Pirko34e2ed32013-04-04 08:33:00 +0000853 rtmsg_ifa(RTM_NEWADDR, ifa, nlh, NETLINK_CB(skb).portid);
854 blocking_notifier_call_chain(&inetaddr_chain, NETDEV_UP, ifa);
Jiri Pirko5c766d62013-01-24 09:41:41 +0000855 }
856 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700857}
858
859/*
860 * Determine a default network mask, based on the IP address.
861 */
862
Eric Dumazet40384992012-08-03 21:06:50 +0000863static int inet_abc_len(__be32 addr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700864{
865 int rc = -1; /* Something else, probably a multicast. */
866
Joe Perchesf97c1e02007-12-16 13:45:43 -0800867 if (ipv4_is_zeronet(addr))
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900868 rc = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700869 else {
Al Viro714e85b2006-11-14 20:51:49 -0800870 __u32 haddr = ntohl(addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700871
Al Viro714e85b2006-11-14 20:51:49 -0800872 if (IN_CLASSA(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700873 rc = 8;
Al Viro714e85b2006-11-14 20:51:49 -0800874 else if (IN_CLASSB(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700875 rc = 16;
Al Viro714e85b2006-11-14 20:51:49 -0800876 else if (IN_CLASSC(haddr))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700877 rc = 24;
878 }
879
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +0900880 return rc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700881}
882
883
Denis V. Luneve5b13cb2008-02-28 20:51:43 -0800884int devinet_ioctl(struct net *net, unsigned int cmd, void __user *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700885{
886 struct ifreq ifr;
887 struct sockaddr_in sin_orig;
888 struct sockaddr_in *sin = (struct sockaddr_in *)&ifr.ifr_addr;
889 struct in_device *in_dev;
890 struct in_ifaddr **ifap = NULL;
891 struct in_ifaddr *ifa = NULL;
892 struct net_device *dev;
893 char *colon;
894 int ret = -EFAULT;
895 int tryaddrmatch = 0;
896
897 /*
898 * Fetch the caller's info block into kernel space
899 */
900
901 if (copy_from_user(&ifr, arg, sizeof(struct ifreq)))
902 goto out;
903 ifr.ifr_name[IFNAMSIZ - 1] = 0;
904
905 /* save original address for comparison */
906 memcpy(&sin_orig, sin, sizeof(*sin));
907
908 colon = strchr(ifr.ifr_name, ':');
909 if (colon)
910 *colon = 0;
911
Denis V. Luneve5b13cb2008-02-28 20:51:43 -0800912 dev_load(net, ifr.ifr_name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700913
Stephen Hemminger132adf52007-03-08 20:44:43 -0800914 switch (cmd) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700915 case SIOCGIFADDR: /* Get interface address */
916 case SIOCGIFBRDADDR: /* Get the broadcast address */
917 case SIOCGIFDSTADDR: /* Get the destination address */
918 case SIOCGIFNETMASK: /* Get the netmask for the interface */
919 /* Note that these ioctls will not sleep,
920 so that we do not impose a lock.
921 One day we will be forced to put shlock here (I mean SMP)
922 */
923 tryaddrmatch = (sin_orig.sin_family == AF_INET);
924 memset(sin, 0, sizeof(*sin));
925 sin->sin_family = AF_INET;
926 break;
927
928 case SIOCSIFFLAGS:
Zhao Hongjiangbf5b30b2012-09-20 22:37:25 +0000929 ret = -EPERM;
Eric W. Biederman52e804c2012-11-16 03:03:05 +0000930 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700931 goto out;
932 break;
933 case SIOCSIFADDR: /* Set interface address (and family) */
934 case SIOCSIFBRDADDR: /* Set the broadcast address */
935 case SIOCSIFDSTADDR: /* Set the destination address */
936 case SIOCSIFNETMASK: /* Set the netmask for the interface */
Zhao Hongjiangbf5b30b2012-09-20 22:37:25 +0000937 ret = -EPERM;
Eric W. Biederman52e804c2012-11-16 03:03:05 +0000938 if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700939 goto out;
940 ret = -EINVAL;
941 if (sin->sin_family != AF_INET)
942 goto out;
943 break;
944 default:
945 ret = -EINVAL;
946 goto out;
947 }
948
949 rtnl_lock();
950
951 ret = -ENODEV;
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800952 dev = __dev_get_by_name(net, ifr.ifr_name);
953 if (!dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700954 goto done;
955
956 if (colon)
957 *colon = ':';
958
Eric Dumazet9f9354b2009-11-04 22:05:10 -0800959 in_dev = __in_dev_get_rtnl(dev);
960 if (in_dev) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700961 if (tryaddrmatch) {
962 /* Matthias Andree */
963 /* compare label and address (4.4BSD style) */
964 /* note: we only do this for a limited set of ioctls
965 and only if the original address family was AF_INET.
966 This is checked above. */
967 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
968 ifap = &ifa->ifa_next) {
969 if (!strcmp(ifr.ifr_name, ifa->ifa_label) &&
970 sin_orig.sin_addr.s_addr ==
David S. Miller6c91afe2011-03-09 13:27:16 -0800971 ifa->ifa_local) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700972 break; /* found */
973 }
974 }
975 }
976 /* we didn't get a match, maybe the application is
977 4.3BSD-style and passed in junk so we fall back to
978 comparing just the label */
979 if (!ifa) {
980 for (ifap = &in_dev->ifa_list; (ifa = *ifap) != NULL;
981 ifap = &ifa->ifa_next)
982 if (!strcmp(ifr.ifr_name, ifa->ifa_label))
983 break;
984 }
985 }
986
987 ret = -EADDRNOTAVAIL;
988 if (!ifa && cmd != SIOCSIFADDR && cmd != SIOCSIFFLAGS)
989 goto done;
990
Stephen Hemminger132adf52007-03-08 20:44:43 -0800991 switch (cmd) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700992 case SIOCGIFADDR: /* Get interface address */
993 sin->sin_addr.s_addr = ifa->ifa_local;
994 goto rarok;
995
996 case SIOCGIFBRDADDR: /* Get the broadcast address */
997 sin->sin_addr.s_addr = ifa->ifa_broadcast;
998 goto rarok;
999
1000 case SIOCGIFDSTADDR: /* Get the destination address */
1001 sin->sin_addr.s_addr = ifa->ifa_address;
1002 goto rarok;
1003
1004 case SIOCGIFNETMASK: /* Get the netmask for the interface */
1005 sin->sin_addr.s_addr = ifa->ifa_mask;
1006 goto rarok;
1007
1008 case SIOCSIFFLAGS:
1009 if (colon) {
1010 ret = -EADDRNOTAVAIL;
1011 if (!ifa)
1012 break;
1013 ret = 0;
1014 if (!(ifr.ifr_flags & IFF_UP))
1015 inet_del_ifa(in_dev, ifap, 1);
1016 break;
1017 }
1018 ret = dev_change_flags(dev, ifr.ifr_flags);
1019 break;
1020
1021 case SIOCSIFADDR: /* Set interface address (and family) */
1022 ret = -EINVAL;
1023 if (inet_abc_len(sin->sin_addr.s_addr) < 0)
1024 break;
1025
1026 if (!ifa) {
1027 ret = -ENOBUFS;
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001028 ifa = inet_alloc_ifa();
1029 if (!ifa)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001030 break;
Xi Wangc7e2e1d2013-01-05 11:19:24 +00001031 INIT_HLIST_NODE(&ifa->hash);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001032 if (colon)
1033 memcpy(ifa->ifa_label, ifr.ifr_name, IFNAMSIZ);
1034 else
1035 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
1036 } else {
1037 ret = 0;
1038 if (ifa->ifa_local == sin->sin_addr.s_addr)
1039 break;
1040 inet_del_ifa(in_dev, ifap, 0);
1041 ifa->ifa_broadcast = 0;
Bjorn Mork148f9722008-02-26 18:17:53 -08001042 ifa->ifa_scope = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001043 }
1044
1045 ifa->ifa_address = ifa->ifa_local = sin->sin_addr.s_addr;
1046
1047 if (!(dev->flags & IFF_POINTOPOINT)) {
1048 ifa->ifa_prefixlen = inet_abc_len(ifa->ifa_address);
1049 ifa->ifa_mask = inet_make_mask(ifa->ifa_prefixlen);
1050 if ((dev->flags & IFF_BROADCAST) &&
1051 ifa->ifa_prefixlen < 31)
1052 ifa->ifa_broadcast = ifa->ifa_address |
1053 ~ifa->ifa_mask;
1054 } else {
1055 ifa->ifa_prefixlen = 32;
1056 ifa->ifa_mask = inet_make_mask(32);
1057 }
Jiri Pirko5c766d62013-01-24 09:41:41 +00001058 set_ifa_lifetime(ifa, INFINITY_LIFE_TIME, INFINITY_LIFE_TIME);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001059 ret = inet_set_ifa(dev, ifa);
1060 break;
1061
1062 case SIOCSIFBRDADDR: /* Set the broadcast address */
1063 ret = 0;
1064 if (ifa->ifa_broadcast != sin->sin_addr.s_addr) {
1065 inet_del_ifa(in_dev, ifap, 0);
1066 ifa->ifa_broadcast = sin->sin_addr.s_addr;
1067 inet_insert_ifa(ifa);
1068 }
1069 break;
1070
1071 case SIOCSIFDSTADDR: /* Set the destination address */
1072 ret = 0;
1073 if (ifa->ifa_address == sin->sin_addr.s_addr)
1074 break;
1075 ret = -EINVAL;
1076 if (inet_abc_len(sin->sin_addr.s_addr) < 0)
1077 break;
1078 ret = 0;
1079 inet_del_ifa(in_dev, ifap, 0);
1080 ifa->ifa_address = sin->sin_addr.s_addr;
1081 inet_insert_ifa(ifa);
1082 break;
1083
1084 case SIOCSIFNETMASK: /* Set the netmask for the interface */
1085
1086 /*
1087 * The mask we set must be legal.
1088 */
1089 ret = -EINVAL;
1090 if (bad_mask(sin->sin_addr.s_addr, 0))
1091 break;
1092 ret = 0;
1093 if (ifa->ifa_mask != sin->sin_addr.s_addr) {
Al Viroa144ea42006-09-28 18:00:55 -07001094 __be32 old_mask = ifa->ifa_mask;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001095 inet_del_ifa(in_dev, ifap, 0);
1096 ifa->ifa_mask = sin->sin_addr.s_addr;
1097 ifa->ifa_prefixlen = inet_mask_len(ifa->ifa_mask);
1098
1099 /* See if current broadcast address matches
1100 * with current netmask, then recalculate
1101 * the broadcast address. Otherwise it's a
1102 * funny address, so don't touch it since
1103 * the user seems to know what (s)he's doing...
1104 */
1105 if ((dev->flags & IFF_BROADCAST) &&
1106 (ifa->ifa_prefixlen < 31) &&
1107 (ifa->ifa_broadcast ==
David Engeldcab5e12005-10-21 22:09:16 -05001108 (ifa->ifa_local|~old_mask))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001109 ifa->ifa_broadcast = (ifa->ifa_local |
1110 ~sin->sin_addr.s_addr);
1111 }
1112 inet_insert_ifa(ifa);
1113 }
1114 break;
1115 }
1116done:
1117 rtnl_unlock();
1118out:
1119 return ret;
1120rarok:
1121 rtnl_unlock();
1122 ret = copy_to_user(arg, &ifr, sizeof(struct ifreq)) ? -EFAULT : 0;
1123 goto out;
1124}
1125
1126static int inet_gifconf(struct net_device *dev, char __user *buf, int len)
1127{
Herbert Xue5ed6392005-10-03 14:35:55 -07001128 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001129 struct in_ifaddr *ifa;
1130 struct ifreq ifr;
1131 int done = 0;
1132
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001133 if (!in_dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001134 goto out;
1135
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001136 for (ifa = in_dev->ifa_list; ifa; ifa = ifa->ifa_next) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001137 if (!buf) {
1138 done += sizeof(ifr);
1139 continue;
1140 }
1141 if (len < (int) sizeof(ifr))
1142 break;
1143 memset(&ifr, 0, sizeof(struct ifreq));
Dan Carpenter4299c8a2013-07-29 22:15:19 +03001144 strcpy(ifr.ifr_name, ifa->ifa_label);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001145
1146 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_family = AF_INET;
1147 (*(struct sockaddr_in *)&ifr.ifr_addr).sin_addr.s_addr =
1148 ifa->ifa_local;
1149
1150 if (copy_to_user(buf, &ifr, sizeof(struct ifreq))) {
1151 done = -EFAULT;
1152 break;
1153 }
1154 buf += sizeof(struct ifreq);
1155 len -= sizeof(struct ifreq);
1156 done += sizeof(struct ifreq);
1157 }
1158out:
1159 return done;
1160}
1161
Al Viroa61ced52006-09-26 21:27:54 -07001162__be32 inet_select_addr(const struct net_device *dev, __be32 dst, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001163{
Al Viroa61ced52006-09-26 21:27:54 -07001164 __be32 addr = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001165 struct in_device *in_dev;
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001166 struct net *net = dev_net(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001167
1168 rcu_read_lock();
Herbert Xue5ed6392005-10-03 14:35:55 -07001169 in_dev = __in_dev_get_rcu(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001170 if (!in_dev)
1171 goto no_in_dev;
1172
1173 for_primary_ifa(in_dev) {
1174 if (ifa->ifa_scope > scope)
1175 continue;
1176 if (!dst || inet_ifa_match(dst, ifa)) {
1177 addr = ifa->ifa_local;
1178 break;
1179 }
1180 if (!addr)
1181 addr = ifa->ifa_local;
1182 } endfor_ifa(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001183
1184 if (addr)
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001185 goto out_unlock;
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001186no_in_dev:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001187
1188 /* Not loopback addresses on loopback should be preferred
1189 in this case. It is importnat that lo is the first interface
1190 in dev_base list.
1191 */
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001192 for_each_netdev_rcu(net, dev) {
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001193 in_dev = __in_dev_get_rcu(dev);
1194 if (!in_dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001195 continue;
1196
1197 for_primary_ifa(in_dev) {
1198 if (ifa->ifa_scope != RT_SCOPE_LINK &&
1199 ifa->ifa_scope <= scope) {
1200 addr = ifa->ifa_local;
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001201 goto out_unlock;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001202 }
1203 } endfor_ifa(in_dev);
1204 }
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001205out_unlock:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001206 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001207 return addr;
1208}
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001209EXPORT_SYMBOL(inet_select_addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001210
Al Viro60cad5d2006-09-26 22:17:09 -07001211static __be32 confirm_addr_indev(struct in_device *in_dev, __be32 dst,
1212 __be32 local, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001213{
1214 int same = 0;
Al Viroa144ea42006-09-28 18:00:55 -07001215 __be32 addr = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001216
1217 for_ifa(in_dev) {
1218 if (!addr &&
1219 (local == ifa->ifa_local || !local) &&
1220 ifa->ifa_scope <= scope) {
1221 addr = ifa->ifa_local;
1222 if (same)
1223 break;
1224 }
1225 if (!same) {
1226 same = (!local || inet_ifa_match(local, ifa)) &&
1227 (!dst || inet_ifa_match(dst, ifa));
1228 if (same && addr) {
1229 if (local || !dst)
1230 break;
1231 /* Is the selected addr into dst subnet? */
1232 if (inet_ifa_match(addr, ifa))
1233 break;
1234 /* No, then can we use new local src? */
1235 if (ifa->ifa_scope <= scope) {
1236 addr = ifa->ifa_local;
1237 break;
1238 }
1239 /* search for large dst subnet for addr */
1240 same = 0;
1241 }
1242 }
1243 } endfor_ifa(in_dev);
1244
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001245 return same ? addr : 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001246}
1247
1248/*
1249 * Confirm that local IP address exists using wildcards:
Nicolas Dichtelb601fa12013-12-10 15:02:40 +01001250 * - net: netns to check, cannot be NULL
1251 * - in_dev: only on this interface, NULL=any interface
Linus Torvalds1da177e2005-04-16 15:20:36 -07001252 * - dst: only in the same subnet as dst, 0=any dst
1253 * - local: address, 0=autoselect the local address
1254 * - scope: maximum allowed scope value for the local address
1255 */
Nicolas Dichtelb601fa12013-12-10 15:02:40 +01001256__be32 inet_confirm_addr(struct net *net, struct in_device *in_dev,
Denis V. Lunev9bd85e32008-01-14 23:05:55 -08001257 __be32 dst, __be32 local, int scope)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001258{
Al Viro60cad5d2006-09-26 22:17:09 -07001259 __be32 addr = 0;
Denis V. Lunev9bd85e32008-01-14 23:05:55 -08001260 struct net_device *dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001261
Nicolas Dichtelb601fa12013-12-10 15:02:40 +01001262 if (in_dev != NULL)
Denis V. Lunev9bd85e32008-01-14 23:05:55 -08001263 return confirm_addr_indev(in_dev, dst, local, scope);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001264
Linus Torvalds1da177e2005-04-16 15:20:36 -07001265 rcu_read_lock();
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001266 for_each_netdev_rcu(net, dev) {
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001267 in_dev = __in_dev_get_rcu(dev);
1268 if (in_dev) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001269 addr = confirm_addr_indev(in_dev, dst, local, scope);
1270 if (addr)
1271 break;
1272 }
1273 }
1274 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001275
1276 return addr;
1277}
Andy Gospodarekeaddcd72012-03-22 16:14:29 +00001278EXPORT_SYMBOL(inet_confirm_addr);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001279
1280/*
1281 * Device notifier
1282 */
1283
1284int register_inetaddr_notifier(struct notifier_block *nb)
1285{
Alan Sterne041c682006-03-27 01:16:30 -08001286 return blocking_notifier_chain_register(&inetaddr_chain, nb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001287}
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001288EXPORT_SYMBOL(register_inetaddr_notifier);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001289
1290int unregister_inetaddr_notifier(struct notifier_block *nb)
1291{
Alan Sterne041c682006-03-27 01:16:30 -08001292 return blocking_notifier_chain_unregister(&inetaddr_chain, nb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001293}
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001294EXPORT_SYMBOL(unregister_inetaddr_notifier);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001295
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001296/* Rename ifa_labels for a device name change. Make some effort to preserve
1297 * existing alias numbering and to create unique labels if possible.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001298*/
1299static void inetdev_changename(struct net_device *dev, struct in_device *in_dev)
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001300{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001301 struct in_ifaddr *ifa;
1302 int named = 0;
1303
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001304 for (ifa = in_dev->ifa_list; ifa; ifa = ifa->ifa_next) {
1305 char old[IFNAMSIZ], *dot;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001306
1307 memcpy(old, ifa->ifa_label, IFNAMSIZ);
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001308 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001309 if (named++ == 0)
Thomas Graf573bf472008-06-10 15:40:04 -07001310 goto skip;
Mark McLoughlin44344b22008-01-04 00:56:25 -08001311 dot = strchr(old, ':');
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001312 if (dot == NULL) {
1313 sprintf(old, ":%d", named);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001314 dot = old;
1315 }
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001316 if (strlen(dot) + strlen(dev->name) < IFNAMSIZ)
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001317 strcat(ifa->ifa_label, dot);
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001318 else
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001319 strcpy(ifa->ifa_label + (IFNAMSIZ - strlen(dot) - 1), dot);
Thomas Graf573bf472008-06-10 15:40:04 -07001320skip:
1321 rtmsg_ifa(RTM_NEWADDR, ifa, NULL, 0);
YOSHIFUJI Hideakie905a9e2007-02-09 23:24:47 +09001322 }
1323}
Linus Torvalds1da177e2005-04-16 15:20:36 -07001324
Eric Dumazet40384992012-08-03 21:06:50 +00001325static bool inetdev_valid_mtu(unsigned int mtu)
Breno Leitao06770842008-09-02 17:28:58 -07001326{
1327 return mtu >= 68;
1328}
1329
Ian Campbelld11327ad2011-02-11 07:44:16 +00001330static void inetdev_send_gratuitous_arp(struct net_device *dev,
1331 struct in_device *in_dev)
1332
1333{
Zoltan Kissb76d0782011-07-24 13:09:30 +00001334 struct in_ifaddr *ifa;
Ian Campbelld11327ad2011-02-11 07:44:16 +00001335
Zoltan Kissb76d0782011-07-24 13:09:30 +00001336 for (ifa = in_dev->ifa_list; ifa;
1337 ifa = ifa->ifa_next) {
1338 arp_send(ARPOP_REQUEST, ETH_P_ARP,
1339 ifa->ifa_local, dev,
1340 ifa->ifa_local, NULL,
1341 dev->dev_addr, NULL);
1342 }
Ian Campbelld11327ad2011-02-11 07:44:16 +00001343}
1344
Linus Torvalds1da177e2005-04-16 15:20:36 -07001345/* Called only under RTNL semaphore */
1346
1347static int inetdev_event(struct notifier_block *this, unsigned long event,
1348 void *ptr)
1349{
Jiri Pirko351638e2013-05-28 01:30:21 +00001350 struct net_device *dev = netdev_notifier_info_to_dev(ptr);
Eric Dumazet748e2d92012-08-22 21:50:59 +00001351 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001352
1353 ASSERT_RTNL();
1354
1355 if (!in_dev) {
Herbert Xu8030f542007-02-22 01:53:47 +09001356 if (event == NETDEV_REGISTER) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001357 in_dev = inetdev_init(dev);
WANG Cong20e61da2014-07-25 15:25:08 -07001358 if (IS_ERR(in_dev))
1359 return notifier_from_errno(PTR_ERR(in_dev));
Eric W. Biederman0cc217e2007-09-26 22:10:06 -07001360 if (dev->flags & IFF_LOOPBACK) {
Herbert Xu42f811b2007-06-04 23:34:44 -07001361 IN_DEV_CONF_SET(in_dev, NOXFRM, 1);
1362 IN_DEV_CONF_SET(in_dev, NOPOLICY, 1);
Herbert Xu8030f542007-02-22 01:53:47 +09001363 }
Breno Leitao06770842008-09-02 17:28:58 -07001364 } else if (event == NETDEV_CHANGEMTU) {
1365 /* Re-enabling IP */
1366 if (inetdev_valid_mtu(dev->mtu))
1367 in_dev = inetdev_init(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001368 }
1369 goto out;
1370 }
1371
1372 switch (event) {
1373 case NETDEV_REGISTER:
Joe Perches91df42b2012-05-15 14:11:54 +00001374 pr_debug("%s: bug\n", __func__);
Stephen Hemmingera9b3cd72011-08-01 16:19:00 +00001375 RCU_INIT_POINTER(dev->ip_ptr, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001376 break;
1377 case NETDEV_UP:
Breno Leitao06770842008-09-02 17:28:58 -07001378 if (!inetdev_valid_mtu(dev->mtu))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001379 break;
Eric W. Biederman0cc217e2007-09-26 22:10:06 -07001380 if (dev->flags & IFF_LOOPBACK) {
Eric Dumazet9f9354b2009-11-04 22:05:10 -08001381 struct in_ifaddr *ifa = inet_alloc_ifa();
1382
1383 if (ifa) {
David S. Millerfd23c3b2011-02-18 12:42:28 -08001384 INIT_HLIST_NODE(&ifa->hash);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001385 ifa->ifa_local =
1386 ifa->ifa_address = htonl(INADDR_LOOPBACK);
1387 ifa->ifa_prefixlen = 8;
1388 ifa->ifa_mask = inet_make_mask(8);
1389 in_dev_hold(in_dev);
1390 ifa->ifa_dev = in_dev;
1391 ifa->ifa_scope = RT_SCOPE_HOST;
1392 memcpy(ifa->ifa_label, dev->name, IFNAMSIZ);
Jiri Pirko5c766d62013-01-24 09:41:41 +00001393 set_ifa_lifetime(ifa, INFINITY_LIFE_TIME,
1394 INFINITY_LIFE_TIME);
Jiri Pirkodfd15822014-01-07 15:55:45 +01001395 ipv4_devconf_setall(in_dev);
1396 neigh_parms_data_state_setall(in_dev->arp_parms);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001397 inet_insert_ifa(ifa);
1398 }
1399 }
1400 ip_mc_up(in_dev);
Stephen Hemmingereefef1c2009-02-01 01:04:33 -08001401 /* fall through */
1402 case NETDEV_CHANGEADDR:
Ian Campbelld11327ad2011-02-11 07:44:16 +00001403 if (!IN_DEV_ARP_NOTIFY(in_dev))
1404 break;
1405 /* fall through */
1406 case NETDEV_NOTIFY_PEERS:
Stephen Hemmingera21090c2009-10-07 03:18:17 -07001407 /* Send gratuitous ARP to notify of link change */
Ian Campbelld11327ad2011-02-11 07:44:16 +00001408 inetdev_send_gratuitous_arp(dev, in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001409 break;
1410 case NETDEV_DOWN:
1411 ip_mc_down(in_dev);
1412 break;
Jiri Pirko93d9b7d2010-03-10 10:28:56 +00001413 case NETDEV_PRE_TYPE_CHANGE:
Moni Shoua75c78502009-09-15 02:37:40 -07001414 ip_mc_unmap(in_dev);
1415 break;
Jiri Pirko93d9b7d2010-03-10 10:28:56 +00001416 case NETDEV_POST_TYPE_CHANGE:
Moni Shoua75c78502009-09-15 02:37:40 -07001417 ip_mc_remap(in_dev);
1418 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001419 case NETDEV_CHANGEMTU:
Breno Leitao06770842008-09-02 17:28:58 -07001420 if (inetdev_valid_mtu(dev->mtu))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001421 break;
Breno Leitao06770842008-09-02 17:28:58 -07001422 /* disable IP when MTU is not enough */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001423 case NETDEV_UNREGISTER:
1424 inetdev_destroy(in_dev);
1425 break;
1426 case NETDEV_CHANGENAME:
1427 /* Do not notify about label change, this event is
1428 * not interesting to applications using netlink.
1429 */
1430 inetdev_changename(dev, in_dev);
1431
Pavel Emelyanov51602b22007-12-11 02:17:40 -08001432 devinet_sysctl_unregister(in_dev);
Pavel Emelyanov66f27a52007-12-02 00:55:54 +11001433 devinet_sysctl_register(in_dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001434 break;
1435 }
1436out:
1437 return NOTIFY_DONE;
1438}
1439
1440static struct notifier_block ip_netdev_notifier = {
Jianjun Kong539afed2008-11-03 02:48:48 -08001441 .notifier_call = inetdev_event,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001442};
1443
Eric Dumazet40384992012-08-03 21:06:50 +00001444static size_t inet_nlmsg_size(void)
Thomas Graf339bf982006-11-10 14:10:15 -08001445{
1446 return NLMSG_ALIGN(sizeof(struct ifaddrmsg))
1447 + nla_total_size(4) /* IFA_ADDRESS */
1448 + nla_total_size(4) /* IFA_LOCAL */
1449 + nla_total_size(4) /* IFA_BROADCAST */
Jiri Pirkoad6c8132013-12-08 12:16:10 +01001450 + nla_total_size(IFNAMSIZ) /* IFA_LABEL */
Geert Uytterhoeven63b5f152014-02-05 08:38:25 +01001451 + nla_total_size(4) /* IFA_FLAGS */
1452 + nla_total_size(sizeof(struct ifa_cacheinfo)); /* IFA_CACHEINFO */
Thomas Graf339bf982006-11-10 14:10:15 -08001453}
1454
Jiri Pirko5c766d62013-01-24 09:41:41 +00001455static inline u32 cstamp_delta(unsigned long cstamp)
1456{
1457 return (cstamp - INITIAL_JIFFIES) * 100UL / HZ;
1458}
1459
1460static int put_cacheinfo(struct sk_buff *skb, unsigned long cstamp,
1461 unsigned long tstamp, u32 preferred, u32 valid)
1462{
1463 struct ifa_cacheinfo ci;
1464
1465 ci.cstamp = cstamp_delta(cstamp);
1466 ci.tstamp = cstamp_delta(tstamp);
1467 ci.ifa_prefered = preferred;
1468 ci.ifa_valid = valid;
1469
1470 return nla_put(skb, IFA_CACHEINFO, sizeof(ci), &ci);
1471}
1472
Linus Torvalds1da177e2005-04-16 15:20:36 -07001473static int inet_fill_ifaddr(struct sk_buff *skb, struct in_ifaddr *ifa,
Eric W. Biederman15e47302012-09-07 20:12:54 +00001474 u32 portid, u32 seq, int event, unsigned int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001475{
1476 struct ifaddrmsg *ifm;
1477 struct nlmsghdr *nlh;
Jiri Pirko5c766d62013-01-24 09:41:41 +00001478 u32 preferred, valid;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001479
Eric W. Biederman15e47302012-09-07 20:12:54 +00001480 nlh = nlmsg_put(skb, portid, seq, event, sizeof(*ifm), flags);
Thomas Graf47f68512006-08-04 23:04:36 -07001481 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08001482 return -EMSGSIZE;
Thomas Graf47f68512006-08-04 23:04:36 -07001483
1484 ifm = nlmsg_data(nlh);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001485 ifm->ifa_family = AF_INET;
1486 ifm->ifa_prefixlen = ifa->ifa_prefixlen;
Jiri Pirko5c766d62013-01-24 09:41:41 +00001487 ifm->ifa_flags = ifa->ifa_flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001488 ifm->ifa_scope = ifa->ifa_scope;
1489 ifm->ifa_index = ifa->ifa_dev->dev->ifindex;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001490
Jiri Pirko5c766d62013-01-24 09:41:41 +00001491 if (!(ifm->ifa_flags & IFA_F_PERMANENT)) {
1492 preferred = ifa->ifa_preferred_lft;
1493 valid = ifa->ifa_valid_lft;
1494 if (preferred != INFINITY_LIFE_TIME) {
1495 long tval = (jiffies - ifa->ifa_tstamp) / HZ;
1496
1497 if (preferred > tval)
1498 preferred -= tval;
1499 else
1500 preferred = 0;
1501 if (valid != INFINITY_LIFE_TIME) {
1502 if (valid > tval)
1503 valid -= tval;
1504 else
1505 valid = 0;
1506 }
1507 }
1508 } else {
1509 preferred = INFINITY_LIFE_TIME;
1510 valid = INFINITY_LIFE_TIME;
1511 }
David S. Millerf3756b72012-04-01 20:39:02 -04001512 if ((ifa->ifa_address &&
1513 nla_put_be32(skb, IFA_ADDRESS, ifa->ifa_address)) ||
1514 (ifa->ifa_local &&
1515 nla_put_be32(skb, IFA_LOCAL, ifa->ifa_local)) ||
1516 (ifa->ifa_broadcast &&
1517 nla_put_be32(skb, IFA_BROADCAST, ifa->ifa_broadcast)) ||
1518 (ifa->ifa_label[0] &&
Jiri Pirko5c766d62013-01-24 09:41:41 +00001519 nla_put_string(skb, IFA_LABEL, ifa->ifa_label)) ||
Jiri Pirkoad6c8132013-12-08 12:16:10 +01001520 nla_put_u32(skb, IFA_FLAGS, ifa->ifa_flags) ||
Jiri Pirko5c766d62013-01-24 09:41:41 +00001521 put_cacheinfo(skb, ifa->ifa_cstamp, ifa->ifa_tstamp,
1522 preferred, valid))
David S. Millerf3756b72012-04-01 20:39:02 -04001523 goto nla_put_failure;
Thomas Graf47f68512006-08-04 23:04:36 -07001524
Johannes Berg053c0952015-01-16 22:09:00 +01001525 nlmsg_end(skb, nlh);
1526 return 0;
Thomas Graf47f68512006-08-04 23:04:36 -07001527
1528nla_put_failure:
Patrick McHardy26932562007-01-31 23:16:40 -08001529 nlmsg_cancel(skb, nlh);
1530 return -EMSGSIZE;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001531}
1532
1533static int inet_dump_ifaddr(struct sk_buff *skb, struct netlink_callback *cb)
1534{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001535 struct net *net = sock_net(skb->sk);
Eric Dumazeteec4df92009-11-12 07:44:25 +00001536 int h, s_h;
1537 int idx, s_idx;
1538 int ip_idx, s_ip_idx;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001539 struct net_device *dev;
1540 struct in_device *in_dev;
1541 struct in_ifaddr *ifa;
Eric Dumazeteec4df92009-11-12 07:44:25 +00001542 struct hlist_head *head;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001543
Eric Dumazeteec4df92009-11-12 07:44:25 +00001544 s_h = cb->args[0];
1545 s_idx = idx = cb->args[1];
1546 s_ip_idx = ip_idx = cb->args[2];
Linus Torvalds1da177e2005-04-16 15:20:36 -07001547
Eric Dumazeteec4df92009-11-12 07:44:25 +00001548 for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) {
1549 idx = 0;
1550 head = &net->dev_index_head[h];
1551 rcu_read_lock();
Nicolas Dichtel04652772013-03-22 06:28:42 +00001552 cb->seq = atomic_read(&net->ipv4.dev_addr_genid) ^
1553 net->dev_base_seq;
Sasha Levinb67bfe02013-02-27 17:06:00 -08001554 hlist_for_each_entry_rcu(dev, head, index_hlist) {
Eric Dumazeteec4df92009-11-12 07:44:25 +00001555 if (idx < s_idx)
1556 goto cont;
Patrick McHardy4b97efd2010-03-26 20:27:49 -07001557 if (h > s_h || idx > s_idx)
Eric Dumazeteec4df92009-11-12 07:44:25 +00001558 s_ip_idx = 0;
1559 in_dev = __in_dev_get_rcu(dev);
1560 if (!in_dev)
1561 goto cont;
1562
1563 for (ifa = in_dev->ifa_list, ip_idx = 0; ifa;
1564 ifa = ifa->ifa_next, ip_idx++) {
1565 if (ip_idx < s_ip_idx)
1566 continue;
1567 if (inet_fill_ifaddr(skb, ifa,
Eric W. Biederman15e47302012-09-07 20:12:54 +00001568 NETLINK_CB(cb->skb).portid,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001569 cb->nlh->nlmsg_seq,
Johannes Berg053c0952015-01-16 22:09:00 +01001570 RTM_NEWADDR, NLM_F_MULTI) < 0) {
Eric Dumazeteec4df92009-11-12 07:44:25 +00001571 rcu_read_unlock();
1572 goto done;
1573 }
Nicolas Dichtel04652772013-03-22 06:28:42 +00001574 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
Eric Dumazeteec4df92009-11-12 07:44:25 +00001575 }
Pavel Emelianov7562f872007-05-03 15:13:45 -07001576cont:
Eric Dumazeteec4df92009-11-12 07:44:25 +00001577 idx++;
1578 }
1579 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001580 }
1581
1582done:
Eric Dumazeteec4df92009-11-12 07:44:25 +00001583 cb->args[0] = h;
1584 cb->args[1] = idx;
1585 cb->args[2] = ip_idx;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001586
1587 return skb->len;
1588}
1589
Jianjun Kong539afed2008-11-03 02:48:48 -08001590static void rtmsg_ifa(int event, struct in_ifaddr *ifa, struct nlmsghdr *nlh,
Eric W. Biederman15e47302012-09-07 20:12:54 +00001591 u32 portid)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001592{
Thomas Graf47f68512006-08-04 23:04:36 -07001593 struct sk_buff *skb;
Thomas Grafd6062cb2006-08-15 00:33:59 -07001594 u32 seq = nlh ? nlh->nlmsg_seq : 0;
1595 int err = -ENOBUFS;
Denis V. Lunev4b8aa9a2008-01-31 18:47:40 -08001596 struct net *net;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001597
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09001598 net = dev_net(ifa->ifa_dev->dev);
Thomas Graf339bf982006-11-10 14:10:15 -08001599 skb = nlmsg_new(inet_nlmsg_size(), GFP_KERNEL);
Thomas Graf47f68512006-08-04 23:04:36 -07001600 if (skb == NULL)
Thomas Grafd6062cb2006-08-15 00:33:59 -07001601 goto errout;
1602
Eric W. Biederman15e47302012-09-07 20:12:54 +00001603 err = inet_fill_ifaddr(skb, ifa, portid, seq, event, 0);
Patrick McHardy26932562007-01-31 23:16:40 -08001604 if (err < 0) {
1605 /* -EMSGSIZE implies BUG in inet_nlmsg_size() */
1606 WARN_ON(err == -EMSGSIZE);
1607 kfree_skb(skb);
1608 goto errout;
1609 }
Eric W. Biederman15e47302012-09-07 20:12:54 +00001610 rtnl_notify(skb, net, portid, RTNLGRP_IPV4_IFADDR, nlh, GFP_KERNEL);
Pablo Neira Ayuso1ce85fe2009-02-24 23:18:28 -08001611 return;
Thomas Grafd6062cb2006-08-15 00:33:59 -07001612errout:
1613 if (err < 0)
Denis V. Lunev4b8aa9a2008-01-31 18:47:40 -08001614 rtnl_set_sk_err(net, RTNLGRP_IPV4_IFADDR, err);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001615}
1616
Thomas Graf9f0f7272010-11-16 04:32:48 +00001617static size_t inet_get_link_af_size(const struct net_device *dev)
1618{
Eric Dumazet1fc19af2011-05-09 20:55:03 -07001619 struct in_device *in_dev = rcu_dereference_rtnl(dev->ip_ptr);
Thomas Graf9f0f7272010-11-16 04:32:48 +00001620
1621 if (!in_dev)
1622 return 0;
1623
1624 return nla_total_size(IPV4_DEVCONF_MAX * 4); /* IFLA_INET_CONF */
1625}
1626
1627static int inet_fill_link_af(struct sk_buff *skb, const struct net_device *dev)
1628{
Eric Dumazet1fc19af2011-05-09 20:55:03 -07001629 struct in_device *in_dev = rcu_dereference_rtnl(dev->ip_ptr);
Thomas Graf9f0f7272010-11-16 04:32:48 +00001630 struct nlattr *nla;
1631 int i;
1632
1633 if (!in_dev)
1634 return -ENODATA;
1635
1636 nla = nla_reserve(skb, IFLA_INET_CONF, IPV4_DEVCONF_MAX * 4);
1637 if (nla == NULL)
1638 return -EMSGSIZE;
1639
1640 for (i = 0; i < IPV4_DEVCONF_MAX; i++)
1641 ((u32 *) nla_data(nla))[i] = in_dev->cnf.data[i];
1642
1643 return 0;
1644}
1645
1646static const struct nla_policy inet_af_policy[IFLA_INET_MAX+1] = {
1647 [IFLA_INET_CONF] = { .type = NLA_NESTED },
1648};
1649
Thomas Grafcf7afbf2010-11-22 01:31:54 +00001650static int inet_validate_link_af(const struct net_device *dev,
1651 const struct nlattr *nla)
Thomas Graf9f0f7272010-11-16 04:32:48 +00001652{
Thomas Graf9f0f7272010-11-16 04:32:48 +00001653 struct nlattr *a, *tb[IFLA_INET_MAX+1];
1654 int err, rem;
1655
Eric Dumazetf7fce742010-12-01 06:03:06 +00001656 if (dev && !__in_dev_get_rtnl(dev))
Thomas Grafcf7afbf2010-11-22 01:31:54 +00001657 return -EAFNOSUPPORT;
Thomas Graf9f0f7272010-11-16 04:32:48 +00001658
1659 err = nla_parse_nested(tb, IFLA_INET_MAX, nla, inet_af_policy);
1660 if (err < 0)
1661 return err;
1662
1663 if (tb[IFLA_INET_CONF]) {
1664 nla_for_each_nested(a, tb[IFLA_INET_CONF], rem) {
1665 int cfgid = nla_type(a);
1666
1667 if (nla_len(a) < 4)
1668 return -EINVAL;
1669
1670 if (cfgid <= 0 || cfgid > IPV4_DEVCONF_MAX)
1671 return -EINVAL;
1672 }
1673 }
1674
Thomas Grafcf7afbf2010-11-22 01:31:54 +00001675 return 0;
1676}
1677
1678static int inet_set_link_af(struct net_device *dev, const struct nlattr *nla)
1679{
Eric Dumazetf7fce742010-12-01 06:03:06 +00001680 struct in_device *in_dev = __in_dev_get_rtnl(dev);
Thomas Grafcf7afbf2010-11-22 01:31:54 +00001681 struct nlattr *a, *tb[IFLA_INET_MAX+1];
1682 int rem;
1683
1684 if (!in_dev)
1685 return -EAFNOSUPPORT;
1686
1687 if (nla_parse_nested(tb, IFLA_INET_MAX, nla, NULL) < 0)
1688 BUG();
1689
Thomas Graf9f0f7272010-11-16 04:32:48 +00001690 if (tb[IFLA_INET_CONF]) {
1691 nla_for_each_nested(a, tb[IFLA_INET_CONF], rem)
1692 ipv4_devconf_set(in_dev, nla_type(a), nla_get_u32(a));
1693 }
1694
1695 return 0;
1696}
1697
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001698static int inet_netconf_msgsize_devconf(int type)
1699{
1700 int size = NLMSG_ALIGN(sizeof(struct netconfmsg))
1701 + nla_total_size(4); /* NETCONFA_IFINDEX */
1702
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001703 /* type -1 is used for ALL */
1704 if (type == -1 || type == NETCONFA_FORWARDING)
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001705 size += nla_total_size(4);
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00001706 if (type == -1 || type == NETCONFA_RP_FILTER)
1707 size += nla_total_size(4);
Nicolas Dichteld67b8c62012-12-04 01:13:35 +00001708 if (type == -1 || type == NETCONFA_MC_FORWARDING)
1709 size += nla_total_size(4);
stephen hemminger09aea5d2013-12-17 22:35:52 -08001710 if (type == -1 || type == NETCONFA_PROXY_NEIGH)
stephen hemmingerf085ff12013-12-12 13:06:50 -08001711 size += nla_total_size(4);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001712
1713 return size;
1714}
1715
1716static int inet_netconf_fill_devconf(struct sk_buff *skb, int ifindex,
1717 struct ipv4_devconf *devconf, u32 portid,
1718 u32 seq, int event, unsigned int flags,
1719 int type)
1720{
1721 struct nlmsghdr *nlh;
1722 struct netconfmsg *ncm;
1723
1724 nlh = nlmsg_put(skb, portid, seq, event, sizeof(struct netconfmsg),
1725 flags);
1726 if (nlh == NULL)
1727 return -EMSGSIZE;
1728
1729 ncm = nlmsg_data(nlh);
1730 ncm->ncm_family = AF_INET;
1731
1732 if (nla_put_s32(skb, NETCONFA_IFINDEX, ifindex) < 0)
1733 goto nla_put_failure;
1734
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001735 /* type -1 is used for ALL */
1736 if ((type == -1 || type == NETCONFA_FORWARDING) &&
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001737 nla_put_s32(skb, NETCONFA_FORWARDING,
1738 IPV4_DEVCONF(*devconf, FORWARDING)) < 0)
1739 goto nla_put_failure;
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00001740 if ((type == -1 || type == NETCONFA_RP_FILTER) &&
1741 nla_put_s32(skb, NETCONFA_RP_FILTER,
1742 IPV4_DEVCONF(*devconf, RP_FILTER)) < 0)
1743 goto nla_put_failure;
Nicolas Dichteld67b8c62012-12-04 01:13:35 +00001744 if ((type == -1 || type == NETCONFA_MC_FORWARDING) &&
1745 nla_put_s32(skb, NETCONFA_MC_FORWARDING,
1746 IPV4_DEVCONF(*devconf, MC_FORWARDING)) < 0)
1747 goto nla_put_failure;
stephen hemminger09aea5d2013-12-17 22:35:52 -08001748 if ((type == -1 || type == NETCONFA_PROXY_NEIGH) &&
1749 nla_put_s32(skb, NETCONFA_PROXY_NEIGH,
stephen hemmingerf085ff12013-12-12 13:06:50 -08001750 IPV4_DEVCONF(*devconf, PROXY_ARP)) < 0)
1751 goto nla_put_failure;
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001752
Johannes Berg053c0952015-01-16 22:09:00 +01001753 nlmsg_end(skb, nlh);
1754 return 0;
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001755
1756nla_put_failure:
1757 nlmsg_cancel(skb, nlh);
1758 return -EMSGSIZE;
1759}
1760
Nicolas Dichteld67b8c62012-12-04 01:13:35 +00001761void inet_netconf_notify_devconf(struct net *net, int type, int ifindex,
1762 struct ipv4_devconf *devconf)
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001763{
1764 struct sk_buff *skb;
1765 int err = -ENOBUFS;
1766
1767 skb = nlmsg_new(inet_netconf_msgsize_devconf(type), GFP_ATOMIC);
1768 if (skb == NULL)
1769 goto errout;
1770
1771 err = inet_netconf_fill_devconf(skb, ifindex, devconf, 0, 0,
1772 RTM_NEWNETCONF, 0, type);
1773 if (err < 0) {
1774 /* -EMSGSIZE implies BUG in inet_netconf_msgsize_devconf() */
1775 WARN_ON(err == -EMSGSIZE);
1776 kfree_skb(skb);
1777 goto errout;
1778 }
1779 rtnl_notify(skb, net, 0, RTNLGRP_IPV4_NETCONF, NULL, GFP_ATOMIC);
1780 return;
1781errout:
1782 if (err < 0)
1783 rtnl_set_sk_err(net, RTNLGRP_IPV4_NETCONF, err);
1784}
1785
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001786static const struct nla_policy devconf_ipv4_policy[NETCONFA_MAX+1] = {
1787 [NETCONFA_IFINDEX] = { .len = sizeof(int) },
1788 [NETCONFA_FORWARDING] = { .len = sizeof(int) },
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00001789 [NETCONFA_RP_FILTER] = { .len = sizeof(int) },
stephen hemminger09aea5d2013-12-17 22:35:52 -08001790 [NETCONFA_PROXY_NEIGH] = { .len = sizeof(int) },
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001791};
1792
1793static int inet_netconf_get_devconf(struct sk_buff *in_skb,
Thomas Graf661d2962013-03-21 07:45:29 +00001794 struct nlmsghdr *nlh)
Nicolas Dichtel9e551112012-10-25 22:28:53 +00001795{
1796 struct net *net = sock_net(in_skb->sk);
1797 struct nlattr *tb[NETCONFA_MAX+1];
1798 struct netconfmsg *ncm;
1799 struct sk_buff *skb;
1800 struct ipv4_devconf *devconf;
1801 struct in_device *in_dev;
1802 struct net_device *dev;
1803 int ifindex;
1804 int err;
1805
1806 err = nlmsg_parse(nlh, sizeof(*ncm), tb, NETCONFA_MAX,
1807 devconf_ipv4_policy);
1808 if (err < 0)
1809 goto errout;
1810
1811 err = EINVAL;
1812 if (!tb[NETCONFA_IFINDEX])
1813 goto errout;
1814
1815 ifindex = nla_get_s32(tb[NETCONFA_IFINDEX]);
1816 switch (ifindex) {
1817 case NETCONFA_IFINDEX_ALL:
1818 devconf = net->ipv4.devconf_all;
1819 break;
1820 case NETCONFA_IFINDEX_DEFAULT:
1821 devconf = net->ipv4.devconf_dflt;
1822 break;
1823 default:
1824 dev = __dev_get_by_index(net, ifindex);
1825 if (dev == NULL)
1826 goto errout;
1827 in_dev = __in_dev_get_rtnl(dev);
1828 if (in_dev == NULL)
1829 goto errout;
1830 devconf = &in_dev->cnf;
1831 break;
1832 }
1833
1834 err = -ENOBUFS;
1835 skb = nlmsg_new(inet_netconf_msgsize_devconf(-1), GFP_ATOMIC);
1836 if (skb == NULL)
1837 goto errout;
1838
1839 err = inet_netconf_fill_devconf(skb, ifindex, devconf,
1840 NETLINK_CB(in_skb).portid,
1841 nlh->nlmsg_seq, RTM_NEWNETCONF, 0,
1842 -1);
1843 if (err < 0) {
1844 /* -EMSGSIZE implies BUG in inet_netconf_msgsize_devconf() */
1845 WARN_ON(err == -EMSGSIZE);
1846 kfree_skb(skb);
1847 goto errout;
1848 }
1849 err = rtnl_unicast(skb, net, NETLINK_CB(in_skb).portid);
1850errout:
1851 return err;
1852}
1853
Nicolas Dichtel7a674202013-03-05 23:42:06 +00001854static int inet_netconf_dump_devconf(struct sk_buff *skb,
1855 struct netlink_callback *cb)
1856{
1857 struct net *net = sock_net(skb->sk);
1858 int h, s_h;
1859 int idx, s_idx;
1860 struct net_device *dev;
1861 struct in_device *in_dev;
1862 struct hlist_head *head;
1863
1864 s_h = cb->args[0];
1865 s_idx = idx = cb->args[1];
1866
1867 for (h = s_h; h < NETDEV_HASHENTRIES; h++, s_idx = 0) {
1868 idx = 0;
1869 head = &net->dev_index_head[h];
1870 rcu_read_lock();
Nicolas Dichtel04652772013-03-22 06:28:42 +00001871 cb->seq = atomic_read(&net->ipv4.dev_addr_genid) ^
1872 net->dev_base_seq;
Nicolas Dichtel7a674202013-03-05 23:42:06 +00001873 hlist_for_each_entry_rcu(dev, head, index_hlist) {
1874 if (idx < s_idx)
1875 goto cont;
1876 in_dev = __in_dev_get_rcu(dev);
1877 if (!in_dev)
1878 goto cont;
1879
1880 if (inet_netconf_fill_devconf(skb, dev->ifindex,
1881 &in_dev->cnf,
1882 NETLINK_CB(cb->skb).portid,
1883 cb->nlh->nlmsg_seq,
1884 RTM_NEWNETCONF,
1885 NLM_F_MULTI,
David S. Miller7b46a642015-01-18 23:36:08 -05001886 -1) < 0) {
Nicolas Dichtel7a674202013-03-05 23:42:06 +00001887 rcu_read_unlock();
1888 goto done;
1889 }
Nicolas Dichtel04652772013-03-22 06:28:42 +00001890 nl_dump_check_consistent(cb, nlmsg_hdr(skb));
Nicolas Dichtel7a674202013-03-05 23:42:06 +00001891cont:
1892 idx++;
1893 }
1894 rcu_read_unlock();
1895 }
1896 if (h == NETDEV_HASHENTRIES) {
1897 if (inet_netconf_fill_devconf(skb, NETCONFA_IFINDEX_ALL,
1898 net->ipv4.devconf_all,
1899 NETLINK_CB(cb->skb).portid,
1900 cb->nlh->nlmsg_seq,
1901 RTM_NEWNETCONF, NLM_F_MULTI,
David S. Miller7b46a642015-01-18 23:36:08 -05001902 -1) < 0)
Nicolas Dichtel7a674202013-03-05 23:42:06 +00001903 goto done;
1904 else
1905 h++;
1906 }
1907 if (h == NETDEV_HASHENTRIES + 1) {
1908 if (inet_netconf_fill_devconf(skb, NETCONFA_IFINDEX_DEFAULT,
1909 net->ipv4.devconf_dflt,
1910 NETLINK_CB(cb->skb).portid,
1911 cb->nlh->nlmsg_seq,
1912 RTM_NEWNETCONF, NLM_F_MULTI,
David S. Miller7b46a642015-01-18 23:36:08 -05001913 -1) < 0)
Nicolas Dichtel7a674202013-03-05 23:42:06 +00001914 goto done;
1915 else
1916 h++;
1917 }
1918done:
1919 cb->args[0] = h;
1920 cb->args[1] = idx;
1921
1922 return skb->len;
1923}
1924
Linus Torvalds1da177e2005-04-16 15:20:36 -07001925#ifdef CONFIG_SYSCTL
1926
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001927static void devinet_copy_dflt_conf(struct net *net, int i)
Herbert Xu31be3082007-06-04 23:35:37 -07001928{
1929 struct net_device *dev;
1930
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001931 rcu_read_lock();
1932 for_each_netdev_rcu(net, dev) {
Herbert Xu31be3082007-06-04 23:35:37 -07001933 struct in_device *in_dev;
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001934
Herbert Xu31be3082007-06-04 23:35:37 -07001935 in_dev = __in_dev_get_rcu(dev);
1936 if (in_dev && !test_bit(i, in_dev->cnf.state))
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -08001937 in_dev->cnf.data[i] = net->ipv4.devconf_dflt->data[i];
Herbert Xu31be3082007-06-04 23:35:37 -07001938 }
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001939 rcu_read_unlock();
Herbert Xu31be3082007-06-04 23:35:37 -07001940}
1941
Eric Dumazetc6d14c82009-11-04 05:43:23 -08001942/* called with RTNL locked */
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001943static void inet_forward_change(struct net *net)
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001944{
1945 struct net_device *dev;
Pavel Emelyanov586f1212007-12-16 13:32:48 -08001946 int on = IPV4_DEVCONF_ALL(net, FORWARDING);
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001947
Pavel Emelyanov586f1212007-12-16 13:32:48 -08001948 IPV4_DEVCONF_ALL(net, ACCEPT_REDIRECTS) = !on;
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -08001949 IPV4_DEVCONF_DFLT(net, FORWARDING) = on;
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001950 inet_netconf_notify_devconf(net, NETCONFA_FORWARDING,
1951 NETCONFA_IFINDEX_ALL,
1952 net->ipv4.devconf_all);
1953 inet_netconf_notify_devconf(net, NETCONFA_FORWARDING,
1954 NETCONFA_IFINDEX_DEFAULT,
1955 net->ipv4.devconf_dflt);
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001956
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001957 for_each_netdev(net, dev) {
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001958 struct in_device *in_dev;
Ben Hutchings0187bdf2008-06-19 16:15:47 -07001959 if (on)
1960 dev_disable_lro(dev);
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001961 rcu_read_lock();
1962 in_dev = __in_dev_get_rcu(dev);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001963 if (in_dev) {
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001964 IN_DEV_CONF_SET(in_dev, FORWARDING, on);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00001965 inet_netconf_notify_devconf(net, NETCONFA_FORWARDING,
1966 dev->ifindex, &in_dev->cnf);
1967 }
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001968 rcu_read_unlock();
1969 }
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08001970}
1971
stephen hemmingerf085ff12013-12-12 13:06:50 -08001972static int devinet_conf_ifindex(struct net *net, struct ipv4_devconf *cnf)
1973{
1974 if (cnf == net->ipv4.devconf_dflt)
1975 return NETCONFA_IFINDEX_DEFAULT;
1976 else if (cnf == net->ipv4.devconf_all)
1977 return NETCONFA_IFINDEX_ALL;
1978 else {
1979 struct in_device *idev
1980 = container_of(cnf, struct in_device, cnf);
1981 return idev->dev->ifindex;
1982 }
1983}
1984
Joe Perchesfe2c6332013-06-11 23:04:25 -07001985static int devinet_conf_proc(struct ctl_table *ctl, int write,
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07001986 void __user *buffer,
Herbert Xu31be3082007-06-04 23:35:37 -07001987 size_t *lenp, loff_t *ppos)
1988{
Peter Pan(潘卫平)d01ff0a2011-12-01 15:47:06 +00001989 int old_value = *(int *)ctl->data;
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07001990 int ret = proc_dointvec(ctl, write, buffer, lenp, ppos);
Peter Pan(潘卫平)d01ff0a2011-12-01 15:47:06 +00001991 int new_value = *(int *)ctl->data;
Herbert Xu31be3082007-06-04 23:35:37 -07001992
1993 if (write) {
1994 struct ipv4_devconf *cnf = ctl->extra1;
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08001995 struct net *net = ctl->extra2;
Herbert Xu31be3082007-06-04 23:35:37 -07001996 int i = (int *)ctl->data - cnf->data;
stephen hemmingerf085ff12013-12-12 13:06:50 -08001997 int ifindex;
Herbert Xu31be3082007-06-04 23:35:37 -07001998
1999 set_bit(i, cnf->state);
2000
Pavel Emelyanov9355bbd2007-12-16 13:32:16 -08002001 if (cnf == net->ipv4.devconf_dflt)
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08002002 devinet_copy_dflt_conf(net, i);
Thomas Grafd0daebc32012-06-12 00:44:01 +00002003 if (i == IPV4_DEVCONF_ACCEPT_LOCAL - 1 ||
2004 i == IPV4_DEVCONF_ROUTE_LOCALNET - 1)
Peter Pan(潘卫平)d01ff0a2011-12-01 15:47:06 +00002005 if ((new_value == 0) && (old_value != 0))
Nicolas Dichtel4ccfe6d2012-09-07 00:45:29 +00002006 rt_cache_flush(net);
stephen hemmingerf085ff12013-12-12 13:06:50 -08002007
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00002008 if (i == IPV4_DEVCONF_RP_FILTER - 1 &&
2009 new_value != old_value) {
stephen hemmingerf085ff12013-12-12 13:06:50 -08002010 ifindex = devinet_conf_ifindex(net, cnf);
Nicolas Dichtelcc535df2012-10-29 04:53:27 +00002011 inet_netconf_notify_devconf(net, NETCONFA_RP_FILTER,
2012 ifindex, cnf);
2013 }
stephen hemmingerf085ff12013-12-12 13:06:50 -08002014 if (i == IPV4_DEVCONF_PROXY_ARP - 1 &&
2015 new_value != old_value) {
2016 ifindex = devinet_conf_ifindex(net, cnf);
stephen hemminger09aea5d2013-12-17 22:35:52 -08002017 inet_netconf_notify_devconf(net, NETCONFA_PROXY_NEIGH,
stephen hemmingerf085ff12013-12-12 13:06:50 -08002018 ifindex, cnf);
2019 }
Herbert Xu31be3082007-06-04 23:35:37 -07002020 }
2021
2022 return ret;
2023}
2024
Joe Perchesfe2c6332013-06-11 23:04:25 -07002025static int devinet_sysctl_forward(struct ctl_table *ctl, int write,
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07002026 void __user *buffer,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002027 size_t *lenp, loff_t *ppos)
2028{
2029 int *valp = ctl->data;
2030 int val = *valp;
Eric W. Biederman88af1822010-02-19 13:22:59 +00002031 loff_t pos = *ppos;
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07002032 int ret = proc_dointvec(ctl, write, buffer, lenp, ppos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002033
2034 if (write && *valp != val) {
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08002035 struct net *net = ctl->extra2;
2036
Ben Hutchings0187bdf2008-06-19 16:15:47 -07002037 if (valp != &IPV4_DEVCONF_DFLT(net, FORWARDING)) {
Eric W. Biederman88af1822010-02-19 13:22:59 +00002038 if (!rtnl_trylock()) {
2039 /* Restore the original values before restarting */
2040 *valp = val;
2041 *ppos = pos;
Eric W. Biederman9b8adb52009-05-13 16:59:21 +00002042 return restart_syscall();
Eric W. Biederman88af1822010-02-19 13:22:59 +00002043 }
Ben Hutchings0187bdf2008-06-19 16:15:47 -07002044 if (valp == &IPV4_DEVCONF_ALL(net, FORWARDING)) {
2045 inet_forward_change(net);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00002046 } else {
Ben Hutchings0187bdf2008-06-19 16:15:47 -07002047 struct ipv4_devconf *cnf = ctl->extra1;
2048 struct in_device *idev =
2049 container_of(cnf, struct in_device, cnf);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00002050 if (*valp)
2051 dev_disable_lro(idev->dev);
2052 inet_netconf_notify_devconf(net,
2053 NETCONFA_FORWARDING,
2054 idev->dev->ifindex,
2055 cnf);
Ben Hutchings0187bdf2008-06-19 16:15:47 -07002056 }
2057 rtnl_unlock();
Nicolas Dichtel4ccfe6d2012-09-07 00:45:29 +00002058 rt_cache_flush(net);
Nicolas Dichteledc9e742012-10-25 22:28:52 +00002059 } else
2060 inet_netconf_notify_devconf(net, NETCONFA_FORWARDING,
2061 NETCONFA_IFINDEX_DEFAULT,
2062 net->ipv4.devconf_dflt);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002063 }
2064
2065 return ret;
2066}
2067
Joe Perchesfe2c6332013-06-11 23:04:25 -07002068static int ipv4_doint_and_flush(struct ctl_table *ctl, int write,
David S. Miller323e1262010-12-12 21:55:08 -08002069 void __user *buffer,
2070 size_t *lenp, loff_t *ppos)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002071{
2072 int *valp = ctl->data;
2073 int val = *valp;
Alexey Dobriyan8d65af72009-09-23 15:57:19 -07002074 int ret = proc_dointvec(ctl, write, buffer, lenp, ppos);
Denis V. Lunev76e6ebf2008-07-05 19:00:44 -07002075 struct net *net = ctl->extra2;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002076
2077 if (write && *valp != val)
Nicolas Dichtel4ccfe6d2012-09-07 00:45:29 +00002078 rt_cache_flush(net);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002079
2080 return ret;
2081}
2082
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002083#define DEVINET_SYSCTL_ENTRY(attr, name, mval, proc) \
Herbert Xu42f811b2007-06-04 23:34:44 -07002084 { \
Herbert Xu42f811b2007-06-04 23:34:44 -07002085 .procname = name, \
2086 .data = ipv4_devconf.data + \
Eric W. Biederman02291682010-02-14 03:25:51 +00002087 IPV4_DEVCONF_ ## attr - 1, \
Herbert Xu42f811b2007-06-04 23:34:44 -07002088 .maxlen = sizeof(int), \
2089 .mode = mval, \
2090 .proc_handler = proc, \
Herbert Xu31be3082007-06-04 23:35:37 -07002091 .extra1 = &ipv4_devconf, \
Herbert Xu42f811b2007-06-04 23:34:44 -07002092 }
2093
2094#define DEVINET_SYSCTL_RW_ENTRY(attr, name) \
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002095 DEVINET_SYSCTL_ENTRY(attr, name, 0644, devinet_conf_proc)
Herbert Xu42f811b2007-06-04 23:34:44 -07002096
2097#define DEVINET_SYSCTL_RO_ENTRY(attr, name) \
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002098 DEVINET_SYSCTL_ENTRY(attr, name, 0444, devinet_conf_proc)
Herbert Xu42f811b2007-06-04 23:34:44 -07002099
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002100#define DEVINET_SYSCTL_COMPLEX_ENTRY(attr, name, proc) \
2101 DEVINET_SYSCTL_ENTRY(attr, name, 0644, proc)
Herbert Xu42f811b2007-06-04 23:34:44 -07002102
2103#define DEVINET_SYSCTL_FLUSHING_ENTRY(attr, name) \
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002104 DEVINET_SYSCTL_COMPLEX_ENTRY(attr, name, ipv4_doint_and_flush)
Herbert Xu42f811b2007-06-04 23:34:44 -07002105
Linus Torvalds1da177e2005-04-16 15:20:36 -07002106static struct devinet_sysctl_table {
2107 struct ctl_table_header *sysctl_header;
Eric W. Biederman02291682010-02-14 03:25:51 +00002108 struct ctl_table devinet_vars[__IPV4_DEVCONF_MAX];
Linus Torvalds1da177e2005-04-16 15:20:36 -07002109} devinet_sysctl = {
2110 .devinet_vars = {
Herbert Xu42f811b2007-06-04 23:34:44 -07002111 DEVINET_SYSCTL_COMPLEX_ENTRY(FORWARDING, "forwarding",
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002112 devinet_sysctl_forward),
Herbert Xu42f811b2007-06-04 23:34:44 -07002113 DEVINET_SYSCTL_RO_ENTRY(MC_FORWARDING, "mc_forwarding"),
2114
2115 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_REDIRECTS, "accept_redirects"),
2116 DEVINET_SYSCTL_RW_ENTRY(SECURE_REDIRECTS, "secure_redirects"),
2117 DEVINET_SYSCTL_RW_ENTRY(SHARED_MEDIA, "shared_media"),
2118 DEVINET_SYSCTL_RW_ENTRY(RP_FILTER, "rp_filter"),
2119 DEVINET_SYSCTL_RW_ENTRY(SEND_REDIRECTS, "send_redirects"),
2120 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_SOURCE_ROUTE,
2121 "accept_source_route"),
Patrick McHardy8153a102009-12-03 01:25:58 +00002122 DEVINET_SYSCTL_RW_ENTRY(ACCEPT_LOCAL, "accept_local"),
Jamal Hadi Salim28f6aee2009-12-25 17:30:22 -08002123 DEVINET_SYSCTL_RW_ENTRY(SRC_VMARK, "src_valid_mark"),
Herbert Xu42f811b2007-06-04 23:34:44 -07002124 DEVINET_SYSCTL_RW_ENTRY(PROXY_ARP, "proxy_arp"),
2125 DEVINET_SYSCTL_RW_ENTRY(MEDIUM_ID, "medium_id"),
2126 DEVINET_SYSCTL_RW_ENTRY(BOOTP_RELAY, "bootp_relay"),
2127 DEVINET_SYSCTL_RW_ENTRY(LOG_MARTIANS, "log_martians"),
2128 DEVINET_SYSCTL_RW_ENTRY(TAG, "tag"),
2129 DEVINET_SYSCTL_RW_ENTRY(ARPFILTER, "arp_filter"),
2130 DEVINET_SYSCTL_RW_ENTRY(ARP_ANNOUNCE, "arp_announce"),
2131 DEVINET_SYSCTL_RW_ENTRY(ARP_IGNORE, "arp_ignore"),
2132 DEVINET_SYSCTL_RW_ENTRY(ARP_ACCEPT, "arp_accept"),
Stephen Hemmingereefef1c2009-02-01 01:04:33 -08002133 DEVINET_SYSCTL_RW_ENTRY(ARP_NOTIFY, "arp_notify"),
Jesper Dangaard Brouer65324142010-01-05 05:50:47 +00002134 DEVINET_SYSCTL_RW_ENTRY(PROXY_ARP_PVLAN, "proxy_arp_pvlan"),
William Manley5c6fe012013-08-06 19:03:14 +01002135 DEVINET_SYSCTL_RW_ENTRY(FORCE_IGMP_VERSION,
2136 "force_igmp_version"),
William Manley26900482013-08-06 19:03:15 +01002137 DEVINET_SYSCTL_RW_ENTRY(IGMPV2_UNSOLICITED_REPORT_INTERVAL,
2138 "igmpv2_unsolicited_report_interval"),
2139 DEVINET_SYSCTL_RW_ENTRY(IGMPV3_UNSOLICITED_REPORT_INTERVAL,
2140 "igmpv3_unsolicited_report_interval"),
Herbert Xu42f811b2007-06-04 23:34:44 -07002141
2142 DEVINET_SYSCTL_FLUSHING_ENTRY(NOXFRM, "disable_xfrm"),
2143 DEVINET_SYSCTL_FLUSHING_ENTRY(NOPOLICY, "disable_policy"),
Herbert Xu42f811b2007-06-04 23:34:44 -07002144 DEVINET_SYSCTL_FLUSHING_ENTRY(PROMOTE_SECONDARIES,
2145 "promote_secondaries"),
Thomas Grafd0daebc32012-06-12 00:44:01 +00002146 DEVINET_SYSCTL_FLUSHING_ENTRY(ROUTE_LOCALNET,
2147 "route_localnet"),
Linus Torvalds1da177e2005-04-16 15:20:36 -07002148 },
Linus Torvalds1da177e2005-04-16 15:20:36 -07002149};
2150
Pavel Emelyanovea40b322007-12-16 13:30:07 -08002151static int __devinet_sysctl_register(struct net *net, char *dev_name,
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002152 struct ipv4_devconf *p)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002153{
2154 int i;
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002155 struct devinet_sysctl_table *t;
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002156 char path[sizeof("net/ipv4/conf/") + IFNAMSIZ];
Pavel Emelyanovbfada692007-12-02 00:57:08 +11002157
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002158 t = kmemdup(&devinet_sysctl, sizeof(*t), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002159 if (!t)
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002160 goto out;
2161
Linus Torvalds1da177e2005-04-16 15:20:36 -07002162 for (i = 0; i < ARRAY_SIZE(t->devinet_vars) - 1; i++) {
2163 t->devinet_vars[i].data += (char *)p - (char *)&ipv4_devconf;
Herbert Xu31be3082007-06-04 23:35:37 -07002164 t->devinet_vars[i].extra1 = p;
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08002165 t->devinet_vars[i].extra2 = net;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002166 }
2167
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002168 snprintf(path, sizeof(path), "net/ipv4/conf/%s", dev_name);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002169
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002170 t->sysctl_header = register_net_sysctl(net, path, t->devinet_vars);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002171 if (!t->sysctl_header)
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002172 goto free;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002173
2174 p->sysctl = t;
Pavel Emelyanovea40b322007-12-16 13:30:07 -08002175 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002176
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002177free:
Linus Torvalds1da177e2005-04-16 15:20:36 -07002178 kfree(t);
Pavel Emelyanov9fa89642007-12-02 00:17:46 +11002179out:
Pavel Emelyanovea40b322007-12-16 13:30:07 -08002180 return -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002181}
2182
Pavel Emelyanov51602b22007-12-11 02:17:40 -08002183static void __devinet_sysctl_unregister(struct ipv4_devconf *cnf)
2184{
2185 struct devinet_sysctl_table *t = cnf->sysctl;
2186
2187 if (t == NULL)
2188 return;
2189
2190 cnf->sysctl = NULL;
Lucian Adrian Grijincuff538812011-05-01 01:44:01 +00002191 unregister_net_sysctl_table(t->sysctl_header);
Pavel Emelyanov51602b22007-12-11 02:17:40 -08002192 kfree(t);
2193}
2194
WANG Cong20e61da2014-07-25 15:25:08 -07002195static int devinet_sysctl_register(struct in_device *idev)
Pavel Emelyanov66f27a52007-12-02 00:55:54 +11002196{
WANG Cong20e61da2014-07-25 15:25:08 -07002197 int err;
2198
2199 if (!sysctl_dev_name_is_allowed(idev->dev->name))
2200 return -EINVAL;
2201
2202 err = neigh_sysctl_register(idev->dev, idev->arp_parms, NULL);
2203 if (err)
2204 return err;
2205 err = __devinet_sysctl_register(dev_net(idev->dev), idev->dev->name,
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002206 &idev->cnf);
WANG Cong20e61da2014-07-25 15:25:08 -07002207 if (err)
2208 neigh_sysctl_unregister(idev->arp_parms);
2209 return err;
Pavel Emelyanov66f27a52007-12-02 00:55:54 +11002210}
2211
Pavel Emelyanov51602b22007-12-11 02:17:40 -08002212static void devinet_sysctl_unregister(struct in_device *idev)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002213{
Pavel Emelyanov51602b22007-12-11 02:17:40 -08002214 __devinet_sysctl_unregister(&idev->cnf);
2215 neigh_sysctl_unregister(idev->arp_parms);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002216}
Linus Torvalds1da177e2005-04-16 15:20:36 -07002217
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002218static struct ctl_table ctl_forward_entry[] = {
2219 {
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002220 .procname = "ip_forward",
2221 .data = &ipv4_devconf.data[
Eric W. Biederman02291682010-02-14 03:25:51 +00002222 IPV4_DEVCONF_FORWARDING - 1],
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002223 .maxlen = sizeof(int),
2224 .mode = 0644,
2225 .proc_handler = devinet_sysctl_forward,
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002226 .extra1 = &ipv4_devconf,
Pavel Emelyanovc0ce9fb2007-12-16 13:31:14 -08002227 .extra2 = &init_net,
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002228 },
2229 { },
2230};
Eric Dumazet2a75de02008-01-05 23:08:49 -08002231#endif
Pavel Emelyanov68dd2992007-12-05 01:44:58 -08002232
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002233static __net_init int devinet_init_net(struct net *net)
2234{
2235 int err;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002236 struct ipv4_devconf *all, *dflt;
Eric Dumazet2a75de02008-01-05 23:08:49 -08002237#ifdef CONFIG_SYSCTL
2238 struct ctl_table *tbl = ctl_forward_entry;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002239 struct ctl_table_header *forw_hdr;
Eric Dumazet2a75de02008-01-05 23:08:49 -08002240#endif
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002241
2242 err = -ENOMEM;
2243 all = &ipv4_devconf;
2244 dflt = &ipv4_devconf_dflt;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002245
Octavian Purdila09ad9bc2009-11-25 15:14:13 -08002246 if (!net_eq(net, &init_net)) {
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002247 all = kmemdup(all, sizeof(ipv4_devconf), GFP_KERNEL);
2248 if (all == NULL)
2249 goto err_alloc_all;
2250
2251 dflt = kmemdup(dflt, sizeof(ipv4_devconf_dflt), GFP_KERNEL);
2252 if (dflt == NULL)
2253 goto err_alloc_dflt;
2254
Eric Dumazet2a75de02008-01-05 23:08:49 -08002255#ifdef CONFIG_SYSCTL
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002256 tbl = kmemdup(tbl, sizeof(ctl_forward_entry), GFP_KERNEL);
2257 if (tbl == NULL)
2258 goto err_alloc_ctl;
2259
Eric W. Biederman02291682010-02-14 03:25:51 +00002260 tbl[0].data = &all->data[IPV4_DEVCONF_FORWARDING - 1];
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002261 tbl[0].extra1 = all;
2262 tbl[0].extra2 = net;
Eric Dumazet2a75de02008-01-05 23:08:49 -08002263#endif
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002264 }
2265
2266#ifdef CONFIG_SYSCTL
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002267 err = __devinet_sysctl_register(net, "all", all);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002268 if (err < 0)
2269 goto err_reg_all;
2270
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002271 err = __devinet_sysctl_register(net, "default", dflt);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002272 if (err < 0)
2273 goto err_reg_dflt;
2274
2275 err = -ENOMEM;
Eric W. Biederman8607ddb2012-04-19 13:42:09 +00002276 forw_hdr = register_net_sysctl(net, "net/ipv4", tbl);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002277 if (forw_hdr == NULL)
2278 goto err_reg_ctl;
Eric Dumazet2a75de02008-01-05 23:08:49 -08002279 net->ipv4.forw_hdr = forw_hdr;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002280#endif
2281
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002282 net->ipv4.devconf_all = all;
2283 net->ipv4.devconf_dflt = dflt;
2284 return 0;
2285
2286#ifdef CONFIG_SYSCTL
2287err_reg_ctl:
2288 __devinet_sysctl_unregister(dflt);
2289err_reg_dflt:
2290 __devinet_sysctl_unregister(all);
2291err_reg_all:
2292 if (tbl != ctl_forward_entry)
2293 kfree(tbl);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002294err_alloc_ctl:
Eric Dumazet2a75de02008-01-05 23:08:49 -08002295#endif
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002296 if (dflt != &ipv4_devconf_dflt)
2297 kfree(dflt);
2298err_alloc_dflt:
2299 if (all != &ipv4_devconf)
2300 kfree(all);
2301err_alloc_all:
2302 return err;
2303}
2304
2305static __net_exit void devinet_exit_net(struct net *net)
2306{
Eric Dumazet2a75de02008-01-05 23:08:49 -08002307#ifdef CONFIG_SYSCTL
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002308 struct ctl_table *tbl;
2309
2310 tbl = net->ipv4.forw_hdr->ctl_table_arg;
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002311 unregister_net_sysctl_table(net->ipv4.forw_hdr);
2312 __devinet_sysctl_unregister(net->ipv4.devconf_dflt);
2313 __devinet_sysctl_unregister(net->ipv4.devconf_all);
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002314 kfree(tbl);
Eric Dumazet2a75de02008-01-05 23:08:49 -08002315#endif
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002316 kfree(net->ipv4.devconf_dflt);
2317 kfree(net->ipv4.devconf_all);
2318}
2319
2320static __net_initdata struct pernet_operations devinet_ops = {
2321 .init = devinet_init_net,
2322 .exit = devinet_exit_net,
2323};
2324
Thomas Graf9f0f7272010-11-16 04:32:48 +00002325static struct rtnl_af_ops inet_af_ops = {
2326 .family = AF_INET,
2327 .fill_link_af = inet_fill_link_af,
2328 .get_link_af_size = inet_get_link_af_size,
Thomas Grafcf7afbf2010-11-22 01:31:54 +00002329 .validate_link_af = inet_validate_link_af,
2330 .set_link_af = inet_set_link_af,
Thomas Graf9f0f7272010-11-16 04:32:48 +00002331};
2332
Linus Torvalds1da177e2005-04-16 15:20:36 -07002333void __init devinet_init(void)
2334{
David S. Millerfd23c3b2011-02-18 12:42:28 -08002335 int i;
2336
2337 for (i = 0; i < IN4_ADDR_HSIZE; i++)
2338 INIT_HLIST_HEAD(&inet_addr_lst[i]);
2339
Pavel Emelyanov752d14d2007-12-16 13:31:47 -08002340 register_pernet_subsys(&devinet_ops);
2341
Linus Torvalds1da177e2005-04-16 15:20:36 -07002342 register_gifconf(PF_INET, inet_gifconf);
2343 register_netdevice_notifier(&ip_netdev_notifier);
Thomas Graf63f34442007-03-22 11:55:17 -07002344
viresh kumar906e0732014-01-22 12:23:32 +05302345 queue_delayed_work(system_power_efficient_wq, &check_lifetime_work, 0);
Jiri Pirko5c766d62013-01-24 09:41:41 +00002346
Thomas Graf9f0f7272010-11-16 04:32:48 +00002347 rtnl_af_register(&inet_af_ops);
2348
Greg Rosec7ac8672011-06-10 01:27:09 +00002349 rtnl_register(PF_INET, RTM_NEWADDR, inet_rtm_newaddr, NULL, NULL);
2350 rtnl_register(PF_INET, RTM_DELADDR, inet_rtm_deladdr, NULL, NULL);
2351 rtnl_register(PF_INET, RTM_GETADDR, NULL, inet_dump_ifaddr, NULL);
Nicolas Dichtel9e551112012-10-25 22:28:53 +00002352 rtnl_register(PF_INET, RTM_GETNETCONF, inet_netconf_get_devconf,
Nicolas Dichtel7a674202013-03-05 23:42:06 +00002353 inet_netconf_dump_devconf, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002354}
2355