blob: 86f9b165bbba69482f151010d05ad8fe6243b293 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Generic address resolution entity
3 *
4 * Authors:
5 * Pedro Roque <roque@di.fc.ul.pt>
6 * Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
7 *
8 * This program is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU General Public License
10 * as published by the Free Software Foundation; either version
11 * 2 of the License, or (at your option) any later version.
12 *
13 * Fixes:
14 * Vitaly E. Lavrov releasing NULL neighbor in neigh_add.
15 * Harald Welte Add neighbour cache statistics like rtstat
16 */
17
Joe Perchese005d192012-05-16 19:58:40 +000018#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
19
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090020#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021#include <linux/types.h>
22#include <linux/kernel.h>
23#include <linux/module.h>
24#include <linux/socket.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070025#include <linux/netdevice.h>
26#include <linux/proc_fs.h>
27#ifdef CONFIG_SYSCTL
28#include <linux/sysctl.h>
29#endif
30#include <linux/times.h>
Eric W. Biederman457c4cb2007-09-12 12:01:34 +020031#include <net/net_namespace.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070032#include <net/neighbour.h>
33#include <net/dst.h>
34#include <net/sock.h>
Tom Tucker8d717402006-07-30 20:43:36 -070035#include <net/netevent.h>
Thomas Grafa14a49d2006-08-07 17:53:08 -070036#include <net/netlink.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070037#include <linux/rtnetlink.h>
38#include <linux/random.h>
Paulo Marques543537b2005-06-23 00:09:02 -070039#include <linux/string.h>
vignesh babuc3609d52007-08-24 22:27:55 -070040#include <linux/log2.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070041
Joe Perchesd5d427c2013-04-15 15:17:19 +000042#define DEBUG
Linus Torvalds1da177e2005-04-16 15:20:36 -070043#define NEIGH_DEBUG 1
Joe Perchesd5d427c2013-04-15 15:17:19 +000044#define neigh_dbg(level, fmt, ...) \
45do { \
46 if (level <= NEIGH_DEBUG) \
47 pr_debug(fmt, ##__VA_ARGS__); \
48} while (0)
Linus Torvalds1da177e2005-04-16 15:20:36 -070049
50#define PNEIGH_HASHMASK 0xF
51
52static void neigh_timer_handler(unsigned long arg);
Thomas Grafd961db32007-08-08 23:12:56 -070053static void __neigh_notify(struct neighbour *n, int type, int flags);
54static void neigh_update_notify(struct neighbour *neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -070055static int pneigh_ifdown(struct neigh_table *tbl, struct net_device *dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -070056
57static struct neigh_table *neigh_tables;
Amos Waterland45fc3b12005-09-24 16:53:16 -070058#ifdef CONFIG_PROC_FS
Arjan van de Ven9a321442007-02-12 00:55:35 -080059static const struct file_operations neigh_stat_seq_fops;
Amos Waterland45fc3b12005-09-24 16:53:16 -070060#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070061
62/*
63 Neighbour hash table buckets are protected with rwlock tbl->lock.
64
65 - All the scans/updates to hash buckets MUST be made under this lock.
66 - NOTHING clever should be made under this lock: no callbacks
67 to protocol backends, no attempts to send something to network.
68 It will result in deadlocks, if backend/driver wants to use neighbour
69 cache.
70 - If the entry requires some non-trivial actions, increase
71 its reference count and release table lock.
72
73 Neighbour entries are protected:
74 - with reference count.
75 - with rwlock neigh->lock
76
77 Reference count prevents destruction.
78
79 neigh->lock mainly serializes ll address data and its validity state.
80 However, the same lock is used to protect another entry fields:
81 - timer
82 - resolution queue
83
84 Again, nothing clever shall be made under neigh->lock,
85 the most complicated procedure, which we allow is dev->hard_header.
86 It is supposed, that dev->hard_header is simplistic and does
87 not make callbacks to neighbour tables.
88
89 The last lock is neigh_tbl_lock. It is pure SMP lock, protecting
90 list of neighbour tables. This list is used only in process context,
91 */
92
93static DEFINE_RWLOCK(neigh_tbl_lock);
94
David S. Miller8f40b162011-07-17 13:34:11 -070095static int neigh_blackhole(struct neighbour *neigh, struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -070096{
97 kfree_skb(skb);
98 return -ENETDOWN;
99}
100
Thomas Graf4f494552007-08-08 23:12:36 -0700101static void neigh_cleanup_and_release(struct neighbour *neigh)
102{
103 if (neigh->parms->neigh_cleanup)
104 neigh->parms->neigh_cleanup(neigh);
105
Thomas Grafd961db32007-08-08 23:12:56 -0700106 __neigh_notify(neigh, RTM_DELNEIGH, 0);
Thomas Graf4f494552007-08-08 23:12:36 -0700107 neigh_release(neigh);
108}
109
Linus Torvalds1da177e2005-04-16 15:20:36 -0700110/*
111 * It is random distribution in the interval (1/2)*base...(3/2)*base.
112 * It corresponds to default IPv6 settings and is not overridable,
113 * because it is really reasonable choice.
114 */
115
116unsigned long neigh_rand_reach_time(unsigned long base)
117{
Eric Dumazeta02cec22010-09-22 20:43:57 +0000118 return base ? (net_random() % base) + (base >> 1) : 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900120EXPORT_SYMBOL(neigh_rand_reach_time);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700121
122
123static int neigh_forced_gc(struct neigh_table *tbl)
124{
125 int shrunk = 0;
126 int i;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000127 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700128
129 NEIGH_CACHE_STAT_INC(tbl, forced_gc_runs);
130
131 write_lock_bh(&tbl->lock);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000132 nht = rcu_dereference_protected(tbl->nht,
133 lockdep_is_held(&tbl->lock));
David S. Millercd089332011-07-11 01:28:12 -0700134 for (i = 0; i < (1 << nht->hash_shift); i++) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700135 struct neighbour *n;
136 struct neighbour __rcu **np;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700137
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000138 np = &nht->hash_buckets[i];
Eric Dumazet767e97e2010-10-06 17:49:21 -0700139 while ((n = rcu_dereference_protected(*np,
140 lockdep_is_held(&tbl->lock))) != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700141 /* Neighbour record may be discarded if:
142 * - nobody refers to it.
143 * - it is not permanent
144 */
145 write_lock(&n->lock);
146 if (atomic_read(&n->refcnt) == 1 &&
147 !(n->nud_state & NUD_PERMANENT)) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700148 rcu_assign_pointer(*np,
149 rcu_dereference_protected(n->next,
150 lockdep_is_held(&tbl->lock)));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700151 n->dead = 1;
152 shrunk = 1;
153 write_unlock(&n->lock);
Thomas Graf4f494552007-08-08 23:12:36 -0700154 neigh_cleanup_and_release(n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155 continue;
156 }
157 write_unlock(&n->lock);
158 np = &n->next;
159 }
160 }
161
162 tbl->last_flush = jiffies;
163
164 write_unlock_bh(&tbl->lock);
165
166 return shrunk;
167}
168
Pavel Emelyanova43d8992007-12-20 15:49:05 -0800169static void neigh_add_timer(struct neighbour *n, unsigned long when)
170{
171 neigh_hold(n);
172 if (unlikely(mod_timer(&n->timer, when))) {
173 printk("NEIGH: BUG, double timer add, state is %x\n",
174 n->nud_state);
175 dump_stack();
176 }
177}
178
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179static int neigh_del_timer(struct neighbour *n)
180{
181 if ((n->nud_state & NUD_IN_TIMER) &&
182 del_timer(&n->timer)) {
183 neigh_release(n);
184 return 1;
185 }
186 return 0;
187}
188
189static void pneigh_queue_purge(struct sk_buff_head *list)
190{
191 struct sk_buff *skb;
192
193 while ((skb = skb_dequeue(list)) != NULL) {
194 dev_put(skb->dev);
195 kfree_skb(skb);
196 }
197}
198
Herbert Xu49636bb2005-10-23 17:18:00 +1000199static void neigh_flush_dev(struct neigh_table *tbl, struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200{
201 int i;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000202 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000204 nht = rcu_dereference_protected(tbl->nht,
205 lockdep_is_held(&tbl->lock));
206
David S. Millercd089332011-07-11 01:28:12 -0700207 for (i = 0; i < (1 << nht->hash_shift); i++) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700208 struct neighbour *n;
209 struct neighbour __rcu **np = &nht->hash_buckets[i];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700210
Eric Dumazet767e97e2010-10-06 17:49:21 -0700211 while ((n = rcu_dereference_protected(*np,
212 lockdep_is_held(&tbl->lock))) != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213 if (dev && n->dev != dev) {
214 np = &n->next;
215 continue;
216 }
Eric Dumazet767e97e2010-10-06 17:49:21 -0700217 rcu_assign_pointer(*np,
218 rcu_dereference_protected(n->next,
219 lockdep_is_held(&tbl->lock)));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700220 write_lock(&n->lock);
221 neigh_del_timer(n);
222 n->dead = 1;
223
224 if (atomic_read(&n->refcnt) != 1) {
225 /* The most unpleasant situation.
226 We must destroy neighbour entry,
227 but someone still uses it.
228
229 The destroy will be delayed until
230 the last user releases us, but
231 we must kill timers etc. and move
232 it to safe state.
233 */
234 skb_queue_purge(&n->arp_queue);
Eric Dumazet8b5c1712011-11-09 12:07:14 +0000235 n->arp_queue_len_bytes = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700236 n->output = neigh_blackhole;
237 if (n->nud_state & NUD_VALID)
238 n->nud_state = NUD_NOARP;
239 else
240 n->nud_state = NUD_NONE;
Joe Perchesd5d427c2013-04-15 15:17:19 +0000241 neigh_dbg(2, "neigh %p is stray\n", n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700242 }
243 write_unlock(&n->lock);
Thomas Graf4f494552007-08-08 23:12:36 -0700244 neigh_cleanup_and_release(n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245 }
246 }
Herbert Xu49636bb2005-10-23 17:18:00 +1000247}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248
Herbert Xu49636bb2005-10-23 17:18:00 +1000249void neigh_changeaddr(struct neigh_table *tbl, struct net_device *dev)
250{
251 write_lock_bh(&tbl->lock);
252 neigh_flush_dev(tbl, dev);
253 write_unlock_bh(&tbl->lock);
254}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900255EXPORT_SYMBOL(neigh_changeaddr);
Herbert Xu49636bb2005-10-23 17:18:00 +1000256
257int neigh_ifdown(struct neigh_table *tbl, struct net_device *dev)
258{
259 write_lock_bh(&tbl->lock);
260 neigh_flush_dev(tbl, dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261 pneigh_ifdown(tbl, dev);
262 write_unlock_bh(&tbl->lock);
263
264 del_timer_sync(&tbl->proxy_timer);
265 pneigh_queue_purge(&tbl->proxy_queue);
266 return 0;
267}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900268EXPORT_SYMBOL(neigh_ifdown);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700269
David Miller596b9b62011-07-25 00:01:25 +0000270static struct neighbour *neigh_alloc(struct neigh_table *tbl, struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700271{
272 struct neighbour *n = NULL;
273 unsigned long now = jiffies;
274 int entries;
275
276 entries = atomic_inc_return(&tbl->entries) - 1;
277 if (entries >= tbl->gc_thresh3 ||
278 (entries >= tbl->gc_thresh2 &&
279 time_after(now, tbl->last_flush + 5 * HZ))) {
280 if (!neigh_forced_gc(tbl) &&
281 entries >= tbl->gc_thresh3)
282 goto out_entries;
283 }
284
YOSHIFUJI Hideaki / 吉藤英明08433ef2013-01-24 00:44:23 +0000285 n = kzalloc(tbl->entry_size + dev->neigh_priv_len, GFP_ATOMIC);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286 if (!n)
287 goto out_entries;
288
Linus Torvalds1da177e2005-04-16 15:20:36 -0700289 skb_queue_head_init(&n->arp_queue);
290 rwlock_init(&n->lock);
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +0000291 seqlock_init(&n->ha_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700292 n->updated = n->used = now;
293 n->nud_state = NUD_NONE;
294 n->output = neigh_blackhole;
David S. Millerf6b72b62011-07-14 07:53:20 -0700295 seqlock_init(&n->hh.hh_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700296 n->parms = neigh_parms_clone(&tbl->parms);
Pavel Emelyanovb24b8a22008-01-23 21:20:07 -0800297 setup_timer(&n->timer, neigh_timer_handler, (unsigned long)n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700298
299 NEIGH_CACHE_STAT_INC(tbl, allocs);
300 n->tbl = tbl;
301 atomic_set(&n->refcnt, 1);
302 n->dead = 1;
303out:
304 return n;
305
306out_entries:
307 atomic_dec(&tbl->entries);
308 goto out;
309}
310
David S. Miller2c2aba62011-12-28 15:06:58 -0500311static void neigh_get_hash_rnd(u32 *x)
312{
313 get_random_bytes(x, sizeof(*x));
314 *x |= 1;
315}
316
David S. Millercd089332011-07-11 01:28:12 -0700317static struct neigh_hash_table *neigh_hash_alloc(unsigned int shift)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700318{
David S. Millercd089332011-07-11 01:28:12 -0700319 size_t size = (1 << shift) * sizeof(struct neighbour *);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000320 struct neigh_hash_table *ret;
Eric Dumazet6193d2b2011-01-19 22:02:47 +0000321 struct neighbour __rcu **buckets;
David S. Miller2c2aba62011-12-28 15:06:58 -0500322 int i;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000324 ret = kmalloc(sizeof(*ret), GFP_ATOMIC);
325 if (!ret)
326 return NULL;
327 if (size <= PAGE_SIZE)
328 buckets = kzalloc(size, GFP_ATOMIC);
329 else
Eric Dumazet6193d2b2011-01-19 22:02:47 +0000330 buckets = (struct neighbour __rcu **)
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000331 __get_free_pages(GFP_ATOMIC | __GFP_ZERO,
332 get_order(size));
333 if (!buckets) {
334 kfree(ret);
335 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700336 }
Eric Dumazet6193d2b2011-01-19 22:02:47 +0000337 ret->hash_buckets = buckets;
David S. Millercd089332011-07-11 01:28:12 -0700338 ret->hash_shift = shift;
David S. Miller2c2aba62011-12-28 15:06:58 -0500339 for (i = 0; i < NEIGH_NUM_HASH_RND; i++)
340 neigh_get_hash_rnd(&ret->hash_rnd[i]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700341 return ret;
342}
343
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000344static void neigh_hash_free_rcu(struct rcu_head *head)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700345{
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000346 struct neigh_hash_table *nht = container_of(head,
347 struct neigh_hash_table,
348 rcu);
David S. Millercd089332011-07-11 01:28:12 -0700349 size_t size = (1 << nht->hash_shift) * sizeof(struct neighbour *);
Eric Dumazet6193d2b2011-01-19 22:02:47 +0000350 struct neighbour __rcu **buckets = nht->hash_buckets;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351
352 if (size <= PAGE_SIZE)
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000353 kfree(buckets);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700354 else
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000355 free_pages((unsigned long)buckets, get_order(size));
356 kfree(nht);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700357}
358
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000359static struct neigh_hash_table *neigh_hash_grow(struct neigh_table *tbl,
David S. Millercd089332011-07-11 01:28:12 -0700360 unsigned long new_shift)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361{
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000362 unsigned int i, hash;
363 struct neigh_hash_table *new_nht, *old_nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700364
365 NEIGH_CACHE_STAT_INC(tbl, hash_grows);
366
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000367 old_nht = rcu_dereference_protected(tbl->nht,
368 lockdep_is_held(&tbl->lock));
David S. Millercd089332011-07-11 01:28:12 -0700369 new_nht = neigh_hash_alloc(new_shift);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000370 if (!new_nht)
371 return old_nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700372
David S. Millercd089332011-07-11 01:28:12 -0700373 for (i = 0; i < (1 << old_nht->hash_shift); i++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700374 struct neighbour *n, *next;
375
Eric Dumazet767e97e2010-10-06 17:49:21 -0700376 for (n = rcu_dereference_protected(old_nht->hash_buckets[i],
377 lockdep_is_held(&tbl->lock));
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000378 n != NULL;
379 n = next) {
380 hash = tbl->hash(n->primary_key, n->dev,
381 new_nht->hash_rnd);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700382
David S. Millercd089332011-07-11 01:28:12 -0700383 hash >>= (32 - new_nht->hash_shift);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700384 next = rcu_dereference_protected(n->next,
385 lockdep_is_held(&tbl->lock));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700386
Eric Dumazet767e97e2010-10-06 17:49:21 -0700387 rcu_assign_pointer(n->next,
388 rcu_dereference_protected(
389 new_nht->hash_buckets[hash],
390 lockdep_is_held(&tbl->lock)));
391 rcu_assign_pointer(new_nht->hash_buckets[hash], n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700392 }
393 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700394
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000395 rcu_assign_pointer(tbl->nht, new_nht);
396 call_rcu(&old_nht->rcu, neigh_hash_free_rcu);
397 return new_nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700398}
399
400struct neighbour *neigh_lookup(struct neigh_table *tbl, const void *pkey,
401 struct net_device *dev)
402{
403 struct neighbour *n;
404 int key_len = tbl->key_len;
Pavel Emelyanovbc4bf5f2008-02-23 19:57:02 -0800405 u32 hash_val;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000406 struct neigh_hash_table *nht;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900407
Linus Torvalds1da177e2005-04-16 15:20:36 -0700408 NEIGH_CACHE_STAT_INC(tbl, lookups);
409
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000410 rcu_read_lock_bh();
411 nht = rcu_dereference_bh(tbl->nht);
David S. Millercd089332011-07-11 01:28:12 -0700412 hash_val = tbl->hash(pkey, dev, nht->hash_rnd) >> (32 - nht->hash_shift);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700413
414 for (n = rcu_dereference_bh(nht->hash_buckets[hash_val]);
415 n != NULL;
416 n = rcu_dereference_bh(n->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700417 if (dev == n->dev && !memcmp(n->primary_key, pkey, key_len)) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700418 if (!atomic_inc_not_zero(&n->refcnt))
419 n = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700420 NEIGH_CACHE_STAT_INC(tbl, hits);
421 break;
422 }
423 }
Eric Dumazet767e97e2010-10-06 17:49:21 -0700424
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000425 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700426 return n;
427}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900428EXPORT_SYMBOL(neigh_lookup);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700429
Eric W. Biederman426b5302008-01-24 00:13:18 -0800430struct neighbour *neigh_lookup_nodev(struct neigh_table *tbl, struct net *net,
431 const void *pkey)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700432{
433 struct neighbour *n;
434 int key_len = tbl->key_len;
Pavel Emelyanovbc4bf5f2008-02-23 19:57:02 -0800435 u32 hash_val;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000436 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700437
438 NEIGH_CACHE_STAT_INC(tbl, lookups);
439
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000440 rcu_read_lock_bh();
441 nht = rcu_dereference_bh(tbl->nht);
David S. Millercd089332011-07-11 01:28:12 -0700442 hash_val = tbl->hash(pkey, NULL, nht->hash_rnd) >> (32 - nht->hash_shift);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700443
444 for (n = rcu_dereference_bh(nht->hash_buckets[hash_val]);
445 n != NULL;
446 n = rcu_dereference_bh(n->next)) {
Eric W. Biederman426b5302008-01-24 00:13:18 -0800447 if (!memcmp(n->primary_key, pkey, key_len) &&
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +0900448 net_eq(dev_net(n->dev), net)) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700449 if (!atomic_inc_not_zero(&n->refcnt))
450 n = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700451 NEIGH_CACHE_STAT_INC(tbl, hits);
452 break;
453 }
454 }
Eric Dumazet767e97e2010-10-06 17:49:21 -0700455
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000456 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700457 return n;
458}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900459EXPORT_SYMBOL(neigh_lookup_nodev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700460
David S. Millera263b302012-07-02 02:02:15 -0700461struct neighbour *__neigh_create(struct neigh_table *tbl, const void *pkey,
462 struct net_device *dev, bool want_ref)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700463{
464 u32 hash_val;
465 int key_len = tbl->key_len;
466 int error;
David Miller596b9b62011-07-25 00:01:25 +0000467 struct neighbour *n1, *rc, *n = neigh_alloc(tbl, dev);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000468 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700469
470 if (!n) {
471 rc = ERR_PTR(-ENOBUFS);
472 goto out;
473 }
474
475 memcpy(n->primary_key, pkey, key_len);
476 n->dev = dev;
477 dev_hold(dev);
478
479 /* Protocol specific setup. */
480 if (tbl->constructor && (error = tbl->constructor(n)) < 0) {
481 rc = ERR_PTR(error);
482 goto out_neigh_release;
483 }
484
David Millerda6a8fa2011-07-25 00:01:38 +0000485 if (dev->netdev_ops->ndo_neigh_construct) {
486 error = dev->netdev_ops->ndo_neigh_construct(n);
487 if (error < 0) {
488 rc = ERR_PTR(error);
489 goto out_neigh_release;
490 }
491 }
492
David S. Miller447f2192011-12-19 15:04:41 -0500493 /* Device specific setup. */
494 if (n->parms->neigh_setup &&
495 (error = n->parms->neigh_setup(n)) < 0) {
496 rc = ERR_PTR(error);
497 goto out_neigh_release;
498 }
499
Linus Torvalds1da177e2005-04-16 15:20:36 -0700500 n->confirmed = jiffies - (n->parms->base_reachable_time << 1);
501
502 write_lock_bh(&tbl->lock);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000503 nht = rcu_dereference_protected(tbl->nht,
504 lockdep_is_held(&tbl->lock));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700505
David S. Millercd089332011-07-11 01:28:12 -0700506 if (atomic_read(&tbl->entries) > (1 << nht->hash_shift))
507 nht = neigh_hash_grow(tbl, nht->hash_shift + 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508
David S. Millercd089332011-07-11 01:28:12 -0700509 hash_val = tbl->hash(pkey, dev, nht->hash_rnd) >> (32 - nht->hash_shift);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700510
511 if (n->parms->dead) {
512 rc = ERR_PTR(-EINVAL);
513 goto out_tbl_unlock;
514 }
515
Eric Dumazet767e97e2010-10-06 17:49:21 -0700516 for (n1 = rcu_dereference_protected(nht->hash_buckets[hash_val],
517 lockdep_is_held(&tbl->lock));
518 n1 != NULL;
519 n1 = rcu_dereference_protected(n1->next,
520 lockdep_is_held(&tbl->lock))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700521 if (dev == n1->dev && !memcmp(n1->primary_key, pkey, key_len)) {
David S. Millera263b302012-07-02 02:02:15 -0700522 if (want_ref)
523 neigh_hold(n1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700524 rc = n1;
525 goto out_tbl_unlock;
526 }
527 }
528
Linus Torvalds1da177e2005-04-16 15:20:36 -0700529 n->dead = 0;
David S. Millera263b302012-07-02 02:02:15 -0700530 if (want_ref)
531 neigh_hold(n);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700532 rcu_assign_pointer(n->next,
533 rcu_dereference_protected(nht->hash_buckets[hash_val],
534 lockdep_is_held(&tbl->lock)));
535 rcu_assign_pointer(nht->hash_buckets[hash_val], n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700536 write_unlock_bh(&tbl->lock);
Joe Perchesd5d427c2013-04-15 15:17:19 +0000537 neigh_dbg(2, "neigh %p is created\n", n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700538 rc = n;
539out:
540 return rc;
541out_tbl_unlock:
542 write_unlock_bh(&tbl->lock);
543out_neigh_release:
544 neigh_release(n);
545 goto out;
546}
David S. Millera263b302012-07-02 02:02:15 -0700547EXPORT_SYMBOL(__neigh_create);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700548
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900549static u32 pneigh_hash(const void *pkey, int key_len)
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700550{
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700551 u32 hash_val = *(u32 *)(pkey + key_len - 4);
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700552 hash_val ^= (hash_val >> 16);
553 hash_val ^= hash_val >> 8;
554 hash_val ^= hash_val >> 4;
555 hash_val &= PNEIGH_HASHMASK;
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900556 return hash_val;
557}
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700558
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900559static struct pneigh_entry *__pneigh_lookup_1(struct pneigh_entry *n,
560 struct net *net,
561 const void *pkey,
562 int key_len,
563 struct net_device *dev)
564{
565 while (n) {
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700566 if (!memcmp(n->key, pkey, key_len) &&
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900567 net_eq(pneigh_net(n), net) &&
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700568 (n->dev == dev || !n->dev))
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900569 return n;
570 n = n->next;
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700571 }
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900572 return NULL;
573}
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700574
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900575struct pneigh_entry *__pneigh_lookup(struct neigh_table *tbl,
576 struct net *net, const void *pkey, struct net_device *dev)
577{
578 int key_len = tbl->key_len;
579 u32 hash_val = pneigh_hash(pkey, key_len);
580
581 return __pneigh_lookup_1(tbl->phash_buckets[hash_val],
582 net, pkey, key_len, dev);
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700583}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900584EXPORT_SYMBOL_GPL(__pneigh_lookup);
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700585
Eric W. Biederman426b5302008-01-24 00:13:18 -0800586struct pneigh_entry * pneigh_lookup(struct neigh_table *tbl,
587 struct net *net, const void *pkey,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700588 struct net_device *dev, int creat)
589{
590 struct pneigh_entry *n;
591 int key_len = tbl->key_len;
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900592 u32 hash_val = pneigh_hash(pkey, key_len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700593
594 read_lock_bh(&tbl->lock);
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900595 n = __pneigh_lookup_1(tbl->phash_buckets[hash_val],
596 net, pkey, key_len, dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700597 read_unlock_bh(&tbl->lock);
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900598
599 if (n || !creat)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700600 goto out;
601
Pavel Emelyanov4ae28942007-10-15 12:54:15 -0700602 ASSERT_RTNL();
603
Linus Torvalds1da177e2005-04-16 15:20:36 -0700604 n = kmalloc(sizeof(*n) + key_len, GFP_KERNEL);
605 if (!n)
606 goto out;
607
Eric Dumazete42ea982008-11-12 00:54:54 -0800608 write_pnet(&n->net, hold_net(net));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700609 memcpy(n->key, pkey, key_len);
610 n->dev = dev;
611 if (dev)
612 dev_hold(dev);
613
614 if (tbl->pconstructor && tbl->pconstructor(n)) {
615 if (dev)
616 dev_put(dev);
Denis V. Lunevda12f732008-02-20 00:26:16 -0800617 release_net(net);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700618 kfree(n);
619 n = NULL;
620 goto out;
621 }
622
623 write_lock_bh(&tbl->lock);
624 n->next = tbl->phash_buckets[hash_val];
625 tbl->phash_buckets[hash_val] = n;
626 write_unlock_bh(&tbl->lock);
627out:
628 return n;
629}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900630EXPORT_SYMBOL(pneigh_lookup);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700631
632
Eric W. Biederman426b5302008-01-24 00:13:18 -0800633int pneigh_delete(struct neigh_table *tbl, struct net *net, const void *pkey,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700634 struct net_device *dev)
635{
636 struct pneigh_entry *n, **np;
637 int key_len = tbl->key_len;
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900638 u32 hash_val = pneigh_hash(pkey, key_len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700639
640 write_lock_bh(&tbl->lock);
641 for (np = &tbl->phash_buckets[hash_val]; (n = *np) != NULL;
642 np = &n->next) {
Eric W. Biederman426b5302008-01-24 00:13:18 -0800643 if (!memcmp(n->key, pkey, key_len) && n->dev == dev &&
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +0900644 net_eq(pneigh_net(n), net)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700645 *np = n->next;
646 write_unlock_bh(&tbl->lock);
647 if (tbl->pdestructor)
648 tbl->pdestructor(n);
649 if (n->dev)
650 dev_put(n->dev);
YOSHIFUJI Hideaki57da52c2008-03-26 03:49:59 +0900651 release_net(pneigh_net(n));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700652 kfree(n);
653 return 0;
654 }
655 }
656 write_unlock_bh(&tbl->lock);
657 return -ENOENT;
658}
659
660static int pneigh_ifdown(struct neigh_table *tbl, struct net_device *dev)
661{
662 struct pneigh_entry *n, **np;
663 u32 h;
664
665 for (h = 0; h <= PNEIGH_HASHMASK; h++) {
666 np = &tbl->phash_buckets[h];
667 while ((n = *np) != NULL) {
668 if (!dev || n->dev == dev) {
669 *np = n->next;
670 if (tbl->pdestructor)
671 tbl->pdestructor(n);
672 if (n->dev)
673 dev_put(n->dev);
YOSHIFUJI Hideaki57da52c2008-03-26 03:49:59 +0900674 release_net(pneigh_net(n));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700675 kfree(n);
676 continue;
677 }
678 np = &n->next;
679 }
680 }
681 return -ENOENT;
682}
683
Denis V. Lunev06f05112008-01-24 00:30:58 -0800684static void neigh_parms_destroy(struct neigh_parms *parms);
685
686static inline void neigh_parms_put(struct neigh_parms *parms)
687{
688 if (atomic_dec_and_test(&parms->refcnt))
689 neigh_parms_destroy(parms);
690}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700691
692/*
693 * neighbour must already be out of the table;
694 *
695 */
696void neigh_destroy(struct neighbour *neigh)
697{
David Millerda6a8fa2011-07-25 00:01:38 +0000698 struct net_device *dev = neigh->dev;
699
Linus Torvalds1da177e2005-04-16 15:20:36 -0700700 NEIGH_CACHE_STAT_INC(neigh->tbl, destroys);
701
702 if (!neigh->dead) {
Joe Perchese005d192012-05-16 19:58:40 +0000703 pr_warn("Destroying alive neighbour %p\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700704 dump_stack();
705 return;
706 }
707
708 if (neigh_del_timer(neigh))
Joe Perchese005d192012-05-16 19:58:40 +0000709 pr_warn("Impossible event\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700710
Linus Torvalds1da177e2005-04-16 15:20:36 -0700711 skb_queue_purge(&neigh->arp_queue);
Eric Dumazet8b5c1712011-11-09 12:07:14 +0000712 neigh->arp_queue_len_bytes = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700713
David S. Miller447f2192011-12-19 15:04:41 -0500714 if (dev->netdev_ops->ndo_neigh_destroy)
715 dev->netdev_ops->ndo_neigh_destroy(neigh);
716
David Millerda6a8fa2011-07-25 00:01:38 +0000717 dev_put(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700718 neigh_parms_put(neigh->parms);
719
Joe Perchesd5d427c2013-04-15 15:17:19 +0000720 neigh_dbg(2, "neigh %p is destroyed\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700721
722 atomic_dec(&neigh->tbl->entries);
David Miller5b8b0062011-07-25 00:01:22 +0000723 kfree_rcu(neigh, rcu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700724}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900725EXPORT_SYMBOL(neigh_destroy);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700726
727/* Neighbour state is suspicious;
728 disable fast path.
729
730 Called with write_locked neigh.
731 */
732static void neigh_suspect(struct neighbour *neigh)
733{
Joe Perchesd5d427c2013-04-15 15:17:19 +0000734 neigh_dbg(2, "neigh %p is suspected\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700735
736 neigh->output = neigh->ops->output;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700737}
738
739/* Neighbour state is OK;
740 enable fast path.
741
742 Called with write_locked neigh.
743 */
744static void neigh_connect(struct neighbour *neigh)
745{
Joe Perchesd5d427c2013-04-15 15:17:19 +0000746 neigh_dbg(2, "neigh %p is connected\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700747
748 neigh->output = neigh->ops->connected_output;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700749}
750
Eric Dumazete4c4e442009-07-30 03:15:07 +0000751static void neigh_periodic_work(struct work_struct *work)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700752{
Eric Dumazete4c4e442009-07-30 03:15:07 +0000753 struct neigh_table *tbl = container_of(work, struct neigh_table, gc_work.work);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700754 struct neighbour *n;
755 struct neighbour __rcu **np;
Eric Dumazete4c4e442009-07-30 03:15:07 +0000756 unsigned int i;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000757 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700758
759 NEIGH_CACHE_STAT_INC(tbl, periodic_gc_runs);
760
Eric Dumazete4c4e442009-07-30 03:15:07 +0000761 write_lock_bh(&tbl->lock);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000762 nht = rcu_dereference_protected(tbl->nht,
763 lockdep_is_held(&tbl->lock));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700764
YOSHIFUJI Hideaki / 吉藤英明27246802013-01-22 05:20:05 +0000765 if (atomic_read(&tbl->entries) < tbl->gc_thresh1)
766 goto out;
767
Linus Torvalds1da177e2005-04-16 15:20:36 -0700768 /*
769 * periodically recompute ReachableTime from random function
770 */
771
Eric Dumazete4c4e442009-07-30 03:15:07 +0000772 if (time_after(jiffies, tbl->last_rand + 300 * HZ)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700773 struct neigh_parms *p;
Eric Dumazete4c4e442009-07-30 03:15:07 +0000774 tbl->last_rand = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700775 for (p = &tbl->parms; p; p = p->next)
776 p->reachable_time =
777 neigh_rand_reach_time(p->base_reachable_time);
778 }
779
David S. Millercd089332011-07-11 01:28:12 -0700780 for (i = 0 ; i < (1 << nht->hash_shift); i++) {
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000781 np = &nht->hash_buckets[i];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700782
Eric Dumazet767e97e2010-10-06 17:49:21 -0700783 while ((n = rcu_dereference_protected(*np,
784 lockdep_is_held(&tbl->lock))) != NULL) {
Eric Dumazete4c4e442009-07-30 03:15:07 +0000785 unsigned int state;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700786
Eric Dumazete4c4e442009-07-30 03:15:07 +0000787 write_lock(&n->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700788
Eric Dumazete4c4e442009-07-30 03:15:07 +0000789 state = n->nud_state;
790 if (state & (NUD_PERMANENT | NUD_IN_TIMER)) {
791 write_unlock(&n->lock);
792 goto next_elt;
793 }
794
795 if (time_before(n->used, n->confirmed))
796 n->used = n->confirmed;
797
798 if (atomic_read(&n->refcnt) == 1 &&
799 (state == NUD_FAILED ||
800 time_after(jiffies, n->used + n->parms->gc_staletime))) {
801 *np = n->next;
802 n->dead = 1;
803 write_unlock(&n->lock);
804 neigh_cleanup_and_release(n);
805 continue;
806 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700807 write_unlock(&n->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700808
809next_elt:
Eric Dumazete4c4e442009-07-30 03:15:07 +0000810 np = &n->next;
811 }
812 /*
813 * It's fine to release lock here, even if hash table
814 * grows while we are preempted.
815 */
816 write_unlock_bh(&tbl->lock);
817 cond_resched();
818 write_lock_bh(&tbl->lock);
Michel Machado84338a62012-02-21 16:04:13 -0500819 nht = rcu_dereference_protected(tbl->nht,
820 lockdep_is_held(&tbl->lock));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700821 }
YOSHIFUJI Hideaki / 吉藤英明27246802013-01-22 05:20:05 +0000822out:
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900823 /* Cycle through all hash buckets every base_reachable_time/2 ticks.
824 * ARP entry timeouts range from 1/2 base_reachable_time to 3/2
825 * base_reachable_time.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700826 */
Eric Dumazete4c4e442009-07-30 03:15:07 +0000827 schedule_delayed_work(&tbl->gc_work,
828 tbl->parms.base_reachable_time >> 1);
829 write_unlock_bh(&tbl->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700830}
831
832static __inline__ int neigh_max_probes(struct neighbour *n)
833{
834 struct neigh_parms *p = n->parms;
Eric Dumazeta02cec22010-09-22 20:43:57 +0000835 return (n->nud_state & NUD_PROBE) ?
Linus Torvalds1da177e2005-04-16 15:20:36 -0700836 p->ucast_probes :
Eric Dumazeta02cec22010-09-22 20:43:57 +0000837 p->ucast_probes + p->app_probes + p->mcast_probes;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700838}
839
Timo Teras5ef12d92009-06-11 04:16:28 -0700840static void neigh_invalidate(struct neighbour *neigh)
Eric Dumazet0a141502010-03-09 19:40:54 +0000841 __releases(neigh->lock)
842 __acquires(neigh->lock)
Timo Teras5ef12d92009-06-11 04:16:28 -0700843{
844 struct sk_buff *skb;
845
846 NEIGH_CACHE_STAT_INC(neigh->tbl, res_failed);
Joe Perchesd5d427c2013-04-15 15:17:19 +0000847 neigh_dbg(2, "neigh %p is failed\n", neigh);
Timo Teras5ef12d92009-06-11 04:16:28 -0700848 neigh->updated = jiffies;
849
850 /* It is very thin place. report_unreachable is very complicated
851 routine. Particularly, it can hit the same neighbour entry!
852
853 So that, we try to be accurate and avoid dead loop. --ANK
854 */
855 while (neigh->nud_state == NUD_FAILED &&
856 (skb = __skb_dequeue(&neigh->arp_queue)) != NULL) {
857 write_unlock(&neigh->lock);
858 neigh->ops->error_report(neigh, skb);
859 write_lock(&neigh->lock);
860 }
861 skb_queue_purge(&neigh->arp_queue);
Eric Dumazet8b5c1712011-11-09 12:07:14 +0000862 neigh->arp_queue_len_bytes = 0;
Timo Teras5ef12d92009-06-11 04:16:28 -0700863}
864
Eric Dumazetcd28ca02011-08-09 08:15:58 +0000865static void neigh_probe(struct neighbour *neigh)
866 __releases(neigh->lock)
867{
868 struct sk_buff *skb = skb_peek(&neigh->arp_queue);
869 /* keep skb alive even if arp_queue overflows */
870 if (skb)
871 skb = skb_copy(skb, GFP_ATOMIC);
872 write_unlock(&neigh->lock);
873 neigh->ops->solicit(neigh, skb);
874 atomic_inc(&neigh->probes);
875 kfree_skb(skb);
876}
877
Linus Torvalds1da177e2005-04-16 15:20:36 -0700878/* Called when a timer expires for a neighbour entry. */
879
880static void neigh_timer_handler(unsigned long arg)
881{
882 unsigned long now, next;
883 struct neighbour *neigh = (struct neighbour *)arg;
Eric Dumazet95c96172012-04-15 05:58:06 +0000884 unsigned int state;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700885 int notify = 0;
886
887 write_lock(&neigh->lock);
888
889 state = neigh->nud_state;
890 now = jiffies;
891 next = now + HZ;
892
David S. Miller045f7b32011-11-01 17:45:55 -0400893 if (!(state & NUD_IN_TIMER))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700894 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700895
896 if (state & NUD_REACHABLE) {
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900897 if (time_before_eq(now,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700898 neigh->confirmed + neigh->parms->reachable_time)) {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000899 neigh_dbg(2, "neigh %p is still alive\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700900 next = neigh->confirmed + neigh->parms->reachable_time;
901 } else if (time_before_eq(now,
902 neigh->used + neigh->parms->delay_probe_time)) {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000903 neigh_dbg(2, "neigh %p is delayed\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700904 neigh->nud_state = NUD_DELAY;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800905 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700906 neigh_suspect(neigh);
907 next = now + neigh->parms->delay_probe_time;
908 } else {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000909 neigh_dbg(2, "neigh %p is suspected\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700910 neigh->nud_state = NUD_STALE;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800911 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700912 neigh_suspect(neigh);
Tom Tucker8d717402006-07-30 20:43:36 -0700913 notify = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700914 }
915 } else if (state & NUD_DELAY) {
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900916 if (time_before_eq(now,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700917 neigh->confirmed + neigh->parms->delay_probe_time)) {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000918 neigh_dbg(2, "neigh %p is now reachable\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700919 neigh->nud_state = NUD_REACHABLE;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800920 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700921 neigh_connect(neigh);
Tom Tucker8d717402006-07-30 20:43:36 -0700922 notify = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700923 next = neigh->confirmed + neigh->parms->reachable_time;
924 } else {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000925 neigh_dbg(2, "neigh %p is probed\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700926 neigh->nud_state = NUD_PROBE;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800927 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700928 atomic_set(&neigh->probes, 0);
929 next = now + neigh->parms->retrans_time;
930 }
931 } else {
932 /* NUD_PROBE|NUD_INCOMPLETE */
933 next = now + neigh->parms->retrans_time;
934 }
935
936 if ((neigh->nud_state & (NUD_INCOMPLETE | NUD_PROBE)) &&
937 atomic_read(&neigh->probes) >= neigh_max_probes(neigh)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700938 neigh->nud_state = NUD_FAILED;
939 notify = 1;
Timo Teras5ef12d92009-06-11 04:16:28 -0700940 neigh_invalidate(neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700941 }
942
943 if (neigh->nud_state & NUD_IN_TIMER) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700944 if (time_before(next, jiffies + HZ/2))
945 next = jiffies + HZ/2;
Herbert Xu6fb99742005-10-23 16:37:48 +1000946 if (!mod_timer(&neigh->timer, next))
947 neigh_hold(neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700948 }
949 if (neigh->nud_state & (NUD_INCOMPLETE | NUD_PROBE)) {
Eric Dumazetcd28ca02011-08-09 08:15:58 +0000950 neigh_probe(neigh);
David S. Miller9ff56602008-02-17 18:39:54 -0800951 } else {
David S. Miller69cc64d2008-02-11 21:45:44 -0800952out:
David S. Miller9ff56602008-02-17 18:39:54 -0800953 write_unlock(&neigh->lock);
954 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700955
Thomas Grafd961db32007-08-08 23:12:56 -0700956 if (notify)
957 neigh_update_notify(neigh);
958
Linus Torvalds1da177e2005-04-16 15:20:36 -0700959 neigh_release(neigh);
960}
961
962int __neigh_event_send(struct neighbour *neigh, struct sk_buff *skb)
963{
964 int rc;
Eric Dumazetcd28ca02011-08-09 08:15:58 +0000965 bool immediate_probe = false;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700966
967 write_lock_bh(&neigh->lock);
968
969 rc = 0;
970 if (neigh->nud_state & (NUD_CONNECTED | NUD_DELAY | NUD_PROBE))
971 goto out_unlock_bh;
972
Linus Torvalds1da177e2005-04-16 15:20:36 -0700973 if (!(neigh->nud_state & (NUD_STALE | NUD_INCOMPLETE))) {
974 if (neigh->parms->mcast_probes + neigh->parms->app_probes) {
Eric Dumazetcd28ca02011-08-09 08:15:58 +0000975 unsigned long next, now = jiffies;
976
Linus Torvalds1da177e2005-04-16 15:20:36 -0700977 atomic_set(&neigh->probes, neigh->parms->ucast_probes);
978 neigh->nud_state = NUD_INCOMPLETE;
Eric Dumazetcd28ca02011-08-09 08:15:58 +0000979 neigh->updated = now;
980 next = now + max(neigh->parms->retrans_time, HZ/2);
981 neigh_add_timer(neigh, next);
982 immediate_probe = true;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700983 } else {
984 neigh->nud_state = NUD_FAILED;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800985 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700986 write_unlock_bh(&neigh->lock);
987
Wei Yongjunf3fbbe02009-02-25 00:37:32 +0000988 kfree_skb(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700989 return 1;
990 }
991 } else if (neigh->nud_state & NUD_STALE) {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000992 neigh_dbg(2, "neigh %p is delayed\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700993 neigh->nud_state = NUD_DELAY;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800994 neigh->updated = jiffies;
David S. Miller667347f2005-09-27 12:07:44 -0700995 neigh_add_timer(neigh,
996 jiffies + neigh->parms->delay_probe_time);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700997 }
998
999 if (neigh->nud_state == NUD_INCOMPLETE) {
1000 if (skb) {
Eric Dumazet8b5c1712011-11-09 12:07:14 +00001001 while (neigh->arp_queue_len_bytes + skb->truesize >
1002 neigh->parms->queue_len_bytes) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001003 struct sk_buff *buff;
Eric Dumazet8b5c1712011-11-09 12:07:14 +00001004
David S. Millerf72051b2008-09-23 01:11:18 -07001005 buff = __skb_dequeue(&neigh->arp_queue);
Eric Dumazet8b5c1712011-11-09 12:07:14 +00001006 if (!buff)
1007 break;
1008 neigh->arp_queue_len_bytes -= buff->truesize;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001009 kfree_skb(buff);
Neil Horman9a6d2762008-07-16 20:50:49 -07001010 NEIGH_CACHE_STAT_INC(neigh->tbl, unres_discards);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001011 }
Eric Dumazeta4731132010-05-27 16:09:39 -07001012 skb_dst_force(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001013 __skb_queue_tail(&neigh->arp_queue, skb);
Eric Dumazet8b5c1712011-11-09 12:07:14 +00001014 neigh->arp_queue_len_bytes += skb->truesize;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001015 }
1016 rc = 1;
1017 }
1018out_unlock_bh:
Eric Dumazetcd28ca02011-08-09 08:15:58 +00001019 if (immediate_probe)
1020 neigh_probe(neigh);
1021 else
1022 write_unlock(&neigh->lock);
1023 local_bh_enable();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001024 return rc;
1025}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001026EXPORT_SYMBOL(__neigh_event_send);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001027
David S. Millerf6b72b62011-07-14 07:53:20 -07001028static void neigh_update_hhs(struct neighbour *neigh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001029{
1030 struct hh_cache *hh;
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -07001031 void (*update)(struct hh_cache*, const struct net_device*, const unsigned char *)
Doug Kehn91a72a72010-07-14 18:02:16 -07001032 = NULL;
1033
1034 if (neigh->dev->header_ops)
1035 update = neigh->dev->header_ops->cache_update;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001036
1037 if (update) {
David S. Millerf6b72b62011-07-14 07:53:20 -07001038 hh = &neigh->hh;
1039 if (hh->hh_len) {
Stephen Hemminger3644f0c2006-12-07 15:08:17 -08001040 write_seqlock_bh(&hh->hh_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001041 update(hh, neigh->dev, neigh->ha);
Stephen Hemminger3644f0c2006-12-07 15:08:17 -08001042 write_sequnlock_bh(&hh->hh_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001043 }
1044 }
1045}
1046
1047
1048
1049/* Generic update routine.
1050 -- lladdr is new lladdr or NULL, if it is not supplied.
1051 -- new is new state.
1052 -- flags
1053 NEIGH_UPDATE_F_OVERRIDE allows to override existing lladdr,
1054 if it is different.
1055 NEIGH_UPDATE_F_WEAK_OVERRIDE will suspect existing "connected"
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001056 lladdr instead of overriding it
Linus Torvalds1da177e2005-04-16 15:20:36 -07001057 if it is different.
1058 It also allows to retain current state
1059 if lladdr is unchanged.
1060 NEIGH_UPDATE_F_ADMIN means that the change is administrative.
1061
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001062 NEIGH_UPDATE_F_OVERRIDE_ISROUTER allows to override existing
Linus Torvalds1da177e2005-04-16 15:20:36 -07001063 NTF_ROUTER flag.
1064 NEIGH_UPDATE_F_ISROUTER indicates if the neighbour is known as
1065 a router.
1066
1067 Caller MUST hold reference count on the entry.
1068 */
1069
1070int neigh_update(struct neighbour *neigh, const u8 *lladdr, u8 new,
1071 u32 flags)
1072{
1073 u8 old;
1074 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001075 int notify = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001076 struct net_device *dev;
1077 int update_isrouter = 0;
1078
1079 write_lock_bh(&neigh->lock);
1080
1081 dev = neigh->dev;
1082 old = neigh->nud_state;
1083 err = -EPERM;
1084
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001085 if (!(flags & NEIGH_UPDATE_F_ADMIN) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -07001086 (old & (NUD_NOARP | NUD_PERMANENT)))
1087 goto out;
1088
1089 if (!(new & NUD_VALID)) {
1090 neigh_del_timer(neigh);
1091 if (old & NUD_CONNECTED)
1092 neigh_suspect(neigh);
1093 neigh->nud_state = new;
1094 err = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001095 notify = old & NUD_VALID;
Timo Teras5ef12d92009-06-11 04:16:28 -07001096 if ((old & (NUD_INCOMPLETE | NUD_PROBE)) &&
1097 (new & NUD_FAILED)) {
1098 neigh_invalidate(neigh);
1099 notify = 1;
1100 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001101 goto out;
1102 }
1103
1104 /* Compare new lladdr with cached one */
1105 if (!dev->addr_len) {
1106 /* First case: device needs no address. */
1107 lladdr = neigh->ha;
1108 } else if (lladdr) {
1109 /* The second case: if something is already cached
1110 and a new address is proposed:
1111 - compare new & old
1112 - if they are different, check override flag
1113 */
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001114 if ((old & NUD_VALID) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -07001115 !memcmp(lladdr, neigh->ha, dev->addr_len))
1116 lladdr = neigh->ha;
1117 } else {
1118 /* No address is supplied; if we know something,
1119 use it, otherwise discard the request.
1120 */
1121 err = -EINVAL;
1122 if (!(old & NUD_VALID))
1123 goto out;
1124 lladdr = neigh->ha;
1125 }
1126
1127 if (new & NUD_CONNECTED)
1128 neigh->confirmed = jiffies;
1129 neigh->updated = jiffies;
1130
1131 /* If entry was valid and address is not changed,
1132 do not change entry state, if new one is STALE.
1133 */
1134 err = 0;
1135 update_isrouter = flags & NEIGH_UPDATE_F_OVERRIDE_ISROUTER;
1136 if (old & NUD_VALID) {
1137 if (lladdr != neigh->ha && !(flags & NEIGH_UPDATE_F_OVERRIDE)) {
1138 update_isrouter = 0;
1139 if ((flags & NEIGH_UPDATE_F_WEAK_OVERRIDE) &&
1140 (old & NUD_CONNECTED)) {
1141 lladdr = neigh->ha;
1142 new = NUD_STALE;
1143 } else
1144 goto out;
1145 } else {
1146 if (lladdr == neigh->ha && new == NUD_STALE &&
1147 ((flags & NEIGH_UPDATE_F_WEAK_OVERRIDE) ||
1148 (old & NUD_CONNECTED))
1149 )
1150 new = old;
1151 }
1152 }
1153
1154 if (new != old) {
1155 neigh_del_timer(neigh);
Pavel Emelyanova43d8992007-12-20 15:49:05 -08001156 if (new & NUD_IN_TIMER)
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001157 neigh_add_timer(neigh, (jiffies +
1158 ((new & NUD_REACHABLE) ?
David S. Miller667347f2005-09-27 12:07:44 -07001159 neigh->parms->reachable_time :
1160 0)));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001161 neigh->nud_state = new;
1162 }
1163
1164 if (lladdr != neigh->ha) {
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001165 write_seqlock(&neigh->ha_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001166 memcpy(&neigh->ha, lladdr, dev->addr_len);
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001167 write_sequnlock(&neigh->ha_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001168 neigh_update_hhs(neigh);
1169 if (!(new & NUD_CONNECTED))
1170 neigh->confirmed = jiffies -
1171 (neigh->parms->base_reachable_time << 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001172 notify = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001173 }
1174 if (new == old)
1175 goto out;
1176 if (new & NUD_CONNECTED)
1177 neigh_connect(neigh);
1178 else
1179 neigh_suspect(neigh);
1180 if (!(old & NUD_VALID)) {
1181 struct sk_buff *skb;
1182
1183 /* Again: avoid dead loop if something went wrong */
1184
1185 while (neigh->nud_state & NUD_VALID &&
1186 (skb = __skb_dequeue(&neigh->arp_queue)) != NULL) {
David S. Miller69cce1d2011-07-17 23:09:49 -07001187 struct dst_entry *dst = skb_dst(skb);
1188 struct neighbour *n2, *n1 = neigh;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001189 write_unlock_bh(&neigh->lock);
roy.qing.li@gmail.come049f282011-10-17 22:32:42 +00001190
1191 rcu_read_lock();
David S. Miller13a43d92012-07-02 22:15:37 -07001192
1193 /* Why not just use 'neigh' as-is? The problem is that
1194 * things such as shaper, eql, and sch_teql can end up
1195 * using alternative, different, neigh objects to output
1196 * the packet in the output path. So what we need to do
1197 * here is re-lookup the top-level neigh in the path so
1198 * we can reinject the packet there.
1199 */
1200 n2 = NULL;
1201 if (dst) {
1202 n2 = dst_neigh_lookup_skb(dst, skb);
1203 if (n2)
1204 n1 = n2;
1205 }
David S. Miller8f40b162011-07-17 13:34:11 -07001206 n1->output(n1, skb);
David S. Miller13a43d92012-07-02 22:15:37 -07001207 if (n2)
1208 neigh_release(n2);
roy.qing.li@gmail.come049f282011-10-17 22:32:42 +00001209 rcu_read_unlock();
1210
Linus Torvalds1da177e2005-04-16 15:20:36 -07001211 write_lock_bh(&neigh->lock);
1212 }
1213 skb_queue_purge(&neigh->arp_queue);
Eric Dumazet8b5c1712011-11-09 12:07:14 +00001214 neigh->arp_queue_len_bytes = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001215 }
1216out:
1217 if (update_isrouter) {
1218 neigh->flags = (flags & NEIGH_UPDATE_F_ISROUTER) ?
1219 (neigh->flags | NTF_ROUTER) :
1220 (neigh->flags & ~NTF_ROUTER);
1221 }
1222 write_unlock_bh(&neigh->lock);
Tom Tucker8d717402006-07-30 20:43:36 -07001223
1224 if (notify)
Thomas Grafd961db32007-08-08 23:12:56 -07001225 neigh_update_notify(neigh);
1226
Linus Torvalds1da177e2005-04-16 15:20:36 -07001227 return err;
1228}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001229EXPORT_SYMBOL(neigh_update);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001230
1231struct neighbour *neigh_event_ns(struct neigh_table *tbl,
1232 u8 *lladdr, void *saddr,
1233 struct net_device *dev)
1234{
1235 struct neighbour *neigh = __neigh_lookup(tbl, saddr, dev,
1236 lladdr || !dev->addr_len);
1237 if (neigh)
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001238 neigh_update(neigh, lladdr, NUD_STALE,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001239 NEIGH_UPDATE_F_OVERRIDE);
1240 return neigh;
1241}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001242EXPORT_SYMBOL(neigh_event_ns);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001243
Eric Dumazet34d101d2010-10-11 09:16:57 -07001244/* called with read_lock_bh(&n->lock); */
David S. Millerf6b72b62011-07-14 07:53:20 -07001245static void neigh_hh_init(struct neighbour *n, struct dst_entry *dst)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001246{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001247 struct net_device *dev = dst->dev;
David S. Millerf6b72b62011-07-14 07:53:20 -07001248 __be16 prot = dst->ops->protocol;
1249 struct hh_cache *hh = &n->hh;
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001250
1251 write_lock_bh(&n->lock);
Eric Dumazet34d101d2010-10-11 09:16:57 -07001252
David S. Millerf6b72b62011-07-14 07:53:20 -07001253 /* Only one thread can come in here and initialize the
1254 * hh_cache entry.
1255 */
David S. Millerb23b5452011-07-16 17:45:02 -07001256 if (!hh->hh_len)
1257 dev->header_ops->cache(n, hh, prot);
David S. Millerf6b72b62011-07-14 07:53:20 -07001258
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001259 write_unlock_bh(&n->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001260}
1261
1262/* This function can be used in contexts, where only old dev_queue_xmit
Eric Dumazet767e97e2010-10-06 17:49:21 -07001263 * worked, f.e. if you want to override normal output path (eql, shaper),
1264 * but resolution is not made yet.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001265 */
1266
David S. Miller8f40b162011-07-17 13:34:11 -07001267int neigh_compat_output(struct neighbour *neigh, struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001268{
1269 struct net_device *dev = skb->dev;
1270
Arnaldo Carvalho de Melobbe735e2007-03-10 22:16:10 -03001271 __skb_pull(skb, skb_network_offset(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001272
Stephen Hemminger0c4e8582007-10-09 01:36:32 -07001273 if (dev_hard_header(skb, dev, ntohs(skb->protocol), NULL, NULL,
1274 skb->len) < 0 &&
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -07001275 dev->header_ops->rebuild(skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001276 return 0;
1277
1278 return dev_queue_xmit(skb);
1279}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001280EXPORT_SYMBOL(neigh_compat_output);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001281
1282/* Slow and careful. */
1283
David S. Miller8f40b162011-07-17 13:34:11 -07001284int neigh_resolve_output(struct neighbour *neigh, struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001285{
Eric Dumazetadf30902009-06-02 05:19:30 +00001286 struct dst_entry *dst = skb_dst(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001287 int rc = 0;
1288
David S. Miller8f40b162011-07-17 13:34:11 -07001289 if (!dst)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001290 goto discard;
1291
Linus Torvalds1da177e2005-04-16 15:20:36 -07001292 if (!neigh_event_send(neigh, skb)) {
1293 int err;
1294 struct net_device *dev = neigh->dev;
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001295 unsigned int seq;
Eric Dumazet34d101d2010-10-11 09:16:57 -07001296
David S. Millerf6b72b62011-07-14 07:53:20 -07001297 if (dev->header_ops->cache && !neigh->hh.hh_len)
1298 neigh_hh_init(neigh, dst);
Eric Dumazet34d101d2010-10-11 09:16:57 -07001299
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001300 do {
ramesh.nagappa@gmail.come1f16502012-10-05 19:10:15 +00001301 __skb_pull(skb, skb_network_offset(skb));
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001302 seq = read_seqbegin(&neigh->ha_lock);
1303 err = dev_hard_header(skb, dev, ntohs(skb->protocol),
1304 neigh->ha, NULL, skb->len);
1305 } while (read_seqretry(&neigh->ha_lock, seq));
Eric Dumazet34d101d2010-10-11 09:16:57 -07001306
Linus Torvalds1da177e2005-04-16 15:20:36 -07001307 if (err >= 0)
David S. Miller542d4d62011-07-16 18:06:24 -07001308 rc = dev_queue_xmit(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001309 else
1310 goto out_kfree_skb;
1311 }
1312out:
1313 return rc;
1314discard:
Joe Perchesd5d427c2013-04-15 15:17:19 +00001315 neigh_dbg(1, "%s: dst=%p neigh=%p\n", __func__, dst, neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001316out_kfree_skb:
1317 rc = -EINVAL;
1318 kfree_skb(skb);
1319 goto out;
1320}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001321EXPORT_SYMBOL(neigh_resolve_output);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001322
1323/* As fast as possible without hh cache */
1324
David S. Miller8f40b162011-07-17 13:34:11 -07001325int neigh_connected_output(struct neighbour *neigh, struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001326{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001327 struct net_device *dev = neigh->dev;
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001328 unsigned int seq;
David S. Miller8f40b162011-07-17 13:34:11 -07001329 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001330
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001331 do {
ramesh.nagappa@gmail.come1f16502012-10-05 19:10:15 +00001332 __skb_pull(skb, skb_network_offset(skb));
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001333 seq = read_seqbegin(&neigh->ha_lock);
1334 err = dev_hard_header(skb, dev, ntohs(skb->protocol),
1335 neigh->ha, NULL, skb->len);
1336 } while (read_seqretry(&neigh->ha_lock, seq));
1337
Linus Torvalds1da177e2005-04-16 15:20:36 -07001338 if (err >= 0)
David S. Miller542d4d62011-07-16 18:06:24 -07001339 err = dev_queue_xmit(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001340 else {
1341 err = -EINVAL;
1342 kfree_skb(skb);
1343 }
1344 return err;
1345}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001346EXPORT_SYMBOL(neigh_connected_output);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001347
David S. Miller8f40b162011-07-17 13:34:11 -07001348int neigh_direct_output(struct neighbour *neigh, struct sk_buff *skb)
1349{
1350 return dev_queue_xmit(skb);
1351}
1352EXPORT_SYMBOL(neigh_direct_output);
1353
Linus Torvalds1da177e2005-04-16 15:20:36 -07001354static void neigh_proxy_process(unsigned long arg)
1355{
1356 struct neigh_table *tbl = (struct neigh_table *)arg;
1357 long sched_next = 0;
1358 unsigned long now = jiffies;
David S. Millerf72051b2008-09-23 01:11:18 -07001359 struct sk_buff *skb, *n;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001360
1361 spin_lock(&tbl->proxy_queue.lock);
1362
David S. Millerf72051b2008-09-23 01:11:18 -07001363 skb_queue_walk_safe(&tbl->proxy_queue, skb, n) {
1364 long tdif = NEIGH_CB(skb)->sched_next - now;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001365
Linus Torvalds1da177e2005-04-16 15:20:36 -07001366 if (tdif <= 0) {
David S. Millerf72051b2008-09-23 01:11:18 -07001367 struct net_device *dev = skb->dev;
Eric Dumazet20e60742011-08-22 19:32:42 +00001368
David S. Millerf72051b2008-09-23 01:11:18 -07001369 __skb_unlink(skb, &tbl->proxy_queue);
Eric Dumazet20e60742011-08-22 19:32:42 +00001370 if (tbl->proxy_redo && netif_running(dev)) {
1371 rcu_read_lock();
David S. Millerf72051b2008-09-23 01:11:18 -07001372 tbl->proxy_redo(skb);
Eric Dumazet20e60742011-08-22 19:32:42 +00001373 rcu_read_unlock();
1374 } else {
David S. Millerf72051b2008-09-23 01:11:18 -07001375 kfree_skb(skb);
Eric Dumazet20e60742011-08-22 19:32:42 +00001376 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001377
1378 dev_put(dev);
1379 } else if (!sched_next || tdif < sched_next)
1380 sched_next = tdif;
1381 }
1382 del_timer(&tbl->proxy_timer);
1383 if (sched_next)
1384 mod_timer(&tbl->proxy_timer, jiffies + sched_next);
1385 spin_unlock(&tbl->proxy_queue.lock);
1386}
1387
1388void pneigh_enqueue(struct neigh_table *tbl, struct neigh_parms *p,
1389 struct sk_buff *skb)
1390{
1391 unsigned long now = jiffies;
1392 unsigned long sched_next = now + (net_random() % p->proxy_delay);
1393
1394 if (tbl->proxy_queue.qlen > p->proxy_qlen) {
1395 kfree_skb(skb);
1396 return;
1397 }
Patrick McHardya61bbcf2005-08-14 17:24:31 -07001398
1399 NEIGH_CB(skb)->sched_next = sched_next;
1400 NEIGH_CB(skb)->flags |= LOCALLY_ENQUEUED;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001401
1402 spin_lock(&tbl->proxy_queue.lock);
1403 if (del_timer(&tbl->proxy_timer)) {
1404 if (time_before(tbl->proxy_timer.expires, sched_next))
1405 sched_next = tbl->proxy_timer.expires;
1406 }
Eric Dumazetadf30902009-06-02 05:19:30 +00001407 skb_dst_drop(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001408 dev_hold(skb->dev);
1409 __skb_queue_tail(&tbl->proxy_queue, skb);
1410 mod_timer(&tbl->proxy_timer, sched_next);
1411 spin_unlock(&tbl->proxy_queue.lock);
1412}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001413EXPORT_SYMBOL(pneigh_enqueue);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001414
Tobias Klauser97fd5bc2009-07-13 11:17:49 -07001415static inline struct neigh_parms *lookup_neigh_parms(struct neigh_table *tbl,
Eric W. Biederman426b5302008-01-24 00:13:18 -08001416 struct net *net, int ifindex)
1417{
1418 struct neigh_parms *p;
1419
1420 for (p = &tbl->parms; p; p = p->next) {
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09001421 if ((p->dev && p->dev->ifindex == ifindex && net_eq(neigh_parms_net(p), net)) ||
Gao feng170d6f92013-06-20 10:01:33 +08001422 (!p->dev && !ifindex && net_eq(net, &init_net)))
Eric W. Biederman426b5302008-01-24 00:13:18 -08001423 return p;
1424 }
1425
1426 return NULL;
1427}
Linus Torvalds1da177e2005-04-16 15:20:36 -07001428
1429struct neigh_parms *neigh_parms_alloc(struct net_device *dev,
1430 struct neigh_table *tbl)
1431{
Gao fengcf89d6b2013-06-20 10:01:32 +08001432 struct neigh_parms *p;
Stephen Hemminger00829822008-11-20 20:14:53 -08001433 struct net *net = dev_net(dev);
1434 const struct net_device_ops *ops = dev->netdev_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001435
Gao fengcf89d6b2013-06-20 10:01:32 +08001436 p = kmemdup(&tbl->parms, sizeof(*p), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001437 if (p) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001438 p->tbl = tbl;
1439 atomic_set(&p->refcnt, 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001440 p->reachable_time =
1441 neigh_rand_reach_time(p->base_reachable_time);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001442
Stephen Hemminger00829822008-11-20 20:14:53 -08001443 if (ops->ndo_neigh_setup && ops->ndo_neigh_setup(dev, p)) {
Denis V. Lunev486b51d2008-01-14 22:59:59 -08001444 kfree(p);
1445 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001446 }
Denis V. Lunev486b51d2008-01-14 22:59:59 -08001447
1448 dev_hold(dev);
1449 p->dev = dev;
Eric Dumazete42ea982008-11-12 00:54:54 -08001450 write_pnet(&p->net, hold_net(net));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001451 p->sysctl_table = NULL;
1452 write_lock_bh(&tbl->lock);
1453 p->next = tbl->parms.next;
1454 tbl->parms.next = p;
1455 write_unlock_bh(&tbl->lock);
1456 }
1457 return p;
1458}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001459EXPORT_SYMBOL(neigh_parms_alloc);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001460
1461static void neigh_rcu_free_parms(struct rcu_head *head)
1462{
1463 struct neigh_parms *parms =
1464 container_of(head, struct neigh_parms, rcu_head);
1465
1466 neigh_parms_put(parms);
1467}
1468
1469void neigh_parms_release(struct neigh_table *tbl, struct neigh_parms *parms)
1470{
1471 struct neigh_parms **p;
1472
1473 if (!parms || parms == &tbl->parms)
1474 return;
1475 write_lock_bh(&tbl->lock);
1476 for (p = &tbl->parms.next; *p; p = &(*p)->next) {
1477 if (*p == parms) {
1478 *p = parms->next;
1479 parms->dead = 1;
1480 write_unlock_bh(&tbl->lock);
David S. Millercecbb632008-01-20 16:39:03 -08001481 if (parms->dev)
1482 dev_put(parms->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001483 call_rcu(&parms->rcu_head, neigh_rcu_free_parms);
1484 return;
1485 }
1486 }
1487 write_unlock_bh(&tbl->lock);
Joe Perchesd5d427c2013-04-15 15:17:19 +00001488 neigh_dbg(1, "%s: not found\n", __func__);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001489}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001490EXPORT_SYMBOL(neigh_parms_release);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001491
Denis V. Lunev06f05112008-01-24 00:30:58 -08001492static void neigh_parms_destroy(struct neigh_parms *parms)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001493{
YOSHIFUJI Hideaki57da52c2008-03-26 03:49:59 +09001494 release_net(neigh_parms_net(parms));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001495 kfree(parms);
1496}
1497
Pavel Emelianovc2ecba72007-04-17 12:45:31 -07001498static struct lock_class_key neigh_table_proxy_queue_class;
1499
Hiroaki SHIMODAdcd2ba92012-04-13 07:34:44 +00001500static void neigh_table_init_no_netlink(struct neigh_table *tbl)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001501{
1502 unsigned long now = jiffies;
1503 unsigned long phsize;
1504
Eric Dumazete42ea982008-11-12 00:54:54 -08001505 write_pnet(&tbl->parms.net, &init_net);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001506 atomic_set(&tbl->parms.refcnt, 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001507 tbl->parms.reachable_time =
1508 neigh_rand_reach_time(tbl->parms.base_reachable_time);
1509
Linus Torvalds1da177e2005-04-16 15:20:36 -07001510 tbl->stats = alloc_percpu(struct neigh_statistics);
1511 if (!tbl->stats)
1512 panic("cannot create neighbour cache statistics");
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001513
Linus Torvalds1da177e2005-04-16 15:20:36 -07001514#ifdef CONFIG_PROC_FS
Alexey Dobriyan9b739ba2008-11-11 16:47:44 -08001515 if (!proc_create_data(tbl->id, 0, init_net.proc_net_stat,
1516 &neigh_stat_seq_fops, tbl))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001517 panic("cannot create neighbour proc dir entry");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001518#endif
1519
David S. Millercd089332011-07-11 01:28:12 -07001520 RCU_INIT_POINTER(tbl->nht, neigh_hash_alloc(3));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001521
1522 phsize = (PNEIGH_HASHMASK + 1) * sizeof(struct pneigh_entry *);
Andrew Morton77d04bd2006-04-07 14:52:59 -07001523 tbl->phash_buckets = kzalloc(phsize, GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001524
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001525 if (!tbl->nht || !tbl->phash_buckets)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001526 panic("cannot allocate neighbour cache hashes");
1527
YOSHIFUJI Hideaki / 吉藤英明08433ef2013-01-24 00:44:23 +00001528 if (!tbl->entry_size)
1529 tbl->entry_size = ALIGN(offsetof(struct neighbour, primary_key) +
1530 tbl->key_len, NEIGH_PRIV_ALIGN);
1531 else
1532 WARN_ON(tbl->entry_size % NEIGH_PRIV_ALIGN);
1533
Linus Torvalds1da177e2005-04-16 15:20:36 -07001534 rwlock_init(&tbl->lock);
Tejun Heo203b42f2012-08-21 13:18:23 -07001535 INIT_DEFERRABLE_WORK(&tbl->gc_work, neigh_periodic_work);
Eric Dumazete4c4e442009-07-30 03:15:07 +00001536 schedule_delayed_work(&tbl->gc_work, tbl->parms.reachable_time);
Pavel Emelyanovb24b8a22008-01-23 21:20:07 -08001537 setup_timer(&tbl->proxy_timer, neigh_proxy_process, (unsigned long)tbl);
Pavel Emelianovc2ecba72007-04-17 12:45:31 -07001538 skb_queue_head_init_class(&tbl->proxy_queue,
1539 &neigh_table_proxy_queue_class);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001540
1541 tbl->last_flush = now;
1542 tbl->last_rand = now + tbl->parms.reachable_time * 20;
Simon Kelleybd89efc2006-05-12 14:56:08 -07001543}
1544
1545void neigh_table_init(struct neigh_table *tbl)
1546{
1547 struct neigh_table *tmp;
1548
1549 neigh_table_init_no_netlink(tbl);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001550 write_lock(&neigh_tbl_lock);
Simon Kelleybd89efc2006-05-12 14:56:08 -07001551 for (tmp = neigh_tables; tmp; tmp = tmp->next) {
1552 if (tmp->family == tbl->family)
1553 break;
1554 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001555 tbl->next = neigh_tables;
1556 neigh_tables = tbl;
1557 write_unlock(&neigh_tbl_lock);
Simon Kelleybd89efc2006-05-12 14:56:08 -07001558
1559 if (unlikely(tmp)) {
Joe Perchese005d192012-05-16 19:58:40 +00001560 pr_err("Registering multiple tables for family %d\n",
1561 tbl->family);
Simon Kelleybd89efc2006-05-12 14:56:08 -07001562 dump_stack();
1563 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001564}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001565EXPORT_SYMBOL(neigh_table_init);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001566
1567int neigh_table_clear(struct neigh_table *tbl)
1568{
1569 struct neigh_table **tp;
1570
1571 /* It is not clean... Fix it to unload IPv6 module safely */
Tejun Heoa5c30b32010-10-19 06:04:42 +00001572 cancel_delayed_work_sync(&tbl->gc_work);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001573 del_timer_sync(&tbl->proxy_timer);
1574 pneigh_queue_purge(&tbl->proxy_queue);
1575 neigh_ifdown(tbl, NULL);
1576 if (atomic_read(&tbl->entries))
Joe Perchese005d192012-05-16 19:58:40 +00001577 pr_crit("neighbour leakage\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001578 write_lock(&neigh_tbl_lock);
1579 for (tp = &neigh_tables; *tp; tp = &(*tp)->next) {
1580 if (*tp == tbl) {
1581 *tp = tbl->next;
1582 break;
1583 }
1584 }
1585 write_unlock(&neigh_tbl_lock);
1586
Eric Dumazet6193d2b2011-01-19 22:02:47 +00001587 call_rcu(&rcu_dereference_protected(tbl->nht, 1)->rcu,
1588 neigh_hash_free_rcu);
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001589 tbl->nht = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001590
1591 kfree(tbl->phash_buckets);
1592 tbl->phash_buckets = NULL;
1593
Alexey Dobriyan3f192b52007-11-05 21:28:13 -08001594 remove_proc_entry(tbl->id, init_net.proc_net_stat);
1595
Kirill Korotaev3fcde742006-09-01 01:34:10 -07001596 free_percpu(tbl->stats);
1597 tbl->stats = NULL;
1598
Linus Torvalds1da177e2005-04-16 15:20:36 -07001599 return 0;
1600}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001601EXPORT_SYMBOL(neigh_table_clear);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001602
Thomas Graf661d2962013-03-21 07:45:29 +00001603static int neigh_delete(struct sk_buff *skb, struct nlmsghdr *nlh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001604{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001605 struct net *net = sock_net(skb->sk);
Thomas Grafa14a49d2006-08-07 17:53:08 -07001606 struct ndmsg *ndm;
1607 struct nlattr *dst_attr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001608 struct neigh_table *tbl;
1609 struct net_device *dev = NULL;
Thomas Grafa14a49d2006-08-07 17:53:08 -07001610 int err = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001611
Eric Dumazet110b2492010-10-04 04:27:36 +00001612 ASSERT_RTNL();
Thomas Grafa14a49d2006-08-07 17:53:08 -07001613 if (nlmsg_len(nlh) < sizeof(*ndm))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001614 goto out;
1615
Thomas Grafa14a49d2006-08-07 17:53:08 -07001616 dst_attr = nlmsg_find_attr(nlh, sizeof(*ndm), NDA_DST);
1617 if (dst_attr == NULL)
1618 goto out;
1619
1620 ndm = nlmsg_data(nlh);
1621 if (ndm->ndm_ifindex) {
Eric Dumazet110b2492010-10-04 04:27:36 +00001622 dev = __dev_get_by_index(net, ndm->ndm_ifindex);
Thomas Grafa14a49d2006-08-07 17:53:08 -07001623 if (dev == NULL) {
1624 err = -ENODEV;
1625 goto out;
1626 }
1627 }
1628
Linus Torvalds1da177e2005-04-16 15:20:36 -07001629 read_lock(&neigh_tbl_lock);
1630 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
Thomas Grafa14a49d2006-08-07 17:53:08 -07001631 struct neighbour *neigh;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001632
1633 if (tbl->family != ndm->ndm_family)
1634 continue;
1635 read_unlock(&neigh_tbl_lock);
1636
Thomas Grafa14a49d2006-08-07 17:53:08 -07001637 if (nla_len(dst_attr) < tbl->key_len)
Eric Dumazet110b2492010-10-04 04:27:36 +00001638 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001639
1640 if (ndm->ndm_flags & NTF_PROXY) {
Eric W. Biederman426b5302008-01-24 00:13:18 -08001641 err = pneigh_delete(tbl, net, nla_data(dst_attr), dev);
Eric Dumazet110b2492010-10-04 04:27:36 +00001642 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001643 }
1644
Thomas Grafa14a49d2006-08-07 17:53:08 -07001645 if (dev == NULL)
Eric Dumazet110b2492010-10-04 04:27:36 +00001646 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001647
Thomas Grafa14a49d2006-08-07 17:53:08 -07001648 neigh = neigh_lookup(tbl, nla_data(dst_attr), dev);
1649 if (neigh == NULL) {
1650 err = -ENOENT;
Eric Dumazet110b2492010-10-04 04:27:36 +00001651 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001652 }
Thomas Grafa14a49d2006-08-07 17:53:08 -07001653
1654 err = neigh_update(neigh, NULL, NUD_FAILED,
1655 NEIGH_UPDATE_F_OVERRIDE |
1656 NEIGH_UPDATE_F_ADMIN);
1657 neigh_release(neigh);
Eric Dumazet110b2492010-10-04 04:27:36 +00001658 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001659 }
1660 read_unlock(&neigh_tbl_lock);
Thomas Grafa14a49d2006-08-07 17:53:08 -07001661 err = -EAFNOSUPPORT;
1662
Linus Torvalds1da177e2005-04-16 15:20:36 -07001663out:
1664 return err;
1665}
1666
Thomas Graf661d2962013-03-21 07:45:29 +00001667static int neigh_add(struct sk_buff *skb, struct nlmsghdr *nlh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001668{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001669 struct net *net = sock_net(skb->sk);
Thomas Graf5208deb2006-08-07 17:55:40 -07001670 struct ndmsg *ndm;
1671 struct nlattr *tb[NDA_MAX+1];
Linus Torvalds1da177e2005-04-16 15:20:36 -07001672 struct neigh_table *tbl;
1673 struct net_device *dev = NULL;
Thomas Graf5208deb2006-08-07 17:55:40 -07001674 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001675
Eric Dumazet110b2492010-10-04 04:27:36 +00001676 ASSERT_RTNL();
Thomas Graf5208deb2006-08-07 17:55:40 -07001677 err = nlmsg_parse(nlh, sizeof(*ndm), tb, NDA_MAX, NULL);
1678 if (err < 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001679 goto out;
1680
Thomas Graf5208deb2006-08-07 17:55:40 -07001681 err = -EINVAL;
1682 if (tb[NDA_DST] == NULL)
1683 goto out;
1684
1685 ndm = nlmsg_data(nlh);
1686 if (ndm->ndm_ifindex) {
Eric Dumazet110b2492010-10-04 04:27:36 +00001687 dev = __dev_get_by_index(net, ndm->ndm_ifindex);
Thomas Graf5208deb2006-08-07 17:55:40 -07001688 if (dev == NULL) {
1689 err = -ENODEV;
1690 goto out;
1691 }
1692
1693 if (tb[NDA_LLADDR] && nla_len(tb[NDA_LLADDR]) < dev->addr_len)
Eric Dumazet110b2492010-10-04 04:27:36 +00001694 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001695 }
1696
Linus Torvalds1da177e2005-04-16 15:20:36 -07001697 read_lock(&neigh_tbl_lock);
1698 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
Thomas Graf5208deb2006-08-07 17:55:40 -07001699 int flags = NEIGH_UPDATE_F_ADMIN | NEIGH_UPDATE_F_OVERRIDE;
1700 struct neighbour *neigh;
1701 void *dst, *lladdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001702
1703 if (tbl->family != ndm->ndm_family)
1704 continue;
1705 read_unlock(&neigh_tbl_lock);
1706
Thomas Graf5208deb2006-08-07 17:55:40 -07001707 if (nla_len(tb[NDA_DST]) < tbl->key_len)
Eric Dumazet110b2492010-10-04 04:27:36 +00001708 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001709 dst = nla_data(tb[NDA_DST]);
1710 lladdr = tb[NDA_LLADDR] ? nla_data(tb[NDA_LLADDR]) : NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001711
1712 if (ndm->ndm_flags & NTF_PROXY) {
Ville Nuorvala62dd9312006-09-22 14:43:19 -07001713 struct pneigh_entry *pn;
1714
1715 err = -ENOBUFS;
Eric W. Biederman426b5302008-01-24 00:13:18 -08001716 pn = pneigh_lookup(tbl, net, dst, dev, 1);
Ville Nuorvala62dd9312006-09-22 14:43:19 -07001717 if (pn) {
1718 pn->flags = ndm->ndm_flags;
1719 err = 0;
1720 }
Eric Dumazet110b2492010-10-04 04:27:36 +00001721 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001722 }
1723
Thomas Graf5208deb2006-08-07 17:55:40 -07001724 if (dev == NULL)
Eric Dumazet110b2492010-10-04 04:27:36 +00001725 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001726
1727 neigh = neigh_lookup(tbl, dst, dev);
1728 if (neigh == NULL) {
1729 if (!(nlh->nlmsg_flags & NLM_F_CREATE)) {
1730 err = -ENOENT;
Eric Dumazet110b2492010-10-04 04:27:36 +00001731 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001732 }
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001733
Thomas Graf5208deb2006-08-07 17:55:40 -07001734 neigh = __neigh_lookup_errno(tbl, dst, dev);
1735 if (IS_ERR(neigh)) {
1736 err = PTR_ERR(neigh);
Eric Dumazet110b2492010-10-04 04:27:36 +00001737 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001738 }
1739 } else {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001740 if (nlh->nlmsg_flags & NLM_F_EXCL) {
1741 err = -EEXIST;
Thomas Graf5208deb2006-08-07 17:55:40 -07001742 neigh_release(neigh);
Eric Dumazet110b2492010-10-04 04:27:36 +00001743 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001744 }
Thomas Graf5208deb2006-08-07 17:55:40 -07001745
1746 if (!(nlh->nlmsg_flags & NLM_F_REPLACE))
1747 flags &= ~NEIGH_UPDATE_F_OVERRIDE;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001748 }
1749
Eric Biederman0c5c2d32009-03-04 00:03:08 -08001750 if (ndm->ndm_flags & NTF_USE) {
1751 neigh_event_send(neigh, NULL);
1752 err = 0;
1753 } else
1754 err = neigh_update(neigh, lladdr, ndm->ndm_state, flags);
Thomas Graf5208deb2006-08-07 17:55:40 -07001755 neigh_release(neigh);
Eric Dumazet110b2492010-10-04 04:27:36 +00001756 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001757 }
1758
1759 read_unlock(&neigh_tbl_lock);
Thomas Graf5208deb2006-08-07 17:55:40 -07001760 err = -EAFNOSUPPORT;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001761out:
1762 return err;
1763}
1764
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001765static int neightbl_fill_parms(struct sk_buff *skb, struct neigh_parms *parms)
1766{
Thomas Grafca860fb2006-08-07 18:00:18 -07001767 struct nlattr *nest;
1768
1769 nest = nla_nest_start(skb, NDTA_PARMS);
1770 if (nest == NULL)
1771 return -ENOBUFS;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001772
David S. Miller9a6308d2012-04-01 20:06:28 -04001773 if ((parms->dev &&
1774 nla_put_u32(skb, NDTPA_IFINDEX, parms->dev->ifindex)) ||
1775 nla_put_u32(skb, NDTPA_REFCNT, atomic_read(&parms->refcnt)) ||
1776 nla_put_u32(skb, NDTPA_QUEUE_LENBYTES, parms->queue_len_bytes) ||
1777 /* approximative value for deprecated QUEUE_LEN (in packets) */
1778 nla_put_u32(skb, NDTPA_QUEUE_LEN,
Shan Weice46cc62012-12-04 18:49:15 +00001779 parms->queue_len_bytes / SKB_TRUESIZE(ETH_FRAME_LEN)) ||
David S. Miller9a6308d2012-04-01 20:06:28 -04001780 nla_put_u32(skb, NDTPA_PROXY_QLEN, parms->proxy_qlen) ||
1781 nla_put_u32(skb, NDTPA_APP_PROBES, parms->app_probes) ||
1782 nla_put_u32(skb, NDTPA_UCAST_PROBES, parms->ucast_probes) ||
1783 nla_put_u32(skb, NDTPA_MCAST_PROBES, parms->mcast_probes) ||
1784 nla_put_msecs(skb, NDTPA_REACHABLE_TIME, parms->reachable_time) ||
1785 nla_put_msecs(skb, NDTPA_BASE_REACHABLE_TIME,
1786 parms->base_reachable_time) ||
1787 nla_put_msecs(skb, NDTPA_GC_STALETIME, parms->gc_staletime) ||
1788 nla_put_msecs(skb, NDTPA_DELAY_PROBE_TIME,
1789 parms->delay_probe_time) ||
1790 nla_put_msecs(skb, NDTPA_RETRANS_TIME, parms->retrans_time) ||
1791 nla_put_msecs(skb, NDTPA_ANYCAST_DELAY, parms->anycast_delay) ||
1792 nla_put_msecs(skb, NDTPA_PROXY_DELAY, parms->proxy_delay) ||
1793 nla_put_msecs(skb, NDTPA_LOCKTIME, parms->locktime))
1794 goto nla_put_failure;
Thomas Grafca860fb2006-08-07 18:00:18 -07001795 return nla_nest_end(skb, nest);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001796
Thomas Grafca860fb2006-08-07 18:00:18 -07001797nla_put_failure:
Thomas Grafbc3ed282008-06-03 16:36:54 -07001798 nla_nest_cancel(skb, nest);
1799 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001800}
1801
Thomas Grafca860fb2006-08-07 18:00:18 -07001802static int neightbl_fill_info(struct sk_buff *skb, struct neigh_table *tbl,
1803 u32 pid, u32 seq, int type, int flags)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001804{
1805 struct nlmsghdr *nlh;
1806 struct ndtmsg *ndtmsg;
1807
Thomas Grafca860fb2006-08-07 18:00:18 -07001808 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndtmsg), flags);
1809 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08001810 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001811
Thomas Grafca860fb2006-08-07 18:00:18 -07001812 ndtmsg = nlmsg_data(nlh);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001813
1814 read_lock_bh(&tbl->lock);
1815 ndtmsg->ndtm_family = tbl->family;
Patrick McHardy9ef1d4c2005-06-28 12:55:30 -07001816 ndtmsg->ndtm_pad1 = 0;
1817 ndtmsg->ndtm_pad2 = 0;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001818
David S. Miller9a6308d2012-04-01 20:06:28 -04001819 if (nla_put_string(skb, NDTA_NAME, tbl->id) ||
1820 nla_put_msecs(skb, NDTA_GC_INTERVAL, tbl->gc_interval) ||
1821 nla_put_u32(skb, NDTA_THRESH1, tbl->gc_thresh1) ||
1822 nla_put_u32(skb, NDTA_THRESH2, tbl->gc_thresh2) ||
1823 nla_put_u32(skb, NDTA_THRESH3, tbl->gc_thresh3))
1824 goto nla_put_failure;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001825 {
1826 unsigned long now = jiffies;
1827 unsigned int flush_delta = now - tbl->last_flush;
1828 unsigned int rand_delta = now - tbl->last_rand;
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001829 struct neigh_hash_table *nht;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001830 struct ndt_config ndc = {
1831 .ndtc_key_len = tbl->key_len,
1832 .ndtc_entry_size = tbl->entry_size,
1833 .ndtc_entries = atomic_read(&tbl->entries),
1834 .ndtc_last_flush = jiffies_to_msecs(flush_delta),
1835 .ndtc_last_rand = jiffies_to_msecs(rand_delta),
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001836 .ndtc_proxy_qlen = tbl->proxy_queue.qlen,
1837 };
1838
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001839 rcu_read_lock_bh();
1840 nht = rcu_dereference_bh(tbl->nht);
David S. Miller2c2aba62011-12-28 15:06:58 -05001841 ndc.ndtc_hash_rnd = nht->hash_rnd[0];
David S. Millercd089332011-07-11 01:28:12 -07001842 ndc.ndtc_hash_mask = ((1 << nht->hash_shift) - 1);
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001843 rcu_read_unlock_bh();
1844
David S. Miller9a6308d2012-04-01 20:06:28 -04001845 if (nla_put(skb, NDTA_CONFIG, sizeof(ndc), &ndc))
1846 goto nla_put_failure;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001847 }
1848
1849 {
1850 int cpu;
1851 struct ndt_stats ndst;
1852
1853 memset(&ndst, 0, sizeof(ndst));
1854
KAMEZAWA Hiroyuki6f912042006-04-10 22:52:50 -07001855 for_each_possible_cpu(cpu) {
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001856 struct neigh_statistics *st;
1857
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001858 st = per_cpu_ptr(tbl->stats, cpu);
1859 ndst.ndts_allocs += st->allocs;
1860 ndst.ndts_destroys += st->destroys;
1861 ndst.ndts_hash_grows += st->hash_grows;
1862 ndst.ndts_res_failed += st->res_failed;
1863 ndst.ndts_lookups += st->lookups;
1864 ndst.ndts_hits += st->hits;
1865 ndst.ndts_rcv_probes_mcast += st->rcv_probes_mcast;
1866 ndst.ndts_rcv_probes_ucast += st->rcv_probes_ucast;
1867 ndst.ndts_periodic_gc_runs += st->periodic_gc_runs;
1868 ndst.ndts_forced_gc_runs += st->forced_gc_runs;
1869 }
1870
David S. Miller9a6308d2012-04-01 20:06:28 -04001871 if (nla_put(skb, NDTA_STATS, sizeof(ndst), &ndst))
1872 goto nla_put_failure;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001873 }
1874
1875 BUG_ON(tbl->parms.dev);
1876 if (neightbl_fill_parms(skb, &tbl->parms) < 0)
Thomas Grafca860fb2006-08-07 18:00:18 -07001877 goto nla_put_failure;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001878
1879 read_unlock_bh(&tbl->lock);
Thomas Grafca860fb2006-08-07 18:00:18 -07001880 return nlmsg_end(skb, nlh);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001881
Thomas Grafca860fb2006-08-07 18:00:18 -07001882nla_put_failure:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001883 read_unlock_bh(&tbl->lock);
Patrick McHardy26932562007-01-31 23:16:40 -08001884 nlmsg_cancel(skb, nlh);
1885 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001886}
1887
Thomas Grafca860fb2006-08-07 18:00:18 -07001888static int neightbl_fill_param_info(struct sk_buff *skb,
1889 struct neigh_table *tbl,
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001890 struct neigh_parms *parms,
Thomas Grafca860fb2006-08-07 18:00:18 -07001891 u32 pid, u32 seq, int type,
1892 unsigned int flags)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001893{
1894 struct ndtmsg *ndtmsg;
1895 struct nlmsghdr *nlh;
1896
Thomas Grafca860fb2006-08-07 18:00:18 -07001897 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndtmsg), flags);
1898 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08001899 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001900
Thomas Grafca860fb2006-08-07 18:00:18 -07001901 ndtmsg = nlmsg_data(nlh);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001902
1903 read_lock_bh(&tbl->lock);
1904 ndtmsg->ndtm_family = tbl->family;
Patrick McHardy9ef1d4c2005-06-28 12:55:30 -07001905 ndtmsg->ndtm_pad1 = 0;
1906 ndtmsg->ndtm_pad2 = 0;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001907
Thomas Grafca860fb2006-08-07 18:00:18 -07001908 if (nla_put_string(skb, NDTA_NAME, tbl->id) < 0 ||
1909 neightbl_fill_parms(skb, parms) < 0)
1910 goto errout;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001911
1912 read_unlock_bh(&tbl->lock);
Thomas Grafca860fb2006-08-07 18:00:18 -07001913 return nlmsg_end(skb, nlh);
1914errout:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001915 read_unlock_bh(&tbl->lock);
Patrick McHardy26932562007-01-31 23:16:40 -08001916 nlmsg_cancel(skb, nlh);
1917 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001918}
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001919
Patrick McHardyef7c79e2007-06-05 12:38:30 -07001920static const struct nla_policy nl_neightbl_policy[NDTA_MAX+1] = {
Thomas Graf6b3f8672006-08-07 17:58:53 -07001921 [NDTA_NAME] = { .type = NLA_STRING },
1922 [NDTA_THRESH1] = { .type = NLA_U32 },
1923 [NDTA_THRESH2] = { .type = NLA_U32 },
1924 [NDTA_THRESH3] = { .type = NLA_U32 },
1925 [NDTA_GC_INTERVAL] = { .type = NLA_U64 },
1926 [NDTA_PARMS] = { .type = NLA_NESTED },
1927};
1928
Patrick McHardyef7c79e2007-06-05 12:38:30 -07001929static const struct nla_policy nl_ntbl_parm_policy[NDTPA_MAX+1] = {
Thomas Graf6b3f8672006-08-07 17:58:53 -07001930 [NDTPA_IFINDEX] = { .type = NLA_U32 },
1931 [NDTPA_QUEUE_LEN] = { .type = NLA_U32 },
1932 [NDTPA_PROXY_QLEN] = { .type = NLA_U32 },
1933 [NDTPA_APP_PROBES] = { .type = NLA_U32 },
1934 [NDTPA_UCAST_PROBES] = { .type = NLA_U32 },
1935 [NDTPA_MCAST_PROBES] = { .type = NLA_U32 },
1936 [NDTPA_BASE_REACHABLE_TIME] = { .type = NLA_U64 },
1937 [NDTPA_GC_STALETIME] = { .type = NLA_U64 },
1938 [NDTPA_DELAY_PROBE_TIME] = { .type = NLA_U64 },
1939 [NDTPA_RETRANS_TIME] = { .type = NLA_U64 },
1940 [NDTPA_ANYCAST_DELAY] = { .type = NLA_U64 },
1941 [NDTPA_PROXY_DELAY] = { .type = NLA_U64 },
1942 [NDTPA_LOCKTIME] = { .type = NLA_U64 },
1943};
1944
Thomas Graf661d2962013-03-21 07:45:29 +00001945static int neightbl_set(struct sk_buff *skb, struct nlmsghdr *nlh)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001946{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001947 struct net *net = sock_net(skb->sk);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001948 struct neigh_table *tbl;
Thomas Graf6b3f8672006-08-07 17:58:53 -07001949 struct ndtmsg *ndtmsg;
1950 struct nlattr *tb[NDTA_MAX+1];
1951 int err;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001952
Thomas Graf6b3f8672006-08-07 17:58:53 -07001953 err = nlmsg_parse(nlh, sizeof(*ndtmsg), tb, NDTA_MAX,
1954 nl_neightbl_policy);
1955 if (err < 0)
1956 goto errout;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001957
Thomas Graf6b3f8672006-08-07 17:58:53 -07001958 if (tb[NDTA_NAME] == NULL) {
1959 err = -EINVAL;
1960 goto errout;
1961 }
1962
1963 ndtmsg = nlmsg_data(nlh);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001964 read_lock(&neigh_tbl_lock);
1965 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
1966 if (ndtmsg->ndtm_family && tbl->family != ndtmsg->ndtm_family)
1967 continue;
1968
Thomas Graf6b3f8672006-08-07 17:58:53 -07001969 if (nla_strcmp(tb[NDTA_NAME], tbl->id) == 0)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001970 break;
1971 }
1972
1973 if (tbl == NULL) {
1974 err = -ENOENT;
Thomas Graf6b3f8672006-08-07 17:58:53 -07001975 goto errout_locked;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001976 }
1977
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001978 /*
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001979 * We acquire tbl->lock to be nice to the periodic timers and
1980 * make sure they always see a consistent set of values.
1981 */
1982 write_lock_bh(&tbl->lock);
1983
Thomas Graf6b3f8672006-08-07 17:58:53 -07001984 if (tb[NDTA_PARMS]) {
1985 struct nlattr *tbp[NDTPA_MAX+1];
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001986 struct neigh_parms *p;
Thomas Graf6b3f8672006-08-07 17:58:53 -07001987 int i, ifindex = 0;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001988
Thomas Graf6b3f8672006-08-07 17:58:53 -07001989 err = nla_parse_nested(tbp, NDTPA_MAX, tb[NDTA_PARMS],
1990 nl_ntbl_parm_policy);
1991 if (err < 0)
1992 goto errout_tbl_lock;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001993
Thomas Graf6b3f8672006-08-07 17:58:53 -07001994 if (tbp[NDTPA_IFINDEX])
1995 ifindex = nla_get_u32(tbp[NDTPA_IFINDEX]);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001996
Tobias Klauser97fd5bc2009-07-13 11:17:49 -07001997 p = lookup_neigh_parms(tbl, net, ifindex);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001998 if (p == NULL) {
1999 err = -ENOENT;
Thomas Graf6b3f8672006-08-07 17:58:53 -07002000 goto errout_tbl_lock;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002001 }
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002002
Thomas Graf6b3f8672006-08-07 17:58:53 -07002003 for (i = 1; i <= NDTPA_MAX; i++) {
2004 if (tbp[i] == NULL)
2005 continue;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002006
Thomas Graf6b3f8672006-08-07 17:58:53 -07002007 switch (i) {
2008 case NDTPA_QUEUE_LEN:
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002009 p->queue_len_bytes = nla_get_u32(tbp[i]) *
2010 SKB_TRUESIZE(ETH_FRAME_LEN);
2011 break;
2012 case NDTPA_QUEUE_LENBYTES:
2013 p->queue_len_bytes = nla_get_u32(tbp[i]);
Thomas Graf6b3f8672006-08-07 17:58:53 -07002014 break;
2015 case NDTPA_PROXY_QLEN:
2016 p->proxy_qlen = nla_get_u32(tbp[i]);
2017 break;
2018 case NDTPA_APP_PROBES:
2019 p->app_probes = nla_get_u32(tbp[i]);
2020 break;
2021 case NDTPA_UCAST_PROBES:
2022 p->ucast_probes = nla_get_u32(tbp[i]);
2023 break;
2024 case NDTPA_MCAST_PROBES:
2025 p->mcast_probes = nla_get_u32(tbp[i]);
2026 break;
2027 case NDTPA_BASE_REACHABLE_TIME:
2028 p->base_reachable_time = nla_get_msecs(tbp[i]);
2029 break;
2030 case NDTPA_GC_STALETIME:
2031 p->gc_staletime = nla_get_msecs(tbp[i]);
2032 break;
2033 case NDTPA_DELAY_PROBE_TIME:
2034 p->delay_probe_time = nla_get_msecs(tbp[i]);
2035 break;
2036 case NDTPA_RETRANS_TIME:
2037 p->retrans_time = nla_get_msecs(tbp[i]);
2038 break;
2039 case NDTPA_ANYCAST_DELAY:
2040 p->anycast_delay = nla_get_msecs(tbp[i]);
2041 break;
2042 case NDTPA_PROXY_DELAY:
2043 p->proxy_delay = nla_get_msecs(tbp[i]);
2044 break;
2045 case NDTPA_LOCKTIME:
2046 p->locktime = nla_get_msecs(tbp[i]);
2047 break;
2048 }
2049 }
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002050 }
2051
Thomas Graf6b3f8672006-08-07 17:58:53 -07002052 if (tb[NDTA_THRESH1])
2053 tbl->gc_thresh1 = nla_get_u32(tb[NDTA_THRESH1]);
2054
2055 if (tb[NDTA_THRESH2])
2056 tbl->gc_thresh2 = nla_get_u32(tb[NDTA_THRESH2]);
2057
2058 if (tb[NDTA_THRESH3])
2059 tbl->gc_thresh3 = nla_get_u32(tb[NDTA_THRESH3]);
2060
2061 if (tb[NDTA_GC_INTERVAL])
2062 tbl->gc_interval = nla_get_msecs(tb[NDTA_GC_INTERVAL]);
2063
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002064 err = 0;
2065
Thomas Graf6b3f8672006-08-07 17:58:53 -07002066errout_tbl_lock:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002067 write_unlock_bh(&tbl->lock);
Thomas Graf6b3f8672006-08-07 17:58:53 -07002068errout_locked:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002069 read_unlock(&neigh_tbl_lock);
Thomas Graf6b3f8672006-08-07 17:58:53 -07002070errout:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002071 return err;
2072}
2073
Thomas Grafc8822a42007-03-22 11:50:06 -07002074static int neightbl_dump_info(struct sk_buff *skb, struct netlink_callback *cb)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002075{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09002076 struct net *net = sock_net(skb->sk);
Thomas Grafca860fb2006-08-07 18:00:18 -07002077 int family, tidx, nidx = 0;
2078 int tbl_skip = cb->args[0];
2079 int neigh_skip = cb->args[1];
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002080 struct neigh_table *tbl;
2081
Thomas Grafca860fb2006-08-07 18:00:18 -07002082 family = ((struct rtgenmsg *) nlmsg_data(cb->nlh))->rtgen_family;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002083
2084 read_lock(&neigh_tbl_lock);
Thomas Grafca860fb2006-08-07 18:00:18 -07002085 for (tbl = neigh_tables, tidx = 0; tbl; tbl = tbl->next, tidx++) {
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002086 struct neigh_parms *p;
2087
Thomas Grafca860fb2006-08-07 18:00:18 -07002088 if (tidx < tbl_skip || (family && tbl->family != family))
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002089 continue;
2090
Eric W. Biederman15e47302012-09-07 20:12:54 +00002091 if (neightbl_fill_info(skb, tbl, NETLINK_CB(cb->skb).portid,
Thomas Grafca860fb2006-08-07 18:00:18 -07002092 cb->nlh->nlmsg_seq, RTM_NEWNEIGHTBL,
2093 NLM_F_MULTI) <= 0)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002094 break;
2095
Eric W. Biederman426b5302008-01-24 00:13:18 -08002096 for (nidx = 0, p = tbl->parms.next; p; p = p->next) {
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002097 if (!net_eq(neigh_parms_net(p), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002098 continue;
2099
Gautam Kachrooefc683f2009-02-06 00:52:04 -08002100 if (nidx < neigh_skip)
2101 goto next;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002102
Thomas Grafca860fb2006-08-07 18:00:18 -07002103 if (neightbl_fill_param_info(skb, tbl, p,
Eric W. Biederman15e47302012-09-07 20:12:54 +00002104 NETLINK_CB(cb->skb).portid,
Thomas Grafca860fb2006-08-07 18:00:18 -07002105 cb->nlh->nlmsg_seq,
2106 RTM_NEWNEIGHTBL,
2107 NLM_F_MULTI) <= 0)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002108 goto out;
Gautam Kachrooefc683f2009-02-06 00:52:04 -08002109 next:
2110 nidx++;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002111 }
2112
Thomas Grafca860fb2006-08-07 18:00:18 -07002113 neigh_skip = 0;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002114 }
2115out:
2116 read_unlock(&neigh_tbl_lock);
Thomas Grafca860fb2006-08-07 18:00:18 -07002117 cb->args[0] = tidx;
2118 cb->args[1] = nidx;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002119
2120 return skb->len;
2121}
Linus Torvalds1da177e2005-04-16 15:20:36 -07002122
Thomas Graf8b8aec52006-08-07 17:56:37 -07002123static int neigh_fill_info(struct sk_buff *skb, struct neighbour *neigh,
2124 u32 pid, u32 seq, int type, unsigned int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002125{
2126 unsigned long now = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002127 struct nda_cacheinfo ci;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002128 struct nlmsghdr *nlh;
2129 struct ndmsg *ndm;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002130
Thomas Graf8b8aec52006-08-07 17:56:37 -07002131 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndm), flags);
2132 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08002133 return -EMSGSIZE;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002134
2135 ndm = nlmsg_data(nlh);
2136 ndm->ndm_family = neigh->ops->family;
Patrick McHardy9ef1d4c2005-06-28 12:55:30 -07002137 ndm->ndm_pad1 = 0;
2138 ndm->ndm_pad2 = 0;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002139 ndm->ndm_flags = neigh->flags;
2140 ndm->ndm_type = neigh->type;
2141 ndm->ndm_ifindex = neigh->dev->ifindex;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002142
David S. Miller9a6308d2012-04-01 20:06:28 -04002143 if (nla_put(skb, NDA_DST, neigh->tbl->key_len, neigh->primary_key))
2144 goto nla_put_failure;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002145
2146 read_lock_bh(&neigh->lock);
2147 ndm->ndm_state = neigh->nud_state;
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00002148 if (neigh->nud_state & NUD_VALID) {
2149 char haddr[MAX_ADDR_LEN];
2150
2151 neigh_ha_snapshot(haddr, neigh, neigh->dev);
2152 if (nla_put(skb, NDA_LLADDR, neigh->dev->addr_len, haddr) < 0) {
2153 read_unlock_bh(&neigh->lock);
2154 goto nla_put_failure;
2155 }
Thomas Graf8b8aec52006-08-07 17:56:37 -07002156 }
2157
Stephen Hemmingerb9f5f522008-06-03 16:03:15 -07002158 ci.ndm_used = jiffies_to_clock_t(now - neigh->used);
2159 ci.ndm_confirmed = jiffies_to_clock_t(now - neigh->confirmed);
2160 ci.ndm_updated = jiffies_to_clock_t(now - neigh->updated);
Thomas Graf8b8aec52006-08-07 17:56:37 -07002161 ci.ndm_refcnt = atomic_read(&neigh->refcnt) - 1;
2162 read_unlock_bh(&neigh->lock);
2163
David S. Miller9a6308d2012-04-01 20:06:28 -04002164 if (nla_put_u32(skb, NDA_PROBES, atomic_read(&neigh->probes)) ||
2165 nla_put(skb, NDA_CACHEINFO, sizeof(ci), &ci))
2166 goto nla_put_failure;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002167
2168 return nlmsg_end(skb, nlh);
2169
2170nla_put_failure:
Patrick McHardy26932562007-01-31 23:16:40 -08002171 nlmsg_cancel(skb, nlh);
2172 return -EMSGSIZE;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002173}
2174
Tony Zelenoff84920c12012-01-26 22:28:58 +00002175static int pneigh_fill_info(struct sk_buff *skb, struct pneigh_entry *pn,
2176 u32 pid, u32 seq, int type, unsigned int flags,
2177 struct neigh_table *tbl)
2178{
2179 struct nlmsghdr *nlh;
2180 struct ndmsg *ndm;
2181
2182 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndm), flags);
2183 if (nlh == NULL)
2184 return -EMSGSIZE;
2185
2186 ndm = nlmsg_data(nlh);
2187 ndm->ndm_family = tbl->family;
2188 ndm->ndm_pad1 = 0;
2189 ndm->ndm_pad2 = 0;
2190 ndm->ndm_flags = pn->flags | NTF_PROXY;
2191 ndm->ndm_type = NDA_DST;
2192 ndm->ndm_ifindex = pn->dev->ifindex;
2193 ndm->ndm_state = NUD_NONE;
2194
David S. Miller9a6308d2012-04-01 20:06:28 -04002195 if (nla_put(skb, NDA_DST, tbl->key_len, pn->key))
2196 goto nla_put_failure;
Tony Zelenoff84920c12012-01-26 22:28:58 +00002197
2198 return nlmsg_end(skb, nlh);
2199
2200nla_put_failure:
2201 nlmsg_cancel(skb, nlh);
2202 return -EMSGSIZE;
2203}
2204
Thomas Grafd961db32007-08-08 23:12:56 -07002205static void neigh_update_notify(struct neighbour *neigh)
2206{
2207 call_netevent_notifiers(NETEVENT_NEIGH_UPDATE, neigh);
2208 __neigh_notify(neigh, RTM_NEWNEIGH, 0);
2209}
Linus Torvalds1da177e2005-04-16 15:20:36 -07002210
2211static int neigh_dump_table(struct neigh_table *tbl, struct sk_buff *skb,
2212 struct netlink_callback *cb)
2213{
Eric Dumazet767e97e2010-10-06 17:49:21 -07002214 struct net *net = sock_net(skb->sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002215 struct neighbour *n;
2216 int rc, h, s_h = cb->args[1];
2217 int idx, s_idx = idx = cb->args[2];
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002218 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002219
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002220 rcu_read_lock_bh();
2221 nht = rcu_dereference_bh(tbl->nht);
2222
Eric Dumazet4bd6683b2012-06-07 04:58:35 +00002223 for (h = s_h; h < (1 << nht->hash_shift); h++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002224 if (h > s_h)
2225 s_idx = 0;
Eric Dumazet767e97e2010-10-06 17:49:21 -07002226 for (n = rcu_dereference_bh(nht->hash_buckets[h]), idx = 0;
2227 n != NULL;
2228 n = rcu_dereference_bh(n->next)) {
Octavian Purdila09ad9bc2009-11-25 15:14:13 -08002229 if (!net_eq(dev_net(n->dev), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002230 continue;
Gautam Kachrooefc683f2009-02-06 00:52:04 -08002231 if (idx < s_idx)
2232 goto next;
Eric W. Biederman15e47302012-09-07 20:12:54 +00002233 if (neigh_fill_info(skb, n, NETLINK_CB(cb->skb).portid,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002234 cb->nlh->nlmsg_seq,
Jamal Hadi Salimb6544c02005-06-18 22:54:12 -07002235 RTM_NEWNEIGH,
2236 NLM_F_MULTI) <= 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002237 rc = -1;
2238 goto out;
2239 }
Eric Dumazet767e97e2010-10-06 17:49:21 -07002240next:
Gautam Kachrooefc683f2009-02-06 00:52:04 -08002241 idx++;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002242 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07002243 }
2244 rc = skb->len;
2245out:
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002246 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -07002247 cb->args[1] = h;
2248 cb->args[2] = idx;
2249 return rc;
2250}
2251
Tony Zelenoff84920c12012-01-26 22:28:58 +00002252static int pneigh_dump_table(struct neigh_table *tbl, struct sk_buff *skb,
2253 struct netlink_callback *cb)
2254{
2255 struct pneigh_entry *n;
2256 struct net *net = sock_net(skb->sk);
2257 int rc, h, s_h = cb->args[3];
2258 int idx, s_idx = idx = cb->args[4];
2259
2260 read_lock_bh(&tbl->lock);
2261
Eric Dumazet4bd6683b2012-06-07 04:58:35 +00002262 for (h = s_h; h <= PNEIGH_HASHMASK; h++) {
Tony Zelenoff84920c12012-01-26 22:28:58 +00002263 if (h > s_h)
2264 s_idx = 0;
2265 for (n = tbl->phash_buckets[h], idx = 0; n; n = n->next) {
2266 if (dev_net(n->dev) != net)
2267 continue;
2268 if (idx < s_idx)
2269 goto next;
Eric W. Biederman15e47302012-09-07 20:12:54 +00002270 if (pneigh_fill_info(skb, n, NETLINK_CB(cb->skb).portid,
Tony Zelenoff84920c12012-01-26 22:28:58 +00002271 cb->nlh->nlmsg_seq,
2272 RTM_NEWNEIGH,
2273 NLM_F_MULTI, tbl) <= 0) {
2274 read_unlock_bh(&tbl->lock);
2275 rc = -1;
2276 goto out;
2277 }
2278 next:
2279 idx++;
2280 }
2281 }
2282
2283 read_unlock_bh(&tbl->lock);
2284 rc = skb->len;
2285out:
2286 cb->args[3] = h;
2287 cb->args[4] = idx;
2288 return rc;
2289
2290}
2291
Thomas Grafc8822a42007-03-22 11:50:06 -07002292static int neigh_dump_info(struct sk_buff *skb, struct netlink_callback *cb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002293{
2294 struct neigh_table *tbl;
2295 int t, family, s_t;
Tony Zelenoff84920c12012-01-26 22:28:58 +00002296 int proxy = 0;
Eric Dumazet4bd6683b2012-06-07 04:58:35 +00002297 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002298
2299 read_lock(&neigh_tbl_lock);
Thomas Graf8b8aec52006-08-07 17:56:37 -07002300 family = ((struct rtgenmsg *) nlmsg_data(cb->nlh))->rtgen_family;
Tony Zelenoff84920c12012-01-26 22:28:58 +00002301
2302 /* check for full ndmsg structure presence, family member is
2303 * the same for both structures
2304 */
2305 if (nlmsg_len(cb->nlh) >= sizeof(struct ndmsg) &&
2306 ((struct ndmsg *) nlmsg_data(cb->nlh))->ndm_flags == NTF_PROXY)
2307 proxy = 1;
2308
Linus Torvalds1da177e2005-04-16 15:20:36 -07002309 s_t = cb->args[0];
2310
Eric Dumazet4bd6683b2012-06-07 04:58:35 +00002311 for (tbl = neigh_tables, t = 0; tbl;
Tony Zelenoff84920c12012-01-26 22:28:58 +00002312 tbl = tbl->next, t++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002313 if (t < s_t || (family && tbl->family != family))
2314 continue;
2315 if (t > s_t)
2316 memset(&cb->args[1], 0, sizeof(cb->args) -
2317 sizeof(cb->args[0]));
Tony Zelenoff84920c12012-01-26 22:28:58 +00002318 if (proxy)
2319 err = pneigh_dump_table(tbl, skb, cb);
2320 else
2321 err = neigh_dump_table(tbl, skb, cb);
Eric Dumazet4bd6683b2012-06-07 04:58:35 +00002322 if (err < 0)
2323 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002324 }
2325 read_unlock(&neigh_tbl_lock);
2326
2327 cb->args[0] = t;
2328 return skb->len;
2329}
2330
2331void neigh_for_each(struct neigh_table *tbl, void (*cb)(struct neighbour *, void *), void *cookie)
2332{
2333 int chain;
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002334 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002335
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002336 rcu_read_lock_bh();
2337 nht = rcu_dereference_bh(tbl->nht);
2338
Eric Dumazet767e97e2010-10-06 17:49:21 -07002339 read_lock(&tbl->lock); /* avoid resizes */
David S. Millercd089332011-07-11 01:28:12 -07002340 for (chain = 0; chain < (1 << nht->hash_shift); chain++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002341 struct neighbour *n;
2342
Eric Dumazet767e97e2010-10-06 17:49:21 -07002343 for (n = rcu_dereference_bh(nht->hash_buckets[chain]);
2344 n != NULL;
2345 n = rcu_dereference_bh(n->next))
Linus Torvalds1da177e2005-04-16 15:20:36 -07002346 cb(n, cookie);
2347 }
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002348 read_unlock(&tbl->lock);
2349 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -07002350}
2351EXPORT_SYMBOL(neigh_for_each);
2352
2353/* The tbl->lock must be held as a writer and BH disabled. */
2354void __neigh_for_each_release(struct neigh_table *tbl,
2355 int (*cb)(struct neighbour *))
2356{
2357 int chain;
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002358 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002359
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002360 nht = rcu_dereference_protected(tbl->nht,
2361 lockdep_is_held(&tbl->lock));
David S. Millercd089332011-07-11 01:28:12 -07002362 for (chain = 0; chain < (1 << nht->hash_shift); chain++) {
Eric Dumazet767e97e2010-10-06 17:49:21 -07002363 struct neighbour *n;
2364 struct neighbour __rcu **np;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002365
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002366 np = &nht->hash_buckets[chain];
Eric Dumazet767e97e2010-10-06 17:49:21 -07002367 while ((n = rcu_dereference_protected(*np,
2368 lockdep_is_held(&tbl->lock))) != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002369 int release;
2370
2371 write_lock(&n->lock);
2372 release = cb(n);
2373 if (release) {
Eric Dumazet767e97e2010-10-06 17:49:21 -07002374 rcu_assign_pointer(*np,
2375 rcu_dereference_protected(n->next,
2376 lockdep_is_held(&tbl->lock)));
Linus Torvalds1da177e2005-04-16 15:20:36 -07002377 n->dead = 1;
2378 } else
2379 np = &n->next;
2380 write_unlock(&n->lock);
Thomas Graf4f494552007-08-08 23:12:36 -07002381 if (release)
2382 neigh_cleanup_and_release(n);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002383 }
2384 }
2385}
2386EXPORT_SYMBOL(__neigh_for_each_release);
2387
2388#ifdef CONFIG_PROC_FS
2389
2390static struct neighbour *neigh_get_first(struct seq_file *seq)
2391{
2392 struct neigh_seq_state *state = seq->private;
YOSHIFUJI Hideaki12188542008-03-26 02:36:06 +09002393 struct net *net = seq_file_net(seq);
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002394 struct neigh_hash_table *nht = state->nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002395 struct neighbour *n = NULL;
2396 int bucket = state->bucket;
2397
2398 state->flags &= ~NEIGH_SEQ_IS_PNEIGH;
David S. Millercd089332011-07-11 01:28:12 -07002399 for (bucket = 0; bucket < (1 << nht->hash_shift); bucket++) {
Eric Dumazet767e97e2010-10-06 17:49:21 -07002400 n = rcu_dereference_bh(nht->hash_buckets[bucket]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002401
2402 while (n) {
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002403 if (!net_eq(dev_net(n->dev), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002404 goto next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002405 if (state->neigh_sub_iter) {
2406 loff_t fakep = 0;
2407 void *v;
2408
2409 v = state->neigh_sub_iter(state, n, &fakep);
2410 if (!v)
2411 goto next;
2412 }
2413 if (!(state->flags & NEIGH_SEQ_SKIP_NOARP))
2414 break;
2415 if (n->nud_state & ~NUD_NOARP)
2416 break;
Eric Dumazet767e97e2010-10-06 17:49:21 -07002417next:
2418 n = rcu_dereference_bh(n->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002419 }
2420
2421 if (n)
2422 break;
2423 }
2424 state->bucket = bucket;
2425
2426 return n;
2427}
2428
2429static struct neighbour *neigh_get_next(struct seq_file *seq,
2430 struct neighbour *n,
2431 loff_t *pos)
2432{
2433 struct neigh_seq_state *state = seq->private;
YOSHIFUJI Hideaki12188542008-03-26 02:36:06 +09002434 struct net *net = seq_file_net(seq);
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002435 struct neigh_hash_table *nht = state->nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002436
2437 if (state->neigh_sub_iter) {
2438 void *v = state->neigh_sub_iter(state, n, pos);
2439 if (v)
2440 return n;
2441 }
Eric Dumazet767e97e2010-10-06 17:49:21 -07002442 n = rcu_dereference_bh(n->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002443
2444 while (1) {
2445 while (n) {
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002446 if (!net_eq(dev_net(n->dev), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002447 goto next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002448 if (state->neigh_sub_iter) {
2449 void *v = state->neigh_sub_iter(state, n, pos);
2450 if (v)
2451 return n;
2452 goto next;
2453 }
2454 if (!(state->flags & NEIGH_SEQ_SKIP_NOARP))
2455 break;
2456
2457 if (n->nud_state & ~NUD_NOARP)
2458 break;
Eric Dumazet767e97e2010-10-06 17:49:21 -07002459next:
2460 n = rcu_dereference_bh(n->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002461 }
2462
2463 if (n)
2464 break;
2465
David S. Millercd089332011-07-11 01:28:12 -07002466 if (++state->bucket >= (1 << nht->hash_shift))
Linus Torvalds1da177e2005-04-16 15:20:36 -07002467 break;
2468
Eric Dumazet767e97e2010-10-06 17:49:21 -07002469 n = rcu_dereference_bh(nht->hash_buckets[state->bucket]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002470 }
2471
2472 if (n && pos)
2473 --(*pos);
2474 return n;
2475}
2476
2477static struct neighbour *neigh_get_idx(struct seq_file *seq, loff_t *pos)
2478{
2479 struct neighbour *n = neigh_get_first(seq);
2480
2481 if (n) {
Chris Larson745e2032008-08-03 01:10:55 -07002482 --(*pos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002483 while (*pos) {
2484 n = neigh_get_next(seq, n, pos);
2485 if (!n)
2486 break;
2487 }
2488 }
2489 return *pos ? NULL : n;
2490}
2491
2492static struct pneigh_entry *pneigh_get_first(struct seq_file *seq)
2493{
2494 struct neigh_seq_state *state = seq->private;
YOSHIFUJI Hideaki12188542008-03-26 02:36:06 +09002495 struct net *net = seq_file_net(seq);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002496 struct neigh_table *tbl = state->tbl;
2497 struct pneigh_entry *pn = NULL;
2498 int bucket = state->bucket;
2499
2500 state->flags |= NEIGH_SEQ_IS_PNEIGH;
2501 for (bucket = 0; bucket <= PNEIGH_HASHMASK; bucket++) {
2502 pn = tbl->phash_buckets[bucket];
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002503 while (pn && !net_eq(pneigh_net(pn), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002504 pn = pn->next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002505 if (pn)
2506 break;
2507 }
2508 state->bucket = bucket;
2509
2510 return pn;
2511}
2512
2513static struct pneigh_entry *pneigh_get_next(struct seq_file *seq,
2514 struct pneigh_entry *pn,
2515 loff_t *pos)
2516{
2517 struct neigh_seq_state *state = seq->private;
YOSHIFUJI Hideaki12188542008-03-26 02:36:06 +09002518 struct net *net = seq_file_net(seq);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002519 struct neigh_table *tbl = state->tbl;
2520
Jorge Boncompte [DTI2]df07a942011-11-25 13:24:49 -05002521 do {
2522 pn = pn->next;
2523 } while (pn && !net_eq(pneigh_net(pn), net));
2524
Linus Torvalds1da177e2005-04-16 15:20:36 -07002525 while (!pn) {
2526 if (++state->bucket > PNEIGH_HASHMASK)
2527 break;
2528 pn = tbl->phash_buckets[state->bucket];
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002529 while (pn && !net_eq(pneigh_net(pn), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002530 pn = pn->next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002531 if (pn)
2532 break;
2533 }
2534
2535 if (pn && pos)
2536 --(*pos);
2537
2538 return pn;
2539}
2540
2541static struct pneigh_entry *pneigh_get_idx(struct seq_file *seq, loff_t *pos)
2542{
2543 struct pneigh_entry *pn = pneigh_get_first(seq);
2544
2545 if (pn) {
Chris Larson745e2032008-08-03 01:10:55 -07002546 --(*pos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002547 while (*pos) {
2548 pn = pneigh_get_next(seq, pn, pos);
2549 if (!pn)
2550 break;
2551 }
2552 }
2553 return *pos ? NULL : pn;
2554}
2555
2556static void *neigh_get_idx_any(struct seq_file *seq, loff_t *pos)
2557{
2558 struct neigh_seq_state *state = seq->private;
2559 void *rc;
Chris Larson745e2032008-08-03 01:10:55 -07002560 loff_t idxpos = *pos;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002561
Chris Larson745e2032008-08-03 01:10:55 -07002562 rc = neigh_get_idx(seq, &idxpos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002563 if (!rc && !(state->flags & NEIGH_SEQ_NEIGH_ONLY))
Chris Larson745e2032008-08-03 01:10:55 -07002564 rc = pneigh_get_idx(seq, &idxpos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002565
2566 return rc;
2567}
2568
2569void *neigh_seq_start(struct seq_file *seq, loff_t *pos, struct neigh_table *tbl, unsigned int neigh_seq_flags)
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002570 __acquires(rcu_bh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002571{
2572 struct neigh_seq_state *state = seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002573
2574 state->tbl = tbl;
2575 state->bucket = 0;
2576 state->flags = (neigh_seq_flags & ~NEIGH_SEQ_IS_PNEIGH);
2577
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002578 rcu_read_lock_bh();
2579 state->nht = rcu_dereference_bh(tbl->nht);
Eric Dumazet767e97e2010-10-06 17:49:21 -07002580
Chris Larson745e2032008-08-03 01:10:55 -07002581 return *pos ? neigh_get_idx_any(seq, pos) : SEQ_START_TOKEN;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002582}
2583EXPORT_SYMBOL(neigh_seq_start);
2584
2585void *neigh_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2586{
2587 struct neigh_seq_state *state;
2588 void *rc;
2589
2590 if (v == SEQ_START_TOKEN) {
Chris Larsonbff69732008-08-03 01:02:41 -07002591 rc = neigh_get_first(seq);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002592 goto out;
2593 }
2594
2595 state = seq->private;
2596 if (!(state->flags & NEIGH_SEQ_IS_PNEIGH)) {
2597 rc = neigh_get_next(seq, v, NULL);
2598 if (rc)
2599 goto out;
2600 if (!(state->flags & NEIGH_SEQ_NEIGH_ONLY))
2601 rc = pneigh_get_first(seq);
2602 } else {
2603 BUG_ON(state->flags & NEIGH_SEQ_NEIGH_ONLY);
2604 rc = pneigh_get_next(seq, v, NULL);
2605 }
2606out:
2607 ++(*pos);
2608 return rc;
2609}
2610EXPORT_SYMBOL(neigh_seq_next);
2611
2612void neigh_seq_stop(struct seq_file *seq, void *v)
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002613 __releases(rcu_bh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002614{
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002615 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -07002616}
2617EXPORT_SYMBOL(neigh_seq_stop);
2618
2619/* statistics via seq_file */
2620
2621static void *neigh_stat_seq_start(struct seq_file *seq, loff_t *pos)
2622{
Alexey Dobriyan81c1ebf2010-01-22 10:16:05 +00002623 struct neigh_table *tbl = seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002624 int cpu;
2625
2626 if (*pos == 0)
2627 return SEQ_START_TOKEN;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09002628
Rusty Russell0f23174a2008-12-29 12:23:42 +00002629 for (cpu = *pos-1; cpu < nr_cpu_ids; ++cpu) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002630 if (!cpu_possible(cpu))
2631 continue;
2632 *pos = cpu+1;
2633 return per_cpu_ptr(tbl->stats, cpu);
2634 }
2635 return NULL;
2636}
2637
2638static void *neigh_stat_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2639{
Alexey Dobriyan81c1ebf2010-01-22 10:16:05 +00002640 struct neigh_table *tbl = seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002641 int cpu;
2642
Rusty Russell0f23174a2008-12-29 12:23:42 +00002643 for (cpu = *pos; cpu < nr_cpu_ids; ++cpu) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002644 if (!cpu_possible(cpu))
2645 continue;
2646 *pos = cpu+1;
2647 return per_cpu_ptr(tbl->stats, cpu);
2648 }
2649 return NULL;
2650}
2651
2652static void neigh_stat_seq_stop(struct seq_file *seq, void *v)
2653{
2654
2655}
2656
2657static int neigh_stat_seq_show(struct seq_file *seq, void *v)
2658{
Alexey Dobriyan81c1ebf2010-01-22 10:16:05 +00002659 struct neigh_table *tbl = seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002660 struct neigh_statistics *st = v;
2661
2662 if (v == SEQ_START_TOKEN) {
Neil Horman9a6d2762008-07-16 20:50:49 -07002663 seq_printf(seq, "entries allocs destroys hash_grows lookups hits res_failed rcv_probes_mcast rcv_probes_ucast periodic_gc_runs forced_gc_runs unresolved_discards\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07002664 return 0;
2665 }
2666
2667 seq_printf(seq, "%08x %08lx %08lx %08lx %08lx %08lx %08lx "
Neil Horman9a6d2762008-07-16 20:50:49 -07002668 "%08lx %08lx %08lx %08lx %08lx\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07002669 atomic_read(&tbl->entries),
2670
2671 st->allocs,
2672 st->destroys,
2673 st->hash_grows,
2674
2675 st->lookups,
2676 st->hits,
2677
2678 st->res_failed,
2679
2680 st->rcv_probes_mcast,
2681 st->rcv_probes_ucast,
2682
2683 st->periodic_gc_runs,
Neil Horman9a6d2762008-07-16 20:50:49 -07002684 st->forced_gc_runs,
2685 st->unres_discards
Linus Torvalds1da177e2005-04-16 15:20:36 -07002686 );
2687
2688 return 0;
2689}
2690
Stephen Hemmingerf6908082007-03-12 14:34:29 -07002691static const struct seq_operations neigh_stat_seq_ops = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002692 .start = neigh_stat_seq_start,
2693 .next = neigh_stat_seq_next,
2694 .stop = neigh_stat_seq_stop,
2695 .show = neigh_stat_seq_show,
2696};
2697
2698static int neigh_stat_seq_open(struct inode *inode, struct file *file)
2699{
2700 int ret = seq_open(file, &neigh_stat_seq_ops);
2701
2702 if (!ret) {
2703 struct seq_file *sf = file->private_data;
Al Virod9dda782013-03-31 18:16:14 -04002704 sf->private = PDE_DATA(inode);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002705 }
2706 return ret;
2707};
2708
Arjan van de Ven9a321442007-02-12 00:55:35 -08002709static const struct file_operations neigh_stat_seq_fops = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002710 .owner = THIS_MODULE,
2711 .open = neigh_stat_seq_open,
2712 .read = seq_read,
2713 .llseek = seq_lseek,
2714 .release = seq_release,
2715};
2716
2717#endif /* CONFIG_PROC_FS */
2718
Thomas Graf339bf982006-11-10 14:10:15 -08002719static inline size_t neigh_nlmsg_size(void)
2720{
2721 return NLMSG_ALIGN(sizeof(struct ndmsg))
2722 + nla_total_size(MAX_ADDR_LEN) /* NDA_DST */
2723 + nla_total_size(MAX_ADDR_LEN) /* NDA_LLADDR */
2724 + nla_total_size(sizeof(struct nda_cacheinfo))
2725 + nla_total_size(4); /* NDA_PROBES */
2726}
2727
Thomas Grafb8673312006-08-15 00:33:14 -07002728static void __neigh_notify(struct neighbour *n, int type, int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002729{
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09002730 struct net *net = dev_net(n->dev);
Thomas Graf8b8aec52006-08-07 17:56:37 -07002731 struct sk_buff *skb;
Thomas Grafb8673312006-08-15 00:33:14 -07002732 int err = -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002733
Thomas Graf339bf982006-11-10 14:10:15 -08002734 skb = nlmsg_new(neigh_nlmsg_size(), GFP_ATOMIC);
Thomas Graf8b8aec52006-08-07 17:56:37 -07002735 if (skb == NULL)
Thomas Grafb8673312006-08-15 00:33:14 -07002736 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002737
Thomas Grafb8673312006-08-15 00:33:14 -07002738 err = neigh_fill_info(skb, n, 0, 0, type, flags);
Patrick McHardy26932562007-01-31 23:16:40 -08002739 if (err < 0) {
2740 /* -EMSGSIZE implies BUG in neigh_nlmsg_size() */
2741 WARN_ON(err == -EMSGSIZE);
2742 kfree_skb(skb);
2743 goto errout;
2744 }
Pablo Neira Ayuso1ce85fe2009-02-24 23:18:28 -08002745 rtnl_notify(skb, net, 0, RTNLGRP_NEIGH, NULL, GFP_ATOMIC);
2746 return;
Thomas Grafb8673312006-08-15 00:33:14 -07002747errout:
2748 if (err < 0)
Eric W. Biederman426b5302008-01-24 00:13:18 -08002749 rtnl_set_sk_err(net, RTNLGRP_NEIGH, err);
Thomas Grafb8673312006-08-15 00:33:14 -07002750}
2751
Thomas Grafd961db32007-08-08 23:12:56 -07002752#ifdef CONFIG_ARPD
Thomas Grafb8673312006-08-15 00:33:14 -07002753void neigh_app_ns(struct neighbour *n)
2754{
2755 __neigh_notify(n, RTM_GETNEIGH, NLM_F_REQUEST);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002756}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09002757EXPORT_SYMBOL(neigh_app_ns);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002758#endif /* CONFIG_ARPD */
2759
2760#ifdef CONFIG_SYSCTL
Cong Wangb93196d2012-12-06 10:04:04 +08002761static int zero;
2762static int unres_qlen_max = INT_MAX / SKB_TRUESIZE(ETH_FRAME_LEN);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002763
Joe Perchesfe2c6332013-06-11 23:04:25 -07002764static int proc_unres_qlen(struct ctl_table *ctl, int write,
2765 void __user *buffer, size_t *lenp, loff_t *ppos)
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002766{
2767 int size, ret;
Joe Perchesfe2c6332013-06-11 23:04:25 -07002768 struct ctl_table tmp = *ctl;
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002769
Shan Weice46cc62012-12-04 18:49:15 +00002770 tmp.extra1 = &zero;
2771 tmp.extra2 = &unres_qlen_max;
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002772 tmp.data = &size;
Shan Weice46cc62012-12-04 18:49:15 +00002773
2774 size = *(int *)ctl->data / SKB_TRUESIZE(ETH_FRAME_LEN);
2775 ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos);
2776
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002777 if (write && !ret)
2778 *(int *)ctl->data = size * SKB_TRUESIZE(ETH_FRAME_LEN);
2779 return ret;
2780}
2781
2782enum {
2783 NEIGH_VAR_MCAST_PROBE,
2784 NEIGH_VAR_UCAST_PROBE,
2785 NEIGH_VAR_APP_PROBE,
2786 NEIGH_VAR_RETRANS_TIME,
2787 NEIGH_VAR_BASE_REACHABLE_TIME,
2788 NEIGH_VAR_DELAY_PROBE_TIME,
2789 NEIGH_VAR_GC_STALETIME,
2790 NEIGH_VAR_QUEUE_LEN,
2791 NEIGH_VAR_QUEUE_LEN_BYTES,
2792 NEIGH_VAR_PROXY_QLEN,
2793 NEIGH_VAR_ANYCAST_DELAY,
2794 NEIGH_VAR_PROXY_DELAY,
2795 NEIGH_VAR_LOCKTIME,
2796 NEIGH_VAR_RETRANS_TIME_MS,
2797 NEIGH_VAR_BASE_REACHABLE_TIME_MS,
2798 NEIGH_VAR_GC_INTERVAL,
2799 NEIGH_VAR_GC_THRESH1,
2800 NEIGH_VAR_GC_THRESH2,
2801 NEIGH_VAR_GC_THRESH3,
2802 NEIGH_VAR_MAX
2803};
Eric W. Biederman54716e32010-02-14 03:27:03 +00002804
Linus Torvalds1da177e2005-04-16 15:20:36 -07002805static struct neigh_sysctl_table {
2806 struct ctl_table_header *sysctl_header;
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002807 struct ctl_table neigh_vars[NEIGH_VAR_MAX + 1];
Brian Haleyab32ea52006-09-22 14:15:41 -07002808} neigh_sysctl_template __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002809 .neigh_vars = {
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002810 [NEIGH_VAR_MCAST_PROBE] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002811 .procname = "mcast_solicit",
2812 .maxlen = sizeof(int),
2813 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002814 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002815 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002816 [NEIGH_VAR_UCAST_PROBE] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002817 .procname = "ucast_solicit",
2818 .maxlen = sizeof(int),
2819 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002820 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002821 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002822 [NEIGH_VAR_APP_PROBE] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002823 .procname = "app_solicit",
2824 .maxlen = sizeof(int),
2825 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002826 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002827 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002828 [NEIGH_VAR_RETRANS_TIME] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002829 .procname = "retrans_time",
2830 .maxlen = sizeof(int),
2831 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002832 .proc_handler = proc_dointvec_userhz_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002833 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002834 [NEIGH_VAR_BASE_REACHABLE_TIME] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002835 .procname = "base_reachable_time",
2836 .maxlen = sizeof(int),
2837 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002838 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002839 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002840 [NEIGH_VAR_DELAY_PROBE_TIME] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002841 .procname = "delay_first_probe_time",
2842 .maxlen = sizeof(int),
2843 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002844 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002845 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002846 [NEIGH_VAR_GC_STALETIME] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002847 .procname = "gc_stale_time",
2848 .maxlen = sizeof(int),
2849 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002850 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002851 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002852 [NEIGH_VAR_QUEUE_LEN] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002853 .procname = "unres_qlen",
2854 .maxlen = sizeof(int),
2855 .mode = 0644,
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002856 .proc_handler = proc_unres_qlen,
2857 },
2858 [NEIGH_VAR_QUEUE_LEN_BYTES] = {
2859 .procname = "unres_qlen_bytes",
2860 .maxlen = sizeof(int),
2861 .mode = 0644,
Shan Weice46cc62012-12-04 18:49:15 +00002862 .extra1 = &zero,
2863 .proc_handler = proc_dointvec_minmax,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002864 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002865 [NEIGH_VAR_PROXY_QLEN] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002866 .procname = "proxy_qlen",
2867 .maxlen = sizeof(int),
2868 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002869 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002870 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002871 [NEIGH_VAR_ANYCAST_DELAY] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002872 .procname = "anycast_delay",
2873 .maxlen = sizeof(int),
2874 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002875 .proc_handler = proc_dointvec_userhz_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002876 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002877 [NEIGH_VAR_PROXY_DELAY] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002878 .procname = "proxy_delay",
2879 .maxlen = sizeof(int),
2880 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002881 .proc_handler = proc_dointvec_userhz_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002882 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002883 [NEIGH_VAR_LOCKTIME] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002884 .procname = "locktime",
2885 .maxlen = sizeof(int),
2886 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002887 .proc_handler = proc_dointvec_userhz_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002888 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002889 [NEIGH_VAR_RETRANS_TIME_MS] = {
Eric W. Biedermand12af672007-10-18 03:05:25 -07002890 .procname = "retrans_time_ms",
2891 .maxlen = sizeof(int),
2892 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002893 .proc_handler = proc_dointvec_ms_jiffies,
Eric W. Biedermand12af672007-10-18 03:05:25 -07002894 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002895 [NEIGH_VAR_BASE_REACHABLE_TIME_MS] = {
Eric W. Biedermand12af672007-10-18 03:05:25 -07002896 .procname = "base_reachable_time_ms",
2897 .maxlen = sizeof(int),
2898 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002899 .proc_handler = proc_dointvec_ms_jiffies,
Eric W. Biedermand12af672007-10-18 03:05:25 -07002900 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002901 [NEIGH_VAR_GC_INTERVAL] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002902 .procname = "gc_interval",
2903 .maxlen = sizeof(int),
2904 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002905 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002906 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002907 [NEIGH_VAR_GC_THRESH1] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002908 .procname = "gc_thresh1",
2909 .maxlen = sizeof(int),
2910 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002911 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002912 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002913 [NEIGH_VAR_GC_THRESH2] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002914 .procname = "gc_thresh2",
2915 .maxlen = sizeof(int),
2916 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002917 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002918 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002919 [NEIGH_VAR_GC_THRESH3] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002920 .procname = "gc_thresh3",
2921 .maxlen = sizeof(int),
2922 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002923 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002924 },
Pavel Emelyanovc3bac5a2007-12-02 00:08:16 +11002925 {},
Linus Torvalds1da177e2005-04-16 15:20:36 -07002926 },
2927};
2928
2929int neigh_sysctl_register(struct net_device *dev, struct neigh_parms *p,
Eric W. Biederman54716e32010-02-14 03:27:03 +00002930 char *p_name, proc_handler *handler)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002931{
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002932 struct neigh_sysctl_table *t;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002933 const char *dev_name_source = NULL;
Eric W. Biederman8f40a1f2012-04-19 13:38:03 +00002934 char neigh_path[ sizeof("net//neigh/") + IFNAMSIZ + IFNAMSIZ ];
Linus Torvalds1da177e2005-04-16 15:20:36 -07002935
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002936 t = kmemdup(&neigh_sysctl_template, sizeof(*t), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002937 if (!t)
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002938 goto err;
2939
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002940 t->neigh_vars[NEIGH_VAR_MCAST_PROBE].data = &p->mcast_probes;
2941 t->neigh_vars[NEIGH_VAR_UCAST_PROBE].data = &p->ucast_probes;
2942 t->neigh_vars[NEIGH_VAR_APP_PROBE].data = &p->app_probes;
2943 t->neigh_vars[NEIGH_VAR_RETRANS_TIME].data = &p->retrans_time;
2944 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME].data = &p->base_reachable_time;
2945 t->neigh_vars[NEIGH_VAR_DELAY_PROBE_TIME].data = &p->delay_probe_time;
2946 t->neigh_vars[NEIGH_VAR_GC_STALETIME].data = &p->gc_staletime;
2947 t->neigh_vars[NEIGH_VAR_QUEUE_LEN].data = &p->queue_len_bytes;
2948 t->neigh_vars[NEIGH_VAR_QUEUE_LEN_BYTES].data = &p->queue_len_bytes;
2949 t->neigh_vars[NEIGH_VAR_PROXY_QLEN].data = &p->proxy_qlen;
2950 t->neigh_vars[NEIGH_VAR_ANYCAST_DELAY].data = &p->anycast_delay;
2951 t->neigh_vars[NEIGH_VAR_PROXY_DELAY].data = &p->proxy_delay;
2952 t->neigh_vars[NEIGH_VAR_LOCKTIME].data = &p->locktime;
2953 t->neigh_vars[NEIGH_VAR_RETRANS_TIME_MS].data = &p->retrans_time;
2954 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME_MS].data = &p->base_reachable_time;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002955
2956 if (dev) {
2957 dev_name_source = dev->name;
Eric W. Biedermand12af672007-10-18 03:05:25 -07002958 /* Terminate the table early */
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002959 memset(&t->neigh_vars[NEIGH_VAR_GC_INTERVAL], 0,
2960 sizeof(t->neigh_vars[NEIGH_VAR_GC_INTERVAL]));
Linus Torvalds1da177e2005-04-16 15:20:36 -07002961 } else {
Eric W. Biederman8f40a1f2012-04-19 13:38:03 +00002962 dev_name_source = "default";
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002963 t->neigh_vars[NEIGH_VAR_GC_INTERVAL].data = (int *)(p + 1);
2964 t->neigh_vars[NEIGH_VAR_GC_THRESH1].data = (int *)(p + 1) + 1;
2965 t->neigh_vars[NEIGH_VAR_GC_THRESH2].data = (int *)(p + 1) + 2;
2966 t->neigh_vars[NEIGH_VAR_GC_THRESH3].data = (int *)(p + 1) + 3;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002967 }
2968
Linus Torvalds1da177e2005-04-16 15:20:36 -07002969
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002970 if (handler) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002971 /* RetransTime */
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002972 t->neigh_vars[NEIGH_VAR_RETRANS_TIME].proc_handler = handler;
2973 t->neigh_vars[NEIGH_VAR_RETRANS_TIME].extra1 = dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002974 /* ReachableTime */
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002975 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME].proc_handler = handler;
2976 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME].extra1 = dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002977 /* RetransTime (in milliseconds)*/
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002978 t->neigh_vars[NEIGH_VAR_RETRANS_TIME_MS].proc_handler = handler;
2979 t->neigh_vars[NEIGH_VAR_RETRANS_TIME_MS].extra1 = dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002980 /* ReachableTime (in milliseconds) */
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002981 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME_MS].proc_handler = handler;
2982 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME_MS].extra1 = dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002983 }
2984
Eric W. Biederman464dc802012-11-16 03:02:59 +00002985 /* Don't export sysctls to unprivileged users */
2986 if (neigh_parms_net(p)->user_ns != &init_user_ns)
2987 t->neigh_vars[0].procname = NULL;
2988
Eric W. Biederman8f40a1f2012-04-19 13:38:03 +00002989 snprintf(neigh_path, sizeof(neigh_path), "net/%s/neigh/%s",
2990 p_name, dev_name_source);
Denis V. Lunev4ab438f2008-02-28 20:48:01 -08002991 t->sysctl_header =
Eric W. Biederman8f40a1f2012-04-19 13:38:03 +00002992 register_net_sysctl(neigh_parms_net(p), neigh_path, t->neigh_vars);
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002993 if (!t->sysctl_header)
Eric W. Biederman8f40a1f2012-04-19 13:38:03 +00002994 goto free;
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002995
Linus Torvalds1da177e2005-04-16 15:20:36 -07002996 p->sysctl_table = t;
2997 return 0;
2998
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002999free:
Linus Torvalds1da177e2005-04-16 15:20:36 -07003000 kfree(t);
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11003001err:
3002 return -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003003}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09003004EXPORT_SYMBOL(neigh_sysctl_register);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003005
3006void neigh_sysctl_unregister(struct neigh_parms *p)
3007{
3008 if (p->sysctl_table) {
3009 struct neigh_sysctl_table *t = p->sysctl_table;
3010 p->sysctl_table = NULL;
Eric W. Biederman5dd3df12012-04-19 13:24:33 +00003011 unregister_net_sysctl_table(t->sysctl_header);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003012 kfree(t);
3013 }
3014}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09003015EXPORT_SYMBOL(neigh_sysctl_unregister);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003016
3017#endif /* CONFIG_SYSCTL */
3018
Thomas Grafc8822a42007-03-22 11:50:06 -07003019static int __init neigh_init(void)
3020{
Greg Rosec7ac8672011-06-10 01:27:09 +00003021 rtnl_register(PF_UNSPEC, RTM_NEWNEIGH, neigh_add, NULL, NULL);
3022 rtnl_register(PF_UNSPEC, RTM_DELNEIGH, neigh_delete, NULL, NULL);
3023 rtnl_register(PF_UNSPEC, RTM_GETNEIGH, NULL, neigh_dump_info, NULL);
Thomas Grafc8822a42007-03-22 11:50:06 -07003024
Greg Rosec7ac8672011-06-10 01:27:09 +00003025 rtnl_register(PF_UNSPEC, RTM_GETNEIGHTBL, NULL, neightbl_dump_info,
3026 NULL);
3027 rtnl_register(PF_UNSPEC, RTM_SETNEIGHTBL, neightbl_set, NULL, NULL);
Thomas Grafc8822a42007-03-22 11:50:06 -07003028
3029 return 0;
3030}
3031
3032subsys_initcall(neigh_init);
3033