blob: 5c56b217b999d114ea7954a9e6060a77d906ceff [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Generic address resolution entity
3 *
4 * Authors:
5 * Pedro Roque <roque@di.fc.ul.pt>
6 * Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
7 *
8 * This program is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU General Public License
10 * as published by the Free Software Foundation; either version
11 * 2 of the License, or (at your option) any later version.
12 *
13 * Fixes:
14 * Vitaly E. Lavrov releasing NULL neighbor in neigh_add.
15 * Harald Welte Add neighbour cache statistics like rtstat
16 */
17
Joe Perchese005d192012-05-16 19:58:40 +000018#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
19
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090020#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021#include <linux/types.h>
22#include <linux/kernel.h>
23#include <linux/module.h>
24#include <linux/socket.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070025#include <linux/netdevice.h>
26#include <linux/proc_fs.h>
27#ifdef CONFIG_SYSCTL
28#include <linux/sysctl.h>
29#endif
30#include <linux/times.h>
Eric W. Biederman457c4cb2007-09-12 12:01:34 +020031#include <net/net_namespace.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070032#include <net/neighbour.h>
33#include <net/dst.h>
34#include <net/sock.h>
Tom Tucker8d717402006-07-30 20:43:36 -070035#include <net/netevent.h>
Thomas Grafa14a49d2006-08-07 17:53:08 -070036#include <net/netlink.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070037#include <linux/rtnetlink.h>
38#include <linux/random.h>
Paulo Marques543537b2005-06-23 00:09:02 -070039#include <linux/string.h>
vignesh babuc3609d52007-08-24 22:27:55 -070040#include <linux/log2.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070041
Joe Perchesd5d427c2013-04-15 15:17:19 +000042#define DEBUG
Linus Torvalds1da177e2005-04-16 15:20:36 -070043#define NEIGH_DEBUG 1
Joe Perchesd5d427c2013-04-15 15:17:19 +000044#define neigh_dbg(level, fmt, ...) \
45do { \
46 if (level <= NEIGH_DEBUG) \
47 pr_debug(fmt, ##__VA_ARGS__); \
48} while (0)
Linus Torvalds1da177e2005-04-16 15:20:36 -070049
50#define PNEIGH_HASHMASK 0xF
51
52static void neigh_timer_handler(unsigned long arg);
Thomas Grafd961db32007-08-08 23:12:56 -070053static void __neigh_notify(struct neighbour *n, int type, int flags);
54static void neigh_update_notify(struct neighbour *neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -070055static int pneigh_ifdown(struct neigh_table *tbl, struct net_device *dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -070056
57static struct neigh_table *neigh_tables;
Amos Waterland45fc3b12005-09-24 16:53:16 -070058#ifdef CONFIG_PROC_FS
Arjan van de Ven9a321442007-02-12 00:55:35 -080059static const struct file_operations neigh_stat_seq_fops;
Amos Waterland45fc3b12005-09-24 16:53:16 -070060#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070061
62/*
63 Neighbour hash table buckets are protected with rwlock tbl->lock.
64
65 - All the scans/updates to hash buckets MUST be made under this lock.
66 - NOTHING clever should be made under this lock: no callbacks
67 to protocol backends, no attempts to send something to network.
68 It will result in deadlocks, if backend/driver wants to use neighbour
69 cache.
70 - If the entry requires some non-trivial actions, increase
71 its reference count and release table lock.
72
73 Neighbour entries are protected:
74 - with reference count.
75 - with rwlock neigh->lock
76
77 Reference count prevents destruction.
78
79 neigh->lock mainly serializes ll address data and its validity state.
80 However, the same lock is used to protect another entry fields:
81 - timer
82 - resolution queue
83
84 Again, nothing clever shall be made under neigh->lock,
85 the most complicated procedure, which we allow is dev->hard_header.
86 It is supposed, that dev->hard_header is simplistic and does
87 not make callbacks to neighbour tables.
88
89 The last lock is neigh_tbl_lock. It is pure SMP lock, protecting
90 list of neighbour tables. This list is used only in process context,
91 */
92
93static DEFINE_RWLOCK(neigh_tbl_lock);
94
David S. Miller8f40b162011-07-17 13:34:11 -070095static int neigh_blackhole(struct neighbour *neigh, struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -070096{
97 kfree_skb(skb);
98 return -ENETDOWN;
99}
100
Thomas Graf4f494552007-08-08 23:12:36 -0700101static void neigh_cleanup_and_release(struct neighbour *neigh)
102{
103 if (neigh->parms->neigh_cleanup)
104 neigh->parms->neigh_cleanup(neigh);
105
Thomas Grafd961db32007-08-08 23:12:56 -0700106 __neigh_notify(neigh, RTM_DELNEIGH, 0);
Thomas Graf4f494552007-08-08 23:12:36 -0700107 neigh_release(neigh);
108}
109
Linus Torvalds1da177e2005-04-16 15:20:36 -0700110/*
111 * It is random distribution in the interval (1/2)*base...(3/2)*base.
112 * It corresponds to default IPv6 settings and is not overridable,
113 * because it is really reasonable choice.
114 */
115
116unsigned long neigh_rand_reach_time(unsigned long base)
117{
Eric Dumazeta02cec22010-09-22 20:43:57 +0000118 return base ? (net_random() % base) + (base >> 1) : 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900120EXPORT_SYMBOL(neigh_rand_reach_time);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700121
122
123static int neigh_forced_gc(struct neigh_table *tbl)
124{
125 int shrunk = 0;
126 int i;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000127 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700128
129 NEIGH_CACHE_STAT_INC(tbl, forced_gc_runs);
130
131 write_lock_bh(&tbl->lock);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000132 nht = rcu_dereference_protected(tbl->nht,
133 lockdep_is_held(&tbl->lock));
David S. Millercd089332011-07-11 01:28:12 -0700134 for (i = 0; i < (1 << nht->hash_shift); i++) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700135 struct neighbour *n;
136 struct neighbour __rcu **np;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700137
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000138 np = &nht->hash_buckets[i];
Eric Dumazet767e97e2010-10-06 17:49:21 -0700139 while ((n = rcu_dereference_protected(*np,
140 lockdep_is_held(&tbl->lock))) != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700141 /* Neighbour record may be discarded if:
142 * - nobody refers to it.
143 * - it is not permanent
144 */
145 write_lock(&n->lock);
146 if (atomic_read(&n->refcnt) == 1 &&
147 !(n->nud_state & NUD_PERMANENT)) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700148 rcu_assign_pointer(*np,
149 rcu_dereference_protected(n->next,
150 lockdep_is_held(&tbl->lock)));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700151 n->dead = 1;
152 shrunk = 1;
153 write_unlock(&n->lock);
Thomas Graf4f494552007-08-08 23:12:36 -0700154 neigh_cleanup_and_release(n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155 continue;
156 }
157 write_unlock(&n->lock);
158 np = &n->next;
159 }
160 }
161
162 tbl->last_flush = jiffies;
163
164 write_unlock_bh(&tbl->lock);
165
166 return shrunk;
167}
168
Pavel Emelyanova43d8992007-12-20 15:49:05 -0800169static void neigh_add_timer(struct neighbour *n, unsigned long when)
170{
171 neigh_hold(n);
172 if (unlikely(mod_timer(&n->timer, when))) {
173 printk("NEIGH: BUG, double timer add, state is %x\n",
174 n->nud_state);
175 dump_stack();
176 }
177}
178
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179static int neigh_del_timer(struct neighbour *n)
180{
181 if ((n->nud_state & NUD_IN_TIMER) &&
182 del_timer(&n->timer)) {
183 neigh_release(n);
184 return 1;
185 }
186 return 0;
187}
188
189static void pneigh_queue_purge(struct sk_buff_head *list)
190{
191 struct sk_buff *skb;
192
193 while ((skb = skb_dequeue(list)) != NULL) {
194 dev_put(skb->dev);
195 kfree_skb(skb);
196 }
197}
198
Herbert Xu49636bb2005-10-23 17:18:00 +1000199static void neigh_flush_dev(struct neigh_table *tbl, struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200{
201 int i;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000202 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000204 nht = rcu_dereference_protected(tbl->nht,
205 lockdep_is_held(&tbl->lock));
206
David S. Millercd089332011-07-11 01:28:12 -0700207 for (i = 0; i < (1 << nht->hash_shift); i++) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700208 struct neighbour *n;
209 struct neighbour __rcu **np = &nht->hash_buckets[i];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700210
Eric Dumazet767e97e2010-10-06 17:49:21 -0700211 while ((n = rcu_dereference_protected(*np,
212 lockdep_is_held(&tbl->lock))) != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213 if (dev && n->dev != dev) {
214 np = &n->next;
215 continue;
216 }
Eric Dumazet767e97e2010-10-06 17:49:21 -0700217 rcu_assign_pointer(*np,
218 rcu_dereference_protected(n->next,
219 lockdep_is_held(&tbl->lock)));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700220 write_lock(&n->lock);
221 neigh_del_timer(n);
222 n->dead = 1;
223
224 if (atomic_read(&n->refcnt) != 1) {
225 /* The most unpleasant situation.
226 We must destroy neighbour entry,
227 but someone still uses it.
228
229 The destroy will be delayed until
230 the last user releases us, but
231 we must kill timers etc. and move
232 it to safe state.
233 */
234 skb_queue_purge(&n->arp_queue);
Eric Dumazet8b5c1712011-11-09 12:07:14 +0000235 n->arp_queue_len_bytes = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700236 n->output = neigh_blackhole;
237 if (n->nud_state & NUD_VALID)
238 n->nud_state = NUD_NOARP;
239 else
240 n->nud_state = NUD_NONE;
Joe Perchesd5d427c2013-04-15 15:17:19 +0000241 neigh_dbg(2, "neigh %p is stray\n", n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700242 }
243 write_unlock(&n->lock);
Thomas Graf4f494552007-08-08 23:12:36 -0700244 neigh_cleanup_and_release(n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245 }
246 }
Herbert Xu49636bb2005-10-23 17:18:00 +1000247}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248
Herbert Xu49636bb2005-10-23 17:18:00 +1000249void neigh_changeaddr(struct neigh_table *tbl, struct net_device *dev)
250{
251 write_lock_bh(&tbl->lock);
252 neigh_flush_dev(tbl, dev);
253 write_unlock_bh(&tbl->lock);
254}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900255EXPORT_SYMBOL(neigh_changeaddr);
Herbert Xu49636bb2005-10-23 17:18:00 +1000256
257int neigh_ifdown(struct neigh_table *tbl, struct net_device *dev)
258{
259 write_lock_bh(&tbl->lock);
260 neigh_flush_dev(tbl, dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261 pneigh_ifdown(tbl, dev);
262 write_unlock_bh(&tbl->lock);
263
264 del_timer_sync(&tbl->proxy_timer);
265 pneigh_queue_purge(&tbl->proxy_queue);
266 return 0;
267}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900268EXPORT_SYMBOL(neigh_ifdown);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700269
David Miller596b9b62011-07-25 00:01:25 +0000270static struct neighbour *neigh_alloc(struct neigh_table *tbl, struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700271{
272 struct neighbour *n = NULL;
273 unsigned long now = jiffies;
274 int entries;
275
276 entries = atomic_inc_return(&tbl->entries) - 1;
277 if (entries >= tbl->gc_thresh3 ||
278 (entries >= tbl->gc_thresh2 &&
279 time_after(now, tbl->last_flush + 5 * HZ))) {
280 if (!neigh_forced_gc(tbl) &&
281 entries >= tbl->gc_thresh3)
282 goto out_entries;
283 }
284
YOSHIFUJI Hideaki / 吉藤英明08433ef2013-01-24 00:44:23 +0000285 n = kzalloc(tbl->entry_size + dev->neigh_priv_len, GFP_ATOMIC);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286 if (!n)
287 goto out_entries;
288
Linus Torvalds1da177e2005-04-16 15:20:36 -0700289 skb_queue_head_init(&n->arp_queue);
290 rwlock_init(&n->lock);
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +0000291 seqlock_init(&n->ha_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700292 n->updated = n->used = now;
293 n->nud_state = NUD_NONE;
294 n->output = neigh_blackhole;
David S. Millerf6b72b62011-07-14 07:53:20 -0700295 seqlock_init(&n->hh.hh_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700296 n->parms = neigh_parms_clone(&tbl->parms);
Pavel Emelyanovb24b8a22008-01-23 21:20:07 -0800297 setup_timer(&n->timer, neigh_timer_handler, (unsigned long)n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700298
299 NEIGH_CACHE_STAT_INC(tbl, allocs);
300 n->tbl = tbl;
301 atomic_set(&n->refcnt, 1);
302 n->dead = 1;
303out:
304 return n;
305
306out_entries:
307 atomic_dec(&tbl->entries);
308 goto out;
309}
310
David S. Miller2c2aba62011-12-28 15:06:58 -0500311static void neigh_get_hash_rnd(u32 *x)
312{
313 get_random_bytes(x, sizeof(*x));
314 *x |= 1;
315}
316
David S. Millercd089332011-07-11 01:28:12 -0700317static struct neigh_hash_table *neigh_hash_alloc(unsigned int shift)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700318{
David S. Millercd089332011-07-11 01:28:12 -0700319 size_t size = (1 << shift) * sizeof(struct neighbour *);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000320 struct neigh_hash_table *ret;
Eric Dumazet6193d2b2011-01-19 22:02:47 +0000321 struct neighbour __rcu **buckets;
David S. Miller2c2aba62011-12-28 15:06:58 -0500322 int i;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000324 ret = kmalloc(sizeof(*ret), GFP_ATOMIC);
325 if (!ret)
326 return NULL;
327 if (size <= PAGE_SIZE)
328 buckets = kzalloc(size, GFP_ATOMIC);
329 else
Eric Dumazet6193d2b2011-01-19 22:02:47 +0000330 buckets = (struct neighbour __rcu **)
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000331 __get_free_pages(GFP_ATOMIC | __GFP_ZERO,
332 get_order(size));
333 if (!buckets) {
334 kfree(ret);
335 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700336 }
Eric Dumazet6193d2b2011-01-19 22:02:47 +0000337 ret->hash_buckets = buckets;
David S. Millercd089332011-07-11 01:28:12 -0700338 ret->hash_shift = shift;
David S. Miller2c2aba62011-12-28 15:06:58 -0500339 for (i = 0; i < NEIGH_NUM_HASH_RND; i++)
340 neigh_get_hash_rnd(&ret->hash_rnd[i]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700341 return ret;
342}
343
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000344static void neigh_hash_free_rcu(struct rcu_head *head)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700345{
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000346 struct neigh_hash_table *nht = container_of(head,
347 struct neigh_hash_table,
348 rcu);
David S. Millercd089332011-07-11 01:28:12 -0700349 size_t size = (1 << nht->hash_shift) * sizeof(struct neighbour *);
Eric Dumazet6193d2b2011-01-19 22:02:47 +0000350 struct neighbour __rcu **buckets = nht->hash_buckets;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351
352 if (size <= PAGE_SIZE)
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000353 kfree(buckets);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700354 else
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000355 free_pages((unsigned long)buckets, get_order(size));
356 kfree(nht);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700357}
358
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000359static struct neigh_hash_table *neigh_hash_grow(struct neigh_table *tbl,
David S. Millercd089332011-07-11 01:28:12 -0700360 unsigned long new_shift)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361{
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000362 unsigned int i, hash;
363 struct neigh_hash_table *new_nht, *old_nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700364
365 NEIGH_CACHE_STAT_INC(tbl, hash_grows);
366
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000367 old_nht = rcu_dereference_protected(tbl->nht,
368 lockdep_is_held(&tbl->lock));
David S. Millercd089332011-07-11 01:28:12 -0700369 new_nht = neigh_hash_alloc(new_shift);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000370 if (!new_nht)
371 return old_nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700372
David S. Millercd089332011-07-11 01:28:12 -0700373 for (i = 0; i < (1 << old_nht->hash_shift); i++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700374 struct neighbour *n, *next;
375
Eric Dumazet767e97e2010-10-06 17:49:21 -0700376 for (n = rcu_dereference_protected(old_nht->hash_buckets[i],
377 lockdep_is_held(&tbl->lock));
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000378 n != NULL;
379 n = next) {
380 hash = tbl->hash(n->primary_key, n->dev,
381 new_nht->hash_rnd);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700382
David S. Millercd089332011-07-11 01:28:12 -0700383 hash >>= (32 - new_nht->hash_shift);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700384 next = rcu_dereference_protected(n->next,
385 lockdep_is_held(&tbl->lock));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700386
Eric Dumazet767e97e2010-10-06 17:49:21 -0700387 rcu_assign_pointer(n->next,
388 rcu_dereference_protected(
389 new_nht->hash_buckets[hash],
390 lockdep_is_held(&tbl->lock)));
391 rcu_assign_pointer(new_nht->hash_buckets[hash], n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700392 }
393 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700394
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000395 rcu_assign_pointer(tbl->nht, new_nht);
396 call_rcu(&old_nht->rcu, neigh_hash_free_rcu);
397 return new_nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700398}
399
400struct neighbour *neigh_lookup(struct neigh_table *tbl, const void *pkey,
401 struct net_device *dev)
402{
403 struct neighbour *n;
404 int key_len = tbl->key_len;
Pavel Emelyanovbc4bf5f2008-02-23 19:57:02 -0800405 u32 hash_val;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000406 struct neigh_hash_table *nht;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900407
Linus Torvalds1da177e2005-04-16 15:20:36 -0700408 NEIGH_CACHE_STAT_INC(tbl, lookups);
409
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000410 rcu_read_lock_bh();
411 nht = rcu_dereference_bh(tbl->nht);
David S. Millercd089332011-07-11 01:28:12 -0700412 hash_val = tbl->hash(pkey, dev, nht->hash_rnd) >> (32 - nht->hash_shift);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700413
414 for (n = rcu_dereference_bh(nht->hash_buckets[hash_val]);
415 n != NULL;
416 n = rcu_dereference_bh(n->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700417 if (dev == n->dev && !memcmp(n->primary_key, pkey, key_len)) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700418 if (!atomic_inc_not_zero(&n->refcnt))
419 n = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700420 NEIGH_CACHE_STAT_INC(tbl, hits);
421 break;
422 }
423 }
Eric Dumazet767e97e2010-10-06 17:49:21 -0700424
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000425 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700426 return n;
427}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900428EXPORT_SYMBOL(neigh_lookup);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700429
Eric W. Biederman426b5302008-01-24 00:13:18 -0800430struct neighbour *neigh_lookup_nodev(struct neigh_table *tbl, struct net *net,
431 const void *pkey)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700432{
433 struct neighbour *n;
434 int key_len = tbl->key_len;
Pavel Emelyanovbc4bf5f2008-02-23 19:57:02 -0800435 u32 hash_val;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000436 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700437
438 NEIGH_CACHE_STAT_INC(tbl, lookups);
439
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000440 rcu_read_lock_bh();
441 nht = rcu_dereference_bh(tbl->nht);
David S. Millercd089332011-07-11 01:28:12 -0700442 hash_val = tbl->hash(pkey, NULL, nht->hash_rnd) >> (32 - nht->hash_shift);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700443
444 for (n = rcu_dereference_bh(nht->hash_buckets[hash_val]);
445 n != NULL;
446 n = rcu_dereference_bh(n->next)) {
Eric W. Biederman426b5302008-01-24 00:13:18 -0800447 if (!memcmp(n->primary_key, pkey, key_len) &&
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +0900448 net_eq(dev_net(n->dev), net)) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700449 if (!atomic_inc_not_zero(&n->refcnt))
450 n = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700451 NEIGH_CACHE_STAT_INC(tbl, hits);
452 break;
453 }
454 }
Eric Dumazet767e97e2010-10-06 17:49:21 -0700455
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000456 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700457 return n;
458}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900459EXPORT_SYMBOL(neigh_lookup_nodev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700460
David S. Millera263b302012-07-02 02:02:15 -0700461struct neighbour *__neigh_create(struct neigh_table *tbl, const void *pkey,
462 struct net_device *dev, bool want_ref)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700463{
464 u32 hash_val;
465 int key_len = tbl->key_len;
466 int error;
David Miller596b9b62011-07-25 00:01:25 +0000467 struct neighbour *n1, *rc, *n = neigh_alloc(tbl, dev);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000468 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700469
470 if (!n) {
471 rc = ERR_PTR(-ENOBUFS);
472 goto out;
473 }
474
475 memcpy(n->primary_key, pkey, key_len);
476 n->dev = dev;
477 dev_hold(dev);
478
479 /* Protocol specific setup. */
480 if (tbl->constructor && (error = tbl->constructor(n)) < 0) {
481 rc = ERR_PTR(error);
482 goto out_neigh_release;
483 }
484
David Millerda6a8fa2011-07-25 00:01:38 +0000485 if (dev->netdev_ops->ndo_neigh_construct) {
486 error = dev->netdev_ops->ndo_neigh_construct(n);
487 if (error < 0) {
488 rc = ERR_PTR(error);
489 goto out_neigh_release;
490 }
491 }
492
David S. Miller447f2192011-12-19 15:04:41 -0500493 /* Device specific setup. */
494 if (n->parms->neigh_setup &&
495 (error = n->parms->neigh_setup(n)) < 0) {
496 rc = ERR_PTR(error);
497 goto out_neigh_release;
498 }
499
Linus Torvalds1da177e2005-04-16 15:20:36 -0700500 n->confirmed = jiffies - (n->parms->base_reachable_time << 1);
501
502 write_lock_bh(&tbl->lock);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000503 nht = rcu_dereference_protected(tbl->nht,
504 lockdep_is_held(&tbl->lock));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700505
David S. Millercd089332011-07-11 01:28:12 -0700506 if (atomic_read(&tbl->entries) > (1 << nht->hash_shift))
507 nht = neigh_hash_grow(tbl, nht->hash_shift + 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508
David S. Millercd089332011-07-11 01:28:12 -0700509 hash_val = tbl->hash(pkey, dev, nht->hash_rnd) >> (32 - nht->hash_shift);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700510
511 if (n->parms->dead) {
512 rc = ERR_PTR(-EINVAL);
513 goto out_tbl_unlock;
514 }
515
Eric Dumazet767e97e2010-10-06 17:49:21 -0700516 for (n1 = rcu_dereference_protected(nht->hash_buckets[hash_val],
517 lockdep_is_held(&tbl->lock));
518 n1 != NULL;
519 n1 = rcu_dereference_protected(n1->next,
520 lockdep_is_held(&tbl->lock))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700521 if (dev == n1->dev && !memcmp(n1->primary_key, pkey, key_len)) {
David S. Millera263b302012-07-02 02:02:15 -0700522 if (want_ref)
523 neigh_hold(n1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700524 rc = n1;
525 goto out_tbl_unlock;
526 }
527 }
528
Linus Torvalds1da177e2005-04-16 15:20:36 -0700529 n->dead = 0;
David S. Millera263b302012-07-02 02:02:15 -0700530 if (want_ref)
531 neigh_hold(n);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700532 rcu_assign_pointer(n->next,
533 rcu_dereference_protected(nht->hash_buckets[hash_val],
534 lockdep_is_held(&tbl->lock)));
535 rcu_assign_pointer(nht->hash_buckets[hash_val], n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700536 write_unlock_bh(&tbl->lock);
Joe Perchesd5d427c2013-04-15 15:17:19 +0000537 neigh_dbg(2, "neigh %p is created\n", n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700538 rc = n;
539out:
540 return rc;
541out_tbl_unlock:
542 write_unlock_bh(&tbl->lock);
543out_neigh_release:
544 neigh_release(n);
545 goto out;
546}
David S. Millera263b302012-07-02 02:02:15 -0700547EXPORT_SYMBOL(__neigh_create);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700548
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900549static u32 pneigh_hash(const void *pkey, int key_len)
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700550{
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700551 u32 hash_val = *(u32 *)(pkey + key_len - 4);
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700552 hash_val ^= (hash_val >> 16);
553 hash_val ^= hash_val >> 8;
554 hash_val ^= hash_val >> 4;
555 hash_val &= PNEIGH_HASHMASK;
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900556 return hash_val;
557}
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700558
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900559static struct pneigh_entry *__pneigh_lookup_1(struct pneigh_entry *n,
560 struct net *net,
561 const void *pkey,
562 int key_len,
563 struct net_device *dev)
564{
565 while (n) {
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700566 if (!memcmp(n->key, pkey, key_len) &&
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900567 net_eq(pneigh_net(n), net) &&
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700568 (n->dev == dev || !n->dev))
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900569 return n;
570 n = n->next;
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700571 }
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900572 return NULL;
573}
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700574
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900575struct pneigh_entry *__pneigh_lookup(struct neigh_table *tbl,
576 struct net *net, const void *pkey, struct net_device *dev)
577{
578 int key_len = tbl->key_len;
579 u32 hash_val = pneigh_hash(pkey, key_len);
580
581 return __pneigh_lookup_1(tbl->phash_buckets[hash_val],
582 net, pkey, key_len, dev);
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700583}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900584EXPORT_SYMBOL_GPL(__pneigh_lookup);
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700585
Eric W. Biederman426b5302008-01-24 00:13:18 -0800586struct pneigh_entry * pneigh_lookup(struct neigh_table *tbl,
587 struct net *net, const void *pkey,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700588 struct net_device *dev, int creat)
589{
590 struct pneigh_entry *n;
591 int key_len = tbl->key_len;
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900592 u32 hash_val = pneigh_hash(pkey, key_len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700593
594 read_lock_bh(&tbl->lock);
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900595 n = __pneigh_lookup_1(tbl->phash_buckets[hash_val],
596 net, pkey, key_len, dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700597 read_unlock_bh(&tbl->lock);
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900598
599 if (n || !creat)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700600 goto out;
601
Pavel Emelyanov4ae28942007-10-15 12:54:15 -0700602 ASSERT_RTNL();
603
Linus Torvalds1da177e2005-04-16 15:20:36 -0700604 n = kmalloc(sizeof(*n) + key_len, GFP_KERNEL);
605 if (!n)
606 goto out;
607
Eric Dumazete42ea982008-11-12 00:54:54 -0800608 write_pnet(&n->net, hold_net(net));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700609 memcpy(n->key, pkey, key_len);
610 n->dev = dev;
611 if (dev)
612 dev_hold(dev);
613
614 if (tbl->pconstructor && tbl->pconstructor(n)) {
615 if (dev)
616 dev_put(dev);
Denis V. Lunevda12f732008-02-20 00:26:16 -0800617 release_net(net);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700618 kfree(n);
619 n = NULL;
620 goto out;
621 }
622
623 write_lock_bh(&tbl->lock);
624 n->next = tbl->phash_buckets[hash_val];
625 tbl->phash_buckets[hash_val] = n;
626 write_unlock_bh(&tbl->lock);
627out:
628 return n;
629}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900630EXPORT_SYMBOL(pneigh_lookup);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700631
632
Eric W. Biederman426b5302008-01-24 00:13:18 -0800633int pneigh_delete(struct neigh_table *tbl, struct net *net, const void *pkey,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700634 struct net_device *dev)
635{
636 struct pneigh_entry *n, **np;
637 int key_len = tbl->key_len;
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900638 u32 hash_val = pneigh_hash(pkey, key_len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700639
640 write_lock_bh(&tbl->lock);
641 for (np = &tbl->phash_buckets[hash_val]; (n = *np) != NULL;
642 np = &n->next) {
Eric W. Biederman426b5302008-01-24 00:13:18 -0800643 if (!memcmp(n->key, pkey, key_len) && n->dev == dev &&
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +0900644 net_eq(pneigh_net(n), net)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700645 *np = n->next;
646 write_unlock_bh(&tbl->lock);
647 if (tbl->pdestructor)
648 tbl->pdestructor(n);
649 if (n->dev)
650 dev_put(n->dev);
YOSHIFUJI Hideaki57da52c2008-03-26 03:49:59 +0900651 release_net(pneigh_net(n));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700652 kfree(n);
653 return 0;
654 }
655 }
656 write_unlock_bh(&tbl->lock);
657 return -ENOENT;
658}
659
660static int pneigh_ifdown(struct neigh_table *tbl, struct net_device *dev)
661{
662 struct pneigh_entry *n, **np;
663 u32 h;
664
665 for (h = 0; h <= PNEIGH_HASHMASK; h++) {
666 np = &tbl->phash_buckets[h];
667 while ((n = *np) != NULL) {
668 if (!dev || n->dev == dev) {
669 *np = n->next;
670 if (tbl->pdestructor)
671 tbl->pdestructor(n);
672 if (n->dev)
673 dev_put(n->dev);
YOSHIFUJI Hideaki57da52c2008-03-26 03:49:59 +0900674 release_net(pneigh_net(n));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700675 kfree(n);
676 continue;
677 }
678 np = &n->next;
679 }
680 }
681 return -ENOENT;
682}
683
Denis V. Lunev06f05112008-01-24 00:30:58 -0800684static void neigh_parms_destroy(struct neigh_parms *parms);
685
686static inline void neigh_parms_put(struct neigh_parms *parms)
687{
688 if (atomic_dec_and_test(&parms->refcnt))
689 neigh_parms_destroy(parms);
690}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700691
692/*
693 * neighbour must already be out of the table;
694 *
695 */
696void neigh_destroy(struct neighbour *neigh)
697{
David Millerda6a8fa2011-07-25 00:01:38 +0000698 struct net_device *dev = neigh->dev;
699
Linus Torvalds1da177e2005-04-16 15:20:36 -0700700 NEIGH_CACHE_STAT_INC(neigh->tbl, destroys);
701
702 if (!neigh->dead) {
Joe Perchese005d192012-05-16 19:58:40 +0000703 pr_warn("Destroying alive neighbour %p\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700704 dump_stack();
705 return;
706 }
707
708 if (neigh_del_timer(neigh))
Joe Perchese005d192012-05-16 19:58:40 +0000709 pr_warn("Impossible event\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700710
Linus Torvalds1da177e2005-04-16 15:20:36 -0700711 skb_queue_purge(&neigh->arp_queue);
Eric Dumazet8b5c1712011-11-09 12:07:14 +0000712 neigh->arp_queue_len_bytes = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700713
David S. Miller447f2192011-12-19 15:04:41 -0500714 if (dev->netdev_ops->ndo_neigh_destroy)
715 dev->netdev_ops->ndo_neigh_destroy(neigh);
716
David Millerda6a8fa2011-07-25 00:01:38 +0000717 dev_put(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700718 neigh_parms_put(neigh->parms);
719
Joe Perchesd5d427c2013-04-15 15:17:19 +0000720 neigh_dbg(2, "neigh %p is destroyed\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700721
722 atomic_dec(&neigh->tbl->entries);
David Miller5b8b0062011-07-25 00:01:22 +0000723 kfree_rcu(neigh, rcu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700724}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900725EXPORT_SYMBOL(neigh_destroy);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700726
727/* Neighbour state is suspicious;
728 disable fast path.
729
730 Called with write_locked neigh.
731 */
732static void neigh_suspect(struct neighbour *neigh)
733{
Joe Perchesd5d427c2013-04-15 15:17:19 +0000734 neigh_dbg(2, "neigh %p is suspected\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700735
736 neigh->output = neigh->ops->output;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700737}
738
739/* Neighbour state is OK;
740 enable fast path.
741
742 Called with write_locked neigh.
743 */
744static void neigh_connect(struct neighbour *neigh)
745{
Joe Perchesd5d427c2013-04-15 15:17:19 +0000746 neigh_dbg(2, "neigh %p is connected\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700747
748 neigh->output = neigh->ops->connected_output;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700749}
750
Eric Dumazete4c4e442009-07-30 03:15:07 +0000751static void neigh_periodic_work(struct work_struct *work)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700752{
Eric Dumazete4c4e442009-07-30 03:15:07 +0000753 struct neigh_table *tbl = container_of(work, struct neigh_table, gc_work.work);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700754 struct neighbour *n;
755 struct neighbour __rcu **np;
Eric Dumazete4c4e442009-07-30 03:15:07 +0000756 unsigned int i;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000757 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700758
759 NEIGH_CACHE_STAT_INC(tbl, periodic_gc_runs);
760
Eric Dumazete4c4e442009-07-30 03:15:07 +0000761 write_lock_bh(&tbl->lock);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000762 nht = rcu_dereference_protected(tbl->nht,
763 lockdep_is_held(&tbl->lock));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700764
YOSHIFUJI Hideaki / 吉藤英明27246802013-01-22 05:20:05 +0000765 if (atomic_read(&tbl->entries) < tbl->gc_thresh1)
766 goto out;
767
Linus Torvalds1da177e2005-04-16 15:20:36 -0700768 /*
769 * periodically recompute ReachableTime from random function
770 */
771
Eric Dumazete4c4e442009-07-30 03:15:07 +0000772 if (time_after(jiffies, tbl->last_rand + 300 * HZ)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700773 struct neigh_parms *p;
Eric Dumazete4c4e442009-07-30 03:15:07 +0000774 tbl->last_rand = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700775 for (p = &tbl->parms; p; p = p->next)
776 p->reachable_time =
777 neigh_rand_reach_time(p->base_reachable_time);
778 }
779
David S. Millercd089332011-07-11 01:28:12 -0700780 for (i = 0 ; i < (1 << nht->hash_shift); i++) {
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000781 np = &nht->hash_buckets[i];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700782
Eric Dumazet767e97e2010-10-06 17:49:21 -0700783 while ((n = rcu_dereference_protected(*np,
784 lockdep_is_held(&tbl->lock))) != NULL) {
Eric Dumazete4c4e442009-07-30 03:15:07 +0000785 unsigned int state;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700786
Eric Dumazete4c4e442009-07-30 03:15:07 +0000787 write_lock(&n->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700788
Eric Dumazete4c4e442009-07-30 03:15:07 +0000789 state = n->nud_state;
790 if (state & (NUD_PERMANENT | NUD_IN_TIMER)) {
791 write_unlock(&n->lock);
792 goto next_elt;
793 }
794
795 if (time_before(n->used, n->confirmed))
796 n->used = n->confirmed;
797
798 if (atomic_read(&n->refcnt) == 1 &&
799 (state == NUD_FAILED ||
800 time_after(jiffies, n->used + n->parms->gc_staletime))) {
801 *np = n->next;
802 n->dead = 1;
803 write_unlock(&n->lock);
804 neigh_cleanup_and_release(n);
805 continue;
806 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700807 write_unlock(&n->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700808
809next_elt:
Eric Dumazete4c4e442009-07-30 03:15:07 +0000810 np = &n->next;
811 }
812 /*
813 * It's fine to release lock here, even if hash table
814 * grows while we are preempted.
815 */
816 write_unlock_bh(&tbl->lock);
817 cond_resched();
818 write_lock_bh(&tbl->lock);
Michel Machado84338a62012-02-21 16:04:13 -0500819 nht = rcu_dereference_protected(tbl->nht,
820 lockdep_is_held(&tbl->lock));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700821 }
YOSHIFUJI Hideaki / 吉藤英明27246802013-01-22 05:20:05 +0000822out:
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900823 /* Cycle through all hash buckets every base_reachable_time/2 ticks.
824 * ARP entry timeouts range from 1/2 base_reachable_time to 3/2
825 * base_reachable_time.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700826 */
Eric Dumazete4c4e442009-07-30 03:15:07 +0000827 schedule_delayed_work(&tbl->gc_work,
828 tbl->parms.base_reachable_time >> 1);
829 write_unlock_bh(&tbl->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700830}
831
832static __inline__ int neigh_max_probes(struct neighbour *n)
833{
834 struct neigh_parms *p = n->parms;
Eric Dumazeta02cec22010-09-22 20:43:57 +0000835 return (n->nud_state & NUD_PROBE) ?
Linus Torvalds1da177e2005-04-16 15:20:36 -0700836 p->ucast_probes :
Eric Dumazeta02cec22010-09-22 20:43:57 +0000837 p->ucast_probes + p->app_probes + p->mcast_probes;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700838}
839
Timo Teras5ef12d92009-06-11 04:16:28 -0700840static void neigh_invalidate(struct neighbour *neigh)
Eric Dumazet0a141502010-03-09 19:40:54 +0000841 __releases(neigh->lock)
842 __acquires(neigh->lock)
Timo Teras5ef12d92009-06-11 04:16:28 -0700843{
844 struct sk_buff *skb;
845
846 NEIGH_CACHE_STAT_INC(neigh->tbl, res_failed);
Joe Perchesd5d427c2013-04-15 15:17:19 +0000847 neigh_dbg(2, "neigh %p is failed\n", neigh);
Timo Teras5ef12d92009-06-11 04:16:28 -0700848 neigh->updated = jiffies;
849
850 /* It is very thin place. report_unreachable is very complicated
851 routine. Particularly, it can hit the same neighbour entry!
852
853 So that, we try to be accurate and avoid dead loop. --ANK
854 */
855 while (neigh->nud_state == NUD_FAILED &&
856 (skb = __skb_dequeue(&neigh->arp_queue)) != NULL) {
857 write_unlock(&neigh->lock);
858 neigh->ops->error_report(neigh, skb);
859 write_lock(&neigh->lock);
860 }
861 skb_queue_purge(&neigh->arp_queue);
Eric Dumazet8b5c1712011-11-09 12:07:14 +0000862 neigh->arp_queue_len_bytes = 0;
Timo Teras5ef12d92009-06-11 04:16:28 -0700863}
864
Eric Dumazetcd28ca02011-08-09 08:15:58 +0000865static void neigh_probe(struct neighbour *neigh)
866 __releases(neigh->lock)
867{
868 struct sk_buff *skb = skb_peek(&neigh->arp_queue);
869 /* keep skb alive even if arp_queue overflows */
870 if (skb)
871 skb = skb_copy(skb, GFP_ATOMIC);
872 write_unlock(&neigh->lock);
873 neigh->ops->solicit(neigh, skb);
874 atomic_inc(&neigh->probes);
875 kfree_skb(skb);
876}
877
Linus Torvalds1da177e2005-04-16 15:20:36 -0700878/* Called when a timer expires for a neighbour entry. */
879
880static void neigh_timer_handler(unsigned long arg)
881{
882 unsigned long now, next;
883 struct neighbour *neigh = (struct neighbour *)arg;
Eric Dumazet95c96172012-04-15 05:58:06 +0000884 unsigned int state;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700885 int notify = 0;
886
887 write_lock(&neigh->lock);
888
889 state = neigh->nud_state;
890 now = jiffies;
891 next = now + HZ;
892
David S. Miller045f7b32011-11-01 17:45:55 -0400893 if (!(state & NUD_IN_TIMER))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700894 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700895
896 if (state & NUD_REACHABLE) {
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900897 if (time_before_eq(now,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700898 neigh->confirmed + neigh->parms->reachable_time)) {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000899 neigh_dbg(2, "neigh %p is still alive\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700900 next = neigh->confirmed + neigh->parms->reachable_time;
901 } else if (time_before_eq(now,
902 neigh->used + neigh->parms->delay_probe_time)) {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000903 neigh_dbg(2, "neigh %p is delayed\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700904 neigh->nud_state = NUD_DELAY;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800905 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700906 neigh_suspect(neigh);
907 next = now + neigh->parms->delay_probe_time;
908 } else {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000909 neigh_dbg(2, "neigh %p is suspected\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700910 neigh->nud_state = NUD_STALE;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800911 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700912 neigh_suspect(neigh);
Tom Tucker8d717402006-07-30 20:43:36 -0700913 notify = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700914 }
915 } else if (state & NUD_DELAY) {
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900916 if (time_before_eq(now,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700917 neigh->confirmed + neigh->parms->delay_probe_time)) {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000918 neigh_dbg(2, "neigh %p is now reachable\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700919 neigh->nud_state = NUD_REACHABLE;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800920 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700921 neigh_connect(neigh);
Tom Tucker8d717402006-07-30 20:43:36 -0700922 notify = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700923 next = neigh->confirmed + neigh->parms->reachable_time;
924 } else {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000925 neigh_dbg(2, "neigh %p is probed\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700926 neigh->nud_state = NUD_PROBE;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800927 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700928 atomic_set(&neigh->probes, 0);
929 next = now + neigh->parms->retrans_time;
930 }
931 } else {
932 /* NUD_PROBE|NUD_INCOMPLETE */
933 next = now + neigh->parms->retrans_time;
934 }
935
936 if ((neigh->nud_state & (NUD_INCOMPLETE | NUD_PROBE)) &&
937 atomic_read(&neigh->probes) >= neigh_max_probes(neigh)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700938 neigh->nud_state = NUD_FAILED;
939 notify = 1;
Timo Teras5ef12d92009-06-11 04:16:28 -0700940 neigh_invalidate(neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700941 }
942
943 if (neigh->nud_state & NUD_IN_TIMER) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700944 if (time_before(next, jiffies + HZ/2))
945 next = jiffies + HZ/2;
Herbert Xu6fb99742005-10-23 16:37:48 +1000946 if (!mod_timer(&neigh->timer, next))
947 neigh_hold(neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700948 }
949 if (neigh->nud_state & (NUD_INCOMPLETE | NUD_PROBE)) {
Eric Dumazetcd28ca02011-08-09 08:15:58 +0000950 neigh_probe(neigh);
David S. Miller9ff56602008-02-17 18:39:54 -0800951 } else {
David S. Miller69cc64d2008-02-11 21:45:44 -0800952out:
David S. Miller9ff56602008-02-17 18:39:54 -0800953 write_unlock(&neigh->lock);
954 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700955
Thomas Grafd961db32007-08-08 23:12:56 -0700956 if (notify)
957 neigh_update_notify(neigh);
958
Linus Torvalds1da177e2005-04-16 15:20:36 -0700959 neigh_release(neigh);
960}
961
962int __neigh_event_send(struct neighbour *neigh, struct sk_buff *skb)
963{
964 int rc;
Eric Dumazetcd28ca02011-08-09 08:15:58 +0000965 bool immediate_probe = false;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700966
967 write_lock_bh(&neigh->lock);
968
969 rc = 0;
970 if (neigh->nud_state & (NUD_CONNECTED | NUD_DELAY | NUD_PROBE))
971 goto out_unlock_bh;
972
Linus Torvalds1da177e2005-04-16 15:20:36 -0700973 if (!(neigh->nud_state & (NUD_STALE | NUD_INCOMPLETE))) {
974 if (neigh->parms->mcast_probes + neigh->parms->app_probes) {
Eric Dumazetcd28ca02011-08-09 08:15:58 +0000975 unsigned long next, now = jiffies;
976
Linus Torvalds1da177e2005-04-16 15:20:36 -0700977 atomic_set(&neigh->probes, neigh->parms->ucast_probes);
978 neigh->nud_state = NUD_INCOMPLETE;
Eric Dumazetcd28ca02011-08-09 08:15:58 +0000979 neigh->updated = now;
980 next = now + max(neigh->parms->retrans_time, HZ/2);
981 neigh_add_timer(neigh, next);
982 immediate_probe = true;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700983 } else {
984 neigh->nud_state = NUD_FAILED;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800985 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700986 write_unlock_bh(&neigh->lock);
987
Wei Yongjunf3fbbe02009-02-25 00:37:32 +0000988 kfree_skb(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700989 return 1;
990 }
991 } else if (neigh->nud_state & NUD_STALE) {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000992 neigh_dbg(2, "neigh %p is delayed\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700993 neigh->nud_state = NUD_DELAY;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800994 neigh->updated = jiffies;
David S. Miller667347f2005-09-27 12:07:44 -0700995 neigh_add_timer(neigh,
996 jiffies + neigh->parms->delay_probe_time);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700997 }
998
999 if (neigh->nud_state == NUD_INCOMPLETE) {
1000 if (skb) {
Eric Dumazet8b5c1712011-11-09 12:07:14 +00001001 while (neigh->arp_queue_len_bytes + skb->truesize >
1002 neigh->parms->queue_len_bytes) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001003 struct sk_buff *buff;
Eric Dumazet8b5c1712011-11-09 12:07:14 +00001004
David S. Millerf72051b2008-09-23 01:11:18 -07001005 buff = __skb_dequeue(&neigh->arp_queue);
Eric Dumazet8b5c1712011-11-09 12:07:14 +00001006 if (!buff)
1007 break;
1008 neigh->arp_queue_len_bytes -= buff->truesize;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001009 kfree_skb(buff);
Neil Horman9a6d2762008-07-16 20:50:49 -07001010 NEIGH_CACHE_STAT_INC(neigh->tbl, unres_discards);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001011 }
Eric Dumazeta4731132010-05-27 16:09:39 -07001012 skb_dst_force(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001013 __skb_queue_tail(&neigh->arp_queue, skb);
Eric Dumazet8b5c1712011-11-09 12:07:14 +00001014 neigh->arp_queue_len_bytes += skb->truesize;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001015 }
1016 rc = 1;
1017 }
1018out_unlock_bh:
Eric Dumazetcd28ca02011-08-09 08:15:58 +00001019 if (immediate_probe)
1020 neigh_probe(neigh);
1021 else
1022 write_unlock(&neigh->lock);
1023 local_bh_enable();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001024 return rc;
1025}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001026EXPORT_SYMBOL(__neigh_event_send);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001027
David S. Millerf6b72b62011-07-14 07:53:20 -07001028static void neigh_update_hhs(struct neighbour *neigh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001029{
1030 struct hh_cache *hh;
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -07001031 void (*update)(struct hh_cache*, const struct net_device*, const unsigned char *)
Doug Kehn91a72a72010-07-14 18:02:16 -07001032 = NULL;
1033
1034 if (neigh->dev->header_ops)
1035 update = neigh->dev->header_ops->cache_update;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001036
1037 if (update) {
David S. Millerf6b72b62011-07-14 07:53:20 -07001038 hh = &neigh->hh;
1039 if (hh->hh_len) {
Stephen Hemminger3644f0c2006-12-07 15:08:17 -08001040 write_seqlock_bh(&hh->hh_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001041 update(hh, neigh->dev, neigh->ha);
Stephen Hemminger3644f0c2006-12-07 15:08:17 -08001042 write_sequnlock_bh(&hh->hh_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001043 }
1044 }
1045}
1046
1047
1048
1049/* Generic update routine.
1050 -- lladdr is new lladdr or NULL, if it is not supplied.
1051 -- new is new state.
1052 -- flags
1053 NEIGH_UPDATE_F_OVERRIDE allows to override existing lladdr,
1054 if it is different.
1055 NEIGH_UPDATE_F_WEAK_OVERRIDE will suspect existing "connected"
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001056 lladdr instead of overriding it
Linus Torvalds1da177e2005-04-16 15:20:36 -07001057 if it is different.
1058 It also allows to retain current state
1059 if lladdr is unchanged.
1060 NEIGH_UPDATE_F_ADMIN means that the change is administrative.
1061
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001062 NEIGH_UPDATE_F_OVERRIDE_ISROUTER allows to override existing
Linus Torvalds1da177e2005-04-16 15:20:36 -07001063 NTF_ROUTER flag.
1064 NEIGH_UPDATE_F_ISROUTER indicates if the neighbour is known as
1065 a router.
1066
1067 Caller MUST hold reference count on the entry.
1068 */
1069
1070int neigh_update(struct neighbour *neigh, const u8 *lladdr, u8 new,
1071 u32 flags)
1072{
1073 u8 old;
1074 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001075 int notify = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001076 struct net_device *dev;
1077 int update_isrouter = 0;
1078
1079 write_lock_bh(&neigh->lock);
1080
1081 dev = neigh->dev;
1082 old = neigh->nud_state;
1083 err = -EPERM;
1084
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001085 if (!(flags & NEIGH_UPDATE_F_ADMIN) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -07001086 (old & (NUD_NOARP | NUD_PERMANENT)))
1087 goto out;
1088
1089 if (!(new & NUD_VALID)) {
1090 neigh_del_timer(neigh);
1091 if (old & NUD_CONNECTED)
1092 neigh_suspect(neigh);
1093 neigh->nud_state = new;
1094 err = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001095 notify = old & NUD_VALID;
Timo Teras5ef12d92009-06-11 04:16:28 -07001096 if ((old & (NUD_INCOMPLETE | NUD_PROBE)) &&
1097 (new & NUD_FAILED)) {
1098 neigh_invalidate(neigh);
1099 notify = 1;
1100 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001101 goto out;
1102 }
1103
1104 /* Compare new lladdr with cached one */
1105 if (!dev->addr_len) {
1106 /* First case: device needs no address. */
1107 lladdr = neigh->ha;
1108 } else if (lladdr) {
1109 /* The second case: if something is already cached
1110 and a new address is proposed:
1111 - compare new & old
1112 - if they are different, check override flag
1113 */
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001114 if ((old & NUD_VALID) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -07001115 !memcmp(lladdr, neigh->ha, dev->addr_len))
1116 lladdr = neigh->ha;
1117 } else {
1118 /* No address is supplied; if we know something,
1119 use it, otherwise discard the request.
1120 */
1121 err = -EINVAL;
1122 if (!(old & NUD_VALID))
1123 goto out;
1124 lladdr = neigh->ha;
1125 }
1126
1127 if (new & NUD_CONNECTED)
1128 neigh->confirmed = jiffies;
1129 neigh->updated = jiffies;
1130
1131 /* If entry was valid and address is not changed,
1132 do not change entry state, if new one is STALE.
1133 */
1134 err = 0;
1135 update_isrouter = flags & NEIGH_UPDATE_F_OVERRIDE_ISROUTER;
1136 if (old & NUD_VALID) {
1137 if (lladdr != neigh->ha && !(flags & NEIGH_UPDATE_F_OVERRIDE)) {
1138 update_isrouter = 0;
1139 if ((flags & NEIGH_UPDATE_F_WEAK_OVERRIDE) &&
1140 (old & NUD_CONNECTED)) {
1141 lladdr = neigh->ha;
1142 new = NUD_STALE;
1143 } else
1144 goto out;
1145 } else {
1146 if (lladdr == neigh->ha && new == NUD_STALE &&
1147 ((flags & NEIGH_UPDATE_F_WEAK_OVERRIDE) ||
1148 (old & NUD_CONNECTED))
1149 )
1150 new = old;
1151 }
1152 }
1153
1154 if (new != old) {
1155 neigh_del_timer(neigh);
Pavel Emelyanova43d8992007-12-20 15:49:05 -08001156 if (new & NUD_IN_TIMER)
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001157 neigh_add_timer(neigh, (jiffies +
1158 ((new & NUD_REACHABLE) ?
David S. Miller667347f2005-09-27 12:07:44 -07001159 neigh->parms->reachable_time :
1160 0)));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001161 neigh->nud_state = new;
1162 }
1163
1164 if (lladdr != neigh->ha) {
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001165 write_seqlock(&neigh->ha_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001166 memcpy(&neigh->ha, lladdr, dev->addr_len);
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001167 write_sequnlock(&neigh->ha_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001168 neigh_update_hhs(neigh);
1169 if (!(new & NUD_CONNECTED))
1170 neigh->confirmed = jiffies -
1171 (neigh->parms->base_reachable_time << 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001172 notify = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001173 }
1174 if (new == old)
1175 goto out;
1176 if (new & NUD_CONNECTED)
1177 neigh_connect(neigh);
1178 else
1179 neigh_suspect(neigh);
1180 if (!(old & NUD_VALID)) {
1181 struct sk_buff *skb;
1182
1183 /* Again: avoid dead loop if something went wrong */
1184
1185 while (neigh->nud_state & NUD_VALID &&
1186 (skb = __skb_dequeue(&neigh->arp_queue)) != NULL) {
David S. Miller69cce1d2011-07-17 23:09:49 -07001187 struct dst_entry *dst = skb_dst(skb);
1188 struct neighbour *n2, *n1 = neigh;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001189 write_unlock_bh(&neigh->lock);
roy.qing.li@gmail.come049f282011-10-17 22:32:42 +00001190
1191 rcu_read_lock();
David S. Miller13a43d92012-07-02 22:15:37 -07001192
1193 /* Why not just use 'neigh' as-is? The problem is that
1194 * things such as shaper, eql, and sch_teql can end up
1195 * using alternative, different, neigh objects to output
1196 * the packet in the output path. So what we need to do
1197 * here is re-lookup the top-level neigh in the path so
1198 * we can reinject the packet there.
1199 */
1200 n2 = NULL;
1201 if (dst) {
1202 n2 = dst_neigh_lookup_skb(dst, skb);
1203 if (n2)
1204 n1 = n2;
1205 }
David S. Miller8f40b162011-07-17 13:34:11 -07001206 n1->output(n1, skb);
David S. Miller13a43d92012-07-02 22:15:37 -07001207 if (n2)
1208 neigh_release(n2);
roy.qing.li@gmail.come049f282011-10-17 22:32:42 +00001209 rcu_read_unlock();
1210
Linus Torvalds1da177e2005-04-16 15:20:36 -07001211 write_lock_bh(&neigh->lock);
1212 }
1213 skb_queue_purge(&neigh->arp_queue);
Eric Dumazet8b5c1712011-11-09 12:07:14 +00001214 neigh->arp_queue_len_bytes = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001215 }
1216out:
1217 if (update_isrouter) {
1218 neigh->flags = (flags & NEIGH_UPDATE_F_ISROUTER) ?
1219 (neigh->flags | NTF_ROUTER) :
1220 (neigh->flags & ~NTF_ROUTER);
1221 }
1222 write_unlock_bh(&neigh->lock);
Tom Tucker8d717402006-07-30 20:43:36 -07001223
1224 if (notify)
Thomas Grafd961db32007-08-08 23:12:56 -07001225 neigh_update_notify(neigh);
1226
Linus Torvalds1da177e2005-04-16 15:20:36 -07001227 return err;
1228}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001229EXPORT_SYMBOL(neigh_update);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001230
1231struct neighbour *neigh_event_ns(struct neigh_table *tbl,
1232 u8 *lladdr, void *saddr,
1233 struct net_device *dev)
1234{
1235 struct neighbour *neigh = __neigh_lookup(tbl, saddr, dev,
1236 lladdr || !dev->addr_len);
1237 if (neigh)
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001238 neigh_update(neigh, lladdr, NUD_STALE,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001239 NEIGH_UPDATE_F_OVERRIDE);
1240 return neigh;
1241}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001242EXPORT_SYMBOL(neigh_event_ns);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001243
Eric Dumazet34d101d2010-10-11 09:16:57 -07001244/* called with read_lock_bh(&n->lock); */
David S. Millerf6b72b62011-07-14 07:53:20 -07001245static void neigh_hh_init(struct neighbour *n, struct dst_entry *dst)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001246{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001247 struct net_device *dev = dst->dev;
David S. Millerf6b72b62011-07-14 07:53:20 -07001248 __be16 prot = dst->ops->protocol;
1249 struct hh_cache *hh = &n->hh;
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001250
1251 write_lock_bh(&n->lock);
Eric Dumazet34d101d2010-10-11 09:16:57 -07001252
David S. Millerf6b72b62011-07-14 07:53:20 -07001253 /* Only one thread can come in here and initialize the
1254 * hh_cache entry.
1255 */
David S. Millerb23b5452011-07-16 17:45:02 -07001256 if (!hh->hh_len)
1257 dev->header_ops->cache(n, hh, prot);
David S. Millerf6b72b62011-07-14 07:53:20 -07001258
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001259 write_unlock_bh(&n->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001260}
1261
1262/* This function can be used in contexts, where only old dev_queue_xmit
Eric Dumazet767e97e2010-10-06 17:49:21 -07001263 * worked, f.e. if you want to override normal output path (eql, shaper),
1264 * but resolution is not made yet.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001265 */
1266
David S. Miller8f40b162011-07-17 13:34:11 -07001267int neigh_compat_output(struct neighbour *neigh, struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001268{
1269 struct net_device *dev = skb->dev;
1270
Arnaldo Carvalho de Melobbe735e2007-03-10 22:16:10 -03001271 __skb_pull(skb, skb_network_offset(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001272
Stephen Hemminger0c4e8582007-10-09 01:36:32 -07001273 if (dev_hard_header(skb, dev, ntohs(skb->protocol), NULL, NULL,
1274 skb->len) < 0 &&
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -07001275 dev->header_ops->rebuild(skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001276 return 0;
1277
1278 return dev_queue_xmit(skb);
1279}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001280EXPORT_SYMBOL(neigh_compat_output);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001281
1282/* Slow and careful. */
1283
David S. Miller8f40b162011-07-17 13:34:11 -07001284int neigh_resolve_output(struct neighbour *neigh, struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001285{
Eric Dumazetadf30902009-06-02 05:19:30 +00001286 struct dst_entry *dst = skb_dst(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001287 int rc = 0;
1288
David S. Miller8f40b162011-07-17 13:34:11 -07001289 if (!dst)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001290 goto discard;
1291
Linus Torvalds1da177e2005-04-16 15:20:36 -07001292 if (!neigh_event_send(neigh, skb)) {
1293 int err;
1294 struct net_device *dev = neigh->dev;
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001295 unsigned int seq;
Eric Dumazet34d101d2010-10-11 09:16:57 -07001296
David S. Millerf6b72b62011-07-14 07:53:20 -07001297 if (dev->header_ops->cache && !neigh->hh.hh_len)
1298 neigh_hh_init(neigh, dst);
Eric Dumazet34d101d2010-10-11 09:16:57 -07001299
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001300 do {
ramesh.nagappa@gmail.come1f16502012-10-05 19:10:15 +00001301 __skb_pull(skb, skb_network_offset(skb));
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001302 seq = read_seqbegin(&neigh->ha_lock);
1303 err = dev_hard_header(skb, dev, ntohs(skb->protocol),
1304 neigh->ha, NULL, skb->len);
1305 } while (read_seqretry(&neigh->ha_lock, seq));
Eric Dumazet34d101d2010-10-11 09:16:57 -07001306
Linus Torvalds1da177e2005-04-16 15:20:36 -07001307 if (err >= 0)
David S. Miller542d4d62011-07-16 18:06:24 -07001308 rc = dev_queue_xmit(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001309 else
1310 goto out_kfree_skb;
1311 }
1312out:
1313 return rc;
1314discard:
Joe Perchesd5d427c2013-04-15 15:17:19 +00001315 neigh_dbg(1, "%s: dst=%p neigh=%p\n", __func__, dst, neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001316out_kfree_skb:
1317 rc = -EINVAL;
1318 kfree_skb(skb);
1319 goto out;
1320}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001321EXPORT_SYMBOL(neigh_resolve_output);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001322
1323/* As fast as possible without hh cache */
1324
David S. Miller8f40b162011-07-17 13:34:11 -07001325int neigh_connected_output(struct neighbour *neigh, struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001326{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001327 struct net_device *dev = neigh->dev;
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001328 unsigned int seq;
David S. Miller8f40b162011-07-17 13:34:11 -07001329 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001330
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001331 do {
ramesh.nagappa@gmail.come1f16502012-10-05 19:10:15 +00001332 __skb_pull(skb, skb_network_offset(skb));
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001333 seq = read_seqbegin(&neigh->ha_lock);
1334 err = dev_hard_header(skb, dev, ntohs(skb->protocol),
1335 neigh->ha, NULL, skb->len);
1336 } while (read_seqretry(&neigh->ha_lock, seq));
1337
Linus Torvalds1da177e2005-04-16 15:20:36 -07001338 if (err >= 0)
David S. Miller542d4d62011-07-16 18:06:24 -07001339 err = dev_queue_xmit(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001340 else {
1341 err = -EINVAL;
1342 kfree_skb(skb);
1343 }
1344 return err;
1345}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001346EXPORT_SYMBOL(neigh_connected_output);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001347
David S. Miller8f40b162011-07-17 13:34:11 -07001348int neigh_direct_output(struct neighbour *neigh, struct sk_buff *skb)
1349{
1350 return dev_queue_xmit(skb);
1351}
1352EXPORT_SYMBOL(neigh_direct_output);
1353
Linus Torvalds1da177e2005-04-16 15:20:36 -07001354static void neigh_proxy_process(unsigned long arg)
1355{
1356 struct neigh_table *tbl = (struct neigh_table *)arg;
1357 long sched_next = 0;
1358 unsigned long now = jiffies;
David S. Millerf72051b2008-09-23 01:11:18 -07001359 struct sk_buff *skb, *n;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001360
1361 spin_lock(&tbl->proxy_queue.lock);
1362
David S. Millerf72051b2008-09-23 01:11:18 -07001363 skb_queue_walk_safe(&tbl->proxy_queue, skb, n) {
1364 long tdif = NEIGH_CB(skb)->sched_next - now;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001365
Linus Torvalds1da177e2005-04-16 15:20:36 -07001366 if (tdif <= 0) {
David S. Millerf72051b2008-09-23 01:11:18 -07001367 struct net_device *dev = skb->dev;
Eric Dumazet20e60742011-08-22 19:32:42 +00001368
David S. Millerf72051b2008-09-23 01:11:18 -07001369 __skb_unlink(skb, &tbl->proxy_queue);
Eric Dumazet20e60742011-08-22 19:32:42 +00001370 if (tbl->proxy_redo && netif_running(dev)) {
1371 rcu_read_lock();
David S. Millerf72051b2008-09-23 01:11:18 -07001372 tbl->proxy_redo(skb);
Eric Dumazet20e60742011-08-22 19:32:42 +00001373 rcu_read_unlock();
1374 } else {
David S. Millerf72051b2008-09-23 01:11:18 -07001375 kfree_skb(skb);
Eric Dumazet20e60742011-08-22 19:32:42 +00001376 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001377
1378 dev_put(dev);
1379 } else if (!sched_next || tdif < sched_next)
1380 sched_next = tdif;
1381 }
1382 del_timer(&tbl->proxy_timer);
1383 if (sched_next)
1384 mod_timer(&tbl->proxy_timer, jiffies + sched_next);
1385 spin_unlock(&tbl->proxy_queue.lock);
1386}
1387
1388void pneigh_enqueue(struct neigh_table *tbl, struct neigh_parms *p,
1389 struct sk_buff *skb)
1390{
1391 unsigned long now = jiffies;
1392 unsigned long sched_next = now + (net_random() % p->proxy_delay);
1393
1394 if (tbl->proxy_queue.qlen > p->proxy_qlen) {
1395 kfree_skb(skb);
1396 return;
1397 }
Patrick McHardya61bbcf2005-08-14 17:24:31 -07001398
1399 NEIGH_CB(skb)->sched_next = sched_next;
1400 NEIGH_CB(skb)->flags |= LOCALLY_ENQUEUED;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001401
1402 spin_lock(&tbl->proxy_queue.lock);
1403 if (del_timer(&tbl->proxy_timer)) {
1404 if (time_before(tbl->proxy_timer.expires, sched_next))
1405 sched_next = tbl->proxy_timer.expires;
1406 }
Eric Dumazetadf30902009-06-02 05:19:30 +00001407 skb_dst_drop(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001408 dev_hold(skb->dev);
1409 __skb_queue_tail(&tbl->proxy_queue, skb);
1410 mod_timer(&tbl->proxy_timer, sched_next);
1411 spin_unlock(&tbl->proxy_queue.lock);
1412}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001413EXPORT_SYMBOL(pneigh_enqueue);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001414
Tobias Klauser97fd5bc2009-07-13 11:17:49 -07001415static inline struct neigh_parms *lookup_neigh_parms(struct neigh_table *tbl,
Eric W. Biederman426b5302008-01-24 00:13:18 -08001416 struct net *net, int ifindex)
1417{
1418 struct neigh_parms *p;
1419
1420 for (p = &tbl->parms; p; p = p->next) {
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09001421 if ((p->dev && p->dev->ifindex == ifindex && net_eq(neigh_parms_net(p), net)) ||
Eric W. Biederman426b5302008-01-24 00:13:18 -08001422 (!p->dev && !ifindex))
1423 return p;
1424 }
1425
1426 return NULL;
1427}
Linus Torvalds1da177e2005-04-16 15:20:36 -07001428
1429struct neigh_parms *neigh_parms_alloc(struct net_device *dev,
1430 struct neigh_table *tbl)
1431{
Eric W. Biederman426b5302008-01-24 00:13:18 -08001432 struct neigh_parms *p, *ref;
Stephen Hemminger00829822008-11-20 20:14:53 -08001433 struct net *net = dev_net(dev);
1434 const struct net_device_ops *ops = dev->netdev_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001435
Tobias Klauser97fd5bc2009-07-13 11:17:49 -07001436 ref = lookup_neigh_parms(tbl, net, 0);
Eric W. Biederman426b5302008-01-24 00:13:18 -08001437 if (!ref)
1438 return NULL;
1439
1440 p = kmemdup(ref, sizeof(*p), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001441 if (p) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001442 p->tbl = tbl;
1443 atomic_set(&p->refcnt, 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001444 p->reachable_time =
1445 neigh_rand_reach_time(p->base_reachable_time);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001446
Stephen Hemminger00829822008-11-20 20:14:53 -08001447 if (ops->ndo_neigh_setup && ops->ndo_neigh_setup(dev, p)) {
Denis V. Lunev486b51d2008-01-14 22:59:59 -08001448 kfree(p);
1449 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001450 }
Denis V. Lunev486b51d2008-01-14 22:59:59 -08001451
1452 dev_hold(dev);
1453 p->dev = dev;
Eric Dumazete42ea982008-11-12 00:54:54 -08001454 write_pnet(&p->net, hold_net(net));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001455 p->sysctl_table = NULL;
1456 write_lock_bh(&tbl->lock);
1457 p->next = tbl->parms.next;
1458 tbl->parms.next = p;
1459 write_unlock_bh(&tbl->lock);
1460 }
1461 return p;
1462}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001463EXPORT_SYMBOL(neigh_parms_alloc);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001464
1465static void neigh_rcu_free_parms(struct rcu_head *head)
1466{
1467 struct neigh_parms *parms =
1468 container_of(head, struct neigh_parms, rcu_head);
1469
1470 neigh_parms_put(parms);
1471}
1472
1473void neigh_parms_release(struct neigh_table *tbl, struct neigh_parms *parms)
1474{
1475 struct neigh_parms **p;
1476
1477 if (!parms || parms == &tbl->parms)
1478 return;
1479 write_lock_bh(&tbl->lock);
1480 for (p = &tbl->parms.next; *p; p = &(*p)->next) {
1481 if (*p == parms) {
1482 *p = parms->next;
1483 parms->dead = 1;
1484 write_unlock_bh(&tbl->lock);
David S. Millercecbb632008-01-20 16:39:03 -08001485 if (parms->dev)
1486 dev_put(parms->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001487 call_rcu(&parms->rcu_head, neigh_rcu_free_parms);
1488 return;
1489 }
1490 }
1491 write_unlock_bh(&tbl->lock);
Joe Perchesd5d427c2013-04-15 15:17:19 +00001492 neigh_dbg(1, "%s: not found\n", __func__);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001493}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001494EXPORT_SYMBOL(neigh_parms_release);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001495
Denis V. Lunev06f05112008-01-24 00:30:58 -08001496static void neigh_parms_destroy(struct neigh_parms *parms)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001497{
YOSHIFUJI Hideaki57da52c2008-03-26 03:49:59 +09001498 release_net(neigh_parms_net(parms));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001499 kfree(parms);
1500}
1501
Pavel Emelianovc2ecba72007-04-17 12:45:31 -07001502static struct lock_class_key neigh_table_proxy_queue_class;
1503
Hiroaki SHIMODAdcd2ba92012-04-13 07:34:44 +00001504static void neigh_table_init_no_netlink(struct neigh_table *tbl)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001505{
1506 unsigned long now = jiffies;
1507 unsigned long phsize;
1508
Eric Dumazete42ea982008-11-12 00:54:54 -08001509 write_pnet(&tbl->parms.net, &init_net);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001510 atomic_set(&tbl->parms.refcnt, 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001511 tbl->parms.reachable_time =
1512 neigh_rand_reach_time(tbl->parms.base_reachable_time);
1513
Linus Torvalds1da177e2005-04-16 15:20:36 -07001514 tbl->stats = alloc_percpu(struct neigh_statistics);
1515 if (!tbl->stats)
1516 panic("cannot create neighbour cache statistics");
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001517
Linus Torvalds1da177e2005-04-16 15:20:36 -07001518#ifdef CONFIG_PROC_FS
Alexey Dobriyan9b739ba2008-11-11 16:47:44 -08001519 if (!proc_create_data(tbl->id, 0, init_net.proc_net_stat,
1520 &neigh_stat_seq_fops, tbl))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001521 panic("cannot create neighbour proc dir entry");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001522#endif
1523
David S. Millercd089332011-07-11 01:28:12 -07001524 RCU_INIT_POINTER(tbl->nht, neigh_hash_alloc(3));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001525
1526 phsize = (PNEIGH_HASHMASK + 1) * sizeof(struct pneigh_entry *);
Andrew Morton77d04bd2006-04-07 14:52:59 -07001527 tbl->phash_buckets = kzalloc(phsize, GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001528
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001529 if (!tbl->nht || !tbl->phash_buckets)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001530 panic("cannot allocate neighbour cache hashes");
1531
YOSHIFUJI Hideaki / 吉藤英明08433ef2013-01-24 00:44:23 +00001532 if (!tbl->entry_size)
1533 tbl->entry_size = ALIGN(offsetof(struct neighbour, primary_key) +
1534 tbl->key_len, NEIGH_PRIV_ALIGN);
1535 else
1536 WARN_ON(tbl->entry_size % NEIGH_PRIV_ALIGN);
1537
Linus Torvalds1da177e2005-04-16 15:20:36 -07001538 rwlock_init(&tbl->lock);
Tejun Heo203b42f2012-08-21 13:18:23 -07001539 INIT_DEFERRABLE_WORK(&tbl->gc_work, neigh_periodic_work);
Eric Dumazete4c4e442009-07-30 03:15:07 +00001540 schedule_delayed_work(&tbl->gc_work, tbl->parms.reachable_time);
Pavel Emelyanovb24b8a22008-01-23 21:20:07 -08001541 setup_timer(&tbl->proxy_timer, neigh_proxy_process, (unsigned long)tbl);
Pavel Emelianovc2ecba72007-04-17 12:45:31 -07001542 skb_queue_head_init_class(&tbl->proxy_queue,
1543 &neigh_table_proxy_queue_class);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001544
1545 tbl->last_flush = now;
1546 tbl->last_rand = now + tbl->parms.reachable_time * 20;
Simon Kelleybd89efc2006-05-12 14:56:08 -07001547}
1548
1549void neigh_table_init(struct neigh_table *tbl)
1550{
1551 struct neigh_table *tmp;
1552
1553 neigh_table_init_no_netlink(tbl);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001554 write_lock(&neigh_tbl_lock);
Simon Kelleybd89efc2006-05-12 14:56:08 -07001555 for (tmp = neigh_tables; tmp; tmp = tmp->next) {
1556 if (tmp->family == tbl->family)
1557 break;
1558 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001559 tbl->next = neigh_tables;
1560 neigh_tables = tbl;
1561 write_unlock(&neigh_tbl_lock);
Simon Kelleybd89efc2006-05-12 14:56:08 -07001562
1563 if (unlikely(tmp)) {
Joe Perchese005d192012-05-16 19:58:40 +00001564 pr_err("Registering multiple tables for family %d\n",
1565 tbl->family);
Simon Kelleybd89efc2006-05-12 14:56:08 -07001566 dump_stack();
1567 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001568}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001569EXPORT_SYMBOL(neigh_table_init);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001570
1571int neigh_table_clear(struct neigh_table *tbl)
1572{
1573 struct neigh_table **tp;
1574
1575 /* It is not clean... Fix it to unload IPv6 module safely */
Tejun Heoa5c30b32010-10-19 06:04:42 +00001576 cancel_delayed_work_sync(&tbl->gc_work);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001577 del_timer_sync(&tbl->proxy_timer);
1578 pneigh_queue_purge(&tbl->proxy_queue);
1579 neigh_ifdown(tbl, NULL);
1580 if (atomic_read(&tbl->entries))
Joe Perchese005d192012-05-16 19:58:40 +00001581 pr_crit("neighbour leakage\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001582 write_lock(&neigh_tbl_lock);
1583 for (tp = &neigh_tables; *tp; tp = &(*tp)->next) {
1584 if (*tp == tbl) {
1585 *tp = tbl->next;
1586 break;
1587 }
1588 }
1589 write_unlock(&neigh_tbl_lock);
1590
Eric Dumazet6193d2b2011-01-19 22:02:47 +00001591 call_rcu(&rcu_dereference_protected(tbl->nht, 1)->rcu,
1592 neigh_hash_free_rcu);
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001593 tbl->nht = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001594
1595 kfree(tbl->phash_buckets);
1596 tbl->phash_buckets = NULL;
1597
Alexey Dobriyan3f192b52007-11-05 21:28:13 -08001598 remove_proc_entry(tbl->id, init_net.proc_net_stat);
1599
Kirill Korotaev3fcde742006-09-01 01:34:10 -07001600 free_percpu(tbl->stats);
1601 tbl->stats = NULL;
1602
Linus Torvalds1da177e2005-04-16 15:20:36 -07001603 return 0;
1604}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001605EXPORT_SYMBOL(neigh_table_clear);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001606
Thomas Graf661d2962013-03-21 07:45:29 +00001607static int neigh_delete(struct sk_buff *skb, struct nlmsghdr *nlh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001608{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001609 struct net *net = sock_net(skb->sk);
Thomas Grafa14a49d2006-08-07 17:53:08 -07001610 struct ndmsg *ndm;
1611 struct nlattr *dst_attr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001612 struct neigh_table *tbl;
1613 struct net_device *dev = NULL;
Thomas Grafa14a49d2006-08-07 17:53:08 -07001614 int err = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001615
Eric Dumazet110b2492010-10-04 04:27:36 +00001616 ASSERT_RTNL();
Thomas Grafa14a49d2006-08-07 17:53:08 -07001617 if (nlmsg_len(nlh) < sizeof(*ndm))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001618 goto out;
1619
Thomas Grafa14a49d2006-08-07 17:53:08 -07001620 dst_attr = nlmsg_find_attr(nlh, sizeof(*ndm), NDA_DST);
1621 if (dst_attr == NULL)
1622 goto out;
1623
1624 ndm = nlmsg_data(nlh);
1625 if (ndm->ndm_ifindex) {
Eric Dumazet110b2492010-10-04 04:27:36 +00001626 dev = __dev_get_by_index(net, ndm->ndm_ifindex);
Thomas Grafa14a49d2006-08-07 17:53:08 -07001627 if (dev == NULL) {
1628 err = -ENODEV;
1629 goto out;
1630 }
1631 }
1632
Linus Torvalds1da177e2005-04-16 15:20:36 -07001633 read_lock(&neigh_tbl_lock);
1634 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
Thomas Grafa14a49d2006-08-07 17:53:08 -07001635 struct neighbour *neigh;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001636
1637 if (tbl->family != ndm->ndm_family)
1638 continue;
1639 read_unlock(&neigh_tbl_lock);
1640
Thomas Grafa14a49d2006-08-07 17:53:08 -07001641 if (nla_len(dst_attr) < tbl->key_len)
Eric Dumazet110b2492010-10-04 04:27:36 +00001642 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001643
1644 if (ndm->ndm_flags & NTF_PROXY) {
Eric W. Biederman426b5302008-01-24 00:13:18 -08001645 err = pneigh_delete(tbl, net, nla_data(dst_attr), dev);
Eric Dumazet110b2492010-10-04 04:27:36 +00001646 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001647 }
1648
Thomas Grafa14a49d2006-08-07 17:53:08 -07001649 if (dev == NULL)
Eric Dumazet110b2492010-10-04 04:27:36 +00001650 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001651
Thomas Grafa14a49d2006-08-07 17:53:08 -07001652 neigh = neigh_lookup(tbl, nla_data(dst_attr), dev);
1653 if (neigh == NULL) {
1654 err = -ENOENT;
Eric Dumazet110b2492010-10-04 04:27:36 +00001655 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001656 }
Thomas Grafa14a49d2006-08-07 17:53:08 -07001657
1658 err = neigh_update(neigh, NULL, NUD_FAILED,
1659 NEIGH_UPDATE_F_OVERRIDE |
1660 NEIGH_UPDATE_F_ADMIN);
1661 neigh_release(neigh);
Eric Dumazet110b2492010-10-04 04:27:36 +00001662 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001663 }
1664 read_unlock(&neigh_tbl_lock);
Thomas Grafa14a49d2006-08-07 17:53:08 -07001665 err = -EAFNOSUPPORT;
1666
Linus Torvalds1da177e2005-04-16 15:20:36 -07001667out:
1668 return err;
1669}
1670
Thomas Graf661d2962013-03-21 07:45:29 +00001671static int neigh_add(struct sk_buff *skb, struct nlmsghdr *nlh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001672{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001673 struct net *net = sock_net(skb->sk);
Thomas Graf5208deb2006-08-07 17:55:40 -07001674 struct ndmsg *ndm;
1675 struct nlattr *tb[NDA_MAX+1];
Linus Torvalds1da177e2005-04-16 15:20:36 -07001676 struct neigh_table *tbl;
1677 struct net_device *dev = NULL;
Thomas Graf5208deb2006-08-07 17:55:40 -07001678 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001679
Eric Dumazet110b2492010-10-04 04:27:36 +00001680 ASSERT_RTNL();
Thomas Graf5208deb2006-08-07 17:55:40 -07001681 err = nlmsg_parse(nlh, sizeof(*ndm), tb, NDA_MAX, NULL);
1682 if (err < 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001683 goto out;
1684
Thomas Graf5208deb2006-08-07 17:55:40 -07001685 err = -EINVAL;
1686 if (tb[NDA_DST] == NULL)
1687 goto out;
1688
1689 ndm = nlmsg_data(nlh);
1690 if (ndm->ndm_ifindex) {
Eric Dumazet110b2492010-10-04 04:27:36 +00001691 dev = __dev_get_by_index(net, ndm->ndm_ifindex);
Thomas Graf5208deb2006-08-07 17:55:40 -07001692 if (dev == NULL) {
1693 err = -ENODEV;
1694 goto out;
1695 }
1696
1697 if (tb[NDA_LLADDR] && nla_len(tb[NDA_LLADDR]) < dev->addr_len)
Eric Dumazet110b2492010-10-04 04:27:36 +00001698 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001699 }
1700
Linus Torvalds1da177e2005-04-16 15:20:36 -07001701 read_lock(&neigh_tbl_lock);
1702 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
Thomas Graf5208deb2006-08-07 17:55:40 -07001703 int flags = NEIGH_UPDATE_F_ADMIN | NEIGH_UPDATE_F_OVERRIDE;
1704 struct neighbour *neigh;
1705 void *dst, *lladdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001706
1707 if (tbl->family != ndm->ndm_family)
1708 continue;
1709 read_unlock(&neigh_tbl_lock);
1710
Thomas Graf5208deb2006-08-07 17:55:40 -07001711 if (nla_len(tb[NDA_DST]) < tbl->key_len)
Eric Dumazet110b2492010-10-04 04:27:36 +00001712 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001713 dst = nla_data(tb[NDA_DST]);
1714 lladdr = tb[NDA_LLADDR] ? nla_data(tb[NDA_LLADDR]) : NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001715
1716 if (ndm->ndm_flags & NTF_PROXY) {
Ville Nuorvala62dd9312006-09-22 14:43:19 -07001717 struct pneigh_entry *pn;
1718
1719 err = -ENOBUFS;
Eric W. Biederman426b5302008-01-24 00:13:18 -08001720 pn = pneigh_lookup(tbl, net, dst, dev, 1);
Ville Nuorvala62dd9312006-09-22 14:43:19 -07001721 if (pn) {
1722 pn->flags = ndm->ndm_flags;
1723 err = 0;
1724 }
Eric Dumazet110b2492010-10-04 04:27:36 +00001725 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001726 }
1727
Thomas Graf5208deb2006-08-07 17:55:40 -07001728 if (dev == NULL)
Eric Dumazet110b2492010-10-04 04:27:36 +00001729 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001730
1731 neigh = neigh_lookup(tbl, dst, dev);
1732 if (neigh == NULL) {
1733 if (!(nlh->nlmsg_flags & NLM_F_CREATE)) {
1734 err = -ENOENT;
Eric Dumazet110b2492010-10-04 04:27:36 +00001735 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001736 }
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001737
Thomas Graf5208deb2006-08-07 17:55:40 -07001738 neigh = __neigh_lookup_errno(tbl, dst, dev);
1739 if (IS_ERR(neigh)) {
1740 err = PTR_ERR(neigh);
Eric Dumazet110b2492010-10-04 04:27:36 +00001741 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001742 }
1743 } else {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001744 if (nlh->nlmsg_flags & NLM_F_EXCL) {
1745 err = -EEXIST;
Thomas Graf5208deb2006-08-07 17:55:40 -07001746 neigh_release(neigh);
Eric Dumazet110b2492010-10-04 04:27:36 +00001747 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001748 }
Thomas Graf5208deb2006-08-07 17:55:40 -07001749
1750 if (!(nlh->nlmsg_flags & NLM_F_REPLACE))
1751 flags &= ~NEIGH_UPDATE_F_OVERRIDE;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001752 }
1753
Eric Biederman0c5c2d32009-03-04 00:03:08 -08001754 if (ndm->ndm_flags & NTF_USE) {
1755 neigh_event_send(neigh, NULL);
1756 err = 0;
1757 } else
1758 err = neigh_update(neigh, lladdr, ndm->ndm_state, flags);
Thomas Graf5208deb2006-08-07 17:55:40 -07001759 neigh_release(neigh);
Eric Dumazet110b2492010-10-04 04:27:36 +00001760 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001761 }
1762
1763 read_unlock(&neigh_tbl_lock);
Thomas Graf5208deb2006-08-07 17:55:40 -07001764 err = -EAFNOSUPPORT;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001765out:
1766 return err;
1767}
1768
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001769static int neightbl_fill_parms(struct sk_buff *skb, struct neigh_parms *parms)
1770{
Thomas Grafca860fb2006-08-07 18:00:18 -07001771 struct nlattr *nest;
1772
1773 nest = nla_nest_start(skb, NDTA_PARMS);
1774 if (nest == NULL)
1775 return -ENOBUFS;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001776
David S. Miller9a6308d2012-04-01 20:06:28 -04001777 if ((parms->dev &&
1778 nla_put_u32(skb, NDTPA_IFINDEX, parms->dev->ifindex)) ||
1779 nla_put_u32(skb, NDTPA_REFCNT, atomic_read(&parms->refcnt)) ||
1780 nla_put_u32(skb, NDTPA_QUEUE_LENBYTES, parms->queue_len_bytes) ||
1781 /* approximative value for deprecated QUEUE_LEN (in packets) */
1782 nla_put_u32(skb, NDTPA_QUEUE_LEN,
Shan Weice46cc62012-12-04 18:49:15 +00001783 parms->queue_len_bytes / SKB_TRUESIZE(ETH_FRAME_LEN)) ||
David S. Miller9a6308d2012-04-01 20:06:28 -04001784 nla_put_u32(skb, NDTPA_PROXY_QLEN, parms->proxy_qlen) ||
1785 nla_put_u32(skb, NDTPA_APP_PROBES, parms->app_probes) ||
1786 nla_put_u32(skb, NDTPA_UCAST_PROBES, parms->ucast_probes) ||
1787 nla_put_u32(skb, NDTPA_MCAST_PROBES, parms->mcast_probes) ||
1788 nla_put_msecs(skb, NDTPA_REACHABLE_TIME, parms->reachable_time) ||
1789 nla_put_msecs(skb, NDTPA_BASE_REACHABLE_TIME,
1790 parms->base_reachable_time) ||
1791 nla_put_msecs(skb, NDTPA_GC_STALETIME, parms->gc_staletime) ||
1792 nla_put_msecs(skb, NDTPA_DELAY_PROBE_TIME,
1793 parms->delay_probe_time) ||
1794 nla_put_msecs(skb, NDTPA_RETRANS_TIME, parms->retrans_time) ||
1795 nla_put_msecs(skb, NDTPA_ANYCAST_DELAY, parms->anycast_delay) ||
1796 nla_put_msecs(skb, NDTPA_PROXY_DELAY, parms->proxy_delay) ||
1797 nla_put_msecs(skb, NDTPA_LOCKTIME, parms->locktime))
1798 goto nla_put_failure;
Thomas Grafca860fb2006-08-07 18:00:18 -07001799 return nla_nest_end(skb, nest);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001800
Thomas Grafca860fb2006-08-07 18:00:18 -07001801nla_put_failure:
Thomas Grafbc3ed282008-06-03 16:36:54 -07001802 nla_nest_cancel(skb, nest);
1803 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001804}
1805
Thomas Grafca860fb2006-08-07 18:00:18 -07001806static int neightbl_fill_info(struct sk_buff *skb, struct neigh_table *tbl,
1807 u32 pid, u32 seq, int type, int flags)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001808{
1809 struct nlmsghdr *nlh;
1810 struct ndtmsg *ndtmsg;
1811
Thomas Grafca860fb2006-08-07 18:00:18 -07001812 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndtmsg), flags);
1813 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08001814 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001815
Thomas Grafca860fb2006-08-07 18:00:18 -07001816 ndtmsg = nlmsg_data(nlh);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001817
1818 read_lock_bh(&tbl->lock);
1819 ndtmsg->ndtm_family = tbl->family;
Patrick McHardy9ef1d4c2005-06-28 12:55:30 -07001820 ndtmsg->ndtm_pad1 = 0;
1821 ndtmsg->ndtm_pad2 = 0;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001822
David S. Miller9a6308d2012-04-01 20:06:28 -04001823 if (nla_put_string(skb, NDTA_NAME, tbl->id) ||
1824 nla_put_msecs(skb, NDTA_GC_INTERVAL, tbl->gc_interval) ||
1825 nla_put_u32(skb, NDTA_THRESH1, tbl->gc_thresh1) ||
1826 nla_put_u32(skb, NDTA_THRESH2, tbl->gc_thresh2) ||
1827 nla_put_u32(skb, NDTA_THRESH3, tbl->gc_thresh3))
1828 goto nla_put_failure;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001829 {
1830 unsigned long now = jiffies;
1831 unsigned int flush_delta = now - tbl->last_flush;
1832 unsigned int rand_delta = now - tbl->last_rand;
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001833 struct neigh_hash_table *nht;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001834 struct ndt_config ndc = {
1835 .ndtc_key_len = tbl->key_len,
1836 .ndtc_entry_size = tbl->entry_size,
1837 .ndtc_entries = atomic_read(&tbl->entries),
1838 .ndtc_last_flush = jiffies_to_msecs(flush_delta),
1839 .ndtc_last_rand = jiffies_to_msecs(rand_delta),
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001840 .ndtc_proxy_qlen = tbl->proxy_queue.qlen,
1841 };
1842
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001843 rcu_read_lock_bh();
1844 nht = rcu_dereference_bh(tbl->nht);
David S. Miller2c2aba62011-12-28 15:06:58 -05001845 ndc.ndtc_hash_rnd = nht->hash_rnd[0];
David S. Millercd089332011-07-11 01:28:12 -07001846 ndc.ndtc_hash_mask = ((1 << nht->hash_shift) - 1);
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001847 rcu_read_unlock_bh();
1848
David S. Miller9a6308d2012-04-01 20:06:28 -04001849 if (nla_put(skb, NDTA_CONFIG, sizeof(ndc), &ndc))
1850 goto nla_put_failure;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001851 }
1852
1853 {
1854 int cpu;
1855 struct ndt_stats ndst;
1856
1857 memset(&ndst, 0, sizeof(ndst));
1858
KAMEZAWA Hiroyuki6f912042006-04-10 22:52:50 -07001859 for_each_possible_cpu(cpu) {
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001860 struct neigh_statistics *st;
1861
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001862 st = per_cpu_ptr(tbl->stats, cpu);
1863 ndst.ndts_allocs += st->allocs;
1864 ndst.ndts_destroys += st->destroys;
1865 ndst.ndts_hash_grows += st->hash_grows;
1866 ndst.ndts_res_failed += st->res_failed;
1867 ndst.ndts_lookups += st->lookups;
1868 ndst.ndts_hits += st->hits;
1869 ndst.ndts_rcv_probes_mcast += st->rcv_probes_mcast;
1870 ndst.ndts_rcv_probes_ucast += st->rcv_probes_ucast;
1871 ndst.ndts_periodic_gc_runs += st->periodic_gc_runs;
1872 ndst.ndts_forced_gc_runs += st->forced_gc_runs;
1873 }
1874
David S. Miller9a6308d2012-04-01 20:06:28 -04001875 if (nla_put(skb, NDTA_STATS, sizeof(ndst), &ndst))
1876 goto nla_put_failure;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001877 }
1878
1879 BUG_ON(tbl->parms.dev);
1880 if (neightbl_fill_parms(skb, &tbl->parms) < 0)
Thomas Grafca860fb2006-08-07 18:00:18 -07001881 goto nla_put_failure;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001882
1883 read_unlock_bh(&tbl->lock);
Thomas Grafca860fb2006-08-07 18:00:18 -07001884 return nlmsg_end(skb, nlh);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001885
Thomas Grafca860fb2006-08-07 18:00:18 -07001886nla_put_failure:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001887 read_unlock_bh(&tbl->lock);
Patrick McHardy26932562007-01-31 23:16:40 -08001888 nlmsg_cancel(skb, nlh);
1889 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001890}
1891
Thomas Grafca860fb2006-08-07 18:00:18 -07001892static int neightbl_fill_param_info(struct sk_buff *skb,
1893 struct neigh_table *tbl,
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001894 struct neigh_parms *parms,
Thomas Grafca860fb2006-08-07 18:00:18 -07001895 u32 pid, u32 seq, int type,
1896 unsigned int flags)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001897{
1898 struct ndtmsg *ndtmsg;
1899 struct nlmsghdr *nlh;
1900
Thomas Grafca860fb2006-08-07 18:00:18 -07001901 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndtmsg), flags);
1902 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08001903 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001904
Thomas Grafca860fb2006-08-07 18:00:18 -07001905 ndtmsg = nlmsg_data(nlh);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001906
1907 read_lock_bh(&tbl->lock);
1908 ndtmsg->ndtm_family = tbl->family;
Patrick McHardy9ef1d4c2005-06-28 12:55:30 -07001909 ndtmsg->ndtm_pad1 = 0;
1910 ndtmsg->ndtm_pad2 = 0;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001911
Thomas Grafca860fb2006-08-07 18:00:18 -07001912 if (nla_put_string(skb, NDTA_NAME, tbl->id) < 0 ||
1913 neightbl_fill_parms(skb, parms) < 0)
1914 goto errout;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001915
1916 read_unlock_bh(&tbl->lock);
Thomas Grafca860fb2006-08-07 18:00:18 -07001917 return nlmsg_end(skb, nlh);
1918errout:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001919 read_unlock_bh(&tbl->lock);
Patrick McHardy26932562007-01-31 23:16:40 -08001920 nlmsg_cancel(skb, nlh);
1921 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001922}
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001923
Patrick McHardyef7c79e2007-06-05 12:38:30 -07001924static const struct nla_policy nl_neightbl_policy[NDTA_MAX+1] = {
Thomas Graf6b3f8672006-08-07 17:58:53 -07001925 [NDTA_NAME] = { .type = NLA_STRING },
1926 [NDTA_THRESH1] = { .type = NLA_U32 },
1927 [NDTA_THRESH2] = { .type = NLA_U32 },
1928 [NDTA_THRESH3] = { .type = NLA_U32 },
1929 [NDTA_GC_INTERVAL] = { .type = NLA_U64 },
1930 [NDTA_PARMS] = { .type = NLA_NESTED },
1931};
1932
Patrick McHardyef7c79e2007-06-05 12:38:30 -07001933static const struct nla_policy nl_ntbl_parm_policy[NDTPA_MAX+1] = {
Thomas Graf6b3f8672006-08-07 17:58:53 -07001934 [NDTPA_IFINDEX] = { .type = NLA_U32 },
1935 [NDTPA_QUEUE_LEN] = { .type = NLA_U32 },
1936 [NDTPA_PROXY_QLEN] = { .type = NLA_U32 },
1937 [NDTPA_APP_PROBES] = { .type = NLA_U32 },
1938 [NDTPA_UCAST_PROBES] = { .type = NLA_U32 },
1939 [NDTPA_MCAST_PROBES] = { .type = NLA_U32 },
1940 [NDTPA_BASE_REACHABLE_TIME] = { .type = NLA_U64 },
1941 [NDTPA_GC_STALETIME] = { .type = NLA_U64 },
1942 [NDTPA_DELAY_PROBE_TIME] = { .type = NLA_U64 },
1943 [NDTPA_RETRANS_TIME] = { .type = NLA_U64 },
1944 [NDTPA_ANYCAST_DELAY] = { .type = NLA_U64 },
1945 [NDTPA_PROXY_DELAY] = { .type = NLA_U64 },
1946 [NDTPA_LOCKTIME] = { .type = NLA_U64 },
1947};
1948
Thomas Graf661d2962013-03-21 07:45:29 +00001949static int neightbl_set(struct sk_buff *skb, struct nlmsghdr *nlh)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001950{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001951 struct net *net = sock_net(skb->sk);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001952 struct neigh_table *tbl;
Thomas Graf6b3f8672006-08-07 17:58:53 -07001953 struct ndtmsg *ndtmsg;
1954 struct nlattr *tb[NDTA_MAX+1];
1955 int err;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001956
Thomas Graf6b3f8672006-08-07 17:58:53 -07001957 err = nlmsg_parse(nlh, sizeof(*ndtmsg), tb, NDTA_MAX,
1958 nl_neightbl_policy);
1959 if (err < 0)
1960 goto errout;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001961
Thomas Graf6b3f8672006-08-07 17:58:53 -07001962 if (tb[NDTA_NAME] == NULL) {
1963 err = -EINVAL;
1964 goto errout;
1965 }
1966
1967 ndtmsg = nlmsg_data(nlh);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001968 read_lock(&neigh_tbl_lock);
1969 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
1970 if (ndtmsg->ndtm_family && tbl->family != ndtmsg->ndtm_family)
1971 continue;
1972
Thomas Graf6b3f8672006-08-07 17:58:53 -07001973 if (nla_strcmp(tb[NDTA_NAME], tbl->id) == 0)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001974 break;
1975 }
1976
1977 if (tbl == NULL) {
1978 err = -ENOENT;
Thomas Graf6b3f8672006-08-07 17:58:53 -07001979 goto errout_locked;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001980 }
1981
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001982 /*
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001983 * We acquire tbl->lock to be nice to the periodic timers and
1984 * make sure they always see a consistent set of values.
1985 */
1986 write_lock_bh(&tbl->lock);
1987
Thomas Graf6b3f8672006-08-07 17:58:53 -07001988 if (tb[NDTA_PARMS]) {
1989 struct nlattr *tbp[NDTPA_MAX+1];
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001990 struct neigh_parms *p;
Thomas Graf6b3f8672006-08-07 17:58:53 -07001991 int i, ifindex = 0;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001992
Thomas Graf6b3f8672006-08-07 17:58:53 -07001993 err = nla_parse_nested(tbp, NDTPA_MAX, tb[NDTA_PARMS],
1994 nl_ntbl_parm_policy);
1995 if (err < 0)
1996 goto errout_tbl_lock;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001997
Thomas Graf6b3f8672006-08-07 17:58:53 -07001998 if (tbp[NDTPA_IFINDEX])
1999 ifindex = nla_get_u32(tbp[NDTPA_IFINDEX]);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002000
Tobias Klauser97fd5bc2009-07-13 11:17:49 -07002001 p = lookup_neigh_parms(tbl, net, ifindex);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002002 if (p == NULL) {
2003 err = -ENOENT;
Thomas Graf6b3f8672006-08-07 17:58:53 -07002004 goto errout_tbl_lock;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002005 }
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002006
Thomas Graf6b3f8672006-08-07 17:58:53 -07002007 for (i = 1; i <= NDTPA_MAX; i++) {
2008 if (tbp[i] == NULL)
2009 continue;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002010
Thomas Graf6b3f8672006-08-07 17:58:53 -07002011 switch (i) {
2012 case NDTPA_QUEUE_LEN:
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002013 p->queue_len_bytes = nla_get_u32(tbp[i]) *
2014 SKB_TRUESIZE(ETH_FRAME_LEN);
2015 break;
2016 case NDTPA_QUEUE_LENBYTES:
2017 p->queue_len_bytes = nla_get_u32(tbp[i]);
Thomas Graf6b3f8672006-08-07 17:58:53 -07002018 break;
2019 case NDTPA_PROXY_QLEN:
2020 p->proxy_qlen = nla_get_u32(tbp[i]);
2021 break;
2022 case NDTPA_APP_PROBES:
2023 p->app_probes = nla_get_u32(tbp[i]);
2024 break;
2025 case NDTPA_UCAST_PROBES:
2026 p->ucast_probes = nla_get_u32(tbp[i]);
2027 break;
2028 case NDTPA_MCAST_PROBES:
2029 p->mcast_probes = nla_get_u32(tbp[i]);
2030 break;
2031 case NDTPA_BASE_REACHABLE_TIME:
2032 p->base_reachable_time = nla_get_msecs(tbp[i]);
2033 break;
2034 case NDTPA_GC_STALETIME:
2035 p->gc_staletime = nla_get_msecs(tbp[i]);
2036 break;
2037 case NDTPA_DELAY_PROBE_TIME:
2038 p->delay_probe_time = nla_get_msecs(tbp[i]);
2039 break;
2040 case NDTPA_RETRANS_TIME:
2041 p->retrans_time = nla_get_msecs(tbp[i]);
2042 break;
2043 case NDTPA_ANYCAST_DELAY:
2044 p->anycast_delay = nla_get_msecs(tbp[i]);
2045 break;
2046 case NDTPA_PROXY_DELAY:
2047 p->proxy_delay = nla_get_msecs(tbp[i]);
2048 break;
2049 case NDTPA_LOCKTIME:
2050 p->locktime = nla_get_msecs(tbp[i]);
2051 break;
2052 }
2053 }
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002054 }
2055
Thomas Graf6b3f8672006-08-07 17:58:53 -07002056 if (tb[NDTA_THRESH1])
2057 tbl->gc_thresh1 = nla_get_u32(tb[NDTA_THRESH1]);
2058
2059 if (tb[NDTA_THRESH2])
2060 tbl->gc_thresh2 = nla_get_u32(tb[NDTA_THRESH2]);
2061
2062 if (tb[NDTA_THRESH3])
2063 tbl->gc_thresh3 = nla_get_u32(tb[NDTA_THRESH3]);
2064
2065 if (tb[NDTA_GC_INTERVAL])
2066 tbl->gc_interval = nla_get_msecs(tb[NDTA_GC_INTERVAL]);
2067
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002068 err = 0;
2069
Thomas Graf6b3f8672006-08-07 17:58:53 -07002070errout_tbl_lock:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002071 write_unlock_bh(&tbl->lock);
Thomas Graf6b3f8672006-08-07 17:58:53 -07002072errout_locked:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002073 read_unlock(&neigh_tbl_lock);
Thomas Graf6b3f8672006-08-07 17:58:53 -07002074errout:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002075 return err;
2076}
2077
Thomas Grafc8822a42007-03-22 11:50:06 -07002078static int neightbl_dump_info(struct sk_buff *skb, struct netlink_callback *cb)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002079{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09002080 struct net *net = sock_net(skb->sk);
Thomas Grafca860fb2006-08-07 18:00:18 -07002081 int family, tidx, nidx = 0;
2082 int tbl_skip = cb->args[0];
2083 int neigh_skip = cb->args[1];
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002084 struct neigh_table *tbl;
2085
Thomas Grafca860fb2006-08-07 18:00:18 -07002086 family = ((struct rtgenmsg *) nlmsg_data(cb->nlh))->rtgen_family;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002087
2088 read_lock(&neigh_tbl_lock);
Thomas Grafca860fb2006-08-07 18:00:18 -07002089 for (tbl = neigh_tables, tidx = 0; tbl; tbl = tbl->next, tidx++) {
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002090 struct neigh_parms *p;
2091
Thomas Grafca860fb2006-08-07 18:00:18 -07002092 if (tidx < tbl_skip || (family && tbl->family != family))
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002093 continue;
2094
Eric W. Biederman15e47302012-09-07 20:12:54 +00002095 if (neightbl_fill_info(skb, tbl, NETLINK_CB(cb->skb).portid,
Thomas Grafca860fb2006-08-07 18:00:18 -07002096 cb->nlh->nlmsg_seq, RTM_NEWNEIGHTBL,
2097 NLM_F_MULTI) <= 0)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002098 break;
2099
Eric W. Biederman426b5302008-01-24 00:13:18 -08002100 for (nidx = 0, p = tbl->parms.next; p; p = p->next) {
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002101 if (!net_eq(neigh_parms_net(p), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002102 continue;
2103
Gautam Kachrooefc683f2009-02-06 00:52:04 -08002104 if (nidx < neigh_skip)
2105 goto next;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002106
Thomas Grafca860fb2006-08-07 18:00:18 -07002107 if (neightbl_fill_param_info(skb, tbl, p,
Eric W. Biederman15e47302012-09-07 20:12:54 +00002108 NETLINK_CB(cb->skb).portid,
Thomas Grafca860fb2006-08-07 18:00:18 -07002109 cb->nlh->nlmsg_seq,
2110 RTM_NEWNEIGHTBL,
2111 NLM_F_MULTI) <= 0)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002112 goto out;
Gautam Kachrooefc683f2009-02-06 00:52:04 -08002113 next:
2114 nidx++;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002115 }
2116
Thomas Grafca860fb2006-08-07 18:00:18 -07002117 neigh_skip = 0;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002118 }
2119out:
2120 read_unlock(&neigh_tbl_lock);
Thomas Grafca860fb2006-08-07 18:00:18 -07002121 cb->args[0] = tidx;
2122 cb->args[1] = nidx;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002123
2124 return skb->len;
2125}
Linus Torvalds1da177e2005-04-16 15:20:36 -07002126
Thomas Graf8b8aec52006-08-07 17:56:37 -07002127static int neigh_fill_info(struct sk_buff *skb, struct neighbour *neigh,
2128 u32 pid, u32 seq, int type, unsigned int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002129{
2130 unsigned long now = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002131 struct nda_cacheinfo ci;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002132 struct nlmsghdr *nlh;
2133 struct ndmsg *ndm;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002134
Thomas Graf8b8aec52006-08-07 17:56:37 -07002135 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndm), flags);
2136 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08002137 return -EMSGSIZE;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002138
2139 ndm = nlmsg_data(nlh);
2140 ndm->ndm_family = neigh->ops->family;
Patrick McHardy9ef1d4c2005-06-28 12:55:30 -07002141 ndm->ndm_pad1 = 0;
2142 ndm->ndm_pad2 = 0;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002143 ndm->ndm_flags = neigh->flags;
2144 ndm->ndm_type = neigh->type;
2145 ndm->ndm_ifindex = neigh->dev->ifindex;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002146
David S. Miller9a6308d2012-04-01 20:06:28 -04002147 if (nla_put(skb, NDA_DST, neigh->tbl->key_len, neigh->primary_key))
2148 goto nla_put_failure;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002149
2150 read_lock_bh(&neigh->lock);
2151 ndm->ndm_state = neigh->nud_state;
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00002152 if (neigh->nud_state & NUD_VALID) {
2153 char haddr[MAX_ADDR_LEN];
2154
2155 neigh_ha_snapshot(haddr, neigh, neigh->dev);
2156 if (nla_put(skb, NDA_LLADDR, neigh->dev->addr_len, haddr) < 0) {
2157 read_unlock_bh(&neigh->lock);
2158 goto nla_put_failure;
2159 }
Thomas Graf8b8aec52006-08-07 17:56:37 -07002160 }
2161
Stephen Hemmingerb9f5f522008-06-03 16:03:15 -07002162 ci.ndm_used = jiffies_to_clock_t(now - neigh->used);
2163 ci.ndm_confirmed = jiffies_to_clock_t(now - neigh->confirmed);
2164 ci.ndm_updated = jiffies_to_clock_t(now - neigh->updated);
Thomas Graf8b8aec52006-08-07 17:56:37 -07002165 ci.ndm_refcnt = atomic_read(&neigh->refcnt) - 1;
2166 read_unlock_bh(&neigh->lock);
2167
David S. Miller9a6308d2012-04-01 20:06:28 -04002168 if (nla_put_u32(skb, NDA_PROBES, atomic_read(&neigh->probes)) ||
2169 nla_put(skb, NDA_CACHEINFO, sizeof(ci), &ci))
2170 goto nla_put_failure;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002171
2172 return nlmsg_end(skb, nlh);
2173
2174nla_put_failure:
Patrick McHardy26932562007-01-31 23:16:40 -08002175 nlmsg_cancel(skb, nlh);
2176 return -EMSGSIZE;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002177}
2178
Tony Zelenoff84920c12012-01-26 22:28:58 +00002179static int pneigh_fill_info(struct sk_buff *skb, struct pneigh_entry *pn,
2180 u32 pid, u32 seq, int type, unsigned int flags,
2181 struct neigh_table *tbl)
2182{
2183 struct nlmsghdr *nlh;
2184 struct ndmsg *ndm;
2185
2186 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndm), flags);
2187 if (nlh == NULL)
2188 return -EMSGSIZE;
2189
2190 ndm = nlmsg_data(nlh);
2191 ndm->ndm_family = tbl->family;
2192 ndm->ndm_pad1 = 0;
2193 ndm->ndm_pad2 = 0;
2194 ndm->ndm_flags = pn->flags | NTF_PROXY;
2195 ndm->ndm_type = NDA_DST;
2196 ndm->ndm_ifindex = pn->dev->ifindex;
2197 ndm->ndm_state = NUD_NONE;
2198
David S. Miller9a6308d2012-04-01 20:06:28 -04002199 if (nla_put(skb, NDA_DST, tbl->key_len, pn->key))
2200 goto nla_put_failure;
Tony Zelenoff84920c12012-01-26 22:28:58 +00002201
2202 return nlmsg_end(skb, nlh);
2203
2204nla_put_failure:
2205 nlmsg_cancel(skb, nlh);
2206 return -EMSGSIZE;
2207}
2208
Thomas Grafd961db32007-08-08 23:12:56 -07002209static void neigh_update_notify(struct neighbour *neigh)
2210{
2211 call_netevent_notifiers(NETEVENT_NEIGH_UPDATE, neigh);
2212 __neigh_notify(neigh, RTM_NEWNEIGH, 0);
2213}
Linus Torvalds1da177e2005-04-16 15:20:36 -07002214
2215static int neigh_dump_table(struct neigh_table *tbl, struct sk_buff *skb,
2216 struct netlink_callback *cb)
2217{
Eric Dumazet767e97e2010-10-06 17:49:21 -07002218 struct net *net = sock_net(skb->sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002219 struct neighbour *n;
2220 int rc, h, s_h = cb->args[1];
2221 int idx, s_idx = idx = cb->args[2];
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002222 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002223
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002224 rcu_read_lock_bh();
2225 nht = rcu_dereference_bh(tbl->nht);
2226
Eric Dumazet4bd66832012-06-07 04:58:35 +00002227 for (h = s_h; h < (1 << nht->hash_shift); h++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002228 if (h > s_h)
2229 s_idx = 0;
Eric Dumazet767e97e2010-10-06 17:49:21 -07002230 for (n = rcu_dereference_bh(nht->hash_buckets[h]), idx = 0;
2231 n != NULL;
2232 n = rcu_dereference_bh(n->next)) {
Octavian Purdila09ad9bc2009-11-25 15:14:13 -08002233 if (!net_eq(dev_net(n->dev), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002234 continue;
Gautam Kachrooefc683f2009-02-06 00:52:04 -08002235 if (idx < s_idx)
2236 goto next;
Eric W. Biederman15e47302012-09-07 20:12:54 +00002237 if (neigh_fill_info(skb, n, NETLINK_CB(cb->skb).portid,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002238 cb->nlh->nlmsg_seq,
Jamal Hadi Salimb6544c02005-06-18 22:54:12 -07002239 RTM_NEWNEIGH,
2240 NLM_F_MULTI) <= 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002241 rc = -1;
2242 goto out;
2243 }
Eric Dumazet767e97e2010-10-06 17:49:21 -07002244next:
Gautam Kachrooefc683f2009-02-06 00:52:04 -08002245 idx++;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002246 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07002247 }
2248 rc = skb->len;
2249out:
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002250 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -07002251 cb->args[1] = h;
2252 cb->args[2] = idx;
2253 return rc;
2254}
2255
Tony Zelenoff84920c12012-01-26 22:28:58 +00002256static int pneigh_dump_table(struct neigh_table *tbl, struct sk_buff *skb,
2257 struct netlink_callback *cb)
2258{
2259 struct pneigh_entry *n;
2260 struct net *net = sock_net(skb->sk);
2261 int rc, h, s_h = cb->args[3];
2262 int idx, s_idx = idx = cb->args[4];
2263
2264 read_lock_bh(&tbl->lock);
2265
Eric Dumazet4bd66832012-06-07 04:58:35 +00002266 for (h = s_h; h <= PNEIGH_HASHMASK; h++) {
Tony Zelenoff84920c12012-01-26 22:28:58 +00002267 if (h > s_h)
2268 s_idx = 0;
2269 for (n = tbl->phash_buckets[h], idx = 0; n; n = n->next) {
2270 if (dev_net(n->dev) != net)
2271 continue;
2272 if (idx < s_idx)
2273 goto next;
Eric W. Biederman15e47302012-09-07 20:12:54 +00002274 if (pneigh_fill_info(skb, n, NETLINK_CB(cb->skb).portid,
Tony Zelenoff84920c12012-01-26 22:28:58 +00002275 cb->nlh->nlmsg_seq,
2276 RTM_NEWNEIGH,
2277 NLM_F_MULTI, tbl) <= 0) {
2278 read_unlock_bh(&tbl->lock);
2279 rc = -1;
2280 goto out;
2281 }
2282 next:
2283 idx++;
2284 }
2285 }
2286
2287 read_unlock_bh(&tbl->lock);
2288 rc = skb->len;
2289out:
2290 cb->args[3] = h;
2291 cb->args[4] = idx;
2292 return rc;
2293
2294}
2295
Thomas Grafc8822a42007-03-22 11:50:06 -07002296static int neigh_dump_info(struct sk_buff *skb, struct netlink_callback *cb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002297{
2298 struct neigh_table *tbl;
2299 int t, family, s_t;
Tony Zelenoff84920c12012-01-26 22:28:58 +00002300 int proxy = 0;
Eric Dumazet4bd66832012-06-07 04:58:35 +00002301 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002302
2303 read_lock(&neigh_tbl_lock);
Thomas Graf8b8aec52006-08-07 17:56:37 -07002304 family = ((struct rtgenmsg *) nlmsg_data(cb->nlh))->rtgen_family;
Tony Zelenoff84920c12012-01-26 22:28:58 +00002305
2306 /* check for full ndmsg structure presence, family member is
2307 * the same for both structures
2308 */
2309 if (nlmsg_len(cb->nlh) >= sizeof(struct ndmsg) &&
2310 ((struct ndmsg *) nlmsg_data(cb->nlh))->ndm_flags == NTF_PROXY)
2311 proxy = 1;
2312
Linus Torvalds1da177e2005-04-16 15:20:36 -07002313 s_t = cb->args[0];
2314
Eric Dumazet4bd66832012-06-07 04:58:35 +00002315 for (tbl = neigh_tables, t = 0; tbl;
Tony Zelenoff84920c12012-01-26 22:28:58 +00002316 tbl = tbl->next, t++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002317 if (t < s_t || (family && tbl->family != family))
2318 continue;
2319 if (t > s_t)
2320 memset(&cb->args[1], 0, sizeof(cb->args) -
2321 sizeof(cb->args[0]));
Tony Zelenoff84920c12012-01-26 22:28:58 +00002322 if (proxy)
2323 err = pneigh_dump_table(tbl, skb, cb);
2324 else
2325 err = neigh_dump_table(tbl, skb, cb);
Eric Dumazet4bd66832012-06-07 04:58:35 +00002326 if (err < 0)
2327 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002328 }
2329 read_unlock(&neigh_tbl_lock);
2330
2331 cb->args[0] = t;
2332 return skb->len;
2333}
2334
2335void neigh_for_each(struct neigh_table *tbl, void (*cb)(struct neighbour *, void *), void *cookie)
2336{
2337 int chain;
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002338 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002339
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002340 rcu_read_lock_bh();
2341 nht = rcu_dereference_bh(tbl->nht);
2342
Eric Dumazet767e97e2010-10-06 17:49:21 -07002343 read_lock(&tbl->lock); /* avoid resizes */
David S. Millercd089332011-07-11 01:28:12 -07002344 for (chain = 0; chain < (1 << nht->hash_shift); chain++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002345 struct neighbour *n;
2346
Eric Dumazet767e97e2010-10-06 17:49:21 -07002347 for (n = rcu_dereference_bh(nht->hash_buckets[chain]);
2348 n != NULL;
2349 n = rcu_dereference_bh(n->next))
Linus Torvalds1da177e2005-04-16 15:20:36 -07002350 cb(n, cookie);
2351 }
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002352 read_unlock(&tbl->lock);
2353 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -07002354}
2355EXPORT_SYMBOL(neigh_for_each);
2356
2357/* The tbl->lock must be held as a writer and BH disabled. */
2358void __neigh_for_each_release(struct neigh_table *tbl,
2359 int (*cb)(struct neighbour *))
2360{
2361 int chain;
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002362 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002363
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002364 nht = rcu_dereference_protected(tbl->nht,
2365 lockdep_is_held(&tbl->lock));
David S. Millercd089332011-07-11 01:28:12 -07002366 for (chain = 0; chain < (1 << nht->hash_shift); chain++) {
Eric Dumazet767e97e2010-10-06 17:49:21 -07002367 struct neighbour *n;
2368 struct neighbour __rcu **np;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002369
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002370 np = &nht->hash_buckets[chain];
Eric Dumazet767e97e2010-10-06 17:49:21 -07002371 while ((n = rcu_dereference_protected(*np,
2372 lockdep_is_held(&tbl->lock))) != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002373 int release;
2374
2375 write_lock(&n->lock);
2376 release = cb(n);
2377 if (release) {
Eric Dumazet767e97e2010-10-06 17:49:21 -07002378 rcu_assign_pointer(*np,
2379 rcu_dereference_protected(n->next,
2380 lockdep_is_held(&tbl->lock)));
Linus Torvalds1da177e2005-04-16 15:20:36 -07002381 n->dead = 1;
2382 } else
2383 np = &n->next;
2384 write_unlock(&n->lock);
Thomas Graf4f494552007-08-08 23:12:36 -07002385 if (release)
2386 neigh_cleanup_and_release(n);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002387 }
2388 }
2389}
2390EXPORT_SYMBOL(__neigh_for_each_release);
2391
2392#ifdef CONFIG_PROC_FS
2393
2394static struct neighbour *neigh_get_first(struct seq_file *seq)
2395{
2396 struct neigh_seq_state *state = seq->private;
YOSHIFUJI Hideaki12188542008-03-26 02:36:06 +09002397 struct net *net = seq_file_net(seq);
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002398 struct neigh_hash_table *nht = state->nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002399 struct neighbour *n = NULL;
2400 int bucket = state->bucket;
2401
2402 state->flags &= ~NEIGH_SEQ_IS_PNEIGH;
David S. Millercd089332011-07-11 01:28:12 -07002403 for (bucket = 0; bucket < (1 << nht->hash_shift); bucket++) {
Eric Dumazet767e97e2010-10-06 17:49:21 -07002404 n = rcu_dereference_bh(nht->hash_buckets[bucket]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002405
2406 while (n) {
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002407 if (!net_eq(dev_net(n->dev), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002408 goto next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002409 if (state->neigh_sub_iter) {
2410 loff_t fakep = 0;
2411 void *v;
2412
2413 v = state->neigh_sub_iter(state, n, &fakep);
2414 if (!v)
2415 goto next;
2416 }
2417 if (!(state->flags & NEIGH_SEQ_SKIP_NOARP))
2418 break;
2419 if (n->nud_state & ~NUD_NOARP)
2420 break;
Eric Dumazet767e97e2010-10-06 17:49:21 -07002421next:
2422 n = rcu_dereference_bh(n->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002423 }
2424
2425 if (n)
2426 break;
2427 }
2428 state->bucket = bucket;
2429
2430 return n;
2431}
2432
2433static struct neighbour *neigh_get_next(struct seq_file *seq,
2434 struct neighbour *n,
2435 loff_t *pos)
2436{
2437 struct neigh_seq_state *state = seq->private;
YOSHIFUJI Hideaki12188542008-03-26 02:36:06 +09002438 struct net *net = seq_file_net(seq);
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002439 struct neigh_hash_table *nht = state->nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002440
2441 if (state->neigh_sub_iter) {
2442 void *v = state->neigh_sub_iter(state, n, pos);
2443 if (v)
2444 return n;
2445 }
Eric Dumazet767e97e2010-10-06 17:49:21 -07002446 n = rcu_dereference_bh(n->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002447
2448 while (1) {
2449 while (n) {
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002450 if (!net_eq(dev_net(n->dev), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002451 goto next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002452 if (state->neigh_sub_iter) {
2453 void *v = state->neigh_sub_iter(state, n, pos);
2454 if (v)
2455 return n;
2456 goto next;
2457 }
2458 if (!(state->flags & NEIGH_SEQ_SKIP_NOARP))
2459 break;
2460
2461 if (n->nud_state & ~NUD_NOARP)
2462 break;
Eric Dumazet767e97e2010-10-06 17:49:21 -07002463next:
2464 n = rcu_dereference_bh(n->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002465 }
2466
2467 if (n)
2468 break;
2469
David S. Millercd089332011-07-11 01:28:12 -07002470 if (++state->bucket >= (1 << nht->hash_shift))
Linus Torvalds1da177e2005-04-16 15:20:36 -07002471 break;
2472
Eric Dumazet767e97e2010-10-06 17:49:21 -07002473 n = rcu_dereference_bh(nht->hash_buckets[state->bucket]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002474 }
2475
2476 if (n && pos)
2477 --(*pos);
2478 return n;
2479}
2480
2481static struct neighbour *neigh_get_idx(struct seq_file *seq, loff_t *pos)
2482{
2483 struct neighbour *n = neigh_get_first(seq);
2484
2485 if (n) {
Chris Larson745e2032008-08-03 01:10:55 -07002486 --(*pos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002487 while (*pos) {
2488 n = neigh_get_next(seq, n, pos);
2489 if (!n)
2490 break;
2491 }
2492 }
2493 return *pos ? NULL : n;
2494}
2495
2496static struct pneigh_entry *pneigh_get_first(struct seq_file *seq)
2497{
2498 struct neigh_seq_state *state = seq->private;
YOSHIFUJI Hideaki12188542008-03-26 02:36:06 +09002499 struct net *net = seq_file_net(seq);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002500 struct neigh_table *tbl = state->tbl;
2501 struct pneigh_entry *pn = NULL;
2502 int bucket = state->bucket;
2503
2504 state->flags |= NEIGH_SEQ_IS_PNEIGH;
2505 for (bucket = 0; bucket <= PNEIGH_HASHMASK; bucket++) {
2506 pn = tbl->phash_buckets[bucket];
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002507 while (pn && !net_eq(pneigh_net(pn), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002508 pn = pn->next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002509 if (pn)
2510 break;
2511 }
2512 state->bucket = bucket;
2513
2514 return pn;
2515}
2516
2517static struct pneigh_entry *pneigh_get_next(struct seq_file *seq,
2518 struct pneigh_entry *pn,
2519 loff_t *pos)
2520{
2521 struct neigh_seq_state *state = seq->private;
YOSHIFUJI Hideaki12188542008-03-26 02:36:06 +09002522 struct net *net = seq_file_net(seq);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002523 struct neigh_table *tbl = state->tbl;
2524
Jorge Boncompte [DTI2]df07a942011-11-25 13:24:49 -05002525 do {
2526 pn = pn->next;
2527 } while (pn && !net_eq(pneigh_net(pn), net));
2528
Linus Torvalds1da177e2005-04-16 15:20:36 -07002529 while (!pn) {
2530 if (++state->bucket > PNEIGH_HASHMASK)
2531 break;
2532 pn = tbl->phash_buckets[state->bucket];
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002533 while (pn && !net_eq(pneigh_net(pn), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002534 pn = pn->next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002535 if (pn)
2536 break;
2537 }
2538
2539 if (pn && pos)
2540 --(*pos);
2541
2542 return pn;
2543}
2544
2545static struct pneigh_entry *pneigh_get_idx(struct seq_file *seq, loff_t *pos)
2546{
2547 struct pneigh_entry *pn = pneigh_get_first(seq);
2548
2549 if (pn) {
Chris Larson745e2032008-08-03 01:10:55 -07002550 --(*pos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002551 while (*pos) {
2552 pn = pneigh_get_next(seq, pn, pos);
2553 if (!pn)
2554 break;
2555 }
2556 }
2557 return *pos ? NULL : pn;
2558}
2559
2560static void *neigh_get_idx_any(struct seq_file *seq, loff_t *pos)
2561{
2562 struct neigh_seq_state *state = seq->private;
2563 void *rc;
Chris Larson745e2032008-08-03 01:10:55 -07002564 loff_t idxpos = *pos;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002565
Chris Larson745e2032008-08-03 01:10:55 -07002566 rc = neigh_get_idx(seq, &idxpos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002567 if (!rc && !(state->flags & NEIGH_SEQ_NEIGH_ONLY))
Chris Larson745e2032008-08-03 01:10:55 -07002568 rc = pneigh_get_idx(seq, &idxpos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002569
2570 return rc;
2571}
2572
2573void *neigh_seq_start(struct seq_file *seq, loff_t *pos, struct neigh_table *tbl, unsigned int neigh_seq_flags)
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002574 __acquires(rcu_bh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002575{
2576 struct neigh_seq_state *state = seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002577
2578 state->tbl = tbl;
2579 state->bucket = 0;
2580 state->flags = (neigh_seq_flags & ~NEIGH_SEQ_IS_PNEIGH);
2581
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002582 rcu_read_lock_bh();
2583 state->nht = rcu_dereference_bh(tbl->nht);
Eric Dumazet767e97e2010-10-06 17:49:21 -07002584
Chris Larson745e2032008-08-03 01:10:55 -07002585 return *pos ? neigh_get_idx_any(seq, pos) : SEQ_START_TOKEN;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002586}
2587EXPORT_SYMBOL(neigh_seq_start);
2588
2589void *neigh_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2590{
2591 struct neigh_seq_state *state;
2592 void *rc;
2593
2594 if (v == SEQ_START_TOKEN) {
Chris Larsonbff69732008-08-03 01:02:41 -07002595 rc = neigh_get_first(seq);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002596 goto out;
2597 }
2598
2599 state = seq->private;
2600 if (!(state->flags & NEIGH_SEQ_IS_PNEIGH)) {
2601 rc = neigh_get_next(seq, v, NULL);
2602 if (rc)
2603 goto out;
2604 if (!(state->flags & NEIGH_SEQ_NEIGH_ONLY))
2605 rc = pneigh_get_first(seq);
2606 } else {
2607 BUG_ON(state->flags & NEIGH_SEQ_NEIGH_ONLY);
2608 rc = pneigh_get_next(seq, v, NULL);
2609 }
2610out:
2611 ++(*pos);
2612 return rc;
2613}
2614EXPORT_SYMBOL(neigh_seq_next);
2615
2616void neigh_seq_stop(struct seq_file *seq, void *v)
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002617 __releases(rcu_bh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002618{
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002619 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -07002620}
2621EXPORT_SYMBOL(neigh_seq_stop);
2622
2623/* statistics via seq_file */
2624
2625static void *neigh_stat_seq_start(struct seq_file *seq, loff_t *pos)
2626{
Alexey Dobriyan81c1ebf2010-01-22 10:16:05 +00002627 struct neigh_table *tbl = seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002628 int cpu;
2629
2630 if (*pos == 0)
2631 return SEQ_START_TOKEN;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09002632
Rusty Russell0f23174a2008-12-29 12:23:42 +00002633 for (cpu = *pos-1; cpu < nr_cpu_ids; ++cpu) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002634 if (!cpu_possible(cpu))
2635 continue;
2636 *pos = cpu+1;
2637 return per_cpu_ptr(tbl->stats, cpu);
2638 }
2639 return NULL;
2640}
2641
2642static void *neigh_stat_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2643{
Alexey Dobriyan81c1ebf2010-01-22 10:16:05 +00002644 struct neigh_table *tbl = seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002645 int cpu;
2646
Rusty Russell0f23174a2008-12-29 12:23:42 +00002647 for (cpu = *pos; cpu < nr_cpu_ids; ++cpu) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002648 if (!cpu_possible(cpu))
2649 continue;
2650 *pos = cpu+1;
2651 return per_cpu_ptr(tbl->stats, cpu);
2652 }
2653 return NULL;
2654}
2655
2656static void neigh_stat_seq_stop(struct seq_file *seq, void *v)
2657{
2658
2659}
2660
2661static int neigh_stat_seq_show(struct seq_file *seq, void *v)
2662{
Alexey Dobriyan81c1ebf2010-01-22 10:16:05 +00002663 struct neigh_table *tbl = seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002664 struct neigh_statistics *st = v;
2665
2666 if (v == SEQ_START_TOKEN) {
Neil Horman9a6d2762008-07-16 20:50:49 -07002667 seq_printf(seq, "entries allocs destroys hash_grows lookups hits res_failed rcv_probes_mcast rcv_probes_ucast periodic_gc_runs forced_gc_runs unresolved_discards\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07002668 return 0;
2669 }
2670
2671 seq_printf(seq, "%08x %08lx %08lx %08lx %08lx %08lx %08lx "
Neil Horman9a6d2762008-07-16 20:50:49 -07002672 "%08lx %08lx %08lx %08lx %08lx\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07002673 atomic_read(&tbl->entries),
2674
2675 st->allocs,
2676 st->destroys,
2677 st->hash_grows,
2678
2679 st->lookups,
2680 st->hits,
2681
2682 st->res_failed,
2683
2684 st->rcv_probes_mcast,
2685 st->rcv_probes_ucast,
2686
2687 st->periodic_gc_runs,
Neil Horman9a6d2762008-07-16 20:50:49 -07002688 st->forced_gc_runs,
2689 st->unres_discards
Linus Torvalds1da177e2005-04-16 15:20:36 -07002690 );
2691
2692 return 0;
2693}
2694
Stephen Hemmingerf6908082007-03-12 14:34:29 -07002695static const struct seq_operations neigh_stat_seq_ops = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002696 .start = neigh_stat_seq_start,
2697 .next = neigh_stat_seq_next,
2698 .stop = neigh_stat_seq_stop,
2699 .show = neigh_stat_seq_show,
2700};
2701
2702static int neigh_stat_seq_open(struct inode *inode, struct file *file)
2703{
2704 int ret = seq_open(file, &neigh_stat_seq_ops);
2705
2706 if (!ret) {
2707 struct seq_file *sf = file->private_data;
Al Virod9dda782013-03-31 18:16:14 -04002708 sf->private = PDE_DATA(inode);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002709 }
2710 return ret;
2711};
2712
Arjan van de Ven9a321442007-02-12 00:55:35 -08002713static const struct file_operations neigh_stat_seq_fops = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002714 .owner = THIS_MODULE,
2715 .open = neigh_stat_seq_open,
2716 .read = seq_read,
2717 .llseek = seq_lseek,
2718 .release = seq_release,
2719};
2720
2721#endif /* CONFIG_PROC_FS */
2722
Thomas Graf339bf982006-11-10 14:10:15 -08002723static inline size_t neigh_nlmsg_size(void)
2724{
2725 return NLMSG_ALIGN(sizeof(struct ndmsg))
2726 + nla_total_size(MAX_ADDR_LEN) /* NDA_DST */
2727 + nla_total_size(MAX_ADDR_LEN) /* NDA_LLADDR */
2728 + nla_total_size(sizeof(struct nda_cacheinfo))
2729 + nla_total_size(4); /* NDA_PROBES */
2730}
2731
Thomas Grafb8673312006-08-15 00:33:14 -07002732static void __neigh_notify(struct neighbour *n, int type, int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002733{
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09002734 struct net *net = dev_net(n->dev);
Thomas Graf8b8aec52006-08-07 17:56:37 -07002735 struct sk_buff *skb;
Thomas Grafb8673312006-08-15 00:33:14 -07002736 int err = -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002737
Thomas Graf339bf982006-11-10 14:10:15 -08002738 skb = nlmsg_new(neigh_nlmsg_size(), GFP_ATOMIC);
Thomas Graf8b8aec52006-08-07 17:56:37 -07002739 if (skb == NULL)
Thomas Grafb8673312006-08-15 00:33:14 -07002740 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002741
Thomas Grafb8673312006-08-15 00:33:14 -07002742 err = neigh_fill_info(skb, n, 0, 0, type, flags);
Patrick McHardy26932562007-01-31 23:16:40 -08002743 if (err < 0) {
2744 /* -EMSGSIZE implies BUG in neigh_nlmsg_size() */
2745 WARN_ON(err == -EMSGSIZE);
2746 kfree_skb(skb);
2747 goto errout;
2748 }
Pablo Neira Ayuso1ce85fe2009-02-24 23:18:28 -08002749 rtnl_notify(skb, net, 0, RTNLGRP_NEIGH, NULL, GFP_ATOMIC);
2750 return;
Thomas Grafb8673312006-08-15 00:33:14 -07002751errout:
2752 if (err < 0)
Eric W. Biederman426b5302008-01-24 00:13:18 -08002753 rtnl_set_sk_err(net, RTNLGRP_NEIGH, err);
Thomas Grafb8673312006-08-15 00:33:14 -07002754}
2755
Thomas Grafd961db32007-08-08 23:12:56 -07002756#ifdef CONFIG_ARPD
Thomas Grafb8673312006-08-15 00:33:14 -07002757void neigh_app_ns(struct neighbour *n)
2758{
2759 __neigh_notify(n, RTM_GETNEIGH, NLM_F_REQUEST);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002760}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09002761EXPORT_SYMBOL(neigh_app_ns);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002762#endif /* CONFIG_ARPD */
2763
2764#ifdef CONFIG_SYSCTL
Cong Wangb93196d2012-12-06 10:04:04 +08002765static int zero;
2766static int unres_qlen_max = INT_MAX / SKB_TRUESIZE(ETH_FRAME_LEN);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002767
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002768static int proc_unres_qlen(ctl_table *ctl, int write, void __user *buffer,
2769 size_t *lenp, loff_t *ppos)
2770{
2771 int size, ret;
2772 ctl_table tmp = *ctl;
2773
Shan Weice46cc62012-12-04 18:49:15 +00002774 tmp.extra1 = &zero;
2775 tmp.extra2 = &unres_qlen_max;
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002776 tmp.data = &size;
Shan Weice46cc62012-12-04 18:49:15 +00002777
2778 size = *(int *)ctl->data / SKB_TRUESIZE(ETH_FRAME_LEN);
2779 ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos);
2780
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002781 if (write && !ret)
2782 *(int *)ctl->data = size * SKB_TRUESIZE(ETH_FRAME_LEN);
2783 return ret;
2784}
2785
2786enum {
2787 NEIGH_VAR_MCAST_PROBE,
2788 NEIGH_VAR_UCAST_PROBE,
2789 NEIGH_VAR_APP_PROBE,
2790 NEIGH_VAR_RETRANS_TIME,
2791 NEIGH_VAR_BASE_REACHABLE_TIME,
2792 NEIGH_VAR_DELAY_PROBE_TIME,
2793 NEIGH_VAR_GC_STALETIME,
2794 NEIGH_VAR_QUEUE_LEN,
2795 NEIGH_VAR_QUEUE_LEN_BYTES,
2796 NEIGH_VAR_PROXY_QLEN,
2797 NEIGH_VAR_ANYCAST_DELAY,
2798 NEIGH_VAR_PROXY_DELAY,
2799 NEIGH_VAR_LOCKTIME,
2800 NEIGH_VAR_RETRANS_TIME_MS,
2801 NEIGH_VAR_BASE_REACHABLE_TIME_MS,
2802 NEIGH_VAR_GC_INTERVAL,
2803 NEIGH_VAR_GC_THRESH1,
2804 NEIGH_VAR_GC_THRESH2,
2805 NEIGH_VAR_GC_THRESH3,
2806 NEIGH_VAR_MAX
2807};
Eric W. Biederman54716e32010-02-14 03:27:03 +00002808
Linus Torvalds1da177e2005-04-16 15:20:36 -07002809static struct neigh_sysctl_table {
2810 struct ctl_table_header *sysctl_header;
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002811 struct ctl_table neigh_vars[NEIGH_VAR_MAX + 1];
Brian Haleyab32ea52006-09-22 14:15:41 -07002812} neigh_sysctl_template __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002813 .neigh_vars = {
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002814 [NEIGH_VAR_MCAST_PROBE] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002815 .procname = "mcast_solicit",
2816 .maxlen = sizeof(int),
2817 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002818 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002819 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002820 [NEIGH_VAR_UCAST_PROBE] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002821 .procname = "ucast_solicit",
2822 .maxlen = sizeof(int),
2823 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002824 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002825 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002826 [NEIGH_VAR_APP_PROBE] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002827 .procname = "app_solicit",
2828 .maxlen = sizeof(int),
2829 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002830 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002831 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002832 [NEIGH_VAR_RETRANS_TIME] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002833 .procname = "retrans_time",
2834 .maxlen = sizeof(int),
2835 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002836 .proc_handler = proc_dointvec_userhz_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002837 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002838 [NEIGH_VAR_BASE_REACHABLE_TIME] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002839 .procname = "base_reachable_time",
2840 .maxlen = sizeof(int),
2841 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002842 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002843 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002844 [NEIGH_VAR_DELAY_PROBE_TIME] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002845 .procname = "delay_first_probe_time",
2846 .maxlen = sizeof(int),
2847 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002848 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002849 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002850 [NEIGH_VAR_GC_STALETIME] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002851 .procname = "gc_stale_time",
2852 .maxlen = sizeof(int),
2853 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002854 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002855 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002856 [NEIGH_VAR_QUEUE_LEN] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002857 .procname = "unres_qlen",
2858 .maxlen = sizeof(int),
2859 .mode = 0644,
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002860 .proc_handler = proc_unres_qlen,
2861 },
2862 [NEIGH_VAR_QUEUE_LEN_BYTES] = {
2863 .procname = "unres_qlen_bytes",
2864 .maxlen = sizeof(int),
2865 .mode = 0644,
Shan Weice46cc62012-12-04 18:49:15 +00002866 .extra1 = &zero,
2867 .proc_handler = proc_dointvec_minmax,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002868 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002869 [NEIGH_VAR_PROXY_QLEN] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002870 .procname = "proxy_qlen",
2871 .maxlen = sizeof(int),
2872 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002873 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002874 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002875 [NEIGH_VAR_ANYCAST_DELAY] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002876 .procname = "anycast_delay",
2877 .maxlen = sizeof(int),
2878 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002879 .proc_handler = proc_dointvec_userhz_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002880 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002881 [NEIGH_VAR_PROXY_DELAY] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002882 .procname = "proxy_delay",
2883 .maxlen = sizeof(int),
2884 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002885 .proc_handler = proc_dointvec_userhz_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002886 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002887 [NEIGH_VAR_LOCKTIME] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002888 .procname = "locktime",
2889 .maxlen = sizeof(int),
2890 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002891 .proc_handler = proc_dointvec_userhz_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002892 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002893 [NEIGH_VAR_RETRANS_TIME_MS] = {
Eric W. Biedermand12af672007-10-18 03:05:25 -07002894 .procname = "retrans_time_ms",
2895 .maxlen = sizeof(int),
2896 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002897 .proc_handler = proc_dointvec_ms_jiffies,
Eric W. Biedermand12af672007-10-18 03:05:25 -07002898 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002899 [NEIGH_VAR_BASE_REACHABLE_TIME_MS] = {
Eric W. Biedermand12af672007-10-18 03:05:25 -07002900 .procname = "base_reachable_time_ms",
2901 .maxlen = sizeof(int),
2902 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002903 .proc_handler = proc_dointvec_ms_jiffies,
Eric W. Biedermand12af672007-10-18 03:05:25 -07002904 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002905 [NEIGH_VAR_GC_INTERVAL] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002906 .procname = "gc_interval",
2907 .maxlen = sizeof(int),
2908 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002909 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002910 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002911 [NEIGH_VAR_GC_THRESH1] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002912 .procname = "gc_thresh1",
2913 .maxlen = sizeof(int),
2914 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002915 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002916 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002917 [NEIGH_VAR_GC_THRESH2] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002918 .procname = "gc_thresh2",
2919 .maxlen = sizeof(int),
2920 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002921 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002922 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002923 [NEIGH_VAR_GC_THRESH3] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002924 .procname = "gc_thresh3",
2925 .maxlen = sizeof(int),
2926 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002927 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002928 },
Pavel Emelyanovc3bac5a2007-12-02 00:08:16 +11002929 {},
Linus Torvalds1da177e2005-04-16 15:20:36 -07002930 },
2931};
2932
2933int neigh_sysctl_register(struct net_device *dev, struct neigh_parms *p,
Eric W. Biederman54716e32010-02-14 03:27:03 +00002934 char *p_name, proc_handler *handler)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002935{
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002936 struct neigh_sysctl_table *t;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002937 const char *dev_name_source = NULL;
Eric W. Biederman8f40a1f2012-04-19 13:38:03 +00002938 char neigh_path[ sizeof("net//neigh/") + IFNAMSIZ + IFNAMSIZ ];
Linus Torvalds1da177e2005-04-16 15:20:36 -07002939
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002940 t = kmemdup(&neigh_sysctl_template, sizeof(*t), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002941 if (!t)
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002942 goto err;
2943
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002944 t->neigh_vars[NEIGH_VAR_MCAST_PROBE].data = &p->mcast_probes;
2945 t->neigh_vars[NEIGH_VAR_UCAST_PROBE].data = &p->ucast_probes;
2946 t->neigh_vars[NEIGH_VAR_APP_PROBE].data = &p->app_probes;
2947 t->neigh_vars[NEIGH_VAR_RETRANS_TIME].data = &p->retrans_time;
2948 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME].data = &p->base_reachable_time;
2949 t->neigh_vars[NEIGH_VAR_DELAY_PROBE_TIME].data = &p->delay_probe_time;
2950 t->neigh_vars[NEIGH_VAR_GC_STALETIME].data = &p->gc_staletime;
2951 t->neigh_vars[NEIGH_VAR_QUEUE_LEN].data = &p->queue_len_bytes;
2952 t->neigh_vars[NEIGH_VAR_QUEUE_LEN_BYTES].data = &p->queue_len_bytes;
2953 t->neigh_vars[NEIGH_VAR_PROXY_QLEN].data = &p->proxy_qlen;
2954 t->neigh_vars[NEIGH_VAR_ANYCAST_DELAY].data = &p->anycast_delay;
2955 t->neigh_vars[NEIGH_VAR_PROXY_DELAY].data = &p->proxy_delay;
2956 t->neigh_vars[NEIGH_VAR_LOCKTIME].data = &p->locktime;
2957 t->neigh_vars[NEIGH_VAR_RETRANS_TIME_MS].data = &p->retrans_time;
2958 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME_MS].data = &p->base_reachable_time;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002959
2960 if (dev) {
2961 dev_name_source = dev->name;
Eric W. Biedermand12af672007-10-18 03:05:25 -07002962 /* Terminate the table early */
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002963 memset(&t->neigh_vars[NEIGH_VAR_GC_INTERVAL], 0,
2964 sizeof(t->neigh_vars[NEIGH_VAR_GC_INTERVAL]));
Linus Torvalds1da177e2005-04-16 15:20:36 -07002965 } else {
Eric W. Biederman8f40a1f2012-04-19 13:38:03 +00002966 dev_name_source = "default";
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002967 t->neigh_vars[NEIGH_VAR_GC_INTERVAL].data = (int *)(p + 1);
2968 t->neigh_vars[NEIGH_VAR_GC_THRESH1].data = (int *)(p + 1) + 1;
2969 t->neigh_vars[NEIGH_VAR_GC_THRESH2].data = (int *)(p + 1) + 2;
2970 t->neigh_vars[NEIGH_VAR_GC_THRESH3].data = (int *)(p + 1) + 3;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002971 }
2972
Linus Torvalds1da177e2005-04-16 15:20:36 -07002973
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002974 if (handler) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002975 /* RetransTime */
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002976 t->neigh_vars[NEIGH_VAR_RETRANS_TIME].proc_handler = handler;
2977 t->neigh_vars[NEIGH_VAR_RETRANS_TIME].extra1 = dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002978 /* ReachableTime */
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002979 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME].proc_handler = handler;
2980 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME].extra1 = dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002981 /* RetransTime (in milliseconds)*/
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002982 t->neigh_vars[NEIGH_VAR_RETRANS_TIME_MS].proc_handler = handler;
2983 t->neigh_vars[NEIGH_VAR_RETRANS_TIME_MS].extra1 = dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002984 /* ReachableTime (in milliseconds) */
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002985 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME_MS].proc_handler = handler;
2986 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME_MS].extra1 = dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002987 }
2988
Eric W. Biederman464dc802012-11-16 03:02:59 +00002989 /* Don't export sysctls to unprivileged users */
2990 if (neigh_parms_net(p)->user_ns != &init_user_ns)
2991 t->neigh_vars[0].procname = NULL;
2992
Eric W. Biederman8f40a1f2012-04-19 13:38:03 +00002993 snprintf(neigh_path, sizeof(neigh_path), "net/%s/neigh/%s",
2994 p_name, dev_name_source);
Denis V. Lunev4ab438f2008-02-28 20:48:01 -08002995 t->sysctl_header =
Eric W. Biederman8f40a1f2012-04-19 13:38:03 +00002996 register_net_sysctl(neigh_parms_net(p), neigh_path, t->neigh_vars);
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002997 if (!t->sysctl_header)
Eric W. Biederman8f40a1f2012-04-19 13:38:03 +00002998 goto free;
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002999
Linus Torvalds1da177e2005-04-16 15:20:36 -07003000 p->sysctl_table = t;
3001 return 0;
3002
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11003003free:
Linus Torvalds1da177e2005-04-16 15:20:36 -07003004 kfree(t);
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11003005err:
3006 return -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003007}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09003008EXPORT_SYMBOL(neigh_sysctl_register);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003009
3010void neigh_sysctl_unregister(struct neigh_parms *p)
3011{
3012 if (p->sysctl_table) {
3013 struct neigh_sysctl_table *t = p->sysctl_table;
3014 p->sysctl_table = NULL;
Eric W. Biederman5dd3df12012-04-19 13:24:33 +00003015 unregister_net_sysctl_table(t->sysctl_header);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003016 kfree(t);
3017 }
3018}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09003019EXPORT_SYMBOL(neigh_sysctl_unregister);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003020
3021#endif /* CONFIG_SYSCTL */
3022
Thomas Grafc8822a42007-03-22 11:50:06 -07003023static int __init neigh_init(void)
3024{
Greg Rosec7ac8672011-06-10 01:27:09 +00003025 rtnl_register(PF_UNSPEC, RTM_NEWNEIGH, neigh_add, NULL, NULL);
3026 rtnl_register(PF_UNSPEC, RTM_DELNEIGH, neigh_delete, NULL, NULL);
3027 rtnl_register(PF_UNSPEC, RTM_GETNEIGH, NULL, neigh_dump_info, NULL);
Thomas Grafc8822a42007-03-22 11:50:06 -07003028
Greg Rosec7ac8672011-06-10 01:27:09 +00003029 rtnl_register(PF_UNSPEC, RTM_GETNEIGHTBL, NULL, neightbl_dump_info,
3030 NULL);
3031 rtnl_register(PF_UNSPEC, RTM_SETNEIGHTBL, neightbl_set, NULL, NULL);
Thomas Grafc8822a42007-03-22 11:50:06 -07003032
3033 return 0;
3034}
3035
3036subsys_initcall(neigh_init);
3037