blob: 6072610a8672d1a54a0e7618214f70610fa2a6fa [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Generic address resolution entity
3 *
4 * Authors:
5 * Pedro Roque <roque@di.fc.ul.pt>
6 * Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
7 *
8 * This program is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU General Public License
10 * as published by the Free Software Foundation; either version
11 * 2 of the License, or (at your option) any later version.
12 *
13 * Fixes:
14 * Vitaly E. Lavrov releasing NULL neighbor in neigh_add.
15 * Harald Welte Add neighbour cache statistics like rtstat
16 */
17
Joe Perchese005d192012-05-16 19:58:40 +000018#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
19
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090020#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021#include <linux/types.h>
22#include <linux/kernel.h>
23#include <linux/module.h>
24#include <linux/socket.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070025#include <linux/netdevice.h>
26#include <linux/proc_fs.h>
27#ifdef CONFIG_SYSCTL
28#include <linux/sysctl.h>
29#endif
30#include <linux/times.h>
Eric W. Biederman457c4cb2007-09-12 12:01:34 +020031#include <net/net_namespace.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070032#include <net/neighbour.h>
33#include <net/dst.h>
34#include <net/sock.h>
Tom Tucker8d717402006-07-30 20:43:36 -070035#include <net/netevent.h>
Thomas Grafa14a49d2006-08-07 17:53:08 -070036#include <net/netlink.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070037#include <linux/rtnetlink.h>
38#include <linux/random.h>
Paulo Marques543537b2005-06-23 00:09:02 -070039#include <linux/string.h>
vignesh babuc3609d52007-08-24 22:27:55 -070040#include <linux/log2.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070041
Joe Perchesd5d427c2013-04-15 15:17:19 +000042#define DEBUG
Linus Torvalds1da177e2005-04-16 15:20:36 -070043#define NEIGH_DEBUG 1
Joe Perchesd5d427c2013-04-15 15:17:19 +000044#define neigh_dbg(level, fmt, ...) \
45do { \
46 if (level <= NEIGH_DEBUG) \
47 pr_debug(fmt, ##__VA_ARGS__); \
48} while (0)
Linus Torvalds1da177e2005-04-16 15:20:36 -070049
50#define PNEIGH_HASHMASK 0xF
51
52static void neigh_timer_handler(unsigned long arg);
Thomas Grafd961db32007-08-08 23:12:56 -070053static void __neigh_notify(struct neighbour *n, int type, int flags);
54static void neigh_update_notify(struct neighbour *neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -070055static int pneigh_ifdown(struct neigh_table *tbl, struct net_device *dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -070056
57static struct neigh_table *neigh_tables;
Amos Waterland45fc3b12005-09-24 16:53:16 -070058#ifdef CONFIG_PROC_FS
Arjan van de Ven9a321442007-02-12 00:55:35 -080059static const struct file_operations neigh_stat_seq_fops;
Amos Waterland45fc3b12005-09-24 16:53:16 -070060#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070061
62/*
63 Neighbour hash table buckets are protected with rwlock tbl->lock.
64
65 - All the scans/updates to hash buckets MUST be made under this lock.
66 - NOTHING clever should be made under this lock: no callbacks
67 to protocol backends, no attempts to send something to network.
68 It will result in deadlocks, if backend/driver wants to use neighbour
69 cache.
70 - If the entry requires some non-trivial actions, increase
71 its reference count and release table lock.
72
73 Neighbour entries are protected:
74 - with reference count.
75 - with rwlock neigh->lock
76
77 Reference count prevents destruction.
78
79 neigh->lock mainly serializes ll address data and its validity state.
80 However, the same lock is used to protect another entry fields:
81 - timer
82 - resolution queue
83
84 Again, nothing clever shall be made under neigh->lock,
85 the most complicated procedure, which we allow is dev->hard_header.
86 It is supposed, that dev->hard_header is simplistic and does
87 not make callbacks to neighbour tables.
88
89 The last lock is neigh_tbl_lock. It is pure SMP lock, protecting
90 list of neighbour tables. This list is used only in process context,
91 */
92
93static DEFINE_RWLOCK(neigh_tbl_lock);
94
David S. Miller8f40b162011-07-17 13:34:11 -070095static int neigh_blackhole(struct neighbour *neigh, struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -070096{
97 kfree_skb(skb);
98 return -ENETDOWN;
99}
100
Thomas Graf4f494552007-08-08 23:12:36 -0700101static void neigh_cleanup_and_release(struct neighbour *neigh)
102{
103 if (neigh->parms->neigh_cleanup)
104 neigh->parms->neigh_cleanup(neigh);
105
Thomas Grafd961db32007-08-08 23:12:56 -0700106 __neigh_notify(neigh, RTM_DELNEIGH, 0);
Thomas Graf4f494552007-08-08 23:12:36 -0700107 neigh_release(neigh);
108}
109
Linus Torvalds1da177e2005-04-16 15:20:36 -0700110/*
111 * It is random distribution in the interval (1/2)*base...(3/2)*base.
112 * It corresponds to default IPv6 settings and is not overridable,
113 * because it is really reasonable choice.
114 */
115
116unsigned long neigh_rand_reach_time(unsigned long base)
117{
Eric Dumazeta02cec22010-09-22 20:43:57 +0000118 return base ? (net_random() % base) + (base >> 1) : 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900120EXPORT_SYMBOL(neigh_rand_reach_time);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700121
122
123static int neigh_forced_gc(struct neigh_table *tbl)
124{
125 int shrunk = 0;
126 int i;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000127 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700128
129 NEIGH_CACHE_STAT_INC(tbl, forced_gc_runs);
130
131 write_lock_bh(&tbl->lock);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000132 nht = rcu_dereference_protected(tbl->nht,
133 lockdep_is_held(&tbl->lock));
David S. Millercd089332011-07-11 01:28:12 -0700134 for (i = 0; i < (1 << nht->hash_shift); i++) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700135 struct neighbour *n;
136 struct neighbour __rcu **np;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700137
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000138 np = &nht->hash_buckets[i];
Eric Dumazet767e97e2010-10-06 17:49:21 -0700139 while ((n = rcu_dereference_protected(*np,
140 lockdep_is_held(&tbl->lock))) != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700141 /* Neighbour record may be discarded if:
142 * - nobody refers to it.
143 * - it is not permanent
144 */
145 write_lock(&n->lock);
146 if (atomic_read(&n->refcnt) == 1 &&
147 !(n->nud_state & NUD_PERMANENT)) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700148 rcu_assign_pointer(*np,
149 rcu_dereference_protected(n->next,
150 lockdep_is_held(&tbl->lock)));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700151 n->dead = 1;
152 shrunk = 1;
153 write_unlock(&n->lock);
Thomas Graf4f494552007-08-08 23:12:36 -0700154 neigh_cleanup_and_release(n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155 continue;
156 }
157 write_unlock(&n->lock);
158 np = &n->next;
159 }
160 }
161
162 tbl->last_flush = jiffies;
163
164 write_unlock_bh(&tbl->lock);
165
166 return shrunk;
167}
168
Pavel Emelyanova43d8992007-12-20 15:49:05 -0800169static void neigh_add_timer(struct neighbour *n, unsigned long when)
170{
171 neigh_hold(n);
172 if (unlikely(mod_timer(&n->timer, when))) {
173 printk("NEIGH: BUG, double timer add, state is %x\n",
174 n->nud_state);
175 dump_stack();
176 }
177}
178
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179static int neigh_del_timer(struct neighbour *n)
180{
181 if ((n->nud_state & NUD_IN_TIMER) &&
182 del_timer(&n->timer)) {
183 neigh_release(n);
184 return 1;
185 }
186 return 0;
187}
188
189static void pneigh_queue_purge(struct sk_buff_head *list)
190{
191 struct sk_buff *skb;
192
193 while ((skb = skb_dequeue(list)) != NULL) {
194 dev_put(skb->dev);
195 kfree_skb(skb);
196 }
197}
198
Herbert Xu49636bb2005-10-23 17:18:00 +1000199static void neigh_flush_dev(struct neigh_table *tbl, struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200{
201 int i;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000202 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000204 nht = rcu_dereference_protected(tbl->nht,
205 lockdep_is_held(&tbl->lock));
206
David S. Millercd089332011-07-11 01:28:12 -0700207 for (i = 0; i < (1 << nht->hash_shift); i++) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700208 struct neighbour *n;
209 struct neighbour __rcu **np = &nht->hash_buckets[i];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700210
Eric Dumazet767e97e2010-10-06 17:49:21 -0700211 while ((n = rcu_dereference_protected(*np,
212 lockdep_is_held(&tbl->lock))) != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213 if (dev && n->dev != dev) {
214 np = &n->next;
215 continue;
216 }
Eric Dumazet767e97e2010-10-06 17:49:21 -0700217 rcu_assign_pointer(*np,
218 rcu_dereference_protected(n->next,
219 lockdep_is_held(&tbl->lock)));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700220 write_lock(&n->lock);
221 neigh_del_timer(n);
222 n->dead = 1;
223
224 if (atomic_read(&n->refcnt) != 1) {
225 /* The most unpleasant situation.
226 We must destroy neighbour entry,
227 but someone still uses it.
228
229 The destroy will be delayed until
230 the last user releases us, but
231 we must kill timers etc. and move
232 it to safe state.
233 */
Eric Dumazetc9ab4d82013-06-28 02:37:42 -0700234 __skb_queue_purge(&n->arp_queue);
Eric Dumazet8b5c1712011-11-09 12:07:14 +0000235 n->arp_queue_len_bytes = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700236 n->output = neigh_blackhole;
237 if (n->nud_state & NUD_VALID)
238 n->nud_state = NUD_NOARP;
239 else
240 n->nud_state = NUD_NONE;
Joe Perchesd5d427c2013-04-15 15:17:19 +0000241 neigh_dbg(2, "neigh %p is stray\n", n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700242 }
243 write_unlock(&n->lock);
Thomas Graf4f494552007-08-08 23:12:36 -0700244 neigh_cleanup_and_release(n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245 }
246 }
Herbert Xu49636bb2005-10-23 17:18:00 +1000247}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248
Herbert Xu49636bb2005-10-23 17:18:00 +1000249void neigh_changeaddr(struct neigh_table *tbl, struct net_device *dev)
250{
251 write_lock_bh(&tbl->lock);
252 neigh_flush_dev(tbl, dev);
253 write_unlock_bh(&tbl->lock);
254}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900255EXPORT_SYMBOL(neigh_changeaddr);
Herbert Xu49636bb2005-10-23 17:18:00 +1000256
257int neigh_ifdown(struct neigh_table *tbl, struct net_device *dev)
258{
259 write_lock_bh(&tbl->lock);
260 neigh_flush_dev(tbl, dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261 pneigh_ifdown(tbl, dev);
262 write_unlock_bh(&tbl->lock);
263
264 del_timer_sync(&tbl->proxy_timer);
265 pneigh_queue_purge(&tbl->proxy_queue);
266 return 0;
267}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900268EXPORT_SYMBOL(neigh_ifdown);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700269
David Miller596b9b62011-07-25 00:01:25 +0000270static struct neighbour *neigh_alloc(struct neigh_table *tbl, struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700271{
272 struct neighbour *n = NULL;
273 unsigned long now = jiffies;
274 int entries;
275
276 entries = atomic_inc_return(&tbl->entries) - 1;
277 if (entries >= tbl->gc_thresh3 ||
278 (entries >= tbl->gc_thresh2 &&
279 time_after(now, tbl->last_flush + 5 * HZ))) {
280 if (!neigh_forced_gc(tbl) &&
281 entries >= tbl->gc_thresh3)
282 goto out_entries;
283 }
284
YOSHIFUJI Hideaki / 吉藤英明08433ef2013-01-24 00:44:23 +0000285 n = kzalloc(tbl->entry_size + dev->neigh_priv_len, GFP_ATOMIC);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700286 if (!n)
287 goto out_entries;
288
Eric Dumazetc9ab4d82013-06-28 02:37:42 -0700289 __skb_queue_head_init(&n->arp_queue);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700290 rwlock_init(&n->lock);
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +0000291 seqlock_init(&n->ha_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700292 n->updated = n->used = now;
293 n->nud_state = NUD_NONE;
294 n->output = neigh_blackhole;
David S. Millerf6b72b62011-07-14 07:53:20 -0700295 seqlock_init(&n->hh.hh_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700296 n->parms = neigh_parms_clone(&tbl->parms);
Pavel Emelyanovb24b8a22008-01-23 21:20:07 -0800297 setup_timer(&n->timer, neigh_timer_handler, (unsigned long)n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700298
299 NEIGH_CACHE_STAT_INC(tbl, allocs);
300 n->tbl = tbl;
301 atomic_set(&n->refcnt, 1);
302 n->dead = 1;
303out:
304 return n;
305
306out_entries:
307 atomic_dec(&tbl->entries);
308 goto out;
309}
310
David S. Miller2c2aba62011-12-28 15:06:58 -0500311static void neigh_get_hash_rnd(u32 *x)
312{
313 get_random_bytes(x, sizeof(*x));
314 *x |= 1;
315}
316
David S. Millercd089332011-07-11 01:28:12 -0700317static struct neigh_hash_table *neigh_hash_alloc(unsigned int shift)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700318{
David S. Millercd089332011-07-11 01:28:12 -0700319 size_t size = (1 << shift) * sizeof(struct neighbour *);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000320 struct neigh_hash_table *ret;
Eric Dumazet6193d2b2011-01-19 22:02:47 +0000321 struct neighbour __rcu **buckets;
David S. Miller2c2aba62011-12-28 15:06:58 -0500322 int i;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000324 ret = kmalloc(sizeof(*ret), GFP_ATOMIC);
325 if (!ret)
326 return NULL;
327 if (size <= PAGE_SIZE)
328 buckets = kzalloc(size, GFP_ATOMIC);
329 else
Eric Dumazet6193d2b2011-01-19 22:02:47 +0000330 buckets = (struct neighbour __rcu **)
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000331 __get_free_pages(GFP_ATOMIC | __GFP_ZERO,
332 get_order(size));
333 if (!buckets) {
334 kfree(ret);
335 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700336 }
Eric Dumazet6193d2b2011-01-19 22:02:47 +0000337 ret->hash_buckets = buckets;
David S. Millercd089332011-07-11 01:28:12 -0700338 ret->hash_shift = shift;
David S. Miller2c2aba62011-12-28 15:06:58 -0500339 for (i = 0; i < NEIGH_NUM_HASH_RND; i++)
340 neigh_get_hash_rnd(&ret->hash_rnd[i]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700341 return ret;
342}
343
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000344static void neigh_hash_free_rcu(struct rcu_head *head)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700345{
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000346 struct neigh_hash_table *nht = container_of(head,
347 struct neigh_hash_table,
348 rcu);
David S. Millercd089332011-07-11 01:28:12 -0700349 size_t size = (1 << nht->hash_shift) * sizeof(struct neighbour *);
Eric Dumazet6193d2b2011-01-19 22:02:47 +0000350 struct neighbour __rcu **buckets = nht->hash_buckets;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700351
352 if (size <= PAGE_SIZE)
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000353 kfree(buckets);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700354 else
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000355 free_pages((unsigned long)buckets, get_order(size));
356 kfree(nht);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700357}
358
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000359static struct neigh_hash_table *neigh_hash_grow(struct neigh_table *tbl,
David S. Millercd089332011-07-11 01:28:12 -0700360 unsigned long new_shift)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361{
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000362 unsigned int i, hash;
363 struct neigh_hash_table *new_nht, *old_nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700364
365 NEIGH_CACHE_STAT_INC(tbl, hash_grows);
366
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000367 old_nht = rcu_dereference_protected(tbl->nht,
368 lockdep_is_held(&tbl->lock));
David S. Millercd089332011-07-11 01:28:12 -0700369 new_nht = neigh_hash_alloc(new_shift);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000370 if (!new_nht)
371 return old_nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700372
David S. Millercd089332011-07-11 01:28:12 -0700373 for (i = 0; i < (1 << old_nht->hash_shift); i++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700374 struct neighbour *n, *next;
375
Eric Dumazet767e97e2010-10-06 17:49:21 -0700376 for (n = rcu_dereference_protected(old_nht->hash_buckets[i],
377 lockdep_is_held(&tbl->lock));
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000378 n != NULL;
379 n = next) {
380 hash = tbl->hash(n->primary_key, n->dev,
381 new_nht->hash_rnd);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700382
David S. Millercd089332011-07-11 01:28:12 -0700383 hash >>= (32 - new_nht->hash_shift);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700384 next = rcu_dereference_protected(n->next,
385 lockdep_is_held(&tbl->lock));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700386
Eric Dumazet767e97e2010-10-06 17:49:21 -0700387 rcu_assign_pointer(n->next,
388 rcu_dereference_protected(
389 new_nht->hash_buckets[hash],
390 lockdep_is_held(&tbl->lock)));
391 rcu_assign_pointer(new_nht->hash_buckets[hash], n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700392 }
393 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700394
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000395 rcu_assign_pointer(tbl->nht, new_nht);
396 call_rcu(&old_nht->rcu, neigh_hash_free_rcu);
397 return new_nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700398}
399
400struct neighbour *neigh_lookup(struct neigh_table *tbl, const void *pkey,
401 struct net_device *dev)
402{
403 struct neighbour *n;
404 int key_len = tbl->key_len;
Pavel Emelyanovbc4bf5f2008-02-23 19:57:02 -0800405 u32 hash_val;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000406 struct neigh_hash_table *nht;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900407
Linus Torvalds1da177e2005-04-16 15:20:36 -0700408 NEIGH_CACHE_STAT_INC(tbl, lookups);
409
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000410 rcu_read_lock_bh();
411 nht = rcu_dereference_bh(tbl->nht);
David S. Millercd089332011-07-11 01:28:12 -0700412 hash_val = tbl->hash(pkey, dev, nht->hash_rnd) >> (32 - nht->hash_shift);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700413
414 for (n = rcu_dereference_bh(nht->hash_buckets[hash_val]);
415 n != NULL;
416 n = rcu_dereference_bh(n->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700417 if (dev == n->dev && !memcmp(n->primary_key, pkey, key_len)) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700418 if (!atomic_inc_not_zero(&n->refcnt))
419 n = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700420 NEIGH_CACHE_STAT_INC(tbl, hits);
421 break;
422 }
423 }
Eric Dumazet767e97e2010-10-06 17:49:21 -0700424
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000425 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700426 return n;
427}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900428EXPORT_SYMBOL(neigh_lookup);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700429
Eric W. Biederman426b5302008-01-24 00:13:18 -0800430struct neighbour *neigh_lookup_nodev(struct neigh_table *tbl, struct net *net,
431 const void *pkey)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700432{
433 struct neighbour *n;
434 int key_len = tbl->key_len;
Pavel Emelyanovbc4bf5f2008-02-23 19:57:02 -0800435 u32 hash_val;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000436 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700437
438 NEIGH_CACHE_STAT_INC(tbl, lookups);
439
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000440 rcu_read_lock_bh();
441 nht = rcu_dereference_bh(tbl->nht);
David S. Millercd089332011-07-11 01:28:12 -0700442 hash_val = tbl->hash(pkey, NULL, nht->hash_rnd) >> (32 - nht->hash_shift);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700443
444 for (n = rcu_dereference_bh(nht->hash_buckets[hash_val]);
445 n != NULL;
446 n = rcu_dereference_bh(n->next)) {
Eric W. Biederman426b5302008-01-24 00:13:18 -0800447 if (!memcmp(n->primary_key, pkey, key_len) &&
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +0900448 net_eq(dev_net(n->dev), net)) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700449 if (!atomic_inc_not_zero(&n->refcnt))
450 n = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700451 NEIGH_CACHE_STAT_INC(tbl, hits);
452 break;
453 }
454 }
Eric Dumazet767e97e2010-10-06 17:49:21 -0700455
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000456 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700457 return n;
458}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900459EXPORT_SYMBOL(neigh_lookup_nodev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700460
David S. Millera263b302012-07-02 02:02:15 -0700461struct neighbour *__neigh_create(struct neigh_table *tbl, const void *pkey,
462 struct net_device *dev, bool want_ref)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700463{
464 u32 hash_val;
465 int key_len = tbl->key_len;
466 int error;
David Miller596b9b62011-07-25 00:01:25 +0000467 struct neighbour *n1, *rc, *n = neigh_alloc(tbl, dev);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000468 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700469
470 if (!n) {
471 rc = ERR_PTR(-ENOBUFS);
472 goto out;
473 }
474
475 memcpy(n->primary_key, pkey, key_len);
476 n->dev = dev;
477 dev_hold(dev);
478
479 /* Protocol specific setup. */
480 if (tbl->constructor && (error = tbl->constructor(n)) < 0) {
481 rc = ERR_PTR(error);
482 goto out_neigh_release;
483 }
484
David Millerda6a8fa2011-07-25 00:01:38 +0000485 if (dev->netdev_ops->ndo_neigh_construct) {
486 error = dev->netdev_ops->ndo_neigh_construct(n);
487 if (error < 0) {
488 rc = ERR_PTR(error);
489 goto out_neigh_release;
490 }
491 }
492
David S. Miller447f2192011-12-19 15:04:41 -0500493 /* Device specific setup. */
494 if (n->parms->neigh_setup &&
495 (error = n->parms->neigh_setup(n)) < 0) {
496 rc = ERR_PTR(error);
497 goto out_neigh_release;
498 }
499
Linus Torvalds1da177e2005-04-16 15:20:36 -0700500 n->confirmed = jiffies - (n->parms->base_reachable_time << 1);
501
502 write_lock_bh(&tbl->lock);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000503 nht = rcu_dereference_protected(tbl->nht,
504 lockdep_is_held(&tbl->lock));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700505
David S. Millercd089332011-07-11 01:28:12 -0700506 if (atomic_read(&tbl->entries) > (1 << nht->hash_shift))
507 nht = neigh_hash_grow(tbl, nht->hash_shift + 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508
David S. Millercd089332011-07-11 01:28:12 -0700509 hash_val = tbl->hash(pkey, dev, nht->hash_rnd) >> (32 - nht->hash_shift);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700510
511 if (n->parms->dead) {
512 rc = ERR_PTR(-EINVAL);
513 goto out_tbl_unlock;
514 }
515
Eric Dumazet767e97e2010-10-06 17:49:21 -0700516 for (n1 = rcu_dereference_protected(nht->hash_buckets[hash_val],
517 lockdep_is_held(&tbl->lock));
518 n1 != NULL;
519 n1 = rcu_dereference_protected(n1->next,
520 lockdep_is_held(&tbl->lock))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700521 if (dev == n1->dev && !memcmp(n1->primary_key, pkey, key_len)) {
David S. Millera263b302012-07-02 02:02:15 -0700522 if (want_ref)
523 neigh_hold(n1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700524 rc = n1;
525 goto out_tbl_unlock;
526 }
527 }
528
Linus Torvalds1da177e2005-04-16 15:20:36 -0700529 n->dead = 0;
David S. Millera263b302012-07-02 02:02:15 -0700530 if (want_ref)
531 neigh_hold(n);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700532 rcu_assign_pointer(n->next,
533 rcu_dereference_protected(nht->hash_buckets[hash_val],
534 lockdep_is_held(&tbl->lock)));
535 rcu_assign_pointer(nht->hash_buckets[hash_val], n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700536 write_unlock_bh(&tbl->lock);
Joe Perchesd5d427c2013-04-15 15:17:19 +0000537 neigh_dbg(2, "neigh %p is created\n", n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700538 rc = n;
539out:
540 return rc;
541out_tbl_unlock:
542 write_unlock_bh(&tbl->lock);
543out_neigh_release:
544 neigh_release(n);
545 goto out;
546}
David S. Millera263b302012-07-02 02:02:15 -0700547EXPORT_SYMBOL(__neigh_create);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700548
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900549static u32 pneigh_hash(const void *pkey, int key_len)
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700550{
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700551 u32 hash_val = *(u32 *)(pkey + key_len - 4);
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700552 hash_val ^= (hash_val >> 16);
553 hash_val ^= hash_val >> 8;
554 hash_val ^= hash_val >> 4;
555 hash_val &= PNEIGH_HASHMASK;
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900556 return hash_val;
557}
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700558
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900559static struct pneigh_entry *__pneigh_lookup_1(struct pneigh_entry *n,
560 struct net *net,
561 const void *pkey,
562 int key_len,
563 struct net_device *dev)
564{
565 while (n) {
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700566 if (!memcmp(n->key, pkey, key_len) &&
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900567 net_eq(pneigh_net(n), net) &&
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700568 (n->dev == dev || !n->dev))
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900569 return n;
570 n = n->next;
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700571 }
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900572 return NULL;
573}
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700574
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900575struct pneigh_entry *__pneigh_lookup(struct neigh_table *tbl,
576 struct net *net, const void *pkey, struct net_device *dev)
577{
578 int key_len = tbl->key_len;
579 u32 hash_val = pneigh_hash(pkey, key_len);
580
581 return __pneigh_lookup_1(tbl->phash_buckets[hash_val],
582 net, pkey, key_len, dev);
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700583}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900584EXPORT_SYMBOL_GPL(__pneigh_lookup);
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700585
Eric W. Biederman426b5302008-01-24 00:13:18 -0800586struct pneigh_entry * pneigh_lookup(struct neigh_table *tbl,
587 struct net *net, const void *pkey,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700588 struct net_device *dev, int creat)
589{
590 struct pneigh_entry *n;
591 int key_len = tbl->key_len;
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900592 u32 hash_val = pneigh_hash(pkey, key_len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700593
594 read_lock_bh(&tbl->lock);
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900595 n = __pneigh_lookup_1(tbl->phash_buckets[hash_val],
596 net, pkey, key_len, dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700597 read_unlock_bh(&tbl->lock);
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900598
599 if (n || !creat)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700600 goto out;
601
Pavel Emelyanov4ae28942007-10-15 12:54:15 -0700602 ASSERT_RTNL();
603
Linus Torvalds1da177e2005-04-16 15:20:36 -0700604 n = kmalloc(sizeof(*n) + key_len, GFP_KERNEL);
605 if (!n)
606 goto out;
607
Eric Dumazete42ea982008-11-12 00:54:54 -0800608 write_pnet(&n->net, hold_net(net));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700609 memcpy(n->key, pkey, key_len);
610 n->dev = dev;
611 if (dev)
612 dev_hold(dev);
613
614 if (tbl->pconstructor && tbl->pconstructor(n)) {
615 if (dev)
616 dev_put(dev);
Denis V. Lunevda12f732008-02-20 00:26:16 -0800617 release_net(net);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700618 kfree(n);
619 n = NULL;
620 goto out;
621 }
622
623 write_lock_bh(&tbl->lock);
624 n->next = tbl->phash_buckets[hash_val];
625 tbl->phash_buckets[hash_val] = n;
626 write_unlock_bh(&tbl->lock);
627out:
628 return n;
629}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900630EXPORT_SYMBOL(pneigh_lookup);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700631
632
Eric W. Biederman426b5302008-01-24 00:13:18 -0800633int pneigh_delete(struct neigh_table *tbl, struct net *net, const void *pkey,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700634 struct net_device *dev)
635{
636 struct pneigh_entry *n, **np;
637 int key_len = tbl->key_len;
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900638 u32 hash_val = pneigh_hash(pkey, key_len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700639
640 write_lock_bh(&tbl->lock);
641 for (np = &tbl->phash_buckets[hash_val]; (n = *np) != NULL;
642 np = &n->next) {
Eric W. Biederman426b5302008-01-24 00:13:18 -0800643 if (!memcmp(n->key, pkey, key_len) && n->dev == dev &&
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +0900644 net_eq(pneigh_net(n), net)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700645 *np = n->next;
646 write_unlock_bh(&tbl->lock);
647 if (tbl->pdestructor)
648 tbl->pdestructor(n);
649 if (n->dev)
650 dev_put(n->dev);
YOSHIFUJI Hideaki57da52c2008-03-26 03:49:59 +0900651 release_net(pneigh_net(n));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700652 kfree(n);
653 return 0;
654 }
655 }
656 write_unlock_bh(&tbl->lock);
657 return -ENOENT;
658}
659
660static int pneigh_ifdown(struct neigh_table *tbl, struct net_device *dev)
661{
662 struct pneigh_entry *n, **np;
663 u32 h;
664
665 for (h = 0; h <= PNEIGH_HASHMASK; h++) {
666 np = &tbl->phash_buckets[h];
667 while ((n = *np) != NULL) {
668 if (!dev || n->dev == dev) {
669 *np = n->next;
670 if (tbl->pdestructor)
671 tbl->pdestructor(n);
672 if (n->dev)
673 dev_put(n->dev);
YOSHIFUJI Hideaki57da52c2008-03-26 03:49:59 +0900674 release_net(pneigh_net(n));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700675 kfree(n);
676 continue;
677 }
678 np = &n->next;
679 }
680 }
681 return -ENOENT;
682}
683
Denis V. Lunev06f05112008-01-24 00:30:58 -0800684static void neigh_parms_destroy(struct neigh_parms *parms);
685
686static inline void neigh_parms_put(struct neigh_parms *parms)
687{
688 if (atomic_dec_and_test(&parms->refcnt))
689 neigh_parms_destroy(parms);
690}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700691
692/*
693 * neighbour must already be out of the table;
694 *
695 */
696void neigh_destroy(struct neighbour *neigh)
697{
David Millerda6a8fa2011-07-25 00:01:38 +0000698 struct net_device *dev = neigh->dev;
699
Linus Torvalds1da177e2005-04-16 15:20:36 -0700700 NEIGH_CACHE_STAT_INC(neigh->tbl, destroys);
701
702 if (!neigh->dead) {
Joe Perchese005d192012-05-16 19:58:40 +0000703 pr_warn("Destroying alive neighbour %p\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700704 dump_stack();
705 return;
706 }
707
708 if (neigh_del_timer(neigh))
Joe Perchese005d192012-05-16 19:58:40 +0000709 pr_warn("Impossible event\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700710
Eric Dumazetc9ab4d82013-06-28 02:37:42 -0700711 write_lock_bh(&neigh->lock);
712 __skb_queue_purge(&neigh->arp_queue);
713 write_unlock_bh(&neigh->lock);
Eric Dumazet8b5c1712011-11-09 12:07:14 +0000714 neigh->arp_queue_len_bytes = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700715
David S. Miller447f2192011-12-19 15:04:41 -0500716 if (dev->netdev_ops->ndo_neigh_destroy)
717 dev->netdev_ops->ndo_neigh_destroy(neigh);
718
David Millerda6a8fa2011-07-25 00:01:38 +0000719 dev_put(dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700720 neigh_parms_put(neigh->parms);
721
Joe Perchesd5d427c2013-04-15 15:17:19 +0000722 neigh_dbg(2, "neigh %p is destroyed\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700723
724 atomic_dec(&neigh->tbl->entries);
David Miller5b8b0062011-07-25 00:01:22 +0000725 kfree_rcu(neigh, rcu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700726}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900727EXPORT_SYMBOL(neigh_destroy);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700728
729/* Neighbour state is suspicious;
730 disable fast path.
731
732 Called with write_locked neigh.
733 */
734static void neigh_suspect(struct neighbour *neigh)
735{
Joe Perchesd5d427c2013-04-15 15:17:19 +0000736 neigh_dbg(2, "neigh %p is suspected\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700737
738 neigh->output = neigh->ops->output;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700739}
740
741/* Neighbour state is OK;
742 enable fast path.
743
744 Called with write_locked neigh.
745 */
746static void neigh_connect(struct neighbour *neigh)
747{
Joe Perchesd5d427c2013-04-15 15:17:19 +0000748 neigh_dbg(2, "neigh %p is connected\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700749
750 neigh->output = neigh->ops->connected_output;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700751}
752
Eric Dumazete4c4e442009-07-30 03:15:07 +0000753static void neigh_periodic_work(struct work_struct *work)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700754{
Eric Dumazete4c4e442009-07-30 03:15:07 +0000755 struct neigh_table *tbl = container_of(work, struct neigh_table, gc_work.work);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700756 struct neighbour *n;
757 struct neighbour __rcu **np;
Eric Dumazete4c4e442009-07-30 03:15:07 +0000758 unsigned int i;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000759 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700760
761 NEIGH_CACHE_STAT_INC(tbl, periodic_gc_runs);
762
Eric Dumazete4c4e442009-07-30 03:15:07 +0000763 write_lock_bh(&tbl->lock);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000764 nht = rcu_dereference_protected(tbl->nht,
765 lockdep_is_held(&tbl->lock));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700766
YOSHIFUJI Hideaki / 吉藤英明27246802013-01-22 05:20:05 +0000767 if (atomic_read(&tbl->entries) < tbl->gc_thresh1)
768 goto out;
769
Linus Torvalds1da177e2005-04-16 15:20:36 -0700770 /*
771 * periodically recompute ReachableTime from random function
772 */
773
Eric Dumazete4c4e442009-07-30 03:15:07 +0000774 if (time_after(jiffies, tbl->last_rand + 300 * HZ)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700775 struct neigh_parms *p;
Eric Dumazete4c4e442009-07-30 03:15:07 +0000776 tbl->last_rand = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700777 for (p = &tbl->parms; p; p = p->next)
778 p->reachable_time =
779 neigh_rand_reach_time(p->base_reachable_time);
780 }
781
David S. Millercd089332011-07-11 01:28:12 -0700782 for (i = 0 ; i < (1 << nht->hash_shift); i++) {
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000783 np = &nht->hash_buckets[i];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700784
Eric Dumazet767e97e2010-10-06 17:49:21 -0700785 while ((n = rcu_dereference_protected(*np,
786 lockdep_is_held(&tbl->lock))) != NULL) {
Eric Dumazete4c4e442009-07-30 03:15:07 +0000787 unsigned int state;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700788
Eric Dumazete4c4e442009-07-30 03:15:07 +0000789 write_lock(&n->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700790
Eric Dumazete4c4e442009-07-30 03:15:07 +0000791 state = n->nud_state;
792 if (state & (NUD_PERMANENT | NUD_IN_TIMER)) {
793 write_unlock(&n->lock);
794 goto next_elt;
795 }
796
797 if (time_before(n->used, n->confirmed))
798 n->used = n->confirmed;
799
800 if (atomic_read(&n->refcnt) == 1 &&
801 (state == NUD_FAILED ||
802 time_after(jiffies, n->used + n->parms->gc_staletime))) {
803 *np = n->next;
804 n->dead = 1;
805 write_unlock(&n->lock);
806 neigh_cleanup_and_release(n);
807 continue;
808 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700809 write_unlock(&n->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700810
811next_elt:
Eric Dumazete4c4e442009-07-30 03:15:07 +0000812 np = &n->next;
813 }
814 /*
815 * It's fine to release lock here, even if hash table
816 * grows while we are preempted.
817 */
818 write_unlock_bh(&tbl->lock);
819 cond_resched();
820 write_lock_bh(&tbl->lock);
Michel Machado84338a62012-02-21 16:04:13 -0500821 nht = rcu_dereference_protected(tbl->nht,
822 lockdep_is_held(&tbl->lock));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700823 }
YOSHIFUJI Hideaki / 吉藤英明27246802013-01-22 05:20:05 +0000824out:
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900825 /* Cycle through all hash buckets every base_reachable_time/2 ticks.
826 * ARP entry timeouts range from 1/2 base_reachable_time to 3/2
827 * base_reachable_time.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700828 */
Eric Dumazete4c4e442009-07-30 03:15:07 +0000829 schedule_delayed_work(&tbl->gc_work,
830 tbl->parms.base_reachable_time >> 1);
831 write_unlock_bh(&tbl->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700832}
833
834static __inline__ int neigh_max_probes(struct neighbour *n)
835{
836 struct neigh_parms *p = n->parms;
Eric Dumazeta02cec22010-09-22 20:43:57 +0000837 return (n->nud_state & NUD_PROBE) ?
Linus Torvalds1da177e2005-04-16 15:20:36 -0700838 p->ucast_probes :
Eric Dumazeta02cec22010-09-22 20:43:57 +0000839 p->ucast_probes + p->app_probes + p->mcast_probes;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700840}
841
Timo Teras5ef12d92009-06-11 04:16:28 -0700842static void neigh_invalidate(struct neighbour *neigh)
Eric Dumazet0a141502010-03-09 19:40:54 +0000843 __releases(neigh->lock)
844 __acquires(neigh->lock)
Timo Teras5ef12d92009-06-11 04:16:28 -0700845{
846 struct sk_buff *skb;
847
848 NEIGH_CACHE_STAT_INC(neigh->tbl, res_failed);
Joe Perchesd5d427c2013-04-15 15:17:19 +0000849 neigh_dbg(2, "neigh %p is failed\n", neigh);
Timo Teras5ef12d92009-06-11 04:16:28 -0700850 neigh->updated = jiffies;
851
852 /* It is very thin place. report_unreachable is very complicated
853 routine. Particularly, it can hit the same neighbour entry!
854
855 So that, we try to be accurate and avoid dead loop. --ANK
856 */
857 while (neigh->nud_state == NUD_FAILED &&
858 (skb = __skb_dequeue(&neigh->arp_queue)) != NULL) {
859 write_unlock(&neigh->lock);
860 neigh->ops->error_report(neigh, skb);
861 write_lock(&neigh->lock);
862 }
Eric Dumazetc9ab4d82013-06-28 02:37:42 -0700863 __skb_queue_purge(&neigh->arp_queue);
Eric Dumazet8b5c1712011-11-09 12:07:14 +0000864 neigh->arp_queue_len_bytes = 0;
Timo Teras5ef12d92009-06-11 04:16:28 -0700865}
866
Eric Dumazetcd28ca02011-08-09 08:15:58 +0000867static void neigh_probe(struct neighbour *neigh)
868 __releases(neigh->lock)
869{
870 struct sk_buff *skb = skb_peek(&neigh->arp_queue);
871 /* keep skb alive even if arp_queue overflows */
872 if (skb)
873 skb = skb_copy(skb, GFP_ATOMIC);
874 write_unlock(&neigh->lock);
875 neigh->ops->solicit(neigh, skb);
876 atomic_inc(&neigh->probes);
877 kfree_skb(skb);
878}
879
Linus Torvalds1da177e2005-04-16 15:20:36 -0700880/* Called when a timer expires for a neighbour entry. */
881
882static void neigh_timer_handler(unsigned long arg)
883{
884 unsigned long now, next;
885 struct neighbour *neigh = (struct neighbour *)arg;
Eric Dumazet95c96172012-04-15 05:58:06 +0000886 unsigned int state;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700887 int notify = 0;
888
889 write_lock(&neigh->lock);
890
891 state = neigh->nud_state;
892 now = jiffies;
893 next = now + HZ;
894
David S. Miller045f7b32011-11-01 17:45:55 -0400895 if (!(state & NUD_IN_TIMER))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700896 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700897
898 if (state & NUD_REACHABLE) {
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900899 if (time_before_eq(now,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700900 neigh->confirmed + neigh->parms->reachable_time)) {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000901 neigh_dbg(2, "neigh %p is still alive\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700902 next = neigh->confirmed + neigh->parms->reachable_time;
903 } else if (time_before_eq(now,
904 neigh->used + neigh->parms->delay_probe_time)) {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000905 neigh_dbg(2, "neigh %p is delayed\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700906 neigh->nud_state = NUD_DELAY;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800907 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700908 neigh_suspect(neigh);
909 next = now + neigh->parms->delay_probe_time;
910 } else {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000911 neigh_dbg(2, "neigh %p is suspected\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700912 neigh->nud_state = NUD_STALE;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800913 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700914 neigh_suspect(neigh);
Tom Tucker8d717402006-07-30 20:43:36 -0700915 notify = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700916 }
917 } else if (state & NUD_DELAY) {
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900918 if (time_before_eq(now,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700919 neigh->confirmed + neigh->parms->delay_probe_time)) {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000920 neigh_dbg(2, "neigh %p is now reachable\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700921 neigh->nud_state = NUD_REACHABLE;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800922 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700923 neigh_connect(neigh);
Tom Tucker8d717402006-07-30 20:43:36 -0700924 notify = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700925 next = neigh->confirmed + neigh->parms->reachable_time;
926 } else {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000927 neigh_dbg(2, "neigh %p is probed\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700928 neigh->nud_state = NUD_PROBE;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800929 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700930 atomic_set(&neigh->probes, 0);
931 next = now + neigh->parms->retrans_time;
932 }
933 } else {
934 /* NUD_PROBE|NUD_INCOMPLETE */
935 next = now + neigh->parms->retrans_time;
936 }
937
938 if ((neigh->nud_state & (NUD_INCOMPLETE | NUD_PROBE)) &&
939 atomic_read(&neigh->probes) >= neigh_max_probes(neigh)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700940 neigh->nud_state = NUD_FAILED;
941 notify = 1;
Timo Teras5ef12d92009-06-11 04:16:28 -0700942 neigh_invalidate(neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700943 }
944
945 if (neigh->nud_state & NUD_IN_TIMER) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700946 if (time_before(next, jiffies + HZ/2))
947 next = jiffies + HZ/2;
Herbert Xu6fb99742005-10-23 16:37:48 +1000948 if (!mod_timer(&neigh->timer, next))
949 neigh_hold(neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700950 }
951 if (neigh->nud_state & (NUD_INCOMPLETE | NUD_PROBE)) {
Eric Dumazetcd28ca02011-08-09 08:15:58 +0000952 neigh_probe(neigh);
David S. Miller9ff56602008-02-17 18:39:54 -0800953 } else {
David S. Miller69cc64d2008-02-11 21:45:44 -0800954out:
David S. Miller9ff56602008-02-17 18:39:54 -0800955 write_unlock(&neigh->lock);
956 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700957
Thomas Grafd961db32007-08-08 23:12:56 -0700958 if (notify)
959 neigh_update_notify(neigh);
960
Linus Torvalds1da177e2005-04-16 15:20:36 -0700961 neigh_release(neigh);
962}
963
964int __neigh_event_send(struct neighbour *neigh, struct sk_buff *skb)
965{
966 int rc;
Eric Dumazetcd28ca02011-08-09 08:15:58 +0000967 bool immediate_probe = false;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700968
969 write_lock_bh(&neigh->lock);
970
971 rc = 0;
972 if (neigh->nud_state & (NUD_CONNECTED | NUD_DELAY | NUD_PROBE))
973 goto out_unlock_bh;
974
Linus Torvalds1da177e2005-04-16 15:20:36 -0700975 if (!(neigh->nud_state & (NUD_STALE | NUD_INCOMPLETE))) {
976 if (neigh->parms->mcast_probes + neigh->parms->app_probes) {
Eric Dumazetcd28ca02011-08-09 08:15:58 +0000977 unsigned long next, now = jiffies;
978
Linus Torvalds1da177e2005-04-16 15:20:36 -0700979 atomic_set(&neigh->probes, neigh->parms->ucast_probes);
980 neigh->nud_state = NUD_INCOMPLETE;
Eric Dumazetcd28ca02011-08-09 08:15:58 +0000981 neigh->updated = now;
982 next = now + max(neigh->parms->retrans_time, HZ/2);
983 neigh_add_timer(neigh, next);
984 immediate_probe = true;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700985 } else {
986 neigh->nud_state = NUD_FAILED;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800987 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700988 write_unlock_bh(&neigh->lock);
989
Wei Yongjunf3fbbe02009-02-25 00:37:32 +0000990 kfree_skb(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700991 return 1;
992 }
993 } else if (neigh->nud_state & NUD_STALE) {
Joe Perchesd5d427c2013-04-15 15:17:19 +0000994 neigh_dbg(2, "neigh %p is delayed\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700995 neigh->nud_state = NUD_DELAY;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800996 neigh->updated = jiffies;
David S. Miller667347f2005-09-27 12:07:44 -0700997 neigh_add_timer(neigh,
998 jiffies + neigh->parms->delay_probe_time);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700999 }
1000
1001 if (neigh->nud_state == NUD_INCOMPLETE) {
1002 if (skb) {
Eric Dumazet8b5c1712011-11-09 12:07:14 +00001003 while (neigh->arp_queue_len_bytes + skb->truesize >
1004 neigh->parms->queue_len_bytes) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001005 struct sk_buff *buff;
Eric Dumazet8b5c1712011-11-09 12:07:14 +00001006
David S. Millerf72051b2008-09-23 01:11:18 -07001007 buff = __skb_dequeue(&neigh->arp_queue);
Eric Dumazet8b5c1712011-11-09 12:07:14 +00001008 if (!buff)
1009 break;
1010 neigh->arp_queue_len_bytes -= buff->truesize;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001011 kfree_skb(buff);
Neil Horman9a6d2762008-07-16 20:50:49 -07001012 NEIGH_CACHE_STAT_INC(neigh->tbl, unres_discards);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001013 }
Eric Dumazeta4731132010-05-27 16:09:39 -07001014 skb_dst_force(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001015 __skb_queue_tail(&neigh->arp_queue, skb);
Eric Dumazet8b5c1712011-11-09 12:07:14 +00001016 neigh->arp_queue_len_bytes += skb->truesize;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001017 }
1018 rc = 1;
1019 }
1020out_unlock_bh:
Eric Dumazetcd28ca02011-08-09 08:15:58 +00001021 if (immediate_probe)
1022 neigh_probe(neigh);
1023 else
1024 write_unlock(&neigh->lock);
1025 local_bh_enable();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001026 return rc;
1027}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001028EXPORT_SYMBOL(__neigh_event_send);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001029
David S. Millerf6b72b62011-07-14 07:53:20 -07001030static void neigh_update_hhs(struct neighbour *neigh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001031{
1032 struct hh_cache *hh;
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -07001033 void (*update)(struct hh_cache*, const struct net_device*, const unsigned char *)
Doug Kehn91a72a72010-07-14 18:02:16 -07001034 = NULL;
1035
1036 if (neigh->dev->header_ops)
1037 update = neigh->dev->header_ops->cache_update;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001038
1039 if (update) {
David S. Millerf6b72b62011-07-14 07:53:20 -07001040 hh = &neigh->hh;
1041 if (hh->hh_len) {
Stephen Hemminger3644f0c2006-12-07 15:08:17 -08001042 write_seqlock_bh(&hh->hh_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001043 update(hh, neigh->dev, neigh->ha);
Stephen Hemminger3644f0c2006-12-07 15:08:17 -08001044 write_sequnlock_bh(&hh->hh_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001045 }
1046 }
1047}
1048
1049
1050
1051/* Generic update routine.
1052 -- lladdr is new lladdr or NULL, if it is not supplied.
1053 -- new is new state.
1054 -- flags
1055 NEIGH_UPDATE_F_OVERRIDE allows to override existing lladdr,
1056 if it is different.
1057 NEIGH_UPDATE_F_WEAK_OVERRIDE will suspect existing "connected"
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001058 lladdr instead of overriding it
Linus Torvalds1da177e2005-04-16 15:20:36 -07001059 if it is different.
1060 It also allows to retain current state
1061 if lladdr is unchanged.
1062 NEIGH_UPDATE_F_ADMIN means that the change is administrative.
1063
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001064 NEIGH_UPDATE_F_OVERRIDE_ISROUTER allows to override existing
Linus Torvalds1da177e2005-04-16 15:20:36 -07001065 NTF_ROUTER flag.
1066 NEIGH_UPDATE_F_ISROUTER indicates if the neighbour is known as
1067 a router.
1068
1069 Caller MUST hold reference count on the entry.
1070 */
1071
1072int neigh_update(struct neighbour *neigh, const u8 *lladdr, u8 new,
1073 u32 flags)
1074{
1075 u8 old;
1076 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001077 int notify = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001078 struct net_device *dev;
1079 int update_isrouter = 0;
1080
1081 write_lock_bh(&neigh->lock);
1082
1083 dev = neigh->dev;
1084 old = neigh->nud_state;
1085 err = -EPERM;
1086
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001087 if (!(flags & NEIGH_UPDATE_F_ADMIN) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -07001088 (old & (NUD_NOARP | NUD_PERMANENT)))
1089 goto out;
1090
1091 if (!(new & NUD_VALID)) {
1092 neigh_del_timer(neigh);
1093 if (old & NUD_CONNECTED)
1094 neigh_suspect(neigh);
1095 neigh->nud_state = new;
1096 err = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001097 notify = old & NUD_VALID;
Timo Teras5ef12d92009-06-11 04:16:28 -07001098 if ((old & (NUD_INCOMPLETE | NUD_PROBE)) &&
1099 (new & NUD_FAILED)) {
1100 neigh_invalidate(neigh);
1101 notify = 1;
1102 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001103 goto out;
1104 }
1105
1106 /* Compare new lladdr with cached one */
1107 if (!dev->addr_len) {
1108 /* First case: device needs no address. */
1109 lladdr = neigh->ha;
1110 } else if (lladdr) {
1111 /* The second case: if something is already cached
1112 and a new address is proposed:
1113 - compare new & old
1114 - if they are different, check override flag
1115 */
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001116 if ((old & NUD_VALID) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -07001117 !memcmp(lladdr, neigh->ha, dev->addr_len))
1118 lladdr = neigh->ha;
1119 } else {
1120 /* No address is supplied; if we know something,
1121 use it, otherwise discard the request.
1122 */
1123 err = -EINVAL;
1124 if (!(old & NUD_VALID))
1125 goto out;
1126 lladdr = neigh->ha;
1127 }
1128
1129 if (new & NUD_CONNECTED)
1130 neigh->confirmed = jiffies;
1131 neigh->updated = jiffies;
1132
1133 /* If entry was valid and address is not changed,
1134 do not change entry state, if new one is STALE.
1135 */
1136 err = 0;
1137 update_isrouter = flags & NEIGH_UPDATE_F_OVERRIDE_ISROUTER;
1138 if (old & NUD_VALID) {
1139 if (lladdr != neigh->ha && !(flags & NEIGH_UPDATE_F_OVERRIDE)) {
1140 update_isrouter = 0;
1141 if ((flags & NEIGH_UPDATE_F_WEAK_OVERRIDE) &&
1142 (old & NUD_CONNECTED)) {
1143 lladdr = neigh->ha;
1144 new = NUD_STALE;
1145 } else
1146 goto out;
1147 } else {
1148 if (lladdr == neigh->ha && new == NUD_STALE &&
1149 ((flags & NEIGH_UPDATE_F_WEAK_OVERRIDE) ||
1150 (old & NUD_CONNECTED))
1151 )
1152 new = old;
1153 }
1154 }
1155
1156 if (new != old) {
1157 neigh_del_timer(neigh);
Pavel Emelyanova43d8992007-12-20 15:49:05 -08001158 if (new & NUD_IN_TIMER)
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001159 neigh_add_timer(neigh, (jiffies +
1160 ((new & NUD_REACHABLE) ?
David S. Miller667347f2005-09-27 12:07:44 -07001161 neigh->parms->reachable_time :
1162 0)));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001163 neigh->nud_state = new;
1164 }
1165
1166 if (lladdr != neigh->ha) {
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001167 write_seqlock(&neigh->ha_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001168 memcpy(&neigh->ha, lladdr, dev->addr_len);
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001169 write_sequnlock(&neigh->ha_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001170 neigh_update_hhs(neigh);
1171 if (!(new & NUD_CONNECTED))
1172 neigh->confirmed = jiffies -
1173 (neigh->parms->base_reachable_time << 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001174 notify = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001175 }
1176 if (new == old)
1177 goto out;
1178 if (new & NUD_CONNECTED)
1179 neigh_connect(neigh);
1180 else
1181 neigh_suspect(neigh);
1182 if (!(old & NUD_VALID)) {
1183 struct sk_buff *skb;
1184
1185 /* Again: avoid dead loop if something went wrong */
1186
1187 while (neigh->nud_state & NUD_VALID &&
1188 (skb = __skb_dequeue(&neigh->arp_queue)) != NULL) {
David S. Miller69cce1d2011-07-17 23:09:49 -07001189 struct dst_entry *dst = skb_dst(skb);
1190 struct neighbour *n2, *n1 = neigh;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001191 write_unlock_bh(&neigh->lock);
roy.qing.li@gmail.come049f282011-10-17 22:32:42 +00001192
1193 rcu_read_lock();
David S. Miller13a43d92012-07-02 22:15:37 -07001194
1195 /* Why not just use 'neigh' as-is? The problem is that
1196 * things such as shaper, eql, and sch_teql can end up
1197 * using alternative, different, neigh objects to output
1198 * the packet in the output path. So what we need to do
1199 * here is re-lookup the top-level neigh in the path so
1200 * we can reinject the packet there.
1201 */
1202 n2 = NULL;
1203 if (dst) {
1204 n2 = dst_neigh_lookup_skb(dst, skb);
1205 if (n2)
1206 n1 = n2;
1207 }
David S. Miller8f40b162011-07-17 13:34:11 -07001208 n1->output(n1, skb);
David S. Miller13a43d92012-07-02 22:15:37 -07001209 if (n2)
1210 neigh_release(n2);
roy.qing.li@gmail.come049f282011-10-17 22:32:42 +00001211 rcu_read_unlock();
1212
Linus Torvalds1da177e2005-04-16 15:20:36 -07001213 write_lock_bh(&neigh->lock);
1214 }
Eric Dumazetc9ab4d82013-06-28 02:37:42 -07001215 __skb_queue_purge(&neigh->arp_queue);
Eric Dumazet8b5c1712011-11-09 12:07:14 +00001216 neigh->arp_queue_len_bytes = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001217 }
1218out:
1219 if (update_isrouter) {
1220 neigh->flags = (flags & NEIGH_UPDATE_F_ISROUTER) ?
1221 (neigh->flags | NTF_ROUTER) :
1222 (neigh->flags & ~NTF_ROUTER);
1223 }
1224 write_unlock_bh(&neigh->lock);
Tom Tucker8d717402006-07-30 20:43:36 -07001225
1226 if (notify)
Thomas Grafd961db32007-08-08 23:12:56 -07001227 neigh_update_notify(neigh);
1228
Linus Torvalds1da177e2005-04-16 15:20:36 -07001229 return err;
1230}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001231EXPORT_SYMBOL(neigh_update);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001232
1233struct neighbour *neigh_event_ns(struct neigh_table *tbl,
1234 u8 *lladdr, void *saddr,
1235 struct net_device *dev)
1236{
1237 struct neighbour *neigh = __neigh_lookup(tbl, saddr, dev,
1238 lladdr || !dev->addr_len);
1239 if (neigh)
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001240 neigh_update(neigh, lladdr, NUD_STALE,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001241 NEIGH_UPDATE_F_OVERRIDE);
1242 return neigh;
1243}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001244EXPORT_SYMBOL(neigh_event_ns);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001245
Eric Dumazet34d101d2010-10-11 09:16:57 -07001246/* called with read_lock_bh(&n->lock); */
David S. Millerf6b72b62011-07-14 07:53:20 -07001247static void neigh_hh_init(struct neighbour *n, struct dst_entry *dst)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001248{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001249 struct net_device *dev = dst->dev;
David S. Millerf6b72b62011-07-14 07:53:20 -07001250 __be16 prot = dst->ops->protocol;
1251 struct hh_cache *hh = &n->hh;
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001252
1253 write_lock_bh(&n->lock);
Eric Dumazet34d101d2010-10-11 09:16:57 -07001254
David S. Millerf6b72b62011-07-14 07:53:20 -07001255 /* Only one thread can come in here and initialize the
1256 * hh_cache entry.
1257 */
David S. Millerb23b5452011-07-16 17:45:02 -07001258 if (!hh->hh_len)
1259 dev->header_ops->cache(n, hh, prot);
David S. Millerf6b72b62011-07-14 07:53:20 -07001260
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001261 write_unlock_bh(&n->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001262}
1263
1264/* This function can be used in contexts, where only old dev_queue_xmit
Eric Dumazet767e97e2010-10-06 17:49:21 -07001265 * worked, f.e. if you want to override normal output path (eql, shaper),
1266 * but resolution is not made yet.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001267 */
1268
David S. Miller8f40b162011-07-17 13:34:11 -07001269int neigh_compat_output(struct neighbour *neigh, struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001270{
1271 struct net_device *dev = skb->dev;
1272
Arnaldo Carvalho de Melobbe735e2007-03-10 22:16:10 -03001273 __skb_pull(skb, skb_network_offset(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001274
Stephen Hemminger0c4e8582007-10-09 01:36:32 -07001275 if (dev_hard_header(skb, dev, ntohs(skb->protocol), NULL, NULL,
1276 skb->len) < 0 &&
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -07001277 dev->header_ops->rebuild(skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001278 return 0;
1279
1280 return dev_queue_xmit(skb);
1281}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001282EXPORT_SYMBOL(neigh_compat_output);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001283
1284/* Slow and careful. */
1285
David S. Miller8f40b162011-07-17 13:34:11 -07001286int neigh_resolve_output(struct neighbour *neigh, struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001287{
Eric Dumazetadf30902009-06-02 05:19:30 +00001288 struct dst_entry *dst = skb_dst(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001289 int rc = 0;
1290
David S. Miller8f40b162011-07-17 13:34:11 -07001291 if (!dst)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001292 goto discard;
1293
Linus Torvalds1da177e2005-04-16 15:20:36 -07001294 if (!neigh_event_send(neigh, skb)) {
1295 int err;
1296 struct net_device *dev = neigh->dev;
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001297 unsigned int seq;
Eric Dumazet34d101d2010-10-11 09:16:57 -07001298
David S. Millerf6b72b62011-07-14 07:53:20 -07001299 if (dev->header_ops->cache && !neigh->hh.hh_len)
1300 neigh_hh_init(neigh, dst);
Eric Dumazet34d101d2010-10-11 09:16:57 -07001301
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001302 do {
ramesh.nagappa@gmail.come1f16502012-10-05 19:10:15 +00001303 __skb_pull(skb, skb_network_offset(skb));
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001304 seq = read_seqbegin(&neigh->ha_lock);
1305 err = dev_hard_header(skb, dev, ntohs(skb->protocol),
1306 neigh->ha, NULL, skb->len);
1307 } while (read_seqretry(&neigh->ha_lock, seq));
Eric Dumazet34d101d2010-10-11 09:16:57 -07001308
Linus Torvalds1da177e2005-04-16 15:20:36 -07001309 if (err >= 0)
David S. Miller542d4d62011-07-16 18:06:24 -07001310 rc = dev_queue_xmit(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001311 else
1312 goto out_kfree_skb;
1313 }
1314out:
1315 return rc;
1316discard:
Joe Perchesd5d427c2013-04-15 15:17:19 +00001317 neigh_dbg(1, "%s: dst=%p neigh=%p\n", __func__, dst, neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001318out_kfree_skb:
1319 rc = -EINVAL;
1320 kfree_skb(skb);
1321 goto out;
1322}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001323EXPORT_SYMBOL(neigh_resolve_output);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001324
1325/* As fast as possible without hh cache */
1326
David S. Miller8f40b162011-07-17 13:34:11 -07001327int neigh_connected_output(struct neighbour *neigh, struct sk_buff *skb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001328{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001329 struct net_device *dev = neigh->dev;
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001330 unsigned int seq;
David S. Miller8f40b162011-07-17 13:34:11 -07001331 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001332
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001333 do {
ramesh.nagappa@gmail.come1f16502012-10-05 19:10:15 +00001334 __skb_pull(skb, skb_network_offset(skb));
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001335 seq = read_seqbegin(&neigh->ha_lock);
1336 err = dev_hard_header(skb, dev, ntohs(skb->protocol),
1337 neigh->ha, NULL, skb->len);
1338 } while (read_seqretry(&neigh->ha_lock, seq));
1339
Linus Torvalds1da177e2005-04-16 15:20:36 -07001340 if (err >= 0)
David S. Miller542d4d62011-07-16 18:06:24 -07001341 err = dev_queue_xmit(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001342 else {
1343 err = -EINVAL;
1344 kfree_skb(skb);
1345 }
1346 return err;
1347}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001348EXPORT_SYMBOL(neigh_connected_output);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001349
David S. Miller8f40b162011-07-17 13:34:11 -07001350int neigh_direct_output(struct neighbour *neigh, struct sk_buff *skb)
1351{
1352 return dev_queue_xmit(skb);
1353}
1354EXPORT_SYMBOL(neigh_direct_output);
1355
Linus Torvalds1da177e2005-04-16 15:20:36 -07001356static void neigh_proxy_process(unsigned long arg)
1357{
1358 struct neigh_table *tbl = (struct neigh_table *)arg;
1359 long sched_next = 0;
1360 unsigned long now = jiffies;
David S. Millerf72051b2008-09-23 01:11:18 -07001361 struct sk_buff *skb, *n;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001362
1363 spin_lock(&tbl->proxy_queue.lock);
1364
David S. Millerf72051b2008-09-23 01:11:18 -07001365 skb_queue_walk_safe(&tbl->proxy_queue, skb, n) {
1366 long tdif = NEIGH_CB(skb)->sched_next - now;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001367
Linus Torvalds1da177e2005-04-16 15:20:36 -07001368 if (tdif <= 0) {
David S. Millerf72051b2008-09-23 01:11:18 -07001369 struct net_device *dev = skb->dev;
Eric Dumazet20e60742011-08-22 19:32:42 +00001370
David S. Millerf72051b2008-09-23 01:11:18 -07001371 __skb_unlink(skb, &tbl->proxy_queue);
Eric Dumazet20e60742011-08-22 19:32:42 +00001372 if (tbl->proxy_redo && netif_running(dev)) {
1373 rcu_read_lock();
David S. Millerf72051b2008-09-23 01:11:18 -07001374 tbl->proxy_redo(skb);
Eric Dumazet20e60742011-08-22 19:32:42 +00001375 rcu_read_unlock();
1376 } else {
David S. Millerf72051b2008-09-23 01:11:18 -07001377 kfree_skb(skb);
Eric Dumazet20e60742011-08-22 19:32:42 +00001378 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001379
1380 dev_put(dev);
1381 } else if (!sched_next || tdif < sched_next)
1382 sched_next = tdif;
1383 }
1384 del_timer(&tbl->proxy_timer);
1385 if (sched_next)
1386 mod_timer(&tbl->proxy_timer, jiffies + sched_next);
1387 spin_unlock(&tbl->proxy_queue.lock);
1388}
1389
1390void pneigh_enqueue(struct neigh_table *tbl, struct neigh_parms *p,
1391 struct sk_buff *skb)
1392{
1393 unsigned long now = jiffies;
1394 unsigned long sched_next = now + (net_random() % p->proxy_delay);
1395
1396 if (tbl->proxy_queue.qlen > p->proxy_qlen) {
1397 kfree_skb(skb);
1398 return;
1399 }
Patrick McHardya61bbcf2005-08-14 17:24:31 -07001400
1401 NEIGH_CB(skb)->sched_next = sched_next;
1402 NEIGH_CB(skb)->flags |= LOCALLY_ENQUEUED;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001403
1404 spin_lock(&tbl->proxy_queue.lock);
1405 if (del_timer(&tbl->proxy_timer)) {
1406 if (time_before(tbl->proxy_timer.expires, sched_next))
1407 sched_next = tbl->proxy_timer.expires;
1408 }
Eric Dumazetadf30902009-06-02 05:19:30 +00001409 skb_dst_drop(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001410 dev_hold(skb->dev);
1411 __skb_queue_tail(&tbl->proxy_queue, skb);
1412 mod_timer(&tbl->proxy_timer, sched_next);
1413 spin_unlock(&tbl->proxy_queue.lock);
1414}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001415EXPORT_SYMBOL(pneigh_enqueue);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001416
Tobias Klauser97fd5bc2009-07-13 11:17:49 -07001417static inline struct neigh_parms *lookup_neigh_parms(struct neigh_table *tbl,
Eric W. Biederman426b5302008-01-24 00:13:18 -08001418 struct net *net, int ifindex)
1419{
1420 struct neigh_parms *p;
1421
1422 for (p = &tbl->parms; p; p = p->next) {
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09001423 if ((p->dev && p->dev->ifindex == ifindex && net_eq(neigh_parms_net(p), net)) ||
Gao feng170d6f92013-06-20 10:01:33 +08001424 (!p->dev && !ifindex && net_eq(net, &init_net)))
Eric W. Biederman426b5302008-01-24 00:13:18 -08001425 return p;
1426 }
1427
1428 return NULL;
1429}
Linus Torvalds1da177e2005-04-16 15:20:36 -07001430
1431struct neigh_parms *neigh_parms_alloc(struct net_device *dev,
1432 struct neigh_table *tbl)
1433{
Gao fengcf89d6b2013-06-20 10:01:32 +08001434 struct neigh_parms *p;
Stephen Hemminger00829822008-11-20 20:14:53 -08001435 struct net *net = dev_net(dev);
1436 const struct net_device_ops *ops = dev->netdev_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001437
Gao fengcf89d6b2013-06-20 10:01:32 +08001438 p = kmemdup(&tbl->parms, sizeof(*p), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001439 if (p) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001440 p->tbl = tbl;
1441 atomic_set(&p->refcnt, 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001442 p->reachable_time =
1443 neigh_rand_reach_time(p->base_reachable_time);
Denis V. Lunev486b51d2008-01-14 22:59:59 -08001444 dev_hold(dev);
1445 p->dev = dev;
Eric Dumazete42ea982008-11-12 00:54:54 -08001446 write_pnet(&p->net, hold_net(net));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001447 p->sysctl_table = NULL;
Veaceslav Falico63134802013-08-02 19:07:38 +02001448
1449 if (ops->ndo_neigh_setup && ops->ndo_neigh_setup(dev, p)) {
1450 release_net(net);
1451 dev_put(dev);
1452 kfree(p);
1453 return NULL;
1454 }
1455
Linus Torvalds1da177e2005-04-16 15:20:36 -07001456 write_lock_bh(&tbl->lock);
1457 p->next = tbl->parms.next;
1458 tbl->parms.next = p;
1459 write_unlock_bh(&tbl->lock);
1460 }
1461 return p;
1462}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001463EXPORT_SYMBOL(neigh_parms_alloc);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001464
1465static void neigh_rcu_free_parms(struct rcu_head *head)
1466{
1467 struct neigh_parms *parms =
1468 container_of(head, struct neigh_parms, rcu_head);
1469
1470 neigh_parms_put(parms);
1471}
1472
1473void neigh_parms_release(struct neigh_table *tbl, struct neigh_parms *parms)
1474{
1475 struct neigh_parms **p;
1476
1477 if (!parms || parms == &tbl->parms)
1478 return;
1479 write_lock_bh(&tbl->lock);
1480 for (p = &tbl->parms.next; *p; p = &(*p)->next) {
1481 if (*p == parms) {
1482 *p = parms->next;
1483 parms->dead = 1;
1484 write_unlock_bh(&tbl->lock);
David S. Millercecbb632008-01-20 16:39:03 -08001485 if (parms->dev)
1486 dev_put(parms->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001487 call_rcu(&parms->rcu_head, neigh_rcu_free_parms);
1488 return;
1489 }
1490 }
1491 write_unlock_bh(&tbl->lock);
Joe Perchesd5d427c2013-04-15 15:17:19 +00001492 neigh_dbg(1, "%s: not found\n", __func__);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001493}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001494EXPORT_SYMBOL(neigh_parms_release);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001495
Denis V. Lunev06f05112008-01-24 00:30:58 -08001496static void neigh_parms_destroy(struct neigh_parms *parms)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001497{
YOSHIFUJI Hideaki57da52c2008-03-26 03:49:59 +09001498 release_net(neigh_parms_net(parms));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001499 kfree(parms);
1500}
1501
Pavel Emelianovc2ecba72007-04-17 12:45:31 -07001502static struct lock_class_key neigh_table_proxy_queue_class;
1503
Hiroaki SHIMODAdcd2ba92012-04-13 07:34:44 +00001504static void neigh_table_init_no_netlink(struct neigh_table *tbl)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001505{
1506 unsigned long now = jiffies;
1507 unsigned long phsize;
1508
Eric Dumazete42ea982008-11-12 00:54:54 -08001509 write_pnet(&tbl->parms.net, &init_net);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001510 atomic_set(&tbl->parms.refcnt, 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001511 tbl->parms.reachable_time =
1512 neigh_rand_reach_time(tbl->parms.base_reachable_time);
1513
Linus Torvalds1da177e2005-04-16 15:20:36 -07001514 tbl->stats = alloc_percpu(struct neigh_statistics);
1515 if (!tbl->stats)
1516 panic("cannot create neighbour cache statistics");
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001517
Linus Torvalds1da177e2005-04-16 15:20:36 -07001518#ifdef CONFIG_PROC_FS
Alexey Dobriyan9b739ba2008-11-11 16:47:44 -08001519 if (!proc_create_data(tbl->id, 0, init_net.proc_net_stat,
1520 &neigh_stat_seq_fops, tbl))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001521 panic("cannot create neighbour proc dir entry");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001522#endif
1523
David S. Millercd089332011-07-11 01:28:12 -07001524 RCU_INIT_POINTER(tbl->nht, neigh_hash_alloc(3));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001525
1526 phsize = (PNEIGH_HASHMASK + 1) * sizeof(struct pneigh_entry *);
Andrew Morton77d04bd2006-04-07 14:52:59 -07001527 tbl->phash_buckets = kzalloc(phsize, GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001528
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001529 if (!tbl->nht || !tbl->phash_buckets)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001530 panic("cannot allocate neighbour cache hashes");
1531
YOSHIFUJI Hideaki / 吉藤英明08433ef2013-01-24 00:44:23 +00001532 if (!tbl->entry_size)
1533 tbl->entry_size = ALIGN(offsetof(struct neighbour, primary_key) +
1534 tbl->key_len, NEIGH_PRIV_ALIGN);
1535 else
1536 WARN_ON(tbl->entry_size % NEIGH_PRIV_ALIGN);
1537
Linus Torvalds1da177e2005-04-16 15:20:36 -07001538 rwlock_init(&tbl->lock);
Tejun Heo203b42f2012-08-21 13:18:23 -07001539 INIT_DEFERRABLE_WORK(&tbl->gc_work, neigh_periodic_work);
Eric Dumazete4c4e442009-07-30 03:15:07 +00001540 schedule_delayed_work(&tbl->gc_work, tbl->parms.reachable_time);
Pavel Emelyanovb24b8a22008-01-23 21:20:07 -08001541 setup_timer(&tbl->proxy_timer, neigh_proxy_process, (unsigned long)tbl);
Pavel Emelianovc2ecba72007-04-17 12:45:31 -07001542 skb_queue_head_init_class(&tbl->proxy_queue,
1543 &neigh_table_proxy_queue_class);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001544
1545 tbl->last_flush = now;
1546 tbl->last_rand = now + tbl->parms.reachable_time * 20;
Simon Kelleybd89efc2006-05-12 14:56:08 -07001547}
1548
1549void neigh_table_init(struct neigh_table *tbl)
1550{
1551 struct neigh_table *tmp;
1552
1553 neigh_table_init_no_netlink(tbl);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001554 write_lock(&neigh_tbl_lock);
Simon Kelleybd89efc2006-05-12 14:56:08 -07001555 for (tmp = neigh_tables; tmp; tmp = tmp->next) {
1556 if (tmp->family == tbl->family)
1557 break;
1558 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001559 tbl->next = neigh_tables;
1560 neigh_tables = tbl;
1561 write_unlock(&neigh_tbl_lock);
Simon Kelleybd89efc2006-05-12 14:56:08 -07001562
1563 if (unlikely(tmp)) {
Joe Perchese005d192012-05-16 19:58:40 +00001564 pr_err("Registering multiple tables for family %d\n",
1565 tbl->family);
Simon Kelleybd89efc2006-05-12 14:56:08 -07001566 dump_stack();
1567 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001568}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001569EXPORT_SYMBOL(neigh_table_init);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001570
1571int neigh_table_clear(struct neigh_table *tbl)
1572{
1573 struct neigh_table **tp;
1574
1575 /* It is not clean... Fix it to unload IPv6 module safely */
Tejun Heoa5c30b32010-10-19 06:04:42 +00001576 cancel_delayed_work_sync(&tbl->gc_work);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001577 del_timer_sync(&tbl->proxy_timer);
1578 pneigh_queue_purge(&tbl->proxy_queue);
1579 neigh_ifdown(tbl, NULL);
1580 if (atomic_read(&tbl->entries))
Joe Perchese005d192012-05-16 19:58:40 +00001581 pr_crit("neighbour leakage\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001582 write_lock(&neigh_tbl_lock);
1583 for (tp = &neigh_tables; *tp; tp = &(*tp)->next) {
1584 if (*tp == tbl) {
1585 *tp = tbl->next;
1586 break;
1587 }
1588 }
1589 write_unlock(&neigh_tbl_lock);
1590
Eric Dumazet6193d2b2011-01-19 22:02:47 +00001591 call_rcu(&rcu_dereference_protected(tbl->nht, 1)->rcu,
1592 neigh_hash_free_rcu);
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001593 tbl->nht = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001594
1595 kfree(tbl->phash_buckets);
1596 tbl->phash_buckets = NULL;
1597
Alexey Dobriyan3f192b52007-11-05 21:28:13 -08001598 remove_proc_entry(tbl->id, init_net.proc_net_stat);
1599
Kirill Korotaev3fcde742006-09-01 01:34:10 -07001600 free_percpu(tbl->stats);
1601 tbl->stats = NULL;
1602
Linus Torvalds1da177e2005-04-16 15:20:36 -07001603 return 0;
1604}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001605EXPORT_SYMBOL(neigh_table_clear);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001606
Thomas Graf661d2962013-03-21 07:45:29 +00001607static int neigh_delete(struct sk_buff *skb, struct nlmsghdr *nlh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001608{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001609 struct net *net = sock_net(skb->sk);
Thomas Grafa14a49d2006-08-07 17:53:08 -07001610 struct ndmsg *ndm;
1611 struct nlattr *dst_attr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001612 struct neigh_table *tbl;
1613 struct net_device *dev = NULL;
Thomas Grafa14a49d2006-08-07 17:53:08 -07001614 int err = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001615
Eric Dumazet110b2492010-10-04 04:27:36 +00001616 ASSERT_RTNL();
Thomas Grafa14a49d2006-08-07 17:53:08 -07001617 if (nlmsg_len(nlh) < sizeof(*ndm))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001618 goto out;
1619
Thomas Grafa14a49d2006-08-07 17:53:08 -07001620 dst_attr = nlmsg_find_attr(nlh, sizeof(*ndm), NDA_DST);
1621 if (dst_attr == NULL)
1622 goto out;
1623
1624 ndm = nlmsg_data(nlh);
1625 if (ndm->ndm_ifindex) {
Eric Dumazet110b2492010-10-04 04:27:36 +00001626 dev = __dev_get_by_index(net, ndm->ndm_ifindex);
Thomas Grafa14a49d2006-08-07 17:53:08 -07001627 if (dev == NULL) {
1628 err = -ENODEV;
1629 goto out;
1630 }
1631 }
1632
Linus Torvalds1da177e2005-04-16 15:20:36 -07001633 read_lock(&neigh_tbl_lock);
1634 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
Thomas Grafa14a49d2006-08-07 17:53:08 -07001635 struct neighbour *neigh;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001636
1637 if (tbl->family != ndm->ndm_family)
1638 continue;
1639 read_unlock(&neigh_tbl_lock);
1640
Thomas Grafa14a49d2006-08-07 17:53:08 -07001641 if (nla_len(dst_attr) < tbl->key_len)
Eric Dumazet110b2492010-10-04 04:27:36 +00001642 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001643
1644 if (ndm->ndm_flags & NTF_PROXY) {
Eric W. Biederman426b5302008-01-24 00:13:18 -08001645 err = pneigh_delete(tbl, net, nla_data(dst_attr), dev);
Eric Dumazet110b2492010-10-04 04:27:36 +00001646 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001647 }
1648
Thomas Grafa14a49d2006-08-07 17:53:08 -07001649 if (dev == NULL)
Eric Dumazet110b2492010-10-04 04:27:36 +00001650 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001651
Thomas Grafa14a49d2006-08-07 17:53:08 -07001652 neigh = neigh_lookup(tbl, nla_data(dst_attr), dev);
1653 if (neigh == NULL) {
1654 err = -ENOENT;
Eric Dumazet110b2492010-10-04 04:27:36 +00001655 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001656 }
Thomas Grafa14a49d2006-08-07 17:53:08 -07001657
1658 err = neigh_update(neigh, NULL, NUD_FAILED,
1659 NEIGH_UPDATE_F_OVERRIDE |
1660 NEIGH_UPDATE_F_ADMIN);
1661 neigh_release(neigh);
Eric Dumazet110b2492010-10-04 04:27:36 +00001662 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001663 }
1664 read_unlock(&neigh_tbl_lock);
Thomas Grafa14a49d2006-08-07 17:53:08 -07001665 err = -EAFNOSUPPORT;
1666
Linus Torvalds1da177e2005-04-16 15:20:36 -07001667out:
1668 return err;
1669}
1670
Thomas Graf661d2962013-03-21 07:45:29 +00001671static int neigh_add(struct sk_buff *skb, struct nlmsghdr *nlh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001672{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001673 struct net *net = sock_net(skb->sk);
Thomas Graf5208deb2006-08-07 17:55:40 -07001674 struct ndmsg *ndm;
1675 struct nlattr *tb[NDA_MAX+1];
Linus Torvalds1da177e2005-04-16 15:20:36 -07001676 struct neigh_table *tbl;
1677 struct net_device *dev = NULL;
Thomas Graf5208deb2006-08-07 17:55:40 -07001678 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001679
Eric Dumazet110b2492010-10-04 04:27:36 +00001680 ASSERT_RTNL();
Thomas Graf5208deb2006-08-07 17:55:40 -07001681 err = nlmsg_parse(nlh, sizeof(*ndm), tb, NDA_MAX, NULL);
1682 if (err < 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001683 goto out;
1684
Thomas Graf5208deb2006-08-07 17:55:40 -07001685 err = -EINVAL;
1686 if (tb[NDA_DST] == NULL)
1687 goto out;
1688
1689 ndm = nlmsg_data(nlh);
1690 if (ndm->ndm_ifindex) {
Eric Dumazet110b2492010-10-04 04:27:36 +00001691 dev = __dev_get_by_index(net, ndm->ndm_ifindex);
Thomas Graf5208deb2006-08-07 17:55:40 -07001692 if (dev == NULL) {
1693 err = -ENODEV;
1694 goto out;
1695 }
1696
1697 if (tb[NDA_LLADDR] && nla_len(tb[NDA_LLADDR]) < dev->addr_len)
Eric Dumazet110b2492010-10-04 04:27:36 +00001698 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001699 }
1700
Linus Torvalds1da177e2005-04-16 15:20:36 -07001701 read_lock(&neigh_tbl_lock);
1702 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
Thomas Graf5208deb2006-08-07 17:55:40 -07001703 int flags = NEIGH_UPDATE_F_ADMIN | NEIGH_UPDATE_F_OVERRIDE;
1704 struct neighbour *neigh;
1705 void *dst, *lladdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001706
1707 if (tbl->family != ndm->ndm_family)
1708 continue;
1709 read_unlock(&neigh_tbl_lock);
1710
Thomas Graf5208deb2006-08-07 17:55:40 -07001711 if (nla_len(tb[NDA_DST]) < tbl->key_len)
Eric Dumazet110b2492010-10-04 04:27:36 +00001712 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001713 dst = nla_data(tb[NDA_DST]);
1714 lladdr = tb[NDA_LLADDR] ? nla_data(tb[NDA_LLADDR]) : NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001715
1716 if (ndm->ndm_flags & NTF_PROXY) {
Ville Nuorvala62dd9312006-09-22 14:43:19 -07001717 struct pneigh_entry *pn;
1718
1719 err = -ENOBUFS;
Eric W. Biederman426b5302008-01-24 00:13:18 -08001720 pn = pneigh_lookup(tbl, net, dst, dev, 1);
Ville Nuorvala62dd9312006-09-22 14:43:19 -07001721 if (pn) {
1722 pn->flags = ndm->ndm_flags;
1723 err = 0;
1724 }
Eric Dumazet110b2492010-10-04 04:27:36 +00001725 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001726 }
1727
Thomas Graf5208deb2006-08-07 17:55:40 -07001728 if (dev == NULL)
Eric Dumazet110b2492010-10-04 04:27:36 +00001729 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001730
1731 neigh = neigh_lookup(tbl, dst, dev);
1732 if (neigh == NULL) {
1733 if (!(nlh->nlmsg_flags & NLM_F_CREATE)) {
1734 err = -ENOENT;
Eric Dumazet110b2492010-10-04 04:27:36 +00001735 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001736 }
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001737
Thomas Graf5208deb2006-08-07 17:55:40 -07001738 neigh = __neigh_lookup_errno(tbl, dst, dev);
1739 if (IS_ERR(neigh)) {
1740 err = PTR_ERR(neigh);
Eric Dumazet110b2492010-10-04 04:27:36 +00001741 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001742 }
1743 } else {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001744 if (nlh->nlmsg_flags & NLM_F_EXCL) {
1745 err = -EEXIST;
Thomas Graf5208deb2006-08-07 17:55:40 -07001746 neigh_release(neigh);
Eric Dumazet110b2492010-10-04 04:27:36 +00001747 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001748 }
Thomas Graf5208deb2006-08-07 17:55:40 -07001749
1750 if (!(nlh->nlmsg_flags & NLM_F_REPLACE))
1751 flags &= ~NEIGH_UPDATE_F_OVERRIDE;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001752 }
1753
Eric Biederman0c5c2d32009-03-04 00:03:08 -08001754 if (ndm->ndm_flags & NTF_USE) {
1755 neigh_event_send(neigh, NULL);
1756 err = 0;
1757 } else
1758 err = neigh_update(neigh, lladdr, ndm->ndm_state, flags);
Thomas Graf5208deb2006-08-07 17:55:40 -07001759 neigh_release(neigh);
Eric Dumazet110b2492010-10-04 04:27:36 +00001760 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001761 }
1762
1763 read_unlock(&neigh_tbl_lock);
Thomas Graf5208deb2006-08-07 17:55:40 -07001764 err = -EAFNOSUPPORT;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001765out:
1766 return err;
1767}
1768
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001769static int neightbl_fill_parms(struct sk_buff *skb, struct neigh_parms *parms)
1770{
Thomas Grafca860fb2006-08-07 18:00:18 -07001771 struct nlattr *nest;
1772
1773 nest = nla_nest_start(skb, NDTA_PARMS);
1774 if (nest == NULL)
1775 return -ENOBUFS;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001776
David S. Miller9a6308d2012-04-01 20:06:28 -04001777 if ((parms->dev &&
1778 nla_put_u32(skb, NDTPA_IFINDEX, parms->dev->ifindex)) ||
1779 nla_put_u32(skb, NDTPA_REFCNT, atomic_read(&parms->refcnt)) ||
1780 nla_put_u32(skb, NDTPA_QUEUE_LENBYTES, parms->queue_len_bytes) ||
1781 /* approximative value for deprecated QUEUE_LEN (in packets) */
1782 nla_put_u32(skb, NDTPA_QUEUE_LEN,
Shan Weice46cc62012-12-04 18:49:15 +00001783 parms->queue_len_bytes / SKB_TRUESIZE(ETH_FRAME_LEN)) ||
David S. Miller9a6308d2012-04-01 20:06:28 -04001784 nla_put_u32(skb, NDTPA_PROXY_QLEN, parms->proxy_qlen) ||
1785 nla_put_u32(skb, NDTPA_APP_PROBES, parms->app_probes) ||
1786 nla_put_u32(skb, NDTPA_UCAST_PROBES, parms->ucast_probes) ||
1787 nla_put_u32(skb, NDTPA_MCAST_PROBES, parms->mcast_probes) ||
1788 nla_put_msecs(skb, NDTPA_REACHABLE_TIME, parms->reachable_time) ||
1789 nla_put_msecs(skb, NDTPA_BASE_REACHABLE_TIME,
1790 parms->base_reachable_time) ||
1791 nla_put_msecs(skb, NDTPA_GC_STALETIME, parms->gc_staletime) ||
1792 nla_put_msecs(skb, NDTPA_DELAY_PROBE_TIME,
1793 parms->delay_probe_time) ||
1794 nla_put_msecs(skb, NDTPA_RETRANS_TIME, parms->retrans_time) ||
1795 nla_put_msecs(skb, NDTPA_ANYCAST_DELAY, parms->anycast_delay) ||
1796 nla_put_msecs(skb, NDTPA_PROXY_DELAY, parms->proxy_delay) ||
1797 nla_put_msecs(skb, NDTPA_LOCKTIME, parms->locktime))
1798 goto nla_put_failure;
Thomas Grafca860fb2006-08-07 18:00:18 -07001799 return nla_nest_end(skb, nest);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001800
Thomas Grafca860fb2006-08-07 18:00:18 -07001801nla_put_failure:
Thomas Grafbc3ed282008-06-03 16:36:54 -07001802 nla_nest_cancel(skb, nest);
1803 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001804}
1805
Thomas Grafca860fb2006-08-07 18:00:18 -07001806static int neightbl_fill_info(struct sk_buff *skb, struct neigh_table *tbl,
1807 u32 pid, u32 seq, int type, int flags)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001808{
1809 struct nlmsghdr *nlh;
1810 struct ndtmsg *ndtmsg;
1811
Thomas Grafca860fb2006-08-07 18:00:18 -07001812 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndtmsg), flags);
1813 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08001814 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001815
Thomas Grafca860fb2006-08-07 18:00:18 -07001816 ndtmsg = nlmsg_data(nlh);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001817
1818 read_lock_bh(&tbl->lock);
1819 ndtmsg->ndtm_family = tbl->family;
Patrick McHardy9ef1d4c2005-06-28 12:55:30 -07001820 ndtmsg->ndtm_pad1 = 0;
1821 ndtmsg->ndtm_pad2 = 0;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001822
David S. Miller9a6308d2012-04-01 20:06:28 -04001823 if (nla_put_string(skb, NDTA_NAME, tbl->id) ||
1824 nla_put_msecs(skb, NDTA_GC_INTERVAL, tbl->gc_interval) ||
1825 nla_put_u32(skb, NDTA_THRESH1, tbl->gc_thresh1) ||
1826 nla_put_u32(skb, NDTA_THRESH2, tbl->gc_thresh2) ||
1827 nla_put_u32(skb, NDTA_THRESH3, tbl->gc_thresh3))
1828 goto nla_put_failure;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001829 {
1830 unsigned long now = jiffies;
1831 unsigned int flush_delta = now - tbl->last_flush;
1832 unsigned int rand_delta = now - tbl->last_rand;
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001833 struct neigh_hash_table *nht;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001834 struct ndt_config ndc = {
1835 .ndtc_key_len = tbl->key_len,
1836 .ndtc_entry_size = tbl->entry_size,
1837 .ndtc_entries = atomic_read(&tbl->entries),
1838 .ndtc_last_flush = jiffies_to_msecs(flush_delta),
1839 .ndtc_last_rand = jiffies_to_msecs(rand_delta),
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001840 .ndtc_proxy_qlen = tbl->proxy_queue.qlen,
1841 };
1842
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001843 rcu_read_lock_bh();
1844 nht = rcu_dereference_bh(tbl->nht);
David S. Miller2c2aba62011-12-28 15:06:58 -05001845 ndc.ndtc_hash_rnd = nht->hash_rnd[0];
David S. Millercd089332011-07-11 01:28:12 -07001846 ndc.ndtc_hash_mask = ((1 << nht->hash_shift) - 1);
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001847 rcu_read_unlock_bh();
1848
David S. Miller9a6308d2012-04-01 20:06:28 -04001849 if (nla_put(skb, NDTA_CONFIG, sizeof(ndc), &ndc))
1850 goto nla_put_failure;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001851 }
1852
1853 {
1854 int cpu;
1855 struct ndt_stats ndst;
1856
1857 memset(&ndst, 0, sizeof(ndst));
1858
KAMEZAWA Hiroyuki6f912042006-04-10 22:52:50 -07001859 for_each_possible_cpu(cpu) {
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001860 struct neigh_statistics *st;
1861
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001862 st = per_cpu_ptr(tbl->stats, cpu);
1863 ndst.ndts_allocs += st->allocs;
1864 ndst.ndts_destroys += st->destroys;
1865 ndst.ndts_hash_grows += st->hash_grows;
1866 ndst.ndts_res_failed += st->res_failed;
1867 ndst.ndts_lookups += st->lookups;
1868 ndst.ndts_hits += st->hits;
1869 ndst.ndts_rcv_probes_mcast += st->rcv_probes_mcast;
1870 ndst.ndts_rcv_probes_ucast += st->rcv_probes_ucast;
1871 ndst.ndts_periodic_gc_runs += st->periodic_gc_runs;
1872 ndst.ndts_forced_gc_runs += st->forced_gc_runs;
1873 }
1874
David S. Miller9a6308d2012-04-01 20:06:28 -04001875 if (nla_put(skb, NDTA_STATS, sizeof(ndst), &ndst))
1876 goto nla_put_failure;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001877 }
1878
1879 BUG_ON(tbl->parms.dev);
1880 if (neightbl_fill_parms(skb, &tbl->parms) < 0)
Thomas Grafca860fb2006-08-07 18:00:18 -07001881 goto nla_put_failure;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001882
1883 read_unlock_bh(&tbl->lock);
Thomas Grafca860fb2006-08-07 18:00:18 -07001884 return nlmsg_end(skb, nlh);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001885
Thomas Grafca860fb2006-08-07 18:00:18 -07001886nla_put_failure:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001887 read_unlock_bh(&tbl->lock);
Patrick McHardy26932562007-01-31 23:16:40 -08001888 nlmsg_cancel(skb, nlh);
1889 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001890}
1891
Thomas Grafca860fb2006-08-07 18:00:18 -07001892static int neightbl_fill_param_info(struct sk_buff *skb,
1893 struct neigh_table *tbl,
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001894 struct neigh_parms *parms,
Thomas Grafca860fb2006-08-07 18:00:18 -07001895 u32 pid, u32 seq, int type,
1896 unsigned int flags)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001897{
1898 struct ndtmsg *ndtmsg;
1899 struct nlmsghdr *nlh;
1900
Thomas Grafca860fb2006-08-07 18:00:18 -07001901 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndtmsg), flags);
1902 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08001903 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001904
Thomas Grafca860fb2006-08-07 18:00:18 -07001905 ndtmsg = nlmsg_data(nlh);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001906
1907 read_lock_bh(&tbl->lock);
1908 ndtmsg->ndtm_family = tbl->family;
Patrick McHardy9ef1d4c2005-06-28 12:55:30 -07001909 ndtmsg->ndtm_pad1 = 0;
1910 ndtmsg->ndtm_pad2 = 0;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001911
Thomas Grafca860fb2006-08-07 18:00:18 -07001912 if (nla_put_string(skb, NDTA_NAME, tbl->id) < 0 ||
1913 neightbl_fill_parms(skb, parms) < 0)
1914 goto errout;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001915
1916 read_unlock_bh(&tbl->lock);
Thomas Grafca860fb2006-08-07 18:00:18 -07001917 return nlmsg_end(skb, nlh);
1918errout:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001919 read_unlock_bh(&tbl->lock);
Patrick McHardy26932562007-01-31 23:16:40 -08001920 nlmsg_cancel(skb, nlh);
1921 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001922}
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001923
Patrick McHardyef7c79e2007-06-05 12:38:30 -07001924static const struct nla_policy nl_neightbl_policy[NDTA_MAX+1] = {
Thomas Graf6b3f8672006-08-07 17:58:53 -07001925 [NDTA_NAME] = { .type = NLA_STRING },
1926 [NDTA_THRESH1] = { .type = NLA_U32 },
1927 [NDTA_THRESH2] = { .type = NLA_U32 },
1928 [NDTA_THRESH3] = { .type = NLA_U32 },
1929 [NDTA_GC_INTERVAL] = { .type = NLA_U64 },
1930 [NDTA_PARMS] = { .type = NLA_NESTED },
1931};
1932
Patrick McHardyef7c79e2007-06-05 12:38:30 -07001933static const struct nla_policy nl_ntbl_parm_policy[NDTPA_MAX+1] = {
Thomas Graf6b3f8672006-08-07 17:58:53 -07001934 [NDTPA_IFINDEX] = { .type = NLA_U32 },
1935 [NDTPA_QUEUE_LEN] = { .type = NLA_U32 },
1936 [NDTPA_PROXY_QLEN] = { .type = NLA_U32 },
1937 [NDTPA_APP_PROBES] = { .type = NLA_U32 },
1938 [NDTPA_UCAST_PROBES] = { .type = NLA_U32 },
1939 [NDTPA_MCAST_PROBES] = { .type = NLA_U32 },
1940 [NDTPA_BASE_REACHABLE_TIME] = { .type = NLA_U64 },
1941 [NDTPA_GC_STALETIME] = { .type = NLA_U64 },
1942 [NDTPA_DELAY_PROBE_TIME] = { .type = NLA_U64 },
1943 [NDTPA_RETRANS_TIME] = { .type = NLA_U64 },
1944 [NDTPA_ANYCAST_DELAY] = { .type = NLA_U64 },
1945 [NDTPA_PROXY_DELAY] = { .type = NLA_U64 },
1946 [NDTPA_LOCKTIME] = { .type = NLA_U64 },
1947};
1948
Thomas Graf661d2962013-03-21 07:45:29 +00001949static int neightbl_set(struct sk_buff *skb, struct nlmsghdr *nlh)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001950{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001951 struct net *net = sock_net(skb->sk);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001952 struct neigh_table *tbl;
Thomas Graf6b3f8672006-08-07 17:58:53 -07001953 struct ndtmsg *ndtmsg;
1954 struct nlattr *tb[NDTA_MAX+1];
1955 int err;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001956
Thomas Graf6b3f8672006-08-07 17:58:53 -07001957 err = nlmsg_parse(nlh, sizeof(*ndtmsg), tb, NDTA_MAX,
1958 nl_neightbl_policy);
1959 if (err < 0)
1960 goto errout;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001961
Thomas Graf6b3f8672006-08-07 17:58:53 -07001962 if (tb[NDTA_NAME] == NULL) {
1963 err = -EINVAL;
1964 goto errout;
1965 }
1966
1967 ndtmsg = nlmsg_data(nlh);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001968 read_lock(&neigh_tbl_lock);
1969 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
1970 if (ndtmsg->ndtm_family && tbl->family != ndtmsg->ndtm_family)
1971 continue;
1972
Thomas Graf6b3f8672006-08-07 17:58:53 -07001973 if (nla_strcmp(tb[NDTA_NAME], tbl->id) == 0)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001974 break;
1975 }
1976
1977 if (tbl == NULL) {
1978 err = -ENOENT;
Thomas Graf6b3f8672006-08-07 17:58:53 -07001979 goto errout_locked;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001980 }
1981
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001982 /*
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001983 * We acquire tbl->lock to be nice to the periodic timers and
1984 * make sure they always see a consistent set of values.
1985 */
1986 write_lock_bh(&tbl->lock);
1987
Thomas Graf6b3f8672006-08-07 17:58:53 -07001988 if (tb[NDTA_PARMS]) {
1989 struct nlattr *tbp[NDTPA_MAX+1];
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001990 struct neigh_parms *p;
Thomas Graf6b3f8672006-08-07 17:58:53 -07001991 int i, ifindex = 0;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001992
Thomas Graf6b3f8672006-08-07 17:58:53 -07001993 err = nla_parse_nested(tbp, NDTPA_MAX, tb[NDTA_PARMS],
1994 nl_ntbl_parm_policy);
1995 if (err < 0)
1996 goto errout_tbl_lock;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001997
Thomas Graf6b3f8672006-08-07 17:58:53 -07001998 if (tbp[NDTPA_IFINDEX])
1999 ifindex = nla_get_u32(tbp[NDTPA_IFINDEX]);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002000
Tobias Klauser97fd5bc2009-07-13 11:17:49 -07002001 p = lookup_neigh_parms(tbl, net, ifindex);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002002 if (p == NULL) {
2003 err = -ENOENT;
Thomas Graf6b3f8672006-08-07 17:58:53 -07002004 goto errout_tbl_lock;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002005 }
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002006
Thomas Graf6b3f8672006-08-07 17:58:53 -07002007 for (i = 1; i <= NDTPA_MAX; i++) {
2008 if (tbp[i] == NULL)
2009 continue;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002010
Thomas Graf6b3f8672006-08-07 17:58:53 -07002011 switch (i) {
2012 case NDTPA_QUEUE_LEN:
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002013 p->queue_len_bytes = nla_get_u32(tbp[i]) *
2014 SKB_TRUESIZE(ETH_FRAME_LEN);
2015 break;
2016 case NDTPA_QUEUE_LENBYTES:
2017 p->queue_len_bytes = nla_get_u32(tbp[i]);
Thomas Graf6b3f8672006-08-07 17:58:53 -07002018 break;
2019 case NDTPA_PROXY_QLEN:
2020 p->proxy_qlen = nla_get_u32(tbp[i]);
2021 break;
2022 case NDTPA_APP_PROBES:
2023 p->app_probes = nla_get_u32(tbp[i]);
2024 break;
2025 case NDTPA_UCAST_PROBES:
2026 p->ucast_probes = nla_get_u32(tbp[i]);
2027 break;
2028 case NDTPA_MCAST_PROBES:
2029 p->mcast_probes = nla_get_u32(tbp[i]);
2030 break;
2031 case NDTPA_BASE_REACHABLE_TIME:
2032 p->base_reachable_time = nla_get_msecs(tbp[i]);
2033 break;
2034 case NDTPA_GC_STALETIME:
2035 p->gc_staletime = nla_get_msecs(tbp[i]);
2036 break;
2037 case NDTPA_DELAY_PROBE_TIME:
2038 p->delay_probe_time = nla_get_msecs(tbp[i]);
2039 break;
2040 case NDTPA_RETRANS_TIME:
2041 p->retrans_time = nla_get_msecs(tbp[i]);
2042 break;
2043 case NDTPA_ANYCAST_DELAY:
2044 p->anycast_delay = nla_get_msecs(tbp[i]);
2045 break;
2046 case NDTPA_PROXY_DELAY:
2047 p->proxy_delay = nla_get_msecs(tbp[i]);
2048 break;
2049 case NDTPA_LOCKTIME:
2050 p->locktime = nla_get_msecs(tbp[i]);
2051 break;
2052 }
2053 }
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002054 }
2055
Gao fengdc25c672013-06-20 10:01:34 +08002056 err = -ENOENT;
2057 if ((tb[NDTA_THRESH1] || tb[NDTA_THRESH2] ||
2058 tb[NDTA_THRESH3] || tb[NDTA_GC_INTERVAL]) &&
2059 !net_eq(net, &init_net))
2060 goto errout_tbl_lock;
2061
Thomas Graf6b3f8672006-08-07 17:58:53 -07002062 if (tb[NDTA_THRESH1])
2063 tbl->gc_thresh1 = nla_get_u32(tb[NDTA_THRESH1]);
2064
2065 if (tb[NDTA_THRESH2])
2066 tbl->gc_thresh2 = nla_get_u32(tb[NDTA_THRESH2]);
2067
2068 if (tb[NDTA_THRESH3])
2069 tbl->gc_thresh3 = nla_get_u32(tb[NDTA_THRESH3]);
2070
2071 if (tb[NDTA_GC_INTERVAL])
2072 tbl->gc_interval = nla_get_msecs(tb[NDTA_GC_INTERVAL]);
2073
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002074 err = 0;
2075
Thomas Graf6b3f8672006-08-07 17:58:53 -07002076errout_tbl_lock:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002077 write_unlock_bh(&tbl->lock);
Thomas Graf6b3f8672006-08-07 17:58:53 -07002078errout_locked:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002079 read_unlock(&neigh_tbl_lock);
Thomas Graf6b3f8672006-08-07 17:58:53 -07002080errout:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002081 return err;
2082}
2083
Thomas Grafc8822a42007-03-22 11:50:06 -07002084static int neightbl_dump_info(struct sk_buff *skb, struct netlink_callback *cb)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002085{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09002086 struct net *net = sock_net(skb->sk);
Thomas Grafca860fb2006-08-07 18:00:18 -07002087 int family, tidx, nidx = 0;
2088 int tbl_skip = cb->args[0];
2089 int neigh_skip = cb->args[1];
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002090 struct neigh_table *tbl;
2091
Thomas Grafca860fb2006-08-07 18:00:18 -07002092 family = ((struct rtgenmsg *) nlmsg_data(cb->nlh))->rtgen_family;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002093
2094 read_lock(&neigh_tbl_lock);
Thomas Grafca860fb2006-08-07 18:00:18 -07002095 for (tbl = neigh_tables, tidx = 0; tbl; tbl = tbl->next, tidx++) {
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002096 struct neigh_parms *p;
2097
Thomas Grafca860fb2006-08-07 18:00:18 -07002098 if (tidx < tbl_skip || (family && tbl->family != family))
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002099 continue;
2100
Eric W. Biederman15e47302012-09-07 20:12:54 +00002101 if (neightbl_fill_info(skb, tbl, NETLINK_CB(cb->skb).portid,
Thomas Grafca860fb2006-08-07 18:00:18 -07002102 cb->nlh->nlmsg_seq, RTM_NEWNEIGHTBL,
2103 NLM_F_MULTI) <= 0)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002104 break;
2105
Eric W. Biederman426b5302008-01-24 00:13:18 -08002106 for (nidx = 0, p = tbl->parms.next; p; p = p->next) {
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002107 if (!net_eq(neigh_parms_net(p), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002108 continue;
2109
Gautam Kachrooefc683f2009-02-06 00:52:04 -08002110 if (nidx < neigh_skip)
2111 goto next;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002112
Thomas Grafca860fb2006-08-07 18:00:18 -07002113 if (neightbl_fill_param_info(skb, tbl, p,
Eric W. Biederman15e47302012-09-07 20:12:54 +00002114 NETLINK_CB(cb->skb).portid,
Thomas Grafca860fb2006-08-07 18:00:18 -07002115 cb->nlh->nlmsg_seq,
2116 RTM_NEWNEIGHTBL,
2117 NLM_F_MULTI) <= 0)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002118 goto out;
Gautam Kachrooefc683f2009-02-06 00:52:04 -08002119 next:
2120 nidx++;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002121 }
2122
Thomas Grafca860fb2006-08-07 18:00:18 -07002123 neigh_skip = 0;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002124 }
2125out:
2126 read_unlock(&neigh_tbl_lock);
Thomas Grafca860fb2006-08-07 18:00:18 -07002127 cb->args[0] = tidx;
2128 cb->args[1] = nidx;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002129
2130 return skb->len;
2131}
Linus Torvalds1da177e2005-04-16 15:20:36 -07002132
Thomas Graf8b8aec52006-08-07 17:56:37 -07002133static int neigh_fill_info(struct sk_buff *skb, struct neighbour *neigh,
2134 u32 pid, u32 seq, int type, unsigned int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002135{
2136 unsigned long now = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002137 struct nda_cacheinfo ci;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002138 struct nlmsghdr *nlh;
2139 struct ndmsg *ndm;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002140
Thomas Graf8b8aec52006-08-07 17:56:37 -07002141 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndm), flags);
2142 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08002143 return -EMSGSIZE;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002144
2145 ndm = nlmsg_data(nlh);
2146 ndm->ndm_family = neigh->ops->family;
Patrick McHardy9ef1d4c2005-06-28 12:55:30 -07002147 ndm->ndm_pad1 = 0;
2148 ndm->ndm_pad2 = 0;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002149 ndm->ndm_flags = neigh->flags;
2150 ndm->ndm_type = neigh->type;
2151 ndm->ndm_ifindex = neigh->dev->ifindex;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002152
David S. Miller9a6308d2012-04-01 20:06:28 -04002153 if (nla_put(skb, NDA_DST, neigh->tbl->key_len, neigh->primary_key))
2154 goto nla_put_failure;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002155
2156 read_lock_bh(&neigh->lock);
2157 ndm->ndm_state = neigh->nud_state;
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00002158 if (neigh->nud_state & NUD_VALID) {
2159 char haddr[MAX_ADDR_LEN];
2160
2161 neigh_ha_snapshot(haddr, neigh, neigh->dev);
2162 if (nla_put(skb, NDA_LLADDR, neigh->dev->addr_len, haddr) < 0) {
2163 read_unlock_bh(&neigh->lock);
2164 goto nla_put_failure;
2165 }
Thomas Graf8b8aec52006-08-07 17:56:37 -07002166 }
2167
Stephen Hemmingerb9f5f522008-06-03 16:03:15 -07002168 ci.ndm_used = jiffies_to_clock_t(now - neigh->used);
2169 ci.ndm_confirmed = jiffies_to_clock_t(now - neigh->confirmed);
2170 ci.ndm_updated = jiffies_to_clock_t(now - neigh->updated);
Thomas Graf8b8aec52006-08-07 17:56:37 -07002171 ci.ndm_refcnt = atomic_read(&neigh->refcnt) - 1;
2172 read_unlock_bh(&neigh->lock);
2173
David S. Miller9a6308d2012-04-01 20:06:28 -04002174 if (nla_put_u32(skb, NDA_PROBES, atomic_read(&neigh->probes)) ||
2175 nla_put(skb, NDA_CACHEINFO, sizeof(ci), &ci))
2176 goto nla_put_failure;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002177
2178 return nlmsg_end(skb, nlh);
2179
2180nla_put_failure:
Patrick McHardy26932562007-01-31 23:16:40 -08002181 nlmsg_cancel(skb, nlh);
2182 return -EMSGSIZE;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002183}
2184
Tony Zelenoff84920c12012-01-26 22:28:58 +00002185static int pneigh_fill_info(struct sk_buff *skb, struct pneigh_entry *pn,
2186 u32 pid, u32 seq, int type, unsigned int flags,
2187 struct neigh_table *tbl)
2188{
2189 struct nlmsghdr *nlh;
2190 struct ndmsg *ndm;
2191
2192 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndm), flags);
2193 if (nlh == NULL)
2194 return -EMSGSIZE;
2195
2196 ndm = nlmsg_data(nlh);
2197 ndm->ndm_family = tbl->family;
2198 ndm->ndm_pad1 = 0;
2199 ndm->ndm_pad2 = 0;
2200 ndm->ndm_flags = pn->flags | NTF_PROXY;
2201 ndm->ndm_type = NDA_DST;
2202 ndm->ndm_ifindex = pn->dev->ifindex;
2203 ndm->ndm_state = NUD_NONE;
2204
David S. Miller9a6308d2012-04-01 20:06:28 -04002205 if (nla_put(skb, NDA_DST, tbl->key_len, pn->key))
2206 goto nla_put_failure;
Tony Zelenoff84920c12012-01-26 22:28:58 +00002207
2208 return nlmsg_end(skb, nlh);
2209
2210nla_put_failure:
2211 nlmsg_cancel(skb, nlh);
2212 return -EMSGSIZE;
2213}
2214
Thomas Grafd961db32007-08-08 23:12:56 -07002215static void neigh_update_notify(struct neighbour *neigh)
2216{
2217 call_netevent_notifiers(NETEVENT_NEIGH_UPDATE, neigh);
2218 __neigh_notify(neigh, RTM_NEWNEIGH, 0);
2219}
Linus Torvalds1da177e2005-04-16 15:20:36 -07002220
2221static int neigh_dump_table(struct neigh_table *tbl, struct sk_buff *skb,
2222 struct netlink_callback *cb)
2223{
Eric Dumazet767e97e2010-10-06 17:49:21 -07002224 struct net *net = sock_net(skb->sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002225 struct neighbour *n;
2226 int rc, h, s_h = cb->args[1];
2227 int idx, s_idx = idx = cb->args[2];
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002228 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002229
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002230 rcu_read_lock_bh();
2231 nht = rcu_dereference_bh(tbl->nht);
2232
Eric Dumazet4bd6683b2012-06-07 04:58:35 +00002233 for (h = s_h; h < (1 << nht->hash_shift); h++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002234 if (h > s_h)
2235 s_idx = 0;
Eric Dumazet767e97e2010-10-06 17:49:21 -07002236 for (n = rcu_dereference_bh(nht->hash_buckets[h]), idx = 0;
2237 n != NULL;
2238 n = rcu_dereference_bh(n->next)) {
Octavian Purdila09ad9bc2009-11-25 15:14:13 -08002239 if (!net_eq(dev_net(n->dev), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002240 continue;
Gautam Kachrooefc683f2009-02-06 00:52:04 -08002241 if (idx < s_idx)
2242 goto next;
Eric W. Biederman15e47302012-09-07 20:12:54 +00002243 if (neigh_fill_info(skb, n, NETLINK_CB(cb->skb).portid,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002244 cb->nlh->nlmsg_seq,
Jamal Hadi Salimb6544c02005-06-18 22:54:12 -07002245 RTM_NEWNEIGH,
2246 NLM_F_MULTI) <= 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002247 rc = -1;
2248 goto out;
2249 }
Eric Dumazet767e97e2010-10-06 17:49:21 -07002250next:
Gautam Kachrooefc683f2009-02-06 00:52:04 -08002251 idx++;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002252 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07002253 }
2254 rc = skb->len;
2255out:
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002256 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -07002257 cb->args[1] = h;
2258 cb->args[2] = idx;
2259 return rc;
2260}
2261
Tony Zelenoff84920c12012-01-26 22:28:58 +00002262static int pneigh_dump_table(struct neigh_table *tbl, struct sk_buff *skb,
2263 struct netlink_callback *cb)
2264{
2265 struct pneigh_entry *n;
2266 struct net *net = sock_net(skb->sk);
2267 int rc, h, s_h = cb->args[3];
2268 int idx, s_idx = idx = cb->args[4];
2269
2270 read_lock_bh(&tbl->lock);
2271
Eric Dumazet4bd6683b2012-06-07 04:58:35 +00002272 for (h = s_h; h <= PNEIGH_HASHMASK; h++) {
Tony Zelenoff84920c12012-01-26 22:28:58 +00002273 if (h > s_h)
2274 s_idx = 0;
2275 for (n = tbl->phash_buckets[h], idx = 0; n; n = n->next) {
2276 if (dev_net(n->dev) != net)
2277 continue;
2278 if (idx < s_idx)
2279 goto next;
Eric W. Biederman15e47302012-09-07 20:12:54 +00002280 if (pneigh_fill_info(skb, n, NETLINK_CB(cb->skb).portid,
Tony Zelenoff84920c12012-01-26 22:28:58 +00002281 cb->nlh->nlmsg_seq,
2282 RTM_NEWNEIGH,
2283 NLM_F_MULTI, tbl) <= 0) {
2284 read_unlock_bh(&tbl->lock);
2285 rc = -1;
2286 goto out;
2287 }
2288 next:
2289 idx++;
2290 }
2291 }
2292
2293 read_unlock_bh(&tbl->lock);
2294 rc = skb->len;
2295out:
2296 cb->args[3] = h;
2297 cb->args[4] = idx;
2298 return rc;
2299
2300}
2301
Thomas Grafc8822a42007-03-22 11:50:06 -07002302static int neigh_dump_info(struct sk_buff *skb, struct netlink_callback *cb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002303{
2304 struct neigh_table *tbl;
2305 int t, family, s_t;
Tony Zelenoff84920c12012-01-26 22:28:58 +00002306 int proxy = 0;
Eric Dumazet4bd6683b2012-06-07 04:58:35 +00002307 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002308
2309 read_lock(&neigh_tbl_lock);
Thomas Graf8b8aec52006-08-07 17:56:37 -07002310 family = ((struct rtgenmsg *) nlmsg_data(cb->nlh))->rtgen_family;
Tony Zelenoff84920c12012-01-26 22:28:58 +00002311
2312 /* check for full ndmsg structure presence, family member is
2313 * the same for both structures
2314 */
2315 if (nlmsg_len(cb->nlh) >= sizeof(struct ndmsg) &&
2316 ((struct ndmsg *) nlmsg_data(cb->nlh))->ndm_flags == NTF_PROXY)
2317 proxy = 1;
2318
Linus Torvalds1da177e2005-04-16 15:20:36 -07002319 s_t = cb->args[0];
2320
Eric Dumazet4bd6683b2012-06-07 04:58:35 +00002321 for (tbl = neigh_tables, t = 0; tbl;
Tony Zelenoff84920c12012-01-26 22:28:58 +00002322 tbl = tbl->next, t++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002323 if (t < s_t || (family && tbl->family != family))
2324 continue;
2325 if (t > s_t)
2326 memset(&cb->args[1], 0, sizeof(cb->args) -
2327 sizeof(cb->args[0]));
Tony Zelenoff84920c12012-01-26 22:28:58 +00002328 if (proxy)
2329 err = pneigh_dump_table(tbl, skb, cb);
2330 else
2331 err = neigh_dump_table(tbl, skb, cb);
Eric Dumazet4bd6683b2012-06-07 04:58:35 +00002332 if (err < 0)
2333 break;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002334 }
2335 read_unlock(&neigh_tbl_lock);
2336
2337 cb->args[0] = t;
2338 return skb->len;
2339}
2340
2341void neigh_for_each(struct neigh_table *tbl, void (*cb)(struct neighbour *, void *), void *cookie)
2342{
2343 int chain;
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002344 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002345
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002346 rcu_read_lock_bh();
2347 nht = rcu_dereference_bh(tbl->nht);
2348
Eric Dumazet767e97e2010-10-06 17:49:21 -07002349 read_lock(&tbl->lock); /* avoid resizes */
David S. Millercd089332011-07-11 01:28:12 -07002350 for (chain = 0; chain < (1 << nht->hash_shift); chain++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002351 struct neighbour *n;
2352
Eric Dumazet767e97e2010-10-06 17:49:21 -07002353 for (n = rcu_dereference_bh(nht->hash_buckets[chain]);
2354 n != NULL;
2355 n = rcu_dereference_bh(n->next))
Linus Torvalds1da177e2005-04-16 15:20:36 -07002356 cb(n, cookie);
2357 }
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002358 read_unlock(&tbl->lock);
2359 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -07002360}
2361EXPORT_SYMBOL(neigh_for_each);
2362
2363/* The tbl->lock must be held as a writer and BH disabled. */
2364void __neigh_for_each_release(struct neigh_table *tbl,
2365 int (*cb)(struct neighbour *))
2366{
2367 int chain;
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002368 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002369
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002370 nht = rcu_dereference_protected(tbl->nht,
2371 lockdep_is_held(&tbl->lock));
David S. Millercd089332011-07-11 01:28:12 -07002372 for (chain = 0; chain < (1 << nht->hash_shift); chain++) {
Eric Dumazet767e97e2010-10-06 17:49:21 -07002373 struct neighbour *n;
2374 struct neighbour __rcu **np;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002375
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002376 np = &nht->hash_buckets[chain];
Eric Dumazet767e97e2010-10-06 17:49:21 -07002377 while ((n = rcu_dereference_protected(*np,
2378 lockdep_is_held(&tbl->lock))) != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002379 int release;
2380
2381 write_lock(&n->lock);
2382 release = cb(n);
2383 if (release) {
Eric Dumazet767e97e2010-10-06 17:49:21 -07002384 rcu_assign_pointer(*np,
2385 rcu_dereference_protected(n->next,
2386 lockdep_is_held(&tbl->lock)));
Linus Torvalds1da177e2005-04-16 15:20:36 -07002387 n->dead = 1;
2388 } else
2389 np = &n->next;
2390 write_unlock(&n->lock);
Thomas Graf4f494552007-08-08 23:12:36 -07002391 if (release)
2392 neigh_cleanup_and_release(n);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002393 }
2394 }
2395}
2396EXPORT_SYMBOL(__neigh_for_each_release);
2397
2398#ifdef CONFIG_PROC_FS
2399
2400static struct neighbour *neigh_get_first(struct seq_file *seq)
2401{
2402 struct neigh_seq_state *state = seq->private;
YOSHIFUJI Hideaki12188542008-03-26 02:36:06 +09002403 struct net *net = seq_file_net(seq);
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002404 struct neigh_hash_table *nht = state->nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002405 struct neighbour *n = NULL;
2406 int bucket = state->bucket;
2407
2408 state->flags &= ~NEIGH_SEQ_IS_PNEIGH;
David S. Millercd089332011-07-11 01:28:12 -07002409 for (bucket = 0; bucket < (1 << nht->hash_shift); bucket++) {
Eric Dumazet767e97e2010-10-06 17:49:21 -07002410 n = rcu_dereference_bh(nht->hash_buckets[bucket]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002411
2412 while (n) {
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002413 if (!net_eq(dev_net(n->dev), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002414 goto next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002415 if (state->neigh_sub_iter) {
2416 loff_t fakep = 0;
2417 void *v;
2418
2419 v = state->neigh_sub_iter(state, n, &fakep);
2420 if (!v)
2421 goto next;
2422 }
2423 if (!(state->flags & NEIGH_SEQ_SKIP_NOARP))
2424 break;
2425 if (n->nud_state & ~NUD_NOARP)
2426 break;
Eric Dumazet767e97e2010-10-06 17:49:21 -07002427next:
2428 n = rcu_dereference_bh(n->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002429 }
2430
2431 if (n)
2432 break;
2433 }
2434 state->bucket = bucket;
2435
2436 return n;
2437}
2438
2439static struct neighbour *neigh_get_next(struct seq_file *seq,
2440 struct neighbour *n,
2441 loff_t *pos)
2442{
2443 struct neigh_seq_state *state = seq->private;
YOSHIFUJI Hideaki12188542008-03-26 02:36:06 +09002444 struct net *net = seq_file_net(seq);
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002445 struct neigh_hash_table *nht = state->nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002446
2447 if (state->neigh_sub_iter) {
2448 void *v = state->neigh_sub_iter(state, n, pos);
2449 if (v)
2450 return n;
2451 }
Eric Dumazet767e97e2010-10-06 17:49:21 -07002452 n = rcu_dereference_bh(n->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002453
2454 while (1) {
2455 while (n) {
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002456 if (!net_eq(dev_net(n->dev), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002457 goto next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002458 if (state->neigh_sub_iter) {
2459 void *v = state->neigh_sub_iter(state, n, pos);
2460 if (v)
2461 return n;
2462 goto next;
2463 }
2464 if (!(state->flags & NEIGH_SEQ_SKIP_NOARP))
2465 break;
2466
2467 if (n->nud_state & ~NUD_NOARP)
2468 break;
Eric Dumazet767e97e2010-10-06 17:49:21 -07002469next:
2470 n = rcu_dereference_bh(n->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002471 }
2472
2473 if (n)
2474 break;
2475
David S. Millercd089332011-07-11 01:28:12 -07002476 if (++state->bucket >= (1 << nht->hash_shift))
Linus Torvalds1da177e2005-04-16 15:20:36 -07002477 break;
2478
Eric Dumazet767e97e2010-10-06 17:49:21 -07002479 n = rcu_dereference_bh(nht->hash_buckets[state->bucket]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002480 }
2481
2482 if (n && pos)
2483 --(*pos);
2484 return n;
2485}
2486
2487static struct neighbour *neigh_get_idx(struct seq_file *seq, loff_t *pos)
2488{
2489 struct neighbour *n = neigh_get_first(seq);
2490
2491 if (n) {
Chris Larson745e2032008-08-03 01:10:55 -07002492 --(*pos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002493 while (*pos) {
2494 n = neigh_get_next(seq, n, pos);
2495 if (!n)
2496 break;
2497 }
2498 }
2499 return *pos ? NULL : n;
2500}
2501
2502static struct pneigh_entry *pneigh_get_first(struct seq_file *seq)
2503{
2504 struct neigh_seq_state *state = seq->private;
YOSHIFUJI Hideaki12188542008-03-26 02:36:06 +09002505 struct net *net = seq_file_net(seq);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002506 struct neigh_table *tbl = state->tbl;
2507 struct pneigh_entry *pn = NULL;
2508 int bucket = state->bucket;
2509
2510 state->flags |= NEIGH_SEQ_IS_PNEIGH;
2511 for (bucket = 0; bucket <= PNEIGH_HASHMASK; bucket++) {
2512 pn = tbl->phash_buckets[bucket];
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002513 while (pn && !net_eq(pneigh_net(pn), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002514 pn = pn->next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002515 if (pn)
2516 break;
2517 }
2518 state->bucket = bucket;
2519
2520 return pn;
2521}
2522
2523static struct pneigh_entry *pneigh_get_next(struct seq_file *seq,
2524 struct pneigh_entry *pn,
2525 loff_t *pos)
2526{
2527 struct neigh_seq_state *state = seq->private;
YOSHIFUJI Hideaki12188542008-03-26 02:36:06 +09002528 struct net *net = seq_file_net(seq);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002529 struct neigh_table *tbl = state->tbl;
2530
Jorge Boncompte [DTI2]df07a942011-11-25 13:24:49 -05002531 do {
2532 pn = pn->next;
2533 } while (pn && !net_eq(pneigh_net(pn), net));
2534
Linus Torvalds1da177e2005-04-16 15:20:36 -07002535 while (!pn) {
2536 if (++state->bucket > PNEIGH_HASHMASK)
2537 break;
2538 pn = tbl->phash_buckets[state->bucket];
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002539 while (pn && !net_eq(pneigh_net(pn), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002540 pn = pn->next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002541 if (pn)
2542 break;
2543 }
2544
2545 if (pn && pos)
2546 --(*pos);
2547
2548 return pn;
2549}
2550
2551static struct pneigh_entry *pneigh_get_idx(struct seq_file *seq, loff_t *pos)
2552{
2553 struct pneigh_entry *pn = pneigh_get_first(seq);
2554
2555 if (pn) {
Chris Larson745e2032008-08-03 01:10:55 -07002556 --(*pos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002557 while (*pos) {
2558 pn = pneigh_get_next(seq, pn, pos);
2559 if (!pn)
2560 break;
2561 }
2562 }
2563 return *pos ? NULL : pn;
2564}
2565
2566static void *neigh_get_idx_any(struct seq_file *seq, loff_t *pos)
2567{
2568 struct neigh_seq_state *state = seq->private;
2569 void *rc;
Chris Larson745e2032008-08-03 01:10:55 -07002570 loff_t idxpos = *pos;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002571
Chris Larson745e2032008-08-03 01:10:55 -07002572 rc = neigh_get_idx(seq, &idxpos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002573 if (!rc && !(state->flags & NEIGH_SEQ_NEIGH_ONLY))
Chris Larson745e2032008-08-03 01:10:55 -07002574 rc = pneigh_get_idx(seq, &idxpos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002575
2576 return rc;
2577}
2578
2579void *neigh_seq_start(struct seq_file *seq, loff_t *pos, struct neigh_table *tbl, unsigned int neigh_seq_flags)
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002580 __acquires(rcu_bh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002581{
2582 struct neigh_seq_state *state = seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002583
2584 state->tbl = tbl;
2585 state->bucket = 0;
2586 state->flags = (neigh_seq_flags & ~NEIGH_SEQ_IS_PNEIGH);
2587
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002588 rcu_read_lock_bh();
2589 state->nht = rcu_dereference_bh(tbl->nht);
Eric Dumazet767e97e2010-10-06 17:49:21 -07002590
Chris Larson745e2032008-08-03 01:10:55 -07002591 return *pos ? neigh_get_idx_any(seq, pos) : SEQ_START_TOKEN;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002592}
2593EXPORT_SYMBOL(neigh_seq_start);
2594
2595void *neigh_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2596{
2597 struct neigh_seq_state *state;
2598 void *rc;
2599
2600 if (v == SEQ_START_TOKEN) {
Chris Larsonbff69732008-08-03 01:02:41 -07002601 rc = neigh_get_first(seq);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002602 goto out;
2603 }
2604
2605 state = seq->private;
2606 if (!(state->flags & NEIGH_SEQ_IS_PNEIGH)) {
2607 rc = neigh_get_next(seq, v, NULL);
2608 if (rc)
2609 goto out;
2610 if (!(state->flags & NEIGH_SEQ_NEIGH_ONLY))
2611 rc = pneigh_get_first(seq);
2612 } else {
2613 BUG_ON(state->flags & NEIGH_SEQ_NEIGH_ONLY);
2614 rc = pneigh_get_next(seq, v, NULL);
2615 }
2616out:
2617 ++(*pos);
2618 return rc;
2619}
2620EXPORT_SYMBOL(neigh_seq_next);
2621
2622void neigh_seq_stop(struct seq_file *seq, void *v)
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002623 __releases(rcu_bh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002624{
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002625 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -07002626}
2627EXPORT_SYMBOL(neigh_seq_stop);
2628
2629/* statistics via seq_file */
2630
2631static void *neigh_stat_seq_start(struct seq_file *seq, loff_t *pos)
2632{
Alexey Dobriyan81c1ebf2010-01-22 10:16:05 +00002633 struct neigh_table *tbl = seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002634 int cpu;
2635
2636 if (*pos == 0)
2637 return SEQ_START_TOKEN;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09002638
Rusty Russell0f23174a2008-12-29 12:23:42 +00002639 for (cpu = *pos-1; cpu < nr_cpu_ids; ++cpu) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002640 if (!cpu_possible(cpu))
2641 continue;
2642 *pos = cpu+1;
2643 return per_cpu_ptr(tbl->stats, cpu);
2644 }
2645 return NULL;
2646}
2647
2648static void *neigh_stat_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2649{
Alexey Dobriyan81c1ebf2010-01-22 10:16:05 +00002650 struct neigh_table *tbl = seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002651 int cpu;
2652
Rusty Russell0f23174a2008-12-29 12:23:42 +00002653 for (cpu = *pos; cpu < nr_cpu_ids; ++cpu) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002654 if (!cpu_possible(cpu))
2655 continue;
2656 *pos = cpu+1;
2657 return per_cpu_ptr(tbl->stats, cpu);
2658 }
2659 return NULL;
2660}
2661
2662static void neigh_stat_seq_stop(struct seq_file *seq, void *v)
2663{
2664
2665}
2666
2667static int neigh_stat_seq_show(struct seq_file *seq, void *v)
2668{
Alexey Dobriyan81c1ebf2010-01-22 10:16:05 +00002669 struct neigh_table *tbl = seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002670 struct neigh_statistics *st = v;
2671
2672 if (v == SEQ_START_TOKEN) {
Neil Horman9a6d2762008-07-16 20:50:49 -07002673 seq_printf(seq, "entries allocs destroys hash_grows lookups hits res_failed rcv_probes_mcast rcv_probes_ucast periodic_gc_runs forced_gc_runs unresolved_discards\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07002674 return 0;
2675 }
2676
2677 seq_printf(seq, "%08x %08lx %08lx %08lx %08lx %08lx %08lx "
Neil Horman9a6d2762008-07-16 20:50:49 -07002678 "%08lx %08lx %08lx %08lx %08lx\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07002679 atomic_read(&tbl->entries),
2680
2681 st->allocs,
2682 st->destroys,
2683 st->hash_grows,
2684
2685 st->lookups,
2686 st->hits,
2687
2688 st->res_failed,
2689
2690 st->rcv_probes_mcast,
2691 st->rcv_probes_ucast,
2692
2693 st->periodic_gc_runs,
Neil Horman9a6d2762008-07-16 20:50:49 -07002694 st->forced_gc_runs,
2695 st->unres_discards
Linus Torvalds1da177e2005-04-16 15:20:36 -07002696 );
2697
2698 return 0;
2699}
2700
Stephen Hemmingerf6908082007-03-12 14:34:29 -07002701static const struct seq_operations neigh_stat_seq_ops = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002702 .start = neigh_stat_seq_start,
2703 .next = neigh_stat_seq_next,
2704 .stop = neigh_stat_seq_stop,
2705 .show = neigh_stat_seq_show,
2706};
2707
2708static int neigh_stat_seq_open(struct inode *inode, struct file *file)
2709{
2710 int ret = seq_open(file, &neigh_stat_seq_ops);
2711
2712 if (!ret) {
2713 struct seq_file *sf = file->private_data;
Al Virod9dda782013-03-31 18:16:14 -04002714 sf->private = PDE_DATA(inode);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002715 }
2716 return ret;
2717};
2718
Arjan van de Ven9a321442007-02-12 00:55:35 -08002719static const struct file_operations neigh_stat_seq_fops = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002720 .owner = THIS_MODULE,
2721 .open = neigh_stat_seq_open,
2722 .read = seq_read,
2723 .llseek = seq_lseek,
2724 .release = seq_release,
2725};
2726
2727#endif /* CONFIG_PROC_FS */
2728
Thomas Graf339bf982006-11-10 14:10:15 -08002729static inline size_t neigh_nlmsg_size(void)
2730{
2731 return NLMSG_ALIGN(sizeof(struct ndmsg))
2732 + nla_total_size(MAX_ADDR_LEN) /* NDA_DST */
2733 + nla_total_size(MAX_ADDR_LEN) /* NDA_LLADDR */
2734 + nla_total_size(sizeof(struct nda_cacheinfo))
2735 + nla_total_size(4); /* NDA_PROBES */
2736}
2737
Thomas Grafb8673312006-08-15 00:33:14 -07002738static void __neigh_notify(struct neighbour *n, int type, int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002739{
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09002740 struct net *net = dev_net(n->dev);
Thomas Graf8b8aec52006-08-07 17:56:37 -07002741 struct sk_buff *skb;
Thomas Grafb8673312006-08-15 00:33:14 -07002742 int err = -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002743
Thomas Graf339bf982006-11-10 14:10:15 -08002744 skb = nlmsg_new(neigh_nlmsg_size(), GFP_ATOMIC);
Thomas Graf8b8aec52006-08-07 17:56:37 -07002745 if (skb == NULL)
Thomas Grafb8673312006-08-15 00:33:14 -07002746 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002747
Thomas Grafb8673312006-08-15 00:33:14 -07002748 err = neigh_fill_info(skb, n, 0, 0, type, flags);
Patrick McHardy26932562007-01-31 23:16:40 -08002749 if (err < 0) {
2750 /* -EMSGSIZE implies BUG in neigh_nlmsg_size() */
2751 WARN_ON(err == -EMSGSIZE);
2752 kfree_skb(skb);
2753 goto errout;
2754 }
Pablo Neira Ayuso1ce85fe2009-02-24 23:18:28 -08002755 rtnl_notify(skb, net, 0, RTNLGRP_NEIGH, NULL, GFP_ATOMIC);
2756 return;
Thomas Grafb8673312006-08-15 00:33:14 -07002757errout:
2758 if (err < 0)
Eric W. Biederman426b5302008-01-24 00:13:18 -08002759 rtnl_set_sk_err(net, RTNLGRP_NEIGH, err);
Thomas Grafb8673312006-08-15 00:33:14 -07002760}
2761
2762void neigh_app_ns(struct neighbour *n)
2763{
2764 __neigh_notify(n, RTM_GETNEIGH, NLM_F_REQUEST);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002765}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09002766EXPORT_SYMBOL(neigh_app_ns);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002767
2768#ifdef CONFIG_SYSCTL
Cong Wangb93196d2012-12-06 10:04:04 +08002769static int zero;
Francesco Fusco555445c2013-07-24 10:39:06 +02002770static int int_max = INT_MAX;
Cong Wangb93196d2012-12-06 10:04:04 +08002771static int unres_qlen_max = INT_MAX / SKB_TRUESIZE(ETH_FRAME_LEN);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002772
Joe Perchesfe2c6332013-06-11 23:04:25 -07002773static int proc_unres_qlen(struct ctl_table *ctl, int write,
2774 void __user *buffer, size_t *lenp, loff_t *ppos)
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002775{
2776 int size, ret;
Joe Perchesfe2c6332013-06-11 23:04:25 -07002777 struct ctl_table tmp = *ctl;
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002778
Shan Weice46cc62012-12-04 18:49:15 +00002779 tmp.extra1 = &zero;
2780 tmp.extra2 = &unres_qlen_max;
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002781 tmp.data = &size;
Shan Weice46cc62012-12-04 18:49:15 +00002782
2783 size = *(int *)ctl->data / SKB_TRUESIZE(ETH_FRAME_LEN);
2784 ret = proc_dointvec_minmax(&tmp, write, buffer, lenp, ppos);
2785
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002786 if (write && !ret)
2787 *(int *)ctl->data = size * SKB_TRUESIZE(ETH_FRAME_LEN);
2788 return ret;
2789}
2790
2791enum {
2792 NEIGH_VAR_MCAST_PROBE,
2793 NEIGH_VAR_UCAST_PROBE,
2794 NEIGH_VAR_APP_PROBE,
2795 NEIGH_VAR_RETRANS_TIME,
2796 NEIGH_VAR_BASE_REACHABLE_TIME,
2797 NEIGH_VAR_DELAY_PROBE_TIME,
2798 NEIGH_VAR_GC_STALETIME,
2799 NEIGH_VAR_QUEUE_LEN,
2800 NEIGH_VAR_QUEUE_LEN_BYTES,
2801 NEIGH_VAR_PROXY_QLEN,
2802 NEIGH_VAR_ANYCAST_DELAY,
2803 NEIGH_VAR_PROXY_DELAY,
2804 NEIGH_VAR_LOCKTIME,
2805 NEIGH_VAR_RETRANS_TIME_MS,
2806 NEIGH_VAR_BASE_REACHABLE_TIME_MS,
2807 NEIGH_VAR_GC_INTERVAL,
2808 NEIGH_VAR_GC_THRESH1,
2809 NEIGH_VAR_GC_THRESH2,
2810 NEIGH_VAR_GC_THRESH3,
2811 NEIGH_VAR_MAX
2812};
Eric W. Biederman54716e32010-02-14 03:27:03 +00002813
Linus Torvalds1da177e2005-04-16 15:20:36 -07002814static struct neigh_sysctl_table {
2815 struct ctl_table_header *sysctl_header;
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002816 struct ctl_table neigh_vars[NEIGH_VAR_MAX + 1];
Brian Haleyab32ea52006-09-22 14:15:41 -07002817} neigh_sysctl_template __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002818 .neigh_vars = {
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002819 [NEIGH_VAR_MCAST_PROBE] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002820 .procname = "mcast_solicit",
2821 .maxlen = sizeof(int),
2822 .mode = 0644,
Francesco Fusco555445c2013-07-24 10:39:06 +02002823 .extra1 = &zero,
2824 .extra2 = &int_max,
2825 .proc_handler = proc_dointvec_minmax,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002826 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002827 [NEIGH_VAR_UCAST_PROBE] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002828 .procname = "ucast_solicit",
2829 .maxlen = sizeof(int),
2830 .mode = 0644,
Francesco Fusco555445c2013-07-24 10:39:06 +02002831 .extra1 = &zero,
2832 .extra2 = &int_max,
2833 .proc_handler = proc_dointvec_minmax,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002834 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002835 [NEIGH_VAR_APP_PROBE] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002836 .procname = "app_solicit",
2837 .maxlen = sizeof(int),
2838 .mode = 0644,
Francesco Fusco555445c2013-07-24 10:39:06 +02002839 .extra1 = &zero,
2840 .extra2 = &int_max,
2841 .proc_handler = proc_dointvec_minmax,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002842 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002843 [NEIGH_VAR_RETRANS_TIME] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002844 .procname = "retrans_time",
2845 .maxlen = sizeof(int),
2846 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002847 .proc_handler = proc_dointvec_userhz_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002848 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002849 [NEIGH_VAR_BASE_REACHABLE_TIME] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002850 .procname = "base_reachable_time",
2851 .maxlen = sizeof(int),
2852 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002853 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002854 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002855 [NEIGH_VAR_DELAY_PROBE_TIME] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002856 .procname = "delay_first_probe_time",
2857 .maxlen = sizeof(int),
2858 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002859 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002860 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002861 [NEIGH_VAR_GC_STALETIME] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002862 .procname = "gc_stale_time",
2863 .maxlen = sizeof(int),
2864 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002865 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002866 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002867 [NEIGH_VAR_QUEUE_LEN] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002868 .procname = "unres_qlen",
2869 .maxlen = sizeof(int),
2870 .mode = 0644,
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002871 .proc_handler = proc_unres_qlen,
2872 },
2873 [NEIGH_VAR_QUEUE_LEN_BYTES] = {
2874 .procname = "unres_qlen_bytes",
2875 .maxlen = sizeof(int),
2876 .mode = 0644,
Shan Weice46cc62012-12-04 18:49:15 +00002877 .extra1 = &zero,
2878 .proc_handler = proc_dointvec_minmax,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002879 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002880 [NEIGH_VAR_PROXY_QLEN] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002881 .procname = "proxy_qlen",
2882 .maxlen = sizeof(int),
2883 .mode = 0644,
Francesco Fusco555445c2013-07-24 10:39:06 +02002884 .extra1 = &zero,
2885 .extra2 = &int_max,
2886 .proc_handler = proc_dointvec_minmax,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002887 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002888 [NEIGH_VAR_ANYCAST_DELAY] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002889 .procname = "anycast_delay",
2890 .maxlen = sizeof(int),
2891 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002892 .proc_handler = proc_dointvec_userhz_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002893 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002894 [NEIGH_VAR_PROXY_DELAY] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002895 .procname = "proxy_delay",
2896 .maxlen = sizeof(int),
2897 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002898 .proc_handler = proc_dointvec_userhz_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002899 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002900 [NEIGH_VAR_LOCKTIME] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002901 .procname = "locktime",
2902 .maxlen = sizeof(int),
2903 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002904 .proc_handler = proc_dointvec_userhz_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002905 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002906 [NEIGH_VAR_RETRANS_TIME_MS] = {
Eric W. Biedermand12af672007-10-18 03:05:25 -07002907 .procname = "retrans_time_ms",
2908 .maxlen = sizeof(int),
2909 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002910 .proc_handler = proc_dointvec_ms_jiffies,
Eric W. Biedermand12af672007-10-18 03:05:25 -07002911 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002912 [NEIGH_VAR_BASE_REACHABLE_TIME_MS] = {
Eric W. Biedermand12af672007-10-18 03:05:25 -07002913 .procname = "base_reachable_time_ms",
2914 .maxlen = sizeof(int),
2915 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002916 .proc_handler = proc_dointvec_ms_jiffies,
Eric W. Biedermand12af672007-10-18 03:05:25 -07002917 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002918 [NEIGH_VAR_GC_INTERVAL] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002919 .procname = "gc_interval",
2920 .maxlen = sizeof(int),
2921 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002922 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002923 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002924 [NEIGH_VAR_GC_THRESH1] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002925 .procname = "gc_thresh1",
2926 .maxlen = sizeof(int),
2927 .mode = 0644,
Francesco Fusco555445c2013-07-24 10:39:06 +02002928 .extra1 = &zero,
2929 .extra2 = &int_max,
2930 .proc_handler = proc_dointvec_minmax,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002931 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002932 [NEIGH_VAR_GC_THRESH2] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002933 .procname = "gc_thresh2",
2934 .maxlen = sizeof(int),
2935 .mode = 0644,
Francesco Fusco555445c2013-07-24 10:39:06 +02002936 .extra1 = &zero,
2937 .extra2 = &int_max,
2938 .proc_handler = proc_dointvec_minmax,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002939 },
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002940 [NEIGH_VAR_GC_THRESH3] = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002941 .procname = "gc_thresh3",
2942 .maxlen = sizeof(int),
2943 .mode = 0644,
Francesco Fusco555445c2013-07-24 10:39:06 +02002944 .extra1 = &zero,
2945 .extra2 = &int_max,
2946 .proc_handler = proc_dointvec_minmax,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002947 },
Pavel Emelyanovc3bac5a2007-12-02 00:08:16 +11002948 {},
Linus Torvalds1da177e2005-04-16 15:20:36 -07002949 },
2950};
2951
2952int neigh_sysctl_register(struct net_device *dev, struct neigh_parms *p,
Eric W. Biederman54716e32010-02-14 03:27:03 +00002953 char *p_name, proc_handler *handler)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002954{
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002955 struct neigh_sysctl_table *t;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002956 const char *dev_name_source = NULL;
Eric W. Biederman8f40a1f2012-04-19 13:38:03 +00002957 char neigh_path[ sizeof("net//neigh/") + IFNAMSIZ + IFNAMSIZ ];
Linus Torvalds1da177e2005-04-16 15:20:36 -07002958
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002959 t = kmemdup(&neigh_sysctl_template, sizeof(*t), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002960 if (!t)
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002961 goto err;
2962
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002963 t->neigh_vars[NEIGH_VAR_MCAST_PROBE].data = &p->mcast_probes;
2964 t->neigh_vars[NEIGH_VAR_UCAST_PROBE].data = &p->ucast_probes;
2965 t->neigh_vars[NEIGH_VAR_APP_PROBE].data = &p->app_probes;
2966 t->neigh_vars[NEIGH_VAR_RETRANS_TIME].data = &p->retrans_time;
2967 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME].data = &p->base_reachable_time;
2968 t->neigh_vars[NEIGH_VAR_DELAY_PROBE_TIME].data = &p->delay_probe_time;
2969 t->neigh_vars[NEIGH_VAR_GC_STALETIME].data = &p->gc_staletime;
2970 t->neigh_vars[NEIGH_VAR_QUEUE_LEN].data = &p->queue_len_bytes;
2971 t->neigh_vars[NEIGH_VAR_QUEUE_LEN_BYTES].data = &p->queue_len_bytes;
2972 t->neigh_vars[NEIGH_VAR_PROXY_QLEN].data = &p->proxy_qlen;
2973 t->neigh_vars[NEIGH_VAR_ANYCAST_DELAY].data = &p->anycast_delay;
2974 t->neigh_vars[NEIGH_VAR_PROXY_DELAY].data = &p->proxy_delay;
2975 t->neigh_vars[NEIGH_VAR_LOCKTIME].data = &p->locktime;
2976 t->neigh_vars[NEIGH_VAR_RETRANS_TIME_MS].data = &p->retrans_time;
2977 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME_MS].data = &p->base_reachable_time;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002978
2979 if (dev) {
2980 dev_name_source = dev->name;
Eric W. Biedermand12af672007-10-18 03:05:25 -07002981 /* Terminate the table early */
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002982 memset(&t->neigh_vars[NEIGH_VAR_GC_INTERVAL], 0,
2983 sizeof(t->neigh_vars[NEIGH_VAR_GC_INTERVAL]));
Linus Torvalds1da177e2005-04-16 15:20:36 -07002984 } else {
Eric W. Biederman8f40a1f2012-04-19 13:38:03 +00002985 dev_name_source = "default";
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002986 t->neigh_vars[NEIGH_VAR_GC_INTERVAL].data = (int *)(p + 1);
2987 t->neigh_vars[NEIGH_VAR_GC_THRESH1].data = (int *)(p + 1) + 1;
2988 t->neigh_vars[NEIGH_VAR_GC_THRESH2].data = (int *)(p + 1) + 2;
2989 t->neigh_vars[NEIGH_VAR_GC_THRESH3].data = (int *)(p + 1) + 3;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002990 }
2991
Linus Torvalds1da177e2005-04-16 15:20:36 -07002992
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002993 if (handler) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002994 /* RetransTime */
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002995 t->neigh_vars[NEIGH_VAR_RETRANS_TIME].proc_handler = handler;
2996 t->neigh_vars[NEIGH_VAR_RETRANS_TIME].extra1 = dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002997 /* ReachableTime */
Eric Dumazet8b5c1712011-11-09 12:07:14 +00002998 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME].proc_handler = handler;
2999 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME].extra1 = dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003000 /* RetransTime (in milliseconds)*/
Eric Dumazet8b5c1712011-11-09 12:07:14 +00003001 t->neigh_vars[NEIGH_VAR_RETRANS_TIME_MS].proc_handler = handler;
3002 t->neigh_vars[NEIGH_VAR_RETRANS_TIME_MS].extra1 = dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003003 /* ReachableTime (in milliseconds) */
Eric Dumazet8b5c1712011-11-09 12:07:14 +00003004 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME_MS].proc_handler = handler;
3005 t->neigh_vars[NEIGH_VAR_BASE_REACHABLE_TIME_MS].extra1 = dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003006 }
3007
Eric W. Biederman464dc802012-11-16 03:02:59 +00003008 /* Don't export sysctls to unprivileged users */
3009 if (neigh_parms_net(p)->user_ns != &init_user_ns)
3010 t->neigh_vars[0].procname = NULL;
3011
Eric W. Biederman8f40a1f2012-04-19 13:38:03 +00003012 snprintf(neigh_path, sizeof(neigh_path), "net/%s/neigh/%s",
3013 p_name, dev_name_source);
Denis V. Lunev4ab438f2008-02-28 20:48:01 -08003014 t->sysctl_header =
Eric W. Biederman8f40a1f2012-04-19 13:38:03 +00003015 register_net_sysctl(neigh_parms_net(p), neigh_path, t->neigh_vars);
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11003016 if (!t->sysctl_header)
Eric W. Biederman8f40a1f2012-04-19 13:38:03 +00003017 goto free;
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11003018
Linus Torvalds1da177e2005-04-16 15:20:36 -07003019 p->sysctl_table = t;
3020 return 0;
3021
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11003022free:
Linus Torvalds1da177e2005-04-16 15:20:36 -07003023 kfree(t);
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11003024err:
3025 return -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003026}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09003027EXPORT_SYMBOL(neigh_sysctl_register);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003028
3029void neigh_sysctl_unregister(struct neigh_parms *p)
3030{
3031 if (p->sysctl_table) {
3032 struct neigh_sysctl_table *t = p->sysctl_table;
3033 p->sysctl_table = NULL;
Eric W. Biederman5dd3df12012-04-19 13:24:33 +00003034 unregister_net_sysctl_table(t->sysctl_header);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003035 kfree(t);
3036 }
3037}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09003038EXPORT_SYMBOL(neigh_sysctl_unregister);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003039
3040#endif /* CONFIG_SYSCTL */
3041
Thomas Grafc8822a42007-03-22 11:50:06 -07003042static int __init neigh_init(void)
3043{
Greg Rosec7ac8672011-06-10 01:27:09 +00003044 rtnl_register(PF_UNSPEC, RTM_NEWNEIGH, neigh_add, NULL, NULL);
3045 rtnl_register(PF_UNSPEC, RTM_DELNEIGH, neigh_delete, NULL, NULL);
3046 rtnl_register(PF_UNSPEC, RTM_GETNEIGH, NULL, neigh_dump_info, NULL);
Thomas Grafc8822a42007-03-22 11:50:06 -07003047
Greg Rosec7ac8672011-06-10 01:27:09 +00003048 rtnl_register(PF_UNSPEC, RTM_GETNEIGHTBL, NULL, neightbl_dump_info,
3049 NULL);
3050 rtnl_register(PF_UNSPEC, RTM_SETNEIGHTBL, neightbl_set, NULL, NULL);
Thomas Grafc8822a42007-03-22 11:50:06 -07003051
3052 return 0;
3053}
3054
3055subsys_initcall(neigh_init);
3056