blob: 2feda6e7a31d22d91c639f88651383a6e154971a [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Generic address resolution entity
3 *
4 * Authors:
5 * Pedro Roque <roque@di.fc.ul.pt>
6 * Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
7 *
8 * This program is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU General Public License
10 * as published by the Free Software Foundation; either version
11 * 2 of the License, or (at your option) any later version.
12 *
13 * Fixes:
14 * Vitaly E. Lavrov releasing NULL neighbor in neigh_add.
15 * Harald Welte Add neighbour cache statistics like rtstat
16 */
17
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090018#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070019#include <linux/types.h>
20#include <linux/kernel.h>
21#include <linux/module.h>
22#include <linux/socket.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070023#include <linux/netdevice.h>
24#include <linux/proc_fs.h>
25#ifdef CONFIG_SYSCTL
26#include <linux/sysctl.h>
27#endif
28#include <linux/times.h>
Eric W. Biederman457c4cb2007-09-12 12:01:34 +020029#include <net/net_namespace.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070030#include <net/neighbour.h>
31#include <net/dst.h>
32#include <net/sock.h>
Tom Tucker8d717402006-07-30 20:43:36 -070033#include <net/netevent.h>
Thomas Grafa14a49d2006-08-07 17:53:08 -070034#include <net/netlink.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035#include <linux/rtnetlink.h>
36#include <linux/random.h>
Paulo Marques543537b2005-06-23 00:09:02 -070037#include <linux/string.h>
vignesh babuc3609d52007-08-24 22:27:55 -070038#include <linux/log2.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070039
40#define NEIGH_DEBUG 1
41
42#define NEIGH_PRINTK(x...) printk(x)
43#define NEIGH_NOPRINTK(x...) do { ; } while(0)
Linus Torvalds1da177e2005-04-16 15:20:36 -070044#define NEIGH_PRINTK1 NEIGH_NOPRINTK
45#define NEIGH_PRINTK2 NEIGH_NOPRINTK
46
47#if NEIGH_DEBUG >= 1
48#undef NEIGH_PRINTK1
49#define NEIGH_PRINTK1 NEIGH_PRINTK
50#endif
51#if NEIGH_DEBUG >= 2
52#undef NEIGH_PRINTK2
53#define NEIGH_PRINTK2 NEIGH_PRINTK
54#endif
55
56#define PNEIGH_HASHMASK 0xF
57
58static void neigh_timer_handler(unsigned long arg);
Thomas Grafd961db32007-08-08 23:12:56 -070059static void __neigh_notify(struct neighbour *n, int type, int flags);
60static void neigh_update_notify(struct neighbour *neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -070061static int pneigh_ifdown(struct neigh_table *tbl, struct net_device *dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -070062
63static struct neigh_table *neigh_tables;
Amos Waterland45fc3b12005-09-24 16:53:16 -070064#ifdef CONFIG_PROC_FS
Arjan van de Ven9a321442007-02-12 00:55:35 -080065static const struct file_operations neigh_stat_seq_fops;
Amos Waterland45fc3b12005-09-24 16:53:16 -070066#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070067
68/*
69 Neighbour hash table buckets are protected with rwlock tbl->lock.
70
71 - All the scans/updates to hash buckets MUST be made under this lock.
72 - NOTHING clever should be made under this lock: no callbacks
73 to protocol backends, no attempts to send something to network.
74 It will result in deadlocks, if backend/driver wants to use neighbour
75 cache.
76 - If the entry requires some non-trivial actions, increase
77 its reference count and release table lock.
78
79 Neighbour entries are protected:
80 - with reference count.
81 - with rwlock neigh->lock
82
83 Reference count prevents destruction.
84
85 neigh->lock mainly serializes ll address data and its validity state.
86 However, the same lock is used to protect another entry fields:
87 - timer
88 - resolution queue
89
90 Again, nothing clever shall be made under neigh->lock,
91 the most complicated procedure, which we allow is dev->hard_header.
92 It is supposed, that dev->hard_header is simplistic and does
93 not make callbacks to neighbour tables.
94
95 The last lock is neigh_tbl_lock. It is pure SMP lock, protecting
96 list of neighbour tables. This list is used only in process context,
97 */
98
99static DEFINE_RWLOCK(neigh_tbl_lock);
100
101static int neigh_blackhole(struct sk_buff *skb)
102{
103 kfree_skb(skb);
104 return -ENETDOWN;
105}
106
Thomas Graf4f494552007-08-08 23:12:36 -0700107static void neigh_cleanup_and_release(struct neighbour *neigh)
108{
109 if (neigh->parms->neigh_cleanup)
110 neigh->parms->neigh_cleanup(neigh);
111
Thomas Grafd961db32007-08-08 23:12:56 -0700112 __neigh_notify(neigh, RTM_DELNEIGH, 0);
Thomas Graf4f494552007-08-08 23:12:36 -0700113 neigh_release(neigh);
114}
115
Linus Torvalds1da177e2005-04-16 15:20:36 -0700116/*
117 * It is random distribution in the interval (1/2)*base...(3/2)*base.
118 * It corresponds to default IPv6 settings and is not overridable,
119 * because it is really reasonable choice.
120 */
121
122unsigned long neigh_rand_reach_time(unsigned long base)
123{
Eric Dumazeta02cec22010-09-22 20:43:57 +0000124 return base ? (net_random() % base) + (base >> 1) : 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700125}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900126EXPORT_SYMBOL(neigh_rand_reach_time);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700127
128
129static int neigh_forced_gc(struct neigh_table *tbl)
130{
131 int shrunk = 0;
132 int i;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000133 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700134
135 NEIGH_CACHE_STAT_INC(tbl, forced_gc_runs);
136
137 write_lock_bh(&tbl->lock);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000138 nht = rcu_dereference_protected(tbl->nht,
139 lockdep_is_held(&tbl->lock));
David S. Millercd089332011-07-11 01:28:12 -0700140 for (i = 0; i < (1 << nht->hash_shift); i++) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700141 struct neighbour *n;
142 struct neighbour __rcu **np;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700143
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000144 np = &nht->hash_buckets[i];
Eric Dumazet767e97e2010-10-06 17:49:21 -0700145 while ((n = rcu_dereference_protected(*np,
146 lockdep_is_held(&tbl->lock))) != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700147 /* Neighbour record may be discarded if:
148 * - nobody refers to it.
149 * - it is not permanent
150 */
151 write_lock(&n->lock);
152 if (atomic_read(&n->refcnt) == 1 &&
153 !(n->nud_state & NUD_PERMANENT)) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700154 rcu_assign_pointer(*np,
155 rcu_dereference_protected(n->next,
156 lockdep_is_held(&tbl->lock)));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700157 n->dead = 1;
158 shrunk = 1;
159 write_unlock(&n->lock);
Thomas Graf4f494552007-08-08 23:12:36 -0700160 neigh_cleanup_and_release(n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700161 continue;
162 }
163 write_unlock(&n->lock);
164 np = &n->next;
165 }
166 }
167
168 tbl->last_flush = jiffies;
169
170 write_unlock_bh(&tbl->lock);
171
172 return shrunk;
173}
174
Pavel Emelyanova43d8992007-12-20 15:49:05 -0800175static void neigh_add_timer(struct neighbour *n, unsigned long when)
176{
177 neigh_hold(n);
178 if (unlikely(mod_timer(&n->timer, when))) {
179 printk("NEIGH: BUG, double timer add, state is %x\n",
180 n->nud_state);
181 dump_stack();
182 }
183}
184
Linus Torvalds1da177e2005-04-16 15:20:36 -0700185static int neigh_del_timer(struct neighbour *n)
186{
187 if ((n->nud_state & NUD_IN_TIMER) &&
188 del_timer(&n->timer)) {
189 neigh_release(n);
190 return 1;
191 }
192 return 0;
193}
194
195static void pneigh_queue_purge(struct sk_buff_head *list)
196{
197 struct sk_buff *skb;
198
199 while ((skb = skb_dequeue(list)) != NULL) {
200 dev_put(skb->dev);
201 kfree_skb(skb);
202 }
203}
204
Herbert Xu49636bb2005-10-23 17:18:00 +1000205static void neigh_flush_dev(struct neigh_table *tbl, struct net_device *dev)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700206{
207 int i;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000208 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700209
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000210 nht = rcu_dereference_protected(tbl->nht,
211 lockdep_is_held(&tbl->lock));
212
David S. Millercd089332011-07-11 01:28:12 -0700213 for (i = 0; i < (1 << nht->hash_shift); i++) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700214 struct neighbour *n;
215 struct neighbour __rcu **np = &nht->hash_buckets[i];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700216
Eric Dumazet767e97e2010-10-06 17:49:21 -0700217 while ((n = rcu_dereference_protected(*np,
218 lockdep_is_held(&tbl->lock))) != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700219 if (dev && n->dev != dev) {
220 np = &n->next;
221 continue;
222 }
Eric Dumazet767e97e2010-10-06 17:49:21 -0700223 rcu_assign_pointer(*np,
224 rcu_dereference_protected(n->next,
225 lockdep_is_held(&tbl->lock)));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700226 write_lock(&n->lock);
227 neigh_del_timer(n);
228 n->dead = 1;
229
230 if (atomic_read(&n->refcnt) != 1) {
231 /* The most unpleasant situation.
232 We must destroy neighbour entry,
233 but someone still uses it.
234
235 The destroy will be delayed until
236 the last user releases us, but
237 we must kill timers etc. and move
238 it to safe state.
239 */
240 skb_queue_purge(&n->arp_queue);
241 n->output = neigh_blackhole;
242 if (n->nud_state & NUD_VALID)
243 n->nud_state = NUD_NOARP;
244 else
245 n->nud_state = NUD_NONE;
246 NEIGH_PRINTK2("neigh %p is stray.\n", n);
247 }
248 write_unlock(&n->lock);
Thomas Graf4f494552007-08-08 23:12:36 -0700249 neigh_cleanup_and_release(n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700250 }
251 }
Herbert Xu49636bb2005-10-23 17:18:00 +1000252}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700253
Herbert Xu49636bb2005-10-23 17:18:00 +1000254void neigh_changeaddr(struct neigh_table *tbl, struct net_device *dev)
255{
256 write_lock_bh(&tbl->lock);
257 neigh_flush_dev(tbl, dev);
258 write_unlock_bh(&tbl->lock);
259}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900260EXPORT_SYMBOL(neigh_changeaddr);
Herbert Xu49636bb2005-10-23 17:18:00 +1000261
262int neigh_ifdown(struct neigh_table *tbl, struct net_device *dev)
263{
264 write_lock_bh(&tbl->lock);
265 neigh_flush_dev(tbl, dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700266 pneigh_ifdown(tbl, dev);
267 write_unlock_bh(&tbl->lock);
268
269 del_timer_sync(&tbl->proxy_timer);
270 pneigh_queue_purge(&tbl->proxy_queue);
271 return 0;
272}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900273EXPORT_SYMBOL(neigh_ifdown);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700274
275static struct neighbour *neigh_alloc(struct neigh_table *tbl)
276{
277 struct neighbour *n = NULL;
278 unsigned long now = jiffies;
279 int entries;
280
281 entries = atomic_inc_return(&tbl->entries) - 1;
282 if (entries >= tbl->gc_thresh3 ||
283 (entries >= tbl->gc_thresh2 &&
284 time_after(now, tbl->last_flush + 5 * HZ))) {
285 if (!neigh_forced_gc(tbl) &&
286 entries >= tbl->gc_thresh3)
287 goto out_entries;
288 }
289
Robert P. J. Dayc3762222007-02-10 01:45:03 -0800290 n = kmem_cache_zalloc(tbl->kmem_cachep, GFP_ATOMIC);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700291 if (!n)
292 goto out_entries;
293
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294 skb_queue_head_init(&n->arp_queue);
295 rwlock_init(&n->lock);
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +0000296 seqlock_init(&n->ha_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297 n->updated = n->used = now;
298 n->nud_state = NUD_NONE;
299 n->output = neigh_blackhole;
David S. Millerf6b72b62011-07-14 07:53:20 -0700300 seqlock_init(&n->hh.hh_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700301 n->parms = neigh_parms_clone(&tbl->parms);
Pavel Emelyanovb24b8a22008-01-23 21:20:07 -0800302 setup_timer(&n->timer, neigh_timer_handler, (unsigned long)n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700303
304 NEIGH_CACHE_STAT_INC(tbl, allocs);
305 n->tbl = tbl;
306 atomic_set(&n->refcnt, 1);
307 n->dead = 1;
308out:
309 return n;
310
311out_entries:
312 atomic_dec(&tbl->entries);
313 goto out;
314}
315
David S. Millercd089332011-07-11 01:28:12 -0700316static struct neigh_hash_table *neigh_hash_alloc(unsigned int shift)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700317{
David S. Millercd089332011-07-11 01:28:12 -0700318 size_t size = (1 << shift) * sizeof(struct neighbour *);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000319 struct neigh_hash_table *ret;
Eric Dumazet6193d2b2011-01-19 22:02:47 +0000320 struct neighbour __rcu **buckets;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700321
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000322 ret = kmalloc(sizeof(*ret), GFP_ATOMIC);
323 if (!ret)
324 return NULL;
325 if (size <= PAGE_SIZE)
326 buckets = kzalloc(size, GFP_ATOMIC);
327 else
Eric Dumazet6193d2b2011-01-19 22:02:47 +0000328 buckets = (struct neighbour __rcu **)
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000329 __get_free_pages(GFP_ATOMIC | __GFP_ZERO,
330 get_order(size));
331 if (!buckets) {
332 kfree(ret);
333 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700334 }
Eric Dumazet6193d2b2011-01-19 22:02:47 +0000335 ret->hash_buckets = buckets;
David S. Millercd089332011-07-11 01:28:12 -0700336 ret->hash_shift = shift;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000337 get_random_bytes(&ret->hash_rnd, sizeof(ret->hash_rnd));
David S. Millerf610b742011-07-11 01:37:28 -0700338 ret->hash_rnd |= 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339 return ret;
340}
341
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000342static void neigh_hash_free_rcu(struct rcu_head *head)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700343{
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000344 struct neigh_hash_table *nht = container_of(head,
345 struct neigh_hash_table,
346 rcu);
David S. Millercd089332011-07-11 01:28:12 -0700347 size_t size = (1 << nht->hash_shift) * sizeof(struct neighbour *);
Eric Dumazet6193d2b2011-01-19 22:02:47 +0000348 struct neighbour __rcu **buckets = nht->hash_buckets;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349
350 if (size <= PAGE_SIZE)
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000351 kfree(buckets);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700352 else
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000353 free_pages((unsigned long)buckets, get_order(size));
354 kfree(nht);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700355}
356
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000357static struct neigh_hash_table *neigh_hash_grow(struct neigh_table *tbl,
David S. Millercd089332011-07-11 01:28:12 -0700358 unsigned long new_shift)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700359{
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000360 unsigned int i, hash;
361 struct neigh_hash_table *new_nht, *old_nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700362
363 NEIGH_CACHE_STAT_INC(tbl, hash_grows);
364
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000365 old_nht = rcu_dereference_protected(tbl->nht,
366 lockdep_is_held(&tbl->lock));
David S. Millercd089332011-07-11 01:28:12 -0700367 new_nht = neigh_hash_alloc(new_shift);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000368 if (!new_nht)
369 return old_nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700370
David S. Millercd089332011-07-11 01:28:12 -0700371 for (i = 0; i < (1 << old_nht->hash_shift); i++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700372 struct neighbour *n, *next;
373
Eric Dumazet767e97e2010-10-06 17:49:21 -0700374 for (n = rcu_dereference_protected(old_nht->hash_buckets[i],
375 lockdep_is_held(&tbl->lock));
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000376 n != NULL;
377 n = next) {
378 hash = tbl->hash(n->primary_key, n->dev,
379 new_nht->hash_rnd);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700380
David S. Millercd089332011-07-11 01:28:12 -0700381 hash >>= (32 - new_nht->hash_shift);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700382 next = rcu_dereference_protected(n->next,
383 lockdep_is_held(&tbl->lock));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700384
Eric Dumazet767e97e2010-10-06 17:49:21 -0700385 rcu_assign_pointer(n->next,
386 rcu_dereference_protected(
387 new_nht->hash_buckets[hash],
388 lockdep_is_held(&tbl->lock)));
389 rcu_assign_pointer(new_nht->hash_buckets[hash], n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700390 }
391 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700392
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000393 rcu_assign_pointer(tbl->nht, new_nht);
394 call_rcu(&old_nht->rcu, neigh_hash_free_rcu);
395 return new_nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700396}
397
398struct neighbour *neigh_lookup(struct neigh_table *tbl, const void *pkey,
399 struct net_device *dev)
400{
401 struct neighbour *n;
402 int key_len = tbl->key_len;
Pavel Emelyanovbc4bf5f2008-02-23 19:57:02 -0800403 u32 hash_val;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000404 struct neigh_hash_table *nht;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900405
Linus Torvalds1da177e2005-04-16 15:20:36 -0700406 NEIGH_CACHE_STAT_INC(tbl, lookups);
407
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000408 rcu_read_lock_bh();
409 nht = rcu_dereference_bh(tbl->nht);
David S. Millercd089332011-07-11 01:28:12 -0700410 hash_val = tbl->hash(pkey, dev, nht->hash_rnd) >> (32 - nht->hash_shift);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700411
412 for (n = rcu_dereference_bh(nht->hash_buckets[hash_val]);
413 n != NULL;
414 n = rcu_dereference_bh(n->next)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700415 if (dev == n->dev && !memcmp(n->primary_key, pkey, key_len)) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700416 if (!atomic_inc_not_zero(&n->refcnt))
417 n = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700418 NEIGH_CACHE_STAT_INC(tbl, hits);
419 break;
420 }
421 }
Eric Dumazet767e97e2010-10-06 17:49:21 -0700422
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000423 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700424 return n;
425}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900426EXPORT_SYMBOL(neigh_lookup);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700427
Eric W. Biederman426b5302008-01-24 00:13:18 -0800428struct neighbour *neigh_lookup_nodev(struct neigh_table *tbl, struct net *net,
429 const void *pkey)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700430{
431 struct neighbour *n;
432 int key_len = tbl->key_len;
Pavel Emelyanovbc4bf5f2008-02-23 19:57:02 -0800433 u32 hash_val;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000434 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700435
436 NEIGH_CACHE_STAT_INC(tbl, lookups);
437
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000438 rcu_read_lock_bh();
439 nht = rcu_dereference_bh(tbl->nht);
David S. Millercd089332011-07-11 01:28:12 -0700440 hash_val = tbl->hash(pkey, NULL, nht->hash_rnd) >> (32 - nht->hash_shift);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700441
442 for (n = rcu_dereference_bh(nht->hash_buckets[hash_val]);
443 n != NULL;
444 n = rcu_dereference_bh(n->next)) {
Eric W. Biederman426b5302008-01-24 00:13:18 -0800445 if (!memcmp(n->primary_key, pkey, key_len) &&
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +0900446 net_eq(dev_net(n->dev), net)) {
Eric Dumazet767e97e2010-10-06 17:49:21 -0700447 if (!atomic_inc_not_zero(&n->refcnt))
448 n = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700449 NEIGH_CACHE_STAT_INC(tbl, hits);
450 break;
451 }
452 }
Eric Dumazet767e97e2010-10-06 17:49:21 -0700453
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000454 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700455 return n;
456}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900457EXPORT_SYMBOL(neigh_lookup_nodev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700458
459struct neighbour *neigh_create(struct neigh_table *tbl, const void *pkey,
460 struct net_device *dev)
461{
462 u32 hash_val;
463 int key_len = tbl->key_len;
464 int error;
465 struct neighbour *n1, *rc, *n = neigh_alloc(tbl);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000466 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700467
468 if (!n) {
469 rc = ERR_PTR(-ENOBUFS);
470 goto out;
471 }
472
473 memcpy(n->primary_key, pkey, key_len);
474 n->dev = dev;
475 dev_hold(dev);
476
477 /* Protocol specific setup. */
478 if (tbl->constructor && (error = tbl->constructor(n)) < 0) {
479 rc = ERR_PTR(error);
480 goto out_neigh_release;
481 }
482
483 /* Device specific setup. */
484 if (n->parms->neigh_setup &&
485 (error = n->parms->neigh_setup(n)) < 0) {
486 rc = ERR_PTR(error);
487 goto out_neigh_release;
488 }
489
490 n->confirmed = jiffies - (n->parms->base_reachable_time << 1);
491
492 write_lock_bh(&tbl->lock);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000493 nht = rcu_dereference_protected(tbl->nht,
494 lockdep_is_held(&tbl->lock));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700495
David S. Millercd089332011-07-11 01:28:12 -0700496 if (atomic_read(&tbl->entries) > (1 << nht->hash_shift))
497 nht = neigh_hash_grow(tbl, nht->hash_shift + 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700498
David S. Millercd089332011-07-11 01:28:12 -0700499 hash_val = tbl->hash(pkey, dev, nht->hash_rnd) >> (32 - nht->hash_shift);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700500
501 if (n->parms->dead) {
502 rc = ERR_PTR(-EINVAL);
503 goto out_tbl_unlock;
504 }
505
Eric Dumazet767e97e2010-10-06 17:49:21 -0700506 for (n1 = rcu_dereference_protected(nht->hash_buckets[hash_val],
507 lockdep_is_held(&tbl->lock));
508 n1 != NULL;
509 n1 = rcu_dereference_protected(n1->next,
510 lockdep_is_held(&tbl->lock))) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511 if (dev == n1->dev && !memcmp(n1->primary_key, pkey, key_len)) {
512 neigh_hold(n1);
513 rc = n1;
514 goto out_tbl_unlock;
515 }
516 }
517
Linus Torvalds1da177e2005-04-16 15:20:36 -0700518 n->dead = 0;
519 neigh_hold(n);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700520 rcu_assign_pointer(n->next,
521 rcu_dereference_protected(nht->hash_buckets[hash_val],
522 lockdep_is_held(&tbl->lock)));
523 rcu_assign_pointer(nht->hash_buckets[hash_val], n);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700524 write_unlock_bh(&tbl->lock);
525 NEIGH_PRINTK2("neigh %p is created.\n", n);
526 rc = n;
527out:
528 return rc;
529out_tbl_unlock:
530 write_unlock_bh(&tbl->lock);
531out_neigh_release:
532 neigh_release(n);
533 goto out;
534}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900535EXPORT_SYMBOL(neigh_create);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700536
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900537static u32 pneigh_hash(const void *pkey, int key_len)
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700538{
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700539 u32 hash_val = *(u32 *)(pkey + key_len - 4);
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700540 hash_val ^= (hash_val >> 16);
541 hash_val ^= hash_val >> 8;
542 hash_val ^= hash_val >> 4;
543 hash_val &= PNEIGH_HASHMASK;
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900544 return hash_val;
545}
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700546
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900547static struct pneigh_entry *__pneigh_lookup_1(struct pneigh_entry *n,
548 struct net *net,
549 const void *pkey,
550 int key_len,
551 struct net_device *dev)
552{
553 while (n) {
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700554 if (!memcmp(n->key, pkey, key_len) &&
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900555 net_eq(pneigh_net(n), net) &&
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700556 (n->dev == dev || !n->dev))
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900557 return n;
558 n = n->next;
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700559 }
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900560 return NULL;
561}
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700562
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900563struct pneigh_entry *__pneigh_lookup(struct neigh_table *tbl,
564 struct net *net, const void *pkey, struct net_device *dev)
565{
566 int key_len = tbl->key_len;
567 u32 hash_val = pneigh_hash(pkey, key_len);
568
569 return __pneigh_lookup_1(tbl->phash_buckets[hash_val],
570 net, pkey, key_len, dev);
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700571}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900572EXPORT_SYMBOL_GPL(__pneigh_lookup);
Pavel Emelyanovfa86d322008-03-24 14:48:59 -0700573
Eric W. Biederman426b5302008-01-24 00:13:18 -0800574struct pneigh_entry * pneigh_lookup(struct neigh_table *tbl,
575 struct net *net, const void *pkey,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700576 struct net_device *dev, int creat)
577{
578 struct pneigh_entry *n;
579 int key_len = tbl->key_len;
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900580 u32 hash_val = pneigh_hash(pkey, key_len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700581
582 read_lock_bh(&tbl->lock);
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900583 n = __pneigh_lookup_1(tbl->phash_buckets[hash_val],
584 net, pkey, key_len, dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700585 read_unlock_bh(&tbl->lock);
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900586
587 if (n || !creat)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700588 goto out;
589
Pavel Emelyanov4ae28942007-10-15 12:54:15 -0700590 ASSERT_RTNL();
591
Linus Torvalds1da177e2005-04-16 15:20:36 -0700592 n = kmalloc(sizeof(*n) + key_len, GFP_KERNEL);
593 if (!n)
594 goto out;
595
Eric Dumazete42ea982008-11-12 00:54:54 -0800596 write_pnet(&n->net, hold_net(net));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700597 memcpy(n->key, pkey, key_len);
598 n->dev = dev;
599 if (dev)
600 dev_hold(dev);
601
602 if (tbl->pconstructor && tbl->pconstructor(n)) {
603 if (dev)
604 dev_put(dev);
Denis V. Lunevda12f732008-02-20 00:26:16 -0800605 release_net(net);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700606 kfree(n);
607 n = NULL;
608 goto out;
609 }
610
611 write_lock_bh(&tbl->lock);
612 n->next = tbl->phash_buckets[hash_val];
613 tbl->phash_buckets[hash_val] = n;
614 write_unlock_bh(&tbl->lock);
615out:
616 return n;
617}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900618EXPORT_SYMBOL(pneigh_lookup);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700619
620
Eric W. Biederman426b5302008-01-24 00:13:18 -0800621int pneigh_delete(struct neigh_table *tbl, struct net *net, const void *pkey,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700622 struct net_device *dev)
623{
624 struct pneigh_entry *n, **np;
625 int key_len = tbl->key_len;
YOSHIFUJI Hideakibe01d652008-03-28 12:46:53 +0900626 u32 hash_val = pneigh_hash(pkey, key_len);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700627
628 write_lock_bh(&tbl->lock);
629 for (np = &tbl->phash_buckets[hash_val]; (n = *np) != NULL;
630 np = &n->next) {
Eric W. Biederman426b5302008-01-24 00:13:18 -0800631 if (!memcmp(n->key, pkey, key_len) && n->dev == dev &&
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +0900632 net_eq(pneigh_net(n), net)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700633 *np = n->next;
634 write_unlock_bh(&tbl->lock);
635 if (tbl->pdestructor)
636 tbl->pdestructor(n);
637 if (n->dev)
638 dev_put(n->dev);
YOSHIFUJI Hideaki57da52c2008-03-26 03:49:59 +0900639 release_net(pneigh_net(n));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700640 kfree(n);
641 return 0;
642 }
643 }
644 write_unlock_bh(&tbl->lock);
645 return -ENOENT;
646}
647
648static int pneigh_ifdown(struct neigh_table *tbl, struct net_device *dev)
649{
650 struct pneigh_entry *n, **np;
651 u32 h;
652
653 for (h = 0; h <= PNEIGH_HASHMASK; h++) {
654 np = &tbl->phash_buckets[h];
655 while ((n = *np) != NULL) {
656 if (!dev || n->dev == dev) {
657 *np = n->next;
658 if (tbl->pdestructor)
659 tbl->pdestructor(n);
660 if (n->dev)
661 dev_put(n->dev);
YOSHIFUJI Hideaki57da52c2008-03-26 03:49:59 +0900662 release_net(pneigh_net(n));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700663 kfree(n);
664 continue;
665 }
666 np = &n->next;
667 }
668 }
669 return -ENOENT;
670}
671
Denis V. Lunev06f05112008-01-24 00:30:58 -0800672static void neigh_parms_destroy(struct neigh_parms *parms);
673
674static inline void neigh_parms_put(struct neigh_parms *parms)
675{
676 if (atomic_dec_and_test(&parms->refcnt))
677 neigh_parms_destroy(parms);
678}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700679
Eric Dumazet767e97e2010-10-06 17:49:21 -0700680static void neigh_destroy_rcu(struct rcu_head *head)
681{
682 struct neighbour *neigh = container_of(head, struct neighbour, rcu);
683
684 kmem_cache_free(neigh->tbl->kmem_cachep, neigh);
685}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700686/*
687 * neighbour must already be out of the table;
688 *
689 */
690void neigh_destroy(struct neighbour *neigh)
691{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700692 NEIGH_CACHE_STAT_INC(neigh->tbl, destroys);
693
694 if (!neigh->dead) {
695 printk(KERN_WARNING
696 "Destroying alive neighbour %p\n", neigh);
697 dump_stack();
698 return;
699 }
700
701 if (neigh_del_timer(neigh))
702 printk(KERN_WARNING "Impossible event.\n");
703
Linus Torvalds1da177e2005-04-16 15:20:36 -0700704 skb_queue_purge(&neigh->arp_queue);
705
706 dev_put(neigh->dev);
707 neigh_parms_put(neigh->parms);
708
709 NEIGH_PRINTK2("neigh %p is destroyed.\n", neigh);
710
711 atomic_dec(&neigh->tbl->entries);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700712 call_rcu(&neigh->rcu, neigh_destroy_rcu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700713}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900714EXPORT_SYMBOL(neigh_destroy);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700715
716/* Neighbour state is suspicious;
717 disable fast path.
718
719 Called with write_locked neigh.
720 */
721static void neigh_suspect(struct neighbour *neigh)
722{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700723 NEIGH_PRINTK2("neigh %p is suspected.\n", neigh);
724
725 neigh->output = neigh->ops->output;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700726}
727
728/* Neighbour state is OK;
729 enable fast path.
730
731 Called with write_locked neigh.
732 */
733static void neigh_connect(struct neighbour *neigh)
734{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700735 NEIGH_PRINTK2("neigh %p is connected.\n", neigh);
736
737 neigh->output = neigh->ops->connected_output;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700738}
739
Eric Dumazete4c4e442009-07-30 03:15:07 +0000740static void neigh_periodic_work(struct work_struct *work)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700741{
Eric Dumazete4c4e442009-07-30 03:15:07 +0000742 struct neigh_table *tbl = container_of(work, struct neigh_table, gc_work.work);
Eric Dumazet767e97e2010-10-06 17:49:21 -0700743 struct neighbour *n;
744 struct neighbour __rcu **np;
Eric Dumazete4c4e442009-07-30 03:15:07 +0000745 unsigned int i;
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000746 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700747
748 NEIGH_CACHE_STAT_INC(tbl, periodic_gc_runs);
749
Eric Dumazete4c4e442009-07-30 03:15:07 +0000750 write_lock_bh(&tbl->lock);
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000751 nht = rcu_dereference_protected(tbl->nht,
752 lockdep_is_held(&tbl->lock));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700753
754 /*
755 * periodically recompute ReachableTime from random function
756 */
757
Eric Dumazete4c4e442009-07-30 03:15:07 +0000758 if (time_after(jiffies, tbl->last_rand + 300 * HZ)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700759 struct neigh_parms *p;
Eric Dumazete4c4e442009-07-30 03:15:07 +0000760 tbl->last_rand = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700761 for (p = &tbl->parms; p; p = p->next)
762 p->reachable_time =
763 neigh_rand_reach_time(p->base_reachable_time);
764 }
765
David S. Millercd089332011-07-11 01:28:12 -0700766 for (i = 0 ; i < (1 << nht->hash_shift); i++) {
Eric Dumazetd6bf7812010-10-04 06:15:44 +0000767 np = &nht->hash_buckets[i];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700768
Eric Dumazet767e97e2010-10-06 17:49:21 -0700769 while ((n = rcu_dereference_protected(*np,
770 lockdep_is_held(&tbl->lock))) != NULL) {
Eric Dumazete4c4e442009-07-30 03:15:07 +0000771 unsigned int state;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700772
Eric Dumazete4c4e442009-07-30 03:15:07 +0000773 write_lock(&n->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700774
Eric Dumazete4c4e442009-07-30 03:15:07 +0000775 state = n->nud_state;
776 if (state & (NUD_PERMANENT | NUD_IN_TIMER)) {
777 write_unlock(&n->lock);
778 goto next_elt;
779 }
780
781 if (time_before(n->used, n->confirmed))
782 n->used = n->confirmed;
783
784 if (atomic_read(&n->refcnt) == 1 &&
785 (state == NUD_FAILED ||
786 time_after(jiffies, n->used + n->parms->gc_staletime))) {
787 *np = n->next;
788 n->dead = 1;
789 write_unlock(&n->lock);
790 neigh_cleanup_and_release(n);
791 continue;
792 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700793 write_unlock(&n->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700794
795next_elt:
Eric Dumazete4c4e442009-07-30 03:15:07 +0000796 np = &n->next;
797 }
798 /*
799 * It's fine to release lock here, even if hash table
800 * grows while we are preempted.
801 */
802 write_unlock_bh(&tbl->lock);
803 cond_resched();
804 write_lock_bh(&tbl->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700805 }
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900806 /* Cycle through all hash buckets every base_reachable_time/2 ticks.
807 * ARP entry timeouts range from 1/2 base_reachable_time to 3/2
808 * base_reachable_time.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700809 */
Eric Dumazete4c4e442009-07-30 03:15:07 +0000810 schedule_delayed_work(&tbl->gc_work,
811 tbl->parms.base_reachable_time >> 1);
812 write_unlock_bh(&tbl->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700813}
814
815static __inline__ int neigh_max_probes(struct neighbour *n)
816{
817 struct neigh_parms *p = n->parms;
Eric Dumazeta02cec22010-09-22 20:43:57 +0000818 return (n->nud_state & NUD_PROBE) ?
Linus Torvalds1da177e2005-04-16 15:20:36 -0700819 p->ucast_probes :
Eric Dumazeta02cec22010-09-22 20:43:57 +0000820 p->ucast_probes + p->app_probes + p->mcast_probes;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700821}
822
Timo Teras5ef12d92009-06-11 04:16:28 -0700823static void neigh_invalidate(struct neighbour *neigh)
Eric Dumazet0a141502010-03-09 19:40:54 +0000824 __releases(neigh->lock)
825 __acquires(neigh->lock)
Timo Teras5ef12d92009-06-11 04:16:28 -0700826{
827 struct sk_buff *skb;
828
829 NEIGH_CACHE_STAT_INC(neigh->tbl, res_failed);
830 NEIGH_PRINTK2("neigh %p is failed.\n", neigh);
831 neigh->updated = jiffies;
832
833 /* It is very thin place. report_unreachable is very complicated
834 routine. Particularly, it can hit the same neighbour entry!
835
836 So that, we try to be accurate and avoid dead loop. --ANK
837 */
838 while (neigh->nud_state == NUD_FAILED &&
839 (skb = __skb_dequeue(&neigh->arp_queue)) != NULL) {
840 write_unlock(&neigh->lock);
841 neigh->ops->error_report(neigh, skb);
842 write_lock(&neigh->lock);
843 }
844 skb_queue_purge(&neigh->arp_queue);
845}
846
Linus Torvalds1da177e2005-04-16 15:20:36 -0700847/* Called when a timer expires for a neighbour entry. */
848
849static void neigh_timer_handler(unsigned long arg)
850{
851 unsigned long now, next;
852 struct neighbour *neigh = (struct neighbour *)arg;
853 unsigned state;
854 int notify = 0;
855
856 write_lock(&neigh->lock);
857
858 state = neigh->nud_state;
859 now = jiffies;
860 next = now + HZ;
861
862 if (!(state & NUD_IN_TIMER)) {
863#ifndef CONFIG_SMP
864 printk(KERN_WARNING "neigh: timer & !nud_in_timer\n");
865#endif
866 goto out;
867 }
868
869 if (state & NUD_REACHABLE) {
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900870 if (time_before_eq(now,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700871 neigh->confirmed + neigh->parms->reachable_time)) {
872 NEIGH_PRINTK2("neigh %p is still alive.\n", neigh);
873 next = neigh->confirmed + neigh->parms->reachable_time;
874 } else if (time_before_eq(now,
875 neigh->used + neigh->parms->delay_probe_time)) {
876 NEIGH_PRINTK2("neigh %p is delayed.\n", neigh);
877 neigh->nud_state = NUD_DELAY;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800878 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700879 neigh_suspect(neigh);
880 next = now + neigh->parms->delay_probe_time;
881 } else {
882 NEIGH_PRINTK2("neigh %p is suspected.\n", neigh);
883 neigh->nud_state = NUD_STALE;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800884 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700885 neigh_suspect(neigh);
Tom Tucker8d717402006-07-30 20:43:36 -0700886 notify = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700887 }
888 } else if (state & NUD_DELAY) {
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900889 if (time_before_eq(now,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700890 neigh->confirmed + neigh->parms->delay_probe_time)) {
891 NEIGH_PRINTK2("neigh %p is now reachable.\n", neigh);
892 neigh->nud_state = NUD_REACHABLE;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800893 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700894 neigh_connect(neigh);
Tom Tucker8d717402006-07-30 20:43:36 -0700895 notify = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700896 next = neigh->confirmed + neigh->parms->reachable_time;
897 } else {
898 NEIGH_PRINTK2("neigh %p is probed.\n", neigh);
899 neigh->nud_state = NUD_PROBE;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800900 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700901 atomic_set(&neigh->probes, 0);
902 next = now + neigh->parms->retrans_time;
903 }
904 } else {
905 /* NUD_PROBE|NUD_INCOMPLETE */
906 next = now + neigh->parms->retrans_time;
907 }
908
909 if ((neigh->nud_state & (NUD_INCOMPLETE | NUD_PROBE)) &&
910 atomic_read(&neigh->probes) >= neigh_max_probes(neigh)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700911 neigh->nud_state = NUD_FAILED;
912 notify = 1;
Timo Teras5ef12d92009-06-11 04:16:28 -0700913 neigh_invalidate(neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700914 }
915
916 if (neigh->nud_state & NUD_IN_TIMER) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700917 if (time_before(next, jiffies + HZ/2))
918 next = jiffies + HZ/2;
Herbert Xu6fb99742005-10-23 16:37:48 +1000919 if (!mod_timer(&neigh->timer, next))
920 neigh_hold(neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700921 }
922 if (neigh->nud_state & (NUD_INCOMPLETE | NUD_PROBE)) {
923 struct sk_buff *skb = skb_peek(&neigh->arp_queue);
David S. Miller9ff56602008-02-17 18:39:54 -0800924 /* keep skb alive even if arp_queue overflows */
925 if (skb)
Frank Blaschka7e367632008-03-03 12:16:04 -0800926 skb = skb_copy(skb, GFP_ATOMIC);
David S. Miller9ff56602008-02-17 18:39:54 -0800927 write_unlock(&neigh->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700928 neigh->ops->solicit(neigh, skb);
929 atomic_inc(&neigh->probes);
Wei Yongjunf3fbbe02009-02-25 00:37:32 +0000930 kfree_skb(skb);
David S. Miller9ff56602008-02-17 18:39:54 -0800931 } else {
David S. Miller69cc64d2008-02-11 21:45:44 -0800932out:
David S. Miller9ff56602008-02-17 18:39:54 -0800933 write_unlock(&neigh->lock);
934 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700935
Thomas Grafd961db32007-08-08 23:12:56 -0700936 if (notify)
937 neigh_update_notify(neigh);
938
Linus Torvalds1da177e2005-04-16 15:20:36 -0700939 neigh_release(neigh);
940}
941
942int __neigh_event_send(struct neighbour *neigh, struct sk_buff *skb)
943{
944 int rc;
945 unsigned long now;
946
947 write_lock_bh(&neigh->lock);
948
949 rc = 0;
950 if (neigh->nud_state & (NUD_CONNECTED | NUD_DELAY | NUD_PROBE))
951 goto out_unlock_bh;
952
953 now = jiffies;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +0900954
Linus Torvalds1da177e2005-04-16 15:20:36 -0700955 if (!(neigh->nud_state & (NUD_STALE | NUD_INCOMPLETE))) {
956 if (neigh->parms->mcast_probes + neigh->parms->app_probes) {
957 atomic_set(&neigh->probes, neigh->parms->ucast_probes);
958 neigh->nud_state = NUD_INCOMPLETE;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800959 neigh->updated = jiffies;
David S. Miller667347f2005-09-27 12:07:44 -0700960 neigh_add_timer(neigh, now + 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700961 } else {
962 neigh->nud_state = NUD_FAILED;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800963 neigh->updated = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700964 write_unlock_bh(&neigh->lock);
965
Wei Yongjunf3fbbe02009-02-25 00:37:32 +0000966 kfree_skb(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700967 return 1;
968 }
969 } else if (neigh->nud_state & NUD_STALE) {
970 NEIGH_PRINTK2("neigh %p is delayed.\n", neigh);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700971 neigh->nud_state = NUD_DELAY;
YOSHIFUJI Hideaki955aaa22006-03-20 16:52:52 -0800972 neigh->updated = jiffies;
David S. Miller667347f2005-09-27 12:07:44 -0700973 neigh_add_timer(neigh,
974 jiffies + neigh->parms->delay_probe_time);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700975 }
976
977 if (neigh->nud_state == NUD_INCOMPLETE) {
978 if (skb) {
979 if (skb_queue_len(&neigh->arp_queue) >=
980 neigh->parms->queue_len) {
981 struct sk_buff *buff;
David S. Millerf72051b2008-09-23 01:11:18 -0700982 buff = __skb_dequeue(&neigh->arp_queue);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700983 kfree_skb(buff);
Neil Horman9a6d2762008-07-16 20:50:49 -0700984 NEIGH_CACHE_STAT_INC(neigh->tbl, unres_discards);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700985 }
Eric Dumazeta4731132010-05-27 16:09:39 -0700986 skb_dst_force(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700987 __skb_queue_tail(&neigh->arp_queue, skb);
988 }
989 rc = 1;
990 }
991out_unlock_bh:
992 write_unlock_bh(&neigh->lock);
993 return rc;
994}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +0900995EXPORT_SYMBOL(__neigh_event_send);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700996
David S. Millerf6b72b62011-07-14 07:53:20 -0700997static void neigh_update_hhs(struct neighbour *neigh)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700998{
999 struct hh_cache *hh;
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -07001000 void (*update)(struct hh_cache*, const struct net_device*, const unsigned char *)
Doug Kehn91a72a72010-07-14 18:02:16 -07001001 = NULL;
1002
1003 if (neigh->dev->header_ops)
1004 update = neigh->dev->header_ops->cache_update;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001005
1006 if (update) {
David S. Millerf6b72b62011-07-14 07:53:20 -07001007 hh = &neigh->hh;
1008 if (hh->hh_len) {
Stephen Hemminger3644f0c2006-12-07 15:08:17 -08001009 write_seqlock_bh(&hh->hh_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001010 update(hh, neigh->dev, neigh->ha);
Stephen Hemminger3644f0c2006-12-07 15:08:17 -08001011 write_sequnlock_bh(&hh->hh_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001012 }
1013 }
1014}
1015
1016
1017
1018/* Generic update routine.
1019 -- lladdr is new lladdr or NULL, if it is not supplied.
1020 -- new is new state.
1021 -- flags
1022 NEIGH_UPDATE_F_OVERRIDE allows to override existing lladdr,
1023 if it is different.
1024 NEIGH_UPDATE_F_WEAK_OVERRIDE will suspect existing "connected"
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001025 lladdr instead of overriding it
Linus Torvalds1da177e2005-04-16 15:20:36 -07001026 if it is different.
1027 It also allows to retain current state
1028 if lladdr is unchanged.
1029 NEIGH_UPDATE_F_ADMIN means that the change is administrative.
1030
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001031 NEIGH_UPDATE_F_OVERRIDE_ISROUTER allows to override existing
Linus Torvalds1da177e2005-04-16 15:20:36 -07001032 NTF_ROUTER flag.
1033 NEIGH_UPDATE_F_ISROUTER indicates if the neighbour is known as
1034 a router.
1035
1036 Caller MUST hold reference count on the entry.
1037 */
1038
1039int neigh_update(struct neighbour *neigh, const u8 *lladdr, u8 new,
1040 u32 flags)
1041{
1042 u8 old;
1043 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001044 int notify = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001045 struct net_device *dev;
1046 int update_isrouter = 0;
1047
1048 write_lock_bh(&neigh->lock);
1049
1050 dev = neigh->dev;
1051 old = neigh->nud_state;
1052 err = -EPERM;
1053
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001054 if (!(flags & NEIGH_UPDATE_F_ADMIN) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -07001055 (old & (NUD_NOARP | NUD_PERMANENT)))
1056 goto out;
1057
1058 if (!(new & NUD_VALID)) {
1059 neigh_del_timer(neigh);
1060 if (old & NUD_CONNECTED)
1061 neigh_suspect(neigh);
1062 neigh->nud_state = new;
1063 err = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001064 notify = old & NUD_VALID;
Timo Teras5ef12d92009-06-11 04:16:28 -07001065 if ((old & (NUD_INCOMPLETE | NUD_PROBE)) &&
1066 (new & NUD_FAILED)) {
1067 neigh_invalidate(neigh);
1068 notify = 1;
1069 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001070 goto out;
1071 }
1072
1073 /* Compare new lladdr with cached one */
1074 if (!dev->addr_len) {
1075 /* First case: device needs no address. */
1076 lladdr = neigh->ha;
1077 } else if (lladdr) {
1078 /* The second case: if something is already cached
1079 and a new address is proposed:
1080 - compare new & old
1081 - if they are different, check override flag
1082 */
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001083 if ((old & NUD_VALID) &&
Linus Torvalds1da177e2005-04-16 15:20:36 -07001084 !memcmp(lladdr, neigh->ha, dev->addr_len))
1085 lladdr = neigh->ha;
1086 } else {
1087 /* No address is supplied; if we know something,
1088 use it, otherwise discard the request.
1089 */
1090 err = -EINVAL;
1091 if (!(old & NUD_VALID))
1092 goto out;
1093 lladdr = neigh->ha;
1094 }
1095
1096 if (new & NUD_CONNECTED)
1097 neigh->confirmed = jiffies;
1098 neigh->updated = jiffies;
1099
1100 /* If entry was valid and address is not changed,
1101 do not change entry state, if new one is STALE.
1102 */
1103 err = 0;
1104 update_isrouter = flags & NEIGH_UPDATE_F_OVERRIDE_ISROUTER;
1105 if (old & NUD_VALID) {
1106 if (lladdr != neigh->ha && !(flags & NEIGH_UPDATE_F_OVERRIDE)) {
1107 update_isrouter = 0;
1108 if ((flags & NEIGH_UPDATE_F_WEAK_OVERRIDE) &&
1109 (old & NUD_CONNECTED)) {
1110 lladdr = neigh->ha;
1111 new = NUD_STALE;
1112 } else
1113 goto out;
1114 } else {
1115 if (lladdr == neigh->ha && new == NUD_STALE &&
1116 ((flags & NEIGH_UPDATE_F_WEAK_OVERRIDE) ||
1117 (old & NUD_CONNECTED))
1118 )
1119 new = old;
1120 }
1121 }
1122
1123 if (new != old) {
1124 neigh_del_timer(neigh);
Pavel Emelyanova43d8992007-12-20 15:49:05 -08001125 if (new & NUD_IN_TIMER)
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001126 neigh_add_timer(neigh, (jiffies +
1127 ((new & NUD_REACHABLE) ?
David S. Miller667347f2005-09-27 12:07:44 -07001128 neigh->parms->reachable_time :
1129 0)));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001130 neigh->nud_state = new;
1131 }
1132
1133 if (lladdr != neigh->ha) {
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001134 write_seqlock(&neigh->ha_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001135 memcpy(&neigh->ha, lladdr, dev->addr_len);
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001136 write_sequnlock(&neigh->ha_lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001137 neigh_update_hhs(neigh);
1138 if (!(new & NUD_CONNECTED))
1139 neigh->confirmed = jiffies -
1140 (neigh->parms->base_reachable_time << 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001141 notify = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001142 }
1143 if (new == old)
1144 goto out;
1145 if (new & NUD_CONNECTED)
1146 neigh_connect(neigh);
1147 else
1148 neigh_suspect(neigh);
1149 if (!(old & NUD_VALID)) {
1150 struct sk_buff *skb;
1151
1152 /* Again: avoid dead loop if something went wrong */
1153
1154 while (neigh->nud_state & NUD_VALID &&
1155 (skb = __skb_dequeue(&neigh->arp_queue)) != NULL) {
1156 struct neighbour *n1 = neigh;
1157 write_unlock_bh(&neigh->lock);
1158 /* On shaper/eql skb->dst->neighbour != neigh :( */
Eric Dumazetadf30902009-06-02 05:19:30 +00001159 if (skb_dst(skb) && skb_dst(skb)->neighbour)
1160 n1 = skb_dst(skb)->neighbour;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001161 n1->output(skb);
1162 write_lock_bh(&neigh->lock);
1163 }
1164 skb_queue_purge(&neigh->arp_queue);
1165 }
1166out:
1167 if (update_isrouter) {
1168 neigh->flags = (flags & NEIGH_UPDATE_F_ISROUTER) ?
1169 (neigh->flags | NTF_ROUTER) :
1170 (neigh->flags & ~NTF_ROUTER);
1171 }
1172 write_unlock_bh(&neigh->lock);
Tom Tucker8d717402006-07-30 20:43:36 -07001173
1174 if (notify)
Thomas Grafd961db32007-08-08 23:12:56 -07001175 neigh_update_notify(neigh);
1176
Linus Torvalds1da177e2005-04-16 15:20:36 -07001177 return err;
1178}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001179EXPORT_SYMBOL(neigh_update);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001180
1181struct neighbour *neigh_event_ns(struct neigh_table *tbl,
1182 u8 *lladdr, void *saddr,
1183 struct net_device *dev)
1184{
1185 struct neighbour *neigh = __neigh_lookup(tbl, saddr, dev,
1186 lladdr || !dev->addr_len);
1187 if (neigh)
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001188 neigh_update(neigh, lladdr, NUD_STALE,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001189 NEIGH_UPDATE_F_OVERRIDE);
1190 return neigh;
1191}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001192EXPORT_SYMBOL(neigh_event_ns);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001193
Eric Dumazet34d101d2010-10-11 09:16:57 -07001194/* called with read_lock_bh(&n->lock); */
David S. Millerf6b72b62011-07-14 07:53:20 -07001195static void neigh_hh_init(struct neighbour *n, struct dst_entry *dst)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001196{
Linus Torvalds1da177e2005-04-16 15:20:36 -07001197 struct net_device *dev = dst->dev;
David S. Millerf6b72b62011-07-14 07:53:20 -07001198 __be16 prot = dst->ops->protocol;
1199 struct hh_cache *hh = &n->hh;
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001200
1201 write_lock_bh(&n->lock);
Eric Dumazet34d101d2010-10-11 09:16:57 -07001202
David S. Millerf6b72b62011-07-14 07:53:20 -07001203 /* Only one thread can come in here and initialize the
1204 * hh_cache entry.
1205 */
David S. Millerb23b5452011-07-16 17:45:02 -07001206 if (!hh->hh_len)
1207 dev->header_ops->cache(n, hh, prot);
David S. Millerf6b72b62011-07-14 07:53:20 -07001208
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001209 write_unlock_bh(&n->lock);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001210}
1211
1212/* This function can be used in contexts, where only old dev_queue_xmit
Eric Dumazet767e97e2010-10-06 17:49:21 -07001213 * worked, f.e. if you want to override normal output path (eql, shaper),
1214 * but resolution is not made yet.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001215 */
1216
1217int neigh_compat_output(struct sk_buff *skb)
1218{
1219 struct net_device *dev = skb->dev;
1220
Arnaldo Carvalho de Melobbe735e2007-03-10 22:16:10 -03001221 __skb_pull(skb, skb_network_offset(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001222
Stephen Hemminger0c4e8582007-10-09 01:36:32 -07001223 if (dev_hard_header(skb, dev, ntohs(skb->protocol), NULL, NULL,
1224 skb->len) < 0 &&
Stephen Hemminger3b04ddd2007-10-09 01:40:57 -07001225 dev->header_ops->rebuild(skb))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001226 return 0;
1227
1228 return dev_queue_xmit(skb);
1229}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001230EXPORT_SYMBOL(neigh_compat_output);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001231
1232/* Slow and careful. */
1233
1234int neigh_resolve_output(struct sk_buff *skb)
1235{
Eric Dumazetadf30902009-06-02 05:19:30 +00001236 struct dst_entry *dst = skb_dst(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001237 struct neighbour *neigh;
1238 int rc = 0;
1239
1240 if (!dst || !(neigh = dst->neighbour))
1241 goto discard;
1242
Arnaldo Carvalho de Melobbe735e2007-03-10 22:16:10 -03001243 __skb_pull(skb, skb_network_offset(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001244
1245 if (!neigh_event_send(neigh, skb)) {
1246 int err;
1247 struct net_device *dev = neigh->dev;
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001248 unsigned int seq;
Eric Dumazet34d101d2010-10-11 09:16:57 -07001249
David S. Millerf6b72b62011-07-14 07:53:20 -07001250 if (dev->header_ops->cache && !neigh->hh.hh_len)
1251 neigh_hh_init(neigh, dst);
Eric Dumazet34d101d2010-10-11 09:16:57 -07001252
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001253 do {
1254 seq = read_seqbegin(&neigh->ha_lock);
1255 err = dev_hard_header(skb, dev, ntohs(skb->protocol),
1256 neigh->ha, NULL, skb->len);
1257 } while (read_seqretry(&neigh->ha_lock, seq));
Eric Dumazet34d101d2010-10-11 09:16:57 -07001258
Linus Torvalds1da177e2005-04-16 15:20:36 -07001259 if (err >= 0)
1260 rc = neigh->ops->queue_xmit(skb);
1261 else
1262 goto out_kfree_skb;
1263 }
1264out:
1265 return rc;
1266discard:
1267 NEIGH_PRINTK1("neigh_resolve_output: dst=%p neigh=%p\n",
1268 dst, dst ? dst->neighbour : NULL);
1269out_kfree_skb:
1270 rc = -EINVAL;
1271 kfree_skb(skb);
1272 goto out;
1273}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001274EXPORT_SYMBOL(neigh_resolve_output);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001275
1276/* As fast as possible without hh cache */
1277
1278int neigh_connected_output(struct sk_buff *skb)
1279{
1280 int err;
Eric Dumazetadf30902009-06-02 05:19:30 +00001281 struct dst_entry *dst = skb_dst(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001282 struct neighbour *neigh = dst->neighbour;
1283 struct net_device *dev = neigh->dev;
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001284 unsigned int seq;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001285
Arnaldo Carvalho de Melobbe735e2007-03-10 22:16:10 -03001286 __skb_pull(skb, skb_network_offset(skb));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001287
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00001288 do {
1289 seq = read_seqbegin(&neigh->ha_lock);
1290 err = dev_hard_header(skb, dev, ntohs(skb->protocol),
1291 neigh->ha, NULL, skb->len);
1292 } while (read_seqretry(&neigh->ha_lock, seq));
1293
Linus Torvalds1da177e2005-04-16 15:20:36 -07001294 if (err >= 0)
1295 err = neigh->ops->queue_xmit(skb);
1296 else {
1297 err = -EINVAL;
1298 kfree_skb(skb);
1299 }
1300 return err;
1301}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001302EXPORT_SYMBOL(neigh_connected_output);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001303
1304static void neigh_proxy_process(unsigned long arg)
1305{
1306 struct neigh_table *tbl = (struct neigh_table *)arg;
1307 long sched_next = 0;
1308 unsigned long now = jiffies;
David S. Millerf72051b2008-09-23 01:11:18 -07001309 struct sk_buff *skb, *n;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001310
1311 spin_lock(&tbl->proxy_queue.lock);
1312
David S. Millerf72051b2008-09-23 01:11:18 -07001313 skb_queue_walk_safe(&tbl->proxy_queue, skb, n) {
1314 long tdif = NEIGH_CB(skb)->sched_next - now;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001315
Linus Torvalds1da177e2005-04-16 15:20:36 -07001316 if (tdif <= 0) {
David S. Millerf72051b2008-09-23 01:11:18 -07001317 struct net_device *dev = skb->dev;
1318 __skb_unlink(skb, &tbl->proxy_queue);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001319 if (tbl->proxy_redo && netif_running(dev))
David S. Millerf72051b2008-09-23 01:11:18 -07001320 tbl->proxy_redo(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001321 else
David S. Millerf72051b2008-09-23 01:11:18 -07001322 kfree_skb(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001323
1324 dev_put(dev);
1325 } else if (!sched_next || tdif < sched_next)
1326 sched_next = tdif;
1327 }
1328 del_timer(&tbl->proxy_timer);
1329 if (sched_next)
1330 mod_timer(&tbl->proxy_timer, jiffies + sched_next);
1331 spin_unlock(&tbl->proxy_queue.lock);
1332}
1333
1334void pneigh_enqueue(struct neigh_table *tbl, struct neigh_parms *p,
1335 struct sk_buff *skb)
1336{
1337 unsigned long now = jiffies;
1338 unsigned long sched_next = now + (net_random() % p->proxy_delay);
1339
1340 if (tbl->proxy_queue.qlen > p->proxy_qlen) {
1341 kfree_skb(skb);
1342 return;
1343 }
Patrick McHardya61bbcf2005-08-14 17:24:31 -07001344
1345 NEIGH_CB(skb)->sched_next = sched_next;
1346 NEIGH_CB(skb)->flags |= LOCALLY_ENQUEUED;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001347
1348 spin_lock(&tbl->proxy_queue.lock);
1349 if (del_timer(&tbl->proxy_timer)) {
1350 if (time_before(tbl->proxy_timer.expires, sched_next))
1351 sched_next = tbl->proxy_timer.expires;
1352 }
Eric Dumazetadf30902009-06-02 05:19:30 +00001353 skb_dst_drop(skb);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001354 dev_hold(skb->dev);
1355 __skb_queue_tail(&tbl->proxy_queue, skb);
1356 mod_timer(&tbl->proxy_timer, sched_next);
1357 spin_unlock(&tbl->proxy_queue.lock);
1358}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001359EXPORT_SYMBOL(pneigh_enqueue);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001360
Tobias Klauser97fd5bc2009-07-13 11:17:49 -07001361static inline struct neigh_parms *lookup_neigh_parms(struct neigh_table *tbl,
Eric W. Biederman426b5302008-01-24 00:13:18 -08001362 struct net *net, int ifindex)
1363{
1364 struct neigh_parms *p;
1365
1366 for (p = &tbl->parms; p; p = p->next) {
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09001367 if ((p->dev && p->dev->ifindex == ifindex && net_eq(neigh_parms_net(p), net)) ||
Eric W. Biederman426b5302008-01-24 00:13:18 -08001368 (!p->dev && !ifindex))
1369 return p;
1370 }
1371
1372 return NULL;
1373}
Linus Torvalds1da177e2005-04-16 15:20:36 -07001374
1375struct neigh_parms *neigh_parms_alloc(struct net_device *dev,
1376 struct neigh_table *tbl)
1377{
Eric W. Biederman426b5302008-01-24 00:13:18 -08001378 struct neigh_parms *p, *ref;
Stephen Hemminger00829822008-11-20 20:14:53 -08001379 struct net *net = dev_net(dev);
1380 const struct net_device_ops *ops = dev->netdev_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001381
Tobias Klauser97fd5bc2009-07-13 11:17:49 -07001382 ref = lookup_neigh_parms(tbl, net, 0);
Eric W. Biederman426b5302008-01-24 00:13:18 -08001383 if (!ref)
1384 return NULL;
1385
1386 p = kmemdup(ref, sizeof(*p), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001387 if (p) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001388 p->tbl = tbl;
1389 atomic_set(&p->refcnt, 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001390 p->reachable_time =
1391 neigh_rand_reach_time(p->base_reachable_time);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001392
Stephen Hemminger00829822008-11-20 20:14:53 -08001393 if (ops->ndo_neigh_setup && ops->ndo_neigh_setup(dev, p)) {
Denis V. Lunev486b51d2008-01-14 22:59:59 -08001394 kfree(p);
1395 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001396 }
Denis V. Lunev486b51d2008-01-14 22:59:59 -08001397
1398 dev_hold(dev);
1399 p->dev = dev;
Eric Dumazete42ea982008-11-12 00:54:54 -08001400 write_pnet(&p->net, hold_net(net));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001401 p->sysctl_table = NULL;
1402 write_lock_bh(&tbl->lock);
1403 p->next = tbl->parms.next;
1404 tbl->parms.next = p;
1405 write_unlock_bh(&tbl->lock);
1406 }
1407 return p;
1408}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001409EXPORT_SYMBOL(neigh_parms_alloc);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001410
1411static void neigh_rcu_free_parms(struct rcu_head *head)
1412{
1413 struct neigh_parms *parms =
1414 container_of(head, struct neigh_parms, rcu_head);
1415
1416 neigh_parms_put(parms);
1417}
1418
1419void neigh_parms_release(struct neigh_table *tbl, struct neigh_parms *parms)
1420{
1421 struct neigh_parms **p;
1422
1423 if (!parms || parms == &tbl->parms)
1424 return;
1425 write_lock_bh(&tbl->lock);
1426 for (p = &tbl->parms.next; *p; p = &(*p)->next) {
1427 if (*p == parms) {
1428 *p = parms->next;
1429 parms->dead = 1;
1430 write_unlock_bh(&tbl->lock);
David S. Millercecbb632008-01-20 16:39:03 -08001431 if (parms->dev)
1432 dev_put(parms->dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001433 call_rcu(&parms->rcu_head, neigh_rcu_free_parms);
1434 return;
1435 }
1436 }
1437 write_unlock_bh(&tbl->lock);
1438 NEIGH_PRINTK1("neigh_parms_release: not found\n");
1439}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001440EXPORT_SYMBOL(neigh_parms_release);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001441
Denis V. Lunev06f05112008-01-24 00:30:58 -08001442static void neigh_parms_destroy(struct neigh_parms *parms)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001443{
YOSHIFUJI Hideaki57da52c2008-03-26 03:49:59 +09001444 release_net(neigh_parms_net(parms));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001445 kfree(parms);
1446}
1447
Pavel Emelianovc2ecba72007-04-17 12:45:31 -07001448static struct lock_class_key neigh_table_proxy_queue_class;
1449
Simon Kelleybd89efc2006-05-12 14:56:08 -07001450void neigh_table_init_no_netlink(struct neigh_table *tbl)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001451{
1452 unsigned long now = jiffies;
1453 unsigned long phsize;
1454
Eric Dumazete42ea982008-11-12 00:54:54 -08001455 write_pnet(&tbl->parms.net, &init_net);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001456 atomic_set(&tbl->parms.refcnt, 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001457 tbl->parms.reachable_time =
1458 neigh_rand_reach_time(tbl->parms.base_reachable_time);
1459
1460 if (!tbl->kmem_cachep)
Alexey Dobriyane5d679f332006-08-26 19:25:52 -07001461 tbl->kmem_cachep =
1462 kmem_cache_create(tbl->id, tbl->entry_size, 0,
1463 SLAB_HWCACHE_ALIGN|SLAB_PANIC,
Paul Mundt20c2df82007-07-20 10:11:58 +09001464 NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001465 tbl->stats = alloc_percpu(struct neigh_statistics);
1466 if (!tbl->stats)
1467 panic("cannot create neighbour cache statistics");
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001468
Linus Torvalds1da177e2005-04-16 15:20:36 -07001469#ifdef CONFIG_PROC_FS
Alexey Dobriyan9b739ba2008-11-11 16:47:44 -08001470 if (!proc_create_data(tbl->id, 0, init_net.proc_net_stat,
1471 &neigh_stat_seq_fops, tbl))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001472 panic("cannot create neighbour proc dir entry");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001473#endif
1474
David S. Millercd089332011-07-11 01:28:12 -07001475 RCU_INIT_POINTER(tbl->nht, neigh_hash_alloc(3));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001476
1477 phsize = (PNEIGH_HASHMASK + 1) * sizeof(struct pneigh_entry *);
Andrew Morton77d04bd2006-04-07 14:52:59 -07001478 tbl->phash_buckets = kzalloc(phsize, GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001479
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001480 if (!tbl->nht || !tbl->phash_buckets)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001481 panic("cannot allocate neighbour cache hashes");
1482
Linus Torvalds1da177e2005-04-16 15:20:36 -07001483 rwlock_init(&tbl->lock);
Eric Dumazete4c4e442009-07-30 03:15:07 +00001484 INIT_DELAYED_WORK_DEFERRABLE(&tbl->gc_work, neigh_periodic_work);
1485 schedule_delayed_work(&tbl->gc_work, tbl->parms.reachable_time);
Pavel Emelyanovb24b8a22008-01-23 21:20:07 -08001486 setup_timer(&tbl->proxy_timer, neigh_proxy_process, (unsigned long)tbl);
Pavel Emelianovc2ecba72007-04-17 12:45:31 -07001487 skb_queue_head_init_class(&tbl->proxy_queue,
1488 &neigh_table_proxy_queue_class);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001489
1490 tbl->last_flush = now;
1491 tbl->last_rand = now + tbl->parms.reachable_time * 20;
Simon Kelleybd89efc2006-05-12 14:56:08 -07001492}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001493EXPORT_SYMBOL(neigh_table_init_no_netlink);
Simon Kelleybd89efc2006-05-12 14:56:08 -07001494
1495void neigh_table_init(struct neigh_table *tbl)
1496{
1497 struct neigh_table *tmp;
1498
1499 neigh_table_init_no_netlink(tbl);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001500 write_lock(&neigh_tbl_lock);
Simon Kelleybd89efc2006-05-12 14:56:08 -07001501 for (tmp = neigh_tables; tmp; tmp = tmp->next) {
1502 if (tmp->family == tbl->family)
1503 break;
1504 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001505 tbl->next = neigh_tables;
1506 neigh_tables = tbl;
1507 write_unlock(&neigh_tbl_lock);
Simon Kelleybd89efc2006-05-12 14:56:08 -07001508
1509 if (unlikely(tmp)) {
1510 printk(KERN_ERR "NEIGH: Registering multiple tables for "
1511 "family %d\n", tbl->family);
1512 dump_stack();
1513 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001514}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001515EXPORT_SYMBOL(neigh_table_init);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001516
1517int neigh_table_clear(struct neigh_table *tbl)
1518{
1519 struct neigh_table **tp;
1520
1521 /* It is not clean... Fix it to unload IPv6 module safely */
Tejun Heoa5c30b32010-10-19 06:04:42 +00001522 cancel_delayed_work_sync(&tbl->gc_work);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001523 del_timer_sync(&tbl->proxy_timer);
1524 pneigh_queue_purge(&tbl->proxy_queue);
1525 neigh_ifdown(tbl, NULL);
1526 if (atomic_read(&tbl->entries))
1527 printk(KERN_CRIT "neighbour leakage\n");
1528 write_lock(&neigh_tbl_lock);
1529 for (tp = &neigh_tables; *tp; tp = &(*tp)->next) {
1530 if (*tp == tbl) {
1531 *tp = tbl->next;
1532 break;
1533 }
1534 }
1535 write_unlock(&neigh_tbl_lock);
1536
Eric Dumazet6193d2b2011-01-19 22:02:47 +00001537 call_rcu(&rcu_dereference_protected(tbl->nht, 1)->rcu,
1538 neigh_hash_free_rcu);
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001539 tbl->nht = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001540
1541 kfree(tbl->phash_buckets);
1542 tbl->phash_buckets = NULL;
1543
Alexey Dobriyan3f192b52007-11-05 21:28:13 -08001544 remove_proc_entry(tbl->id, init_net.proc_net_stat);
1545
Kirill Korotaev3fcde742006-09-01 01:34:10 -07001546 free_percpu(tbl->stats);
1547 tbl->stats = NULL;
1548
Randy Dunlapbfb85c92007-10-21 16:24:27 -07001549 kmem_cache_destroy(tbl->kmem_cachep);
1550 tbl->kmem_cachep = NULL;
1551
Linus Torvalds1da177e2005-04-16 15:20:36 -07001552 return 0;
1553}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09001554EXPORT_SYMBOL(neigh_table_clear);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001555
Thomas Grafc8822a42007-03-22 11:50:06 -07001556static int neigh_delete(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001557{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001558 struct net *net = sock_net(skb->sk);
Thomas Grafa14a49d2006-08-07 17:53:08 -07001559 struct ndmsg *ndm;
1560 struct nlattr *dst_attr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001561 struct neigh_table *tbl;
1562 struct net_device *dev = NULL;
Thomas Grafa14a49d2006-08-07 17:53:08 -07001563 int err = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001564
Eric Dumazet110b2492010-10-04 04:27:36 +00001565 ASSERT_RTNL();
Thomas Grafa14a49d2006-08-07 17:53:08 -07001566 if (nlmsg_len(nlh) < sizeof(*ndm))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001567 goto out;
1568
Thomas Grafa14a49d2006-08-07 17:53:08 -07001569 dst_attr = nlmsg_find_attr(nlh, sizeof(*ndm), NDA_DST);
1570 if (dst_attr == NULL)
1571 goto out;
1572
1573 ndm = nlmsg_data(nlh);
1574 if (ndm->ndm_ifindex) {
Eric Dumazet110b2492010-10-04 04:27:36 +00001575 dev = __dev_get_by_index(net, ndm->ndm_ifindex);
Thomas Grafa14a49d2006-08-07 17:53:08 -07001576 if (dev == NULL) {
1577 err = -ENODEV;
1578 goto out;
1579 }
1580 }
1581
Linus Torvalds1da177e2005-04-16 15:20:36 -07001582 read_lock(&neigh_tbl_lock);
1583 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
Thomas Grafa14a49d2006-08-07 17:53:08 -07001584 struct neighbour *neigh;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001585
1586 if (tbl->family != ndm->ndm_family)
1587 continue;
1588 read_unlock(&neigh_tbl_lock);
1589
Thomas Grafa14a49d2006-08-07 17:53:08 -07001590 if (nla_len(dst_attr) < tbl->key_len)
Eric Dumazet110b2492010-10-04 04:27:36 +00001591 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001592
1593 if (ndm->ndm_flags & NTF_PROXY) {
Eric W. Biederman426b5302008-01-24 00:13:18 -08001594 err = pneigh_delete(tbl, net, nla_data(dst_attr), dev);
Eric Dumazet110b2492010-10-04 04:27:36 +00001595 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001596 }
1597
Thomas Grafa14a49d2006-08-07 17:53:08 -07001598 if (dev == NULL)
Eric Dumazet110b2492010-10-04 04:27:36 +00001599 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001600
Thomas Grafa14a49d2006-08-07 17:53:08 -07001601 neigh = neigh_lookup(tbl, nla_data(dst_attr), dev);
1602 if (neigh == NULL) {
1603 err = -ENOENT;
Eric Dumazet110b2492010-10-04 04:27:36 +00001604 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001605 }
Thomas Grafa14a49d2006-08-07 17:53:08 -07001606
1607 err = neigh_update(neigh, NULL, NUD_FAILED,
1608 NEIGH_UPDATE_F_OVERRIDE |
1609 NEIGH_UPDATE_F_ADMIN);
1610 neigh_release(neigh);
Eric Dumazet110b2492010-10-04 04:27:36 +00001611 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001612 }
1613 read_unlock(&neigh_tbl_lock);
Thomas Grafa14a49d2006-08-07 17:53:08 -07001614 err = -EAFNOSUPPORT;
1615
Linus Torvalds1da177e2005-04-16 15:20:36 -07001616out:
1617 return err;
1618}
1619
Thomas Grafc8822a42007-03-22 11:50:06 -07001620static int neigh_add(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001621{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001622 struct net *net = sock_net(skb->sk);
Thomas Graf5208deb2006-08-07 17:55:40 -07001623 struct ndmsg *ndm;
1624 struct nlattr *tb[NDA_MAX+1];
Linus Torvalds1da177e2005-04-16 15:20:36 -07001625 struct neigh_table *tbl;
1626 struct net_device *dev = NULL;
Thomas Graf5208deb2006-08-07 17:55:40 -07001627 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001628
Eric Dumazet110b2492010-10-04 04:27:36 +00001629 ASSERT_RTNL();
Thomas Graf5208deb2006-08-07 17:55:40 -07001630 err = nlmsg_parse(nlh, sizeof(*ndm), tb, NDA_MAX, NULL);
1631 if (err < 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001632 goto out;
1633
Thomas Graf5208deb2006-08-07 17:55:40 -07001634 err = -EINVAL;
1635 if (tb[NDA_DST] == NULL)
1636 goto out;
1637
1638 ndm = nlmsg_data(nlh);
1639 if (ndm->ndm_ifindex) {
Eric Dumazet110b2492010-10-04 04:27:36 +00001640 dev = __dev_get_by_index(net, ndm->ndm_ifindex);
Thomas Graf5208deb2006-08-07 17:55:40 -07001641 if (dev == NULL) {
1642 err = -ENODEV;
1643 goto out;
1644 }
1645
1646 if (tb[NDA_LLADDR] && nla_len(tb[NDA_LLADDR]) < dev->addr_len)
Eric Dumazet110b2492010-10-04 04:27:36 +00001647 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001648 }
1649
Linus Torvalds1da177e2005-04-16 15:20:36 -07001650 read_lock(&neigh_tbl_lock);
1651 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
Thomas Graf5208deb2006-08-07 17:55:40 -07001652 int flags = NEIGH_UPDATE_F_ADMIN | NEIGH_UPDATE_F_OVERRIDE;
1653 struct neighbour *neigh;
1654 void *dst, *lladdr;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001655
1656 if (tbl->family != ndm->ndm_family)
1657 continue;
1658 read_unlock(&neigh_tbl_lock);
1659
Thomas Graf5208deb2006-08-07 17:55:40 -07001660 if (nla_len(tb[NDA_DST]) < tbl->key_len)
Eric Dumazet110b2492010-10-04 04:27:36 +00001661 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001662 dst = nla_data(tb[NDA_DST]);
1663 lladdr = tb[NDA_LLADDR] ? nla_data(tb[NDA_LLADDR]) : NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001664
1665 if (ndm->ndm_flags & NTF_PROXY) {
Ville Nuorvala62dd9312006-09-22 14:43:19 -07001666 struct pneigh_entry *pn;
1667
1668 err = -ENOBUFS;
Eric W. Biederman426b5302008-01-24 00:13:18 -08001669 pn = pneigh_lookup(tbl, net, dst, dev, 1);
Ville Nuorvala62dd9312006-09-22 14:43:19 -07001670 if (pn) {
1671 pn->flags = ndm->ndm_flags;
1672 err = 0;
1673 }
Eric Dumazet110b2492010-10-04 04:27:36 +00001674 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001675 }
1676
Thomas Graf5208deb2006-08-07 17:55:40 -07001677 if (dev == NULL)
Eric Dumazet110b2492010-10-04 04:27:36 +00001678 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001679
1680 neigh = neigh_lookup(tbl, dst, dev);
1681 if (neigh == NULL) {
1682 if (!(nlh->nlmsg_flags & NLM_F_CREATE)) {
1683 err = -ENOENT;
Eric Dumazet110b2492010-10-04 04:27:36 +00001684 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001685 }
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001686
Thomas Graf5208deb2006-08-07 17:55:40 -07001687 neigh = __neigh_lookup_errno(tbl, dst, dev);
1688 if (IS_ERR(neigh)) {
1689 err = PTR_ERR(neigh);
Eric Dumazet110b2492010-10-04 04:27:36 +00001690 goto out;
Thomas Graf5208deb2006-08-07 17:55:40 -07001691 }
1692 } else {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001693 if (nlh->nlmsg_flags & NLM_F_EXCL) {
1694 err = -EEXIST;
Thomas Graf5208deb2006-08-07 17:55:40 -07001695 neigh_release(neigh);
Eric Dumazet110b2492010-10-04 04:27:36 +00001696 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001697 }
Thomas Graf5208deb2006-08-07 17:55:40 -07001698
1699 if (!(nlh->nlmsg_flags & NLM_F_REPLACE))
1700 flags &= ~NEIGH_UPDATE_F_OVERRIDE;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001701 }
1702
Eric Biederman0c5c2d32009-03-04 00:03:08 -08001703 if (ndm->ndm_flags & NTF_USE) {
1704 neigh_event_send(neigh, NULL);
1705 err = 0;
1706 } else
1707 err = neigh_update(neigh, lladdr, ndm->ndm_state, flags);
Thomas Graf5208deb2006-08-07 17:55:40 -07001708 neigh_release(neigh);
Eric Dumazet110b2492010-10-04 04:27:36 +00001709 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001710 }
1711
1712 read_unlock(&neigh_tbl_lock);
Thomas Graf5208deb2006-08-07 17:55:40 -07001713 err = -EAFNOSUPPORT;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001714out:
1715 return err;
1716}
1717
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001718static int neightbl_fill_parms(struct sk_buff *skb, struct neigh_parms *parms)
1719{
Thomas Grafca860fb2006-08-07 18:00:18 -07001720 struct nlattr *nest;
1721
1722 nest = nla_nest_start(skb, NDTA_PARMS);
1723 if (nest == NULL)
1724 return -ENOBUFS;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001725
1726 if (parms->dev)
Thomas Grafca860fb2006-08-07 18:00:18 -07001727 NLA_PUT_U32(skb, NDTPA_IFINDEX, parms->dev->ifindex);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001728
Thomas Grafca860fb2006-08-07 18:00:18 -07001729 NLA_PUT_U32(skb, NDTPA_REFCNT, atomic_read(&parms->refcnt));
1730 NLA_PUT_U32(skb, NDTPA_QUEUE_LEN, parms->queue_len);
1731 NLA_PUT_U32(skb, NDTPA_PROXY_QLEN, parms->proxy_qlen);
1732 NLA_PUT_U32(skb, NDTPA_APP_PROBES, parms->app_probes);
1733 NLA_PUT_U32(skb, NDTPA_UCAST_PROBES, parms->ucast_probes);
1734 NLA_PUT_U32(skb, NDTPA_MCAST_PROBES, parms->mcast_probes);
1735 NLA_PUT_MSECS(skb, NDTPA_REACHABLE_TIME, parms->reachable_time);
1736 NLA_PUT_MSECS(skb, NDTPA_BASE_REACHABLE_TIME,
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001737 parms->base_reachable_time);
Thomas Grafca860fb2006-08-07 18:00:18 -07001738 NLA_PUT_MSECS(skb, NDTPA_GC_STALETIME, parms->gc_staletime);
1739 NLA_PUT_MSECS(skb, NDTPA_DELAY_PROBE_TIME, parms->delay_probe_time);
1740 NLA_PUT_MSECS(skb, NDTPA_RETRANS_TIME, parms->retrans_time);
1741 NLA_PUT_MSECS(skb, NDTPA_ANYCAST_DELAY, parms->anycast_delay);
1742 NLA_PUT_MSECS(skb, NDTPA_PROXY_DELAY, parms->proxy_delay);
1743 NLA_PUT_MSECS(skb, NDTPA_LOCKTIME, parms->locktime);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001744
Thomas Grafca860fb2006-08-07 18:00:18 -07001745 return nla_nest_end(skb, nest);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001746
Thomas Grafca860fb2006-08-07 18:00:18 -07001747nla_put_failure:
Thomas Grafbc3ed282008-06-03 16:36:54 -07001748 nla_nest_cancel(skb, nest);
1749 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001750}
1751
Thomas Grafca860fb2006-08-07 18:00:18 -07001752static int neightbl_fill_info(struct sk_buff *skb, struct neigh_table *tbl,
1753 u32 pid, u32 seq, int type, int flags)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001754{
1755 struct nlmsghdr *nlh;
1756 struct ndtmsg *ndtmsg;
1757
Thomas Grafca860fb2006-08-07 18:00:18 -07001758 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndtmsg), flags);
1759 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08001760 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001761
Thomas Grafca860fb2006-08-07 18:00:18 -07001762 ndtmsg = nlmsg_data(nlh);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001763
1764 read_lock_bh(&tbl->lock);
1765 ndtmsg->ndtm_family = tbl->family;
Patrick McHardy9ef1d4c2005-06-28 12:55:30 -07001766 ndtmsg->ndtm_pad1 = 0;
1767 ndtmsg->ndtm_pad2 = 0;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001768
Thomas Grafca860fb2006-08-07 18:00:18 -07001769 NLA_PUT_STRING(skb, NDTA_NAME, tbl->id);
1770 NLA_PUT_MSECS(skb, NDTA_GC_INTERVAL, tbl->gc_interval);
1771 NLA_PUT_U32(skb, NDTA_THRESH1, tbl->gc_thresh1);
1772 NLA_PUT_U32(skb, NDTA_THRESH2, tbl->gc_thresh2);
1773 NLA_PUT_U32(skb, NDTA_THRESH3, tbl->gc_thresh3);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001774
1775 {
1776 unsigned long now = jiffies;
1777 unsigned int flush_delta = now - tbl->last_flush;
1778 unsigned int rand_delta = now - tbl->last_rand;
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001779 struct neigh_hash_table *nht;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001780 struct ndt_config ndc = {
1781 .ndtc_key_len = tbl->key_len,
1782 .ndtc_entry_size = tbl->entry_size,
1783 .ndtc_entries = atomic_read(&tbl->entries),
1784 .ndtc_last_flush = jiffies_to_msecs(flush_delta),
1785 .ndtc_last_rand = jiffies_to_msecs(rand_delta),
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001786 .ndtc_proxy_qlen = tbl->proxy_queue.qlen,
1787 };
1788
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001789 rcu_read_lock_bh();
1790 nht = rcu_dereference_bh(tbl->nht);
1791 ndc.ndtc_hash_rnd = nht->hash_rnd;
David S. Millercd089332011-07-11 01:28:12 -07001792 ndc.ndtc_hash_mask = ((1 << nht->hash_shift) - 1);
Eric Dumazetd6bf7812010-10-04 06:15:44 +00001793 rcu_read_unlock_bh();
1794
Thomas Grafca860fb2006-08-07 18:00:18 -07001795 NLA_PUT(skb, NDTA_CONFIG, sizeof(ndc), &ndc);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001796 }
1797
1798 {
1799 int cpu;
1800 struct ndt_stats ndst;
1801
1802 memset(&ndst, 0, sizeof(ndst));
1803
KAMEZAWA Hiroyuki6f912042006-04-10 22:52:50 -07001804 for_each_possible_cpu(cpu) {
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001805 struct neigh_statistics *st;
1806
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001807 st = per_cpu_ptr(tbl->stats, cpu);
1808 ndst.ndts_allocs += st->allocs;
1809 ndst.ndts_destroys += st->destroys;
1810 ndst.ndts_hash_grows += st->hash_grows;
1811 ndst.ndts_res_failed += st->res_failed;
1812 ndst.ndts_lookups += st->lookups;
1813 ndst.ndts_hits += st->hits;
1814 ndst.ndts_rcv_probes_mcast += st->rcv_probes_mcast;
1815 ndst.ndts_rcv_probes_ucast += st->rcv_probes_ucast;
1816 ndst.ndts_periodic_gc_runs += st->periodic_gc_runs;
1817 ndst.ndts_forced_gc_runs += st->forced_gc_runs;
1818 }
1819
Thomas Grafca860fb2006-08-07 18:00:18 -07001820 NLA_PUT(skb, NDTA_STATS, sizeof(ndst), &ndst);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001821 }
1822
1823 BUG_ON(tbl->parms.dev);
1824 if (neightbl_fill_parms(skb, &tbl->parms) < 0)
Thomas Grafca860fb2006-08-07 18:00:18 -07001825 goto nla_put_failure;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001826
1827 read_unlock_bh(&tbl->lock);
Thomas Grafca860fb2006-08-07 18:00:18 -07001828 return nlmsg_end(skb, nlh);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001829
Thomas Grafca860fb2006-08-07 18:00:18 -07001830nla_put_failure:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001831 read_unlock_bh(&tbl->lock);
Patrick McHardy26932562007-01-31 23:16:40 -08001832 nlmsg_cancel(skb, nlh);
1833 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001834}
1835
Thomas Grafca860fb2006-08-07 18:00:18 -07001836static int neightbl_fill_param_info(struct sk_buff *skb,
1837 struct neigh_table *tbl,
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001838 struct neigh_parms *parms,
Thomas Grafca860fb2006-08-07 18:00:18 -07001839 u32 pid, u32 seq, int type,
1840 unsigned int flags)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001841{
1842 struct ndtmsg *ndtmsg;
1843 struct nlmsghdr *nlh;
1844
Thomas Grafca860fb2006-08-07 18:00:18 -07001845 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndtmsg), flags);
1846 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08001847 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001848
Thomas Grafca860fb2006-08-07 18:00:18 -07001849 ndtmsg = nlmsg_data(nlh);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001850
1851 read_lock_bh(&tbl->lock);
1852 ndtmsg->ndtm_family = tbl->family;
Patrick McHardy9ef1d4c2005-06-28 12:55:30 -07001853 ndtmsg->ndtm_pad1 = 0;
1854 ndtmsg->ndtm_pad2 = 0;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001855
Thomas Grafca860fb2006-08-07 18:00:18 -07001856 if (nla_put_string(skb, NDTA_NAME, tbl->id) < 0 ||
1857 neightbl_fill_parms(skb, parms) < 0)
1858 goto errout;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001859
1860 read_unlock_bh(&tbl->lock);
Thomas Grafca860fb2006-08-07 18:00:18 -07001861 return nlmsg_end(skb, nlh);
1862errout:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001863 read_unlock_bh(&tbl->lock);
Patrick McHardy26932562007-01-31 23:16:40 -08001864 nlmsg_cancel(skb, nlh);
1865 return -EMSGSIZE;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001866}
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001867
Patrick McHardyef7c79e2007-06-05 12:38:30 -07001868static const struct nla_policy nl_neightbl_policy[NDTA_MAX+1] = {
Thomas Graf6b3f8672006-08-07 17:58:53 -07001869 [NDTA_NAME] = { .type = NLA_STRING },
1870 [NDTA_THRESH1] = { .type = NLA_U32 },
1871 [NDTA_THRESH2] = { .type = NLA_U32 },
1872 [NDTA_THRESH3] = { .type = NLA_U32 },
1873 [NDTA_GC_INTERVAL] = { .type = NLA_U64 },
1874 [NDTA_PARMS] = { .type = NLA_NESTED },
1875};
1876
Patrick McHardyef7c79e2007-06-05 12:38:30 -07001877static const struct nla_policy nl_ntbl_parm_policy[NDTPA_MAX+1] = {
Thomas Graf6b3f8672006-08-07 17:58:53 -07001878 [NDTPA_IFINDEX] = { .type = NLA_U32 },
1879 [NDTPA_QUEUE_LEN] = { .type = NLA_U32 },
1880 [NDTPA_PROXY_QLEN] = { .type = NLA_U32 },
1881 [NDTPA_APP_PROBES] = { .type = NLA_U32 },
1882 [NDTPA_UCAST_PROBES] = { .type = NLA_U32 },
1883 [NDTPA_MCAST_PROBES] = { .type = NLA_U32 },
1884 [NDTPA_BASE_REACHABLE_TIME] = { .type = NLA_U64 },
1885 [NDTPA_GC_STALETIME] = { .type = NLA_U64 },
1886 [NDTPA_DELAY_PROBE_TIME] = { .type = NLA_U64 },
1887 [NDTPA_RETRANS_TIME] = { .type = NLA_U64 },
1888 [NDTPA_ANYCAST_DELAY] = { .type = NLA_U64 },
1889 [NDTPA_PROXY_DELAY] = { .type = NLA_U64 },
1890 [NDTPA_LOCKTIME] = { .type = NLA_U64 },
1891};
1892
Thomas Grafc8822a42007-03-22 11:50:06 -07001893static int neightbl_set(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001894{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09001895 struct net *net = sock_net(skb->sk);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001896 struct neigh_table *tbl;
Thomas Graf6b3f8672006-08-07 17:58:53 -07001897 struct ndtmsg *ndtmsg;
1898 struct nlattr *tb[NDTA_MAX+1];
1899 int err;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001900
Thomas Graf6b3f8672006-08-07 17:58:53 -07001901 err = nlmsg_parse(nlh, sizeof(*ndtmsg), tb, NDTA_MAX,
1902 nl_neightbl_policy);
1903 if (err < 0)
1904 goto errout;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001905
Thomas Graf6b3f8672006-08-07 17:58:53 -07001906 if (tb[NDTA_NAME] == NULL) {
1907 err = -EINVAL;
1908 goto errout;
1909 }
1910
1911 ndtmsg = nlmsg_data(nlh);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001912 read_lock(&neigh_tbl_lock);
1913 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
1914 if (ndtmsg->ndtm_family && tbl->family != ndtmsg->ndtm_family)
1915 continue;
1916
Thomas Graf6b3f8672006-08-07 17:58:53 -07001917 if (nla_strcmp(tb[NDTA_NAME], tbl->id) == 0)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001918 break;
1919 }
1920
1921 if (tbl == NULL) {
1922 err = -ENOENT;
Thomas Graf6b3f8672006-08-07 17:58:53 -07001923 goto errout_locked;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001924 }
1925
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09001926 /*
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001927 * We acquire tbl->lock to be nice to the periodic timers and
1928 * make sure they always see a consistent set of values.
1929 */
1930 write_lock_bh(&tbl->lock);
1931
Thomas Graf6b3f8672006-08-07 17:58:53 -07001932 if (tb[NDTA_PARMS]) {
1933 struct nlattr *tbp[NDTPA_MAX+1];
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001934 struct neigh_parms *p;
Thomas Graf6b3f8672006-08-07 17:58:53 -07001935 int i, ifindex = 0;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001936
Thomas Graf6b3f8672006-08-07 17:58:53 -07001937 err = nla_parse_nested(tbp, NDTPA_MAX, tb[NDTA_PARMS],
1938 nl_ntbl_parm_policy);
1939 if (err < 0)
1940 goto errout_tbl_lock;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001941
Thomas Graf6b3f8672006-08-07 17:58:53 -07001942 if (tbp[NDTPA_IFINDEX])
1943 ifindex = nla_get_u32(tbp[NDTPA_IFINDEX]);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001944
Tobias Klauser97fd5bc2009-07-13 11:17:49 -07001945 p = lookup_neigh_parms(tbl, net, ifindex);
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001946 if (p == NULL) {
1947 err = -ENOENT;
Thomas Graf6b3f8672006-08-07 17:58:53 -07001948 goto errout_tbl_lock;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001949 }
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001950
Thomas Graf6b3f8672006-08-07 17:58:53 -07001951 for (i = 1; i <= NDTPA_MAX; i++) {
1952 if (tbp[i] == NULL)
1953 continue;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001954
Thomas Graf6b3f8672006-08-07 17:58:53 -07001955 switch (i) {
1956 case NDTPA_QUEUE_LEN:
1957 p->queue_len = nla_get_u32(tbp[i]);
1958 break;
1959 case NDTPA_PROXY_QLEN:
1960 p->proxy_qlen = nla_get_u32(tbp[i]);
1961 break;
1962 case NDTPA_APP_PROBES:
1963 p->app_probes = nla_get_u32(tbp[i]);
1964 break;
1965 case NDTPA_UCAST_PROBES:
1966 p->ucast_probes = nla_get_u32(tbp[i]);
1967 break;
1968 case NDTPA_MCAST_PROBES:
1969 p->mcast_probes = nla_get_u32(tbp[i]);
1970 break;
1971 case NDTPA_BASE_REACHABLE_TIME:
1972 p->base_reachable_time = nla_get_msecs(tbp[i]);
1973 break;
1974 case NDTPA_GC_STALETIME:
1975 p->gc_staletime = nla_get_msecs(tbp[i]);
1976 break;
1977 case NDTPA_DELAY_PROBE_TIME:
1978 p->delay_probe_time = nla_get_msecs(tbp[i]);
1979 break;
1980 case NDTPA_RETRANS_TIME:
1981 p->retrans_time = nla_get_msecs(tbp[i]);
1982 break;
1983 case NDTPA_ANYCAST_DELAY:
1984 p->anycast_delay = nla_get_msecs(tbp[i]);
1985 break;
1986 case NDTPA_PROXY_DELAY:
1987 p->proxy_delay = nla_get_msecs(tbp[i]);
1988 break;
1989 case NDTPA_LOCKTIME:
1990 p->locktime = nla_get_msecs(tbp[i]);
1991 break;
1992 }
1993 }
Thomas Grafc7fb64d2005-06-18 22:50:55 -07001994 }
1995
Thomas Graf6b3f8672006-08-07 17:58:53 -07001996 if (tb[NDTA_THRESH1])
1997 tbl->gc_thresh1 = nla_get_u32(tb[NDTA_THRESH1]);
1998
1999 if (tb[NDTA_THRESH2])
2000 tbl->gc_thresh2 = nla_get_u32(tb[NDTA_THRESH2]);
2001
2002 if (tb[NDTA_THRESH3])
2003 tbl->gc_thresh3 = nla_get_u32(tb[NDTA_THRESH3]);
2004
2005 if (tb[NDTA_GC_INTERVAL])
2006 tbl->gc_interval = nla_get_msecs(tb[NDTA_GC_INTERVAL]);
2007
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002008 err = 0;
2009
Thomas Graf6b3f8672006-08-07 17:58:53 -07002010errout_tbl_lock:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002011 write_unlock_bh(&tbl->lock);
Thomas Graf6b3f8672006-08-07 17:58:53 -07002012errout_locked:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002013 read_unlock(&neigh_tbl_lock);
Thomas Graf6b3f8672006-08-07 17:58:53 -07002014errout:
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002015 return err;
2016}
2017
Thomas Grafc8822a42007-03-22 11:50:06 -07002018static int neightbl_dump_info(struct sk_buff *skb, struct netlink_callback *cb)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002019{
YOSHIFUJI Hideaki3b1e0a62008-03-26 02:26:21 +09002020 struct net *net = sock_net(skb->sk);
Thomas Grafca860fb2006-08-07 18:00:18 -07002021 int family, tidx, nidx = 0;
2022 int tbl_skip = cb->args[0];
2023 int neigh_skip = cb->args[1];
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002024 struct neigh_table *tbl;
2025
Thomas Grafca860fb2006-08-07 18:00:18 -07002026 family = ((struct rtgenmsg *) nlmsg_data(cb->nlh))->rtgen_family;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002027
2028 read_lock(&neigh_tbl_lock);
Thomas Grafca860fb2006-08-07 18:00:18 -07002029 for (tbl = neigh_tables, tidx = 0; tbl; tbl = tbl->next, tidx++) {
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002030 struct neigh_parms *p;
2031
Thomas Grafca860fb2006-08-07 18:00:18 -07002032 if (tidx < tbl_skip || (family && tbl->family != family))
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002033 continue;
2034
Thomas Grafca860fb2006-08-07 18:00:18 -07002035 if (neightbl_fill_info(skb, tbl, NETLINK_CB(cb->skb).pid,
2036 cb->nlh->nlmsg_seq, RTM_NEWNEIGHTBL,
2037 NLM_F_MULTI) <= 0)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002038 break;
2039
Eric W. Biederman426b5302008-01-24 00:13:18 -08002040 for (nidx = 0, p = tbl->parms.next; p; p = p->next) {
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002041 if (!net_eq(neigh_parms_net(p), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002042 continue;
2043
Gautam Kachrooefc683f2009-02-06 00:52:04 -08002044 if (nidx < neigh_skip)
2045 goto next;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002046
Thomas Grafca860fb2006-08-07 18:00:18 -07002047 if (neightbl_fill_param_info(skb, tbl, p,
2048 NETLINK_CB(cb->skb).pid,
2049 cb->nlh->nlmsg_seq,
2050 RTM_NEWNEIGHTBL,
2051 NLM_F_MULTI) <= 0)
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002052 goto out;
Gautam Kachrooefc683f2009-02-06 00:52:04 -08002053 next:
2054 nidx++;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002055 }
2056
Thomas Grafca860fb2006-08-07 18:00:18 -07002057 neigh_skip = 0;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002058 }
2059out:
2060 read_unlock(&neigh_tbl_lock);
Thomas Grafca860fb2006-08-07 18:00:18 -07002061 cb->args[0] = tidx;
2062 cb->args[1] = nidx;
Thomas Grafc7fb64d2005-06-18 22:50:55 -07002063
2064 return skb->len;
2065}
Linus Torvalds1da177e2005-04-16 15:20:36 -07002066
Thomas Graf8b8aec52006-08-07 17:56:37 -07002067static int neigh_fill_info(struct sk_buff *skb, struct neighbour *neigh,
2068 u32 pid, u32 seq, int type, unsigned int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002069{
2070 unsigned long now = jiffies;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002071 struct nda_cacheinfo ci;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002072 struct nlmsghdr *nlh;
2073 struct ndmsg *ndm;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002074
Thomas Graf8b8aec52006-08-07 17:56:37 -07002075 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndm), flags);
2076 if (nlh == NULL)
Patrick McHardy26932562007-01-31 23:16:40 -08002077 return -EMSGSIZE;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002078
2079 ndm = nlmsg_data(nlh);
2080 ndm->ndm_family = neigh->ops->family;
Patrick McHardy9ef1d4c2005-06-28 12:55:30 -07002081 ndm->ndm_pad1 = 0;
2082 ndm->ndm_pad2 = 0;
Thomas Graf8b8aec52006-08-07 17:56:37 -07002083 ndm->ndm_flags = neigh->flags;
2084 ndm->ndm_type = neigh->type;
2085 ndm->ndm_ifindex = neigh->dev->ifindex;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002086
Thomas Graf8b8aec52006-08-07 17:56:37 -07002087 NLA_PUT(skb, NDA_DST, neigh->tbl->key_len, neigh->primary_key);
2088
2089 read_lock_bh(&neigh->lock);
2090 ndm->ndm_state = neigh->nud_state;
Eric Dumazet0ed8ddf2010-10-07 10:44:07 +00002091 if (neigh->nud_state & NUD_VALID) {
2092 char haddr[MAX_ADDR_LEN];
2093
2094 neigh_ha_snapshot(haddr, neigh, neigh->dev);
2095 if (nla_put(skb, NDA_LLADDR, neigh->dev->addr_len, haddr) < 0) {
2096 read_unlock_bh(&neigh->lock);
2097 goto nla_put_failure;
2098 }
Thomas Graf8b8aec52006-08-07 17:56:37 -07002099 }
2100
Stephen Hemmingerb9f5f522008-06-03 16:03:15 -07002101 ci.ndm_used = jiffies_to_clock_t(now - neigh->used);
2102 ci.ndm_confirmed = jiffies_to_clock_t(now - neigh->confirmed);
2103 ci.ndm_updated = jiffies_to_clock_t(now - neigh->updated);
Thomas Graf8b8aec52006-08-07 17:56:37 -07002104 ci.ndm_refcnt = atomic_read(&neigh->refcnt) - 1;
2105 read_unlock_bh(&neigh->lock);
2106
2107 NLA_PUT_U32(skb, NDA_PROBES, atomic_read(&neigh->probes));
2108 NLA_PUT(skb, NDA_CACHEINFO, sizeof(ci), &ci);
2109
2110 return nlmsg_end(skb, nlh);
2111
2112nla_put_failure:
Patrick McHardy26932562007-01-31 23:16:40 -08002113 nlmsg_cancel(skb, nlh);
2114 return -EMSGSIZE;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002115}
2116
Thomas Grafd961db32007-08-08 23:12:56 -07002117static void neigh_update_notify(struct neighbour *neigh)
2118{
2119 call_netevent_notifiers(NETEVENT_NEIGH_UPDATE, neigh);
2120 __neigh_notify(neigh, RTM_NEWNEIGH, 0);
2121}
Linus Torvalds1da177e2005-04-16 15:20:36 -07002122
2123static int neigh_dump_table(struct neigh_table *tbl, struct sk_buff *skb,
2124 struct netlink_callback *cb)
2125{
Eric Dumazet767e97e2010-10-06 17:49:21 -07002126 struct net *net = sock_net(skb->sk);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002127 struct neighbour *n;
2128 int rc, h, s_h = cb->args[1];
2129 int idx, s_idx = idx = cb->args[2];
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002130 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002131
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002132 rcu_read_lock_bh();
2133 nht = rcu_dereference_bh(tbl->nht);
2134
David S. Millercd089332011-07-11 01:28:12 -07002135 for (h = 0; h < (1 << nht->hash_shift); h++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002136 if (h < s_h)
2137 continue;
2138 if (h > s_h)
2139 s_idx = 0;
Eric Dumazet767e97e2010-10-06 17:49:21 -07002140 for (n = rcu_dereference_bh(nht->hash_buckets[h]), idx = 0;
2141 n != NULL;
2142 n = rcu_dereference_bh(n->next)) {
Octavian Purdila09ad9bc2009-11-25 15:14:13 -08002143 if (!net_eq(dev_net(n->dev), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002144 continue;
Gautam Kachrooefc683f2009-02-06 00:52:04 -08002145 if (idx < s_idx)
2146 goto next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002147 if (neigh_fill_info(skb, n, NETLINK_CB(cb->skb).pid,
2148 cb->nlh->nlmsg_seq,
Jamal Hadi Salimb6544c02005-06-18 22:54:12 -07002149 RTM_NEWNEIGH,
2150 NLM_F_MULTI) <= 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002151 rc = -1;
2152 goto out;
2153 }
Eric Dumazet767e97e2010-10-06 17:49:21 -07002154next:
Gautam Kachrooefc683f2009-02-06 00:52:04 -08002155 idx++;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002156 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07002157 }
2158 rc = skb->len;
2159out:
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002160 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -07002161 cb->args[1] = h;
2162 cb->args[2] = idx;
2163 return rc;
2164}
2165
Thomas Grafc8822a42007-03-22 11:50:06 -07002166static int neigh_dump_info(struct sk_buff *skb, struct netlink_callback *cb)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002167{
2168 struct neigh_table *tbl;
2169 int t, family, s_t;
2170
2171 read_lock(&neigh_tbl_lock);
Thomas Graf8b8aec52006-08-07 17:56:37 -07002172 family = ((struct rtgenmsg *) nlmsg_data(cb->nlh))->rtgen_family;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002173 s_t = cb->args[0];
2174
2175 for (tbl = neigh_tables, t = 0; tbl; tbl = tbl->next, t++) {
2176 if (t < s_t || (family && tbl->family != family))
2177 continue;
2178 if (t > s_t)
2179 memset(&cb->args[1], 0, sizeof(cb->args) -
2180 sizeof(cb->args[0]));
2181 if (neigh_dump_table(tbl, skb, cb) < 0)
2182 break;
2183 }
2184 read_unlock(&neigh_tbl_lock);
2185
2186 cb->args[0] = t;
2187 return skb->len;
2188}
2189
2190void neigh_for_each(struct neigh_table *tbl, void (*cb)(struct neighbour *, void *), void *cookie)
2191{
2192 int chain;
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002193 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002194
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002195 rcu_read_lock_bh();
2196 nht = rcu_dereference_bh(tbl->nht);
2197
Eric Dumazet767e97e2010-10-06 17:49:21 -07002198 read_lock(&tbl->lock); /* avoid resizes */
David S. Millercd089332011-07-11 01:28:12 -07002199 for (chain = 0; chain < (1 << nht->hash_shift); chain++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002200 struct neighbour *n;
2201
Eric Dumazet767e97e2010-10-06 17:49:21 -07002202 for (n = rcu_dereference_bh(nht->hash_buckets[chain]);
2203 n != NULL;
2204 n = rcu_dereference_bh(n->next))
Linus Torvalds1da177e2005-04-16 15:20:36 -07002205 cb(n, cookie);
2206 }
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002207 read_unlock(&tbl->lock);
2208 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -07002209}
2210EXPORT_SYMBOL(neigh_for_each);
2211
2212/* The tbl->lock must be held as a writer and BH disabled. */
2213void __neigh_for_each_release(struct neigh_table *tbl,
2214 int (*cb)(struct neighbour *))
2215{
2216 int chain;
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002217 struct neigh_hash_table *nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002218
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002219 nht = rcu_dereference_protected(tbl->nht,
2220 lockdep_is_held(&tbl->lock));
David S. Millercd089332011-07-11 01:28:12 -07002221 for (chain = 0; chain < (1 << nht->hash_shift); chain++) {
Eric Dumazet767e97e2010-10-06 17:49:21 -07002222 struct neighbour *n;
2223 struct neighbour __rcu **np;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002224
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002225 np = &nht->hash_buckets[chain];
Eric Dumazet767e97e2010-10-06 17:49:21 -07002226 while ((n = rcu_dereference_protected(*np,
2227 lockdep_is_held(&tbl->lock))) != NULL) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002228 int release;
2229
2230 write_lock(&n->lock);
2231 release = cb(n);
2232 if (release) {
Eric Dumazet767e97e2010-10-06 17:49:21 -07002233 rcu_assign_pointer(*np,
2234 rcu_dereference_protected(n->next,
2235 lockdep_is_held(&tbl->lock)));
Linus Torvalds1da177e2005-04-16 15:20:36 -07002236 n->dead = 1;
2237 } else
2238 np = &n->next;
2239 write_unlock(&n->lock);
Thomas Graf4f494552007-08-08 23:12:36 -07002240 if (release)
2241 neigh_cleanup_and_release(n);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002242 }
2243 }
2244}
2245EXPORT_SYMBOL(__neigh_for_each_release);
2246
2247#ifdef CONFIG_PROC_FS
2248
2249static struct neighbour *neigh_get_first(struct seq_file *seq)
2250{
2251 struct neigh_seq_state *state = seq->private;
YOSHIFUJI Hideaki12188542008-03-26 02:36:06 +09002252 struct net *net = seq_file_net(seq);
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002253 struct neigh_hash_table *nht = state->nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002254 struct neighbour *n = NULL;
2255 int bucket = state->bucket;
2256
2257 state->flags &= ~NEIGH_SEQ_IS_PNEIGH;
David S. Millercd089332011-07-11 01:28:12 -07002258 for (bucket = 0; bucket < (1 << nht->hash_shift); bucket++) {
Eric Dumazet767e97e2010-10-06 17:49:21 -07002259 n = rcu_dereference_bh(nht->hash_buckets[bucket]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002260
2261 while (n) {
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002262 if (!net_eq(dev_net(n->dev), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002263 goto next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002264 if (state->neigh_sub_iter) {
2265 loff_t fakep = 0;
2266 void *v;
2267
2268 v = state->neigh_sub_iter(state, n, &fakep);
2269 if (!v)
2270 goto next;
2271 }
2272 if (!(state->flags & NEIGH_SEQ_SKIP_NOARP))
2273 break;
2274 if (n->nud_state & ~NUD_NOARP)
2275 break;
Eric Dumazet767e97e2010-10-06 17:49:21 -07002276next:
2277 n = rcu_dereference_bh(n->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002278 }
2279
2280 if (n)
2281 break;
2282 }
2283 state->bucket = bucket;
2284
2285 return n;
2286}
2287
2288static struct neighbour *neigh_get_next(struct seq_file *seq,
2289 struct neighbour *n,
2290 loff_t *pos)
2291{
2292 struct neigh_seq_state *state = seq->private;
YOSHIFUJI Hideaki12188542008-03-26 02:36:06 +09002293 struct net *net = seq_file_net(seq);
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002294 struct neigh_hash_table *nht = state->nht;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002295
2296 if (state->neigh_sub_iter) {
2297 void *v = state->neigh_sub_iter(state, n, pos);
2298 if (v)
2299 return n;
2300 }
Eric Dumazet767e97e2010-10-06 17:49:21 -07002301 n = rcu_dereference_bh(n->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002302
2303 while (1) {
2304 while (n) {
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002305 if (!net_eq(dev_net(n->dev), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002306 goto next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002307 if (state->neigh_sub_iter) {
2308 void *v = state->neigh_sub_iter(state, n, pos);
2309 if (v)
2310 return n;
2311 goto next;
2312 }
2313 if (!(state->flags & NEIGH_SEQ_SKIP_NOARP))
2314 break;
2315
2316 if (n->nud_state & ~NUD_NOARP)
2317 break;
Eric Dumazet767e97e2010-10-06 17:49:21 -07002318next:
2319 n = rcu_dereference_bh(n->next);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002320 }
2321
2322 if (n)
2323 break;
2324
David S. Millercd089332011-07-11 01:28:12 -07002325 if (++state->bucket >= (1 << nht->hash_shift))
Linus Torvalds1da177e2005-04-16 15:20:36 -07002326 break;
2327
Eric Dumazet767e97e2010-10-06 17:49:21 -07002328 n = rcu_dereference_bh(nht->hash_buckets[state->bucket]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002329 }
2330
2331 if (n && pos)
2332 --(*pos);
2333 return n;
2334}
2335
2336static struct neighbour *neigh_get_idx(struct seq_file *seq, loff_t *pos)
2337{
2338 struct neighbour *n = neigh_get_first(seq);
2339
2340 if (n) {
Chris Larson745e2032008-08-03 01:10:55 -07002341 --(*pos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002342 while (*pos) {
2343 n = neigh_get_next(seq, n, pos);
2344 if (!n)
2345 break;
2346 }
2347 }
2348 return *pos ? NULL : n;
2349}
2350
2351static struct pneigh_entry *pneigh_get_first(struct seq_file *seq)
2352{
2353 struct neigh_seq_state *state = seq->private;
YOSHIFUJI Hideaki12188542008-03-26 02:36:06 +09002354 struct net *net = seq_file_net(seq);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002355 struct neigh_table *tbl = state->tbl;
2356 struct pneigh_entry *pn = NULL;
2357 int bucket = state->bucket;
2358
2359 state->flags |= NEIGH_SEQ_IS_PNEIGH;
2360 for (bucket = 0; bucket <= PNEIGH_HASHMASK; bucket++) {
2361 pn = tbl->phash_buckets[bucket];
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002362 while (pn && !net_eq(pneigh_net(pn), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002363 pn = pn->next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002364 if (pn)
2365 break;
2366 }
2367 state->bucket = bucket;
2368
2369 return pn;
2370}
2371
2372static struct pneigh_entry *pneigh_get_next(struct seq_file *seq,
2373 struct pneigh_entry *pn,
2374 loff_t *pos)
2375{
2376 struct neigh_seq_state *state = seq->private;
YOSHIFUJI Hideaki12188542008-03-26 02:36:06 +09002377 struct net *net = seq_file_net(seq);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002378 struct neigh_table *tbl = state->tbl;
2379
2380 pn = pn->next;
2381 while (!pn) {
2382 if (++state->bucket > PNEIGH_HASHMASK)
2383 break;
2384 pn = tbl->phash_buckets[state->bucket];
YOSHIFUJI Hideaki878628f2008-03-26 03:57:35 +09002385 while (pn && !net_eq(pneigh_net(pn), net))
Eric W. Biederman426b5302008-01-24 00:13:18 -08002386 pn = pn->next;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002387 if (pn)
2388 break;
2389 }
2390
2391 if (pn && pos)
2392 --(*pos);
2393
2394 return pn;
2395}
2396
2397static struct pneigh_entry *pneigh_get_idx(struct seq_file *seq, loff_t *pos)
2398{
2399 struct pneigh_entry *pn = pneigh_get_first(seq);
2400
2401 if (pn) {
Chris Larson745e2032008-08-03 01:10:55 -07002402 --(*pos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002403 while (*pos) {
2404 pn = pneigh_get_next(seq, pn, pos);
2405 if (!pn)
2406 break;
2407 }
2408 }
2409 return *pos ? NULL : pn;
2410}
2411
2412static void *neigh_get_idx_any(struct seq_file *seq, loff_t *pos)
2413{
2414 struct neigh_seq_state *state = seq->private;
2415 void *rc;
Chris Larson745e2032008-08-03 01:10:55 -07002416 loff_t idxpos = *pos;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002417
Chris Larson745e2032008-08-03 01:10:55 -07002418 rc = neigh_get_idx(seq, &idxpos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002419 if (!rc && !(state->flags & NEIGH_SEQ_NEIGH_ONLY))
Chris Larson745e2032008-08-03 01:10:55 -07002420 rc = pneigh_get_idx(seq, &idxpos);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002421
2422 return rc;
2423}
2424
2425void *neigh_seq_start(struct seq_file *seq, loff_t *pos, struct neigh_table *tbl, unsigned int neigh_seq_flags)
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002426 __acquires(rcu_bh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002427{
2428 struct neigh_seq_state *state = seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002429
2430 state->tbl = tbl;
2431 state->bucket = 0;
2432 state->flags = (neigh_seq_flags & ~NEIGH_SEQ_IS_PNEIGH);
2433
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002434 rcu_read_lock_bh();
2435 state->nht = rcu_dereference_bh(tbl->nht);
Eric Dumazet767e97e2010-10-06 17:49:21 -07002436
Chris Larson745e2032008-08-03 01:10:55 -07002437 return *pos ? neigh_get_idx_any(seq, pos) : SEQ_START_TOKEN;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002438}
2439EXPORT_SYMBOL(neigh_seq_start);
2440
2441void *neigh_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2442{
2443 struct neigh_seq_state *state;
2444 void *rc;
2445
2446 if (v == SEQ_START_TOKEN) {
Chris Larsonbff69732008-08-03 01:02:41 -07002447 rc = neigh_get_first(seq);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002448 goto out;
2449 }
2450
2451 state = seq->private;
2452 if (!(state->flags & NEIGH_SEQ_IS_PNEIGH)) {
2453 rc = neigh_get_next(seq, v, NULL);
2454 if (rc)
2455 goto out;
2456 if (!(state->flags & NEIGH_SEQ_NEIGH_ONLY))
2457 rc = pneigh_get_first(seq);
2458 } else {
2459 BUG_ON(state->flags & NEIGH_SEQ_NEIGH_ONLY);
2460 rc = pneigh_get_next(seq, v, NULL);
2461 }
2462out:
2463 ++(*pos);
2464 return rc;
2465}
2466EXPORT_SYMBOL(neigh_seq_next);
2467
2468void neigh_seq_stop(struct seq_file *seq, void *v)
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002469 __releases(rcu_bh)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002470{
Eric Dumazetd6bf7812010-10-04 06:15:44 +00002471 rcu_read_unlock_bh();
Linus Torvalds1da177e2005-04-16 15:20:36 -07002472}
2473EXPORT_SYMBOL(neigh_seq_stop);
2474
2475/* statistics via seq_file */
2476
2477static void *neigh_stat_seq_start(struct seq_file *seq, loff_t *pos)
2478{
Alexey Dobriyan81c1ebf2010-01-22 10:16:05 +00002479 struct neigh_table *tbl = seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002480 int cpu;
2481
2482 if (*pos == 0)
2483 return SEQ_START_TOKEN;
YOSHIFUJI Hideaki4ec93ed2007-02-09 23:24:36 +09002484
Rusty Russell0f23174a2008-12-29 12:23:42 +00002485 for (cpu = *pos-1; cpu < nr_cpu_ids; ++cpu) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002486 if (!cpu_possible(cpu))
2487 continue;
2488 *pos = cpu+1;
2489 return per_cpu_ptr(tbl->stats, cpu);
2490 }
2491 return NULL;
2492}
2493
2494static void *neigh_stat_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2495{
Alexey Dobriyan81c1ebf2010-01-22 10:16:05 +00002496 struct neigh_table *tbl = seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002497 int cpu;
2498
Rusty Russell0f23174a2008-12-29 12:23:42 +00002499 for (cpu = *pos; cpu < nr_cpu_ids; ++cpu) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002500 if (!cpu_possible(cpu))
2501 continue;
2502 *pos = cpu+1;
2503 return per_cpu_ptr(tbl->stats, cpu);
2504 }
2505 return NULL;
2506}
2507
2508static void neigh_stat_seq_stop(struct seq_file *seq, void *v)
2509{
2510
2511}
2512
2513static int neigh_stat_seq_show(struct seq_file *seq, void *v)
2514{
Alexey Dobriyan81c1ebf2010-01-22 10:16:05 +00002515 struct neigh_table *tbl = seq->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002516 struct neigh_statistics *st = v;
2517
2518 if (v == SEQ_START_TOKEN) {
Neil Horman9a6d2762008-07-16 20:50:49 -07002519 seq_printf(seq, "entries allocs destroys hash_grows lookups hits res_failed rcv_probes_mcast rcv_probes_ucast periodic_gc_runs forced_gc_runs unresolved_discards\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07002520 return 0;
2521 }
2522
2523 seq_printf(seq, "%08x %08lx %08lx %08lx %08lx %08lx %08lx "
Neil Horman9a6d2762008-07-16 20:50:49 -07002524 "%08lx %08lx %08lx %08lx %08lx\n",
Linus Torvalds1da177e2005-04-16 15:20:36 -07002525 atomic_read(&tbl->entries),
2526
2527 st->allocs,
2528 st->destroys,
2529 st->hash_grows,
2530
2531 st->lookups,
2532 st->hits,
2533
2534 st->res_failed,
2535
2536 st->rcv_probes_mcast,
2537 st->rcv_probes_ucast,
2538
2539 st->periodic_gc_runs,
Neil Horman9a6d2762008-07-16 20:50:49 -07002540 st->forced_gc_runs,
2541 st->unres_discards
Linus Torvalds1da177e2005-04-16 15:20:36 -07002542 );
2543
2544 return 0;
2545}
2546
Stephen Hemmingerf6908082007-03-12 14:34:29 -07002547static const struct seq_operations neigh_stat_seq_ops = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002548 .start = neigh_stat_seq_start,
2549 .next = neigh_stat_seq_next,
2550 .stop = neigh_stat_seq_stop,
2551 .show = neigh_stat_seq_show,
2552};
2553
2554static int neigh_stat_seq_open(struct inode *inode, struct file *file)
2555{
2556 int ret = seq_open(file, &neigh_stat_seq_ops);
2557
2558 if (!ret) {
2559 struct seq_file *sf = file->private_data;
Alexey Dobriyan81c1ebf2010-01-22 10:16:05 +00002560 sf->private = PDE(inode)->data;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002561 }
2562 return ret;
2563};
2564
Arjan van de Ven9a321442007-02-12 00:55:35 -08002565static const struct file_operations neigh_stat_seq_fops = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002566 .owner = THIS_MODULE,
2567 .open = neigh_stat_seq_open,
2568 .read = seq_read,
2569 .llseek = seq_lseek,
2570 .release = seq_release,
2571};
2572
2573#endif /* CONFIG_PROC_FS */
2574
Thomas Graf339bf982006-11-10 14:10:15 -08002575static inline size_t neigh_nlmsg_size(void)
2576{
2577 return NLMSG_ALIGN(sizeof(struct ndmsg))
2578 + nla_total_size(MAX_ADDR_LEN) /* NDA_DST */
2579 + nla_total_size(MAX_ADDR_LEN) /* NDA_LLADDR */
2580 + nla_total_size(sizeof(struct nda_cacheinfo))
2581 + nla_total_size(4); /* NDA_PROBES */
2582}
2583
Thomas Grafb8673312006-08-15 00:33:14 -07002584static void __neigh_notify(struct neighbour *n, int type, int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002585{
YOSHIFUJI Hideakic346dca2008-03-25 21:47:49 +09002586 struct net *net = dev_net(n->dev);
Thomas Graf8b8aec52006-08-07 17:56:37 -07002587 struct sk_buff *skb;
Thomas Grafb8673312006-08-15 00:33:14 -07002588 int err = -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002589
Thomas Graf339bf982006-11-10 14:10:15 -08002590 skb = nlmsg_new(neigh_nlmsg_size(), GFP_ATOMIC);
Thomas Graf8b8aec52006-08-07 17:56:37 -07002591 if (skb == NULL)
Thomas Grafb8673312006-08-15 00:33:14 -07002592 goto errout;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002593
Thomas Grafb8673312006-08-15 00:33:14 -07002594 err = neigh_fill_info(skb, n, 0, 0, type, flags);
Patrick McHardy26932562007-01-31 23:16:40 -08002595 if (err < 0) {
2596 /* -EMSGSIZE implies BUG in neigh_nlmsg_size() */
2597 WARN_ON(err == -EMSGSIZE);
2598 kfree_skb(skb);
2599 goto errout;
2600 }
Pablo Neira Ayuso1ce85fe2009-02-24 23:18:28 -08002601 rtnl_notify(skb, net, 0, RTNLGRP_NEIGH, NULL, GFP_ATOMIC);
2602 return;
Thomas Grafb8673312006-08-15 00:33:14 -07002603errout:
2604 if (err < 0)
Eric W. Biederman426b5302008-01-24 00:13:18 -08002605 rtnl_set_sk_err(net, RTNLGRP_NEIGH, err);
Thomas Grafb8673312006-08-15 00:33:14 -07002606}
2607
Thomas Grafd961db32007-08-08 23:12:56 -07002608#ifdef CONFIG_ARPD
Thomas Grafb8673312006-08-15 00:33:14 -07002609void neigh_app_ns(struct neighbour *n)
2610{
2611 __neigh_notify(n, RTM_GETNEIGH, NLM_F_REQUEST);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002612}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09002613EXPORT_SYMBOL(neigh_app_ns);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002614#endif /* CONFIG_ARPD */
2615
2616#ifdef CONFIG_SYSCTL
2617
Eric W. Biederman54716e32010-02-14 03:27:03 +00002618#define NEIGH_VARS_MAX 19
2619
Linus Torvalds1da177e2005-04-16 15:20:36 -07002620static struct neigh_sysctl_table {
2621 struct ctl_table_header *sysctl_header;
Eric W. Biederman54716e32010-02-14 03:27:03 +00002622 struct ctl_table neigh_vars[NEIGH_VARS_MAX];
Pavel Emelyanovc3bac5a2007-12-02 00:08:16 +11002623 char *dev_name;
Brian Haleyab32ea52006-09-22 14:15:41 -07002624} neigh_sysctl_template __read_mostly = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002625 .neigh_vars = {
2626 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002627 .procname = "mcast_solicit",
2628 .maxlen = sizeof(int),
2629 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002630 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002631 },
2632 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002633 .procname = "ucast_solicit",
2634 .maxlen = sizeof(int),
2635 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002636 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002637 },
2638 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002639 .procname = "app_solicit",
2640 .maxlen = sizeof(int),
2641 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002642 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002643 },
2644 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002645 .procname = "retrans_time",
2646 .maxlen = sizeof(int),
2647 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002648 .proc_handler = proc_dointvec_userhz_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002649 },
2650 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002651 .procname = "base_reachable_time",
2652 .maxlen = sizeof(int),
2653 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002654 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002655 },
2656 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002657 .procname = "delay_first_probe_time",
2658 .maxlen = sizeof(int),
2659 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002660 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002661 },
2662 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002663 .procname = "gc_stale_time",
2664 .maxlen = sizeof(int),
2665 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002666 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002667 },
2668 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002669 .procname = "unres_qlen",
2670 .maxlen = sizeof(int),
2671 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002672 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002673 },
2674 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002675 .procname = "proxy_qlen",
2676 .maxlen = sizeof(int),
2677 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002678 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002679 },
2680 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002681 .procname = "anycast_delay",
2682 .maxlen = sizeof(int),
2683 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002684 .proc_handler = proc_dointvec_userhz_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002685 },
2686 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002687 .procname = "proxy_delay",
2688 .maxlen = sizeof(int),
2689 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002690 .proc_handler = proc_dointvec_userhz_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002691 },
2692 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002693 .procname = "locktime",
2694 .maxlen = sizeof(int),
2695 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002696 .proc_handler = proc_dointvec_userhz_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002697 },
2698 {
Eric W. Biedermand12af672007-10-18 03:05:25 -07002699 .procname = "retrans_time_ms",
2700 .maxlen = sizeof(int),
2701 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002702 .proc_handler = proc_dointvec_ms_jiffies,
Eric W. Biedermand12af672007-10-18 03:05:25 -07002703 },
2704 {
Eric W. Biedermand12af672007-10-18 03:05:25 -07002705 .procname = "base_reachable_time_ms",
2706 .maxlen = sizeof(int),
2707 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002708 .proc_handler = proc_dointvec_ms_jiffies,
Eric W. Biedermand12af672007-10-18 03:05:25 -07002709 },
2710 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002711 .procname = "gc_interval",
2712 .maxlen = sizeof(int),
2713 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002714 .proc_handler = proc_dointvec_jiffies,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002715 },
2716 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002717 .procname = "gc_thresh1",
2718 .maxlen = sizeof(int),
2719 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002720 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002721 },
2722 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002723 .procname = "gc_thresh2",
2724 .maxlen = sizeof(int),
2725 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002726 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002727 },
2728 {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002729 .procname = "gc_thresh3",
2730 .maxlen = sizeof(int),
2731 .mode = 0644,
Alexey Dobriyan6d9f2392008-11-03 18:21:05 -08002732 .proc_handler = proc_dointvec,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002733 },
Pavel Emelyanovc3bac5a2007-12-02 00:08:16 +11002734 {},
Linus Torvalds1da177e2005-04-16 15:20:36 -07002735 },
2736};
2737
2738int neigh_sysctl_register(struct net_device *dev, struct neigh_parms *p,
Eric W. Biederman54716e32010-02-14 03:27:03 +00002739 char *p_name, proc_handler *handler)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002740{
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002741 struct neigh_sysctl_table *t;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002742 const char *dev_name_source = NULL;
Pavel Emelyanovc3bac5a2007-12-02 00:08:16 +11002743
2744#define NEIGH_CTL_PATH_ROOT 0
2745#define NEIGH_CTL_PATH_PROTO 1
2746#define NEIGH_CTL_PATH_NEIGH 2
2747#define NEIGH_CTL_PATH_DEV 3
2748
2749 struct ctl_path neigh_path[] = {
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002750 { .procname = "net", },
2751 { .procname = "proto", },
2752 { .procname = "neigh", },
2753 { .procname = "default", },
Pavel Emelyanovc3bac5a2007-12-02 00:08:16 +11002754 { },
2755 };
Linus Torvalds1da177e2005-04-16 15:20:36 -07002756
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002757 t = kmemdup(&neigh_sysctl_template, sizeof(*t), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002758 if (!t)
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002759 goto err;
2760
Linus Torvalds1da177e2005-04-16 15:20:36 -07002761 t->neigh_vars[0].data = &p->mcast_probes;
2762 t->neigh_vars[1].data = &p->ucast_probes;
2763 t->neigh_vars[2].data = &p->app_probes;
2764 t->neigh_vars[3].data = &p->retrans_time;
2765 t->neigh_vars[4].data = &p->base_reachable_time;
2766 t->neigh_vars[5].data = &p->delay_probe_time;
2767 t->neigh_vars[6].data = &p->gc_staletime;
2768 t->neigh_vars[7].data = &p->queue_len;
2769 t->neigh_vars[8].data = &p->proxy_qlen;
2770 t->neigh_vars[9].data = &p->anycast_delay;
2771 t->neigh_vars[10].data = &p->proxy_delay;
2772 t->neigh_vars[11].data = &p->locktime;
Eric W. Biedermand12af672007-10-18 03:05:25 -07002773 t->neigh_vars[12].data = &p->retrans_time;
2774 t->neigh_vars[13].data = &p->base_reachable_time;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002775
2776 if (dev) {
2777 dev_name_source = dev->name;
Eric W. Biedermand12af672007-10-18 03:05:25 -07002778 /* Terminate the table early */
2779 memset(&t->neigh_vars[14], 0, sizeof(t->neigh_vars[14]));
Linus Torvalds1da177e2005-04-16 15:20:36 -07002780 } else {
Pavel Emelyanovc3bac5a2007-12-02 00:08:16 +11002781 dev_name_source = neigh_path[NEIGH_CTL_PATH_DEV].procname;
Eric W. Biedermand12af672007-10-18 03:05:25 -07002782 t->neigh_vars[14].data = (int *)(p + 1);
2783 t->neigh_vars[15].data = (int *)(p + 1) + 1;
2784 t->neigh_vars[16].data = (int *)(p + 1) + 2;
2785 t->neigh_vars[17].data = (int *)(p + 1) + 3;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002786 }
2787
Linus Torvalds1da177e2005-04-16 15:20:36 -07002788
Eric W. Biedermanf8572d82009-11-05 13:32:03 -08002789 if (handler) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002790 /* RetransTime */
2791 t->neigh_vars[3].proc_handler = handler;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002792 t->neigh_vars[3].extra1 = dev;
2793 /* ReachableTime */
2794 t->neigh_vars[4].proc_handler = handler;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002795 t->neigh_vars[4].extra1 = dev;
2796 /* RetransTime (in milliseconds)*/
Eric W. Biedermand12af672007-10-18 03:05:25 -07002797 t->neigh_vars[12].proc_handler = handler;
Eric W. Biedermand12af672007-10-18 03:05:25 -07002798 t->neigh_vars[12].extra1 = dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002799 /* ReachableTime (in milliseconds) */
Eric W. Biedermand12af672007-10-18 03:05:25 -07002800 t->neigh_vars[13].proc_handler = handler;
Eric W. Biedermand12af672007-10-18 03:05:25 -07002801 t->neigh_vars[13].extra1 = dev;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002802 }
2803
Pavel Emelyanovc3bac5a2007-12-02 00:08:16 +11002804 t->dev_name = kstrdup(dev_name_source, GFP_KERNEL);
2805 if (!t->dev_name)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002806 goto free;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002807
Pavel Emelyanovc3bac5a2007-12-02 00:08:16 +11002808 neigh_path[NEIGH_CTL_PATH_DEV].procname = t->dev_name;
Pavel Emelyanovc3bac5a2007-12-02 00:08:16 +11002809 neigh_path[NEIGH_CTL_PATH_PROTO].procname = p_name;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002810
Denis V. Lunev4ab438f2008-02-28 20:48:01 -08002811 t->sysctl_header =
YOSHIFUJI Hideaki57da52c2008-03-26 03:49:59 +09002812 register_net_sysctl_table(neigh_parms_net(p), neigh_path, t->neigh_vars);
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002813 if (!t->sysctl_header)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002814 goto free_procname;
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002815
Linus Torvalds1da177e2005-04-16 15:20:36 -07002816 p->sysctl_table = t;
2817 return 0;
2818
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002819free_procname:
Pavel Emelyanovc3bac5a2007-12-02 00:08:16 +11002820 kfree(t->dev_name);
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002821free:
Linus Torvalds1da177e2005-04-16 15:20:36 -07002822 kfree(t);
Pavel Emelyanov3c607bb2007-12-02 00:06:34 +11002823err:
2824 return -ENOBUFS;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002825}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09002826EXPORT_SYMBOL(neigh_sysctl_register);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002827
2828void neigh_sysctl_unregister(struct neigh_parms *p)
2829{
2830 if (p->sysctl_table) {
2831 struct neigh_sysctl_table *t = p->sysctl_table;
2832 p->sysctl_table = NULL;
2833 unregister_sysctl_table(t->sysctl_header);
Pavel Emelyanovc3bac5a2007-12-02 00:08:16 +11002834 kfree(t->dev_name);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002835 kfree(t);
2836 }
2837}
YOSHIFUJI Hideaki0a204502008-03-24 18:39:10 +09002838EXPORT_SYMBOL(neigh_sysctl_unregister);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002839
2840#endif /* CONFIG_SYSCTL */
2841
Thomas Grafc8822a42007-03-22 11:50:06 -07002842static int __init neigh_init(void)
2843{
Greg Rosec7ac8672011-06-10 01:27:09 +00002844 rtnl_register(PF_UNSPEC, RTM_NEWNEIGH, neigh_add, NULL, NULL);
2845 rtnl_register(PF_UNSPEC, RTM_DELNEIGH, neigh_delete, NULL, NULL);
2846 rtnl_register(PF_UNSPEC, RTM_GETNEIGH, NULL, neigh_dump_info, NULL);
Thomas Grafc8822a42007-03-22 11:50:06 -07002847
Greg Rosec7ac8672011-06-10 01:27:09 +00002848 rtnl_register(PF_UNSPEC, RTM_GETNEIGHTBL, NULL, neightbl_dump_info,
2849 NULL);
2850 rtnl_register(PF_UNSPEC, RTM_SETNEIGHTBL, neightbl_set, NULL, NULL);
Thomas Grafc8822a42007-03-22 11:50:06 -07002851
2852 return 0;
2853}
2854
2855subsys_initcall(neigh_init);
2856