allow coexistance of N build and AC build.
[tomato.git] / release / src-rt-6.x / linux / linux-2.6 / net / core / neighbour.c
blobdedccd4501e1a5acd10102f0d21a480066c00585
1 /*
2 * Generic address resolution entity
4 * Authors:
5 * Pedro Roque <roque@di.fc.ul.pt>
6 * Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
8 * This program is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU General Public License
10 * as published by the Free Software Foundation; either version
11 * 2 of the License, or (at your option) any later version.
13 * Fixes:
14 * Vitaly E. Lavrov releasing NULL neighbor in neigh_add.
15 * Harald Welte Add neighbour cache statistics like rtstat
18 #include <linux/types.h>
19 #include <linux/kernel.h>
20 #include <linux/module.h>
21 #include <linux/socket.h>
22 #include <linux/netdevice.h>
23 #include <linux/proc_fs.h>
24 #ifdef CONFIG_SYSCTL
25 #include <linux/sysctl.h>
26 #endif
27 #include <linux/times.h>
28 #include <net/neighbour.h>
29 #include <net/dst.h>
30 #include <net/sock.h>
31 #include <net/netevent.h>
32 #include <net/netlink.h>
33 #include <linux/rtnetlink.h>
34 #include <linux/random.h>
35 #include <linux/string.h>
37 #define NEIGH_DEBUG 1
39 #define NEIGH_PRINTK(x...) printk(x)
40 #define NEIGH_NOPRINTK(x...) do { ; } while(0)
41 #define NEIGH_PRINTK0 NEIGH_PRINTK
42 #define NEIGH_PRINTK1 NEIGH_NOPRINTK
43 #define NEIGH_PRINTK2 NEIGH_NOPRINTK
45 #if NEIGH_DEBUG >= 1
46 #undef NEIGH_PRINTK1
47 #define NEIGH_PRINTK1 NEIGH_PRINTK
48 #endif
49 #if NEIGH_DEBUG >= 2
50 #undef NEIGH_PRINTK2
51 #define NEIGH_PRINTK2 NEIGH_PRINTK
52 #endif
54 #define PNEIGH_HASHMASK 0xF
56 static void neigh_timer_handler(unsigned long arg);
57 #ifdef CONFIG_ARPD
58 static void neigh_app_notify(struct neighbour *n);
59 #endif
60 static int pneigh_ifdown(struct neigh_table *tbl, struct net_device *dev);
61 void neigh_changeaddr(struct neigh_table *tbl, struct net_device *dev);
63 static struct neigh_table *neigh_tables;
64 #ifdef CONFIG_PROC_FS
65 static const struct file_operations neigh_stat_seq_fops;
66 #endif
69 Neighbour hash table buckets are protected with rwlock tbl->lock.
71 - All the scans/updates to hash buckets MUST be made under this lock.
72 - NOTHING clever should be made under this lock: no callbacks
73 to protocol backends, no attempts to send something to network.
74 It will result in deadlocks, if backend/driver wants to use neighbour
75 cache.
76 - If the entry requires some non-trivial actions, increase
77 its reference count and release table lock.
79 Neighbour entries are protected:
80 - with reference count.
81 - with rwlock neigh->lock
83 Reference count prevents destruction.
85 neigh->lock mainly serializes ll address data and its validity state.
86 However, the same lock is used to protect another entry fields:
87 - timer
88 - resolution queue
90 Again, nothing clever shall be made under neigh->lock,
91 the most complicated procedure, which we allow is dev->hard_header.
92 It is supposed, that dev->hard_header is simplistic and does
93 not make callbacks to neighbour tables.
95 The last lock is neigh_tbl_lock. It is pure SMP lock, protecting
96 list of neighbour tables. This list is used only in process context,
99 static DEFINE_RWLOCK(neigh_tbl_lock);
101 static int neigh_blackhole(struct sk_buff *skb)
103 kfree_skb(skb);
104 return -ENETDOWN;
107 static void neigh_cleanup_and_release(struct neighbour *neigh)
109 if (neigh->parms->neigh_cleanup)
110 neigh->parms->neigh_cleanup(neigh);
112 neigh_release(neigh);
116 * It is random distribution in the interval (1/2)*base...(3/2)*base.
117 * It corresponds to default IPv6 settings and is not overridable,
118 * because it is really reasonable choice.
121 unsigned long neigh_rand_reach_time(unsigned long base)
123 return (base ? (net_random() % base) + (base >> 1) : 0);
127 static int neigh_forced_gc(struct neigh_table *tbl)
129 int shrunk = 0;
130 int i;
132 NEIGH_CACHE_STAT_INC(tbl, forced_gc_runs);
134 write_lock_bh(&tbl->lock);
135 for (i = 0; i <= tbl->hash_mask; i++) {
136 struct neighbour *n, **np;
138 np = &tbl->hash_buckets[i];
139 while ((n = *np) != NULL) {
140 /* Neighbour record may be discarded if:
141 * - nobody refers to it.
142 * - it is not permanent
144 write_lock(&n->lock);
145 if (atomic_read(&n->refcnt) == 1 &&
146 !(n->nud_state & NUD_PERMANENT)) {
147 *np = n->next;
148 n->dead = 1;
149 shrunk = 1;
150 write_unlock(&n->lock);
151 neigh_cleanup_and_release(n);
152 continue;
154 write_unlock(&n->lock);
155 np = &n->next;
159 tbl->last_flush = jiffies;
161 write_unlock_bh(&tbl->lock);
163 return shrunk;
166 static int neigh_del_timer(struct neighbour *n)
168 if ((n->nud_state & NUD_IN_TIMER) &&
169 del_timer(&n->timer)) {
170 neigh_release(n);
171 return 1;
173 return 0;
176 static void pneigh_queue_purge(struct sk_buff_head *list)
178 struct sk_buff *skb;
180 while ((skb = skb_dequeue(list)) != NULL) {
181 dev_put(skb->dev);
182 kfree_skb(skb);
186 static void neigh_flush_dev(struct neigh_table *tbl, struct net_device *dev)
188 int i;
190 for (i = 0; i <= tbl->hash_mask; i++) {
191 struct neighbour *n, **np = &tbl->hash_buckets[i];
193 while ((n = *np) != NULL) {
194 if (dev && n->dev != dev) {
195 np = &n->next;
196 continue;
198 *np = n->next;
199 write_lock(&n->lock);
200 neigh_del_timer(n);
201 n->dead = 1;
203 if (atomic_read(&n->refcnt) != 1) {
204 /* The most unpleasant situation.
205 We must destroy neighbour entry,
206 but someone still uses it.
208 The destroy will be delayed until
209 the last user releases us, but
210 we must kill timers etc. and move
211 it to safe state.
213 skb_queue_purge(&n->arp_queue);
214 n->output = neigh_blackhole;
215 if (n->nud_state & NUD_VALID)
216 n->nud_state = NUD_NOARP;
217 else
218 n->nud_state = NUD_NONE;
219 NEIGH_PRINTK2("neigh %p is stray.\n", n);
221 write_unlock(&n->lock);
222 neigh_cleanup_and_release(n);
227 void neigh_changeaddr(struct neigh_table *tbl, struct net_device *dev)
229 write_lock_bh(&tbl->lock);
230 neigh_flush_dev(tbl, dev);
231 write_unlock_bh(&tbl->lock);
234 int neigh_ifdown(struct neigh_table *tbl, struct net_device *dev)
236 write_lock_bh(&tbl->lock);
237 neigh_flush_dev(tbl, dev);
238 pneigh_ifdown(tbl, dev);
239 write_unlock_bh(&tbl->lock);
241 del_timer_sync(&tbl->proxy_timer);
242 pneigh_queue_purge(&tbl->proxy_queue);
243 return 0;
246 static struct neighbour *neigh_alloc(struct neigh_table *tbl)
248 struct neighbour *n = NULL;
249 unsigned long now = jiffies;
250 int entries;
252 entries = atomic_inc_return(&tbl->entries) - 1;
253 if (entries >= tbl->gc_thresh3 ||
254 (entries >= tbl->gc_thresh2 &&
255 time_after(now, tbl->last_flush + 5 * HZ))) {
256 if (!neigh_forced_gc(tbl) &&
257 entries >= tbl->gc_thresh3)
258 goto out_entries;
261 n = kmem_cache_zalloc(tbl->kmem_cachep, GFP_ATOMIC);
262 if (!n)
263 goto out_entries;
265 skb_queue_head_init(&n->arp_queue);
266 rwlock_init(&n->lock);
267 n->updated = n->used = now;
268 n->nud_state = NUD_NONE;
269 n->output = neigh_blackhole;
270 n->parms = neigh_parms_clone(&tbl->parms);
271 init_timer(&n->timer);
272 n->timer.function = neigh_timer_handler;
273 n->timer.data = (unsigned long)n;
275 NEIGH_CACHE_STAT_INC(tbl, allocs);
276 n->tbl = tbl;
277 atomic_set(&n->refcnt, 1);
278 n->dead = 1;
279 out:
280 return n;
282 out_entries:
283 atomic_dec(&tbl->entries);
284 goto out;
287 static struct neighbour **neigh_hash_alloc(unsigned int entries)
289 unsigned long size = entries * sizeof(struct neighbour *);
290 struct neighbour **ret;
292 if (size <= PAGE_SIZE) {
293 ret = kzalloc(size, GFP_ATOMIC);
294 } else {
295 ret = (struct neighbour **)
296 __get_free_pages(GFP_ATOMIC|__GFP_ZERO, get_order(size));
298 return ret;
301 static void neigh_hash_free(struct neighbour **hash, unsigned int entries)
303 unsigned long size = entries * sizeof(struct neighbour *);
305 if (size <= PAGE_SIZE)
306 kfree(hash);
307 else
308 free_pages((unsigned long)hash, get_order(size));
311 static void neigh_hash_grow(struct neigh_table *tbl, unsigned long new_entries)
313 struct neighbour **new_hash, **old_hash;
314 unsigned int i, new_hash_mask, old_entries;
316 NEIGH_CACHE_STAT_INC(tbl, hash_grows);
318 BUG_ON(new_entries & (new_entries - 1));
319 new_hash = neigh_hash_alloc(new_entries);
320 if (!new_hash)
321 return;
323 old_entries = tbl->hash_mask + 1;
324 new_hash_mask = new_entries - 1;
325 old_hash = tbl->hash_buckets;
327 get_random_bytes(&tbl->hash_rnd, sizeof(tbl->hash_rnd));
328 for (i = 0; i < old_entries; i++) {
329 struct neighbour *n, *next;
331 for (n = old_hash[i]; n; n = next) {
332 unsigned int hash_val = tbl->hash(n->primary_key, n->dev);
334 hash_val &= new_hash_mask;
335 next = n->next;
337 n->next = new_hash[hash_val];
338 new_hash[hash_val] = n;
341 tbl->hash_buckets = new_hash;
342 tbl->hash_mask = new_hash_mask;
344 neigh_hash_free(old_hash, old_entries);
347 struct neighbour *neigh_lookup(struct neigh_table *tbl, const void *pkey,
348 struct net_device *dev)
350 struct neighbour *n;
351 int key_len = tbl->key_len;
352 u32 hash_val = tbl->hash(pkey, dev);
354 NEIGH_CACHE_STAT_INC(tbl, lookups);
356 read_lock_bh(&tbl->lock);
357 for (n = tbl->hash_buckets[hash_val & tbl->hash_mask]; n; n = n->next) {
358 if (dev == n->dev && !memcmp(n->primary_key, pkey, key_len)) {
359 neigh_hold(n);
360 NEIGH_CACHE_STAT_INC(tbl, hits);
361 break;
364 read_unlock_bh(&tbl->lock);
365 return n;
368 struct neighbour *neigh_lookup_nodev(struct neigh_table *tbl, const void *pkey)
370 struct neighbour *n;
371 int key_len = tbl->key_len;
372 u32 hash_val = tbl->hash(pkey, NULL);
374 NEIGH_CACHE_STAT_INC(tbl, lookups);
376 read_lock_bh(&tbl->lock);
377 for (n = tbl->hash_buckets[hash_val & tbl->hash_mask]; n; n = n->next) {
378 if (!memcmp(n->primary_key, pkey, key_len)) {
379 neigh_hold(n);
380 NEIGH_CACHE_STAT_INC(tbl, hits);
381 break;
384 read_unlock_bh(&tbl->lock);
385 return n;
388 struct neighbour *neigh_create(struct neigh_table *tbl, const void *pkey,
389 struct net_device *dev)
391 u32 hash_val;
392 int key_len = tbl->key_len;
393 int error;
394 struct neighbour *n1, *rc, *n = neigh_alloc(tbl);
396 if (!n) {
397 rc = ERR_PTR(-ENOBUFS);
398 goto out;
401 memcpy(n->primary_key, pkey, key_len);
402 n->dev = dev;
403 dev_hold(dev);
405 /* Protocol specific setup. */
406 if (tbl->constructor && (error = tbl->constructor(n)) < 0) {
407 rc = ERR_PTR(error);
408 goto out_neigh_release;
411 /* Device specific setup. */
412 if (n->parms->neigh_setup &&
413 (error = n->parms->neigh_setup(n)) < 0) {
414 rc = ERR_PTR(error);
415 goto out_neigh_release;
418 n->confirmed = jiffies - (n->parms->base_reachable_time << 1);
420 write_lock_bh(&tbl->lock);
422 if (atomic_read(&tbl->entries) > (tbl->hash_mask + 1))
423 neigh_hash_grow(tbl, (tbl->hash_mask + 1) << 1);
425 hash_val = tbl->hash(pkey, dev) & tbl->hash_mask;
427 if (n->parms->dead) {
428 rc = ERR_PTR(-EINVAL);
429 goto out_tbl_unlock;
432 for (n1 = tbl->hash_buckets[hash_val]; n1; n1 = n1->next) {
433 if (dev == n1->dev && !memcmp(n1->primary_key, pkey, key_len)) {
434 neigh_hold(n1);
435 rc = n1;
436 goto out_tbl_unlock;
440 n->next = tbl->hash_buckets[hash_val];
441 tbl->hash_buckets[hash_val] = n;
442 n->dead = 0;
443 neigh_hold(n);
444 write_unlock_bh(&tbl->lock);
445 NEIGH_PRINTK2("neigh %p is created.\n", n);
446 rc = n;
447 out:
448 return rc;
449 out_tbl_unlock:
450 write_unlock_bh(&tbl->lock);
451 out_neigh_release:
452 neigh_release(n);
453 goto out;
456 struct pneigh_entry * pneigh_lookup(struct neigh_table *tbl, const void *pkey,
457 struct net_device *dev, int creat)
459 struct pneigh_entry *n;
460 int key_len = tbl->key_len;
461 u32 hash_val = *(u32 *)(pkey + key_len - 4);
463 hash_val ^= (hash_val >> 16);
464 hash_val ^= hash_val >> 8;
465 hash_val ^= hash_val >> 4;
466 hash_val &= PNEIGH_HASHMASK;
468 read_lock_bh(&tbl->lock);
470 for (n = tbl->phash_buckets[hash_val]; n; n = n->next) {
471 if (!memcmp(n->key, pkey, key_len) &&
472 (n->dev == dev || !n->dev)) {
473 read_unlock_bh(&tbl->lock);
474 goto out;
477 read_unlock_bh(&tbl->lock);
478 n = NULL;
479 if (!creat)
480 goto out;
482 n = kmalloc(sizeof(*n) + key_len, GFP_KERNEL);
483 if (!n)
484 goto out;
486 memcpy(n->key, pkey, key_len);
487 n->dev = dev;
488 if (dev)
489 dev_hold(dev);
491 if (tbl->pconstructor && tbl->pconstructor(n)) {
492 if (dev)
493 dev_put(dev);
494 kfree(n);
495 n = NULL;
496 goto out;
499 write_lock_bh(&tbl->lock);
500 n->next = tbl->phash_buckets[hash_val];
501 tbl->phash_buckets[hash_val] = n;
502 write_unlock_bh(&tbl->lock);
503 out:
504 return n;
508 int pneigh_delete(struct neigh_table *tbl, const void *pkey,
509 struct net_device *dev)
511 struct pneigh_entry *n, **np;
512 int key_len = tbl->key_len;
513 u32 hash_val = *(u32 *)(pkey + key_len - 4);
515 hash_val ^= (hash_val >> 16);
516 hash_val ^= hash_val >> 8;
517 hash_val ^= hash_val >> 4;
518 hash_val &= PNEIGH_HASHMASK;
520 write_lock_bh(&tbl->lock);
521 for (np = &tbl->phash_buckets[hash_val]; (n = *np) != NULL;
522 np = &n->next) {
523 if (!memcmp(n->key, pkey, key_len) && n->dev == dev) {
524 *np = n->next;
525 write_unlock_bh(&tbl->lock);
526 if (tbl->pdestructor)
527 tbl->pdestructor(n);
528 if (n->dev)
529 dev_put(n->dev);
530 kfree(n);
531 return 0;
534 write_unlock_bh(&tbl->lock);
535 return -ENOENT;
538 static int pneigh_ifdown(struct neigh_table *tbl, struct net_device *dev)
540 struct pneigh_entry *n, **np;
541 u32 h;
543 for (h = 0; h <= PNEIGH_HASHMASK; h++) {
544 np = &tbl->phash_buckets[h];
545 while ((n = *np) != NULL) {
546 if (!dev || n->dev == dev) {
547 *np = n->next;
548 if (tbl->pdestructor)
549 tbl->pdestructor(n);
550 if (n->dev)
551 dev_put(n->dev);
552 kfree(n);
553 continue;
555 np = &n->next;
558 return -ENOENT;
563 * neighbour must already be out of the table;
566 void neigh_destroy(struct neighbour *neigh)
568 struct hh_cache *hh;
570 NEIGH_CACHE_STAT_INC(neigh->tbl, destroys);
572 if (!neigh->dead) {
573 printk(KERN_WARNING
574 "Destroying alive neighbour %p\n", neigh);
575 dump_stack();
576 return;
579 if (neigh_del_timer(neigh))
580 printk(KERN_WARNING "Impossible event.\n");
582 while ((hh = neigh->hh) != NULL) {
583 neigh->hh = hh->hh_next;
584 hh->hh_next = NULL;
586 write_seqlock_bh(&hh->hh_lock);
587 hh->hh_output = neigh_blackhole;
588 write_sequnlock_bh(&hh->hh_lock);
589 if (atomic_dec_and_test(&hh->hh_refcnt))
590 kfree(hh);
593 skb_queue_purge(&neigh->arp_queue);
595 dev_put(neigh->dev);
596 neigh_parms_put(neigh->parms);
598 NEIGH_PRINTK2("neigh %p is destroyed.\n", neigh);
600 atomic_dec(&neigh->tbl->entries);
601 kmem_cache_free(neigh->tbl->kmem_cachep, neigh);
604 /* Neighbour state is suspicious;
605 disable fast path.
607 Called with write_locked neigh.
609 static void neigh_suspect(struct neighbour *neigh)
611 struct hh_cache *hh;
613 NEIGH_PRINTK2("neigh %p is suspected.\n", neigh);
615 neigh->output = neigh->ops->output;
617 for (hh = neigh->hh; hh; hh = hh->hh_next)
618 hh->hh_output = neigh->ops->output;
621 /* Neighbour state is OK;
622 enable fast path.
624 Called with write_locked neigh.
626 static void neigh_connect(struct neighbour *neigh)
628 struct hh_cache *hh;
630 NEIGH_PRINTK2("neigh %p is connected.\n", neigh);
632 neigh->output = neigh->ops->connected_output;
634 for (hh = neigh->hh; hh; hh = hh->hh_next)
635 hh->hh_output = neigh->ops->hh_output;
638 static void neigh_periodic_work(struct work_struct *work)
640 struct neigh_table *tbl = container_of(work, struct neigh_table, gc_work.work);
641 struct neighbour *n, **np;
642 unsigned int i;
644 NEIGH_CACHE_STAT_INC(tbl, periodic_gc_runs);
646 write_lock_bh(&tbl->lock);
649 * periodically recompute ReachableTime from random function
652 if (time_after(jiffies, tbl->last_rand + 300 * HZ)) {
653 struct neigh_parms *p;
654 tbl->last_rand = jiffies;
655 for (p = &tbl->parms; p; p = p->next)
656 p->reachable_time =
657 neigh_rand_reach_time(p->base_reachable_time);
660 for (i = 0 ; i <= tbl->hash_mask; i++) {
661 np = &tbl->hash_buckets[i];
663 while ((n = *np) != NULL) {
664 unsigned int state;
666 write_lock(&n->lock);
668 state = n->nud_state;
669 if (state & (NUD_PERMANENT | NUD_IN_TIMER)) {
670 write_unlock(&n->lock);
671 goto next_elt;
674 if (time_before(n->used, n->confirmed))
675 n->used = n->confirmed;
677 if (atomic_read(&n->refcnt) == 1 &&
678 (state == NUD_FAILED ||
679 time_after(jiffies, n->used + n->parms->gc_staletime))) {
680 *np = n->next;
681 n->dead = 1;
682 write_unlock(&n->lock);
683 neigh_cleanup_and_release(n);
684 continue;
686 write_unlock(&n->lock);
688 next_elt:
689 np = &n->next;
692 * It's fine to release lock here, even if hash table
693 * grows while we are preempted.
695 write_unlock_bh(&tbl->lock);
696 cond_resched();
697 write_lock_bh(&tbl->lock);
699 /* Cycle through all hash buckets every base_reachable_time/2 ticks.
700 * ARP entry timeouts range from 1/2 base_reachable_time to 3/2
701 * base_reachable_time.
703 schedule_delayed_work(&tbl->gc_work,
704 tbl->parms.base_reachable_time >> 1);
705 write_unlock_bh(&tbl->lock);
708 static __inline__ int neigh_max_probes(struct neighbour *n)
710 struct neigh_parms *p = n->parms;
711 return (n->nud_state & NUD_PROBE ?
712 p->ucast_probes :
713 p->ucast_probes + p->app_probes + p->mcast_probes);
716 static inline void neigh_add_timer(struct neighbour *n, unsigned long when)
718 if (unlikely(mod_timer(&n->timer, when))) {
719 printk("NEIGH: BUG, double timer add, state is %x\n",
720 n->nud_state);
721 dump_stack();
725 /* Called when a timer expires for a neighbour entry. */
727 static void neigh_timer_handler(unsigned long arg)
729 unsigned long now, next;
730 struct neighbour *neigh = (struct neighbour *)arg;
731 unsigned state;
732 int notify = 0;
734 write_lock(&neigh->lock);
736 state = neigh->nud_state;
737 now = jiffies;
738 next = now + HZ;
740 if (!(state & NUD_IN_TIMER)) {
741 #ifndef CONFIG_SMP
742 printk(KERN_WARNING "neigh: timer & !nud_in_timer\n");
743 #endif
744 goto out;
747 if (state & NUD_REACHABLE) {
748 if (time_before_eq(now,
749 neigh->confirmed + neigh->parms->reachable_time)) {
750 NEIGH_PRINTK2("neigh %p is still alive.\n", neigh);
751 next = neigh->confirmed + neigh->parms->reachable_time;
752 } else if (time_before_eq(now,
753 neigh->used + neigh->parms->delay_probe_time)) {
754 NEIGH_PRINTK2("neigh %p is delayed.\n", neigh);
755 neigh->nud_state = NUD_DELAY;
756 neigh->updated = jiffies;
757 neigh_suspect(neigh);
758 next = now + neigh->parms->delay_probe_time;
759 } else {
760 NEIGH_PRINTK2("neigh %p is suspected.\n", neigh);
761 neigh->nud_state = NUD_STALE;
762 neigh->updated = jiffies;
763 neigh_suspect(neigh);
764 notify = 1;
766 } else if (state & NUD_DELAY) {
767 if (time_before_eq(now,
768 neigh->confirmed + neigh->parms->delay_probe_time)) {
769 NEIGH_PRINTK2("neigh %p is now reachable.\n", neigh);
770 neigh->nud_state = NUD_REACHABLE;
771 neigh->updated = jiffies;
772 neigh_connect(neigh);
773 notify = 1;
774 next = neigh->confirmed + neigh->parms->reachable_time;
775 } else {
776 NEIGH_PRINTK2("neigh %p is probed.\n", neigh);
777 neigh->nud_state = NUD_PROBE;
778 neigh->updated = jiffies;
779 atomic_set(&neigh->probes, 0);
780 next = now + neigh->parms->retrans_time;
782 } else {
783 /* NUD_PROBE|NUD_INCOMPLETE */
784 next = now + neigh->parms->retrans_time;
787 if ((neigh->nud_state & (NUD_INCOMPLETE | NUD_PROBE)) &&
788 atomic_read(&neigh->probes) >= neigh_max_probes(neigh)) {
789 struct sk_buff *skb;
791 neigh->nud_state = NUD_FAILED;
792 neigh->updated = jiffies;
793 notify = 1;
794 NEIGH_CACHE_STAT_INC(neigh->tbl, res_failed);
795 NEIGH_PRINTK2("neigh %p is failed.\n", neigh);
797 /* It is very thin place. report_unreachable is very complicated
798 routine. Particularly, it can hit the same neighbour entry!
800 So that, we try to be accurate and avoid dead loop. --ANK
802 while (neigh->nud_state == NUD_FAILED &&
803 (skb = __skb_dequeue(&neigh->arp_queue)) != NULL) {
804 write_unlock(&neigh->lock);
805 neigh->ops->error_report(neigh, skb);
806 write_lock(&neigh->lock);
808 skb_queue_purge(&neigh->arp_queue);
811 if (neigh->nud_state & NUD_IN_TIMER) {
812 if (time_before(next, jiffies + HZ/2))
813 next = jiffies + HZ/2;
814 if (!mod_timer(&neigh->timer, next))
815 neigh_hold(neigh);
817 if (neigh->nud_state & (NUD_INCOMPLETE | NUD_PROBE)) {
818 struct sk_buff *skb = skb_peek(&neigh->arp_queue);
819 /* keep skb alive even if arp_queue overflows */
820 if (skb)
821 skb_get(skb);
822 write_unlock(&neigh->lock);
823 neigh->ops->solicit(neigh, skb);
824 atomic_inc(&neigh->probes);
825 if (skb)
826 kfree_skb(skb);
827 } else {
828 out:
829 write_unlock(&neigh->lock);
831 if (notify)
832 call_netevent_notifiers(NETEVENT_NEIGH_UPDATE, neigh);
834 #ifdef CONFIG_ARPD
835 if (notify && neigh->parms->app_probes)
836 neigh_app_notify(neigh);
837 #endif
838 neigh_release(neigh);
841 int __neigh_event_send(struct neighbour *neigh, struct sk_buff *skb)
843 int rc;
844 unsigned long now;
846 write_lock_bh(&neigh->lock);
848 rc = 0;
849 if (neigh->nud_state & (NUD_CONNECTED | NUD_DELAY | NUD_PROBE))
850 goto out_unlock_bh;
852 now = jiffies;
854 if (!(neigh->nud_state & (NUD_STALE | NUD_INCOMPLETE))) {
855 if (neigh->parms->mcast_probes + neigh->parms->app_probes) {
856 atomic_set(&neigh->probes, neigh->parms->ucast_probes);
857 neigh->nud_state = NUD_INCOMPLETE;
858 neigh->updated = jiffies;
859 neigh_hold(neigh);
860 neigh_add_timer(neigh, now + 1);
861 } else {
862 neigh->nud_state = NUD_FAILED;
863 neigh->updated = jiffies;
864 write_unlock_bh(&neigh->lock);
866 if (skb)
867 kfree_skb(skb);
868 return 1;
870 } else if (neigh->nud_state & NUD_STALE) {
871 NEIGH_PRINTK2("neigh %p is delayed.\n", neigh);
872 neigh_hold(neigh);
873 neigh->nud_state = NUD_DELAY;
874 neigh->updated = jiffies;
875 neigh_add_timer(neigh,
876 jiffies + neigh->parms->delay_probe_time);
879 if (neigh->nud_state == NUD_INCOMPLETE) {
880 if (skb) {
881 if (skb_queue_len(&neigh->arp_queue) >=
882 neigh->parms->queue_len) {
883 struct sk_buff *buff;
884 buff = neigh->arp_queue.next;
885 __skb_unlink(buff, &neigh->arp_queue);
886 kfree_skb(buff);
888 __skb_queue_tail(&neigh->arp_queue, skb);
890 rc = 1;
892 out_unlock_bh:
893 write_unlock_bh(&neigh->lock);
894 return rc;
897 static void neigh_update_hhs(struct neighbour *neigh)
899 struct hh_cache *hh;
900 void (*update)(struct hh_cache*, struct net_device*, unsigned char *) =
901 neigh->dev->header_cache_update;
903 if (update) {
904 for (hh = neigh->hh; hh; hh = hh->hh_next) {
905 write_seqlock_bh(&hh->hh_lock);
906 update(hh, neigh->dev, neigh->ha);
907 write_sequnlock_bh(&hh->hh_lock);
914 /* Generic update routine.
915 -- lladdr is new lladdr or NULL, if it is not supplied.
916 -- new is new state.
917 -- flags
918 NEIGH_UPDATE_F_OVERRIDE allows to override existing lladdr,
919 if it is different.
920 NEIGH_UPDATE_F_WEAK_OVERRIDE will suspect existing "connected"
921 lladdr instead of overriding it
922 if it is different.
923 It also allows to retain current state
924 if lladdr is unchanged.
925 NEIGH_UPDATE_F_ADMIN means that the change is administrative.
927 NEIGH_UPDATE_F_OVERRIDE_ISROUTER allows to override existing
928 NTF_ROUTER flag.
929 NEIGH_UPDATE_F_ISROUTER indicates if the neighbour is known as
930 a router.
932 Caller MUST hold reference count on the entry.
935 int neigh_update(struct neighbour *neigh, const u8 *lladdr, u8 new,
936 u32 flags)
938 u8 old;
939 int err;
940 int notify = 0;
941 struct net_device *dev;
942 int update_isrouter = 0;
944 write_lock_bh(&neigh->lock);
946 dev = neigh->dev;
947 old = neigh->nud_state;
948 err = -EPERM;
950 if (!(flags & NEIGH_UPDATE_F_ADMIN) &&
951 (old & (NUD_NOARP | NUD_PERMANENT)))
952 goto out;
954 if (!(new & NUD_VALID)) {
955 neigh_del_timer(neigh);
956 if (old & NUD_CONNECTED)
957 neigh_suspect(neigh);
958 neigh->nud_state = new;
959 err = 0;
960 notify = old & NUD_VALID;
961 goto out;
964 /* Compare new lladdr with cached one */
965 if (!dev->addr_len) {
966 /* First case: device needs no address. */
967 lladdr = neigh->ha;
968 } else if (lladdr) {
969 /* The second case: if something is already cached
970 and a new address is proposed:
971 - compare new & old
972 - if they are different, check override flag
974 if ((old & NUD_VALID) &&
975 !memcmp(lladdr, neigh->ha, dev->addr_len))
976 lladdr = neigh->ha;
977 } else {
978 /* No address is supplied; if we know something,
979 use it, otherwise discard the request.
981 err = -EINVAL;
982 if (!(old & NUD_VALID))
983 goto out;
984 lladdr = neigh->ha;
987 if (new & NUD_CONNECTED)
988 neigh->confirmed = jiffies;
989 neigh->updated = jiffies;
991 /* If entry was valid and address is not changed,
992 do not change entry state, if new one is STALE.
994 err = 0;
995 update_isrouter = flags & NEIGH_UPDATE_F_OVERRIDE_ISROUTER;
996 if (old & NUD_VALID) {
997 if (lladdr != neigh->ha && !(flags & NEIGH_UPDATE_F_OVERRIDE)) {
998 update_isrouter = 0;
999 if ((flags & NEIGH_UPDATE_F_WEAK_OVERRIDE) &&
1000 (old & NUD_CONNECTED)) {
1001 lladdr = neigh->ha;
1002 new = NUD_STALE;
1003 } else
1004 goto out;
1005 } else {
1006 if (lladdr == neigh->ha && new == NUD_STALE &&
1007 ((flags & NEIGH_UPDATE_F_WEAK_OVERRIDE) ||
1008 (old & NUD_CONNECTED))
1010 new = old;
1014 if (new != old) {
1015 neigh_del_timer(neigh);
1016 if (new & NUD_IN_TIMER) {
1017 neigh_hold(neigh);
1018 neigh_add_timer(neigh, (jiffies +
1019 ((new & NUD_REACHABLE) ?
1020 neigh->parms->reachable_time :
1021 0)));
1023 neigh->nud_state = new;
1026 if (lladdr != neigh->ha) {
1027 memcpy(&neigh->ha, lladdr, dev->addr_len);
1028 neigh_update_hhs(neigh);
1029 if (!(new & NUD_CONNECTED))
1030 neigh->confirmed = jiffies -
1031 (neigh->parms->base_reachable_time << 1);
1032 notify = 1;
1034 if (new == old)
1035 goto out;
1036 if (new & NUD_CONNECTED)
1037 neigh_connect(neigh);
1038 else
1039 neigh_suspect(neigh);
1040 if (!(old & NUD_VALID)) {
1041 struct sk_buff *skb;
1043 /* Again: avoid dead loop if something went wrong */
1045 while (neigh->nud_state & NUD_VALID &&
1046 (skb = __skb_dequeue(&neigh->arp_queue)) != NULL) {
1047 struct neighbour *n1 = neigh;
1048 write_unlock_bh(&neigh->lock);
1049 /* On shaper/eql skb->dst->neighbour != neigh :( */
1050 if (skb->dst && skb->dst->neighbour)
1051 n1 = skb->dst->neighbour;
1052 n1->output(skb);
1053 write_lock_bh(&neigh->lock);
1055 skb_queue_purge(&neigh->arp_queue);
1057 out:
1058 if (update_isrouter) {
1059 neigh->flags = (flags & NEIGH_UPDATE_F_ISROUTER) ?
1060 (neigh->flags | NTF_ROUTER) :
1061 (neigh->flags & ~NTF_ROUTER);
1063 write_unlock_bh(&neigh->lock);
1065 if (notify)
1066 call_netevent_notifiers(NETEVENT_NEIGH_UPDATE, neigh);
1067 #ifdef CONFIG_ARPD
1068 if (notify && neigh->parms->app_probes)
1069 neigh_app_notify(neigh);
1070 #endif
1071 return err;
1074 struct neighbour *neigh_event_ns(struct neigh_table *tbl,
1075 u8 *lladdr, void *saddr,
1076 struct net_device *dev)
1078 struct neighbour *neigh = __neigh_lookup(tbl, saddr, dev,
1079 lladdr || !dev->addr_len);
1080 if (neigh)
1081 neigh_update(neigh, lladdr, NUD_STALE,
1082 NEIGH_UPDATE_F_OVERRIDE);
1083 return neigh;
1086 static void neigh_hh_init(struct neighbour *n, struct dst_entry *dst,
1087 __be16 protocol)
1089 struct hh_cache *hh;
1090 struct net_device *dev = dst->dev;
1092 for (hh = n->hh; hh; hh = hh->hh_next)
1093 if (hh->hh_type == protocol)
1094 break;
1096 if (!hh && (hh = kzalloc(sizeof(*hh), GFP_ATOMIC)) != NULL) {
1097 seqlock_init(&hh->hh_lock);
1098 hh->hh_type = protocol;
1099 atomic_set(&hh->hh_refcnt, 0);
1100 hh->hh_next = NULL;
1101 if (dev->hard_header_cache(n, hh)) {
1102 kfree(hh);
1103 hh = NULL;
1104 } else {
1105 atomic_inc(&hh->hh_refcnt);
1106 hh->hh_next = n->hh;
1107 n->hh = hh;
1108 if (n->nud_state & NUD_CONNECTED)
1109 hh->hh_output = n->ops->hh_output;
1110 else
1111 hh->hh_output = n->ops->output;
1114 if (hh) {
1115 atomic_inc(&hh->hh_refcnt);
1116 dst->hh = hh;
1120 /* This function can be used in contexts, where only old dev_queue_xmit
1121 worked, f.e. if you want to override normal output path (eql, shaper),
1122 but resolution is not made yet.
1125 int neigh_compat_output(struct sk_buff *skb)
1127 struct net_device *dev = skb->dev;
1129 __skb_pull(skb, skb_network_offset(skb));
1131 if (dev->hard_header &&
1132 dev->hard_header(skb, dev, ntohs(skb->protocol), NULL, NULL,
1133 skb->len) < 0 &&
1134 dev->rebuild_header(skb))
1135 return 0;
1137 return dev_queue_xmit(skb);
1140 /* Slow and careful. */
1142 int neigh_resolve_output(struct sk_buff *skb)
1144 struct dst_entry *dst = skb->dst;
1145 struct neighbour *neigh;
1146 int rc = 0;
1148 if (!dst || !(neigh = dst->neighbour))
1149 goto discard;
1151 __skb_pull(skb, skb_network_offset(skb));
1153 if (!neigh_event_send(neigh, skb)) {
1154 int err;
1155 struct net_device *dev = neigh->dev;
1156 if (dev->hard_header_cache && !dst->hh) {
1157 write_lock_bh(&neigh->lock);
1158 if (!dst->hh)
1159 neigh_hh_init(neigh, dst, dst->ops->protocol);
1160 err = dev->hard_header(skb, dev, ntohs(skb->protocol),
1161 neigh->ha, NULL, skb->len);
1162 write_unlock_bh(&neigh->lock);
1163 } else {
1164 read_lock_bh(&neigh->lock);
1165 err = dev->hard_header(skb, dev, ntohs(skb->protocol),
1166 neigh->ha, NULL, skb->len);
1167 read_unlock_bh(&neigh->lock);
1169 if (err >= 0)
1170 rc = neigh->ops->queue_xmit(skb);
1171 else
1172 goto out_kfree_skb;
1174 out:
1175 return rc;
1176 discard:
1177 NEIGH_PRINTK1("neigh_resolve_output: dst=%p neigh=%p\n",
1178 dst, dst ? dst->neighbour : NULL);
1179 out_kfree_skb:
1180 rc = -EINVAL;
1181 kfree_skb(skb);
1182 goto out;
1185 /* As fast as possible without hh cache */
1187 int neigh_connected_output(struct sk_buff *skb)
1189 int err;
1190 struct dst_entry *dst = skb->dst;
1191 struct neighbour *neigh = dst->neighbour;
1192 struct net_device *dev = neigh->dev;
1194 __skb_pull(skb, skb_network_offset(skb));
1196 read_lock_bh(&neigh->lock);
1197 err = dev->hard_header(skb, dev, ntohs(skb->protocol),
1198 neigh->ha, NULL, skb->len);
1199 read_unlock_bh(&neigh->lock);
1200 if (err >= 0)
1201 err = neigh->ops->queue_xmit(skb);
1202 else {
1203 err = -EINVAL;
1204 kfree_skb(skb);
1206 return err;
1209 static void neigh_proxy_process(unsigned long arg)
1211 struct neigh_table *tbl = (struct neigh_table *)arg;
1212 long sched_next = 0;
1213 unsigned long now = jiffies;
1214 struct sk_buff *skb;
1216 spin_lock(&tbl->proxy_queue.lock);
1218 skb = tbl->proxy_queue.next;
1220 while (skb != (struct sk_buff *)&tbl->proxy_queue) {
1221 struct sk_buff *back = skb;
1222 long tdif = NEIGH_CB(back)->sched_next - now;
1224 skb = skb->next;
1225 if (tdif <= 0) {
1226 struct net_device *dev = back->dev;
1227 __skb_unlink(back, &tbl->proxy_queue);
1228 if (tbl->proxy_redo && netif_running(dev))
1229 tbl->proxy_redo(back);
1230 else
1231 kfree_skb(back);
1233 dev_put(dev);
1234 } else if (!sched_next || tdif < sched_next)
1235 sched_next = tdif;
1237 del_timer(&tbl->proxy_timer);
1238 if (sched_next)
1239 mod_timer(&tbl->proxy_timer, jiffies + sched_next);
1240 spin_unlock(&tbl->proxy_queue.lock);
1243 void pneigh_enqueue(struct neigh_table *tbl, struct neigh_parms *p,
1244 struct sk_buff *skb)
1246 unsigned long now = jiffies;
1247 unsigned long sched_next = now + (net_random() % p->proxy_delay);
1249 if (tbl->proxy_queue.qlen > p->proxy_qlen) {
1250 kfree_skb(skb);
1251 return;
1254 NEIGH_CB(skb)->sched_next = sched_next;
1255 NEIGH_CB(skb)->flags |= LOCALLY_ENQUEUED;
1257 spin_lock(&tbl->proxy_queue.lock);
1258 if (del_timer(&tbl->proxy_timer)) {
1259 if (time_before(tbl->proxy_timer.expires, sched_next))
1260 sched_next = tbl->proxy_timer.expires;
1262 dst_release(skb->dst);
1263 skb->dst = NULL;
1264 dev_hold(skb->dev);
1265 __skb_queue_tail(&tbl->proxy_queue, skb);
1266 mod_timer(&tbl->proxy_timer, sched_next);
1267 spin_unlock(&tbl->proxy_queue.lock);
1271 struct neigh_parms *neigh_parms_alloc(struct net_device *dev,
1272 struct neigh_table *tbl)
1274 struct neigh_parms *p = kmemdup(&tbl->parms, sizeof(*p), GFP_KERNEL);
1276 if (p) {
1277 p->tbl = tbl;
1278 atomic_set(&p->refcnt, 1);
1279 INIT_RCU_HEAD(&p->rcu_head);
1280 p->reachable_time =
1281 neigh_rand_reach_time(p->base_reachable_time);
1282 if (dev) {
1283 if (dev->neigh_setup && dev->neigh_setup(dev, p)) {
1284 kfree(p);
1285 return NULL;
1288 dev_hold(dev);
1289 p->dev = dev;
1291 p->sysctl_table = NULL;
1292 write_lock_bh(&tbl->lock);
1293 p->next = tbl->parms.next;
1294 tbl->parms.next = p;
1295 write_unlock_bh(&tbl->lock);
1297 return p;
1300 static void neigh_rcu_free_parms(struct rcu_head *head)
1302 struct neigh_parms *parms =
1303 container_of(head, struct neigh_parms, rcu_head);
1305 neigh_parms_put(parms);
1308 void neigh_parms_release(struct neigh_table *tbl, struct neigh_parms *parms)
1310 struct neigh_parms **p;
1312 if (!parms || parms == &tbl->parms)
1313 return;
1314 write_lock_bh(&tbl->lock);
1315 for (p = &tbl->parms.next; *p; p = &(*p)->next) {
1316 if (*p == parms) {
1317 *p = parms->next;
1318 parms->dead = 1;
1319 write_unlock_bh(&tbl->lock);
1320 if (parms->dev)
1321 dev_put(parms->dev);
1322 call_rcu(&parms->rcu_head, neigh_rcu_free_parms);
1323 return;
1326 write_unlock_bh(&tbl->lock);
1327 NEIGH_PRINTK1("neigh_parms_release: not found\n");
1330 void neigh_parms_destroy(struct neigh_parms *parms)
1332 kfree(parms);
1335 static struct lock_class_key neigh_table_proxy_queue_class;
1337 void neigh_table_init_no_netlink(struct neigh_table *tbl)
1339 unsigned long now = jiffies;
1340 unsigned long phsize;
1342 atomic_set(&tbl->parms.refcnt, 1);
1343 INIT_RCU_HEAD(&tbl->parms.rcu_head);
1344 tbl->parms.reachable_time =
1345 neigh_rand_reach_time(tbl->parms.base_reachable_time);
1347 if (!tbl->kmem_cachep)
1348 tbl->kmem_cachep =
1349 kmem_cache_create(tbl->id, tbl->entry_size, 0,
1350 SLAB_HWCACHE_ALIGN|SLAB_PANIC,
1351 NULL, NULL);
1352 tbl->stats = alloc_percpu(struct neigh_statistics);
1353 if (!tbl->stats)
1354 panic("cannot create neighbour cache statistics");
1356 #ifdef CONFIG_PROC_FS
1357 tbl->pde = create_proc_entry(tbl->id, 0, proc_net_stat);
1358 if (!tbl->pde)
1359 panic("cannot create neighbour proc dir entry");
1360 tbl->pde->proc_fops = &neigh_stat_seq_fops;
1361 tbl->pde->data = tbl;
1362 #endif
1364 tbl->hash_mask = 1;
1365 tbl->hash_buckets = neigh_hash_alloc(tbl->hash_mask + 1);
1367 phsize = (PNEIGH_HASHMASK + 1) * sizeof(struct pneigh_entry *);
1368 tbl->phash_buckets = kzalloc(phsize, GFP_KERNEL);
1370 if (!tbl->hash_buckets || !tbl->phash_buckets)
1371 panic("cannot allocate neighbour cache hashes");
1373 get_random_bytes(&tbl->hash_rnd, sizeof(tbl->hash_rnd));
1375 rwlock_init(&tbl->lock);
1376 INIT_DELAYED_WORK_DEFERRABLE(&tbl->gc_work, neigh_periodic_work);
1377 schedule_delayed_work(&tbl->gc_work, tbl->parms.reachable_time);
1378 init_timer(&tbl->proxy_timer);
1379 tbl->proxy_timer.data = (unsigned long)tbl;
1380 tbl->proxy_timer.function = neigh_proxy_process;
1381 skb_queue_head_init_class(&tbl->proxy_queue,
1382 &neigh_table_proxy_queue_class);
1384 tbl->last_flush = now;
1385 tbl->last_rand = now + tbl->parms.reachable_time * 20;
1388 void neigh_table_init(struct neigh_table *tbl)
1390 struct neigh_table *tmp;
1392 neigh_table_init_no_netlink(tbl);
1393 write_lock(&neigh_tbl_lock);
1394 for (tmp = neigh_tables; tmp; tmp = tmp->next) {
1395 if (tmp->family == tbl->family)
1396 break;
1398 tbl->next = neigh_tables;
1399 neigh_tables = tbl;
1400 write_unlock(&neigh_tbl_lock);
1402 if (unlikely(tmp)) {
1403 printk(KERN_ERR "NEIGH: Registering multiple tables for "
1404 "family %d\n", tbl->family);
1405 dump_stack();
1409 int neigh_table_clear(struct neigh_table *tbl)
1411 struct neigh_table **tp;
1413 /* It is not clean... Fix it to unload IPv6 module safely */
1414 cancel_delayed_work(&tbl->gc_work);
1415 flush_scheduled_work();
1416 del_timer_sync(&tbl->proxy_timer);
1417 pneigh_queue_purge(&tbl->proxy_queue);
1418 neigh_ifdown(tbl, NULL);
1419 if (atomic_read(&tbl->entries))
1420 printk(KERN_CRIT "neighbour leakage\n");
1421 write_lock(&neigh_tbl_lock);
1422 for (tp = &neigh_tables; *tp; tp = &(*tp)->next) {
1423 if (*tp == tbl) {
1424 *tp = tbl->next;
1425 break;
1428 write_unlock(&neigh_tbl_lock);
1430 neigh_hash_free(tbl->hash_buckets, tbl->hash_mask + 1);
1431 tbl->hash_buckets = NULL;
1433 kfree(tbl->phash_buckets);
1434 tbl->phash_buckets = NULL;
1436 free_percpu(tbl->stats);
1437 tbl->stats = NULL;
1439 return 0;
1442 static int neigh_delete(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
1444 struct ndmsg *ndm;
1445 struct nlattr *dst_attr;
1446 struct neigh_table *tbl;
1447 struct net_device *dev = NULL;
1448 int err = -EINVAL;
1450 if (nlmsg_len(nlh) < sizeof(*ndm))
1451 goto out;
1453 dst_attr = nlmsg_find_attr(nlh, sizeof(*ndm), NDA_DST);
1454 if (dst_attr == NULL)
1455 goto out;
1457 ndm = nlmsg_data(nlh);
1458 if (ndm->ndm_ifindex) {
1459 dev = dev_get_by_index(ndm->ndm_ifindex);
1460 if (dev == NULL) {
1461 err = -ENODEV;
1462 goto out;
1466 read_lock(&neigh_tbl_lock);
1467 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
1468 struct neighbour *neigh;
1470 if (tbl->family != ndm->ndm_family)
1471 continue;
1472 read_unlock(&neigh_tbl_lock);
1474 if (nla_len(dst_attr) < tbl->key_len)
1475 goto out_dev_put;
1477 if (ndm->ndm_flags & NTF_PROXY) {
1478 err = pneigh_delete(tbl, nla_data(dst_attr), dev);
1479 goto out_dev_put;
1482 if (dev == NULL)
1483 goto out_dev_put;
1485 neigh = neigh_lookup(tbl, nla_data(dst_attr), dev);
1486 if (neigh == NULL) {
1487 err = -ENOENT;
1488 goto out_dev_put;
1491 err = neigh_update(neigh, NULL, NUD_FAILED,
1492 NEIGH_UPDATE_F_OVERRIDE |
1493 NEIGH_UPDATE_F_ADMIN);
1494 neigh_release(neigh);
1495 goto out_dev_put;
1497 read_unlock(&neigh_tbl_lock);
1498 err = -EAFNOSUPPORT;
1500 out_dev_put:
1501 if (dev)
1502 dev_put(dev);
1503 out:
1504 return err;
1507 static int neigh_add(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
1509 struct ndmsg *ndm;
1510 struct nlattr *tb[NDA_MAX+1];
1511 struct neigh_table *tbl;
1512 struct net_device *dev = NULL;
1513 int err;
1515 err = nlmsg_parse(nlh, sizeof(*ndm), tb, NDA_MAX, NULL);
1516 if (err < 0)
1517 goto out;
1519 err = -EINVAL;
1520 if (tb[NDA_DST] == NULL)
1521 goto out;
1523 ndm = nlmsg_data(nlh);
1524 if (ndm->ndm_ifindex) {
1525 dev = dev_get_by_index(ndm->ndm_ifindex);
1526 if (dev == NULL) {
1527 err = -ENODEV;
1528 goto out;
1531 if (tb[NDA_LLADDR] && nla_len(tb[NDA_LLADDR]) < dev->addr_len)
1532 goto out_dev_put;
1535 read_lock(&neigh_tbl_lock);
1536 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
1537 int flags = NEIGH_UPDATE_F_ADMIN | NEIGH_UPDATE_F_OVERRIDE;
1538 struct neighbour *neigh;
1539 void *dst, *lladdr;
1541 if (tbl->family != ndm->ndm_family)
1542 continue;
1543 read_unlock(&neigh_tbl_lock);
1545 if (nla_len(tb[NDA_DST]) < tbl->key_len)
1546 goto out_dev_put;
1547 dst = nla_data(tb[NDA_DST]);
1548 lladdr = tb[NDA_LLADDR] ? nla_data(tb[NDA_LLADDR]) : NULL;
1550 if (ndm->ndm_flags & NTF_PROXY) {
1551 struct pneigh_entry *pn;
1553 err = -ENOBUFS;
1554 pn = pneigh_lookup(tbl, dst, dev, 1);
1555 if (pn) {
1556 pn->flags = ndm->ndm_flags;
1557 err = 0;
1559 goto out_dev_put;
1562 if (dev == NULL)
1563 goto out_dev_put;
1565 neigh = neigh_lookup(tbl, dst, dev);
1566 if (neigh == NULL) {
1567 if (!(nlh->nlmsg_flags & NLM_F_CREATE)) {
1568 err = -ENOENT;
1569 goto out_dev_put;
1572 neigh = __neigh_lookup_errno(tbl, dst, dev);
1573 if (IS_ERR(neigh)) {
1574 err = PTR_ERR(neigh);
1575 goto out_dev_put;
1577 } else {
1578 if (nlh->nlmsg_flags & NLM_F_EXCL) {
1579 err = -EEXIST;
1580 neigh_release(neigh);
1581 goto out_dev_put;
1584 if (!(nlh->nlmsg_flags & NLM_F_REPLACE))
1585 flags &= ~NEIGH_UPDATE_F_OVERRIDE;
1588 err = neigh_update(neigh, lladdr, ndm->ndm_state, flags);
1589 neigh_release(neigh);
1590 goto out_dev_put;
1593 read_unlock(&neigh_tbl_lock);
1594 err = -EAFNOSUPPORT;
1596 out_dev_put:
1597 if (dev)
1598 dev_put(dev);
1599 out:
1600 return err;
1603 static int neightbl_fill_parms(struct sk_buff *skb, struct neigh_parms *parms)
1605 struct nlattr *nest;
1607 nest = nla_nest_start(skb, NDTA_PARMS);
1608 if (nest == NULL)
1609 return -ENOBUFS;
1611 if (parms->dev)
1612 NLA_PUT_U32(skb, NDTPA_IFINDEX, parms->dev->ifindex);
1614 NLA_PUT_U32(skb, NDTPA_REFCNT, atomic_read(&parms->refcnt));
1615 NLA_PUT_U32(skb, NDTPA_QUEUE_LEN, parms->queue_len);
1616 NLA_PUT_U32(skb, NDTPA_PROXY_QLEN, parms->proxy_qlen);
1617 NLA_PUT_U32(skb, NDTPA_APP_PROBES, parms->app_probes);
1618 NLA_PUT_U32(skb, NDTPA_UCAST_PROBES, parms->ucast_probes);
1619 NLA_PUT_U32(skb, NDTPA_MCAST_PROBES, parms->mcast_probes);
1620 NLA_PUT_MSECS(skb, NDTPA_REACHABLE_TIME, parms->reachable_time);
1621 NLA_PUT_MSECS(skb, NDTPA_BASE_REACHABLE_TIME,
1622 parms->base_reachable_time);
1623 NLA_PUT_MSECS(skb, NDTPA_GC_STALETIME, parms->gc_staletime);
1624 NLA_PUT_MSECS(skb, NDTPA_DELAY_PROBE_TIME, parms->delay_probe_time);
1625 NLA_PUT_MSECS(skb, NDTPA_RETRANS_TIME, parms->retrans_time);
1626 NLA_PUT_MSECS(skb, NDTPA_ANYCAST_DELAY, parms->anycast_delay);
1627 NLA_PUT_MSECS(skb, NDTPA_PROXY_DELAY, parms->proxy_delay);
1628 NLA_PUT_MSECS(skb, NDTPA_LOCKTIME, parms->locktime);
1630 return nla_nest_end(skb, nest);
1632 nla_put_failure:
1633 return nla_nest_cancel(skb, nest);
1636 static int neightbl_fill_info(struct sk_buff *skb, struct neigh_table *tbl,
1637 u32 pid, u32 seq, int type, int flags)
1639 struct nlmsghdr *nlh;
1640 struct ndtmsg *ndtmsg;
1642 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndtmsg), flags);
1643 if (nlh == NULL)
1644 return -EMSGSIZE;
1646 ndtmsg = nlmsg_data(nlh);
1648 read_lock_bh(&tbl->lock);
1649 ndtmsg->ndtm_family = tbl->family;
1650 ndtmsg->ndtm_pad1 = 0;
1651 ndtmsg->ndtm_pad2 = 0;
1653 NLA_PUT_STRING(skb, NDTA_NAME, tbl->id);
1654 NLA_PUT_MSECS(skb, NDTA_GC_INTERVAL, tbl->gc_interval);
1655 NLA_PUT_U32(skb, NDTA_THRESH1, tbl->gc_thresh1);
1656 NLA_PUT_U32(skb, NDTA_THRESH2, tbl->gc_thresh2);
1657 NLA_PUT_U32(skb, NDTA_THRESH3, tbl->gc_thresh3);
1660 unsigned long now = jiffies;
1661 unsigned int flush_delta = now - tbl->last_flush;
1662 unsigned int rand_delta = now - tbl->last_rand;
1664 struct ndt_config ndc = {
1665 .ndtc_key_len = tbl->key_len,
1666 .ndtc_entry_size = tbl->entry_size,
1667 .ndtc_entries = atomic_read(&tbl->entries),
1668 .ndtc_last_flush = jiffies_to_msecs(flush_delta),
1669 .ndtc_last_rand = jiffies_to_msecs(rand_delta),
1670 .ndtc_hash_rnd = tbl->hash_rnd,
1671 .ndtc_hash_mask = tbl->hash_mask,
1672 .ndtc_proxy_qlen = tbl->proxy_queue.qlen,
1675 NLA_PUT(skb, NDTA_CONFIG, sizeof(ndc), &ndc);
1679 int cpu;
1680 struct ndt_stats ndst;
1682 memset(&ndst, 0, sizeof(ndst));
1684 for_each_possible_cpu(cpu) {
1685 struct neigh_statistics *st;
1687 st = per_cpu_ptr(tbl->stats, cpu);
1688 ndst.ndts_allocs += st->allocs;
1689 ndst.ndts_destroys += st->destroys;
1690 ndst.ndts_hash_grows += st->hash_grows;
1691 ndst.ndts_res_failed += st->res_failed;
1692 ndst.ndts_lookups += st->lookups;
1693 ndst.ndts_hits += st->hits;
1694 ndst.ndts_rcv_probes_mcast += st->rcv_probes_mcast;
1695 ndst.ndts_rcv_probes_ucast += st->rcv_probes_ucast;
1696 ndst.ndts_periodic_gc_runs += st->periodic_gc_runs;
1697 ndst.ndts_forced_gc_runs += st->forced_gc_runs;
1700 NLA_PUT(skb, NDTA_STATS, sizeof(ndst), &ndst);
1703 BUG_ON(tbl->parms.dev);
1704 if (neightbl_fill_parms(skb, &tbl->parms) < 0)
1705 goto nla_put_failure;
1707 read_unlock_bh(&tbl->lock);
1708 return nlmsg_end(skb, nlh);
1710 nla_put_failure:
1711 read_unlock_bh(&tbl->lock);
1712 nlmsg_cancel(skb, nlh);
1713 return -EMSGSIZE;
1716 static int neightbl_fill_param_info(struct sk_buff *skb,
1717 struct neigh_table *tbl,
1718 struct neigh_parms *parms,
1719 u32 pid, u32 seq, int type,
1720 unsigned int flags)
1722 struct ndtmsg *ndtmsg;
1723 struct nlmsghdr *nlh;
1725 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndtmsg), flags);
1726 if (nlh == NULL)
1727 return -EMSGSIZE;
1729 ndtmsg = nlmsg_data(nlh);
1731 read_lock_bh(&tbl->lock);
1732 ndtmsg->ndtm_family = tbl->family;
1733 ndtmsg->ndtm_pad1 = 0;
1734 ndtmsg->ndtm_pad2 = 0;
1736 if (nla_put_string(skb, NDTA_NAME, tbl->id) < 0 ||
1737 neightbl_fill_parms(skb, parms) < 0)
1738 goto errout;
1740 read_unlock_bh(&tbl->lock);
1741 return nlmsg_end(skb, nlh);
1742 errout:
1743 read_unlock_bh(&tbl->lock);
1744 nlmsg_cancel(skb, nlh);
1745 return -EMSGSIZE;
1748 static inline struct neigh_parms *lookup_neigh_params(struct neigh_table *tbl,
1749 int ifindex)
1751 struct neigh_parms *p;
1753 for (p = &tbl->parms; p; p = p->next)
1754 if ((p->dev && p->dev->ifindex == ifindex) ||
1755 (!p->dev && !ifindex))
1756 return p;
1758 return NULL;
1761 static const struct nla_policy nl_neightbl_policy[NDTA_MAX+1] = {
1762 [NDTA_NAME] = { .type = NLA_STRING },
1763 [NDTA_THRESH1] = { .type = NLA_U32 },
1764 [NDTA_THRESH2] = { .type = NLA_U32 },
1765 [NDTA_THRESH3] = { .type = NLA_U32 },
1766 [NDTA_GC_INTERVAL] = { .type = NLA_U64 },
1767 [NDTA_PARMS] = { .type = NLA_NESTED },
1770 static const struct nla_policy nl_ntbl_parm_policy[NDTPA_MAX+1] = {
1771 [NDTPA_IFINDEX] = { .type = NLA_U32 },
1772 [NDTPA_QUEUE_LEN] = { .type = NLA_U32 },
1773 [NDTPA_PROXY_QLEN] = { .type = NLA_U32 },
1774 [NDTPA_APP_PROBES] = { .type = NLA_U32 },
1775 [NDTPA_UCAST_PROBES] = { .type = NLA_U32 },
1776 [NDTPA_MCAST_PROBES] = { .type = NLA_U32 },
1777 [NDTPA_BASE_REACHABLE_TIME] = { .type = NLA_U64 },
1778 [NDTPA_GC_STALETIME] = { .type = NLA_U64 },
1779 [NDTPA_DELAY_PROBE_TIME] = { .type = NLA_U64 },
1780 [NDTPA_RETRANS_TIME] = { .type = NLA_U64 },
1781 [NDTPA_ANYCAST_DELAY] = { .type = NLA_U64 },
1782 [NDTPA_PROXY_DELAY] = { .type = NLA_U64 },
1783 [NDTPA_LOCKTIME] = { .type = NLA_U64 },
1786 static int neightbl_set(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
1788 struct neigh_table *tbl;
1789 struct ndtmsg *ndtmsg;
1790 struct nlattr *tb[NDTA_MAX+1];
1791 int err;
1793 err = nlmsg_parse(nlh, sizeof(*ndtmsg), tb, NDTA_MAX,
1794 nl_neightbl_policy);
1795 if (err < 0)
1796 goto errout;
1798 if (tb[NDTA_NAME] == NULL) {
1799 err = -EINVAL;
1800 goto errout;
1803 ndtmsg = nlmsg_data(nlh);
1804 read_lock(&neigh_tbl_lock);
1805 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
1806 if (ndtmsg->ndtm_family && tbl->family != ndtmsg->ndtm_family)
1807 continue;
1809 if (nla_strcmp(tb[NDTA_NAME], tbl->id) == 0)
1810 break;
1813 if (tbl == NULL) {
1814 err = -ENOENT;
1815 goto errout_locked;
1819 * We acquire tbl->lock to be nice to the periodic timers and
1820 * make sure they always see a consistent set of values.
1822 write_lock_bh(&tbl->lock);
1824 if (tb[NDTA_PARMS]) {
1825 struct nlattr *tbp[NDTPA_MAX+1];
1826 struct neigh_parms *p;
1827 int i, ifindex = 0;
1829 err = nla_parse_nested(tbp, NDTPA_MAX, tb[NDTA_PARMS],
1830 nl_ntbl_parm_policy);
1831 if (err < 0)
1832 goto errout_tbl_lock;
1834 if (tbp[NDTPA_IFINDEX])
1835 ifindex = nla_get_u32(tbp[NDTPA_IFINDEX]);
1837 p = lookup_neigh_params(tbl, ifindex);
1838 if (p == NULL) {
1839 err = -ENOENT;
1840 goto errout_tbl_lock;
1843 for (i = 1; i <= NDTPA_MAX; i++) {
1844 if (tbp[i] == NULL)
1845 continue;
1847 switch (i) {
1848 case NDTPA_QUEUE_LEN:
1849 p->queue_len = nla_get_u32(tbp[i]);
1850 break;
1851 case NDTPA_PROXY_QLEN:
1852 p->proxy_qlen = nla_get_u32(tbp[i]);
1853 break;
1854 case NDTPA_APP_PROBES:
1855 p->app_probes = nla_get_u32(tbp[i]);
1856 break;
1857 case NDTPA_UCAST_PROBES:
1858 p->ucast_probes = nla_get_u32(tbp[i]);
1859 break;
1860 case NDTPA_MCAST_PROBES:
1861 p->mcast_probes = nla_get_u32(tbp[i]);
1862 break;
1863 case NDTPA_BASE_REACHABLE_TIME:
1864 p->base_reachable_time = nla_get_msecs(tbp[i]);
1865 break;
1866 case NDTPA_GC_STALETIME:
1867 p->gc_staletime = nla_get_msecs(tbp[i]);
1868 break;
1869 case NDTPA_DELAY_PROBE_TIME:
1870 p->delay_probe_time = nla_get_msecs(tbp[i]);
1871 break;
1872 case NDTPA_RETRANS_TIME:
1873 p->retrans_time = nla_get_msecs(tbp[i]);
1874 break;
1875 case NDTPA_ANYCAST_DELAY:
1876 p->anycast_delay = nla_get_msecs(tbp[i]);
1877 break;
1878 case NDTPA_PROXY_DELAY:
1879 p->proxy_delay = nla_get_msecs(tbp[i]);
1880 break;
1881 case NDTPA_LOCKTIME:
1882 p->locktime = nla_get_msecs(tbp[i]);
1883 break;
1888 if (tb[NDTA_THRESH1])
1889 tbl->gc_thresh1 = nla_get_u32(tb[NDTA_THRESH1]);
1891 if (tb[NDTA_THRESH2])
1892 tbl->gc_thresh2 = nla_get_u32(tb[NDTA_THRESH2]);
1894 if (tb[NDTA_THRESH3])
1895 tbl->gc_thresh3 = nla_get_u32(tb[NDTA_THRESH3]);
1897 if (tb[NDTA_GC_INTERVAL])
1898 tbl->gc_interval = nla_get_msecs(tb[NDTA_GC_INTERVAL]);
1900 err = 0;
1902 errout_tbl_lock:
1903 write_unlock_bh(&tbl->lock);
1904 errout_locked:
1905 read_unlock(&neigh_tbl_lock);
1906 errout:
1907 return err;
1910 static int neightbl_dump_info(struct sk_buff *skb, struct netlink_callback *cb)
1912 int family, tidx, nidx = 0;
1913 int tbl_skip = cb->args[0];
1914 int neigh_skip = cb->args[1];
1915 struct neigh_table *tbl;
1917 family = ((struct rtgenmsg *) nlmsg_data(cb->nlh))->rtgen_family;
1919 read_lock(&neigh_tbl_lock);
1920 for (tbl = neigh_tables, tidx = 0; tbl; tbl = tbl->next, tidx++) {
1921 struct neigh_parms *p;
1923 if (tidx < tbl_skip || (family && tbl->family != family))
1924 continue;
1926 if (neightbl_fill_info(skb, tbl, NETLINK_CB(cb->skb).pid,
1927 cb->nlh->nlmsg_seq, RTM_NEWNEIGHTBL,
1928 NLM_F_MULTI) <= 0)
1929 break;
1931 for (nidx = 0, p = tbl->parms.next; p; p = p->next, nidx++) {
1932 if (nidx < neigh_skip)
1933 continue;
1935 if (neightbl_fill_param_info(skb, tbl, p,
1936 NETLINK_CB(cb->skb).pid,
1937 cb->nlh->nlmsg_seq,
1938 RTM_NEWNEIGHTBL,
1939 NLM_F_MULTI) <= 0)
1940 goto out;
1943 neigh_skip = 0;
1945 out:
1946 read_unlock(&neigh_tbl_lock);
1947 cb->args[0] = tidx;
1948 cb->args[1] = nidx;
1950 return skb->len;
1953 static int neigh_fill_info(struct sk_buff *skb, struct neighbour *neigh,
1954 u32 pid, u32 seq, int type, unsigned int flags)
1956 unsigned long now = jiffies;
1957 struct nda_cacheinfo ci;
1958 struct nlmsghdr *nlh;
1959 struct ndmsg *ndm;
1961 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndm), flags);
1962 if (nlh == NULL)
1963 return -EMSGSIZE;
1965 ndm = nlmsg_data(nlh);
1966 ndm->ndm_family = neigh->ops->family;
1967 ndm->ndm_pad1 = 0;
1968 ndm->ndm_pad2 = 0;
1969 ndm->ndm_flags = neigh->flags;
1970 ndm->ndm_type = neigh->type;
1971 ndm->ndm_ifindex = neigh->dev->ifindex;
1973 NLA_PUT(skb, NDA_DST, neigh->tbl->key_len, neigh->primary_key);
1975 read_lock_bh(&neigh->lock);
1976 ndm->ndm_state = neigh->nud_state;
1977 if ((neigh->nud_state & NUD_VALID) &&
1978 nla_put(skb, NDA_LLADDR, neigh->dev->addr_len, neigh->ha) < 0) {
1979 read_unlock_bh(&neigh->lock);
1980 goto nla_put_failure;
1983 ci.ndm_used = now - neigh->used;
1984 ci.ndm_confirmed = now - neigh->confirmed;
1985 ci.ndm_updated = now - neigh->updated;
1986 ci.ndm_refcnt = atomic_read(&neigh->refcnt) - 1;
1987 read_unlock_bh(&neigh->lock);
1989 NLA_PUT_U32(skb, NDA_PROBES, atomic_read(&neigh->probes));
1990 NLA_PUT(skb, NDA_CACHEINFO, sizeof(ci), &ci);
1992 return nlmsg_end(skb, nlh);
1994 nla_put_failure:
1995 nlmsg_cancel(skb, nlh);
1996 return -EMSGSIZE;
2000 static int neigh_dump_table(struct neigh_table *tbl, struct sk_buff *skb,
2001 struct netlink_callback *cb)
2003 struct neighbour *n;
2004 int rc, h, s_h = cb->args[1];
2005 int idx, s_idx = idx = cb->args[2];
2007 read_lock_bh(&tbl->lock);
2008 for (h = 0; h <= tbl->hash_mask; h++) {
2009 if (h < s_h)
2010 continue;
2011 if (h > s_h)
2012 s_idx = 0;
2013 for (n = tbl->hash_buckets[h], idx = 0; n; n = n->next, idx++) {
2014 if (idx < s_idx)
2015 continue;
2016 if (neigh_fill_info(skb, n, NETLINK_CB(cb->skb).pid,
2017 cb->nlh->nlmsg_seq,
2018 RTM_NEWNEIGH,
2019 NLM_F_MULTI) <= 0) {
2020 read_unlock_bh(&tbl->lock);
2021 rc = -1;
2022 goto out;
2026 read_unlock_bh(&tbl->lock);
2027 rc = skb->len;
2028 out:
2029 cb->args[1] = h;
2030 cb->args[2] = idx;
2031 return rc;
2034 static int neigh_dump_info(struct sk_buff *skb, struct netlink_callback *cb)
2036 struct neigh_table *tbl;
2037 int t, family, s_t;
2039 read_lock(&neigh_tbl_lock);
2040 family = ((struct rtgenmsg *) nlmsg_data(cb->nlh))->rtgen_family;
2041 s_t = cb->args[0];
2043 for (tbl = neigh_tables, t = 0; tbl; tbl = tbl->next, t++) {
2044 if (t < s_t || (family && tbl->family != family))
2045 continue;
2046 if (t > s_t)
2047 memset(&cb->args[1], 0, sizeof(cb->args) -
2048 sizeof(cb->args[0]));
2049 if (neigh_dump_table(tbl, skb, cb) < 0)
2050 break;
2052 read_unlock(&neigh_tbl_lock);
2054 cb->args[0] = t;
2055 return skb->len;
2058 void neigh_for_each(struct neigh_table *tbl, void (*cb)(struct neighbour *, void *), void *cookie)
2060 int chain;
2062 read_lock_bh(&tbl->lock);
2063 for (chain = 0; chain <= tbl->hash_mask; chain++) {
2064 struct neighbour *n;
2066 for (n = tbl->hash_buckets[chain]; n; n = n->next)
2067 cb(n, cookie);
2069 read_unlock_bh(&tbl->lock);
2071 EXPORT_SYMBOL(neigh_for_each);
2073 /* The tbl->lock must be held as a writer and BH disabled. */
2074 void __neigh_for_each_release(struct neigh_table *tbl,
2075 int (*cb)(struct neighbour *))
2077 int chain;
2079 for (chain = 0; chain <= tbl->hash_mask; chain++) {
2080 struct neighbour *n, **np;
2082 np = &tbl->hash_buckets[chain];
2083 while ((n = *np) != NULL) {
2084 int release;
2086 write_lock(&n->lock);
2087 release = cb(n);
2088 if (release) {
2089 *np = n->next;
2090 n->dead = 1;
2091 } else
2092 np = &n->next;
2093 write_unlock(&n->lock);
2094 if (release) {
2095 neigh_cleanup_and_release(n);
2100 EXPORT_SYMBOL(__neigh_for_each_release);
2102 #ifdef CONFIG_PROC_FS
2104 static struct neighbour *neigh_get_first(struct seq_file *seq)
2106 struct neigh_seq_state *state = seq->private;
2107 struct neigh_table *tbl = state->tbl;
2108 struct neighbour *n = NULL;
2109 int bucket = state->bucket;
2111 state->flags &= ~NEIGH_SEQ_IS_PNEIGH;
2112 for (bucket = 0; bucket <= tbl->hash_mask; bucket++) {
2113 n = tbl->hash_buckets[bucket];
2115 while (n) {
2116 if (state->neigh_sub_iter) {
2117 loff_t fakep = 0;
2118 void *v;
2120 v = state->neigh_sub_iter(state, n, &fakep);
2121 if (!v)
2122 goto next;
2124 if (!(state->flags & NEIGH_SEQ_SKIP_NOARP))
2125 break;
2126 if (n->nud_state & ~NUD_NOARP)
2127 break;
2128 next:
2129 n = n->next;
2132 if (n)
2133 break;
2135 state->bucket = bucket;
2137 return n;
2140 static struct neighbour *neigh_get_next(struct seq_file *seq,
2141 struct neighbour *n,
2142 loff_t *pos)
2144 struct neigh_seq_state *state = seq->private;
2145 struct neigh_table *tbl = state->tbl;
2147 if (state->neigh_sub_iter) {
2148 void *v = state->neigh_sub_iter(state, n, pos);
2149 if (v)
2150 return n;
2152 n = n->next;
2154 while (1) {
2155 while (n) {
2156 if (state->neigh_sub_iter) {
2157 void *v = state->neigh_sub_iter(state, n, pos);
2158 if (v)
2159 return n;
2160 goto next;
2162 if (!(state->flags & NEIGH_SEQ_SKIP_NOARP))
2163 break;
2165 if (n->nud_state & ~NUD_NOARP)
2166 break;
2167 next:
2168 n = n->next;
2171 if (n)
2172 break;
2174 if (++state->bucket > tbl->hash_mask)
2175 break;
2177 n = tbl->hash_buckets[state->bucket];
2180 if (n && pos)
2181 --(*pos);
2182 return n;
2185 static struct neighbour *neigh_get_idx(struct seq_file *seq, loff_t *pos)
2187 struct neighbour *n = neigh_get_first(seq);
2189 if (n) {
2190 while (*pos) {
2191 n = neigh_get_next(seq, n, pos);
2192 if (!n)
2193 break;
2196 return *pos ? NULL : n;
2199 static struct pneigh_entry *pneigh_get_first(struct seq_file *seq)
2201 struct neigh_seq_state *state = seq->private;
2202 struct neigh_table *tbl = state->tbl;
2203 struct pneigh_entry *pn = NULL;
2204 int bucket = state->bucket;
2206 state->flags |= NEIGH_SEQ_IS_PNEIGH;
2207 for (bucket = 0; bucket <= PNEIGH_HASHMASK; bucket++) {
2208 pn = tbl->phash_buckets[bucket];
2209 if (pn)
2210 break;
2212 state->bucket = bucket;
2214 return pn;
2217 static struct pneigh_entry *pneigh_get_next(struct seq_file *seq,
2218 struct pneigh_entry *pn,
2219 loff_t *pos)
2221 struct neigh_seq_state *state = seq->private;
2222 struct neigh_table *tbl = state->tbl;
2224 pn = pn->next;
2225 while (!pn) {
2226 if (++state->bucket > PNEIGH_HASHMASK)
2227 break;
2228 pn = tbl->phash_buckets[state->bucket];
2229 if (pn)
2230 break;
2233 if (pn && pos)
2234 --(*pos);
2236 return pn;
2239 static struct pneigh_entry *pneigh_get_idx(struct seq_file *seq, loff_t *pos)
2241 struct pneigh_entry *pn = pneigh_get_first(seq);
2243 if (pn) {
2244 while (*pos) {
2245 pn = pneigh_get_next(seq, pn, pos);
2246 if (!pn)
2247 break;
2250 return *pos ? NULL : pn;
2253 static void *neigh_get_idx_any(struct seq_file *seq, loff_t *pos)
2255 struct neigh_seq_state *state = seq->private;
2256 void *rc;
2258 rc = neigh_get_idx(seq, pos);
2259 if (!rc && !(state->flags & NEIGH_SEQ_NEIGH_ONLY))
2260 rc = pneigh_get_idx(seq, pos);
2262 return rc;
2265 void *neigh_seq_start(struct seq_file *seq, loff_t *pos, struct neigh_table *tbl, unsigned int neigh_seq_flags)
2267 struct neigh_seq_state *state = seq->private;
2268 loff_t pos_minus_one;
2270 state->tbl = tbl;
2271 state->bucket = 0;
2272 state->flags = (neigh_seq_flags & ~NEIGH_SEQ_IS_PNEIGH);
2274 read_lock_bh(&tbl->lock);
2276 pos_minus_one = *pos - 1;
2277 return *pos ? neigh_get_idx_any(seq, &pos_minus_one) : SEQ_START_TOKEN;
2279 EXPORT_SYMBOL(neigh_seq_start);
2281 void *neigh_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2283 struct neigh_seq_state *state;
2284 void *rc;
2286 if (v == SEQ_START_TOKEN) {
2287 rc = neigh_get_idx(seq, pos);
2288 goto out;
2291 state = seq->private;
2292 if (!(state->flags & NEIGH_SEQ_IS_PNEIGH)) {
2293 rc = neigh_get_next(seq, v, NULL);
2294 if (rc)
2295 goto out;
2296 if (!(state->flags & NEIGH_SEQ_NEIGH_ONLY))
2297 rc = pneigh_get_first(seq);
2298 } else {
2299 BUG_ON(state->flags & NEIGH_SEQ_NEIGH_ONLY);
2300 rc = pneigh_get_next(seq, v, NULL);
2302 out:
2303 ++(*pos);
2304 return rc;
2306 EXPORT_SYMBOL(neigh_seq_next);
2308 void neigh_seq_stop(struct seq_file *seq, void *v)
2310 struct neigh_seq_state *state = seq->private;
2311 struct neigh_table *tbl = state->tbl;
2313 read_unlock_bh(&tbl->lock);
2315 EXPORT_SYMBOL(neigh_seq_stop);
2317 /* statistics via seq_file */
2319 static void *neigh_stat_seq_start(struct seq_file *seq, loff_t *pos)
2321 struct proc_dir_entry *pde = seq->private;
2322 struct neigh_table *tbl = pde->data;
2323 int cpu;
2325 if (*pos == 0)
2326 return SEQ_START_TOKEN;
2328 for (cpu = *pos-1; cpu < NR_CPUS; ++cpu) {
2329 if (!cpu_possible(cpu))
2330 continue;
2331 *pos = cpu+1;
2332 return per_cpu_ptr(tbl->stats, cpu);
2334 return NULL;
2337 static void *neigh_stat_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2339 struct proc_dir_entry *pde = seq->private;
2340 struct neigh_table *tbl = pde->data;
2341 int cpu;
2343 for (cpu = *pos; cpu < NR_CPUS; ++cpu) {
2344 if (!cpu_possible(cpu))
2345 continue;
2346 *pos = cpu+1;
2347 return per_cpu_ptr(tbl->stats, cpu);
2349 return NULL;
2352 static void neigh_stat_seq_stop(struct seq_file *seq, void *v)
2357 static int neigh_stat_seq_show(struct seq_file *seq, void *v)
2359 struct proc_dir_entry *pde = seq->private;
2360 struct neigh_table *tbl = pde->data;
2361 struct neigh_statistics *st = v;
2363 if (v == SEQ_START_TOKEN) {
2364 seq_printf(seq, "entries allocs destroys hash_grows lookups hits res_failed rcv_probes_mcast rcv_probes_ucast periodic_gc_runs forced_gc_runs\n");
2365 return 0;
2368 seq_printf(seq, "%08x %08lx %08lx %08lx %08lx %08lx %08lx "
2369 "%08lx %08lx %08lx %08lx\n",
2370 atomic_read(&tbl->entries),
2372 st->allocs,
2373 st->destroys,
2374 st->hash_grows,
2376 st->lookups,
2377 st->hits,
2379 st->res_failed,
2381 st->rcv_probes_mcast,
2382 st->rcv_probes_ucast,
2384 st->periodic_gc_runs,
2385 st->forced_gc_runs
2388 return 0;
2391 static const struct seq_operations neigh_stat_seq_ops = {
2392 .start = neigh_stat_seq_start,
2393 .next = neigh_stat_seq_next,
2394 .stop = neigh_stat_seq_stop,
2395 .show = neigh_stat_seq_show,
2398 static int neigh_stat_seq_open(struct inode *inode, struct file *file)
2400 int ret = seq_open(file, &neigh_stat_seq_ops);
2402 if (!ret) {
2403 struct seq_file *sf = file->private_data;
2404 sf->private = PDE(inode);
2406 return ret;
2409 static const struct file_operations neigh_stat_seq_fops = {
2410 .owner = THIS_MODULE,
2411 .open = neigh_stat_seq_open,
2412 .read = seq_read,
2413 .llseek = seq_lseek,
2414 .release = seq_release,
2417 #endif /* CONFIG_PROC_FS */
2419 #ifdef CONFIG_ARPD
2420 static inline size_t neigh_nlmsg_size(void)
2422 return NLMSG_ALIGN(sizeof(struct ndmsg))
2423 + nla_total_size(MAX_ADDR_LEN) /* NDA_DST */
2424 + nla_total_size(MAX_ADDR_LEN) /* NDA_LLADDR */
2425 + nla_total_size(sizeof(struct nda_cacheinfo))
2426 + nla_total_size(4); /* NDA_PROBES */
2429 static void __neigh_notify(struct neighbour *n, int type, int flags)
2431 struct sk_buff *skb;
2432 int err = -ENOBUFS;
2434 skb = nlmsg_new(neigh_nlmsg_size(), GFP_ATOMIC);
2435 if (skb == NULL)
2436 goto errout;
2438 err = neigh_fill_info(skb, n, 0, 0, type, flags);
2439 if (err < 0) {
2440 /* -EMSGSIZE implies BUG in neigh_nlmsg_size() */
2441 WARN_ON(err == -EMSGSIZE);
2442 kfree_skb(skb);
2443 goto errout;
2445 err = rtnl_notify(skb, 0, RTNLGRP_NEIGH, NULL, GFP_ATOMIC);
2446 errout:
2447 if (err < 0)
2448 rtnl_set_sk_err(RTNLGRP_NEIGH, err);
2451 void neigh_app_ns(struct neighbour *n)
2453 __neigh_notify(n, RTM_GETNEIGH, NLM_F_REQUEST);
2456 static void neigh_app_notify(struct neighbour *n)
2458 __neigh_notify(n, RTM_NEWNEIGH, 0);
2461 #endif /* CONFIG_ARPD */
2463 #ifdef CONFIG_SYSCTL
2465 static struct neigh_sysctl_table {
2466 struct ctl_table_header *sysctl_header;
2467 ctl_table neigh_vars[__NET_NEIGH_MAX];
2468 ctl_table neigh_dev[2];
2469 ctl_table neigh_neigh_dir[2];
2470 ctl_table neigh_proto_dir[2];
2471 ctl_table neigh_root_dir[2];
2472 } neigh_sysctl_template __read_mostly = {
2473 .neigh_vars = {
2475 .ctl_name = NET_NEIGH_MCAST_SOLICIT,
2476 .procname = "mcast_solicit",
2477 .maxlen = sizeof(int),
2478 .mode = 0644,
2479 .proc_handler = &proc_dointvec,
2482 .ctl_name = NET_NEIGH_UCAST_SOLICIT,
2483 .procname = "ucast_solicit",
2484 .maxlen = sizeof(int),
2485 .mode = 0644,
2486 .proc_handler = &proc_dointvec,
2489 .ctl_name = NET_NEIGH_APP_SOLICIT,
2490 .procname = "app_solicit",
2491 .maxlen = sizeof(int),
2492 .mode = 0644,
2493 .proc_handler = &proc_dointvec,
2496 .ctl_name = NET_NEIGH_RETRANS_TIME,
2497 .procname = "retrans_time",
2498 .maxlen = sizeof(int),
2499 .mode = 0644,
2500 .proc_handler = &proc_dointvec_userhz_jiffies,
2503 .ctl_name = NET_NEIGH_REACHABLE_TIME,
2504 .procname = "base_reachable_time",
2505 .maxlen = sizeof(int),
2506 .mode = 0644,
2507 .proc_handler = &proc_dointvec_jiffies,
2508 .strategy = &sysctl_jiffies,
2511 .ctl_name = NET_NEIGH_DELAY_PROBE_TIME,
2512 .procname = "delay_first_probe_time",
2513 .maxlen = sizeof(int),
2514 .mode = 0644,
2515 .proc_handler = &proc_dointvec_jiffies,
2516 .strategy = &sysctl_jiffies,
2519 .ctl_name = NET_NEIGH_GC_STALE_TIME,
2520 .procname = "gc_stale_time",
2521 .maxlen = sizeof(int),
2522 .mode = 0644,
2523 .proc_handler = &proc_dointvec_jiffies,
2524 .strategy = &sysctl_jiffies,
2527 .ctl_name = NET_NEIGH_UNRES_QLEN,
2528 .procname = "unres_qlen",
2529 .maxlen = sizeof(int),
2530 .mode = 0644,
2531 .proc_handler = &proc_dointvec,
2534 .ctl_name = NET_NEIGH_PROXY_QLEN,
2535 .procname = "proxy_qlen",
2536 .maxlen = sizeof(int),
2537 .mode = 0644,
2538 .proc_handler = &proc_dointvec,
2541 .ctl_name = NET_NEIGH_ANYCAST_DELAY,
2542 .procname = "anycast_delay",
2543 .maxlen = sizeof(int),
2544 .mode = 0644,
2545 .proc_handler = &proc_dointvec_userhz_jiffies,
2548 .ctl_name = NET_NEIGH_PROXY_DELAY,
2549 .procname = "proxy_delay",
2550 .maxlen = sizeof(int),
2551 .mode = 0644,
2552 .proc_handler = &proc_dointvec_userhz_jiffies,
2555 .ctl_name = NET_NEIGH_LOCKTIME,
2556 .procname = "locktime",
2557 .maxlen = sizeof(int),
2558 .mode = 0644,
2559 .proc_handler = &proc_dointvec_userhz_jiffies,
2562 .ctl_name = NET_NEIGH_GC_INTERVAL,
2563 .procname = "gc_interval",
2564 .maxlen = sizeof(int),
2565 .mode = 0644,
2566 .proc_handler = &proc_dointvec_jiffies,
2567 .strategy = &sysctl_jiffies,
2570 .ctl_name = NET_NEIGH_GC_THRESH1,
2571 .procname = "gc_thresh1",
2572 .maxlen = sizeof(int),
2573 .mode = 0644,
2574 .proc_handler = &proc_dointvec,
2577 .ctl_name = NET_NEIGH_GC_THRESH2,
2578 .procname = "gc_thresh2",
2579 .maxlen = sizeof(int),
2580 .mode = 0644,
2581 .proc_handler = &proc_dointvec,
2584 .ctl_name = NET_NEIGH_GC_THRESH3,
2585 .procname = "gc_thresh3",
2586 .maxlen = sizeof(int),
2587 .mode = 0644,
2588 .proc_handler = &proc_dointvec,
2591 .ctl_name = NET_NEIGH_RETRANS_TIME_MS,
2592 .procname = "retrans_time_ms",
2593 .maxlen = sizeof(int),
2594 .mode = 0644,
2595 .proc_handler = &proc_dointvec_ms_jiffies,
2596 .strategy = &sysctl_ms_jiffies,
2599 .ctl_name = NET_NEIGH_REACHABLE_TIME_MS,
2600 .procname = "base_reachable_time_ms",
2601 .maxlen = sizeof(int),
2602 .mode = 0644,
2603 .proc_handler = &proc_dointvec_ms_jiffies,
2604 .strategy = &sysctl_ms_jiffies,
2607 .neigh_dev = {
2609 .ctl_name = NET_PROTO_CONF_DEFAULT,
2610 .procname = "default",
2611 .mode = 0555,
2614 .neigh_neigh_dir = {
2616 .procname = "neigh",
2617 .mode = 0555,
2620 .neigh_proto_dir = {
2622 .mode = 0555,
2625 .neigh_root_dir = {
2627 .ctl_name = CTL_NET,
2628 .procname = "net",
2629 .mode = 0555,
2634 int neigh_sysctl_register(struct net_device *dev, struct neigh_parms *p,
2635 int p_id, int pdev_id, char *p_name,
2636 proc_handler *handler, ctl_handler *strategy)
2638 struct neigh_sysctl_table *t = kmemdup(&neigh_sysctl_template,
2639 sizeof(*t), GFP_KERNEL);
2640 const char *dev_name_source = NULL;
2641 char *dev_name = NULL;
2642 int err = 0;
2644 if (!t)
2645 return -ENOBUFS;
2646 t->neigh_vars[0].data = &p->mcast_probes;
2647 t->neigh_vars[1].data = &p->ucast_probes;
2648 t->neigh_vars[2].data = &p->app_probes;
2649 t->neigh_vars[3].data = &p->retrans_time;
2650 t->neigh_vars[4].data = &p->base_reachable_time;
2651 t->neigh_vars[5].data = &p->delay_probe_time;
2652 t->neigh_vars[6].data = &p->gc_staletime;
2653 t->neigh_vars[7].data = &p->queue_len;
2654 t->neigh_vars[8].data = &p->proxy_qlen;
2655 t->neigh_vars[9].data = &p->anycast_delay;
2656 t->neigh_vars[10].data = &p->proxy_delay;
2657 t->neigh_vars[11].data = &p->locktime;
2659 if (dev) {
2660 dev_name_source = dev->name;
2661 t->neigh_dev[0].ctl_name = dev->ifindex;
2662 t->neigh_vars[12].procname = NULL;
2663 t->neigh_vars[13].procname = NULL;
2664 t->neigh_vars[14].procname = NULL;
2665 t->neigh_vars[15].procname = NULL;
2666 } else {
2667 dev_name_source = t->neigh_dev[0].procname;
2668 t->neigh_vars[12].data = (int *)(p + 1);
2669 t->neigh_vars[13].data = (int *)(p + 1) + 1;
2670 t->neigh_vars[14].data = (int *)(p + 1) + 2;
2671 t->neigh_vars[15].data = (int *)(p + 1) + 3;
2674 t->neigh_vars[16].data = &p->retrans_time;
2675 t->neigh_vars[17].data = &p->base_reachable_time;
2677 if (handler || strategy) {
2678 /* RetransTime */
2679 t->neigh_vars[3].proc_handler = handler;
2680 t->neigh_vars[3].strategy = strategy;
2681 t->neigh_vars[3].extra1 = dev;
2682 /* ReachableTime */
2683 t->neigh_vars[4].proc_handler = handler;
2684 t->neigh_vars[4].strategy = strategy;
2685 t->neigh_vars[4].extra1 = dev;
2686 /* RetransTime (in milliseconds)*/
2687 t->neigh_vars[16].proc_handler = handler;
2688 t->neigh_vars[16].strategy = strategy;
2689 t->neigh_vars[16].extra1 = dev;
2690 /* ReachableTime (in milliseconds) */
2691 t->neigh_vars[17].proc_handler = handler;
2692 t->neigh_vars[17].strategy = strategy;
2693 t->neigh_vars[17].extra1 = dev;
2696 dev_name = kstrdup(dev_name_source, GFP_KERNEL);
2697 if (!dev_name) {
2698 err = -ENOBUFS;
2699 goto free;
2702 t->neigh_dev[0].procname = dev_name;
2704 t->neigh_neigh_dir[0].ctl_name = pdev_id;
2706 t->neigh_proto_dir[0].procname = p_name;
2707 t->neigh_proto_dir[0].ctl_name = p_id;
2709 t->neigh_dev[0].child = t->neigh_vars;
2710 t->neigh_neigh_dir[0].child = t->neigh_dev;
2711 t->neigh_proto_dir[0].child = t->neigh_neigh_dir;
2712 t->neigh_root_dir[0].child = t->neigh_proto_dir;
2714 t->sysctl_header = register_sysctl_table(t->neigh_root_dir);
2715 if (!t->sysctl_header) {
2716 err = -ENOBUFS;
2717 goto free_procname;
2719 p->sysctl_table = t;
2720 return 0;
2722 /* error path */
2723 free_procname:
2724 kfree(dev_name);
2725 free:
2726 kfree(t);
2728 return err;
2731 void neigh_sysctl_unregister(struct neigh_parms *p)
2733 if (p->sysctl_table) {
2734 struct neigh_sysctl_table *t = p->sysctl_table;
2735 p->sysctl_table = NULL;
2736 unregister_sysctl_table(t->sysctl_header);
2737 kfree(t->neigh_dev[0].procname);
2738 kfree(t);
2742 #endif /* CONFIG_SYSCTL */
2744 static int __init neigh_init(void)
2746 rtnl_register(PF_UNSPEC, RTM_NEWNEIGH, neigh_add, NULL);
2747 rtnl_register(PF_UNSPEC, RTM_DELNEIGH, neigh_delete, NULL);
2748 rtnl_register(PF_UNSPEC, RTM_GETNEIGH, NULL, neigh_dump_info);
2750 rtnl_register(PF_UNSPEC, RTM_GETNEIGHTBL, NULL, neightbl_dump_info);
2751 rtnl_register(PF_UNSPEC, RTM_SETNEIGHTBL, neightbl_set, NULL);
2753 return 0;
2756 subsys_initcall(neigh_init);
2758 EXPORT_SYMBOL(__neigh_event_send);
2759 EXPORT_SYMBOL(neigh_changeaddr);
2760 EXPORT_SYMBOL(neigh_compat_output);
2761 EXPORT_SYMBOL(neigh_connected_output);
2762 EXPORT_SYMBOL(neigh_create);
2763 EXPORT_SYMBOL(neigh_destroy);
2764 EXPORT_SYMBOL(neigh_event_ns);
2765 EXPORT_SYMBOL(neigh_ifdown);
2766 EXPORT_SYMBOL(neigh_lookup);
2767 EXPORT_SYMBOL(neigh_lookup_nodev);
2768 EXPORT_SYMBOL(neigh_parms_alloc);
2769 EXPORT_SYMBOL(neigh_parms_release);
2770 EXPORT_SYMBOL(neigh_rand_reach_time);
2771 EXPORT_SYMBOL(neigh_resolve_output);
2772 EXPORT_SYMBOL(neigh_table_clear);
2773 EXPORT_SYMBOL(neigh_table_init);
2774 EXPORT_SYMBOL(neigh_table_init_no_netlink);
2775 EXPORT_SYMBOL(neigh_update);
2776 EXPORT_SYMBOL(pneigh_enqueue);
2777 EXPORT_SYMBOL(pneigh_lookup);
2779 #ifdef CONFIG_ARPD
2780 EXPORT_SYMBOL(neigh_app_ns);
2781 #endif
2782 #ifdef CONFIG_SYSCTL
2783 EXPORT_SYMBOL(neigh_sysctl_register);
2784 EXPORT_SYMBOL(neigh_sysctl_unregister);
2785 #endif