[PATCH] x86_64: Reename CMOS update warning
[linux-2.6/linux-2.6-openrd.git] / net / core / neighbour.c
blob0c8666872d10fdf0d90fea6b327952c6f6493051
1 /*
2 * Generic address resolution entity
4 * Authors:
5 * Pedro Roque <roque@di.fc.ul.pt>
6 * Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
8 * This program is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU General Public License
10 * as published by the Free Software Foundation; either version
11 * 2 of the License, or (at your option) any later version.
13 * Fixes:
14 * Vitaly E. Lavrov releasing NULL neighbor in neigh_add.
15 * Harald Welte Add neighbour cache statistics like rtstat
18 #include <linux/config.h>
19 #include <linux/types.h>
20 #include <linux/kernel.h>
21 #include <linux/module.h>
22 #include <linux/socket.h>
23 #include <linux/sched.h>
24 #include <linux/netdevice.h>
25 #include <linux/proc_fs.h>
26 #ifdef CONFIG_SYSCTL
27 #include <linux/sysctl.h>
28 #endif
29 #include <linux/times.h>
30 #include <net/neighbour.h>
31 #include <net/dst.h>
32 #include <net/sock.h>
33 #include <linux/rtnetlink.h>
34 #include <linux/random.h>
35 #include <linux/string.h>
37 #define NEIGH_DEBUG 1
39 #define NEIGH_PRINTK(x...) printk(x)
40 #define NEIGH_NOPRINTK(x...) do { ; } while(0)
41 #define NEIGH_PRINTK0 NEIGH_PRINTK
42 #define NEIGH_PRINTK1 NEIGH_NOPRINTK
43 #define NEIGH_PRINTK2 NEIGH_NOPRINTK
45 #if NEIGH_DEBUG >= 1
46 #undef NEIGH_PRINTK1
47 #define NEIGH_PRINTK1 NEIGH_PRINTK
48 #endif
49 #if NEIGH_DEBUG >= 2
50 #undef NEIGH_PRINTK2
51 #define NEIGH_PRINTK2 NEIGH_PRINTK
52 #endif
54 #define PNEIGH_HASHMASK 0xF
56 static void neigh_timer_handler(unsigned long arg);
57 #ifdef CONFIG_ARPD
58 static void neigh_app_notify(struct neighbour *n);
59 #endif
60 static int pneigh_ifdown(struct neigh_table *tbl, struct net_device *dev);
61 void neigh_changeaddr(struct neigh_table *tbl, struct net_device *dev);
63 static struct neigh_table *neigh_tables;
64 #ifdef CONFIG_PROC_FS
65 static struct file_operations neigh_stat_seq_fops;
66 #endif
69 Neighbour hash table buckets are protected with rwlock tbl->lock.
71 - All the scans/updates to hash buckets MUST be made under this lock.
72 - NOTHING clever should be made under this lock: no callbacks
73 to protocol backends, no attempts to send something to network.
74 It will result in deadlocks, if backend/driver wants to use neighbour
75 cache.
76 - If the entry requires some non-trivial actions, increase
77 its reference count and release table lock.
79 Neighbour entries are protected:
80 - with reference count.
81 - with rwlock neigh->lock
83 Reference count prevents destruction.
85 neigh->lock mainly serializes ll address data and its validity state.
86 However, the same lock is used to protect another entry fields:
87 - timer
88 - resolution queue
90 Again, nothing clever shall be made under neigh->lock,
91 the most complicated procedure, which we allow is dev->hard_header.
92 It is supposed, that dev->hard_header is simplistic and does
93 not make callbacks to neighbour tables.
95 The last lock is neigh_tbl_lock. It is pure SMP lock, protecting
96 list of neighbour tables. This list is used only in process context,
99 static DEFINE_RWLOCK(neigh_tbl_lock);
101 static int neigh_blackhole(struct sk_buff *skb)
103 kfree_skb(skb);
104 return -ENETDOWN;
108 * It is random distribution in the interval (1/2)*base...(3/2)*base.
109 * It corresponds to default IPv6 settings and is not overridable,
110 * because it is really reasonable choice.
113 unsigned long neigh_rand_reach_time(unsigned long base)
115 return (base ? (net_random() % base) + (base >> 1) : 0);
119 static int neigh_forced_gc(struct neigh_table *tbl)
121 int shrunk = 0;
122 int i;
124 NEIGH_CACHE_STAT_INC(tbl, forced_gc_runs);
126 write_lock_bh(&tbl->lock);
127 for (i = 0; i <= tbl->hash_mask; i++) {
128 struct neighbour *n, **np;
130 np = &tbl->hash_buckets[i];
131 while ((n = *np) != NULL) {
132 /* Neighbour record may be discarded if:
133 * - nobody refers to it.
134 * - it is not permanent
136 write_lock(&n->lock);
137 if (atomic_read(&n->refcnt) == 1 &&
138 !(n->nud_state & NUD_PERMANENT)) {
139 *np = n->next;
140 n->dead = 1;
141 shrunk = 1;
142 write_unlock(&n->lock);
143 neigh_release(n);
144 continue;
146 write_unlock(&n->lock);
147 np = &n->next;
151 tbl->last_flush = jiffies;
153 write_unlock_bh(&tbl->lock);
155 return shrunk;
158 static int neigh_del_timer(struct neighbour *n)
160 if ((n->nud_state & NUD_IN_TIMER) &&
161 del_timer(&n->timer)) {
162 neigh_release(n);
163 return 1;
165 return 0;
168 static void pneigh_queue_purge(struct sk_buff_head *list)
170 struct sk_buff *skb;
172 while ((skb = skb_dequeue(list)) != NULL) {
173 dev_put(skb->dev);
174 kfree_skb(skb);
178 static void neigh_flush_dev(struct neigh_table *tbl, struct net_device *dev)
180 int i;
182 for (i = 0; i <= tbl->hash_mask; i++) {
183 struct neighbour *n, **np = &tbl->hash_buckets[i];
185 while ((n = *np) != NULL) {
186 if (dev && n->dev != dev) {
187 np = &n->next;
188 continue;
190 *np = n->next;
191 write_lock(&n->lock);
192 neigh_del_timer(n);
193 n->dead = 1;
195 if (atomic_read(&n->refcnt) != 1) {
196 /* The most unpleasant situation.
197 We must destroy neighbour entry,
198 but someone still uses it.
200 The destroy will be delayed until
201 the last user releases us, but
202 we must kill timers etc. and move
203 it to safe state.
205 skb_queue_purge(&n->arp_queue);
206 n->output = neigh_blackhole;
207 if (n->nud_state & NUD_VALID)
208 n->nud_state = NUD_NOARP;
209 else
210 n->nud_state = NUD_NONE;
211 NEIGH_PRINTK2("neigh %p is stray.\n", n);
213 write_unlock(&n->lock);
214 neigh_release(n);
219 void neigh_changeaddr(struct neigh_table *tbl, struct net_device *dev)
221 write_lock_bh(&tbl->lock);
222 neigh_flush_dev(tbl, dev);
223 write_unlock_bh(&tbl->lock);
226 int neigh_ifdown(struct neigh_table *tbl, struct net_device *dev)
228 write_lock_bh(&tbl->lock);
229 neigh_flush_dev(tbl, dev);
230 pneigh_ifdown(tbl, dev);
231 write_unlock_bh(&tbl->lock);
233 del_timer_sync(&tbl->proxy_timer);
234 pneigh_queue_purge(&tbl->proxy_queue);
235 return 0;
238 static struct neighbour *neigh_alloc(struct neigh_table *tbl)
240 struct neighbour *n = NULL;
241 unsigned long now = jiffies;
242 int entries;
244 entries = atomic_inc_return(&tbl->entries) - 1;
245 if (entries >= tbl->gc_thresh3 ||
246 (entries >= tbl->gc_thresh2 &&
247 time_after(now, tbl->last_flush + 5 * HZ))) {
248 if (!neigh_forced_gc(tbl) &&
249 entries >= tbl->gc_thresh3)
250 goto out_entries;
253 n = kmem_cache_alloc(tbl->kmem_cachep, SLAB_ATOMIC);
254 if (!n)
255 goto out_entries;
257 memset(n, 0, tbl->entry_size);
259 skb_queue_head_init(&n->arp_queue);
260 rwlock_init(&n->lock);
261 n->updated = n->used = now;
262 n->nud_state = NUD_NONE;
263 n->output = neigh_blackhole;
264 n->parms = neigh_parms_clone(&tbl->parms);
265 init_timer(&n->timer);
266 n->timer.function = neigh_timer_handler;
267 n->timer.data = (unsigned long)n;
269 NEIGH_CACHE_STAT_INC(tbl, allocs);
270 n->tbl = tbl;
271 atomic_set(&n->refcnt, 1);
272 n->dead = 1;
273 out:
274 return n;
276 out_entries:
277 atomic_dec(&tbl->entries);
278 goto out;
281 static struct neighbour **neigh_hash_alloc(unsigned int entries)
283 unsigned long size = entries * sizeof(struct neighbour *);
284 struct neighbour **ret;
286 if (size <= PAGE_SIZE) {
287 ret = kmalloc(size, GFP_ATOMIC);
288 } else {
289 ret = (struct neighbour **)
290 __get_free_pages(GFP_ATOMIC, get_order(size));
292 if (ret)
293 memset(ret, 0, size);
295 return ret;
298 static void neigh_hash_free(struct neighbour **hash, unsigned int entries)
300 unsigned long size = entries * sizeof(struct neighbour *);
302 if (size <= PAGE_SIZE)
303 kfree(hash);
304 else
305 free_pages((unsigned long)hash, get_order(size));
308 static void neigh_hash_grow(struct neigh_table *tbl, unsigned long new_entries)
310 struct neighbour **new_hash, **old_hash;
311 unsigned int i, new_hash_mask, old_entries;
313 NEIGH_CACHE_STAT_INC(tbl, hash_grows);
315 BUG_ON(new_entries & (new_entries - 1));
316 new_hash = neigh_hash_alloc(new_entries);
317 if (!new_hash)
318 return;
320 old_entries = tbl->hash_mask + 1;
321 new_hash_mask = new_entries - 1;
322 old_hash = tbl->hash_buckets;
324 get_random_bytes(&tbl->hash_rnd, sizeof(tbl->hash_rnd));
325 for (i = 0; i < old_entries; i++) {
326 struct neighbour *n, *next;
328 for (n = old_hash[i]; n; n = next) {
329 unsigned int hash_val = tbl->hash(n->primary_key, n->dev);
331 hash_val &= new_hash_mask;
332 next = n->next;
334 n->next = new_hash[hash_val];
335 new_hash[hash_val] = n;
338 tbl->hash_buckets = new_hash;
339 tbl->hash_mask = new_hash_mask;
341 neigh_hash_free(old_hash, old_entries);
344 struct neighbour *neigh_lookup(struct neigh_table *tbl, const void *pkey,
345 struct net_device *dev)
347 struct neighbour *n;
348 int key_len = tbl->key_len;
349 u32 hash_val = tbl->hash(pkey, dev) & tbl->hash_mask;
351 NEIGH_CACHE_STAT_INC(tbl, lookups);
353 read_lock_bh(&tbl->lock);
354 for (n = tbl->hash_buckets[hash_val]; n; n = n->next) {
355 if (dev == n->dev && !memcmp(n->primary_key, pkey, key_len)) {
356 neigh_hold(n);
357 NEIGH_CACHE_STAT_INC(tbl, hits);
358 break;
361 read_unlock_bh(&tbl->lock);
362 return n;
365 struct neighbour *neigh_lookup_nodev(struct neigh_table *tbl, const void *pkey)
367 struct neighbour *n;
368 int key_len = tbl->key_len;
369 u32 hash_val = tbl->hash(pkey, NULL) & tbl->hash_mask;
371 NEIGH_CACHE_STAT_INC(tbl, lookups);
373 read_lock_bh(&tbl->lock);
374 for (n = tbl->hash_buckets[hash_val]; n; n = n->next) {
375 if (!memcmp(n->primary_key, pkey, key_len)) {
376 neigh_hold(n);
377 NEIGH_CACHE_STAT_INC(tbl, hits);
378 break;
381 read_unlock_bh(&tbl->lock);
382 return n;
385 struct neighbour *neigh_create(struct neigh_table *tbl, const void *pkey,
386 struct net_device *dev)
388 u32 hash_val;
389 int key_len = tbl->key_len;
390 int error;
391 struct neighbour *n1, *rc, *n = neigh_alloc(tbl);
393 if (!n) {
394 rc = ERR_PTR(-ENOBUFS);
395 goto out;
398 memcpy(n->primary_key, pkey, key_len);
399 n->dev = dev;
400 dev_hold(dev);
402 /* Protocol specific setup. */
403 if (tbl->constructor && (error = tbl->constructor(n)) < 0) {
404 rc = ERR_PTR(error);
405 goto out_neigh_release;
408 /* Device specific setup. */
409 if (n->parms->neigh_setup &&
410 (error = n->parms->neigh_setup(n)) < 0) {
411 rc = ERR_PTR(error);
412 goto out_neigh_release;
415 n->confirmed = jiffies - (n->parms->base_reachable_time << 1);
417 write_lock_bh(&tbl->lock);
419 if (atomic_read(&tbl->entries) > (tbl->hash_mask + 1))
420 neigh_hash_grow(tbl, (tbl->hash_mask + 1) << 1);
422 hash_val = tbl->hash(pkey, dev) & tbl->hash_mask;
424 if (n->parms->dead) {
425 rc = ERR_PTR(-EINVAL);
426 goto out_tbl_unlock;
429 for (n1 = tbl->hash_buckets[hash_val]; n1; n1 = n1->next) {
430 if (dev == n1->dev && !memcmp(n1->primary_key, pkey, key_len)) {
431 neigh_hold(n1);
432 rc = n1;
433 goto out_tbl_unlock;
437 n->next = tbl->hash_buckets[hash_val];
438 tbl->hash_buckets[hash_val] = n;
439 n->dead = 0;
440 neigh_hold(n);
441 write_unlock_bh(&tbl->lock);
442 NEIGH_PRINTK2("neigh %p is created.\n", n);
443 rc = n;
444 out:
445 return rc;
446 out_tbl_unlock:
447 write_unlock_bh(&tbl->lock);
448 out_neigh_release:
449 neigh_release(n);
450 goto out;
453 struct pneigh_entry * pneigh_lookup(struct neigh_table *tbl, const void *pkey,
454 struct net_device *dev, int creat)
456 struct pneigh_entry *n;
457 int key_len = tbl->key_len;
458 u32 hash_val = *(u32 *)(pkey + key_len - 4);
460 hash_val ^= (hash_val >> 16);
461 hash_val ^= hash_val >> 8;
462 hash_val ^= hash_val >> 4;
463 hash_val &= PNEIGH_HASHMASK;
465 read_lock_bh(&tbl->lock);
467 for (n = tbl->phash_buckets[hash_val]; n; n = n->next) {
468 if (!memcmp(n->key, pkey, key_len) &&
469 (n->dev == dev || !n->dev)) {
470 read_unlock_bh(&tbl->lock);
471 goto out;
474 read_unlock_bh(&tbl->lock);
475 n = NULL;
476 if (!creat)
477 goto out;
479 n = kmalloc(sizeof(*n) + key_len, GFP_KERNEL);
480 if (!n)
481 goto out;
483 memcpy(n->key, pkey, key_len);
484 n->dev = dev;
485 if (dev)
486 dev_hold(dev);
488 if (tbl->pconstructor && tbl->pconstructor(n)) {
489 if (dev)
490 dev_put(dev);
491 kfree(n);
492 n = NULL;
493 goto out;
496 write_lock_bh(&tbl->lock);
497 n->next = tbl->phash_buckets[hash_val];
498 tbl->phash_buckets[hash_val] = n;
499 write_unlock_bh(&tbl->lock);
500 out:
501 return n;
505 int pneigh_delete(struct neigh_table *tbl, const void *pkey,
506 struct net_device *dev)
508 struct pneigh_entry *n, **np;
509 int key_len = tbl->key_len;
510 u32 hash_val = *(u32 *)(pkey + key_len - 4);
512 hash_val ^= (hash_val >> 16);
513 hash_val ^= hash_val >> 8;
514 hash_val ^= hash_val >> 4;
515 hash_val &= PNEIGH_HASHMASK;
517 write_lock_bh(&tbl->lock);
518 for (np = &tbl->phash_buckets[hash_val]; (n = *np) != NULL;
519 np = &n->next) {
520 if (!memcmp(n->key, pkey, key_len) && n->dev == dev) {
521 *np = n->next;
522 write_unlock_bh(&tbl->lock);
523 if (tbl->pdestructor)
524 tbl->pdestructor(n);
525 if (n->dev)
526 dev_put(n->dev);
527 kfree(n);
528 return 0;
531 write_unlock_bh(&tbl->lock);
532 return -ENOENT;
535 static int pneigh_ifdown(struct neigh_table *tbl, struct net_device *dev)
537 struct pneigh_entry *n, **np;
538 u32 h;
540 for (h = 0; h <= PNEIGH_HASHMASK; h++) {
541 np = &tbl->phash_buckets[h];
542 while ((n = *np) != NULL) {
543 if (!dev || n->dev == dev) {
544 *np = n->next;
545 if (tbl->pdestructor)
546 tbl->pdestructor(n);
547 if (n->dev)
548 dev_put(n->dev);
549 kfree(n);
550 continue;
552 np = &n->next;
555 return -ENOENT;
560 * neighbour must already be out of the table;
563 void neigh_destroy(struct neighbour *neigh)
565 struct hh_cache *hh;
567 NEIGH_CACHE_STAT_INC(neigh->tbl, destroys);
569 if (!neigh->dead) {
570 printk(KERN_WARNING
571 "Destroying alive neighbour %p\n", neigh);
572 dump_stack();
573 return;
576 if (neigh_del_timer(neigh))
577 printk(KERN_WARNING "Impossible event.\n");
579 while ((hh = neigh->hh) != NULL) {
580 neigh->hh = hh->hh_next;
581 hh->hh_next = NULL;
582 write_lock_bh(&hh->hh_lock);
583 hh->hh_output = neigh_blackhole;
584 write_unlock_bh(&hh->hh_lock);
585 if (atomic_dec_and_test(&hh->hh_refcnt))
586 kfree(hh);
589 if (neigh->parms->neigh_destructor)
590 (neigh->parms->neigh_destructor)(neigh);
592 skb_queue_purge(&neigh->arp_queue);
594 dev_put(neigh->dev);
595 neigh_parms_put(neigh->parms);
597 NEIGH_PRINTK2("neigh %p is destroyed.\n", neigh);
599 atomic_dec(&neigh->tbl->entries);
600 kmem_cache_free(neigh->tbl->kmem_cachep, neigh);
603 /* Neighbour state is suspicious;
604 disable fast path.
606 Called with write_locked neigh.
608 static void neigh_suspect(struct neighbour *neigh)
610 struct hh_cache *hh;
612 NEIGH_PRINTK2("neigh %p is suspected.\n", neigh);
614 neigh->output = neigh->ops->output;
616 for (hh = neigh->hh; hh; hh = hh->hh_next)
617 hh->hh_output = neigh->ops->output;
620 /* Neighbour state is OK;
621 enable fast path.
623 Called with write_locked neigh.
625 static void neigh_connect(struct neighbour *neigh)
627 struct hh_cache *hh;
629 NEIGH_PRINTK2("neigh %p is connected.\n", neigh);
631 neigh->output = neigh->ops->connected_output;
633 for (hh = neigh->hh; hh; hh = hh->hh_next)
634 hh->hh_output = neigh->ops->hh_output;
637 static void neigh_periodic_timer(unsigned long arg)
639 struct neigh_table *tbl = (struct neigh_table *)arg;
640 struct neighbour *n, **np;
641 unsigned long expire, now = jiffies;
643 NEIGH_CACHE_STAT_INC(tbl, periodic_gc_runs);
645 write_lock(&tbl->lock);
648 * periodically recompute ReachableTime from random function
651 if (time_after(now, tbl->last_rand + 300 * HZ)) {
652 struct neigh_parms *p;
653 tbl->last_rand = now;
654 for (p = &tbl->parms; p; p = p->next)
655 p->reachable_time =
656 neigh_rand_reach_time(p->base_reachable_time);
659 np = &tbl->hash_buckets[tbl->hash_chain_gc];
660 tbl->hash_chain_gc = ((tbl->hash_chain_gc + 1) & tbl->hash_mask);
662 while ((n = *np) != NULL) {
663 unsigned int state;
665 write_lock(&n->lock);
667 state = n->nud_state;
668 if (state & (NUD_PERMANENT | NUD_IN_TIMER)) {
669 write_unlock(&n->lock);
670 goto next_elt;
673 if (time_before(n->used, n->confirmed))
674 n->used = n->confirmed;
676 if (atomic_read(&n->refcnt) == 1 &&
677 (state == NUD_FAILED ||
678 time_after(now, n->used + n->parms->gc_staletime))) {
679 *np = n->next;
680 n->dead = 1;
681 write_unlock(&n->lock);
682 neigh_release(n);
683 continue;
685 write_unlock(&n->lock);
687 next_elt:
688 np = &n->next;
691 /* Cycle through all hash buckets every base_reachable_time/2 ticks.
692 * ARP entry timeouts range from 1/2 base_reachable_time to 3/2
693 * base_reachable_time.
695 expire = tbl->parms.base_reachable_time >> 1;
696 expire /= (tbl->hash_mask + 1);
697 if (!expire)
698 expire = 1;
700 mod_timer(&tbl->gc_timer, now + expire);
702 write_unlock(&tbl->lock);
705 static __inline__ int neigh_max_probes(struct neighbour *n)
707 struct neigh_parms *p = n->parms;
708 return (n->nud_state & NUD_PROBE ?
709 p->ucast_probes :
710 p->ucast_probes + p->app_probes + p->mcast_probes);
713 static inline void neigh_add_timer(struct neighbour *n, unsigned long when)
715 if (unlikely(mod_timer(&n->timer, when))) {
716 printk("NEIGH: BUG, double timer add, state is %x\n",
717 n->nud_state);
718 dump_stack();
722 /* Called when a timer expires for a neighbour entry. */
724 static void neigh_timer_handler(unsigned long arg)
726 unsigned long now, next;
727 struct neighbour *neigh = (struct neighbour *)arg;
728 unsigned state;
729 int notify = 0;
731 write_lock(&neigh->lock);
733 state = neigh->nud_state;
734 now = jiffies;
735 next = now + HZ;
737 if (!(state & NUD_IN_TIMER)) {
738 #ifndef CONFIG_SMP
739 printk(KERN_WARNING "neigh: timer & !nud_in_timer\n");
740 #endif
741 goto out;
744 if (state & NUD_REACHABLE) {
745 if (time_before_eq(now,
746 neigh->confirmed + neigh->parms->reachable_time)) {
747 NEIGH_PRINTK2("neigh %p is still alive.\n", neigh);
748 next = neigh->confirmed + neigh->parms->reachable_time;
749 } else if (time_before_eq(now,
750 neigh->used + neigh->parms->delay_probe_time)) {
751 NEIGH_PRINTK2("neigh %p is delayed.\n", neigh);
752 neigh->nud_state = NUD_DELAY;
753 neigh->updated = jiffies;
754 neigh_suspect(neigh);
755 next = now + neigh->parms->delay_probe_time;
756 } else {
757 NEIGH_PRINTK2("neigh %p is suspected.\n", neigh);
758 neigh->nud_state = NUD_STALE;
759 neigh->updated = jiffies;
760 neigh_suspect(neigh);
762 } else if (state & NUD_DELAY) {
763 if (time_before_eq(now,
764 neigh->confirmed + neigh->parms->delay_probe_time)) {
765 NEIGH_PRINTK2("neigh %p is now reachable.\n", neigh);
766 neigh->nud_state = NUD_REACHABLE;
767 neigh->updated = jiffies;
768 neigh_connect(neigh);
769 next = neigh->confirmed + neigh->parms->reachable_time;
770 } else {
771 NEIGH_PRINTK2("neigh %p is probed.\n", neigh);
772 neigh->nud_state = NUD_PROBE;
773 neigh->updated = jiffies;
774 atomic_set(&neigh->probes, 0);
775 next = now + neigh->parms->retrans_time;
777 } else {
778 /* NUD_PROBE|NUD_INCOMPLETE */
779 next = now + neigh->parms->retrans_time;
782 if ((neigh->nud_state & (NUD_INCOMPLETE | NUD_PROBE)) &&
783 atomic_read(&neigh->probes) >= neigh_max_probes(neigh)) {
784 struct sk_buff *skb;
786 neigh->nud_state = NUD_FAILED;
787 neigh->updated = jiffies;
788 notify = 1;
789 NEIGH_CACHE_STAT_INC(neigh->tbl, res_failed);
790 NEIGH_PRINTK2("neigh %p is failed.\n", neigh);
792 /* It is very thin place. report_unreachable is very complicated
793 routine. Particularly, it can hit the same neighbour entry!
795 So that, we try to be accurate and avoid dead loop. --ANK
797 while (neigh->nud_state == NUD_FAILED &&
798 (skb = __skb_dequeue(&neigh->arp_queue)) != NULL) {
799 write_unlock(&neigh->lock);
800 neigh->ops->error_report(neigh, skb);
801 write_lock(&neigh->lock);
803 skb_queue_purge(&neigh->arp_queue);
806 if (neigh->nud_state & NUD_IN_TIMER) {
807 if (time_before(next, jiffies + HZ/2))
808 next = jiffies + HZ/2;
809 if (!mod_timer(&neigh->timer, next))
810 neigh_hold(neigh);
812 if (neigh->nud_state & (NUD_INCOMPLETE | NUD_PROBE)) {
813 struct sk_buff *skb = skb_peek(&neigh->arp_queue);
814 /* keep skb alive even if arp_queue overflows */
815 if (skb)
816 skb_get(skb);
817 write_unlock(&neigh->lock);
818 neigh->ops->solicit(neigh, skb);
819 atomic_inc(&neigh->probes);
820 if (skb)
821 kfree_skb(skb);
822 } else {
823 out:
824 write_unlock(&neigh->lock);
827 #ifdef CONFIG_ARPD
828 if (notify && neigh->parms->app_probes)
829 neigh_app_notify(neigh);
830 #endif
831 neigh_release(neigh);
834 int __neigh_event_send(struct neighbour *neigh, struct sk_buff *skb)
836 int rc;
837 unsigned long now;
839 write_lock_bh(&neigh->lock);
841 rc = 0;
842 if (neigh->nud_state & (NUD_CONNECTED | NUD_DELAY | NUD_PROBE))
843 goto out_unlock_bh;
845 now = jiffies;
847 if (!(neigh->nud_state & (NUD_STALE | NUD_INCOMPLETE))) {
848 if (neigh->parms->mcast_probes + neigh->parms->app_probes) {
849 atomic_set(&neigh->probes, neigh->parms->ucast_probes);
850 neigh->nud_state = NUD_INCOMPLETE;
851 neigh->updated = jiffies;
852 neigh_hold(neigh);
853 neigh_add_timer(neigh, now + 1);
854 } else {
855 neigh->nud_state = NUD_FAILED;
856 neigh->updated = jiffies;
857 write_unlock_bh(&neigh->lock);
859 if (skb)
860 kfree_skb(skb);
861 return 1;
863 } else if (neigh->nud_state & NUD_STALE) {
864 NEIGH_PRINTK2("neigh %p is delayed.\n", neigh);
865 neigh_hold(neigh);
866 neigh->nud_state = NUD_DELAY;
867 neigh->updated = jiffies;
868 neigh_add_timer(neigh,
869 jiffies + neigh->parms->delay_probe_time);
872 if (neigh->nud_state == NUD_INCOMPLETE) {
873 if (skb) {
874 if (skb_queue_len(&neigh->arp_queue) >=
875 neigh->parms->queue_len) {
876 struct sk_buff *buff;
877 buff = neigh->arp_queue.next;
878 __skb_unlink(buff, &neigh->arp_queue);
879 kfree_skb(buff);
881 __skb_queue_tail(&neigh->arp_queue, skb);
883 rc = 1;
885 out_unlock_bh:
886 write_unlock_bh(&neigh->lock);
887 return rc;
890 static __inline__ void neigh_update_hhs(struct neighbour *neigh)
892 struct hh_cache *hh;
893 void (*update)(struct hh_cache*, struct net_device*, unsigned char *) =
894 neigh->dev->header_cache_update;
896 if (update) {
897 for (hh = neigh->hh; hh; hh = hh->hh_next) {
898 write_lock_bh(&hh->hh_lock);
899 update(hh, neigh->dev, neigh->ha);
900 write_unlock_bh(&hh->hh_lock);
907 /* Generic update routine.
908 -- lladdr is new lladdr or NULL, if it is not supplied.
909 -- new is new state.
910 -- flags
911 NEIGH_UPDATE_F_OVERRIDE allows to override existing lladdr,
912 if it is different.
913 NEIGH_UPDATE_F_WEAK_OVERRIDE will suspect existing "connected"
914 lladdr instead of overriding it
915 if it is different.
916 It also allows to retain current state
917 if lladdr is unchanged.
918 NEIGH_UPDATE_F_ADMIN means that the change is administrative.
920 NEIGH_UPDATE_F_OVERRIDE_ISROUTER allows to override existing
921 NTF_ROUTER flag.
922 NEIGH_UPDATE_F_ISROUTER indicates if the neighbour is known as
923 a router.
925 Caller MUST hold reference count on the entry.
928 int neigh_update(struct neighbour *neigh, const u8 *lladdr, u8 new,
929 u32 flags)
931 u8 old;
932 int err;
933 #ifdef CONFIG_ARPD
934 int notify = 0;
935 #endif
936 struct net_device *dev;
937 int update_isrouter = 0;
939 write_lock_bh(&neigh->lock);
941 dev = neigh->dev;
942 old = neigh->nud_state;
943 err = -EPERM;
945 if (!(flags & NEIGH_UPDATE_F_ADMIN) &&
946 (old & (NUD_NOARP | NUD_PERMANENT)))
947 goto out;
949 if (!(new & NUD_VALID)) {
950 neigh_del_timer(neigh);
951 if (old & NUD_CONNECTED)
952 neigh_suspect(neigh);
953 neigh->nud_state = new;
954 err = 0;
955 #ifdef CONFIG_ARPD
956 notify = old & NUD_VALID;
957 #endif
958 goto out;
961 /* Compare new lladdr with cached one */
962 if (!dev->addr_len) {
963 /* First case: device needs no address. */
964 lladdr = neigh->ha;
965 } else if (lladdr) {
966 /* The second case: if something is already cached
967 and a new address is proposed:
968 - compare new & old
969 - if they are different, check override flag
971 if ((old & NUD_VALID) &&
972 !memcmp(lladdr, neigh->ha, dev->addr_len))
973 lladdr = neigh->ha;
974 } else {
975 /* No address is supplied; if we know something,
976 use it, otherwise discard the request.
978 err = -EINVAL;
979 if (!(old & NUD_VALID))
980 goto out;
981 lladdr = neigh->ha;
984 if (new & NUD_CONNECTED)
985 neigh->confirmed = jiffies;
986 neigh->updated = jiffies;
988 /* If entry was valid and address is not changed,
989 do not change entry state, if new one is STALE.
991 err = 0;
992 update_isrouter = flags & NEIGH_UPDATE_F_OVERRIDE_ISROUTER;
993 if (old & NUD_VALID) {
994 if (lladdr != neigh->ha && !(flags & NEIGH_UPDATE_F_OVERRIDE)) {
995 update_isrouter = 0;
996 if ((flags & NEIGH_UPDATE_F_WEAK_OVERRIDE) &&
997 (old & NUD_CONNECTED)) {
998 lladdr = neigh->ha;
999 new = NUD_STALE;
1000 } else
1001 goto out;
1002 } else {
1003 if (lladdr == neigh->ha && new == NUD_STALE &&
1004 ((flags & NEIGH_UPDATE_F_WEAK_OVERRIDE) ||
1005 (old & NUD_CONNECTED))
1007 new = old;
1011 if (new != old) {
1012 neigh_del_timer(neigh);
1013 if (new & NUD_IN_TIMER) {
1014 neigh_hold(neigh);
1015 neigh_add_timer(neigh, (jiffies +
1016 ((new & NUD_REACHABLE) ?
1017 neigh->parms->reachable_time :
1018 0)));
1020 neigh->nud_state = new;
1023 if (lladdr != neigh->ha) {
1024 memcpy(&neigh->ha, lladdr, dev->addr_len);
1025 neigh_update_hhs(neigh);
1026 if (!(new & NUD_CONNECTED))
1027 neigh->confirmed = jiffies -
1028 (neigh->parms->base_reachable_time << 1);
1029 #ifdef CONFIG_ARPD
1030 notify = 1;
1031 #endif
1033 if (new == old)
1034 goto out;
1035 if (new & NUD_CONNECTED)
1036 neigh_connect(neigh);
1037 else
1038 neigh_suspect(neigh);
1039 if (!(old & NUD_VALID)) {
1040 struct sk_buff *skb;
1042 /* Again: avoid dead loop if something went wrong */
1044 while (neigh->nud_state & NUD_VALID &&
1045 (skb = __skb_dequeue(&neigh->arp_queue)) != NULL) {
1046 struct neighbour *n1 = neigh;
1047 write_unlock_bh(&neigh->lock);
1048 /* On shaper/eql skb->dst->neighbour != neigh :( */
1049 if (skb->dst && skb->dst->neighbour)
1050 n1 = skb->dst->neighbour;
1051 n1->output(skb);
1052 write_lock_bh(&neigh->lock);
1054 skb_queue_purge(&neigh->arp_queue);
1056 out:
1057 if (update_isrouter) {
1058 neigh->flags = (flags & NEIGH_UPDATE_F_ISROUTER) ?
1059 (neigh->flags | NTF_ROUTER) :
1060 (neigh->flags & ~NTF_ROUTER);
1062 write_unlock_bh(&neigh->lock);
1063 #ifdef CONFIG_ARPD
1064 if (notify && neigh->parms->app_probes)
1065 neigh_app_notify(neigh);
1066 #endif
1067 return err;
1070 struct neighbour *neigh_event_ns(struct neigh_table *tbl,
1071 u8 *lladdr, void *saddr,
1072 struct net_device *dev)
1074 struct neighbour *neigh = __neigh_lookup(tbl, saddr, dev,
1075 lladdr || !dev->addr_len);
1076 if (neigh)
1077 neigh_update(neigh, lladdr, NUD_STALE,
1078 NEIGH_UPDATE_F_OVERRIDE);
1079 return neigh;
1082 static void neigh_hh_init(struct neighbour *n, struct dst_entry *dst,
1083 u16 protocol)
1085 struct hh_cache *hh;
1086 struct net_device *dev = dst->dev;
1088 for (hh = n->hh; hh; hh = hh->hh_next)
1089 if (hh->hh_type == protocol)
1090 break;
1092 if (!hh && (hh = kmalloc(sizeof(*hh), GFP_ATOMIC)) != NULL) {
1093 memset(hh, 0, sizeof(struct hh_cache));
1094 rwlock_init(&hh->hh_lock);
1095 hh->hh_type = protocol;
1096 atomic_set(&hh->hh_refcnt, 0);
1097 hh->hh_next = NULL;
1098 if (dev->hard_header_cache(n, hh)) {
1099 kfree(hh);
1100 hh = NULL;
1101 } else {
1102 atomic_inc(&hh->hh_refcnt);
1103 hh->hh_next = n->hh;
1104 n->hh = hh;
1105 if (n->nud_state & NUD_CONNECTED)
1106 hh->hh_output = n->ops->hh_output;
1107 else
1108 hh->hh_output = n->ops->output;
1111 if (hh) {
1112 atomic_inc(&hh->hh_refcnt);
1113 dst->hh = hh;
1117 /* This function can be used in contexts, where only old dev_queue_xmit
1118 worked, f.e. if you want to override normal output path (eql, shaper),
1119 but resolution is not made yet.
1122 int neigh_compat_output(struct sk_buff *skb)
1124 struct net_device *dev = skb->dev;
1126 __skb_pull(skb, skb->nh.raw - skb->data);
1128 if (dev->hard_header &&
1129 dev->hard_header(skb, dev, ntohs(skb->protocol), NULL, NULL,
1130 skb->len) < 0 &&
1131 dev->rebuild_header(skb))
1132 return 0;
1134 return dev_queue_xmit(skb);
1137 /* Slow and careful. */
1139 int neigh_resolve_output(struct sk_buff *skb)
1141 struct dst_entry *dst = skb->dst;
1142 struct neighbour *neigh;
1143 int rc = 0;
1145 if (!dst || !(neigh = dst->neighbour))
1146 goto discard;
1148 __skb_pull(skb, skb->nh.raw - skb->data);
1150 if (!neigh_event_send(neigh, skb)) {
1151 int err;
1152 struct net_device *dev = neigh->dev;
1153 if (dev->hard_header_cache && !dst->hh) {
1154 write_lock_bh(&neigh->lock);
1155 if (!dst->hh)
1156 neigh_hh_init(neigh, dst, dst->ops->protocol);
1157 err = dev->hard_header(skb, dev, ntohs(skb->protocol),
1158 neigh->ha, NULL, skb->len);
1159 write_unlock_bh(&neigh->lock);
1160 } else {
1161 read_lock_bh(&neigh->lock);
1162 err = dev->hard_header(skb, dev, ntohs(skb->protocol),
1163 neigh->ha, NULL, skb->len);
1164 read_unlock_bh(&neigh->lock);
1166 if (err >= 0)
1167 rc = neigh->ops->queue_xmit(skb);
1168 else
1169 goto out_kfree_skb;
1171 out:
1172 return rc;
1173 discard:
1174 NEIGH_PRINTK1("neigh_resolve_output: dst=%p neigh=%p\n",
1175 dst, dst ? dst->neighbour : NULL);
1176 out_kfree_skb:
1177 rc = -EINVAL;
1178 kfree_skb(skb);
1179 goto out;
1182 /* As fast as possible without hh cache */
1184 int neigh_connected_output(struct sk_buff *skb)
1186 int err;
1187 struct dst_entry *dst = skb->dst;
1188 struct neighbour *neigh = dst->neighbour;
1189 struct net_device *dev = neigh->dev;
1191 __skb_pull(skb, skb->nh.raw - skb->data);
1193 read_lock_bh(&neigh->lock);
1194 err = dev->hard_header(skb, dev, ntohs(skb->protocol),
1195 neigh->ha, NULL, skb->len);
1196 read_unlock_bh(&neigh->lock);
1197 if (err >= 0)
1198 err = neigh->ops->queue_xmit(skb);
1199 else {
1200 err = -EINVAL;
1201 kfree_skb(skb);
1203 return err;
1206 static void neigh_proxy_process(unsigned long arg)
1208 struct neigh_table *tbl = (struct neigh_table *)arg;
1209 long sched_next = 0;
1210 unsigned long now = jiffies;
1211 struct sk_buff *skb;
1213 spin_lock(&tbl->proxy_queue.lock);
1215 skb = tbl->proxy_queue.next;
1217 while (skb != (struct sk_buff *)&tbl->proxy_queue) {
1218 struct sk_buff *back = skb;
1219 long tdif = NEIGH_CB(back)->sched_next - now;
1221 skb = skb->next;
1222 if (tdif <= 0) {
1223 struct net_device *dev = back->dev;
1224 __skb_unlink(back, &tbl->proxy_queue);
1225 if (tbl->proxy_redo && netif_running(dev))
1226 tbl->proxy_redo(back);
1227 else
1228 kfree_skb(back);
1230 dev_put(dev);
1231 } else if (!sched_next || tdif < sched_next)
1232 sched_next = tdif;
1234 del_timer(&tbl->proxy_timer);
1235 if (sched_next)
1236 mod_timer(&tbl->proxy_timer, jiffies + sched_next);
1237 spin_unlock(&tbl->proxy_queue.lock);
1240 void pneigh_enqueue(struct neigh_table *tbl, struct neigh_parms *p,
1241 struct sk_buff *skb)
1243 unsigned long now = jiffies;
1244 unsigned long sched_next = now + (net_random() % p->proxy_delay);
1246 if (tbl->proxy_queue.qlen > p->proxy_qlen) {
1247 kfree_skb(skb);
1248 return;
1251 NEIGH_CB(skb)->sched_next = sched_next;
1252 NEIGH_CB(skb)->flags |= LOCALLY_ENQUEUED;
1254 spin_lock(&tbl->proxy_queue.lock);
1255 if (del_timer(&tbl->proxy_timer)) {
1256 if (time_before(tbl->proxy_timer.expires, sched_next))
1257 sched_next = tbl->proxy_timer.expires;
1259 dst_release(skb->dst);
1260 skb->dst = NULL;
1261 dev_hold(skb->dev);
1262 __skb_queue_tail(&tbl->proxy_queue, skb);
1263 mod_timer(&tbl->proxy_timer, sched_next);
1264 spin_unlock(&tbl->proxy_queue.lock);
1268 struct neigh_parms *neigh_parms_alloc(struct net_device *dev,
1269 struct neigh_table *tbl)
1271 struct neigh_parms *p = kmalloc(sizeof(*p), GFP_KERNEL);
1273 if (p) {
1274 memcpy(p, &tbl->parms, sizeof(*p));
1275 p->tbl = tbl;
1276 atomic_set(&p->refcnt, 1);
1277 INIT_RCU_HEAD(&p->rcu_head);
1278 p->reachable_time =
1279 neigh_rand_reach_time(p->base_reachable_time);
1280 if (dev) {
1281 if (dev->neigh_setup && dev->neigh_setup(dev, p)) {
1282 kfree(p);
1283 return NULL;
1286 dev_hold(dev);
1287 p->dev = dev;
1289 p->sysctl_table = NULL;
1290 write_lock_bh(&tbl->lock);
1291 p->next = tbl->parms.next;
1292 tbl->parms.next = p;
1293 write_unlock_bh(&tbl->lock);
1295 return p;
1298 static void neigh_rcu_free_parms(struct rcu_head *head)
1300 struct neigh_parms *parms =
1301 container_of(head, struct neigh_parms, rcu_head);
1303 neigh_parms_put(parms);
1306 void neigh_parms_release(struct neigh_table *tbl, struct neigh_parms *parms)
1308 struct neigh_parms **p;
1310 if (!parms || parms == &tbl->parms)
1311 return;
1312 write_lock_bh(&tbl->lock);
1313 for (p = &tbl->parms.next; *p; p = &(*p)->next) {
1314 if (*p == parms) {
1315 *p = parms->next;
1316 parms->dead = 1;
1317 write_unlock_bh(&tbl->lock);
1318 if (parms->dev)
1319 dev_put(parms->dev);
1320 call_rcu(&parms->rcu_head, neigh_rcu_free_parms);
1321 return;
1324 write_unlock_bh(&tbl->lock);
1325 NEIGH_PRINTK1("neigh_parms_release: not found\n");
1328 void neigh_parms_destroy(struct neigh_parms *parms)
1330 kfree(parms);
1334 void neigh_table_init(struct neigh_table *tbl)
1336 unsigned long now = jiffies;
1337 unsigned long phsize;
1339 atomic_set(&tbl->parms.refcnt, 1);
1340 INIT_RCU_HEAD(&tbl->parms.rcu_head);
1341 tbl->parms.reachable_time =
1342 neigh_rand_reach_time(tbl->parms.base_reachable_time);
1344 if (!tbl->kmem_cachep)
1345 tbl->kmem_cachep = kmem_cache_create(tbl->id,
1346 tbl->entry_size,
1347 0, SLAB_HWCACHE_ALIGN,
1348 NULL, NULL);
1350 if (!tbl->kmem_cachep)
1351 panic("cannot create neighbour cache");
1353 tbl->stats = alloc_percpu(struct neigh_statistics);
1354 if (!tbl->stats)
1355 panic("cannot create neighbour cache statistics");
1357 #ifdef CONFIG_PROC_FS
1358 tbl->pde = create_proc_entry(tbl->id, 0, proc_net_stat);
1359 if (!tbl->pde)
1360 panic("cannot create neighbour proc dir entry");
1361 tbl->pde->proc_fops = &neigh_stat_seq_fops;
1362 tbl->pde->data = tbl;
1363 #endif
1365 tbl->hash_mask = 1;
1366 tbl->hash_buckets = neigh_hash_alloc(tbl->hash_mask + 1);
1368 phsize = (PNEIGH_HASHMASK + 1) * sizeof(struct pneigh_entry *);
1369 tbl->phash_buckets = kmalloc(phsize, GFP_KERNEL);
1371 if (!tbl->hash_buckets || !tbl->phash_buckets)
1372 panic("cannot allocate neighbour cache hashes");
1374 memset(tbl->phash_buckets, 0, phsize);
1376 get_random_bytes(&tbl->hash_rnd, sizeof(tbl->hash_rnd));
1378 rwlock_init(&tbl->lock);
1379 init_timer(&tbl->gc_timer);
1380 tbl->gc_timer.data = (unsigned long)tbl;
1381 tbl->gc_timer.function = neigh_periodic_timer;
1382 tbl->gc_timer.expires = now + 1;
1383 add_timer(&tbl->gc_timer);
1385 init_timer(&tbl->proxy_timer);
1386 tbl->proxy_timer.data = (unsigned long)tbl;
1387 tbl->proxy_timer.function = neigh_proxy_process;
1388 skb_queue_head_init(&tbl->proxy_queue);
1390 tbl->last_flush = now;
1391 tbl->last_rand = now + tbl->parms.reachable_time * 20;
1392 write_lock(&neigh_tbl_lock);
1393 tbl->next = neigh_tables;
1394 neigh_tables = tbl;
1395 write_unlock(&neigh_tbl_lock);
1398 int neigh_table_clear(struct neigh_table *tbl)
1400 struct neigh_table **tp;
1402 /* It is not clean... Fix it to unload IPv6 module safely */
1403 del_timer_sync(&tbl->gc_timer);
1404 del_timer_sync(&tbl->proxy_timer);
1405 pneigh_queue_purge(&tbl->proxy_queue);
1406 neigh_ifdown(tbl, NULL);
1407 if (atomic_read(&tbl->entries))
1408 printk(KERN_CRIT "neighbour leakage\n");
1409 write_lock(&neigh_tbl_lock);
1410 for (tp = &neigh_tables; *tp; tp = &(*tp)->next) {
1411 if (*tp == tbl) {
1412 *tp = tbl->next;
1413 break;
1416 write_unlock(&neigh_tbl_lock);
1418 neigh_hash_free(tbl->hash_buckets, tbl->hash_mask + 1);
1419 tbl->hash_buckets = NULL;
1421 kfree(tbl->phash_buckets);
1422 tbl->phash_buckets = NULL;
1424 return 0;
1427 int neigh_delete(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
1429 struct ndmsg *ndm = NLMSG_DATA(nlh);
1430 struct rtattr **nda = arg;
1431 struct neigh_table *tbl;
1432 struct net_device *dev = NULL;
1433 int err = -ENODEV;
1435 if (ndm->ndm_ifindex &&
1436 (dev = dev_get_by_index(ndm->ndm_ifindex)) == NULL)
1437 goto out;
1439 read_lock(&neigh_tbl_lock);
1440 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
1441 struct rtattr *dst_attr = nda[NDA_DST - 1];
1442 struct neighbour *n;
1444 if (tbl->family != ndm->ndm_family)
1445 continue;
1446 read_unlock(&neigh_tbl_lock);
1448 err = -EINVAL;
1449 if (!dst_attr || RTA_PAYLOAD(dst_attr) < tbl->key_len)
1450 goto out_dev_put;
1452 if (ndm->ndm_flags & NTF_PROXY) {
1453 err = pneigh_delete(tbl, RTA_DATA(dst_attr), dev);
1454 goto out_dev_put;
1457 if (!dev)
1458 goto out;
1460 n = neigh_lookup(tbl, RTA_DATA(dst_attr), dev);
1461 if (n) {
1462 err = neigh_update(n, NULL, NUD_FAILED,
1463 NEIGH_UPDATE_F_OVERRIDE|
1464 NEIGH_UPDATE_F_ADMIN);
1465 neigh_release(n);
1467 goto out_dev_put;
1469 read_unlock(&neigh_tbl_lock);
1470 err = -EADDRNOTAVAIL;
1471 out_dev_put:
1472 if (dev)
1473 dev_put(dev);
1474 out:
1475 return err;
1478 int neigh_add(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
1480 struct ndmsg *ndm = NLMSG_DATA(nlh);
1481 struct rtattr **nda = arg;
1482 struct neigh_table *tbl;
1483 struct net_device *dev = NULL;
1484 int err = -ENODEV;
1486 if (ndm->ndm_ifindex &&
1487 (dev = dev_get_by_index(ndm->ndm_ifindex)) == NULL)
1488 goto out;
1490 read_lock(&neigh_tbl_lock);
1491 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
1492 struct rtattr *lladdr_attr = nda[NDA_LLADDR - 1];
1493 struct rtattr *dst_attr = nda[NDA_DST - 1];
1494 int override = 1;
1495 struct neighbour *n;
1497 if (tbl->family != ndm->ndm_family)
1498 continue;
1499 read_unlock(&neigh_tbl_lock);
1501 err = -EINVAL;
1502 if (!dst_attr || RTA_PAYLOAD(dst_attr) < tbl->key_len)
1503 goto out_dev_put;
1505 if (ndm->ndm_flags & NTF_PROXY) {
1506 err = -ENOBUFS;
1507 if (pneigh_lookup(tbl, RTA_DATA(dst_attr), dev, 1))
1508 err = 0;
1509 goto out_dev_put;
1512 err = -EINVAL;
1513 if (!dev)
1514 goto out;
1515 if (lladdr_attr && RTA_PAYLOAD(lladdr_attr) < dev->addr_len)
1516 goto out_dev_put;
1518 n = neigh_lookup(tbl, RTA_DATA(dst_attr), dev);
1519 if (n) {
1520 if (nlh->nlmsg_flags & NLM_F_EXCL) {
1521 err = -EEXIST;
1522 neigh_release(n);
1523 goto out_dev_put;
1526 override = nlh->nlmsg_flags & NLM_F_REPLACE;
1527 } else if (!(nlh->nlmsg_flags & NLM_F_CREATE)) {
1528 err = -ENOENT;
1529 goto out_dev_put;
1530 } else {
1531 n = __neigh_lookup_errno(tbl, RTA_DATA(dst_attr), dev);
1532 if (IS_ERR(n)) {
1533 err = PTR_ERR(n);
1534 goto out_dev_put;
1538 err = neigh_update(n,
1539 lladdr_attr ? RTA_DATA(lladdr_attr) : NULL,
1540 ndm->ndm_state,
1541 (override ? NEIGH_UPDATE_F_OVERRIDE : 0) |
1542 NEIGH_UPDATE_F_ADMIN);
1544 neigh_release(n);
1545 goto out_dev_put;
1548 read_unlock(&neigh_tbl_lock);
1549 err = -EADDRNOTAVAIL;
1550 out_dev_put:
1551 if (dev)
1552 dev_put(dev);
1553 out:
1554 return err;
1557 static int neightbl_fill_parms(struct sk_buff *skb, struct neigh_parms *parms)
1559 struct rtattr *nest = NULL;
1561 nest = RTA_NEST(skb, NDTA_PARMS);
1563 if (parms->dev)
1564 RTA_PUT_U32(skb, NDTPA_IFINDEX, parms->dev->ifindex);
1566 RTA_PUT_U32(skb, NDTPA_REFCNT, atomic_read(&parms->refcnt));
1567 RTA_PUT_U32(skb, NDTPA_QUEUE_LEN, parms->queue_len);
1568 RTA_PUT_U32(skb, NDTPA_PROXY_QLEN, parms->proxy_qlen);
1569 RTA_PUT_U32(skb, NDTPA_APP_PROBES, parms->app_probes);
1570 RTA_PUT_U32(skb, NDTPA_UCAST_PROBES, parms->ucast_probes);
1571 RTA_PUT_U32(skb, NDTPA_MCAST_PROBES, parms->mcast_probes);
1572 RTA_PUT_MSECS(skb, NDTPA_REACHABLE_TIME, parms->reachable_time);
1573 RTA_PUT_MSECS(skb, NDTPA_BASE_REACHABLE_TIME,
1574 parms->base_reachable_time);
1575 RTA_PUT_MSECS(skb, NDTPA_GC_STALETIME, parms->gc_staletime);
1576 RTA_PUT_MSECS(skb, NDTPA_DELAY_PROBE_TIME, parms->delay_probe_time);
1577 RTA_PUT_MSECS(skb, NDTPA_RETRANS_TIME, parms->retrans_time);
1578 RTA_PUT_MSECS(skb, NDTPA_ANYCAST_DELAY, parms->anycast_delay);
1579 RTA_PUT_MSECS(skb, NDTPA_PROXY_DELAY, parms->proxy_delay);
1580 RTA_PUT_MSECS(skb, NDTPA_LOCKTIME, parms->locktime);
1582 return RTA_NEST_END(skb, nest);
1584 rtattr_failure:
1585 return RTA_NEST_CANCEL(skb, nest);
1588 static int neightbl_fill_info(struct neigh_table *tbl, struct sk_buff *skb,
1589 struct netlink_callback *cb)
1591 struct nlmsghdr *nlh;
1592 struct ndtmsg *ndtmsg;
1594 nlh = NLMSG_NEW_ANSWER(skb, cb, RTM_NEWNEIGHTBL, sizeof(struct ndtmsg),
1595 NLM_F_MULTI);
1597 ndtmsg = NLMSG_DATA(nlh);
1599 read_lock_bh(&tbl->lock);
1600 ndtmsg->ndtm_family = tbl->family;
1601 ndtmsg->ndtm_pad1 = 0;
1602 ndtmsg->ndtm_pad2 = 0;
1604 RTA_PUT_STRING(skb, NDTA_NAME, tbl->id);
1605 RTA_PUT_MSECS(skb, NDTA_GC_INTERVAL, tbl->gc_interval);
1606 RTA_PUT_U32(skb, NDTA_THRESH1, tbl->gc_thresh1);
1607 RTA_PUT_U32(skb, NDTA_THRESH2, tbl->gc_thresh2);
1608 RTA_PUT_U32(skb, NDTA_THRESH3, tbl->gc_thresh3);
1611 unsigned long now = jiffies;
1612 unsigned int flush_delta = now - tbl->last_flush;
1613 unsigned int rand_delta = now - tbl->last_rand;
1615 struct ndt_config ndc = {
1616 .ndtc_key_len = tbl->key_len,
1617 .ndtc_entry_size = tbl->entry_size,
1618 .ndtc_entries = atomic_read(&tbl->entries),
1619 .ndtc_last_flush = jiffies_to_msecs(flush_delta),
1620 .ndtc_last_rand = jiffies_to_msecs(rand_delta),
1621 .ndtc_hash_rnd = tbl->hash_rnd,
1622 .ndtc_hash_mask = tbl->hash_mask,
1623 .ndtc_hash_chain_gc = tbl->hash_chain_gc,
1624 .ndtc_proxy_qlen = tbl->proxy_queue.qlen,
1627 RTA_PUT(skb, NDTA_CONFIG, sizeof(ndc), &ndc);
1631 int cpu;
1632 struct ndt_stats ndst;
1634 memset(&ndst, 0, sizeof(ndst));
1636 for_each_cpu(cpu) {
1637 struct neigh_statistics *st;
1639 st = per_cpu_ptr(tbl->stats, cpu);
1640 ndst.ndts_allocs += st->allocs;
1641 ndst.ndts_destroys += st->destroys;
1642 ndst.ndts_hash_grows += st->hash_grows;
1643 ndst.ndts_res_failed += st->res_failed;
1644 ndst.ndts_lookups += st->lookups;
1645 ndst.ndts_hits += st->hits;
1646 ndst.ndts_rcv_probes_mcast += st->rcv_probes_mcast;
1647 ndst.ndts_rcv_probes_ucast += st->rcv_probes_ucast;
1648 ndst.ndts_periodic_gc_runs += st->periodic_gc_runs;
1649 ndst.ndts_forced_gc_runs += st->forced_gc_runs;
1652 RTA_PUT(skb, NDTA_STATS, sizeof(ndst), &ndst);
1655 BUG_ON(tbl->parms.dev);
1656 if (neightbl_fill_parms(skb, &tbl->parms) < 0)
1657 goto rtattr_failure;
1659 read_unlock_bh(&tbl->lock);
1660 return NLMSG_END(skb, nlh);
1662 rtattr_failure:
1663 read_unlock_bh(&tbl->lock);
1664 return NLMSG_CANCEL(skb, nlh);
1666 nlmsg_failure:
1667 return -1;
1670 static int neightbl_fill_param_info(struct neigh_table *tbl,
1671 struct neigh_parms *parms,
1672 struct sk_buff *skb,
1673 struct netlink_callback *cb)
1675 struct ndtmsg *ndtmsg;
1676 struct nlmsghdr *nlh;
1678 nlh = NLMSG_NEW_ANSWER(skb, cb, RTM_NEWNEIGHTBL, sizeof(struct ndtmsg),
1679 NLM_F_MULTI);
1681 ndtmsg = NLMSG_DATA(nlh);
1683 read_lock_bh(&tbl->lock);
1684 ndtmsg->ndtm_family = tbl->family;
1685 ndtmsg->ndtm_pad1 = 0;
1686 ndtmsg->ndtm_pad2 = 0;
1687 RTA_PUT_STRING(skb, NDTA_NAME, tbl->id);
1689 if (neightbl_fill_parms(skb, parms) < 0)
1690 goto rtattr_failure;
1692 read_unlock_bh(&tbl->lock);
1693 return NLMSG_END(skb, nlh);
1695 rtattr_failure:
1696 read_unlock_bh(&tbl->lock);
1697 return NLMSG_CANCEL(skb, nlh);
1699 nlmsg_failure:
1700 return -1;
1703 static inline struct neigh_parms *lookup_neigh_params(struct neigh_table *tbl,
1704 int ifindex)
1706 struct neigh_parms *p;
1708 for (p = &tbl->parms; p; p = p->next)
1709 if ((p->dev && p->dev->ifindex == ifindex) ||
1710 (!p->dev && !ifindex))
1711 return p;
1713 return NULL;
1716 int neightbl_set(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
1718 struct neigh_table *tbl;
1719 struct ndtmsg *ndtmsg = NLMSG_DATA(nlh);
1720 struct rtattr **tb = arg;
1721 int err = -EINVAL;
1723 if (!tb[NDTA_NAME - 1] || !RTA_PAYLOAD(tb[NDTA_NAME - 1]))
1724 return -EINVAL;
1726 read_lock(&neigh_tbl_lock);
1727 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
1728 if (ndtmsg->ndtm_family && tbl->family != ndtmsg->ndtm_family)
1729 continue;
1731 if (!rtattr_strcmp(tb[NDTA_NAME - 1], tbl->id))
1732 break;
1735 if (tbl == NULL) {
1736 err = -ENOENT;
1737 goto errout;
1741 * We acquire tbl->lock to be nice to the periodic timers and
1742 * make sure they always see a consistent set of values.
1744 write_lock_bh(&tbl->lock);
1746 if (tb[NDTA_THRESH1 - 1])
1747 tbl->gc_thresh1 = RTA_GET_U32(tb[NDTA_THRESH1 - 1]);
1749 if (tb[NDTA_THRESH2 - 1])
1750 tbl->gc_thresh2 = RTA_GET_U32(tb[NDTA_THRESH2 - 1]);
1752 if (tb[NDTA_THRESH3 - 1])
1753 tbl->gc_thresh3 = RTA_GET_U32(tb[NDTA_THRESH3 - 1]);
1755 if (tb[NDTA_GC_INTERVAL - 1])
1756 tbl->gc_interval = RTA_GET_MSECS(tb[NDTA_GC_INTERVAL - 1]);
1758 if (tb[NDTA_PARMS - 1]) {
1759 struct rtattr *tbp[NDTPA_MAX];
1760 struct neigh_parms *p;
1761 u32 ifindex = 0;
1763 if (rtattr_parse_nested(tbp, NDTPA_MAX, tb[NDTA_PARMS - 1]) < 0)
1764 goto rtattr_failure;
1766 if (tbp[NDTPA_IFINDEX - 1])
1767 ifindex = RTA_GET_U32(tbp[NDTPA_IFINDEX - 1]);
1769 p = lookup_neigh_params(tbl, ifindex);
1770 if (p == NULL) {
1771 err = -ENOENT;
1772 goto rtattr_failure;
1775 if (tbp[NDTPA_QUEUE_LEN - 1])
1776 p->queue_len = RTA_GET_U32(tbp[NDTPA_QUEUE_LEN - 1]);
1778 if (tbp[NDTPA_PROXY_QLEN - 1])
1779 p->proxy_qlen = RTA_GET_U32(tbp[NDTPA_PROXY_QLEN - 1]);
1781 if (tbp[NDTPA_APP_PROBES - 1])
1782 p->app_probes = RTA_GET_U32(tbp[NDTPA_APP_PROBES - 1]);
1784 if (tbp[NDTPA_UCAST_PROBES - 1])
1785 p->ucast_probes =
1786 RTA_GET_U32(tbp[NDTPA_UCAST_PROBES - 1]);
1788 if (tbp[NDTPA_MCAST_PROBES - 1])
1789 p->mcast_probes =
1790 RTA_GET_U32(tbp[NDTPA_MCAST_PROBES - 1]);
1792 if (tbp[NDTPA_BASE_REACHABLE_TIME - 1])
1793 p->base_reachable_time =
1794 RTA_GET_MSECS(tbp[NDTPA_BASE_REACHABLE_TIME - 1]);
1796 if (tbp[NDTPA_GC_STALETIME - 1])
1797 p->gc_staletime =
1798 RTA_GET_MSECS(tbp[NDTPA_GC_STALETIME - 1]);
1800 if (tbp[NDTPA_DELAY_PROBE_TIME - 1])
1801 p->delay_probe_time =
1802 RTA_GET_MSECS(tbp[NDTPA_DELAY_PROBE_TIME - 1]);
1804 if (tbp[NDTPA_RETRANS_TIME - 1])
1805 p->retrans_time =
1806 RTA_GET_MSECS(tbp[NDTPA_RETRANS_TIME - 1]);
1808 if (tbp[NDTPA_ANYCAST_DELAY - 1])
1809 p->anycast_delay =
1810 RTA_GET_MSECS(tbp[NDTPA_ANYCAST_DELAY - 1]);
1812 if (tbp[NDTPA_PROXY_DELAY - 1])
1813 p->proxy_delay =
1814 RTA_GET_MSECS(tbp[NDTPA_PROXY_DELAY - 1]);
1816 if (tbp[NDTPA_LOCKTIME - 1])
1817 p->locktime = RTA_GET_MSECS(tbp[NDTPA_LOCKTIME - 1]);
1820 err = 0;
1822 rtattr_failure:
1823 write_unlock_bh(&tbl->lock);
1824 errout:
1825 read_unlock(&neigh_tbl_lock);
1826 return err;
1829 int neightbl_dump_info(struct sk_buff *skb, struct netlink_callback *cb)
1831 int idx, family;
1832 int s_idx = cb->args[0];
1833 struct neigh_table *tbl;
1835 family = ((struct rtgenmsg *)NLMSG_DATA(cb->nlh))->rtgen_family;
1837 read_lock(&neigh_tbl_lock);
1838 for (tbl = neigh_tables, idx = 0; tbl; tbl = tbl->next) {
1839 struct neigh_parms *p;
1841 if (idx < s_idx || (family && tbl->family != family))
1842 continue;
1844 if (neightbl_fill_info(tbl, skb, cb) <= 0)
1845 break;
1847 for (++idx, p = tbl->parms.next; p; p = p->next, idx++) {
1848 if (idx < s_idx)
1849 continue;
1851 if (neightbl_fill_param_info(tbl, p, skb, cb) <= 0)
1852 goto out;
1856 out:
1857 read_unlock(&neigh_tbl_lock);
1858 cb->args[0] = idx;
1860 return skb->len;
1863 static int neigh_fill_info(struct sk_buff *skb, struct neighbour *n,
1864 u32 pid, u32 seq, int event, unsigned int flags)
1866 unsigned long now = jiffies;
1867 unsigned char *b = skb->tail;
1868 struct nda_cacheinfo ci;
1869 int locked = 0;
1870 u32 probes;
1871 struct nlmsghdr *nlh = NLMSG_NEW(skb, pid, seq, event,
1872 sizeof(struct ndmsg), flags);
1873 struct ndmsg *ndm = NLMSG_DATA(nlh);
1875 ndm->ndm_family = n->ops->family;
1876 ndm->ndm_pad1 = 0;
1877 ndm->ndm_pad2 = 0;
1878 ndm->ndm_flags = n->flags;
1879 ndm->ndm_type = n->type;
1880 ndm->ndm_ifindex = n->dev->ifindex;
1881 RTA_PUT(skb, NDA_DST, n->tbl->key_len, n->primary_key);
1882 read_lock_bh(&n->lock);
1883 locked = 1;
1884 ndm->ndm_state = n->nud_state;
1885 if (n->nud_state & NUD_VALID)
1886 RTA_PUT(skb, NDA_LLADDR, n->dev->addr_len, n->ha);
1887 ci.ndm_used = now - n->used;
1888 ci.ndm_confirmed = now - n->confirmed;
1889 ci.ndm_updated = now - n->updated;
1890 ci.ndm_refcnt = atomic_read(&n->refcnt) - 1;
1891 probes = atomic_read(&n->probes);
1892 read_unlock_bh(&n->lock);
1893 locked = 0;
1894 RTA_PUT(skb, NDA_CACHEINFO, sizeof(ci), &ci);
1895 RTA_PUT(skb, NDA_PROBES, sizeof(probes), &probes);
1896 nlh->nlmsg_len = skb->tail - b;
1897 return skb->len;
1899 nlmsg_failure:
1900 rtattr_failure:
1901 if (locked)
1902 read_unlock_bh(&n->lock);
1903 skb_trim(skb, b - skb->data);
1904 return -1;
1908 static int neigh_dump_table(struct neigh_table *tbl, struct sk_buff *skb,
1909 struct netlink_callback *cb)
1911 struct neighbour *n;
1912 int rc, h, s_h = cb->args[1];
1913 int idx, s_idx = idx = cb->args[2];
1915 for (h = 0; h <= tbl->hash_mask; h++) {
1916 if (h < s_h)
1917 continue;
1918 if (h > s_h)
1919 s_idx = 0;
1920 read_lock_bh(&tbl->lock);
1921 for (n = tbl->hash_buckets[h], idx = 0; n; n = n->next, idx++) {
1922 if (idx < s_idx)
1923 continue;
1924 if (neigh_fill_info(skb, n, NETLINK_CB(cb->skb).pid,
1925 cb->nlh->nlmsg_seq,
1926 RTM_NEWNEIGH,
1927 NLM_F_MULTI) <= 0) {
1928 read_unlock_bh(&tbl->lock);
1929 rc = -1;
1930 goto out;
1933 read_unlock_bh(&tbl->lock);
1935 rc = skb->len;
1936 out:
1937 cb->args[1] = h;
1938 cb->args[2] = idx;
1939 return rc;
1942 int neigh_dump_info(struct sk_buff *skb, struct netlink_callback *cb)
1944 struct neigh_table *tbl;
1945 int t, family, s_t;
1947 read_lock(&neigh_tbl_lock);
1948 family = ((struct rtgenmsg *)NLMSG_DATA(cb->nlh))->rtgen_family;
1949 s_t = cb->args[0];
1951 for (tbl = neigh_tables, t = 0; tbl; tbl = tbl->next, t++) {
1952 if (t < s_t || (family && tbl->family != family))
1953 continue;
1954 if (t > s_t)
1955 memset(&cb->args[1], 0, sizeof(cb->args) -
1956 sizeof(cb->args[0]));
1957 if (neigh_dump_table(tbl, skb, cb) < 0)
1958 break;
1960 read_unlock(&neigh_tbl_lock);
1962 cb->args[0] = t;
1963 return skb->len;
1966 void neigh_for_each(struct neigh_table *tbl, void (*cb)(struct neighbour *, void *), void *cookie)
1968 int chain;
1970 read_lock_bh(&tbl->lock);
1971 for (chain = 0; chain <= tbl->hash_mask; chain++) {
1972 struct neighbour *n;
1974 for (n = tbl->hash_buckets[chain]; n; n = n->next)
1975 cb(n, cookie);
1977 read_unlock_bh(&tbl->lock);
1979 EXPORT_SYMBOL(neigh_for_each);
1981 /* The tbl->lock must be held as a writer and BH disabled. */
1982 void __neigh_for_each_release(struct neigh_table *tbl,
1983 int (*cb)(struct neighbour *))
1985 int chain;
1987 for (chain = 0; chain <= tbl->hash_mask; chain++) {
1988 struct neighbour *n, **np;
1990 np = &tbl->hash_buckets[chain];
1991 while ((n = *np) != NULL) {
1992 int release;
1994 write_lock(&n->lock);
1995 release = cb(n);
1996 if (release) {
1997 *np = n->next;
1998 n->dead = 1;
1999 } else
2000 np = &n->next;
2001 write_unlock(&n->lock);
2002 if (release)
2003 neigh_release(n);
2007 EXPORT_SYMBOL(__neigh_for_each_release);
2009 #ifdef CONFIG_PROC_FS
2011 static struct neighbour *neigh_get_first(struct seq_file *seq)
2013 struct neigh_seq_state *state = seq->private;
2014 struct neigh_table *tbl = state->tbl;
2015 struct neighbour *n = NULL;
2016 int bucket = state->bucket;
2018 state->flags &= ~NEIGH_SEQ_IS_PNEIGH;
2019 for (bucket = 0; bucket <= tbl->hash_mask; bucket++) {
2020 n = tbl->hash_buckets[bucket];
2022 while (n) {
2023 if (state->neigh_sub_iter) {
2024 loff_t fakep = 0;
2025 void *v;
2027 v = state->neigh_sub_iter(state, n, &fakep);
2028 if (!v)
2029 goto next;
2031 if (!(state->flags & NEIGH_SEQ_SKIP_NOARP))
2032 break;
2033 if (n->nud_state & ~NUD_NOARP)
2034 break;
2035 next:
2036 n = n->next;
2039 if (n)
2040 break;
2042 state->bucket = bucket;
2044 return n;
2047 static struct neighbour *neigh_get_next(struct seq_file *seq,
2048 struct neighbour *n,
2049 loff_t *pos)
2051 struct neigh_seq_state *state = seq->private;
2052 struct neigh_table *tbl = state->tbl;
2054 if (state->neigh_sub_iter) {
2055 void *v = state->neigh_sub_iter(state, n, pos);
2056 if (v)
2057 return n;
2059 n = n->next;
2061 while (1) {
2062 while (n) {
2063 if (state->neigh_sub_iter) {
2064 void *v = state->neigh_sub_iter(state, n, pos);
2065 if (v)
2066 return n;
2067 goto next;
2069 if (!(state->flags & NEIGH_SEQ_SKIP_NOARP))
2070 break;
2072 if (n->nud_state & ~NUD_NOARP)
2073 break;
2074 next:
2075 n = n->next;
2078 if (n)
2079 break;
2081 if (++state->bucket > tbl->hash_mask)
2082 break;
2084 n = tbl->hash_buckets[state->bucket];
2087 if (n && pos)
2088 --(*pos);
2089 return n;
2092 static struct neighbour *neigh_get_idx(struct seq_file *seq, loff_t *pos)
2094 struct neighbour *n = neigh_get_first(seq);
2096 if (n) {
2097 while (*pos) {
2098 n = neigh_get_next(seq, n, pos);
2099 if (!n)
2100 break;
2103 return *pos ? NULL : n;
2106 static struct pneigh_entry *pneigh_get_first(struct seq_file *seq)
2108 struct neigh_seq_state *state = seq->private;
2109 struct neigh_table *tbl = state->tbl;
2110 struct pneigh_entry *pn = NULL;
2111 int bucket = state->bucket;
2113 state->flags |= NEIGH_SEQ_IS_PNEIGH;
2114 for (bucket = 0; bucket <= PNEIGH_HASHMASK; bucket++) {
2115 pn = tbl->phash_buckets[bucket];
2116 if (pn)
2117 break;
2119 state->bucket = bucket;
2121 return pn;
2124 static struct pneigh_entry *pneigh_get_next(struct seq_file *seq,
2125 struct pneigh_entry *pn,
2126 loff_t *pos)
2128 struct neigh_seq_state *state = seq->private;
2129 struct neigh_table *tbl = state->tbl;
2131 pn = pn->next;
2132 while (!pn) {
2133 if (++state->bucket > PNEIGH_HASHMASK)
2134 break;
2135 pn = tbl->phash_buckets[state->bucket];
2136 if (pn)
2137 break;
2140 if (pn && pos)
2141 --(*pos);
2143 return pn;
2146 static struct pneigh_entry *pneigh_get_idx(struct seq_file *seq, loff_t *pos)
2148 struct pneigh_entry *pn = pneigh_get_first(seq);
2150 if (pn) {
2151 while (*pos) {
2152 pn = pneigh_get_next(seq, pn, pos);
2153 if (!pn)
2154 break;
2157 return *pos ? NULL : pn;
2160 static void *neigh_get_idx_any(struct seq_file *seq, loff_t *pos)
2162 struct neigh_seq_state *state = seq->private;
2163 void *rc;
2165 rc = neigh_get_idx(seq, pos);
2166 if (!rc && !(state->flags & NEIGH_SEQ_NEIGH_ONLY))
2167 rc = pneigh_get_idx(seq, pos);
2169 return rc;
2172 void *neigh_seq_start(struct seq_file *seq, loff_t *pos, struct neigh_table *tbl, unsigned int neigh_seq_flags)
2174 struct neigh_seq_state *state = seq->private;
2175 loff_t pos_minus_one;
2177 state->tbl = tbl;
2178 state->bucket = 0;
2179 state->flags = (neigh_seq_flags & ~NEIGH_SEQ_IS_PNEIGH);
2181 read_lock_bh(&tbl->lock);
2183 pos_minus_one = *pos - 1;
2184 return *pos ? neigh_get_idx_any(seq, &pos_minus_one) : SEQ_START_TOKEN;
2186 EXPORT_SYMBOL(neigh_seq_start);
2188 void *neigh_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2190 struct neigh_seq_state *state;
2191 void *rc;
2193 if (v == SEQ_START_TOKEN) {
2194 rc = neigh_get_idx(seq, pos);
2195 goto out;
2198 state = seq->private;
2199 if (!(state->flags & NEIGH_SEQ_IS_PNEIGH)) {
2200 rc = neigh_get_next(seq, v, NULL);
2201 if (rc)
2202 goto out;
2203 if (!(state->flags & NEIGH_SEQ_NEIGH_ONLY))
2204 rc = pneigh_get_first(seq);
2205 } else {
2206 BUG_ON(state->flags & NEIGH_SEQ_NEIGH_ONLY);
2207 rc = pneigh_get_next(seq, v, NULL);
2209 out:
2210 ++(*pos);
2211 return rc;
2213 EXPORT_SYMBOL(neigh_seq_next);
2215 void neigh_seq_stop(struct seq_file *seq, void *v)
2217 struct neigh_seq_state *state = seq->private;
2218 struct neigh_table *tbl = state->tbl;
2220 read_unlock_bh(&tbl->lock);
2222 EXPORT_SYMBOL(neigh_seq_stop);
2224 /* statistics via seq_file */
2226 static void *neigh_stat_seq_start(struct seq_file *seq, loff_t *pos)
2228 struct proc_dir_entry *pde = seq->private;
2229 struct neigh_table *tbl = pde->data;
2230 int cpu;
2232 if (*pos == 0)
2233 return SEQ_START_TOKEN;
2235 for (cpu = *pos-1; cpu < NR_CPUS; ++cpu) {
2236 if (!cpu_possible(cpu))
2237 continue;
2238 *pos = cpu+1;
2239 return per_cpu_ptr(tbl->stats, cpu);
2241 return NULL;
2244 static void *neigh_stat_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2246 struct proc_dir_entry *pde = seq->private;
2247 struct neigh_table *tbl = pde->data;
2248 int cpu;
2250 for (cpu = *pos; cpu < NR_CPUS; ++cpu) {
2251 if (!cpu_possible(cpu))
2252 continue;
2253 *pos = cpu+1;
2254 return per_cpu_ptr(tbl->stats, cpu);
2256 return NULL;
2259 static void neigh_stat_seq_stop(struct seq_file *seq, void *v)
2264 static int neigh_stat_seq_show(struct seq_file *seq, void *v)
2266 struct proc_dir_entry *pde = seq->private;
2267 struct neigh_table *tbl = pde->data;
2268 struct neigh_statistics *st = v;
2270 if (v == SEQ_START_TOKEN) {
2271 seq_printf(seq, "entries allocs destroys hash_grows lookups hits res_failed rcv_probes_mcast rcv_probes_ucast periodic_gc_runs forced_gc_runs\n");
2272 return 0;
2275 seq_printf(seq, "%08x %08lx %08lx %08lx %08lx %08lx %08lx "
2276 "%08lx %08lx %08lx %08lx\n",
2277 atomic_read(&tbl->entries),
2279 st->allocs,
2280 st->destroys,
2281 st->hash_grows,
2283 st->lookups,
2284 st->hits,
2286 st->res_failed,
2288 st->rcv_probes_mcast,
2289 st->rcv_probes_ucast,
2291 st->periodic_gc_runs,
2292 st->forced_gc_runs
2295 return 0;
2298 static struct seq_operations neigh_stat_seq_ops = {
2299 .start = neigh_stat_seq_start,
2300 .next = neigh_stat_seq_next,
2301 .stop = neigh_stat_seq_stop,
2302 .show = neigh_stat_seq_show,
2305 static int neigh_stat_seq_open(struct inode *inode, struct file *file)
2307 int ret = seq_open(file, &neigh_stat_seq_ops);
2309 if (!ret) {
2310 struct seq_file *sf = file->private_data;
2311 sf->private = PDE(inode);
2313 return ret;
2316 static struct file_operations neigh_stat_seq_fops = {
2317 .owner = THIS_MODULE,
2318 .open = neigh_stat_seq_open,
2319 .read = seq_read,
2320 .llseek = seq_lseek,
2321 .release = seq_release,
2324 #endif /* CONFIG_PROC_FS */
2326 #ifdef CONFIG_ARPD
2327 void neigh_app_ns(struct neighbour *n)
2329 struct nlmsghdr *nlh;
2330 int size = NLMSG_SPACE(sizeof(struct ndmsg) + 256);
2331 struct sk_buff *skb = alloc_skb(size, GFP_ATOMIC);
2333 if (!skb)
2334 return;
2336 if (neigh_fill_info(skb, n, 0, 0, RTM_GETNEIGH, 0) < 0) {
2337 kfree_skb(skb);
2338 return;
2340 nlh = (struct nlmsghdr *)skb->data;
2341 nlh->nlmsg_flags = NLM_F_REQUEST;
2342 NETLINK_CB(skb).dst_group = RTNLGRP_NEIGH;
2343 netlink_broadcast(rtnl, skb, 0, RTNLGRP_NEIGH, GFP_ATOMIC);
2346 static void neigh_app_notify(struct neighbour *n)
2348 struct nlmsghdr *nlh;
2349 int size = NLMSG_SPACE(sizeof(struct ndmsg) + 256);
2350 struct sk_buff *skb = alloc_skb(size, GFP_ATOMIC);
2352 if (!skb)
2353 return;
2355 if (neigh_fill_info(skb, n, 0, 0, RTM_NEWNEIGH, 0) < 0) {
2356 kfree_skb(skb);
2357 return;
2359 nlh = (struct nlmsghdr *)skb->data;
2360 NETLINK_CB(skb).dst_group = RTNLGRP_NEIGH;
2361 netlink_broadcast(rtnl, skb, 0, RTNLGRP_NEIGH, GFP_ATOMIC);
2364 #endif /* CONFIG_ARPD */
2366 #ifdef CONFIG_SYSCTL
2368 static struct neigh_sysctl_table {
2369 struct ctl_table_header *sysctl_header;
2370 ctl_table neigh_vars[__NET_NEIGH_MAX];
2371 ctl_table neigh_dev[2];
2372 ctl_table neigh_neigh_dir[2];
2373 ctl_table neigh_proto_dir[2];
2374 ctl_table neigh_root_dir[2];
2375 } neigh_sysctl_template = {
2376 .neigh_vars = {
2378 .ctl_name = NET_NEIGH_MCAST_SOLICIT,
2379 .procname = "mcast_solicit",
2380 .maxlen = sizeof(int),
2381 .mode = 0644,
2382 .proc_handler = &proc_dointvec,
2385 .ctl_name = NET_NEIGH_UCAST_SOLICIT,
2386 .procname = "ucast_solicit",
2387 .maxlen = sizeof(int),
2388 .mode = 0644,
2389 .proc_handler = &proc_dointvec,
2392 .ctl_name = NET_NEIGH_APP_SOLICIT,
2393 .procname = "app_solicit",
2394 .maxlen = sizeof(int),
2395 .mode = 0644,
2396 .proc_handler = &proc_dointvec,
2399 .ctl_name = NET_NEIGH_RETRANS_TIME,
2400 .procname = "retrans_time",
2401 .maxlen = sizeof(int),
2402 .mode = 0644,
2403 .proc_handler = &proc_dointvec_userhz_jiffies,
2406 .ctl_name = NET_NEIGH_REACHABLE_TIME,
2407 .procname = "base_reachable_time",
2408 .maxlen = sizeof(int),
2409 .mode = 0644,
2410 .proc_handler = &proc_dointvec_jiffies,
2411 .strategy = &sysctl_jiffies,
2414 .ctl_name = NET_NEIGH_DELAY_PROBE_TIME,
2415 .procname = "delay_first_probe_time",
2416 .maxlen = sizeof(int),
2417 .mode = 0644,
2418 .proc_handler = &proc_dointvec_jiffies,
2419 .strategy = &sysctl_jiffies,
2422 .ctl_name = NET_NEIGH_GC_STALE_TIME,
2423 .procname = "gc_stale_time",
2424 .maxlen = sizeof(int),
2425 .mode = 0644,
2426 .proc_handler = &proc_dointvec_jiffies,
2427 .strategy = &sysctl_jiffies,
2430 .ctl_name = NET_NEIGH_UNRES_QLEN,
2431 .procname = "unres_qlen",
2432 .maxlen = sizeof(int),
2433 .mode = 0644,
2434 .proc_handler = &proc_dointvec,
2437 .ctl_name = NET_NEIGH_PROXY_QLEN,
2438 .procname = "proxy_qlen",
2439 .maxlen = sizeof(int),
2440 .mode = 0644,
2441 .proc_handler = &proc_dointvec,
2444 .ctl_name = NET_NEIGH_ANYCAST_DELAY,
2445 .procname = "anycast_delay",
2446 .maxlen = sizeof(int),
2447 .mode = 0644,
2448 .proc_handler = &proc_dointvec_userhz_jiffies,
2451 .ctl_name = NET_NEIGH_PROXY_DELAY,
2452 .procname = "proxy_delay",
2453 .maxlen = sizeof(int),
2454 .mode = 0644,
2455 .proc_handler = &proc_dointvec_userhz_jiffies,
2458 .ctl_name = NET_NEIGH_LOCKTIME,
2459 .procname = "locktime",
2460 .maxlen = sizeof(int),
2461 .mode = 0644,
2462 .proc_handler = &proc_dointvec_userhz_jiffies,
2465 .ctl_name = NET_NEIGH_GC_INTERVAL,
2466 .procname = "gc_interval",
2467 .maxlen = sizeof(int),
2468 .mode = 0644,
2469 .proc_handler = &proc_dointvec_jiffies,
2470 .strategy = &sysctl_jiffies,
2473 .ctl_name = NET_NEIGH_GC_THRESH1,
2474 .procname = "gc_thresh1",
2475 .maxlen = sizeof(int),
2476 .mode = 0644,
2477 .proc_handler = &proc_dointvec,
2480 .ctl_name = NET_NEIGH_GC_THRESH2,
2481 .procname = "gc_thresh2",
2482 .maxlen = sizeof(int),
2483 .mode = 0644,
2484 .proc_handler = &proc_dointvec,
2487 .ctl_name = NET_NEIGH_GC_THRESH3,
2488 .procname = "gc_thresh3",
2489 .maxlen = sizeof(int),
2490 .mode = 0644,
2491 .proc_handler = &proc_dointvec,
2494 .ctl_name = NET_NEIGH_RETRANS_TIME_MS,
2495 .procname = "retrans_time_ms",
2496 .maxlen = sizeof(int),
2497 .mode = 0644,
2498 .proc_handler = &proc_dointvec_ms_jiffies,
2499 .strategy = &sysctl_ms_jiffies,
2502 .ctl_name = NET_NEIGH_REACHABLE_TIME_MS,
2503 .procname = "base_reachable_time_ms",
2504 .maxlen = sizeof(int),
2505 .mode = 0644,
2506 .proc_handler = &proc_dointvec_ms_jiffies,
2507 .strategy = &sysctl_ms_jiffies,
2510 .neigh_dev = {
2512 .ctl_name = NET_PROTO_CONF_DEFAULT,
2513 .procname = "default",
2514 .mode = 0555,
2517 .neigh_neigh_dir = {
2519 .procname = "neigh",
2520 .mode = 0555,
2523 .neigh_proto_dir = {
2525 .mode = 0555,
2528 .neigh_root_dir = {
2530 .ctl_name = CTL_NET,
2531 .procname = "net",
2532 .mode = 0555,
2537 int neigh_sysctl_register(struct net_device *dev, struct neigh_parms *p,
2538 int p_id, int pdev_id, char *p_name,
2539 proc_handler *handler, ctl_handler *strategy)
2541 struct neigh_sysctl_table *t = kmalloc(sizeof(*t), GFP_KERNEL);
2542 const char *dev_name_source = NULL;
2543 char *dev_name = NULL;
2544 int err = 0;
2546 if (!t)
2547 return -ENOBUFS;
2548 memcpy(t, &neigh_sysctl_template, sizeof(*t));
2549 t->neigh_vars[0].data = &p->mcast_probes;
2550 t->neigh_vars[1].data = &p->ucast_probes;
2551 t->neigh_vars[2].data = &p->app_probes;
2552 t->neigh_vars[3].data = &p->retrans_time;
2553 t->neigh_vars[4].data = &p->base_reachable_time;
2554 t->neigh_vars[5].data = &p->delay_probe_time;
2555 t->neigh_vars[6].data = &p->gc_staletime;
2556 t->neigh_vars[7].data = &p->queue_len;
2557 t->neigh_vars[8].data = &p->proxy_qlen;
2558 t->neigh_vars[9].data = &p->anycast_delay;
2559 t->neigh_vars[10].data = &p->proxy_delay;
2560 t->neigh_vars[11].data = &p->locktime;
2562 if (dev) {
2563 dev_name_source = dev->name;
2564 t->neigh_dev[0].ctl_name = dev->ifindex;
2565 t->neigh_vars[12].procname = NULL;
2566 t->neigh_vars[13].procname = NULL;
2567 t->neigh_vars[14].procname = NULL;
2568 t->neigh_vars[15].procname = NULL;
2569 } else {
2570 dev_name_source = t->neigh_dev[0].procname;
2571 t->neigh_vars[12].data = (int *)(p + 1);
2572 t->neigh_vars[13].data = (int *)(p + 1) + 1;
2573 t->neigh_vars[14].data = (int *)(p + 1) + 2;
2574 t->neigh_vars[15].data = (int *)(p + 1) + 3;
2577 t->neigh_vars[16].data = &p->retrans_time;
2578 t->neigh_vars[17].data = &p->base_reachable_time;
2580 if (handler || strategy) {
2581 /* RetransTime */
2582 t->neigh_vars[3].proc_handler = handler;
2583 t->neigh_vars[3].strategy = strategy;
2584 t->neigh_vars[3].extra1 = dev;
2585 /* ReachableTime */
2586 t->neigh_vars[4].proc_handler = handler;
2587 t->neigh_vars[4].strategy = strategy;
2588 t->neigh_vars[4].extra1 = dev;
2589 /* RetransTime (in milliseconds)*/
2590 t->neigh_vars[16].proc_handler = handler;
2591 t->neigh_vars[16].strategy = strategy;
2592 t->neigh_vars[16].extra1 = dev;
2593 /* ReachableTime (in milliseconds) */
2594 t->neigh_vars[17].proc_handler = handler;
2595 t->neigh_vars[17].strategy = strategy;
2596 t->neigh_vars[17].extra1 = dev;
2599 dev_name = kstrdup(dev_name_source, GFP_KERNEL);
2600 if (!dev_name) {
2601 err = -ENOBUFS;
2602 goto free;
2605 t->neigh_dev[0].procname = dev_name;
2607 t->neigh_neigh_dir[0].ctl_name = pdev_id;
2609 t->neigh_proto_dir[0].procname = p_name;
2610 t->neigh_proto_dir[0].ctl_name = p_id;
2612 t->neigh_dev[0].child = t->neigh_vars;
2613 t->neigh_neigh_dir[0].child = t->neigh_dev;
2614 t->neigh_proto_dir[0].child = t->neigh_neigh_dir;
2615 t->neigh_root_dir[0].child = t->neigh_proto_dir;
2617 t->sysctl_header = register_sysctl_table(t->neigh_root_dir, 0);
2618 if (!t->sysctl_header) {
2619 err = -ENOBUFS;
2620 goto free_procname;
2622 p->sysctl_table = t;
2623 return 0;
2625 /* error path */
2626 free_procname:
2627 kfree(dev_name);
2628 free:
2629 kfree(t);
2631 return err;
2634 void neigh_sysctl_unregister(struct neigh_parms *p)
2636 if (p->sysctl_table) {
2637 struct neigh_sysctl_table *t = p->sysctl_table;
2638 p->sysctl_table = NULL;
2639 unregister_sysctl_table(t->sysctl_header);
2640 kfree(t->neigh_dev[0].procname);
2641 kfree(t);
2645 #endif /* CONFIG_SYSCTL */
2647 EXPORT_SYMBOL(__neigh_event_send);
2648 EXPORT_SYMBOL(neigh_add);
2649 EXPORT_SYMBOL(neigh_changeaddr);
2650 EXPORT_SYMBOL(neigh_compat_output);
2651 EXPORT_SYMBOL(neigh_connected_output);
2652 EXPORT_SYMBOL(neigh_create);
2653 EXPORT_SYMBOL(neigh_delete);
2654 EXPORT_SYMBOL(neigh_destroy);
2655 EXPORT_SYMBOL(neigh_dump_info);
2656 EXPORT_SYMBOL(neigh_event_ns);
2657 EXPORT_SYMBOL(neigh_ifdown);
2658 EXPORT_SYMBOL(neigh_lookup);
2659 EXPORT_SYMBOL(neigh_lookup_nodev);
2660 EXPORT_SYMBOL(neigh_parms_alloc);
2661 EXPORT_SYMBOL(neigh_parms_release);
2662 EXPORT_SYMBOL(neigh_rand_reach_time);
2663 EXPORT_SYMBOL(neigh_resolve_output);
2664 EXPORT_SYMBOL(neigh_table_clear);
2665 EXPORT_SYMBOL(neigh_table_init);
2666 EXPORT_SYMBOL(neigh_update);
2667 EXPORT_SYMBOL(neigh_update_hhs);
2668 EXPORT_SYMBOL(pneigh_enqueue);
2669 EXPORT_SYMBOL(pneigh_lookup);
2670 EXPORT_SYMBOL(neightbl_dump_info);
2671 EXPORT_SYMBOL(neightbl_set);
2673 #ifdef CONFIG_ARPD
2674 EXPORT_SYMBOL(neigh_app_ns);
2675 #endif
2676 #ifdef CONFIG_SYSCTL
2677 EXPORT_SYMBOL(neigh_sysctl_register);
2678 EXPORT_SYMBOL(neigh_sysctl_unregister);
2679 #endif