[MYRI10GE]: Use LRO.
[linux-2.6-block.git] / net / core / neighbour.c
CommitLineData
1da177e4
LT
1/*
2 * Generic address resolution entity
3 *
4 * Authors:
5 * Pedro Roque <roque@di.fc.ul.pt>
6 * Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
7 *
8 * This program is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU General Public License
10 * as published by the Free Software Foundation; either version
11 * 2 of the License, or (at your option) any later version.
12 *
13 * Fixes:
14 * Vitaly E. Lavrov releasing NULL neighbor in neigh_add.
15 * Harald Welte Add neighbour cache statistics like rtstat
16 */
17
1da177e4
LT
18#include <linux/types.h>
19#include <linux/kernel.h>
20#include <linux/module.h>
21#include <linux/socket.h>
1da177e4
LT
22#include <linux/netdevice.h>
23#include <linux/proc_fs.h>
24#ifdef CONFIG_SYSCTL
25#include <linux/sysctl.h>
26#endif
27#include <linux/times.h>
28#include <net/neighbour.h>
29#include <net/dst.h>
30#include <net/sock.h>
8d71740c 31#include <net/netevent.h>
a14a49d2 32#include <net/netlink.h>
1da177e4
LT
33#include <linux/rtnetlink.h>
34#include <linux/random.h>
543537bd 35#include <linux/string.h>
c3609d51 36#include <linux/log2.h>
1da177e4
LT
37
38#define NEIGH_DEBUG 1
39
40#define NEIGH_PRINTK(x...) printk(x)
41#define NEIGH_NOPRINTK(x...) do { ; } while(0)
42#define NEIGH_PRINTK0 NEIGH_PRINTK
43#define NEIGH_PRINTK1 NEIGH_NOPRINTK
44#define NEIGH_PRINTK2 NEIGH_NOPRINTK
45
46#if NEIGH_DEBUG >= 1
47#undef NEIGH_PRINTK1
48#define NEIGH_PRINTK1 NEIGH_PRINTK
49#endif
50#if NEIGH_DEBUG >= 2
51#undef NEIGH_PRINTK2
52#define NEIGH_PRINTK2 NEIGH_PRINTK
53#endif
54
55#define PNEIGH_HASHMASK 0xF
56
57static void neigh_timer_handler(unsigned long arg);
58#ifdef CONFIG_ARPD
59static void neigh_app_notify(struct neighbour *n);
60#endif
61static int pneigh_ifdown(struct neigh_table *tbl, struct net_device *dev);
62void neigh_changeaddr(struct neigh_table *tbl, struct net_device *dev);
63
64static struct neigh_table *neigh_tables;
45fc3b11 65#ifdef CONFIG_PROC_FS
9a32144e 66static const struct file_operations neigh_stat_seq_fops;
45fc3b11 67#endif
1da177e4
LT
68
69/*
70 Neighbour hash table buckets are protected with rwlock tbl->lock.
71
72 - All the scans/updates to hash buckets MUST be made under this lock.
73 - NOTHING clever should be made under this lock: no callbacks
74 to protocol backends, no attempts to send something to network.
75 It will result in deadlocks, if backend/driver wants to use neighbour
76 cache.
77 - If the entry requires some non-trivial actions, increase
78 its reference count and release table lock.
79
80 Neighbour entries are protected:
81 - with reference count.
82 - with rwlock neigh->lock
83
84 Reference count prevents destruction.
85
86 neigh->lock mainly serializes ll address data and its validity state.
87 However, the same lock is used to protect another entry fields:
88 - timer
89 - resolution queue
90
91 Again, nothing clever shall be made under neigh->lock,
92 the most complicated procedure, which we allow is dev->hard_header.
93 It is supposed, that dev->hard_header is simplistic and does
94 not make callbacks to neighbour tables.
95
96 The last lock is neigh_tbl_lock. It is pure SMP lock, protecting
97 list of neighbour tables. This list is used only in process context,
98 */
99
100static DEFINE_RWLOCK(neigh_tbl_lock);
101
102static int neigh_blackhole(struct sk_buff *skb)
103{
104 kfree_skb(skb);
105 return -ENETDOWN;
106}
107
108/*
109 * It is random distribution in the interval (1/2)*base...(3/2)*base.
110 * It corresponds to default IPv6 settings and is not overridable,
111 * because it is really reasonable choice.
112 */
113
114unsigned long neigh_rand_reach_time(unsigned long base)
115{
116 return (base ? (net_random() % base) + (base >> 1) : 0);
117}
118
119
120static int neigh_forced_gc(struct neigh_table *tbl)
121{
122 int shrunk = 0;
123 int i;
124
125 NEIGH_CACHE_STAT_INC(tbl, forced_gc_runs);
126
127 write_lock_bh(&tbl->lock);
128 for (i = 0; i <= tbl->hash_mask; i++) {
129 struct neighbour *n, **np;
130
131 np = &tbl->hash_buckets[i];
132 while ((n = *np) != NULL) {
133 /* Neighbour record may be discarded if:
134 * - nobody refers to it.
135 * - it is not permanent
136 */
137 write_lock(&n->lock);
138 if (atomic_read(&n->refcnt) == 1 &&
139 !(n->nud_state & NUD_PERMANENT)) {
140 *np = n->next;
141 n->dead = 1;
142 shrunk = 1;
143 write_unlock(&n->lock);
ecbb4169
AK
144 if (n->parms->neigh_cleanup)
145 n->parms->neigh_cleanup(n);
1da177e4
LT
146 neigh_release(n);
147 continue;
148 }
149 write_unlock(&n->lock);
150 np = &n->next;
151 }
152 }
153
154 tbl->last_flush = jiffies;
155
156 write_unlock_bh(&tbl->lock);
157
158 return shrunk;
159}
160
161static int neigh_del_timer(struct neighbour *n)
162{
163 if ((n->nud_state & NUD_IN_TIMER) &&
164 del_timer(&n->timer)) {
165 neigh_release(n);
166 return 1;
167 }
168 return 0;
169}
170
171static void pneigh_queue_purge(struct sk_buff_head *list)
172{
173 struct sk_buff *skb;
174
175 while ((skb = skb_dequeue(list)) != NULL) {
176 dev_put(skb->dev);
177 kfree_skb(skb);
178 }
179}
180
49636bb1 181static void neigh_flush_dev(struct neigh_table *tbl, struct net_device *dev)
1da177e4
LT
182{
183 int i;
184
1da177e4
LT
185 for (i = 0; i <= tbl->hash_mask; i++) {
186 struct neighbour *n, **np = &tbl->hash_buckets[i];
187
188 while ((n = *np) != NULL) {
189 if (dev && n->dev != dev) {
190 np = &n->next;
191 continue;
192 }
193 *np = n->next;
194 write_lock(&n->lock);
195 neigh_del_timer(n);
196 n->dead = 1;
197
198 if (atomic_read(&n->refcnt) != 1) {
199 /* The most unpleasant situation.
200 We must destroy neighbour entry,
201 but someone still uses it.
202
203 The destroy will be delayed until
204 the last user releases us, but
205 we must kill timers etc. and move
206 it to safe state.
207 */
208 skb_queue_purge(&n->arp_queue);
209 n->output = neigh_blackhole;
210 if (n->nud_state & NUD_VALID)
211 n->nud_state = NUD_NOARP;
212 else
213 n->nud_state = NUD_NONE;
214 NEIGH_PRINTK2("neigh %p is stray.\n", n);
215 }
216 write_unlock(&n->lock);
ecbb4169
AK
217 if (n->parms->neigh_cleanup)
218 n->parms->neigh_cleanup(n);
1da177e4
LT
219 neigh_release(n);
220 }
221 }
49636bb1 222}
1da177e4 223
49636bb1
HX
224void neigh_changeaddr(struct neigh_table *tbl, struct net_device *dev)
225{
226 write_lock_bh(&tbl->lock);
227 neigh_flush_dev(tbl, dev);
228 write_unlock_bh(&tbl->lock);
229}
230
231int neigh_ifdown(struct neigh_table *tbl, struct net_device *dev)
232{
233 write_lock_bh(&tbl->lock);
234 neigh_flush_dev(tbl, dev);
1da177e4
LT
235 pneigh_ifdown(tbl, dev);
236 write_unlock_bh(&tbl->lock);
237
238 del_timer_sync(&tbl->proxy_timer);
239 pneigh_queue_purge(&tbl->proxy_queue);
240 return 0;
241}
242
243static struct neighbour *neigh_alloc(struct neigh_table *tbl)
244{
245 struct neighbour *n = NULL;
246 unsigned long now = jiffies;
247 int entries;
248
249 entries = atomic_inc_return(&tbl->entries) - 1;
250 if (entries >= tbl->gc_thresh3 ||
251 (entries >= tbl->gc_thresh2 &&
252 time_after(now, tbl->last_flush + 5 * HZ))) {
253 if (!neigh_forced_gc(tbl) &&
254 entries >= tbl->gc_thresh3)
255 goto out_entries;
256 }
257
c3762229 258 n = kmem_cache_zalloc(tbl->kmem_cachep, GFP_ATOMIC);
1da177e4
LT
259 if (!n)
260 goto out_entries;
261
1da177e4
LT
262 skb_queue_head_init(&n->arp_queue);
263 rwlock_init(&n->lock);
264 n->updated = n->used = now;
265 n->nud_state = NUD_NONE;
266 n->output = neigh_blackhole;
267 n->parms = neigh_parms_clone(&tbl->parms);
268 init_timer(&n->timer);
269 n->timer.function = neigh_timer_handler;
270 n->timer.data = (unsigned long)n;
271
272 NEIGH_CACHE_STAT_INC(tbl, allocs);
273 n->tbl = tbl;
274 atomic_set(&n->refcnt, 1);
275 n->dead = 1;
276out:
277 return n;
278
279out_entries:
280 atomic_dec(&tbl->entries);
281 goto out;
282}
283
284static struct neighbour **neigh_hash_alloc(unsigned int entries)
285{
286 unsigned long size = entries * sizeof(struct neighbour *);
287 struct neighbour **ret;
288
289 if (size <= PAGE_SIZE) {
77d04bd9 290 ret = kzalloc(size, GFP_ATOMIC);
1da177e4
LT
291 } else {
292 ret = (struct neighbour **)
77d04bd9 293 __get_free_pages(GFP_ATOMIC|__GFP_ZERO, get_order(size));
1da177e4 294 }
1da177e4
LT
295 return ret;
296}
297
298static void neigh_hash_free(struct neighbour **hash, unsigned int entries)
299{
300 unsigned long size = entries * sizeof(struct neighbour *);
301
302 if (size <= PAGE_SIZE)
303 kfree(hash);
304 else
305 free_pages((unsigned long)hash, get_order(size));
306}
307
308static void neigh_hash_grow(struct neigh_table *tbl, unsigned long new_entries)
309{
310 struct neighbour **new_hash, **old_hash;
311 unsigned int i, new_hash_mask, old_entries;
312
313 NEIGH_CACHE_STAT_INC(tbl, hash_grows);
314
c3609d51 315 BUG_ON(!is_power_of_2(new_entries));
1da177e4
LT
316 new_hash = neigh_hash_alloc(new_entries);
317 if (!new_hash)
318 return;
319
320 old_entries = tbl->hash_mask + 1;
321 new_hash_mask = new_entries - 1;
322 old_hash = tbl->hash_buckets;
323
324 get_random_bytes(&tbl->hash_rnd, sizeof(tbl->hash_rnd));
325 for (i = 0; i < old_entries; i++) {
326 struct neighbour *n, *next;
327
328 for (n = old_hash[i]; n; n = next) {
329 unsigned int hash_val = tbl->hash(n->primary_key, n->dev);
330
331 hash_val &= new_hash_mask;
332 next = n->next;
333
334 n->next = new_hash[hash_val];
335 new_hash[hash_val] = n;
336 }
337 }
338 tbl->hash_buckets = new_hash;
339 tbl->hash_mask = new_hash_mask;
340
341 neigh_hash_free(old_hash, old_entries);
342}
343
344struct neighbour *neigh_lookup(struct neigh_table *tbl, const void *pkey,
345 struct net_device *dev)
346{
347 struct neighbour *n;
348 int key_len = tbl->key_len;
c5e29460 349 u32 hash_val = tbl->hash(pkey, dev);
4ec93edb 350
1da177e4
LT
351 NEIGH_CACHE_STAT_INC(tbl, lookups);
352
353 read_lock_bh(&tbl->lock);
c5e29460 354 for (n = tbl->hash_buckets[hash_val & tbl->hash_mask]; n; n = n->next) {
1da177e4
LT
355 if (dev == n->dev && !memcmp(n->primary_key, pkey, key_len)) {
356 neigh_hold(n);
357 NEIGH_CACHE_STAT_INC(tbl, hits);
358 break;
359 }
360 }
361 read_unlock_bh(&tbl->lock);
362 return n;
363}
364
365struct neighbour *neigh_lookup_nodev(struct neigh_table *tbl, const void *pkey)
366{
367 struct neighbour *n;
368 int key_len = tbl->key_len;
c5e29460 369 u32 hash_val = tbl->hash(pkey, NULL);
1da177e4
LT
370
371 NEIGH_CACHE_STAT_INC(tbl, lookups);
372
373 read_lock_bh(&tbl->lock);
c5e29460 374 for (n = tbl->hash_buckets[hash_val & tbl->hash_mask]; n; n = n->next) {
1da177e4
LT
375 if (!memcmp(n->primary_key, pkey, key_len)) {
376 neigh_hold(n);
377 NEIGH_CACHE_STAT_INC(tbl, hits);
378 break;
379 }
380 }
381 read_unlock_bh(&tbl->lock);
382 return n;
383}
384
385struct neighbour *neigh_create(struct neigh_table *tbl, const void *pkey,
386 struct net_device *dev)
387{
388 u32 hash_val;
389 int key_len = tbl->key_len;
390 int error;
391 struct neighbour *n1, *rc, *n = neigh_alloc(tbl);
392
393 if (!n) {
394 rc = ERR_PTR(-ENOBUFS);
395 goto out;
396 }
397
398 memcpy(n->primary_key, pkey, key_len);
399 n->dev = dev;
400 dev_hold(dev);
401
402 /* Protocol specific setup. */
403 if (tbl->constructor && (error = tbl->constructor(n)) < 0) {
404 rc = ERR_PTR(error);
405 goto out_neigh_release;
406 }
407
408 /* Device specific setup. */
409 if (n->parms->neigh_setup &&
410 (error = n->parms->neigh_setup(n)) < 0) {
411 rc = ERR_PTR(error);
412 goto out_neigh_release;
413 }
414
415 n->confirmed = jiffies - (n->parms->base_reachable_time << 1);
416
417 write_lock_bh(&tbl->lock);
418
419 if (atomic_read(&tbl->entries) > (tbl->hash_mask + 1))
420 neigh_hash_grow(tbl, (tbl->hash_mask + 1) << 1);
421
422 hash_val = tbl->hash(pkey, dev) & tbl->hash_mask;
423
424 if (n->parms->dead) {
425 rc = ERR_PTR(-EINVAL);
426 goto out_tbl_unlock;
427 }
428
429 for (n1 = tbl->hash_buckets[hash_val]; n1; n1 = n1->next) {
430 if (dev == n1->dev && !memcmp(n1->primary_key, pkey, key_len)) {
431 neigh_hold(n1);
432 rc = n1;
433 goto out_tbl_unlock;
434 }
435 }
436
437 n->next = tbl->hash_buckets[hash_val];
438 tbl->hash_buckets[hash_val] = n;
439 n->dead = 0;
440 neigh_hold(n);
441 write_unlock_bh(&tbl->lock);
442 NEIGH_PRINTK2("neigh %p is created.\n", n);
443 rc = n;
444out:
445 return rc;
446out_tbl_unlock:
447 write_unlock_bh(&tbl->lock);
448out_neigh_release:
449 neigh_release(n);
450 goto out;
451}
452
453struct pneigh_entry * pneigh_lookup(struct neigh_table *tbl, const void *pkey,
454 struct net_device *dev, int creat)
455{
456 struct pneigh_entry *n;
457 int key_len = tbl->key_len;
458 u32 hash_val = *(u32 *)(pkey + key_len - 4);
459
460 hash_val ^= (hash_val >> 16);
461 hash_val ^= hash_val >> 8;
462 hash_val ^= hash_val >> 4;
463 hash_val &= PNEIGH_HASHMASK;
464
465 read_lock_bh(&tbl->lock);
466
467 for (n = tbl->phash_buckets[hash_val]; n; n = n->next) {
468 if (!memcmp(n->key, pkey, key_len) &&
469 (n->dev == dev || !n->dev)) {
470 read_unlock_bh(&tbl->lock);
471 goto out;
472 }
473 }
474 read_unlock_bh(&tbl->lock);
475 n = NULL;
476 if (!creat)
477 goto out;
478
479 n = kmalloc(sizeof(*n) + key_len, GFP_KERNEL);
480 if (!n)
481 goto out;
482
483 memcpy(n->key, pkey, key_len);
484 n->dev = dev;
485 if (dev)
486 dev_hold(dev);
487
488 if (tbl->pconstructor && tbl->pconstructor(n)) {
489 if (dev)
490 dev_put(dev);
491 kfree(n);
492 n = NULL;
493 goto out;
494 }
495
496 write_lock_bh(&tbl->lock);
497 n->next = tbl->phash_buckets[hash_val];
498 tbl->phash_buckets[hash_val] = n;
499 write_unlock_bh(&tbl->lock);
500out:
501 return n;
502}
503
504
505int pneigh_delete(struct neigh_table *tbl, const void *pkey,
506 struct net_device *dev)
507{
508 struct pneigh_entry *n, **np;
509 int key_len = tbl->key_len;
510 u32 hash_val = *(u32 *)(pkey + key_len - 4);
511
512 hash_val ^= (hash_val >> 16);
513 hash_val ^= hash_val >> 8;
514 hash_val ^= hash_val >> 4;
515 hash_val &= PNEIGH_HASHMASK;
516
517 write_lock_bh(&tbl->lock);
518 for (np = &tbl->phash_buckets[hash_val]; (n = *np) != NULL;
519 np = &n->next) {
520 if (!memcmp(n->key, pkey, key_len) && n->dev == dev) {
521 *np = n->next;
522 write_unlock_bh(&tbl->lock);
523 if (tbl->pdestructor)
524 tbl->pdestructor(n);
525 if (n->dev)
526 dev_put(n->dev);
527 kfree(n);
528 return 0;
529 }
530 }
531 write_unlock_bh(&tbl->lock);
532 return -ENOENT;
533}
534
535static int pneigh_ifdown(struct neigh_table *tbl, struct net_device *dev)
536{
537 struct pneigh_entry *n, **np;
538 u32 h;
539
540 for (h = 0; h <= PNEIGH_HASHMASK; h++) {
541 np = &tbl->phash_buckets[h];
542 while ((n = *np) != NULL) {
543 if (!dev || n->dev == dev) {
544 *np = n->next;
545 if (tbl->pdestructor)
546 tbl->pdestructor(n);
547 if (n->dev)
548 dev_put(n->dev);
549 kfree(n);
550 continue;
551 }
552 np = &n->next;
553 }
554 }
555 return -ENOENT;
556}
557
558
559/*
560 * neighbour must already be out of the table;
561 *
562 */
563void neigh_destroy(struct neighbour *neigh)
564{
565 struct hh_cache *hh;
566
567 NEIGH_CACHE_STAT_INC(neigh->tbl, destroys);
568
569 if (!neigh->dead) {
570 printk(KERN_WARNING
571 "Destroying alive neighbour %p\n", neigh);
572 dump_stack();
573 return;
574 }
575
576 if (neigh_del_timer(neigh))
577 printk(KERN_WARNING "Impossible event.\n");
578
579 while ((hh = neigh->hh) != NULL) {
580 neigh->hh = hh->hh_next;
581 hh->hh_next = NULL;
3644f0ce
SH
582
583 write_seqlock_bh(&hh->hh_lock);
1da177e4 584 hh->hh_output = neigh_blackhole;
3644f0ce 585 write_sequnlock_bh(&hh->hh_lock);
1da177e4
LT
586 if (atomic_dec_and_test(&hh->hh_refcnt))
587 kfree(hh);
588 }
589
1da177e4
LT
590 skb_queue_purge(&neigh->arp_queue);
591
592 dev_put(neigh->dev);
593 neigh_parms_put(neigh->parms);
594
595 NEIGH_PRINTK2("neigh %p is destroyed.\n", neigh);
596
597 atomic_dec(&neigh->tbl->entries);
598 kmem_cache_free(neigh->tbl->kmem_cachep, neigh);
599}
600
601/* Neighbour state is suspicious;
602 disable fast path.
603
604 Called with write_locked neigh.
605 */
606static void neigh_suspect(struct neighbour *neigh)
607{
608 struct hh_cache *hh;
609
610 NEIGH_PRINTK2("neigh %p is suspected.\n", neigh);
611
612 neigh->output = neigh->ops->output;
613
614 for (hh = neigh->hh; hh; hh = hh->hh_next)
615 hh->hh_output = neigh->ops->output;
616}
617
618/* Neighbour state is OK;
619 enable fast path.
620
621 Called with write_locked neigh.
622 */
623static void neigh_connect(struct neighbour *neigh)
624{
625 struct hh_cache *hh;
626
627 NEIGH_PRINTK2("neigh %p is connected.\n", neigh);
628
629 neigh->output = neigh->ops->connected_output;
630
631 for (hh = neigh->hh; hh; hh = hh->hh_next)
632 hh->hh_output = neigh->ops->hh_output;
633}
634
635static void neigh_periodic_timer(unsigned long arg)
636{
637 struct neigh_table *tbl = (struct neigh_table *)arg;
638 struct neighbour *n, **np;
639 unsigned long expire, now = jiffies;
640
641 NEIGH_CACHE_STAT_INC(tbl, periodic_gc_runs);
642
643 write_lock(&tbl->lock);
644
645 /*
646 * periodically recompute ReachableTime from random function
647 */
648
649 if (time_after(now, tbl->last_rand + 300 * HZ)) {
650 struct neigh_parms *p;
651 tbl->last_rand = now;
652 for (p = &tbl->parms; p; p = p->next)
653 p->reachable_time =
654 neigh_rand_reach_time(p->base_reachable_time);
655 }
656
657 np = &tbl->hash_buckets[tbl->hash_chain_gc];
658 tbl->hash_chain_gc = ((tbl->hash_chain_gc + 1) & tbl->hash_mask);
659
660 while ((n = *np) != NULL) {
661 unsigned int state;
662
663 write_lock(&n->lock);
664
665 state = n->nud_state;
666 if (state & (NUD_PERMANENT | NUD_IN_TIMER)) {
667 write_unlock(&n->lock);
668 goto next_elt;
669 }
670
671 if (time_before(n->used, n->confirmed))
672 n->used = n->confirmed;
673
674 if (atomic_read(&n->refcnt) == 1 &&
675 (state == NUD_FAILED ||
676 time_after(now, n->used + n->parms->gc_staletime))) {
677 *np = n->next;
678 n->dead = 1;
679 write_unlock(&n->lock);
ecbb4169
AK
680 if (n->parms->neigh_cleanup)
681 n->parms->neigh_cleanup(n);
1da177e4
LT
682 neigh_release(n);
683 continue;
684 }
685 write_unlock(&n->lock);
686
687next_elt:
688 np = &n->next;
689 }
690
4ec93edb
YH
691 /* Cycle through all hash buckets every base_reachable_time/2 ticks.
692 * ARP entry timeouts range from 1/2 base_reachable_time to 3/2
693 * base_reachable_time.
1da177e4
LT
694 */
695 expire = tbl->parms.base_reachable_time >> 1;
696 expire /= (tbl->hash_mask + 1);
697 if (!expire)
698 expire = 1;
699
f5a6e01c
AV
700 if (expire>HZ)
701 mod_timer(&tbl->gc_timer, round_jiffies(now + expire));
702 else
703 mod_timer(&tbl->gc_timer, now + expire);
1da177e4
LT
704
705 write_unlock(&tbl->lock);
706}
707
708static __inline__ int neigh_max_probes(struct neighbour *n)
709{
710 struct neigh_parms *p = n->parms;
711 return (n->nud_state & NUD_PROBE ?
712 p->ucast_probes :
713 p->ucast_probes + p->app_probes + p->mcast_probes);
714}
715
667347f1
DM
716static inline void neigh_add_timer(struct neighbour *n, unsigned long when)
717{
718 if (unlikely(mod_timer(&n->timer, when))) {
719 printk("NEIGH: BUG, double timer add, state is %x\n",
720 n->nud_state);
20375502 721 dump_stack();
667347f1
DM
722 }
723}
1da177e4
LT
724
725/* Called when a timer expires for a neighbour entry. */
726
727static void neigh_timer_handler(unsigned long arg)
728{
729 unsigned long now, next;
730 struct neighbour *neigh = (struct neighbour *)arg;
731 unsigned state;
732 int notify = 0;
733
734 write_lock(&neigh->lock);
735
736 state = neigh->nud_state;
737 now = jiffies;
738 next = now + HZ;
739
740 if (!(state & NUD_IN_TIMER)) {
741#ifndef CONFIG_SMP
742 printk(KERN_WARNING "neigh: timer & !nud_in_timer\n");
743#endif
744 goto out;
745 }
746
747 if (state & NUD_REACHABLE) {
4ec93edb 748 if (time_before_eq(now,
1da177e4
LT
749 neigh->confirmed + neigh->parms->reachable_time)) {
750 NEIGH_PRINTK2("neigh %p is still alive.\n", neigh);
751 next = neigh->confirmed + neigh->parms->reachable_time;
752 } else if (time_before_eq(now,
753 neigh->used + neigh->parms->delay_probe_time)) {
754 NEIGH_PRINTK2("neigh %p is delayed.\n", neigh);
755 neigh->nud_state = NUD_DELAY;
955aaa2f 756 neigh->updated = jiffies;
1da177e4
LT
757 neigh_suspect(neigh);
758 next = now + neigh->parms->delay_probe_time;
759 } else {
760 NEIGH_PRINTK2("neigh %p is suspected.\n", neigh);
761 neigh->nud_state = NUD_STALE;
955aaa2f 762 neigh->updated = jiffies;
1da177e4 763 neigh_suspect(neigh);
8d71740c 764 notify = 1;
1da177e4
LT
765 }
766 } else if (state & NUD_DELAY) {
4ec93edb 767 if (time_before_eq(now,
1da177e4
LT
768 neigh->confirmed + neigh->parms->delay_probe_time)) {
769 NEIGH_PRINTK2("neigh %p is now reachable.\n", neigh);
770 neigh->nud_state = NUD_REACHABLE;
955aaa2f 771 neigh->updated = jiffies;
1da177e4 772 neigh_connect(neigh);
8d71740c 773 notify = 1;
1da177e4
LT
774 next = neigh->confirmed + neigh->parms->reachable_time;
775 } else {
776 NEIGH_PRINTK2("neigh %p is probed.\n", neigh);
777 neigh->nud_state = NUD_PROBE;
955aaa2f 778 neigh->updated = jiffies;
1da177e4
LT
779 atomic_set(&neigh->probes, 0);
780 next = now + neigh->parms->retrans_time;
781 }
782 } else {
783 /* NUD_PROBE|NUD_INCOMPLETE */
784 next = now + neigh->parms->retrans_time;
785 }
786
787 if ((neigh->nud_state & (NUD_INCOMPLETE | NUD_PROBE)) &&
788 atomic_read(&neigh->probes) >= neigh_max_probes(neigh)) {
789 struct sk_buff *skb;
790
791 neigh->nud_state = NUD_FAILED;
955aaa2f 792 neigh->updated = jiffies;
1da177e4
LT
793 notify = 1;
794 NEIGH_CACHE_STAT_INC(neigh->tbl, res_failed);
795 NEIGH_PRINTK2("neigh %p is failed.\n", neigh);
796
797 /* It is very thin place. report_unreachable is very complicated
798 routine. Particularly, it can hit the same neighbour entry!
799
800 So that, we try to be accurate and avoid dead loop. --ANK
801 */
802 while (neigh->nud_state == NUD_FAILED &&
803 (skb = __skb_dequeue(&neigh->arp_queue)) != NULL) {
804 write_unlock(&neigh->lock);
805 neigh->ops->error_report(neigh, skb);
806 write_lock(&neigh->lock);
807 }
808 skb_queue_purge(&neigh->arp_queue);
809 }
810
811 if (neigh->nud_state & NUD_IN_TIMER) {
1da177e4
LT
812 if (time_before(next, jiffies + HZ/2))
813 next = jiffies + HZ/2;
6fb9974f
HX
814 if (!mod_timer(&neigh->timer, next))
815 neigh_hold(neigh);
1da177e4
LT
816 }
817 if (neigh->nud_state & (NUD_INCOMPLETE | NUD_PROBE)) {
818 struct sk_buff *skb = skb_peek(&neigh->arp_queue);
819 /* keep skb alive even if arp_queue overflows */
820 if (skb)
821 skb_get(skb);
822 write_unlock(&neigh->lock);
823 neigh->ops->solicit(neigh, skb);
824 atomic_inc(&neigh->probes);
825 if (skb)
826 kfree_skb(skb);
827 } else {
828out:
829 write_unlock(&neigh->lock);
830 }
8d71740c
TT
831 if (notify)
832 call_netevent_notifiers(NETEVENT_NEIGH_UPDATE, neigh);
1da177e4
LT
833
834#ifdef CONFIG_ARPD
835 if (notify && neigh->parms->app_probes)
836 neigh_app_notify(neigh);
837#endif
838 neigh_release(neigh);
839}
840
841int __neigh_event_send(struct neighbour *neigh, struct sk_buff *skb)
842{
843 int rc;
844 unsigned long now;
845
846 write_lock_bh(&neigh->lock);
847
848 rc = 0;
849 if (neigh->nud_state & (NUD_CONNECTED | NUD_DELAY | NUD_PROBE))
850 goto out_unlock_bh;
851
852 now = jiffies;
4ec93edb 853
1da177e4
LT
854 if (!(neigh->nud_state & (NUD_STALE | NUD_INCOMPLETE))) {
855 if (neigh->parms->mcast_probes + neigh->parms->app_probes) {
856 atomic_set(&neigh->probes, neigh->parms->ucast_probes);
857 neigh->nud_state = NUD_INCOMPLETE;
955aaa2f 858 neigh->updated = jiffies;
1da177e4 859 neigh_hold(neigh);
667347f1 860 neigh_add_timer(neigh, now + 1);
1da177e4
LT
861 } else {
862 neigh->nud_state = NUD_FAILED;
955aaa2f 863 neigh->updated = jiffies;
1da177e4
LT
864 write_unlock_bh(&neigh->lock);
865
866 if (skb)
867 kfree_skb(skb);
868 return 1;
869 }
870 } else if (neigh->nud_state & NUD_STALE) {
871 NEIGH_PRINTK2("neigh %p is delayed.\n", neigh);
872 neigh_hold(neigh);
873 neigh->nud_state = NUD_DELAY;
955aaa2f 874 neigh->updated = jiffies;
667347f1
DM
875 neigh_add_timer(neigh,
876 jiffies + neigh->parms->delay_probe_time);
1da177e4
LT
877 }
878
879 if (neigh->nud_state == NUD_INCOMPLETE) {
880 if (skb) {
881 if (skb_queue_len(&neigh->arp_queue) >=
882 neigh->parms->queue_len) {
883 struct sk_buff *buff;
884 buff = neigh->arp_queue.next;
885 __skb_unlink(buff, &neigh->arp_queue);
886 kfree_skb(buff);
887 }
888 __skb_queue_tail(&neigh->arp_queue, skb);
889 }
890 rc = 1;
891 }
892out_unlock_bh:
893 write_unlock_bh(&neigh->lock);
894 return rc;
895}
896
e92b43a3 897static void neigh_update_hhs(struct neighbour *neigh)
1da177e4
LT
898{
899 struct hh_cache *hh;
900 void (*update)(struct hh_cache*, struct net_device*, unsigned char *) =
901 neigh->dev->header_cache_update;
902
903 if (update) {
904 for (hh = neigh->hh; hh; hh = hh->hh_next) {
3644f0ce 905 write_seqlock_bh(&hh->hh_lock);
1da177e4 906 update(hh, neigh->dev, neigh->ha);
3644f0ce 907 write_sequnlock_bh(&hh->hh_lock);
1da177e4
LT
908 }
909 }
910}
911
912
913
914/* Generic update routine.
915 -- lladdr is new lladdr or NULL, if it is not supplied.
916 -- new is new state.
917 -- flags
918 NEIGH_UPDATE_F_OVERRIDE allows to override existing lladdr,
919 if it is different.
920 NEIGH_UPDATE_F_WEAK_OVERRIDE will suspect existing "connected"
4ec93edb 921 lladdr instead of overriding it
1da177e4
LT
922 if it is different.
923 It also allows to retain current state
924 if lladdr is unchanged.
925 NEIGH_UPDATE_F_ADMIN means that the change is administrative.
926
4ec93edb 927 NEIGH_UPDATE_F_OVERRIDE_ISROUTER allows to override existing
1da177e4
LT
928 NTF_ROUTER flag.
929 NEIGH_UPDATE_F_ISROUTER indicates if the neighbour is known as
930 a router.
931
932 Caller MUST hold reference count on the entry.
933 */
934
935int neigh_update(struct neighbour *neigh, const u8 *lladdr, u8 new,
936 u32 flags)
937{
938 u8 old;
939 int err;
1da177e4 940 int notify = 0;
1da177e4
LT
941 struct net_device *dev;
942 int update_isrouter = 0;
943
944 write_lock_bh(&neigh->lock);
945
946 dev = neigh->dev;
947 old = neigh->nud_state;
948 err = -EPERM;
949
4ec93edb 950 if (!(flags & NEIGH_UPDATE_F_ADMIN) &&
1da177e4
LT
951 (old & (NUD_NOARP | NUD_PERMANENT)))
952 goto out;
953
954 if (!(new & NUD_VALID)) {
955 neigh_del_timer(neigh);
956 if (old & NUD_CONNECTED)
957 neigh_suspect(neigh);
958 neigh->nud_state = new;
959 err = 0;
1da177e4 960 notify = old & NUD_VALID;
1da177e4
LT
961 goto out;
962 }
963
964 /* Compare new lladdr with cached one */
965 if (!dev->addr_len) {
966 /* First case: device needs no address. */
967 lladdr = neigh->ha;
968 } else if (lladdr) {
969 /* The second case: if something is already cached
970 and a new address is proposed:
971 - compare new & old
972 - if they are different, check override flag
973 */
4ec93edb 974 if ((old & NUD_VALID) &&
1da177e4
LT
975 !memcmp(lladdr, neigh->ha, dev->addr_len))
976 lladdr = neigh->ha;
977 } else {
978 /* No address is supplied; if we know something,
979 use it, otherwise discard the request.
980 */
981 err = -EINVAL;
982 if (!(old & NUD_VALID))
983 goto out;
984 lladdr = neigh->ha;
985 }
986
987 if (new & NUD_CONNECTED)
988 neigh->confirmed = jiffies;
989 neigh->updated = jiffies;
990
991 /* If entry was valid and address is not changed,
992 do not change entry state, if new one is STALE.
993 */
994 err = 0;
995 update_isrouter = flags & NEIGH_UPDATE_F_OVERRIDE_ISROUTER;
996 if (old & NUD_VALID) {
997 if (lladdr != neigh->ha && !(flags & NEIGH_UPDATE_F_OVERRIDE)) {
998 update_isrouter = 0;
999 if ((flags & NEIGH_UPDATE_F_WEAK_OVERRIDE) &&
1000 (old & NUD_CONNECTED)) {
1001 lladdr = neigh->ha;
1002 new = NUD_STALE;
1003 } else
1004 goto out;
1005 } else {
1006 if (lladdr == neigh->ha && new == NUD_STALE &&
1007 ((flags & NEIGH_UPDATE_F_WEAK_OVERRIDE) ||
1008 (old & NUD_CONNECTED))
1009 )
1010 new = old;
1011 }
1012 }
1013
1014 if (new != old) {
1015 neigh_del_timer(neigh);
1016 if (new & NUD_IN_TIMER) {
1017 neigh_hold(neigh);
4ec93edb
YH
1018 neigh_add_timer(neigh, (jiffies +
1019 ((new & NUD_REACHABLE) ?
667347f1
DM
1020 neigh->parms->reachable_time :
1021 0)));
1da177e4
LT
1022 }
1023 neigh->nud_state = new;
1024 }
1025
1026 if (lladdr != neigh->ha) {
1027 memcpy(&neigh->ha, lladdr, dev->addr_len);
1028 neigh_update_hhs(neigh);
1029 if (!(new & NUD_CONNECTED))
1030 neigh->confirmed = jiffies -
1031 (neigh->parms->base_reachable_time << 1);
1da177e4 1032 notify = 1;
1da177e4
LT
1033 }
1034 if (new == old)
1035 goto out;
1036 if (new & NUD_CONNECTED)
1037 neigh_connect(neigh);
1038 else
1039 neigh_suspect(neigh);
1040 if (!(old & NUD_VALID)) {
1041 struct sk_buff *skb;
1042
1043 /* Again: avoid dead loop if something went wrong */
1044
1045 while (neigh->nud_state & NUD_VALID &&
1046 (skb = __skb_dequeue(&neigh->arp_queue)) != NULL) {
1047 struct neighbour *n1 = neigh;
1048 write_unlock_bh(&neigh->lock);
1049 /* On shaper/eql skb->dst->neighbour != neigh :( */
1050 if (skb->dst && skb->dst->neighbour)
1051 n1 = skb->dst->neighbour;
1052 n1->output(skb);
1053 write_lock_bh(&neigh->lock);
1054 }
1055 skb_queue_purge(&neigh->arp_queue);
1056 }
1057out:
1058 if (update_isrouter) {
1059 neigh->flags = (flags & NEIGH_UPDATE_F_ISROUTER) ?
1060 (neigh->flags | NTF_ROUTER) :
1061 (neigh->flags & ~NTF_ROUTER);
1062 }
1063 write_unlock_bh(&neigh->lock);
8d71740c
TT
1064
1065 if (notify)
1066 call_netevent_notifiers(NETEVENT_NEIGH_UPDATE, neigh);
1da177e4
LT
1067#ifdef CONFIG_ARPD
1068 if (notify && neigh->parms->app_probes)
1069 neigh_app_notify(neigh);
1070#endif
1071 return err;
1072}
1073
1074struct neighbour *neigh_event_ns(struct neigh_table *tbl,
1075 u8 *lladdr, void *saddr,
1076 struct net_device *dev)
1077{
1078 struct neighbour *neigh = __neigh_lookup(tbl, saddr, dev,
1079 lladdr || !dev->addr_len);
1080 if (neigh)
4ec93edb 1081 neigh_update(neigh, lladdr, NUD_STALE,
1da177e4
LT
1082 NEIGH_UPDATE_F_OVERRIDE);
1083 return neigh;
1084}
1085
1086static void neigh_hh_init(struct neighbour *n, struct dst_entry *dst,
d77072ec 1087 __be16 protocol)
1da177e4
LT
1088{
1089 struct hh_cache *hh;
1090 struct net_device *dev = dst->dev;
1091
1092 for (hh = n->hh; hh; hh = hh->hh_next)
1093 if (hh->hh_type == protocol)
1094 break;
1095
77d04bd9 1096 if (!hh && (hh = kzalloc(sizeof(*hh), GFP_ATOMIC)) != NULL) {
3644f0ce 1097 seqlock_init(&hh->hh_lock);
1da177e4
LT
1098 hh->hh_type = protocol;
1099 atomic_set(&hh->hh_refcnt, 0);
1100 hh->hh_next = NULL;
1101 if (dev->hard_header_cache(n, hh)) {
1102 kfree(hh);
1103 hh = NULL;
1104 } else {
1105 atomic_inc(&hh->hh_refcnt);
1106 hh->hh_next = n->hh;
1107 n->hh = hh;
1108 if (n->nud_state & NUD_CONNECTED)
1109 hh->hh_output = n->ops->hh_output;
1110 else
1111 hh->hh_output = n->ops->output;
1112 }
1113 }
1114 if (hh) {
1115 atomic_inc(&hh->hh_refcnt);
1116 dst->hh = hh;
1117 }
1118}
1119
1120/* This function can be used in contexts, where only old dev_queue_xmit
1121 worked, f.e. if you want to override normal output path (eql, shaper),
1122 but resolution is not made yet.
1123 */
1124
1125int neigh_compat_output(struct sk_buff *skb)
1126{
1127 struct net_device *dev = skb->dev;
1128
bbe735e4 1129 __skb_pull(skb, skb_network_offset(skb));
1da177e4
LT
1130
1131 if (dev->hard_header &&
1132 dev->hard_header(skb, dev, ntohs(skb->protocol), NULL, NULL,
4ec93edb 1133 skb->len) < 0 &&
1da177e4
LT
1134 dev->rebuild_header(skb))
1135 return 0;
1136
1137 return dev_queue_xmit(skb);
1138}
1139
1140/* Slow and careful. */
1141
1142int neigh_resolve_output(struct sk_buff *skb)
1143{
1144 struct dst_entry *dst = skb->dst;
1145 struct neighbour *neigh;
1146 int rc = 0;
1147
1148 if (!dst || !(neigh = dst->neighbour))
1149 goto discard;
1150
bbe735e4 1151 __skb_pull(skb, skb_network_offset(skb));
1da177e4
LT
1152
1153 if (!neigh_event_send(neigh, skb)) {
1154 int err;
1155 struct net_device *dev = neigh->dev;
1156 if (dev->hard_header_cache && !dst->hh) {
1157 write_lock_bh(&neigh->lock);
1158 if (!dst->hh)
1159 neigh_hh_init(neigh, dst, dst->ops->protocol);
1160 err = dev->hard_header(skb, dev, ntohs(skb->protocol),
1161 neigh->ha, NULL, skb->len);
1162 write_unlock_bh(&neigh->lock);
1163 } else {
1164 read_lock_bh(&neigh->lock);
1165 err = dev->hard_header(skb, dev, ntohs(skb->protocol),
1166 neigh->ha, NULL, skb->len);
1167 read_unlock_bh(&neigh->lock);
1168 }
1169 if (err >= 0)
1170 rc = neigh->ops->queue_xmit(skb);
1171 else
1172 goto out_kfree_skb;
1173 }
1174out:
1175 return rc;
1176discard:
1177 NEIGH_PRINTK1("neigh_resolve_output: dst=%p neigh=%p\n",
1178 dst, dst ? dst->neighbour : NULL);
1179out_kfree_skb:
1180 rc = -EINVAL;
1181 kfree_skb(skb);
1182 goto out;
1183}
1184
1185/* As fast as possible without hh cache */
1186
1187int neigh_connected_output(struct sk_buff *skb)
1188{
1189 int err;
1190 struct dst_entry *dst = skb->dst;
1191 struct neighbour *neigh = dst->neighbour;
1192 struct net_device *dev = neigh->dev;
1193
bbe735e4 1194 __skb_pull(skb, skb_network_offset(skb));
1da177e4
LT
1195
1196 read_lock_bh(&neigh->lock);
1197 err = dev->hard_header(skb, dev, ntohs(skb->protocol),
1198 neigh->ha, NULL, skb->len);
1199 read_unlock_bh(&neigh->lock);
1200 if (err >= 0)
1201 err = neigh->ops->queue_xmit(skb);
1202 else {
1203 err = -EINVAL;
1204 kfree_skb(skb);
1205 }
1206 return err;
1207}
1208
1209static void neigh_proxy_process(unsigned long arg)
1210{
1211 struct neigh_table *tbl = (struct neigh_table *)arg;
1212 long sched_next = 0;
1213 unsigned long now = jiffies;
1214 struct sk_buff *skb;
1215
1216 spin_lock(&tbl->proxy_queue.lock);
1217
1218 skb = tbl->proxy_queue.next;
1219
1220 while (skb != (struct sk_buff *)&tbl->proxy_queue) {
1221 struct sk_buff *back = skb;
a61bbcf2 1222 long tdif = NEIGH_CB(back)->sched_next - now;
1da177e4
LT
1223
1224 skb = skb->next;
1225 if (tdif <= 0) {
1226 struct net_device *dev = back->dev;
1227 __skb_unlink(back, &tbl->proxy_queue);
1228 if (tbl->proxy_redo && netif_running(dev))
1229 tbl->proxy_redo(back);
1230 else
1231 kfree_skb(back);
1232
1233 dev_put(dev);
1234 } else if (!sched_next || tdif < sched_next)
1235 sched_next = tdif;
1236 }
1237 del_timer(&tbl->proxy_timer);
1238 if (sched_next)
1239 mod_timer(&tbl->proxy_timer, jiffies + sched_next);
1240 spin_unlock(&tbl->proxy_queue.lock);
1241}
1242
1243void pneigh_enqueue(struct neigh_table *tbl, struct neigh_parms *p,
1244 struct sk_buff *skb)
1245{
1246 unsigned long now = jiffies;
1247 unsigned long sched_next = now + (net_random() % p->proxy_delay);
1248
1249 if (tbl->proxy_queue.qlen > p->proxy_qlen) {
1250 kfree_skb(skb);
1251 return;
1252 }
a61bbcf2
PM
1253
1254 NEIGH_CB(skb)->sched_next = sched_next;
1255 NEIGH_CB(skb)->flags |= LOCALLY_ENQUEUED;
1da177e4
LT
1256
1257 spin_lock(&tbl->proxy_queue.lock);
1258 if (del_timer(&tbl->proxy_timer)) {
1259 if (time_before(tbl->proxy_timer.expires, sched_next))
1260 sched_next = tbl->proxy_timer.expires;
1261 }
1262 dst_release(skb->dst);
1263 skb->dst = NULL;
1264 dev_hold(skb->dev);
1265 __skb_queue_tail(&tbl->proxy_queue, skb);
1266 mod_timer(&tbl->proxy_timer, sched_next);
1267 spin_unlock(&tbl->proxy_queue.lock);
1268}
1269
1270
1271struct neigh_parms *neigh_parms_alloc(struct net_device *dev,
1272 struct neigh_table *tbl)
1273{
b1a98bf6 1274 struct neigh_parms *p = kmemdup(&tbl->parms, sizeof(*p), GFP_KERNEL);
1da177e4
LT
1275
1276 if (p) {
1da177e4
LT
1277 p->tbl = tbl;
1278 atomic_set(&p->refcnt, 1);
1279 INIT_RCU_HEAD(&p->rcu_head);
1280 p->reachable_time =
1281 neigh_rand_reach_time(p->base_reachable_time);
c7fb64db
TG
1282 if (dev) {
1283 if (dev->neigh_setup && dev->neigh_setup(dev, p)) {
1284 kfree(p);
1285 return NULL;
1286 }
1287
1288 dev_hold(dev);
1289 p->dev = dev;
1da177e4
LT
1290 }
1291 p->sysctl_table = NULL;
1292 write_lock_bh(&tbl->lock);
1293 p->next = tbl->parms.next;
1294 tbl->parms.next = p;
1295 write_unlock_bh(&tbl->lock);
1296 }
1297 return p;
1298}
1299
1300static void neigh_rcu_free_parms(struct rcu_head *head)
1301{
1302 struct neigh_parms *parms =
1303 container_of(head, struct neigh_parms, rcu_head);
1304
1305 neigh_parms_put(parms);
1306}
1307
1308void neigh_parms_release(struct neigh_table *tbl, struct neigh_parms *parms)
1309{
1310 struct neigh_parms **p;
1311
1312 if (!parms || parms == &tbl->parms)
1313 return;
1314 write_lock_bh(&tbl->lock);
1315 for (p = &tbl->parms.next; *p; p = &(*p)->next) {
1316 if (*p == parms) {
1317 *p = parms->next;
1318 parms->dead = 1;
1319 write_unlock_bh(&tbl->lock);
c7fb64db
TG
1320 if (parms->dev)
1321 dev_put(parms->dev);
1da177e4
LT
1322 call_rcu(&parms->rcu_head, neigh_rcu_free_parms);
1323 return;
1324 }
1325 }
1326 write_unlock_bh(&tbl->lock);
1327 NEIGH_PRINTK1("neigh_parms_release: not found\n");
1328}
1329
1330void neigh_parms_destroy(struct neigh_parms *parms)
1331{
1332 kfree(parms);
1333}
1334
c2ecba71
PE
1335static struct lock_class_key neigh_table_proxy_queue_class;
1336
bd89efc5 1337void neigh_table_init_no_netlink(struct neigh_table *tbl)
1da177e4
LT
1338{
1339 unsigned long now = jiffies;
1340 unsigned long phsize;
1341
1342 atomic_set(&tbl->parms.refcnt, 1);
1343 INIT_RCU_HEAD(&tbl->parms.rcu_head);
1344 tbl->parms.reachable_time =
1345 neigh_rand_reach_time(tbl->parms.base_reachable_time);
1346
1347 if (!tbl->kmem_cachep)
e5d679f3
AD
1348 tbl->kmem_cachep =
1349 kmem_cache_create(tbl->id, tbl->entry_size, 0,
1350 SLAB_HWCACHE_ALIGN|SLAB_PANIC,
20c2df83 1351 NULL);
1da177e4
LT
1352 tbl->stats = alloc_percpu(struct neigh_statistics);
1353 if (!tbl->stats)
1354 panic("cannot create neighbour cache statistics");
4ec93edb 1355
1da177e4
LT
1356#ifdef CONFIG_PROC_FS
1357 tbl->pde = create_proc_entry(tbl->id, 0, proc_net_stat);
4ec93edb 1358 if (!tbl->pde)
1da177e4
LT
1359 panic("cannot create neighbour proc dir entry");
1360 tbl->pde->proc_fops = &neigh_stat_seq_fops;
1361 tbl->pde->data = tbl;
1362#endif
1363
1364 tbl->hash_mask = 1;
1365 tbl->hash_buckets = neigh_hash_alloc(tbl->hash_mask + 1);
1366
1367 phsize = (PNEIGH_HASHMASK + 1) * sizeof(struct pneigh_entry *);
77d04bd9 1368 tbl->phash_buckets = kzalloc(phsize, GFP_KERNEL);
1da177e4
LT
1369
1370 if (!tbl->hash_buckets || !tbl->phash_buckets)
1371 panic("cannot allocate neighbour cache hashes");
1372
1da177e4
LT
1373 get_random_bytes(&tbl->hash_rnd, sizeof(tbl->hash_rnd));
1374
1375 rwlock_init(&tbl->lock);
1376 init_timer(&tbl->gc_timer);
1377 tbl->gc_timer.data = (unsigned long)tbl;
1378 tbl->gc_timer.function = neigh_periodic_timer;
1379 tbl->gc_timer.expires = now + 1;
1380 add_timer(&tbl->gc_timer);
1381
1382 init_timer(&tbl->proxy_timer);
1383 tbl->proxy_timer.data = (unsigned long)tbl;
1384 tbl->proxy_timer.function = neigh_proxy_process;
c2ecba71
PE
1385 skb_queue_head_init_class(&tbl->proxy_queue,
1386 &neigh_table_proxy_queue_class);
1da177e4
LT
1387
1388 tbl->last_flush = now;
1389 tbl->last_rand = now + tbl->parms.reachable_time * 20;
bd89efc5
SK
1390}
1391
1392void neigh_table_init(struct neigh_table *tbl)
1393{
1394 struct neigh_table *tmp;
1395
1396 neigh_table_init_no_netlink(tbl);
1da177e4 1397 write_lock(&neigh_tbl_lock);
bd89efc5
SK
1398 for (tmp = neigh_tables; tmp; tmp = tmp->next) {
1399 if (tmp->family == tbl->family)
1400 break;
1401 }
1da177e4
LT
1402 tbl->next = neigh_tables;
1403 neigh_tables = tbl;
1404 write_unlock(&neigh_tbl_lock);
bd89efc5
SK
1405
1406 if (unlikely(tmp)) {
1407 printk(KERN_ERR "NEIGH: Registering multiple tables for "
1408 "family %d\n", tbl->family);
1409 dump_stack();
1410 }
1da177e4
LT
1411}
1412
1413int neigh_table_clear(struct neigh_table *tbl)
1414{
1415 struct neigh_table **tp;
1416
1417 /* It is not clean... Fix it to unload IPv6 module safely */
1418 del_timer_sync(&tbl->gc_timer);
1419 del_timer_sync(&tbl->proxy_timer);
1420 pneigh_queue_purge(&tbl->proxy_queue);
1421 neigh_ifdown(tbl, NULL);
1422 if (atomic_read(&tbl->entries))
1423 printk(KERN_CRIT "neighbour leakage\n");
1424 write_lock(&neigh_tbl_lock);
1425 for (tp = &neigh_tables; *tp; tp = &(*tp)->next) {
1426 if (*tp == tbl) {
1427 *tp = tbl->next;
1428 break;
1429 }
1430 }
1431 write_unlock(&neigh_tbl_lock);
1432
1433 neigh_hash_free(tbl->hash_buckets, tbl->hash_mask + 1);
1434 tbl->hash_buckets = NULL;
1435
1436 kfree(tbl->phash_buckets);
1437 tbl->phash_buckets = NULL;
1438
3fcde74b
KK
1439 free_percpu(tbl->stats);
1440 tbl->stats = NULL;
1441
1da177e4
LT
1442 return 0;
1443}
1444
c8822a4e 1445static int neigh_delete(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
1da177e4 1446{
a14a49d2
TG
1447 struct ndmsg *ndm;
1448 struct nlattr *dst_attr;
1da177e4
LT
1449 struct neigh_table *tbl;
1450 struct net_device *dev = NULL;
a14a49d2 1451 int err = -EINVAL;
1da177e4 1452
a14a49d2 1453 if (nlmsg_len(nlh) < sizeof(*ndm))
1da177e4
LT
1454 goto out;
1455
a14a49d2
TG
1456 dst_attr = nlmsg_find_attr(nlh, sizeof(*ndm), NDA_DST);
1457 if (dst_attr == NULL)
1458 goto out;
1459
1460 ndm = nlmsg_data(nlh);
1461 if (ndm->ndm_ifindex) {
1462 dev = dev_get_by_index(ndm->ndm_ifindex);
1463 if (dev == NULL) {
1464 err = -ENODEV;
1465 goto out;
1466 }
1467 }
1468
1da177e4
LT
1469 read_lock(&neigh_tbl_lock);
1470 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
a14a49d2 1471 struct neighbour *neigh;
1da177e4
LT
1472
1473 if (tbl->family != ndm->ndm_family)
1474 continue;
1475 read_unlock(&neigh_tbl_lock);
1476
a14a49d2 1477 if (nla_len(dst_attr) < tbl->key_len)
1da177e4
LT
1478 goto out_dev_put;
1479
1480 if (ndm->ndm_flags & NTF_PROXY) {
a14a49d2 1481 err = pneigh_delete(tbl, nla_data(dst_attr), dev);
1da177e4
LT
1482 goto out_dev_put;
1483 }
1484
a14a49d2
TG
1485 if (dev == NULL)
1486 goto out_dev_put;
1da177e4 1487
a14a49d2
TG
1488 neigh = neigh_lookup(tbl, nla_data(dst_attr), dev);
1489 if (neigh == NULL) {
1490 err = -ENOENT;
1491 goto out_dev_put;
1da177e4 1492 }
a14a49d2
TG
1493
1494 err = neigh_update(neigh, NULL, NUD_FAILED,
1495 NEIGH_UPDATE_F_OVERRIDE |
1496 NEIGH_UPDATE_F_ADMIN);
1497 neigh_release(neigh);
1da177e4
LT
1498 goto out_dev_put;
1499 }
1500 read_unlock(&neigh_tbl_lock);
a14a49d2
TG
1501 err = -EAFNOSUPPORT;
1502
1da177e4
LT
1503out_dev_put:
1504 if (dev)
1505 dev_put(dev);
1506out:
1507 return err;
1508}
1509
c8822a4e 1510static int neigh_add(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
1da177e4 1511{
5208debd
TG
1512 struct ndmsg *ndm;
1513 struct nlattr *tb[NDA_MAX+1];
1da177e4
LT
1514 struct neigh_table *tbl;
1515 struct net_device *dev = NULL;
5208debd 1516 int err;
1da177e4 1517
5208debd
TG
1518 err = nlmsg_parse(nlh, sizeof(*ndm), tb, NDA_MAX, NULL);
1519 if (err < 0)
1da177e4
LT
1520 goto out;
1521
5208debd
TG
1522 err = -EINVAL;
1523 if (tb[NDA_DST] == NULL)
1524 goto out;
1525
1526 ndm = nlmsg_data(nlh);
1527 if (ndm->ndm_ifindex) {
1528 dev = dev_get_by_index(ndm->ndm_ifindex);
1529 if (dev == NULL) {
1530 err = -ENODEV;
1531 goto out;
1532 }
1533
1534 if (tb[NDA_LLADDR] && nla_len(tb[NDA_LLADDR]) < dev->addr_len)
1535 goto out_dev_put;
1536 }
1537
1da177e4
LT
1538 read_lock(&neigh_tbl_lock);
1539 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
5208debd
TG
1540 int flags = NEIGH_UPDATE_F_ADMIN | NEIGH_UPDATE_F_OVERRIDE;
1541 struct neighbour *neigh;
1542 void *dst, *lladdr;
1da177e4
LT
1543
1544 if (tbl->family != ndm->ndm_family)
1545 continue;
1546 read_unlock(&neigh_tbl_lock);
1547
5208debd 1548 if (nla_len(tb[NDA_DST]) < tbl->key_len)
1da177e4 1549 goto out_dev_put;
5208debd
TG
1550 dst = nla_data(tb[NDA_DST]);
1551 lladdr = tb[NDA_LLADDR] ? nla_data(tb[NDA_LLADDR]) : NULL;
1da177e4
LT
1552
1553 if (ndm->ndm_flags & NTF_PROXY) {
62dd9318
VN
1554 struct pneigh_entry *pn;
1555
1556 err = -ENOBUFS;
1557 pn = pneigh_lookup(tbl, dst, dev, 1);
1558 if (pn) {
1559 pn->flags = ndm->ndm_flags;
1560 err = 0;
1561 }
1da177e4
LT
1562 goto out_dev_put;
1563 }
1564
5208debd 1565 if (dev == NULL)
1da177e4 1566 goto out_dev_put;
5208debd
TG
1567
1568 neigh = neigh_lookup(tbl, dst, dev);
1569 if (neigh == NULL) {
1570 if (!(nlh->nlmsg_flags & NLM_F_CREATE)) {
1571 err = -ENOENT;
1572 goto out_dev_put;
1573 }
4ec93edb 1574
5208debd
TG
1575 neigh = __neigh_lookup_errno(tbl, dst, dev);
1576 if (IS_ERR(neigh)) {
1577 err = PTR_ERR(neigh);
1da177e4
LT
1578 goto out_dev_put;
1579 }
1da177e4 1580 } else {
5208debd
TG
1581 if (nlh->nlmsg_flags & NLM_F_EXCL) {
1582 err = -EEXIST;
1583 neigh_release(neigh);
1da177e4
LT
1584 goto out_dev_put;
1585 }
1da177e4 1586
5208debd
TG
1587 if (!(nlh->nlmsg_flags & NLM_F_REPLACE))
1588 flags &= ~NEIGH_UPDATE_F_OVERRIDE;
1589 }
1da177e4 1590
5208debd
TG
1591 err = neigh_update(neigh, lladdr, ndm->ndm_state, flags);
1592 neigh_release(neigh);
1da177e4
LT
1593 goto out_dev_put;
1594 }
1595
1596 read_unlock(&neigh_tbl_lock);
5208debd
TG
1597 err = -EAFNOSUPPORT;
1598
1da177e4
LT
1599out_dev_put:
1600 if (dev)
1601 dev_put(dev);
1602out:
1603 return err;
1604}
1605
c7fb64db
TG
1606static int neightbl_fill_parms(struct sk_buff *skb, struct neigh_parms *parms)
1607{
ca860fb3
TG
1608 struct nlattr *nest;
1609
1610 nest = nla_nest_start(skb, NDTA_PARMS);
1611 if (nest == NULL)
1612 return -ENOBUFS;
c7fb64db
TG
1613
1614 if (parms->dev)
ca860fb3
TG
1615 NLA_PUT_U32(skb, NDTPA_IFINDEX, parms->dev->ifindex);
1616
1617 NLA_PUT_U32(skb, NDTPA_REFCNT, atomic_read(&parms->refcnt));
1618 NLA_PUT_U32(skb, NDTPA_QUEUE_LEN, parms->queue_len);
1619 NLA_PUT_U32(skb, NDTPA_PROXY_QLEN, parms->proxy_qlen);
1620 NLA_PUT_U32(skb, NDTPA_APP_PROBES, parms->app_probes);
1621 NLA_PUT_U32(skb, NDTPA_UCAST_PROBES, parms->ucast_probes);
1622 NLA_PUT_U32(skb, NDTPA_MCAST_PROBES, parms->mcast_probes);
1623 NLA_PUT_MSECS(skb, NDTPA_REACHABLE_TIME, parms->reachable_time);
1624 NLA_PUT_MSECS(skb, NDTPA_BASE_REACHABLE_TIME,
c7fb64db 1625 parms->base_reachable_time);
ca860fb3
TG
1626 NLA_PUT_MSECS(skb, NDTPA_GC_STALETIME, parms->gc_staletime);
1627 NLA_PUT_MSECS(skb, NDTPA_DELAY_PROBE_TIME, parms->delay_probe_time);
1628 NLA_PUT_MSECS(skb, NDTPA_RETRANS_TIME, parms->retrans_time);
1629 NLA_PUT_MSECS(skb, NDTPA_ANYCAST_DELAY, parms->anycast_delay);
1630 NLA_PUT_MSECS(skb, NDTPA_PROXY_DELAY, parms->proxy_delay);
1631 NLA_PUT_MSECS(skb, NDTPA_LOCKTIME, parms->locktime);
c7fb64db 1632
ca860fb3 1633 return nla_nest_end(skb, nest);
c7fb64db 1634
ca860fb3
TG
1635nla_put_failure:
1636 return nla_nest_cancel(skb, nest);
c7fb64db
TG
1637}
1638
ca860fb3
TG
1639static int neightbl_fill_info(struct sk_buff *skb, struct neigh_table *tbl,
1640 u32 pid, u32 seq, int type, int flags)
c7fb64db
TG
1641{
1642 struct nlmsghdr *nlh;
1643 struct ndtmsg *ndtmsg;
1644
ca860fb3
TG
1645 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndtmsg), flags);
1646 if (nlh == NULL)
26932566 1647 return -EMSGSIZE;
c7fb64db 1648
ca860fb3 1649 ndtmsg = nlmsg_data(nlh);
c7fb64db
TG
1650
1651 read_lock_bh(&tbl->lock);
1652 ndtmsg->ndtm_family = tbl->family;
9ef1d4c7
PM
1653 ndtmsg->ndtm_pad1 = 0;
1654 ndtmsg->ndtm_pad2 = 0;
c7fb64db 1655
ca860fb3
TG
1656 NLA_PUT_STRING(skb, NDTA_NAME, tbl->id);
1657 NLA_PUT_MSECS(skb, NDTA_GC_INTERVAL, tbl->gc_interval);
1658 NLA_PUT_U32(skb, NDTA_THRESH1, tbl->gc_thresh1);
1659 NLA_PUT_U32(skb, NDTA_THRESH2, tbl->gc_thresh2);
1660 NLA_PUT_U32(skb, NDTA_THRESH3, tbl->gc_thresh3);
c7fb64db
TG
1661
1662 {
1663 unsigned long now = jiffies;
1664 unsigned int flush_delta = now - tbl->last_flush;
1665 unsigned int rand_delta = now - tbl->last_rand;
1666
1667 struct ndt_config ndc = {
1668 .ndtc_key_len = tbl->key_len,
1669 .ndtc_entry_size = tbl->entry_size,
1670 .ndtc_entries = atomic_read(&tbl->entries),
1671 .ndtc_last_flush = jiffies_to_msecs(flush_delta),
1672 .ndtc_last_rand = jiffies_to_msecs(rand_delta),
1673 .ndtc_hash_rnd = tbl->hash_rnd,
1674 .ndtc_hash_mask = tbl->hash_mask,
1675 .ndtc_hash_chain_gc = tbl->hash_chain_gc,
1676 .ndtc_proxy_qlen = tbl->proxy_queue.qlen,
1677 };
1678
ca860fb3 1679 NLA_PUT(skb, NDTA_CONFIG, sizeof(ndc), &ndc);
c7fb64db
TG
1680 }
1681
1682 {
1683 int cpu;
1684 struct ndt_stats ndst;
1685
1686 memset(&ndst, 0, sizeof(ndst));
1687
6f912042 1688 for_each_possible_cpu(cpu) {
c7fb64db
TG
1689 struct neigh_statistics *st;
1690
c7fb64db
TG
1691 st = per_cpu_ptr(tbl->stats, cpu);
1692 ndst.ndts_allocs += st->allocs;
1693 ndst.ndts_destroys += st->destroys;
1694 ndst.ndts_hash_grows += st->hash_grows;
1695 ndst.ndts_res_failed += st->res_failed;
1696 ndst.ndts_lookups += st->lookups;
1697 ndst.ndts_hits += st->hits;
1698 ndst.ndts_rcv_probes_mcast += st->rcv_probes_mcast;
1699 ndst.ndts_rcv_probes_ucast += st->rcv_probes_ucast;
1700 ndst.ndts_periodic_gc_runs += st->periodic_gc_runs;
1701 ndst.ndts_forced_gc_runs += st->forced_gc_runs;
1702 }
1703
ca860fb3 1704 NLA_PUT(skb, NDTA_STATS, sizeof(ndst), &ndst);
c7fb64db
TG
1705 }
1706
1707 BUG_ON(tbl->parms.dev);
1708 if (neightbl_fill_parms(skb, &tbl->parms) < 0)
ca860fb3 1709 goto nla_put_failure;
c7fb64db
TG
1710
1711 read_unlock_bh(&tbl->lock);
ca860fb3 1712 return nlmsg_end(skb, nlh);
c7fb64db 1713
ca860fb3 1714nla_put_failure:
c7fb64db 1715 read_unlock_bh(&tbl->lock);
26932566
PM
1716 nlmsg_cancel(skb, nlh);
1717 return -EMSGSIZE;
c7fb64db
TG
1718}
1719
ca860fb3
TG
1720static int neightbl_fill_param_info(struct sk_buff *skb,
1721 struct neigh_table *tbl,
c7fb64db 1722 struct neigh_parms *parms,
ca860fb3
TG
1723 u32 pid, u32 seq, int type,
1724 unsigned int flags)
c7fb64db
TG
1725{
1726 struct ndtmsg *ndtmsg;
1727 struct nlmsghdr *nlh;
1728
ca860fb3
TG
1729 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndtmsg), flags);
1730 if (nlh == NULL)
26932566 1731 return -EMSGSIZE;
c7fb64db 1732
ca860fb3 1733 ndtmsg = nlmsg_data(nlh);
c7fb64db
TG
1734
1735 read_lock_bh(&tbl->lock);
1736 ndtmsg->ndtm_family = tbl->family;
9ef1d4c7
PM
1737 ndtmsg->ndtm_pad1 = 0;
1738 ndtmsg->ndtm_pad2 = 0;
c7fb64db 1739
ca860fb3
TG
1740 if (nla_put_string(skb, NDTA_NAME, tbl->id) < 0 ||
1741 neightbl_fill_parms(skb, parms) < 0)
1742 goto errout;
c7fb64db
TG
1743
1744 read_unlock_bh(&tbl->lock);
ca860fb3
TG
1745 return nlmsg_end(skb, nlh);
1746errout:
c7fb64db 1747 read_unlock_bh(&tbl->lock);
26932566
PM
1748 nlmsg_cancel(skb, nlh);
1749 return -EMSGSIZE;
c7fb64db 1750}
4ec93edb 1751
c7fb64db
TG
1752static inline struct neigh_parms *lookup_neigh_params(struct neigh_table *tbl,
1753 int ifindex)
1754{
1755 struct neigh_parms *p;
4ec93edb 1756
c7fb64db
TG
1757 for (p = &tbl->parms; p; p = p->next)
1758 if ((p->dev && p->dev->ifindex == ifindex) ||
1759 (!p->dev && !ifindex))
1760 return p;
1761
1762 return NULL;
1763}
1764
ef7c79ed 1765static const struct nla_policy nl_neightbl_policy[NDTA_MAX+1] = {
6b3f8674
TG
1766 [NDTA_NAME] = { .type = NLA_STRING },
1767 [NDTA_THRESH1] = { .type = NLA_U32 },
1768 [NDTA_THRESH2] = { .type = NLA_U32 },
1769 [NDTA_THRESH3] = { .type = NLA_U32 },
1770 [NDTA_GC_INTERVAL] = { .type = NLA_U64 },
1771 [NDTA_PARMS] = { .type = NLA_NESTED },
1772};
1773
ef7c79ed 1774static const struct nla_policy nl_ntbl_parm_policy[NDTPA_MAX+1] = {
6b3f8674
TG
1775 [NDTPA_IFINDEX] = { .type = NLA_U32 },
1776 [NDTPA_QUEUE_LEN] = { .type = NLA_U32 },
1777 [NDTPA_PROXY_QLEN] = { .type = NLA_U32 },
1778 [NDTPA_APP_PROBES] = { .type = NLA_U32 },
1779 [NDTPA_UCAST_PROBES] = { .type = NLA_U32 },
1780 [NDTPA_MCAST_PROBES] = { .type = NLA_U32 },
1781 [NDTPA_BASE_REACHABLE_TIME] = { .type = NLA_U64 },
1782 [NDTPA_GC_STALETIME] = { .type = NLA_U64 },
1783 [NDTPA_DELAY_PROBE_TIME] = { .type = NLA_U64 },
1784 [NDTPA_RETRANS_TIME] = { .type = NLA_U64 },
1785 [NDTPA_ANYCAST_DELAY] = { .type = NLA_U64 },
1786 [NDTPA_PROXY_DELAY] = { .type = NLA_U64 },
1787 [NDTPA_LOCKTIME] = { .type = NLA_U64 },
1788};
1789
c8822a4e 1790static int neightbl_set(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
c7fb64db
TG
1791{
1792 struct neigh_table *tbl;
6b3f8674
TG
1793 struct ndtmsg *ndtmsg;
1794 struct nlattr *tb[NDTA_MAX+1];
1795 int err;
c7fb64db 1796
6b3f8674
TG
1797 err = nlmsg_parse(nlh, sizeof(*ndtmsg), tb, NDTA_MAX,
1798 nl_neightbl_policy);
1799 if (err < 0)
1800 goto errout;
c7fb64db 1801
6b3f8674
TG
1802 if (tb[NDTA_NAME] == NULL) {
1803 err = -EINVAL;
1804 goto errout;
1805 }
1806
1807 ndtmsg = nlmsg_data(nlh);
c7fb64db
TG
1808 read_lock(&neigh_tbl_lock);
1809 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
1810 if (ndtmsg->ndtm_family && tbl->family != ndtmsg->ndtm_family)
1811 continue;
1812
6b3f8674 1813 if (nla_strcmp(tb[NDTA_NAME], tbl->id) == 0)
c7fb64db
TG
1814 break;
1815 }
1816
1817 if (tbl == NULL) {
1818 err = -ENOENT;
6b3f8674 1819 goto errout_locked;
c7fb64db
TG
1820 }
1821
4ec93edb 1822 /*
c7fb64db
TG
1823 * We acquire tbl->lock to be nice to the periodic timers and
1824 * make sure they always see a consistent set of values.
1825 */
1826 write_lock_bh(&tbl->lock);
1827
6b3f8674
TG
1828 if (tb[NDTA_PARMS]) {
1829 struct nlattr *tbp[NDTPA_MAX+1];
c7fb64db 1830 struct neigh_parms *p;
6b3f8674 1831 int i, ifindex = 0;
c7fb64db 1832
6b3f8674
TG
1833 err = nla_parse_nested(tbp, NDTPA_MAX, tb[NDTA_PARMS],
1834 nl_ntbl_parm_policy);
1835 if (err < 0)
1836 goto errout_tbl_lock;
c7fb64db 1837
6b3f8674
TG
1838 if (tbp[NDTPA_IFINDEX])
1839 ifindex = nla_get_u32(tbp[NDTPA_IFINDEX]);
c7fb64db
TG
1840
1841 p = lookup_neigh_params(tbl, ifindex);
1842 if (p == NULL) {
1843 err = -ENOENT;
6b3f8674 1844 goto errout_tbl_lock;
c7fb64db 1845 }
c7fb64db 1846
6b3f8674
TG
1847 for (i = 1; i <= NDTPA_MAX; i++) {
1848 if (tbp[i] == NULL)
1849 continue;
c7fb64db 1850
6b3f8674
TG
1851 switch (i) {
1852 case NDTPA_QUEUE_LEN:
1853 p->queue_len = nla_get_u32(tbp[i]);
1854 break;
1855 case NDTPA_PROXY_QLEN:
1856 p->proxy_qlen = nla_get_u32(tbp[i]);
1857 break;
1858 case NDTPA_APP_PROBES:
1859 p->app_probes = nla_get_u32(tbp[i]);
1860 break;
1861 case NDTPA_UCAST_PROBES:
1862 p->ucast_probes = nla_get_u32(tbp[i]);
1863 break;
1864 case NDTPA_MCAST_PROBES:
1865 p->mcast_probes = nla_get_u32(tbp[i]);
1866 break;
1867 case NDTPA_BASE_REACHABLE_TIME:
1868 p->base_reachable_time = nla_get_msecs(tbp[i]);
1869 break;
1870 case NDTPA_GC_STALETIME:
1871 p->gc_staletime = nla_get_msecs(tbp[i]);
1872 break;
1873 case NDTPA_DELAY_PROBE_TIME:
1874 p->delay_probe_time = nla_get_msecs(tbp[i]);
1875 break;
1876 case NDTPA_RETRANS_TIME:
1877 p->retrans_time = nla_get_msecs(tbp[i]);
1878 break;
1879 case NDTPA_ANYCAST_DELAY:
1880 p->anycast_delay = nla_get_msecs(tbp[i]);
1881 break;
1882 case NDTPA_PROXY_DELAY:
1883 p->proxy_delay = nla_get_msecs(tbp[i]);
1884 break;
1885 case NDTPA_LOCKTIME:
1886 p->locktime = nla_get_msecs(tbp[i]);
1887 break;
1888 }
1889 }
1890 }
c7fb64db 1891
6b3f8674
TG
1892 if (tb[NDTA_THRESH1])
1893 tbl->gc_thresh1 = nla_get_u32(tb[NDTA_THRESH1]);
c7fb64db 1894
6b3f8674
TG
1895 if (tb[NDTA_THRESH2])
1896 tbl->gc_thresh2 = nla_get_u32(tb[NDTA_THRESH2]);
c7fb64db 1897
6b3f8674
TG
1898 if (tb[NDTA_THRESH3])
1899 tbl->gc_thresh3 = nla_get_u32(tb[NDTA_THRESH3]);
c7fb64db 1900
6b3f8674
TG
1901 if (tb[NDTA_GC_INTERVAL])
1902 tbl->gc_interval = nla_get_msecs(tb[NDTA_GC_INTERVAL]);
c7fb64db
TG
1903
1904 err = 0;
1905
6b3f8674 1906errout_tbl_lock:
c7fb64db 1907 write_unlock_bh(&tbl->lock);
6b3f8674 1908errout_locked:
c7fb64db 1909 read_unlock(&neigh_tbl_lock);
6b3f8674 1910errout:
c7fb64db
TG
1911 return err;
1912}
1913
c8822a4e 1914static int neightbl_dump_info(struct sk_buff *skb, struct netlink_callback *cb)
c7fb64db 1915{
ca860fb3
TG
1916 int family, tidx, nidx = 0;
1917 int tbl_skip = cb->args[0];
1918 int neigh_skip = cb->args[1];
c7fb64db
TG
1919 struct neigh_table *tbl;
1920
ca860fb3 1921 family = ((struct rtgenmsg *) nlmsg_data(cb->nlh))->rtgen_family;
c7fb64db
TG
1922
1923 read_lock(&neigh_tbl_lock);
ca860fb3 1924 for (tbl = neigh_tables, tidx = 0; tbl; tbl = tbl->next, tidx++) {
c7fb64db
TG
1925 struct neigh_parms *p;
1926
ca860fb3 1927 if (tidx < tbl_skip || (family && tbl->family != family))
c7fb64db
TG
1928 continue;
1929
ca860fb3
TG
1930 if (neightbl_fill_info(skb, tbl, NETLINK_CB(cb->skb).pid,
1931 cb->nlh->nlmsg_seq, RTM_NEWNEIGHTBL,
1932 NLM_F_MULTI) <= 0)
c7fb64db
TG
1933 break;
1934
ca860fb3
TG
1935 for (nidx = 0, p = tbl->parms.next; p; p = p->next, nidx++) {
1936 if (nidx < neigh_skip)
c7fb64db
TG
1937 continue;
1938
ca860fb3
TG
1939 if (neightbl_fill_param_info(skb, tbl, p,
1940 NETLINK_CB(cb->skb).pid,
1941 cb->nlh->nlmsg_seq,
1942 RTM_NEWNEIGHTBL,
1943 NLM_F_MULTI) <= 0)
c7fb64db
TG
1944 goto out;
1945 }
1946
ca860fb3 1947 neigh_skip = 0;
c7fb64db
TG
1948 }
1949out:
1950 read_unlock(&neigh_tbl_lock);
ca860fb3
TG
1951 cb->args[0] = tidx;
1952 cb->args[1] = nidx;
c7fb64db
TG
1953
1954 return skb->len;
1955}
1da177e4 1956
8b8aec50
TG
1957static int neigh_fill_info(struct sk_buff *skb, struct neighbour *neigh,
1958 u32 pid, u32 seq, int type, unsigned int flags)
1da177e4
LT
1959{
1960 unsigned long now = jiffies;
1da177e4 1961 struct nda_cacheinfo ci;
8b8aec50
TG
1962 struct nlmsghdr *nlh;
1963 struct ndmsg *ndm;
1964
1965 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndm), flags);
1966 if (nlh == NULL)
26932566 1967 return -EMSGSIZE;
1da177e4 1968
8b8aec50
TG
1969 ndm = nlmsg_data(nlh);
1970 ndm->ndm_family = neigh->ops->family;
9ef1d4c7
PM
1971 ndm->ndm_pad1 = 0;
1972 ndm->ndm_pad2 = 0;
8b8aec50
TG
1973 ndm->ndm_flags = neigh->flags;
1974 ndm->ndm_type = neigh->type;
1975 ndm->ndm_ifindex = neigh->dev->ifindex;
1da177e4 1976
8b8aec50
TG
1977 NLA_PUT(skb, NDA_DST, neigh->tbl->key_len, neigh->primary_key);
1978
1979 read_lock_bh(&neigh->lock);
1980 ndm->ndm_state = neigh->nud_state;
1981 if ((neigh->nud_state & NUD_VALID) &&
1982 nla_put(skb, NDA_LLADDR, neigh->dev->addr_len, neigh->ha) < 0) {
1983 read_unlock_bh(&neigh->lock);
1984 goto nla_put_failure;
1985 }
1986
1987 ci.ndm_used = now - neigh->used;
1988 ci.ndm_confirmed = now - neigh->confirmed;
1989 ci.ndm_updated = now - neigh->updated;
1990 ci.ndm_refcnt = atomic_read(&neigh->refcnt) - 1;
1991 read_unlock_bh(&neigh->lock);
1992
1993 NLA_PUT_U32(skb, NDA_PROBES, atomic_read(&neigh->probes));
1994 NLA_PUT(skb, NDA_CACHEINFO, sizeof(ci), &ci);
1995
1996 return nlmsg_end(skb, nlh);
1997
1998nla_put_failure:
26932566
PM
1999 nlmsg_cancel(skb, nlh);
2000 return -EMSGSIZE;
1da177e4
LT
2001}
2002
2003
2004static int neigh_dump_table(struct neigh_table *tbl, struct sk_buff *skb,
2005 struct netlink_callback *cb)
2006{
2007 struct neighbour *n;
2008 int rc, h, s_h = cb->args[1];
2009 int idx, s_idx = idx = cb->args[2];
2010
c5e29460 2011 read_lock_bh(&tbl->lock);
1da177e4
LT
2012 for (h = 0; h <= tbl->hash_mask; h++) {
2013 if (h < s_h)
2014 continue;
2015 if (h > s_h)
2016 s_idx = 0;
1da177e4
LT
2017 for (n = tbl->hash_buckets[h], idx = 0; n; n = n->next, idx++) {
2018 if (idx < s_idx)
2019 continue;
2020 if (neigh_fill_info(skb, n, NETLINK_CB(cb->skb).pid,
2021 cb->nlh->nlmsg_seq,
b6544c0b
JHS
2022 RTM_NEWNEIGH,
2023 NLM_F_MULTI) <= 0) {
1da177e4
LT
2024 read_unlock_bh(&tbl->lock);
2025 rc = -1;
2026 goto out;
2027 }
2028 }
1da177e4 2029 }
c5e29460 2030 read_unlock_bh(&tbl->lock);
1da177e4
LT
2031 rc = skb->len;
2032out:
2033 cb->args[1] = h;
2034 cb->args[2] = idx;
2035 return rc;
2036}
2037
c8822a4e 2038static int neigh_dump_info(struct sk_buff *skb, struct netlink_callback *cb)
1da177e4
LT
2039{
2040 struct neigh_table *tbl;
2041 int t, family, s_t;
2042
2043 read_lock(&neigh_tbl_lock);
8b8aec50 2044 family = ((struct rtgenmsg *) nlmsg_data(cb->nlh))->rtgen_family;
1da177e4
LT
2045 s_t = cb->args[0];
2046
2047 for (tbl = neigh_tables, t = 0; tbl; tbl = tbl->next, t++) {
2048 if (t < s_t || (family && tbl->family != family))
2049 continue;
2050 if (t > s_t)
2051 memset(&cb->args[1], 0, sizeof(cb->args) -
2052 sizeof(cb->args[0]));
2053 if (neigh_dump_table(tbl, skb, cb) < 0)
2054 break;
2055 }
2056 read_unlock(&neigh_tbl_lock);
2057
2058 cb->args[0] = t;
2059 return skb->len;
2060}
2061
2062void neigh_for_each(struct neigh_table *tbl, void (*cb)(struct neighbour *, void *), void *cookie)
2063{
2064 int chain;
2065
2066 read_lock_bh(&tbl->lock);
2067 for (chain = 0; chain <= tbl->hash_mask; chain++) {
2068 struct neighbour *n;
2069
2070 for (n = tbl->hash_buckets[chain]; n; n = n->next)
2071 cb(n, cookie);
2072 }
2073 read_unlock_bh(&tbl->lock);
2074}
2075EXPORT_SYMBOL(neigh_for_each);
2076
2077/* The tbl->lock must be held as a writer and BH disabled. */
2078void __neigh_for_each_release(struct neigh_table *tbl,
2079 int (*cb)(struct neighbour *))
2080{
2081 int chain;
2082
2083 for (chain = 0; chain <= tbl->hash_mask; chain++) {
2084 struct neighbour *n, **np;
2085
2086 np = &tbl->hash_buckets[chain];
2087 while ((n = *np) != NULL) {
2088 int release;
2089
2090 write_lock(&n->lock);
2091 release = cb(n);
2092 if (release) {
2093 *np = n->next;
2094 n->dead = 1;
2095 } else
2096 np = &n->next;
2097 write_unlock(&n->lock);
ecbb4169
AK
2098 if (release) {
2099 if (n->parms->neigh_cleanup)
2100 n->parms->neigh_cleanup(n);
1da177e4 2101 neigh_release(n);
ecbb4169 2102 }
1da177e4
LT
2103 }
2104 }
2105}
2106EXPORT_SYMBOL(__neigh_for_each_release);
2107
2108#ifdef CONFIG_PROC_FS
2109
2110static struct neighbour *neigh_get_first(struct seq_file *seq)
2111{
2112 struct neigh_seq_state *state = seq->private;
2113 struct neigh_table *tbl = state->tbl;
2114 struct neighbour *n = NULL;
2115 int bucket = state->bucket;
2116
2117 state->flags &= ~NEIGH_SEQ_IS_PNEIGH;
2118 for (bucket = 0; bucket <= tbl->hash_mask; bucket++) {
2119 n = tbl->hash_buckets[bucket];
2120
2121 while (n) {
2122 if (state->neigh_sub_iter) {
2123 loff_t fakep = 0;
2124 void *v;
2125
2126 v = state->neigh_sub_iter(state, n, &fakep);
2127 if (!v)
2128 goto next;
2129 }
2130 if (!(state->flags & NEIGH_SEQ_SKIP_NOARP))
2131 break;
2132 if (n->nud_state & ~NUD_NOARP)
2133 break;
2134 next:
2135 n = n->next;
2136 }
2137
2138 if (n)
2139 break;
2140 }
2141 state->bucket = bucket;
2142
2143 return n;
2144}
2145
2146static struct neighbour *neigh_get_next(struct seq_file *seq,
2147 struct neighbour *n,
2148 loff_t *pos)
2149{
2150 struct neigh_seq_state *state = seq->private;
2151 struct neigh_table *tbl = state->tbl;
2152
2153 if (state->neigh_sub_iter) {
2154 void *v = state->neigh_sub_iter(state, n, pos);
2155 if (v)
2156 return n;
2157 }
2158 n = n->next;
2159
2160 while (1) {
2161 while (n) {
2162 if (state->neigh_sub_iter) {
2163 void *v = state->neigh_sub_iter(state, n, pos);
2164 if (v)
2165 return n;
2166 goto next;
2167 }
2168 if (!(state->flags & NEIGH_SEQ_SKIP_NOARP))
2169 break;
2170
2171 if (n->nud_state & ~NUD_NOARP)
2172 break;
2173 next:
2174 n = n->next;
2175 }
2176
2177 if (n)
2178 break;
2179
2180 if (++state->bucket > tbl->hash_mask)
2181 break;
2182
2183 n = tbl->hash_buckets[state->bucket];
2184 }
2185
2186 if (n && pos)
2187 --(*pos);
2188 return n;
2189}
2190
2191static struct neighbour *neigh_get_idx(struct seq_file *seq, loff_t *pos)
2192{
2193 struct neighbour *n = neigh_get_first(seq);
2194
2195 if (n) {
2196 while (*pos) {
2197 n = neigh_get_next(seq, n, pos);
2198 if (!n)
2199 break;
2200 }
2201 }
2202 return *pos ? NULL : n;
2203}
2204
2205static struct pneigh_entry *pneigh_get_first(struct seq_file *seq)
2206{
2207 struct neigh_seq_state *state = seq->private;
2208 struct neigh_table *tbl = state->tbl;
2209 struct pneigh_entry *pn = NULL;
2210 int bucket = state->bucket;
2211
2212 state->flags |= NEIGH_SEQ_IS_PNEIGH;
2213 for (bucket = 0; bucket <= PNEIGH_HASHMASK; bucket++) {
2214 pn = tbl->phash_buckets[bucket];
2215 if (pn)
2216 break;
2217 }
2218 state->bucket = bucket;
2219
2220 return pn;
2221}
2222
2223static struct pneigh_entry *pneigh_get_next(struct seq_file *seq,
2224 struct pneigh_entry *pn,
2225 loff_t *pos)
2226{
2227 struct neigh_seq_state *state = seq->private;
2228 struct neigh_table *tbl = state->tbl;
2229
2230 pn = pn->next;
2231 while (!pn) {
2232 if (++state->bucket > PNEIGH_HASHMASK)
2233 break;
2234 pn = tbl->phash_buckets[state->bucket];
2235 if (pn)
2236 break;
2237 }
2238
2239 if (pn && pos)
2240 --(*pos);
2241
2242 return pn;
2243}
2244
2245static struct pneigh_entry *pneigh_get_idx(struct seq_file *seq, loff_t *pos)
2246{
2247 struct pneigh_entry *pn = pneigh_get_first(seq);
2248
2249 if (pn) {
2250 while (*pos) {
2251 pn = pneigh_get_next(seq, pn, pos);
2252 if (!pn)
2253 break;
2254 }
2255 }
2256 return *pos ? NULL : pn;
2257}
2258
2259static void *neigh_get_idx_any(struct seq_file *seq, loff_t *pos)
2260{
2261 struct neigh_seq_state *state = seq->private;
2262 void *rc;
2263
2264 rc = neigh_get_idx(seq, pos);
2265 if (!rc && !(state->flags & NEIGH_SEQ_NEIGH_ONLY))
2266 rc = pneigh_get_idx(seq, pos);
2267
2268 return rc;
2269}
2270
2271void *neigh_seq_start(struct seq_file *seq, loff_t *pos, struct neigh_table *tbl, unsigned int neigh_seq_flags)
2272{
2273 struct neigh_seq_state *state = seq->private;
2274 loff_t pos_minus_one;
2275
2276 state->tbl = tbl;
2277 state->bucket = 0;
2278 state->flags = (neigh_seq_flags & ~NEIGH_SEQ_IS_PNEIGH);
2279
2280 read_lock_bh(&tbl->lock);
2281
2282 pos_minus_one = *pos - 1;
2283 return *pos ? neigh_get_idx_any(seq, &pos_minus_one) : SEQ_START_TOKEN;
2284}
2285EXPORT_SYMBOL(neigh_seq_start);
2286
2287void *neigh_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2288{
2289 struct neigh_seq_state *state;
2290 void *rc;
2291
2292 if (v == SEQ_START_TOKEN) {
2293 rc = neigh_get_idx(seq, pos);
2294 goto out;
2295 }
2296
2297 state = seq->private;
2298 if (!(state->flags & NEIGH_SEQ_IS_PNEIGH)) {
2299 rc = neigh_get_next(seq, v, NULL);
2300 if (rc)
2301 goto out;
2302 if (!(state->flags & NEIGH_SEQ_NEIGH_ONLY))
2303 rc = pneigh_get_first(seq);
2304 } else {
2305 BUG_ON(state->flags & NEIGH_SEQ_NEIGH_ONLY);
2306 rc = pneigh_get_next(seq, v, NULL);
2307 }
2308out:
2309 ++(*pos);
2310 return rc;
2311}
2312EXPORT_SYMBOL(neigh_seq_next);
2313
2314void neigh_seq_stop(struct seq_file *seq, void *v)
2315{
2316 struct neigh_seq_state *state = seq->private;
2317 struct neigh_table *tbl = state->tbl;
2318
2319 read_unlock_bh(&tbl->lock);
2320}
2321EXPORT_SYMBOL(neigh_seq_stop);
2322
2323/* statistics via seq_file */
2324
2325static void *neigh_stat_seq_start(struct seq_file *seq, loff_t *pos)
2326{
2327 struct proc_dir_entry *pde = seq->private;
2328 struct neigh_table *tbl = pde->data;
2329 int cpu;
2330
2331 if (*pos == 0)
2332 return SEQ_START_TOKEN;
4ec93edb 2333
1da177e4
LT
2334 for (cpu = *pos-1; cpu < NR_CPUS; ++cpu) {
2335 if (!cpu_possible(cpu))
2336 continue;
2337 *pos = cpu+1;
2338 return per_cpu_ptr(tbl->stats, cpu);
2339 }
2340 return NULL;
2341}
2342
2343static void *neigh_stat_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2344{
2345 struct proc_dir_entry *pde = seq->private;
2346 struct neigh_table *tbl = pde->data;
2347 int cpu;
2348
2349 for (cpu = *pos; cpu < NR_CPUS; ++cpu) {
2350 if (!cpu_possible(cpu))
2351 continue;
2352 *pos = cpu+1;
2353 return per_cpu_ptr(tbl->stats, cpu);
2354 }
2355 return NULL;
2356}
2357
2358static void neigh_stat_seq_stop(struct seq_file *seq, void *v)
2359{
2360
2361}
2362
2363static int neigh_stat_seq_show(struct seq_file *seq, void *v)
2364{
2365 struct proc_dir_entry *pde = seq->private;
2366 struct neigh_table *tbl = pde->data;
2367 struct neigh_statistics *st = v;
2368
2369 if (v == SEQ_START_TOKEN) {
5bec0039 2370 seq_printf(seq, "entries allocs destroys hash_grows lookups hits res_failed rcv_probes_mcast rcv_probes_ucast periodic_gc_runs forced_gc_runs\n");
1da177e4
LT
2371 return 0;
2372 }
2373
2374 seq_printf(seq, "%08x %08lx %08lx %08lx %08lx %08lx %08lx "
2375 "%08lx %08lx %08lx %08lx\n",
2376 atomic_read(&tbl->entries),
2377
2378 st->allocs,
2379 st->destroys,
2380 st->hash_grows,
2381
2382 st->lookups,
2383 st->hits,
2384
2385 st->res_failed,
2386
2387 st->rcv_probes_mcast,
2388 st->rcv_probes_ucast,
2389
2390 st->periodic_gc_runs,
2391 st->forced_gc_runs
2392 );
2393
2394 return 0;
2395}
2396
f690808e 2397static const struct seq_operations neigh_stat_seq_ops = {
1da177e4
LT
2398 .start = neigh_stat_seq_start,
2399 .next = neigh_stat_seq_next,
2400 .stop = neigh_stat_seq_stop,
2401 .show = neigh_stat_seq_show,
2402};
2403
2404static int neigh_stat_seq_open(struct inode *inode, struct file *file)
2405{
2406 int ret = seq_open(file, &neigh_stat_seq_ops);
2407
2408 if (!ret) {
2409 struct seq_file *sf = file->private_data;
2410 sf->private = PDE(inode);
2411 }
2412 return ret;
2413};
2414
9a32144e 2415static const struct file_operations neigh_stat_seq_fops = {
1da177e4
LT
2416 .owner = THIS_MODULE,
2417 .open = neigh_stat_seq_open,
2418 .read = seq_read,
2419 .llseek = seq_lseek,
2420 .release = seq_release,
2421};
2422
2423#endif /* CONFIG_PROC_FS */
2424
2425#ifdef CONFIG_ARPD
339bf98f
TG
2426static inline size_t neigh_nlmsg_size(void)
2427{
2428 return NLMSG_ALIGN(sizeof(struct ndmsg))
2429 + nla_total_size(MAX_ADDR_LEN) /* NDA_DST */
2430 + nla_total_size(MAX_ADDR_LEN) /* NDA_LLADDR */
2431 + nla_total_size(sizeof(struct nda_cacheinfo))
2432 + nla_total_size(4); /* NDA_PROBES */
2433}
2434
b8673311 2435static void __neigh_notify(struct neighbour *n, int type, int flags)
1da177e4 2436{
8b8aec50 2437 struct sk_buff *skb;
b8673311 2438 int err = -ENOBUFS;
1da177e4 2439
339bf98f 2440 skb = nlmsg_new(neigh_nlmsg_size(), GFP_ATOMIC);
8b8aec50 2441 if (skb == NULL)
b8673311 2442 goto errout;
1da177e4 2443
b8673311 2444 err = neigh_fill_info(skb, n, 0, 0, type, flags);
26932566
PM
2445 if (err < 0) {
2446 /* -EMSGSIZE implies BUG in neigh_nlmsg_size() */
2447 WARN_ON(err == -EMSGSIZE);
2448 kfree_skb(skb);
2449 goto errout;
2450 }
b8673311
TG
2451 err = rtnl_notify(skb, 0, RTNLGRP_NEIGH, NULL, GFP_ATOMIC);
2452errout:
2453 if (err < 0)
2454 rtnl_set_sk_err(RTNLGRP_NEIGH, err);
1da177e4
LT
2455}
2456
b8673311 2457void neigh_app_ns(struct neighbour *n)
1da177e4 2458{
b8673311
TG
2459 __neigh_notify(n, RTM_GETNEIGH, NLM_F_REQUEST);
2460}
1da177e4 2461
b8673311
TG
2462static void neigh_app_notify(struct neighbour *n)
2463{
2464 __neigh_notify(n, RTM_NEWNEIGH, 0);
1da177e4
LT
2465}
2466
2467#endif /* CONFIG_ARPD */
2468
2469#ifdef CONFIG_SYSCTL
2470
2471static struct neigh_sysctl_table {
2472 struct ctl_table_header *sysctl_header;
2473 ctl_table neigh_vars[__NET_NEIGH_MAX];
2474 ctl_table neigh_dev[2];
2475 ctl_table neigh_neigh_dir[2];
2476 ctl_table neigh_proto_dir[2];
2477 ctl_table neigh_root_dir[2];
ab32ea5d 2478} neigh_sysctl_template __read_mostly = {
1da177e4
LT
2479 .neigh_vars = {
2480 {
2481 .ctl_name = NET_NEIGH_MCAST_SOLICIT,
2482 .procname = "mcast_solicit",
2483 .maxlen = sizeof(int),
2484 .mode = 0644,
2485 .proc_handler = &proc_dointvec,
2486 },
2487 {
2488 .ctl_name = NET_NEIGH_UCAST_SOLICIT,
2489 .procname = "ucast_solicit",
2490 .maxlen = sizeof(int),
2491 .mode = 0644,
2492 .proc_handler = &proc_dointvec,
2493 },
2494 {
2495 .ctl_name = NET_NEIGH_APP_SOLICIT,
2496 .procname = "app_solicit",
2497 .maxlen = sizeof(int),
2498 .mode = 0644,
2499 .proc_handler = &proc_dointvec,
2500 },
2501 {
2502 .ctl_name = NET_NEIGH_RETRANS_TIME,
2503 .procname = "retrans_time",
2504 .maxlen = sizeof(int),
2505 .mode = 0644,
2506 .proc_handler = &proc_dointvec_userhz_jiffies,
2507 },
2508 {
2509 .ctl_name = NET_NEIGH_REACHABLE_TIME,
2510 .procname = "base_reachable_time",
2511 .maxlen = sizeof(int),
2512 .mode = 0644,
2513 .proc_handler = &proc_dointvec_jiffies,
2514 .strategy = &sysctl_jiffies,
2515 },
2516 {
2517 .ctl_name = NET_NEIGH_DELAY_PROBE_TIME,
2518 .procname = "delay_first_probe_time",
2519 .maxlen = sizeof(int),
2520 .mode = 0644,
2521 .proc_handler = &proc_dointvec_jiffies,
2522 .strategy = &sysctl_jiffies,
2523 },
2524 {
2525 .ctl_name = NET_NEIGH_GC_STALE_TIME,
2526 .procname = "gc_stale_time",
2527 .maxlen = sizeof(int),
2528 .mode = 0644,
2529 .proc_handler = &proc_dointvec_jiffies,
2530 .strategy = &sysctl_jiffies,
2531 },
2532 {
2533 .ctl_name = NET_NEIGH_UNRES_QLEN,
2534 .procname = "unres_qlen",
2535 .maxlen = sizeof(int),
2536 .mode = 0644,
2537 .proc_handler = &proc_dointvec,
2538 },
2539 {
2540 .ctl_name = NET_NEIGH_PROXY_QLEN,
2541 .procname = "proxy_qlen",
2542 .maxlen = sizeof(int),
2543 .mode = 0644,
2544 .proc_handler = &proc_dointvec,
2545 },
2546 {
2547 .ctl_name = NET_NEIGH_ANYCAST_DELAY,
2548 .procname = "anycast_delay",
2549 .maxlen = sizeof(int),
2550 .mode = 0644,
2551 .proc_handler = &proc_dointvec_userhz_jiffies,
2552 },
2553 {
2554 .ctl_name = NET_NEIGH_PROXY_DELAY,
2555 .procname = "proxy_delay",
2556 .maxlen = sizeof(int),
2557 .mode = 0644,
2558 .proc_handler = &proc_dointvec_userhz_jiffies,
2559 },
2560 {
2561 .ctl_name = NET_NEIGH_LOCKTIME,
2562 .procname = "locktime",
2563 .maxlen = sizeof(int),
2564 .mode = 0644,
2565 .proc_handler = &proc_dointvec_userhz_jiffies,
2566 },
2567 {
2568 .ctl_name = NET_NEIGH_GC_INTERVAL,
2569 .procname = "gc_interval",
2570 .maxlen = sizeof(int),
2571 .mode = 0644,
2572 .proc_handler = &proc_dointvec_jiffies,
2573 .strategy = &sysctl_jiffies,
2574 },
2575 {
2576 .ctl_name = NET_NEIGH_GC_THRESH1,
2577 .procname = "gc_thresh1",
2578 .maxlen = sizeof(int),
2579 .mode = 0644,
2580 .proc_handler = &proc_dointvec,
2581 },
2582 {
2583 .ctl_name = NET_NEIGH_GC_THRESH2,
2584 .procname = "gc_thresh2",
2585 .maxlen = sizeof(int),
2586 .mode = 0644,
2587 .proc_handler = &proc_dointvec,
2588 },
2589 {
2590 .ctl_name = NET_NEIGH_GC_THRESH3,
2591 .procname = "gc_thresh3",
2592 .maxlen = sizeof(int),
2593 .mode = 0644,
2594 .proc_handler = &proc_dointvec,
2595 },
2596 {
2597 .ctl_name = NET_NEIGH_RETRANS_TIME_MS,
2598 .procname = "retrans_time_ms",
2599 .maxlen = sizeof(int),
2600 .mode = 0644,
2601 .proc_handler = &proc_dointvec_ms_jiffies,
2602 .strategy = &sysctl_ms_jiffies,
2603 },
2604 {
2605 .ctl_name = NET_NEIGH_REACHABLE_TIME_MS,
2606 .procname = "base_reachable_time_ms",
2607 .maxlen = sizeof(int),
2608 .mode = 0644,
2609 .proc_handler = &proc_dointvec_ms_jiffies,
2610 .strategy = &sysctl_ms_jiffies,
2611 },
2612 },
2613 .neigh_dev = {
2614 {
2615 .ctl_name = NET_PROTO_CONF_DEFAULT,
2616 .procname = "default",
2617 .mode = 0555,
2618 },
2619 },
2620 .neigh_neigh_dir = {
2621 {
2622 .procname = "neigh",
2623 .mode = 0555,
2624 },
2625 },
2626 .neigh_proto_dir = {
2627 {
2628 .mode = 0555,
2629 },
2630 },
2631 .neigh_root_dir = {
2632 {
2633 .ctl_name = CTL_NET,
2634 .procname = "net",
2635 .mode = 0555,
2636 },
2637 },
2638};
2639
2640int neigh_sysctl_register(struct net_device *dev, struct neigh_parms *p,
4ec93edb 2641 int p_id, int pdev_id, char *p_name,
1da177e4
LT
2642 proc_handler *handler, ctl_handler *strategy)
2643{
b1a98bf6
ACM
2644 struct neigh_sysctl_table *t = kmemdup(&neigh_sysctl_template,
2645 sizeof(*t), GFP_KERNEL);
1da177e4
LT
2646 const char *dev_name_source = NULL;
2647 char *dev_name = NULL;
2648 int err = 0;
2649
2650 if (!t)
2651 return -ENOBUFS;
1da177e4
LT
2652 t->neigh_vars[0].data = &p->mcast_probes;
2653 t->neigh_vars[1].data = &p->ucast_probes;
2654 t->neigh_vars[2].data = &p->app_probes;
2655 t->neigh_vars[3].data = &p->retrans_time;
2656 t->neigh_vars[4].data = &p->base_reachable_time;
2657 t->neigh_vars[5].data = &p->delay_probe_time;
2658 t->neigh_vars[6].data = &p->gc_staletime;
2659 t->neigh_vars[7].data = &p->queue_len;
2660 t->neigh_vars[8].data = &p->proxy_qlen;
2661 t->neigh_vars[9].data = &p->anycast_delay;
2662 t->neigh_vars[10].data = &p->proxy_delay;
2663 t->neigh_vars[11].data = &p->locktime;
2664
2665 if (dev) {
2666 dev_name_source = dev->name;
2667 t->neigh_dev[0].ctl_name = dev->ifindex;
2668 t->neigh_vars[12].procname = NULL;
2669 t->neigh_vars[13].procname = NULL;
2670 t->neigh_vars[14].procname = NULL;
2671 t->neigh_vars[15].procname = NULL;
2672 } else {
4ec93edb 2673 dev_name_source = t->neigh_dev[0].procname;
1da177e4
LT
2674 t->neigh_vars[12].data = (int *)(p + 1);
2675 t->neigh_vars[13].data = (int *)(p + 1) + 1;
2676 t->neigh_vars[14].data = (int *)(p + 1) + 2;
2677 t->neigh_vars[15].data = (int *)(p + 1) + 3;
2678 }
2679
2680 t->neigh_vars[16].data = &p->retrans_time;
2681 t->neigh_vars[17].data = &p->base_reachable_time;
2682
2683 if (handler || strategy) {
2684 /* RetransTime */
2685 t->neigh_vars[3].proc_handler = handler;
2686 t->neigh_vars[3].strategy = strategy;
2687 t->neigh_vars[3].extra1 = dev;
2688 /* ReachableTime */
2689 t->neigh_vars[4].proc_handler = handler;
2690 t->neigh_vars[4].strategy = strategy;
2691 t->neigh_vars[4].extra1 = dev;
2692 /* RetransTime (in milliseconds)*/
2693 t->neigh_vars[16].proc_handler = handler;
2694 t->neigh_vars[16].strategy = strategy;
2695 t->neigh_vars[16].extra1 = dev;
2696 /* ReachableTime (in milliseconds) */
2697 t->neigh_vars[17].proc_handler = handler;
2698 t->neigh_vars[17].strategy = strategy;
2699 t->neigh_vars[17].extra1 = dev;
2700 }
2701
543537bd 2702 dev_name = kstrdup(dev_name_source, GFP_KERNEL);
1da177e4
LT
2703 if (!dev_name) {
2704 err = -ENOBUFS;
2705 goto free;
2706 }
2707
4ec93edb 2708 t->neigh_dev[0].procname = dev_name;
1da177e4
LT
2709
2710 t->neigh_neigh_dir[0].ctl_name = pdev_id;
2711
2712 t->neigh_proto_dir[0].procname = p_name;
2713 t->neigh_proto_dir[0].ctl_name = p_id;
2714
2715 t->neigh_dev[0].child = t->neigh_vars;
2716 t->neigh_neigh_dir[0].child = t->neigh_dev;
2717 t->neigh_proto_dir[0].child = t->neigh_neigh_dir;
2718 t->neigh_root_dir[0].child = t->neigh_proto_dir;
2719
0b4d4147 2720 t->sysctl_header = register_sysctl_table(t->neigh_root_dir);
1da177e4
LT
2721 if (!t->sysctl_header) {
2722 err = -ENOBUFS;
2723 goto free_procname;
2724 }
2725 p->sysctl_table = t;
2726 return 0;
2727
2728 /* error path */
2729 free_procname:
2730 kfree(dev_name);
2731 free:
2732 kfree(t);
2733
2734 return err;
2735}
2736
2737void neigh_sysctl_unregister(struct neigh_parms *p)
2738{
2739 if (p->sysctl_table) {
2740 struct neigh_sysctl_table *t = p->sysctl_table;
2741 p->sysctl_table = NULL;
2742 unregister_sysctl_table(t->sysctl_header);
2743 kfree(t->neigh_dev[0].procname);
2744 kfree(t);
2745 }
2746}
2747
2748#endif /* CONFIG_SYSCTL */
2749
c8822a4e
TG
2750static int __init neigh_init(void)
2751{
2752 rtnl_register(PF_UNSPEC, RTM_NEWNEIGH, neigh_add, NULL);
2753 rtnl_register(PF_UNSPEC, RTM_DELNEIGH, neigh_delete, NULL);
2754 rtnl_register(PF_UNSPEC, RTM_GETNEIGH, NULL, neigh_dump_info);
2755
2756 rtnl_register(PF_UNSPEC, RTM_GETNEIGHTBL, NULL, neightbl_dump_info);
2757 rtnl_register(PF_UNSPEC, RTM_SETNEIGHTBL, neightbl_set, NULL);
2758
2759 return 0;
2760}
2761
2762subsys_initcall(neigh_init);
2763
1da177e4 2764EXPORT_SYMBOL(__neigh_event_send);
1da177e4
LT
2765EXPORT_SYMBOL(neigh_changeaddr);
2766EXPORT_SYMBOL(neigh_compat_output);
2767EXPORT_SYMBOL(neigh_connected_output);
2768EXPORT_SYMBOL(neigh_create);
1da177e4 2769EXPORT_SYMBOL(neigh_destroy);
1da177e4
LT
2770EXPORT_SYMBOL(neigh_event_ns);
2771EXPORT_SYMBOL(neigh_ifdown);
2772EXPORT_SYMBOL(neigh_lookup);
2773EXPORT_SYMBOL(neigh_lookup_nodev);
2774EXPORT_SYMBOL(neigh_parms_alloc);
2775EXPORT_SYMBOL(neigh_parms_release);
2776EXPORT_SYMBOL(neigh_rand_reach_time);
2777EXPORT_SYMBOL(neigh_resolve_output);
2778EXPORT_SYMBOL(neigh_table_clear);
2779EXPORT_SYMBOL(neigh_table_init);
bd89efc5 2780EXPORT_SYMBOL(neigh_table_init_no_netlink);
1da177e4 2781EXPORT_SYMBOL(neigh_update);
1da177e4
LT
2782EXPORT_SYMBOL(pneigh_enqueue);
2783EXPORT_SYMBOL(pneigh_lookup);
2784
2785#ifdef CONFIG_ARPD
2786EXPORT_SYMBOL(neigh_app_ns);
2787#endif
2788#ifdef CONFIG_SYSCTL
2789EXPORT_SYMBOL(neigh_sysctl_register);
2790EXPORT_SYMBOL(neigh_sysctl_unregister);
2791#endif