]> git.proxmox.com Git - mirror_ubuntu-bionic-kernel.git/blame - net/core/neighbour.c
Revert "[RTNETLINK]: Send a single notification on device state changes."
[mirror_ubuntu-bionic-kernel.git] / net / core / neighbour.c
CommitLineData
1da177e4
LT
1/*
2 * Generic address resolution entity
3 *
4 * Authors:
5 * Pedro Roque <roque@di.fc.ul.pt>
6 * Alexey Kuznetsov <kuznet@ms2.inr.ac.ru>
7 *
8 * This program is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU General Public License
10 * as published by the Free Software Foundation; either version
11 * 2 of the License, or (at your option) any later version.
12 *
13 * Fixes:
14 * Vitaly E. Lavrov releasing NULL neighbor in neigh_add.
15 * Harald Welte Add neighbour cache statistics like rtstat
16 */
17
1da177e4
LT
18#include <linux/types.h>
19#include <linux/kernel.h>
20#include <linux/module.h>
21#include <linux/socket.h>
1da177e4
LT
22#include <linux/netdevice.h>
23#include <linux/proc_fs.h>
24#ifdef CONFIG_SYSCTL
25#include <linux/sysctl.h>
26#endif
27#include <linux/times.h>
457c4cbc 28#include <net/net_namespace.h>
1da177e4
LT
29#include <net/neighbour.h>
30#include <net/dst.h>
31#include <net/sock.h>
8d71740c 32#include <net/netevent.h>
a14a49d2 33#include <net/netlink.h>
1da177e4
LT
34#include <linux/rtnetlink.h>
35#include <linux/random.h>
543537bd 36#include <linux/string.h>
c3609d51 37#include <linux/log2.h>
1da177e4
LT
38
39#define NEIGH_DEBUG 1
40
41#define NEIGH_PRINTK(x...) printk(x)
42#define NEIGH_NOPRINTK(x...) do { ; } while(0)
43#define NEIGH_PRINTK0 NEIGH_PRINTK
44#define NEIGH_PRINTK1 NEIGH_NOPRINTK
45#define NEIGH_PRINTK2 NEIGH_NOPRINTK
46
47#if NEIGH_DEBUG >= 1
48#undef NEIGH_PRINTK1
49#define NEIGH_PRINTK1 NEIGH_PRINTK
50#endif
51#if NEIGH_DEBUG >= 2
52#undef NEIGH_PRINTK2
53#define NEIGH_PRINTK2 NEIGH_PRINTK
54#endif
55
56#define PNEIGH_HASHMASK 0xF
57
58static void neigh_timer_handler(unsigned long arg);
d961db35
TG
59static void __neigh_notify(struct neighbour *n, int type, int flags);
60static void neigh_update_notify(struct neighbour *neigh);
1da177e4 61static int pneigh_ifdown(struct neigh_table *tbl, struct net_device *dev);
1da177e4
LT
62
63static struct neigh_table *neigh_tables;
45fc3b11 64#ifdef CONFIG_PROC_FS
9a32144e 65static const struct file_operations neigh_stat_seq_fops;
45fc3b11 66#endif
1da177e4
LT
67
68/*
69 Neighbour hash table buckets are protected with rwlock tbl->lock.
70
71 - All the scans/updates to hash buckets MUST be made under this lock.
72 - NOTHING clever should be made under this lock: no callbacks
73 to protocol backends, no attempts to send something to network.
74 It will result in deadlocks, if backend/driver wants to use neighbour
75 cache.
76 - If the entry requires some non-trivial actions, increase
77 its reference count and release table lock.
78
79 Neighbour entries are protected:
80 - with reference count.
81 - with rwlock neigh->lock
82
83 Reference count prevents destruction.
84
85 neigh->lock mainly serializes ll address data and its validity state.
86 However, the same lock is used to protect another entry fields:
87 - timer
88 - resolution queue
89
90 Again, nothing clever shall be made under neigh->lock,
91 the most complicated procedure, which we allow is dev->hard_header.
92 It is supposed, that dev->hard_header is simplistic and does
93 not make callbacks to neighbour tables.
94
95 The last lock is neigh_tbl_lock. It is pure SMP lock, protecting
96 list of neighbour tables. This list is used only in process context,
97 */
98
99static DEFINE_RWLOCK(neigh_tbl_lock);
100
101static int neigh_blackhole(struct sk_buff *skb)
102{
103 kfree_skb(skb);
104 return -ENETDOWN;
105}
106
4f494554
TG
107static void neigh_cleanup_and_release(struct neighbour *neigh)
108{
109 if (neigh->parms->neigh_cleanup)
110 neigh->parms->neigh_cleanup(neigh);
111
d961db35 112 __neigh_notify(neigh, RTM_DELNEIGH, 0);
4f494554
TG
113 neigh_release(neigh);
114}
115
1da177e4
LT
116/*
117 * It is random distribution in the interval (1/2)*base...(3/2)*base.
118 * It corresponds to default IPv6 settings and is not overridable,
119 * because it is really reasonable choice.
120 */
121
122unsigned long neigh_rand_reach_time(unsigned long base)
123{
124 return (base ? (net_random() % base) + (base >> 1) : 0);
125}
126
127
128static int neigh_forced_gc(struct neigh_table *tbl)
129{
130 int shrunk = 0;
131 int i;
132
133 NEIGH_CACHE_STAT_INC(tbl, forced_gc_runs);
134
135 write_lock_bh(&tbl->lock);
136 for (i = 0; i <= tbl->hash_mask; i++) {
137 struct neighbour *n, **np;
138
139 np = &tbl->hash_buckets[i];
140 while ((n = *np) != NULL) {
141 /* Neighbour record may be discarded if:
142 * - nobody refers to it.
143 * - it is not permanent
144 */
145 write_lock(&n->lock);
146 if (atomic_read(&n->refcnt) == 1 &&
147 !(n->nud_state & NUD_PERMANENT)) {
148 *np = n->next;
149 n->dead = 1;
150 shrunk = 1;
151 write_unlock(&n->lock);
4f494554 152 neigh_cleanup_and_release(n);
1da177e4
LT
153 continue;
154 }
155 write_unlock(&n->lock);
156 np = &n->next;
157 }
158 }
159
160 tbl->last_flush = jiffies;
161
162 write_unlock_bh(&tbl->lock);
163
164 return shrunk;
165}
166
a43d8994
PE
167static void neigh_add_timer(struct neighbour *n, unsigned long when)
168{
169 neigh_hold(n);
170 if (unlikely(mod_timer(&n->timer, when))) {
171 printk("NEIGH: BUG, double timer add, state is %x\n",
172 n->nud_state);
173 dump_stack();
174 }
175}
176
1da177e4
LT
177static int neigh_del_timer(struct neighbour *n)
178{
179 if ((n->nud_state & NUD_IN_TIMER) &&
180 del_timer(&n->timer)) {
181 neigh_release(n);
182 return 1;
183 }
184 return 0;
185}
186
187static void pneigh_queue_purge(struct sk_buff_head *list)
188{
189 struct sk_buff *skb;
190
191 while ((skb = skb_dequeue(list)) != NULL) {
192 dev_put(skb->dev);
193 kfree_skb(skb);
194 }
195}
196
49636bb1 197static void neigh_flush_dev(struct neigh_table *tbl, struct net_device *dev)
1da177e4
LT
198{
199 int i;
200
1da177e4
LT
201 for (i = 0; i <= tbl->hash_mask; i++) {
202 struct neighbour *n, **np = &tbl->hash_buckets[i];
203
204 while ((n = *np) != NULL) {
205 if (dev && n->dev != dev) {
206 np = &n->next;
207 continue;
208 }
209 *np = n->next;
210 write_lock(&n->lock);
211 neigh_del_timer(n);
212 n->dead = 1;
213
214 if (atomic_read(&n->refcnt) != 1) {
215 /* The most unpleasant situation.
216 We must destroy neighbour entry,
217 but someone still uses it.
218
219 The destroy will be delayed until
220 the last user releases us, but
221 we must kill timers etc. and move
222 it to safe state.
223 */
224 skb_queue_purge(&n->arp_queue);
225 n->output = neigh_blackhole;
226 if (n->nud_state & NUD_VALID)
227 n->nud_state = NUD_NOARP;
228 else
229 n->nud_state = NUD_NONE;
230 NEIGH_PRINTK2("neigh %p is stray.\n", n);
231 }
232 write_unlock(&n->lock);
4f494554 233 neigh_cleanup_and_release(n);
1da177e4
LT
234 }
235 }
49636bb1 236}
1da177e4 237
49636bb1
HX
238void neigh_changeaddr(struct neigh_table *tbl, struct net_device *dev)
239{
240 write_lock_bh(&tbl->lock);
241 neigh_flush_dev(tbl, dev);
242 write_unlock_bh(&tbl->lock);
243}
244
245int neigh_ifdown(struct neigh_table *tbl, struct net_device *dev)
246{
247 write_lock_bh(&tbl->lock);
248 neigh_flush_dev(tbl, dev);
1da177e4
LT
249 pneigh_ifdown(tbl, dev);
250 write_unlock_bh(&tbl->lock);
251
252 del_timer_sync(&tbl->proxy_timer);
253 pneigh_queue_purge(&tbl->proxy_queue);
254 return 0;
255}
256
257static struct neighbour *neigh_alloc(struct neigh_table *tbl)
258{
259 struct neighbour *n = NULL;
260 unsigned long now = jiffies;
261 int entries;
262
263 entries = atomic_inc_return(&tbl->entries) - 1;
264 if (entries >= tbl->gc_thresh3 ||
265 (entries >= tbl->gc_thresh2 &&
266 time_after(now, tbl->last_flush + 5 * HZ))) {
267 if (!neigh_forced_gc(tbl) &&
268 entries >= tbl->gc_thresh3)
269 goto out_entries;
270 }
271
c3762229 272 n = kmem_cache_zalloc(tbl->kmem_cachep, GFP_ATOMIC);
1da177e4
LT
273 if (!n)
274 goto out_entries;
275
1da177e4
LT
276 skb_queue_head_init(&n->arp_queue);
277 rwlock_init(&n->lock);
278 n->updated = n->used = now;
279 n->nud_state = NUD_NONE;
280 n->output = neigh_blackhole;
281 n->parms = neigh_parms_clone(&tbl->parms);
b24b8a24 282 setup_timer(&n->timer, neigh_timer_handler, (unsigned long)n);
1da177e4
LT
283
284 NEIGH_CACHE_STAT_INC(tbl, allocs);
285 n->tbl = tbl;
286 atomic_set(&n->refcnt, 1);
287 n->dead = 1;
288out:
289 return n;
290
291out_entries:
292 atomic_dec(&tbl->entries);
293 goto out;
294}
295
296static struct neighbour **neigh_hash_alloc(unsigned int entries)
297{
298 unsigned long size = entries * sizeof(struct neighbour *);
299 struct neighbour **ret;
300
301 if (size <= PAGE_SIZE) {
77d04bd9 302 ret = kzalloc(size, GFP_ATOMIC);
1da177e4
LT
303 } else {
304 ret = (struct neighbour **)
77d04bd9 305 __get_free_pages(GFP_ATOMIC|__GFP_ZERO, get_order(size));
1da177e4 306 }
1da177e4
LT
307 return ret;
308}
309
310static void neigh_hash_free(struct neighbour **hash, unsigned int entries)
311{
312 unsigned long size = entries * sizeof(struct neighbour *);
313
314 if (size <= PAGE_SIZE)
315 kfree(hash);
316 else
317 free_pages((unsigned long)hash, get_order(size));
318}
319
320static void neigh_hash_grow(struct neigh_table *tbl, unsigned long new_entries)
321{
322 struct neighbour **new_hash, **old_hash;
323 unsigned int i, new_hash_mask, old_entries;
324
325 NEIGH_CACHE_STAT_INC(tbl, hash_grows);
326
c3609d51 327 BUG_ON(!is_power_of_2(new_entries));
1da177e4
LT
328 new_hash = neigh_hash_alloc(new_entries);
329 if (!new_hash)
330 return;
331
332 old_entries = tbl->hash_mask + 1;
333 new_hash_mask = new_entries - 1;
334 old_hash = tbl->hash_buckets;
335
336 get_random_bytes(&tbl->hash_rnd, sizeof(tbl->hash_rnd));
337 for (i = 0; i < old_entries; i++) {
338 struct neighbour *n, *next;
339
340 for (n = old_hash[i]; n; n = next) {
341 unsigned int hash_val = tbl->hash(n->primary_key, n->dev);
342
343 hash_val &= new_hash_mask;
344 next = n->next;
345
346 n->next = new_hash[hash_val];
347 new_hash[hash_val] = n;
348 }
349 }
350 tbl->hash_buckets = new_hash;
351 tbl->hash_mask = new_hash_mask;
352
353 neigh_hash_free(old_hash, old_entries);
354}
355
356struct neighbour *neigh_lookup(struct neigh_table *tbl, const void *pkey,
357 struct net_device *dev)
358{
359 struct neighbour *n;
360 int key_len = tbl->key_len;
c5e29460 361 u32 hash_val = tbl->hash(pkey, dev);
4ec93edb 362
1da177e4
LT
363 NEIGH_CACHE_STAT_INC(tbl, lookups);
364
365 read_lock_bh(&tbl->lock);
c5e29460 366 for (n = tbl->hash_buckets[hash_val & tbl->hash_mask]; n; n = n->next) {
1da177e4
LT
367 if (dev == n->dev && !memcmp(n->primary_key, pkey, key_len)) {
368 neigh_hold(n);
369 NEIGH_CACHE_STAT_INC(tbl, hits);
370 break;
371 }
372 }
373 read_unlock_bh(&tbl->lock);
374 return n;
375}
376
426b5303
EB
377struct neighbour *neigh_lookup_nodev(struct neigh_table *tbl, struct net *net,
378 const void *pkey)
1da177e4
LT
379{
380 struct neighbour *n;
381 int key_len = tbl->key_len;
c5e29460 382 u32 hash_val = tbl->hash(pkey, NULL);
1da177e4
LT
383
384 NEIGH_CACHE_STAT_INC(tbl, lookups);
385
386 read_lock_bh(&tbl->lock);
c5e29460 387 for (n = tbl->hash_buckets[hash_val & tbl->hash_mask]; n; n = n->next) {
426b5303
EB
388 if (!memcmp(n->primary_key, pkey, key_len) &&
389 (net == n->dev->nd_net)) {
1da177e4
LT
390 neigh_hold(n);
391 NEIGH_CACHE_STAT_INC(tbl, hits);
392 break;
393 }
394 }
395 read_unlock_bh(&tbl->lock);
396 return n;
397}
398
399struct neighbour *neigh_create(struct neigh_table *tbl, const void *pkey,
400 struct net_device *dev)
401{
402 u32 hash_val;
403 int key_len = tbl->key_len;
404 int error;
405 struct neighbour *n1, *rc, *n = neigh_alloc(tbl);
406
407 if (!n) {
408 rc = ERR_PTR(-ENOBUFS);
409 goto out;
410 }
411
412 memcpy(n->primary_key, pkey, key_len);
413 n->dev = dev;
414 dev_hold(dev);
415
416 /* Protocol specific setup. */
417 if (tbl->constructor && (error = tbl->constructor(n)) < 0) {
418 rc = ERR_PTR(error);
419 goto out_neigh_release;
420 }
421
422 /* Device specific setup. */
423 if (n->parms->neigh_setup &&
424 (error = n->parms->neigh_setup(n)) < 0) {
425 rc = ERR_PTR(error);
426 goto out_neigh_release;
427 }
428
429 n->confirmed = jiffies - (n->parms->base_reachable_time << 1);
430
431 write_lock_bh(&tbl->lock);
432
433 if (atomic_read(&tbl->entries) > (tbl->hash_mask + 1))
434 neigh_hash_grow(tbl, (tbl->hash_mask + 1) << 1);
435
436 hash_val = tbl->hash(pkey, dev) & tbl->hash_mask;
437
438 if (n->parms->dead) {
439 rc = ERR_PTR(-EINVAL);
440 goto out_tbl_unlock;
441 }
442
443 for (n1 = tbl->hash_buckets[hash_val]; n1; n1 = n1->next) {
444 if (dev == n1->dev && !memcmp(n1->primary_key, pkey, key_len)) {
445 neigh_hold(n1);
446 rc = n1;
447 goto out_tbl_unlock;
448 }
449 }
450
451 n->next = tbl->hash_buckets[hash_val];
452 tbl->hash_buckets[hash_val] = n;
453 n->dead = 0;
454 neigh_hold(n);
455 write_unlock_bh(&tbl->lock);
456 NEIGH_PRINTK2("neigh %p is created.\n", n);
457 rc = n;
458out:
459 return rc;
460out_tbl_unlock:
461 write_unlock_bh(&tbl->lock);
462out_neigh_release:
463 neigh_release(n);
464 goto out;
465}
466
426b5303
EB
467struct pneigh_entry * pneigh_lookup(struct neigh_table *tbl,
468 struct net *net, const void *pkey,
1da177e4
LT
469 struct net_device *dev, int creat)
470{
471 struct pneigh_entry *n;
472 int key_len = tbl->key_len;
473 u32 hash_val = *(u32 *)(pkey + key_len - 4);
474
475 hash_val ^= (hash_val >> 16);
476 hash_val ^= hash_val >> 8;
477 hash_val ^= hash_val >> 4;
478 hash_val &= PNEIGH_HASHMASK;
479
480 read_lock_bh(&tbl->lock);
481
482 for (n = tbl->phash_buckets[hash_val]; n; n = n->next) {
483 if (!memcmp(n->key, pkey, key_len) &&
426b5303 484 (n->net == net) &&
1da177e4
LT
485 (n->dev == dev || !n->dev)) {
486 read_unlock_bh(&tbl->lock);
487 goto out;
488 }
489 }
490 read_unlock_bh(&tbl->lock);
491 n = NULL;
492 if (!creat)
493 goto out;
494
4ae28944
PE
495 ASSERT_RTNL();
496
1da177e4
LT
497 n = kmalloc(sizeof(*n) + key_len, GFP_KERNEL);
498 if (!n)
499 goto out;
500
426b5303 501 n->net = hold_net(net);
1da177e4
LT
502 memcpy(n->key, pkey, key_len);
503 n->dev = dev;
504 if (dev)
505 dev_hold(dev);
506
507 if (tbl->pconstructor && tbl->pconstructor(n)) {
508 if (dev)
509 dev_put(dev);
510 kfree(n);
511 n = NULL;
512 goto out;
513 }
514
515 write_lock_bh(&tbl->lock);
516 n->next = tbl->phash_buckets[hash_val];
517 tbl->phash_buckets[hash_val] = n;
518 write_unlock_bh(&tbl->lock);
519out:
520 return n;
521}
522
523
426b5303 524int pneigh_delete(struct neigh_table *tbl, struct net *net, const void *pkey,
1da177e4
LT
525 struct net_device *dev)
526{
527 struct pneigh_entry *n, **np;
528 int key_len = tbl->key_len;
529 u32 hash_val = *(u32 *)(pkey + key_len - 4);
530
531 hash_val ^= (hash_val >> 16);
532 hash_val ^= hash_val >> 8;
533 hash_val ^= hash_val >> 4;
534 hash_val &= PNEIGH_HASHMASK;
535
536 write_lock_bh(&tbl->lock);
537 for (np = &tbl->phash_buckets[hash_val]; (n = *np) != NULL;
538 np = &n->next) {
426b5303
EB
539 if (!memcmp(n->key, pkey, key_len) && n->dev == dev &&
540 (n->net == net)) {
1da177e4
LT
541 *np = n->next;
542 write_unlock_bh(&tbl->lock);
543 if (tbl->pdestructor)
544 tbl->pdestructor(n);
545 if (n->dev)
546 dev_put(n->dev);
426b5303 547 release_net(n->net);
1da177e4
LT
548 kfree(n);
549 return 0;
550 }
551 }
552 write_unlock_bh(&tbl->lock);
553 return -ENOENT;
554}
555
556static int pneigh_ifdown(struct neigh_table *tbl, struct net_device *dev)
557{
558 struct pneigh_entry *n, **np;
559 u32 h;
560
561 for (h = 0; h <= PNEIGH_HASHMASK; h++) {
562 np = &tbl->phash_buckets[h];
563 while ((n = *np) != NULL) {
564 if (!dev || n->dev == dev) {
565 *np = n->next;
566 if (tbl->pdestructor)
567 tbl->pdestructor(n);
568 if (n->dev)
569 dev_put(n->dev);
426b5303 570 release_net(n->net);
1da177e4
LT
571 kfree(n);
572 continue;
573 }
574 np = &n->next;
575 }
576 }
577 return -ENOENT;
578}
579
06f0511d
DL
580static void neigh_parms_destroy(struct neigh_parms *parms);
581
582static inline void neigh_parms_put(struct neigh_parms *parms)
583{
584 if (atomic_dec_and_test(&parms->refcnt))
585 neigh_parms_destroy(parms);
586}
1da177e4
LT
587
588/*
589 * neighbour must already be out of the table;
590 *
591 */
592void neigh_destroy(struct neighbour *neigh)
593{
594 struct hh_cache *hh;
595
596 NEIGH_CACHE_STAT_INC(neigh->tbl, destroys);
597
598 if (!neigh->dead) {
599 printk(KERN_WARNING
600 "Destroying alive neighbour %p\n", neigh);
601 dump_stack();
602 return;
603 }
604
605 if (neigh_del_timer(neigh))
606 printk(KERN_WARNING "Impossible event.\n");
607
608 while ((hh = neigh->hh) != NULL) {
609 neigh->hh = hh->hh_next;
610 hh->hh_next = NULL;
3644f0ce
SH
611
612 write_seqlock_bh(&hh->hh_lock);
1da177e4 613 hh->hh_output = neigh_blackhole;
3644f0ce 614 write_sequnlock_bh(&hh->hh_lock);
1da177e4
LT
615 if (atomic_dec_and_test(&hh->hh_refcnt))
616 kfree(hh);
617 }
618
1da177e4
LT
619 skb_queue_purge(&neigh->arp_queue);
620
621 dev_put(neigh->dev);
622 neigh_parms_put(neigh->parms);
623
624 NEIGH_PRINTK2("neigh %p is destroyed.\n", neigh);
625
626 atomic_dec(&neigh->tbl->entries);
627 kmem_cache_free(neigh->tbl->kmem_cachep, neigh);
628}
629
630/* Neighbour state is suspicious;
631 disable fast path.
632
633 Called with write_locked neigh.
634 */
635static void neigh_suspect(struct neighbour *neigh)
636{
637 struct hh_cache *hh;
638
639 NEIGH_PRINTK2("neigh %p is suspected.\n", neigh);
640
641 neigh->output = neigh->ops->output;
642
643 for (hh = neigh->hh; hh; hh = hh->hh_next)
644 hh->hh_output = neigh->ops->output;
645}
646
647/* Neighbour state is OK;
648 enable fast path.
649
650 Called with write_locked neigh.
651 */
652static void neigh_connect(struct neighbour *neigh)
653{
654 struct hh_cache *hh;
655
656 NEIGH_PRINTK2("neigh %p is connected.\n", neigh);
657
658 neigh->output = neigh->ops->connected_output;
659
660 for (hh = neigh->hh; hh; hh = hh->hh_next)
661 hh->hh_output = neigh->ops->hh_output;
662}
663
664static void neigh_periodic_timer(unsigned long arg)
665{
666 struct neigh_table *tbl = (struct neigh_table *)arg;
667 struct neighbour *n, **np;
668 unsigned long expire, now = jiffies;
669
670 NEIGH_CACHE_STAT_INC(tbl, periodic_gc_runs);
671
672 write_lock(&tbl->lock);
673
674 /*
675 * periodically recompute ReachableTime from random function
676 */
677
678 if (time_after(now, tbl->last_rand + 300 * HZ)) {
679 struct neigh_parms *p;
680 tbl->last_rand = now;
681 for (p = &tbl->parms; p; p = p->next)
682 p->reachable_time =
683 neigh_rand_reach_time(p->base_reachable_time);
684 }
685
686 np = &tbl->hash_buckets[tbl->hash_chain_gc];
687 tbl->hash_chain_gc = ((tbl->hash_chain_gc + 1) & tbl->hash_mask);
688
689 while ((n = *np) != NULL) {
690 unsigned int state;
691
692 write_lock(&n->lock);
693
694 state = n->nud_state;
695 if (state & (NUD_PERMANENT | NUD_IN_TIMER)) {
696 write_unlock(&n->lock);
697 goto next_elt;
698 }
699
700 if (time_before(n->used, n->confirmed))
701 n->used = n->confirmed;
702
703 if (atomic_read(&n->refcnt) == 1 &&
704 (state == NUD_FAILED ||
705 time_after(now, n->used + n->parms->gc_staletime))) {
706 *np = n->next;
707 n->dead = 1;
708 write_unlock(&n->lock);
4f494554 709 neigh_cleanup_and_release(n);
1da177e4
LT
710 continue;
711 }
712 write_unlock(&n->lock);
713
714next_elt:
715 np = &n->next;
716 }
717
4ec93edb
YH
718 /* Cycle through all hash buckets every base_reachable_time/2 ticks.
719 * ARP entry timeouts range from 1/2 base_reachable_time to 3/2
720 * base_reachable_time.
1da177e4
LT
721 */
722 expire = tbl->parms.base_reachable_time >> 1;
723 expire /= (tbl->hash_mask + 1);
724 if (!expire)
725 expire = 1;
726
f5a6e01c
AV
727 if (expire>HZ)
728 mod_timer(&tbl->gc_timer, round_jiffies(now + expire));
729 else
730 mod_timer(&tbl->gc_timer, now + expire);
1da177e4
LT
731
732 write_unlock(&tbl->lock);
733}
734
735static __inline__ int neigh_max_probes(struct neighbour *n)
736{
737 struct neigh_parms *p = n->parms;
738 return (n->nud_state & NUD_PROBE ?
739 p->ucast_probes :
740 p->ucast_probes + p->app_probes + p->mcast_probes);
741}
742
1da177e4
LT
743/* Called when a timer expires for a neighbour entry. */
744
745static void neigh_timer_handler(unsigned long arg)
746{
747 unsigned long now, next;
748 struct neighbour *neigh = (struct neighbour *)arg;
749 unsigned state;
750 int notify = 0;
751
752 write_lock(&neigh->lock);
753
754 state = neigh->nud_state;
755 now = jiffies;
756 next = now + HZ;
757
758 if (!(state & NUD_IN_TIMER)) {
759#ifndef CONFIG_SMP
760 printk(KERN_WARNING "neigh: timer & !nud_in_timer\n");
761#endif
762 goto out;
763 }
764
765 if (state & NUD_REACHABLE) {
4ec93edb 766 if (time_before_eq(now,
1da177e4
LT
767 neigh->confirmed + neigh->parms->reachable_time)) {
768 NEIGH_PRINTK2("neigh %p is still alive.\n", neigh);
769 next = neigh->confirmed + neigh->parms->reachable_time;
770 } else if (time_before_eq(now,
771 neigh->used + neigh->parms->delay_probe_time)) {
772 NEIGH_PRINTK2("neigh %p is delayed.\n", neigh);
773 neigh->nud_state = NUD_DELAY;
955aaa2f 774 neigh->updated = jiffies;
1da177e4
LT
775 neigh_suspect(neigh);
776 next = now + neigh->parms->delay_probe_time;
777 } else {
778 NEIGH_PRINTK2("neigh %p is suspected.\n", neigh);
779 neigh->nud_state = NUD_STALE;
955aaa2f 780 neigh->updated = jiffies;
1da177e4 781 neigh_suspect(neigh);
8d71740c 782 notify = 1;
1da177e4
LT
783 }
784 } else if (state & NUD_DELAY) {
4ec93edb 785 if (time_before_eq(now,
1da177e4
LT
786 neigh->confirmed + neigh->parms->delay_probe_time)) {
787 NEIGH_PRINTK2("neigh %p is now reachable.\n", neigh);
788 neigh->nud_state = NUD_REACHABLE;
955aaa2f 789 neigh->updated = jiffies;
1da177e4 790 neigh_connect(neigh);
8d71740c 791 notify = 1;
1da177e4
LT
792 next = neigh->confirmed + neigh->parms->reachable_time;
793 } else {
794 NEIGH_PRINTK2("neigh %p is probed.\n", neigh);
795 neigh->nud_state = NUD_PROBE;
955aaa2f 796 neigh->updated = jiffies;
1da177e4
LT
797 atomic_set(&neigh->probes, 0);
798 next = now + neigh->parms->retrans_time;
799 }
800 } else {
801 /* NUD_PROBE|NUD_INCOMPLETE */
802 next = now + neigh->parms->retrans_time;
803 }
804
805 if ((neigh->nud_state & (NUD_INCOMPLETE | NUD_PROBE)) &&
806 atomic_read(&neigh->probes) >= neigh_max_probes(neigh)) {
807 struct sk_buff *skb;
808
809 neigh->nud_state = NUD_FAILED;
955aaa2f 810 neigh->updated = jiffies;
1da177e4
LT
811 notify = 1;
812 NEIGH_CACHE_STAT_INC(neigh->tbl, res_failed);
813 NEIGH_PRINTK2("neigh %p is failed.\n", neigh);
814
815 /* It is very thin place. report_unreachable is very complicated
816 routine. Particularly, it can hit the same neighbour entry!
817
818 So that, we try to be accurate and avoid dead loop. --ANK
819 */
820 while (neigh->nud_state == NUD_FAILED &&
821 (skb = __skb_dequeue(&neigh->arp_queue)) != NULL) {
822 write_unlock(&neigh->lock);
823 neigh->ops->error_report(neigh, skb);
824 write_lock(&neigh->lock);
825 }
826 skb_queue_purge(&neigh->arp_queue);
827 }
828
829 if (neigh->nud_state & NUD_IN_TIMER) {
1da177e4
LT
830 if (time_before(next, jiffies + HZ/2))
831 next = jiffies + HZ/2;
6fb9974f
HX
832 if (!mod_timer(&neigh->timer, next))
833 neigh_hold(neigh);
1da177e4
LT
834 }
835 if (neigh->nud_state & (NUD_INCOMPLETE | NUD_PROBE)) {
836 struct sk_buff *skb = skb_peek(&neigh->arp_queue);
69cc64d8 837
1da177e4
LT
838 neigh->ops->solicit(neigh, skb);
839 atomic_inc(&neigh->probes);
1da177e4 840 }
69cc64d8
DM
841out:
842 write_unlock(&neigh->lock);
d961db35 843
8d71740c 844 if (notify)
d961db35 845 neigh_update_notify(neigh);
1da177e4 846
1da177e4
LT
847 neigh_release(neigh);
848}
849
850int __neigh_event_send(struct neighbour *neigh, struct sk_buff *skb)
851{
852 int rc;
853 unsigned long now;
854
855 write_lock_bh(&neigh->lock);
856
857 rc = 0;
858 if (neigh->nud_state & (NUD_CONNECTED | NUD_DELAY | NUD_PROBE))
859 goto out_unlock_bh;
860
861 now = jiffies;
4ec93edb 862
1da177e4
LT
863 if (!(neigh->nud_state & (NUD_STALE | NUD_INCOMPLETE))) {
864 if (neigh->parms->mcast_probes + neigh->parms->app_probes) {
865 atomic_set(&neigh->probes, neigh->parms->ucast_probes);
866 neigh->nud_state = NUD_INCOMPLETE;
955aaa2f 867 neigh->updated = jiffies;
667347f1 868 neigh_add_timer(neigh, now + 1);
1da177e4
LT
869 } else {
870 neigh->nud_state = NUD_FAILED;
955aaa2f 871 neigh->updated = jiffies;
1da177e4
LT
872 write_unlock_bh(&neigh->lock);
873
874 if (skb)
875 kfree_skb(skb);
876 return 1;
877 }
878 } else if (neigh->nud_state & NUD_STALE) {
879 NEIGH_PRINTK2("neigh %p is delayed.\n", neigh);
1da177e4 880 neigh->nud_state = NUD_DELAY;
955aaa2f 881 neigh->updated = jiffies;
667347f1
DM
882 neigh_add_timer(neigh,
883 jiffies + neigh->parms->delay_probe_time);
1da177e4
LT
884 }
885
886 if (neigh->nud_state == NUD_INCOMPLETE) {
887 if (skb) {
888 if (skb_queue_len(&neigh->arp_queue) >=
889 neigh->parms->queue_len) {
890 struct sk_buff *buff;
891 buff = neigh->arp_queue.next;
892 __skb_unlink(buff, &neigh->arp_queue);
893 kfree_skb(buff);
894 }
895 __skb_queue_tail(&neigh->arp_queue, skb);
896 }
897 rc = 1;
898 }
899out_unlock_bh:
900 write_unlock_bh(&neigh->lock);
901 return rc;
902}
903
e92b43a3 904static void neigh_update_hhs(struct neighbour *neigh)
1da177e4
LT
905{
906 struct hh_cache *hh;
3b04ddde
SH
907 void (*update)(struct hh_cache*, const struct net_device*, const unsigned char *)
908 = neigh->dev->header_ops->cache_update;
1da177e4
LT
909
910 if (update) {
911 for (hh = neigh->hh; hh; hh = hh->hh_next) {
3644f0ce 912 write_seqlock_bh(&hh->hh_lock);
1da177e4 913 update(hh, neigh->dev, neigh->ha);
3644f0ce 914 write_sequnlock_bh(&hh->hh_lock);
1da177e4
LT
915 }
916 }
917}
918
919
920
921/* Generic update routine.
922 -- lladdr is new lladdr or NULL, if it is not supplied.
923 -- new is new state.
924 -- flags
925 NEIGH_UPDATE_F_OVERRIDE allows to override existing lladdr,
926 if it is different.
927 NEIGH_UPDATE_F_WEAK_OVERRIDE will suspect existing "connected"
4ec93edb 928 lladdr instead of overriding it
1da177e4
LT
929 if it is different.
930 It also allows to retain current state
931 if lladdr is unchanged.
932 NEIGH_UPDATE_F_ADMIN means that the change is administrative.
933
4ec93edb 934 NEIGH_UPDATE_F_OVERRIDE_ISROUTER allows to override existing
1da177e4
LT
935 NTF_ROUTER flag.
936 NEIGH_UPDATE_F_ISROUTER indicates if the neighbour is known as
937 a router.
938
939 Caller MUST hold reference count on the entry.
940 */
941
942int neigh_update(struct neighbour *neigh, const u8 *lladdr, u8 new,
943 u32 flags)
944{
945 u8 old;
946 int err;
1da177e4 947 int notify = 0;
1da177e4
LT
948 struct net_device *dev;
949 int update_isrouter = 0;
950
951 write_lock_bh(&neigh->lock);
952
953 dev = neigh->dev;
954 old = neigh->nud_state;
955 err = -EPERM;
956
4ec93edb 957 if (!(flags & NEIGH_UPDATE_F_ADMIN) &&
1da177e4
LT
958 (old & (NUD_NOARP | NUD_PERMANENT)))
959 goto out;
960
961 if (!(new & NUD_VALID)) {
962 neigh_del_timer(neigh);
963 if (old & NUD_CONNECTED)
964 neigh_suspect(neigh);
965 neigh->nud_state = new;
966 err = 0;
1da177e4 967 notify = old & NUD_VALID;
1da177e4
LT
968 goto out;
969 }
970
971 /* Compare new lladdr with cached one */
972 if (!dev->addr_len) {
973 /* First case: device needs no address. */
974 lladdr = neigh->ha;
975 } else if (lladdr) {
976 /* The second case: if something is already cached
977 and a new address is proposed:
978 - compare new & old
979 - if they are different, check override flag
980 */
4ec93edb 981 if ((old & NUD_VALID) &&
1da177e4
LT
982 !memcmp(lladdr, neigh->ha, dev->addr_len))
983 lladdr = neigh->ha;
984 } else {
985 /* No address is supplied; if we know something,
986 use it, otherwise discard the request.
987 */
988 err = -EINVAL;
989 if (!(old & NUD_VALID))
990 goto out;
991 lladdr = neigh->ha;
992 }
993
994 if (new & NUD_CONNECTED)
995 neigh->confirmed = jiffies;
996 neigh->updated = jiffies;
997
998 /* If entry was valid and address is not changed,
999 do not change entry state, if new one is STALE.
1000 */
1001 err = 0;
1002 update_isrouter = flags & NEIGH_UPDATE_F_OVERRIDE_ISROUTER;
1003 if (old & NUD_VALID) {
1004 if (lladdr != neigh->ha && !(flags & NEIGH_UPDATE_F_OVERRIDE)) {
1005 update_isrouter = 0;
1006 if ((flags & NEIGH_UPDATE_F_WEAK_OVERRIDE) &&
1007 (old & NUD_CONNECTED)) {
1008 lladdr = neigh->ha;
1009 new = NUD_STALE;
1010 } else
1011 goto out;
1012 } else {
1013 if (lladdr == neigh->ha && new == NUD_STALE &&
1014 ((flags & NEIGH_UPDATE_F_WEAK_OVERRIDE) ||
1015 (old & NUD_CONNECTED))
1016 )
1017 new = old;
1018 }
1019 }
1020
1021 if (new != old) {
1022 neigh_del_timer(neigh);
a43d8994 1023 if (new & NUD_IN_TIMER)
4ec93edb
YH
1024 neigh_add_timer(neigh, (jiffies +
1025 ((new & NUD_REACHABLE) ?
667347f1
DM
1026 neigh->parms->reachable_time :
1027 0)));
1da177e4
LT
1028 neigh->nud_state = new;
1029 }
1030
1031 if (lladdr != neigh->ha) {
1032 memcpy(&neigh->ha, lladdr, dev->addr_len);
1033 neigh_update_hhs(neigh);
1034 if (!(new & NUD_CONNECTED))
1035 neigh->confirmed = jiffies -
1036 (neigh->parms->base_reachable_time << 1);
1da177e4 1037 notify = 1;
1da177e4
LT
1038 }
1039 if (new == old)
1040 goto out;
1041 if (new & NUD_CONNECTED)
1042 neigh_connect(neigh);
1043 else
1044 neigh_suspect(neigh);
1045 if (!(old & NUD_VALID)) {
1046 struct sk_buff *skb;
1047
1048 /* Again: avoid dead loop if something went wrong */
1049
1050 while (neigh->nud_state & NUD_VALID &&
1051 (skb = __skb_dequeue(&neigh->arp_queue)) != NULL) {
1052 struct neighbour *n1 = neigh;
1053 write_unlock_bh(&neigh->lock);
1054 /* On shaper/eql skb->dst->neighbour != neigh :( */
1055 if (skb->dst && skb->dst->neighbour)
1056 n1 = skb->dst->neighbour;
1057 n1->output(skb);
1058 write_lock_bh(&neigh->lock);
1059 }
1060 skb_queue_purge(&neigh->arp_queue);
1061 }
1062out:
1063 if (update_isrouter) {
1064 neigh->flags = (flags & NEIGH_UPDATE_F_ISROUTER) ?
1065 (neigh->flags | NTF_ROUTER) :
1066 (neigh->flags & ~NTF_ROUTER);
1067 }
1068 write_unlock_bh(&neigh->lock);
8d71740c
TT
1069
1070 if (notify)
d961db35
TG
1071 neigh_update_notify(neigh);
1072
1da177e4
LT
1073 return err;
1074}
1075
1076struct neighbour *neigh_event_ns(struct neigh_table *tbl,
1077 u8 *lladdr, void *saddr,
1078 struct net_device *dev)
1079{
1080 struct neighbour *neigh = __neigh_lookup(tbl, saddr, dev,
1081 lladdr || !dev->addr_len);
1082 if (neigh)
4ec93edb 1083 neigh_update(neigh, lladdr, NUD_STALE,
1da177e4
LT
1084 NEIGH_UPDATE_F_OVERRIDE);
1085 return neigh;
1086}
1087
1088static void neigh_hh_init(struct neighbour *n, struct dst_entry *dst,
d77072ec 1089 __be16 protocol)
1da177e4
LT
1090{
1091 struct hh_cache *hh;
1092 struct net_device *dev = dst->dev;
1093
1094 for (hh = n->hh; hh; hh = hh->hh_next)
1095 if (hh->hh_type == protocol)
1096 break;
1097
77d04bd9 1098 if (!hh && (hh = kzalloc(sizeof(*hh), GFP_ATOMIC)) != NULL) {
3644f0ce 1099 seqlock_init(&hh->hh_lock);
1da177e4
LT
1100 hh->hh_type = protocol;
1101 atomic_set(&hh->hh_refcnt, 0);
1102 hh->hh_next = NULL;
3b04ddde
SH
1103
1104 if (dev->header_ops->cache(n, hh)) {
1da177e4
LT
1105 kfree(hh);
1106 hh = NULL;
1107 } else {
1108 atomic_inc(&hh->hh_refcnt);
1109 hh->hh_next = n->hh;
1110 n->hh = hh;
1111 if (n->nud_state & NUD_CONNECTED)
1112 hh->hh_output = n->ops->hh_output;
1113 else
1114 hh->hh_output = n->ops->output;
1115 }
1116 }
1117 if (hh) {
1118 atomic_inc(&hh->hh_refcnt);
1119 dst->hh = hh;
1120 }
1121}
1122
1123/* This function can be used in contexts, where only old dev_queue_xmit
1124 worked, f.e. if you want to override normal output path (eql, shaper),
1125 but resolution is not made yet.
1126 */
1127
1128int neigh_compat_output(struct sk_buff *skb)
1129{
1130 struct net_device *dev = skb->dev;
1131
bbe735e4 1132 __skb_pull(skb, skb_network_offset(skb));
1da177e4 1133
0c4e8581
SH
1134 if (dev_hard_header(skb, dev, ntohs(skb->protocol), NULL, NULL,
1135 skb->len) < 0 &&
3b04ddde 1136 dev->header_ops->rebuild(skb))
1da177e4
LT
1137 return 0;
1138
1139 return dev_queue_xmit(skb);
1140}
1141
1142/* Slow and careful. */
1143
1144int neigh_resolve_output(struct sk_buff *skb)
1145{
1146 struct dst_entry *dst = skb->dst;
1147 struct neighbour *neigh;
1148 int rc = 0;
1149
1150 if (!dst || !(neigh = dst->neighbour))
1151 goto discard;
1152
bbe735e4 1153 __skb_pull(skb, skb_network_offset(skb));
1da177e4
LT
1154
1155 if (!neigh_event_send(neigh, skb)) {
1156 int err;
1157 struct net_device *dev = neigh->dev;
3b04ddde 1158 if (dev->header_ops->cache && !dst->hh) {
1da177e4
LT
1159 write_lock_bh(&neigh->lock);
1160 if (!dst->hh)
1161 neigh_hh_init(neigh, dst, dst->ops->protocol);
0c4e8581
SH
1162 err = dev_hard_header(skb, dev, ntohs(skb->protocol),
1163 neigh->ha, NULL, skb->len);
1da177e4
LT
1164 write_unlock_bh(&neigh->lock);
1165 } else {
1166 read_lock_bh(&neigh->lock);
0c4e8581
SH
1167 err = dev_hard_header(skb, dev, ntohs(skb->protocol),
1168 neigh->ha, NULL, skb->len);
1da177e4
LT
1169 read_unlock_bh(&neigh->lock);
1170 }
1171 if (err >= 0)
1172 rc = neigh->ops->queue_xmit(skb);
1173 else
1174 goto out_kfree_skb;
1175 }
1176out:
1177 return rc;
1178discard:
1179 NEIGH_PRINTK1("neigh_resolve_output: dst=%p neigh=%p\n",
1180 dst, dst ? dst->neighbour : NULL);
1181out_kfree_skb:
1182 rc = -EINVAL;
1183 kfree_skb(skb);
1184 goto out;
1185}
1186
1187/* As fast as possible without hh cache */
1188
1189int neigh_connected_output(struct sk_buff *skb)
1190{
1191 int err;
1192 struct dst_entry *dst = skb->dst;
1193 struct neighbour *neigh = dst->neighbour;
1194 struct net_device *dev = neigh->dev;
1195
bbe735e4 1196 __skb_pull(skb, skb_network_offset(skb));
1da177e4
LT
1197
1198 read_lock_bh(&neigh->lock);
0c4e8581
SH
1199 err = dev_hard_header(skb, dev, ntohs(skb->protocol),
1200 neigh->ha, NULL, skb->len);
1da177e4
LT
1201 read_unlock_bh(&neigh->lock);
1202 if (err >= 0)
1203 err = neigh->ops->queue_xmit(skb);
1204 else {
1205 err = -EINVAL;
1206 kfree_skb(skb);
1207 }
1208 return err;
1209}
1210
1211static void neigh_proxy_process(unsigned long arg)
1212{
1213 struct neigh_table *tbl = (struct neigh_table *)arg;
1214 long sched_next = 0;
1215 unsigned long now = jiffies;
1216 struct sk_buff *skb;
1217
1218 spin_lock(&tbl->proxy_queue.lock);
1219
1220 skb = tbl->proxy_queue.next;
1221
1222 while (skb != (struct sk_buff *)&tbl->proxy_queue) {
1223 struct sk_buff *back = skb;
a61bbcf2 1224 long tdif = NEIGH_CB(back)->sched_next - now;
1da177e4
LT
1225
1226 skb = skb->next;
1227 if (tdif <= 0) {
1228 struct net_device *dev = back->dev;
1229 __skb_unlink(back, &tbl->proxy_queue);
1230 if (tbl->proxy_redo && netif_running(dev))
1231 tbl->proxy_redo(back);
1232 else
1233 kfree_skb(back);
1234
1235 dev_put(dev);
1236 } else if (!sched_next || tdif < sched_next)
1237 sched_next = tdif;
1238 }
1239 del_timer(&tbl->proxy_timer);
1240 if (sched_next)
1241 mod_timer(&tbl->proxy_timer, jiffies + sched_next);
1242 spin_unlock(&tbl->proxy_queue.lock);
1243}
1244
1245void pneigh_enqueue(struct neigh_table *tbl, struct neigh_parms *p,
1246 struct sk_buff *skb)
1247{
1248 unsigned long now = jiffies;
1249 unsigned long sched_next = now + (net_random() % p->proxy_delay);
1250
1251 if (tbl->proxy_queue.qlen > p->proxy_qlen) {
1252 kfree_skb(skb);
1253 return;
1254 }
a61bbcf2
PM
1255
1256 NEIGH_CB(skb)->sched_next = sched_next;
1257 NEIGH_CB(skb)->flags |= LOCALLY_ENQUEUED;
1da177e4
LT
1258
1259 spin_lock(&tbl->proxy_queue.lock);
1260 if (del_timer(&tbl->proxy_timer)) {
1261 if (time_before(tbl->proxy_timer.expires, sched_next))
1262 sched_next = tbl->proxy_timer.expires;
1263 }
1264 dst_release(skb->dst);
1265 skb->dst = NULL;
1266 dev_hold(skb->dev);
1267 __skb_queue_tail(&tbl->proxy_queue, skb);
1268 mod_timer(&tbl->proxy_timer, sched_next);
1269 spin_unlock(&tbl->proxy_queue.lock);
1270}
1271
426b5303
EB
1272static inline struct neigh_parms *lookup_neigh_params(struct neigh_table *tbl,
1273 struct net *net, int ifindex)
1274{
1275 struct neigh_parms *p;
1276
1277 for (p = &tbl->parms; p; p = p->next) {
1278 if (p->net != net)
1279 continue;
1280 if ((p->dev && p->dev->ifindex == ifindex) ||
1281 (!p->dev && !ifindex))
1282 return p;
1283 }
1284
1285 return NULL;
1286}
1da177e4
LT
1287
1288struct neigh_parms *neigh_parms_alloc(struct net_device *dev,
1289 struct neigh_table *tbl)
1290{
426b5303
EB
1291 struct neigh_parms *p, *ref;
1292 struct net *net;
1293
486b51d3 1294 net = dev->nd_net;
426b5303
EB
1295 ref = lookup_neigh_params(tbl, net, 0);
1296 if (!ref)
1297 return NULL;
1da177e4 1298
426b5303 1299 p = kmemdup(ref, sizeof(*p), GFP_KERNEL);
1da177e4 1300 if (p) {
1da177e4
LT
1301 p->tbl = tbl;
1302 atomic_set(&p->refcnt, 1);
1303 INIT_RCU_HEAD(&p->rcu_head);
1304 p->reachable_time =
1305 neigh_rand_reach_time(p->base_reachable_time);
c7fb64db 1306
486b51d3
DL
1307 if (dev->neigh_setup && dev->neigh_setup(dev, p)) {
1308 kfree(p);
1309 return NULL;
1da177e4 1310 }
486b51d3
DL
1311
1312 dev_hold(dev);
1313 p->dev = dev;
426b5303 1314 p->net = hold_net(net);
1da177e4
LT
1315 p->sysctl_table = NULL;
1316 write_lock_bh(&tbl->lock);
1317 p->next = tbl->parms.next;
1318 tbl->parms.next = p;
1319 write_unlock_bh(&tbl->lock);
1320 }
1321 return p;
1322}
1323
1324static void neigh_rcu_free_parms(struct rcu_head *head)
1325{
1326 struct neigh_parms *parms =
1327 container_of(head, struct neigh_parms, rcu_head);
1328
1329 neigh_parms_put(parms);
1330}
1331
1332void neigh_parms_release(struct neigh_table *tbl, struct neigh_parms *parms)
1333{
1334 struct neigh_parms **p;
1335
1336 if (!parms || parms == &tbl->parms)
1337 return;
1338 write_lock_bh(&tbl->lock);
1339 for (p = &tbl->parms.next; *p; p = &(*p)->next) {
1340 if (*p == parms) {
1341 *p = parms->next;
1342 parms->dead = 1;
1343 write_unlock_bh(&tbl->lock);
cecbb639
DM
1344 if (parms->dev)
1345 dev_put(parms->dev);
1da177e4
LT
1346 call_rcu(&parms->rcu_head, neigh_rcu_free_parms);
1347 return;
1348 }
1349 }
1350 write_unlock_bh(&tbl->lock);
1351 NEIGH_PRINTK1("neigh_parms_release: not found\n");
1352}
1353
06f0511d 1354static void neigh_parms_destroy(struct neigh_parms *parms)
1da177e4 1355{
426b5303 1356 release_net(parms->net);
1da177e4
LT
1357 kfree(parms);
1358}
1359
c2ecba71
PE
1360static struct lock_class_key neigh_table_proxy_queue_class;
1361
bd89efc5 1362void neigh_table_init_no_netlink(struct neigh_table *tbl)
1da177e4
LT
1363{
1364 unsigned long now = jiffies;
1365 unsigned long phsize;
1366
426b5303 1367 tbl->parms.net = &init_net;
1da177e4
LT
1368 atomic_set(&tbl->parms.refcnt, 1);
1369 INIT_RCU_HEAD(&tbl->parms.rcu_head);
1370 tbl->parms.reachable_time =
1371 neigh_rand_reach_time(tbl->parms.base_reachable_time);
1372
1373 if (!tbl->kmem_cachep)
e5d679f3
AD
1374 tbl->kmem_cachep =
1375 kmem_cache_create(tbl->id, tbl->entry_size, 0,
1376 SLAB_HWCACHE_ALIGN|SLAB_PANIC,
20c2df83 1377 NULL);
1da177e4
LT
1378 tbl->stats = alloc_percpu(struct neigh_statistics);
1379 if (!tbl->stats)
1380 panic("cannot create neighbour cache statistics");
4ec93edb 1381
1da177e4 1382#ifdef CONFIG_PROC_FS
457c4cbc 1383 tbl->pde = create_proc_entry(tbl->id, 0, init_net.proc_net_stat);
4ec93edb 1384 if (!tbl->pde)
1da177e4
LT
1385 panic("cannot create neighbour proc dir entry");
1386 tbl->pde->proc_fops = &neigh_stat_seq_fops;
1387 tbl->pde->data = tbl;
1388#endif
1389
1390 tbl->hash_mask = 1;
1391 tbl->hash_buckets = neigh_hash_alloc(tbl->hash_mask + 1);
1392
1393 phsize = (PNEIGH_HASHMASK + 1) * sizeof(struct pneigh_entry *);
77d04bd9 1394 tbl->phash_buckets = kzalloc(phsize, GFP_KERNEL);
1da177e4
LT
1395
1396 if (!tbl->hash_buckets || !tbl->phash_buckets)
1397 panic("cannot allocate neighbour cache hashes");
1398
1da177e4
LT
1399 get_random_bytes(&tbl->hash_rnd, sizeof(tbl->hash_rnd));
1400
1401 rwlock_init(&tbl->lock);
b24b8a24 1402 setup_timer(&tbl->gc_timer, neigh_periodic_timer, (unsigned long)tbl);
1da177e4
LT
1403 tbl->gc_timer.expires = now + 1;
1404 add_timer(&tbl->gc_timer);
1405
b24b8a24 1406 setup_timer(&tbl->proxy_timer, neigh_proxy_process, (unsigned long)tbl);
c2ecba71
PE
1407 skb_queue_head_init_class(&tbl->proxy_queue,
1408 &neigh_table_proxy_queue_class);
1da177e4
LT
1409
1410 tbl->last_flush = now;
1411 tbl->last_rand = now + tbl->parms.reachable_time * 20;
bd89efc5
SK
1412}
1413
1414void neigh_table_init(struct neigh_table *tbl)
1415{
1416 struct neigh_table *tmp;
1417
1418 neigh_table_init_no_netlink(tbl);
1da177e4 1419 write_lock(&neigh_tbl_lock);
bd89efc5
SK
1420 for (tmp = neigh_tables; tmp; tmp = tmp->next) {
1421 if (tmp->family == tbl->family)
1422 break;
1423 }
1da177e4
LT
1424 tbl->next = neigh_tables;
1425 neigh_tables = tbl;
1426 write_unlock(&neigh_tbl_lock);
bd89efc5
SK
1427
1428 if (unlikely(tmp)) {
1429 printk(KERN_ERR "NEIGH: Registering multiple tables for "
1430 "family %d\n", tbl->family);
1431 dump_stack();
1432 }
1da177e4
LT
1433}
1434
1435int neigh_table_clear(struct neigh_table *tbl)
1436{
1437 struct neigh_table **tp;
1438
1439 /* It is not clean... Fix it to unload IPv6 module safely */
1440 del_timer_sync(&tbl->gc_timer);
1441 del_timer_sync(&tbl->proxy_timer);
1442 pneigh_queue_purge(&tbl->proxy_queue);
1443 neigh_ifdown(tbl, NULL);
1444 if (atomic_read(&tbl->entries))
1445 printk(KERN_CRIT "neighbour leakage\n");
1446 write_lock(&neigh_tbl_lock);
1447 for (tp = &neigh_tables; *tp; tp = &(*tp)->next) {
1448 if (*tp == tbl) {
1449 *tp = tbl->next;
1450 break;
1451 }
1452 }
1453 write_unlock(&neigh_tbl_lock);
1454
1455 neigh_hash_free(tbl->hash_buckets, tbl->hash_mask + 1);
1456 tbl->hash_buckets = NULL;
1457
1458 kfree(tbl->phash_buckets);
1459 tbl->phash_buckets = NULL;
1460
3f192b5c
AD
1461 remove_proc_entry(tbl->id, init_net.proc_net_stat);
1462
3fcde74b
KK
1463 free_percpu(tbl->stats);
1464 tbl->stats = NULL;
1465
bfb85c9f
RD
1466 kmem_cache_destroy(tbl->kmem_cachep);
1467 tbl->kmem_cachep = NULL;
1468
1da177e4
LT
1469 return 0;
1470}
1471
c8822a4e 1472static int neigh_delete(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
1da177e4 1473{
881d966b 1474 struct net *net = skb->sk->sk_net;
a14a49d2
TG
1475 struct ndmsg *ndm;
1476 struct nlattr *dst_attr;
1da177e4
LT
1477 struct neigh_table *tbl;
1478 struct net_device *dev = NULL;
a14a49d2 1479 int err = -EINVAL;
1da177e4 1480
a14a49d2 1481 if (nlmsg_len(nlh) < sizeof(*ndm))
1da177e4
LT
1482 goto out;
1483
a14a49d2
TG
1484 dst_attr = nlmsg_find_attr(nlh, sizeof(*ndm), NDA_DST);
1485 if (dst_attr == NULL)
1486 goto out;
1487
1488 ndm = nlmsg_data(nlh);
1489 if (ndm->ndm_ifindex) {
881d966b 1490 dev = dev_get_by_index(net, ndm->ndm_ifindex);
a14a49d2
TG
1491 if (dev == NULL) {
1492 err = -ENODEV;
1493 goto out;
1494 }
1495 }
1496
1da177e4
LT
1497 read_lock(&neigh_tbl_lock);
1498 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
a14a49d2 1499 struct neighbour *neigh;
1da177e4
LT
1500
1501 if (tbl->family != ndm->ndm_family)
1502 continue;
1503 read_unlock(&neigh_tbl_lock);
1504
a14a49d2 1505 if (nla_len(dst_attr) < tbl->key_len)
1da177e4
LT
1506 goto out_dev_put;
1507
1508 if (ndm->ndm_flags & NTF_PROXY) {
426b5303 1509 err = pneigh_delete(tbl, net, nla_data(dst_attr), dev);
1da177e4
LT
1510 goto out_dev_put;
1511 }
1512
a14a49d2
TG
1513 if (dev == NULL)
1514 goto out_dev_put;
1da177e4 1515
a14a49d2
TG
1516 neigh = neigh_lookup(tbl, nla_data(dst_attr), dev);
1517 if (neigh == NULL) {
1518 err = -ENOENT;
1519 goto out_dev_put;
1da177e4 1520 }
a14a49d2
TG
1521
1522 err = neigh_update(neigh, NULL, NUD_FAILED,
1523 NEIGH_UPDATE_F_OVERRIDE |
1524 NEIGH_UPDATE_F_ADMIN);
1525 neigh_release(neigh);
1da177e4
LT
1526 goto out_dev_put;
1527 }
1528 read_unlock(&neigh_tbl_lock);
a14a49d2
TG
1529 err = -EAFNOSUPPORT;
1530
1da177e4
LT
1531out_dev_put:
1532 if (dev)
1533 dev_put(dev);
1534out:
1535 return err;
1536}
1537
c8822a4e 1538static int neigh_add(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
1da177e4 1539{
881d966b 1540 struct net *net = skb->sk->sk_net;
5208debd
TG
1541 struct ndmsg *ndm;
1542 struct nlattr *tb[NDA_MAX+1];
1da177e4
LT
1543 struct neigh_table *tbl;
1544 struct net_device *dev = NULL;
5208debd 1545 int err;
1da177e4 1546
5208debd
TG
1547 err = nlmsg_parse(nlh, sizeof(*ndm), tb, NDA_MAX, NULL);
1548 if (err < 0)
1da177e4
LT
1549 goto out;
1550
5208debd
TG
1551 err = -EINVAL;
1552 if (tb[NDA_DST] == NULL)
1553 goto out;
1554
1555 ndm = nlmsg_data(nlh);
1556 if (ndm->ndm_ifindex) {
881d966b 1557 dev = dev_get_by_index(net, ndm->ndm_ifindex);
5208debd
TG
1558 if (dev == NULL) {
1559 err = -ENODEV;
1560 goto out;
1561 }
1562
1563 if (tb[NDA_LLADDR] && nla_len(tb[NDA_LLADDR]) < dev->addr_len)
1564 goto out_dev_put;
1565 }
1566
1da177e4
LT
1567 read_lock(&neigh_tbl_lock);
1568 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
5208debd
TG
1569 int flags = NEIGH_UPDATE_F_ADMIN | NEIGH_UPDATE_F_OVERRIDE;
1570 struct neighbour *neigh;
1571 void *dst, *lladdr;
1da177e4
LT
1572
1573 if (tbl->family != ndm->ndm_family)
1574 continue;
1575 read_unlock(&neigh_tbl_lock);
1576
5208debd 1577 if (nla_len(tb[NDA_DST]) < tbl->key_len)
1da177e4 1578 goto out_dev_put;
5208debd
TG
1579 dst = nla_data(tb[NDA_DST]);
1580 lladdr = tb[NDA_LLADDR] ? nla_data(tb[NDA_LLADDR]) : NULL;
1da177e4
LT
1581
1582 if (ndm->ndm_flags & NTF_PROXY) {
62dd9318
VN
1583 struct pneigh_entry *pn;
1584
1585 err = -ENOBUFS;
426b5303 1586 pn = pneigh_lookup(tbl, net, dst, dev, 1);
62dd9318
VN
1587 if (pn) {
1588 pn->flags = ndm->ndm_flags;
1589 err = 0;
1590 }
1da177e4
LT
1591 goto out_dev_put;
1592 }
1593
5208debd 1594 if (dev == NULL)
1da177e4 1595 goto out_dev_put;
5208debd
TG
1596
1597 neigh = neigh_lookup(tbl, dst, dev);
1598 if (neigh == NULL) {
1599 if (!(nlh->nlmsg_flags & NLM_F_CREATE)) {
1600 err = -ENOENT;
1601 goto out_dev_put;
1602 }
4ec93edb 1603
5208debd
TG
1604 neigh = __neigh_lookup_errno(tbl, dst, dev);
1605 if (IS_ERR(neigh)) {
1606 err = PTR_ERR(neigh);
1da177e4
LT
1607 goto out_dev_put;
1608 }
1da177e4 1609 } else {
5208debd
TG
1610 if (nlh->nlmsg_flags & NLM_F_EXCL) {
1611 err = -EEXIST;
1612 neigh_release(neigh);
1da177e4
LT
1613 goto out_dev_put;
1614 }
1da177e4 1615
5208debd
TG
1616 if (!(nlh->nlmsg_flags & NLM_F_REPLACE))
1617 flags &= ~NEIGH_UPDATE_F_OVERRIDE;
1618 }
1da177e4 1619
5208debd
TG
1620 err = neigh_update(neigh, lladdr, ndm->ndm_state, flags);
1621 neigh_release(neigh);
1da177e4
LT
1622 goto out_dev_put;
1623 }
1624
1625 read_unlock(&neigh_tbl_lock);
5208debd
TG
1626 err = -EAFNOSUPPORT;
1627
1da177e4
LT
1628out_dev_put:
1629 if (dev)
1630 dev_put(dev);
1631out:
1632 return err;
1633}
1634
c7fb64db
TG
1635static int neightbl_fill_parms(struct sk_buff *skb, struct neigh_parms *parms)
1636{
ca860fb3
TG
1637 struct nlattr *nest;
1638
1639 nest = nla_nest_start(skb, NDTA_PARMS);
1640 if (nest == NULL)
1641 return -ENOBUFS;
c7fb64db
TG
1642
1643 if (parms->dev)
ca860fb3
TG
1644 NLA_PUT_U32(skb, NDTPA_IFINDEX, parms->dev->ifindex);
1645
1646 NLA_PUT_U32(skb, NDTPA_REFCNT, atomic_read(&parms->refcnt));
1647 NLA_PUT_U32(skb, NDTPA_QUEUE_LEN, parms->queue_len);
1648 NLA_PUT_U32(skb, NDTPA_PROXY_QLEN, parms->proxy_qlen);
1649 NLA_PUT_U32(skb, NDTPA_APP_PROBES, parms->app_probes);
1650 NLA_PUT_U32(skb, NDTPA_UCAST_PROBES, parms->ucast_probes);
1651 NLA_PUT_U32(skb, NDTPA_MCAST_PROBES, parms->mcast_probes);
1652 NLA_PUT_MSECS(skb, NDTPA_REACHABLE_TIME, parms->reachable_time);
1653 NLA_PUT_MSECS(skb, NDTPA_BASE_REACHABLE_TIME,
c7fb64db 1654 parms->base_reachable_time);
ca860fb3
TG
1655 NLA_PUT_MSECS(skb, NDTPA_GC_STALETIME, parms->gc_staletime);
1656 NLA_PUT_MSECS(skb, NDTPA_DELAY_PROBE_TIME, parms->delay_probe_time);
1657 NLA_PUT_MSECS(skb, NDTPA_RETRANS_TIME, parms->retrans_time);
1658 NLA_PUT_MSECS(skb, NDTPA_ANYCAST_DELAY, parms->anycast_delay);
1659 NLA_PUT_MSECS(skb, NDTPA_PROXY_DELAY, parms->proxy_delay);
1660 NLA_PUT_MSECS(skb, NDTPA_LOCKTIME, parms->locktime);
c7fb64db 1661
ca860fb3 1662 return nla_nest_end(skb, nest);
c7fb64db 1663
ca860fb3
TG
1664nla_put_failure:
1665 return nla_nest_cancel(skb, nest);
c7fb64db
TG
1666}
1667
ca860fb3
TG
1668static int neightbl_fill_info(struct sk_buff *skb, struct neigh_table *tbl,
1669 u32 pid, u32 seq, int type, int flags)
c7fb64db
TG
1670{
1671 struct nlmsghdr *nlh;
1672 struct ndtmsg *ndtmsg;
1673
ca860fb3
TG
1674 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndtmsg), flags);
1675 if (nlh == NULL)
26932566 1676 return -EMSGSIZE;
c7fb64db 1677
ca860fb3 1678 ndtmsg = nlmsg_data(nlh);
c7fb64db
TG
1679
1680 read_lock_bh(&tbl->lock);
1681 ndtmsg->ndtm_family = tbl->family;
9ef1d4c7
PM
1682 ndtmsg->ndtm_pad1 = 0;
1683 ndtmsg->ndtm_pad2 = 0;
c7fb64db 1684
ca860fb3
TG
1685 NLA_PUT_STRING(skb, NDTA_NAME, tbl->id);
1686 NLA_PUT_MSECS(skb, NDTA_GC_INTERVAL, tbl->gc_interval);
1687 NLA_PUT_U32(skb, NDTA_THRESH1, tbl->gc_thresh1);
1688 NLA_PUT_U32(skb, NDTA_THRESH2, tbl->gc_thresh2);
1689 NLA_PUT_U32(skb, NDTA_THRESH3, tbl->gc_thresh3);
c7fb64db
TG
1690
1691 {
1692 unsigned long now = jiffies;
1693 unsigned int flush_delta = now - tbl->last_flush;
1694 unsigned int rand_delta = now - tbl->last_rand;
1695
1696 struct ndt_config ndc = {
1697 .ndtc_key_len = tbl->key_len,
1698 .ndtc_entry_size = tbl->entry_size,
1699 .ndtc_entries = atomic_read(&tbl->entries),
1700 .ndtc_last_flush = jiffies_to_msecs(flush_delta),
1701 .ndtc_last_rand = jiffies_to_msecs(rand_delta),
1702 .ndtc_hash_rnd = tbl->hash_rnd,
1703 .ndtc_hash_mask = tbl->hash_mask,
1704 .ndtc_hash_chain_gc = tbl->hash_chain_gc,
1705 .ndtc_proxy_qlen = tbl->proxy_queue.qlen,
1706 };
1707
ca860fb3 1708 NLA_PUT(skb, NDTA_CONFIG, sizeof(ndc), &ndc);
c7fb64db
TG
1709 }
1710
1711 {
1712 int cpu;
1713 struct ndt_stats ndst;
1714
1715 memset(&ndst, 0, sizeof(ndst));
1716
6f912042 1717 for_each_possible_cpu(cpu) {
c7fb64db
TG
1718 struct neigh_statistics *st;
1719
c7fb64db
TG
1720 st = per_cpu_ptr(tbl->stats, cpu);
1721 ndst.ndts_allocs += st->allocs;
1722 ndst.ndts_destroys += st->destroys;
1723 ndst.ndts_hash_grows += st->hash_grows;
1724 ndst.ndts_res_failed += st->res_failed;
1725 ndst.ndts_lookups += st->lookups;
1726 ndst.ndts_hits += st->hits;
1727 ndst.ndts_rcv_probes_mcast += st->rcv_probes_mcast;
1728 ndst.ndts_rcv_probes_ucast += st->rcv_probes_ucast;
1729 ndst.ndts_periodic_gc_runs += st->periodic_gc_runs;
1730 ndst.ndts_forced_gc_runs += st->forced_gc_runs;
1731 }
1732
ca860fb3 1733 NLA_PUT(skb, NDTA_STATS, sizeof(ndst), &ndst);
c7fb64db
TG
1734 }
1735
1736 BUG_ON(tbl->parms.dev);
1737 if (neightbl_fill_parms(skb, &tbl->parms) < 0)
ca860fb3 1738 goto nla_put_failure;
c7fb64db
TG
1739
1740 read_unlock_bh(&tbl->lock);
ca860fb3 1741 return nlmsg_end(skb, nlh);
c7fb64db 1742
ca860fb3 1743nla_put_failure:
c7fb64db 1744 read_unlock_bh(&tbl->lock);
26932566
PM
1745 nlmsg_cancel(skb, nlh);
1746 return -EMSGSIZE;
c7fb64db
TG
1747}
1748
ca860fb3
TG
1749static int neightbl_fill_param_info(struct sk_buff *skb,
1750 struct neigh_table *tbl,
c7fb64db 1751 struct neigh_parms *parms,
ca860fb3
TG
1752 u32 pid, u32 seq, int type,
1753 unsigned int flags)
c7fb64db
TG
1754{
1755 struct ndtmsg *ndtmsg;
1756 struct nlmsghdr *nlh;
1757
ca860fb3
TG
1758 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndtmsg), flags);
1759 if (nlh == NULL)
26932566 1760 return -EMSGSIZE;
c7fb64db 1761
ca860fb3 1762 ndtmsg = nlmsg_data(nlh);
c7fb64db
TG
1763
1764 read_lock_bh(&tbl->lock);
1765 ndtmsg->ndtm_family = tbl->family;
9ef1d4c7
PM
1766 ndtmsg->ndtm_pad1 = 0;
1767 ndtmsg->ndtm_pad2 = 0;
c7fb64db 1768
ca860fb3
TG
1769 if (nla_put_string(skb, NDTA_NAME, tbl->id) < 0 ||
1770 neightbl_fill_parms(skb, parms) < 0)
1771 goto errout;
c7fb64db
TG
1772
1773 read_unlock_bh(&tbl->lock);
ca860fb3
TG
1774 return nlmsg_end(skb, nlh);
1775errout:
c7fb64db 1776 read_unlock_bh(&tbl->lock);
26932566
PM
1777 nlmsg_cancel(skb, nlh);
1778 return -EMSGSIZE;
c7fb64db 1779}
4ec93edb 1780
ef7c79ed 1781static const struct nla_policy nl_neightbl_policy[NDTA_MAX+1] = {
6b3f8674
TG
1782 [NDTA_NAME] = { .type = NLA_STRING },
1783 [NDTA_THRESH1] = { .type = NLA_U32 },
1784 [NDTA_THRESH2] = { .type = NLA_U32 },
1785 [NDTA_THRESH3] = { .type = NLA_U32 },
1786 [NDTA_GC_INTERVAL] = { .type = NLA_U64 },
1787 [NDTA_PARMS] = { .type = NLA_NESTED },
1788};
1789
ef7c79ed 1790static const struct nla_policy nl_ntbl_parm_policy[NDTPA_MAX+1] = {
6b3f8674
TG
1791 [NDTPA_IFINDEX] = { .type = NLA_U32 },
1792 [NDTPA_QUEUE_LEN] = { .type = NLA_U32 },
1793 [NDTPA_PROXY_QLEN] = { .type = NLA_U32 },
1794 [NDTPA_APP_PROBES] = { .type = NLA_U32 },
1795 [NDTPA_UCAST_PROBES] = { .type = NLA_U32 },
1796 [NDTPA_MCAST_PROBES] = { .type = NLA_U32 },
1797 [NDTPA_BASE_REACHABLE_TIME] = { .type = NLA_U64 },
1798 [NDTPA_GC_STALETIME] = { .type = NLA_U64 },
1799 [NDTPA_DELAY_PROBE_TIME] = { .type = NLA_U64 },
1800 [NDTPA_RETRANS_TIME] = { .type = NLA_U64 },
1801 [NDTPA_ANYCAST_DELAY] = { .type = NLA_U64 },
1802 [NDTPA_PROXY_DELAY] = { .type = NLA_U64 },
1803 [NDTPA_LOCKTIME] = { .type = NLA_U64 },
1804};
1805
c8822a4e 1806static int neightbl_set(struct sk_buff *skb, struct nlmsghdr *nlh, void *arg)
c7fb64db 1807{
b854272b 1808 struct net *net = skb->sk->sk_net;
c7fb64db 1809 struct neigh_table *tbl;
6b3f8674
TG
1810 struct ndtmsg *ndtmsg;
1811 struct nlattr *tb[NDTA_MAX+1];
1812 int err;
c7fb64db 1813
6b3f8674
TG
1814 err = nlmsg_parse(nlh, sizeof(*ndtmsg), tb, NDTA_MAX,
1815 nl_neightbl_policy);
1816 if (err < 0)
1817 goto errout;
c7fb64db 1818
6b3f8674
TG
1819 if (tb[NDTA_NAME] == NULL) {
1820 err = -EINVAL;
1821 goto errout;
1822 }
1823
1824 ndtmsg = nlmsg_data(nlh);
c7fb64db
TG
1825 read_lock(&neigh_tbl_lock);
1826 for (tbl = neigh_tables; tbl; tbl = tbl->next) {
1827 if (ndtmsg->ndtm_family && tbl->family != ndtmsg->ndtm_family)
1828 continue;
1829
6b3f8674 1830 if (nla_strcmp(tb[NDTA_NAME], tbl->id) == 0)
c7fb64db
TG
1831 break;
1832 }
1833
1834 if (tbl == NULL) {
1835 err = -ENOENT;
6b3f8674 1836 goto errout_locked;
c7fb64db
TG
1837 }
1838
4ec93edb 1839 /*
c7fb64db
TG
1840 * We acquire tbl->lock to be nice to the periodic timers and
1841 * make sure they always see a consistent set of values.
1842 */
1843 write_lock_bh(&tbl->lock);
1844
6b3f8674
TG
1845 if (tb[NDTA_PARMS]) {
1846 struct nlattr *tbp[NDTPA_MAX+1];
c7fb64db 1847 struct neigh_parms *p;
6b3f8674 1848 int i, ifindex = 0;
c7fb64db 1849
6b3f8674
TG
1850 err = nla_parse_nested(tbp, NDTPA_MAX, tb[NDTA_PARMS],
1851 nl_ntbl_parm_policy);
1852 if (err < 0)
1853 goto errout_tbl_lock;
c7fb64db 1854
6b3f8674
TG
1855 if (tbp[NDTPA_IFINDEX])
1856 ifindex = nla_get_u32(tbp[NDTPA_IFINDEX]);
c7fb64db 1857
426b5303 1858 p = lookup_neigh_params(tbl, net, ifindex);
c7fb64db
TG
1859 if (p == NULL) {
1860 err = -ENOENT;
6b3f8674 1861 goto errout_tbl_lock;
c7fb64db 1862 }
c7fb64db 1863
6b3f8674
TG
1864 for (i = 1; i <= NDTPA_MAX; i++) {
1865 if (tbp[i] == NULL)
1866 continue;
c7fb64db 1867
6b3f8674
TG
1868 switch (i) {
1869 case NDTPA_QUEUE_LEN:
1870 p->queue_len = nla_get_u32(tbp[i]);
1871 break;
1872 case NDTPA_PROXY_QLEN:
1873 p->proxy_qlen = nla_get_u32(tbp[i]);
1874 break;
1875 case NDTPA_APP_PROBES:
1876 p->app_probes = nla_get_u32(tbp[i]);
1877 break;
1878 case NDTPA_UCAST_PROBES:
1879 p->ucast_probes = nla_get_u32(tbp[i]);
1880 break;
1881 case NDTPA_MCAST_PROBES:
1882 p->mcast_probes = nla_get_u32(tbp[i]);
1883 break;
1884 case NDTPA_BASE_REACHABLE_TIME:
1885 p->base_reachable_time = nla_get_msecs(tbp[i]);
1886 break;
1887 case NDTPA_GC_STALETIME:
1888 p->gc_staletime = nla_get_msecs(tbp[i]);
1889 break;
1890 case NDTPA_DELAY_PROBE_TIME:
1891 p->delay_probe_time = nla_get_msecs(tbp[i]);
1892 break;
1893 case NDTPA_RETRANS_TIME:
1894 p->retrans_time = nla_get_msecs(tbp[i]);
1895 break;
1896 case NDTPA_ANYCAST_DELAY:
1897 p->anycast_delay = nla_get_msecs(tbp[i]);
1898 break;
1899 case NDTPA_PROXY_DELAY:
1900 p->proxy_delay = nla_get_msecs(tbp[i]);
1901 break;
1902 case NDTPA_LOCKTIME:
1903 p->locktime = nla_get_msecs(tbp[i]);
1904 break;
1905 }
1906 }
1907 }
c7fb64db 1908
6b3f8674
TG
1909 if (tb[NDTA_THRESH1])
1910 tbl->gc_thresh1 = nla_get_u32(tb[NDTA_THRESH1]);
c7fb64db 1911
6b3f8674
TG
1912 if (tb[NDTA_THRESH2])
1913 tbl->gc_thresh2 = nla_get_u32(tb[NDTA_THRESH2]);
c7fb64db 1914
6b3f8674
TG
1915 if (tb[NDTA_THRESH3])
1916 tbl->gc_thresh3 = nla_get_u32(tb[NDTA_THRESH3]);
c7fb64db 1917
6b3f8674
TG
1918 if (tb[NDTA_GC_INTERVAL])
1919 tbl->gc_interval = nla_get_msecs(tb[NDTA_GC_INTERVAL]);
c7fb64db
TG
1920
1921 err = 0;
1922
6b3f8674 1923errout_tbl_lock:
c7fb64db 1924 write_unlock_bh(&tbl->lock);
6b3f8674 1925errout_locked:
c7fb64db 1926 read_unlock(&neigh_tbl_lock);
6b3f8674 1927errout:
c7fb64db
TG
1928 return err;
1929}
1930
c8822a4e 1931static int neightbl_dump_info(struct sk_buff *skb, struct netlink_callback *cb)
c7fb64db 1932{
b854272b 1933 struct net *net = skb->sk->sk_net;
ca860fb3
TG
1934 int family, tidx, nidx = 0;
1935 int tbl_skip = cb->args[0];
1936 int neigh_skip = cb->args[1];
c7fb64db
TG
1937 struct neigh_table *tbl;
1938
ca860fb3 1939 family = ((struct rtgenmsg *) nlmsg_data(cb->nlh))->rtgen_family;
c7fb64db
TG
1940
1941 read_lock(&neigh_tbl_lock);
ca860fb3 1942 for (tbl = neigh_tables, tidx = 0; tbl; tbl = tbl->next, tidx++) {
c7fb64db
TG
1943 struct neigh_parms *p;
1944
ca860fb3 1945 if (tidx < tbl_skip || (family && tbl->family != family))
c7fb64db
TG
1946 continue;
1947
ca860fb3
TG
1948 if (neightbl_fill_info(skb, tbl, NETLINK_CB(cb->skb).pid,
1949 cb->nlh->nlmsg_seq, RTM_NEWNEIGHTBL,
1950 NLM_F_MULTI) <= 0)
c7fb64db
TG
1951 break;
1952
426b5303
EB
1953 for (nidx = 0, p = tbl->parms.next; p; p = p->next) {
1954 if (net != p->net)
1955 continue;
1956
1957 if (nidx++ < neigh_skip)
c7fb64db
TG
1958 continue;
1959
ca860fb3
TG
1960 if (neightbl_fill_param_info(skb, tbl, p,
1961 NETLINK_CB(cb->skb).pid,
1962 cb->nlh->nlmsg_seq,
1963 RTM_NEWNEIGHTBL,
1964 NLM_F_MULTI) <= 0)
c7fb64db
TG
1965 goto out;
1966 }
1967
ca860fb3 1968 neigh_skip = 0;
c7fb64db
TG
1969 }
1970out:
1971 read_unlock(&neigh_tbl_lock);
ca860fb3
TG
1972 cb->args[0] = tidx;
1973 cb->args[1] = nidx;
c7fb64db
TG
1974
1975 return skb->len;
1976}
1da177e4 1977
8b8aec50
TG
1978static int neigh_fill_info(struct sk_buff *skb, struct neighbour *neigh,
1979 u32 pid, u32 seq, int type, unsigned int flags)
1da177e4
LT
1980{
1981 unsigned long now = jiffies;
1da177e4 1982 struct nda_cacheinfo ci;
8b8aec50
TG
1983 struct nlmsghdr *nlh;
1984 struct ndmsg *ndm;
1985
1986 nlh = nlmsg_put(skb, pid, seq, type, sizeof(*ndm), flags);
1987 if (nlh == NULL)
26932566 1988 return -EMSGSIZE;
1da177e4 1989
8b8aec50
TG
1990 ndm = nlmsg_data(nlh);
1991 ndm->ndm_family = neigh->ops->family;
9ef1d4c7
PM
1992 ndm->ndm_pad1 = 0;
1993 ndm->ndm_pad2 = 0;
8b8aec50
TG
1994 ndm->ndm_flags = neigh->flags;
1995 ndm->ndm_type = neigh->type;
1996 ndm->ndm_ifindex = neigh->dev->ifindex;
1da177e4 1997
8b8aec50
TG
1998 NLA_PUT(skb, NDA_DST, neigh->tbl->key_len, neigh->primary_key);
1999
2000 read_lock_bh(&neigh->lock);
2001 ndm->ndm_state = neigh->nud_state;
2002 if ((neigh->nud_state & NUD_VALID) &&
2003 nla_put(skb, NDA_LLADDR, neigh->dev->addr_len, neigh->ha) < 0) {
2004 read_unlock_bh(&neigh->lock);
2005 goto nla_put_failure;
2006 }
2007
2008 ci.ndm_used = now - neigh->used;
2009 ci.ndm_confirmed = now - neigh->confirmed;
2010 ci.ndm_updated = now - neigh->updated;
2011 ci.ndm_refcnt = atomic_read(&neigh->refcnt) - 1;
2012 read_unlock_bh(&neigh->lock);
2013
2014 NLA_PUT_U32(skb, NDA_PROBES, atomic_read(&neigh->probes));
2015 NLA_PUT(skb, NDA_CACHEINFO, sizeof(ci), &ci);
2016
2017 return nlmsg_end(skb, nlh);
2018
2019nla_put_failure:
26932566
PM
2020 nlmsg_cancel(skb, nlh);
2021 return -EMSGSIZE;
1da177e4
LT
2022}
2023
d961db35
TG
2024static void neigh_update_notify(struct neighbour *neigh)
2025{
2026 call_netevent_notifiers(NETEVENT_NEIGH_UPDATE, neigh);
2027 __neigh_notify(neigh, RTM_NEWNEIGH, 0);
2028}
1da177e4
LT
2029
2030static int neigh_dump_table(struct neigh_table *tbl, struct sk_buff *skb,
2031 struct netlink_callback *cb)
2032{
426b5303 2033 struct net * net = skb->sk->sk_net;
1da177e4
LT
2034 struct neighbour *n;
2035 int rc, h, s_h = cb->args[1];
2036 int idx, s_idx = idx = cb->args[2];
2037
c5e29460 2038 read_lock_bh(&tbl->lock);
1da177e4
LT
2039 for (h = 0; h <= tbl->hash_mask; h++) {
2040 if (h < s_h)
2041 continue;
2042 if (h > s_h)
2043 s_idx = 0;
426b5303
EB
2044 for (n = tbl->hash_buckets[h], idx = 0; n; n = n->next) {
2045 int lidx;
2046 if (n->dev->nd_net != net)
2047 continue;
2048 lidx = idx++;
2049 if (lidx < s_idx)
1da177e4
LT
2050 continue;
2051 if (neigh_fill_info(skb, n, NETLINK_CB(cb->skb).pid,
2052 cb->nlh->nlmsg_seq,
b6544c0b
JHS
2053 RTM_NEWNEIGH,
2054 NLM_F_MULTI) <= 0) {
1da177e4
LT
2055 read_unlock_bh(&tbl->lock);
2056 rc = -1;
2057 goto out;
2058 }
2059 }
1da177e4 2060 }
c5e29460 2061 read_unlock_bh(&tbl->lock);
1da177e4
LT
2062 rc = skb->len;
2063out:
2064 cb->args[1] = h;
2065 cb->args[2] = idx;
2066 return rc;
2067}
2068
c8822a4e 2069static int neigh_dump_info(struct sk_buff *skb, struct netlink_callback *cb)
1da177e4
LT
2070{
2071 struct neigh_table *tbl;
2072 int t, family, s_t;
2073
2074 read_lock(&neigh_tbl_lock);
8b8aec50 2075 family = ((struct rtgenmsg *) nlmsg_data(cb->nlh))->rtgen_family;
1da177e4
LT
2076 s_t = cb->args[0];
2077
2078 for (tbl = neigh_tables, t = 0; tbl; tbl = tbl->next, t++) {
2079 if (t < s_t || (family && tbl->family != family))
2080 continue;
2081 if (t > s_t)
2082 memset(&cb->args[1], 0, sizeof(cb->args) -
2083 sizeof(cb->args[0]));
2084 if (neigh_dump_table(tbl, skb, cb) < 0)
2085 break;
2086 }
2087 read_unlock(&neigh_tbl_lock);
2088
2089 cb->args[0] = t;
2090 return skb->len;
2091}
2092
2093void neigh_for_each(struct neigh_table *tbl, void (*cb)(struct neighbour *, void *), void *cookie)
2094{
2095 int chain;
2096
2097 read_lock_bh(&tbl->lock);
2098 for (chain = 0; chain <= tbl->hash_mask; chain++) {
2099 struct neighbour *n;
2100
2101 for (n = tbl->hash_buckets[chain]; n; n = n->next)
2102 cb(n, cookie);
2103 }
2104 read_unlock_bh(&tbl->lock);
2105}
2106EXPORT_SYMBOL(neigh_for_each);
2107
2108/* The tbl->lock must be held as a writer and BH disabled. */
2109void __neigh_for_each_release(struct neigh_table *tbl,
2110 int (*cb)(struct neighbour *))
2111{
2112 int chain;
2113
2114 for (chain = 0; chain <= tbl->hash_mask; chain++) {
2115 struct neighbour *n, **np;
2116
2117 np = &tbl->hash_buckets[chain];
2118 while ((n = *np) != NULL) {
2119 int release;
2120
2121 write_lock(&n->lock);
2122 release = cb(n);
2123 if (release) {
2124 *np = n->next;
2125 n->dead = 1;
2126 } else
2127 np = &n->next;
2128 write_unlock(&n->lock);
4f494554
TG
2129 if (release)
2130 neigh_cleanup_and_release(n);
1da177e4
LT
2131 }
2132 }
2133}
2134EXPORT_SYMBOL(__neigh_for_each_release);
2135
2136#ifdef CONFIG_PROC_FS
2137
2138static struct neighbour *neigh_get_first(struct seq_file *seq)
2139{
2140 struct neigh_seq_state *state = seq->private;
42508461 2141 struct net *net = state->p.net;
1da177e4
LT
2142 struct neigh_table *tbl = state->tbl;
2143 struct neighbour *n = NULL;
2144 int bucket = state->bucket;
2145
2146 state->flags &= ~NEIGH_SEQ_IS_PNEIGH;
2147 for (bucket = 0; bucket <= tbl->hash_mask; bucket++) {
2148 n = tbl->hash_buckets[bucket];
2149
2150 while (n) {
426b5303
EB
2151 if (n->dev->nd_net != net)
2152 goto next;
1da177e4
LT
2153 if (state->neigh_sub_iter) {
2154 loff_t fakep = 0;
2155 void *v;
2156
2157 v = state->neigh_sub_iter(state, n, &fakep);
2158 if (!v)
2159 goto next;
2160 }
2161 if (!(state->flags & NEIGH_SEQ_SKIP_NOARP))
2162 break;
2163 if (n->nud_state & ~NUD_NOARP)
2164 break;
2165 next:
2166 n = n->next;
2167 }
2168
2169 if (n)
2170 break;
2171 }
2172 state->bucket = bucket;
2173
2174 return n;
2175}
2176
2177static struct neighbour *neigh_get_next(struct seq_file *seq,
2178 struct neighbour *n,
2179 loff_t *pos)
2180{
2181 struct neigh_seq_state *state = seq->private;
42508461 2182 struct net *net = state->p.net;
1da177e4
LT
2183 struct neigh_table *tbl = state->tbl;
2184
2185 if (state->neigh_sub_iter) {
2186 void *v = state->neigh_sub_iter(state, n, pos);
2187 if (v)
2188 return n;
2189 }
2190 n = n->next;
2191
2192 while (1) {
2193 while (n) {
426b5303
EB
2194 if (n->dev->nd_net != net)
2195 goto next;
1da177e4
LT
2196 if (state->neigh_sub_iter) {
2197 void *v = state->neigh_sub_iter(state, n, pos);
2198 if (v)
2199 return n;
2200 goto next;
2201 }
2202 if (!(state->flags & NEIGH_SEQ_SKIP_NOARP))
2203 break;
2204
2205 if (n->nud_state & ~NUD_NOARP)
2206 break;
2207 next:
2208 n = n->next;
2209 }
2210
2211 if (n)
2212 break;
2213
2214 if (++state->bucket > tbl->hash_mask)
2215 break;
2216
2217 n = tbl->hash_buckets[state->bucket];
2218 }
2219
2220 if (n && pos)
2221 --(*pos);
2222 return n;
2223}
2224
2225static struct neighbour *neigh_get_idx(struct seq_file *seq, loff_t *pos)
2226{
2227 struct neighbour *n = neigh_get_first(seq);
2228
2229 if (n) {
2230 while (*pos) {
2231 n = neigh_get_next(seq, n, pos);
2232 if (!n)
2233 break;
2234 }
2235 }
2236 return *pos ? NULL : n;
2237}
2238
2239static struct pneigh_entry *pneigh_get_first(struct seq_file *seq)
2240{
2241 struct neigh_seq_state *state = seq->private;
42508461 2242 struct net * net = state->p.net;
1da177e4
LT
2243 struct neigh_table *tbl = state->tbl;
2244 struct pneigh_entry *pn = NULL;
2245 int bucket = state->bucket;
2246
2247 state->flags |= NEIGH_SEQ_IS_PNEIGH;
2248 for (bucket = 0; bucket <= PNEIGH_HASHMASK; bucket++) {
2249 pn = tbl->phash_buckets[bucket];
426b5303
EB
2250 while (pn && (pn->net != net))
2251 pn = pn->next;
1da177e4
LT
2252 if (pn)
2253 break;
2254 }
2255 state->bucket = bucket;
2256
2257 return pn;
2258}
2259
2260static struct pneigh_entry *pneigh_get_next(struct seq_file *seq,
2261 struct pneigh_entry *pn,
2262 loff_t *pos)
2263{
2264 struct neigh_seq_state *state = seq->private;
42508461 2265 struct net * net = state->p.net;
1da177e4
LT
2266 struct neigh_table *tbl = state->tbl;
2267
2268 pn = pn->next;
2269 while (!pn) {
2270 if (++state->bucket > PNEIGH_HASHMASK)
2271 break;
2272 pn = tbl->phash_buckets[state->bucket];
426b5303
EB
2273 while (pn && (pn->net != net))
2274 pn = pn->next;
1da177e4
LT
2275 if (pn)
2276 break;
2277 }
2278
2279 if (pn && pos)
2280 --(*pos);
2281
2282 return pn;
2283}
2284
2285static struct pneigh_entry *pneigh_get_idx(struct seq_file *seq, loff_t *pos)
2286{
2287 struct pneigh_entry *pn = pneigh_get_first(seq);
2288
2289 if (pn) {
2290 while (*pos) {
2291 pn = pneigh_get_next(seq, pn, pos);
2292 if (!pn)
2293 break;
2294 }
2295 }
2296 return *pos ? NULL : pn;
2297}
2298
2299static void *neigh_get_idx_any(struct seq_file *seq, loff_t *pos)
2300{
2301 struct neigh_seq_state *state = seq->private;
2302 void *rc;
2303
2304 rc = neigh_get_idx(seq, pos);
2305 if (!rc && !(state->flags & NEIGH_SEQ_NEIGH_ONLY))
2306 rc = pneigh_get_idx(seq, pos);
2307
2308 return rc;
2309}
2310
2311void *neigh_seq_start(struct seq_file *seq, loff_t *pos, struct neigh_table *tbl, unsigned int neigh_seq_flags)
9a429c49 2312 __acquires(tbl->lock)
1da177e4
LT
2313{
2314 struct neigh_seq_state *state = seq->private;
2315 loff_t pos_minus_one;
2316
2317 state->tbl = tbl;
2318 state->bucket = 0;
2319 state->flags = (neigh_seq_flags & ~NEIGH_SEQ_IS_PNEIGH);
2320
2321 read_lock_bh(&tbl->lock);
2322
2323 pos_minus_one = *pos - 1;
2324 return *pos ? neigh_get_idx_any(seq, &pos_minus_one) : SEQ_START_TOKEN;
2325}
2326EXPORT_SYMBOL(neigh_seq_start);
2327
2328void *neigh_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2329{
2330 struct neigh_seq_state *state;
2331 void *rc;
2332
2333 if (v == SEQ_START_TOKEN) {
2334 rc = neigh_get_idx(seq, pos);
2335 goto out;
2336 }
2337
2338 state = seq->private;
2339 if (!(state->flags & NEIGH_SEQ_IS_PNEIGH)) {
2340 rc = neigh_get_next(seq, v, NULL);
2341 if (rc)
2342 goto out;
2343 if (!(state->flags & NEIGH_SEQ_NEIGH_ONLY))
2344 rc = pneigh_get_first(seq);
2345 } else {
2346 BUG_ON(state->flags & NEIGH_SEQ_NEIGH_ONLY);
2347 rc = pneigh_get_next(seq, v, NULL);
2348 }
2349out:
2350 ++(*pos);
2351 return rc;
2352}
2353EXPORT_SYMBOL(neigh_seq_next);
2354
2355void neigh_seq_stop(struct seq_file *seq, void *v)
9a429c49 2356 __releases(tbl->lock)
1da177e4
LT
2357{
2358 struct neigh_seq_state *state = seq->private;
2359 struct neigh_table *tbl = state->tbl;
2360
2361 read_unlock_bh(&tbl->lock);
2362}
2363EXPORT_SYMBOL(neigh_seq_stop);
2364
2365/* statistics via seq_file */
2366
2367static void *neigh_stat_seq_start(struct seq_file *seq, loff_t *pos)
2368{
2369 struct proc_dir_entry *pde = seq->private;
2370 struct neigh_table *tbl = pde->data;
2371 int cpu;
2372
2373 if (*pos == 0)
2374 return SEQ_START_TOKEN;
4ec93edb 2375
1da177e4
LT
2376 for (cpu = *pos-1; cpu < NR_CPUS; ++cpu) {
2377 if (!cpu_possible(cpu))
2378 continue;
2379 *pos = cpu+1;
2380 return per_cpu_ptr(tbl->stats, cpu);
2381 }
2382 return NULL;
2383}
2384
2385static void *neigh_stat_seq_next(struct seq_file *seq, void *v, loff_t *pos)
2386{
2387 struct proc_dir_entry *pde = seq->private;
2388 struct neigh_table *tbl = pde->data;
2389 int cpu;
2390
2391 for (cpu = *pos; cpu < NR_CPUS; ++cpu) {
2392 if (!cpu_possible(cpu))
2393 continue;
2394 *pos = cpu+1;
2395 return per_cpu_ptr(tbl->stats, cpu);
2396 }
2397 return NULL;
2398}
2399
2400static void neigh_stat_seq_stop(struct seq_file *seq, void *v)
2401{
2402
2403}
2404
2405static int neigh_stat_seq_show(struct seq_file *seq, void *v)
2406{
2407 struct proc_dir_entry *pde = seq->private;
2408 struct neigh_table *tbl = pde->data;
2409 struct neigh_statistics *st = v;
2410
2411 if (v == SEQ_START_TOKEN) {
5bec0039 2412 seq_printf(seq, "entries allocs destroys hash_grows lookups hits res_failed rcv_probes_mcast rcv_probes_ucast periodic_gc_runs forced_gc_runs\n");
1da177e4
LT
2413 return 0;
2414 }
2415
2416 seq_printf(seq, "%08x %08lx %08lx %08lx %08lx %08lx %08lx "
2417 "%08lx %08lx %08lx %08lx\n",
2418 atomic_read(&tbl->entries),
2419
2420 st->allocs,
2421 st->destroys,
2422 st->hash_grows,
2423
2424 st->lookups,
2425 st->hits,
2426
2427 st->res_failed,
2428
2429 st->rcv_probes_mcast,
2430 st->rcv_probes_ucast,
2431
2432 st->periodic_gc_runs,
2433 st->forced_gc_runs
2434 );
2435
2436 return 0;
2437}
2438
f690808e 2439static const struct seq_operations neigh_stat_seq_ops = {
1da177e4
LT
2440 .start = neigh_stat_seq_start,
2441 .next = neigh_stat_seq_next,
2442 .stop = neigh_stat_seq_stop,
2443 .show = neigh_stat_seq_show,
2444};
2445
2446static int neigh_stat_seq_open(struct inode *inode, struct file *file)
2447{
2448 int ret = seq_open(file, &neigh_stat_seq_ops);
2449
2450 if (!ret) {
2451 struct seq_file *sf = file->private_data;
2452 sf->private = PDE(inode);
2453 }
2454 return ret;
2455};
2456
9a32144e 2457static const struct file_operations neigh_stat_seq_fops = {
1da177e4
LT
2458 .owner = THIS_MODULE,
2459 .open = neigh_stat_seq_open,
2460 .read = seq_read,
2461 .llseek = seq_lseek,
2462 .release = seq_release,
2463};
2464
2465#endif /* CONFIG_PROC_FS */
2466
339bf98f
TG
2467static inline size_t neigh_nlmsg_size(void)
2468{
2469 return NLMSG_ALIGN(sizeof(struct ndmsg))
2470 + nla_total_size(MAX_ADDR_LEN) /* NDA_DST */
2471 + nla_total_size(MAX_ADDR_LEN) /* NDA_LLADDR */
2472 + nla_total_size(sizeof(struct nda_cacheinfo))
2473 + nla_total_size(4); /* NDA_PROBES */
2474}
2475
b8673311 2476static void __neigh_notify(struct neighbour *n, int type, int flags)
1da177e4 2477{
426b5303 2478 struct net *net = n->dev->nd_net;
8b8aec50 2479 struct sk_buff *skb;
b8673311 2480 int err = -ENOBUFS;
1da177e4 2481
339bf98f 2482 skb = nlmsg_new(neigh_nlmsg_size(), GFP_ATOMIC);
8b8aec50 2483 if (skb == NULL)
b8673311 2484 goto errout;
1da177e4 2485
b8673311 2486 err = neigh_fill_info(skb, n, 0, 0, type, flags);
26932566
PM
2487 if (err < 0) {
2488 /* -EMSGSIZE implies BUG in neigh_nlmsg_size() */
2489 WARN_ON(err == -EMSGSIZE);
2490 kfree_skb(skb);
2491 goto errout;
2492 }
426b5303 2493 err = rtnl_notify(skb, net, 0, RTNLGRP_NEIGH, NULL, GFP_ATOMIC);
b8673311
TG
2494errout:
2495 if (err < 0)
426b5303 2496 rtnl_set_sk_err(net, RTNLGRP_NEIGH, err);
1da177e4
LT
2497}
2498
d961db35 2499#ifdef CONFIG_ARPD
b8673311 2500void neigh_app_ns(struct neighbour *n)
1da177e4 2501{
b8673311
TG
2502 __neigh_notify(n, RTM_GETNEIGH, NLM_F_REQUEST);
2503}
1da177e4
LT
2504#endif /* CONFIG_ARPD */
2505
2506#ifdef CONFIG_SYSCTL
2507
2508static struct neigh_sysctl_table {
2509 struct ctl_table_header *sysctl_header;
c3bac5a7
PE
2510 struct ctl_table neigh_vars[__NET_NEIGH_MAX];
2511 char *dev_name;
ab32ea5d 2512} neigh_sysctl_template __read_mostly = {
1da177e4
LT
2513 .neigh_vars = {
2514 {
2515 .ctl_name = NET_NEIGH_MCAST_SOLICIT,
2516 .procname = "mcast_solicit",
2517 .maxlen = sizeof(int),
2518 .mode = 0644,
2519 .proc_handler = &proc_dointvec,
2520 },
2521 {
2522 .ctl_name = NET_NEIGH_UCAST_SOLICIT,
2523 .procname = "ucast_solicit",
2524 .maxlen = sizeof(int),
2525 .mode = 0644,
2526 .proc_handler = &proc_dointvec,
2527 },
2528 {
2529 .ctl_name = NET_NEIGH_APP_SOLICIT,
2530 .procname = "app_solicit",
2531 .maxlen = sizeof(int),
2532 .mode = 0644,
2533 .proc_handler = &proc_dointvec,
2534 },
2535 {
1da177e4
LT
2536 .procname = "retrans_time",
2537 .maxlen = sizeof(int),
2538 .mode = 0644,
2539 .proc_handler = &proc_dointvec_userhz_jiffies,
2540 },
2541 {
2542 .ctl_name = NET_NEIGH_REACHABLE_TIME,
2543 .procname = "base_reachable_time",
2544 .maxlen = sizeof(int),
2545 .mode = 0644,
2546 .proc_handler = &proc_dointvec_jiffies,
2547 .strategy = &sysctl_jiffies,
2548 },
2549 {
2550 .ctl_name = NET_NEIGH_DELAY_PROBE_TIME,
2551 .procname = "delay_first_probe_time",
2552 .maxlen = sizeof(int),
2553 .mode = 0644,
2554 .proc_handler = &proc_dointvec_jiffies,
2555 .strategy = &sysctl_jiffies,
2556 },
2557 {
2558 .ctl_name = NET_NEIGH_GC_STALE_TIME,
2559 .procname = "gc_stale_time",
2560 .maxlen = sizeof(int),
2561 .mode = 0644,
2562 .proc_handler = &proc_dointvec_jiffies,
2563 .strategy = &sysctl_jiffies,
2564 },
2565 {
2566 .ctl_name = NET_NEIGH_UNRES_QLEN,
2567 .procname = "unres_qlen",
2568 .maxlen = sizeof(int),
2569 .mode = 0644,
2570 .proc_handler = &proc_dointvec,
2571 },
2572 {
2573 .ctl_name = NET_NEIGH_PROXY_QLEN,
2574 .procname = "proxy_qlen",
2575 .maxlen = sizeof(int),
2576 .mode = 0644,
2577 .proc_handler = &proc_dointvec,
2578 },
2579 {
1da177e4
LT
2580 .procname = "anycast_delay",
2581 .maxlen = sizeof(int),
2582 .mode = 0644,
2583 .proc_handler = &proc_dointvec_userhz_jiffies,
2584 },
2585 {
1da177e4
LT
2586 .procname = "proxy_delay",
2587 .maxlen = sizeof(int),
2588 .mode = 0644,
2589 .proc_handler = &proc_dointvec_userhz_jiffies,
2590 },
2591 {
1da177e4
LT
2592 .procname = "locktime",
2593 .maxlen = sizeof(int),
2594 .mode = 0644,
2595 .proc_handler = &proc_dointvec_userhz_jiffies,
2596 },
d12af679
EB
2597 {
2598 .ctl_name = NET_NEIGH_RETRANS_TIME_MS,
2599 .procname = "retrans_time_ms",
2600 .maxlen = sizeof(int),
2601 .mode = 0644,
2602 .proc_handler = &proc_dointvec_ms_jiffies,
2603 .strategy = &sysctl_ms_jiffies,
2604 },
2605 {
2606 .ctl_name = NET_NEIGH_REACHABLE_TIME_MS,
2607 .procname = "base_reachable_time_ms",
2608 .maxlen = sizeof(int),
2609 .mode = 0644,
2610 .proc_handler = &proc_dointvec_ms_jiffies,
2611 .strategy = &sysctl_ms_jiffies,
2612 },
1da177e4
LT
2613 {
2614 .ctl_name = NET_NEIGH_GC_INTERVAL,
2615 .procname = "gc_interval",
2616 .maxlen = sizeof(int),
2617 .mode = 0644,
2618 .proc_handler = &proc_dointvec_jiffies,
2619 .strategy = &sysctl_jiffies,
2620 },
2621 {
2622 .ctl_name = NET_NEIGH_GC_THRESH1,
2623 .procname = "gc_thresh1",
2624 .maxlen = sizeof(int),
2625 .mode = 0644,
2626 .proc_handler = &proc_dointvec,
2627 },
2628 {
2629 .ctl_name = NET_NEIGH_GC_THRESH2,
2630 .procname = "gc_thresh2",
2631 .maxlen = sizeof(int),
2632 .mode = 0644,
2633 .proc_handler = &proc_dointvec,
2634 },
2635 {
2636 .ctl_name = NET_NEIGH_GC_THRESH3,
2637 .procname = "gc_thresh3",
2638 .maxlen = sizeof(int),
2639 .mode = 0644,
2640 .proc_handler = &proc_dointvec,
2641 },
c3bac5a7 2642 {},
1da177e4
LT
2643 },
2644};
2645
2646int neigh_sysctl_register(struct net_device *dev, struct neigh_parms *p,
4ec93edb 2647 int p_id, int pdev_id, char *p_name,
1da177e4
LT
2648 proc_handler *handler, ctl_handler *strategy)
2649{
3c607bbb 2650 struct neigh_sysctl_table *t;
1da177e4 2651 const char *dev_name_source = NULL;
c3bac5a7
PE
2652
2653#define NEIGH_CTL_PATH_ROOT 0
2654#define NEIGH_CTL_PATH_PROTO 1
2655#define NEIGH_CTL_PATH_NEIGH 2
2656#define NEIGH_CTL_PATH_DEV 3
2657
2658 struct ctl_path neigh_path[] = {
2659 { .procname = "net", .ctl_name = CTL_NET, },
2660 { .procname = "proto", .ctl_name = 0, },
2661 { .procname = "neigh", .ctl_name = 0, },
2662 { .procname = "default", .ctl_name = NET_PROTO_CONF_DEFAULT, },
2663 { },
2664 };
1da177e4 2665
3c607bbb 2666 t = kmemdup(&neigh_sysctl_template, sizeof(*t), GFP_KERNEL);
1da177e4 2667 if (!t)
3c607bbb
PE
2668 goto err;
2669
1da177e4
LT
2670 t->neigh_vars[0].data = &p->mcast_probes;
2671 t->neigh_vars[1].data = &p->ucast_probes;
2672 t->neigh_vars[2].data = &p->app_probes;
2673 t->neigh_vars[3].data = &p->retrans_time;
2674 t->neigh_vars[4].data = &p->base_reachable_time;
2675 t->neigh_vars[5].data = &p->delay_probe_time;
2676 t->neigh_vars[6].data = &p->gc_staletime;
2677 t->neigh_vars[7].data = &p->queue_len;
2678 t->neigh_vars[8].data = &p->proxy_qlen;
2679 t->neigh_vars[9].data = &p->anycast_delay;
2680 t->neigh_vars[10].data = &p->proxy_delay;
2681 t->neigh_vars[11].data = &p->locktime;
d12af679
EB
2682 t->neigh_vars[12].data = &p->retrans_time;
2683 t->neigh_vars[13].data = &p->base_reachable_time;
1da177e4
LT
2684
2685 if (dev) {
2686 dev_name_source = dev->name;
c3bac5a7 2687 neigh_path[NEIGH_CTL_PATH_DEV].ctl_name = dev->ifindex;
d12af679
EB
2688 /* Terminate the table early */
2689 memset(&t->neigh_vars[14], 0, sizeof(t->neigh_vars[14]));
1da177e4 2690 } else {
c3bac5a7 2691 dev_name_source = neigh_path[NEIGH_CTL_PATH_DEV].procname;
d12af679
EB
2692 t->neigh_vars[14].data = (int *)(p + 1);
2693 t->neigh_vars[15].data = (int *)(p + 1) + 1;
2694 t->neigh_vars[16].data = (int *)(p + 1) + 2;
2695 t->neigh_vars[17].data = (int *)(p + 1) + 3;
1da177e4
LT
2696 }
2697
1da177e4
LT
2698
2699 if (handler || strategy) {
2700 /* RetransTime */
2701 t->neigh_vars[3].proc_handler = handler;
2702 t->neigh_vars[3].strategy = strategy;
2703 t->neigh_vars[3].extra1 = dev;
d12af679
EB
2704 if (!strategy)
2705 t->neigh_vars[3].ctl_name = CTL_UNNUMBERED;
1da177e4
LT
2706 /* ReachableTime */
2707 t->neigh_vars[4].proc_handler = handler;
2708 t->neigh_vars[4].strategy = strategy;
2709 t->neigh_vars[4].extra1 = dev;
d12af679
EB
2710 if (!strategy)
2711 t->neigh_vars[4].ctl_name = CTL_UNNUMBERED;
1da177e4 2712 /* RetransTime (in milliseconds)*/
d12af679
EB
2713 t->neigh_vars[12].proc_handler = handler;
2714 t->neigh_vars[12].strategy = strategy;
2715 t->neigh_vars[12].extra1 = dev;
2716 if (!strategy)
2717 t->neigh_vars[12].ctl_name = CTL_UNNUMBERED;
1da177e4 2718 /* ReachableTime (in milliseconds) */
d12af679
EB
2719 t->neigh_vars[13].proc_handler = handler;
2720 t->neigh_vars[13].strategy = strategy;
2721 t->neigh_vars[13].extra1 = dev;
2722 if (!strategy)
2723 t->neigh_vars[13].ctl_name = CTL_UNNUMBERED;
1da177e4
LT
2724 }
2725
c3bac5a7
PE
2726 t->dev_name = kstrdup(dev_name_source, GFP_KERNEL);
2727 if (!t->dev_name)
1da177e4 2728 goto free;
1da177e4 2729
c3bac5a7
PE
2730 neigh_path[NEIGH_CTL_PATH_DEV].procname = t->dev_name;
2731 neigh_path[NEIGH_CTL_PATH_NEIGH].ctl_name = pdev_id;
2732 neigh_path[NEIGH_CTL_PATH_PROTO].procname = p_name;
2733 neigh_path[NEIGH_CTL_PATH_PROTO].ctl_name = p_id;
1da177e4 2734
c3bac5a7 2735 t->sysctl_header = register_sysctl_paths(neigh_path, t->neigh_vars);
3c607bbb 2736 if (!t->sysctl_header)
1da177e4 2737 goto free_procname;
3c607bbb 2738
1da177e4
LT
2739 p->sysctl_table = t;
2740 return 0;
2741
3c607bbb 2742free_procname:
c3bac5a7 2743 kfree(t->dev_name);
3c607bbb 2744free:
1da177e4 2745 kfree(t);
3c607bbb
PE
2746err:
2747 return -ENOBUFS;
1da177e4
LT
2748}
2749
2750void neigh_sysctl_unregister(struct neigh_parms *p)
2751{
2752 if (p->sysctl_table) {
2753 struct neigh_sysctl_table *t = p->sysctl_table;
2754 p->sysctl_table = NULL;
2755 unregister_sysctl_table(t->sysctl_header);
c3bac5a7 2756 kfree(t->dev_name);
1da177e4
LT
2757 kfree(t);
2758 }
2759}
2760
2761#endif /* CONFIG_SYSCTL */
2762
c8822a4e
TG
2763static int __init neigh_init(void)
2764{
2765 rtnl_register(PF_UNSPEC, RTM_NEWNEIGH, neigh_add, NULL);
2766 rtnl_register(PF_UNSPEC, RTM_DELNEIGH, neigh_delete, NULL);
2767 rtnl_register(PF_UNSPEC, RTM_GETNEIGH, NULL, neigh_dump_info);
2768
2769 rtnl_register(PF_UNSPEC, RTM_GETNEIGHTBL, NULL, neightbl_dump_info);
2770 rtnl_register(PF_UNSPEC, RTM_SETNEIGHTBL, neightbl_set, NULL);
2771
2772 return 0;
2773}
2774
2775subsys_initcall(neigh_init);
2776
1da177e4 2777EXPORT_SYMBOL(__neigh_event_send);
1da177e4
LT
2778EXPORT_SYMBOL(neigh_changeaddr);
2779EXPORT_SYMBOL(neigh_compat_output);
2780EXPORT_SYMBOL(neigh_connected_output);
2781EXPORT_SYMBOL(neigh_create);
1da177e4 2782EXPORT_SYMBOL(neigh_destroy);
1da177e4
LT
2783EXPORT_SYMBOL(neigh_event_ns);
2784EXPORT_SYMBOL(neigh_ifdown);
2785EXPORT_SYMBOL(neigh_lookup);
2786EXPORT_SYMBOL(neigh_lookup_nodev);
2787EXPORT_SYMBOL(neigh_parms_alloc);
2788EXPORT_SYMBOL(neigh_parms_release);
2789EXPORT_SYMBOL(neigh_rand_reach_time);
2790EXPORT_SYMBOL(neigh_resolve_output);
2791EXPORT_SYMBOL(neigh_table_clear);
2792EXPORT_SYMBOL(neigh_table_init);
bd89efc5 2793EXPORT_SYMBOL(neigh_table_init_no_netlink);
1da177e4 2794EXPORT_SYMBOL(neigh_update);
1da177e4
LT
2795EXPORT_SYMBOL(pneigh_enqueue);
2796EXPORT_SYMBOL(pneigh_lookup);
2797
2798#ifdef CONFIG_ARPD
2799EXPORT_SYMBOL(neigh_app_ns);
2800#endif
2801#ifdef CONFIG_SYSCTL
2802EXPORT_SYMBOL(neigh_sysctl_register);
2803EXPORT_SYMBOL(neigh_sysctl_unregister);
2804#endif