]> git.proxmox.com Git - mirror_frr.git/blob - zebra/zebra_rib.c
Merge volatile/cumulus_ospf6d
[mirror_frr.git] / zebra / zebra_rib.c
1 /* Routing Information Base.
2 * Copyright (C) 1997, 98, 99, 2001 Kunihiro Ishiguro
3 *
4 * This file is part of GNU Zebra.
5 *
6 * GNU Zebra is free software; you can redistribute it and/or modify it
7 * under the terms of the GNU General Public License as published by the
8 * Free Software Foundation; either version 2, or (at your option) any
9 * later version.
10 *
11 * GNU Zebra is distributed in the hope that it will be useful, but
12 * WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * General Public License for more details.
15 *
16 * You should have received a copy of the GNU General Public License
17 * along with GNU Zebra; see the file COPYING. If not, write to the Free
18 * Software Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA
19 * 02111-1307, USA.
20 */
21
22 #include <zebra.h>
23
24 #include "prefix.h"
25 #include "table.h"
26 #include "memory.h"
27 #include "str.h"
28 #include "command.h"
29 #include "if.h"
30 #include "log.h"
31 #include "sockunion.h"
32 #include "linklist.h"
33 #include "thread.h"
34 #include "workqueue.h"
35 #include "prefix.h"
36 #include "routemap.h"
37
38 #include "zebra/rib.h"
39 #include "zebra/rt.h"
40 #include "zebra/zserv.h"
41 #include "zebra/redistribute.h"
42 #include "zebra/debug.h"
43 #include "zebra/zebra_fpm.h"
44
45 /* Default rtm_table for all clients */
46 extern struct zebra_t zebrad;
47
48 /* Hold time for RIB process, should be very minimal.
49 * it is useful to able to set it otherwise for testing, hence exported
50 * as global here for test-rig code.
51 */
52 int rib_process_hold_time = 10;
53
54 /* Each route type's string and default distance value. */
55 static const struct
56 {
57 int key;
58 int distance;
59 } route_info[ZEBRA_ROUTE_MAX] =
60 {
61 [ZEBRA_ROUTE_SYSTEM] = {ZEBRA_ROUTE_SYSTEM, 0},
62 [ZEBRA_ROUTE_KERNEL] = {ZEBRA_ROUTE_KERNEL, 0},
63 [ZEBRA_ROUTE_CONNECT] = {ZEBRA_ROUTE_CONNECT, 0},
64 [ZEBRA_ROUTE_STATIC] = {ZEBRA_ROUTE_STATIC, 1},
65 [ZEBRA_ROUTE_RIP] = {ZEBRA_ROUTE_RIP, 120},
66 [ZEBRA_ROUTE_RIPNG] = {ZEBRA_ROUTE_RIPNG, 120},
67 [ZEBRA_ROUTE_OSPF] = {ZEBRA_ROUTE_OSPF, 110},
68 [ZEBRA_ROUTE_OSPF6] = {ZEBRA_ROUTE_OSPF6, 110},
69 [ZEBRA_ROUTE_ISIS] = {ZEBRA_ROUTE_ISIS, 115},
70 [ZEBRA_ROUTE_BGP] = {ZEBRA_ROUTE_BGP, 20 /* IBGP is 200. */},
71 [ZEBRA_ROUTE_BABEL] = {ZEBRA_ROUTE_BABEL, 95},
72 /* no entry/default: 150 */
73 };
74 \f
75 /* Vector for routing table. */
76 static vector vrf_vector;
77
78 /*
79 * vrf_table_create
80 */
81 static void
82 vrf_table_create (struct vrf *vrf, afi_t afi, safi_t safi)
83 {
84 rib_table_info_t *info;
85 struct route_table *table;
86
87 assert (!vrf->table[afi][safi]);
88
89 table = route_table_init ();
90 vrf->table[afi][safi] = table;
91
92 info = XCALLOC (MTYPE_RIB_TABLE_INFO, sizeof (*info));
93 info->vrf = vrf;
94 info->afi = afi;
95 info->safi = safi;
96 table->info = info;
97 }
98
99 /* Allocate new VRF. */
100 static struct vrf *
101 vrf_alloc (const char *name)
102 {
103 struct vrf *vrf;
104
105 vrf = XCALLOC (MTYPE_VRF, sizeof (struct vrf));
106
107 /* Put name. */
108 if (name)
109 vrf->name = XSTRDUP (MTYPE_VRF_NAME, name);
110
111 /* Allocate routing table and static table. */
112 vrf_table_create (vrf, AFI_IP, SAFI_UNICAST);
113 vrf_table_create (vrf, AFI_IP6, SAFI_UNICAST);
114 vrf->stable[AFI_IP][SAFI_UNICAST] = route_table_init ();
115 vrf->stable[AFI_IP6][SAFI_UNICAST] = route_table_init ();
116 vrf_table_create (vrf, AFI_IP, SAFI_MULTICAST);
117 vrf_table_create (vrf, AFI_IP6, SAFI_MULTICAST);
118 vrf->stable[AFI_IP][SAFI_MULTICAST] = route_table_init ();
119 vrf->stable[AFI_IP6][SAFI_MULTICAST] = route_table_init ();
120
121
122 return vrf;
123 }
124
125 /* Lookup VRF by identifier. */
126 struct vrf *
127 vrf_lookup (u_int32_t id)
128 {
129 return vector_lookup (vrf_vector, id);
130 }
131
132 /* Initialize VRF. */
133 static void
134 vrf_init (void)
135 {
136 struct vrf *default_table;
137
138 /* Allocate VRF vector. */
139 vrf_vector = vector_init (1);
140
141 /* Allocate default main table. */
142 default_table = vrf_alloc ("Default-IP-Routing-Table");
143
144 /* Default table index must be 0. */
145 vector_set_index (vrf_vector, 0, default_table);
146 }
147
148 /* Lookup route table. */
149 struct route_table *
150 vrf_table (afi_t afi, safi_t safi, u_int32_t id)
151 {
152 struct vrf *vrf;
153
154 vrf = vrf_lookup (id);
155 if (! vrf)
156 return NULL;
157
158 if( afi >= AFI_MAX || safi >= SAFI_MAX )
159 return NULL;
160
161 return vrf->table[afi][safi];
162 }
163
164 /* Lookup static route table. */
165 struct route_table *
166 vrf_static_table (afi_t afi, safi_t safi, u_int32_t id)
167 {
168 struct vrf *vrf;
169
170 vrf = vrf_lookup (id);
171 if (! vrf)
172 return NULL;
173
174 if( afi >= AFI_MAX || safi >= SAFI_MAX )
175 return NULL;
176
177 return vrf->stable[afi][safi];
178 }
179 \f
180 /*
181 * nexthop_type_to_str
182 */
183 const char *
184 nexthop_type_to_str (enum nexthop_types_t nh_type)
185 {
186 static const char *desc[] = {
187 "none",
188 "Directly connected",
189 "Interface route",
190 "IPv4 nexthop",
191 "IPv4 nexthop with ifindex",
192 "IPv4 nexthop with ifname",
193 "IPv6 nexthop",
194 "IPv6 nexthop with ifindex",
195 "IPv6 nexthop with ifname",
196 "Null0 nexthop",
197 };
198
199 if (nh_type >= ZEBRA_NUM_OF (desc))
200 return "<Invalid nh type>";
201
202 return desc[nh_type];
203 }
204
205 /* Add nexthop to the end of a nexthop list. */
206 static void
207 _nexthop_add (struct nexthop **target, struct nexthop *nexthop)
208 {
209 struct nexthop *last;
210
211 for (last = *target; last && last->next; last = last->next)
212 ;
213 if (last)
214 last->next = nexthop;
215 else
216 *target = nexthop;
217 nexthop->prev = last;
218 }
219
220 /* Add nexthop to the end of a rib node's nexthop list */
221 static void
222 nexthop_add (struct rib *rib, struct nexthop *nexthop)
223 {
224 _nexthop_add(&rib->nexthop, nexthop);
225 rib->nexthop_num++;
226 }
227
228 /* Delete specified nexthop from the list. */
229 static void
230 nexthop_delete (struct rib *rib, struct nexthop *nexthop)
231 {
232 if (nexthop->next)
233 nexthop->next->prev = nexthop->prev;
234 if (nexthop->prev)
235 nexthop->prev->next = nexthop->next;
236 else
237 rib->nexthop = nexthop->next;
238 rib->nexthop_num--;
239 }
240
241 static void nexthops_free(struct nexthop *nexthop);
242
243 /* Free nexthop. */
244 static void
245 nexthop_free (struct nexthop *nexthop)
246 {
247 if (nexthop->ifname)
248 XFREE (0, nexthop->ifname);
249 if (nexthop->resolved)
250 nexthops_free(nexthop->resolved);
251 XFREE (MTYPE_NEXTHOP, nexthop);
252 }
253
254 /* Frees a list of nexthops */
255 static void
256 nexthops_free (struct nexthop *nexthop)
257 {
258 struct nexthop *nh, *next;
259
260 for (nh = nexthop; nh; nh = next)
261 {
262 next = nh->next;
263 nexthop_free (nh);
264 }
265 }
266
267 struct nexthop *
268 nexthop_ifindex_add (struct rib *rib, unsigned int ifindex)
269 {
270 struct nexthop *nexthop;
271
272 nexthop = XCALLOC (MTYPE_NEXTHOP, sizeof (struct nexthop));
273 nexthop->type = NEXTHOP_TYPE_IFINDEX;
274 nexthop->ifindex = ifindex;
275
276 nexthop_add (rib, nexthop);
277
278 return nexthop;
279 }
280
281 struct nexthop *
282 nexthop_ifname_add (struct rib *rib, char *ifname)
283 {
284 struct nexthop *nexthop;
285
286 nexthop = XCALLOC (MTYPE_NEXTHOP, sizeof (struct nexthop));
287 nexthop->type = NEXTHOP_TYPE_IFNAME;
288 nexthop->ifname = XSTRDUP (0, ifname);
289
290 nexthop_add (rib, nexthop);
291
292 return nexthop;
293 }
294
295 struct nexthop *
296 nexthop_ipv4_add (struct rib *rib, struct in_addr *ipv4, struct in_addr *src)
297 {
298 struct nexthop *nexthop;
299
300 nexthop = XCALLOC (MTYPE_NEXTHOP, sizeof (struct nexthop));
301 nexthop->type = NEXTHOP_TYPE_IPV4;
302 nexthop->gate.ipv4 = *ipv4;
303 if (src)
304 nexthop->src.ipv4 = *src;
305
306 nexthop_add (rib, nexthop);
307
308 return nexthop;
309 }
310
311 struct nexthop *
312 nexthop_ipv4_ifindex_add (struct rib *rib, struct in_addr *ipv4,
313 struct in_addr *src, unsigned int ifindex)
314 {
315 struct nexthop *nexthop;
316
317 nexthop = XCALLOC (MTYPE_NEXTHOP, sizeof (struct nexthop));
318 nexthop->type = NEXTHOP_TYPE_IPV4_IFINDEX;
319 nexthop->gate.ipv4 = *ipv4;
320 if (src)
321 nexthop->src.ipv4 = *src;
322 nexthop->ifindex = ifindex;
323
324 nexthop_add (rib, nexthop);
325
326 return nexthop;
327 }
328
329 #ifdef HAVE_IPV6
330 struct nexthop *
331 nexthop_ipv6_add (struct rib *rib, struct in6_addr *ipv6)
332 {
333 struct nexthop *nexthop;
334
335 nexthop = XCALLOC (MTYPE_NEXTHOP, sizeof (struct nexthop));
336 nexthop->type = NEXTHOP_TYPE_IPV6;
337 nexthop->gate.ipv6 = *ipv6;
338
339 nexthop_add (rib, nexthop);
340
341 return nexthop;
342 }
343
344 static struct nexthop *
345 nexthop_ipv6_ifname_add (struct rib *rib, struct in6_addr *ipv6,
346 char *ifname)
347 {
348 struct nexthop *nexthop;
349
350 nexthop = XCALLOC (MTYPE_NEXTHOP, sizeof (struct nexthop));
351 nexthop->type = NEXTHOP_TYPE_IPV6_IFNAME;
352 nexthop->gate.ipv6 = *ipv6;
353 nexthop->ifname = XSTRDUP (0, ifname);
354
355 nexthop_add (rib, nexthop);
356
357 return nexthop;
358 }
359
360 static struct nexthop *
361 nexthop_ipv6_ifindex_add (struct rib *rib, struct in6_addr *ipv6,
362 unsigned int ifindex)
363 {
364 struct nexthop *nexthop;
365
366 nexthop = XCALLOC (MTYPE_NEXTHOP, sizeof (struct nexthop));
367 nexthop->type = NEXTHOP_TYPE_IPV6_IFINDEX;
368 nexthop->gate.ipv6 = *ipv6;
369 nexthop->ifindex = ifindex;
370
371 nexthop_add (rib, nexthop);
372
373 return nexthop;
374 }
375 #endif /* HAVE_IPV6 */
376
377 struct nexthop *
378 nexthop_blackhole_add (struct rib *rib)
379 {
380 struct nexthop *nexthop;
381
382 nexthop = XCALLOC (MTYPE_NEXTHOP, sizeof (struct nexthop));
383 nexthop->type = NEXTHOP_TYPE_BLACKHOLE;
384 SET_FLAG (rib->flags, ZEBRA_FLAG_BLACKHOLE);
385
386 nexthop_add (rib, nexthop);
387
388 return nexthop;
389 }
390
391 /* This method checks whether a recursive nexthop has at
392 * least one resolved nexthop in the fib.
393 */
394 int
395 nexthop_has_fib_child(struct nexthop *nexthop)
396 {
397 struct nexthop *nh;
398
399 if (! CHECK_FLAG (nexthop->flags, NEXTHOP_FLAG_RECURSIVE))
400 return 0;
401
402 for (nh = nexthop->resolved; nh; nh = nh->next)
403 if (CHECK_FLAG (nh->flags, NEXTHOP_FLAG_FIB))
404 return 1;
405
406 return 0;
407 }
408
409 /* If force flag is not set, do not modify falgs at all for uninstall
410 the route from FIB. */
411 static int
412 nexthop_active_ipv4 (struct rib *rib, struct nexthop *nexthop, int set,
413 struct route_node *top)
414 {
415 struct prefix_ipv4 p;
416 struct route_table *table;
417 struct route_node *rn;
418 struct rib *match;
419 int resolved;
420 struct nexthop *newhop;
421 struct nexthop *resolved_hop;
422
423 if (nexthop->type == NEXTHOP_TYPE_IPV4)
424 nexthop->ifindex = 0;
425
426 if (set)
427 {
428 UNSET_FLAG (nexthop->flags, NEXTHOP_FLAG_RECURSIVE);
429 nexthops_free(nexthop->resolved);
430 nexthop->resolved = NULL;
431 }
432
433 /* Make lookup prefix. */
434 memset (&p, 0, sizeof (struct prefix_ipv4));
435 p.family = AF_INET;
436 p.prefixlen = IPV4_MAX_PREFIXLEN;
437 p.prefix = nexthop->gate.ipv4;
438
439 /* Lookup table. */
440 table = vrf_table (AFI_IP, SAFI_UNICAST, 0);
441 if (! table)
442 return 0;
443
444 rn = route_node_match (table, (struct prefix *) &p);
445 while (rn)
446 {
447 route_unlock_node (rn);
448
449 /* If lookup self prefix return immediately. */
450 if (rn == top)
451 return 0;
452
453 /* Pick up selected route. */
454 RNODE_FOREACH_RIB (rn, match)
455 {
456 if (CHECK_FLAG (match->status, RIB_ENTRY_REMOVED))
457 continue;
458 if (CHECK_FLAG (match->flags, ZEBRA_FLAG_SELECTED))
459 break;
460 }
461
462 /* If there is no selected route or matched route is EGP, go up
463 tree. */
464 if (! match
465 || match->type == ZEBRA_ROUTE_BGP)
466 {
467 do {
468 rn = rn->parent;
469 } while (rn && rn->info == NULL);
470 if (rn)
471 route_lock_node (rn);
472 }
473 else
474 {
475 /* If the longest prefix match for the nexthop yields
476 * a blackhole, mark it as inactive. */
477 if (CHECK_FLAG (match->flags, ZEBRA_FLAG_BLACKHOLE)
478 || CHECK_FLAG (match->flags, ZEBRA_FLAG_REJECT))
479 return 0;
480
481 if (match->type == ZEBRA_ROUTE_CONNECT)
482 {
483 /* Directly point connected route. */
484 newhop = match->nexthop;
485 if (newhop && nexthop->type == NEXTHOP_TYPE_IPV4)
486 nexthop->ifindex = newhop->ifindex;
487
488 return 1;
489 }
490 else if (CHECK_FLAG (rib->flags, ZEBRA_FLAG_INTERNAL))
491 {
492 resolved = 0;
493 for (newhop = match->nexthop; newhop; newhop = newhop->next)
494 if (CHECK_FLAG (newhop->flags, NEXTHOP_FLAG_FIB)
495 && ! CHECK_FLAG (newhop->flags, NEXTHOP_FLAG_RECURSIVE))
496 {
497 if (set)
498 {
499 SET_FLAG (nexthop->flags, NEXTHOP_FLAG_RECURSIVE);
500
501 resolved_hop = XCALLOC(MTYPE_NEXTHOP, sizeof (struct nexthop));
502 SET_FLAG (resolved_hop->flags, NEXTHOP_FLAG_ACTIVE);
503 /* If the resolving route specifies a gateway, use it */
504 if (newhop->type == NEXTHOP_TYPE_IPV4
505 || newhop->type == NEXTHOP_TYPE_IPV4_IFINDEX
506 || newhop->type == NEXTHOP_TYPE_IPV4_IFNAME)
507 {
508 resolved_hop->type = newhop->type;
509 resolved_hop->gate.ipv4 = newhop->gate.ipv4;
510
511 if (newhop->ifindex)
512 {
513 resolved_hop->type = NEXTHOP_TYPE_IPV4_IFINDEX;
514 resolved_hop->ifindex = newhop->ifindex;
515 }
516 }
517
518 /* If the resolving route is an interface route,
519 * it means the gateway we are looking up is connected
520 * to that interface. (The actual network is _not_ onlink).
521 * Therefore, the resolved route should have the original
522 * gateway as nexthop as it is directly connected.
523 *
524 * On Linux, we have to set the onlink netlink flag because
525 * otherwise, the kernel won't accept the route. */
526 if (newhop->type == NEXTHOP_TYPE_IFINDEX
527 || newhop->type == NEXTHOP_TYPE_IFNAME)
528 {
529 resolved_hop->flags |= NEXTHOP_FLAG_ONLINK;
530 resolved_hop->type = NEXTHOP_TYPE_IPV4_IFINDEX;
531 resolved_hop->gate.ipv4 = nexthop->gate.ipv4;
532 resolved_hop->ifindex = newhop->ifindex;
533 }
534
535 _nexthop_add(&nexthop->resolved, resolved_hop);
536 }
537 resolved = 1;
538 }
539 return resolved;
540 }
541 else
542 {
543 return 0;
544 }
545 }
546 }
547 return 0;
548 }
549
550 #ifdef HAVE_IPV6
551 /* If force flag is not set, do not modify falgs at all for uninstall
552 the route from FIB. */
553 static int
554 nexthop_active_ipv6 (struct rib *rib, struct nexthop *nexthop, int set,
555 struct route_node *top)
556 {
557 struct prefix_ipv6 p;
558 struct route_table *table;
559 struct route_node *rn;
560 struct rib *match;
561 int resolved;
562 struct nexthop *newhop;
563 struct nexthop *resolved_hop;
564
565 if (nexthop->type == NEXTHOP_TYPE_IPV6)
566 nexthop->ifindex = 0;
567
568 if (set)
569 {
570 UNSET_FLAG (nexthop->flags, NEXTHOP_FLAG_RECURSIVE);
571 nexthops_free(nexthop->resolved);
572 nexthop->resolved = NULL;
573 }
574
575 /* Make lookup prefix. */
576 memset (&p, 0, sizeof (struct prefix_ipv6));
577 p.family = AF_INET6;
578 p.prefixlen = IPV6_MAX_PREFIXLEN;
579 p.prefix = nexthop->gate.ipv6;
580
581 /* Lookup table. */
582 table = vrf_table (AFI_IP6, SAFI_UNICAST, 0);
583 if (! table)
584 return 0;
585
586 rn = route_node_match (table, (struct prefix *) &p);
587 while (rn)
588 {
589 route_unlock_node (rn);
590
591 /* If lookup self prefix return immediately. */
592 if (rn == top)
593 return 0;
594
595 /* Pick up selected route. */
596 RNODE_FOREACH_RIB (rn, match)
597 {
598 if (CHECK_FLAG (match->status, RIB_ENTRY_REMOVED))
599 continue;
600 if (CHECK_FLAG (match->flags, ZEBRA_FLAG_SELECTED))
601 break;
602 }
603
604 /* If there is no selected route or matched route is EGP, go up
605 tree. */
606 if (! match
607 || match->type == ZEBRA_ROUTE_BGP)
608 {
609 do {
610 rn = rn->parent;
611 } while (rn && rn->info == NULL);
612 if (rn)
613 route_lock_node (rn);
614 }
615 else
616 {
617 /* If the longest prefix match for the nexthop yields
618 * a blackhole, mark it as inactive. */
619 if (CHECK_FLAG (match->flags, ZEBRA_FLAG_BLACKHOLE)
620 || CHECK_FLAG (match->flags, ZEBRA_FLAG_REJECT))
621 return 0;
622
623 if (match->type == ZEBRA_ROUTE_CONNECT)
624 {
625 /* Directly point connected route. */
626 newhop = match->nexthop;
627
628 if (newhop && nexthop->type == NEXTHOP_TYPE_IPV6)
629 nexthop->ifindex = newhop->ifindex;
630
631 return 1;
632 }
633 else if (CHECK_FLAG (rib->flags, ZEBRA_FLAG_INTERNAL))
634 {
635 resolved = 0;
636 for (newhop = match->nexthop; newhop; newhop = newhop->next)
637 if (CHECK_FLAG (newhop->flags, NEXTHOP_FLAG_FIB)
638 && ! CHECK_FLAG (newhop->flags, NEXTHOP_FLAG_RECURSIVE))
639 {
640 if (set)
641 {
642 SET_FLAG (nexthop->flags, NEXTHOP_FLAG_RECURSIVE);
643
644 resolved_hop = XCALLOC(MTYPE_NEXTHOP, sizeof (struct nexthop));
645 SET_FLAG (resolved_hop->flags, NEXTHOP_FLAG_ACTIVE);
646 /* See nexthop_active_ipv4 for a description how the
647 * resolved nexthop is constructed. */
648 if (newhop->type == NEXTHOP_TYPE_IPV6
649 || newhop->type == NEXTHOP_TYPE_IPV6_IFINDEX
650 || newhop->type == NEXTHOP_TYPE_IPV6_IFNAME)
651 {
652 resolved_hop->type = newhop->type;
653 resolved_hop->gate.ipv6 = newhop->gate.ipv6;
654
655 if (newhop->ifindex)
656 {
657 resolved_hop->type = NEXTHOP_TYPE_IPV6_IFINDEX;
658 resolved_hop->ifindex = newhop->ifindex;
659 }
660 }
661
662 if (newhop->type == NEXTHOP_TYPE_IFINDEX
663 || newhop->type == NEXTHOP_TYPE_IFNAME)
664 {
665 resolved_hop->flags |= NEXTHOP_FLAG_ONLINK;
666 resolved_hop->type = NEXTHOP_TYPE_IPV6_IFINDEX;
667 resolved_hop->gate.ipv6 = nexthop->gate.ipv6;
668 resolved_hop->ifindex = newhop->ifindex;
669 }
670
671 _nexthop_add(&nexthop->resolved, resolved_hop);
672 }
673 resolved = 1;
674 }
675 return resolved;
676 }
677 else
678 {
679 return 0;
680 }
681 }
682 }
683 return 0;
684 }
685 #endif /* HAVE_IPV6 */
686
687 struct rib *
688 rib_match_ipv4 (struct in_addr addr)
689 {
690 struct prefix_ipv4 p;
691 struct route_table *table;
692 struct route_node *rn;
693 struct rib *match;
694 struct nexthop *newhop, *tnewhop;
695 int recursing;
696
697 /* Lookup table. */
698 table = vrf_table (AFI_IP, SAFI_UNICAST, 0);
699 if (! table)
700 return 0;
701
702 memset (&p, 0, sizeof (struct prefix_ipv4));
703 p.family = AF_INET;
704 p.prefixlen = IPV4_MAX_PREFIXLEN;
705 p.prefix = addr;
706
707 rn = route_node_match (table, (struct prefix *) &p);
708
709 while (rn)
710 {
711 route_unlock_node (rn);
712
713 /* Pick up selected route. */
714 RNODE_FOREACH_RIB (rn, match)
715 {
716 if (CHECK_FLAG (match->status, RIB_ENTRY_REMOVED))
717 continue;
718 if (CHECK_FLAG (match->flags, ZEBRA_FLAG_SELECTED))
719 break;
720 }
721
722 /* If there is no selected route or matched route is EGP, go up
723 tree. */
724 if (! match
725 || match->type == ZEBRA_ROUTE_BGP)
726 {
727 do {
728 rn = rn->parent;
729 } while (rn && rn->info == NULL);
730 if (rn)
731 route_lock_node (rn);
732 }
733 else
734 {
735 if (match->type == ZEBRA_ROUTE_CONNECT)
736 /* Directly point connected route. */
737 return match;
738 else
739 {
740 for (ALL_NEXTHOPS_RO(match->nexthop, newhop, tnewhop, recursing))
741 if (CHECK_FLAG (newhop->flags, NEXTHOP_FLAG_FIB))
742 return match;
743 return NULL;
744 }
745 }
746 }
747 return NULL;
748 }
749
750 struct rib *
751 rib_lookup_ipv4 (struct prefix_ipv4 *p)
752 {
753 struct route_table *table;
754 struct route_node *rn;
755 struct rib *match;
756 struct nexthop *nexthop, *tnexthop;
757 int recursing;
758
759 /* Lookup table. */
760 table = vrf_table (AFI_IP, SAFI_UNICAST, 0);
761 if (! table)
762 return 0;
763
764 rn = route_node_lookup (table, (struct prefix *) p);
765
766 /* No route for this prefix. */
767 if (! rn)
768 return NULL;
769
770 /* Unlock node. */
771 route_unlock_node (rn);
772
773 RNODE_FOREACH_RIB (rn, match)
774 {
775 if (CHECK_FLAG (match->status, RIB_ENTRY_REMOVED))
776 continue;
777 if (CHECK_FLAG (match->flags, ZEBRA_FLAG_SELECTED))
778 break;
779 }
780
781 if (! match || match->type == ZEBRA_ROUTE_BGP)
782 return NULL;
783
784 if (match->type == ZEBRA_ROUTE_CONNECT)
785 return match;
786
787 for (ALL_NEXTHOPS_RO(match->nexthop, nexthop, tnexthop, recursing))
788 if (CHECK_FLAG (nexthop->flags, NEXTHOP_FLAG_FIB))
789 return match;
790
791 return NULL;
792 }
793
794 /*
795 * This clone function, unlike its original rib_lookup_ipv4(), checks
796 * if specified IPv4 route record (prefix/mask -> gate) exists in
797 * the whole RIB and has ZEBRA_FLAG_SELECTED set.
798 *
799 * Return values:
800 * -1: error
801 * 0: exact match found
802 * 1: a match was found with a different gate
803 * 2: connected route found
804 * 3: no matches found
805 */
806 int
807 rib_lookup_ipv4_route (struct prefix_ipv4 *p, union sockunion * qgate)
808 {
809 struct route_table *table;
810 struct route_node *rn;
811 struct rib *match;
812 struct nexthop *nexthop, *tnexthop;
813 int recursing;
814 int nexthops_active;
815
816 /* Lookup table. */
817 table = vrf_table (AFI_IP, SAFI_UNICAST, 0);
818 if (! table)
819 return ZEBRA_RIB_LOOKUP_ERROR;
820
821 /* Scan the RIB table for exactly matching RIB entry. */
822 rn = route_node_lookup (table, (struct prefix *) p);
823
824 /* No route for this prefix. */
825 if (! rn)
826 return ZEBRA_RIB_NOTFOUND;
827
828 /* Unlock node. */
829 route_unlock_node (rn);
830
831 /* Find out if a "selected" RR for the discovered RIB entry exists ever. */
832 RNODE_FOREACH_RIB (rn, match)
833 {
834 if (CHECK_FLAG (match->status, RIB_ENTRY_REMOVED))
835 continue;
836 if (CHECK_FLAG (match->flags, ZEBRA_FLAG_SELECTED))
837 break;
838 }
839
840 /* None such found :( */
841 if (!match)
842 return ZEBRA_RIB_NOTFOUND;
843
844 if (match->type == ZEBRA_ROUTE_CONNECT)
845 return ZEBRA_RIB_FOUND_CONNECTED;
846
847 /* Ok, we have a cood candidate, let's check it's nexthop list... */
848 nexthops_active = 0;
849 for (ALL_NEXTHOPS_RO(match->nexthop, nexthop, tnexthop, recursing))
850 if (CHECK_FLAG (nexthop->flags, NEXTHOP_FLAG_FIB))
851 {
852 nexthops_active = 1;
853 if (nexthop->gate.ipv4.s_addr == sockunion2ip (qgate))
854 return ZEBRA_RIB_FOUND_EXACT;
855 if (IS_ZEBRA_DEBUG_RIB)
856 {
857 char gate_buf[INET_ADDRSTRLEN], qgate_buf[INET_ADDRSTRLEN];
858 inet_ntop (AF_INET, &nexthop->gate.ipv4.s_addr, gate_buf, INET_ADDRSTRLEN);
859 inet_ntop (AF_INET, &sockunion2ip(qgate), qgate_buf, INET_ADDRSTRLEN);
860 zlog_debug ("%s: qgate == %s, %s == %s", __func__,
861 qgate_buf, recursing ? "rgate" : "gate", gate_buf);
862 }
863 }
864
865 if (nexthops_active)
866 return ZEBRA_RIB_FOUND_NOGATE;
867
868 return ZEBRA_RIB_NOTFOUND;
869 }
870
871 #ifdef HAVE_IPV6
872 struct rib *
873 rib_match_ipv6 (struct in6_addr *addr)
874 {
875 struct prefix_ipv6 p;
876 struct route_table *table;
877 struct route_node *rn;
878 struct rib *match;
879 struct nexthop *newhop, *tnewhop;
880 int recursing;
881
882 /* Lookup table. */
883 table = vrf_table (AFI_IP6, SAFI_UNICAST, 0);
884 if (! table)
885 return 0;
886
887 memset (&p, 0, sizeof (struct prefix_ipv6));
888 p.family = AF_INET6;
889 p.prefixlen = IPV6_MAX_PREFIXLEN;
890 IPV6_ADDR_COPY (&p.prefix, addr);
891
892 rn = route_node_match (table, (struct prefix *) &p);
893
894 while (rn)
895 {
896 route_unlock_node (rn);
897
898 /* Pick up selected route. */
899 RNODE_FOREACH_RIB (rn, match)
900 {
901 if (CHECK_FLAG (match->status, RIB_ENTRY_REMOVED))
902 continue;
903 if (CHECK_FLAG (match->flags, ZEBRA_FLAG_SELECTED))
904 break;
905 }
906
907 /* If there is no selected route or matched route is EGP, go up
908 tree. */
909 if (! match
910 || match->type == ZEBRA_ROUTE_BGP)
911 {
912 do {
913 rn = rn->parent;
914 } while (rn && rn->info == NULL);
915 if (rn)
916 route_lock_node (rn);
917 }
918 else
919 {
920 if (match->type == ZEBRA_ROUTE_CONNECT)
921 /* Directly point connected route. */
922 return match;
923 else
924 {
925 for (ALL_NEXTHOPS_RO(match->nexthop, newhop, tnewhop, recursing))
926 if (CHECK_FLAG (newhop->flags, NEXTHOP_FLAG_FIB))
927 return match;
928 return NULL;
929 }
930 }
931 }
932 return NULL;
933 }
934 #endif /* HAVE_IPV6 */
935
936 #define RIB_SYSTEM_ROUTE(R) \
937 ((R)->type == ZEBRA_ROUTE_KERNEL || (R)->type == ZEBRA_ROUTE_CONNECT)
938
939 /* This function verifies reachability of one given nexthop, which can be
940 * numbered or unnumbered, IPv4 or IPv6. The result is unconditionally stored
941 * in nexthop->flags field. If the 4th parameter, 'set', is non-zero,
942 * nexthop->ifindex will be updated appropriately as well.
943 * An existing route map can turn (otherwise active) nexthop into inactive, but
944 * not vice versa.
945 *
946 * The return value is the final value of 'ACTIVE' flag.
947 */
948
949 static unsigned
950 nexthop_active_check (struct route_node *rn, struct rib *rib,
951 struct nexthop *nexthop, int set)
952 {
953 rib_table_info_t *info = rn->table->info;
954 struct interface *ifp;
955 route_map_result_t ret = RMAP_MATCH;
956 extern char *proto_rm[AFI_MAX][ZEBRA_ROUTE_MAX+1];
957 struct route_map *rmap;
958 int family;
959
960 family = 0;
961 switch (nexthop->type)
962 {
963 case NEXTHOP_TYPE_IFINDEX:
964 ifp = if_lookup_by_index (nexthop->ifindex);
965 if (ifp && if_is_operative(ifp))
966 SET_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
967 else
968 UNSET_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
969 break;
970 case NEXTHOP_TYPE_IPV6_IFNAME:
971 family = AFI_IP6;
972 case NEXTHOP_TYPE_IFNAME:
973 ifp = if_lookup_by_name (nexthop->ifname);
974 if (ifp && if_is_operative(ifp))
975 {
976 if (set)
977 nexthop->ifindex = ifp->ifindex;
978 SET_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
979 }
980 else
981 {
982 if (set)
983 nexthop->ifindex = 0;
984 UNSET_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
985 }
986 break;
987 case NEXTHOP_TYPE_IPV4:
988 case NEXTHOP_TYPE_IPV4_IFINDEX:
989 family = AFI_IP;
990 if (nexthop_active_ipv4 (rib, nexthop, set, rn))
991 SET_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
992 else
993 UNSET_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
994 break;
995 #ifdef HAVE_IPV6
996 case NEXTHOP_TYPE_IPV6:
997 family = AFI_IP6;
998 if (nexthop_active_ipv6 (rib, nexthop, set, rn))
999 SET_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
1000 else
1001 UNSET_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
1002 break;
1003 case NEXTHOP_TYPE_IPV6_IFINDEX:
1004 family = AFI_IP6;
1005 if (IN6_IS_ADDR_LINKLOCAL (&nexthop->gate.ipv6))
1006 {
1007 ifp = if_lookup_by_index (nexthop->ifindex);
1008 if (ifp && if_is_operative(ifp))
1009 SET_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
1010 else
1011 UNSET_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
1012 }
1013 else
1014 {
1015 if (nexthop_active_ipv6 (rib, nexthop, set, rn))
1016 SET_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
1017 else
1018 UNSET_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
1019 }
1020 break;
1021 #endif /* HAVE_IPV6 */
1022 case NEXTHOP_TYPE_BLACKHOLE:
1023 SET_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
1024 break;
1025 default:
1026 break;
1027 }
1028 if (! CHECK_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE))
1029 return 0;
1030
1031 /* XXX: What exactly do those checks do? Do we support
1032 * e.g. IPv4 routes with IPv6 nexthops or vice versa? */
1033 if (RIB_SYSTEM_ROUTE(rib) ||
1034 (family == AFI_IP && rn->p.family != AF_INET) ||
1035 (family == AFI_IP6 && rn->p.family != AF_INET6))
1036 return CHECK_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
1037
1038 /* The original code didn't determine the family correctly
1039 * e.g. for NEXTHOP_TYPE_IFINDEX. Retrieve the correct afi
1040 * from the rib_table_info in those cases.
1041 * Possibly it may be better to use only the rib_table_info
1042 * in every case.
1043 */
1044 if (!family)
1045 family = info->afi;
1046
1047 rmap = 0;
1048 if (rib->type >= 0 && rib->type < ZEBRA_ROUTE_MAX &&
1049 proto_rm[family][rib->type])
1050 rmap = route_map_lookup_by_name (proto_rm[family][rib->type]);
1051 if (!rmap && proto_rm[family][ZEBRA_ROUTE_MAX])
1052 rmap = route_map_lookup_by_name (proto_rm[family][ZEBRA_ROUTE_MAX]);
1053 if (rmap) {
1054 ret = route_map_apply(rmap, &rn->p, RMAP_ZEBRA, nexthop);
1055 }
1056
1057 if (ret == RMAP_DENYMATCH)
1058 UNSET_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
1059 return CHECK_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
1060 }
1061
1062 /* Iterate over all nexthops of the given RIB entry and refresh their
1063 * ACTIVE flag. rib->nexthop_active_num is updated accordingly. If any
1064 * nexthop is found to toggle the ACTIVE flag, the whole rib structure
1065 * is flagged with ZEBRA_FLAG_CHANGED. The 4th 'set' argument is
1066 * transparently passed to nexthop_active_check().
1067 *
1068 * Return value is the new number of active nexthops.
1069 */
1070
1071 static int
1072 nexthop_active_update (struct route_node *rn, struct rib *rib, int set)
1073 {
1074 struct nexthop *nexthop;
1075 unsigned int prev_active, prev_index, new_active;
1076
1077 rib->nexthop_active_num = 0;
1078 UNSET_FLAG (rib->flags, ZEBRA_FLAG_CHANGED);
1079
1080 for (nexthop = rib->nexthop; nexthop; nexthop = nexthop->next)
1081 {
1082 prev_active = CHECK_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE);
1083 prev_index = nexthop->ifindex;
1084 if ((new_active = nexthop_active_check (rn, rib, nexthop, set)))
1085 rib->nexthop_active_num++;
1086 if (prev_active != new_active ||
1087 prev_index != nexthop->ifindex)
1088 SET_FLAG (rib->flags, ZEBRA_FLAG_CHANGED);
1089 }
1090 return rib->nexthop_active_num;
1091 }
1092
1093 \f
1094
1095 static void
1096 rib_install_kernel (struct route_node *rn, struct rib *rib)
1097 {
1098 int ret = 0;
1099 struct nexthop *nexthop, *tnexthop;
1100 int recursing;
1101
1102 /*
1103 * Make sure we update the FPM any time we send new information to
1104 * the kernel.
1105 */
1106 zfpm_trigger_update (rn, "installing in kernel");
1107 switch (PREFIX_FAMILY (&rn->p))
1108 {
1109 case AF_INET:
1110 ret = kernel_add_ipv4 (&rn->p, rib);
1111 break;
1112 #ifdef HAVE_IPV6
1113 case AF_INET6:
1114 ret = kernel_add_ipv6 (&rn->p, rib);
1115 break;
1116 #endif /* HAVE_IPV6 */
1117 }
1118
1119 /* This condition is never met, if we are using rt_socket.c */
1120 if (ret < 0)
1121 {
1122 for (ALL_NEXTHOPS_RO(rib->nexthop, nexthop, tnexthop, recursing))
1123 UNSET_FLAG (nexthop->flags, NEXTHOP_FLAG_FIB);
1124 }
1125 }
1126
1127 /* Uninstall the route from kernel. */
1128 static int
1129 rib_uninstall_kernel (struct route_node *rn, struct rib *rib)
1130 {
1131 int ret = 0;
1132 struct nexthop *nexthop, *tnexthop;
1133 int recursing;
1134
1135 /*
1136 * Make sure we update the FPM any time we send new information to
1137 * the kernel.
1138 */
1139 zfpm_trigger_update (rn, "uninstalling from kernel");
1140
1141 switch (PREFIX_FAMILY (&rn->p))
1142 {
1143 case AF_INET:
1144 ret = kernel_delete_ipv4 (&rn->p, rib);
1145 break;
1146 #ifdef HAVE_IPV6
1147 case AF_INET6:
1148 ret = kernel_delete_ipv6 (&rn->p, rib);
1149 break;
1150 #endif /* HAVE_IPV6 */
1151 }
1152
1153 for (ALL_NEXTHOPS_RO(rib->nexthop, nexthop, tnexthop, recursing))
1154 UNSET_FLAG (nexthop->flags, NEXTHOP_FLAG_FIB);
1155
1156 return ret;
1157 }
1158
1159 /* Uninstall the route from kernel. */
1160 static void
1161 rib_uninstall (struct route_node *rn, struct rib *rib)
1162 {
1163 if (CHECK_FLAG (rib->flags, ZEBRA_FLAG_SELECTED))
1164 {
1165 zfpm_trigger_update (rn, "rib_uninstall");
1166
1167 redistribute_delete (&rn->p, rib);
1168 if (! RIB_SYSTEM_ROUTE (rib))
1169 rib_uninstall_kernel (rn, rib);
1170 UNSET_FLAG (rib->flags, ZEBRA_FLAG_SELECTED);
1171 }
1172 }
1173
1174 static void rib_unlink (struct route_node *, struct rib *);
1175
1176 /*
1177 * rib_can_delete_dest
1178 *
1179 * Returns TRUE if the given dest can be deleted from the table.
1180 */
1181 static int
1182 rib_can_delete_dest (rib_dest_t *dest)
1183 {
1184 if (dest->routes)
1185 {
1186 return 0;
1187 }
1188
1189 /*
1190 * Don't delete the dest if we have to update the FPM about this
1191 * prefix.
1192 */
1193 if (CHECK_FLAG (dest->flags, RIB_DEST_UPDATE_FPM) ||
1194 CHECK_FLAG (dest->flags, RIB_DEST_SENT_TO_FPM))
1195 return 0;
1196
1197 return 1;
1198 }
1199
1200 /*
1201 * rib_gc_dest
1202 *
1203 * Garbage collect the rib dest corresponding to the given route node
1204 * if appropriate.
1205 *
1206 * Returns TRUE if the dest was deleted, FALSE otherwise.
1207 */
1208 int
1209 rib_gc_dest (struct route_node *rn)
1210 {
1211 rib_dest_t *dest;
1212 char buf[INET6_ADDRSTRLEN];
1213
1214 dest = rib_dest_from_rnode (rn);
1215 if (!dest)
1216 return 0;
1217
1218 if (!rib_can_delete_dest (dest))
1219 return 0;
1220
1221 if (IS_ZEBRA_DEBUG_RIB)
1222 {
1223 inet_ntop (rn->p.family, &rn->p.u.prefix, buf, sizeof (buf));
1224 zlog_debug ("%s: %s/%d: removing dest from table", __func__,
1225 buf, rn->p.prefixlen);
1226 }
1227
1228 dest->rnode = NULL;
1229 XFREE (MTYPE_RIB_DEST, dest);
1230 rn->info = NULL;
1231
1232 /*
1233 * Release the one reference that we keep on the route node.
1234 */
1235 route_unlock_node (rn);
1236 return 1;
1237 }
1238
1239 /* Core function for processing routing information base. */
1240 static void
1241 rib_process (struct route_node *rn)
1242 {
1243 struct rib *rib;
1244 struct rib *next;
1245 struct rib *fib = NULL;
1246 struct rib *select = NULL;
1247 struct rib *del = NULL;
1248 int installed = 0;
1249 struct nexthop *nexthop = NULL, *tnexthop;
1250 int recursing;
1251 char buf[INET6_ADDRSTRLEN];
1252
1253 assert (rn);
1254
1255 if (IS_ZEBRA_DEBUG_RIB || IS_ZEBRA_DEBUG_RIB_Q)
1256 inet_ntop (rn->p.family, &rn->p.u.prefix, buf, INET6_ADDRSTRLEN);
1257
1258 RNODE_FOREACH_RIB_SAFE (rn, rib, next)
1259 {
1260 /* Currently installed rib. */
1261 if (CHECK_FLAG (rib->flags, ZEBRA_FLAG_SELECTED))
1262 {
1263 assert (fib == NULL);
1264 fib = rib;
1265 }
1266
1267 /* Unlock removed routes, so they'll be freed, bar the FIB entry,
1268 * which we need to do do further work with below.
1269 */
1270 if (CHECK_FLAG (rib->status, RIB_ENTRY_REMOVED))
1271 {
1272 if (rib != fib)
1273 {
1274 if (IS_ZEBRA_DEBUG_RIB)
1275 zlog_debug ("%s: %s/%d: rn %p, removing rib %p", __func__,
1276 buf, rn->p.prefixlen, rn, rib);
1277 rib_unlink (rn, rib);
1278 }
1279 else
1280 del = rib;
1281
1282 continue;
1283 }
1284
1285 /* Skip unreachable nexthop. */
1286 if (! nexthop_active_update (rn, rib, 0))
1287 continue;
1288
1289 /* Infinit distance. */
1290 if (rib->distance == DISTANCE_INFINITY)
1291 continue;
1292
1293 /* Newly selected rib, the common case. */
1294 if (!select)
1295 {
1296 select = rib;
1297 continue;
1298 }
1299
1300 /* filter route selection in following order:
1301 * - connected beats other types
1302 * - lower distance beats higher
1303 * - lower metric beats higher for equal distance
1304 * - last, hence oldest, route wins tie break.
1305 */
1306
1307 /* Connected routes. Pick the last connected
1308 * route of the set of lowest metric connected routes.
1309 */
1310 if (rib->type == ZEBRA_ROUTE_CONNECT)
1311 {
1312 if (select->type != ZEBRA_ROUTE_CONNECT
1313 || rib->metric <= select->metric)
1314 select = rib;
1315 continue;
1316 }
1317 else if (select->type == ZEBRA_ROUTE_CONNECT)
1318 continue;
1319
1320 /* higher distance loses */
1321 if (rib->distance > select->distance)
1322 continue;
1323
1324 /* lower wins */
1325 if (rib->distance < select->distance)
1326 {
1327 select = rib;
1328 continue;
1329 }
1330
1331 /* metric tie-breaks equal distance */
1332 if (rib->metric <= select->metric)
1333 select = rib;
1334 } /* RNODE_FOREACH_RIB_SAFE */
1335
1336 /* After the cycle is finished, the following pointers will be set:
1337 * select --- the winner RIB entry, if any was found, otherwise NULL
1338 * fib --- the SELECTED RIB entry, if any, otherwise NULL
1339 * del --- equal to fib, if fib is queued for deletion, NULL otherwise
1340 * rib --- NULL
1341 */
1342
1343 /* Same RIB entry is selected. Update FIB and finish. */
1344 if (select && select == fib)
1345 {
1346 if (IS_ZEBRA_DEBUG_RIB)
1347 zlog_debug ("%s: %s/%d: Updating existing route, select %p, fib %p",
1348 __func__, buf, rn->p.prefixlen, select, fib);
1349 if (CHECK_FLAG (select->flags, ZEBRA_FLAG_CHANGED))
1350 {
1351 zfpm_trigger_update (rn, "updating existing route");
1352
1353 redistribute_delete (&rn->p, select);
1354 if (! RIB_SYSTEM_ROUTE (select))
1355 rib_uninstall_kernel (rn, select);
1356
1357 /* Set real nexthop. */
1358 nexthop_active_update (rn, select, 1);
1359
1360 if (! RIB_SYSTEM_ROUTE (select))
1361 rib_install_kernel (rn, select);
1362 redistribute_add (&rn->p, select);
1363 }
1364 else if (! RIB_SYSTEM_ROUTE (select))
1365 {
1366 /* Housekeeping code to deal with
1367 race conditions in kernel with linux
1368 netlink reporting interface up before IPv4 or IPv6 protocol
1369 is ready to add routes.
1370 This makes sure the routes are IN the kernel.
1371 */
1372
1373 for (ALL_NEXTHOPS_RO(select->nexthop, nexthop, tnexthop, recursing))
1374 if (CHECK_FLAG (nexthop->flags, NEXTHOP_FLAG_FIB))
1375 {
1376 installed = 1;
1377 break;
1378 }
1379 if (! installed)
1380 rib_install_kernel (rn, select);
1381 }
1382 goto end;
1383 }
1384
1385 /* At this point we either haven't found the best RIB entry or it is
1386 * different from what we currently intend to flag with SELECTED. In both
1387 * cases, if a RIB block is present in FIB, it should be withdrawn.
1388 */
1389 if (fib)
1390 {
1391 if (IS_ZEBRA_DEBUG_RIB)
1392 zlog_debug ("%s: %s/%d: Removing existing route, fib %p", __func__,
1393 buf, rn->p.prefixlen, fib);
1394
1395 zfpm_trigger_update (rn, "removing existing route");
1396
1397 redistribute_delete (&rn->p, fib);
1398 if (! RIB_SYSTEM_ROUTE (fib))
1399 rib_uninstall_kernel (rn, fib);
1400 UNSET_FLAG (fib->flags, ZEBRA_FLAG_SELECTED);
1401
1402 /* Set real nexthop. */
1403 nexthop_active_update (rn, fib, 1);
1404 }
1405
1406 /* Regardless of some RIB entry being SELECTED or not before, now we can
1407 * tell, that if a new winner exists, FIB is still not updated with this
1408 * data, but ready to be.
1409 */
1410 if (select)
1411 {
1412 if (IS_ZEBRA_DEBUG_RIB)
1413 zlog_debug ("%s: %s/%d: Adding route, select %p", __func__, buf,
1414 rn->p.prefixlen, select);
1415
1416 zfpm_trigger_update (rn, "new route selected");
1417
1418 /* Set real nexthop. */
1419 nexthop_active_update (rn, select, 1);
1420
1421 if (! RIB_SYSTEM_ROUTE (select))
1422 rib_install_kernel (rn, select);
1423 SET_FLAG (select->flags, ZEBRA_FLAG_SELECTED);
1424 redistribute_add (&rn->p, select);
1425 }
1426
1427 /* FIB route was removed, should be deleted */
1428 if (del)
1429 {
1430 if (IS_ZEBRA_DEBUG_RIB)
1431 zlog_debug ("%s: %s/%d: Deleting fib %p, rn %p", __func__, buf,
1432 rn->p.prefixlen, del, rn);
1433 rib_unlink (rn, del);
1434 }
1435
1436 end:
1437 if (IS_ZEBRA_DEBUG_RIB_Q)
1438 zlog_debug ("%s: %s/%d: rn %p dequeued", __func__, buf, rn->p.prefixlen, rn);
1439
1440 /*
1441 * Check if the dest can be deleted now.
1442 */
1443 rib_gc_dest (rn);
1444 }
1445
1446 /* Take a list of route_node structs and return 1, if there was a record
1447 * picked from it and processed by rib_process(). Don't process more,
1448 * than one RN record; operate only in the specified sub-queue.
1449 */
1450 static unsigned int
1451 process_subq (struct list * subq, u_char qindex)
1452 {
1453 struct listnode *lnode = listhead (subq);
1454 struct route_node *rnode;
1455
1456 if (!lnode)
1457 return 0;
1458
1459 rnode = listgetdata (lnode);
1460 rib_process (rnode);
1461
1462 if (rnode->info)
1463 UNSET_FLAG (rib_dest_from_rnode (rnode)->flags, RIB_ROUTE_QUEUED (qindex));
1464
1465 #if 0
1466 else
1467 {
1468 zlog_debug ("%s: called for route_node (%p, %d) with no ribs",
1469 __func__, rnode, rnode->lock);
1470 zlog_backtrace(LOG_DEBUG);
1471 }
1472 #endif
1473 route_unlock_node (rnode);
1474 list_delete_node (subq, lnode);
1475 return 1;
1476 }
1477
1478 /* Dispatch the meta queue by picking, processing and unlocking the next RN from
1479 * a non-empty sub-queue with lowest priority. wq is equal to zebra->ribq and data
1480 * is pointed to the meta queue structure.
1481 */
1482 static wq_item_status
1483 meta_queue_process (struct work_queue *dummy, void *data)
1484 {
1485 struct meta_queue * mq = data;
1486 unsigned i;
1487
1488 for (i = 0; i < MQ_SIZE; i++)
1489 if (process_subq (mq->subq[i], i))
1490 {
1491 mq->size--;
1492 break;
1493 }
1494 return mq->size ? WQ_REQUEUE : WQ_SUCCESS;
1495 }
1496
1497 /*
1498 * Map from rib types to queue type (priority) in meta queue
1499 */
1500 static const u_char meta_queue_map[ZEBRA_ROUTE_MAX] = {
1501 [ZEBRA_ROUTE_SYSTEM] = 4,
1502 [ZEBRA_ROUTE_KERNEL] = 0,
1503 [ZEBRA_ROUTE_CONNECT] = 0,
1504 [ZEBRA_ROUTE_STATIC] = 1,
1505 [ZEBRA_ROUTE_RIP] = 2,
1506 [ZEBRA_ROUTE_RIPNG] = 2,
1507 [ZEBRA_ROUTE_OSPF] = 2,
1508 [ZEBRA_ROUTE_OSPF6] = 2,
1509 [ZEBRA_ROUTE_ISIS] = 2,
1510 [ZEBRA_ROUTE_BGP] = 3,
1511 [ZEBRA_ROUTE_HSLS] = 4,
1512 [ZEBRA_ROUTE_BABEL] = 2,
1513 };
1514
1515 /* Look into the RN and queue it into one or more priority queues,
1516 * increasing the size for each data push done.
1517 */
1518 static void
1519 rib_meta_queue_add (struct meta_queue *mq, struct route_node *rn)
1520 {
1521 struct rib *rib;
1522 char buf[INET6_ADDRSTRLEN];
1523
1524 if (IS_ZEBRA_DEBUG_RIB_Q)
1525 inet_ntop (rn->p.family, &rn->p.u.prefix, buf, INET6_ADDRSTRLEN);
1526
1527 RNODE_FOREACH_RIB (rn, rib)
1528 {
1529 u_char qindex = meta_queue_map[rib->type];
1530
1531 /* Invariant: at this point we always have rn->info set. */
1532 if (CHECK_FLAG (rib_dest_from_rnode (rn)->flags,
1533 RIB_ROUTE_QUEUED (qindex)))
1534 {
1535 if (IS_ZEBRA_DEBUG_RIB_Q)
1536 zlog_debug ("%s: %s/%d: rn %p is already queued in sub-queue %u",
1537 __func__, buf, rn->p.prefixlen, rn, qindex);
1538 continue;
1539 }
1540
1541 SET_FLAG (rib_dest_from_rnode (rn)->flags, RIB_ROUTE_QUEUED (qindex));
1542 listnode_add (mq->subq[qindex], rn);
1543 route_lock_node (rn);
1544 mq->size++;
1545
1546 if (IS_ZEBRA_DEBUG_RIB_Q)
1547 zlog_debug ("%s: %s/%d: queued rn %p into sub-queue %u",
1548 __func__, buf, rn->p.prefixlen, rn, qindex);
1549 }
1550 }
1551
1552 /* Add route_node to work queue and schedule processing */
1553 static void
1554 rib_queue_add (struct zebra_t *zebra, struct route_node *rn)
1555 {
1556 char buf[INET_ADDRSTRLEN];
1557 assert (zebra && rn);
1558
1559 if (IS_ZEBRA_DEBUG_RIB_Q)
1560 inet_ntop (AF_INET, &rn->p.u.prefix, buf, INET_ADDRSTRLEN);
1561
1562 /* Pointless to queue a route_node with no RIB entries to add or remove */
1563 if (!rnode_to_ribs (rn))
1564 {
1565 zlog_debug ("%s: called for route_node (%p, %d) with no ribs",
1566 __func__, rn, rn->lock);
1567 zlog_backtrace(LOG_DEBUG);
1568 return;
1569 }
1570
1571 if (IS_ZEBRA_DEBUG_RIB_Q)
1572 zlog_info ("%s: %s/%d: work queue added", __func__, buf, rn->p.prefixlen);
1573
1574 assert (zebra);
1575
1576 if (zebra->ribq == NULL)
1577 {
1578 zlog_err ("%s: work_queue does not exist!", __func__);
1579 return;
1580 }
1581
1582 /*
1583 * The RIB queue should normally be either empty or holding the only
1584 * work_queue_item element. In the latter case this element would
1585 * hold a pointer to the meta queue structure, which must be used to
1586 * actually queue the route nodes to process. So create the MQ
1587 * holder, if necessary, then push the work into it in any case.
1588 * This semantics was introduced after 0.99.9 release.
1589 */
1590 if (!zebra->ribq->items->count)
1591 work_queue_add (zebra->ribq, zebra->mq);
1592
1593 rib_meta_queue_add (zebra->mq, rn);
1594
1595 if (IS_ZEBRA_DEBUG_RIB_Q)
1596 zlog_debug ("%s: %s/%d: rn %p queued", __func__, buf, rn->p.prefixlen, rn);
1597
1598 return;
1599 }
1600
1601 /* Create new meta queue.
1602 A destructor function doesn't seem to be necessary here.
1603 */
1604 static struct meta_queue *
1605 meta_queue_new (void)
1606 {
1607 struct meta_queue *new;
1608 unsigned i;
1609
1610 new = XCALLOC (MTYPE_WORK_QUEUE, sizeof (struct meta_queue));
1611 assert(new);
1612
1613 for (i = 0; i < MQ_SIZE; i++)
1614 {
1615 new->subq[i] = list_new ();
1616 assert(new->subq[i]);
1617 }
1618
1619 return new;
1620 }
1621
1622 /* initialise zebra rib work queue */
1623 static void
1624 rib_queue_init (struct zebra_t *zebra)
1625 {
1626 assert (zebra);
1627
1628 if (! (zebra->ribq = work_queue_new (zebra->master,
1629 "route_node processing")))
1630 {
1631 zlog_err ("%s: could not initialise work queue!", __func__);
1632 return;
1633 }
1634
1635 /* fill in the work queue spec */
1636 zebra->ribq->spec.workfunc = &meta_queue_process;
1637 zebra->ribq->spec.errorfunc = NULL;
1638 /* XXX: TODO: These should be runtime configurable via vty */
1639 zebra->ribq->spec.max_retries = 3;
1640 zebra->ribq->spec.hold = rib_process_hold_time;
1641
1642 if (!(zebra->mq = meta_queue_new ()))
1643 {
1644 zlog_err ("%s: could not initialise meta queue!", __func__);
1645 return;
1646 }
1647 return;
1648 }
1649
1650 /* RIB updates are processed via a queue of pointers to route_nodes.
1651 *
1652 * The queue length is bounded by the maximal size of the routing table,
1653 * as a route_node will not be requeued, if already queued.
1654 *
1655 * RIBs are submitted via rib_addnode or rib_delnode which set minimal
1656 * state, or static_install_ipv{4,6} (when an existing RIB is updated)
1657 * and then submit route_node to queue for best-path selection later.
1658 * Order of add/delete state changes are preserved for any given RIB.
1659 *
1660 * Deleted RIBs are reaped during best-path selection.
1661 *
1662 * rib_addnode
1663 * |-> rib_link or unset RIB_ENTRY_REMOVE |->Update kernel with
1664 * |-------->| | best RIB, if required
1665 * | |
1666 * static_install->|->rib_addqueue...... -> rib_process
1667 * | |
1668 * |-------->| |-> rib_unlink
1669 * |-> set RIB_ENTRY_REMOVE |
1670 * rib_delnode (RIB freed)
1671 *
1672 * The 'info' pointer of a route_node points to a rib_dest_t
1673 * ('dest'). Queueing state for a route_node is kept on the dest. The
1674 * dest is created on-demand by rib_link() and is kept around at least
1675 * as long as there are ribs hanging off it (@see rib_gc_dest()).
1676 *
1677 * Refcounting (aka "locking" throughout the GNU Zebra and Quagga code):
1678 *
1679 * - route_nodes: refcounted by:
1680 * - dest attached to route_node:
1681 * - managed by: rib_link/rib_gc_dest
1682 * - route_node processing queue
1683 * - managed by: rib_addqueue, rib_process.
1684 *
1685 */
1686
1687 /* Add RIB to head of the route node. */
1688 static void
1689 rib_link (struct route_node *rn, struct rib *rib)
1690 {
1691 struct rib *head;
1692 rib_dest_t *dest;
1693 char buf[INET6_ADDRSTRLEN];
1694
1695 assert (rib && rn);
1696
1697 if (IS_ZEBRA_DEBUG_RIB)
1698 {
1699 inet_ntop (rn->p.family, &rn->p.u.prefix, buf, INET6_ADDRSTRLEN);
1700 zlog_debug ("%s: %s/%d: rn %p, rib %p", __func__,
1701 buf, rn->p.prefixlen, rn, rib);
1702 }
1703
1704 dest = rib_dest_from_rnode (rn);
1705 if (!dest)
1706 {
1707 if (IS_ZEBRA_DEBUG_RIB)
1708 {
1709 zlog_debug ("%s: %s/%d: adding dest to table", __func__,
1710 buf, rn->p.prefixlen);
1711 }
1712
1713 dest = XCALLOC (MTYPE_RIB_DEST, sizeof (rib_dest_t));
1714 route_lock_node (rn); /* rn route table reference */
1715 rn->info = dest;
1716 dest->rnode = rn;
1717 }
1718
1719 head = dest->routes;
1720 if (head)
1721 {
1722 head->prev = rib;
1723 }
1724 rib->next = head;
1725 dest->routes = rib;
1726 rib_queue_add (&zebrad, rn);
1727 }
1728
1729 static void
1730 rib_addnode (struct route_node *rn, struct rib *rib)
1731 {
1732 /* RIB node has been un-removed before route-node is processed.
1733 * route_node must hence already be on the queue for processing..
1734 */
1735 if (CHECK_FLAG (rib->status, RIB_ENTRY_REMOVED))
1736 {
1737 if (IS_ZEBRA_DEBUG_RIB)
1738 {
1739 char buf[INET6_ADDRSTRLEN];
1740 inet_ntop (rn->p.family, &rn->p.u.prefix, buf, INET6_ADDRSTRLEN);
1741 zlog_debug ("%s: %s/%d: rn %p, un-removed rib %p",
1742 __func__, buf, rn->p.prefixlen, rn, rib);
1743 }
1744 UNSET_FLAG (rib->status, RIB_ENTRY_REMOVED);
1745 return;
1746 }
1747 rib_link (rn, rib);
1748 }
1749
1750 /*
1751 * rib_unlink
1752 *
1753 * Detach a rib structure from a route_node.
1754 *
1755 * Note that a call to rib_unlink() should be followed by a call to
1756 * rib_gc_dest() at some point. This allows a rib_dest_t that is no
1757 * longer required to be deleted.
1758 */
1759 static void
1760 rib_unlink (struct route_node *rn, struct rib *rib)
1761 {
1762 char buf[INET6_ADDRSTRLEN];
1763 rib_dest_t *dest;
1764
1765 assert (rn && rib);
1766
1767 if (IS_ZEBRA_DEBUG_RIB)
1768 {
1769 inet_ntop (rn->p.family, &rn->p.u.prefix, buf, INET6_ADDRSTRLEN);
1770 zlog_debug ("%s: %s/%d: rn %p, rib %p",
1771 __func__, buf, rn->p.prefixlen, rn, rib);
1772 }
1773
1774 dest = rib_dest_from_rnode (rn);
1775
1776 if (rib->next)
1777 rib->next->prev = rib->prev;
1778
1779 if (rib->prev)
1780 rib->prev->next = rib->next;
1781 else
1782 {
1783 dest->routes = rib->next;
1784 }
1785
1786 /* free RIB and nexthops */
1787 nexthops_free(rib->nexthop);
1788 XFREE (MTYPE_RIB, rib);
1789
1790 }
1791
1792 static void
1793 rib_delnode (struct route_node *rn, struct rib *rib)
1794 {
1795 if (IS_ZEBRA_DEBUG_RIB)
1796 {
1797 char buf[INET6_ADDRSTRLEN];
1798 inet_ntop (rn->p.family, &rn->p.u.prefix, buf, INET6_ADDRSTRLEN);
1799 zlog_debug ("%s: %s/%d: rn %p, rib %p, removing", __func__,
1800 buf, rn->p.prefixlen, rn, rib);
1801 }
1802 SET_FLAG (rib->status, RIB_ENTRY_REMOVED);
1803 rib_queue_add (&zebrad, rn);
1804 }
1805
1806 int
1807 rib_add_ipv4 (int type, int flags, struct prefix_ipv4 *p,
1808 struct in_addr *gate, struct in_addr *src,
1809 unsigned int ifindex, u_int32_t vrf_id,
1810 u_int32_t metric, u_char distance, safi_t safi)
1811 {
1812 struct rib *rib;
1813 struct rib *same = NULL;
1814 struct route_table *table;
1815 struct route_node *rn;
1816 struct nexthop *nexthop;
1817
1818 /* Lookup table. */
1819 table = vrf_table (AFI_IP, safi, 0);
1820 if (! table)
1821 return 0;
1822
1823 /* Make it sure prefixlen is applied to the prefix. */
1824 apply_mask_ipv4 (p);
1825
1826 /* Set default distance by route type. */
1827 if (distance == 0)
1828 {
1829 if ((unsigned)type >= array_size(route_info))
1830 distance = 150;
1831 else
1832 distance = route_info[type].distance;
1833
1834 /* iBGP distance is 200. */
1835 if (type == ZEBRA_ROUTE_BGP && CHECK_FLAG (flags, ZEBRA_FLAG_IBGP))
1836 distance = 200;
1837 }
1838
1839 /* Lookup route node.*/
1840 rn = route_node_get (table, (struct prefix *) p);
1841
1842 /* If same type of route are installed, treat it as a implicit
1843 withdraw. */
1844 RNODE_FOREACH_RIB (rn, rib)
1845 {
1846 if (CHECK_FLAG (rib->status, RIB_ENTRY_REMOVED))
1847 continue;
1848
1849 if (rib->type != type)
1850 continue;
1851 if (rib->type != ZEBRA_ROUTE_CONNECT)
1852 {
1853 same = rib;
1854 break;
1855 }
1856 /* Duplicate connected route comes in. */
1857 else if ((nexthop = rib->nexthop) &&
1858 nexthop->type == NEXTHOP_TYPE_IFINDEX &&
1859 nexthop->ifindex == ifindex &&
1860 !CHECK_FLAG (rib->status, RIB_ENTRY_REMOVED))
1861 {
1862 rib->refcnt++;
1863 return 0 ;
1864 }
1865 }
1866
1867 /* Allocate new rib structure. */
1868 rib = XCALLOC (MTYPE_RIB, sizeof (struct rib));
1869 rib->type = type;
1870 rib->distance = distance;
1871 rib->flags = flags;
1872 rib->metric = metric;
1873 rib->table = vrf_id;
1874 rib->nexthop_num = 0;
1875 rib->uptime = time (NULL);
1876
1877 /* Nexthop settings. */
1878 if (gate)
1879 {
1880 if (ifindex)
1881 nexthop_ipv4_ifindex_add (rib, gate, src, ifindex);
1882 else
1883 nexthop_ipv4_add (rib, gate, src);
1884 }
1885 else
1886 nexthop_ifindex_add (rib, ifindex);
1887
1888 /* If this route is kernel route, set FIB flag to the route. */
1889 if (type == ZEBRA_ROUTE_KERNEL || type == ZEBRA_ROUTE_CONNECT)
1890 for (nexthop = rib->nexthop; nexthop; nexthop = nexthop->next)
1891 SET_FLAG (nexthop->flags, NEXTHOP_FLAG_FIB);
1892
1893 /* Link new rib to node.*/
1894 if (IS_ZEBRA_DEBUG_RIB)
1895 zlog_debug ("%s: calling rib_addnode (%p, %p)", __func__, rn, rib);
1896 rib_addnode (rn, rib);
1897
1898 /* Free implicit route.*/
1899 if (same)
1900 {
1901 if (IS_ZEBRA_DEBUG_RIB)
1902 zlog_debug ("%s: calling rib_delnode (%p, %p)", __func__, rn, rib);
1903 rib_delnode (rn, same);
1904 }
1905
1906 route_unlock_node (rn);
1907 return 0;
1908 }
1909
1910 /* This function dumps the contents of a given RIB entry into
1911 * standard debug log. Calling function name and IP prefix in
1912 * question are passed as 1st and 2nd arguments.
1913 */
1914
1915 void rib_dump (const char * func, const struct prefix * p, const struct rib * rib)
1916 {
1917 char straddr[INET6_ADDRSTRLEN];
1918 struct nexthop *nexthop, *tnexthop;
1919 int recursing;
1920
1921 inet_ntop (p->family, &p->u.prefix, straddr, INET6_ADDRSTRLEN);
1922 zlog_debug ("%s: dumping RIB entry %p for %s/%d", func, rib, straddr, p->prefixlen);
1923 zlog_debug
1924 (
1925 "%s: refcnt == %lu, uptime == %lu, type == %u, table == %d",
1926 func,
1927 rib->refcnt,
1928 (unsigned long) rib->uptime,
1929 rib->type,
1930 rib->table
1931 );
1932 zlog_debug
1933 (
1934 "%s: metric == %u, distance == %u, flags == %u, status == %u",
1935 func,
1936 rib->metric,
1937 rib->distance,
1938 rib->flags,
1939 rib->status
1940 );
1941 zlog_debug
1942 (
1943 "%s: nexthop_num == %u, nexthop_active_num == %u, nexthop_fib_num == %u",
1944 func,
1945 rib->nexthop_num,
1946 rib->nexthop_active_num,
1947 rib->nexthop_fib_num
1948 );
1949
1950 for (ALL_NEXTHOPS_RO(rib->nexthop, nexthop, tnexthop, recursing))
1951 {
1952 inet_ntop (p->family, &nexthop->gate, straddr, INET6_ADDRSTRLEN);
1953 zlog_debug
1954 (
1955 "%s: %s %s with flags %s%s%s",
1956 func,
1957 (recursing ? " NH" : "NH"),
1958 straddr,
1959 (CHECK_FLAG (nexthop->flags, NEXTHOP_FLAG_ACTIVE) ? "ACTIVE " : ""),
1960 (CHECK_FLAG (nexthop->flags, NEXTHOP_FLAG_FIB) ? "FIB " : ""),
1961 (CHECK_FLAG (nexthop->flags, NEXTHOP_FLAG_RECURSIVE) ? "RECURSIVE" : "")
1962 );
1963 }
1964 zlog_debug ("%s: dump complete", func);
1965 }
1966
1967 /* This is an exported helper to rtm_read() to dump the strange
1968 * RIB entry found by rib_lookup_ipv4_route()
1969 */
1970
1971 void rib_lookup_and_dump (struct prefix_ipv4 * p)
1972 {
1973 struct route_table *table;
1974 struct route_node *rn;
1975 struct rib *rib;
1976 char prefix_buf[INET_ADDRSTRLEN];
1977
1978 /* Lookup table. */
1979 table = vrf_table (AFI_IP, SAFI_UNICAST, 0);
1980 if (! table)
1981 {
1982 zlog_err ("%s: vrf_table() returned NULL", __func__);
1983 return;
1984 }
1985
1986 inet_ntop (AF_INET, &p->prefix.s_addr, prefix_buf, INET_ADDRSTRLEN);
1987 /* Scan the RIB table for exactly matching RIB entry. */
1988 rn = route_node_lookup (table, (struct prefix *) p);
1989
1990 /* No route for this prefix. */
1991 if (! rn)
1992 {
1993 zlog_debug ("%s: lookup failed for %s/%d", __func__, prefix_buf, p->prefixlen);
1994 return;
1995 }
1996
1997 /* Unlock node. */
1998 route_unlock_node (rn);
1999
2000 /* let's go */
2001 RNODE_FOREACH_RIB (rn, rib)
2002 {
2003 zlog_debug
2004 (
2005 "%s: rn %p, rib %p: %s, %s",
2006 __func__,
2007 rn,
2008 rib,
2009 (CHECK_FLAG (rib->status, RIB_ENTRY_REMOVED) ? "removed" : "NOT removed"),
2010 (CHECK_FLAG (rib->flags, ZEBRA_FLAG_SELECTED) ? "selected" : "NOT selected")
2011 );
2012 rib_dump (__func__, (struct prefix *) p, rib);
2013 }
2014 }
2015
2016 /* Check if requested address assignment will fail due to another
2017 * route being installed by zebra in FIB already. Take necessary
2018 * actions, if needed: remove such a route from FIB and deSELECT
2019 * corresponding RIB entry. Then put affected RN into RIBQ head.
2020 */
2021 void rib_lookup_and_pushup (struct prefix_ipv4 * p)
2022 {
2023 struct route_table *table;
2024 struct route_node *rn;
2025 struct rib *rib;
2026 unsigned changed = 0;
2027
2028 if (NULL == (table = vrf_table (AFI_IP, SAFI_UNICAST, 0)))
2029 {
2030 zlog_err ("%s: vrf_table() returned NULL", __func__);
2031 return;
2032 }
2033
2034 /* No matches would be the simplest case. */
2035 if (NULL == (rn = route_node_lookup (table, (struct prefix *) p)))
2036 return;
2037
2038 /* Unlock node. */
2039 route_unlock_node (rn);
2040
2041 /* Check all RIB entries. In case any changes have to be done, requeue
2042 * the RN into RIBQ head. If the routing message about the new connected
2043 * route (generated by the IP address we are going to assign very soon)
2044 * comes before the RIBQ is processed, the new RIB entry will join
2045 * RIBQ record already on head. This is necessary for proper revalidation
2046 * of the rest of the RIB.
2047 */
2048 RNODE_FOREACH_RIB (rn, rib)
2049 {
2050 if (CHECK_FLAG (rib->flags, ZEBRA_FLAG_SELECTED) &&
2051 ! RIB_SYSTEM_ROUTE (rib))
2052 {
2053 changed = 1;
2054 if (IS_ZEBRA_DEBUG_RIB)
2055 {
2056 char buf[INET_ADDRSTRLEN];
2057 inet_ntop (rn->p.family, &p->prefix, buf, INET_ADDRSTRLEN);
2058 zlog_debug ("%s: freeing way for connected prefix %s/%d", __func__, buf, p->prefixlen);
2059 rib_dump (__func__, &rn->p, rib);
2060 }
2061 rib_uninstall (rn, rib);
2062 }
2063 }
2064 if (changed)
2065 rib_queue_add (&zebrad, rn);
2066 }
2067
2068 int
2069 rib_add_ipv4_multipath (struct prefix_ipv4 *p, struct rib *rib, safi_t safi)
2070 {
2071 struct route_table *table;
2072 struct route_node *rn;
2073 struct rib *same;
2074 struct nexthop *nexthop;
2075
2076 /* Lookup table. */
2077 table = vrf_table (AFI_IP, safi, 0);
2078 if (! table)
2079 return 0;
2080
2081 /* Make it sure prefixlen is applied to the prefix. */
2082 apply_mask_ipv4 (p);
2083
2084 /* Set default distance by route type. */
2085 if (rib->distance == 0)
2086 {
2087 rib->distance = route_info[rib->type].distance;
2088
2089 /* iBGP distance is 200. */
2090 if (rib->type == ZEBRA_ROUTE_BGP
2091 && CHECK_FLAG (rib->flags, ZEBRA_FLAG_IBGP))
2092 rib->distance = 200;
2093 }
2094
2095 /* Lookup route node.*/
2096 rn = route_node_get (table, (struct prefix *) p);
2097
2098 /* If same type of route are installed, treat it as a implicit
2099 withdraw. */
2100 RNODE_FOREACH_RIB (rn, same)
2101 {
2102 if (CHECK_FLAG (same->status, RIB_ENTRY_REMOVED))
2103 continue;
2104
2105 if (same->type == rib->type && same->table == rib->table
2106 && same->type != ZEBRA_ROUTE_CONNECT)
2107 break;
2108 }
2109
2110 /* If this route is kernel route, set FIB flag to the route. */
2111 if (rib->type == ZEBRA_ROUTE_KERNEL || rib->type == ZEBRA_ROUTE_CONNECT)
2112 for (nexthop = rib->nexthop; nexthop; nexthop = nexthop->next)
2113 SET_FLAG (nexthop->flags, NEXTHOP_FLAG_FIB);
2114
2115 /* Link new rib to node.*/
2116 rib_addnode (rn, rib);
2117 if (IS_ZEBRA_DEBUG_RIB)
2118 {
2119 zlog_debug ("%s: called rib_addnode (%p, %p) on new RIB entry",
2120 __func__, rn, rib);
2121 rib_dump (__func__, (struct prefix *) p, rib);
2122 }
2123
2124 /* Free implicit route.*/
2125 if (same)
2126 {
2127 if (IS_ZEBRA_DEBUG_RIB)
2128 {
2129 zlog_debug ("%s: calling rib_delnode (%p, %p) on existing RIB entry",
2130 __func__, rn, same);
2131 rib_dump (__func__, (struct prefix *) p, same);
2132 }
2133 rib_delnode (rn, same);
2134 }
2135
2136 route_unlock_node (rn);
2137 return 0;
2138 }
2139
2140 /* XXX factor with rib_delete_ipv6 */
2141 int
2142 rib_delete_ipv4 (int type, int flags, struct prefix_ipv4 *p,
2143 struct in_addr *gate, unsigned int ifindex, u_int32_t vrf_id, safi_t safi)
2144 {
2145 struct route_table *table;
2146 struct route_node *rn;
2147 struct rib *rib;
2148 struct rib *fib = NULL;
2149 struct rib *same = NULL;
2150 struct nexthop *nexthop, *tnexthop;
2151 int recursing;
2152 char buf1[INET_ADDRSTRLEN];
2153 char buf2[INET_ADDRSTRLEN];
2154
2155 /* Lookup table. */
2156 table = vrf_table (AFI_IP, safi, 0);
2157 if (! table)
2158 return 0;
2159
2160 /* Apply mask. */
2161 apply_mask_ipv4 (p);
2162
2163 if (IS_ZEBRA_DEBUG_KERNEL)
2164 {
2165 if (gate)
2166 zlog_debug ("rib_delete_ipv4(): route delete %s/%d via %s ifindex %d",
2167 inet_ntop (AF_INET, &p->prefix, buf1, INET_ADDRSTRLEN),
2168 p->prefixlen,
2169 inet_ntoa (*gate),
2170 ifindex);
2171 else
2172 zlog_debug ("rib_delete_ipv4(): route delete %s/%d ifindex %d",
2173 inet_ntop (AF_INET, &p->prefix, buf1, INET_ADDRSTRLEN),
2174 p->prefixlen,
2175 ifindex);
2176 }
2177
2178 /* Lookup route node. */
2179 rn = route_node_lookup (table, (struct prefix *) p);
2180 if (! rn)
2181 {
2182 if (IS_ZEBRA_DEBUG_KERNEL)
2183 {
2184 if (gate)
2185 zlog_debug ("route %s/%d via %s ifindex %d doesn't exist in rib",
2186 inet_ntop (AF_INET, &p->prefix, buf1, INET_ADDRSTRLEN),
2187 p->prefixlen,
2188 inet_ntop (AF_INET, gate, buf2, INET_ADDRSTRLEN),
2189 ifindex);
2190 else
2191 zlog_debug ("route %s/%d ifindex %d doesn't exist in rib",
2192 inet_ntop (AF_INET, &p->prefix, buf1, INET_ADDRSTRLEN),
2193 p->prefixlen,
2194 ifindex);
2195 }
2196 return ZEBRA_ERR_RTNOEXIST;
2197 }
2198
2199 /* Lookup same type route. */
2200 RNODE_FOREACH_RIB (rn, rib)
2201 {
2202 if (CHECK_FLAG (rib->status, RIB_ENTRY_REMOVED))
2203 continue;
2204
2205 if (CHECK_FLAG (rib->flags, ZEBRA_FLAG_SELECTED))
2206 fib = rib;
2207
2208 if (rib->type != type)
2209 continue;
2210 if (rib->type == ZEBRA_ROUTE_CONNECT && (nexthop = rib->nexthop) &&
2211 nexthop->type == NEXTHOP_TYPE_IFINDEX)
2212 {
2213 if (nexthop->ifindex != ifindex)
2214 continue;
2215 if (rib->refcnt)
2216 {
2217 rib->refcnt--;
2218 route_unlock_node (rn);
2219 route_unlock_node (rn);
2220 return 0;
2221 }
2222 same = rib;
2223 break;
2224 }
2225 /* Make sure that the route found has the same gateway. */
2226 else
2227 {
2228 if (gate == NULL)
2229 {
2230 same = rib;
2231 break;
2232 }
2233 for (ALL_NEXTHOPS_RO(rib->nexthop, nexthop, tnexthop, recursing))
2234 if (IPV4_ADDR_SAME (&nexthop->gate.ipv4, gate))
2235 {
2236 same = rib;
2237 break;
2238 }
2239 if (same)
2240 break;
2241 }
2242 }
2243 /* If same type of route can't be found and this message is from
2244 kernel. */
2245 if (! same)
2246 {
2247 if (fib && type == ZEBRA_ROUTE_KERNEL)
2248 {
2249 /* Unset flags. */
2250 for (nexthop = fib->nexthop; nexthop; nexthop = nexthop->next)
2251 UNSET_FLAG (nexthop->flags, NEXTHOP_FLAG_FIB);
2252
2253 UNSET_FLAG (fib->flags, ZEBRA_FLAG_SELECTED);
2254 }
2255 else
2256 {
2257 if (IS_ZEBRA_DEBUG_KERNEL)
2258 {
2259 if (gate)
2260 zlog_debug ("route %s/%d via %s ifindex %d type %d doesn't exist in rib",
2261 inet_ntop (AF_INET, &p->prefix, buf1, INET_ADDRSTRLEN),
2262 p->prefixlen,
2263 inet_ntop (AF_INET, gate, buf2, INET_ADDRSTRLEN),
2264 ifindex,
2265 type);
2266 else
2267 zlog_debug ("route %s/%d ifindex %d type %d doesn't exist in rib",
2268 inet_ntop (AF_INET, &p->prefix, buf1, INET_ADDRSTRLEN),
2269 p->prefixlen,
2270 ifindex,
2271 type);
2272 }
2273 route_unlock_node (rn);
2274 return ZEBRA_ERR_RTNOEXIST;
2275 }
2276 }
2277
2278 if (same)
2279 rib_delnode (rn, same);
2280
2281 route_unlock_node (rn);
2282 return 0;
2283 }
2284 \f
2285 /* Install static route into rib. */
2286 static void
2287 static_install_ipv4 (struct prefix *p, struct static_ipv4 *si)
2288 {
2289 struct rib *rib;
2290 struct route_node *rn;
2291 struct route_table *table;
2292
2293 /* Lookup table. */
2294 table = vrf_table (AFI_IP, SAFI_UNICAST, 0);
2295 if (! table)
2296 return;
2297
2298 /* Lookup existing route */
2299 rn = route_node_get (table, p);
2300 RNODE_FOREACH_RIB (rn, rib)
2301 {
2302 if (CHECK_FLAG (rib->status, RIB_ENTRY_REMOVED))
2303 continue;
2304
2305 if (rib->type == ZEBRA_ROUTE_STATIC && rib->distance == si->distance)
2306 break;
2307 }
2308
2309 if (rib)
2310 {
2311 /* Same distance static route is there. Update it with new
2312 nexthop. */
2313 route_unlock_node (rn);
2314 switch (si->type)
2315 {
2316 case STATIC_IPV4_GATEWAY:
2317 nexthop_ipv4_add (rib, &si->gate.ipv4, NULL);
2318 break;
2319 case STATIC_IPV4_IFNAME:
2320 nexthop_ifname_add (rib, si->gate.ifname);
2321 break;
2322 case STATIC_IPV4_BLACKHOLE:
2323 nexthop_blackhole_add (rib);
2324 break;
2325 }
2326 rib_queue_add (&zebrad, rn);
2327 }
2328 else
2329 {
2330 /* This is new static route. */
2331 rib = XCALLOC (MTYPE_RIB, sizeof (struct rib));
2332
2333 rib->type = ZEBRA_ROUTE_STATIC;
2334 rib->distance = si->distance;
2335 rib->metric = 0;
2336 rib->table = zebrad.rtm_table_default;
2337 rib->nexthop_num = 0;
2338
2339 switch (si->type)
2340 {
2341 case STATIC_IPV4_GATEWAY:
2342 nexthop_ipv4_add (rib, &si->gate.ipv4, NULL);
2343 break;
2344 case STATIC_IPV4_IFNAME:
2345 nexthop_ifname_add (rib, si->gate.ifname);
2346 break;
2347 case STATIC_IPV4_BLACKHOLE:
2348 nexthop_blackhole_add (rib);
2349 break;
2350 }
2351
2352 /* Save the flags of this static routes (reject, blackhole) */
2353 rib->flags = si->flags;
2354
2355 /* Link this rib to the tree. */
2356 rib_addnode (rn, rib);
2357 }
2358 }
2359
2360 static int
2361 static_ipv4_nexthop_same (struct nexthop *nexthop, struct static_ipv4 *si)
2362 {
2363 if (nexthop->type == NEXTHOP_TYPE_IPV4
2364 && si->type == STATIC_IPV4_GATEWAY
2365 && IPV4_ADDR_SAME (&nexthop->gate.ipv4, &si->gate.ipv4))
2366 return 1;
2367 if (nexthop->type == NEXTHOP_TYPE_IFNAME
2368 && si->type == STATIC_IPV4_IFNAME
2369 && strcmp (nexthop->ifname, si->gate.ifname) == 0)
2370 return 1;
2371 if (nexthop->type == NEXTHOP_TYPE_BLACKHOLE
2372 && si->type == STATIC_IPV4_BLACKHOLE)
2373 return 1;
2374 return 0;
2375 }
2376
2377 /* Uninstall static route from RIB. */
2378 static void
2379 static_uninstall_ipv4 (struct prefix *p, struct static_ipv4 *si)
2380 {
2381 struct route_node *rn;
2382 struct rib *rib;
2383 struct nexthop *nexthop;
2384 struct route_table *table;
2385
2386 /* Lookup table. */
2387 table = vrf_table (AFI_IP, SAFI_UNICAST, 0);
2388 if (! table)
2389 return;
2390
2391 /* Lookup existing route with type and distance. */
2392 rn = route_node_lookup (table, p);
2393 if (! rn)
2394 return;
2395
2396 RNODE_FOREACH_RIB (rn, rib)
2397 {
2398 if (CHECK_FLAG (rib->status, RIB_ENTRY_REMOVED))
2399 continue;
2400
2401 if (rib->type == ZEBRA_ROUTE_STATIC && rib->distance == si->distance)
2402 break;
2403 }
2404
2405 if (! rib)
2406 {
2407 route_unlock_node (rn);
2408 return;
2409 }
2410
2411 /* Lookup nexthop. */
2412 for (nexthop = rib->nexthop; nexthop; nexthop = nexthop->next)
2413 if (static_ipv4_nexthop_same (nexthop, si))
2414 break;
2415
2416 /* Can't find nexthop. */
2417 if (! nexthop)
2418 {
2419 route_unlock_node (rn);
2420 return;
2421 }
2422
2423 /* Check nexthop. */
2424 if (rib->nexthop_num == 1)
2425 rib_delnode (rn, rib);
2426 else
2427 {
2428 if (CHECK_FLAG (nexthop->flags, NEXTHOP_FLAG_FIB))
2429 rib_uninstall (rn, rib);
2430 nexthop_delete (rib, nexthop);
2431 nexthop_free (nexthop);
2432 rib_queue_add (&zebrad, rn);
2433 }
2434 /* Unlock node. */
2435 route_unlock_node (rn);
2436 }
2437
2438 /* Add static route into static route configuration. */
2439 int
2440 static_add_ipv4 (struct prefix *p, struct in_addr *gate, const char *ifname,
2441 u_char flags, u_char distance, u_int32_t vrf_id)
2442 {
2443 u_char type = 0;
2444 struct route_node *rn;
2445 struct static_ipv4 *si;
2446 struct static_ipv4 *pp;
2447 struct static_ipv4 *cp;
2448 struct static_ipv4 *update = NULL;
2449 struct route_table *stable;
2450
2451 /* Lookup table. */
2452 stable = vrf_static_table (AFI_IP, SAFI_UNICAST, vrf_id);
2453 if (! stable)
2454 return -1;
2455
2456 /* Lookup static route prefix. */
2457 rn = route_node_get (stable, p);
2458
2459 /* Make flags. */
2460 if (gate)
2461 type = STATIC_IPV4_GATEWAY;
2462 else if (ifname)
2463 type = STATIC_IPV4_IFNAME;
2464 else
2465 type = STATIC_IPV4_BLACKHOLE;
2466
2467 /* Do nothing if there is a same static route. */
2468 for (si = rn->info; si; si = si->next)
2469 {
2470 if (type == si->type
2471 && (! gate || IPV4_ADDR_SAME (gate, &si->gate.ipv4))
2472 && (! ifname || strcmp (ifname, si->gate.ifname) == 0))
2473 {
2474 if (distance == si->distance)
2475 {
2476 route_unlock_node (rn);
2477 return 0;
2478 }
2479 else
2480 update = si;
2481 }
2482 }
2483
2484 /* Distance changed. */
2485 if (update)
2486 static_delete_ipv4 (p, gate, ifname, update->distance, vrf_id);
2487
2488 /* Make new static route structure. */
2489 si = XCALLOC (MTYPE_STATIC_IPV4, sizeof (struct static_ipv4));
2490
2491 si->type = type;
2492 si->distance = distance;
2493 si->flags = flags;
2494
2495 if (gate)
2496 si->gate.ipv4 = *gate;
2497 if (ifname)
2498 si->gate.ifname = XSTRDUP (0, ifname);
2499
2500 /* Add new static route information to the tree with sort by
2501 distance value and gateway address. */
2502 for (pp = NULL, cp = rn->info; cp; pp = cp, cp = cp->next)
2503 {
2504 if (si->distance < cp->distance)
2505 break;
2506 if (si->distance > cp->distance)
2507 continue;
2508 if (si->type == STATIC_IPV4_GATEWAY && cp->type == STATIC_IPV4_GATEWAY)
2509 {
2510 if (ntohl (si->gate.ipv4.s_addr) < ntohl (cp->gate.ipv4.s_addr))
2511 break;
2512 if (ntohl (si->gate.ipv4.s_addr) > ntohl (cp->gate.ipv4.s_addr))
2513 continue;
2514 }
2515 }
2516
2517 /* Make linked list. */
2518 if (pp)
2519 pp->next = si;
2520 else
2521 rn->info = si;
2522 if (cp)
2523 cp->prev = si;
2524 si->prev = pp;
2525 si->next = cp;
2526
2527 /* Install into rib. */
2528 static_install_ipv4 (p, si);
2529
2530 return 1;
2531 }
2532
2533 /* Delete static route from static route configuration. */
2534 int
2535 static_delete_ipv4 (struct prefix *p, struct in_addr *gate, const char *ifname,
2536 u_char distance, u_int32_t vrf_id)
2537 {
2538 u_char type = 0;
2539 struct route_node *rn;
2540 struct static_ipv4 *si;
2541 struct route_table *stable;
2542
2543 /* Lookup table. */
2544 stable = vrf_static_table (AFI_IP, SAFI_UNICAST, vrf_id);
2545 if (! stable)
2546 return -1;
2547
2548 /* Lookup static route prefix. */
2549 rn = route_node_lookup (stable, p);
2550 if (! rn)
2551 return 0;
2552
2553 /* Make flags. */
2554 if (gate)
2555 type = STATIC_IPV4_GATEWAY;
2556 else if (ifname)
2557 type = STATIC_IPV4_IFNAME;
2558 else
2559 type = STATIC_IPV4_BLACKHOLE;
2560
2561 /* Find same static route is the tree */
2562 for (si = rn->info; si; si = si->next)
2563 if (type == si->type
2564 && (! gate || IPV4_ADDR_SAME (gate, &si->gate.ipv4))
2565 && (! ifname || strcmp (ifname, si->gate.ifname) == 0))
2566 break;
2567
2568 /* Can't find static route. */
2569 if (! si)
2570 {
2571 route_unlock_node (rn);
2572 return 0;
2573 }
2574
2575 /* Install into rib. */
2576 static_uninstall_ipv4 (p, si);
2577
2578 /* Unlink static route from linked list. */
2579 if (si->prev)
2580 si->prev->next = si->next;
2581 else
2582 rn->info = si->next;
2583 if (si->next)
2584 si->next->prev = si->prev;
2585 route_unlock_node (rn);
2586
2587 /* Free static route configuration. */
2588 if (ifname)
2589 XFREE (0, si->gate.ifname);
2590 XFREE (MTYPE_STATIC_IPV4, si);
2591
2592 route_unlock_node (rn);
2593
2594 return 1;
2595 }
2596
2597 \f
2598 #ifdef HAVE_IPV6
2599 static int
2600 rib_bogus_ipv6 (int type, struct prefix_ipv6 *p,
2601 struct in6_addr *gate, unsigned int ifindex, int table)
2602 {
2603 if (type == ZEBRA_ROUTE_CONNECT && IN6_IS_ADDR_UNSPECIFIED (&p->prefix)) {
2604 #if defined (MUSICA) || defined (LINUX)
2605 /* IN6_IS_ADDR_V4COMPAT(&p->prefix) */
2606 if (p->prefixlen == 96)
2607 return 0;
2608 #endif /* MUSICA */
2609 return 1;
2610 }
2611 if (type == ZEBRA_ROUTE_KERNEL && IN6_IS_ADDR_UNSPECIFIED (&p->prefix)
2612 && p->prefixlen == 96 && gate && IN6_IS_ADDR_UNSPECIFIED (gate))
2613 {
2614 kernel_delete_ipv6_old (p, gate, ifindex, 0, table);
2615 return 1;
2616 }
2617 return 0;
2618 }
2619
2620 int
2621 rib_add_ipv6 (int type, int flags, struct prefix_ipv6 *p,
2622 struct in6_addr *gate, unsigned int ifindex, u_int32_t vrf_id,
2623 u_int32_t metric, u_char distance, safi_t safi)
2624 {
2625 struct rib *rib;
2626 struct rib *same = NULL;
2627 struct route_table *table;
2628 struct route_node *rn;
2629 struct nexthop *nexthop;
2630
2631 /* Lookup table. */
2632 table = vrf_table (AFI_IP6, safi, 0);
2633 if (! table)
2634 return 0;
2635
2636 /* Make sure mask is applied. */
2637 apply_mask_ipv6 (p);
2638
2639 /* Set default distance by route type. */
2640 if (!distance)
2641 distance = route_info[type].distance;
2642
2643 if (type == ZEBRA_ROUTE_BGP && CHECK_FLAG (flags, ZEBRA_FLAG_IBGP))
2644 distance = 200;
2645
2646 /* Filter bogus route. */
2647 if (rib_bogus_ipv6 (type, p, gate, ifindex, 0))
2648 return 0;
2649
2650 /* Lookup route node.*/
2651 rn = route_node_get (table, (struct prefix *) p);
2652
2653 /* If same type of route are installed, treat it as a implicit
2654 withdraw. */
2655 RNODE_FOREACH_RIB (rn, rib)
2656 {
2657 if (CHECK_FLAG (rib->status, RIB_ENTRY_REMOVED))
2658 continue;
2659
2660 if (rib->type != type)
2661 continue;
2662 if (rib->type != ZEBRA_ROUTE_CONNECT)
2663 {
2664 same = rib;
2665 break;
2666 }
2667 else if ((nexthop = rib->nexthop) &&
2668 nexthop->type == NEXTHOP_TYPE_IFINDEX &&
2669 nexthop->ifindex == ifindex)
2670 {
2671 rib->refcnt++;
2672 return 0;
2673 }
2674 }
2675
2676 /* Allocate new rib structure. */
2677 rib = XCALLOC (MTYPE_RIB, sizeof (struct rib));
2678
2679 rib->type = type;
2680 rib->distance = distance;
2681 rib->flags = flags;
2682 rib->metric = metric;
2683 rib->table = vrf_id;
2684 rib->nexthop_num = 0;
2685 rib->uptime = time (NULL);
2686
2687 /* Nexthop settings. */
2688 if (gate)
2689 {
2690 if (ifindex)
2691 nexthop_ipv6_ifindex_add (rib, gate, ifindex);
2692 else
2693 nexthop_ipv6_add (rib, gate);
2694 }
2695 else
2696 nexthop_ifindex_add (rib, ifindex);
2697
2698 /* If this route is kernel route, set FIB flag to the route. */
2699 if (type == ZEBRA_ROUTE_KERNEL || type == ZEBRA_ROUTE_CONNECT)
2700 for (nexthop = rib->nexthop; nexthop; nexthop = nexthop->next)
2701 SET_FLAG (nexthop->flags, NEXTHOP_FLAG_FIB);
2702
2703 /* Link new rib to node.*/
2704 rib_addnode (rn, rib);
2705 if (IS_ZEBRA_DEBUG_RIB)
2706 {
2707 zlog_debug ("%s: called rib_addnode (%p, %p) on new RIB entry",
2708 __func__, rn, rib);
2709 rib_dump (__func__, (struct prefix *) p, rib);
2710 }
2711
2712 /* Free implicit route.*/
2713 if (same)
2714 {
2715 if (IS_ZEBRA_DEBUG_RIB)
2716 {
2717 zlog_debug ("%s: calling rib_delnode (%p, %p) on existing RIB entry",
2718 __func__, rn, same);
2719 rib_dump (__func__, (struct prefix *) p, same);
2720 }
2721 rib_delnode (rn, same);
2722 }
2723
2724 route_unlock_node (rn);
2725 return 0;
2726 }
2727
2728 /* XXX factor with rib_delete_ipv6 */
2729 int
2730 rib_delete_ipv6 (int type, int flags, struct prefix_ipv6 *p,
2731 struct in6_addr *gate, unsigned int ifindex, u_int32_t vrf_id, safi_t safi)
2732 {
2733 struct route_table *table;
2734 struct route_node *rn;
2735 struct rib *rib;
2736 struct rib *fib = NULL;
2737 struct rib *same = NULL;
2738 struct nexthop *nexthop, *tnexthop;
2739 int recursing;
2740 char buf1[INET6_ADDRSTRLEN];
2741 char buf2[INET6_ADDRSTRLEN];
2742
2743 /* Apply mask. */
2744 apply_mask_ipv6 (p);
2745
2746 /* Lookup table. */
2747 table = vrf_table (AFI_IP6, safi, 0);
2748 if (! table)
2749 return 0;
2750
2751 /* Lookup route node. */
2752 rn = route_node_lookup (table, (struct prefix *) p);
2753 if (! rn)
2754 {
2755 if (IS_ZEBRA_DEBUG_KERNEL)
2756 {
2757 if (gate)
2758 zlog_debug ("route %s/%d via %s ifindex %d doesn't exist in rib",
2759 inet_ntop (AF_INET6, &p->prefix, buf1, INET6_ADDRSTRLEN),
2760 p->prefixlen,
2761 inet_ntop (AF_INET6, gate, buf2, INET6_ADDRSTRLEN),
2762 ifindex);
2763 else
2764 zlog_debug ("route %s/%d ifindex %d doesn't exist in rib",
2765 inet_ntop (AF_INET6, &p->prefix, buf1, INET6_ADDRSTRLEN),
2766 p->prefixlen,
2767 ifindex);
2768 }
2769 return ZEBRA_ERR_RTNOEXIST;
2770 }
2771
2772 /* Lookup same type route. */
2773 RNODE_FOREACH_RIB (rn, rib)
2774 {
2775 if (CHECK_FLAG(rib->status, RIB_ENTRY_REMOVED))
2776 continue;
2777
2778 if (CHECK_FLAG (rib->flags, ZEBRA_FLAG_SELECTED))
2779 fib = rib;
2780
2781 if (rib->type != type)
2782 continue;
2783 if (rib->type == ZEBRA_ROUTE_CONNECT && (nexthop = rib->nexthop) &&
2784 nexthop->type == NEXTHOP_TYPE_IFINDEX)
2785 {
2786 if (nexthop->ifindex != ifindex)
2787 continue;
2788 if (rib->refcnt)
2789 {
2790 rib->refcnt--;
2791 route_unlock_node (rn);
2792 route_unlock_node (rn);
2793 return 0;
2794 }
2795 same = rib;
2796 break;
2797 }
2798 /* Make sure that the route found has the same gateway. */
2799 else
2800 {
2801 if (gate == NULL)
2802 {
2803 same = rib;
2804 break;
2805 }
2806 for (ALL_NEXTHOPS_RO(rib->nexthop, nexthop, tnexthop, recursing))
2807 if (IPV6_ADDR_SAME (&nexthop->gate.ipv6, gate))
2808 {
2809 same = rib;
2810 break;
2811 }
2812 if (same)
2813 break;
2814 }
2815 }
2816
2817 /* If same type of route can't be found and this message is from
2818 kernel. */
2819 if (! same)
2820 {
2821 if (fib && type == ZEBRA_ROUTE_KERNEL)
2822 {
2823 /* Unset flags. */
2824 for (nexthop = fib->nexthop; nexthop; nexthop = nexthop->next)
2825 UNSET_FLAG (nexthop->flags, NEXTHOP_FLAG_FIB);
2826
2827 UNSET_FLAG (fib->flags, ZEBRA_FLAG_SELECTED);
2828 }
2829 else
2830 {
2831 if (IS_ZEBRA_DEBUG_KERNEL)
2832 {
2833 if (gate)
2834 zlog_debug ("route %s/%d via %s ifindex %d type %d doesn't exist in rib",
2835 inet_ntop (AF_INET6, &p->prefix, buf1, INET6_ADDRSTRLEN),
2836 p->prefixlen,
2837 inet_ntop (AF_INET6, gate, buf2, INET6_ADDRSTRLEN),
2838 ifindex,
2839 type);
2840 else
2841 zlog_debug ("route %s/%d ifindex %d type %d doesn't exist in rib",
2842 inet_ntop (AF_INET6, &p->prefix, buf1, INET6_ADDRSTRLEN),
2843 p->prefixlen,
2844 ifindex,
2845 type);
2846 }
2847 route_unlock_node (rn);
2848 return ZEBRA_ERR_RTNOEXIST;
2849 }
2850 }
2851
2852 if (same)
2853 rib_delnode (rn, same);
2854
2855 route_unlock_node (rn);
2856 return 0;
2857 }
2858 \f
2859 /* Install static route into rib. */
2860 static void
2861 static_install_ipv6 (struct prefix *p, struct static_ipv6 *si)
2862 {
2863 struct rib *rib;
2864 struct route_table *table;
2865 struct route_node *rn;
2866
2867 /* Lookup table. */
2868 table = vrf_table (AFI_IP6, SAFI_UNICAST, 0);
2869 if (! table)
2870 return;
2871
2872 /* Lookup existing route */
2873 rn = route_node_get (table, p);
2874 RNODE_FOREACH_RIB (rn, rib)
2875 {
2876 if (CHECK_FLAG(rib->status, RIB_ENTRY_REMOVED))
2877 continue;
2878
2879 if (rib->type == ZEBRA_ROUTE_STATIC && rib->distance == si->distance)
2880 break;
2881 }
2882
2883 if (rib)
2884 {
2885 /* Same distance static route is there. Update it with new
2886 nexthop. */
2887 route_unlock_node (rn);
2888
2889 switch (si->type)
2890 {
2891 case STATIC_IPV6_GATEWAY:
2892 nexthop_ipv6_add (rib, &si->ipv6);
2893 break;
2894 case STATIC_IPV6_IFNAME:
2895 nexthop_ifname_add (rib, si->ifname);
2896 break;
2897 case STATIC_IPV6_GATEWAY_IFNAME:
2898 nexthop_ipv6_ifname_add (rib, &si->ipv6, si->ifname);
2899 break;
2900 }
2901 rib_queue_add (&zebrad, rn);
2902 }
2903 else
2904 {
2905 /* This is new static route. */
2906 rib = XCALLOC (MTYPE_RIB, sizeof (struct rib));
2907
2908 rib->type = ZEBRA_ROUTE_STATIC;
2909 rib->distance = si->distance;
2910 rib->metric = 0;
2911 rib->nexthop_num = 0;
2912
2913 switch (si->type)
2914 {
2915 case STATIC_IPV6_GATEWAY:
2916 nexthop_ipv6_add (rib, &si->ipv6);
2917 break;
2918 case STATIC_IPV6_IFNAME:
2919 nexthop_ifname_add (rib, si->ifname);
2920 break;
2921 case STATIC_IPV6_GATEWAY_IFNAME:
2922 nexthop_ipv6_ifname_add (rib, &si->ipv6, si->ifname);
2923 break;
2924 }
2925
2926 /* Save the flags of this static routes (reject, blackhole) */
2927 rib->flags = si->flags;
2928
2929 /* Link this rib to the tree. */
2930 rib_addnode (rn, rib);
2931 }
2932 }
2933
2934 static int
2935 static_ipv6_nexthop_same (struct nexthop *nexthop, struct static_ipv6 *si)
2936 {
2937 if (nexthop->type == NEXTHOP_TYPE_IPV6
2938 && si->type == STATIC_IPV6_GATEWAY
2939 && IPV6_ADDR_SAME (&nexthop->gate.ipv6, &si->ipv6))
2940 return 1;
2941 if (nexthop->type == NEXTHOP_TYPE_IFNAME
2942 && si->type == STATIC_IPV6_IFNAME
2943 && strcmp (nexthop->ifname, si->ifname) == 0)
2944 return 1;
2945 if (nexthop->type == NEXTHOP_TYPE_IPV6_IFNAME
2946 && si->type == STATIC_IPV6_GATEWAY_IFNAME
2947 && IPV6_ADDR_SAME (&nexthop->gate.ipv6, &si->ipv6)
2948 && strcmp (nexthop->ifname, si->ifname) == 0)
2949 return 1;
2950 return 0;
2951 }
2952
2953 static void
2954 static_uninstall_ipv6 (struct prefix *p, struct static_ipv6 *si)
2955 {
2956 struct route_table *table;
2957 struct route_node *rn;
2958 struct rib *rib;
2959 struct nexthop *nexthop;
2960
2961 /* Lookup table. */
2962 table = vrf_table (AFI_IP6, SAFI_UNICAST, 0);
2963 if (! table)
2964 return;
2965
2966 /* Lookup existing route with type and distance. */
2967 rn = route_node_lookup (table, (struct prefix *) p);
2968 if (! rn)
2969 return;
2970
2971 RNODE_FOREACH_RIB (rn, rib)
2972 {
2973 if (CHECK_FLAG (rib->status, RIB_ENTRY_REMOVED))
2974 continue;
2975
2976 if (rib->type == ZEBRA_ROUTE_STATIC && rib->distance == si->distance)
2977 break;
2978 }
2979
2980 if (! rib)
2981 {
2982 route_unlock_node (rn);
2983 return;
2984 }
2985
2986 /* Lookup nexthop. */
2987 for (nexthop = rib->nexthop; nexthop; nexthop = nexthop->next)
2988 if (static_ipv6_nexthop_same (nexthop, si))
2989 break;
2990
2991 /* Can't find nexthop. */
2992 if (! nexthop)
2993 {
2994 route_unlock_node (rn);
2995 return;
2996 }
2997
2998 /* Check nexthop. */
2999 if (rib->nexthop_num == 1)
3000 {
3001 rib_delnode (rn, rib);
3002 }
3003 else
3004 {
3005 if (CHECK_FLAG (nexthop->flags, NEXTHOP_FLAG_FIB))
3006 rib_uninstall (rn, rib);
3007 nexthop_delete (rib, nexthop);
3008 nexthop_free (nexthop);
3009 rib_queue_add (&zebrad, rn);
3010 }
3011 /* Unlock node. */
3012 route_unlock_node (rn);
3013 }
3014
3015 /* Add static route into static route configuration. */
3016 int
3017 static_add_ipv6 (struct prefix *p, u_char type, struct in6_addr *gate,
3018 const char *ifname, u_char flags, u_char distance,
3019 u_int32_t vrf_id)
3020 {
3021 struct route_node *rn;
3022 struct static_ipv6 *si;
3023 struct static_ipv6 *pp;
3024 struct static_ipv6 *cp;
3025 struct route_table *stable;
3026
3027 /* Lookup table. */
3028 stable = vrf_static_table (AFI_IP6, SAFI_UNICAST, vrf_id);
3029 if (! stable)
3030 return -1;
3031
3032 if (!gate &&
3033 (type == STATIC_IPV6_GATEWAY || type == STATIC_IPV6_GATEWAY_IFNAME))
3034 return -1;
3035
3036 if (!ifname &&
3037 (type == STATIC_IPV6_GATEWAY_IFNAME || type == STATIC_IPV6_IFNAME))
3038 return -1;
3039
3040 /* Lookup static route prefix. */
3041 rn = route_node_get (stable, p);
3042
3043 /* Do nothing if there is a same static route. */
3044 for (si = rn->info; si; si = si->next)
3045 {
3046 if (distance == si->distance
3047 && type == si->type
3048 && (! gate || IPV6_ADDR_SAME (gate, &si->ipv6))
3049 && (! ifname || strcmp (ifname, si->ifname) == 0))
3050 {
3051 route_unlock_node (rn);
3052 return 0;
3053 }
3054 }
3055
3056 /* Make new static route structure. */
3057 si = XCALLOC (MTYPE_STATIC_IPV6, sizeof (struct static_ipv6));
3058
3059 si->type = type;
3060 si->distance = distance;
3061 si->flags = flags;
3062
3063 switch (type)
3064 {
3065 case STATIC_IPV6_GATEWAY:
3066 si->ipv6 = *gate;
3067 break;
3068 case STATIC_IPV6_IFNAME:
3069 si->ifname = XSTRDUP (0, ifname);
3070 break;
3071 case STATIC_IPV6_GATEWAY_IFNAME:
3072 si->ipv6 = *gate;
3073 si->ifname = XSTRDUP (0, ifname);
3074 break;
3075 }
3076
3077 /* Add new static route information to the tree with sort by
3078 distance value and gateway address. */
3079 for (pp = NULL, cp = rn->info; cp; pp = cp, cp = cp->next)
3080 {
3081 if (si->distance < cp->distance)
3082 break;
3083 if (si->distance > cp->distance)
3084 continue;
3085 }
3086
3087 /* Make linked list. */
3088 if (pp)
3089 pp->next = si;
3090 else
3091 rn->info = si;
3092 if (cp)
3093 cp->prev = si;
3094 si->prev = pp;
3095 si->next = cp;
3096
3097 /* Install into rib. */
3098 static_install_ipv6 (p, si);
3099
3100 return 1;
3101 }
3102
3103 /* Delete static route from static route configuration. */
3104 int
3105 static_delete_ipv6 (struct prefix *p, u_char type, struct in6_addr *gate,
3106 const char *ifname, u_char distance, u_int32_t vrf_id)
3107 {
3108 struct route_node *rn;
3109 struct static_ipv6 *si;
3110 struct route_table *stable;
3111
3112 /* Lookup table. */
3113 stable = vrf_static_table (AFI_IP6, SAFI_UNICAST, vrf_id);
3114 if (! stable)
3115 return -1;
3116
3117 /* Lookup static route prefix. */
3118 rn = route_node_lookup (stable, p);
3119 if (! rn)
3120 return 0;
3121
3122 /* Find same static route is the tree */
3123 for (si = rn->info; si; si = si->next)
3124 if (distance == si->distance
3125 && type == si->type
3126 && (! gate || IPV6_ADDR_SAME (gate, &si->ipv6))
3127 && (! ifname || strcmp (ifname, si->ifname) == 0))
3128 break;
3129
3130 /* Can't find static route. */
3131 if (! si)
3132 {
3133 route_unlock_node (rn);
3134 return 0;
3135 }
3136
3137 /* Install into rib. */
3138 static_uninstall_ipv6 (p, si);
3139
3140 /* Unlink static route from linked list. */
3141 if (si->prev)
3142 si->prev->next = si->next;
3143 else
3144 rn->info = si->next;
3145 if (si->next)
3146 si->next->prev = si->prev;
3147
3148 /* Free static route configuration. */
3149 if (ifname)
3150 XFREE (0, si->ifname);
3151 XFREE (MTYPE_STATIC_IPV6, si);
3152
3153 return 1;
3154 }
3155 #endif /* HAVE_IPV6 */
3156 \f
3157 /* RIB update function. */
3158 void
3159 rib_update (void)
3160 {
3161 struct route_node *rn;
3162 struct route_table *table;
3163
3164 table = vrf_table (AFI_IP, SAFI_UNICAST, 0);
3165 if (table)
3166 for (rn = route_top (table); rn; rn = route_next (rn))
3167 if (rnode_to_ribs (rn))
3168 rib_queue_add (&zebrad, rn);
3169
3170 table = vrf_table (AFI_IP6, SAFI_UNICAST, 0);
3171 if (table)
3172 for (rn = route_top (table); rn; rn = route_next (rn))
3173 if (rnode_to_ribs (rn))
3174 rib_queue_add (&zebrad, rn);
3175 }
3176
3177 \f
3178 /* Remove all routes which comes from non main table. */
3179 static void
3180 rib_weed_table (struct route_table *table)
3181 {
3182 struct route_node *rn;
3183 struct rib *rib;
3184 struct rib *next;
3185
3186 if (table)
3187 for (rn = route_top (table); rn; rn = route_next (rn))
3188 RNODE_FOREACH_RIB_SAFE (rn, rib, next)
3189 {
3190 if (CHECK_FLAG (rib->status, RIB_ENTRY_REMOVED))
3191 continue;
3192
3193 if (rib->table != zebrad.rtm_table_default &&
3194 rib->table != RT_TABLE_MAIN)
3195 rib_delnode (rn, rib);
3196 }
3197 }
3198
3199 /* Delete all routes from non main table. */
3200 void
3201 rib_weed_tables (void)
3202 {
3203 rib_weed_table (vrf_table (AFI_IP, SAFI_UNICAST, 0));
3204 rib_weed_table (vrf_table (AFI_IP6, SAFI_UNICAST, 0));
3205 }
3206 \f
3207 /* Delete self installed routes after zebra is relaunched. */
3208 static void
3209 rib_sweep_table (struct route_table *table)
3210 {
3211 struct route_node *rn;
3212 struct rib *rib;
3213 struct rib *next;
3214 int ret = 0;
3215
3216 if (table)
3217 for (rn = route_top (table); rn; rn = route_next (rn))
3218 RNODE_FOREACH_RIB_SAFE (rn, rib, next)
3219 {
3220 if (CHECK_FLAG (rib->status, RIB_ENTRY_REMOVED))
3221 continue;
3222
3223 if (rib->type == ZEBRA_ROUTE_KERNEL &&
3224 CHECK_FLAG (rib->flags, ZEBRA_FLAG_SELFROUTE))
3225 {
3226 ret = rib_uninstall_kernel (rn, rib);
3227 if (! ret)
3228 rib_delnode (rn, rib);
3229 }
3230 }
3231 }
3232
3233 /* Sweep all RIB tables. */
3234 void
3235 rib_sweep_route (void)
3236 {
3237 rib_sweep_table (vrf_table (AFI_IP, SAFI_UNICAST, 0));
3238 rib_sweep_table (vrf_table (AFI_IP6, SAFI_UNICAST, 0));
3239 }
3240
3241 /* Remove specific by protocol routes from 'table'. */
3242 static unsigned long
3243 rib_score_proto_table (u_char proto, struct route_table *table)
3244 {
3245 struct route_node *rn;
3246 struct rib *rib;
3247 struct rib *next;
3248 unsigned long n = 0;
3249
3250 if (table)
3251 for (rn = route_top (table); rn; rn = route_next (rn))
3252 RNODE_FOREACH_RIB_SAFE (rn, rib, next)
3253 {
3254 if (CHECK_FLAG (rib->status, RIB_ENTRY_REMOVED))
3255 continue;
3256 if (rib->type == proto)
3257 {
3258 rib_delnode (rn, rib);
3259 n++;
3260 }
3261 }
3262
3263 return n;
3264 }
3265
3266 /* Remove specific by protocol routes. */
3267 unsigned long
3268 rib_score_proto (u_char proto)
3269 {
3270 return rib_score_proto_table (proto, vrf_table (AFI_IP, SAFI_UNICAST, 0))
3271 +rib_score_proto_table (proto, vrf_table (AFI_IP6, SAFI_UNICAST, 0));
3272 }
3273
3274 /* Close RIB and clean up kernel routes. */
3275 static void
3276 rib_close_table (struct route_table *table)
3277 {
3278 struct route_node *rn;
3279 struct rib *rib;
3280
3281 if (table)
3282 for (rn = route_top (table); rn; rn = route_next (rn))
3283 RNODE_FOREACH_RIB (rn, rib)
3284 {
3285 if (!CHECK_FLAG (rib->flags, ZEBRA_FLAG_SELECTED))
3286 continue;
3287
3288 zfpm_trigger_update (rn, NULL);
3289
3290 if (! RIB_SYSTEM_ROUTE (rib))
3291 rib_uninstall_kernel (rn, rib);
3292 }
3293 }
3294
3295 /* Close all RIB tables. */
3296 void
3297 rib_close (void)
3298 {
3299 rib_close_table (vrf_table (AFI_IP, SAFI_UNICAST, 0));
3300 rib_close_table (vrf_table (AFI_IP6, SAFI_UNICAST, 0));
3301 }
3302 \f
3303 /* Routing information base initialize. */
3304 void
3305 rib_init (void)
3306 {
3307 rib_queue_init (&zebrad);
3308 /* VRF initialization. */
3309 vrf_init ();
3310 }
3311
3312 /*
3313 * vrf_id_get_next
3314 *
3315 * Get the first vrf id that is greater than the given vrf id if any.
3316 *
3317 * Returns TRUE if a vrf id was found, FALSE otherwise.
3318 */
3319 static inline int
3320 vrf_id_get_next (uint32_t id, uint32_t *next_id_p)
3321 {
3322 while (++id < vector_active (vrf_vector))
3323 {
3324 if (vrf_lookup (id))
3325 {
3326 *next_id_p = id;
3327 return 1;
3328 }
3329 }
3330
3331 return 0;
3332 }
3333
3334 /*
3335 * rib_tables_iter_next
3336 *
3337 * Returns the next table in the iteration.
3338 */
3339 struct route_table *
3340 rib_tables_iter_next (rib_tables_iter_t *iter)
3341 {
3342 struct route_table *table;
3343
3344 /*
3345 * Array that helps us go over all AFI/SAFI combinations via one
3346 * index.
3347 */
3348 static struct {
3349 afi_t afi;
3350 safi_t safi;
3351 } afi_safis[] = {
3352 { AFI_IP, SAFI_UNICAST },
3353 { AFI_IP, SAFI_MULTICAST },
3354 { AFI_IP6, SAFI_UNICAST },
3355 { AFI_IP6, SAFI_MULTICAST },
3356 };
3357
3358 table = NULL;
3359
3360 switch (iter->state)
3361 {
3362
3363 case RIB_TABLES_ITER_S_INIT:
3364 iter->vrf_id = 0;
3365 iter->afi_safi_ix = -1;
3366
3367 /* Fall through */
3368
3369 case RIB_TABLES_ITER_S_ITERATING:
3370 iter->afi_safi_ix++;
3371 while (1)
3372 {
3373
3374 while (iter->afi_safi_ix < (int) ZEBRA_NUM_OF (afi_safis))
3375 {
3376 table = vrf_table (afi_safis[iter->afi_safi_ix].afi,
3377 afi_safis[iter->afi_safi_ix].safi,
3378 iter->vrf_id);
3379 if (table)
3380 break;
3381
3382 iter->afi_safi_ix++;
3383 }
3384
3385 /*
3386 * Found another table in this vrf.
3387 */
3388 if (table)
3389 break;
3390
3391 /*
3392 * Done with all tables in the current vrf, go to the next
3393 * one.
3394 */
3395 if (!vrf_id_get_next (iter->vrf_id, &iter->vrf_id))
3396 break;
3397
3398 iter->afi_safi_ix = 0;
3399 }
3400
3401 break;
3402
3403 case RIB_TABLES_ITER_S_DONE:
3404 return NULL;
3405 }
3406
3407 if (table)
3408 iter->state = RIB_TABLES_ITER_S_ITERATING;
3409 else
3410 iter->state = RIB_TABLES_ITER_S_DONE;
3411
3412 return table;
3413 }