2 * Kernel routing table updates by routing socket.
3 * Copyright (C) 1997, 98 Kunihiro Ishiguro
5 * This file is part of GNU Zebra.
7 * GNU Zebra is free software; you can redistribute it and/or modify it
8 * under the terms of the GNU General Public License as published by the
9 * Free Software Foundation; either version 2, or (at your option) any
12 * GNU Zebra is distributed in the hope that it will be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * General Public License for more details.
17 * You should have received a copy of the GNU General Public License along
18 * with this program; see the file COPYING; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
27 #include <netmpls/mpls.h>
32 #include "sockunion.h"
36 #include "lib_errors.h"
38 #include "zebra/debug.h"
39 #include "zebra/rib.h"
41 #include "zebra/kernel_socket.h"
42 #include "zebra/zebra_mpls.h"
43 #include "zebra/zebra_errors.h"
45 extern struct zebra_privs_t zserv_privs
;
47 #ifdef HAVE_STRUCT_SOCKADDR_IN_SIN_LEN
48 /* Adjust netmask socket length. Return value is a adjusted sin_len
50 static int sin_masklen(struct in_addr mask
)
54 struct sockaddr_in sin
;
60 len
= sizeof(struct sockaddr_in
);
62 lim
= (char *)&sin
.sin_addr
;
63 p
= lim
+ sizeof(sin
.sin_addr
);
65 while (*--p
== 0 && p
>= lim
)
69 #endif /* HAVE_STRUCT_SOCKADDR_IN_SIN_LEN */
72 static int kernel_rtm_add_labels(struct mpls_label_stack
*nh_label
,
73 struct sockaddr_mpls
*smpls
)
75 if (nh_label
->num_labels
> 1) {
76 flog_warn(EC_ZEBRA_MAX_LABELS_PUSH
,
77 "%s: can't push %u labels at "
78 "once (maximum is 1)",
79 __func__
, nh_label
->num_labels
);
83 memset(smpls
, 0, sizeof(*smpls
));
84 smpls
->smpls_len
= sizeof(*smpls
);
85 smpls
->smpls_family
= AF_MPLS
;
86 smpls
->smpls_label
= htonl(nh_label
->label
[0] << MPLS_LABEL_OFFSET
);
92 /* Interface between zebra message and rtm message. */
93 static int kernel_rtm_ipv4(int cmd
, const struct prefix
*p
,
94 const struct nexthop_group
*ng
, uint32_t metric
)
97 struct sockaddr_in
*mask
= NULL
;
98 struct sockaddr_in sin_dest
, sin_mask
, sin_gate
;
100 struct sockaddr_mpls smpls
;
102 union sockunion
*smplsp
= NULL
;
103 struct nexthop
*nexthop
;
105 ifindex_t ifindex
= 0;
108 char prefix_buf
[PREFIX_STRLEN
];
109 enum blackhole_type bh_type
= BLACKHOLE_UNSPEC
;
111 if (IS_ZEBRA_DEBUG_RIB
)
112 prefix2str(p
, prefix_buf
, sizeof(prefix_buf
));
113 memset(&sin_dest
, 0, sizeof(struct sockaddr_in
));
114 sin_dest
.sin_family
= AF_INET
;
115 #ifdef HAVE_STRUCT_SOCKADDR_IN_SIN_LEN
116 sin_dest
.sin_len
= sizeof(struct sockaddr_in
);
117 #endif /* HAVE_STRUCT_SOCKADDR_IN_SIN_LEN */
118 sin_dest
.sin_addr
= p
->u
.prefix4
;
120 memset(&sin_mask
, 0, sizeof(struct sockaddr_in
));
122 memset(&sin_gate
, 0, sizeof(struct sockaddr_in
));
123 sin_gate
.sin_family
= AF_INET
;
124 #ifdef HAVE_STRUCT_SOCKADDR_IN_SIN_LEN
125 sin_gate
.sin_len
= sizeof(struct sockaddr_in
);
126 #endif /* HAVE_STRUCT_SOCKADDR_IN_SIN_LEN */
129 for (ALL_NEXTHOPS_PTR(ng
, nexthop
)) {
130 if (CHECK_FLAG(nexthop
->flags
, NEXTHOP_FLAG_RECURSIVE
))
134 char gate_buf
[INET_ADDRSTRLEN
] = "NULL";
137 * XXX We need to refrain from kernel operations in some cases,
138 * but this if statement seems overly cautious - what about
139 * other than ADD and DELETE?
141 if ((cmd
== RTM_ADD
&& NEXTHOP_IS_ACTIVE(nexthop
->flags
))
142 || (cmd
== RTM_DELETE
)) {
143 if (nexthop
->type
== NEXTHOP_TYPE_IPV4
144 || nexthop
->type
== NEXTHOP_TYPE_IPV4_IFINDEX
) {
145 sin_gate
.sin_addr
= nexthop
->gate
.ipv4
;
148 if (nexthop
->type
== NEXTHOP_TYPE_IFINDEX
149 || nexthop
->type
== NEXTHOP_TYPE_IPV4_IFINDEX
)
150 ifindex
= nexthop
->ifindex
;
151 if (nexthop
->type
== NEXTHOP_TYPE_BLACKHOLE
) {
152 struct in_addr loopback
;
153 loopback
.s_addr
= htonl(INADDR_LOOPBACK
);
154 sin_gate
.sin_addr
= loopback
;
155 bh_type
= nexthop
->bh_type
;
159 if (gate
&& p
->prefixlen
== 32)
162 masklen2ip(p
->prefixlen
, &sin_mask
.sin_addr
);
163 sin_mask
.sin_family
= AF_INET
;
164 #ifdef HAVE_STRUCT_SOCKADDR_IN_SIN_LEN
166 sin_masklen(sin_mask
.sin_addr
);
167 #endif /* HAVE_STRUCT_SOCKADDR_IN_SIN_LEN */
172 if (nexthop
->nh_label
173 && !kernel_rtm_add_labels(nexthop
->nh_label
,
176 smplsp
= (union sockunion
*)&smpls
;
179 error
= rtm_write(cmd
, (union sockunion
*)&sin_dest
,
180 (union sockunion
*)mask
,
181 gate
? (union sockunion
*)&sin_gate
183 smplsp
, ifindex
, bh_type
, metric
);
185 if (IS_ZEBRA_DEBUG_KERNEL
) {
188 "%s: %s: attention! gate not found for re",
189 __func__
, prefix_buf
);
191 inet_ntop(AF_INET
, &sin_gate
.sin_addr
,
192 gate_buf
, INET_ADDRSTRLEN
);
196 /* We only flag nexthops as being in FIB if rtm_write()
198 case ZEBRA_ERR_NOERROR
:
200 if (IS_ZEBRA_DEBUG_KERNEL
)
202 "%s: %s: successfully did NH %s",
203 __func__
, prefix_buf
, gate_buf
);
206 SET_FLAG(nexthop
->flags
,
211 /* The only valid case for this error is kernel's
213 * a multipath route, which is common for FreeBSD. This
215 * ignored silently, but logged as an error otherwise.
217 case ZEBRA_ERR_RTEXIST
:
221 "%s: rtm_write() returned %d for command %d",
222 __func__
, error
, cmd
);
225 /* Note any unexpected status returns */
229 "%s: %s: rtm_write() unexpectedly returned %d for command %s",
231 prefix2str(p
, prefix_buf
,
234 lookup_msg(rtm_type_str
, cmd
, NULL
));
237 } /* if (cmd and flags make sense) */
238 else if (IS_ZEBRA_DEBUG_KERNEL
)
239 zlog_debug("%s: odd command %s for flags %d", __func__
,
240 lookup_msg(rtm_type_str
, cmd
, NULL
),
242 } /* for (ALL_NEXTHOPS(...))*/
244 /* If there was no useful nexthop, then complain. */
245 if (nexthop_num
== 0) {
246 if (IS_ZEBRA_DEBUG_KERNEL
)
247 zlog_debug("%s: No useful nexthops were found in RIB prefix %s",
248 __func__
, prefix2str(p
, prefix_buf
,
249 sizeof(prefix_buf
)));
257 /* Calculate sin6_len value for netmask socket value. */
258 static int sin6_masklen(struct in6_addr mask
)
260 struct sockaddr_in6 sin6
;
264 if (IN6_IS_ADDR_UNSPECIFIED(&mask
))
267 sin6
.sin6_addr
= mask
;
268 len
= sizeof(struct sockaddr_in6
);
270 lim
= (char *)&sin6
.sin6_addr
;
271 p
= lim
+ sizeof(sin6
.sin6_addr
);
273 while (*--p
== 0 && p
>= lim
)
278 #endif /* SIN6_LEN */
280 /* Interface between zebra message and rtm message. */
281 static int kernel_rtm_ipv6(int cmd
, const struct prefix
*p
,
282 const struct nexthop_group
*ng
, uint32_t metric
)
284 struct sockaddr_in6
*mask
;
285 struct sockaddr_in6 sin_dest
, sin_mask
, sin_gate
;
287 struct sockaddr_mpls smpls
;
289 union sockunion
*smplsp
= NULL
;
290 struct nexthop
*nexthop
;
292 ifindex_t ifindex
= 0;
295 enum blackhole_type bh_type
= BLACKHOLE_UNSPEC
;
297 memset(&sin_dest
, 0, sizeof(struct sockaddr_in6
));
298 sin_dest
.sin6_family
= AF_INET6
;
300 sin_dest
.sin6_len
= sizeof(struct sockaddr_in6
);
301 #endif /* SIN6_LEN */
302 sin_dest
.sin6_addr
= p
->u
.prefix6
;
304 memset(&sin_mask
, 0, sizeof(struct sockaddr_in6
));
306 memset(&sin_gate
, 0, sizeof(struct sockaddr_in6
));
307 sin_gate
.sin6_family
= AF_INET6
;
308 #ifdef HAVE_STRUCT_SOCKADDR_IN_SIN_LEN
309 sin_gate
.sin6_len
= sizeof(struct sockaddr_in6
);
310 #endif /* HAVE_STRUCT_SOCKADDR_IN_SIN_LEN */
313 for (ALL_NEXTHOPS_PTR(ng
, nexthop
)) {
314 if (CHECK_FLAG(nexthop
->flags
, NEXTHOP_FLAG_RECURSIVE
))
319 if ((cmd
== RTM_ADD
&& NEXTHOP_IS_ACTIVE(nexthop
->flags
))
320 || (cmd
== RTM_DELETE
)) {
321 if (nexthop
->type
== NEXTHOP_TYPE_IPV6
322 || nexthop
->type
== NEXTHOP_TYPE_IPV6_IFINDEX
) {
323 sin_gate
.sin6_addr
= nexthop
->gate
.ipv6
;
326 if (nexthop
->type
== NEXTHOP_TYPE_IFINDEX
327 || nexthop
->type
== NEXTHOP_TYPE_IPV6_IFINDEX
)
328 ifindex
= nexthop
->ifindex
;
330 if (nexthop
->type
== NEXTHOP_TYPE_BLACKHOLE
)
331 bh_type
= nexthop
->bh_type
;
334 /* Under kame set interface index to link local address. */
337 #define SET_IN6_LINKLOCAL_IFINDEX(a, i) \
339 (a).s6_addr[2] = ((i) >> 8) & 0xff; \
340 (a).s6_addr[3] = (i)&0xff; \
343 if (gate
&& IN6_IS_ADDR_LINKLOCAL(&sin_gate
.sin6_addr
))
344 SET_IN6_LINKLOCAL_IFINDEX(sin_gate
.sin6_addr
, ifindex
);
347 if (gate
&& p
->prefixlen
== 128)
350 masklen2ip6(p
->prefixlen
, &sin_mask
.sin6_addr
);
351 sin_mask
.sin6_family
= AF_INET6
;
353 sin_mask
.sin6_len
= sin6_masklen(sin_mask
.sin6_addr
);
354 #endif /* SIN6_LEN */
359 if (nexthop
->nh_label
360 && !kernel_rtm_add_labels(nexthop
->nh_label
, &smpls
))
362 smplsp
= (union sockunion
*)&smpls
;
365 error
= rtm_write(cmd
, (union sockunion
*)&sin_dest
,
366 (union sockunion
*)mask
,
367 gate
? (union sockunion
*)&sin_gate
: NULL
,
368 smplsp
, ifindex
, bh_type
, metric
);
370 /* Update installed nexthop info on success */
371 if ((cmd
== RTM_ADD
) && (error
== ZEBRA_ERR_NOERROR
))
372 SET_FLAG(nexthop
->flags
, NEXTHOP_FLAG_FIB
);
377 /* If there is no useful nexthop then return. */
378 if (nexthop_num
== 0) {
379 if (IS_ZEBRA_DEBUG_KERNEL
)
380 zlog_debug("kernel_rtm_ipv6(): No useful nexthop.");
387 static int kernel_rtm(int cmd
, const struct prefix
*p
,
388 const struct nexthop_group
*ng
, uint32_t metric
)
390 switch (PREFIX_FAMILY(p
)) {
392 return kernel_rtm_ipv4(cmd
, p
, ng
, metric
);
394 return kernel_rtm_ipv6(cmd
, p
, ng
, metric
);
400 * Update or delete a prefix from the kernel,
401 * using info from a dataplane context struct.
403 enum zebra_dplane_result
kernel_route_update(struct zebra_dplane_ctx
*ctx
)
405 enum zebra_dplane_result res
= ZEBRA_DPLANE_REQUEST_SUCCESS
;
407 if (dplane_ctx_get_src(ctx
) != NULL
) {
408 zlog_err("route add: IPv6 sourcedest routes unsupported!");
409 res
= ZEBRA_DPLANE_REQUEST_FAILURE
;
413 frr_elevate_privs(ZPRIVS_RAISE
) {
415 if (dplane_ctx_get_op(ctx
) == DPLANE_OP_ROUTE_DELETE
)
416 kernel_rtm(RTM_DELETE
, dplane_ctx_get_dest(ctx
),
417 dplane_ctx_get_ng(ctx
),
418 dplane_ctx_get_metric(ctx
));
419 else if (dplane_ctx_get_op(ctx
) == DPLANE_OP_ROUTE_INSTALL
)
420 kernel_rtm(RTM_ADD
, dplane_ctx_get_dest(ctx
),
421 dplane_ctx_get_ng(ctx
),
422 dplane_ctx_get_metric(ctx
));
423 else if (dplane_ctx_get_op(ctx
) == DPLANE_OP_ROUTE_UPDATE
) {
424 /* Must do delete and add separately -
425 * no update available
427 kernel_rtm(RTM_DELETE
, dplane_ctx_get_dest(ctx
),
428 dplane_ctx_get_old_ng(ctx
),
429 dplane_ctx_get_old_metric(ctx
));
431 kernel_rtm(RTM_ADD
, dplane_ctx_get_dest(ctx
),
432 dplane_ctx_get_ng(ctx
),
433 dplane_ctx_get_metric(ctx
));
435 zlog_err("Invalid routing socket update op %s (%u)",
436 dplane_op2str(dplane_ctx_get_op(ctx
)),
437 dplane_ctx_get_op(ctx
));
438 res
= ZEBRA_DPLANE_REQUEST_FAILURE
;
440 } /* Elevated privs */
447 int kernel_neigh_update(int add
, int ifindex
, uint32_t addr
, char *lla
,
448 int llalen
, ns_id_t ns_id
)
454 extern int kernel_get_ipmr_sg_stats(struct zebra_vrf
*zvrf
, void *mroute
)
459 int kernel_add_vtep(vni_t vni
, struct interface
*ifp
, struct in_addr
*vtep_ip
)
464 int kernel_del_vtep(vni_t vni
, struct interface
*ifp
, struct in_addr
*vtep_ip
)
469 int kernel_add_mac(struct interface
*ifp
, vlanid_t vid
, struct ethaddr
*mac
,
470 struct in_addr vtep_ip
, bool sticky
)
475 int kernel_del_mac(struct interface
*ifp
, vlanid_t vid
, struct ethaddr
*mac
,
476 struct in_addr vtep_ip
)
481 int kernel_add_neigh(struct interface
*ifp
, struct ipaddr
*ip
,
482 struct ethaddr
*mac
, uint8_t flags
)
487 int kernel_del_neigh(struct interface
*ifp
, struct ipaddr
*ip
)
492 extern int kernel_interface_set_master(struct interface
*master
,
493 struct interface
*slave
)
498 uint32_t kernel_get_speed(struct interface
*ifp
)
503 #endif /* !HAVE_NETLINK */