2 * Code for encoding/decoding FPM messages that are in netlink format.
4 * Copyright (C) 1997, 98, 99 Kunihiro Ishiguro
5 * Copyright (C) 2012 by Open Source Routing.
6 * Copyright (C) 2012 by Internet Systems Consortium, Inc. ("ISC")
8 * This file is part of GNU Zebra.
10 * GNU Zebra is free software; you can redistribute it and/or modify it
11 * under the terms of the GNU General Public License as published by the
12 * Free Software Foundation; either version 2, or (at your option) any
15 * GNU Zebra is distributed in the hope that it will be useful, but
16 * WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
18 * General Public License for more details.
20 * You should have received a copy of the GNU General Public License along
21 * with this program; see the file COPYING; if not, write to the Free Software
22 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
34 #include "zebra/zserv.h"
35 #include "zebra/zebra_router.h"
36 #include "zebra/zebra_dplane.h"
37 #include "zebra/zebra_ns.h"
38 #include "zebra/zebra_vrf.h"
39 #include "zebra/kernel_netlink.h"
40 #include "zebra/rt_netlink.h"
43 #include "zebra/zebra_fpm_private.h"
44 #include "zebra/zebra_vxlan_private.h"
49 * The size of an address in a given address family.
51 static size_t af_addr_size(uint8_t af
)
66 * We plan to use RTA_ENCAP_TYPE attribute for VxLAN encap as well.
67 * Currently, values 0 to 8 for this attribute are used by lwtunnel_encap_types
68 * So, we cannot use these values for VxLAN encap.
70 enum fpm_nh_encap_type_t
{
71 FPM_NH_ENCAP_NONE
= 0,
72 FPM_NH_ENCAP_VXLAN
= 100,
77 * fpm_nh_encap_type_to_str
79 static const char *fpm_nh_encap_type_to_str(enum fpm_nh_encap_type_t encap_type
)
82 case FPM_NH_ENCAP_NONE
:
85 case FPM_NH_ENCAP_VXLAN
:
88 case FPM_NH_ENCAP_MAX
:
95 struct vxlan_encap_info_t
{
99 enum vxlan_encap_info_type_t
{
103 struct fpm_nh_encap_info_t
{
104 enum fpm_nh_encap_type_t encap_type
;
106 struct vxlan_encap_info_t vxlan_encap
;
113 * Holds information about a single nexthop for netlink. These info
114 * structures are transient and may contain pointers into rib
115 * data structures for convenience.
117 struct netlink_nh_info
{
119 union g_addr
*gateway
;
122 * Information from the struct nexthop from which this nh was
123 * derived. For debug purposes only.
126 enum nexthop_types_t type
;
127 struct fpm_nh_encap_info_t encap_info
;
133 * A structure for holding information for a netlink route message.
135 struct netlink_route_info
{
140 uint8_t rtm_protocol
;
142 struct prefix
*prefix
;
144 unsigned int num_nhs
;
149 struct netlink_nh_info nhs
[MULTIPATH_NUM
];
150 union g_addr
*pref_src
;
154 * netlink_route_info_add_nh
156 * Add information about the given nexthop to the given route info
159 * Returns true if a nexthop was added, false otherwise.
161 static int netlink_route_info_add_nh(struct netlink_route_info
*ri
,
162 struct nexthop
*nexthop
,
163 struct route_entry
*re
)
165 struct netlink_nh_info nhi
;
167 zebra_l3vni_t
*zl3vni
= NULL
;
169 memset(&nhi
, 0, sizeof(nhi
));
172 if (ri
->num_nhs
>= (int)array_size(ri
->nhs
))
175 nhi
.recursive
= nexthop
->rparent
? 1 : 0;
176 nhi
.type
= nexthop
->type
;
177 nhi
.if_index
= nexthop
->ifindex
;
179 if (nexthop
->type
== NEXTHOP_TYPE_IPV4
180 || nexthop
->type
== NEXTHOP_TYPE_IPV4_IFINDEX
) {
181 nhi
.gateway
= &nexthop
->gate
;
182 if (nexthop
->src
.ipv4
.s_addr
!= INADDR_ANY
)
186 if (nexthop
->type
== NEXTHOP_TYPE_IPV6
187 || nexthop
->type
== NEXTHOP_TYPE_IPV6_IFINDEX
) {
188 nhi
.gateway
= &nexthop
->gate
;
191 if (nexthop
->type
== NEXTHOP_TYPE_IFINDEX
) {
192 if (nexthop
->src
.ipv4
.s_addr
!= INADDR_ANY
)
196 if (!nhi
.gateway
&& nhi
.if_index
== 0)
199 if (re
&& CHECK_FLAG(re
->flags
, ZEBRA_FLAG_EVPN_ROUTE
)) {
200 nhi
.encap_info
.encap_type
= FPM_NH_ENCAP_VXLAN
;
202 zl3vni
= zl3vni_from_vrf(nexthop
->vrf_id
);
203 if (zl3vni
&& is_l3vni_oper_up(zl3vni
)) {
205 /* Add VNI to VxLAN encap info */
206 nhi
.encap_info
.vxlan_encap
.vni
= zl3vni
->vni
;
211 * We have a valid nhi. Copy the structure over to the route_info.
213 ri
->nhs
[ri
->num_nhs
] = nhi
;
216 if (src
&& !ri
->pref_src
)
223 * netlink_proto_from_route_type
225 static uint8_t netlink_proto_from_route_type(int type
)
228 case ZEBRA_ROUTE_KERNEL
:
229 case ZEBRA_ROUTE_CONNECT
:
230 return RTPROT_KERNEL
;
238 * netlink_route_info_fill
240 * Fill out the route information object from the given route.
242 * Returns true on success and false on failure.
244 static int netlink_route_info_fill(struct netlink_route_info
*ri
, int cmd
,
245 rib_dest_t
*dest
, struct route_entry
*re
)
247 struct nexthop
*nexthop
;
248 struct rib_table_info
*table_info
=
249 rib_table_info(rib_dest_table(dest
));
250 struct zebra_vrf
*zvrf
= table_info
->zvrf
;
252 memset(ri
, 0, sizeof(*ri
));
254 ri
->prefix
= rib_dest_prefix(dest
);
255 ri
->af
= rib_dest_af(dest
);
257 if (zvrf
&& zvrf
->zns
)
258 ri
->nlmsg_pid
= zvrf
->zns
->netlink_dplane
.snl
.nl_pid
;
260 ri
->nlmsg_type
= cmd
;
261 ri
->rtm_table
= table_info
->table_id
;
262 ri
->rtm_protocol
= RTPROT_UNSPEC
;
265 * An RTM_DELROUTE need not be accompanied by any nexthops,
266 * particularly in our communication with the FPM.
268 if (cmd
== RTM_DELROUTE
&& !re
)
272 zfpm_debug("%s: Expected non-NULL re pointer", __func__
);
276 ri
->rtm_protocol
= netlink_proto_from_route_type(re
->type
);
277 ri
->rtm_type
= RTN_UNICAST
;
278 ri
->metric
= &re
->metric
;
280 for (ALL_NEXTHOPS(re
->nhe
->nhg
, nexthop
)) {
281 if (ri
->num_nhs
>= zrouter
.multipath_num
)
284 if (CHECK_FLAG(nexthop
->flags
, NEXTHOP_FLAG_RECURSIVE
))
287 if (nexthop
->type
== NEXTHOP_TYPE_BLACKHOLE
) {
288 switch (nexthop
->bh_type
) {
289 case BLACKHOLE_ADMINPROHIB
:
290 ri
->rtm_type
= RTN_PROHIBIT
;
292 case BLACKHOLE_REJECT
:
293 ri
->rtm_type
= RTN_UNREACHABLE
;
297 ri
->rtm_type
= RTN_BLACKHOLE
;
302 if ((cmd
== RTM_NEWROUTE
303 && CHECK_FLAG(nexthop
->flags
, NEXTHOP_FLAG_ACTIVE
))
304 || (cmd
== RTM_DELROUTE
305 && CHECK_FLAG(re
->status
, ROUTE_ENTRY_INSTALLED
))) {
306 netlink_route_info_add_nh(ri
, nexthop
, re
);
310 if (ri
->num_nhs
== 0) {
311 switch (ri
->rtm_type
) {
313 case RTN_UNREACHABLE
:
317 /* If there is no useful nexthop then return. */
319 "netlink_encode_route(): No useful nexthop.");
328 * netlink_route_info_encode
330 * Returns the number of bytes written to the buffer. 0 or a negative
331 * value indicates an error.
333 static int netlink_route_info_encode(struct netlink_route_info
*ri
,
334 char *in_buf
, size_t in_buf_len
)
337 unsigned int nexthop_num
= 0;
339 struct netlink_nh_info
*nhi
;
340 enum fpm_nh_encap_type_t encap
;
341 struct rtattr
*nest
, *inner_nest
;
342 struct rtnexthop
*rtnh
;
343 struct vxlan_encap_info_t
*vxlan
;
344 struct in6_addr ipv6
;
352 req
= (void *)in_buf
;
354 buf_offset
= ((char *)req
->buf
) - ((char *)req
);
356 if (in_buf_len
< buf_offset
) {
361 memset(req
, 0, buf_offset
);
363 bytelen
= af_addr_size(ri
->af
);
365 req
->n
.nlmsg_len
= NLMSG_LENGTH(sizeof(struct rtmsg
));
366 req
->n
.nlmsg_flags
= NLM_F_CREATE
| NLM_F_REQUEST
;
367 req
->n
.nlmsg_pid
= ri
->nlmsg_pid
;
368 req
->n
.nlmsg_type
= ri
->nlmsg_type
;
369 req
->r
.rtm_family
= ri
->af
;
372 * rtm_table field is a uchar field which can accomodate table_id less
374 * To support table id greater than 255, if the table_id is greater than
375 * 255, set rtm_table to RT_TABLE_UNSPEC and add RTA_TABLE attribute
376 * with 32 bit value as the table_id.
378 if (ri
->rtm_table
< 256)
379 req
->r
.rtm_table
= ri
->rtm_table
;
381 req
->r
.rtm_table
= RT_TABLE_UNSPEC
;
382 nl_attr_put32(&req
->n
, in_buf_len
, RTA_TABLE
, ri
->rtm_table
);
385 req
->r
.rtm_dst_len
= ri
->prefix
->prefixlen
;
386 req
->r
.rtm_protocol
= ri
->rtm_protocol
;
387 req
->r
.rtm_scope
= RT_SCOPE_UNIVERSE
;
389 nl_attr_put(&req
->n
, in_buf_len
, RTA_DST
, &ri
->prefix
->u
.prefix
,
392 req
->r
.rtm_type
= ri
->rtm_type
;
396 nl_attr_put32(&req
->n
, in_buf_len
, RTA_PRIORITY
, *ri
->metric
);
398 if (ri
->num_nhs
== 0)
401 if (ri
->num_nhs
== 1) {
405 if (nhi
->type
== NEXTHOP_TYPE_IPV4_IFINDEX
406 && ri
->af
== AF_INET6
) {
407 ipv4_to_ipv4_mapped_ipv6(&ipv6
,
409 nl_attr_put(&req
->n
, in_buf_len
, RTA_GATEWAY
,
412 nl_attr_put(&req
->n
, in_buf_len
, RTA_GATEWAY
,
413 nhi
->gateway
, bytelen
);
417 nl_attr_put32(&req
->n
, in_buf_len
, RTA_OIF
,
421 encap
= nhi
->encap_info
.encap_type
;
423 case FPM_NH_ENCAP_NONE
:
424 case FPM_NH_ENCAP_MAX
:
426 case FPM_NH_ENCAP_VXLAN
:
427 nl_attr_put16(&req
->n
, in_buf_len
, RTA_ENCAP_TYPE
,
429 vxlan
= &nhi
->encap_info
.vxlan_encap
;
430 nest
= nl_attr_nest(&req
->n
, in_buf_len
, RTA_ENCAP
);
431 nl_attr_put32(&req
->n
, in_buf_len
, VXLAN_VNI
,
433 nl_attr_nest_end(&req
->n
, nest
);
443 nest
= nl_attr_nest(&req
->n
, in_buf_len
, RTA_MULTIPATH
);
445 for (nexthop_num
= 0; nexthop_num
< ri
->num_nhs
; nexthop_num
++) {
446 rtnh
= nl_attr_rtnh(&req
->n
, in_buf_len
);
447 nhi
= &ri
->nhs
[nexthop_num
];
450 nl_attr_put(&req
->n
, in_buf_len
, RTA_GATEWAY
,
451 nhi
->gateway
, bytelen
);
454 rtnh
->rtnh_ifindex
= nhi
->if_index
;
457 encap
= nhi
->encap_info
.encap_type
;
459 case FPM_NH_ENCAP_NONE
:
460 case FPM_NH_ENCAP_MAX
:
462 case FPM_NH_ENCAP_VXLAN
:
463 nl_attr_put16(&req
->n
, in_buf_len
, RTA_ENCAP_TYPE
,
465 vxlan
= &nhi
->encap_info
.vxlan_encap
;
467 nl_attr_nest(&req
->n
, in_buf_len
, RTA_ENCAP
);
468 nl_attr_put32(&req
->n
, in_buf_len
, VXLAN_VNI
,
470 nl_attr_nest_end(&req
->n
, inner_nest
);
474 nl_attr_rtnh_end(&req
->n
, rtnh
);
477 nl_attr_nest_end(&req
->n
, nest
);
478 assert(nest
->rta_len
> RTA_LENGTH(0));
483 nl_attr_put(&req
->n
, in_buf_len
, RTA_PREFSRC
, &ri
->pref_src
,
487 assert(req
->n
.nlmsg_len
< in_buf_len
);
488 return req
->n
.nlmsg_len
;
492 * zfpm_log_route_info
494 * Helper function to log the information in a route_info structure.
496 static void zfpm_log_route_info(struct netlink_route_info
*ri
,
499 struct netlink_nh_info
*nhi
;
501 char buf
[PREFIX_STRLEN
];
503 zfpm_debug("%s : %s %pFX, Proto: %s, Metric: %u", label
,
504 nl_msg_type_to_str(ri
->nlmsg_type
), ri
->prefix
,
505 nl_rtproto_to_str(ri
->rtm_protocol
),
506 ri
->metric
? *ri
->metric
: 0);
508 for (i
= 0; i
< ri
->num_nhs
; i
++) {
511 if (ri
->af
== AF_INET
)
512 inet_ntop(AF_INET
, &nhi
->gateway
, buf
, sizeof(buf
));
514 inet_ntop(AF_INET6
, &nhi
->gateway
, buf
, sizeof(buf
));
516 zfpm_debug(" Intf: %u, Gateway: %s, Recursive: %s, Type: %s, Encap type: %s",
517 nhi
->if_index
, buf
, nhi
->recursive
? "yes" : "no",
518 nexthop_type_to_str(nhi
->type
),
519 fpm_nh_encap_type_to_str(nhi
->encap_info
.encap_type
)
525 * zfpm_netlink_encode_route
527 * Create a netlink message corresponding to the given route in the
528 * given buffer space.
530 * Returns the number of bytes written to the buffer. 0 or a negative
531 * value indicates an error.
533 int zfpm_netlink_encode_route(int cmd
, rib_dest_t
*dest
, struct route_entry
*re
,
534 char *in_buf
, size_t in_buf_len
)
536 struct netlink_route_info ri_space
, *ri
;
540 if (!netlink_route_info_fill(ri
, cmd
, dest
, re
))
543 zfpm_log_route_info(ri
, __func__
);
545 return netlink_route_info_encode(ri
, in_buf
, in_buf_len
);
549 * zfpm_netlink_encode_mac
551 * Create a netlink message corresponding to the given MAC.
553 * Returns the number of bytes written to the buffer. 0 or a negative
554 * value indicates an error.
556 int zfpm_netlink_encode_mac(struct fpm_mac_info_t
*mac
, char *in_buf
,
566 req
= (void *)in_buf
;
568 buf_offset
= offsetof(struct macmsg
, buf
);
569 if (in_buf_len
< buf_offset
)
571 memset(req
, 0, buf_offset
);
573 /* Construct nlmsg header */
574 req
->hdr
.nlmsg_len
= NLMSG_LENGTH(sizeof(struct ndmsg
));
575 req
->hdr
.nlmsg_type
= CHECK_FLAG(mac
->fpm_flags
, ZEBRA_MAC_DELETE_FPM
) ?
576 RTM_DELNEIGH
: RTM_NEWNEIGH
;
577 req
->hdr
.nlmsg_flags
= NLM_F_REQUEST
;
578 if (req
->hdr
.nlmsg_type
== RTM_NEWNEIGH
)
579 req
->hdr
.nlmsg_flags
|= (NLM_F_CREATE
| NLM_F_REPLACE
);
581 /* Construct ndmsg */
582 req
->ndm
.ndm_family
= AF_BRIDGE
;
583 req
->ndm
.ndm_ifindex
= mac
->vxlan_if
;
585 req
->ndm
.ndm_state
= NUD_REACHABLE
;
586 req
->ndm
.ndm_flags
|= NTF_SELF
| NTF_MASTER
;
587 if (CHECK_FLAG(mac
->zebra_flags
,
588 (ZEBRA_MAC_STICKY
| ZEBRA_MAC_REMOTE_DEF_GW
)))
589 req
->ndm
.ndm_state
|= NUD_NOARP
;
591 req
->ndm
.ndm_flags
|= NTF_EXT_LEARNED
;
594 nl_attr_put(&req
->hdr
, in_buf_len
, NDA_LLADDR
, &mac
->macaddr
, 6);
595 nl_attr_put(&req
->hdr
, in_buf_len
, NDA_DST
, &mac
->r_vtep_ip
, 4);
596 nl_attr_put32(&req
->hdr
, in_buf_len
, NDA_MASTER
, mac
->svi_if
);
597 nl_attr_put32(&req
->hdr
, in_buf_len
, NDA_VNI
, mac
->vni
);
599 assert(req
->hdr
.nlmsg_len
< in_buf_len
);
601 zfpm_debug("Tx %s family %s ifindex %u MAC %pEA DEST %pI4",
602 nl_msg_type_to_str(req
->hdr
.nlmsg_type
),
603 nl_family_to_str(req
->ndm
.ndm_family
), req
->ndm
.ndm_ifindex
,
604 &mac
->macaddr
, &mac
->r_vtep_ip
);
606 return req
->hdr
.nlmsg_len
;
609 #endif /* HAVE_NETLINK */