]> git.proxmox.com Git - mirror_frr.git/blame - vrrpd/vrrp.c
tests: clean up all_proto_startup a bit
[mirror_frr.git] / vrrpd / vrrp.c
CommitLineData
5435a2bf 1/*
63d4bd12
QY
2 * VRRP global definitions and state machine.
3 * Copyright (C) 2018-2019 Cumulus Networks, Inc.
4 * Quentin Young
5435a2bf
QY
5 *
6 * This program is free software; you can redistribute it and/or modify it
7 * under the terms of the GNU General Public License as published by the Free
8 * Software Foundation; either version 2 of the License, or (at your option)
9 * any later version.
10 *
11 * This program is distributed in the hope that it will be useful, but WITHOUT
12 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
14 * more details.
15 *
16 * You should have received a copy of the GNU General Public License along
17 * with this program; see the file COPYING; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
19 */
41ee5442
QY
20#include <zebra.h>
21
862f2f37
QY
22#include "lib/hash.h"
23#include "lib/hook.h"
40744000
QY
24#include "lib/if.h"
25#include "lib/linklist.h"
862f2f37 26#include "lib/memory.h"
91188ca6 27#include "lib/network.h"
40744000 28#include "lib/prefix.h"
862f2f37 29#include "lib/sockopt.h"
dad18a2f 30#include "lib/sockunion.h"
40744000 31#include "lib/vrf.h"
f828842a 32#include "lib/vty.h"
5435a2bf
QY
33
34#include "vrrp.h"
40744000 35#include "vrrp_arp.h"
b637bcd4 36#include "vrrp_debug.h"
4f52e9a6 37#include "vrrp_ndisc.h"
247aa469 38#include "vrrp_packet.h"
f3fe0047 39#include "vrrp_zebra.h"
5435a2bf 40
4ec94408
QY
41#define VRRP_LOGPFX "[CORE] "
42
bf8d3d6a
DL
43DEFINE_MTYPE_STATIC(VRRPD, VRRP_IP, "VRRP IP address");
44DEFINE_MTYPE_STATIC(VRRPD, VRRP_RTR, "VRRP Router");
7c136b08 45
27fd8827
QY
46/* statics */
47struct hash *vrrp_vrouters_hash;
48bool vrrp_autoconfig_is_on;
49int vrrp_autoconfig_version;
50
8cd1d277
QY
51struct vrrp_defaults vd;
52
2b64873d 53const char *const vrrp_state_names[3] = {
4ec94408
QY
54 [VRRP_STATE_INITIALIZE] = "Initialize",
55 [VRRP_STATE_MASTER] = "Master",
56 [VRRP_STATE_BACKUP] = "Backup",
57};
58
2b64873d 59static const char *const vrrp_event_names[2] = {
4ec94408
QY
60 [VRRP_EVENT_STARTUP] = "Startup",
61 [VRRP_EVENT_SHUTDOWN] = "Shutdown",
62};
63
64
5435a2bf
QY
65/* Utility functions ------------------------------------------------------- */
66
67/*
68 * Sets an ethaddr to RFC-defined Virtual Router MAC address.
69 *
70 * mac
71 * ethaddr to set
72 *
73 * v6
74 * Whether this is a V6 or V4 Virtual Router MAC
75 *
76 * vrid
77 * Virtual Router Identifier
78 */
79static void vrrp_mac_set(struct ethaddr *mac, bool v6, uint8_t vrid)
80{
81 /*
82 * V4: 00-00-5E-00-01-{VRID}
83 * V6: 00-00-5E-00-02-{VRID}
84 */
85 mac->octet[0] = 0x00;
86 mac->octet[1] = 0x00;
87 mac->octet[2] = 0x5E;
88 mac->octet[3] = 0x00;
89 mac->octet[4] = v6 ? 0x02 : 0x01;
90 mac->octet[5] = vrid;
91}
92
1d21789e 93/*
862f2f37 94 * Recalculates and sets skew_time and master_down_interval based
1d21789e
QY
95 * values.
96 *
862f2f37
QY
97 * r
98 * VRRP Router to operate on
1d21789e 99 */
862f2f37 100static void vrrp_recalculate_timers(struct vrrp_router *r)
1d21789e 101{
08671293
QY
102 uint16_t mdiadv = r->vr->version == 3 ? r->master_adver_interval
103 : r->vr->advertisement_interval;
8b28e459 104 uint16_t skm = (r->vr->version == 3) ? r->master_adver_interval : 100;
2fff50ec 105
2884f9bb 106 r->skew_time = ((256 - r->vr->priority) * skm) / 256;
08671293 107 r->master_down_interval = 3 * mdiadv;
862f2f37 108 r->master_down_interval += r->skew_time;
1d21789e
QY
109}
110
5d3730c5
QY
111/*
112 * Determines if a VRRP router is the owner of the specified address.
113 *
dad18a2f 114 * The determining factor for whether an interface is the address owner is
2f1fc30f 115 * simply whether the address is assigned to the VRRP base interface by someone
dad18a2f
QY
116 * other than vrrpd.
117 *
118 * This function should always return the correct answer regardless of
119 * master/backup status.
120 *
2f1fc30f
QY
121 * ifp
122 * The interface to check owernship of. This should be the base interface of
123 * a VRRP router.
124 *
5d3730c5 125 * vr
862f2f37 126 * Virtual Router
5d3730c5
QY
127 *
128 * Returns:
129 * whether or not vr owns the specified address
130 */
7e205b4a 131static bool vrrp_is_owner(struct interface *ifp, struct ipaddr *addr)
5d3730c5 132{
2f1fc30f
QY
133 /*
134 * This code sanity checks implicit ownership configuration. Ideally,
135 * the way we determine address ownership status for this VRRP router
136 * is by looking at whether our VIPs are also assigned to the base
137 * interface, and therefore count as "real" addresses. This frees the
138 * user from having to manually configure priority 255 to indicate
139 * address ownership. However, this means one of the VIPs will be used
140 * as the source address for VRRP advertisements, which in turn means
141 * that other VRRP routers will be receiving packets with a source
142 * address they themselves have. This causes lots of different issues
143 * so for now we're disabling this and forcing the user to configure
144 * priority 255 to indicate ownership.
145 */
146
147 return false;
148
149#if 0
7e205b4a 150 struct prefix p;
5d3730c5 151
7e205b4a
QY
152 p.family = IS_IPADDR_V4(addr) ? AF_INET : AF_INET6;
153 p.prefixlen = IS_IPADDR_V4(addr) ? IPV4_MAX_BITLEN : IPV6_MAX_BITLEN;
154 memcpy(&p.u, &addr->ip, sizeof(addr->ip));
dad18a2f 155
7e205b4a 156 return !!connected_lookup_prefix_exact(ifp, &p);
2f1fc30f 157#endif
5d3730c5
QY
158}
159
6e93585e
QY
160/*
161 * Whether an interface has a MAC address that matches the VRRP RFC.
162 *
163 * ifp
164 * Interface to check
165 *
166 * Returns:
167 * Whether the interface has a VRRP mac or not
168 */
169static bool vrrp_ifp_has_vrrp_mac(struct interface *ifp)
170{
171 struct ethaddr vmac4;
172 struct ethaddr vmac6;
2fff50ec 173
6e93585e
QY
174 vrrp_mac_set(&vmac4, 0, 0x00);
175 vrrp_mac_set(&vmac6, 1, 0x00);
176
177 return !memcmp(ifp->hw_addr, vmac4.octet, sizeof(vmac4.octet) - 1)
178 || !memcmp(ifp->hw_addr, vmac6.octet, sizeof(vmac6.octet) - 1);
179}
180
181/*
182 * Lookup a Virtual Router instance given a macvlan subinterface.
183 *
184 * The VRID is extracted from the interface MAC and the 2-tuple (iface, vrid)
185 * is used to look up any existing instances that match the interface. It does
186 * not matter whether the instance is already bound to the interface or not.
187 *
2681134b
QY
188 * Note that the interface linkages must be correct for this to work. In other
189 * words, the macvlan must have a valid VRRP MAC, and its link_ifindex must be
190 * be equal to the ifindex of another interface in the interface RB trees (its
191 * parent). If these conditions aren't satisfied we won't find the VR.
192 *
6e93585e
QY
193 * mvl_ifp
194 * Interface pointer to use to lookup. Should be a macvlan device.
195 *
196 * Returns:
197 * Virtual Router, if found
198 * NULL otherwise
199 */
200static struct vrrp_vrouter *vrrp_lookup_by_if_mvl(struct interface *mvl_ifp)
201{
202 struct interface *p;
203
c257cce4 204 if (!mvl_ifp || mvl_ifp->link_ifindex == 0
76bcde9e 205 || !vrrp_ifp_has_vrrp_mac(mvl_ifp)) {
c257cce4 206 if (mvl_ifp && mvl_ifp->link_ifindex == 0)
76bcde9e
QY
207 DEBUGD(&vrrp_dbg_zebra,
208 VRRP_LOGPFX
209 "Interface %s has no parent ifindex; disregarding",
210 mvl_ifp->name);
c257cce4 211 if (mvl_ifp && !vrrp_ifp_has_vrrp_mac(mvl_ifp))
76bcde9e
QY
212 DEBUGD(&vrrp_dbg_zebra,
213 VRRP_LOGPFX
214 "Interface %s has a non-VRRP MAC; disregarding",
215 mvl_ifp->name);
6e93585e 216 return NULL;
76bcde9e 217 }
6e93585e 218
490810d5 219 p = if_lookup_by_index(mvl_ifp->link_ifindex, mvl_ifp->vrf_id);
3cb543cf
QY
220
221 if (!p) {
222 DEBUGD(&vrrp_dbg_zebra,
223 VRRP_LOGPFX
224 "Tried to lookup interface %d, parent of %s, but it doesn't exist",
225 mvl_ifp->link_ifindex, mvl_ifp->name);
226 return NULL;
227 }
228
6e93585e
QY
229 uint8_t vrid = mvl_ifp->hw_addr[5];
230
231 return vrrp_lookup(p, vrid);
232}
233
234/*
235 * Lookup the Virtual Router instances configured on a particular interface.
236 *
237 * ifp
238 * Interface pointer to use to lookup. Should not be a macvlan device.
239 *
240 * Returns:
241 * List of virtual routers found
242 */
243static struct list *vrrp_lookup_by_if(struct interface *ifp)
244{
245 struct list *l = hash_to_list(vrrp_vrouters_hash);
246 struct listnode *ln, *nn;
247 struct vrrp_vrouter *vr;
248
249 for (ALL_LIST_ELEMENTS(l, ln, nn, vr))
250 if (vr->ifp != ifp)
251 list_delete_node(l, ln);
252
253 return l;
254}
255
256/*
257 * Lookup any Virtual Router instances associated with a particular interface.
258 * This is a combination of the results from vrrp_lookup_by_if_mvl and
259 * vrrp_lookup_by_if.
260 *
261 * Suppose the system interface list looks like the following:
262 *
263 * eth0
264 * \- eth0-v0 00:00:5e:00:01:01
265 * \- eth0-v1 00:00:5e:00:02:01
266 * \- eth0-v2 00:00:5e:00:01:0a
267 *
268 * Passing eth0-v2 to this function will give you the VRRP instance configured
269 * on eth0 with VRID 10. Passing eth0-v0 or eth0-v1 will give you the VRRP
270 * instance configured on eth0 with VRID 1. Passing eth0 will give you both.
271 *
272 * ifp
273 * Interface pointer to use to lookup. Can be any interface.
274 *
275 * Returns:
276 * List of virtual routers found
277 */
278static struct list *vrrp_lookup_by_if_any(struct interface *ifp)
279{
280 struct vrrp_vrouter *vr;
281 struct list *vrs;
282
283 vr = vrrp_lookup_by_if_mvl(ifp);
284 vrs = vr ? list_new() : vrrp_lookup_by_if(ifp);
285
286 if (vr)
287 listnode_add(vrs, vr);
288
289 return vrs;
290}
291
1d21789e
QY
292/* Configuration controllers ----------------------------------------------- */
293
6e93585e
QY
294void vrrp_check_start(struct vrrp_vrouter *vr)
295{
296 struct vrrp_router *r;
297 bool start;
d8b92c67 298 const char *whynot = NULL;
6e93585e
QY
299
300 if (vr->shutdown || vr->ifp == NULL)
301 return;
302
303 r = vr->v4;
114a413e 304 /* Must not already be started */
6e93585e 305 start = r->fsm.state == VRRP_STATE_INITIALIZE;
d8b92c67 306 whynot = (!start && !whynot) ? "Already running" : whynot;
114a413e 307 /* Must have a parent interface */
6e93585e 308 start = start && (vr->ifp != NULL);
00c3cf9c 309 whynot = (!start && !whynot) ? "No base interface" : whynot;
c16fb340 310#if 0
114a413e 311 /* Parent interface must be up */
b0ec34c8 312 start = start && if_is_operative(vr->ifp);
d8b92c67 313 start = (!start && !whynot) ? "Base interface inoperative" : whynot;
c16fb340 314#endif
114a413e 315 /* Parent interface must have at least one v4 */
457ea8d4 316 start = start && connected_count_by_family(vr->ifp, AF_INET) > 0;
00c3cf9c 317 whynot = (!start && !whynot) ? "No primary IPv4 address" : whynot;
114a413e 318 /* Must have a macvlan interface */
6e93585e 319 start = start && (r->mvl_ifp != NULL);
00c3cf9c 320 whynot = (!start && !whynot) ? "No VRRP interface" : whynot;
c16fb340 321#if 0
b0ec34c8
QY
322 /* Macvlan interface must be admin up */
323 start = start && CHECK_FLAG(r->mvl_ifp->flags, IFF_UP);
d8b92c67 324 start = (!start && !whynot) ? "Macvlan device admin down" : whynot;
c16fb340 325#endif
114a413e 326 /* Must have at least one VIP configured */
6e93585e 327 start = start && r->addrs->count > 0;
00c3cf9c
QY
328 whynot = (!start && !whynot) ? "No Virtual IP address configured"
329 : whynot;
6e93585e
QY
330 if (start)
331 vrrp_event(r, VRRP_EVENT_STARTUP);
6309f71c 332 else if (whynot)
613b45b0
QY
333 zlog_warn(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
334 "Refusing to start Virtual Router: %s",
335 vr->vrid, family2str(r->family), whynot);
6e93585e 336
d8b92c67
QY
337 whynot = NULL;
338
6e93585e 339 r = vr->v6;
114a413e 340 /* Must not already be started */
6e93585e 341 start = r->fsm.state == VRRP_STATE_INITIALIZE;
d8b92c67 342 whynot = (!start && !whynot) ? "Already running" : whynot;
26c7454b 343 /* Must not be v2 */
bdf16661 344 start = start && vr->version != 2;
00c3cf9c 345 whynot = (!start && !whynot) ? "VRRPv2 does not support v6" : whynot;
114a413e 346 /* Must have a parent interface */
6e93585e 347 start = start && (vr->ifp != NULL);
00c3cf9c 348 whynot = (!start && !whynot) ? "No base interface" : whynot;
c16fb340 349#if 0
114a413e 350 /* Parent interface must be up */
b0ec34c8 351 start = start && if_is_operative(vr->ifp);
d8b92c67 352 start = (!start && !whynot) ? "Base interface inoperative" : whynot;
c16fb340 353#endif
114a413e 354 /* Must have a macvlan interface */
6e93585e 355 start = start && (r->mvl_ifp != NULL);
00c3cf9c 356 whynot = (!start && !whynot) ? "No VRRP interface" : whynot;
c16fb340 357#if 0
b0ec34c8
QY
358 /* Macvlan interface must be admin up */
359 start = start && CHECK_FLAG(r->mvl_ifp->flags, IFF_UP);
d8b92c67 360 start = (!start && !whynot) ? "Macvlan device admin down" : whynot;
114a413e
QY
361 /* Macvlan interface must have a link local */
362 start = start && connected_get_linklocal(r->mvl_ifp);
2fff50ec 363 whynot =
457ea8d4 364 (!start && !whynot) ? "No link local address configured" : whynot;
6309f71c 365 /* Macvlan interface must have a v6 IP besides the link local */
457ea8d4 366 start = start && (connected_count_by_family(r->mvl_ifp, AF_INET6) > 1);
2fff50ec 367 whynot = (!start && !whynot)
457ea8d4
GN
368 ? "No Virtual IPv6 address configured on macvlan device"
369 : whynot;
d5dc62c4 370#endif
114a413e 371 /* Must have at least one VIP configured */
6e93585e 372 start = start && r->addrs->count > 0;
2fff50ec 373 whynot =
457ea8d4 374 (!start && !whynot) ? "No Virtual IP address configured" : whynot;
6e93585e
QY
375 if (start)
376 vrrp_event(r, VRRP_EVENT_STARTUP);
6309f71c 377 else if (whynot)
613b45b0
QY
378 zlog_warn(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
379 "Refusing to start Virtual Router: %s",
380 vr->vrid, family2str(r->family), whynot);
6e93585e
QY
381}
382
1d21789e 383void vrrp_set_priority(struct vrrp_vrouter *vr, uint8_t priority)
c23edd74 384{
862f2f37 385 vr->priority = priority;
bac08ded
QY
386 vr->v4->priority = priority;
387 vr->v6->priority = priority;
c23edd74
QY
388}
389
1d21789e
QY
390void vrrp_set_advertisement_interval(struct vrrp_vrouter *vr,
391 uint16_t advertisement_interval)
392{
393 if (vr->advertisement_interval == advertisement_interval)
394 return;
395
862f2f37
QY
396 vr->advertisement_interval = advertisement_interval;
397 vrrp_recalculate_timers(vr->v4);
398 vrrp_recalculate_timers(vr->v6);
399}
400
2cd90902 401static bool vrrp_has_ip(struct vrrp_vrouter *vr, struct ipaddr *ip)
862f2f37 402{
2cd90902
QY
403 struct vrrp_router *r = ip->ipa_type == IPADDR_V4 ? vr->v4 : vr->v6;
404 struct listnode *ln;
405 struct ipaddr *iter;
862f2f37 406
2cd90902 407 for (ALL_LIST_ELEMENTS_RO(r->addrs, ln, iter))
e920b0b2 408 if (!memcmp(&iter->ip, &ip->ip, IPADDRSZ(ip)))
2cd90902 409 return true;
10133a59 410
2cd90902
QY
411 return false;
412}
413
671fd2a3 414int vrrp_add_ip(struct vrrp_vrouter *vr, struct ipaddr *ip)
2cd90902 415{
671fd2a3
QY
416 struct vrrp_router *r = IS_IPADDR_V4(ip) ? vr->v4 : vr->v6;
417 int af = r->family;
27fd8827
QY
418
419 assert(r->family == af);
359c72ba 420 assert(!(r->vr->version == 2 && ip->ipa_type == IPADDR_V6));
27fd8827 421
2cd90902
QY
422 if (vrrp_has_ip(r->vr, ip))
423 return 0;
424
425 if (!vrrp_is_owner(r->vr->ifp, ip) && r->is_owner) {
10133a59 426 char ipbuf[INET6_ADDRSTRLEN];
2fff50ec 427
2cd90902 428 inet_ntop(r->family, &ip->ip, ipbuf, sizeof(ipbuf));
10133a59 429 zlog_err(
613b45b0 430 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
10133a59 431 "This VRRP router is not the address owner of %s, but is the address owner of other addresses; this config is unsupported.",
613b45b0 432 r->vr->vrid, family2str(r->family), ipbuf);
2cd90902 433 return -1;
10133a59
QY
434 }
435
72df9d93 436 struct ipaddr *new = XCALLOC(MTYPE_VRRP_IP, sizeof(struct ipaddr));
2cd90902
QY
437
438 *new = *ip;
439 listnode_add(r->addrs, new);
440
6e93585e 441 if (r->fsm.state == VRRP_STATE_MASTER) {
2cd90902
QY
442 switch (r->family) {
443 case AF_INET:
444 vrrp_garp_send(r, &new->ipaddr_v4);
445 break;
446 case AF_INET6:
447 vrrp_ndisc_una_send(r, new);
448 break;
449 }
450 }
451
6e93585e 452 return 0;
2cd90902
QY
453}
454
6e93585e 455int vrrp_add_ipv4(struct vrrp_vrouter *vr, struct in_addr v4)
2cd90902
QY
456{
457 struct ipaddr ip;
2fff50ec 458
2cd90902
QY
459 ip.ipa_type = IPADDR_V4;
460 ip.ipaddr_v4 = v4;
671fd2a3 461 return vrrp_add_ip(vr, &ip);
2cd90902
QY
462}
463
6e93585e 464int vrrp_add_ipv6(struct vrrp_vrouter *vr, struct in6_addr v6)
2cd90902 465{
359c72ba
QY
466 assert(vr->version != 2);
467
2cd90902 468 struct ipaddr ip;
2fff50ec 469
2cd90902
QY
470 ip.ipa_type = IPADDR_V6;
471 ip.ipaddr_v6 = v6;
671fd2a3 472 return vrrp_add_ip(vr, &ip);
1d21789e
QY
473}
474
671fd2a3 475int vrrp_del_ip(struct vrrp_vrouter *vr, struct ipaddr *ip)
c23edd74 476{
2cd90902
QY
477 struct listnode *ln, *nn;
478 struct ipaddr *iter;
479 int ret = 0;
c23edd74 480
671fd2a3
QY
481 struct vrrp_router *r = IS_IPADDR_V4(ip) ? vr->v4 : vr->v6;
482
2cd90902
QY
483 if (!vrrp_has_ip(r->vr, ip))
484 return 0;
10133a59 485
6e93585e
QY
486 for (ALL_LIST_ELEMENTS(r->addrs, ln, nn, iter))
487 if (!memcmp(&iter->ip, &ip->ip, IPADDRSZ(ip)))
488 list_delete_node(r->addrs, ln);
2cd90902
QY
489
490 /*
6e93585e
QY
491 * NB: Deleting the last address and then issuing a shutdown will cause
492 * transmission of a priority 0 VRRP Advertisement - as per the RFC -
493 * but it will have no addresses. This is not forbidden in the RFC but
494 * might confuse other implementations.
2cd90902 495 */
6e93585e
QY
496 if (r->addrs->count == 0 && r->fsm.state != VRRP_STATE_INITIALIZE)
497 ret = vrrp_event(r, VRRP_EVENT_SHUTDOWN);
10133a59 498
2cd90902
QY
499 return ret;
500}
4f52e9a6 501
6e93585e 502int vrrp_del_ipv6(struct vrrp_vrouter *vr, struct in6_addr v6)
2cd90902
QY
503{
504 struct ipaddr ip;
2fff50ec 505
2cd90902
QY
506 ip.ipa_type = IPADDR_V6;
507 ip.ipaddr_v6 = v6;
671fd2a3 508 return vrrp_del_ip(vr, &ip);
862f2f37
QY
509}
510
6e93585e 511int vrrp_del_ipv4(struct vrrp_vrouter *vr, struct in_addr v4)
862f2f37 512{
2cd90902 513 struct ipaddr ip;
2fff50ec 514
2cd90902
QY
515 ip.ipa_type = IPADDR_V4;
516 ip.ipaddr_v4 = v4;
671fd2a3 517 return vrrp_del_ip(vr, &ip);
c23edd74
QY
518}
519
1d21789e
QY
520
521/* Creation and destruction ------------------------------------------------ */
522
6287cefe
QY
523static void vrrp_router_addr_list_del_cb(void *val)
524{
525 struct ipaddr *ip = val;
2fff50ec 526
72df9d93 527 XFREE(MTYPE_VRRP_IP, ip);
6287cefe
QY
528}
529
85467974
QY
530/*
531 * Search for a suitable macvlan subinterface we can attach to, and if found,
532 * attach to it.
533 *
534 * r
535 * Router to attach to interface
536 *
537 * Returns:
538 * Whether an interface was successfully attached
539 */
540static bool vrrp_attach_interface(struct vrrp_router *r)
862f2f37 541{
dad18a2f
QY
542 /* Search for existing interface with computed MAC address */
543 struct interface **ifps;
2fff50ec 544
490810d5
QY
545 size_t ifps_cnt =
546 if_lookup_by_hwaddr(r->vmac.octet, sizeof(r->vmac.octet), &ifps,
547 r->vr->ifp->vrf_id);
dad18a2f
QY
548
549 /*
1b1f3c43
QY
550 * Filter to only those macvlan interfaces whose parent is the base
551 * interface this VRRP router is configured on.
dad18a2f
QY
552 *
553 * If there are still multiple interfaces we just select the first one,
554 * as it should be functionally identical to the others.
555 */
556 unsigned int candidates = 0;
557 struct interface *selection = NULL;
2fff50ec 558
dad18a2f 559 for (unsigned int i = 0; i < ifps_cnt; i++) {
b0ec34c8 560 if (ifps[i]->link_ifindex != r->vr->ifp->ifindex)
dad18a2f
QY
561 ifps[i] = NULL;
562 else {
563 selection = selection ? selection : ifps[i];
564 candidates++;
565 }
566 }
567
b79640e4
QY
568 if (ifps_cnt)
569 XFREE(MTYPE_TMP, ifps);
dad18a2f
QY
570
571 char ethstr[ETHER_ADDR_STRLEN];
2fff50ec 572
dad18a2f
QY
573 prefix_mac2str(&r->vmac, ethstr, sizeof(ethstr));
574
575 assert(!!selection == !!candidates);
576
577 if (candidates == 0)
613b45b0
QY
578 zlog_warn(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
579 "Interface: None (no interface found w/ MAC %s)",
e6341d21 580 r->vr->vrid, family2str(r->family), ethstr);
dad18a2f 581 else if (candidates > 1)
613b45b0
QY
582 zlog_warn(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
583 "Interface: Multiple interfaces found; using %s",
e6341d21 584 r->vr->vrid, family2str(r->family), selection->name);
dad18a2f 585 else
613b45b0
QY
586 zlog_info(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
587 "Interface: %s",
e6341d21 588 r->vr->vrid, family2str(r->family), selection->name);
dad18a2f 589
7e205b4a 590 r->mvl_ifp = selection;
dad18a2f 591
85467974 592 return !!r->mvl_ifp;
85467974
QY
593}
594
595static struct vrrp_router *vrrp_router_create(struct vrrp_vrouter *vr,
596 int family)
597{
72df9d93
QY
598 struct vrrp_router *r =
599 XCALLOC(MTYPE_VRRP_RTR, sizeof(struct vrrp_router));
85467974
QY
600
601 r->family = family;
602 r->sock_rx = -1;
603 r->sock_tx = -1;
604 r->vr = vr;
605 r->addrs = list_new();
606 r->addrs->del = vrrp_router_addr_list_del_cb;
607 r->priority = vr->priority;
608 r->fsm.state = VRRP_STATE_INITIALIZE;
609 vrrp_mac_set(&r->vmac, family == AF_INET6, vr->vrid);
610
611 vrrp_attach_interface(r);
612
862f2f37
QY
613 return r;
614}
615
616static void vrrp_router_destroy(struct vrrp_router *r)
617{
6287cefe
QY
618 if (r->is_active)
619 vrrp_event(r, VRRP_EVENT_SHUTDOWN);
620
2fff50ec 621 if (r->sock_rx >= 0)
dad18a2f 622 close(r->sock_rx);
2fff50ec 623 if (r->sock_tx >= 0)
dad18a2f 624 close(r->sock_tx);
6287cefe 625
862f2f37
QY
626 /* FIXME: also delete list elements */
627 list_delete(&r->addrs);
72df9d93 628 XFREE(MTYPE_VRRP_RTR, r);
862f2f37
QY
629}
630
99966840
QY
631struct vrrp_vrouter *vrrp_vrouter_create(struct interface *ifp, uint8_t vrid,
632 uint8_t version)
5435a2bf 633{
4f0b6b45 634 struct vrrp_vrouter *vr = vrrp_lookup(ifp, vrid);
6287cefe
QY
635
636 if (vr)
637 return vr;
638
99966840
QY
639 if (version != 2 && version != 3)
640 return NULL;
641
72df9d93 642 vr = XCALLOC(MTYPE_VRRP_RTR, sizeof(struct vrrp_vrouter));
5435a2bf 643
5435a2bf 644 vr->ifp = ifp;
99966840 645 vr->version = version;
5435a2bf 646 vr->vrid = vrid;
8cd1d277
QY
647 vr->priority = vd.priority;
648 vr->preempt_mode = vd.preempt_mode;
649 vr->accept_mode = vd.accept_mode;
650 vr->shutdown = vd.shutdown;
862f2f37
QY
651
652 vr->v4 = vrrp_router_create(vr, AF_INET);
653 vr->v6 = vrrp_router_create(vr, AF_INET6);
654
8cd1d277 655 vrrp_set_advertisement_interval(vr, vd.advertisement_interval);
5435a2bf
QY
656
657 hash_get(vrrp_vrouters_hash, vr, hash_alloc_intern);
658
659 return vr;
660}
661
c23edd74
QY
662void vrrp_vrouter_destroy(struct vrrp_vrouter *vr)
663{
862f2f37
QY
664 vrrp_router_destroy(vr->v4);
665 vrrp_router_destroy(vr->v6);
c23edd74 666 hash_release(vrrp_vrouters_hash, vr);
72df9d93 667 XFREE(MTYPE_VRRP_RTR, vr);
c23edd74
QY
668}
669
fb8b348c 670struct vrrp_vrouter *vrrp_lookup(const struct interface *ifp, uint8_t vrid)
5435a2bf
QY
671{
672 struct vrrp_vrouter vr;
2fff50ec 673
5435a2bf 674 vr.vrid = vrid;
fb8b348c 675 vr.ifp = (struct interface *)ifp;
5435a2bf
QY
676
677 return hash_lookup(vrrp_vrouters_hash, &vr);
678}
679
680/* Network ----------------------------------------------------------------- */
681
10133a59
QY
682/* Forward decls */
683static void vrrp_change_state(struct vrrp_router *r, int to);
684static int vrrp_adver_timer_expire(struct thread *thread);
685static int vrrp_master_down_timer_expire(struct thread *thread);
686
958b1487
QY
687/*
688 * Finds the first connected address of the appropriate family on a VRRP
689 * router's interface and binds the Tx socket of the VRRP router to that
690 * address.
691 *
692 * Also sets src field of vrrp_router.
693 *
694 * r
695 * VRRP router to operate on
696 *
697 * Returns:
698 * 0 on success
699 * -1 on failure
700 */
701static int vrrp_bind_to_primary_connected(struct vrrp_router *r)
702{
958b1487
QY
703 struct interface *ifp;
704
705 /*
706 * A slight quirk: the RFC specifies that advertisements under IPv6 must
707 * be transmitted using the link local address of the source interface
708 */
709 ifp = r->family == AF_INET ? r->vr->ifp : r->mvl_ifp;
710
711 struct listnode *ln;
712 struct connected *c = NULL;
2fff50ec 713
958b1487
QY
714 for (ALL_LIST_ELEMENTS_RO(ifp->connected, ln, c))
715 if (c->address->family == r->family) {
716 if (r->family == AF_INET6
717 && IN6_IS_ADDR_LINKLOCAL(&c->address->u.prefix6))
718 break;
719 else if (r->family == AF_INET)
720 break;
721 }
722
723 if (c == NULL) {
724 zlog_err(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
725 "Failed to find address to bind on %s",
726 r->vr->vrid, family2str(r->family), ifp->name);
727 return -1;
728 }
729
730 union sockunion su;
2fff50ec 731
958b1487
QY
732 memset(&su, 0x00, sizeof(su));
733
734 switch (r->family) {
735 case AF_INET:
736 r->src.ipa_type = IPADDR_V4;
737 r->src.ipaddr_v4 = c->address->u.prefix4;
738 su.sin.sin_family = AF_INET;
739 su.sin.sin_addr = c->address->u.prefix4;
740 break;
741 case AF_INET6:
742 r->src.ipa_type = IPADDR_V6;
743 r->src.ipaddr_v6 = c->address->u.prefix6;
744 su.sin6.sin6_family = AF_INET6;
745 su.sin6.sin6_scope_id = ifp->ifindex;
746 su.sin6.sin6_addr = c->address->u.prefix6;
747 break;
748 }
749
19c38250
QY
750 int ret = 0;
751
958b1487
QY
752 sockopt_reuseaddr(r->sock_tx);
753 if (bind(r->sock_tx, (const struct sockaddr *)&su, sizeof(su)) < 0) {
754 zlog_err(
755 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
26b6d034
PR
756 "Failed to bind Tx socket to primary IP address %pFX: %s",
757 r->vr->vrid, family2str(r->family), c->address,
958b1487 758 safe_strerror(errno));
19c38250 759 ret = -1;
958b1487
QY
760 } else {
761 DEBUGD(&vrrp_dbg_sock,
762 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
26b6d034
PR
763 "Bound Tx socket to primary IP address %pFX",
764 r->vr->vrid, family2str(r->family), c->address);
958b1487
QY
765 }
766
19c38250 767 return ret;
958b1487
QY
768}
769
770
5435a2bf 771/*
91188ca6 772 * Create and multicast a VRRP ADVERTISEMENT message.
5435a2bf 773 *
862f2f37
QY
774 * r
775 * VRRP Router for which to send ADVERTISEMENT
5435a2bf 776 */
862f2f37 777static void vrrp_send_advertisement(struct vrrp_router *r)
5435a2bf 778{
247aa469 779 struct vrrp_pkt *pkt;
d9e01e1c 780 ssize_t pktsz;
862f2f37
QY
781 struct ipaddr *addrs[r->addrs->count];
782 union sockunion dest;
247aa469 783
958b1487
QY
784 if (r->src.ipa_type == IPADDR_NONE
785 && vrrp_bind_to_primary_connected(r) < 0)
786 return;
787
862f2f37 788 list_to_array(r->addrs, (void **)addrs, r->addrs->count);
247aa469 789
99966840
QY
790 pktsz = vrrp_pkt_adver_build(&pkt, &r->src, r->vr->version, r->vr->vrid,
791 r->priority, r->vr->advertisement_interval,
d9e01e1c 792 r->addrs->count, (struct ipaddr **)&addrs);
247aa469 793
b637bcd4
QY
794 if (DEBUG_MODE_CHECK(&vrrp_dbg_pkt, DEBUG_MODE_ALL))
795 zlog_hexdump(pkt, (size_t)pktsz);
247aa469 796
354b49d6
QY
797 const char *group = r->family == AF_INET ? VRRP_MCASTV4_GROUP_STR
798 : VRRP_MCASTV6_GROUP_STR;
ab059def 799 (void)str2sockunion(group, &dest);
247aa469 800
d9e01e1c 801 ssize_t sent = sendto(r->sock_tx, pkt, (size_t)pktsz, 0, &dest.sa,
862f2f37 802 sockunion_sizeof(&dest));
4ec94408 803
7c136b08 804 vrrp_pkt_free(pkt);
bb54fa3a 805
4ec94408 806 if (sent < 0) {
613b45b0 807 zlog_warn(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
8071d5c3 808 "Failed to send VRRP Advertisement: %s",
613b45b0
QY
809 r->vr->vrid, family2str(r->family),
810 safe_strerror(errno));
6332c77f
QY
811 } else {
812 ++r->stats.adver_tx_cnt;
4ec94408 813 }
5435a2bf
QY
814}
815
10133a59
QY
816/*
817 * Receive and parse VRRP advertisement.
818 *
819 * By the time we get here all fields have been validated for basic correctness
820 * and the packet is a valid VRRP packet.
821 *
822 * However, we have not validated whether the VRID is correct for this virtual
823 * router, nor whether the priority is correct (i.e. is not 255 when we are the
99966840
QY
824 * address owner), nor whether the advertisement interval equals our own
825 * configured value (this check is only performed in VRRPv2).
0f1f98e8
QY
826 *
827 * r
828 * VRRP Router associated with the socket this advertisement was received on
829 *
830 * src
831 * Source address of sender
832 *
833 * pkt
834 * The advertisement they sent
835 *
836 * pktsize
837 * Size of advertisement
838 *
839 * Returns:
840 * -1 if advertisement is invalid
841 * 0 otherwise
10133a59 842 */
0f1f98e8
QY
843static int vrrp_recv_advertisement(struct vrrp_router *r, struct ipaddr *src,
844 struct vrrp_pkt *pkt, size_t pktsize)
5435a2bf 845{
3708883c 846 char sipstr[INET6_ADDRSTRLEN];
c7e65c4f 847 char dipstr[INET6_ADDRSTRLEN];
2fff50ec
QY
848
849 ipaddr2str(src, sipstr, sizeof(sipstr));
c7e65c4f 850 ipaddr2str(&r->src, dipstr, sizeof(dipstr));
3708883c 851
91188ca6 852 char dumpbuf[BUFSIZ];
2fff50ec 853
d9e01e1c 854 vrrp_pkt_adver_dump(dumpbuf, sizeof(dumpbuf), pkt);
b637bcd4 855 DEBUGD(&vrrp_dbg_proto,
613b45b0 856 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1d5453d6 857 "Received VRRP Advertisement from %s: %s",
613b45b0 858 r->vr->vrid, family2str(r->family), sipstr, dumpbuf);
10133a59
QY
859
860 /* Check that VRID matches our configured VRID */
861 if (pkt->hdr.vrid != r->vr->vrid) {
b637bcd4 862 DEBUGD(&vrrp_dbg_proto,
613b45b0 863 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
6cde4b45 864 "Datagram invalid: Advertisement contains VRID %hhu which does not match our instance",
b637bcd4 865 r->vr->vrid, family2str(r->family), pkt->hdr.vrid);
10133a59
QY
866 return -1;
867 }
868
869 /* Verify that we are not the IPvX address owner */
870 if (r->is_owner) {
b637bcd4 871 DEBUGD(&vrrp_dbg_proto,
613b45b0
QY
872 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
873 "Datagram invalid: Received advertisement but we are the address owner",
b637bcd4 874 r->vr->vrid, family2str(r->family));
10133a59
QY
875 return -1;
876 }
877
99966840
QY
878 /* If v2, verify that adver time matches ours */
879 bool adveq = (pkt->hdr.v2.adver_int
880 == MAX(r->vr->advertisement_interval / 100, 1));
881 if (r->vr->version == 2 && !adveq) {
b637bcd4 882 DEBUGD(&vrrp_dbg_proto,
613b45b0 883 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
6cde4b45 884 "Datagram invalid: Received advertisement with advertisement interval %hhu unequal to our configured value %u",
b637bcd4
QY
885 r->vr->vrid, family2str(r->family),
886 pkt->hdr.v2.adver_int,
887 MAX(r->vr->advertisement_interval / 100, 1));
99966840
QY
888 return -1;
889 }
890
891
10133a59 892 /* Check that # IPs received matches our # configured IPs */
b637bcd4
QY
893 if (pkt->hdr.naddr != r->addrs->count)
894 DEBUGD(&vrrp_dbg_proto,
613b45b0 895 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
6cde4b45 896 "Datagram has %hhu addresses, but this VRRP instance has %u",
b637bcd4
QY
897 r->vr->vrid, family2str(r->family), pkt->hdr.naddr,
898 r->addrs->count);
10133a59 899
6332c77f
QY
900 ++r->stats.adver_rx_cnt;
901
0f1f98e8 902 int addrcmp;
0f1f98e8 903
10133a59
QY
904 switch (r->fsm.state) {
905 case VRRP_STATE_MASTER:
e920b0b2 906 addrcmp = memcmp(&src->ip, &r->src.ip, IPADDRSZ(src));
0f1f98e8 907
10133a59
QY
908 if (pkt->hdr.priority == 0) {
909 vrrp_send_advertisement(r);
910 THREAD_OFF(r->t_adver_timer);
911 thread_add_timer_msec(
912 master, vrrp_adver_timer_expire, r,
de7fe61e 913 r->vr->advertisement_interval * CS2MS,
10133a59 914 &r->t_adver_timer);
0f1f98e8 915 } else if (pkt->hdr.priority > r->priority
354b49d6
QY
916 || ((pkt->hdr.priority == r->priority)
917 && addrcmp > 0)) {
3708883c 918 zlog_info(
613b45b0 919 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
6cde4b45 920 "Received advertisement from %s w/ priority %hhu; switching to Backup",
613b45b0
QY
921 r->vr->vrid, family2str(r->family), sipstr,
922 pkt->hdr.priority);
10133a59 923 THREAD_OFF(r->t_adver_timer);
99966840
QY
924 if (r->vr->version == 3) {
925 r->master_adver_interval =
926 htons(pkt->hdr.v3.adver_int);
927 }
10133a59
QY
928 vrrp_recalculate_timers(r);
929 THREAD_OFF(r->t_master_down_timer);
930 thread_add_timer_msec(master,
931 vrrp_master_down_timer_expire, r,
de7fe61e 932 r->master_down_interval * CS2MS,
10133a59
QY
933 &r->t_master_down_timer);
934 vrrp_change_state(r, VRRP_STATE_BACKUP);
935 } else {
936 /* Discard advertisement */
b637bcd4 937 DEBUGD(&vrrp_dbg_proto,
613b45b0 938 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
6cde4b45 939 "Discarding advertisement from %s (%hhu <= %hhu & %s <= %s)",
613b45b0
QY
940 r->vr->vrid, family2str(r->family), sipstr,
941 pkt->hdr.priority, r->priority, sipstr, dipstr);
10133a59
QY
942 }
943 break;
944 case VRRP_STATE_BACKUP:
945 if (pkt->hdr.priority == 0) {
946 THREAD_OFF(r->t_master_down_timer);
947 thread_add_timer_msec(
948 master, vrrp_master_down_timer_expire, r,
de7fe61e 949 r->skew_time * CS2MS, &r->t_master_down_timer);
a8f58eb6 950 } else if (!r->vr->preempt_mode
10133a59 951 || pkt->hdr.priority >= r->priority) {
99966840
QY
952 if (r->vr->version == 3) {
953 r->master_adver_interval =
954 ntohs(pkt->hdr.v3.adver_int);
955 }
10133a59
QY
956 vrrp_recalculate_timers(r);
957 THREAD_OFF(r->t_master_down_timer);
958 thread_add_timer_msec(master,
959 vrrp_master_down_timer_expire, r,
de7fe61e 960 r->master_down_interval * CS2MS,
10133a59 961 &r->t_master_down_timer);
a8f58eb6 962 } else if (r->vr->preempt_mode
10133a59
QY
963 && pkt->hdr.priority < r->priority) {
964 /* Discard advertisement */
b637bcd4 965 DEBUGD(&vrrp_dbg_proto,
613b45b0 966 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
6cde4b45 967 "Discarding advertisement from %s (%hhu < %hhu & preempt = true)",
613b45b0
QY
968 r->vr->vrid, family2str(r->family), sipstr,
969 pkt->hdr.priority, r->priority);
10133a59
QY
970 }
971 break;
972 case VRRP_STATE_INITIALIZE:
613b45b0 973 zlog_err(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
10133a59 974 "Received ADVERTISEMENT in state %s; this is a bug",
613b45b0
QY
975 r->vr->vrid, family2str(r->family),
976 vrrp_state_names[r->fsm.state]);
10133a59
QY
977 break;
978 }
979
980 return 0;
91188ca6
QY
981}
982
983/*
984 * Read and process next IPvX datagram.
985 */
986static int vrrp_read(struct thread *thread)
987{
988 struct vrrp_router *r = thread->arg;
989
990 struct vrrp_pkt *pkt;
991 ssize_t pktsize;
992 ssize_t nbytes;
993 bool resched;
994 char errbuf[BUFSIZ];
fa211f1c 995 struct sockaddr_storage sa;
91188ca6 996 uint8_t control[64];
d04bb25a 997 struct ipaddr src = {};
91188ca6 998
ab059def 999 struct msghdr m = {};
91188ca6 1000 struct iovec iov;
2fff50ec 1001
91188ca6
QY
1002 iov.iov_base = r->ibuf;
1003 iov.iov_len = sizeof(r->ibuf);
fa211f1c
QY
1004 m.msg_name = &sa;
1005 m.msg_namelen = sizeof(sa);
91188ca6
QY
1006 m.msg_iov = &iov;
1007 m.msg_iovlen = 1;
1008 m.msg_control = control;
1009 m.msg_controllen = sizeof(control);
1010
dad18a2f 1011 nbytes = recvmsg(r->sock_rx, &m, MSG_DONTWAIT);
91188ca6
QY
1012
1013 if ((nbytes < 0 && ERRNO_IO_RETRY(errno))) {
1014 resched = true;
1015 goto done;
1016 } else if (nbytes <= 0) {
1017 vrrp_event(r, VRRP_EVENT_SHUTDOWN);
1018 resched = false;
1019 goto done;
1020 }
1021
b637bcd4
QY
1022 if (DEBUG_MODE_CHECK(&vrrp_dbg_pkt, DEBUG_MODE_ALL)) {
1023 DEBUGD(&vrrp_dbg_pkt,
613b45b0
QY
1024 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1025 "Datagram rx: ",
b637bcd4
QY
1026 r->vr->vrid, family2str(r->family));
1027 zlog_hexdump(r->ibuf, nbytes);
1028 }
91188ca6 1029
8cb3d803
QY
1030 pktsize = vrrp_pkt_parse_datagram(r->family, r->vr->version, &m, nbytes,
1031 &src, &pkt, errbuf, sizeof(errbuf));
91188ca6 1032
613b45b0 1033 if (pktsize < 0)
b637bcd4 1034 DEBUGD(&vrrp_dbg_pkt,
613b45b0
QY
1035 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1036 "Datagram invalid: %s",
b637bcd4 1037 r->vr->vrid, family2str(r->family), errbuf);
613b45b0 1038 else
0f1f98e8 1039 vrrp_recv_advertisement(r, &src, pkt, pktsize);
91188ca6
QY
1040
1041 resched = true;
1042
1043done:
1044 memset(r->ibuf, 0x00, sizeof(r->ibuf));
1045
1046 if (resched)
dad18a2f
QY
1047 thread_add_read(master, vrrp_read, r, r->sock_rx, &r->t_read);
1048
1049 return 0;
1050}
1051
5435a2bf 1052/*
dad18a2f
QY
1053 * Creates and configures VRRP router sockets.
1054 *
1055 * This function:
1056 * - Creates two sockets, one for Tx, one for Rx
490810d5
QY
1057 * - Binds the Tx socket to the macvlan device, if necessary (VRF case)
1058 * - Binds the Rx socket to the base interface
dad18a2f
QY
1059 * - Joins the Rx socket to the appropriate VRRP multicast group
1060 * - Sets the Tx socket to set the TTL (v4) or Hop Limit (v6) field to 255 for
1061 * all transmitted IPvX packets
1062 * - Requests the kernel to deliver IPv6 header values needed to validate VRRP
1063 * packets
dad18a2f
QY
1064 *
1065 * If any of the above fail, the sockets are closed. The only exception is if
1066 * the TTL / Hop Limit settings fail; these are logged, but configuration
1067 * proceeds.
5435a2bf
QY
1068 *
1069 * The first connected address on the Virtual Router's interface is used as the
1070 * interface address.
1071 *
862f2f37
QY
1072 * r
1073 * VRRP Router for which to create listen socket
dad18a2f
QY
1074 *
1075 * Returns:
1076 * 0 on success
1077 * -1 on failure
5435a2bf 1078 */
862f2f37 1079static int vrrp_socket(struct vrrp_router *r)
5435a2bf 1080{
5435a2bf 1081 int ret;
91188ca6 1082 bool failed = false;
5435a2bf 1083
0cf6db21 1084 frr_with_privs(&vrrp_privs) {
444a06ea
QY
1085 r->sock_rx = vrf_socket(r->family, SOCK_RAW, IPPROTO_VRRP,
1086 r->vr->ifp->vrf_id, NULL);
1087 r->sock_tx = vrf_socket(r->family, SOCK_RAW, IPPROTO_VRRP,
1088 r->vr->ifp->vrf_id, NULL);
5435a2bf
QY
1089 }
1090
dad18a2f
QY
1091 if (r->sock_rx < 0 || r->sock_tx < 0) {
1092 const char *rxtx = r->sock_rx < 0 ? "Rx" : "Tx";
2fff50ec 1093
613b45b0
QY
1094 zlog_warn(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1095 "Can't create VRRP %s socket",
dad18a2f 1096 r->vr->vrid, family2str(r->family), rxtx);
91188ca6
QY
1097 failed = true;
1098 goto done;
4ec94408 1099 }
40744000 1100
490810d5
QY
1101 /*
1102 * Bind Tx socket to macvlan device - necessary for VRF support,
1103 * otherwise the kernel will select the vrf device
1104 */
1105 if (r->vr->ifp->vrf_id != VRF_DEFAULT) {
1106 frr_with_privs (&vrrp_privs) {
1107 ret = setsockopt(r->sock_tx, SOL_SOCKET,
1108 SO_BINDTODEVICE, r->mvl_ifp->name,
1109 strlen(r->mvl_ifp->name));
1110 }
1111
1112 if (ret < 0) {
1113 zlog_warn(
1114 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1115 "Failed to bind Tx socket to macvlan device '%s'",
1116 r->vr->vrid, family2str(r->family),
1117 r->mvl_ifp->name);
1118 failed = true;
1119 goto done;
1120 }
1121 }
dad18a2f 1122 /* Configure sockets */
91188ca6 1123 if (r->family == AF_INET) {
dad18a2f 1124 /* Set Tx socket to always Tx with TTL set to 255 */
91188ca6 1125 int ttl = 255;
2fff50ec 1126
dad18a2f 1127 ret = setsockopt(r->sock_tx, IPPROTO_IP, IP_MULTICAST_TTL, &ttl,
91188ca6
QY
1128 sizeof(ttl));
1129 if (ret < 0) {
1130 zlog_warn(
613b45b0 1131 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
91188ca6 1132 "Failed to set outgoing multicast TTL count to 255; RFC 5798 compliant implementations will drop our packets",
613b45b0 1133 r->vr->vrid, family2str(r->family));
91188ca6
QY
1134 }
1135
6ad94d3a
QY
1136 /* Set Tx socket DSCP byte */
1137 setsockopt_ipv4_tos(r->sock_tx, IPTOS_PREC_INTERNETCONTROL);
1138
6e9529ed
QY
1139 /* Turn off multicast loop on Tx */
1140 setsockopt_ipv4_multicast_loop(r->sock_tx, 0);
1141
b523b241 1142 /* Bind Rx socket to exact interface */
0cf6db21 1143 frr_with_privs(&vrrp_privs) {
b523b241
QY
1144 ret = setsockopt(r->sock_rx, SOL_SOCKET,
1145 SO_BINDTODEVICE, r->vr->ifp->name,
1146 strlen(r->vr->ifp->name));
1147 }
b523b241 1148 if (ret) {
613b45b0 1149 zlog_warn(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
b523b241 1150 "Failed to bind Rx socket to %s: %s",
613b45b0
QY
1151 r->vr->vrid, family2str(r->family),
1152 r->vr->ifp->name, safe_strerror(errno));
b523b241
QY
1153 failed = true;
1154 goto done;
1155 }
b637bcd4 1156 DEBUGD(&vrrp_dbg_sock,
613b45b0
QY
1157 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1158 "Bound Rx socket to %s",
1159 r->vr->vrid, family2str(r->family), r->vr->ifp->name);
b523b241
QY
1160
1161 /* Bind Rx socket to v4 multicast address */
1162 struct sockaddr_in sa = {0};
2fff50ec 1163
b523b241
QY
1164 sa.sin_family = AF_INET;
1165 sa.sin_addr.s_addr = htonl(VRRP_MCASTV4_GROUP);
1166 if (bind(r->sock_rx, (struct sockaddr *)&sa, sizeof(sa))) {
1167 zlog_err(
613b45b0
QY
1168 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1169 "Failed to bind Rx socket to VRRP multicast group: %s",
b523b241
QY
1170 r->vr->vrid, family2str(r->family),
1171 safe_strerror(errno));
1172 failed = true;
1173 goto done;
1174 }
b637bcd4 1175 DEBUGD(&vrrp_dbg_sock,
613b45b0
QY
1176 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1177 "Bound Rx socket to VRRP multicast group",
b637bcd4 1178 r->vr->vrid, family2str(r->family));
b523b241 1179
dad18a2f 1180 /* Join Rx socket to VRRP IPv4 multicast group */
bdf16661 1181 assert(listhead(r->vr->ifp->connected));
dad18a2f 1182 struct connected *c = listhead(r->vr->ifp->connected)->data;
91188ca6 1183 struct in_addr v4 = c->address->u.prefix4;
2fff50ec 1184
dad18a2f
QY
1185 ret = setsockopt_ipv4_multicast(r->sock_rx, IP_ADD_MEMBERSHIP,
1186 v4, htonl(VRRP_MCASTV4_GROUP),
862f2f37 1187 r->vr->ifp->ifindex);
b523b241
QY
1188 if (ret < 0) {
1189 zlog_warn(VRRP_LOGPFX VRRP_LOGPFX_VRID
1190 "Failed to join VRRP %s multicast group",
1191 r->vr->vrid, family2str(r->family));
1192 failed = true;
1193 goto done;
1194 }
b637bcd4 1195 DEBUGD(&vrrp_dbg_sock,
613b45b0
QY
1196 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1197 "Joined VRRP multicast group",
b637bcd4 1198 r->vr->vrid, family2str(r->family));
7e205b4a
QY
1199
1200 /* Set outgoing interface for advertisements */
1201 struct ip_mreqn mreqn = {};
2fff50ec 1202
7e205b4a
QY
1203 mreqn.imr_ifindex = r->mvl_ifp->ifindex;
1204 ret = setsockopt(r->sock_tx, IPPROTO_IP, IP_MULTICAST_IF,
1205 (void *)&mreqn, sizeof(mreqn));
1206 if (ret < 0) {
1207 zlog_warn(
613b45b0 1208 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
7e205b4a 1209 "Could not set %s as outgoing multicast interface",
613b45b0
QY
1210 r->vr->vrid, family2str(r->family),
1211 r->mvl_ifp->name);
7e205b4a
QY
1212 failed = true;
1213 goto done;
1214 }
b637bcd4 1215 DEBUGD(&vrrp_dbg_sock,
613b45b0 1216 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
b637bcd4 1217 "Set %s as outgoing multicast interface",
613b45b0 1218 r->vr->vrid, family2str(r->family), r->mvl_ifp->name);
1760ce42
QY
1219
1220 /* Select and bind source address */
1221 if (vrrp_bind_to_primary_connected(r) < 0) {
1222 failed = true;
1223 goto done;
1224 }
1225
91188ca6 1226 } else if (r->family == AF_INET6) {
dad18a2f
QY
1227 /* Always transmit IPv6 packets with hop limit set to 255 */
1228 ret = setsockopt_ipv6_multicast_hops(r->sock_tx, 255);
91188ca6
QY
1229 if (ret < 0) {
1230 zlog_warn(
613b45b0 1231 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
91188ca6 1232 "Failed to set outgoing multicast hop count to 255; RFC 5798 compliant implementations will drop our packets",
613b45b0 1233 r->vr->vrid, family2str(r->family));
91188ca6 1234 }
d04bb25a 1235
6ad94d3a
QY
1236 /* Set Tx socket DSCP byte */
1237 setsockopt_ipv6_tclass(r->sock_tx, IPTOS_PREC_INTERNETCONTROL);
1238
d04bb25a
QY
1239 /* Request hop limit delivery */
1240 setsockopt_ipv6_hoplimit(r->sock_rx, 1);
91188ca6 1241 if (ret < 0) {
613b45b0 1242 zlog_warn(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
91188ca6 1243 "Failed to request IPv6 Hop Limit delivery",
613b45b0 1244 r->vr->vrid, family2str(r->family));
91188ca6
QY
1245 failed = true;
1246 goto done;
1247 }
1248
6e9529ed
QY
1249 /* Turn off multicast loop on Tx */
1250 setsockopt_ipv6_multicast_loop(r->sock_tx, 0);
1251
b523b241 1252 /* Bind Rx socket to exact interface */
0cf6db21 1253 frr_with_privs(&vrrp_privs) {
b523b241
QY
1254 ret = setsockopt(r->sock_rx, SOL_SOCKET,
1255 SO_BINDTODEVICE, r->vr->ifp->name,
1256 strlen(r->vr->ifp->name));
1257 }
b523b241 1258 if (ret) {
613b45b0 1259 zlog_warn(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
b523b241 1260 "Failed to bind Rx socket to %s: %s",
613b45b0
QY
1261 r->vr->vrid, family2str(r->family),
1262 r->vr->ifp->name, safe_strerror(errno));
b523b241
QY
1263 failed = true;
1264 goto done;
1265 }
b637bcd4 1266 DEBUGD(&vrrp_dbg_sock,
613b45b0
QY
1267 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1268 "Bound Rx socket to %s",
1269 r->vr->vrid, family2str(r->family), r->vr->ifp->name);
b523b241
QY
1270
1271 /* Bind Rx socket to v6 multicast address */
1272 struct sockaddr_in6 sa = {0};
2fff50ec 1273
b523b241
QY
1274 sa.sin6_family = AF_INET6;
1275 inet_pton(AF_INET6, VRRP_MCASTV6_GROUP_STR, &sa.sin6_addr);
1276 if (bind(r->sock_rx, (struct sockaddr *)&sa, sizeof(sa))) {
1277 zlog_err(
613b45b0
QY
1278 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1279 "Failed to bind Rx socket to VRRP multicast group: %s",
b523b241
QY
1280 r->vr->vrid, family2str(r->family),
1281 safe_strerror(errno));
1282 failed = true;
1283 goto done;
1284 }
b637bcd4 1285 DEBUGD(&vrrp_dbg_sock,
613b45b0
QY
1286 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1287 "Bound Rx socket to VRRP multicast group",
b637bcd4 1288 r->vr->vrid, family2str(r->family));
b523b241 1289
91188ca6 1290 /* Join VRRP IPv6 multicast group */
862f2f37 1291 struct ipv6_mreq mreq;
2fff50ec 1292
dad18a2f
QY
1293 inet_pton(AF_INET6, VRRP_MCASTV6_GROUP_STR,
1294 &mreq.ipv6mr_multiaddr);
862f2f37 1295 mreq.ipv6mr_interface = r->vr->ifp->ifindex;
dad18a2f
QY
1296 ret = setsockopt(r->sock_rx, IPPROTO_IPV6, IPV6_JOIN_GROUP,
1297 &mreq, sizeof(mreq));
b523b241 1298 if (ret < 0) {
613b45b0
QY
1299 zlog_warn(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1300 "Failed to join VRRP multicast group",
b523b241
QY
1301 r->vr->vrid, family2str(r->family));
1302 failed = true;
1303 goto done;
1304 }
b637bcd4 1305 DEBUGD(&vrrp_dbg_sock,
613b45b0
QY
1306 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1307 "Joined VRRP multicast group",
b637bcd4 1308 r->vr->vrid, family2str(r->family));
7e205b4a
QY
1309
1310 /* Set outgoing interface for advertisements */
1311 ret = setsockopt(r->sock_tx, IPPROTO_IPV6, IPV6_MULTICAST_IF,
1312 &r->mvl_ifp->ifindex, sizeof(ifindex_t));
1313 if (ret < 0) {
1314 zlog_warn(
613b45b0 1315 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
7e205b4a 1316 "Could not set %s as outgoing multicast interface",
613b45b0
QY
1317 r->vr->vrid, family2str(r->family),
1318 r->mvl_ifp->name);
7e205b4a
QY
1319 failed = true;
1320 goto done;
1321 }
b637bcd4 1322 DEBUGD(&vrrp_dbg_sock,
613b45b0 1323 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
b637bcd4 1324 "Set %s as outgoing multicast interface",
613b45b0 1325 r->vr->vrid, family2str(r->family), r->mvl_ifp->name);
862f2f37
QY
1326 }
1327
91188ca6
QY
1328done:
1329 ret = 0;
1330 if (failed) {
613b45b0
QY
1331 zlog_warn(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1332 "Failed to initialize VRRP router",
91188ca6 1333 r->vr->vrid, family2str(r->family));
1b5e2a22 1334 if (r->sock_rx >= 0) {
dad18a2f 1335 close(r->sock_rx);
1b5e2a22
QY
1336 r->sock_rx = -1;
1337 }
1338 if (r->sock_tx >= 0) {
dad18a2f 1339 close(r->sock_tx);
1b5e2a22
QY
1340 r->sock_tx = -1;
1341 }
91188ca6
QY
1342 ret = -1;
1343 }
1344
1345 return ret;
5435a2bf
QY
1346}
1347
1348
1349/* State machine ----------------------------------------------------------- */
1350
2fff50ec 1351DEFINE_HOOK(vrrp_change_state_hook, (struct vrrp_router *r, int to), (r, to));
5435a2bf
QY
1352
1353/*
1354 * Handle any necessary actions during state change to MASTER state.
1355 *
862f2f37
QY
1356 * r
1357 * VRRP Router to operate on
5435a2bf 1358 */
862f2f37 1359static void vrrp_change_state_master(struct vrrp_router *r)
5435a2bf 1360{
f3fe0047
QY
1361 /* Enable ND Router Advertisements */
1362 if (r->family == AF_INET6)
1363 vrrp_zebra_radv_set(r, true);
c3bd894e 1364
ee5aabb6 1365 /* Set protodown off */
c3bd894e 1366 vrrp_zclient_send_interface_protodown(r->mvl_ifp, false);
ee5aabb6
QY
1367
1368 /*
1369 * If protodown is already off, we can send our stuff, otherwise we
1370 * have to delay until the interface is all the way up
1371 */
1372 if (if_is_operative(r->mvl_ifp)) {
1373 vrrp_send_advertisement(r);
1374
1375 if (r->family == AF_INET)
1376 vrrp_garp_send_all(r);
1377 else if (r->family == AF_INET6)
1378 vrrp_ndisc_una_send_all(r);
1379 } else {
1380 DEBUGD(&vrrp_dbg_proto,
613b45b0 1381 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
ee5aabb6 1382 "Delaying VRRP advertisement until interface is up",
613b45b0 1383 r->vr->vrid, family2str(r->family));
ee5aabb6
QY
1384 r->advert_pending = true;
1385
1386 if (r->family == AF_INET) {
1387 DEBUGD(&vrrp_dbg_proto,
613b45b0 1388 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
ee5aabb6 1389 "Delaying VRRP gratuitous ARPs until interface is up",
613b45b0 1390 r->vr->vrid, family2str(r->family));
ee5aabb6
QY
1391 r->garp_pending = true;
1392 } else if (r->family == AF_INET6) {
1393 DEBUGD(&vrrp_dbg_proto,
613b45b0 1394 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
ee5aabb6 1395 "Delaying VRRP unsolicited neighbor advertisement until interface is up",
613b45b0 1396 r->vr->vrid, family2str(r->family));
ee5aabb6
QY
1397 r->ndisc_pending = true;
1398 }
1399 }
5435a2bf
QY
1400}
1401
1402/*
1403 * Handle any necessary actions during state change to BACKUP state.
1404 *
862f2f37 1405 * r
5435a2bf
QY
1406 * Virtual Router to operate on
1407 */
862f2f37 1408static void vrrp_change_state_backup(struct vrrp_router *r)
5435a2bf 1409{
f3fe0047
QY
1410 /* Disable ND Router Advertisements */
1411 if (r->family == AF_INET6)
1412 vrrp_zebra_radv_set(r, false);
c3bd894e 1413
45505f63
QY
1414 /* Disable Adver_Timer */
1415 THREAD_OFF(r->t_adver_timer);
1416
d60b2ffd
QY
1417 r->advert_pending = false;
1418 r->garp_pending = false;
1419 r->ndisc_pending = false;
958b1487 1420 memset(&r->src, 0x00, sizeof(r->src));
d60b2ffd 1421
c3bd894e 1422 vrrp_zclient_send_interface_protodown(r->mvl_ifp, true);
5435a2bf
QY
1423}
1424
1425/*
1426 * Handle any necessary actions during state change to INITIALIZE state.
1427 *
1428 * This is not called for initial startup, only when transitioning from MASTER
1429 * or BACKUP.
1430 *
862f2f37
QY
1431 * r
1432 * VRRP Router to operate on
5435a2bf 1433 */
862f2f37 1434static void vrrp_change_state_initialize(struct vrrp_router *r)
5435a2bf 1435{
862f2f37
QY
1436 r->master_adver_interval = 0;
1437 vrrp_recalculate_timers(r);
f3fe0047 1438
d60b2ffd
QY
1439 r->advert_pending = false;
1440 r->garp_pending = false;
1441 r->ndisc_pending = false;
1442
f3fe0047 1443 /* Disable ND Router Advertisements */
9323f278 1444 if (r->family == AF_INET6 && r->mvl_ifp)
f3fe0047 1445 vrrp_zebra_radv_set(r, false);
5435a2bf
QY
1446}
1447
2b64873d 1448void (*const vrrp_change_state_handlers[])(struct vrrp_router *vr) = {
5435a2bf
QY
1449 [VRRP_STATE_MASTER] = vrrp_change_state_master,
1450 [VRRP_STATE_BACKUP] = vrrp_change_state_backup,
1451 [VRRP_STATE_INITIALIZE] = vrrp_change_state_initialize,
1452};
1453
1454/*
1455 * Change Virtual Router FSM position. Handles transitional actions and calls
1456 * any subscribers to the state change hook.
1457 *
862f2f37 1458 * r
5435a2bf
QY
1459 * Virtual Router for which to change state
1460 *
1461 * to
1462 * State to change to
1463 */
862f2f37 1464static void vrrp_change_state(struct vrrp_router *r, int to)
5435a2bf 1465{
6287cefe
QY
1466 if (r->fsm.state == to)
1467 return;
1468
5435a2bf 1469 /* Call our handlers, then any subscribers */
862f2f37
QY
1470 vrrp_change_state_handlers[to](r);
1471 hook_call(vrrp_change_state_hook, r, to);
613b45b0
QY
1472 zlog_info(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM "%s -> %s",
1473 r->vr->vrid, family2str(r->family),
862f2f37
QY
1474 vrrp_state_names[r->fsm.state], vrrp_state_names[to]);
1475 r->fsm.state = to;
6332c77f
QY
1476
1477 ++r->stats.trans_cnt;
5435a2bf
QY
1478}
1479
1480/*
1481 * Called when Adver_Timer expires.
1482 */
1483static int vrrp_adver_timer_expire(struct thread *thread)
1484{
862f2f37 1485 struct vrrp_router *r = thread->arg;
5435a2bf 1486
b637bcd4 1487 DEBUGD(&vrrp_dbg_proto,
613b45b0
QY
1488 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1489 "Adver_Timer expired",
1490 r->vr->vrid, family2str(r->family));
4ec94408 1491
862f2f37 1492 if (r->fsm.state == VRRP_STATE_MASTER) {
3e7a4043 1493 /* Send an ADVERTISEMENT */
862f2f37 1494 vrrp_send_advertisement(r);
5435a2bf 1495
3e7a4043 1496 /* Reset the Adver_Timer to Advertisement_Interval */
862f2f37 1497 thread_add_timer_msec(master, vrrp_adver_timer_expire, r,
de7fe61e 1498 r->vr->advertisement_interval * CS2MS,
862f2f37 1499 &r->t_adver_timer);
3e7a4043 1500 } else {
613b45b0 1501 zlog_err(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
b637bcd4 1502 "Adver_Timer expired in state '%s'; this is a bug",
613b45b0
QY
1503 r->vr->vrid, family2str(r->family),
1504 vrrp_state_names[r->fsm.state]);
5435a2bf 1505 }
3e7a4043 1506
5435a2bf
QY
1507 return 0;
1508}
1509
1510/*
4ec94408 1511 * Called when Master_Down_Timer expires.
5435a2bf
QY
1512 */
1513static int vrrp_master_down_timer_expire(struct thread *thread)
1514{
862f2f37 1515 struct vrrp_router *r = thread->arg;
4ec94408 1516
613b45b0
QY
1517 zlog_info(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1518 "Master_Down_Timer expired",
1519 r->vr->vrid, family2str(r->family));
5435a2bf 1520
c7e3b83d 1521 thread_add_timer_msec(master, vrrp_adver_timer_expire, r,
de7fe61e 1522 r->vr->advertisement_interval * CS2MS,
c7e3b83d
QY
1523 &r->t_adver_timer);
1524 vrrp_change_state(r, VRRP_STATE_MASTER);
1525
5435a2bf
QY
1526 return 0;
1527}
1528
1529/*
1530 * Event handler for Startup event.
1531 *
1532 * Creates sockets, sends advertisements and ARP requests, starts timers,
1d21789e
QY
1533 * and transitions the Virtual Router to either Master or Backup states.
1534 *
1535 * This function will also initialize the program's global ARP subsystem if it
1536 * has not yet been initialized.
5435a2bf 1537 *
862f2f37
QY
1538 * r
1539 * VRRP Router on which to apply Startup event
1d21789e
QY
1540 *
1541 * Returns:
1542 * < 0 if the session socket could not be created, or the state is not
1543 * Initialize
1544 * 0 on success
5435a2bf 1545 */
862f2f37 1546static int vrrp_startup(struct vrrp_router *r)
5435a2bf 1547{
1d21789e 1548 /* May only be called when the state is Initialize */
862f2f37 1549 if (r->fsm.state != VRRP_STATE_INITIALIZE)
1d21789e
QY
1550 return -1;
1551
7e205b4a 1552 /* Must have a valid macvlan interface available */
85467974 1553 if (r->mvl_ifp == NULL && !vrrp_attach_interface(r)) {
613b45b0
QY
1554 zlog_warn(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1555 "No appropriate interface found",
7e205b4a
QY
1556 r->vr->vrid, family2str(r->family));
1557 return -1;
1558 }
1559
40744000 1560 /* Initialize global gratuitous ARP socket if necessary */
862f2f37 1561 if (r->family == AF_INET && !vrrp_garp_is_init())
40744000 1562 vrrp_garp_init();
4f52e9a6
QY
1563 if (r->family == AF_INET6 && !vrrp_ndisc_is_init())
1564 vrrp_ndisc_init();
40744000 1565
5435a2bf 1566 /* Create socket */
dad18a2f 1567 if (r->sock_rx < 0 || r->sock_tx < 0) {
862f2f37 1568 int ret = vrrp_socket(r);
2fff50ec 1569
dad18a2f 1570 if (ret < 0 || r->sock_tx < 0 || r->sock_rx < 0)
862f2f37
QY
1571 return ret;
1572 }
5435a2bf
QY
1573
1574 /* Schedule listener */
dad18a2f 1575 thread_add_read(master, vrrp_read, r, r->sock_rx, &r->t_read);
5435a2bf 1576
91188ca6 1577 /* Configure effective priority */
bdf16661 1578 assert(listhead(r->addrs));
862f2f37 1579 struct ipaddr *primary = (struct ipaddr *)listhead(r->addrs)->data;
862f2f37 1580 char ipbuf[INET6_ADDRSTRLEN];
2fff50ec 1581
862f2f37
QY
1582 inet_ntop(r->family, &primary->ip.addr, ipbuf, sizeof(ipbuf));
1583
2f1fc30f
QY
1584 if (r->vr->priority == VRRP_PRIO_MASTER
1585 || vrrp_is_owner(r->vr->ifp, primary)) {
862f2f37
QY
1586 r->priority = VRRP_PRIO_MASTER;
1587 vrrp_recalculate_timers(r);
1588
5d3730c5 1589 zlog_info(
613b45b0 1590 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
2f1fc30f 1591 "%s has priority set to 255 or owns primary Virtual Router IP %s; electing self as Master",
613b45b0
QY
1592 r->vr->vrid, family2str(r->family), r->vr->ifp->name,
1593 ipbuf);
5d3730c5
QY
1594 }
1595
862f2f37 1596 if (r->priority == VRRP_PRIO_MASTER) {
862f2f37 1597 thread_add_timer_msec(master, vrrp_adver_timer_expire, r,
de7fe61e 1598 r->vr->advertisement_interval * CS2MS,
862f2f37
QY
1599 &r->t_adver_timer);
1600 vrrp_change_state(r, VRRP_STATE_MASTER);
5435a2bf 1601 } else {
862f2f37
QY
1602 r->master_adver_interval = r->vr->advertisement_interval;
1603 vrrp_recalculate_timers(r);
1604 thread_add_timer_msec(master, vrrp_master_down_timer_expire, r,
de7fe61e 1605 r->master_down_interval * CS2MS,
862f2f37
QY
1606 &r->t_master_down_timer);
1607 vrrp_change_state(r, VRRP_STATE_BACKUP);
5435a2bf 1608 }
a8144d7f 1609
862f2f37
QY
1610 r->is_active = true;
1611
a8144d7f 1612 return 0;
5435a2bf
QY
1613}
1614
1d21789e
QY
1615/*
1616 * Shuts down a Virtual Router and transitions it to Initialize.
1617 *
1618 * This call must be idempotent; it is safe to call multiple times on the same
862f2f37 1619 * VRRP Router.
1d21789e 1620 */
862f2f37 1621static int vrrp_shutdown(struct vrrp_router *r)
5435a2bf 1622{
45505f63
QY
1623 uint8_t saved_prio;
1624
862f2f37
QY
1625 switch (r->fsm.state) {
1626 case VRRP_STATE_MASTER:
862f2f37 1627 /* Send an ADVERTISEMENT with Priority = 0 */
45505f63 1628 saved_prio = r->priority;
862f2f37
QY
1629 r->priority = 0;
1630 vrrp_send_advertisement(r);
1631 r->priority = saved_prio;
1632 break;
1633 case VRRP_STATE_BACKUP:
862f2f37
QY
1634 break;
1635 case VRRP_STATE_INITIALIZE:
b637bcd4 1636 DEBUGD(&vrrp_dbg_proto,
613b45b0 1637 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
b637bcd4 1638 "Received '%s' event in '%s' state; ignoring",
613b45b0
QY
1639 r->vr->vrid, family2str(r->family),
1640 vrrp_event_names[VRRP_EVENT_SHUTDOWN],
b637bcd4 1641 vrrp_state_names[VRRP_STATE_INITIALIZE]);
2681134b 1642 return 0;
3e7a4043
QY
1643 }
1644
45505f63
QY
1645 /* Cancel all timers */
1646 THREAD_OFF(r->t_adver_timer);
1647 THREAD_OFF(r->t_master_down_timer);
a90edf08
QY
1648 THREAD_OFF(r->t_read);
1649 THREAD_OFF(r->t_write);
45505f63 1650
4d2ea6bf 1651 /* Protodown macvlan */
9323f278
QY
1652 if (r->mvl_ifp)
1653 vrrp_zclient_send_interface_protodown(r->mvl_ifp, true);
4d2ea6bf 1654
958b1487
QY
1655 /* Throw away our source address */
1656 memset(&r->src, 0x00, sizeof(r->src));
1657
b7dc1bbb
QY
1658 if (r->sock_rx > 0) {
1659 close(r->sock_rx);
1660 r->sock_rx = -1;
1661 }
1662 if (r->sock_tx > 0) {
1663 close(r->sock_tx);
1664 r->sock_tx = -1;
1665 }
1666
862f2f37 1667 vrrp_change_state(r, VRRP_STATE_INITIALIZE);
1d21789e 1668
73b5cb19
QY
1669 r->is_active = false;
1670
a8144d7f 1671 return 0;
5435a2bf
QY
1672}
1673
2b64873d 1674static int (*const vrrp_event_handlers[])(struct vrrp_router *r) = {
5435a2bf
QY
1675 [VRRP_EVENT_STARTUP] = vrrp_startup,
1676 [VRRP_EVENT_SHUTDOWN] = vrrp_shutdown,
1677};
1678
1679/*
862f2f37 1680 * Spawn a VRRP FSM event on a VRRP Router.
5435a2bf
QY
1681 *
1682 * vr
862f2f37 1683 * VRRP Router on which to spawn event
5435a2bf
QY
1684 *
1685 * event
1686 * The event to spawn
27fd8827
QY
1687 *
1688 * Returns:
1689 * -1 on failure
1690 * 0 otherwise
5435a2bf 1691 */
862f2f37 1692int vrrp_event(struct vrrp_router *r, int event)
5435a2bf 1693{
613b45b0
QY
1694 zlog_info(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM "'%s' event",
1695 r->vr->vrid, family2str(r->family), vrrp_event_names[event]);
862f2f37 1696 return vrrp_event_handlers[event](r);
5435a2bf
QY
1697}
1698
1699
27fd8827
QY
1700/* Autoconfig -------------------------------------------------------------- */
1701
1702/*
1703 * Set the configured addresses for this VRRP instance to exactly the addresses
1704 * present on its macvlan subinterface(s).
1705 *
1706 * vr
1707 * VRRP router to act on
1708 */
ac1429b9 1709static void vrrp_autoconfig_autoaddrupdate(struct vrrp_router *r)
27fd8827 1710{
27fd8827
QY
1711 struct listnode *ln;
1712 struct connected *c = NULL;
ac1429b9 1713 bool is_v6_ll;
27fd8827 1714
ac1429b9
QY
1715 if (!r->mvl_ifp)
1716 return;
27fd8827 1717
ac1429b9 1718 DEBUGD(&vrrp_dbg_auto,
613b45b0
QY
1719 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1720 "Setting Virtual IP list to match IPv4 addresses on %s",
ac1429b9
QY
1721 r->vr->vrid, family2str(r->family), r->mvl_ifp->name);
1722 for (ALL_LIST_ELEMENTS_RO(r->mvl_ifp->connected, ln, c)) {
1723 is_v6_ll = (c->address->family == AF_INET6
1724 && IN6_IS_ADDR_LINKLOCAL(&c->address->u.prefix6));
1725 if (c->address->family == r->family && !is_v6_ll) {
ac1429b9 1726 DEBUGD(&vrrp_dbg_auto,
613b45b0 1727 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
26b6d034
PR
1728 "Adding %pFX",
1729 r->vr->vrid, family2str(r->family), c->address);
ac1429b9
QY
1730 if (r->family == AF_INET)
1731 vrrp_add_ipv4(r->vr, c->address->u.prefix4);
359c72ba 1732 else if (r->vr->version == 3)
ac1429b9
QY
1733 vrrp_add_ipv6(r->vr, c->address->u.prefix6);
1734 }
b637bcd4 1735 }
27fd8827 1736
ac1429b9 1737 vrrp_check_start(r->vr);
6e93585e 1738
ac1429b9 1739 if (r->addrs->count == 0 && r->fsm.state != VRRP_STATE_INITIALIZE) {
b637bcd4 1740 DEBUGD(&vrrp_dbg_auto,
613b45b0
QY
1741 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1742 "Virtual IP list is empty; shutting down",
ac1429b9
QY
1743 r->vr->vrid, family2str(r->family));
1744 vrrp_event(r, VRRP_EVENT_SHUTDOWN);
b637bcd4 1745 }
27fd8827 1746}
5435a2bf 1747
53e60e5c
QY
1748static struct vrrp_vrouter *
1749vrrp_autoconfig_autocreate(struct interface *mvl_ifp)
1750{
1751 struct interface *p;
1752 struct vrrp_vrouter *vr;
1753
490810d5 1754 p = if_lookup_by_index(mvl_ifp->link_ifindex, mvl_ifp->vrf_id);
27fd8827
QY
1755
1756 if (!p)
1757 return NULL;
1758
53e60e5c 1759 uint8_t vrid = mvl_ifp->hw_addr[5];
613b45b0 1760 uint8_t fam = mvl_ifp->hw_addr[4];
53e60e5c 1761
00984df7 1762 DEBUGD(&vrrp_dbg_auto,
613b45b0
QY
1763 VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1764 "Autoconfiguring VRRP on %s",
1765 vrid, family2str(fam), p->name);
53e60e5c 1766
53e60e5c
QY
1767 vr = vrrp_vrouter_create(p, vrid, vrrp_autoconfig_version);
1768
27fd8827 1769 if (!vr) {
613b45b0
QY
1770 zlog_warn(VRRP_LOGPFX VRRP_LOGPFX_VRID VRRP_LOGPFX_FAM
1771 "Failed to autoconfigure VRRP on %s",
1772 vrid, family2str(fam), p->name);
53e60e5c 1773 return NULL;
27fd8827 1774 }
53e60e5c 1775
d37281cb
QY
1776 vr->autoconf = true;
1777
1778 /*
1779 * If these interfaces are protodown on, we need to un-protodown them
1780 * in order to get Zebra to send us their addresses so we can
1781 * autoconfigure them.
1782 */
1783 if (vr->v4->mvl_ifp)
1784 vrrp_zclient_send_interface_protodown(vr->v4->mvl_ifp, false);
1785 if (vr->v6->mvl_ifp)
1786 vrrp_zclient_send_interface_protodown(vr->v6->mvl_ifp, false);
1787
1788 /* If they're not, we can go ahead and add the addresses we have */
ac1429b9
QY
1789 vrrp_autoconfig_autoaddrupdate(vr->v4);
1790 vrrp_autoconfig_autoaddrupdate(vr->v6);
53e60e5c 1791
53e60e5c
QY
1792 return vr;
1793}
1794
6e93585e
QY
1795/*
1796 * Callback to notify autoconfig of interface add.
1797 *
1798 * If the interface is a VRRP-compatible device, and there is no existing VRRP
1799 * router running on it, one is created. All addresses on the interface are
1800 * added to the router.
1801 *
1802 * ifp
1803 * Interface to operate on
1804 *
1805 * Returns:
1806 * -1 on failure
1807 * 0 otherwise
1808 */
1809static int vrrp_autoconfig_if_add(struct interface *ifp)
27fd8827 1810{
2198a5bb
QY
1811 bool created = false;
1812 struct vrrp_vrouter *vr;
1813
27fd8827
QY
1814 if (!vrrp_autoconfig_is_on)
1815 return 0;
1816
27fd8827
QY
1817 if (!ifp || !ifp->link_ifindex || !vrrp_ifp_has_vrrp_mac(ifp))
1818 return -1;
1819
6e93585e 1820 vr = vrrp_lookup_by_if_mvl(ifp);
27fd8827 1821
2198a5bb 1822 if (!vr) {
27fd8827 1823 vr = vrrp_autoconfig_autocreate(ifp);
d37281cb 1824 created = true;
2198a5bb 1825 }
27fd8827 1826
a8f58eb6 1827 if (!vr || !vr->autoconf)
27fd8827 1828 return 0;
d37281cb
QY
1829
1830 if (!created) {
1831 /*
1832 * We didn't create it, but it has already been autoconfigured.
1833 * Try to attach this interface to the existing instance.
1834 */
1835 if (!vr->v4->mvl_ifp) {
1836 vrrp_attach_interface(vr->v4);
1837 /* If we just attached it, make sure it's turned on */
1838 if (vr->v4->mvl_ifp) {
1839 vrrp_zclient_send_interface_protodown(
1840 vr->v4->mvl_ifp, false);
1841 /*
1842 * If it's already up, we can go ahead and add
1843 * the addresses we have
1844 */
1845 vrrp_autoconfig_autoaddrupdate(vr->v4);
1846 }
1847 }
1848 if (!vr->v6->mvl_ifp) {
1849 vrrp_attach_interface(vr->v6);
1850 /* If we just attached it, make sure it's turned on */
1851 if (vr->v6->mvl_ifp) {
1852 vrrp_zclient_send_interface_protodown(
1853 vr->v6->mvl_ifp, false);
1854 /*
1855 * If it's already up, we can go ahead and add
1856 * the addresses we have
1857 */
1858 vrrp_autoconfig_autoaddrupdate(vr->v6);
1859 }
1860 }
27fd8827
QY
1861 }
1862
1863 return 0;
1864}
1865
6e93585e
QY
1866/*
1867 * Callback to notify autoconfig of interface delete.
1868 *
1869 * If the interface is a VRRP-compatible device, and a VRRP router is running
1870 * on it, and that VRRP router was automatically configured, it will be
1871 * deleted. If that was the last router for the corresponding VRID (i.e., if
1872 * this interface was a v4 VRRP interface and no v6 router is configured for
1873 * the same VRID) then the entire virtual router is deleted.
1874 *
1875 * ifp
1876 * Interface to operate on
1877 *
1878 * Returns:
1879 * -1 on failure
1880 * 0 otherwise
1881 */
1882static int vrrp_autoconfig_if_del(struct interface *ifp)
27fd8827
QY
1883{
1884 if (!vrrp_autoconfig_is_on)
1885 return 0;
1886
6e93585e
QY
1887 struct vrrp_vrouter *vr;
1888 struct listnode *ln;
1889 struct list *vrs;
27fd8827 1890
6e93585e 1891 vrs = vrrp_lookup_by_if_any(ifp);
27fd8827 1892
6e93585e
QY
1893 for (ALL_LIST_ELEMENTS_RO(vrs, ln, vr))
1894 if (vr->autoconf
1895 && (!vr->ifp || (!vr->v4->mvl_ifp && !vr->v6->mvl_ifp))) {
b637bcd4
QY
1896 DEBUGD(&vrrp_dbg_auto,
1897 VRRP_LOGPFX VRRP_LOGPFX_VRID
6e93585e
QY
1898 "All VRRP interfaces for instance deleted; destroying autoconfigured VRRP router",
1899 vr->vrid);
1900 vrrp_vrouter_destroy(vr);
b637bcd4 1901 }
27fd8827 1902
6e93585e 1903 list_delete(&vrs);
27fd8827
QY
1904
1905 return 0;
1906}
1907
6e93585e
QY
1908/*
1909 * Callback to notify autoconfig of interface up.
1910 *
8bceffc7
QY
1911 * Creates VRRP instance on interface if it does not exist. Otherwise does
1912 * nothing.
6e93585e
QY
1913 *
1914 * ifp
1915 * Interface to operate on
1916 *
1917 * Returns:
1918 * -1 on failure
1919 * 0 otherwise
1920 */
1921static int vrrp_autoconfig_if_up(struct interface *ifp)
53e60e5c 1922{
27fd8827
QY
1923 if (!vrrp_autoconfig_is_on)
1924 return 0;
1925
6e93585e 1926 struct vrrp_vrouter *vr = vrrp_lookup_by_if_mvl(ifp);
27fd8827
QY
1927
1928 if (vr && !vr->autoconf)
1929 return 0;
1930
1931 if (!vr) {
1932 vrrp_autoconfig_if_add(ifp);
53e60e5c
QY
1933 return 0;
1934 }
1935
27fd8827
QY
1936 return 0;
1937}
1938
6e93585e
QY
1939/*
1940 * Callback to notify autoconfig of interface down.
1941 *
1942 * Does nothing. An interface down event is accompanied by address deletion
1943 * events for all the addresses on the interface; if an autoconfigured VRRP
1944 * router exists on this interface, then it will have all its addresses deleted
1945 * and end up in Initialize.
1946 *
1947 * ifp
1948 * Interface to operate on
1949 *
1950 * Returns:
1951 * -1 on failure
1952 * 0 otherwise
1953 */
1954static int vrrp_autoconfig_if_down(struct interface *ifp)
27fd8827
QY
1955{
1956 if (!vrrp_autoconfig_is_on)
1957 return 0;
1958
1959 return 0;
1960}
1961
6e93585e
QY
1962/*
1963 * Callback to notify autoconfig of a new interface address.
1964 *
1965 * If a VRRP router exists on this interface, its address list is updated to
1966 * match the new address list. If no addresses remain, a Shutdown event is
1967 * issued to the VRRP router.
1968 *
1969 * ifp
1970 * Interface to operate on
1971 *
1972 * Returns:
1973 * -1 on failure
1974 * 0 otherwise
1975 *
1976 */
1977static int vrrp_autoconfig_if_address_add(struct interface *ifp)
27fd8827
QY
1978{
1979 if (!vrrp_autoconfig_is_on)
1980 return 0;
1981
6e93585e 1982 struct vrrp_vrouter *vr = vrrp_lookup_by_if_mvl(ifp);
27fd8827 1983
ac1429b9
QY
1984 if (vr && vr->autoconf) {
1985 if (vr->v4->mvl_ifp == ifp)
1986 vrrp_autoconfig_autoaddrupdate(vr->v4);
1987 else if (vr->v6->mvl_ifp == ifp)
1988 vrrp_autoconfig_autoaddrupdate(vr->v6);
1989 }
27fd8827
QY
1990
1991 return 0;
1992}
1993
6e93585e
QY
1994/*
1995 * Callback to notify autoconfig of a removed interface address.
1996 *
1997 * If a VRRP router exists on this interface, its address list is updated to
1998 * match the new address list. If no addresses remain, a Shutdown event is
1999 * issued to the VRRP router.
2000 *
2001 * ifp
2002 * Interface to operate on
2003 *
2004 * Returns:
2005 * -1 on failure
2006 * 0 otherwise
2007 *
2008 */
2009static int vrrp_autoconfig_if_address_del(struct interface *ifp)
27fd8827
QY
2010{
2011 if (!vrrp_autoconfig_is_on)
2012 return 0;
2013
6e93585e 2014 struct vrrp_vrouter *vr = vrrp_lookup_by_if_mvl(ifp);
27fd8827 2015
ac1429b9
QY
2016 if (vr && vr->autoconf) {
2017 if (vr->v4->mvl_ifp == ifp)
2018 vrrp_autoconfig_autoaddrupdate(vr->v4);
2019 else if (vr->v6->mvl_ifp == ifp)
2020 vrrp_autoconfig_autoaddrupdate(vr->v6);
2021 }
27fd8827
QY
2022
2023 return 0;
2024}
2025
2026int vrrp_autoconfig(void)
2027{
2028 if (!vrrp_autoconfig_is_on)
2029 return 0;
2030
490810d5 2031 struct vrf *vrf;
27fd8827 2032 struct interface *ifp;
53e60e5c 2033
490810d5
QY
2034 RB_FOREACH (vrf, vrf_name_head, &vrfs_by_name) {
2035 FOR_ALL_INTERFACES (vrf, ifp)
2036 vrrp_autoconfig_if_add(ifp);
2037 }
53e60e5c
QY
2038
2039 return 0;
2040}
2041
27fd8827
QY
2042void vrrp_autoconfig_on(int version)
2043{
2044 vrrp_autoconfig_is_on = true;
2045 vrrp_autoconfig_version = version;
2046
2047 vrrp_autoconfig();
2048}
2049
2050void vrrp_autoconfig_off(void)
2051{
2052 vrrp_autoconfig_is_on = false;
2053
2054 struct list *ll = hash_to_list(vrrp_vrouters_hash);
2055
2056 struct listnode *ln;
2057 struct vrrp_vrouter *vr;
2058
2059 for (ALL_LIST_ELEMENTS_RO(ll, ln, vr))
2060 if (vr->autoconf)
2061 vrrp_vrouter_destroy(vr);
2062
2063 list_delete(&ll);
2064}
2065
6e93585e
QY
2066/* Interface tracking ------------------------------------------------------ */
2067
2068/*
2069 * Bind any pending interfaces.
2070 *
2071 * mvl_ifp
2072 * macvlan interface that some VRRP instances might want to bind to
2073 */
2074static void vrrp_bind_pending(struct interface *mvl_ifp)
2075{
2076 struct vrrp_vrouter *vr;
2077
76bcde9e
QY
2078 DEBUGD(&vrrp_dbg_zebra,
2079 VRRP_LOGPFX
2080 "Searching for instances that could use interface %s",
2081 mvl_ifp->name);
2082
6e93585e
QY
2083 vr = vrrp_lookup_by_if_mvl(mvl_ifp);
2084
2085 if (vr) {
76bcde9e
QY
2086 DEBUGD(&vrrp_dbg_zebra,
2087 VRRP_LOGPFX VRRP_LOGPFX_VRID
2088 "<-- This instance can probably use interface %s",
2089 vr->vrid, mvl_ifp->name);
2090
6e93585e
QY
2091 if (mvl_ifp->hw_addr[4] == 0x01 && !vr->v4->mvl_ifp)
2092 vrrp_attach_interface(vr->v4);
2093 else if (mvl_ifp->hw_addr[4] == 0x02 && !vr->v6->mvl_ifp)
2094 vrrp_attach_interface(vr->v6);
2095 }
2096}
2097
2098void vrrp_if_up(struct interface *ifp)
2099{
2100 struct vrrp_vrouter *vr;
2101 struct listnode *ln;
2102 struct list *vrs;
2103
2104 vrrp_bind_pending(ifp);
2105
2106 vrs = vrrp_lookup_by_if_any(ifp);
2107
d60b2ffd 2108 for (ALL_LIST_ELEMENTS_RO(vrs, ln, vr)) {
6e93585e
QY
2109 vrrp_check_start(vr);
2110
ee5aabb6
QY
2111 if (!if_is_operative(ifp))
2112 continue;
2113
d60b2ffd
QY
2114 /*
2115 * Handle the situation in which we performed a state
2116 * transition on this VRRP router but needed to wait for the
2117 * macvlan interface to come up to perform some actions
2118 */
2119 if (ifp == vr->v4->mvl_ifp) {
2120 if (vr->v4->advert_pending) {
2121 DEBUGD(&vrrp_dbg_proto,
2122 VRRP_LOGPFX VRRP_LOGPFX_VRID
613b45b0 2123 VRRP_LOGPFX_FAM
d60b2ffd 2124 "Interface up; sending pending advertisement",
613b45b0 2125 vr->vrid, family2str(vr->v4->family));
d60b2ffd
QY
2126 vrrp_send_advertisement(vr->v4);
2127 vr->v4->advert_pending = false;
2128 }
2129 if (vr->v4->garp_pending) {
2130 DEBUGD(&vrrp_dbg_proto,
2131 VRRP_LOGPFX VRRP_LOGPFX_VRID
613b45b0 2132 VRRP_LOGPFX_FAM
d60b2ffd 2133 "Interface up; sending pending gratuitous ARP",
613b45b0 2134 vr->vrid, family2str(vr->v4->family));
d60b2ffd
QY
2135 vrrp_garp_send_all(vr->v4);
2136 vr->v4->garp_pending = false;
2137 }
2138 }
2139 if (ifp == vr->v6->mvl_ifp) {
2140 if (vr->v6->advert_pending) {
2141 DEBUGD(&vrrp_dbg_proto,
2142 VRRP_LOGPFX VRRP_LOGPFX_VRID
613b45b0 2143 VRRP_LOGPFX_FAM
d60b2ffd 2144 "Interface up; sending pending advertisement",
613b45b0 2145 vr->vrid, family2str(vr->v6->family));
d60b2ffd
QY
2146 vrrp_send_advertisement(vr->v6);
2147 vr->v6->advert_pending = false;
2148 }
2149 if (vr->v6->ndisc_pending) {
2150 DEBUGD(&vrrp_dbg_proto,
2151 VRRP_LOGPFX VRRP_LOGPFX_VRID
613b45b0 2152 VRRP_LOGPFX_FAM
d60b2ffd 2153 "Interface up; sending pending Unsolicited Neighbor Advertisement",
613b45b0 2154 vr->vrid, family2str(vr->v6->family));
d60b2ffd
QY
2155 vrrp_ndisc_una_send_all(vr->v6);
2156 vr->v6->ndisc_pending = false;
2157 }
2158 }
2159 }
2160
6e93585e
QY
2161 list_delete(&vrs);
2162
2163 vrrp_autoconfig_if_up(ifp);
2164}
2165
2166void vrrp_if_down(struct interface *ifp)
2167{
2168 struct vrrp_vrouter *vr;
2169 struct listnode *ln;
2170 struct list *vrs;
2171
2e3d7564
QY
2172 vrrp_bind_pending(ifp);
2173
6e93585e
QY
2174 vrs = vrrp_lookup_by_if_any(ifp);
2175
2176 for (ALL_LIST_ELEMENTS_RO(vrs, ln, vr)) {
2e3d7564
QY
2177 vrrp_check_start(vr);
2178
c4485ad5
QY
2179 if (vr->ifp == ifp || vr->v4->mvl_ifp == ifp
2180 || vr->v6->mvl_ifp == ifp) {
2181 DEBUGD(&vrrp_dbg_auto,
2182 VRRP_LOGPFX VRRP_LOGPFX_VRID "Interface %s down",
2183 vr->vrid, ifp->name);
6e93585e
QY
2184 }
2185 }
2186
2187 list_delete(&vrs);
2188
2189 vrrp_autoconfig_if_down(ifp);
2190}
2191
2192void vrrp_if_add(struct interface *ifp)
2193{
2194 vrrp_bind_pending(ifp);
2195
2196 /* thanks, zebra */
2197 if (CHECK_FLAG(ifp->flags, IFF_UP))
2198 vrrp_if_up(ifp);
2199
2200 vrrp_autoconfig_if_add(ifp);
2201}
2202
2203void vrrp_if_del(struct interface *ifp)
2204{
2205 struct listnode *ln;
2206 struct vrrp_vrouter *vr;
6e93585e
QY
2207
2208 vrrp_if_down(ifp);
2209
2681134b
QY
2210 /*
2211 * You think we'd be able use vrrp_lookup_by_if_any to find interfaces?
2212 * Nah. FRR's interface management is insane. There are no ordering
2213 * guarantees about what interfaces are deleted when. Maybe this is a
2214 * macvlan and its parent was already deleted, in which case its
2215 * ifindex is now IFINDEX_INTERNAL, so ifp->link_ifindex - while still
2216 * valid - doesn't match any interface on the system, meaning we can't
2217 * use any of the vrrp_lookup* functions since they rely on finding the
2218 * base interface of what they're given by following link_ifindex.
2219 *
2220 * Since we need to actually NULL out pointers in this function to
2221 * avoid a UAF - since the caller will (might) free ifp after we return
2222 * - we need to look up based on pointers.
2223 */
2224 struct list *vrs = hash_to_list(vrrp_vrouters_hash);
2225
6e93585e 2226 for (ALL_LIST_ELEMENTS_RO(vrs, ln, vr)) {
2681134b
QY
2227 if (ifp == vr->ifp) {
2228 vrrp_event(vr->v4, VRRP_EVENT_SHUTDOWN);
2229 vrrp_event(vr->v6, VRRP_EVENT_SHUTDOWN);
61980c71 2230 /*
2681134b
QY
2231 * Stands to reason if the base was deleted, so were
2232 * (or will be) its children
61980c71 2233 */
2681134b
QY
2234 vr->v4->mvl_ifp = NULL;
2235 vr->v6->mvl_ifp = NULL;
61980c71 2236 /*
2681134b
QY
2237 * We shouldn't need to lose the reference if it's the
2238 * primary interface, because that was configured
2239 * explicitly in our config, and thus will be kept as a
2240 * stub; to avoid stupid bugs, double check that
61980c71 2241 */
2681134b
QY
2242 assert(ifp->configured);
2243 } else if (ifp == vr->v4->mvl_ifp) {
2244 vrrp_event(vr->v4, VRRP_EVENT_SHUTDOWN);
61980c71 2245 /*
2681134b
QY
2246 * If this is a macvlan, then it wasn't explicitly
2247 * configured and will be deleted when we return from
2248 * this function, so we need to lose the reference
61980c71 2249 */
2681134b
QY
2250 vr->v4->mvl_ifp = NULL;
2251 } else if (ifp == vr->v6->mvl_ifp) {
2252 vrrp_event(vr->v6, VRRP_EVENT_SHUTDOWN);
61980c71 2253 /*
2681134b 2254 * If this is a macvlan, then it wasn't explicitly
61980c71
QY
2255 * configured and will be deleted when we return from
2256 * this function, so we need to lose the reference
2257 */
2681134b 2258 vr->v6->mvl_ifp = NULL;
62475ecd 2259 }
6e93585e
QY
2260 }
2261
2262 list_delete(&vrs);
2263
2264 vrrp_autoconfig_if_del(ifp);
2265}
2266
2267void vrrp_if_address_add(struct interface *ifp)
2268{
2269 struct vrrp_vrouter *vr;
2270 struct listnode *ln;
2271 struct list *vrs;
2272
2273 /*
2274 * We have to do a wide search here, because we need to know when a v6
2275 * macvlan device gets a new address. This is because the macvlan link
2276 * local is used as the source address for v6 advertisements, and hence
2277 * "do I have a link local" constitutes an activation condition for v6
2278 * virtual routers.
2279 */
2280 vrs = vrrp_lookup_by_if_any(ifp);
2281
2282 for (ALL_LIST_ELEMENTS_RO(vrs, ln, vr))
2283 vrrp_check_start(vr);
2284
2285 list_delete(&vrs);
2286
2287 vrrp_autoconfig_if_address_add(ifp);
2288}
2289
2290void vrrp_if_address_del(struct interface *ifp)
2291{
89f34204
QY
2292 /*
2293 * Zebra is stupid and sends us address deletion notifications
2294 * when any of the following condition sets are met:
2295 *
b0ec34c8
QY
2296 * - if_is_operative && address deleted
2297 * - if_is_operative -> !if_is_operative
89f34204
QY
2298 *
2299 * Note that the second one is nonsense, because Zebra behaves as
2300 * though an interface going down means all the addresses on that
2301 * interface got deleted. Which is a problem for autoconfig because all
2302 * the addresses on an interface going away means the VRRP session goes
2303 * to Initialize. However interfaces go down whenever we transition to
2304 * Backup, so this effectively means that for autoconfigured instances
2305 * we actually end up in Initialize whenever we try to go into Backup.
2306 *
2307 * Also, Zebra does NOT send us notifications when:
b0ec34c8 2308 * - !if_is_operative && address deleted
89f34204
QY
2309 *
2310 * Which means if we're in backup and an address is deleted out from
2311 * under us, we won't even know.
2312 *
2313 * The only solution here is to only resynchronize our address list
2314 * when:
2315 *
2316 * - An interfaces comes up
2317 * - An interface address is added
2318 * - An interface address is deleted AND the interface is up
2319 *
2320 * Even though this is only a problem with autoconfig at the moment I'm
2321 * papering over Zebra's braindead semantics here. Every piece of code
2322 * in this function should be protected by a check that the interface
2323 * is up.
2324 */
2fff50ec 2325 if (if_is_operative(ifp))
89f34204 2326 vrrp_autoconfig_if_address_del(ifp);
6e93585e
QY
2327}
2328
27fd8827
QY
2329/* Other ------------------------------------------------------------------- */
2330
f828842a
QY
2331int vrrp_config_write_global(struct vty *vty)
2332{
8cd1d277
QY
2333 unsigned int writes = 0;
2334
2335 if (vrrp_autoconfig_is_on && ++writes)
f828842a
QY
2336 vty_out(vty, "vrrp autoconfigure%s\n",
2337 vrrp_autoconfig_version == 2 ? " version 2" : "");
2338
f495425b 2339 /* FIXME: needs to be udpated for full YANG conversion. */
8cd1d277 2340 if (vd.priority != VRRP_DEFAULT_PRIORITY && ++writes)
6cde4b45 2341 vty_out(vty, "vrrp default priority %hhu\n", vd.priority);
8cd1d277
QY
2342
2343 if (vd.advertisement_interval != VRRP_DEFAULT_ADVINT && ++writes)
2344 vty_out(vty,
0b1321e2 2345 "vrrp default advertisement-interval %u\n",
33b010a9 2346 vd.advertisement_interval * CS2MS);
8cd1d277
QY
2347
2348 if (vd.preempt_mode != VRRP_DEFAULT_PREEMPT && ++writes)
2349 vty_out(vty, "%svrrp default preempt\n",
2350 !vd.preempt_mode ? "no " : "");
2351
2352 if (vd.accept_mode != VRRP_DEFAULT_ACCEPT && ++writes)
2353 vty_out(vty, "%svrrp default accept\n",
2354 !vd.accept_mode ? "no " : "");
2355
2356 if (vd.shutdown != VRRP_DEFAULT_SHUTDOWN && ++writes)
2357 vty_out(vty, "%svrrp default shutdown\n",
2358 !vd.shutdown ? "no " : "");
2359
2360 return writes;
f828842a
QY
2361}
2362
53ca01e5 2363static unsigned int vrrp_hash_key(const void *arg)
5435a2bf 2364{
53ca01e5 2365 const struct vrrp_vrouter *vr = arg;
4f0b6b45 2366 char key[IFNAMSIZ + 64];
2fff50ec 2367
0b1321e2 2368 snprintf(key, sizeof(key), "%s@%u", vr->ifp->name, vr->vrid);
4f0b6b45
QY
2369
2370 return string_hash_make(key);
5435a2bf
QY
2371}
2372
2373static bool vrrp_hash_cmp(const void *arg1, const void *arg2)
2374{
2375 const struct vrrp_vrouter *vr1 = arg1;
2376 const struct vrrp_vrouter *vr2 = arg2;
2377
4f0b6b45 2378 if (vr1->ifp != vr2->ifp)
f06c4576 2379 return false;
4f0b6b45 2380 if (vr1->vrid != vr2->vrid)
f06c4576 2381 return false;
4f0b6b45 2382
f06c4576 2383 return true;
5435a2bf
QY
2384}
2385
2386void vrrp_init(void)
2387{
8cd1d277 2388 /* Set default defaults */
f495425b
QY
2389 vd.version = yang_get_default_uint8("%s/version", VRRP_XPATH_FULL);
2390 vd.priority = yang_get_default_uint8("%s/priority", VRRP_XPATH_FULL);
2391 vd.advertisement_interval = yang_get_default_uint16(
2392 "%s/advertisement-interval", VRRP_XPATH_FULL);
2393 vd.preempt_mode = yang_get_default_bool("%s/preempt", VRRP_XPATH_FULL);
2394 vd.accept_mode =
2395 yang_get_default_bool("%s/accept-mode", VRRP_XPATH_FULL);
8cd1d277
QY
2396 vd.shutdown = VRRP_DEFAULT_SHUTDOWN;
2397
53e60e5c 2398 vrrp_autoconfig_version = 3;
5435a2bf
QY
2399 vrrp_vrouters_hash = hash_create(&vrrp_hash_key, vrrp_hash_cmp,
2400 "VRRP virtual router hash");
2401 vrf_init(NULL, NULL, NULL, NULL, NULL);
2402}
f1175ba9
QY
2403
2404void vrrp_fini(void)
2405{
2406 /* Destroy all instances */
2407 struct list *vrs = hash_to_list(vrrp_vrouters_hash);
2408
2409 struct listnode *ln;
2410 struct vrrp_vrouter *vr;
2411
19c38250 2412 for (ALL_LIST_ELEMENTS_RO(vrs, ln, vr))
f1175ba9 2413 vrrp_vrouter_destroy(vr);
f1175ba9
QY
2414
2415 list_delete(&vrs);
2416
2417 hash_clean(vrrp_vrouters_hash, NULL);
2418 hash_free(vrrp_vrouters_hash);
2419}