]> git.proxmox.com Git - mirror_frr.git/blob - bgpd/bgp_packet.c
[bgpd] Stability fixes including bugs 397, 492
[mirror_frr.git] / bgpd / bgp_packet.c
1 /* BGP packet management routine.
2 Copyright (C) 1999 Kunihiro Ishiguro
3
4 This file is part of GNU Zebra.
5
6 GNU Zebra is free software; you can redistribute it and/or modify it
7 under the terms of the GNU General Public License as published by the
8 Free Software Foundation; either version 2, or (at your option) any
9 later version.
10
11 GNU Zebra is distributed in the hope that it will be useful, but
12 WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GNU Zebra; see the file COPYING. If not, write to the Free
18 Software Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA
19 02111-1307, USA. */
20
21 #include <zebra.h>
22
23 #include "thread.h"
24 #include "stream.h"
25 #include "network.h"
26 #include "prefix.h"
27 #include "command.h"
28 #include "log.h"
29 #include "memory.h"
30 #include "sockunion.h" /* for inet_ntop () */
31 #include "linklist.h"
32 #include "plist.h"
33
34 #include "bgpd/bgpd.h"
35 #include "bgpd/bgp_table.h"
36 #include "bgpd/bgp_dump.h"
37 #include "bgpd/bgp_attr.h"
38 #include "bgpd/bgp_debug.h"
39 #include "bgpd/bgp_fsm.h"
40 #include "bgpd/bgp_route.h"
41 #include "bgpd/bgp_packet.h"
42 #include "bgpd/bgp_open.h"
43 #include "bgpd/bgp_aspath.h"
44 #include "bgpd/bgp_community.h"
45 #include "bgpd/bgp_ecommunity.h"
46 #include "bgpd/bgp_network.h"
47 #include "bgpd/bgp_mplsvpn.h"
48 #include "bgpd/bgp_advertise.h"
49 #include "bgpd/bgp_vty.h"
50
51 int stream_put_prefix (struct stream *, struct prefix *);
52 \f
53 /* Set up BGP packet marker and packet type. */
54 static int
55 bgp_packet_set_marker (struct stream *s, u_char type)
56 {
57 int i;
58
59 /* Fill in marker. */
60 for (i = 0; i < BGP_MARKER_SIZE; i++)
61 stream_putc (s, 0xff);
62
63 /* Dummy total length. This field is should be filled in later on. */
64 stream_putw (s, 0);
65
66 /* BGP packet type. */
67 stream_putc (s, type);
68
69 /* Return current stream size. */
70 return stream_get_endp (s);
71 }
72
73 /* Set BGP packet header size entry. If size is zero then use current
74 stream size. */
75 static int
76 bgp_packet_set_size (struct stream *s)
77 {
78 int cp;
79
80 /* Preserve current pointer. */
81 cp = stream_get_endp (s);
82 stream_putw_at (s, BGP_MARKER_SIZE, cp);
83
84 return cp;
85 }
86
87 /* Add new packet to the peer. */
88 static void
89 bgp_packet_add (struct peer *peer, struct stream *s)
90 {
91 /* Add packet to the end of list. */
92 stream_fifo_push (peer->obuf, s);
93 }
94
95 /* Free first packet. */
96 static void
97 bgp_packet_delete (struct peer *peer)
98 {
99 stream_free (stream_fifo_pop (peer->obuf));
100 }
101
102 /* Check file descriptor whether connect is established. */
103 static void
104 bgp_connect_check (struct peer *peer)
105 {
106 int status;
107 socklen_t slen;
108 int ret;
109
110 /* Anyway I have to reset read and write thread. */
111 BGP_READ_OFF (peer->t_read);
112 BGP_WRITE_OFF (peer->t_write);
113
114 /* Check file descriptor. */
115 slen = sizeof (status);
116 ret = getsockopt(peer->fd, SOL_SOCKET, SO_ERROR, (void *) &status, &slen);
117
118 /* If getsockopt is fail, this is fatal error. */
119 if (ret < 0)
120 {
121 zlog (peer->log, LOG_INFO, "can't get sockopt for nonblocking connect");
122 BGP_EVENT_ADD (peer, TCP_fatal_error);
123 return;
124 }
125
126 /* When status is 0 then TCP connection is established. */
127 if (status == 0)
128 {
129 BGP_EVENT_ADD (peer, TCP_connection_open);
130 }
131 else
132 {
133 if (BGP_DEBUG (events, EVENTS))
134 plog_debug (peer->log, "%s [Event] Connect failed (%s)",
135 peer->host, safe_strerror (errno));
136 BGP_EVENT_ADD (peer, TCP_connection_open_failed);
137 }
138 }
139
140 /* Make BGP update packet. */
141 static struct stream *
142 bgp_update_packet (struct peer *peer, afi_t afi, safi_t safi)
143 {
144 struct stream *s;
145 struct bgp_adj_out *adj;
146 struct bgp_advertise *adv;
147 struct stream *packet;
148 struct bgp_node *rn = NULL;
149 struct bgp_info *binfo = NULL;
150 bgp_size_t total_attr_len = 0;
151 unsigned long pos;
152 char buf[BUFSIZ];
153
154 s = peer->work;
155 stream_reset (s);
156
157 adv = FIFO_HEAD (&peer->sync[afi][safi]->update);
158
159 while (adv)
160 {
161 assert (adv->rn);
162 rn = adv->rn;
163 adj = adv->adj;
164 if (adv->binfo)
165 binfo = adv->binfo;
166
167 /* When remaining space can't include NLRI and it's length. */
168 if (STREAM_REMAIN (s) <= BGP_NLRI_LENGTH + PSIZE (rn->p.prefixlen))
169 break;
170
171 /* If packet is empty, set attribute. */
172 if (stream_empty (s))
173 {
174 struct prefix_rd *prd = NULL;
175 u_char *tag = NULL;
176 struct peer *from = NULL;
177
178 if (rn->prn)
179 prd = (struct prefix_rd *) &rn->prn->p;
180 if (binfo && binfo->extra)
181 {
182 tag = binfo->extra->tag;
183 from = binfo->peer;
184 }
185
186 bgp_packet_set_marker (s, BGP_MSG_UPDATE);
187 stream_putw (s, 0);
188 pos = stream_get_endp (s);
189 stream_putw (s, 0);
190 total_attr_len = bgp_packet_attribute (NULL, peer, s,
191 adv->baa->attr,
192 &rn->p, afi, safi,
193 from, prd, tag);
194 stream_putw_at (s, pos, total_attr_len);
195 }
196
197 if (afi == AFI_IP && safi == SAFI_UNICAST)
198 stream_put_prefix (s, &rn->p);
199
200 if (BGP_DEBUG (update, UPDATE_OUT))
201 zlog (peer->log, LOG_DEBUG, "%s send UPDATE %s/%d",
202 peer->host,
203 inet_ntop (rn->p.family, &(rn->p.u.prefix), buf, BUFSIZ),
204 rn->p.prefixlen);
205
206 /* Synchnorize attribute. */
207 if (adj->attr)
208 bgp_attr_unintern (adj->attr);
209 else
210 peer->scount[afi][safi]++;
211
212 adj->attr = bgp_attr_intern (adv->baa->attr);
213
214 adv = bgp_advertise_clean (peer, adj, afi, safi);
215
216 if (! (afi == AFI_IP && safi == SAFI_UNICAST))
217 break;
218 }
219
220 if (! stream_empty (s))
221 {
222 bgp_packet_set_size (s);
223 packet = stream_dup (s);
224 bgp_packet_add (peer, packet);
225 BGP_WRITE_ON (peer->t_write, bgp_write, peer->fd);
226 stream_reset (s);
227 return packet;
228 }
229 return NULL;
230 }
231
232 static struct stream *
233 bgp_update_packet_eor (struct peer *peer, afi_t afi, safi_t safi)
234 {
235 struct stream *s;
236 struct stream *packet;
237
238 if (DISABLE_BGP_ANNOUNCE)
239 return NULL;
240
241 if (BGP_DEBUG (normal, NORMAL))
242 zlog_debug ("send End-of-RIB for %s to %s", afi_safi_print (afi, safi), peer->host);
243
244 s = stream_new (BGP_MAX_PACKET_SIZE);
245
246 /* Make BGP update packet. */
247 bgp_packet_set_marker (s, BGP_MSG_UPDATE);
248
249 /* Unfeasible Routes Length */
250 stream_putw (s, 0);
251
252 if (afi == AFI_IP && safi == SAFI_UNICAST)
253 {
254 /* Total Path Attribute Length */
255 stream_putw (s, 0);
256 }
257 else
258 {
259 /* Total Path Attribute Length */
260 stream_putw (s, 6);
261 stream_putc (s, BGP_ATTR_FLAG_OPTIONAL);
262 stream_putc (s, BGP_ATTR_MP_UNREACH_NLRI);
263 stream_putc (s, 3);
264 stream_putw (s, afi);
265 stream_putc (s, safi);
266 }
267
268 bgp_packet_set_size (s);
269 packet = stream_dup (s);
270 bgp_packet_add (peer, packet);
271 stream_free (s);
272 return packet;
273 }
274
275 /* Make BGP withdraw packet. */
276 static struct stream *
277 bgp_withdraw_packet (struct peer *peer, afi_t afi, safi_t safi)
278 {
279 struct stream *s;
280 struct stream *packet;
281 struct bgp_adj_out *adj;
282 struct bgp_advertise *adv;
283 struct bgp_node *rn;
284 unsigned long pos;
285 bgp_size_t unfeasible_len;
286 bgp_size_t total_attr_len;
287 char buf[BUFSIZ];
288
289 s = peer->work;
290 stream_reset (s);
291
292 while ((adv = FIFO_HEAD (&peer->sync[afi][safi]->withdraw)) != NULL)
293 {
294 assert (adv->rn);
295 adj = adv->adj;
296 rn = adv->rn;
297
298 if (STREAM_REMAIN (s)
299 < (BGP_NLRI_LENGTH + BGP_TOTAL_ATTR_LEN + PSIZE (rn->p.prefixlen)))
300 break;
301
302 if (stream_empty (s))
303 {
304 bgp_packet_set_marker (s, BGP_MSG_UPDATE);
305 stream_putw (s, 0);
306 }
307
308 if (afi == AFI_IP && safi == SAFI_UNICAST)
309 stream_put_prefix (s, &rn->p);
310 else
311 {
312 struct prefix_rd *prd = NULL;
313
314 if (rn->prn)
315 prd = (struct prefix_rd *) &rn->prn->p;
316 pos = stream_get_endp (s);
317 stream_putw (s, 0);
318 total_attr_len
319 = bgp_packet_withdraw (peer, s, &rn->p, afi, safi, prd, NULL);
320
321 /* Set total path attribute length. */
322 stream_putw_at (s, pos, total_attr_len);
323 }
324
325 if (BGP_DEBUG (update, UPDATE_OUT))
326 zlog (peer->log, LOG_DEBUG, "%s send UPDATE %s/%d -- unreachable",
327 peer->host,
328 inet_ntop (rn->p.family, &(rn->p.u.prefix), buf, BUFSIZ),
329 rn->p.prefixlen);
330
331 peer->scount[afi][safi]--;
332
333 bgp_adj_out_remove (rn, adj, peer, afi, safi);
334 bgp_unlock_node (rn);
335
336 if (! (afi == AFI_IP && safi == SAFI_UNICAST))
337 break;
338 }
339
340 if (! stream_empty (s))
341 {
342 if (afi == AFI_IP && safi == SAFI_UNICAST)
343 {
344 unfeasible_len
345 = stream_get_endp (s) - BGP_HEADER_SIZE - BGP_UNFEASIBLE_LEN;
346 stream_putw_at (s, BGP_HEADER_SIZE, unfeasible_len);
347 stream_putw (s, 0);
348 }
349 bgp_packet_set_size (s);
350 packet = stream_dup (s);
351 bgp_packet_add (peer, packet);
352 stream_reset (s);
353 return packet;
354 }
355
356 return NULL;
357 }
358
359 void
360 bgp_default_update_send (struct peer *peer, struct attr *attr,
361 afi_t afi, safi_t safi, struct peer *from)
362 {
363 struct stream *s;
364 struct stream *packet;
365 struct prefix p;
366 unsigned long pos;
367 bgp_size_t total_attr_len;
368 char attrstr[BUFSIZ];
369 char buf[BUFSIZ];
370
371 if (DISABLE_BGP_ANNOUNCE)
372 return;
373
374 if (afi == AFI_IP)
375 str2prefix ("0.0.0.0/0", &p);
376 #ifdef HAVE_IPV6
377 else
378 str2prefix ("::/0", &p);
379 #endif /* HAVE_IPV6 */
380
381 /* Logging the attribute. */
382 if (BGP_DEBUG (update, UPDATE_OUT))
383 {
384 bgp_dump_attr (peer, attr, attrstr, BUFSIZ);
385 zlog (peer->log, LOG_DEBUG, "%s send UPDATE %s/%d %s",
386 peer->host, inet_ntop(p.family, &(p.u.prefix), buf, BUFSIZ),
387 p.prefixlen, attrstr);
388 }
389
390 s = stream_new (BGP_MAX_PACKET_SIZE);
391
392 /* Make BGP update packet. */
393 bgp_packet_set_marker (s, BGP_MSG_UPDATE);
394
395 /* Unfeasible Routes Length. */
396 stream_putw (s, 0);
397
398 /* Make place for total attribute length. */
399 pos = stream_get_endp (s);
400 stream_putw (s, 0);
401 total_attr_len = bgp_packet_attribute (NULL, peer, s, attr, &p, afi, safi, from, NULL, NULL);
402
403 /* Set Total Path Attribute Length. */
404 stream_putw_at (s, pos, total_attr_len);
405
406 /* NLRI set. */
407 if (p.family == AF_INET && safi == SAFI_UNICAST)
408 stream_put_prefix (s, &p);
409
410 /* Set size. */
411 bgp_packet_set_size (s);
412
413 packet = stream_dup (s);
414 stream_free (s);
415
416 /* Dump packet if debug option is set. */
417 #ifdef DEBUG
418 /* bgp_packet_dump (packet); */
419 #endif /* DEBUG */
420
421 /* Add packet to the peer. */
422 bgp_packet_add (peer, packet);
423
424 BGP_WRITE_ON (peer->t_write, bgp_write, peer->fd);
425 }
426
427 void
428 bgp_default_withdraw_send (struct peer *peer, afi_t afi, safi_t safi)
429 {
430 struct stream *s;
431 struct stream *packet;
432 struct prefix p;
433 unsigned long pos;
434 unsigned long cp;
435 bgp_size_t unfeasible_len;
436 bgp_size_t total_attr_len;
437 char buf[BUFSIZ];
438
439 if (DISABLE_BGP_ANNOUNCE)
440 return;
441
442 if (afi == AFI_IP)
443 str2prefix ("0.0.0.0/0", &p);
444 #ifdef HAVE_IPV6
445 else
446 str2prefix ("::/0", &p);
447 #endif /* HAVE_IPV6 */
448
449 total_attr_len = 0;
450 pos = 0;
451
452 if (BGP_DEBUG (update, UPDATE_OUT))
453 zlog (peer->log, LOG_DEBUG, "%s send UPDATE %s/%d -- unreachable",
454 peer->host, inet_ntop(p.family, &(p.u.prefix), buf, BUFSIZ),
455 p.prefixlen);
456
457 s = stream_new (BGP_MAX_PACKET_SIZE);
458
459 /* Make BGP update packet. */
460 bgp_packet_set_marker (s, BGP_MSG_UPDATE);
461
462 /* Unfeasible Routes Length. */;
463 cp = stream_get_endp (s);
464 stream_putw (s, 0);
465
466 /* Withdrawn Routes. */
467 if (p.family == AF_INET && safi == SAFI_UNICAST)
468 {
469 stream_put_prefix (s, &p);
470
471 unfeasible_len = stream_get_endp (s) - cp - 2;
472
473 /* Set unfeasible len. */
474 stream_putw_at (s, cp, unfeasible_len);
475
476 /* Set total path attribute length. */
477 stream_putw (s, 0);
478 }
479 else
480 {
481 pos = stream_get_endp (s);
482 stream_putw (s, 0);
483 total_attr_len = bgp_packet_withdraw (peer, s, &p, afi, safi, NULL, NULL);
484
485 /* Set total path attribute length. */
486 stream_putw_at (s, pos, total_attr_len);
487 }
488
489 bgp_packet_set_size (s);
490
491 packet = stream_dup (s);
492 stream_free (s);
493
494 /* Add packet to the peer. */
495 bgp_packet_add (peer, packet);
496
497 BGP_WRITE_ON (peer->t_write, bgp_write, peer->fd);
498 }
499
500 /* Get next packet to be written. */
501 static struct stream *
502 bgp_write_packet (struct peer *peer)
503 {
504 afi_t afi;
505 safi_t safi;
506 struct stream *s = NULL;
507 struct bgp_advertise *adv;
508
509 s = stream_fifo_head (peer->obuf);
510 if (s)
511 return s;
512
513 for (afi = AFI_IP; afi < AFI_MAX; afi++)
514 for (safi = SAFI_UNICAST; safi < SAFI_MAX; safi++)
515 {
516 adv = FIFO_HEAD (&peer->sync[afi][safi]->withdraw);
517 if (adv)
518 {
519 s = bgp_withdraw_packet (peer, afi, safi);
520 if (s)
521 return s;
522 }
523 }
524
525 for (afi = AFI_IP; afi < AFI_MAX; afi++)
526 for (safi = SAFI_UNICAST; safi < SAFI_MAX; safi++)
527 {
528 adv = FIFO_HEAD (&peer->sync[afi][safi]->update);
529 if (adv)
530 {
531 if (adv->binfo && adv->binfo->uptime < peer->synctime)
532 {
533 if (CHECK_FLAG (adv->binfo->peer->cap, PEER_CAP_RESTART_RCV)
534 && CHECK_FLAG (adv->binfo->peer->cap, PEER_CAP_RESTART_ADV)
535 && ! CHECK_FLAG (adv->binfo->flags, BGP_INFO_STALE)
536 && safi != SAFI_MPLS_VPN)
537 {
538 if (CHECK_FLAG (adv->binfo->peer->af_sflags[afi][safi],
539 PEER_STATUS_EOR_RECEIVED))
540 s = bgp_update_packet (peer, afi, safi);
541 }
542 else
543 s = bgp_update_packet (peer, afi, safi);
544 }
545
546 if (s)
547 return s;
548 }
549
550 if (CHECK_FLAG (peer->cap, PEER_CAP_RESTART_RCV))
551 {
552 if (peer->afc_nego[afi][safi] && peer->synctime
553 && ! CHECK_FLAG (peer->af_sflags[afi][safi], PEER_STATUS_EOR_SEND)
554 && safi != SAFI_MPLS_VPN)
555 {
556 SET_FLAG (peer->af_sflags[afi][safi], PEER_STATUS_EOR_SEND);
557 return bgp_update_packet_eor (peer, afi, safi);
558 }
559 }
560 }
561
562 return NULL;
563 }
564
565 /* Is there partially written packet or updates we can send right
566 now. */
567 static int
568 bgp_write_proceed (struct peer *peer)
569 {
570 afi_t afi;
571 safi_t safi;
572 struct bgp_advertise *adv;
573
574 if (stream_fifo_head (peer->obuf))
575 return 1;
576
577 for (afi = AFI_IP; afi < AFI_MAX; afi++)
578 for (safi = SAFI_UNICAST; safi < SAFI_MAX; safi++)
579 if (FIFO_HEAD (&peer->sync[afi][safi]->withdraw))
580 return 1;
581
582 for (afi = AFI_IP; afi < AFI_MAX; afi++)
583 for (safi = SAFI_UNICAST; safi < SAFI_MAX; safi++)
584 if ((adv = FIFO_HEAD (&peer->sync[afi][safi]->update)) != NULL)
585 if (adv->binfo->uptime < peer->synctime)
586 return 1;
587
588 return 0;
589 }
590
591 /* Write packet to the peer. */
592 int
593 bgp_write (struct thread *thread)
594 {
595 struct peer *peer;
596 u_char type;
597 struct stream *s;
598 int num;
599 unsigned int count = 0;
600 int write_errno;
601
602 /* Yes first of all get peer pointer. */
603 peer = THREAD_ARG (thread);
604 peer->t_write = NULL;
605
606 /* For non-blocking IO check. */
607 if (peer->status == Connect)
608 {
609 bgp_connect_check (peer);
610 return 0;
611 }
612
613 /* Nonblocking write until TCP output buffer is full. */
614 while (1)
615 {
616 int writenum;
617 int val;
618
619 s = bgp_write_packet (peer);
620 if (! s)
621 return 0;
622
623 /* XXX: FIXME, the socket should be NONBLOCK from the start
624 * status shouldnt need to be toggled on each write
625 */
626 val = fcntl (peer->fd, F_GETFL, 0);
627 fcntl (peer->fd, F_SETFL, val|O_NONBLOCK);
628
629 /* Number of bytes to be sent. */
630 writenum = stream_get_endp (s) - stream_get_getp (s);
631
632 /* Call write() system call. */
633 num = write (peer->fd, STREAM_PNT (s), writenum);
634 write_errno = errno;
635 fcntl (peer->fd, F_SETFL, val);
636 if (num <= 0)
637 {
638 /* Partial write. */
639 if (write_errno == EWOULDBLOCK || write_errno == EAGAIN)
640 break;
641
642 BGP_EVENT_ADD (peer, TCP_fatal_error);
643 return 0;
644 }
645 if (num != writenum)
646 {
647 stream_forward_getp (s, num);
648
649 if (write_errno == EAGAIN)
650 break;
651
652 continue;
653 }
654
655 /* Retrieve BGP packet type. */
656 stream_set_getp (s, BGP_MARKER_SIZE + 2);
657 type = stream_getc (s);
658
659 switch (type)
660 {
661 case BGP_MSG_OPEN:
662 peer->open_out++;
663 break;
664 case BGP_MSG_UPDATE:
665 peer->update_out++;
666 break;
667 case BGP_MSG_NOTIFY:
668 peer->notify_out++;
669 /* Double start timer. */
670 peer->v_start *= 2;
671
672 /* Overflow check. */
673 if (peer->v_start >= (60 * 2))
674 peer->v_start = (60 * 2);
675
676 /* Flush any existing events */
677 BGP_EVENT_ADD (peer, BGP_Stop);
678 return 0;
679 case BGP_MSG_KEEPALIVE:
680 peer->keepalive_out++;
681 break;
682 case BGP_MSG_ROUTE_REFRESH_NEW:
683 case BGP_MSG_ROUTE_REFRESH_OLD:
684 peer->refresh_out++;
685 break;
686 case BGP_MSG_CAPABILITY:
687 peer->dynamic_cap_out++;
688 break;
689 }
690
691 /* OK we send packet so delete it. */
692 bgp_packet_delete (peer);
693
694 if (++count >= BGP_WRITE_PACKET_MAX)
695 break;
696 }
697
698 if (bgp_write_proceed (peer))
699 BGP_WRITE_ON (peer->t_write, bgp_write, peer->fd);
700
701 return 0;
702 }
703
704 /* This is only for sending NOTIFICATION message to neighbor. */
705 static int
706 bgp_write_notify (struct peer *peer)
707 {
708 int ret;
709 u_char type;
710 struct stream *s;
711
712 /* There should be at least one packet. */
713 s = stream_fifo_head (peer->obuf);
714 if (!s)
715 return 0;
716 assert (stream_get_endp (s) >= BGP_HEADER_SIZE);
717
718 /* I'm not sure fd is writable. */
719 ret = writen (peer->fd, STREAM_DATA (s), stream_get_endp (s));
720 if (ret <= 0)
721 {
722 BGP_EVENT_ADD (peer, TCP_fatal_error);
723 return 0;
724 }
725
726 /* Retrieve BGP packet type. */
727 stream_set_getp (s, BGP_MARKER_SIZE + 2);
728 type = stream_getc (s);
729
730 assert (type == BGP_MSG_NOTIFY);
731
732 /* Type should be notify. */
733 peer->notify_out++;
734
735 /* Double start timer. */
736 peer->v_start *= 2;
737
738 /* Overflow check. */
739 if (peer->v_start >= (60 * 2))
740 peer->v_start = (60 * 2);
741
742 BGP_EVENT_ADD (peer, BGP_Stop);
743
744 return 0;
745 }
746
747 /* Make keepalive packet and send it to the peer. */
748 void
749 bgp_keepalive_send (struct peer *peer)
750 {
751 struct stream *s;
752 int length;
753
754 s = stream_new (BGP_MAX_PACKET_SIZE);
755
756 /* Make keepalive packet. */
757 bgp_packet_set_marker (s, BGP_MSG_KEEPALIVE);
758
759 /* Set packet size. */
760 length = bgp_packet_set_size (s);
761
762 /* Dump packet if debug option is set. */
763 /* bgp_packet_dump (s); */
764
765 if (BGP_DEBUG (keepalive, KEEPALIVE))
766 zlog_debug ("%s sending KEEPALIVE", peer->host);
767 if (BGP_DEBUG (normal, NORMAL))
768 zlog_debug ("%s send message type %d, length (incl. header) %d",
769 peer->host, BGP_MSG_KEEPALIVE, length);
770
771 /* Add packet to the peer. */
772 bgp_packet_add (peer, s);
773
774 BGP_WRITE_ON (peer->t_write, bgp_write, peer->fd);
775 }
776
777 /* Make open packet and send it to the peer. */
778 void
779 bgp_open_send (struct peer *peer)
780 {
781 struct stream *s;
782 int length;
783 u_int16_t send_holdtime;
784 as_t local_as;
785
786 if (CHECK_FLAG (peer->config, PEER_CONFIG_TIMER))
787 send_holdtime = peer->holdtime;
788 else
789 send_holdtime = peer->bgp->default_holdtime;
790
791 /* local-as Change */
792 if (peer->change_local_as)
793 local_as = peer->change_local_as;
794 else
795 local_as = peer->local_as;
796
797 s = stream_new (BGP_MAX_PACKET_SIZE);
798
799 /* Make open packet. */
800 bgp_packet_set_marker (s, BGP_MSG_OPEN);
801
802 /* Set open packet values. */
803 stream_putc (s, BGP_VERSION_4); /* BGP version */
804 stream_putw (s, (local_as <= BGP_AS_MAX) ? (u_int16_t) local_as
805 : BGP_AS_TRANS);
806 stream_putw (s, send_holdtime); /* Hold Time */
807 stream_put_in_addr (s, &peer->local_id); /* BGP Identifier */
808
809 /* Set capability code. */
810 bgp_open_capability (s, peer);
811
812 /* Set BGP packet length. */
813 length = bgp_packet_set_size (s);
814
815 if (BGP_DEBUG (normal, NORMAL))
816 zlog_debug ("%s sending OPEN, version %d, my as %u, holdtime %d, id %s",
817 peer->host, BGP_VERSION_4, local_as,
818 send_holdtime, inet_ntoa (peer->local_id));
819
820 if (BGP_DEBUG (normal, NORMAL))
821 zlog_debug ("%s send message type %d, length (incl. header) %d",
822 peer->host, BGP_MSG_OPEN, length);
823
824 /* Dump packet if debug option is set. */
825 /* bgp_packet_dump (s); */
826
827 /* Add packet to the peer. */
828 bgp_packet_add (peer, s);
829
830 BGP_WRITE_ON (peer->t_write, bgp_write, peer->fd);
831 }
832
833 /* Send BGP notify packet with data potion. */
834 void
835 bgp_notify_send_with_data (struct peer *peer, u_char code, u_char sub_code,
836 u_char *data, size_t datalen)
837 {
838 struct stream *s;
839 int length;
840
841 /* Allocate new stream. */
842 s = stream_new (BGP_MAX_PACKET_SIZE);
843
844 /* Make nitify packet. */
845 bgp_packet_set_marker (s, BGP_MSG_NOTIFY);
846
847 /* Set notify packet values. */
848 stream_putc (s, code); /* BGP notify code */
849 stream_putc (s, sub_code); /* BGP notify sub_code */
850
851 /* If notify data is present. */
852 if (data)
853 stream_write (s, data, datalen);
854
855 /* Set BGP packet length. */
856 length = bgp_packet_set_size (s);
857
858 /* Add packet to the peer. */
859 stream_fifo_clean (peer->obuf);
860 bgp_packet_add (peer, s);
861
862 /* For debug */
863 {
864 struct bgp_notify bgp_notify;
865 int first = 0;
866 int i;
867 char c[4];
868
869 bgp_notify.code = code;
870 bgp_notify.subcode = sub_code;
871 bgp_notify.data = NULL;
872 bgp_notify.length = length - BGP_MSG_NOTIFY_MIN_SIZE;
873
874 if (bgp_notify.length)
875 {
876 bgp_notify.data = XMALLOC (MTYPE_TMP, bgp_notify.length * 3);
877 for (i = 0; i < bgp_notify.length; i++)
878 if (first)
879 {
880 sprintf (c, " %02x", data[i]);
881 strcat (bgp_notify.data, c);
882 }
883 else
884 {
885 first = 1;
886 sprintf (c, "%02x", data[i]);
887 strcpy (bgp_notify.data, c);
888 }
889 }
890 bgp_notify_print (peer, &bgp_notify, "sending");
891 if (bgp_notify.data)
892 XFREE (MTYPE_TMP, bgp_notify.data);
893 }
894
895 if (BGP_DEBUG (normal, NORMAL))
896 zlog_debug ("%s send message type %d, length (incl. header) %d",
897 peer->host, BGP_MSG_NOTIFY, length);
898
899 /* peer reset cause */
900 if (sub_code != BGP_NOTIFY_CEASE_CONFIG_CHANGE)
901 {
902 if (sub_code == BGP_NOTIFY_CEASE_ADMIN_RESET)
903 peer->last_reset = PEER_DOWN_USER_RESET;
904 else if (sub_code == BGP_NOTIFY_CEASE_ADMIN_SHUTDOWN)
905 peer->last_reset = PEER_DOWN_USER_SHUTDOWN;
906 else
907 peer->last_reset = PEER_DOWN_NOTIFY_SEND;
908 }
909
910 /* Call imidiately. */
911 BGP_WRITE_OFF (peer->t_write);
912
913 bgp_write_notify (peer);
914 }
915
916 /* Send BGP notify packet. */
917 void
918 bgp_notify_send (struct peer *peer, u_char code, u_char sub_code)
919 {
920 bgp_notify_send_with_data (peer, code, sub_code, NULL, 0);
921 }
922
923 static const char *
924 afi2str (afi_t afi)
925 {
926 if (afi == AFI_IP)
927 return "AFI_IP";
928 else if (afi == AFI_IP6)
929 return "AFI_IP6";
930 else
931 return "Unknown AFI";
932 }
933
934 static const char *
935 safi2str (safi_t safi)
936 {
937 if (safi == SAFI_UNICAST)
938 return "SAFI_UNICAST";
939 else if (safi == SAFI_MULTICAST)
940 return "SAFI_MULTICAST";
941 else if (safi == SAFI_MPLS_VPN || safi == BGP_SAFI_VPNV4)
942 return "SAFI_MPLS_VPN";
943 else
944 return "Unknown SAFI";
945 }
946
947 /* Send route refresh message to the peer. */
948 void
949 bgp_route_refresh_send (struct peer *peer, afi_t afi, safi_t safi,
950 u_char orf_type, u_char when_to_refresh, int remove)
951 {
952 struct stream *s;
953 struct stream *packet;
954 int length;
955 struct bgp_filter *filter;
956 int orf_refresh = 0;
957
958 if (DISABLE_BGP_ANNOUNCE)
959 return;
960
961 filter = &peer->filter[afi][safi];
962
963 /* Adjust safi code. */
964 if (safi == SAFI_MPLS_VPN)
965 safi = BGP_SAFI_VPNV4;
966
967 s = stream_new (BGP_MAX_PACKET_SIZE);
968
969 /* Make BGP update packet. */
970 if (CHECK_FLAG (peer->cap, PEER_CAP_REFRESH_NEW_RCV))
971 bgp_packet_set_marker (s, BGP_MSG_ROUTE_REFRESH_NEW);
972 else
973 bgp_packet_set_marker (s, BGP_MSG_ROUTE_REFRESH_OLD);
974
975 /* Encode Route Refresh message. */
976 stream_putw (s, afi);
977 stream_putc (s, 0);
978 stream_putc (s, safi);
979
980 if (orf_type == ORF_TYPE_PREFIX
981 || orf_type == ORF_TYPE_PREFIX_OLD)
982 if (remove || filter->plist[FILTER_IN].plist)
983 {
984 u_int16_t orf_len;
985 unsigned long orfp;
986
987 orf_refresh = 1;
988 stream_putc (s, when_to_refresh);
989 stream_putc (s, orf_type);
990 orfp = stream_get_endp (s);
991 stream_putw (s, 0);
992
993 if (remove)
994 {
995 UNSET_FLAG (peer->af_sflags[afi][safi], PEER_STATUS_ORF_PREFIX_SEND);
996 stream_putc (s, ORF_COMMON_PART_REMOVE_ALL);
997 if (BGP_DEBUG (normal, NORMAL))
998 zlog_debug ("%s sending REFRESH_REQ to remove ORF(%d) (%s) for afi/safi: %d/%d",
999 peer->host, orf_type,
1000 (when_to_refresh == REFRESH_DEFER ? "defer" : "immediate"),
1001 afi, safi);
1002 }
1003 else
1004 {
1005 SET_FLAG (peer->af_sflags[afi][safi], PEER_STATUS_ORF_PREFIX_SEND);
1006 prefix_bgp_orf_entry (s, filter->plist[FILTER_IN].plist,
1007 ORF_COMMON_PART_ADD, ORF_COMMON_PART_PERMIT,
1008 ORF_COMMON_PART_DENY);
1009 if (BGP_DEBUG (normal, NORMAL))
1010 zlog_debug ("%s sending REFRESH_REQ with pfxlist ORF(%d) (%s) for afi/safi: %d/%d",
1011 peer->host, orf_type,
1012 (when_to_refresh == REFRESH_DEFER ? "defer" : "immediate"),
1013 afi, safi);
1014 }
1015
1016 /* Total ORF Entry Len. */
1017 orf_len = stream_get_endp (s) - orfp - 2;
1018 stream_putw_at (s, orfp, orf_len);
1019 }
1020
1021 /* Set packet size. */
1022 length = bgp_packet_set_size (s);
1023
1024 if (BGP_DEBUG (normal, NORMAL))
1025 {
1026 if (! orf_refresh)
1027 zlog_debug ("%s sending REFRESH_REQ for afi/safi: %d/%d",
1028 peer->host, afi, safi);
1029 zlog_debug ("%s send message type %d, length (incl. header) %d",
1030 peer->host, CHECK_FLAG (peer->cap, PEER_CAP_REFRESH_NEW_RCV) ?
1031 BGP_MSG_ROUTE_REFRESH_NEW : BGP_MSG_ROUTE_REFRESH_OLD, length);
1032 }
1033
1034 /* Make real packet. */
1035 packet = stream_dup (s);
1036 stream_free (s);
1037
1038 /* Add packet to the peer. */
1039 bgp_packet_add (peer, packet);
1040
1041 BGP_WRITE_ON (peer->t_write, bgp_write, peer->fd);
1042 }
1043
1044 /* Send capability message to the peer. */
1045 void
1046 bgp_capability_send (struct peer *peer, afi_t afi, safi_t safi,
1047 int capability_code, int action)
1048 {
1049 struct stream *s;
1050 struct stream *packet;
1051 int length;
1052
1053 /* Adjust safi code. */
1054 if (safi == SAFI_MPLS_VPN)
1055 safi = BGP_SAFI_VPNV4;
1056
1057 s = stream_new (BGP_MAX_PACKET_SIZE);
1058
1059 /* Make BGP update packet. */
1060 bgp_packet_set_marker (s, BGP_MSG_CAPABILITY);
1061
1062 /* Encode MP_EXT capability. */
1063 if (capability_code == CAPABILITY_CODE_MP)
1064 {
1065 stream_putc (s, action);
1066 stream_putc (s, CAPABILITY_CODE_MP);
1067 stream_putc (s, CAPABILITY_CODE_MP_LEN);
1068 stream_putw (s, afi);
1069 stream_putc (s, 0);
1070 stream_putc (s, safi);
1071
1072 if (BGP_DEBUG (normal, NORMAL))
1073 zlog_debug ("%s sending CAPABILITY has %s MP_EXT CAP for afi/safi: %d/%d",
1074 peer->host, action == CAPABILITY_ACTION_SET ?
1075 "Advertising" : "Removing", afi, safi);
1076 }
1077
1078 /* Set packet size. */
1079 length = bgp_packet_set_size (s);
1080
1081 /* Make real packet. */
1082 packet = stream_dup (s);
1083 stream_free (s);
1084
1085 /* Add packet to the peer. */
1086 bgp_packet_add (peer, packet);
1087
1088 if (BGP_DEBUG (normal, NORMAL))
1089 zlog_debug ("%s send message type %d, length (incl. header) %d",
1090 peer->host, BGP_MSG_CAPABILITY, length);
1091
1092 BGP_WRITE_ON (peer->t_write, bgp_write, peer->fd);
1093 }
1094 \f
1095 /* RFC1771 6.8 Connection collision detection. */
1096 static int
1097 bgp_collision_detect (struct peer *new, struct in_addr remote_id)
1098 {
1099 struct peer *peer;
1100 struct listnode *node, *nnode;
1101 struct bgp *bgp;
1102
1103 bgp = bgp_get_default ();
1104 if (! bgp)
1105 return 0;
1106
1107 /* Upon receipt of an OPEN message, the local system must examine
1108 all of its connections that are in the OpenConfirm state. A BGP
1109 speaker may also examine connections in an OpenSent state if it
1110 knows the BGP Identifier of the peer by means outside of the
1111 protocol. If among these connections there is a connection to a
1112 remote BGP speaker whose BGP Identifier equals the one in the
1113 OPEN message, then the local system performs the following
1114 collision resolution procedure: */
1115
1116 for (ALL_LIST_ELEMENTS (bgp->peer, node, nnode, peer))
1117 {
1118 /* Under OpenConfirm status, local peer structure already hold
1119 remote router ID. */
1120
1121 if (peer != new
1122 && (peer->status == OpenConfirm || peer->status == OpenSent)
1123 && sockunion_same (&peer->su, &new->su))
1124 {
1125 /* 1. The BGP Identifier of the local system is compared to
1126 the BGP Identifier of the remote system (as specified in
1127 the OPEN message). */
1128
1129 if (ntohl (peer->local_id.s_addr) < ntohl (remote_id.s_addr))
1130 {
1131 /* 2. If the value of the local BGP Identifier is less
1132 than the remote one, the local system closes BGP
1133 connection that already exists (the one that is
1134 already in the OpenConfirm state), and accepts BGP
1135 connection initiated by the remote system. */
1136
1137 if (peer->fd >= 0)
1138 bgp_notify_send (peer, BGP_NOTIFY_CEASE, BGP_NOTIFY_CEASE_COLLISION_RESOLUTION);
1139 return 1;
1140 }
1141 else
1142 {
1143 /* 3. Otherwise, the local system closes newly created
1144 BGP connection (the one associated with the newly
1145 received OPEN message), and continues to use the
1146 existing one (the one that is already in the
1147 OpenConfirm state). */
1148
1149 if (new->fd >= 0)
1150 bgp_notify_send (new, BGP_NOTIFY_CEASE,
1151 BGP_NOTIFY_CEASE_COLLISION_RESOLUTION);
1152 return -1;
1153 }
1154 }
1155 }
1156 return 0;
1157 }
1158
1159 static int
1160 bgp_open_receive (struct peer *peer, bgp_size_t size)
1161 {
1162 int ret;
1163 u_char version;
1164 u_char optlen;
1165 u_int16_t holdtime;
1166 u_int16_t send_holdtime;
1167 as_t remote_as;
1168 as_t as4 = 0;
1169 struct peer *realpeer;
1170 struct in_addr remote_id;
1171 int capability;
1172 u_int8_t notify_data_remote_as[2];
1173 u_int8_t notify_data_remote_id[4];
1174
1175 realpeer = NULL;
1176
1177 /* Parse open packet. */
1178 version = stream_getc (peer->ibuf);
1179 memcpy (notify_data_remote_as, stream_pnt (peer->ibuf), 2);
1180 remote_as = stream_getw (peer->ibuf);
1181 holdtime = stream_getw (peer->ibuf);
1182 memcpy (notify_data_remote_id, stream_pnt (peer->ibuf), 4);
1183 remote_id.s_addr = stream_get_ipv4 (peer->ibuf);
1184
1185 /* Receive OPEN message log */
1186 if (BGP_DEBUG (normal, NORMAL))
1187 zlog_debug ("%s rcv OPEN, version %d, remote-as (in open) %u,"
1188 " holdtime %d, id %s",
1189 peer->host, version, remote_as, holdtime,
1190 inet_ntoa (remote_id));
1191
1192 /* BEGIN to read the capability here, but dont do it yet */
1193 capability = 0;
1194 optlen = stream_getc (peer->ibuf);
1195
1196 if (optlen != 0)
1197 {
1198 /* We need the as4 capability value *right now* because
1199 * if it is there, we have not got the remote_as yet, and without
1200 * that we do not know which peer is connecting to us now.
1201 */
1202 as4 = peek_for_as4_capability (peer, optlen);
1203 }
1204
1205 /* Just in case we have a silly peer who sends AS4 capability set to 0 */
1206 if (CHECK_FLAG (peer->cap, PEER_CAP_AS4_RCV) && !as4)
1207 {
1208 zlog_err ("%s bad OPEN, got AS4 capability, but AS4 set to 0",
1209 peer->host);
1210 bgp_notify_send (peer, BGP_NOTIFY_OPEN_ERR,
1211 BGP_NOTIFY_OPEN_BAD_PEER_AS);
1212 return -1;
1213 }
1214
1215 if (remote_as == BGP_AS_TRANS)
1216 {
1217 /* Take the AS4 from the capability. We must have received the
1218 * capability now! Otherwise we have a asn16 peer who uses
1219 * BGP_AS_TRANS, for some unknown reason.
1220 */
1221 if (as4 == BGP_AS_TRANS)
1222 {
1223 zlog_err ("%s [AS4] NEW speaker using AS_TRANS for AS4, not allowed",
1224 peer->host);
1225 bgp_notify_send (peer, BGP_NOTIFY_OPEN_ERR,
1226 BGP_NOTIFY_OPEN_BAD_PEER_AS);
1227 return -1;
1228 }
1229
1230 if (!as4 && BGP_DEBUG (as4, AS4))
1231 zlog_debug ("%s [AS4] OPEN remote_as is AS_TRANS, but no AS4."
1232 " Odd, but proceeding.", peer->host);
1233 else if (as4 < BGP_AS_MAX && BGP_DEBUG (as4, AS4))
1234 zlog_debug ("%s [AS4] OPEN remote_as is AS_TRANS, but AS4 (%u) fits "
1235 "in 2-bytes, very odd peer.", peer->host, as4);
1236 if (as4)
1237 remote_as = as4;
1238 }
1239 else
1240 {
1241 /* We may have a partner with AS4 who has an asno < BGP_AS_MAX */
1242 /* If we have got the capability, peer->as4cap must match remote_as */
1243 if (CHECK_FLAG (peer->cap, PEER_CAP_AS4_RCV)
1244 && as4 != remote_as)
1245 {
1246 /* raise error, log this, close session */
1247 zlog_err ("%s bad OPEN, got AS4 capability, but remote_as %u"
1248 " mismatch with 16bit 'myasn' %u in open",
1249 peer->host, as4, remote_as);
1250 bgp_notify_send (peer, BGP_NOTIFY_OPEN_ERR,
1251 BGP_NOTIFY_OPEN_BAD_PEER_AS);
1252 return -1;
1253 }
1254 }
1255
1256 /* Lookup peer from Open packet. */
1257 if (CHECK_FLAG (peer->sflags, PEER_STATUS_ACCEPT_PEER))
1258 {
1259 int as = 0;
1260
1261 realpeer = peer_lookup_with_open (&peer->su, remote_as, &remote_id, &as);
1262
1263 if (! realpeer)
1264 {
1265 /* Peer's source IP address is check in bgp_accept(), so this
1266 must be AS number mismatch or remote-id configuration
1267 mismatch. */
1268 if (as)
1269 {
1270 if (BGP_DEBUG (normal, NORMAL))
1271 zlog_debug ("%s bad OPEN, wrong router identifier %s",
1272 peer->host, inet_ntoa (remote_id));
1273 bgp_notify_send_with_data (peer, BGP_NOTIFY_OPEN_ERR,
1274 BGP_NOTIFY_OPEN_BAD_BGP_IDENT,
1275 notify_data_remote_id, 4);
1276 }
1277 else
1278 {
1279 if (BGP_DEBUG (normal, NORMAL))
1280 zlog_debug ("%s bad OPEN, remote AS is %u, expected %u",
1281 peer->host, remote_as, peer->as);
1282 bgp_notify_send_with_data (peer, BGP_NOTIFY_OPEN_ERR,
1283 BGP_NOTIFY_OPEN_BAD_PEER_AS,
1284 notify_data_remote_as, 2);
1285 }
1286 return -1;
1287 }
1288 }
1289
1290 /* When collision is detected and this peer is closed. Retrun
1291 immidiately. */
1292 ret = bgp_collision_detect (peer, remote_id);
1293 if (ret < 0)
1294 return ret;
1295
1296 /* Hack part. */
1297 if (CHECK_FLAG (peer->sflags, PEER_STATUS_ACCEPT_PEER))
1298 {
1299 if (realpeer->status == Established
1300 && CHECK_FLAG (realpeer->sflags, PEER_STATUS_NSF_MODE))
1301 {
1302 realpeer->last_reset = PEER_DOWN_NSF_CLOSE_SESSION;
1303 SET_FLAG (realpeer->sflags, PEER_STATUS_NSF_WAIT);
1304 }
1305 else if (ret == 0 && realpeer->status != Active
1306 && realpeer->status != OpenSent
1307 && realpeer->status != OpenConfirm
1308 && realpeer->status != Connect)
1309 {
1310 /* XXX: This is an awful problem..
1311 *
1312 * According to the RFC we should just let this connection (of the
1313 * accepted 'peer') continue on to Established if the other
1314 * connection (the 'realpeer' one) is in state Connect, and deal
1315 * with the more larval FSM as/when it gets far enough to receive
1316 * an Open. We don't do that though, we instead close the (more
1317 * developed) accepted connection.
1318 *
1319 * This means there's a race, which if hit, can loop:
1320 *
1321 * FSM for A FSM for B
1322 * realpeer accept-peer realpeer accept-peer
1323 *
1324 * Connect Connect
1325 * Active
1326 * OpenSent OpenSent
1327 * <arrive here,
1328 * Notify, delete>
1329 * Idle Active
1330 * OpenSent OpenSent
1331 * <arrive here,
1332 * Notify, delete>
1333 * Idle
1334 * <wait> <wait>
1335 * Connect Connect
1336 *
1337 *
1338 * If both sides are Quagga, they're almost certain to wait for
1339 * the same amount of time of course (which doesn't preclude other
1340 * implementations also waiting for same time). The race is
1341 * exacerbated by high-latency (in bgpd and/or the network).
1342 *
1343 * The reason we do this is because our FSM is tied to our peer
1344 * structure, which carries our configuration information, etc.
1345 * I.e. we can't let the accepted-peer FSM continue on as it is,
1346 * cause it's not associated with any actual peer configuration -
1347 * it's just a dummy.
1348 *
1349 * It's possible we could hack-fix this by just bgp_stop'ing the
1350 * realpeer and continueing on with the 'transfer FSM' below.
1351 * Ideally, we need to seperate FSMs from struct peer.
1352 *
1353 * Setting one side to passive avoids the race, as a workaround.
1354 */
1355 if (BGP_DEBUG (events, EVENTS))
1356 zlog_debug ("%s peer status is %s close connection",
1357 realpeer->host, LOOKUP (bgp_status_msg,
1358 realpeer->status));
1359 bgp_notify_send (peer, BGP_NOTIFY_CEASE,
1360 BGP_NOTIFY_CEASE_CONNECT_REJECT);
1361
1362 return -1;
1363 }
1364
1365 if (BGP_DEBUG (events, EVENTS))
1366 zlog_debug ("%s [Event] Transfer accept BGP peer to real (state %s)",
1367 peer->host,
1368 LOOKUP (bgp_status_msg, realpeer->status));
1369
1370 bgp_stop (realpeer);
1371
1372 /* Transfer file descriptor. */
1373 realpeer->fd = peer->fd;
1374 peer->fd = -1;
1375
1376 /* Transfer input buffer. */
1377 stream_free (realpeer->ibuf);
1378 realpeer->ibuf = peer->ibuf;
1379 realpeer->packet_size = peer->packet_size;
1380 peer->ibuf = NULL;
1381
1382 /* Transfer status. */
1383 realpeer->status = peer->status;
1384 bgp_stop (peer);
1385
1386 /* peer pointer change. Open packet send to neighbor. */
1387 peer = realpeer;
1388 bgp_open_send (peer);
1389 if (peer->fd < 0)
1390 {
1391 zlog_err ("bgp_open_receive peer's fd is negative value %d",
1392 peer->fd);
1393 return -1;
1394 }
1395 BGP_READ_ON (peer->t_read, bgp_read, peer->fd);
1396 }
1397
1398 /* remote router-id check. */
1399 if (remote_id.s_addr == 0
1400 || ntohl (remote_id.s_addr) >= 0xe0000000
1401 || ntohl (peer->local_id.s_addr) == ntohl (remote_id.s_addr))
1402 {
1403 if (BGP_DEBUG (normal, NORMAL))
1404 zlog_debug ("%s bad OPEN, wrong router identifier %s",
1405 peer->host, inet_ntoa (remote_id));
1406 bgp_notify_send_with_data (peer,
1407 BGP_NOTIFY_OPEN_ERR,
1408 BGP_NOTIFY_OPEN_BAD_BGP_IDENT,
1409 notify_data_remote_id, 4);
1410 return -1;
1411 }
1412
1413 /* Set remote router-id */
1414 peer->remote_id = remote_id;
1415
1416 /* Peer BGP version check. */
1417 if (version != BGP_VERSION_4)
1418 {
1419 u_int8_t maxver = BGP_VERSION_4;
1420 if (BGP_DEBUG (normal, NORMAL))
1421 zlog_debug ("%s bad protocol version, remote requested %d, local request %d",
1422 peer->host, version, BGP_VERSION_4);
1423 bgp_notify_send_with_data (peer,
1424 BGP_NOTIFY_OPEN_ERR,
1425 BGP_NOTIFY_OPEN_UNSUP_VERSION,
1426 &maxver, 1);
1427 return -1;
1428 }
1429
1430 /* Check neighbor as number. */
1431 if (remote_as != peer->as)
1432 {
1433 if (BGP_DEBUG (normal, NORMAL))
1434 zlog_debug ("%s bad OPEN, remote AS is %u, expected %u",
1435 peer->host, remote_as, peer->as);
1436 bgp_notify_send_with_data (peer,
1437 BGP_NOTIFY_OPEN_ERR,
1438 BGP_NOTIFY_OPEN_BAD_PEER_AS,
1439 notify_data_remote_as, 2);
1440 return -1;
1441 }
1442
1443 /* From the rfc: Upon receipt of an OPEN message, a BGP speaker MUST
1444 calculate the value of the Hold Timer by using the smaller of its
1445 configured Hold Time and the Hold Time received in the OPEN message.
1446 The Hold Time MUST be either zero or at least three seconds. An
1447 implementation may reject connections on the basis of the Hold Time. */
1448
1449 if (holdtime < 3 && holdtime != 0)
1450 {
1451 bgp_notify_send (peer,
1452 BGP_NOTIFY_OPEN_ERR,
1453 BGP_NOTIFY_OPEN_UNACEP_HOLDTIME);
1454 return -1;
1455 }
1456
1457 /* From the rfc: A reasonable maximum time between KEEPALIVE messages
1458 would be one third of the Hold Time interval. KEEPALIVE messages
1459 MUST NOT be sent more frequently than one per second. An
1460 implementation MAY adjust the rate at which it sends KEEPALIVE
1461 messages as a function of the Hold Time interval. */
1462
1463 if (CHECK_FLAG (peer->config, PEER_CONFIG_TIMER))
1464 send_holdtime = peer->holdtime;
1465 else
1466 send_holdtime = peer->bgp->default_holdtime;
1467
1468 if (holdtime < send_holdtime)
1469 peer->v_holdtime = holdtime;
1470 else
1471 peer->v_holdtime = send_holdtime;
1472
1473 peer->v_keepalive = peer->v_holdtime / 3;
1474
1475 /* Open option part parse. */
1476 if (optlen != 0)
1477 {
1478 ret = bgp_open_option_parse (peer, optlen, &capability);
1479 if (ret < 0)
1480 return ret;
1481 }
1482 else
1483 {
1484 if (BGP_DEBUG (normal, NORMAL))
1485 zlog_debug ("%s rcvd OPEN w/ OPTION parameter len: 0",
1486 peer->host);
1487 }
1488
1489 /* Override capability. */
1490 if (! capability || CHECK_FLAG (peer->flags, PEER_FLAG_OVERRIDE_CAPABILITY))
1491 {
1492 peer->afc_nego[AFI_IP][SAFI_UNICAST] = peer->afc[AFI_IP][SAFI_UNICAST];
1493 peer->afc_nego[AFI_IP][SAFI_MULTICAST] = peer->afc[AFI_IP][SAFI_MULTICAST];
1494 peer->afc_nego[AFI_IP6][SAFI_UNICAST] = peer->afc[AFI_IP6][SAFI_UNICAST];
1495 peer->afc_nego[AFI_IP6][SAFI_MULTICAST] = peer->afc[AFI_IP6][SAFI_MULTICAST];
1496 }
1497
1498 /* Get sockname. */
1499 bgp_getsockname (peer);
1500
1501 BGP_EVENT_ADD (peer, Receive_OPEN_message);
1502
1503 peer->packet_size = 0;
1504 if (peer->ibuf)
1505 stream_reset (peer->ibuf);
1506
1507 return 0;
1508 }
1509
1510 /* Parse BGP Update packet and make attribute object. */
1511 static int
1512 bgp_update_receive (struct peer *peer, bgp_size_t size)
1513 {
1514 int ret;
1515 u_char *end;
1516 struct stream *s;
1517 struct attr attr;
1518 bgp_size_t attribute_len;
1519 bgp_size_t update_len;
1520 bgp_size_t withdraw_len;
1521 struct bgp_nlri update;
1522 struct bgp_nlri withdraw;
1523 struct bgp_nlri mp_update;
1524 struct bgp_nlri mp_withdraw;
1525 char attrstr[BUFSIZ] = "";
1526
1527 /* Status must be Established. */
1528 if (peer->status != Established)
1529 {
1530 zlog_err ("%s [FSM] Update packet received under status %s",
1531 peer->host, LOOKUP (bgp_status_msg, peer->status));
1532 bgp_notify_send (peer, BGP_NOTIFY_FSM_ERR, 0);
1533 return -1;
1534 }
1535
1536 /* Set initial values. */
1537 memset (&attr, 0, sizeof (struct attr));
1538 memset (&update, 0, sizeof (struct bgp_nlri));
1539 memset (&withdraw, 0, sizeof (struct bgp_nlri));
1540 memset (&mp_update, 0, sizeof (struct bgp_nlri));
1541 memset (&mp_withdraw, 0, sizeof (struct bgp_nlri));
1542
1543 s = peer->ibuf;
1544 end = stream_pnt (s) + size;
1545
1546 /* RFC1771 6.3 If the Unfeasible Routes Length or Total Attribute
1547 Length is too large (i.e., if Unfeasible Routes Length + Total
1548 Attribute Length + 23 exceeds the message Length), then the Error
1549 Subcode is set to Malformed Attribute List. */
1550 if (stream_pnt (s) + 2 > end)
1551 {
1552 zlog_err ("%s [Error] Update packet error"
1553 " (packet length is short for unfeasible length)",
1554 peer->host);
1555 bgp_notify_send (peer, BGP_NOTIFY_UPDATE_ERR,
1556 BGP_NOTIFY_UPDATE_MAL_ATTR);
1557 return -1;
1558 }
1559
1560 /* Unfeasible Route Length. */
1561 withdraw_len = stream_getw (s);
1562
1563 /* Unfeasible Route Length check. */
1564 if (stream_pnt (s) + withdraw_len > end)
1565 {
1566 zlog_err ("%s [Error] Update packet error"
1567 " (packet unfeasible length overflow %d)",
1568 peer->host, withdraw_len);
1569 bgp_notify_send (peer, BGP_NOTIFY_UPDATE_ERR,
1570 BGP_NOTIFY_UPDATE_MAL_ATTR);
1571 return -1;
1572 }
1573
1574 /* Unfeasible Route packet format check. */
1575 if (withdraw_len > 0)
1576 {
1577 ret = bgp_nlri_sanity_check (peer, AFI_IP, stream_pnt (s), withdraw_len);
1578 if (ret < 0)
1579 return -1;
1580
1581 if (BGP_DEBUG (packet, PACKET_RECV))
1582 zlog_debug ("%s [Update:RECV] Unfeasible NLRI received", peer->host);
1583
1584 withdraw.afi = AFI_IP;
1585 withdraw.safi = SAFI_UNICAST;
1586 withdraw.nlri = stream_pnt (s);
1587 withdraw.length = withdraw_len;
1588 stream_forward_getp (s, withdraw_len);
1589 }
1590
1591 /* Attribute total length check. */
1592 if (stream_pnt (s) + 2 > end)
1593 {
1594 zlog_warn ("%s [Error] Packet Error"
1595 " (update packet is short for attribute length)",
1596 peer->host);
1597 bgp_notify_send (peer, BGP_NOTIFY_UPDATE_ERR,
1598 BGP_NOTIFY_UPDATE_MAL_ATTR);
1599 return -1;
1600 }
1601
1602 /* Fetch attribute total length. */
1603 attribute_len = stream_getw (s);
1604
1605 /* Attribute length check. */
1606 if (stream_pnt (s) + attribute_len > end)
1607 {
1608 zlog_warn ("%s [Error] Packet Error"
1609 " (update packet attribute length overflow %d)",
1610 peer->host, attribute_len);
1611 bgp_notify_send (peer, BGP_NOTIFY_UPDATE_ERR,
1612 BGP_NOTIFY_UPDATE_MAL_ATTR);
1613 return -1;
1614 }
1615
1616 /* Parse attribute when it exists. */
1617 if (attribute_len)
1618 {
1619 ret = bgp_attr_parse (peer, &attr, attribute_len,
1620 &mp_update, &mp_withdraw);
1621 if (ret < 0)
1622 return -1;
1623 }
1624
1625 /* Logging the attribute. */
1626 if (BGP_DEBUG (update, UPDATE_IN))
1627 {
1628 ret= bgp_dump_attr (peer, &attr, attrstr, BUFSIZ);
1629
1630 if (ret)
1631 zlog (peer->log, LOG_DEBUG, "%s rcvd UPDATE w/ attr: %s",
1632 peer->host, attrstr);
1633 }
1634
1635 /* Network Layer Reachability Information. */
1636 update_len = end - stream_pnt (s);
1637
1638 if (update_len)
1639 {
1640 /* Check NLRI packet format and prefix length. */
1641 ret = bgp_nlri_sanity_check (peer, AFI_IP, stream_pnt (s), update_len);
1642 if (ret < 0)
1643 return -1;
1644
1645 /* Set NLRI portion to structure. */
1646 update.afi = AFI_IP;
1647 update.safi = SAFI_UNICAST;
1648 update.nlri = stream_pnt (s);
1649 update.length = update_len;
1650 stream_forward_getp (s, update_len);
1651 }
1652
1653 /* NLRI is processed only when the peer is configured specific
1654 Address Family and Subsequent Address Family. */
1655 if (peer->afc[AFI_IP][SAFI_UNICAST])
1656 {
1657 if (withdraw.length)
1658 bgp_nlri_parse (peer, NULL, &withdraw);
1659
1660 if (update.length)
1661 {
1662 /* We check well-known attribute only for IPv4 unicast
1663 update. */
1664 ret = bgp_attr_check (peer, &attr);
1665 if (ret < 0)
1666 return -1;
1667
1668 bgp_nlri_parse (peer, &attr, &update);
1669 }
1670
1671 if (mp_update.length
1672 && mp_update.afi == AFI_IP
1673 && mp_update.safi == SAFI_UNICAST)
1674 bgp_nlri_parse (peer, &attr, &mp_update);
1675
1676 if (mp_withdraw.length
1677 && mp_withdraw.afi == AFI_IP
1678 && mp_withdraw.safi == SAFI_UNICAST)
1679 bgp_nlri_parse (peer, NULL, &mp_withdraw);
1680
1681 if (! attribute_len && ! withdraw_len)
1682 {
1683 /* End-of-RIB received */
1684 SET_FLAG (peer->af_sflags[AFI_IP][SAFI_UNICAST],
1685 PEER_STATUS_EOR_RECEIVED);
1686
1687 /* NSF delete stale route */
1688 if (peer->nsf[AFI_IP][SAFI_UNICAST])
1689 bgp_clear_stale_route (peer, AFI_IP, SAFI_UNICAST);
1690
1691 if (BGP_DEBUG (normal, NORMAL))
1692 zlog (peer->log, LOG_DEBUG, "rcvd End-of-RIB for IPv4 Unicast from %s",
1693 peer->host);
1694 }
1695 }
1696 if (peer->afc[AFI_IP][SAFI_MULTICAST])
1697 {
1698 if (mp_update.length
1699 && mp_update.afi == AFI_IP
1700 && mp_update.safi == SAFI_MULTICAST)
1701 bgp_nlri_parse (peer, &attr, &mp_update);
1702
1703 if (mp_withdraw.length
1704 && mp_withdraw.afi == AFI_IP
1705 && mp_withdraw.safi == SAFI_MULTICAST)
1706 bgp_nlri_parse (peer, NULL, &mp_withdraw);
1707
1708 if (! withdraw_len
1709 && mp_withdraw.afi == AFI_IP
1710 && mp_withdraw.safi == SAFI_MULTICAST
1711 && mp_withdraw.length == 0)
1712 {
1713 /* End-of-RIB received */
1714 SET_FLAG (peer->af_sflags[AFI_IP][SAFI_MULTICAST],
1715 PEER_STATUS_EOR_RECEIVED);
1716
1717 /* NSF delete stale route */
1718 if (peer->nsf[AFI_IP][SAFI_MULTICAST])
1719 bgp_clear_stale_route (peer, AFI_IP, SAFI_MULTICAST);
1720
1721 if (BGP_DEBUG (normal, NORMAL))
1722 zlog (peer->log, LOG_DEBUG, "rcvd End-of-RIB for IPv4 Multicast from %s",
1723 peer->host);
1724 }
1725 }
1726 if (peer->afc[AFI_IP6][SAFI_UNICAST])
1727 {
1728 if (mp_update.length
1729 && mp_update.afi == AFI_IP6
1730 && mp_update.safi == SAFI_UNICAST)
1731 bgp_nlri_parse (peer, &attr, &mp_update);
1732
1733 if (mp_withdraw.length
1734 && mp_withdraw.afi == AFI_IP6
1735 && mp_withdraw.safi == SAFI_UNICAST)
1736 bgp_nlri_parse (peer, NULL, &mp_withdraw);
1737
1738 if (! withdraw_len
1739 && mp_withdraw.afi == AFI_IP6
1740 && mp_withdraw.safi == SAFI_UNICAST
1741 && mp_withdraw.length == 0)
1742 {
1743 /* End-of-RIB received */
1744 SET_FLAG (peer->af_sflags[AFI_IP6][SAFI_UNICAST], PEER_STATUS_EOR_RECEIVED);
1745
1746 /* NSF delete stale route */
1747 if (peer->nsf[AFI_IP6][SAFI_UNICAST])
1748 bgp_clear_stale_route (peer, AFI_IP6, SAFI_UNICAST);
1749
1750 if (BGP_DEBUG (normal, NORMAL))
1751 zlog (peer->log, LOG_DEBUG, "rcvd End-of-RIB for IPv6 Unicast from %s",
1752 peer->host);
1753 }
1754 }
1755 if (peer->afc[AFI_IP6][SAFI_MULTICAST])
1756 {
1757 if (mp_update.length
1758 && mp_update.afi == AFI_IP6
1759 && mp_update.safi == SAFI_MULTICAST)
1760 bgp_nlri_parse (peer, &attr, &mp_update);
1761
1762 if (mp_withdraw.length
1763 && mp_withdraw.afi == AFI_IP6
1764 && mp_withdraw.safi == SAFI_MULTICAST)
1765 bgp_nlri_parse (peer, NULL, &mp_withdraw);
1766
1767 if (! withdraw_len
1768 && mp_withdraw.afi == AFI_IP6
1769 && mp_withdraw.safi == SAFI_MULTICAST
1770 && mp_withdraw.length == 0)
1771 {
1772 /* End-of-RIB received */
1773
1774 /* NSF delete stale route */
1775 if (peer->nsf[AFI_IP6][SAFI_MULTICAST])
1776 bgp_clear_stale_route (peer, AFI_IP6, SAFI_MULTICAST);
1777
1778 if (BGP_DEBUG (update, UPDATE_IN))
1779 zlog (peer->log, LOG_DEBUG, "rcvd End-of-RIB for IPv6 Multicast from %s",
1780 peer->host);
1781 }
1782 }
1783 if (peer->afc[AFI_IP][SAFI_MPLS_VPN])
1784 {
1785 if (mp_update.length
1786 && mp_update.afi == AFI_IP
1787 && mp_update.safi == BGP_SAFI_VPNV4)
1788 bgp_nlri_parse_vpnv4 (peer, &attr, &mp_update);
1789
1790 if (mp_withdraw.length
1791 && mp_withdraw.afi == AFI_IP
1792 && mp_withdraw.safi == BGP_SAFI_VPNV4)
1793 bgp_nlri_parse_vpnv4 (peer, NULL, &mp_withdraw);
1794
1795 if (! withdraw_len
1796 && mp_withdraw.afi == AFI_IP
1797 && mp_withdraw.safi == BGP_SAFI_VPNV4
1798 && mp_withdraw.length == 0)
1799 {
1800 /* End-of-RIB received */
1801
1802 if (BGP_DEBUG (update, UPDATE_IN))
1803 zlog (peer->log, LOG_DEBUG, "rcvd End-of-RIB for VPNv4 Unicast from %s",
1804 peer->host);
1805 }
1806 }
1807
1808 /* Everything is done. We unintern temporary structures which
1809 interned in bgp_attr_parse(). */
1810 if (attr.aspath)
1811 aspath_unintern (attr.aspath);
1812 if (attr.community)
1813 community_unintern (attr.community);
1814 if (attr.extra)
1815 {
1816 if (attr.extra->ecommunity)
1817 ecommunity_unintern (attr.extra->ecommunity);
1818 if (attr.extra->cluster)
1819 cluster_unintern (attr.extra->cluster);
1820 if (attr.extra->transit)
1821 transit_unintern (attr.extra->transit);
1822 bgp_attr_extra_free (&attr);
1823 }
1824
1825 /* If peering is stopped due to some reason, do not generate BGP
1826 event. */
1827 if (peer->status != Established)
1828 return 0;
1829
1830 /* Increment packet counter. */
1831 peer->update_in++;
1832 peer->update_time = time (NULL);
1833
1834 /* Generate BGP event. */
1835 BGP_EVENT_ADD (peer, Receive_UPDATE_message);
1836
1837 return 0;
1838 }
1839
1840 /* Notify message treatment function. */
1841 static void
1842 bgp_notify_receive (struct peer *peer, bgp_size_t size)
1843 {
1844 struct bgp_notify bgp_notify;
1845
1846 if (peer->notify.data)
1847 {
1848 XFREE (MTYPE_TMP, peer->notify.data);
1849 peer->notify.data = NULL;
1850 peer->notify.length = 0;
1851 }
1852
1853 bgp_notify.code = stream_getc (peer->ibuf);
1854 bgp_notify.subcode = stream_getc (peer->ibuf);
1855 bgp_notify.length = size - 2;
1856 bgp_notify.data = NULL;
1857
1858 /* Preserv notify code and sub code. */
1859 peer->notify.code = bgp_notify.code;
1860 peer->notify.subcode = bgp_notify.subcode;
1861 /* For further diagnostic record returned Data. */
1862 if (bgp_notify.length)
1863 {
1864 peer->notify.length = size - 2;
1865 peer->notify.data = XMALLOC (MTYPE_TMP, size - 2);
1866 memcpy (peer->notify.data, stream_pnt (peer->ibuf), size - 2);
1867 }
1868
1869 /* For debug */
1870 {
1871 int i;
1872 int first = 0;
1873 char c[4];
1874
1875 if (bgp_notify.length)
1876 {
1877 bgp_notify.data = XMALLOC (MTYPE_TMP, bgp_notify.length * 3);
1878 for (i = 0; i < bgp_notify.length; i++)
1879 if (first)
1880 {
1881 sprintf (c, " %02x", stream_getc (peer->ibuf));
1882 strcat (bgp_notify.data, c);
1883 }
1884 else
1885 {
1886 first = 1;
1887 sprintf (c, "%02x", stream_getc (peer->ibuf));
1888 strcpy (bgp_notify.data, c);
1889 }
1890 }
1891
1892 bgp_notify_print(peer, &bgp_notify, "received");
1893 if (bgp_notify.data)
1894 XFREE (MTYPE_TMP, bgp_notify.data);
1895 }
1896
1897 /* peer count update */
1898 peer->notify_in++;
1899
1900 if (peer->status == Established)
1901 peer->last_reset = PEER_DOWN_NOTIFY_RECEIVED;
1902
1903 /* We have to check for Notify with Unsupported Optional Parameter.
1904 in that case we fallback to open without the capability option.
1905 But this done in bgp_stop. We just mark it here to avoid changing
1906 the fsm tables. */
1907 if (bgp_notify.code == BGP_NOTIFY_OPEN_ERR &&
1908 bgp_notify.subcode == BGP_NOTIFY_OPEN_UNSUP_PARAM )
1909 UNSET_FLAG (peer->sflags, PEER_STATUS_CAPABILITY_OPEN);
1910
1911 /* Also apply to Unsupported Capability until remote router support
1912 capability. */
1913 if (bgp_notify.code == BGP_NOTIFY_OPEN_ERR &&
1914 bgp_notify.subcode == BGP_NOTIFY_OPEN_UNSUP_CAPBL)
1915 UNSET_FLAG (peer->sflags, PEER_STATUS_CAPABILITY_OPEN);
1916
1917 BGP_EVENT_ADD (peer, Receive_NOTIFICATION_message);
1918 }
1919
1920 /* Keepalive treatment function -- get keepalive send keepalive */
1921 static void
1922 bgp_keepalive_receive (struct peer *peer, bgp_size_t size)
1923 {
1924 if (BGP_DEBUG (keepalive, KEEPALIVE))
1925 zlog_debug ("%s KEEPALIVE rcvd", peer->host);
1926
1927 BGP_EVENT_ADD (peer, Receive_KEEPALIVE_message);
1928 }
1929
1930 /* Route refresh message is received. */
1931 static void
1932 bgp_route_refresh_receive (struct peer *peer, bgp_size_t size)
1933 {
1934 afi_t afi;
1935 safi_t safi;
1936 u_char reserved;
1937 struct stream *s;
1938
1939 /* If peer does not have the capability, send notification. */
1940 if (! CHECK_FLAG (peer->cap, PEER_CAP_REFRESH_ADV))
1941 {
1942 plog_err (peer->log, "%s [Error] BGP route refresh is not enabled",
1943 peer->host);
1944 bgp_notify_send (peer,
1945 BGP_NOTIFY_HEADER_ERR,
1946 BGP_NOTIFY_HEADER_BAD_MESTYPE);
1947 return;
1948 }
1949
1950 /* Status must be Established. */
1951 if (peer->status != Established)
1952 {
1953 plog_err (peer->log,
1954 "%s [Error] Route refresh packet received under status %s",
1955 peer->host, LOOKUP (bgp_status_msg, peer->status));
1956 bgp_notify_send (peer, BGP_NOTIFY_FSM_ERR, 0);
1957 return;
1958 }
1959
1960 s = peer->ibuf;
1961
1962 /* Parse packet. */
1963 afi = stream_getw (s);
1964 reserved = stream_getc (s);
1965 safi = stream_getc (s);
1966
1967 if (BGP_DEBUG (normal, NORMAL))
1968 zlog_debug ("%s rcvd REFRESH_REQ for afi/safi: %d/%d",
1969 peer->host, afi, safi);
1970
1971 /* Check AFI and SAFI. */
1972 if ((afi != AFI_IP && afi != AFI_IP6)
1973 || (safi != SAFI_UNICAST && safi != SAFI_MULTICAST
1974 && safi != BGP_SAFI_VPNV4))
1975 {
1976 if (BGP_DEBUG (normal, NORMAL))
1977 {
1978 zlog_debug ("%s REFRESH_REQ for unrecognized afi/safi: %d/%d - ignored",
1979 peer->host, afi, safi);
1980 }
1981 return;
1982 }
1983
1984 /* Adjust safi code. */
1985 if (safi == BGP_SAFI_VPNV4)
1986 safi = SAFI_MPLS_VPN;
1987
1988 if (size != BGP_MSG_ROUTE_REFRESH_MIN_SIZE - BGP_HEADER_SIZE)
1989 {
1990 u_char *end;
1991 u_char when_to_refresh;
1992 u_char orf_type;
1993 u_int16_t orf_len;
1994
1995 if (size - (BGP_MSG_ROUTE_REFRESH_MIN_SIZE - BGP_HEADER_SIZE) < 5)
1996 {
1997 zlog_info ("%s ORF route refresh length error", peer->host);
1998 bgp_notify_send (peer, BGP_NOTIFY_CEASE, 0);
1999 return;
2000 }
2001
2002 when_to_refresh = stream_getc (s);
2003 end = stream_pnt (s) + (size - 5);
2004
2005 while ((stream_pnt (s) + 2) < end)
2006 {
2007 orf_type = stream_getc (s);
2008 orf_len = stream_getw (s);
2009
2010 /* orf_len in bounds? */
2011 if ((stream_pnt (s) + orf_len) > end)
2012 break; /* XXX: Notify instead?? */
2013 if (orf_type == ORF_TYPE_PREFIX
2014 || orf_type == ORF_TYPE_PREFIX_OLD)
2015 {
2016 u_char *p_pnt = stream_pnt (s);
2017 u_char *p_end = stream_pnt (s) + orf_len;
2018 struct orf_prefix orfp;
2019 u_char common = 0;
2020 u_int32_t seq;
2021 int psize;
2022 char name[BUFSIZ];
2023 char buf[BUFSIZ];
2024 int ret;
2025
2026 if (BGP_DEBUG (normal, NORMAL))
2027 {
2028 zlog_debug ("%s rcvd Prefixlist ORF(%d) length %d",
2029 peer->host, orf_type, orf_len);
2030 }
2031
2032 /* we're going to read at least 1 byte of common ORF header,
2033 * and 7 bytes of ORF Address-filter entry from the stream
2034 */
2035 if (orf_len < 7)
2036 break;
2037
2038 /* ORF prefix-list name */
2039 sprintf (name, "%s.%d.%d", peer->host, afi, safi);
2040
2041 while (p_pnt < p_end)
2042 {
2043 memset (&orfp, 0, sizeof (struct orf_prefix));
2044 common = *p_pnt++;
2045 if (common & ORF_COMMON_PART_REMOVE_ALL)
2046 {
2047 if (BGP_DEBUG (normal, NORMAL))
2048 zlog_debug ("%s rcvd Remove-All pfxlist ORF request", peer->host);
2049 prefix_bgp_orf_remove_all (name);
2050 break;
2051 }
2052 memcpy (&seq, p_pnt, sizeof (u_int32_t));
2053 p_pnt += sizeof (u_int32_t);
2054 orfp.seq = ntohl (seq);
2055 orfp.ge = *p_pnt++;
2056 orfp.le = *p_pnt++;
2057 orfp.p.prefixlen = *p_pnt++;
2058 orfp.p.family = afi2family (afi);
2059 psize = PSIZE (orfp.p.prefixlen);
2060 memcpy (&orfp.p.u.prefix, p_pnt, psize);
2061 p_pnt += psize;
2062
2063 if (BGP_DEBUG (normal, NORMAL))
2064 zlog_debug ("%s rcvd %s %s seq %u %s/%d ge %d le %d",
2065 peer->host,
2066 (common & ORF_COMMON_PART_REMOVE ? "Remove" : "Add"),
2067 (common & ORF_COMMON_PART_DENY ? "deny" : "permit"),
2068 orfp.seq,
2069 inet_ntop (orfp.p.family, &orfp.p.u.prefix, buf, BUFSIZ),
2070 orfp.p.prefixlen, orfp.ge, orfp.le);
2071
2072 ret = prefix_bgp_orf_set (name, afi, &orfp,
2073 (common & ORF_COMMON_PART_DENY ? 0 : 1 ),
2074 (common & ORF_COMMON_PART_REMOVE ? 0 : 1));
2075
2076 if (ret != CMD_SUCCESS)
2077 {
2078 if (BGP_DEBUG (normal, NORMAL))
2079 zlog_debug ("%s Received misformatted prefixlist ORF. Remove All pfxlist", peer->host);
2080 prefix_bgp_orf_remove_all (name);
2081 break;
2082 }
2083 }
2084 peer->orf_plist[afi][safi] =
2085 prefix_list_lookup (AFI_ORF_PREFIX, name);
2086 }
2087 stream_forward_getp (s, orf_len);
2088 }
2089 if (BGP_DEBUG (normal, NORMAL))
2090 zlog_debug ("%s rcvd Refresh %s ORF request", peer->host,
2091 when_to_refresh == REFRESH_DEFER ? "Defer" : "Immediate");
2092 if (when_to_refresh == REFRESH_DEFER)
2093 return;
2094 }
2095
2096 /* First update is deferred until ORF or ROUTE-REFRESH is received */
2097 if (CHECK_FLAG (peer->af_sflags[afi][safi], PEER_STATUS_ORF_WAIT_REFRESH))
2098 UNSET_FLAG (peer->af_sflags[afi][safi], PEER_STATUS_ORF_WAIT_REFRESH);
2099
2100 /* Perform route refreshment to the peer */
2101 bgp_announce_route (peer, afi, safi);
2102 }
2103
2104 static int
2105 bgp_capability_msg_parse (struct peer *peer, u_char *pnt, bgp_size_t length)
2106 {
2107 u_char *end;
2108 struct capability_mp_data mpc;
2109 struct capability_header *hdr;
2110 u_char action;
2111 struct bgp *bgp;
2112 afi_t afi;
2113 safi_t safi;
2114
2115 bgp = peer->bgp;
2116 end = pnt + length;
2117
2118 while (pnt < end)
2119 {
2120 /* We need at least action, capability code and capability length. */
2121 if (pnt + 3 > end)
2122 {
2123 zlog_info ("%s Capability length error", peer->host);
2124 bgp_notify_send (peer, BGP_NOTIFY_CEASE, 0);
2125 return -1;
2126 }
2127 action = *pnt;
2128 hdr = (struct capability_header *)(pnt + 1);
2129
2130 /* Action value check. */
2131 if (action != CAPABILITY_ACTION_SET
2132 && action != CAPABILITY_ACTION_UNSET)
2133 {
2134 zlog_info ("%s Capability Action Value error %d",
2135 peer->host, action);
2136 bgp_notify_send (peer, BGP_NOTIFY_CEASE, 0);
2137 return -1;
2138 }
2139
2140 if (BGP_DEBUG (normal, NORMAL))
2141 zlog_debug ("%s CAPABILITY has action: %d, code: %u, length %u",
2142 peer->host, action, hdr->code, hdr->length);
2143
2144 /* Capability length check. */
2145 if ((pnt + hdr->length + 3) > end)
2146 {
2147 zlog_info ("%s Capability length error", peer->host);
2148 bgp_notify_send (peer, BGP_NOTIFY_CEASE, 0);
2149 return -1;
2150 }
2151
2152 /* Fetch structure to the byte stream. */
2153 memcpy (&mpc, pnt + 3, sizeof (struct capability_mp_data));
2154
2155 /* We know MP Capability Code. */
2156 if (hdr->code == CAPABILITY_CODE_MP)
2157 {
2158 afi = ntohs (mpc.afi);
2159 safi = mpc.safi;
2160
2161 /* Ignore capability when override-capability is set. */
2162 if (CHECK_FLAG (peer->flags, PEER_FLAG_OVERRIDE_CAPABILITY))
2163 continue;
2164
2165 if (!bgp_afi_safi_valid_indices (afi, &safi))
2166 {
2167 if (BGP_DEBUG (normal, NORMAL))
2168 zlog_debug ("%s Dynamic Capability MP_EXT afi/safi invalid "
2169 "(%u/%u)", peer->host, afi, safi);
2170 continue;
2171 }
2172
2173 /* Address family check. */
2174 if (BGP_DEBUG (normal, NORMAL))
2175 zlog_debug ("%s CAPABILITY has %s MP_EXT CAP for afi/safi: %u/%u",
2176 peer->host,
2177 action == CAPABILITY_ACTION_SET
2178 ? "Advertising" : "Removing",
2179 ntohs(mpc.afi) , mpc.safi);
2180
2181 if (action == CAPABILITY_ACTION_SET)
2182 {
2183 peer->afc_recv[afi][safi] = 1;
2184 if (peer->afc[afi][safi])
2185 {
2186 peer->afc_nego[afi][safi] = 1;
2187 bgp_announce_route (peer, afi, safi);
2188 }
2189 }
2190 else
2191 {
2192 peer->afc_recv[afi][safi] = 0;
2193 peer->afc_nego[afi][safi] = 0;
2194
2195 if (peer_active_nego (peer))
2196 bgp_clear_route (peer, afi, safi, BGP_CLEAR_ROUTE_NORMAL);
2197 else
2198 BGP_EVENT_ADD (peer, BGP_Stop);
2199 }
2200 }
2201 else
2202 {
2203 zlog_warn ("%s unrecognized capability code: %d - ignored",
2204 peer->host, hdr->code);
2205 }
2206 pnt += hdr->length + 3;
2207 }
2208 return 0;
2209 }
2210
2211 /* Dynamic Capability is received.
2212 *
2213 * This is exported for unit-test purposes
2214 */
2215 int
2216 bgp_capability_receive (struct peer *peer, bgp_size_t size)
2217 {
2218 u_char *pnt;
2219
2220 /* Fetch pointer. */
2221 pnt = stream_pnt (peer->ibuf);
2222
2223 if (BGP_DEBUG (normal, NORMAL))
2224 zlog_debug ("%s rcv CAPABILITY", peer->host);
2225
2226 /* If peer does not have the capability, send notification. */
2227 if (! CHECK_FLAG (peer->cap, PEER_CAP_DYNAMIC_ADV))
2228 {
2229 plog_err (peer->log, "%s [Error] BGP dynamic capability is not enabled",
2230 peer->host);
2231 bgp_notify_send (peer,
2232 BGP_NOTIFY_HEADER_ERR,
2233 BGP_NOTIFY_HEADER_BAD_MESTYPE);
2234 return -1;
2235 }
2236
2237 /* Status must be Established. */
2238 if (peer->status != Established)
2239 {
2240 plog_err (peer->log,
2241 "%s [Error] Dynamic capability packet received under status %s", peer->host, LOOKUP (bgp_status_msg, peer->status));
2242 bgp_notify_send (peer, BGP_NOTIFY_FSM_ERR, 0);
2243 return -1;
2244 }
2245
2246 /* Parse packet. */
2247 return bgp_capability_msg_parse (peer, pnt, size);
2248 }
2249 \f
2250 /* BGP read utility function. */
2251 static int
2252 bgp_read_packet (struct peer *peer)
2253 {
2254 int nbytes;
2255 int readsize;
2256
2257 readsize = peer->packet_size - stream_get_endp (peer->ibuf);
2258
2259 /* If size is zero then return. */
2260 if (! readsize)
2261 return 0;
2262
2263 /* Read packet from fd. */
2264 nbytes = stream_read_unblock (peer->ibuf, peer->fd, readsize);
2265
2266 /* If read byte is smaller than zero then error occured. */
2267 if (nbytes < 0)
2268 {
2269 if (errno == EAGAIN)
2270 return -1;
2271
2272 plog_err (peer->log, "%s [Error] bgp_read_packet error: %s",
2273 peer->host, safe_strerror (errno));
2274
2275 if (peer->status == Established)
2276 {
2277 if (CHECK_FLAG (peer->sflags, PEER_STATUS_NSF_MODE))
2278 {
2279 peer->last_reset = PEER_DOWN_NSF_CLOSE_SESSION;
2280 SET_FLAG (peer->sflags, PEER_STATUS_NSF_WAIT);
2281 }
2282 else
2283 peer->last_reset = PEER_DOWN_CLOSE_SESSION;
2284 }
2285
2286 BGP_EVENT_ADD (peer, TCP_fatal_error);
2287 return -1;
2288 }
2289
2290 /* When read byte is zero : clear bgp peer and return */
2291 if (nbytes == 0)
2292 {
2293 if (BGP_DEBUG (events, EVENTS))
2294 plog_debug (peer->log, "%s [Event] BGP connection closed fd %d",
2295 peer->host, peer->fd);
2296
2297 if (peer->status == Established)
2298 {
2299 if (CHECK_FLAG (peer->sflags, PEER_STATUS_NSF_MODE))
2300 {
2301 peer->last_reset = PEER_DOWN_NSF_CLOSE_SESSION;
2302 SET_FLAG (peer->sflags, PEER_STATUS_NSF_WAIT);
2303 }
2304 else
2305 peer->last_reset = PEER_DOWN_CLOSE_SESSION;
2306 }
2307
2308 BGP_EVENT_ADD (peer, TCP_connection_closed);
2309 return -1;
2310 }
2311
2312 /* We read partial packet. */
2313 if (stream_get_endp (peer->ibuf) != peer->packet_size)
2314 return -1;
2315
2316 return 0;
2317 }
2318
2319 /* Marker check. */
2320 static int
2321 bgp_marker_all_one (struct stream *s, int length)
2322 {
2323 int i;
2324
2325 for (i = 0; i < length; i++)
2326 if (s->data[i] != 0xff)
2327 return 0;
2328
2329 return 1;
2330 }
2331
2332 /* Starting point of packet process function. */
2333 int
2334 bgp_read (struct thread *thread)
2335 {
2336 int ret;
2337 u_char type = 0;
2338 struct peer *peer;
2339 bgp_size_t size;
2340 char notify_data_length[2];
2341
2342 /* Yes first of all get peer pointer. */
2343 peer = THREAD_ARG (thread);
2344 peer->t_read = NULL;
2345
2346 /* For non-blocking IO check. */
2347 if (peer->status == Connect)
2348 {
2349 bgp_connect_check (peer);
2350 goto done;
2351 }
2352 else
2353 {
2354 if (peer->fd < 0)
2355 {
2356 zlog_err ("bgp_read peer's fd is negative value %d", peer->fd);
2357 return -1;
2358 }
2359 BGP_READ_ON (peer->t_read, bgp_read, peer->fd);
2360 }
2361
2362 /* Read packet header to determine type of the packet */
2363 if (peer->packet_size == 0)
2364 peer->packet_size = BGP_HEADER_SIZE;
2365
2366 if (stream_get_endp (peer->ibuf) < BGP_HEADER_SIZE)
2367 {
2368 ret = bgp_read_packet (peer);
2369
2370 /* Header read error or partial read packet. */
2371 if (ret < 0)
2372 goto done;
2373
2374 /* Get size and type. */
2375 stream_forward_getp (peer->ibuf, BGP_MARKER_SIZE);
2376 memcpy (notify_data_length, stream_pnt (peer->ibuf), 2);
2377 size = stream_getw (peer->ibuf);
2378 type = stream_getc (peer->ibuf);
2379
2380 if (BGP_DEBUG (normal, NORMAL) && type != 2 && type != 0)
2381 zlog_debug ("%s rcv message type %d, length (excl. header) %d",
2382 peer->host, type, size - BGP_HEADER_SIZE);
2383
2384 /* Marker check */
2385 if (((type == BGP_MSG_OPEN) || (type == BGP_MSG_KEEPALIVE))
2386 && ! bgp_marker_all_one (peer->ibuf, BGP_MARKER_SIZE))
2387 {
2388 bgp_notify_send (peer,
2389 BGP_NOTIFY_HEADER_ERR,
2390 BGP_NOTIFY_HEADER_NOT_SYNC);
2391 goto done;
2392 }
2393
2394 /* BGP type check. */
2395 if (type != BGP_MSG_OPEN && type != BGP_MSG_UPDATE
2396 && type != BGP_MSG_NOTIFY && type != BGP_MSG_KEEPALIVE
2397 && type != BGP_MSG_ROUTE_REFRESH_NEW
2398 && type != BGP_MSG_ROUTE_REFRESH_OLD
2399 && type != BGP_MSG_CAPABILITY)
2400 {
2401 if (BGP_DEBUG (normal, NORMAL))
2402 plog_debug (peer->log,
2403 "%s unknown message type 0x%02x",
2404 peer->host, type);
2405 bgp_notify_send_with_data (peer,
2406 BGP_NOTIFY_HEADER_ERR,
2407 BGP_NOTIFY_HEADER_BAD_MESTYPE,
2408 &type, 1);
2409 goto done;
2410 }
2411 /* Mimimum packet length check. */
2412 if ((size < BGP_HEADER_SIZE)
2413 || (size > BGP_MAX_PACKET_SIZE)
2414 || (type == BGP_MSG_OPEN && size < BGP_MSG_OPEN_MIN_SIZE)
2415 || (type == BGP_MSG_UPDATE && size < BGP_MSG_UPDATE_MIN_SIZE)
2416 || (type == BGP_MSG_NOTIFY && size < BGP_MSG_NOTIFY_MIN_SIZE)
2417 || (type == BGP_MSG_KEEPALIVE && size != BGP_MSG_KEEPALIVE_MIN_SIZE)
2418 || (type == BGP_MSG_ROUTE_REFRESH_NEW && size < BGP_MSG_ROUTE_REFRESH_MIN_SIZE)
2419 || (type == BGP_MSG_ROUTE_REFRESH_OLD && size < BGP_MSG_ROUTE_REFRESH_MIN_SIZE)
2420 || (type == BGP_MSG_CAPABILITY && size < BGP_MSG_CAPABILITY_MIN_SIZE))
2421 {
2422 if (BGP_DEBUG (normal, NORMAL))
2423 plog_debug (peer->log,
2424 "%s bad message length - %d for %s",
2425 peer->host, size,
2426 type == 128 ? "ROUTE-REFRESH" :
2427 bgp_type_str[(int) type]);
2428 bgp_notify_send_with_data (peer,
2429 BGP_NOTIFY_HEADER_ERR,
2430 BGP_NOTIFY_HEADER_BAD_MESLEN,
2431 (u_char *) notify_data_length, 2);
2432 goto done;
2433 }
2434
2435 /* Adjust size to message length. */
2436 peer->packet_size = size;
2437 }
2438
2439 ret = bgp_read_packet (peer);
2440 if (ret < 0)
2441 goto done;
2442
2443 /* Get size and type again. */
2444 size = stream_getw_from (peer->ibuf, BGP_MARKER_SIZE);
2445 type = stream_getc_from (peer->ibuf, BGP_MARKER_SIZE + 2);
2446
2447 /* BGP packet dump function. */
2448 bgp_dump_packet (peer, type, peer->ibuf);
2449
2450 size = (peer->packet_size - BGP_HEADER_SIZE);
2451
2452 /* Read rest of the packet and call each sort of packet routine */
2453 switch (type)
2454 {
2455 case BGP_MSG_OPEN:
2456 peer->open_in++;
2457 bgp_open_receive (peer, size); /* XXX return value ignored! */
2458 break;
2459 case BGP_MSG_UPDATE:
2460 peer->readtime = time(NULL); /* Last read timer reset */
2461 bgp_update_receive (peer, size);
2462 break;
2463 case BGP_MSG_NOTIFY:
2464 bgp_notify_receive (peer, size);
2465 break;
2466 case BGP_MSG_KEEPALIVE:
2467 peer->readtime = time(NULL); /* Last read timer reset */
2468 bgp_keepalive_receive (peer, size);
2469 break;
2470 case BGP_MSG_ROUTE_REFRESH_NEW:
2471 case BGP_MSG_ROUTE_REFRESH_OLD:
2472 peer->refresh_in++;
2473 bgp_route_refresh_receive (peer, size);
2474 break;
2475 case BGP_MSG_CAPABILITY:
2476 peer->dynamic_cap_in++;
2477 bgp_capability_receive (peer, size);
2478 break;
2479 }
2480
2481 /* Clear input buffer. */
2482 peer->packet_size = 0;
2483 if (peer->ibuf)
2484 stream_reset (peer->ibuf);
2485
2486 done:
2487 if (CHECK_FLAG (peer->sflags, PEER_STATUS_ACCEPT_PEER))
2488 {
2489 if (BGP_DEBUG (events, EVENTS))
2490 zlog_debug ("%s [Event] Accepting BGP peer delete", peer->host);
2491 peer_delete (peer);
2492 }
2493 return 0;
2494 }