3 * Used to advertise routes for upstream (l2tp port, rather than gratiutious
4 * arp) and downstream--allowing routers to load-balance both.
6 * Implementation limitations:
7 * - We never listen for incoming connections (session always initiated by us).
8 * - Any routes advertised by the peer are accepted, but ignored.
9 * - No password support; neither RFC1771 (which no-one seems to do anyway)
10 * nor RFC2385 (which requires a kernel patch on 2.4 kernels).
13 char const *cvs_id_bgp
= "$Id: bgp.c,v 1.12 2005/09/02 23:39:36 bodea Exp $";
20 #include <sys/socket.h>
21 #include <netinet/in.h>
22 #include <arpa/inet.h>
30 static void bgp_clear(struct bgp_peer
*peer
);
31 static void bgp_set_retry(struct bgp_peer
*peer
);
32 static void bgp_cidr(in_addr_t ip
, in_addr_t mask
, struct bgp_ip_prefix
*pfx
);
33 static struct bgp_route_list
*bgp_insert_route(struct bgp_route_list
*head
,
34 struct bgp_route_list
*new);
35 static struct bgp_route6_list
*bgp_insert_route6(struct bgp_route6_list
*head
,
36 struct bgp_route6_list
*new);
38 static void bgp_free_routes(struct bgp_route_list
*routes
);
39 static void bgp_free_routes6(struct bgp_route6_list
*routes
);
40 static char const *bgp_msg_type_str(uint8_t type
);
41 static int bgp_connect(struct bgp_peer
*peer
);
42 static int bgp_handle_connect(struct bgp_peer
*peer
);
43 static int bgp_write(struct bgp_peer
*peer
);
44 static int bgp_read(struct bgp_peer
*peer
);
45 static int bgp_handle_input(struct bgp_peer
*peer
);
46 static int bgp_send_open(struct bgp_peer
*peer
);
47 static int bgp_send_keepalive(struct bgp_peer
*peer
);
48 static int bgp_send_update(struct bgp_peer
*peer
);
49 static int bgp_send_update6(struct bgp_peer
*peer
);
50 static int bgp_send_notification(struct bgp_peer
*peer
, uint8_t code
,
52 static int bgp_send_notification_full(struct bgp_peer
*peer
, uint8_t code
,
53 uint8_t subcode
, char *notification_data
, uint16_t data_len
);
55 static uint16_t our_as
;
56 static struct bgp_route_list
*bgp_routes
= 0;
57 static struct bgp_route6_list
*bgp_routes6
= 0;
59 int bgp_configured
= 0;
60 struct bgp_peer
*bgp_peers
= 0;
62 /* prepare peer structure, globals */
66 struct bgp_peer
*peer
;
68 for (i
= 0; i
< BGP_NUM_PEERS
; i
++)
71 memset(peer
, 0, sizeof(*peer
));
73 peer
->addr
= INADDR_NONE
;
75 peer
->state
= peer
->next_state
= Disabled
;
77 if (!((peer
->outbuf
= malloc(sizeof(*peer
->outbuf
)))
78 && (peer
->inbuf
= malloc(sizeof(*peer
->inbuf
)))))
80 LOG(0, 0, 0, "Can't allocate buffers for bgp peer (%s)\n",
86 peer
->edata
.type
= FD_TYPE_BGP
;
87 peer
->edata
.index
= i
;
99 bgp_configured
= 0; /* set by bgp_start */
104 /* start connection with a peer */
105 int bgp_start(struct bgp_peer
*peer
, char *name
, int as
, int keepalive
,
106 int hold
, int enable
)
111 struct bgp_path_attr a
;
113 char *p
= path_attrs
;
115 uint32_t metric
= htonl(BGP_METRIC
);
116 uint32_t no_export
= htonl(BGP_COMMUNITY_NO_EXPORT
);
121 if (peer
->state
!= Disabled
)
124 snprintf(peer
->name
, sizeof(peer
->name
), "%s", name
);
126 if (!(h
= gethostbyname(name
)) || h
->h_addrtype
!= AF_INET
)
128 LOG(0, 0, 0, "Can't get address for BGP peer %s (%s)\n",
129 name
, h
? "no address" : hstrerror(h_errno
));
134 memcpy(&peer
->addr
, h
->h_addr
, sizeof(peer
->addr
));
135 peer
->as
= as
> 0 ? as
: our_as
;
136 ibgp
= peer
->as
== our_as
;
138 /* set initial timer values */
139 peer
->init_keepalive
= keepalive
== -1 ? BGP_KEEPALIVE_TIME
: keepalive
;
140 peer
->init_hold
= hold
== -1 ? BGP_HOLD_TIME
: hold
;
142 if (peer
->init_hold
< 3)
145 if (peer
->init_keepalive
* 3 > peer
->init_hold
)
146 peer
->init_keepalive
= peer
->init_hold
/ 3;
148 /* clear buffers, go to Idle state */
149 peer
->next_state
= Idle
;
152 /* set initial routing state */
153 peer
->routing
= enable
;
155 /* all our routes use the same attributes, so prepare it in advance */
156 if (peer
->path_attrs
)
157 free(peer
->path_attrs
);
159 peer
->path_attr_len
= 0;
162 a
.flags
= BGP_PATH_ATTR_FLAG_TRANS
;
163 a
.code
= BGP_PATH_ATTR_CODE_ORIGIN
;
165 a
.data
.s
.value
[0] = BGP_PATH_ATTR_CODE_ORIGIN_IGP
;
167 #define ADD_ATTRIBUTE() do { \
168 i = BGP_PATH_ATTR_SIZE(a); \
171 peer->path_attr_len += i; } while (0)
176 a
.flags
= BGP_PATH_ATTR_FLAG_TRANS
;
177 a
.code
= BGP_PATH_ATTR_CODE_AS_PATH
;
191 BGP_PATH_ATTR_CODE_AS_PATH_AS_SEQUENCE
,
196 a
.data
.s
.len
= sizeof(as_path
);
197 memcpy(&a
.data
.s
.value
, &as_path
, sizeof(as_path
));
202 /* MULTI_EXIT_DISC */
203 a
.flags
= BGP_PATH_ATTR_FLAG_OPTIONAL
;
204 a
.code
= BGP_PATH_ATTR_CODE_MULTI_EXIT_DISC
;
205 a
.data
.s
.len
= sizeof(metric
);
206 memcpy(a
.data
.s
.value
, &metric
, sizeof(metric
));
212 uint32_t local_pref
= htonl(BGP_LOCAL_PREF
);
215 a
.flags
= BGP_PATH_ATTR_FLAG_TRANS
;
216 a
.code
= BGP_PATH_ATTR_CODE_LOCAL_PREF
;
217 a
.data
.s
.len
= sizeof(local_pref
);
218 memcpy(a
.data
.s
.value
, &local_pref
, sizeof(local_pref
));
224 a
.flags
= BGP_PATH_ATTR_FLAG_OPTIONAL
| BGP_PATH_ATTR_FLAG_TRANS
;
225 a
.code
= BGP_PATH_ATTR_CODE_COMMUNITIES
;
226 a
.data
.s
.len
= sizeof(no_export
);
227 memcpy(a
.data
.s
.value
, &no_export
, sizeof(no_export
));
231 /* remember the len before adding NEXT_HOP */
232 peer
->path_attr_len_without_nexthop
= peer
->path_attr_len
;
235 a
.flags
= BGP_PATH_ATTR_FLAG_TRANS
;
236 a
.code
= BGP_PATH_ATTR_CODE_NEXT_HOP
;
237 ip
= my_address
; /* we're it */
238 a
.data
.s
.len
= sizeof(ip
);
239 memcpy(a
.data
.s
.value
, &ip
, sizeof(ip
));
243 if (!(peer
->path_attrs
= malloc(peer
->path_attr_len
)))
245 LOG(0, 0, 0, "Can't allocate path_attrs for %s (%s)\n",
246 name
, strerror(errno
));
251 memcpy(peer
->path_attrs
, path_attrs
, peer
->path_attr_len
);
253 LOG(4, 0, 0, "Initiating BGP connection to %s (routing %s)\n",
254 name
, enable
? "enabled" : "suspended");
256 /* we have at least one peer configured */
260 return bgp_connect(peer
);
263 /* clear counters, timers, routes and buffers; close socket; move to
264 next_state, which may be Disabled or Idle */
265 static void bgp_clear(struct bgp_peer
*peer
)
267 if (peer
->sock
!= -1)
273 peer
->keepalive_time
= 0;
274 peer
->expire_time
= 0;
276 peer
->keepalive
= peer
->init_keepalive
;
277 peer
->hold
= peer
->init_hold
;
279 bgp_free_routes(peer
->routes
);
281 bgp_free_routes6(peer
->routes6
);
284 peer
->outbuf
->packet
.header
.len
= 0;
285 peer
->outbuf
->done
= 0;
286 peer
->inbuf
->packet
.header
.len
= 0;
287 peer
->inbuf
->done
= 0;
292 if (peer
->state
!= peer
->next_state
)
294 peer
->state
= peer
->next_state
;
295 peer
->state_time
= time_now
;
297 LOG(4, 0, 0, "BGP peer %s: state %s\n", peer
->name
,
298 bgp_state_str(peer
->next_state
));
302 /* initiate a clean shutdown */
303 void bgp_stop(struct bgp_peer
*peer
)
305 LOG(4, 0, 0, "Terminating BGP connection to %s\n", peer
->name
);
306 bgp_send_notification(peer
, BGP_ERR_CEASE
, 0);
309 /* drop connection (if any) and set state to Disabled */
310 void bgp_halt(struct bgp_peer
*peer
)
312 LOG(4, 0, 0, "Aborting BGP connection to %s\n", peer
->name
);
313 peer
->next_state
= Disabled
;
317 /* drop connection (if any) and set to Idle for connection retry */
318 int bgp_restart(struct bgp_peer
*peer
)
320 peer
->next_state
= Idle
;
324 peer
->retry_time
= time_now
;
325 peer
->retry_count
= 0;
328 return bgp_connect(peer
);
331 static void bgp_set_retry(struct bgp_peer
*peer
)
333 if (peer
->retry_count
++ < BGP_MAX_RETRY
)
335 peer
->retry_time
= time_now
+ (BGP_RETRY_BACKOFF
* peer
->retry_count
);
336 peer
->next_state
= Idle
;
340 bgp_halt(peer
); /* give up */
343 /* convert ip/mask to CIDR notation */
344 static void bgp_cidr(in_addr_t ip
, in_addr_t mask
, struct bgp_ip_prefix
*pfx
)
349 /* convert to prefix notation */
353 if (!mask
) /* bogus */
356 for (i
= 0; i
< 32 && ((b
= ntohl(1 << i
)), !(mask
& b
)); i
++)
363 /* insert route into list; sorted */
364 static struct bgp_route_list
*bgp_insert_route(struct bgp_route_list
*head
,
365 struct bgp_route_list
*new)
367 struct bgp_route_list
*p
= head
;
368 struct bgp_route_list
*e
= 0;
370 while (p
&& memcmp(&p
->dest
, &new->dest
, sizeof(p
->dest
)) < 0)
390 /* insert route6 into list; sorted */
391 static struct bgp_route6_list
*bgp_insert_route6(struct bgp_route6_list
*head
,
392 struct bgp_route6_list
*new)
394 struct bgp_route6_list
*p
= head
;
395 struct bgp_route6_list
*e
= 0;
397 while (p
&& memcmp(&p
->dest
, &new->dest
, sizeof(p
->dest
)) < 0)
417 /* add route to list for peers */
419 * Note: this doesn't do route aggregation, nor drop routes if a less
420 * specific match already exists (partly because I'm lazy, but also so
421 * that if that route is later deleted we don't have to be concerned
422 * about adding back the more specific one).
424 int bgp_add_route(in_addr_t ip
, in_addr_t mask
)
426 struct bgp_route_list
*r
= bgp_routes
;
427 struct bgp_route_list add
;
430 bgp_cidr(ip
, mask
, &add
.dest
);
433 /* check for duplicate */
436 i
= memcmp(&r
->dest
, &add
.dest
, sizeof(r
->dest
));
438 return 1; /* already covered */
446 /* insert into route list; sorted */
447 if (!(r
= malloc(sizeof(*r
))))
449 LOG(0, 0, 0, "Can't allocate route for %s/%d (%s)\n",
450 fmtaddr(add
.dest
.prefix
, 0), add
.dest
.len
, strerror(errno
));
455 memcpy(r
, &add
, sizeof(*r
));
456 bgp_routes
= bgp_insert_route(bgp_routes
, r
);
458 /* flag established peers for update */
459 for (i
= 0; i
< BGP_NUM_PEERS
; i
++)
460 if (bgp_peers
[i
].state
== Established
)
461 bgp_peers
[i
].update_routes
= 1;
463 LOG(4, 0, 0, "Registered BGP route %s/%d\n",
464 fmtaddr(add
.dest
.prefix
, 0), add
.dest
.len
);
469 /* add route to list for peers */
471 * Note: same provisions as above
473 int bgp_add_route6(struct in6_addr ip
, int prefixlen
)
475 struct bgp_route6_list
*r
= bgp_routes6
;
476 struct bgp_route6_list add
;
478 char ipv6addr
[INET6_ADDRSTRLEN
];
480 memcpy(&add
.dest
.prefix
, &ip
.s6_addr
, 16);
481 add
.dest
.len
= prefixlen
;
484 /* check for duplicate */
487 i
= memcmp(&r
->dest
, &add
.dest
, sizeof(r
->dest
));
489 return 1; /* already covered */
497 /* insert into route list; sorted */
498 if (!(r
= malloc(sizeof(*r
))))
500 LOG(0, 0, 0, "Can't allocate route for %s/%d (%s)\n",
501 inet_ntop(AF_INET6
, &ip
, ipv6addr
, INET6_ADDRSTRLEN
), add
.dest
.len
,
507 memcpy(r
, &add
, sizeof(*r
));
508 bgp_routes6
= bgp_insert_route6(bgp_routes6
, r
);
510 /* flag established peers for update */
511 for (i
= 0; i
< BGP_NUM_PEERS
; i
++)
512 if (bgp_peers
[i
].state
== Established
)
513 bgp_peers
[i
].update_routes6
= 1;
515 LOG(4, 0, 0, "Registered BGP route %s/%d\n",
516 inet_ntop(AF_INET6
, &ip
, ipv6addr
, INET6_ADDRSTRLEN
), add
.dest
.len
);
521 /* remove route from list for peers */
522 int bgp_del_route(in_addr_t ip
, in_addr_t mask
)
524 struct bgp_route_list
*r
= bgp_routes
;
525 struct bgp_route_list
*e
= 0;
526 struct bgp_route_list del
;
529 bgp_cidr(ip
, mask
, &del
.dest
);
532 /* find entry in routes list and remove */
535 i
= memcmp(&r
->dest
, &del
.dest
, sizeof(r
->dest
));
541 bgp_routes
= r
->next
;
559 /* flag established peers for update */
560 for (i
= 0; i
< BGP_NUM_PEERS
; i
++)
561 if (bgp_peers
[i
].state
== Established
)
562 bgp_peers
[i
].update_routes
= 1;
564 LOG(4, 0, 0, "Removed BGP route %s/%d\n",
565 fmtaddr(del
.dest
.prefix
, 0), del
.dest
.len
);
570 /* remove route from list for peers */
571 int bgp_del_route6(struct in6_addr ip
, int prefixlen
)
573 struct bgp_route6_list
*r
= bgp_routes6
;
574 struct bgp_route6_list
*e
= 0;
575 struct bgp_route6_list del
;
577 char ipv6addr
[INET6_ADDRSTRLEN
];
579 memcpy(&del
.dest
.prefix
, &ip
.s6_addr
, 16);
580 del
.dest
.len
= prefixlen
;
583 /* find entry in routes list and remove */
586 i
= memcmp(&r
->dest
, &del
.dest
, sizeof(r
->dest
));
592 bgp_routes6
= r
->next
;
610 /* flag established peers for update */
611 for (i
= 0; i
< BGP_NUM_PEERS
; i
++)
612 if (bgp_peers
[i
].state
== Established
)
613 bgp_peers
[i
].update_routes6
= 1;
615 LOG(4, 0, 0, "Removed BGP route %s/%d\n",
616 inet_ntop(AF_INET6
, &ip
, ipv6addr
, INET6_ADDRSTRLEN
), del
.dest
.len
);
621 /* enable or disable routing */
622 void bgp_enable_routing(int enable
)
626 for (i
= 0; i
< BGP_NUM_PEERS
; i
++)
628 bgp_peers
[i
].routing
= enable
;
630 /* flag established peers for update */
631 if (bgp_peers
[i
].state
== Established
)
632 bgp_peers
[i
].update_routes
= 1;
635 LOG(4, 0, 0, "%s BGP routing\n", enable
? "Enabled" : "Suspended");
639 # include <sys/epoll.h>
641 # include "fake_epoll.h"
644 /* return a bitmask of the events required to poll this peer's fd */
652 for (i
= 0; i
< BGP_NUM_PEERS
; i
++)
654 struct bgp_peer
*peer
= &bgp_peers
[i
];
657 if (peer
->state
== Disabled
|| peer
->state
== Idle
)
660 if (peer
->inbuf
->done
< BGP_MAX_PACKET_SIZE
)
663 if (peer
->state
== Connect
|| /* connection in progress */
664 peer
->update_routes
|| /* routing updates */
665 peer
->outbuf
->packet
.header
.len
) /* pending output */
668 if (peer
->events
!= events
)
670 struct epoll_event ev
;
672 ev
.events
= peer
->events
= events
;
673 ev
.data
.ptr
= &peer
->edata
;
674 epoll_ctl(epollfd
, EPOLL_CTL_MOD
, peer
->sock
, &ev
);
681 /* process bgp events/timers */
682 int bgp_process(uint32_t events
[])
689 for (i
= 0; i
< BGP_NUM_PEERS
; i
++)
691 struct bgp_peer
*peer
= &bgp_peers
[i
];
693 if (*peer
->name
&& peer
->cli_flag
== BGP_CLI_RESTART
)
699 if (peer
->state
== Disabled
)
704 switch (peer
->cli_flag
)
706 case BGP_CLI_SUSPEND
:
710 if (peer
->state
== Established
)
711 peer
->update_routes
= 1;
720 if (peer
->state
== Established
)
721 peer
->update_routes
= 1;
730 /* handle empty/fill of buffers */
731 if (events
[i
] & EPOLLOUT
)
734 if (peer
->state
== Connect
)
735 r
= bgp_handle_connect(peer
);
736 else if (peer
->outbuf
->packet
.header
.len
)
743 if (events
[i
] & (EPOLLIN
|EPOLLHUP
))
749 /* process input buffer contents */
750 while (peer
->inbuf
->done
>= sizeof(peer
->inbuf
->packet
.header
)
751 && !peer
->outbuf
->packet
.header
.len
) /* may need to queue a response */
753 if (bgp_handle_input(peer
) < 0)
757 /* process pending updates */
758 if (peer
->update_routes
759 && !peer
->outbuf
->packet
.header
.len
) /* ditto */
761 if (!bgp_send_update(peer
))
765 /* process pending IPv6 updates */
766 if (peer
->update_routes6
767 && !peer
->outbuf
->packet
.header
.len
) /* ditto */
769 if (!bgp_send_update6(peer
))
774 if (peer
->state
== Established
)
776 if (time_now
> peer
->expire_time
)
778 LOG(1, 0, 0, "No message from BGP peer %s in %ds\n",
779 peer
->name
, peer
->hold
);
781 bgp_send_notification(peer
, BGP_ERR_HOLD_TIMER_EXP
, 0);
785 if (time_now
> peer
->keepalive_time
&& !peer
->outbuf
->packet
.header
.len
)
786 bgp_send_keepalive(peer
);
788 else if (peer
->state
== Idle
)
790 if (time_now
> peer
->retry_time
)
793 else if (time_now
> peer
->state_time
+ BGP_STATE_TIME
)
795 LOG(1, 0, 0, "%s timer expired for BGP peer %s\n",
796 bgp_state_str(peer
->state
), peer
->name
);
805 static void bgp_free_routes(struct bgp_route_list
*routes
)
807 struct bgp_route_list
*tmp
;
809 while ((tmp
= routes
))
816 static void bgp_free_routes6(struct bgp_route6_list
*routes
)
818 struct bgp_route6_list
*tmp
;
820 while ((tmp
= routes
))
827 char const *bgp_state_str(enum bgp_state state
)
831 case Disabled
: return "Disabled";
832 case Idle
: return "Idle";
833 case Connect
: return "Connect";
834 case Active
: return "Active";
835 case OpenSent
: return "OpenSent";
836 case OpenConfirm
: return "OpenConfirm";
837 case Established
: return "Established";
843 static char const *bgp_msg_type_str(uint8_t type
)
847 case BGP_MSG_OPEN
: return "OPEN";
848 case BGP_MSG_UPDATE
: return "UPDATE";
849 case BGP_MSG_NOTIFICATION
: return "NOTIFICATION";
850 case BGP_MSG_KEEPALIVE
: return "KEEPALIVE";
856 /* attempt to connect to peer */
857 static int bgp_connect(struct bgp_peer
*peer
)
859 static int bgp_port
= 0;
860 struct sockaddr_in addr
;
861 struct epoll_event ev
;
865 struct servent
*serv
;
866 if (!(serv
= getservbyname("bgp", "tcp")))
868 LOG(0, 0, 0, "Can't get bgp service (%s)\n", strerror(errno
));
872 bgp_port
= serv
->s_port
;
875 if ((peer
->sock
= socket(PF_INET
, SOCK_STREAM
, IPPROTO_TCP
)) < 0)
877 LOG(0, 0, 0, "Can't create a socket for BGP peer %s (%s)\n",
878 peer
->name
, strerror(errno
));
880 peer
->state
= peer
->next_state
= Disabled
;
884 /* add to poll set */
885 ev
.events
= peer
->events
= EPOLLOUT
;
886 ev
.data
.ptr
= &peer
->edata
;
887 epoll_ctl(epollfd
, EPOLL_CTL_ADD
, peer
->sock
, &ev
);
889 /* set to non-blocking */
890 fcntl(peer
->sock
, F_SETFL
, fcntl(peer
->sock
, F_GETFL
, 0) | O_NONBLOCK
);
893 memset(&addr
, 0, sizeof(addr
));
894 addr
.sin_family
= AF_INET
;
895 addr
.sin_port
= bgp_port
;
896 addr
.sin_addr
.s_addr
= peer
->addr
;
898 while (connect(peer
->sock
, (struct sockaddr
*) &addr
, sizeof(addr
)) == -1)
900 if (errno
== EINTR
) /* SIGALARM handler */
903 if (errno
!= EINPROGRESS
)
905 LOG(1, 0, 0, "Can't connect to BGP peer %s (%s)\n",
906 inet_ntoa(addr
.sin_addr
), strerror(errno
));
912 peer
->state
= Connect
;
913 peer
->state_time
= time_now
;
915 LOG(4, 0, 0, "BGP peer %s: state Connect\n", peer
->name
);
919 peer
->state
= Active
;
920 peer
->state_time
= time_now
;
921 peer
->retry_time
= peer
->retry_count
= 0;
923 LOG(4, 0, 0, "BGP peer %s: state Active\n", inet_ntoa(addr
.sin_addr
));
925 peer
->handle_ipv6_routes
= 0;
927 return bgp_send_open(peer
);
930 /* complete partial connection (state = Connect) */
931 static int bgp_handle_connect(struct bgp_peer
*peer
)
934 socklen_t len
= sizeof(int);
935 getsockopt(peer
->sock
, SOL_SOCKET
, SO_ERROR
, &err
, &len
);
938 LOG(1, 0, 0, "Can't connect to BGP peer %s (%s)\n", peer
->name
,
945 peer
->state
= Active
;
946 peer
->state_time
= time_now
;
948 LOG(4, 0, 0, "BGP peer %s: state Active\n", peer
->name
);
950 peer
->handle_ipv6_routes
= 0;
952 return bgp_send_open(peer
);
955 /* initiate a write */
956 static int bgp_write(struct bgp_peer
*peer
)
958 int len
= htons(peer
->outbuf
->packet
.header
.len
);
961 while ((r
= write(peer
->sock
, &peer
->outbuf
->packet
+ peer
->outbuf
->done
,
962 len
- peer
->outbuf
->done
)) == -1)
971 LOG(1, 0, 0, "Connection to BGP peer %s closed\n", peer
->name
);
973 LOG(1, 0, 0, "Can't write to BGP peer %s (%s)\n", peer
->name
,
982 peer
->outbuf
->done
+= r
;
986 LOG(4, 0, 0, "Sent %s to BGP peer %s\n",
987 bgp_msg_type_str(peer
->outbuf
->packet
.header
.type
), peer
->name
);
989 peer
->outbuf
->packet
.header
.len
= 0;
990 peer
->outbuf
->done
= 0;
992 if (peer
->state
== Established
)
993 peer
->keepalive_time
= time_now
+ peer
->keepalive
;
995 if (peer
->state
!= peer
->next_state
)
997 if (peer
->next_state
== Disabled
|| peer
->next_state
== Idle
)
1003 peer
->state
= peer
->next_state
;
1004 peer
->state_time
= time_now
;
1006 LOG(4, 0, 0, "BGP peer %s: state %s\n", peer
->name
,
1007 bgp_state_str(peer
->state
));
1013 /* initiate a read */
1014 static int bgp_read(struct bgp_peer
*peer
)
1018 while ((r
= read(peer
->sock
, &peer
->inbuf
->packet
+ peer
->inbuf
->done
,
1019 BGP_MAX_PACKET_SIZE
- peer
->inbuf
->done
)) < 1)
1023 LOG(1, 0, 0, "Connection to BGP peer %s closed\n", peer
->name
);
1030 if (errno
== EAGAIN
)
1033 LOG(1, 0, 0, "Can't read from BGP peer %s (%s)\n", peer
->name
,
1037 bgp_set_retry(peer
);
1041 peer
->inbuf
->done
+= r
;
1045 /* process buffered packets */
1046 static int bgp_handle_input(struct bgp_peer
*peer
)
1048 struct bgp_packet
*p
= &peer
->inbuf
->packet
;
1049 int len
= ntohs(p
->header
.len
);
1051 if (len
> BGP_MAX_PACKET_SIZE
)
1053 LOG(1, 0, 0, "Bad header length from BGP %s\n", peer
->name
);
1054 bgp_send_notification(peer
, BGP_ERR_HEADER
, BGP_ERR_HDR_BAD_LEN
);
1058 if (peer
->inbuf
->done
< len
)
1061 LOG(4, 0, 0, "Received %s from BGP peer %s\n",
1062 bgp_msg_type_str(p
->header
.type
), peer
->name
);
1064 switch (p
->header
.type
)
1068 struct bgp_data_open data
;
1071 off_t param_offset
, capability_offset
;
1072 struct bgp_opt_param
*param
;
1073 uint8_t capabilities_len
;
1074 char *capabilities
= NULL
;
1075 struct bgp_capability
*capability
;
1076 struct bgp_mp_cap_param
*mp_cap
;
1078 for (i
= 0; i
< sizeof(p
->header
.marker
); i
++)
1080 if ((unsigned char) p
->header
.marker
[i
] != 0xff)
1082 LOG(1, 0, 0, "Invalid marker from BGP peer %s\n",
1085 bgp_send_notification(peer
, BGP_ERR_HEADER
,
1086 BGP_ERR_HDR_NOT_SYNC
);
1092 if (peer
->state
!= OpenSent
)
1094 LOG(1, 0, 0, "OPEN from BGP peer %s in %s state\n",
1095 peer
->name
, bgp_state_str(peer
->state
));
1097 bgp_send_notification(peer
, BGP_ERR_FSM
, 0);
1101 memcpy(&data
, p
->data
, len
- sizeof(p
->header
));
1103 if (data
.version
!= BGP_VERSION
)
1105 LOG(1, 0, 0, "Bad version (%d) sent by BGP peer %s\n",
1106 (int) data
.version
, peer
->name
);
1108 bgp_send_notification(peer
, BGP_ERR_OPEN
, BGP_ERR_OPN_VERSION
);
1112 if (ntohs(data
.as
) != peer
->as
)
1114 LOG(1, 0, 0, "Bad AS sent by BGP peer %s (got %d, "
1115 "expected %d)\n", peer
->name
, (int) htons(data
.as
),
1118 bgp_send_notification(peer
, BGP_ERR_OPEN
, BGP_ERR_OPN_BAD_AS
);
1122 if ((hold
= ntohs(data
.hold_time
)) < 3)
1124 LOG(1, 0, 0, "Bad hold time (%d) from BGP peer %s\n",
1127 bgp_send_notification(peer
, BGP_ERR_OPEN
, BGP_ERR_OPN_HOLD_TIME
);
1131 /* pick lowest hold time */
1132 if (hold
< peer
->hold
)
1135 /* adjust our keepalive based on negotiated hold value */
1136 if (peer
->keepalive
* 3 > peer
->hold
)
1137 peer
->keepalive
= peer
->hold
/ 3;
1139 /* check for optional parameters */
1140 /* 2 is for the size of type + len (both uint8_t) */
1141 for (param_offset
= 0;
1142 param_offset
< data
.opt_len
;
1143 param_offset
+= 2 + param
->len
)
1145 param
= (struct bgp_opt_param
*)(&data
.opt_params
+ param_offset
);
1147 /* sensible check */
1148 if (data
.opt_len
- param_offset
< 2
1149 || param
->len
> data
.opt_len
- param_offset
- 2)
1151 LOG(1, 0, 0, "Malformed Optional Parameter list from BGP peer %s\n",
1154 bgp_send_notification(peer
, BGP_ERR_OPEN
, BGP_ERR_UNSPEC
);
1158 /* we know only one parameter type */
1159 if (param
->type
!= BGP_PARAM_TYPE_CAPABILITY
)
1161 LOG(1, 0, 0, "Unsupported Optional Parameter type %d from BGP peer %s\n",
1162 param
->type
, peer
->name
);
1164 bgp_send_notification(peer
, BGP_ERR_OPEN
, BGP_ERR_OPN_UNSUP_PARAM
);
1168 capabilities_len
= param
->len
;
1169 capabilities
= (char *)¶m
->value
;
1172 /* look for BGP multiprotocol capability */
1175 for (capability_offset
= 0;
1176 capability_offset
< capabilities_len
;
1177 capability_offset
+= 2 + capability
->len
)
1179 capability
= (struct bgp_capability
*)(capabilities
+ capability_offset
);
1181 /* sensible check */
1182 if (capabilities_len
- capability_offset
< 2
1183 || capability
->len
> capabilities_len
- capability_offset
- 2)
1185 LOG(1, 0, 0, "Malformed Capabilities list from BGP peer %s\n",
1188 bgp_send_notification(peer
, BGP_ERR_OPEN
, BGP_ERR_UNSPEC
);
1192 /* we only know one capability code */
1193 if (capability
->code
!= BGP_CAP_CODE_MP
1194 && capability
->len
!= sizeof(struct bgp_mp_cap_param
))
1196 LOG(4, 0, 0, "Unsupported Capability code %d from BGP peer %s\n",
1197 capability
->code
, peer
->name
);
1199 bgp_send_notification_full(peer
, BGP_ERR_OPEN
, BGP_ERR_OPN_UNSUP_CAP
,
1200 (char *)capability
, 2 + capability
->len
);
1201 /* we don't terminate, still; we just jump to the next one */
1205 mp_cap
= (struct bgp_mp_cap_param
*)&capability
->value
;
1206 /* the only <AFI, SAFI> tuple we support */
1207 if (ntohs(mp_cap
->afi
) != AF_INET6
&& mp_cap
->safi
!= BGP_MP_SAFI_UNICAST
)
1209 LOG(4, 0, 0, "Unsupported multiprotocol AFI %d and SAFI %d from BGP peer %s\n",
1210 mp_cap
->afi
, mp_cap
->safi
, peer
->name
);
1212 bgp_send_notification_full(peer
, BGP_ERR_OPEN
, BGP_ERR_OPN_UNSUP_CAP
,
1213 (char *)capability
, 2 + capability
->len
);
1214 /* we don't terminate, still; we just jump to the next one */
1218 peer
->handle_ipv6_routes
= 1;
1222 /* next transition requires an exchange of keepalives */
1223 bgp_send_keepalive(peer
);
1228 case BGP_MSG_KEEPALIVE
:
1229 if (peer
->state
== OpenConfirm
)
1231 peer
->state
= peer
->next_state
= Established
;
1232 peer
->state_time
= time_now
;
1233 peer
->keepalive_time
= time_now
+ peer
->keepalive
;
1234 peer
->update_routes
= 1;
1235 peer
->retry_count
= 0;
1236 peer
->retry_time
= 0;
1238 LOG(4, 0, 0, "BGP peer %s: state Established\n", peer
->name
);
1243 case BGP_MSG_NOTIFICATION
:
1244 if (len
> sizeof(p
->header
))
1246 struct bgp_data_notification
*notification
=
1247 (struct bgp_data_notification
*) p
->data
;
1249 if (notification
->error_code
== BGP_ERR_CEASE
)
1251 LOG(4, 0, 0, "BGP peer %s sent CEASE\n", peer
->name
);
1256 if (notification
->error_code
== BGP_ERR_OPEN
1257 && notification
->error_subcode
== BGP_ERR_OPN_UNSUP_CAP
)
1259 /* the only capability we advertise is this one, so upon receiving
1260 an "unsupported capability" message, we disable IPv6 routes for
1262 LOG(4, 0, 0, "BGP peer %s doesn't support IPv6 routes advertisement\n", peer
->name
);
1263 peer
->handle_ipv6_routes
= 0;
1267 /* FIXME: should handle more notifications */
1268 LOG(4, 0, 0, "BGP peer %s sent unhandled NOTIFICATION %d\n",
1269 peer
->name
, (int) notification
->error_code
);
1276 peer
->expire_time
= time_now
+ peer
->hold
;
1278 /* see if there's another message in the same packet/buffer */
1279 if (peer
->inbuf
->done
> len
)
1281 peer
->inbuf
->done
-= len
;
1282 memmove(p
, (char *) p
+ len
, peer
->inbuf
->done
);
1286 peer
->inbuf
->packet
.header
.len
= 0;
1287 peer
->inbuf
->done
= 0;
1290 return peer
->inbuf
->done
;
1293 /* send/buffer OPEN message */
1294 static int bgp_send_open(struct bgp_peer
*peer
)
1296 struct bgp_data_open data
;
1297 struct bgp_mp_cap_param mp_ipv6
= { htons(AF_INET6
), 0, BGP_MP_SAFI_UNICAST
};
1298 struct bgp_capability cap_mp_ipv6
;
1299 struct bgp_opt_param param_cap_mp_ipv6
;
1300 uint16_t len
= sizeof(peer
->outbuf
->packet
.header
);
1302 memset(peer
->outbuf
->packet
.header
.marker
, 0xff,
1303 sizeof(peer
->outbuf
->packet
.header
.marker
));
1305 peer
->outbuf
->packet
.header
.type
= BGP_MSG_OPEN
;
1307 data
.version
= BGP_VERSION
;
1308 data
.as
= htons(our_as
);
1309 data
.hold_time
= htons(peer
->hold
);
1310 data
.identifier
= my_address
;
1312 /* construct the param and capability */
1313 cap_mp_ipv6
.code
= BGP_CAP_CODE_MP
;
1314 cap_mp_ipv6
.len
= sizeof(mp_ipv6
);
1315 memcpy(&cap_mp_ipv6
.value
, &mp_ipv6
, cap_mp_ipv6
.len
);
1317 param_cap_mp_ipv6
.type
= BGP_PARAM_TYPE_CAPABILITY
;
1318 param_cap_mp_ipv6
.len
= 2 + sizeof(mp_ipv6
);
1319 memcpy(¶m_cap_mp_ipv6
.value
, &cap_mp_ipv6
, param_cap_mp_ipv6
.len
);
1321 data
.opt_len
= 2 + param_cap_mp_ipv6
.len
;
1322 memcpy(&data
.opt_params
, ¶m_cap_mp_ipv6
, data
.opt_len
);
1324 memcpy(peer
->outbuf
->packet
.data
, &data
, BGP_DATA_OPEN_SIZE
);
1325 len
+= BGP_DATA_OPEN_SIZE
;
1327 peer
->outbuf
->packet
.header
.len
= htons(len
);
1328 peer
->outbuf
->done
= 0;
1329 peer
->next_state
= OpenSent
;
1331 return bgp_write(peer
);
1334 /* send/buffer KEEPALIVE message */
1335 static int bgp_send_keepalive(struct bgp_peer
*peer
)
1337 memset(peer
->outbuf
->packet
.header
.marker
, 0xff,
1338 sizeof(peer
->outbuf
->packet
.header
.marker
));
1340 peer
->outbuf
->packet
.header
.type
= BGP_MSG_KEEPALIVE
;
1341 peer
->outbuf
->packet
.header
.len
=
1342 htons(sizeof(peer
->outbuf
->packet
.header
));
1344 peer
->outbuf
->done
= 0;
1345 peer
->next_state
= (peer
->state
== OpenSent
) ? OpenConfirm
: peer
->state
;
1347 return bgp_write(peer
);
1350 /* send/buffer UPDATE message */
1351 static int bgp_send_update(struct bgp_peer
*peer
)
1353 uint16_t unf_len
= 0;
1355 uint16_t len
= sizeof(peer
->outbuf
->packet
.header
);
1356 struct bgp_route_list
*have
= peer
->routes
;
1357 struct bgp_route_list
*want
= peer
->routing
? bgp_routes
: 0;
1358 struct bgp_route_list
*e
= 0;
1359 struct bgp_route_list
*add
= 0;
1362 char *data
= (char *) &peer
->outbuf
->packet
.data
;
1364 /* need leave room for attr_len, bgp_path_attrs and one prefix */
1365 char *max
= (char *) &peer
->outbuf
->packet
.data
1366 + sizeof(peer
->outbuf
->packet
.data
)
1367 - sizeof(attr_len
) - peer
->path_attr_len
- sizeof(struct bgp_ip_prefix
);
1369 /* skip over unf_len */
1370 data
+= sizeof(unf_len
);
1371 len
+= sizeof(unf_len
);
1373 memset(peer
->outbuf
->packet
.header
.marker
, 0xff,
1374 sizeof(peer
->outbuf
->packet
.header
.marker
));
1376 peer
->outbuf
->packet
.header
.type
= BGP_MSG_UPDATE
;
1378 peer
->update_routes
= 0; /* tentatively clear */
1380 /* find differences */
1381 while ((have
|| want
) && data
< (max
- sizeof(struct bgp_ip_prefix
)))
1385 ? memcmp(&have
->dest
, &want
->dest
, sizeof(have
->dest
))
1390 if (s
< 0) /* found one to delete */
1392 struct bgp_route_list
*tmp
= have
;
1395 s
= BGP_IP_PREFIX_SIZE(tmp
->dest
);
1396 memcpy(data
, &tmp
->dest
, s
);
1401 LOG(5, 0, 0, "Withdrawing route %s/%d from BGP peer %s\n",
1402 fmtaddr(tmp
->dest
.prefix
, 0), tmp
->dest
.len
, peer
->name
);
1409 peer
->routes
= have
;
1415 e
= have
; /* stash the last found to relink above */
1419 else if (s
> 0) /* addition reqd. */
1423 peer
->update_routes
= 1; /* only one add per packet */
1437 peer
->update_routes
= 1; /* more to do */
1439 /* anything changed? */
1440 if (!(unf_len
|| add
))
1443 /* go back and insert unf_len */
1444 unf_len
= htons(unf_len
);
1445 memcpy(&peer
->outbuf
->packet
.data
, &unf_len
, sizeof(unf_len
));
1449 if (!(e
= malloc(sizeof(*e
))))
1451 LOG(0, 0, 0, "Can't allocate route for %s/%d (%s)\n",
1452 fmtaddr(add
->dest
.prefix
, 0), add
->dest
.len
, strerror(errno
));
1457 memcpy(e
, add
, sizeof(*e
));
1459 peer
->routes
= bgp_insert_route(peer
->routes
, e
);
1461 attr_len
= htons(peer
->path_attr_len
);
1462 memcpy(data
, &attr_len
, sizeof(attr_len
));
1463 data
+= sizeof(attr_len
);
1464 len
+= sizeof(attr_len
);
1466 memcpy(data
, peer
->path_attrs
, peer
->path_attr_len
);
1467 data
+= peer
->path_attr_len
;
1468 len
+= peer
->path_attr_len
;
1470 s
= BGP_IP_PREFIX_SIZE(add
->dest
);
1471 memcpy(data
, &add
->dest
, s
);
1475 LOG(5, 0, 0, "Advertising route %s/%d to BGP peer %s\n",
1476 fmtaddr(add
->dest
.prefix
, 0), add
->dest
.len
, peer
->name
);
1481 memcpy(data
, &attr_len
, sizeof(attr_len
));
1482 data
+= sizeof(attr_len
);
1483 len
+= sizeof(attr_len
);
1486 peer
->outbuf
->packet
.header
.len
= htons(len
);
1487 peer
->outbuf
->done
= 0;
1489 return bgp_write(peer
);
1492 /* send/buffer UPDATE message for IPv6 routes */
1493 static int bgp_send_update6(struct bgp_peer
*peer
)
1497 /* send/buffer NOTIFICATION message */
1498 static int bgp_send_notification(struct bgp_peer
*peer
, uint8_t code
,
1501 return bgp_send_notification_full(peer
, code
, subcode
, NULL
, 0);
1504 static int bgp_send_notification_full(struct bgp_peer
*peer
, uint8_t code
,
1505 uint8_t subcode
, char *notification_data
, uint16_t data_len
)
1507 struct bgp_data_notification data
;
1510 data
.error_code
= code
;
1511 len
+= sizeof(data
.error_code
);
1513 data
.error_subcode
= subcode
;
1514 len
+= sizeof(data
.error_code
);
1516 memcpy(data
.data
, notification_data
, data_len
);
1519 memset(peer
->outbuf
->packet
.header
.marker
, 0xff,
1520 sizeof(peer
->outbuf
->packet
.header
.marker
));
1522 peer
->outbuf
->packet
.header
.type
= BGP_MSG_NOTIFICATION
;
1523 peer
->outbuf
->packet
.header
.len
=
1524 htons(sizeof(peer
->outbuf
->packet
.header
) + len
);
1526 memcpy(peer
->outbuf
->packet
.data
, &data
, len
);
1528 peer
->outbuf
->done
= 0;
1529 peer
->next_state
= code
== BGP_ERR_CEASE
? Disabled
: Idle
;
1531 /* we're dying; ignore any pending input */
1532 peer
->inbuf
->packet
.header
.len
= 0;
1533 peer
->inbuf
->done
= 0;
1535 return bgp_write(peer
);