diff options
| author | Donald Sharp <sharpd@cumulusnetworks.com> | 2016-03-31 08:20:53 -0400 |
|---|---|---|
| committer | Donald Sharp <sharpd@cumulusnetworks.com> | 2016-03-31 08:20:53 -0400 |
| commit | 6c12c8ab7629d5b1f11595bf779a1ebb5ba09746 (patch) | |
| tree | 414ba386b4b870e8b988d0292dd04c68ede8d90f | |
| parent | 0974ce9a0d7401829000acae071422888cbd572b (diff) | |
zebra: Fix Startup with > 1k interfaces
Zebra in rt_netlink.c has a while (1) loop that handles
recvmsg from the netlink socket. In early bootup a
situation can occur whereby the netlink messages
take a long time to parse. This time starts to
take an exponential amount of time the more netlink
messages that you read in. There reaches
a point where the incoming netlink messages are
coming in at about the same rate that they are processed.
This ends up causing the while (1) loop to never exit.
Eventually this causes quagga to fail when the watchdog message
is never sent to systemd.
This patch attempts to address this deficiency in that
we allow for a pause from reading in netlink messages
to allow other work to be done. This pause drains
the work queue items created by the netlink received
data and allows zebra to respond to other system input.
I believe we will need to come back in and modify zebra
startup a bit more. There are ineffiencies that need
to be addressed as part of boot up.
Ticket: CM-9992
Signed-off-by: Donald Sharp <sharpd@cumulusnetworks.com>
Reviewed-by: Don Slice <dslice@cumulusnetworks.com>
Reviewed-by: Wilson Kok <wkok@cumulusnetworks.com>
| -rw-r--r-- | zebra/rt_netlink.c | 23 |
1 files changed, 14 insertions, 9 deletions
diff --git a/zebra/rt_netlink.c b/zebra/rt_netlink.c index b95ef8462b..5686d8e528 100644 --- a/zebra/rt_netlink.c +++ b/zebra/rt_netlink.c @@ -290,11 +290,12 @@ vrf_lookup_by_table (u_int32_t table_id) static int netlink_parse_info (int (*filter) (struct sockaddr_nl *, struct nlmsghdr *, ns_id_t), - struct nlsock *nl, struct zebra_ns *zns) + struct nlsock *nl, struct zebra_ns *zns, int count) { int status; int ret = 0; int error; + int read_in = 0; while (1) { @@ -312,6 +313,9 @@ netlink_parse_info (int (*filter) (struct sockaddr_nl *, struct nlmsghdr *, }; struct nlmsghdr *h; + if (count && read_in >= count) + return 0; + status = recvmsg (nl->sock, &msg, 0); if (status < 0) { @@ -336,7 +340,8 @@ netlink_parse_info (int (*filter) (struct sockaddr_nl *, struct nlmsghdr *, nl->name, msg.msg_namelen); return -1; } - + + read_in++; for (h = (struct nlmsghdr *) buf; NLMSG_OK (h, (unsigned int) status); h = NLMSG_NEXT (h, status)) { @@ -1464,7 +1469,7 @@ interface_lookup_netlink (struct zebra_ns *zns) ret = netlink_request (AF_PACKET, RTM_GETLINK, &zns->netlink_cmd); if (ret < 0) return ret; - ret = netlink_parse_info (netlink_interface, &zns->netlink_cmd, zns); + ret = netlink_parse_info (netlink_interface, &zns->netlink_cmd, zns, 0); if (ret < 0) return ret; @@ -1472,7 +1477,7 @@ interface_lookup_netlink (struct zebra_ns *zns) ret = netlink_request (AF_INET, RTM_GETADDR, &zns->netlink_cmd); if (ret < 0) return ret; - ret = netlink_parse_info (netlink_interface_addr, &zns->netlink_cmd, zns); + ret = netlink_parse_info (netlink_interface_addr, &zns->netlink_cmd, zns, 0); if (ret < 0) return ret; @@ -1481,7 +1486,7 @@ interface_lookup_netlink (struct zebra_ns *zns) ret = netlink_request (AF_INET6, RTM_GETADDR, &zns->netlink_cmd); if (ret < 0) return ret; - ret = netlink_parse_info (netlink_interface_addr, &zns->netlink_cmd, zns); + ret = netlink_parse_info (netlink_interface_addr, &zns->netlink_cmd, zns, 0); if (ret < 0) return ret; #endif /* HAVE_IPV6 */ @@ -1500,7 +1505,7 @@ netlink_route_read (struct zebra_ns *zns) ret = netlink_request (AF_INET, RTM_GETROUTE, &zns->netlink_cmd); if (ret < 0) return ret; - ret = netlink_parse_info (netlink_routing_table, &zns->netlink_cmd, zns); + ret = netlink_parse_info (netlink_routing_table, &zns->netlink_cmd, zns, 0); if (ret < 0) return ret; @@ -1509,7 +1514,7 @@ netlink_route_read (struct zebra_ns *zns) ret = netlink_request (AF_INET6, RTM_GETROUTE, &zns->netlink_cmd); if (ret < 0) return ret; - ret = netlink_parse_info (netlink_routing_table, &zns->netlink_cmd, zns); + ret = netlink_parse_info (netlink_routing_table, &zns->netlink_cmd, zns, 0); if (ret < 0) return ret; #endif /* HAVE_IPV6 */ @@ -1642,7 +1647,7 @@ netlink_talk (struct nlmsghdr *n, struct nlsock *nl, struct zebra_ns *zns) * Get reply from netlink socket. * The reply should either be an acknowlegement or an error. */ - return netlink_parse_info (netlink_talk_filter, nl, zns); + return netlink_parse_info (netlink_talk_filter, nl, zns, 0); } /* Routing table change via netlink interface. */ @@ -2471,7 +2476,7 @@ static int kernel_read (struct thread *thread) { struct zebra_ns *zns = (struct zebra_ns *)THREAD_ARG (thread); - netlink_parse_info (netlink_information_fetch, &zns->netlink, zns); + netlink_parse_info (netlink_information_fetch, &zns->netlink, zns, 5); zns->t_netlink = thread_add_read (zebrad.master, kernel_read, zns, zns->netlink.sock); |
