netlink: Always process all responses to a netlink request

A single netlink request can result in multiple response datagrams.  We
process multiple response datagrams in some circumstances, but there are
cases where we exit early and will leave remaining datagrams in the queue.
These will be flushed in nl_send() before we send another request.

This is confusing, and not what we need to reliably check for errors from
netlink operations.  So, instead, make sure we always process all the
response datagrams whenever we send a request (excepting fatal errors).

In most cases this is just a matter of avoiding early exits from nl_foreach
loops.  nl_route_dup() is a bit trickier, because we need to retain all the
routes we're going to try to copy in a single buffer.  Here we instead use
a secondary buffer to flush any remaining datagrams, and report an error
if there are any additional routes in those datagrams .

Link: https://bugs.passt.top/show_bug.cgi?id=67
Link: https://bugs.passt.top/show_bug.cgi?id=60
Signed-off-by: David Gibson <david@gibson.dropbear.id.au>
Signed-off-by: Stefano Brivio <sbrivio@redhat.com>
This commit is contained in:
David Gibson 2023-08-03 17:19:54 +10:00 committed by Stefano Brivio
parent 8de9805224
commit 4d6e9d0816

View file

@ -116,24 +116,9 @@ fail:
static uint16_t nl_send(int s, void *req, uint16_t type, static uint16_t nl_send(int s, void *req, uint16_t type,
uint16_t flags, ssize_t len) uint16_t flags, ssize_t len)
{ {
char flush[NLBUFSIZ];
struct nlmsghdr *nh; struct nlmsghdr *nh;
int done = 0;
ssize_t n; ssize_t n;
while (!done && (n = recv(s, flush, sizeof(flush), MSG_DONTWAIT)) > 0) {
size_t nm = n;
for (nh = (struct nlmsghdr *)flush;
NLMSG_OK(nh, nm); nh = NLMSG_NEXT(nh, nm)) {
if (nh->nlmsg_type == NLMSG_DONE ||
nh->nlmsg_type == NLMSG_ERROR) {
done = 1;
break;
}
}
}
nh = (struct nlmsghdr *)req; nh = (struct nlmsghdr *)req;
nh->nlmsg_type = type; nh->nlmsg_type = type;
nh->nlmsg_flags = NLM_F_REQUEST | NLM_F_ACK | flags; nh->nlmsg_flags = NLM_F_REQUEST | NLM_F_ACK | flags;
@ -269,6 +254,7 @@ unsigned int nl_get_ext_if(int s, sa_family_t af)
.rtm.rtm_type = RTN_UNICAST, .rtm.rtm_type = RTN_UNICAST,
.rtm.rtm_family = af, .rtm.rtm_family = af,
}; };
unsigned int ifi = 0;
struct nlmsghdr *nh; struct nlmsghdr *nh;
struct rtattr *rta; struct rtattr *rta;
char buf[NLBUFSIZ]; char buf[NLBUFSIZ];
@ -280,23 +266,19 @@ unsigned int nl_get_ext_if(int s, sa_family_t af)
nl_foreach_oftype(nh, status, s, buf, seq, RTM_NEWROUTE) { nl_foreach_oftype(nh, status, s, buf, seq, RTM_NEWROUTE) {
struct rtmsg *rtm = (struct rtmsg *)NLMSG_DATA(nh); struct rtmsg *rtm = (struct rtmsg *)NLMSG_DATA(nh);
if (rtm->rtm_dst_len || rtm->rtm_family != af) if (ifi || rtm->rtm_dst_len || rtm->rtm_family != af)
continue; continue;
for (rta = RTM_RTA(rtm), na = RTM_PAYLOAD(nh); RTA_OK(rta, na); for (rta = RTM_RTA(rtm), na = RTM_PAYLOAD(nh); RTA_OK(rta, na);
rta = RTA_NEXT(rta, na)) { rta = RTA_NEXT(rta, na)) {
unsigned int ifi;
if (rta->rta_type != RTA_OIF) if (rta->rta_type != RTA_OIF)
continue; continue;
ifi = *(unsigned int *)RTA_DATA(rta); ifi = *(unsigned int *)RTA_DATA(rta);
}
}
return ifi; return ifi;
}
}
return 0;
} }
/** /**
@ -324,6 +306,7 @@ void nl_route_get_def(int s, unsigned int ifi, sa_family_t af, void *gw)
.ifi = ifi, .ifi = ifi,
}; };
struct nlmsghdr *nh; struct nlmsghdr *nh;
bool found = false;
char buf[NLBUFSIZ]; char buf[NLBUFSIZ];
ssize_t status; ssize_t status;
uint16_t seq; uint16_t seq;
@ -334,7 +317,7 @@ void nl_route_get_def(int s, unsigned int ifi, sa_family_t af, void *gw)
struct rtattr *rta; struct rtattr *rta;
size_t na; size_t na;
if (rtm->rtm_dst_len) if (found || rtm->rtm_dst_len)
continue; continue;
for (rta = RTM_RTA(rtm), na = RTM_PAYLOAD(nh); RTA_OK(rta, na); for (rta = RTM_RTA(rtm), na = RTM_PAYLOAD(nh); RTA_OK(rta, na);
@ -343,7 +326,7 @@ void nl_route_get_def(int s, unsigned int ifi, sa_family_t af, void *gw)
continue; continue;
memcpy(gw, RTA_DATA(rta), RTA_PAYLOAD(rta)); memcpy(gw, RTA_DATA(rta), RTA_PAYLOAD(rta));
return; found = true;
} }
} }
} }
@ -477,6 +460,22 @@ void nl_route_dup(int s_src, unsigned int ifi_src,
} }
} }
if (!NLMSG_OK(nh, status) || status > 0) {
/* Process any remaining datagrams in a different
* buffer so we don't overwrite the first one.
*/
char tail[NLBUFSIZ];
unsigned extra = 0;
nl_foreach_oftype(nh, status, s_src, tail, seq, RTM_NEWROUTE)
extra++;
if (extra) {
err("netlink: Too many routes to duplicate");
return;
}
}
/* Routes might have dependencies between each other, and the kernel /* Routes might have dependencies between each other, and the kernel
* processes RTM_NEWROUTE messages sequentially. For n routes, we might * processes RTM_NEWROUTE messages sequentially. For n routes, we might
* need to send the requests up to n times to get all of them inserted. * need to send the requests up to n times to get all of them inserted.
@ -706,7 +705,6 @@ void nl_link_get_mac(int s, unsigned int ifi, void *mac)
continue; continue;
memcpy(mac, RTA_DATA(rta), ETH_ALEN); memcpy(mac, RTA_DATA(rta), ETH_ALEN);
break;
} }
} }
} }