38b50dba47
Avoid a bunch of syscalls on forwarding paths by: - storing minimum and maximum file descriptor numbers for each protocol, fall back to SO_PROTOCOL query only on overlaps - allocating a larger receive buffer -- this can result in more coalesced packets than sendmmsg() can take (UIO_MAXIOV, i.e. 1024), so make sure we don't exceed that within a single call to protocol tap handlers - nesting the handling loop in tap_handler() in the receive loop, so that we have better chances of filling our receive buffer in fewer calls - skipping the recvfrom() in the UDP handler on EPOLLERR -- there's nothing to be done in that case and while at it: - restore the 20ms timer interval for periodic (TCP) events, I accidentally changed that to 100ms in an earlier commit - attempt using SO_ZEROCOPY for UDP -- if it's not available, sendmmsg() will succeed anyway - fix the handling of the status code from sendmmsg(), if it fails, we'll try to discard the first message, hence return 1 from the UDP handler Signed-off-by: Stefano Brivio <sbrivio@redhat.com>
148 lines
3.5 KiB
C
148 lines
3.5 KiB
C
// SPDX-License-Identifier: AGPL-3.0-or-later
|
|
|
|
/* PASST - Plug A Simple Socket Transport
|
|
*
|
|
* icmp.c - ICMP/ICMPv6 echo proxy
|
|
*
|
|
* Copyright (c) 2021 Red Hat GmbH
|
|
* Author: Stefano Brivio <sbrivio@redhat.com>
|
|
*
|
|
*/
|
|
|
|
#include <stdio.h>
|
|
#include <errno.h>
|
|
#include <limits.h>
|
|
#include <net/ethernet.h>
|
|
#include <net/if.h>
|
|
#include <netinet/in.h>
|
|
#include <stdint.h>
|
|
#include <stddef.h>
|
|
#include <string.h>
|
|
#include <sys/epoll.h>
|
|
#include <sys/types.h>
|
|
#include <sys/socket.h>
|
|
#include <unistd.h>
|
|
#include <linux/ip.h>
|
|
#include <linux/ipv6.h>
|
|
#include <linux/icmp.h>
|
|
#include <linux/icmpv6.h>
|
|
#include <time.h>
|
|
|
|
#include "passt.h"
|
|
#include "tap.h"
|
|
#include "util.h"
|
|
#include "icmp.h"
|
|
|
|
/**
|
|
* icmp_sock_handler() - Handle new data from socket
|
|
* @c: Execution context
|
|
* @s: File descriptor number for socket
|
|
* @events: epoll events bitmap
|
|
*/
|
|
void icmp_sock_handler(struct ctx *c, int s, uint32_t events)
|
|
{
|
|
struct in6_addr a6 = { .s6_addr = { 0, 0, 0, 0,
|
|
0, 0, 0, 0,
|
|
0, 0, 0xff, 0xff,
|
|
0, 0, 0, 0 } };
|
|
struct sockaddr_storage sr, sl;
|
|
socklen_t slen = sizeof(sr);
|
|
char buf[USHRT_MAX];
|
|
ssize_t n;
|
|
|
|
(void)events;
|
|
|
|
n = recvfrom(s, buf, sizeof(buf), MSG_DONTWAIT,
|
|
(struct sockaddr *)&sr, &slen);
|
|
if (n < 0)
|
|
return;
|
|
|
|
if (getsockname(s, (struct sockaddr *)&sl, &slen))
|
|
return;
|
|
|
|
if (sl.ss_family == AF_INET) {
|
|
struct sockaddr_in *sr4 = (struct sockaddr_in *)&sr;
|
|
|
|
memcpy(&a6.s6_addr[12], &sr4->sin_addr, sizeof(sr4->sin_addr));
|
|
|
|
tap_ip_send(c, &a6, IPPROTO_ICMP, buf, n);
|
|
} else if (sl.ss_family == AF_INET6) {
|
|
struct sockaddr_in6 *sr6 = (struct sockaddr_in6 *)&sr;
|
|
|
|
tap_ip_send(c, &sr6->sin6_addr, IPPROTO_ICMPV6, buf, n);
|
|
}
|
|
}
|
|
|
|
/**
|
|
* icmp_tap_handler() - Handle packets from tap
|
|
* @c: Execution context
|
|
* @af: Address family, AF_INET or AF_INET6
|
|
* @msg: Input message
|
|
* @count: Message count (always 1 for ICMP)
|
|
*
|
|
* Return: count of consumed packets (always 1, even if malformed)
|
|
*/
|
|
int icmp_tap_handler(struct ctx *c, int af, void *addr,
|
|
struct tap_msg *msg, int count)
|
|
{
|
|
(void)count;
|
|
|
|
if (af == AF_INET) {
|
|
struct icmphdr *ih = (struct icmphdr *)msg[0].l4h;
|
|
struct sockaddr_in sa = {
|
|
.sin_family = AF_INET,
|
|
.sin_addr.s_addr = htonl(INADDR_ANY),
|
|
};
|
|
|
|
if (msg[0].l4_len < sizeof(*ih) || ih->type != ICMP_ECHO)
|
|
return 1;
|
|
|
|
sa.sin_port = ih->un.echo.id;
|
|
bind(c->icmp.s4, (struct sockaddr *)&sa, sizeof(sa));
|
|
|
|
sa.sin_addr = *(struct in_addr *)addr;
|
|
sendto(c->icmp.s4, msg[0].l4h, msg[0].l4_len,
|
|
MSG_DONTWAIT | MSG_NOSIGNAL,
|
|
(struct sockaddr *)&sa, sizeof(sa));
|
|
} else if (af == AF_INET6) {
|
|
struct sockaddr_in6 sa = {
|
|
.sin6_family = AF_INET6,
|
|
.sin6_addr = IN6ADDR_ANY_INIT,
|
|
};
|
|
struct icmp6hdr *ih = (struct icmp6hdr *)msg[0].l4h;
|
|
|
|
if (msg[0].l4_len < sizeof(*ih) ||
|
|
(ih->icmp6_type != 128 && ih->icmp6_type != 129))
|
|
return 1;
|
|
|
|
sa.sin6_port = ih->icmp6_identifier;
|
|
bind(c->icmp.s6, (struct sockaddr *)&sa, sizeof(sa));
|
|
|
|
sa.sin6_addr = *(struct in6_addr *)addr;
|
|
sendto(c->icmp.s6, msg[0].l4h, msg[0].l4_len,
|
|
MSG_DONTWAIT | MSG_NOSIGNAL,
|
|
(struct sockaddr *)&sa, sizeof(sa));
|
|
}
|
|
|
|
return 1;
|
|
}
|
|
|
|
/**
|
|
* icmp_sock_init() - Create ICMP, ICMPv6 sockets for echo requests and replies
|
|
* @c: Execution context
|
|
*
|
|
* Return: 0 on success, -1 on failure
|
|
*/
|
|
int icmp_sock_init(struct ctx *c)
|
|
{
|
|
c->icmp.fd_min = INT_MAX;
|
|
c->icmp.fd_max = 0;
|
|
|
|
if (c->v4 && (c->icmp.s4 = sock_l4_add(c, 4, IPPROTO_ICMP, 0)) < 0)
|
|
return -1;
|
|
|
|
if (c->v6 && (c->icmp.s6 = sock_l4_add(c, 6, IPPROTO_ICMPV6, 0)) < 0)
|
|
return -1;
|
|
|
|
return 0;
|
|
}
|