17765f8de0
Provide an AVX2-based function using compiler intrinsics for TCP/IP-style checksums. The load/unpack/add idea and implementation is largely based on code from BESS (the Berkeley Extensible Software Switch) licensed as 3-Clause BSD, with a number of modifications to further decrease pipeline stalls and to minimise cache pollution. This speeds up considerably data paths from sockets to tap interfaces, decreasing overhead for checksum computation, with 16-64KiB packet buffers, from approximately 11% to 7%. The rest is just syscalls at this point. While at it, provide convenience targets in the Makefile for avx2, avx2_debug, and debug targets -- these simply add target-specific CFLAGS to the build. Signed-off-by: Stefano Brivio <sbrivio@redhat.com>
128 lines
2.9 KiB
C
128 lines
2.9 KiB
C
void err(const char *format, ...);
|
|
void warn(const char *format, ...);
|
|
void info(const char *format, ...);
|
|
|
|
#ifdef DEBUG
|
|
void debug(const char *format, ...);
|
|
#else
|
|
#define debug(...) { }
|
|
#endif
|
|
|
|
#define CHECK_SET_MIN_MAX(basename, fd) \
|
|
do { \
|
|
if ((fd) < basename##min) \
|
|
basename##min = (fd); \
|
|
if ((fd) > basename##max) \
|
|
basename##max = (fd); \
|
|
} while (0)
|
|
|
|
#define CHECK_SET_MIN_MAX_PROTO_FD(proto, ipproto, proto_ctx, fd) \
|
|
do { \
|
|
if ((proto) == (ipproto)) \
|
|
CHECK_SET_MIN_MAX(c->proto_ctx.fd_, (fd)); \
|
|
} while (0)
|
|
|
|
#ifndef MIN
|
|
#define MIN(x, y) (((x) < (y)) ? (x) : (y))
|
|
#endif
|
|
#ifndef MAX
|
|
#define MAX(x, y) (((x) > (y)) ? (x) : (y))
|
|
#endif
|
|
|
|
#define SWAP(a, b) \
|
|
do { \
|
|
typeof(a) __x = (a); (a) = (b); (b) = __x; \
|
|
} while (0) \
|
|
|
|
#define STRINGIFY(x) #x
|
|
#define STR(x) STRINGIFY(x)
|
|
|
|
#define V4 0
|
|
#define V6 1
|
|
#define IP_VERSIONS 2
|
|
|
|
#define ARRAY_SIZE(a) ((int)(sizeof(a) / sizeof((a)[0])))
|
|
|
|
#define IN_INTERVAL(a, b, x) ((x) >= (a) && (x) <= (b))
|
|
#define FD_PROTO(x, proto) \
|
|
(IN_INTERVAL(c->proto.fd_min, c->proto.fd_max, (x)))
|
|
|
|
#define PORT_EPHEMERAL_MIN ((1 << 15) + (1 << 14)) /* RFC 6335 */
|
|
#define PORT_IS_EPHEMERAL(port) ((port) >= PORT_EPHEMERAL_MIN)
|
|
|
|
#define NS_FN_STACK_SIZE (RLIMIT_STACK_VAL * 1024 / 4)
|
|
|
|
#if __BYTE_ORDER == __BIG_ENDIAN
|
|
#define L2_BUF_ETH_IP4_INIT \
|
|
{ \
|
|
.h_dest = { 0 }, \
|
|
.h_source = { 0 }, \
|
|
.h_proto = ETH_P_IP, \
|
|
}
|
|
#else
|
|
#define L2_BUF_ETH_IP4_INIT \
|
|
{ \
|
|
.h_dest = { 0 }, \
|
|
.h_source = { 0 }, \
|
|
.h_proto = __bswap_constant_16(ETH_P_IP), \
|
|
}
|
|
#endif
|
|
|
|
#if __BYTE_ORDER == __BIG_ENDIAN
|
|
#define L2_BUF_ETH_IP6_INIT \
|
|
{ \
|
|
.h_dest = { 0 }, \
|
|
.h_source = { 0 }, \
|
|
.h_proto = ETH_P_IPV6, \
|
|
}
|
|
#else
|
|
#define L2_BUF_ETH_IP6_INIT \
|
|
{ \
|
|
.h_dest = { 0 }, \
|
|
.h_source = { 0 }, \
|
|
.h_proto = __bswap_constant_16(ETH_P_IPV6), \
|
|
}
|
|
#endif
|
|
|
|
#define L2_BUF_IP4_INIT(proto) \
|
|
{ \
|
|
.version = 4, \
|
|
.ihl = 5, \
|
|
.tos = 0, \
|
|
.tot_len = 0, \
|
|
.id = 0, \
|
|
.frag_off = 0, \
|
|
.ttl = 255, \
|
|
.protocol = (proto), \
|
|
.saddr = 0, \
|
|
.daddr = 0, \
|
|
}
|
|
|
|
#define L2_BUF_IP6_INIT(proto) \
|
|
{ \
|
|
.priority = 0, \
|
|
.version = 6, \
|
|
.flow_lbl = { 0 }, \
|
|
.payload_len = 0, \
|
|
.nexthdr = (proto), \
|
|
.hop_limit = 255, \
|
|
.saddr = IN6ADDR_ANY_INIT, \
|
|
.daddr = IN6ADDR_ANY_INIT, \
|
|
}
|
|
|
|
#include <linux/ipv6.h>
|
|
#include <net/if.h>
|
|
#include <linux/ip.h>
|
|
#include <limits.h>
|
|
|
|
struct ctx;
|
|
|
|
char *ipv6_l4hdr(struct ipv6hdr *ip6h, uint8_t *proto);
|
|
int sock_l4(struct ctx *c, int af, uint8_t proto, uint16_t port, int lo,
|
|
uint32_t data);
|
|
int timespec_diff_ms(struct timespec *a, struct timespec *b);
|
|
void bitmap_set(uint8_t *map, int bit);
|
|
void bitmap_clear(uint8_t *map, int bit);
|
|
int bitmap_isset(uint8_t *map, int bit);
|
|
void procfs_scan_listen(char *name, uint8_t *map);
|
|
int ns_enter(int target_pid);
|